This is a live mirror of the Perl 5 development currently hosted at https://github.com/perl/perl5
assorted blead build help for VMS (mostly ithreads-related)
[perl5.git] / sv.c
CommitLineData
a0d0e21e 1/* sv.c
79072805 2 *
4bb101f2 3 * Copyright (C) 1991, 1992, 1993, 1994, 1995, 1996, 1997, 1998, 1999,
241d1a3b 4 * 2000, 2001, 2002, 2003, 2004, 2005, by Larry Wall and others
79072805
LW
5 *
6 * You may distribute under the terms of either the GNU General Public
7 * License or the Artistic License, as specified in the README file.
8 *
a0d0e21e 9 * "I wonder what the Entish is for 'yes' and 'no'," he thought.
645c22ef
DM
10 *
11 *
5e045b90
AMS
12 * This file contains the code that creates, manipulates and destroys
13 * scalar values (SVs). The other types (AV, HV, GV, etc.) reuse the
14 * structure of an SV, so their creation and destruction is handled
15 * here; higher-level functions are in av.c, hv.c, and so on. Opcode
16 * level functions (eg. substr, split, join) for each of the types are
17 * in the pp*.c files.
79072805
LW
18 */
19
20#include "EXTERN.h"
864dbfa3 21#define PERL_IN_SV_C
79072805 22#include "perl.h"
d2f185dc 23#include "regcomp.h"
79072805 24
51371543 25#define FCALL *f
2c5424a7 26
2f8ed50e
OS
27#ifdef __Lynx__
28/* Missing proto on LynxOS */
29 char *gconvert(double, int, int, char *);
30#endif
31
e23c8137
JH
32#ifdef PERL_UTF8_CACHE_ASSERT
33/* The cache element 0 is the Unicode offset;
34 * the cache element 1 is the byte offset of the element 0;
35 * the cache element 2 is the Unicode length of the substring;
36 * the cache element 3 is the byte length of the substring;
37 * The checking of the substring side would be good
38 * but substr() has enough code paths to make my head spin;
39 * if adding more checks watch out for the following tests:
40 * t/op/index.t t/op/length.t t/op/pat.t t/op/substr.t
41 * lib/utf8.t lib/Unicode/Collate/t/index.t
42 * --jhi
43 */
44#define ASSERT_UTF8_CACHE(cache) \
45 STMT_START { if (cache) { assert((cache)[0] <= (cache)[1]); } } STMT_END
46#else
47#define ASSERT_UTF8_CACHE(cache) NOOP
48#endif
49
f8c7b90f 50#ifdef PERL_OLD_COPY_ON_WRITE
765f542d 51#define SV_COW_NEXT_SV(sv) INT2PTR(SV *,SvUVX(sv))
607fa7f2 52#define SV_COW_NEXT_SV_SET(current,next) SvUV_set(current, PTR2UV(next))
b5ccf5f2 53/* This is a pessimistic view. Scalar must be purely a read-write PV to copy-
765f542d 54 on-write. */
765f542d 55#endif
645c22ef
DM
56
57/* ============================================================================
58
59=head1 Allocation and deallocation of SVs.
60
5e045b90
AMS
61An SV (or AV, HV, etc.) is allocated in two parts: the head (struct sv,
62av, hv...) contains type and reference count information, as well as a
63pointer to the body (struct xrv, xpv, xpviv...), which contains fields
64specific to each type.
65
4977e971
NC
66Normally, this allocation is done using arenas, which by default are
67approximately 4K chunks of memory parcelled up into N heads or bodies. The
68first slot in each arena is reserved, and is used to hold a link to the next
69arena. In the case of heads, the unused first slot also contains some flags
70and a note of the number of slots. Snaked through each arena chain is a
5e045b90 71linked list of free items; when this becomes empty, an extra arena is
4977e971 72allocated and divided up into N items which are threaded into the free list.
645c22ef
DM
73
74The following global variables are associated with arenas:
75
76 PL_sv_arenaroot pointer to list of SV arenas
77 PL_sv_root pointer to list of free SV structures
78
79 PL_foo_arenaroot pointer to list of foo arenas,
80 PL_foo_root pointer to list of free foo bodies
81 ... for foo in xiv, xnv, xrv, xpv etc.
82
83Note that some of the larger and more rarely used body types (eg xpvio)
84are not allocated using arenas, but are instead just malloc()/free()ed as
85required. Also, if PURIFY is defined, arenas are abandoned altogether,
86with all items individually malloc()ed. In addition, a few SV heads are
87not allocated from an arena, but are instead directly created as static
4977e971
NC
88or auto variables, eg PL_sv_undef. The size of arenas can be changed from
89the default by setting PERL_ARENA_SIZE appropriately at compile time.
645c22ef
DM
90
91The SV arena serves the secondary purpose of allowing still-live SVs
92to be located and destroyed during final cleanup.
93
94At the lowest level, the macros new_SV() and del_SV() grab and free
95an SV head. (If debugging with -DD, del_SV() calls the function S_del_sv()
96to return the SV to the free list with error checking.) new_SV() calls
97more_sv() / sv_add_arena() to add an extra arena if the free list is empty.
98SVs in the free list have their SvTYPE field set to all ones.
99
100Similarly, there are macros new_XIV()/del_XIV(), new_XNV()/del_XNV() etc
101that allocate and return individual body types. Normally these are mapped
ff276b08
RG
102to the arena-manipulating functions new_xiv()/del_xiv() etc, but may be
103instead mapped directly to malloc()/free() if PURIFY is defined. The
645c22ef
DM
104new/del functions remove from, or add to, the appropriate PL_foo_root
105list, and call more_xiv() etc to add a new arena if the list is empty.
106
ff276b08 107At the time of very final cleanup, sv_free_arenas() is called from
645c22ef
DM
108perl_destruct() to physically free all the arenas allocated since the
109start of the interpreter. Note that this also clears PL_he_arenaroot,
110which is otherwise dealt with in hv.c.
111
112Manipulation of any of the PL_*root pointers is protected by enclosing
113LOCK_SV_MUTEX; ... UNLOCK_SV_MUTEX calls which should Do the Right Thing
114if threads are enabled.
115
116The function visit() scans the SV arenas list, and calls a specified
117function for each SV it finds which is still live - ie which has an SvTYPE
118other than all 1's, and a non-zero SvREFCNT. visit() is used by the
119following functions (specified as [function that calls visit()] / [function
120called by visit() for each SV]):
121
122 sv_report_used() / do_report_used()
123 dump all remaining SVs (debugging aid)
124
125 sv_clean_objs() / do_clean_objs(),do_clean_named_objs()
126 Attempt to free all objects pointed to by RVs,
127 and, unless DISABLE_DESTRUCTOR_KLUDGE is defined,
128 try to do the same for all objects indirectly
129 referenced by typeglobs too. Called once from
130 perl_destruct(), prior to calling sv_clean_all()
131 below.
132
133 sv_clean_all() / do_clean_all()
134 SvREFCNT_dec(sv) each remaining SV, possibly
135 triggering an sv_free(). It also sets the
136 SVf_BREAK flag on the SV to indicate that the
137 refcnt has been artificially lowered, and thus
138 stopping sv_free() from giving spurious warnings
139 about SVs which unexpectedly have a refcnt
140 of zero. called repeatedly from perl_destruct()
141 until there are no SVs left.
142
143=head2 Summary
144
145Private API to rest of sv.c
146
147 new_SV(), del_SV(),
148
149 new_XIV(), del_XIV(),
150 new_XNV(), del_XNV(),
151 etc
152
153Public API:
154
8cf8f3d1 155 sv_report_used(), sv_clean_objs(), sv_clean_all(), sv_free_arenas()
645c22ef
DM
156
157
158=cut
159
160============================================================================ */
161
162
51371543 163
4561caa4
CS
164/*
165 * "A time to plant, and a time to uproot what was planted..."
166 */
167
77354fb4
NC
168/*
169 * nice_chunk and nice_chunk size need to be set
170 * and queried under the protection of sv_mutex
171 */
172void
173Perl_offer_nice_chunk(pTHX_ void *chunk, U32 chunk_size)
174{
175 void *new_chunk;
176 U32 new_chunk_size;
177 LOCK_SV_MUTEX;
178 new_chunk = (void *)(chunk);
179 new_chunk_size = (chunk_size);
180 if (new_chunk_size > PL_nice_chunk_size) {
181 Safefree(PL_nice_chunk);
182 PL_nice_chunk = (char *) new_chunk;
183 PL_nice_chunk_size = new_chunk_size;
184 } else {
185 Safefree(chunk);
186 }
187 UNLOCK_SV_MUTEX;
188}
cac9b346 189
fd0854ff
DM
190#ifdef DEBUG_LEAKING_SCALARS
191# ifdef NETWARE
192# define FREE_SV_DEBUG_FILE(sv) PerlMemfree((sv)->sv_debug_file)
193# else
194# define FREE_SV_DEBUG_FILE(sv) PerlMemShared_free((sv)->sv_debug_file)
195# endif
196#else
197# define FREE_SV_DEBUG_FILE(sv)
198#endif
199
053fc874
GS
200#define plant_SV(p) \
201 STMT_START { \
fd0854ff 202 FREE_SV_DEBUG_FILE(p); \
053fc874
GS
203 SvANY(p) = (void *)PL_sv_root; \
204 SvFLAGS(p) = SVTYPEMASK; \
205 PL_sv_root = (p); \
206 --PL_sv_count; \
207 } STMT_END
a0d0e21e 208
fba3b22e 209/* sv_mutex must be held while calling uproot_SV() */
053fc874
GS
210#define uproot_SV(p) \
211 STMT_START { \
212 (p) = PL_sv_root; \
213 PL_sv_root = (SV*)SvANY(p); \
214 ++PL_sv_count; \
215 } STMT_END
216
645c22ef 217
cac9b346
NC
218/* make some more SVs by adding another arena */
219
220/* sv_mutex must be held while calling more_sv() */
221STATIC SV*
222S_more_sv(pTHX)
223{
224 SV* sv;
225
226 if (PL_nice_chunk) {
227 sv_add_arena(PL_nice_chunk, PL_nice_chunk_size, 0);
228 PL_nice_chunk = Nullch;
229 PL_nice_chunk_size = 0;
230 }
231 else {
232 char *chunk; /* must use New here to match call to */
a02a5408 233 Newx(chunk,PERL_ARENA_SIZE,char); /* Safefree() in sv_free_arenas() */
2e7ed132 234 sv_add_arena(chunk, PERL_ARENA_SIZE, 0);
cac9b346
NC
235 }
236 uproot_SV(sv);
237 return sv;
238}
239
645c22ef
DM
240/* new_SV(): return a new, empty SV head */
241
eba0f806
DM
242#ifdef DEBUG_LEAKING_SCALARS
243/* provide a real function for a debugger to play with */
244STATIC SV*
245S_new_SV(pTHX)
246{
247 SV* sv;
248
249 LOCK_SV_MUTEX;
250 if (PL_sv_root)
251 uproot_SV(sv);
252 else
cac9b346 253 sv = S_more_sv(aTHX);
eba0f806
DM
254 UNLOCK_SV_MUTEX;
255 SvANY(sv) = 0;
256 SvREFCNT(sv) = 1;
257 SvFLAGS(sv) = 0;
fd0854ff
DM
258 sv->sv_debug_optype = PL_op ? PL_op->op_type : 0;
259 sv->sv_debug_line = (U16) ((PL_copline == NOLINE) ?
260 (PL_curcop ? CopLINE(PL_curcop) : 0) : PL_copline);
261 sv->sv_debug_inpad = 0;
262 sv->sv_debug_cloned = 0;
263# ifdef NETWARE
264 sv->sv_debug_file = PL_curcop ? savepv(CopFILE(PL_curcop)): NULL;
265# else
266 sv->sv_debug_file = PL_curcop ? savesharedpv(CopFILE(PL_curcop)): NULL;
267# endif
268
eba0f806
DM
269 return sv;
270}
271# define new_SV(p) (p)=S_new_SV(aTHX)
272
273#else
274# define new_SV(p) \
053fc874
GS
275 STMT_START { \
276 LOCK_SV_MUTEX; \
277 if (PL_sv_root) \
278 uproot_SV(p); \
279 else \
cac9b346 280 (p) = S_more_sv(aTHX); \
053fc874
GS
281 UNLOCK_SV_MUTEX; \
282 SvANY(p) = 0; \
283 SvREFCNT(p) = 1; \
284 SvFLAGS(p) = 0; \
285 } STMT_END
eba0f806 286#endif
463ee0b2 287
645c22ef
DM
288
289/* del_SV(): return an empty SV head to the free list */
290
a0d0e21e 291#ifdef DEBUGGING
4561caa4 292
053fc874
GS
293#define del_SV(p) \
294 STMT_START { \
295 LOCK_SV_MUTEX; \
aea4f609 296 if (DEBUG_D_TEST) \
053fc874
GS
297 del_sv(p); \
298 else \
299 plant_SV(p); \
300 UNLOCK_SV_MUTEX; \
301 } STMT_END
a0d0e21e 302
76e3520e 303STATIC void
cea2e8a9 304S_del_sv(pTHX_ SV *p)
463ee0b2 305{
aea4f609 306 if (DEBUG_D_TEST) {
4633a7c4 307 SV* sva;
a3b680e6 308 bool ok = 0;
3280af22 309 for (sva = PL_sv_arenaroot; sva; sva = (SV *) SvANY(sva)) {
53c1dcc0
AL
310 const SV * const sv = sva + 1;
311 const SV * const svend = &sva[SvREFCNT(sva)];
c0ff570e 312 if (p >= sv && p < svend) {
a0d0e21e 313 ok = 1;
c0ff570e
NC
314 break;
315 }
a0d0e21e
LW
316 }
317 if (!ok) {
0453d815 318 if (ckWARN_d(WARN_INTERNAL))
9014280d 319 Perl_warner(aTHX_ packWARN(WARN_INTERNAL),
472d47bc
SB
320 "Attempt to free non-arena SV: 0x%"UVxf
321 pTHX__FORMAT, PTR2UV(p) pTHX__VALUE);
a0d0e21e
LW
322 return;
323 }
324 }
4561caa4 325 plant_SV(p);
463ee0b2 326}
a0d0e21e 327
4561caa4
CS
328#else /* ! DEBUGGING */
329
330#define del_SV(p) plant_SV(p)
331
332#endif /* DEBUGGING */
463ee0b2 333
645c22ef
DM
334
335/*
ccfc67b7
JH
336=head1 SV Manipulation Functions
337
645c22ef
DM
338=for apidoc sv_add_arena
339
340Given a chunk of memory, link it to the head of the list of arenas,
341and split it into a list of free SVs.
342
343=cut
344*/
345
4633a7c4 346void
864dbfa3 347Perl_sv_add_arena(pTHX_ char *ptr, U32 size, U32 flags)
463ee0b2 348{
4633a7c4 349 SV* sva = (SV*)ptr;
463ee0b2
LW
350 register SV* sv;
351 register SV* svend;
4633a7c4
LW
352
353 /* The first SV in an arena isn't an SV. */
3280af22 354 SvANY(sva) = (void *) PL_sv_arenaroot; /* ptr to next arena */
4633a7c4
LW
355 SvREFCNT(sva) = size / sizeof(SV); /* number of SV slots */
356 SvFLAGS(sva) = flags; /* FAKE if not to be freed */
357
3280af22
NIS
358 PL_sv_arenaroot = sva;
359 PL_sv_root = sva + 1;
4633a7c4
LW
360
361 svend = &sva[SvREFCNT(sva) - 1];
362 sv = sva + 1;
463ee0b2 363 while (sv < svend) {
a0d0e21e 364 SvANY(sv) = (void *)(SV*)(sv + 1);
03e36789 365#ifdef DEBUGGING
978b032e 366 SvREFCNT(sv) = 0;
03e36789
NC
367#endif
368 /* Must always set typemask because it's awlays checked in on cleanup
369 when the arenas are walked looking for objects. */
8990e307 370 SvFLAGS(sv) = SVTYPEMASK;
463ee0b2
LW
371 sv++;
372 }
373 SvANY(sv) = 0;
03e36789
NC
374#ifdef DEBUGGING
375 SvREFCNT(sv) = 0;
376#endif
4633a7c4
LW
377 SvFLAGS(sv) = SVTYPEMASK;
378}
379
055972dc
DM
380/* visit(): call the named function for each non-free SV in the arenas
381 * whose flags field matches the flags/mask args. */
645c22ef 382
5226ed68 383STATIC I32
055972dc 384S_visit(pTHX_ SVFUNC_t f, U32 flags, U32 mask)
8990e307 385{
4633a7c4 386 SV* sva;
5226ed68 387 I32 visited = 0;
8990e307 388
3280af22 389 for (sva = PL_sv_arenaroot; sva; sva = (SV*)SvANY(sva)) {
53c1dcc0 390 register const SV * const svend = &sva[SvREFCNT(sva)];
a3b680e6 391 register SV* sv;
4561caa4 392 for (sv = sva + 1; sv < svend; ++sv) {
055972dc
DM
393 if (SvTYPE(sv) != SVTYPEMASK
394 && (sv->sv_flags & mask) == flags
395 && SvREFCNT(sv))
396 {
acfe0abc 397 (FCALL)(aTHX_ sv);
5226ed68
JH
398 ++visited;
399 }
8990e307
LW
400 }
401 }
5226ed68 402 return visited;
8990e307
LW
403}
404
758a08c3
JH
405#ifdef DEBUGGING
406
645c22ef
DM
407/* called by sv_report_used() for each live SV */
408
409static void
acfe0abc 410do_report_used(pTHX_ SV *sv)
645c22ef
DM
411{
412 if (SvTYPE(sv) != SVTYPEMASK) {
413 PerlIO_printf(Perl_debug_log, "****\n");
414 sv_dump(sv);
415 }
416}
758a08c3 417#endif
645c22ef
DM
418
419/*
420=for apidoc sv_report_used
421
422Dump the contents of all SVs not yet freed. (Debugging aid).
423
424=cut
425*/
426
8990e307 427void
864dbfa3 428Perl_sv_report_used(pTHX)
4561caa4 429{
ff270d3a 430#ifdef DEBUGGING
055972dc 431 visit(do_report_used, 0, 0);
ff270d3a 432#endif
4561caa4
CS
433}
434
645c22ef
DM
435/* called by sv_clean_objs() for each live SV */
436
437static void
e15faf7d 438do_clean_objs(pTHX_ SV *ref)
645c22ef 439{
e15faf7d 440 SV* target;
645c22ef 441
e15faf7d
NC
442 if (SvROK(ref) && SvOBJECT(target = SvRV(ref))) {
443 DEBUG_D((PerlIO_printf(Perl_debug_log, "Cleaning object ref:\n "), sv_dump(ref)));
444 if (SvWEAKREF(ref)) {
445 sv_del_backref(target, ref);
446 SvWEAKREF_off(ref);
447 SvRV_set(ref, NULL);
645c22ef 448 } else {
e15faf7d
NC
449 SvROK_off(ref);
450 SvRV_set(ref, NULL);
451 SvREFCNT_dec(target);
645c22ef
DM
452 }
453 }
454
455 /* XXX Might want to check arrays, etc. */
456}
457
458/* called by sv_clean_objs() for each live SV */
459
460#ifndef DISABLE_DESTRUCTOR_KLUDGE
461static void
acfe0abc 462do_clean_named_objs(pTHX_ SV *sv)
645c22ef
DM
463{
464 if (SvTYPE(sv) == SVt_PVGV && GvGP(sv)) {
c69033f2
NC
465 if ((
466#ifdef PERL_DONT_CREATE_GVSV
467 GvSV(sv) &&
468#endif
469 SvOBJECT(GvSV(sv))) ||
645c22ef
DM
470 (GvAV(sv) && SvOBJECT(GvAV(sv))) ||
471 (GvHV(sv) && SvOBJECT(GvHV(sv))) ||
472 (GvIO(sv) && SvOBJECT(GvIO(sv))) ||
473 (GvCV(sv) && SvOBJECT(GvCV(sv))) )
474 {
475 DEBUG_D((PerlIO_printf(Perl_debug_log, "Cleaning named glob object:\n "), sv_dump(sv)));
ec5f3c78 476 SvFLAGS(sv) |= SVf_BREAK;
645c22ef
DM
477 SvREFCNT_dec(sv);
478 }
479 }
480}
481#endif
482
483/*
484=for apidoc sv_clean_objs
485
486Attempt to destroy all objects not yet freed
487
488=cut
489*/
490
4561caa4 491void
864dbfa3 492Perl_sv_clean_objs(pTHX)
4561caa4 493{
3280af22 494 PL_in_clean_objs = TRUE;
055972dc 495 visit(do_clean_objs, SVf_ROK, SVf_ROK);
4561caa4 496#ifndef DISABLE_DESTRUCTOR_KLUDGE
2d0f3c12 497 /* some barnacles may yet remain, clinging to typeglobs */
055972dc 498 visit(do_clean_named_objs, SVt_PVGV, SVTYPEMASK);
4561caa4 499#endif
3280af22 500 PL_in_clean_objs = FALSE;
4561caa4
CS
501}
502
645c22ef
DM
503/* called by sv_clean_all() for each live SV */
504
505static void
acfe0abc 506do_clean_all(pTHX_ SV *sv)
645c22ef
DM
507{
508 DEBUG_D((PerlIO_printf(Perl_debug_log, "Cleaning loops: SV at 0x%"UVxf"\n", PTR2UV(sv)) ));
509 SvFLAGS(sv) |= SVf_BREAK;
0e705b3b
DM
510 if (PL_comppad == (AV*)sv) {
511 PL_comppad = Nullav;
512 PL_curpad = Null(SV**);
513 }
645c22ef
DM
514 SvREFCNT_dec(sv);
515}
516
517/*
518=for apidoc sv_clean_all
519
520Decrement the refcnt of each remaining SV, possibly triggering a
521cleanup. This function may have to be called multiple times to free
ff276b08 522SVs which are in complex self-referential hierarchies.
645c22ef
DM
523
524=cut
525*/
526
5226ed68 527I32
864dbfa3 528Perl_sv_clean_all(pTHX)
8990e307 529{
5226ed68 530 I32 cleaned;
3280af22 531 PL_in_clean_all = TRUE;
055972dc 532 cleaned = visit(do_clean_all, 0,0);
3280af22 533 PL_in_clean_all = FALSE;
5226ed68 534 return cleaned;
8990e307 535}
463ee0b2 536
7cfef17e
NC
537static void
538S_free_arena(pTHX_ void **root) {
539 while (root) {
1b6737cc 540 void ** const next = *(void **)root;
7cfef17e
NC
541 Safefree(root);
542 root = next;
543 }
544}
545
645c22ef
DM
546/*
547=for apidoc sv_free_arenas
548
549Deallocate the memory used by all arenas. Note that all the individual SV
550heads and bodies within the arenas must already have been freed.
551
552=cut
553*/
554
7cfef17e
NC
555#define free_arena(name) \
556 STMT_START { \
557 S_free_arena(aTHX_ (void**) PL_ ## name ## _arenaroot); \
558 PL_ ## name ## _arenaroot = 0; \
559 PL_ ## name ## _root = 0; \
560 } STMT_END
561
4633a7c4 562void
864dbfa3 563Perl_sv_free_arenas(pTHX)
4633a7c4
LW
564{
565 SV* sva;
566 SV* svanext;
567
568 /* Free arenas here, but be careful about fake ones. (We assume
569 contiguity of the fake ones with the corresponding real ones.) */
570
3280af22 571 for (sva = PL_sv_arenaroot; sva; sva = svanext) {
4633a7c4
LW
572 svanext = (SV*) SvANY(sva);
573 while (svanext && SvFAKE(svanext))
574 svanext = (SV*) SvANY(svanext);
575
576 if (!SvFAKE(sva))
1df70142 577 Safefree(sva);
4633a7c4 578 }
8b4f5e17 579
7cfef17e
NC
580 free_arena(xnv);
581 free_arena(xpv);
582 free_arena(xpviv);
583 free_arena(xpvnv);
584 free_arena(xpvcv);
585 free_arena(xpvav);
586 free_arena(xpvhv);
587 free_arena(xpvmg);
588 free_arena(xpvgv);
589 free_arena(xpvlv);
590 free_arena(xpvbm);
591 free_arena(he);
592#if defined(USE_ITHREADS)
593 free_arena(pte);
594#endif
612f20c3 595
43c5f42d 596 Safefree(PL_nice_chunk);
3280af22
NIS
597 PL_nice_chunk = Nullch;
598 PL_nice_chunk_size = 0;
599 PL_sv_arenaroot = 0;
600 PL_sv_root = 0;
4633a7c4
LW
601}
602
29489e7c
DM
603/* ---------------------------------------------------------------------
604 *
605 * support functions for report_uninit()
606 */
607
608/* the maxiumum size of array or hash where we will scan looking
609 * for the undefined element that triggered the warning */
610
611#define FUV_MAX_SEARCH_SIZE 1000
612
613/* Look for an entry in the hash whose value has the same SV as val;
614 * If so, return a mortal copy of the key. */
615
616STATIC SV*
617S_find_hash_subscript(pTHX_ HV *hv, SV* val)
618{
27da23d5 619 dVAR;
29489e7c 620 register HE **array;
29489e7c
DM
621 I32 i;
622
623 if (!hv || SvMAGICAL(hv) || !HvARRAY(hv) ||
624 (HvTOTALKEYS(hv) > FUV_MAX_SEARCH_SIZE))
625 return Nullsv;
626
627 array = HvARRAY(hv);
628
629 for (i=HvMAX(hv); i>0; i--) {
f54cb97a 630 register HE *entry;
29489e7c
DM
631 for (entry = array[i]; entry; entry = HeNEXT(entry)) {
632 if (HeVAL(entry) != val)
633 continue;
634 if ( HeVAL(entry) == &PL_sv_undef ||
635 HeVAL(entry) == &PL_sv_placeholder)
636 continue;
637 if (!HeKEY(entry))
638 return Nullsv;
639 if (HeKLEN(entry) == HEf_SVKEY)
640 return sv_mortalcopy(HeKEY_sv(entry));
641 return sv_2mortal(newSVpvn(HeKEY(entry), HeKLEN(entry)));
642 }
643 }
644 return Nullsv;
645}
646
647/* Look for an entry in the array whose value has the same SV as val;
648 * If so, return the index, otherwise return -1. */
649
650STATIC I32
651S_find_array_subscript(pTHX_ AV *av, SV* val)
652{
653 SV** svp;
654 I32 i;
655 if (!av || SvMAGICAL(av) || !AvARRAY(av) ||
656 (AvFILLp(av) > FUV_MAX_SEARCH_SIZE))
657 return -1;
658
659 svp = AvARRAY(av);
660 for (i=AvFILLp(av); i>=0; i--) {
661 if (svp[i] == val && svp[i] != &PL_sv_undef)
662 return i;
663 }
664 return -1;
665}
666
667/* S_varname(): return the name of a variable, optionally with a subscript.
668 * If gv is non-zero, use the name of that global, along with gvtype (one
669 * of "$", "@", "%"); otherwise use the name of the lexical at pad offset
670 * targ. Depending on the value of the subscript_type flag, return:
671 */
672
673#define FUV_SUBSCRIPT_NONE 1 /* "@foo" */
674#define FUV_SUBSCRIPT_ARRAY 2 /* "$foo[aindex]" */
675#define FUV_SUBSCRIPT_HASH 3 /* "$foo{keyname}" */
676#define FUV_SUBSCRIPT_WITHIN 4 /* "within @foo" */
677
678STATIC SV*
be2ef075 679S_varname(pTHX_ GV *gv, const char gvtype, PADOFFSET targ,
29489e7c
DM
680 SV* keyname, I32 aindex, int subscript_type)
681{
29489e7c 682
a3b680e6 683 SV * const name = sv_newmortal();
29489e7c
DM
684 if (gv) {
685
686 /* simulate gv_fullname4(), but add literal '^' for $^FOO names
687 * XXX get rid of all this if gv_fullnameX() ever supports this
688 * directly */
689
bfed75c6 690 const char *p;
53c1dcc0 691 HV * const hv = GvSTASH(gv);
29489e7c
DM
692 if (!hv)
693 p = "???";
bfcb3514 694 else if (!(p=HvNAME_get(hv)))
29489e7c 695 p = "__ANON__";
be2ef075
NC
696 if (strEQ(p, "main"))
697 sv_setpvn(name, &gvtype, 1);
698 else
699 Perl_sv_setpvf(aTHX_ name, "%c%s::", gvtype, p);
700
29489e7c
DM
701 if (GvNAMELEN(gv)>= 1 &&
702 ((unsigned int)*GvNAME(gv)) <= 26)
703 { /* handle $^FOO */
704 Perl_sv_catpvf(aTHX_ name,"^%c", *GvNAME(gv) + 'A' - 1);
705 sv_catpvn(name,GvNAME(gv)+1,GvNAMELEN(gv)-1);
706 }
707 else
708 sv_catpvn(name,GvNAME(gv),GvNAMELEN(gv));
709 }
710 else {
53c1dcc0
AL
711 U32 unused;
712 CV * const cv = find_runcv(&unused);
713 SV *sv;
714 AV *av;
715
29489e7c 716 if (!cv || !CvPADLIST(cv))
1b6737cc 717 return Nullsv;
29489e7c
DM
718 av = (AV*)(*av_fetch(CvPADLIST(cv), 0, FALSE));
719 sv = *av_fetch(av, targ, FALSE);
720 /* SvLEN in a pad name is not to be trusted */
f9926b10 721 sv_setpv(name, SvPV_nolen_const(sv));
29489e7c
DM
722 }
723
724 if (subscript_type == FUV_SUBSCRIPT_HASH) {
1b6737cc 725 SV * const sv = NEWSV(0,0);
29489e7c 726 *SvPVX(name) = '$';
29489e7c 727 Perl_sv_catpvf(aTHX_ name, "{%s}",
3f7c398e 728 pv_display(sv,SvPVX_const(keyname), SvCUR(keyname), 0, 32));
29489e7c
DM
729 SvREFCNT_dec(sv);
730 }
731 else if (subscript_type == FUV_SUBSCRIPT_ARRAY) {
732 *SvPVX(name) = '$';
265a12b8 733 Perl_sv_catpvf(aTHX_ name, "[%"IVdf"]", (IV)aindex);
29489e7c
DM
734 }
735 else if (subscript_type == FUV_SUBSCRIPT_WITHIN)
736 sv_insert(name, 0, 0, "within ", 7);
737
738 return name;
739}
740
741
742/*
743=for apidoc find_uninit_var
744
745Find the name of the undefined variable (if any) that caused the operator o
746to issue a "Use of uninitialized value" warning.
747If match is true, only return a name if it's value matches uninit_sv.
748So roughly speaking, if a unary operator (such as OP_COS) generates a
749warning, then following the direct child of the op may yield an
750OP_PADSV or OP_GV that gives the name of the undefined variable. On the
751other hand, with OP_ADD there are two branches to follow, so we only print
752the variable name if we get an exact match.
753
754The name is returned as a mortal SV.
755
756Assumes that PL_op is the op that originally triggered the error, and that
757PL_comppad/PL_curpad points to the currently executing pad.
758
759=cut
760*/
761
762STATIC SV *
763S_find_uninit_var(pTHX_ OP* obase, SV* uninit_sv, bool match)
764{
27da23d5 765 dVAR;
29489e7c
DM
766 SV *sv;
767 AV *av;
29489e7c
DM
768 GV *gv;
769 OP *o, *o2, *kid;
770
771 if (!obase || (match && (!uninit_sv || uninit_sv == &PL_sv_undef ||
772 uninit_sv == &PL_sv_placeholder)))
773 return Nullsv;
774
775 switch (obase->op_type) {
776
777 case OP_RV2AV:
778 case OP_RV2HV:
779 case OP_PADAV:
780 case OP_PADHV:
781 {
f54cb97a
AL
782 const bool pad = (obase->op_type == OP_PADAV || obase->op_type == OP_PADHV);
783 const bool hash = (obase->op_type == OP_PADHV || obase->op_type == OP_RV2HV);
112dcc46
RGS
784 I32 index = 0;
785 SV *keysv = Nullsv;
29489e7c
DM
786 int subscript_type = FUV_SUBSCRIPT_WITHIN;
787
788 if (pad) { /* @lex, %lex */
789 sv = PAD_SVl(obase->op_targ);
790 gv = Nullgv;
791 }
792 else {
793 if (cUNOPx(obase)->op_first->op_type == OP_GV) {
794 /* @global, %global */
795 gv = cGVOPx_gv(cUNOPx(obase)->op_first);
796 if (!gv)
797 break;
798 sv = hash ? (SV*)GvHV(gv): (SV*)GvAV(gv);
799 }
800 else /* @{expr}, %{expr} */
801 return find_uninit_var(cUNOPx(obase)->op_first,
802 uninit_sv, match);
803 }
804
805 /* attempt to find a match within the aggregate */
806 if (hash) {
807 keysv = S_find_hash_subscript(aTHX_ (HV*)sv, uninit_sv);
808 if (keysv)
809 subscript_type = FUV_SUBSCRIPT_HASH;
810 }
811 else {
812 index = S_find_array_subscript(aTHX_ (AV*)sv, uninit_sv);
813 if (index >= 0)
814 subscript_type = FUV_SUBSCRIPT_ARRAY;
815 }
816
817 if (match && subscript_type == FUV_SUBSCRIPT_WITHIN)
818 break;
819
be2ef075 820 return varname(gv, hash ? '%' : '@', obase->op_targ,
29489e7c
DM
821 keysv, index, subscript_type);
822 }
823
824 case OP_PADSV:
825 if (match && PAD_SVl(obase->op_targ) != uninit_sv)
826 break;
be2ef075 827 return varname(Nullgv, '$', obase->op_targ,
29489e7c
DM
828 Nullsv, 0, FUV_SUBSCRIPT_NONE);
829
830 case OP_GVSV:
831 gv = cGVOPx_gv(obase);
832 if (!gv || (match && GvSV(gv) != uninit_sv))
833 break;
be2ef075 834 return varname(gv, '$', 0, Nullsv, 0, FUV_SUBSCRIPT_NONE);
29489e7c
DM
835
836 case OP_AELEMFAST:
837 if (obase->op_flags & OPf_SPECIAL) { /* lexical array */
838 if (match) {
1b6737cc 839 SV **svp;
29489e7c
DM
840 av = (AV*)PAD_SV(obase->op_targ);
841 if (!av || SvRMAGICAL(av))
842 break;
843 svp = av_fetch(av, (I32)obase->op_private, FALSE);
844 if (!svp || *svp != uninit_sv)
845 break;
846 }
be2ef075 847 return varname(Nullgv, '$', obase->op_targ,
29489e7c
DM
848 Nullsv, (I32)obase->op_private, FUV_SUBSCRIPT_ARRAY);
849 }
850 else {
851 gv = cGVOPx_gv(obase);
852 if (!gv)
853 break;
854 if (match) {
1b6737cc 855 SV **svp;
29489e7c
DM
856 av = GvAV(gv);
857 if (!av || SvRMAGICAL(av))
858 break;
859 svp = av_fetch(av, (I32)obase->op_private, FALSE);
860 if (!svp || *svp != uninit_sv)
861 break;
862 }
be2ef075 863 return varname(gv, '$', 0,
29489e7c
DM
864 Nullsv, (I32)obase->op_private, FUV_SUBSCRIPT_ARRAY);
865 }
866 break;
867
868 case OP_EXISTS:
869 o = cUNOPx(obase)->op_first;
870 if (!o || o->op_type != OP_NULL ||
871 ! (o->op_targ == OP_AELEM || o->op_targ == OP_HELEM))
872 break;
873 return find_uninit_var(cBINOPo->op_last, uninit_sv, match);
874
875 case OP_AELEM:
876 case OP_HELEM:
877 if (PL_op == obase)
878 /* $a[uninit_expr] or $h{uninit_expr} */
879 return find_uninit_var(cBINOPx(obase)->op_last, uninit_sv, match);
880
881 gv = Nullgv;
882 o = cBINOPx(obase)->op_first;
883 kid = cBINOPx(obase)->op_last;
884
885 /* get the av or hv, and optionally the gv */
886 sv = Nullsv;
887 if (o->op_type == OP_PADAV || o->op_type == OP_PADHV) {
888 sv = PAD_SV(o->op_targ);
889 }
890 else if ((o->op_type == OP_RV2AV || o->op_type == OP_RV2HV)
891 && cUNOPo->op_first->op_type == OP_GV)
892 {
893 gv = cGVOPx_gv(cUNOPo->op_first);
894 if (!gv)
895 break;
896 sv = o->op_type == OP_RV2HV ? (SV*)GvHV(gv) : (SV*)GvAV(gv);
897 }
898 if (!sv)
899 break;
900
901 if (kid && kid->op_type == OP_CONST && SvOK(cSVOPx_sv(kid))) {
902 /* index is constant */
903 if (match) {
904 if (SvMAGICAL(sv))
905 break;
906 if (obase->op_type == OP_HELEM) {
907 HE* he = hv_fetch_ent((HV*)sv, cSVOPx_sv(kid), 0, 0);
908 if (!he || HeVAL(he) != uninit_sv)
909 break;
910 }
911 else {
1b6737cc 912 SV ** const svp = av_fetch((AV*)sv, SvIV(cSVOPx_sv(kid)), FALSE);
29489e7c
DM
913 if (!svp || *svp != uninit_sv)
914 break;
915 }
916 }
917 if (obase->op_type == OP_HELEM)
be2ef075 918 return varname(gv, '%', o->op_targ,
29489e7c
DM
919 cSVOPx_sv(kid), 0, FUV_SUBSCRIPT_HASH);
920 else
be2ef075 921 return varname(gv, '@', o->op_targ, Nullsv,
29489e7c
DM
922 SvIV(cSVOPx_sv(kid)), FUV_SUBSCRIPT_ARRAY);
923 ;
924 }
925 else {
926 /* index is an expression;
927 * attempt to find a match within the aggregate */
928 if (obase->op_type == OP_HELEM) {
53c1dcc0 929 SV * const keysv = S_find_hash_subscript(aTHX_ (HV*)sv, uninit_sv);
29489e7c 930 if (keysv)
be2ef075 931 return varname(gv, '%', o->op_targ,
29489e7c
DM
932 keysv, 0, FUV_SUBSCRIPT_HASH);
933 }
934 else {
f54cb97a 935 const I32 index = S_find_array_subscript(aTHX_ (AV*)sv, uninit_sv);
29489e7c 936 if (index >= 0)
be2ef075 937 return varname(gv, '@', o->op_targ,
29489e7c
DM
938 Nullsv, index, FUV_SUBSCRIPT_ARRAY);
939 }
940 if (match)
941 break;
1b6737cc 942 return varname(gv,
29489e7c 943 (o->op_type == OP_PADAV || o->op_type == OP_RV2AV)
be2ef075 944 ? '@' : '%',
29489e7c
DM
945 o->op_targ, Nullsv, 0, FUV_SUBSCRIPT_WITHIN);
946 }
947
948 break;
949
950 case OP_AASSIGN:
951 /* only examine RHS */
952 return find_uninit_var(cBINOPx(obase)->op_first, uninit_sv, match);
953
954 case OP_OPEN:
955 o = cUNOPx(obase)->op_first;
956 if (o->op_type == OP_PUSHMARK)
957 o = o->op_sibling;
958
959 if (!o->op_sibling) {
960 /* one-arg version of open is highly magical */
961
962 if (o->op_type == OP_GV) { /* open FOO; */
963 gv = cGVOPx_gv(o);
964 if (match && GvSV(gv) != uninit_sv)
965 break;
be2ef075 966 return varname(gv, '$', 0,
29489e7c
DM
967 Nullsv, 0, FUV_SUBSCRIPT_NONE);
968 }
969 /* other possibilities not handled are:
970 * open $x; or open my $x; should return '${*$x}'
971 * open expr; should return '$'.expr ideally
972 */
973 break;
974 }
975 goto do_op;
976
977 /* ops where $_ may be an implicit arg */
978 case OP_TRANS:
979 case OP_SUBST:
980 case OP_MATCH:
981 if ( !(obase->op_flags & OPf_STACKED)) {
982 if (uninit_sv == ((obase->op_private & OPpTARGET_MY)
983 ? PAD_SVl(obase->op_targ)
984 : DEFSV))
985 {
986 sv = sv_newmortal();
616d8c9c 987 sv_setpvn(sv, "$_", 2);
29489e7c
DM
988 return sv;
989 }
990 }
991 goto do_op;
992
993 case OP_PRTF:
994 case OP_PRINT:
995 /* skip filehandle as it can't produce 'undef' warning */
996 o = cUNOPx(obase)->op_first;
997 if ((obase->op_flags & OPf_STACKED) && o->op_type == OP_PUSHMARK)
998 o = o->op_sibling->op_sibling;
999 goto do_op2;
1000
1001
e21bd382 1002 case OP_RV2SV:
29489e7c
DM
1003 case OP_CUSTOM:
1004 case OP_ENTERSUB:
1005 match = 1; /* XS or custom code could trigger random warnings */
1006 goto do_op;
1007
1008 case OP_SCHOMP:
1009 case OP_CHOMP:
1010 if (SvROK(PL_rs) && uninit_sv == SvRV(PL_rs))
d0043bd1 1011 return sv_2mortal(newSVpvn("${$/}", 5));
29489e7c
DM
1012 /* FALL THROUGH */
1013
1014 default:
1015 do_op:
1016 if (!(obase->op_flags & OPf_KIDS))
1017 break;
1018 o = cUNOPx(obase)->op_first;
1019
1020 do_op2:
1021 if (!o)
1022 break;
1023
1024 /* if all except one arg are constant, or have no side-effects,
1025 * or are optimized away, then it's unambiguous */
1026 o2 = Nullop;
1027 for (kid=o; kid; kid = kid->op_sibling) {
1028 if (kid &&
1029 ( (kid->op_type == OP_CONST && SvOK(cSVOPx_sv(kid)))
1030 || (kid->op_type == OP_NULL && ! (kid->op_flags & OPf_KIDS))
1031 || (kid->op_type == OP_PUSHMARK)
1032 )
1033 )
1034 continue;
1035 if (o2) { /* more than one found */
1036 o2 = Nullop;
1037 break;
1038 }
1039 o2 = kid;
1040 }
1041 if (o2)
1042 return find_uninit_var(o2, uninit_sv, match);
1043
1044 /* scan all args */
1045 while (o) {
1046 sv = find_uninit_var(o, uninit_sv, 1);
1047 if (sv)
1048 return sv;
1049 o = o->op_sibling;
1050 }
1051 break;
1052 }
1053 return Nullsv;
1054}
1055
1056
645c22ef
DM
1057/*
1058=for apidoc report_uninit
1059
1060Print appropriate "Use of uninitialized variable" warning
1061
1062=cut
1063*/
1064
1d7c1841 1065void
29489e7c
DM
1066Perl_report_uninit(pTHX_ SV* uninit_sv)
1067{
1068 if (PL_op) {
112dcc46 1069 SV* varname = Nullsv;
29489e7c
DM
1070 if (uninit_sv) {
1071 varname = find_uninit_var(PL_op, uninit_sv,0);
1072 if (varname)
1073 sv_insert(varname, 0, 0, " ", 1);
1074 }
9014280d 1075 Perl_warner(aTHX_ packWARN(WARN_UNINITIALIZED), PL_warn_uninit,
93524f2b 1076 varname ? SvPV_nolen_const(varname) : "",
29489e7c
DM
1077 " in ", OP_DESC(PL_op));
1078 }
1d7c1841 1079 else
29489e7c
DM
1080 Perl_warner(aTHX_ packWARN(WARN_UNINITIALIZED), PL_warn_uninit,
1081 "", "", "");
1d7c1841
GS
1082}
1083
de042e1d 1084STATIC void *
e3bbdc67 1085S_more_bodies (pTHX_ void **arena_root, void **root, size_t size)
cac9b346 1086{
e3bbdc67
NC
1087 char *start;
1088 const char *end;
53c1dcc0 1089 const size_t count = PERL_ARENA_SIZE/size;
a02a5408 1090 Newx(start, count*size, char);
e3bbdc67
NC
1091 *((void **) start) = *arena_root;
1092 *arena_root = (void *)start;
cac9b346 1093
e3bbdc67 1094 end = start + (count-1) * size;
cac9b346 1095
e3bbdc67
NC
1096 /* The initial slot is used to link the arenas together, so it isn't to be
1097 linked into the list of ready-to-use bodies. */
cac9b346 1098
e3bbdc67 1099 start += size;
cac9b346 1100
e3bbdc67 1101 *root = (void *)start;
cac9b346 1102
e3bbdc67 1103 while (start < end) {
53c1dcc0 1104 char * const next = start + size;
e3bbdc67
NC
1105 *(void**) start = (void *)next;
1106 start = next;
cac9b346 1107 }
e3bbdc67 1108 *(void **)start = 0;
de042e1d
NC
1109
1110 return *root;
cac9b346
NC
1111}
1112
aeb18a1e 1113/* grab a new thing from the free list, allocating more if necessary */
645c22ef 1114
30f9da9e 1115/* 1st, the inline version */
08742458
NC
1116
1117#define new_body_inline(xpv, arena_root, root, size) \
1118 STMT_START { \
1119 LOCK_SV_MUTEX; \
1120 xpv = *((void **)(root)) \
1121 ? *((void **)(root)) : S_more_bodies(aTHX_ arena_root, root, size); \
1122 *(root) = *(void**)(xpv); \
1123 UNLOCK_SV_MUTEX; \
1124 } STMT_END
1125
30f9da9e
JC
1126/* now use the inline version in the proper function */
1127
1128STATIC void *
1129S_new_body(pTHX_ void **arena_root, void **root, size_t size)
1130{
1131 void *xpv;
1132 new_body_inline(xpv, arena_root, root, size);
1133 return xpv;
1134}
1135
aeb18a1e 1136/* return a thing to the free list */
645c22ef 1137
cb4415b8
NC
1138#define del_body(thing, root) \
1139 STMT_START { \
49c04cc7 1140 void **thing_copy = (void **)thing; \
cb4415b8 1141 LOCK_SV_MUTEX; \
49c04cc7
NC
1142 *thing_copy = *root; \
1143 *root = (void*)thing_copy; \
cb4415b8
NC
1144 UNLOCK_SV_MUTEX; \
1145 } STMT_END
932e9ff9 1146
aeb18a1e
NC
1147/* Conventionally we simply malloc() a big block of memory, then divide it
1148 up into lots of the thing that we're allocating.
645c22ef 1149
aeb18a1e
NC
1150 This macro will expand to call to S_new_body. So for XPVBM (with ithreads),
1151 it would become
932e9ff9 1152
aeb18a1e
NC
1153 S_new_body(my_perl, (void**)&(my_perl->Ixpvbm_arenaroot),
1154 (void**)&(my_perl->Ixpvbm_root), sizeof(XPVBM), 0)
1155*/
645c22ef 1156
08742458 1157#define new_body_type(TYPE,lctype) \
aeb18a1e
NC
1158 S_new_body(aTHX_ (void**)&PL_ ## lctype ## _arenaroot, \
1159 (void**)&PL_ ## lctype ## _root, \
dd690478
NC
1160 sizeof(TYPE))
1161
cb4415b8
NC
1162#define del_body_type(p,TYPE,lctype) \
1163 del_body((void*)p, (void**)&PL_ ## lctype ## _root)
aeb18a1e
NC
1164
1165/* But for some types, we cheat. The type starts with some members that are
1166 never accessed. So we allocate the substructure, starting at the first used
1167 member, then adjust the pointer back in memory by the size of the bit not
1168 allocated, so it's as if we allocated the full structure.
1169 (But things will all go boom if you write to the part that is "not there",
1170 because you'll be overwriting the last members of the preceding structure
1171 in memory.)
1172
1173 We calculate the correction using the STRUCT_OFFSET macro. For example, if
1174 xpv_allocated is the same structure as XPV then the two OFFSETs sum to zero,
1175 and the pointer is unchanged. If the allocated structure is smaller (no
1176 initial NV actually allocated) then the net effect is to subtract the size
1177 of the NV from the pointer, to return a new pointer as if an initial NV were
1178 actually allocated.
1179
1180 This is the same trick as was used for NV and IV bodies. Ironically it
1181 doesn't need to be used for NV bodies any more, because NV is now at the
1182 start of the structure. IV bodies don't need it either, because they are
1183 no longer allocated. */
1184
1185#define new_body_allocated(TYPE,lctype,member) \
dd690478
NC
1186 (void*)((char*)S_new_body(aTHX_ (void**)&PL_ ## lctype ## _arenaroot, \
1187 (void**)&PL_ ## lctype ## _root, \
1188 sizeof(lctype ## _allocated)) - \
1189 STRUCT_OFFSET(TYPE, member) \
1190 + STRUCT_OFFSET(lctype ## _allocated, member))
aeb18a1e
NC
1191
1192
aeb18a1e 1193#define del_body_allocated(p,TYPE,lctype,member) \
cb4415b8
NC
1194 del_body((void*)((char*)p + STRUCT_OFFSET(TYPE, member) \
1195 - STRUCT_OFFSET(lctype ## _allocated, member)), \
1196 (void**)&PL_ ## lctype ## _root)
932e9ff9 1197
7bab3ede
MB
1198#define my_safemalloc(s) (void*)safemalloc(s)
1199#define my_safefree(p) safefree((char*)p)
463ee0b2 1200
d33b2eba 1201#ifdef PURIFY
463ee0b2 1202
d33b2eba
GS
1203#define new_XNV() my_safemalloc(sizeof(XPVNV))
1204#define del_XNV(p) my_safefree(p)
463ee0b2 1205
d33b2eba
GS
1206#define new_XPV() my_safemalloc(sizeof(XPV))
1207#define del_XPV(p) my_safefree(p)
9b94d1dd 1208
d33b2eba
GS
1209#define new_XPVIV() my_safemalloc(sizeof(XPVIV))
1210#define del_XPVIV(p) my_safefree(p)
932e9ff9 1211
d33b2eba
GS
1212#define new_XPVNV() my_safemalloc(sizeof(XPVNV))
1213#define del_XPVNV(p) my_safefree(p)
932e9ff9 1214
d33b2eba
GS
1215#define new_XPVCV() my_safemalloc(sizeof(XPVCV))
1216#define del_XPVCV(p) my_safefree(p)
932e9ff9 1217
d33b2eba
GS
1218#define new_XPVAV() my_safemalloc(sizeof(XPVAV))
1219#define del_XPVAV(p) my_safefree(p)
1220
1221#define new_XPVHV() my_safemalloc(sizeof(XPVHV))
1222#define del_XPVHV(p) my_safefree(p)
1c846c1f 1223
d33b2eba
GS
1224#define new_XPVMG() my_safemalloc(sizeof(XPVMG))
1225#define del_XPVMG(p) my_safefree(p)
1226
727879eb
NC
1227#define new_XPVGV() my_safemalloc(sizeof(XPVGV))
1228#define del_XPVGV(p) my_safefree(p)
1229
d33b2eba
GS
1230#define new_XPVLV() my_safemalloc(sizeof(XPVLV))
1231#define del_XPVLV(p) my_safefree(p)
1232
1233#define new_XPVBM() my_safemalloc(sizeof(XPVBM))
1234#define del_XPVBM(p) my_safefree(p)
1235
1236#else /* !PURIFY */
1237
08742458 1238#define new_XNV() new_body_type(NV, xnv)
cb4415b8 1239#define del_XNV(p) del_body_type(p, NV, xnv)
9b94d1dd 1240
aeb18a1e
NC
1241#define new_XPV() new_body_allocated(XPV, xpv, xpv_cur)
1242#define del_XPV(p) del_body_allocated(p, XPV, xpv, xpv_cur)
d33b2eba 1243
aeb18a1e
NC
1244#define new_XPVIV() new_body_allocated(XPVIV, xpviv, xpv_cur)
1245#define del_XPVIV(p) del_body_allocated(p, XPVIV, xpviv, xpv_cur)
d33b2eba 1246
08742458 1247#define new_XPVNV() new_body_type(XPVNV, xpvnv)
cb4415b8 1248#define del_XPVNV(p) del_body_type(p, XPVNV, xpvnv)
d33b2eba 1249
08742458 1250#define new_XPVCV() new_body_type(XPVCV, xpvcv)
cb4415b8 1251#define del_XPVCV(p) del_body_type(p, XPVCV, xpvcv)
d33b2eba 1252
aeb18a1e
NC
1253#define new_XPVAV() new_body_allocated(XPVAV, xpvav, xav_fill)
1254#define del_XPVAV(p) del_body_allocated(p, XPVAV, xpvav, xav_fill)
d33b2eba 1255
aeb18a1e
NC
1256#define new_XPVHV() new_body_allocated(XPVHV, xpvhv, xhv_fill)
1257#define del_XPVHV(p) del_body_allocated(p, XPVHV, xpvhv, xhv_fill)
1c846c1f 1258
08742458 1259#define new_XPVMG() new_body_type(XPVMG, xpvmg)
cb4415b8 1260#define del_XPVMG(p) del_body_type(p, XPVMG, xpvmg)
d33b2eba 1261
08742458 1262#define new_XPVGV() new_body_type(XPVGV, xpvgv)
cb4415b8 1263#define del_XPVGV(p) del_body_type(p, XPVGV, xpvgv)
727879eb 1264
08742458 1265#define new_XPVLV() new_body_type(XPVLV, xpvlv)
cb4415b8 1266#define del_XPVLV(p) del_body_type(p, XPVLV, xpvlv)
d33b2eba 1267
08742458 1268#define new_XPVBM() new_body_type(XPVBM, xpvbm)
cb4415b8 1269#define del_XPVBM(p) del_body_type(p, XPVBM, xpvbm)
d33b2eba
GS
1270
1271#endif /* PURIFY */
9b94d1dd 1272
d33b2eba
GS
1273#define new_XPVFM() my_safemalloc(sizeof(XPVFM))
1274#define del_XPVFM(p) my_safefree(p)
1c846c1f 1275
d33b2eba
GS
1276#define new_XPVIO() my_safemalloc(sizeof(XPVIO))
1277#define del_XPVIO(p) my_safefree(p)
8990e307 1278
954c1994
GS
1279/*
1280=for apidoc sv_upgrade
1281
ff276b08 1282Upgrade an SV to a more complex form. Generally adds a new body type to the
645c22ef 1283SV, then copies across as much information as possible from the old body.
ff276b08 1284You generally want to use the C<SvUPGRADE> macro wrapper. See also C<svtype>.
954c1994
GS
1285
1286=cut
1287*/
1288
63f97190 1289void
864dbfa3 1290Perl_sv_upgrade(pTHX_ register SV *sv, U32 mt)
79072805 1291{
9a085840 1292 void** old_body_arena;
878cc751 1293 size_t old_body_offset;
4cbc76b1 1294 size_t old_body_length; /* Well, the length to copy. */
878cc751 1295 void* old_body;
16b305e3
NC
1296#ifndef NV_ZERO_IS_ALLBITS_ZERO
1297 /* If NV 0.0 is store as all bits 0 then Zero() already creates a correct
1298 0.0 for us. */
4cbc76b1 1299 bool zero_nv = TRUE;
16b305e3 1300#endif
403d36eb
NC
1301 void* new_body;
1302 size_t new_body_length;
1303 size_t new_body_offset;
1304 void** new_body_arena;
1305 void** new_body_arenaroot;
53c1dcc0 1306 const U32 old_type = SvTYPE(sv);
79072805 1307
765f542d
NC
1308 if (mt != SVt_PV && SvIsCOW(sv)) {
1309 sv_force_normal_flags(sv, 0);
f130fd45
NIS
1310 }
1311
79072805 1312 if (SvTYPE(sv) == mt)
63f97190 1313 return;
79072805 1314
f5282e15 1315 if (SvTYPE(sv) > mt)
921edb34
RGS
1316 Perl_croak(aTHX_ "sv_upgrade from type %d down to type %d",
1317 (int)SvTYPE(sv), (int)mt);
f5282e15 1318
d2e56290 1319
878cc751
NC
1320 old_body = SvANY(sv);
1321 old_body_arena = 0;
1322 old_body_offset = 0;
4cbc76b1 1323 old_body_length = 0;
403d36eb
NC
1324 new_body_offset = 0;
1325 new_body_length = ~0;
1326
1327 /* Copying structures onto other structures that have been neatly zeroed
1328 has a subtle gotcha. Consider XPVMG
1329
1330 +------+------+------+------+------+-------+-------+
1331 | NV | CUR | LEN | IV | MAGIC | STASH |
1332 +------+------+------+------+------+-------+-------+
1333 0 4 8 12 16 20 24 28
1334
1335 where NVs are aligned to 8 bytes, so that sizeof that structure is
1336 actually 32 bytes long, with 4 bytes of padding at the end:
1337
1338 +------+------+------+------+------+-------+-------+------+
1339 | NV | CUR | LEN | IV | MAGIC | STASH | ??? |
1340 +------+------+------+------+------+-------+-------+------+
1341 0 4 8 12 16 20 24 28 32
1342
1343 so what happens if you allocate memory for this structure:
1344
1345 +------+------+------+------+------+-------+-------+------+------+...
1346 | NV | CUR | LEN | IV | MAGIC | STASH | GP | NAME |
1347 +------+------+------+------+------+-------+-------+------+------+...
1348 0 4 8 12 16 20 24 28 32 36
1349
1350 zero it, then copy sizeof(XPVMG) bytes on top of it? Not quite what you
1351 expect, because you copy the area marked ??? onto GP. Now, ??? may have
1352 started out as zero once, but it's quite possible that it isn't. So now,
1353 rather than a nicely zeroed GP, you have it pointing somewhere random.
1354 Bugs ensue.
1355
1356 (In fact, GP ends up pointing at a previous GP structure, because the
1357 principle cause of the padding in XPVMG getting garbage is a copy of
1358 sizeof(XPVMG) bytes from a XPVGV structure in sv_unglob)
1359
1360 So we are careful and work out the size of used parts of all the
1361 structures. */
878cc751 1362
79072805
LW
1363 switch (SvTYPE(sv)) {
1364 case SVt_NULL:
79072805 1365 break;
79072805 1366 case SVt_IV:
ed6116ce 1367 if (mt == SVt_NV)
463ee0b2 1368 mt = SVt_PVNV;
ed6116ce
LW
1369 else if (mt < SVt_PVIV)
1370 mt = SVt_PVIV;
4cbc76b1
NC
1371 old_body_offset = STRUCT_OFFSET(XPVIV, xiv_iv);
1372 old_body_length = sizeof(IV);
79072805
LW
1373 break;
1374 case SVt_NV:
9a085840 1375 old_body_arena = (void **) &PL_xnv_root;
4cbc76b1 1376 old_body_length = sizeof(NV);
16b305e3 1377#ifndef NV_ZERO_IS_ALLBITS_ZERO
4cbc76b1 1378 zero_nv = FALSE;
16b305e3 1379#endif
ed6116ce 1380 if (mt < SVt_PVNV)
79072805
LW
1381 mt = SVt_PVNV;
1382 break;
ed6116ce 1383 case SVt_RV:
ed6116ce 1384 break;
79072805 1385 case SVt_PV:
9a085840 1386 old_body_arena = (void **) &PL_xpv_root;
878cc751
NC
1387 old_body_offset = STRUCT_OFFSET(XPV, xpv_cur)
1388 - STRUCT_OFFSET(xpv_allocated, xpv_cur);
403d36eb
NC
1389 old_body_length = STRUCT_OFFSET(XPV, xpv_len)
1390 + sizeof (((XPV*)SvANY(sv))->xpv_len)
1391 - old_body_offset;
748a9306
LW
1392 if (mt <= SVt_IV)
1393 mt = SVt_PVIV;
1394 else if (mt == SVt_NV)
1395 mt = SVt_PVNV;
79072805
LW
1396 break;
1397 case SVt_PVIV:
9a085840 1398 old_body_arena = (void **) &PL_xpviv_root;
878cc751
NC
1399 old_body_offset = STRUCT_OFFSET(XPVIV, xpv_cur)
1400 - STRUCT_OFFSET(xpviv_allocated, xpv_cur);
403d36eb
NC
1401 old_body_length = STRUCT_OFFSET(XPVIV, xiv_u)
1402 + sizeof (((XPVIV*)SvANY(sv))->xiv_u)
1403 - old_body_offset;
79072805
LW
1404 break;
1405 case SVt_PVNV:
9a085840 1406 old_body_arena = (void **) &PL_xpvnv_root;
403d36eb
NC
1407 old_body_length = STRUCT_OFFSET(XPVNV, xiv_u)
1408 + sizeof (((XPVNV*)SvANY(sv))->xiv_u);
16b305e3 1409#ifndef NV_ZERO_IS_ALLBITS_ZERO
4cbc76b1 1410 zero_nv = FALSE;
16b305e3 1411#endif
79072805
LW
1412 break;
1413 case SVt_PVMG:
0ec50a73
NC
1414 /* Because the XPVMG of PL_mess_sv isn't allocated from the arena,
1415 there's no way that it can be safely upgraded, because perl.c
1416 expects to Safefree(SvANY(PL_mess_sv)) */
1417 assert(sv != PL_mess_sv);
bce8f412
NC
1418 /* This flag bit is used to mean other things in other scalar types.
1419 Given that it only has meaning inside the pad, it shouldn't be set
1420 on anything that can get upgraded. */
1421 assert((SvFLAGS(sv) & SVpad_TYPED) == 0);
9a085840 1422 old_body_arena = (void **) &PL_xpvmg_root;
403d36eb
NC
1423 old_body_length = STRUCT_OFFSET(XPVMG, xmg_stash)
1424 + sizeof (((XPVMG*)SvANY(sv))->xmg_stash);
16b305e3 1425#ifndef NV_ZERO_IS_ALLBITS_ZERO
4cbc76b1 1426 zero_nv = FALSE;
16b305e3 1427#endif
79072805
LW
1428 break;
1429 default:
cea2e8a9 1430 Perl_croak(aTHX_ "Can't upgrade that kind of scalar");
79072805
LW
1431 }
1432
ffb05e06
NC
1433 SvFLAGS(sv) &= ~SVTYPEMASK;
1434 SvFLAGS(sv) |= mt;
1435
79072805
LW
1436 switch (mt) {
1437 case SVt_NULL:
cea2e8a9 1438 Perl_croak(aTHX_ "Can't upgrade to undef");
79072805 1439 case SVt_IV:
4cbc76b1 1440 assert(old_type == SVt_NULL);
339049b0 1441 SvANY(sv) = (XPVIV*)((char*)&(sv->sv_u.svu_iv) - STRUCT_OFFSET(XPVIV, xiv_iv));
403d36eb 1442 SvIV_set(sv, 0);
85274cbc 1443 return;
79072805 1444 case SVt_NV:
4cbc76b1 1445 assert(old_type == SVt_NULL);
79072805 1446 SvANY(sv) = new_XNV();
403d36eb 1447 SvNV_set(sv, 0);
85274cbc 1448 return;
ed6116ce 1449 case SVt_RV:
4cbc76b1 1450 assert(old_type == SVt_NULL);
339049b0 1451 SvANY(sv) = &sv->sv_u.svu_rv;
403d36eb 1452 SvRV_set(sv, 0);
85274cbc 1453 return;
79072805
LW
1454 case SVt_PVHV:
1455 SvANY(sv) = new_XPVHV();
463ee0b2
LW
1456 HvFILL(sv) = 0;
1457 HvMAX(sv) = 0;
8aacddc1 1458 HvTOTALKEYS(sv) = 0;
bd4b1eb5 1459
2068cd4d
NC
1460 goto hv_av_common;
1461
1462 case SVt_PVAV:
1463 SvANY(sv) = new_XPVAV();
1464 AvMAX(sv) = -1;
1465 AvFILLp(sv) = -1;
1466 AvALLOC(sv) = 0;
1467 AvREAL_only(sv);
1468
1469 hv_av_common:
1470 /* SVt_NULL isn't the only thing upgraded to AV or HV.
1471 The target created by newSVrv also is, and it can have magic.
1472 However, it never has SvPVX set.
1473 */
1474 if (old_type >= SVt_RV) {
1475 assert(SvPVX_const(sv) == 0);
8bd4d4c5 1476 }
2068cd4d
NC
1477
1478 /* Could put this in the else clause below, as PVMG must have SvPVX
1479 0 already (the assertion above) */
bd4b1eb5 1480 SvPV_set(sv, (char*)0);
2068cd4d
NC
1481
1482 if (old_type >= SVt_PVMG) {
1483 SvMAGIC_set(sv, ((XPVMG*)old_body)->xmg_magic);
1484 SvSTASH_set(sv, ((XPVMG*)old_body)->xmg_stash);
1485 } else {
1486 SvMAGIC_set(sv, 0);
1487 SvSTASH_set(sv, 0);
1488 }
79072805 1489 break;
bd4b1eb5
NC
1490
1491 case SVt_PVIO:
403d36eb
NC
1492 new_body = new_XPVIO();
1493 new_body_length = sizeof(XPVIO);
1494 goto zero;
bd4b1eb5 1495 case SVt_PVFM:
403d36eb
NC
1496 new_body = new_XPVFM();
1497 new_body_length = sizeof(XPVFM);
1498 goto zero;
1499
bd4b1eb5 1500 case SVt_PVBM:
403d36eb
NC
1501 new_body_length = sizeof(XPVBM);
1502 new_body_arena = (void **) &PL_xpvbm_root;
1503 new_body_arenaroot = (void **) &PL_xpvbm_arenaroot;
1504 goto new_body;
bd4b1eb5 1505 case SVt_PVGV:
403d36eb
NC
1506 new_body_length = sizeof(XPVGV);
1507 new_body_arena = (void **) &PL_xpvgv_root;
1508 new_body_arenaroot = (void **) &PL_xpvgv_arenaroot;
1509 goto new_body;
79072805 1510 case SVt_PVCV:
403d36eb
NC
1511 new_body_length = sizeof(XPVCV);
1512 new_body_arena = (void **) &PL_xpvcv_root;
1513 new_body_arenaroot = (void **) &PL_xpvcv_arenaroot;
1514 goto new_body;
bd4b1eb5 1515 case SVt_PVLV:
403d36eb
NC
1516 new_body_length = sizeof(XPVLV);
1517 new_body_arena = (void **) &PL_xpvlv_root;
1518 new_body_arenaroot = (void **) &PL_xpvlv_arenaroot;
1519 goto new_body;
1520 case SVt_PVMG:
1521 new_body_length = sizeof(XPVMG);
1522 new_body_arena = (void **) &PL_xpvmg_root;
1523 new_body_arenaroot = (void **) &PL_xpvmg_arenaroot;
1524 goto new_body;
1525 case SVt_PVNV:
1526 new_body_length = sizeof(XPVNV);
1527 new_body_arena = (void **) &PL_xpvnv_root;
1528 new_body_arenaroot = (void **) &PL_xpvnv_arenaroot;
1529 goto new_body;
1530 case SVt_PVIV:
1531 new_body_offset = STRUCT_OFFSET(XPVIV, xpv_cur)
1532 - STRUCT_OFFSET(xpviv_allocated, xpv_cur);
1533 new_body_length = sizeof(XPVIV) - new_body_offset;
1534 new_body_arena = (void **) &PL_xpviv_root;
1535 new_body_arenaroot = (void **) &PL_xpviv_arenaroot;
1536 /* XXX Is this still needed? Was it ever needed? Surely as there is
1537 no route from NV to PVIV, NOK can never be true */
1538 if (SvNIOK(sv))
1539 (void)SvIOK_on(sv);
1540 SvNOK_off(sv);
1541 goto new_body_no_NV;
1542 case SVt_PV:
1543 new_body_offset = STRUCT_OFFSET(XPV, xpv_cur)
1544 - STRUCT_OFFSET(xpv_allocated, xpv_cur);
1545 new_body_length = sizeof(XPV) - new_body_offset;
1546 new_body_arena = (void **) &PL_xpv_root;
1547 new_body_arenaroot = (void **) &PL_xpv_arenaroot;
1548 new_body_no_NV:
1549 /* PV and PVIV don't have an NV slot. */
16b305e3 1550#ifndef NV_ZERO_IS_ALLBITS_ZERO
403d36eb 1551 zero_nv = FALSE;
16b305e3 1552#endif
403d36eb 1553
16b305e3
NC
1554 new_body:
1555 assert(new_body_length);
403d36eb 1556#ifndef PURIFY
16b305e3 1557 /* This points to the start of the allocated area. */
08742458
NC
1558 new_body_inline(new_body, new_body_arenaroot, new_body_arena,
1559 new_body_length);
403d36eb 1560#else
16b305e3
NC
1561 /* We always allocated the full length item with PURIFY */
1562 new_body_length += new_body_offset;
1563 new_body_offset = 0;
1564 new_body = my_safemalloc(new_body_length);
403d36eb
NC
1565
1566#endif
16b305e3
NC
1567 zero:
1568 Zero(new_body, new_body_length, char);
1569 new_body = ((char *)new_body) - new_body_offset;
1570 SvANY(sv) = new_body;
1571
1572 if (old_body_length) {
1573 Copy((char *)old_body + old_body_offset,
1574 (char *)new_body + old_body_offset,
1575 old_body_length, char);
1576 }
403d36eb 1577
16b305e3
NC
1578#ifndef NV_ZERO_IS_ALLBITS_ZERO
1579 if (zero_nv)
1580 SvNV_set(sv, 0);
1581#endif
403d36eb 1582
16b305e3
NC
1583 if (mt == SVt_PVIO)
1584 IoPAGE_LEN(sv) = 60;
1585 if (old_type < SVt_RV)
1586 SvPV_set(sv, 0);
8990e307 1587 break;
403d36eb
NC
1588 default:
1589 Perl_croak(aTHX_ "panic: sv_upgrade to unknown type %lu", mt);
8990e307 1590 }
878cc751
NC
1591
1592
1593 if (old_body_arena) {
1594#ifdef PURIFY
ee6954bb 1595 my_safefree(old_body);
878cc751 1596#else
cb4415b8
NC
1597 del_body((void*)((char*)old_body + old_body_offset),
1598 old_body_arena);
878cc751 1599#endif
2068cd4d 1600 }
79072805
LW
1601}
1602
645c22ef
DM
1603/*
1604=for apidoc sv_backoff
1605
1606Remove any string offset. You should normally use the C<SvOOK_off> macro
1607wrapper instead.
1608
1609=cut
1610*/
1611
79072805 1612int
864dbfa3 1613Perl_sv_backoff(pTHX_ register SV *sv)
79072805
LW
1614{
1615 assert(SvOOK(sv));
b79f7545
NC
1616 assert(SvTYPE(sv) != SVt_PVHV);
1617 assert(SvTYPE(sv) != SVt_PVAV);
463ee0b2 1618 if (SvIVX(sv)) {
53c1dcc0 1619 const char * const s = SvPVX_const(sv);
b162af07 1620 SvLEN_set(sv, SvLEN(sv) + SvIVX(sv));
f880fe2f 1621 SvPV_set(sv, SvPVX(sv) - SvIVX(sv));
79072805 1622 SvIV_set(sv, 0);
463ee0b2 1623 Move(s, SvPVX(sv), SvCUR(sv)+1, char);
79072805
LW
1624 }
1625 SvFLAGS(sv) &= ~SVf_OOK;
a0d0e21e 1626 return 0;
79072805
LW
1627}
1628
954c1994
GS
1629/*
1630=for apidoc sv_grow
1631
645c22ef
DM
1632Expands the character buffer in the SV. If necessary, uses C<sv_unref> and
1633upgrades the SV to C<SVt_PV>. Returns a pointer to the character buffer.
1634Use the C<SvGROW> wrapper instead.
954c1994
GS
1635
1636=cut
1637*/
1638
79072805 1639char *
864dbfa3 1640Perl_sv_grow(pTHX_ register SV *sv, register STRLEN newlen)
79072805
LW
1641{
1642 register char *s;
1643
55497cff 1644#ifdef HAS_64K_LIMIT
79072805 1645 if (newlen >= 0x10000) {
1d7c1841
GS
1646 PerlIO_printf(Perl_debug_log,
1647 "Allocation too large: %"UVxf"\n", (UV)newlen);
79072805
LW
1648 my_exit(1);
1649 }
55497cff 1650#endif /* HAS_64K_LIMIT */
a0d0e21e
LW
1651 if (SvROK(sv))
1652 sv_unref(sv);
79072805
LW
1653 if (SvTYPE(sv) < SVt_PV) {
1654 sv_upgrade(sv, SVt_PV);
93524f2b 1655 s = SvPVX_mutable(sv);
79072805
LW
1656 }
1657 else if (SvOOK(sv)) { /* pv is offset? */
1658 sv_backoff(sv);
93524f2b 1659 s = SvPVX_mutable(sv);
79072805
LW
1660 if (newlen > SvLEN(sv))
1661 newlen += 10 * (newlen - SvCUR(sv)); /* avoid copy each time */
c6f8c383
GA
1662#ifdef HAS_64K_LIMIT
1663 if (newlen >= 0x10000)
1664 newlen = 0xFFFF;
1665#endif
79072805 1666 }
bc44a8a2 1667 else
4d84ee25 1668 s = SvPVX_mutable(sv);
54f0641b 1669
79072805 1670 if (newlen > SvLEN(sv)) { /* need more room? */
7a9b70e9 1671 newlen = PERL_STRLEN_ROUNDUP(newlen);
8d6dde3e 1672 if (SvLEN(sv) && s) {
7bab3ede 1673#ifdef MYMALLOC
93524f2b 1674 const STRLEN l = malloced_size((void*)SvPVX_const(sv));
8d6dde3e
IZ
1675 if (newlen <= l) {
1676 SvLEN_set(sv, l);
1677 return s;
1678 } else
c70c8a0a 1679#endif
1936d2a7 1680 s = saferealloc(s, newlen);
8d6dde3e 1681 }
bfed75c6 1682 else {
1936d2a7 1683 s = safemalloc(newlen);
3f7c398e
SP
1684 if (SvPVX_const(sv) && SvCUR(sv)) {
1685 Move(SvPVX_const(sv), s, (newlen < SvCUR(sv)) ? newlen : SvCUR(sv), char);
40565179 1686 }
4e83176d 1687 }
79072805 1688 SvPV_set(sv, s);
e1ec3a88 1689 SvLEN_set(sv, newlen);
79072805
LW
1690 }
1691 return s;
1692}
1693
954c1994
GS
1694/*
1695=for apidoc sv_setiv
1696
645c22ef
DM
1697Copies an integer into the given SV, upgrading first if necessary.
1698Does not handle 'set' magic. See also C<sv_setiv_mg>.
954c1994
GS
1699
1700=cut
1701*/
1702
79072805 1703void
864dbfa3 1704Perl_sv_setiv(pTHX_ register SV *sv, IV i)
79072805 1705{
765f542d 1706 SV_CHECK_THINKFIRST_COW_DROP(sv);
463ee0b2
LW
1707 switch (SvTYPE(sv)) {
1708 case SVt_NULL:
79072805 1709 sv_upgrade(sv, SVt_IV);
463ee0b2
LW
1710 break;
1711 case SVt_NV:
1712 sv_upgrade(sv, SVt_PVNV);
1713 break;
ed6116ce 1714 case SVt_RV:
463ee0b2 1715 case SVt_PV:
79072805 1716 sv_upgrade(sv, SVt_PVIV);
463ee0b2 1717 break;
a0d0e21e
LW
1718
1719 case SVt_PVGV:
a0d0e21e
LW
1720 case SVt_PVAV:
1721 case SVt_PVHV:
1722 case SVt_PVCV:
1723 case SVt_PVFM:
1724 case SVt_PVIO:
411caa50 1725 Perl_croak(aTHX_ "Can't coerce %s to integer in %s", sv_reftype(sv,0),
53e06cf0 1726 OP_DESC(PL_op));
463ee0b2 1727 }
a0d0e21e 1728 (void)SvIOK_only(sv); /* validate number */
45977657 1729 SvIV_set(sv, i);
463ee0b2 1730 SvTAINT(sv);
79072805
LW
1731}
1732
954c1994
GS
1733/*
1734=for apidoc sv_setiv_mg
1735
1736Like C<sv_setiv>, but also handles 'set' magic.
1737
1738=cut
1739*/
1740
79072805 1741void
864dbfa3 1742Perl_sv_setiv_mg(pTHX_ register SV *sv, IV i)
ef50df4b
GS
1743{
1744 sv_setiv(sv,i);
1745 SvSETMAGIC(sv);
1746}
1747
954c1994
GS
1748/*
1749=for apidoc sv_setuv
1750
645c22ef
DM
1751Copies an unsigned integer into the given SV, upgrading first if necessary.
1752Does not handle 'set' magic. See also C<sv_setuv_mg>.
954c1994
GS
1753
1754=cut
1755*/
1756
ef50df4b 1757void
864dbfa3 1758Perl_sv_setuv(pTHX_ register SV *sv, UV u)
55497cff 1759{
55ada374
NC
1760 /* With these two if statements:
1761 u=1.49 s=0.52 cu=72.49 cs=10.64 scripts=270 tests=20865
d460ef45 1762
55ada374
NC
1763 without
1764 u=1.35 s=0.47 cu=73.45 cs=11.43 scripts=270 tests=20865
d460ef45 1765
55ada374
NC
1766 If you wish to remove them, please benchmark to see what the effect is
1767 */
28e5dec8
JH
1768 if (u <= (UV)IV_MAX) {
1769 sv_setiv(sv, (IV)u);
1770 return;
1771 }
25da4f38
IZ
1772 sv_setiv(sv, 0);
1773 SvIsUV_on(sv);
607fa7f2 1774 SvUV_set(sv, u);
55497cff 1775}
1776
954c1994
GS
1777/*
1778=for apidoc sv_setuv_mg
1779
1780Like C<sv_setuv>, but also handles 'set' magic.
1781
1782=cut
1783*/
1784
55497cff 1785void
864dbfa3 1786Perl_sv_setuv_mg(pTHX_ register SV *sv, UV u)
ef50df4b 1787{
aa0f650e
NC
1788 sv_setiv(sv, 0);
1789 SvIsUV_on(sv);
1790 sv_setuv(sv,u);
ef50df4b
GS
1791 SvSETMAGIC(sv);
1792}
1793
954c1994
GS
1794/*
1795=for apidoc sv_setnv
1796
645c22ef
DM
1797Copies a double into the given SV, upgrading first if necessary.
1798Does not handle 'set' magic. See also C<sv_setnv_mg>.
954c1994
GS
1799
1800=cut
1801*/
1802
ef50df4b 1803void
65202027 1804Perl_sv_setnv(pTHX_ register SV *sv, NV num)
79072805 1805{
765f542d 1806 SV_CHECK_THINKFIRST_COW_DROP(sv);
a0d0e21e
LW
1807 switch (SvTYPE(sv)) {
1808 case SVt_NULL:
1809 case SVt_IV:
79072805 1810 sv_upgrade(sv, SVt_NV);
a0d0e21e 1811 break;
a0d0e21e
LW
1812 case SVt_RV:
1813 case SVt_PV:
1814 case SVt_PVIV:
79072805 1815 sv_upgrade(sv, SVt_PVNV);
a0d0e21e 1816 break;
827b7e14 1817
a0d0e21e 1818 case SVt_PVGV:
a0d0e21e
LW
1819 case SVt_PVAV:
1820 case SVt_PVHV:
1821 case SVt_PVCV:
1822 case SVt_PVFM:
1823 case SVt_PVIO:
411caa50 1824 Perl_croak(aTHX_ "Can't coerce %s to number in %s", sv_reftype(sv,0),
53e06cf0 1825 OP_NAME(PL_op));
79072805 1826 }
9d6ce603 1827 SvNV_set(sv, num);
a0d0e21e 1828 (void)SvNOK_only(sv); /* validate number */
463ee0b2 1829 SvTAINT(sv);
79072805
LW
1830}
1831
954c1994
GS
1832/*
1833=for apidoc sv_setnv_mg
1834
1835Like C<sv_setnv>, but also handles 'set' magic.
1836
1837=cut
1838*/
1839
ef50df4b 1840void
65202027 1841Perl_sv_setnv_mg(pTHX_ register SV *sv, NV num)
ef50df4b
GS
1842{
1843 sv_setnv(sv,num);
1844 SvSETMAGIC(sv);
1845}
1846
645c22ef
DM
1847/* Print an "isn't numeric" warning, using a cleaned-up,
1848 * printable version of the offending string
1849 */
1850
76e3520e 1851STATIC void
cea2e8a9 1852S_not_a_number(pTHX_ SV *sv)
a0d0e21e 1853{
94463019
JH
1854 SV *dsv;
1855 char tmpbuf[64];
1b6737cc 1856 const char *pv;
94463019
JH
1857
1858 if (DO_UTF8(sv)) {
d0043bd1 1859 dsv = sv_2mortal(newSVpvn("", 0));
94463019
JH
1860 pv = sv_uni_display(dsv, sv, 10, 0);
1861 } else {
1862 char *d = tmpbuf;
1863 char *limit = tmpbuf + sizeof(tmpbuf) - 8;
1864 /* each *s can expand to 4 chars + "...\0",
1865 i.e. need room for 8 chars */
ecdeb87c 1866
e62f0680
NC
1867 const char *s, *end;
1868 for (s = SvPVX_const(sv), end = s + SvCUR(sv); s < end && d < limit;
1869 s++) {
94463019
JH
1870 int ch = *s & 0xFF;
1871 if (ch & 128 && !isPRINT_LC(ch)) {
1872 *d++ = 'M';
1873 *d++ = '-';
1874 ch &= 127;
1875 }
1876 if (ch == '\n') {
1877 *d++ = '\\';
1878 *d++ = 'n';
1879 }
1880 else if (ch == '\r') {
1881 *d++ = '\\';
1882 *d++ = 'r';
1883 }
1884 else if (ch == '\f') {
1885 *d++ = '\\';
1886 *d++ = 'f';
1887 }
1888 else if (ch == '\\') {
1889 *d++ = '\\';
1890 *d++ = '\\';
1891 }
1892 else if (ch == '\0') {
1893 *d++ = '\\';
1894 *d++ = '0';
1895 }
1896 else if (isPRINT_LC(ch))
1897 *d++ = ch;
1898 else {
1899 *d++ = '^';
1900 *d++ = toCTRL(ch);
1901 }
1902 }
1903 if (s < end) {
1904 *d++ = '.';
1905 *d++ = '.';
1906 *d++ = '.';
1907 }
1908 *d = '\0';
1909 pv = tmpbuf;
a0d0e21e 1910 }
a0d0e21e 1911
533c011a 1912 if (PL_op)
9014280d 1913 Perl_warner(aTHX_ packWARN(WARN_NUMERIC),
94463019
JH
1914 "Argument \"%s\" isn't numeric in %s", pv,
1915 OP_DESC(PL_op));
a0d0e21e 1916 else
9014280d 1917 Perl_warner(aTHX_ packWARN(WARN_NUMERIC),
94463019 1918 "Argument \"%s\" isn't numeric", pv);
a0d0e21e
LW
1919}
1920
c2988b20
NC
1921/*
1922=for apidoc looks_like_number
1923
645c22ef
DM
1924Test if the content of an SV looks like a number (or is a number).
1925C<Inf> and C<Infinity> are treated as numbers (so will not issue a
1926non-numeric warning), even if your atof() doesn't grok them.
c2988b20
NC
1927
1928=cut
1929*/
1930
1931I32
1932Perl_looks_like_number(pTHX_ SV *sv)
1933{
a3b680e6 1934 register const char *sbegin;
c2988b20
NC
1935 STRLEN len;
1936
1937 if (SvPOK(sv)) {
3f7c398e 1938 sbegin = SvPVX_const(sv);
c2988b20
NC
1939 len = SvCUR(sv);
1940 }
1941 else if (SvPOKp(sv))
83003860 1942 sbegin = SvPV_const(sv, len);
c2988b20 1943 else
e0ab1c0e 1944 return SvFLAGS(sv) & (SVf_NOK|SVp_NOK|SVf_IOK|SVp_IOK);
c2988b20
NC
1945 return grok_number(sbegin, len, NULL);
1946}
25da4f38
IZ
1947
1948/* Actually, ISO C leaves conversion of UV to IV undefined, but
1949 until proven guilty, assume that things are not that bad... */
1950
645c22ef
DM
1951/*
1952 NV_PRESERVES_UV:
1953
1954 As 64 bit platforms often have an NV that doesn't preserve all bits of
28e5dec8
JH
1955 an IV (an assumption perl has been based on to date) it becomes necessary
1956 to remove the assumption that the NV always carries enough precision to
1957 recreate the IV whenever needed, and that the NV is the canonical form.
1958 Instead, IV/UV and NV need to be given equal rights. So as to not lose
645c22ef 1959 precision as a side effect of conversion (which would lead to insanity
28e5dec8
JH
1960 and the dragon(s) in t/op/numconvert.t getting very angry) the intent is
1961 1) to distinguish between IV/UV/NV slots that have cached a valid
1962 conversion where precision was lost and IV/UV/NV slots that have a
1963 valid conversion which has lost no precision
645c22ef 1964 2) to ensure that if a numeric conversion to one form is requested that
28e5dec8
JH
1965 would lose precision, the precise conversion (or differently
1966 imprecise conversion) is also performed and cached, to prevent
1967 requests for different numeric formats on the same SV causing
1968 lossy conversion chains. (lossless conversion chains are perfectly
1969 acceptable (still))
1970
1971
1972 flags are used:
1973 SvIOKp is true if the IV slot contains a valid value
1974 SvIOK is true only if the IV value is accurate (UV if SvIOK_UV true)
1975 SvNOKp is true if the NV slot contains a valid value
1976 SvNOK is true only if the NV value is accurate
1977
1978 so
645c22ef 1979 while converting from PV to NV, check to see if converting that NV to an
28e5dec8
JH
1980 IV(or UV) would lose accuracy over a direct conversion from PV to
1981 IV(or UV). If it would, cache both conversions, return NV, but mark
1982 SV as IOK NOKp (ie not NOK).
1983
645c22ef 1984 While converting from PV to IV, check to see if converting that IV to an
28e5dec8
JH
1985 NV would lose accuracy over a direct conversion from PV to NV. If it
1986 would, cache both conversions, flag similarly.
1987
1988 Before, the SV value "3.2" could become NV=3.2 IV=3 NOK, IOK quite
1989 correctly because if IV & NV were set NV *always* overruled.
645c22ef
DM
1990 Now, "3.2" will become NV=3.2 IV=3 NOK, IOKp, because the flag's meaning
1991 changes - now IV and NV together means that the two are interchangeable:
28e5dec8 1992 SvIVX == (IV) SvNVX && SvNVX == (NV) SvIVX;
d460ef45 1993
645c22ef
DM
1994 The benefit of this is that operations such as pp_add know that if
1995 SvIOK is true for both left and right operands, then integer addition
1996 can be used instead of floating point (for cases where the result won't
1997 overflow). Before, floating point was always used, which could lead to
28e5dec8
JH
1998 loss of precision compared with integer addition.
1999
2000 * making IV and NV equal status should make maths accurate on 64 bit
2001 platforms
2002 * may speed up maths somewhat if pp_add and friends start to use
645c22ef 2003 integers when possible instead of fp. (Hopefully the overhead in
28e5dec8
JH
2004 looking for SvIOK and checking for overflow will not outweigh the
2005 fp to integer speedup)
2006 * will slow down integer operations (callers of SvIV) on "inaccurate"
2007 values, as the change from SvIOK to SvIOKp will cause a call into
2008 sv_2iv each time rather than a macro access direct to the IV slot
2009 * should speed up number->string conversion on integers as IV is
645c22ef 2010 favoured when IV and NV are equally accurate
28e5dec8
JH
2011
2012 ####################################################################
645c22ef
DM
2013 You had better be using SvIOK_notUV if you want an IV for arithmetic:
2014 SvIOK is true if (IV or UV), so you might be getting (IV)SvUV.
2015 On the other hand, SvUOK is true iff UV.
28e5dec8
JH
2016 ####################################################################
2017
645c22ef 2018 Your mileage will vary depending your CPU's relative fp to integer
28e5dec8
JH
2019 performance ratio.
2020*/
2021
2022#ifndef NV_PRESERVES_UV
645c22ef
DM
2023# define IS_NUMBER_UNDERFLOW_IV 1
2024# define IS_NUMBER_UNDERFLOW_UV 2
2025# define IS_NUMBER_IV_AND_UV 2
2026# define IS_NUMBER_OVERFLOW_IV 4
2027# define IS_NUMBER_OVERFLOW_UV 5
2028
2029/* sv_2iuv_non_preserve(): private routine for use by sv_2iv() and sv_2uv() */
28e5dec8
JH
2030
2031/* For sv_2nv these three cases are "SvNOK and don't bother casting" */
2032STATIC int
645c22ef 2033S_sv_2iuv_non_preserve(pTHX_ register SV *sv, I32 numtype)
28e5dec8 2034{
3f7c398e 2035 DEBUG_c(PerlIO_printf(Perl_debug_log,"sv_2iuv_non '%s', IV=0x%"UVxf" NV=%"NVgf" inttype=%"UVXf"\n", SvPVX_const(sv), SvIVX(sv), SvNVX(sv), (UV)numtype));
28e5dec8
JH
2036 if (SvNVX(sv) < (NV)IV_MIN) {
2037 (void)SvIOKp_on(sv);
2038 (void)SvNOK_on(sv);
45977657 2039 SvIV_set(sv, IV_MIN);
28e5dec8
JH
2040 return IS_NUMBER_UNDERFLOW_IV;
2041 }
2042 if (SvNVX(sv) > (NV)UV_MAX) {
2043 (void)SvIOKp_on(sv);
2044 (void)SvNOK_on(sv);
2045 SvIsUV_on(sv);
607fa7f2 2046 SvUV_set(sv, UV_MAX);
28e5dec8
JH
2047 return IS_NUMBER_OVERFLOW_UV;
2048 }
c2988b20
NC
2049 (void)SvIOKp_on(sv);
2050 (void)SvNOK_on(sv);
2051 /* Can't use strtol etc to convert this string. (See truth table in
2052 sv_2iv */
2053 if (SvNVX(sv) <= (UV)IV_MAX) {
45977657 2054 SvIV_set(sv, I_V(SvNVX(sv)));
c2988b20
NC
2055 if ((NV)(SvIVX(sv)) == SvNVX(sv)) {
2056 SvIOK_on(sv); /* Integer is precise. NOK, IOK */
2057 } else {
2058 /* Integer is imprecise. NOK, IOKp */
2059 }
2060 return SvNVX(sv) < 0 ? IS_NUMBER_UNDERFLOW_UV : IS_NUMBER_IV_AND_UV;
2061 }
2062 SvIsUV_on(sv);
607fa7f2 2063 SvUV_set(sv, U_V(SvNVX(sv)));
c2988b20
NC
2064 if ((NV)(SvUVX(sv)) == SvNVX(sv)) {
2065 if (SvUVX(sv) == UV_MAX) {
2066 /* As we know that NVs don't preserve UVs, UV_MAX cannot
2067 possibly be preserved by NV. Hence, it must be overflow.
2068 NOK, IOKp */
2069 return IS_NUMBER_OVERFLOW_UV;
2070 }
2071 SvIOK_on(sv); /* Integer is precise. NOK, UOK */
2072 } else {
2073 /* Integer is imprecise. NOK, IOKp */
28e5dec8 2074 }
c2988b20 2075 return IS_NUMBER_OVERFLOW_IV;
28e5dec8 2076}
645c22ef
DM
2077#endif /* !NV_PRESERVES_UV*/
2078
891f9566
YST
2079/* sv_2iv() is now a macro using Perl_sv_2iv_flags();
2080 * this function provided for binary compatibility only
2081 */
2082
2083IV
2084Perl_sv_2iv(pTHX_ register SV *sv)
2085{
2086 return sv_2iv_flags(sv, SV_GMAGIC);
2087}
2088
645c22ef 2089/*
891f9566 2090=for apidoc sv_2iv_flags
645c22ef 2091
891f9566
YST
2092Return the integer value of an SV, doing any necessary string
2093conversion. If flags includes SV_GMAGIC, does an mg_get() first.
2094Normally used via the C<SvIV(sv)> and C<SvIVx(sv)> macros.
645c22ef
DM
2095
2096=cut
2097*/
28e5dec8 2098
a0d0e21e 2099IV
891f9566 2100Perl_sv_2iv_flags(pTHX_ register SV *sv, I32 flags)
79072805
LW
2101{
2102 if (!sv)
2103 return 0;
8990e307 2104 if (SvGMAGICAL(sv)) {
891f9566
YST
2105 if (flags & SV_GMAGIC)
2106 mg_get(sv);
463ee0b2
LW
2107 if (SvIOKp(sv))
2108 return SvIVX(sv);
748a9306 2109 if (SvNOKp(sv)) {
25da4f38 2110 return I_V(SvNVX(sv));
748a9306 2111 }
36477c24 2112 if (SvPOKp(sv) && SvLEN(sv))
2113 return asIV(sv);
3fe9a6f1 2114 if (!SvROK(sv)) {
d008e5eb 2115 if (!(SvFLAGS(sv) & SVs_PADTMP)) {
041457d9 2116 if (!PL_localizing && ckWARN(WARN_UNINITIALIZED))
29489e7c 2117 report_uninit(sv);
c6ee37c5 2118 }
36477c24 2119 return 0;
3fe9a6f1 2120 }
463ee0b2 2121 }
ed6116ce 2122 if (SvTHINKFIRST(sv)) {
a0d0e21e 2123 if (SvROK(sv)) {
a0d0e21e 2124 SV* tmpstr;
1554e226 2125 if (SvAMAGIC(sv) && (tmpstr=AMG_CALLun(sv,numer)) &&
b4b9a328 2126 (!SvROK(tmpstr) || (SvRV(tmpstr) != SvRV(sv))))
9e7bc3e8 2127 return SvIV(tmpstr);
56431972 2128 return PTR2IV(SvRV(sv));
a0d0e21e 2129 }
765f542d
NC
2130 if (SvIsCOW(sv)) {
2131 sv_force_normal_flags(sv, 0);
47deb5e7 2132 }
0336b60e 2133 if (SvREADONLY(sv) && !SvOK(sv)) {
0336b60e 2134 if (ckWARN(WARN_UNINITIALIZED))
29489e7c 2135 report_uninit(sv);
ed6116ce
LW
2136 return 0;
2137 }
79072805 2138 }
25da4f38
IZ
2139 if (SvIOKp(sv)) {
2140 if (SvIsUV(sv)) {
2141 return (IV)(SvUVX(sv));
2142 }
2143 else {
2144 return SvIVX(sv);
2145 }
463ee0b2 2146 }
748a9306 2147 if (SvNOKp(sv)) {
28e5dec8
JH
2148 /* erm. not sure. *should* never get NOKp (without NOK) from sv_2nv
2149 * without also getting a cached IV/UV from it at the same time
2150 * (ie PV->NV conversion should detect loss of accuracy and cache
2151 * IV or UV at same time to avoid this. NWC */
25da4f38
IZ
2152
2153 if (SvTYPE(sv) == SVt_NV)
2154 sv_upgrade(sv, SVt_PVNV);
2155
28e5dec8
JH
2156 (void)SvIOKp_on(sv); /* Must do this first, to clear any SvOOK */
2157 /* < not <= as for NV doesn't preserve UV, ((NV)IV_MAX+1) will almost
2158 certainly cast into the IV range at IV_MAX, whereas the correct
2159 answer is the UV IV_MAX +1. Hence < ensures that dodgy boundary
2160 cases go to UV */
2161 if (SvNVX(sv) < (NV)IV_MAX + 0.5) {
45977657 2162 SvIV_set(sv, I_V(SvNVX(sv)));
28e5dec8
JH
2163 if (SvNVX(sv) == (NV) SvIVX(sv)
2164#ifndef NV_PRESERVES_UV
2165 && (((UV)1 << NV_PRESERVES_UV_BITS) >
2166 (UV)(SvIVX(sv) > 0 ? SvIVX(sv) : -SvIVX(sv)))
2167 /* Don't flag it as "accurately an integer" if the number
2168 came from a (by definition imprecise) NV operation, and
2169 we're outside the range of NV integer precision */
2170#endif
2171 ) {
2172 SvIOK_on(sv); /* Can this go wrong with rounding? NWC */
2173 DEBUG_c(PerlIO_printf(Perl_debug_log,
7234c960 2174 "0x%"UVxf" iv(%"NVgf" => %"IVdf") (precise)\n",
28e5dec8
JH
2175 PTR2UV(sv),
2176 SvNVX(sv),
2177 SvIVX(sv)));
2178
2179 } else {
2180 /* IV not precise. No need to convert from PV, as NV
2181 conversion would already have cached IV if it detected
2182 that PV->IV would be better than PV->NV->IV
2183 flags already correct - don't set public IOK. */
2184 DEBUG_c(PerlIO_printf(Perl_debug_log,
7234c960 2185 "0x%"UVxf" iv(%"NVgf" => %"IVdf") (imprecise)\n",
28e5dec8
JH
2186 PTR2UV(sv),
2187 SvNVX(sv),
2188 SvIVX(sv)));
2189 }
2190 /* Can the above go wrong if SvIVX == IV_MIN and SvNVX < IV_MIN,
2191 but the cast (NV)IV_MIN rounds to a the value less (more
2192 negative) than IV_MIN which happens to be equal to SvNVX ??
2193 Analogous to 0xFFFFFFFFFFFFFFFF rounding up to NV (2**64) and
2194 NV rounding back to 0xFFFFFFFFFFFFFFFF, so UVX == UV(NVX) and
2195 (NV)UVX == NVX are both true, but the values differ. :-(
2196 Hopefully for 2s complement IV_MIN is something like
2197 0x8000000000000000 which will be exact. NWC */
d460ef45 2198 }
25da4f38 2199 else {
607fa7f2 2200 SvUV_set(sv, U_V(SvNVX(sv)));
28e5dec8
JH
2201 if (
2202 (SvNVX(sv) == (NV) SvUVX(sv))
2203#ifndef NV_PRESERVES_UV
2204 /* Make sure it's not 0xFFFFFFFFFFFFFFFF */
2205 /*&& (SvUVX(sv) != UV_MAX) irrelevant with code below */
2206 && (((UV)1 << NV_PRESERVES_UV_BITS) > SvUVX(sv))
2207 /* Don't flag it as "accurately an integer" if the number
2208 came from a (by definition imprecise) NV operation, and
2209 we're outside the range of NV integer precision */
2210#endif
2211 )
2212 SvIOK_on(sv);
25da4f38
IZ
2213 SvIsUV_on(sv);
2214 ret_iv_max:
1c846c1f 2215 DEBUG_c(PerlIO_printf(Perl_debug_log,
57def98f 2216 "0x%"UVxf" 2iv(%"UVuf" => %"IVdf") (as unsigned)\n",
56431972 2217 PTR2UV(sv),
57def98f
JH
2218 SvUVX(sv),
2219 SvUVX(sv)));
25da4f38
IZ
2220 return (IV)SvUVX(sv);
2221 }
748a9306
LW
2222 }
2223 else if (SvPOKp(sv) && SvLEN(sv)) {
c2988b20 2224 UV value;
504618e9 2225 const int numtype = grok_number(SvPVX_const(sv), SvCUR(sv), &value);
25da4f38
IZ
2226 /* We want to avoid a possible problem when we cache an IV which
2227 may be later translated to an NV, and the resulting NV is not
c2988b20
NC
2228 the same as the direct translation of the initial string
2229 (eg 123.456 can shortcut to the IV 123 with atol(), but we must
2230 be careful to ensure that the value with the .456 is around if the
2231 NV value is requested in the future).
1c846c1f 2232
25da4f38
IZ
2233 This means that if we cache such an IV, we need to cache the
2234 NV as well. Moreover, we trade speed for space, and do not
28e5dec8 2235 cache the NV if we are sure it's not needed.
25da4f38 2236 */
16b7a9a4 2237
c2988b20
NC
2238 /* SVt_PVNV is one higher than SVt_PVIV, hence this order */
2239 if ((numtype & (IS_NUMBER_IN_UV | IS_NUMBER_NOT_INT))
2240 == IS_NUMBER_IN_UV) {
5e045b90 2241 /* It's definitely an integer, only upgrade to PVIV */
28e5dec8
JH
2242 if (SvTYPE(sv) < SVt_PVIV)
2243 sv_upgrade(sv, SVt_PVIV);
f7bbb42a 2244 (void)SvIOK_on(sv);
c2988b20
NC
2245 } else if (SvTYPE(sv) < SVt_PVNV)
2246 sv_upgrade(sv, SVt_PVNV);
28e5dec8 2247
c2988b20
NC
2248 /* If NV preserves UV then we only use the UV value if we know that
2249 we aren't going to call atof() below. If NVs don't preserve UVs
2250 then the value returned may have more precision than atof() will
2251 return, even though value isn't perfectly accurate. */
2252 if ((numtype & (IS_NUMBER_IN_UV
2253#ifdef NV_PRESERVES_UV
2254 | IS_NUMBER_NOT_INT
2255#endif
2256 )) == IS_NUMBER_IN_UV) {
2257 /* This won't turn off the public IOK flag if it was set above */
2258 (void)SvIOKp_on(sv);
2259
2260 if (!(numtype & IS_NUMBER_NEG)) {
2261 /* positive */;
2262 if (value <= (UV)IV_MAX) {
45977657 2263 SvIV_set(sv, (IV)value);
c2988b20 2264 } else {
607fa7f2 2265 SvUV_set(sv, value);
c2988b20
NC
2266 SvIsUV_on(sv);
2267 }
2268 } else {
2269 /* 2s complement assumption */
2270 if (value <= (UV)IV_MIN) {
45977657 2271 SvIV_set(sv, -(IV)value);
c2988b20
NC
2272 } else {
2273 /* Too negative for an IV. This is a double upgrade, but
d1be9408 2274 I'm assuming it will be rare. */
c2988b20
NC
2275 if (SvTYPE(sv) < SVt_PVNV)
2276 sv_upgrade(sv, SVt_PVNV);
2277 SvNOK_on(sv);
2278 SvIOK_off(sv);
2279 SvIOKp_on(sv);
9d6ce603 2280 SvNV_set(sv, -(NV)value);
45977657 2281 SvIV_set(sv, IV_MIN);
c2988b20
NC
2282 }
2283 }
2284 }
2285 /* For !NV_PRESERVES_UV and IS_NUMBER_IN_UV and IS_NUMBER_NOT_INT we
2286 will be in the previous block to set the IV slot, and the next
2287 block to set the NV slot. So no else here. */
2288
2289 if ((numtype & (IS_NUMBER_IN_UV | IS_NUMBER_NOT_INT))
2290 != IS_NUMBER_IN_UV) {
2291 /* It wasn't an (integer that doesn't overflow the UV). */
3f7c398e 2292 SvNV_set(sv, Atof(SvPVX_const(sv)));
28e5dec8 2293
c2988b20
NC
2294 if (! numtype && ckWARN(WARN_NUMERIC))
2295 not_a_number(sv);
28e5dec8 2296
65202027 2297#if defined(USE_LONG_DOUBLE)
c2988b20
NC
2298 DEBUG_c(PerlIO_printf(Perl_debug_log, "0x%"UVxf" 2iv(%" PERL_PRIgldbl ")\n",
2299 PTR2UV(sv), SvNVX(sv)));
65202027 2300#else
1779d84d 2301 DEBUG_c(PerlIO_printf(Perl_debug_log, "0x%"UVxf" 2iv(%"NVgf")\n",
c2988b20 2302 PTR2UV(sv), SvNVX(sv)));
65202027 2303#endif
28e5dec8
JH
2304
2305
2306#ifdef NV_PRESERVES_UV
c2988b20
NC
2307 (void)SvIOKp_on(sv);
2308 (void)SvNOK_on(sv);
2309 if (SvNVX(sv) < (NV)IV_MAX + 0.5) {
45977657 2310 SvIV_set(sv, I_V(SvNVX(sv)));
c2988b20
NC
2311 if ((NV)(SvIVX(sv)) == SvNVX(sv)) {
2312 SvIOK_on(sv);
28e5dec8 2313 } else {
c2988b20
NC
2314 /* Integer is imprecise. NOK, IOKp */
2315 }
2316 /* UV will not work better than IV */
2317 } else {
2318 if (SvNVX(sv) > (NV)UV_MAX) {
2319 SvIsUV_on(sv);
2320 /* Integer is inaccurate. NOK, IOKp, is UV */
607fa7f2 2321 SvUV_set(sv, UV_MAX);
c2988b20
NC
2322 SvIsUV_on(sv);
2323 } else {
607fa7f2 2324 SvUV_set(sv, U_V(SvNVX(sv)));
c2988b20
NC
2325 /* 0xFFFFFFFFFFFFFFFF not an issue in here */
2326 if ((NV)(SvUVX(sv)) == SvNVX(sv)) {
2327 SvIOK_on(sv);
28e5dec8
JH
2328 SvIsUV_on(sv);
2329 } else {
c2988b20
NC
2330 /* Integer is imprecise. NOK, IOKp, is UV */
2331 SvIsUV_on(sv);
28e5dec8 2332 }
28e5dec8 2333 }
c2988b20
NC
2334 goto ret_iv_max;
2335 }
28e5dec8 2336#else /* NV_PRESERVES_UV */
c2988b20
NC
2337 if ((numtype & (IS_NUMBER_IN_UV | IS_NUMBER_NOT_INT))
2338 == (IS_NUMBER_IN_UV | IS_NUMBER_NOT_INT)) {
2339 /* The IV slot will have been set from value returned by
2340 grok_number above. The NV slot has just been set using
2341 Atof. */
560b0c46 2342 SvNOK_on(sv);
c2988b20
NC
2343 assert (SvIOKp(sv));
2344 } else {
2345 if (((UV)1 << NV_PRESERVES_UV_BITS) >
2346 U_V(SvNVX(sv) > 0 ? SvNVX(sv) : -SvNVX(sv))) {
2347 /* Small enough to preserve all bits. */
2348 (void)SvIOKp_on(sv);
2349 SvNOK_on(sv);
45977657 2350 SvIV_set(sv, I_V(SvNVX(sv)));
c2988b20
NC
2351 if ((NV)(SvIVX(sv)) == SvNVX(sv))
2352 SvIOK_on(sv);
2353 /* Assumption: first non-preserved integer is < IV_MAX,
2354 this NV is in the preserved range, therefore: */
2355 if (!(U_V(SvNVX(sv) > 0 ? SvNVX(sv) : -SvNVX(sv))
2356 < (UV)IV_MAX)) {
32fdb065 2357 Perl_croak(aTHX_ "sv_2iv assumed (U_V(fabs((double)SvNVX(sv))) < (UV)IV_MAX) but SvNVX(sv)=%"NVgf" U_V is 0x%"UVxf", IV_MAX is 0x%"UVxf"\n", SvNVX(sv), U_V(SvNVX(sv)), (UV)IV_MAX);
c2988b20
NC
2358 }
2359 } else {
2360 /* IN_UV NOT_INT
2361 0 0 already failed to read UV.
2362 0 1 already failed to read UV.
2363 1 0 you won't get here in this case. IV/UV
2364 slot set, public IOK, Atof() unneeded.
2365 1 1 already read UV.
2366 so there's no point in sv_2iuv_non_preserve() attempting
2367 to use atol, strtol, strtoul etc. */
2368 if (sv_2iuv_non_preserve (sv, numtype)
2369 >= IS_NUMBER_OVERFLOW_IV)
2370 goto ret_iv_max;
2371 }
2372 }
28e5dec8 2373#endif /* NV_PRESERVES_UV */
25da4f38 2374 }
28e5dec8 2375 } else {
041457d9 2376 if (!PL_localizing && !(SvFLAGS(sv) & SVs_PADTMP) && ckWARN(WARN_UNINITIALIZED))
29489e7c 2377 report_uninit(sv);
25da4f38
IZ
2378 if (SvTYPE(sv) < SVt_IV)
2379 /* Typically the caller expects that sv_any is not NULL now. */
2380 sv_upgrade(sv, SVt_IV);
a0d0e21e 2381 return 0;
79072805 2382 }
1d7c1841
GS
2383 DEBUG_c(PerlIO_printf(Perl_debug_log, "0x%"UVxf" 2iv(%"IVdf")\n",
2384 PTR2UV(sv),SvIVX(sv)));
25da4f38 2385 return SvIsUV(sv) ? (IV)SvUVX(sv) : SvIVX(sv);
79072805
LW
2386}
2387
891f9566
YST
2388/* sv_2uv() is now a macro using Perl_sv_2uv_flags();
2389 * this function provided for binary compatibility only
2390 */
2391
2392UV
2393Perl_sv_2uv(pTHX_ register SV *sv)
2394{
2395 return sv_2uv_flags(sv, SV_GMAGIC);
2396}
2397
645c22ef 2398/*
891f9566 2399=for apidoc sv_2uv_flags
645c22ef
DM
2400
2401Return the unsigned integer value of an SV, doing any necessary string
891f9566
YST
2402conversion. If flags includes SV_GMAGIC, does an mg_get() first.
2403Normally used via the C<SvUV(sv)> and C<SvUVx(sv)> macros.
645c22ef
DM
2404
2405=cut
2406*/
2407
ff68c719 2408UV
891f9566 2409Perl_sv_2uv_flags(pTHX_ register SV *sv, I32 flags)
ff68c719 2410{
2411 if (!sv)
2412 return 0;
2413 if (SvGMAGICAL(sv)) {
891f9566
YST
2414 if (flags & SV_GMAGIC)
2415 mg_get(sv);
ff68c719 2416 if (SvIOKp(sv))
2417 return SvUVX(sv);
2418 if (SvNOKp(sv))
2419 return U_V(SvNVX(sv));
36477c24 2420 if (SvPOKp(sv) && SvLEN(sv))
2421 return asUV(sv);
3fe9a6f1 2422 if (!SvROK(sv)) {
d008e5eb 2423 if (!(SvFLAGS(sv) & SVs_PADTMP)) {
041457d9 2424 if (!PL_localizing && ckWARN(WARN_UNINITIALIZED))
29489e7c 2425 report_uninit(sv);
c6ee37c5 2426 }
36477c24 2427 return 0;
3fe9a6f1 2428 }
ff68c719 2429 }
2430 if (SvTHINKFIRST(sv)) {
2431 if (SvROK(sv)) {
ff68c719 2432 SV* tmpstr;
1554e226 2433 if (SvAMAGIC(sv) && (tmpstr=AMG_CALLun(sv,numer)) &&
b4b9a328 2434 (!SvROK(tmpstr) || (SvRV(tmpstr) != SvRV(sv))))
9e7bc3e8 2435 return SvUV(tmpstr);
56431972 2436 return PTR2UV(SvRV(sv));
ff68c719 2437 }
765f542d
NC
2438 if (SvIsCOW(sv)) {
2439 sv_force_normal_flags(sv, 0);
8a818333 2440 }
0336b60e 2441 if (SvREADONLY(sv) && !SvOK(sv)) {
0336b60e 2442 if (ckWARN(WARN_UNINITIALIZED))
29489e7c 2443 report_uninit(sv);
ff68c719 2444 return 0;
2445 }
2446 }
25da4f38
IZ
2447 if (SvIOKp(sv)) {
2448 if (SvIsUV(sv)) {
2449 return SvUVX(sv);
2450 }
2451 else {
2452 return (UV)SvIVX(sv);
2453 }
ff68c719 2454 }
2455 if (SvNOKp(sv)) {
28e5dec8
JH
2456 /* erm. not sure. *should* never get NOKp (without NOK) from sv_2nv
2457 * without also getting a cached IV/UV from it at the same time
2458 * (ie PV->NV conversion should detect loss of accuracy and cache
2459 * IV or UV at same time to avoid this. */
2460 /* IV-over-UV optimisation - choose to cache IV if possible */
2461
25da4f38
IZ
2462 if (SvTYPE(sv) == SVt_NV)
2463 sv_upgrade(sv, SVt_PVNV);
28e5dec8
JH
2464
2465 (void)SvIOKp_on(sv); /* Must do this first, to clear any SvOOK */
2466 if (SvNVX(sv) < (NV)IV_MAX + 0.5) {
45977657 2467 SvIV_set(sv, I_V(SvNVX(sv)));
28e5dec8
JH
2468 if (SvNVX(sv) == (NV) SvIVX(sv)
2469#ifndef NV_PRESERVES_UV
2470 && (((UV)1 << NV_PRESERVES_UV_BITS) >
2471 (UV)(SvIVX(sv) > 0 ? SvIVX(sv) : -SvIVX(sv)))
2472 /* Don't flag it as "accurately an integer" if the number
2473 came from a (by definition imprecise) NV operation, and
2474 we're outside the range of NV integer precision */
2475#endif
2476 ) {
2477 SvIOK_on(sv); /* Can this go wrong with rounding? NWC */
2478 DEBUG_c(PerlIO_printf(Perl_debug_log,
7234c960 2479 "0x%"UVxf" uv(%"NVgf" => %"IVdf") (precise)\n",
28e5dec8
JH
2480 PTR2UV(sv),
2481 SvNVX(sv),
2482 SvIVX(sv)));
2483
2484 } else {
2485 /* IV not precise. No need to convert from PV, as NV
2486 conversion would already have cached IV if it detected
2487 that PV->IV would be better than PV->NV->IV
2488 flags already correct - don't set public IOK. */
2489 DEBUG_c(PerlIO_printf(Perl_debug_log,
7234c960 2490 "0x%"UVxf" uv(%"NVgf" => %"IVdf") (imprecise)\n",
28e5dec8
JH
2491 PTR2UV(sv),
2492 SvNVX(sv),
2493 SvIVX(sv)));
2494 }
2495 /* Can the above go wrong if SvIVX == IV_MIN and SvNVX < IV_MIN,
2496 but the cast (NV)IV_MIN rounds to a the value less (more
2497 negative) than IV_MIN which happens to be equal to SvNVX ??
2498 Analogous to 0xFFFFFFFFFFFFFFFF rounding up to NV (2**64) and
2499 NV rounding back to 0xFFFFFFFFFFFFFFFF, so UVX == UV(NVX) and
2500 (NV)UVX == NVX are both true, but the values differ. :-(
2501 Hopefully for 2s complement IV_MIN is something like
2502 0x8000000000000000 which will be exact. NWC */
d460ef45 2503 }
28e5dec8 2504 else {
607fa7f2 2505 SvUV_set(sv, U_V(SvNVX(sv)));
28e5dec8
JH
2506 if (
2507 (SvNVX(sv) == (NV) SvUVX(sv))
2508#ifndef NV_PRESERVES_UV
2509 /* Make sure it's not 0xFFFFFFFFFFFFFFFF */
2510 /*&& (SvUVX(sv) != UV_MAX) irrelevant with code below */
2511 && (((UV)1 << NV_PRESERVES_UV_BITS) > SvUVX(sv))
2512 /* Don't flag it as "accurately an integer" if the number
2513 came from a (by definition imprecise) NV operation, and
2514 we're outside the range of NV integer precision */
2515#endif
2516 )
2517 SvIOK_on(sv);
2518 SvIsUV_on(sv);
1c846c1f 2519 DEBUG_c(PerlIO_printf(Perl_debug_log,
28e5dec8 2520 "0x%"UVxf" 2uv(%"UVuf" => %"IVdf") (as unsigned)\n",
57def98f 2521 PTR2UV(sv),
28e5dec8
JH
2522 SvUVX(sv),
2523 SvUVX(sv)));
25da4f38 2524 }
ff68c719 2525 }
2526 else if (SvPOKp(sv) && SvLEN(sv)) {
c2988b20 2527 UV value;
504618e9 2528 const int numtype = grok_number(SvPVX_const(sv), SvCUR(sv), &value);
25da4f38
IZ
2529
2530 /* We want to avoid a possible problem when we cache a UV which
2531 may be later translated to an NV, and the resulting NV is not
2532 the translation of the initial data.
1c846c1f 2533
25da4f38
IZ
2534 This means that if we cache such a UV, we need to cache the
2535 NV as well. Moreover, we trade speed for space, and do not
2536 cache the NV if not needed.
2537 */
16b7a9a4 2538
c2988b20
NC
2539 /* SVt_PVNV is one higher than SVt_PVIV, hence this order */
2540 if ((numtype & (IS_NUMBER_IN_UV | IS_NUMBER_NOT_INT))
2541 == IS_NUMBER_IN_UV) {
5e045b90 2542 /* It's definitely an integer, only upgrade to PVIV */
28e5dec8 2543 if (SvTYPE(sv) < SVt_PVIV)
f7bbb42a
JH
2544 sv_upgrade(sv, SVt_PVIV);
2545 (void)SvIOK_on(sv);
c2988b20
NC
2546 } else if (SvTYPE(sv) < SVt_PVNV)
2547 sv_upgrade(sv, SVt_PVNV);
d460ef45 2548
c2988b20
NC
2549 /* If NV preserves UV then we only use the UV value if we know that
2550 we aren't going to call atof() below. If NVs don't preserve UVs
2551 then the value returned may have more precision than atof() will
2552 return, even though it isn't accurate. */
2553 if ((numtype & (IS_NUMBER_IN_UV
2554#ifdef NV_PRESERVES_UV
2555 | IS_NUMBER_NOT_INT
2556#endif
2557 )) == IS_NUMBER_IN_UV) {
2558 /* This won't turn off the public IOK flag if it was set above */
2559 (void)SvIOKp_on(sv);
2560
2561 if (!(numtype & IS_NUMBER_NEG)) {
2562 /* positive */;
2563 if (value <= (UV)IV_MAX) {
45977657 2564 SvIV_set(sv, (IV)value);
28e5dec8
JH
2565 } else {
2566 /* it didn't overflow, and it was positive. */
607fa7f2 2567 SvUV_set(sv, value);
28e5dec8
JH
2568 SvIsUV_on(sv);
2569 }
c2988b20
NC
2570 } else {
2571 /* 2s complement assumption */
2572 if (value <= (UV)IV_MIN) {
45977657 2573 SvIV_set(sv, -(IV)value);
c2988b20
NC
2574 } else {
2575 /* Too negative for an IV. This is a double upgrade, but
d1be9408 2576 I'm assuming it will be rare. */
c2988b20
NC
2577 if (SvTYPE(sv) < SVt_PVNV)
2578 sv_upgrade(sv, SVt_PVNV);
2579 SvNOK_on(sv);
2580 SvIOK_off(sv);
2581 SvIOKp_on(sv);
9d6ce603 2582 SvNV_set(sv, -(NV)value);
45977657 2583 SvIV_set(sv, IV_MIN);
c2988b20
NC
2584 }
2585 }
2586 }
2587
2588 if ((numtype & (IS_NUMBER_IN_UV | IS_NUMBER_NOT_INT))
2589 != IS_NUMBER_IN_UV) {
2590 /* It wasn't an integer, or it overflowed the UV. */
3f7c398e 2591 SvNV_set(sv, Atof(SvPVX_const(sv)));
28e5dec8 2592
c2988b20 2593 if (! numtype && ckWARN(WARN_NUMERIC))
28e5dec8
JH
2594 not_a_number(sv);
2595
2596#if defined(USE_LONG_DOUBLE)
c2988b20
NC
2597 DEBUG_c(PerlIO_printf(Perl_debug_log, "0x%"UVxf" 2uv(%" PERL_PRIgldbl ")\n",
2598 PTR2UV(sv), SvNVX(sv)));
28e5dec8 2599#else
1779d84d 2600 DEBUG_c(PerlIO_printf(Perl_debug_log, "0x%"UVxf" 2uv(%"NVgf")\n",
c2988b20 2601 PTR2UV(sv), SvNVX(sv)));
28e5dec8
JH
2602#endif
2603
2604#ifdef NV_PRESERVES_UV
c2988b20
NC
2605 (void)SvIOKp_on(sv);
2606 (void)SvNOK_on(sv);
2607 if (SvNVX(sv) < (NV)IV_MAX + 0.5) {
45977657 2608 SvIV_set(sv, I_V(SvNVX(sv)));
c2988b20
NC
2609 if ((NV)(SvIVX(sv)) == SvNVX(sv)) {
2610 SvIOK_on(sv);
2611 } else {
2612 /* Integer is imprecise. NOK, IOKp */
2613 }
2614 /* UV will not work better than IV */
2615 } else {
2616 if (SvNVX(sv) > (NV)UV_MAX) {
2617 SvIsUV_on(sv);
2618 /* Integer is inaccurate. NOK, IOKp, is UV */
607fa7f2 2619 SvUV_set(sv, UV_MAX);
c2988b20
NC
2620 SvIsUV_on(sv);
2621 } else {
607fa7f2 2622 SvUV_set(sv, U_V(SvNVX(sv)));
c2988b20
NC
2623 /* 0xFFFFFFFFFFFFFFFF not an issue in here, NVs
2624 NV preservse UV so can do correct comparison. */
2625 if ((NV)(SvUVX(sv)) == SvNVX(sv)) {
2626 SvIOK_on(sv);
2627 SvIsUV_on(sv);
2628 } else {
2629 /* Integer is imprecise. NOK, IOKp, is UV */
2630 SvIsUV_on(sv);
2631 }
2632 }
2633 }
28e5dec8 2634#else /* NV_PRESERVES_UV */
c2988b20
NC
2635 if ((numtype & (IS_NUMBER_IN_UV | IS_NUMBER_NOT_INT))
2636 == (IS_NUMBER_IN_UV | IS_NUMBER_NOT_INT)) {
2637 /* The UV slot will have been set from value returned by
2638 grok_number above. The NV slot has just been set using
2639 Atof. */
560b0c46 2640 SvNOK_on(sv);
c2988b20
NC
2641 assert (SvIOKp(sv));
2642 } else {
2643 if (((UV)1 << NV_PRESERVES_UV_BITS) >
2644 U_V(SvNVX(sv) > 0 ? SvNVX(sv) : -SvNVX(sv))) {
2645 /* Small enough to preserve all bits. */
2646 (void)SvIOKp_on(sv);
2647 SvNOK_on(sv);
45977657 2648 SvIV_set(sv, I_V(SvNVX(sv)));
c2988b20
NC
2649 if ((NV)(SvIVX(sv)) == SvNVX(sv))
2650 SvIOK_on(sv);
2651 /* Assumption: first non-preserved integer is < IV_MAX,
2652 this NV is in the preserved range, therefore: */
2653 if (!(U_V(SvNVX(sv) > 0 ? SvNVX(sv) : -SvNVX(sv))
2654 < (UV)IV_MAX)) {
32fdb065 2655 Perl_croak(aTHX_ "sv_2uv assumed (U_V(fabs((double)SvNVX(sv))) < (UV)IV_MAX) but SvNVX(sv)=%"NVgf" U_V is 0x%"UVxf", IV_MAX is 0x%"UVxf"\n", SvNVX(sv), U_V(SvNVX(sv)), (UV)IV_MAX);
c2988b20
NC
2656 }
2657 } else
2658 sv_2iuv_non_preserve (sv, numtype);
2659 }
28e5dec8 2660#endif /* NV_PRESERVES_UV */
f7bbb42a 2661 }
ff68c719 2662 }
2663 else {
d008e5eb 2664 if (!(SvFLAGS(sv) & SVs_PADTMP)) {
041457d9 2665 if (!PL_localizing && ckWARN(WARN_UNINITIALIZED))
29489e7c 2666 report_uninit(sv);
c6ee37c5 2667 }
25da4f38
IZ
2668 if (SvTYPE(sv) < SVt_IV)
2669 /* Typically the caller expects that sv_any is not NULL now. */
2670 sv_upgrade(sv, SVt_IV);
ff68c719 2671 return 0;
2672 }
25da4f38 2673
1d7c1841
GS
2674 DEBUG_c(PerlIO_printf(Perl_debug_log, "0x%"UVxf" 2uv(%"UVuf")\n",
2675 PTR2UV(sv),SvUVX(sv)));
25da4f38 2676 return SvIsUV(sv) ? SvUVX(sv) : (UV)SvIVX(sv);
ff68c719 2677}
2678
645c22ef
DM
2679/*
2680=for apidoc sv_2nv
2681
2682Return the num value of an SV, doing any necessary string or integer
2683conversion, magic etc. Normally used via the C<SvNV(sv)> and C<SvNVx(sv)>
2684macros.
2685
2686=cut
2687*/
2688
65202027 2689NV
864dbfa3 2690Perl_sv_2nv(pTHX_ register SV *sv)
79072805
LW
2691{
2692 if (!sv)
2693 return 0.0;
8990e307 2694 if (SvGMAGICAL(sv)) {
463ee0b2
LW
2695 mg_get(sv);
2696 if (SvNOKp(sv))
2697 return SvNVX(sv);
a0d0e21e 2698 if (SvPOKp(sv) && SvLEN(sv)) {
041457d9 2699 if (!SvIOKp(sv) && ckWARN(WARN_NUMERIC) &&
504618e9 2700 !grok_number(SvPVX_const(sv), SvCUR(sv), NULL))
a0d0e21e 2701 not_a_number(sv);
3f7c398e 2702 return Atof(SvPVX_const(sv));
a0d0e21e 2703 }
25da4f38 2704 if (SvIOKp(sv)) {
1c846c1f 2705 if (SvIsUV(sv))
65202027 2706 return (NV)SvUVX(sv);
25da4f38 2707 else
65202027 2708 return (NV)SvIVX(sv);
25da4f38 2709 }
16d20bd9 2710 if (!SvROK(sv)) {
d008e5eb 2711 if (!(SvFLAGS(sv) & SVs_PADTMP)) {
041457d9 2712 if (!PL_localizing && ckWARN(WARN_UNINITIALIZED))
29489e7c 2713 report_uninit(sv);
c6ee37c5 2714 }
66a1b24b 2715 return (NV)0;
16d20bd9 2716 }
463ee0b2 2717 }
ed6116ce 2718 if (SvTHINKFIRST(sv)) {
a0d0e21e 2719 if (SvROK(sv)) {
a0d0e21e 2720 SV* tmpstr;
1554e226 2721 if (SvAMAGIC(sv) && (tmpstr=AMG_CALLun(sv,numer)) &&
b4b9a328 2722 (!SvROK(tmpstr) || (SvRV(tmpstr) != SvRV(sv))))
9e7bc3e8 2723 return SvNV(tmpstr);
56431972 2724 return PTR2NV(SvRV(sv));
a0d0e21e 2725 }
765f542d
NC
2726 if (SvIsCOW(sv)) {
2727 sv_force_normal_flags(sv, 0);
8a818333 2728 }
0336b60e 2729 if (SvREADONLY(sv) && !SvOK(sv)) {
599cee73 2730 if (ckWARN(WARN_UNINITIALIZED))
29489e7c 2731 report_uninit(sv);
ed6116ce
LW
2732 return 0.0;
2733 }
79072805
LW
2734 }
2735 if (SvTYPE(sv) < SVt_NV) {
463ee0b2
LW
2736 if (SvTYPE(sv) == SVt_IV)
2737 sv_upgrade(sv, SVt_PVNV);
2738 else
2739 sv_upgrade(sv, SVt_NV);
906f284f 2740#ifdef USE_LONG_DOUBLE
097ee67d 2741 DEBUG_c({
f93f4e46 2742 STORE_NUMERIC_LOCAL_SET_STANDARD();
1d7c1841
GS
2743 PerlIO_printf(Perl_debug_log,
2744 "0x%"UVxf" num(%" PERL_PRIgldbl ")\n",
2745 PTR2UV(sv), SvNVX(sv));
572bbb43
GS
2746 RESTORE_NUMERIC_LOCAL();
2747 });
65202027 2748#else
572bbb43 2749 DEBUG_c({
f93f4e46 2750 STORE_NUMERIC_LOCAL_SET_STANDARD();
1779d84d 2751 PerlIO_printf(Perl_debug_log, "0x%"UVxf" num(%"NVgf")\n",
1d7c1841 2752 PTR2UV(sv), SvNVX(sv));
097ee67d
JH
2753 RESTORE_NUMERIC_LOCAL();
2754 });
572bbb43 2755#endif
79072805
LW
2756 }
2757 else if (SvTYPE(sv) < SVt_PVNV)
2758 sv_upgrade(sv, SVt_PVNV);
59d8ce62
NC
2759 if (SvNOKp(sv)) {
2760 return SvNVX(sv);
61604483 2761 }
59d8ce62 2762 if (SvIOKp(sv)) {
9d6ce603 2763 SvNV_set(sv, SvIsUV(sv) ? (NV)SvUVX(sv) : (NV)SvIVX(sv));
28e5dec8
JH
2764#ifdef NV_PRESERVES_UV
2765 SvNOK_on(sv);
2766#else
2767 /* Only set the public NV OK flag if this NV preserves the IV */
2768 /* Check it's not 0xFFFFFFFFFFFFFFFF */
2769 if (SvIsUV(sv) ? ((SvUVX(sv) != UV_MAX)&&(SvUVX(sv) == U_V(SvNVX(sv))))
2770 : (SvIVX(sv) == I_V(SvNVX(sv))))
2771 SvNOK_on(sv);
2772 else
2773 SvNOKp_on(sv);
2774#endif
93a17b20 2775 }
748a9306 2776 else if (SvPOKp(sv) && SvLEN(sv)) {
c2988b20 2777 UV value;
3f7c398e 2778 const int numtype = grok_number(SvPVX_const(sv), SvCUR(sv), &value);
041457d9 2779 if (!SvIOKp(sv) && !numtype && ckWARN(WARN_NUMERIC))
a0d0e21e 2780 not_a_number(sv);
28e5dec8 2781#ifdef NV_PRESERVES_UV
c2988b20
NC
2782 if ((numtype & (IS_NUMBER_IN_UV | IS_NUMBER_NOT_INT))
2783 == IS_NUMBER_IN_UV) {
5e045b90 2784 /* It's definitely an integer */
9d6ce603 2785 SvNV_set(sv, (numtype & IS_NUMBER_NEG) ? -(NV)value : (NV)value);
c2988b20 2786 } else
3f7c398e 2787 SvNV_set(sv, Atof(SvPVX_const(sv)));
28e5dec8
JH
2788 SvNOK_on(sv);
2789#else
3f7c398e 2790 SvNV_set(sv, Atof(SvPVX_const(sv)));
28e5dec8
JH
2791 /* Only set the public NV OK flag if this NV preserves the value in
2792 the PV at least as well as an IV/UV would.
2793 Not sure how to do this 100% reliably. */
2794 /* if that shift count is out of range then Configure's test is
2795 wonky. We shouldn't be in here with NV_PRESERVES_UV_BITS ==
2796 UV_BITS */
2797 if (((UV)1 << NV_PRESERVES_UV_BITS) >
c2988b20 2798 U_V(SvNVX(sv) > 0 ? SvNVX(sv) : -SvNVX(sv))) {
28e5dec8 2799 SvNOK_on(sv); /* Definitely small enough to preserve all bits */
c2988b20
NC
2800 } else if (!(numtype & IS_NUMBER_IN_UV)) {
2801 /* Can't use strtol etc to convert this string, so don't try.
2802 sv_2iv and sv_2uv will use the NV to convert, not the PV. */
2803 SvNOK_on(sv);
2804 } else {
2805 /* value has been set. It may not be precise. */
2806 if ((numtype & IS_NUMBER_NEG) && (value > (UV)IV_MIN)) {
2807 /* 2s complement assumption for (UV)IV_MIN */
2808 SvNOK_on(sv); /* Integer is too negative. */
2809 } else {
2810 SvNOKp_on(sv);
2811 SvIOKp_on(sv);
6fa402ec 2812
c2988b20 2813 if (numtype & IS_NUMBER_NEG) {
45977657 2814 SvIV_set(sv, -(IV)value);
c2988b20 2815 } else if (value <= (UV)IV_MAX) {
45977657 2816 SvIV_set(sv, (IV)value);
c2988b20 2817 } else {
607fa7f2 2818 SvUV_set(sv, value);
c2988b20
NC
2819 SvIsUV_on(sv);
2820 }
2821
2822 if (numtype & IS_NUMBER_NOT_INT) {
2823 /* I believe that even if the original PV had decimals,
2824 they are lost beyond the limit of the FP precision.
2825 However, neither is canonical, so both only get p
2826 flags. NWC, 2000/11/25 */
2827 /* Both already have p flags, so do nothing */
2828 } else {
66a1b24b 2829 const NV nv = SvNVX(sv);
c2988b20
NC
2830 if (SvNVX(sv) < (NV)IV_MAX + 0.5) {
2831 if (SvIVX(sv) == I_V(nv)) {
2832 SvNOK_on(sv);
2833 SvIOK_on(sv);
2834 } else {
2835 SvIOK_on(sv);
2836 /* It had no "." so it must be integer. */
2837 }
2838 } else {
2839 /* between IV_MAX and NV(UV_MAX).
2840 Could be slightly > UV_MAX */
6fa402ec 2841
c2988b20
NC
2842 if (numtype & IS_NUMBER_NOT_INT) {
2843 /* UV and NV both imprecise. */
2844 } else {
66a1b24b 2845 const UV nv_as_uv = U_V(nv);
c2988b20
NC
2846
2847 if (value == nv_as_uv && SvUVX(sv) != UV_MAX) {
2848 SvNOK_on(sv);
2849 SvIOK_on(sv);
2850 } else {
2851 SvIOK_on(sv);
2852 }
2853 }
2854 }
2855 }
2856 }
2857 }
28e5dec8 2858#endif /* NV_PRESERVES_UV */
93a17b20 2859 }
79072805 2860 else {
041457d9 2861 if (!PL_localizing && !(SvFLAGS(sv) & SVs_PADTMP) && ckWARN(WARN_UNINITIALIZED))
29489e7c 2862 report_uninit(sv);
25da4f38
IZ
2863 if (SvTYPE(sv) < SVt_NV)
2864 /* Typically the caller expects that sv_any is not NULL now. */
28e5dec8
JH
2865 /* XXX Ilya implies that this is a bug in callers that assume this
2866 and ideally should be fixed. */
25da4f38 2867 sv_upgrade(sv, SVt_NV);
a0d0e21e 2868 return 0.0;
79072805 2869 }
572bbb43 2870#if defined(USE_LONG_DOUBLE)
097ee67d 2871 DEBUG_c({
f93f4e46 2872 STORE_NUMERIC_LOCAL_SET_STANDARD();
1d7c1841
GS
2873 PerlIO_printf(Perl_debug_log, "0x%"UVxf" 2nv(%" PERL_PRIgldbl ")\n",
2874 PTR2UV(sv), SvNVX(sv));
572bbb43
GS
2875 RESTORE_NUMERIC_LOCAL();
2876 });
65202027 2877#else
572bbb43 2878 DEBUG_c({
f93f4e46 2879 STORE_NUMERIC_LOCAL_SET_STANDARD();
1779d84d 2880 PerlIO_printf(Perl_debug_log, "0x%"UVxf" 1nv(%"NVgf")\n",
1d7c1841 2881 PTR2UV(sv), SvNVX(sv));
097ee67d
JH
2882 RESTORE_NUMERIC_LOCAL();
2883 });
572bbb43 2884#endif
463ee0b2 2885 return SvNVX(sv);
79072805
LW
2886}
2887
645c22ef
DM
2888/* asIV(): extract an integer from the string value of an SV.
2889 * Caller must validate PVX */
2890
76e3520e 2891STATIC IV
cea2e8a9 2892S_asIV(pTHX_ SV *sv)
36477c24 2893{
c2988b20 2894 UV value;
66a1b24b 2895 const int numtype = grok_number(SvPVX_const(sv), SvCUR(sv), &value);
c2988b20
NC
2896
2897 if ((numtype & (IS_NUMBER_IN_UV | IS_NUMBER_NOT_INT))
2898 == IS_NUMBER_IN_UV) {
645c22ef 2899 /* It's definitely an integer */
c2988b20
NC
2900 if (numtype & IS_NUMBER_NEG) {
2901 if (value < (UV)IV_MIN)
2902 return -(IV)value;
2903 } else {
2904 if (value < (UV)IV_MAX)
2905 return (IV)value;
2906 }
2907 }
d008e5eb 2908 if (!numtype) {
d008e5eb
GS
2909 if (ckWARN(WARN_NUMERIC))
2910 not_a_number(sv);
2911 }
3f7c398e 2912 return I_V(Atof(SvPVX_const(sv)));
36477c24 2913}
2914
645c22ef
DM
2915/* asUV(): extract an unsigned integer from the string value of an SV
2916 * Caller must validate PVX */
2917
76e3520e 2918STATIC UV
cea2e8a9 2919S_asUV(pTHX_ SV *sv)
36477c24 2920{
c2988b20 2921 UV value;
504618e9 2922 const int numtype = grok_number(SvPVX_const(sv), SvCUR(sv), &value);
36477c24 2923
c2988b20
NC
2924 if ((numtype & (IS_NUMBER_IN_UV | IS_NUMBER_NOT_INT))
2925 == IS_NUMBER_IN_UV) {
645c22ef 2926 /* It's definitely an integer */
6fa402ec 2927 if (!(numtype & IS_NUMBER_NEG))
c2988b20
NC
2928 return value;
2929 }
d008e5eb 2930 if (!numtype) {
d008e5eb
GS
2931 if (ckWARN(WARN_NUMERIC))
2932 not_a_number(sv);
2933 }
3f7c398e 2934 return U_V(Atof(SvPVX_const(sv)));
36477c24 2935}
2936
645c22ef
DM
2937/*
2938=for apidoc sv_2pv_nolen
2939
2940Like C<sv_2pv()>, but doesn't return the length too. You should usually
2941use the macro wrapper C<SvPV_nolen(sv)> instead.
2942=cut
2943*/
2944
79072805 2945char *
864dbfa3 2946Perl_sv_2pv_nolen(pTHX_ register SV *sv)
1fa8b10d 2947{
dafda6d1 2948 return sv_2pv(sv, 0);
1fa8b10d
JD
2949}
2950
645c22ef
DM
2951/* uiv_2buf(): private routine for use by sv_2pv_flags(): print an IV or
2952 * UV as a string towards the end of buf, and return pointers to start and
2953 * end of it.
2954 *
2955 * We assume that buf is at least TYPE_CHARS(UV) long.
2956 */
2957
864dbfa3 2958static char *
aec46f14 2959S_uiv_2buf(char *buf, IV iv, UV uv, int is_uv, char **peob)
25da4f38 2960{
25da4f38
IZ
2961 char *ptr = buf + TYPE_CHARS(UV);
2962 char *ebuf = ptr;
2963 int sign;
25da4f38
IZ
2964
2965 if (is_uv)
2966 sign = 0;
2967 else if (iv >= 0) {
2968 uv = iv;
2969 sign = 0;
2970 } else {
2971 uv = -iv;
2972 sign = 1;
2973 }
2974 do {
eb160463 2975 *--ptr = '0' + (char)(uv % 10);
25da4f38
IZ
2976 } while (uv /= 10);
2977 if (sign)
2978 *--ptr = '-';
2979 *peob = ebuf;
2980 return ptr;
2981}
2982
09540bc3
JH
2983/* sv_2pv() is now a macro using Perl_sv_2pv_flags();
2984 * this function provided for binary compatibility only
2985 */
2986
2987char *
2988Perl_sv_2pv(pTHX_ register SV *sv, STRLEN *lp)
2989{
2990 return sv_2pv_flags(sv, lp, SV_GMAGIC);
2991}
2992
645c22ef
DM
2993/*
2994=for apidoc sv_2pv_flags
2995
ff276b08 2996Returns a pointer to the string value of an SV, and sets *lp to its length.
645c22ef
DM
2997If flags includes SV_GMAGIC, does an mg_get() first. Coerces sv to a string
2998if necessary.
2999Normally invoked via the C<SvPV_flags> macro. C<sv_2pv()> and C<sv_2pv_nomg>
3000usually end up here too.
3001
3002=cut
3003*/
3004
8d6d96c1
HS
3005char *
3006Perl_sv_2pv_flags(pTHX_ register SV *sv, STRLEN *lp, I32 flags)
3007{
79072805
LW
3008 register char *s;
3009 int olderrno;
cb50f42d 3010 SV *tsv, *origsv;
25da4f38
IZ
3011 char tbuf[64]; /* Must fit sprintf/Gconvert of longest IV/NV */
3012 char *tmpbuf = tbuf;
79072805 3013
463ee0b2 3014 if (!sv) {
cdb061a3
NC
3015 if (lp)
3016 *lp = 0;
73d840c0 3017 return (char *)"";
463ee0b2 3018 }
8990e307 3019 if (SvGMAGICAL(sv)) {
8d6d96c1
HS
3020 if (flags & SV_GMAGIC)
3021 mg_get(sv);
463ee0b2 3022 if (SvPOKp(sv)) {
cdb061a3
NC
3023 if (lp)
3024 *lp = SvCUR(sv);
10516c54
NC
3025 if (flags & SV_MUTABLE_RETURN)
3026 return SvPVX_mutable(sv);
4d84ee25
NC
3027 if (flags & SV_CONST_RETURN)
3028 return (char *)SvPVX_const(sv);
463ee0b2
LW
3029 return SvPVX(sv);
3030 }
cf2093f6 3031 if (SvIOKp(sv)) {
1c846c1f 3032 if (SvIsUV(sv))
57def98f 3033 (void)sprintf(tmpbuf,"%"UVuf, (UV)SvUVX(sv));
cf2093f6 3034 else
57def98f 3035 (void)sprintf(tmpbuf,"%"IVdf, (IV)SvIVX(sv));
46fc3d4c 3036 tsv = Nullsv;
a0d0e21e 3037 goto tokensave;
463ee0b2
LW
3038 }
3039 if (SvNOKp(sv)) {
2d4389e4 3040 Gconvert(SvNVX(sv), NV_DIG, 0, tmpbuf);
46fc3d4c 3041 tsv = Nullsv;
a0d0e21e 3042 goto tokensave;
463ee0b2 3043 }
16d20bd9 3044 if (!SvROK(sv)) {
d008e5eb 3045 if (!(SvFLAGS(sv) & SVs_PADTMP)) {
041457d9 3046 if (!PL_localizing && ckWARN(WARN_UNINITIALIZED))
29489e7c 3047 report_uninit(sv);
c6ee37c5 3048 }
cdb061a3
NC
3049 if (lp)
3050 *lp = 0;
73d840c0 3051 return (char *)"";
16d20bd9 3052 }
463ee0b2 3053 }
ed6116ce
LW
3054 if (SvTHINKFIRST(sv)) {
3055 if (SvROK(sv)) {
a0d0e21e 3056 SV* tmpstr;
e1ec3a88 3057 register const char *typestr;
1554e226 3058 if (SvAMAGIC(sv) && (tmpstr=AMG_CALLun(sv,string)) &&
b4b9a328 3059 (!SvROK(tmpstr) || (SvRV(tmpstr) != SvRV(sv)))) {
50adf7d2
NC
3060 /* Unwrap this: */
3061 /* char *pv = lp ? SvPV(tmpstr, *lp) : SvPV_nolen(tmpstr); */
3062
3063 char *pv;
3064 if ((SvFLAGS(tmpstr) & (SVf_POK)) == SVf_POK) {
3065 if (flags & SV_CONST_RETURN) {
3066 pv = (char *) SvPVX_const(tmpstr);
3067 } else {
3068 pv = (flags & SV_MUTABLE_RETURN)
3069 ? SvPVX_mutable(tmpstr) : SvPVX(tmpstr);
3070 }
3071 if (lp)
3072 *lp = SvCUR(tmpstr);
3073 } else {
3074 pv = sv_2pv_flags(tmpstr, lp, flags);
3075 }
446eaa42
YST
3076 if (SvUTF8(tmpstr))
3077 SvUTF8_on(sv);
3078 else
3079 SvUTF8_off(sv);
3080 return pv;
3081 }
cb50f42d 3082 origsv = sv;
ed6116ce
LW
3083 sv = (SV*)SvRV(sv);
3084 if (!sv)
e1ec3a88 3085 typestr = "NULLREF";
ed6116ce 3086 else {
f9277f47
IZ
3087 MAGIC *mg;
3088
ed6116ce 3089 switch (SvTYPE(sv)) {
f9277f47
IZ
3090 case SVt_PVMG:
3091 if ( ((SvFLAGS(sv) &
1c846c1f 3092 (SVs_OBJECT|SVf_OK|SVs_GMG|SVs_SMG|SVs_RMG))
faf82a0b 3093 == (SVs_OBJECT|SVs_SMG))
14befaf4 3094 && (mg = mg_find(sv, PERL_MAGIC_qr))) {
e1ec3a88 3095 const regexp *re = (regexp *)mg->mg_obj;
1bd3ad17 3096
2cd61cdb 3097 if (!mg->mg_ptr) {
e1ec3a88 3098 const char *fptr = "msix";
8782bef2
GB
3099 char reflags[6];
3100 char ch;
3101 int left = 0;
3102 int right = 4;
ff385a1b 3103 char need_newline = 0;
eb160463 3104 U16 reganch = (U16)((re->reganch & PMf_COMPILETIME) >> 12);
8782bef2 3105
155aba94 3106 while((ch = *fptr++)) {
8782bef2
GB
3107 if(reganch & 1) {
3108 reflags[left++] = ch;
3109 }
3110 else {
3111 reflags[right--] = ch;
3112 }
3113 reganch >>= 1;
3114 }
3115 if(left != 4) {
3116 reflags[left] = '-';
3117 left = 5;
3118 }
3119
3120 mg->mg_len = re->prelen + 4 + left;
ff385a1b
JF
3121 /*
3122 * If /x was used, we have to worry about a regex
3123 * ending with a comment later being embedded
3124 * within another regex. If so, we don't want this
3125 * regex's "commentization" to leak out to the
3126 * right part of the enclosing regex, we must cap
3127 * it with a newline.
3128 *
3129 * So, if /x was used, we scan backwards from the
3130 * end of the regex. If we find a '#' before we
3131 * find a newline, we need to add a newline
3132 * ourself. If we find a '\n' first (or if we
3133 * don't find '#' or '\n'), we don't need to add
3134 * anything. -jfriedl
3135 */
3136 if (PMf_EXTENDED & re->reganch)
3137 {
e1ec3a88 3138 const char *endptr = re->precomp + re->prelen;
ff385a1b
JF
3139 while (endptr >= re->precomp)
3140 {
e1ec3a88 3141 const char c = *(endptr--);
ff385a1b
JF
3142 if (c == '\n')
3143 break; /* don't need another */
3144 if (c == '#') {
3145 /* we end while in a comment, so we
3146 need a newline */
3147 mg->mg_len++; /* save space for it */
3148 need_newline = 1; /* note to add it */
ab01544f 3149 break;
ff385a1b
JF
3150 }
3151 }
3152 }
3153
a02a5408 3154 Newx(mg->mg_ptr, mg->mg_len + 1 + left, char);
8782bef2
GB
3155 Copy("(?", mg->mg_ptr, 2, char);
3156 Copy(reflags, mg->mg_ptr+2, left, char);
3157 Copy(":", mg->mg_ptr+left+2, 1, char);
3158 Copy(re->precomp, mg->mg_ptr+3+left, re->prelen, char);
ff385a1b
JF
3159 if (need_newline)
3160 mg->mg_ptr[mg->mg_len - 2] = '\n';
1bd3ad17
IZ
3161 mg->mg_ptr[mg->mg_len - 1] = ')';
3162 mg->mg_ptr[mg->mg_len] = 0;
3163 }
3280af22 3164 PL_reginterp_cnt += re->program[0].next_off;
cb50f42d
YST
3165
3166 if (re->reganch & ROPT_UTF8)
3167 SvUTF8_on(origsv);
3168 else
3169 SvUTF8_off(origsv);
cdb061a3
NC
3170 if (lp)
3171 *lp = mg->mg_len;
1bd3ad17 3172 return mg->mg_ptr;
f9277f47
IZ
3173 }
3174 /* Fall through */
ed6116ce
LW
3175 case SVt_NULL:
3176 case SVt_IV:
3177 case SVt_NV:
3178 case SVt_RV:
3179 case SVt_PV:
3180 case SVt_PVIV:
3181 case SVt_PVNV:
e1ec3a88
AL
3182 case SVt_PVBM: typestr = SvROK(sv) ? "REF" : "SCALAR"; break;
3183 case SVt_PVLV: typestr = SvROK(sv) ? "REF"
be65207d
DM
3184 /* tied lvalues should appear to be
3185 * scalars for backwards compatitbility */
3186 : (LvTYPE(sv) == 't' || LvTYPE(sv) == 'T')
3187 ? "SCALAR" : "LVALUE"; break;
e1ec3a88
AL
3188 case SVt_PVAV: typestr = "ARRAY"; break;
3189 case SVt_PVHV: typestr = "HASH"; break;
3190 case SVt_PVCV: typestr = "CODE"; break;
3191 case SVt_PVGV: typestr = "GLOB"; break;
3192 case SVt_PVFM: typestr = "FORMAT"; break;
3193 case SVt_PVIO: typestr = "IO"; break;
3194 default: typestr = "UNKNOWN"; break;
ed6116ce 3195 }
46fc3d4c 3196 tsv = NEWSV(0,0);
a5cb6b62 3197 if (SvOBJECT(sv)) {
bfcb3514 3198 const char *name = HvNAME_get(SvSTASH(sv));
a5cb6b62 3199 Perl_sv_setpvf(aTHX_ tsv, "%s=%s(0x%"UVxf")",
e1ec3a88 3200 name ? name : "__ANON__" , typestr, PTR2UV(sv));
a5cb6b62 3201 }
ed6116ce 3202 else
e1ec3a88 3203 Perl_sv_setpvf(aTHX_ tsv, "%s(0x%"UVxf")", typestr, PTR2UV(sv));
a0d0e21e 3204 goto tokensaveref;
463ee0b2 3205 }
cdb061a3
NC
3206 if (lp)
3207 *lp = strlen(typestr);
73d840c0 3208 return (char *)typestr;
79072805 3209 }
0336b60e 3210 if (SvREADONLY(sv) && !SvOK(sv)) {
0336b60e 3211 if (ckWARN(WARN_UNINITIALIZED))
29489e7c 3212 report_uninit(sv);
cdb061a3
NC
3213 if (lp)
3214 *lp = 0;
73d840c0 3215 return (char *)"";
79072805 3216 }
79072805 3217 }
28e5dec8
JH
3218 if (SvIOK(sv) || ((SvIOKp(sv) && !SvNOKp(sv)))) {
3219 /* I'm assuming that if both IV and NV are equally valid then
3220 converting the IV is going to be more efficient */
e1ec3a88
AL
3221 const U32 isIOK = SvIOK(sv);
3222 const U32 isUIOK = SvIsUV(sv);
28e5dec8
JH
3223 char buf[TYPE_CHARS(UV)];
3224 char *ebuf, *ptr;
3225
3226 if (SvTYPE(sv) < SVt_PVIV)
3227 sv_upgrade(sv, SVt_PVIV);
3228 if (isUIOK)
3229 ptr = uiv_2buf(buf, 0, SvUVX(sv), 1, &ebuf);
3230 else
3231 ptr = uiv_2buf(buf, SvIVX(sv), 0, 0, &ebuf);
5902b6a9
NC
3232 /* inlined from sv_setpvn */
3233 SvGROW_mutable(sv, (STRLEN)(ebuf - ptr + 1));
4d84ee25 3234 Move(ptr,SvPVX_mutable(sv),ebuf - ptr,char);
28e5dec8
JH
3235 SvCUR_set(sv, ebuf - ptr);
3236 s = SvEND(sv);
3237 *s = '\0';
3238 if (isIOK)
3239 SvIOK_on(sv);
3240 else
3241 SvIOKp_on(sv);
3242 if (isUIOK)
3243 SvIsUV_on(sv);
3244 }
3245 else if (SvNOKp(sv)) {
79072805
LW
3246 if (SvTYPE(sv) < SVt_PVNV)
3247 sv_upgrade(sv, SVt_PVNV);
1c846c1f 3248 /* The +20 is pure guesswork. Configure test needed. --jhi */
5902b6a9 3249 s = SvGROW_mutable(sv, NV_DIG + 20);
79072805 3250 olderrno = errno; /* some Xenix systems wipe out errno here */
79072805 3251#ifdef apollo
463ee0b2 3252 if (SvNVX(sv) == 0.0)
79072805
LW
3253 (void)strcpy(s,"0");
3254 else
3255#endif /*apollo*/
bbce6d69 3256 {
2d4389e4 3257 Gconvert(SvNVX(sv), NV_DIG, 0, s);
bbce6d69 3258 }
79072805 3259 errno = olderrno;
a0d0e21e
LW
3260#ifdef FIXNEGATIVEZERO
3261 if (*s == '-' && s[1] == '0' && !s[2])
3262 strcpy(s,"0");
3263#endif
79072805
LW
3264 while (*s) s++;
3265#ifdef hcx
3266 if (s[-1] == '.')
46fc3d4c 3267 *--s = '\0';
79072805
LW
3268#endif
3269 }
79072805 3270 else {
041457d9 3271 if (!PL_localizing && !(SvFLAGS(sv) & SVs_PADTMP) && ckWARN(WARN_UNINITIALIZED))
29489e7c 3272 report_uninit(sv);
cdb061a3 3273 if (lp)
a0d0e21e 3274 *lp = 0;
25da4f38
IZ
3275 if (SvTYPE(sv) < SVt_PV)
3276 /* Typically the caller expects that sv_any is not NULL now. */
3277 sv_upgrade(sv, SVt_PV);
73d840c0 3278 return (char *)"";
79072805 3279 }
cdb061a3
NC
3280 {
3281 STRLEN len = s - SvPVX_const(sv);
3282 if (lp)
3283 *lp = len;
3284 SvCUR_set(sv, len);
3285 }
79072805 3286 SvPOK_on(sv);
1d7c1841 3287 DEBUG_c(PerlIO_printf(Perl_debug_log, "0x%"UVxf" 2pv(%s)\n",
3f7c398e 3288 PTR2UV(sv),SvPVX_const(sv)));
4d84ee25
NC
3289 if (flags & SV_CONST_RETURN)
3290 return (char *)SvPVX_const(sv);
10516c54
NC
3291 if (flags & SV_MUTABLE_RETURN)
3292 return SvPVX_mutable(sv);
463ee0b2 3293 return SvPVX(sv);
a0d0e21e
LW
3294
3295 tokensave:
3296 if (SvROK(sv)) { /* XXX Skip this when sv_pvn_force calls */
3297 /* Sneaky stuff here */
3298
3299 tokensaveref:
46fc3d4c 3300 if (!tsv)
96827780 3301 tsv = newSVpv(tmpbuf, 0);
46fc3d4c 3302 sv_2mortal(tsv);
cdb061a3
NC
3303 if (lp)
3304 *lp = SvCUR(tsv);
46fc3d4c 3305 return SvPVX(tsv);
a0d0e21e
LW
3306 }
3307 else {
27da23d5 3308 dVAR;
a0d0e21e 3309 STRLEN len;
73d840c0 3310 const char *t;
46fc3d4c 3311
3312 if (tsv) {
3313 sv_2mortal(tsv);
3f7c398e 3314 t = SvPVX_const(tsv);
46fc3d4c 3315 len = SvCUR(tsv);
3316 }
3317 else {
96827780
MB
3318 t = tmpbuf;
3319 len = strlen(tmpbuf);
46fc3d4c 3320 }
a0d0e21e 3321#ifdef FIXNEGATIVEZERO
46fc3d4c 3322 if (len == 2 && t[0] == '-' && t[1] == '0') {
3323 t = "0";
3324 len = 1;
3325 }
a0d0e21e 3326#endif
862a34c6 3327 SvUPGRADE(sv, SVt_PV);
cdb061a3
NC
3328 if (lp)
3329 *lp = len;
5902b6a9 3330 s = SvGROW_mutable(sv, len + 1);
a0d0e21e 3331 SvCUR_set(sv, len);
6bf554b4 3332 SvPOKp_on(sv);
490a0e98 3333 return memcpy(s, t, len + 1);
a0d0e21e 3334 }
463ee0b2
LW
3335}
3336
645c22ef 3337/*
6050d10e
JP
3338=for apidoc sv_copypv
3339
3340Copies a stringified representation of the source SV into the
3341destination SV. Automatically performs any necessary mg_get and
54f0641b 3342coercion of numeric values into strings. Guaranteed to preserve
6050d10e 3343UTF-8 flag even from overloaded objects. Similar in nature to
54f0641b
NIS
3344sv_2pv[_flags] but operates directly on an SV instead of just the
3345string. Mostly uses sv_2pv_flags to do its work, except when that
6050d10e
JP
3346would lose the UTF-8'ness of the PV.
3347
3348=cut
3349*/
3350
3351void
3352Perl_sv_copypv(pTHX_ SV *dsv, register SV *ssv)
3353{
446eaa42 3354 STRLEN len;
53c1dcc0 3355 const char * const s = SvPV_const(ssv,len);
cb50f42d 3356 sv_setpvn(dsv,s,len);
446eaa42 3357 if (SvUTF8(ssv))
cb50f42d 3358 SvUTF8_on(dsv);
446eaa42 3359 else
cb50f42d 3360 SvUTF8_off(dsv);
6050d10e
JP
3361}
3362
3363/*
645c22ef
DM
3364=for apidoc sv_2pvbyte_nolen
3365
3366Return a pointer to the byte-encoded representation of the SV.
1e54db1a 3367May cause the SV to be downgraded from UTF-8 as a side-effect.
645c22ef
DM
3368
3369Usually accessed via the C<SvPVbyte_nolen> macro.
3370
3371=cut
3372*/
3373
7340a771
GS
3374char *
3375Perl_sv_2pvbyte_nolen(pTHX_ register SV *sv)
3376{
dafda6d1 3377 return sv_2pvbyte(sv, 0);
7340a771
GS
3378}
3379
645c22ef
DM
3380/*
3381=for apidoc sv_2pvbyte
3382
3383Return a pointer to the byte-encoded representation of the SV, and set *lp
1e54db1a 3384to its length. May cause the SV to be downgraded from UTF-8 as a
645c22ef
DM
3385side-effect.
3386
3387Usually accessed via the C<SvPVbyte> macro.
3388
3389=cut
3390*/
3391
7340a771
GS
3392char *
3393Perl_sv_2pvbyte(pTHX_ register SV *sv, STRLEN *lp)
3394{
0875d2fe 3395 sv_utf8_downgrade(sv,0);
97972285 3396 return lp ? SvPV(sv,*lp) : SvPV_nolen(sv);
7340a771
GS
3397}
3398
645c22ef
DM
3399/*
3400=for apidoc sv_2pvutf8_nolen
3401
1e54db1a
JH
3402Return a pointer to the UTF-8-encoded representation of the SV.
3403May cause the SV to be upgraded to UTF-8 as a side-effect.
645c22ef
DM
3404
3405Usually accessed via the C<SvPVutf8_nolen> macro.
3406
3407=cut
3408*/
3409
7340a771
GS
3410char *
3411Perl_sv_2pvutf8_nolen(pTHX_ register SV *sv)
3412{
dafda6d1 3413 return sv_2pvutf8(sv, 0);
7340a771
GS
3414}
3415
645c22ef
DM
3416/*
3417=for apidoc sv_2pvutf8
3418
1e54db1a
JH
3419Return a pointer to the UTF-8-encoded representation of the SV, and set *lp
3420to its length. May cause the SV to be upgraded to UTF-8 as a side-effect.
645c22ef
DM
3421
3422Usually accessed via the C<SvPVutf8> macro.
3423
3424=cut
3425*/
3426
7340a771
GS
3427char *
3428Perl_sv_2pvutf8(pTHX_ register SV *sv, STRLEN *lp)
3429{
560a288e 3430 sv_utf8_upgrade(sv);
7d59b7e4 3431 return SvPV(sv,*lp);
7340a771 3432}
1c846c1f 3433
645c22ef
DM
3434/*
3435=for apidoc sv_2bool
3436
3437This function is only called on magical items, and is only used by
8cf8f3d1 3438sv_true() or its macro equivalent.
645c22ef
DM
3439
3440=cut
3441*/
3442
463ee0b2 3443bool
864dbfa3 3444Perl_sv_2bool(pTHX_ register SV *sv)
463ee0b2 3445{
5b295bef 3446 SvGETMAGIC(sv);
463ee0b2 3447
a0d0e21e
LW
3448 if (!SvOK(sv))
3449 return 0;
3450 if (SvROK(sv)) {
a0d0e21e 3451 SV* tmpsv;
1554e226 3452 if (SvAMAGIC(sv) && (tmpsv=AMG_CALLun(sv,bool_)) &&
9e3013b1 3453 (!SvROK(tmpsv) || (SvRV(tmpsv) != SvRV(sv))))
8a31060d 3454 return (bool)SvTRUE(tmpsv);
a0d0e21e
LW
3455 return SvRV(sv) != 0;
3456 }
463ee0b2 3457 if (SvPOKp(sv)) {
53c1dcc0
AL
3458 register XPV* const Xpvtmp = (XPV*)SvANY(sv);
3459 if (Xpvtmp &&
339049b0 3460 (*sv->sv_u.svu_pv > '0' ||
11343788 3461 Xpvtmp->xpv_cur > 1 ||
339049b0 3462 (Xpvtmp->xpv_cur && *sv->sv_u.svu_pv != '0')))
463ee0b2
LW
3463 return 1;
3464 else
3465 return 0;
3466 }
3467 else {
3468 if (SvIOKp(sv))
3469 return SvIVX(sv) != 0;
3470 else {
3471 if (SvNOKp(sv))
3472 return SvNVX(sv) != 0.0;
3473 else
3474 return FALSE;
3475 }
3476 }
79072805
LW
3477}
3478
09540bc3
JH
3479/* sv_utf8_upgrade() is now a macro using sv_utf8_upgrade_flags();
3480 * this function provided for binary compatibility only
3481 */
3482
3483
3484STRLEN
3485Perl_sv_utf8_upgrade(pTHX_ register SV *sv)
3486{
3487 return sv_utf8_upgrade_flags(sv, SV_GMAGIC);
3488}
3489
c461cf8f
JH
3490/*
3491=for apidoc sv_utf8_upgrade
3492
78ea37eb 3493Converts the PV of an SV to its UTF-8-encoded form.
645c22ef 3494Forces the SV to string form if it is not already.
4411f3b6
NIS
3495Always sets the SvUTF8 flag to avoid future validity checks even
3496if all the bytes have hibit clear.
c461cf8f 3497
13a6c0e0
JH
3498This is not as a general purpose byte encoding to Unicode interface:
3499use the Encode extension for that.
3500
8d6d96c1
HS
3501=for apidoc sv_utf8_upgrade_flags
3502
78ea37eb 3503Converts the PV of an SV to its UTF-8-encoded form.
645c22ef 3504Forces the SV to string form if it is not already.
8d6d96c1
HS
3505Always sets the SvUTF8 flag to avoid future validity checks even
3506if all the bytes have hibit clear. If C<flags> has C<SV_GMAGIC> bit set,
3507will C<mg_get> on C<sv> if appropriate, else not. C<sv_utf8_upgrade> and
3508C<sv_utf8_upgrade_nomg> are implemented in terms of this function.
3509
13a6c0e0
JH
3510This is not as a general purpose byte encoding to Unicode interface:
3511use the Encode extension for that.
3512
8d6d96c1
HS
3513=cut
3514*/
3515
3516STRLEN
3517Perl_sv_utf8_upgrade_flags(pTHX_ register SV *sv, I32 flags)
3518{
808c356f
RGS
3519 if (sv == &PL_sv_undef)
3520 return 0;
e0e62c2a
NIS
3521 if (!SvPOK(sv)) {
3522 STRLEN len = 0;
d52b7888
NC
3523 if (SvREADONLY(sv) && (SvPOKp(sv) || SvIOKp(sv) || SvNOKp(sv))) {
3524 (void) sv_2pv_flags(sv,&len, flags);
3525 if (SvUTF8(sv))
3526 return len;
3527 } else {
3528 (void) SvPV_force(sv,len);
3529 }
e0e62c2a 3530 }
4411f3b6 3531
f5cee72b 3532 if (SvUTF8(sv)) {
5fec3b1d 3533 return SvCUR(sv);
f5cee72b 3534 }
5fec3b1d 3535
765f542d
NC
3536 if (SvIsCOW(sv)) {
3537 sv_force_normal_flags(sv, 0);
db42d148
NIS
3538 }
3539
88632417 3540 if (PL_encoding && !(flags & SV_UTF8_NO_ENCODING))
799ef3cb 3541 sv_recode_to_utf8(sv, PL_encoding);
9f4817db 3542 else { /* Assume Latin-1/EBCDIC */
c4e7c712
NC
3543 /* This function could be much more efficient if we
3544 * had a FLAG in SVs to signal if there are any hibit
3545 * chars in the PV. Given that there isn't such a flag
3546 * make the loop as fast as possible. */
93524f2b
NC
3547 const U8 *s = (U8 *) SvPVX_const(sv);
3548 const U8 *e = (U8 *) SvEND(sv);
3549 const U8 *t = s;
c4e7c712
NC
3550 int hibit = 0;
3551
3552 while (t < e) {
53c1dcc0 3553 const U8 ch = *t++;
c4e7c712
NC
3554 if ((hibit = !NATIVE_IS_INVARIANT(ch)))
3555 break;
3556 }
3557 if (hibit) {
3558 STRLEN len = SvCUR(sv) + 1; /* Plus the \0 */
53c1dcc0 3559 U8 * const recoded = bytes_to_utf8((U8*)s, &len);
c4e7c712
NC
3560
3561 SvPV_free(sv); /* No longer using what was there before. */
3562
1e2ebb21 3563 SvPV_set(sv, (char*)recoded);
c4e7c712
NC
3564 SvCUR_set(sv, len - 1);
3565 SvLEN_set(sv, len); /* No longer know the real size. */
3566 }
3567 /* Mark as UTF-8 even if no hibit - saves scanning loop */
3568 SvUTF8_on(sv);
560a288e 3569 }
4411f3b6 3570 return SvCUR(sv);
560a288e
GS
3571}
3572
c461cf8f
JH
3573/*
3574=for apidoc sv_utf8_downgrade
3575
78ea37eb
TS
3576Attempts to convert the PV of an SV from characters to bytes.
3577If the PV contains a character beyond byte, this conversion will fail;
3578in this case, either returns false or, if C<fail_ok> is not
c461cf8f
JH
3579true, croaks.
3580
13a6c0e0
JH
3581This is not as a general purpose Unicode to byte encoding interface:
3582use the Encode extension for that.
3583
c461cf8f
JH
3584=cut
3585*/
3586
560a288e
GS
3587bool
3588Perl_sv_utf8_downgrade(pTHX_ register SV* sv, bool fail_ok)
3589{
78ea37eb 3590 if (SvPOKp(sv) && SvUTF8(sv)) {
fa301091 3591 if (SvCUR(sv)) {
03cfe0ae 3592 U8 *s;
652088fc 3593 STRLEN len;
fa301091 3594
765f542d
NC
3595 if (SvIsCOW(sv)) {
3596 sv_force_normal_flags(sv, 0);
3597 }
03cfe0ae
NIS
3598 s = (U8 *) SvPV(sv, len);
3599 if (!utf8_to_bytes(s, &len)) {
fa301091
JH
3600 if (fail_ok)
3601 return FALSE;
3602 else {
3603 if (PL_op)
3604 Perl_croak(aTHX_ "Wide character in %s",
53e06cf0 3605 OP_DESC(PL_op));
fa301091
JH
3606 else
3607 Perl_croak(aTHX_ "Wide character");
3608 }
4b3603a4 3609 }
b162af07 3610 SvCUR_set(sv, len);
67e989fb 3611 }
560a288e 3612 }
ffebcc3e 3613 SvUTF8_off(sv);
560a288e
GS
3614 return TRUE;
3615}
3616
c461cf8f
JH
3617/*
3618=for apidoc sv_utf8_encode
3619
78ea37eb
TS
3620Converts the PV of an SV to UTF-8, but then turns the C<SvUTF8>
3621flag off so that it looks like octets again.
c461cf8f
JH
3622
3623=cut
3624*/
3625
560a288e
GS
3626void
3627Perl_sv_utf8_encode(pTHX_ register SV *sv)
3628{
4411f3b6 3629 (void) sv_utf8_upgrade(sv);
4c94c214
NC
3630 if (SvIsCOW(sv)) {
3631 sv_force_normal_flags(sv, 0);
3632 }
3633 if (SvREADONLY(sv)) {
3634 Perl_croak(aTHX_ PL_no_modify);
3635 }
560a288e
GS
3636 SvUTF8_off(sv);
3637}
3638
4411f3b6
NIS
3639/*
3640=for apidoc sv_utf8_decode
3641
78ea37eb
TS
3642If the PV of the SV is an octet sequence in UTF-8
3643and contains a multiple-byte character, the C<SvUTF8> flag is turned on
3644so that it looks like a character. If the PV contains only single-byte
3645characters, the C<SvUTF8> flag stays being off.
3646Scans PV for validity and returns false if the PV is invalid UTF-8.
4411f3b6
NIS
3647
3648=cut
3649*/
3650
560a288e
GS
3651bool
3652Perl_sv_utf8_decode(pTHX_ register SV *sv)
3653{
78ea37eb 3654 if (SvPOKp(sv)) {
93524f2b
NC
3655 const U8 *c;
3656 const U8 *e;
9cbac4c7 3657
645c22ef
DM
3658 /* The octets may have got themselves encoded - get them back as
3659 * bytes
3660 */
3661 if (!sv_utf8_downgrade(sv, TRUE))
560a288e
GS
3662 return FALSE;
3663
3664 /* it is actually just a matter of turning the utf8 flag on, but
3665 * we want to make sure everything inside is valid utf8 first.
3666 */
93524f2b 3667 c = (const U8 *) SvPVX_const(sv);
63cd0674 3668 if (!is_utf8_string(c, SvCUR(sv)+1))
67e989fb 3669 return FALSE;
93524f2b 3670 e = (const U8 *) SvEND(sv);
511c2ff0 3671 while (c < e) {
b64e5050 3672 const U8 ch = *c++;
c4d5f83a 3673 if (!UTF8_IS_INVARIANT(ch)) {
67e989fb
JH
3674 SvUTF8_on(sv);
3675 break;
3676 }
560a288e 3677 }
560a288e
GS
3678 }
3679 return TRUE;
3680}
3681
09540bc3
JH
3682/* sv_setsv() is now a macro using Perl_sv_setsv_flags();
3683 * this function provided for binary compatibility only
3684 */
3685
3686void
3687Perl_sv_setsv(pTHX_ SV *dstr, register SV *sstr)
3688{
3689 sv_setsv_flags(dstr, sstr, SV_GMAGIC);
3690}
3691
954c1994
GS
3692/*
3693=for apidoc sv_setsv
3694
645c22ef
DM
3695Copies the contents of the source SV C<ssv> into the destination SV
3696C<dsv>. The source SV may be destroyed if it is mortal, so don't use this
3697function if the source SV needs to be reused. Does not handle 'set' magic.
3698Loosely speaking, it performs a copy-by-value, obliterating any previous
3699content of the destination.
3700
3701You probably want to use one of the assortment of wrappers, such as
3702C<SvSetSV>, C<SvSetSV_nosteal>, C<SvSetMagicSV> and
3703C<SvSetMagicSV_nosteal>.
3704
8d6d96c1
HS
3705=for apidoc sv_setsv_flags
3706
645c22ef
DM
3707Copies the contents of the source SV C<ssv> into the destination SV
3708C<dsv>. The source SV may be destroyed if it is mortal, so don't use this
3709function if the source SV needs to be reused. Does not handle 'set' magic.
3710Loosely speaking, it performs a copy-by-value, obliterating any previous
3711content of the destination.
3712If the C<flags> parameter has the C<SV_GMAGIC> bit set, will C<mg_get> on
5fcdf167
NC
3713C<ssv> if appropriate, else not. If the C<flags> parameter has the
3714C<NOSTEAL> bit set then the buffers of temps will not be stolen. <sv_setsv>
3715and C<sv_setsv_nomg> are implemented in terms of this function.
645c22ef
DM
3716
3717You probably want to use one of the assortment of wrappers, such as
3718C<SvSetSV>, C<SvSetSV_nosteal>, C<SvSetMagicSV> and
3719C<SvSetMagicSV_nosteal>.
3720
3721This is the primary function for copying scalars, and most other
3722copy-ish functions and macros use this underneath.
8d6d96c1
HS
3723
3724=cut
3725*/
3726
3727void
3728Perl_sv_setsv_flags(pTHX_ SV *dstr, register SV *sstr, I32 flags)
3729{
8990e307
LW
3730 register U32 sflags;
3731 register int dtype;
3732 register int stype;
463ee0b2 3733
79072805
LW
3734 if (sstr == dstr)
3735 return;
765f542d 3736 SV_CHECK_THINKFIRST_COW_DROP(dstr);
79072805 3737 if (!sstr)
3280af22 3738 sstr = &PL_sv_undef;
8990e307
LW
3739 stype = SvTYPE(sstr);
3740 dtype = SvTYPE(dstr);
79072805 3741
a0d0e21e 3742 SvAMAGIC_off(dstr);
7a5fa8a2 3743 if ( SvVOK(dstr) )
ece467f9
JP
3744 {
3745 /* need to nuke the magic */
3746 mg_free(dstr);
3747 SvRMAGICAL_off(dstr);
3748 }
9e7bc3e8 3749
463ee0b2 3750 /* There's a lot of redundancy below but we're going for speed here */
79072805 3751
8990e307 3752 switch (stype) {
79072805 3753 case SVt_NULL:
aece5585 3754 undef_sstr:
20408e3c
GS
3755 if (dtype != SVt_PVGV) {
3756 (void)SvOK_off(dstr);
3757 return;
3758 }
3759 break;
463ee0b2 3760 case SVt_IV:
aece5585
GA
3761 if (SvIOK(sstr)) {
3762 switch (dtype) {
3763 case SVt_NULL:
8990e307 3764 sv_upgrade(dstr, SVt_IV);
aece5585
GA
3765 break;
3766 case SVt_NV:
8990e307 3767 sv_upgrade(dstr, SVt_PVNV);
aece5585
GA
3768 break;
3769 case SVt_RV:
3770 case SVt_PV:
a0d0e21e 3771 sv_upgrade(dstr, SVt_PVIV);
aece5585
GA
3772 break;
3773 }
3774 (void)SvIOK_only(dstr);
45977657 3775 SvIV_set(dstr, SvIVX(sstr));
25da4f38
IZ
3776 if (SvIsUV(sstr))
3777 SvIsUV_on(dstr);
27c9684d
AP
3778 if (SvTAINTED(sstr))
3779 SvTAINT(dstr);
aece5585 3780 return;
8990e307 3781 }
aece5585
GA
3782 goto undef_sstr;
3783
463ee0b2 3784 case SVt_NV:
aece5585
GA
3785 if (SvNOK(sstr)) {
3786 switch (dtype) {
3787 case SVt_NULL:
3788 case SVt_IV:
8990e307 3789 sv_upgrade(dstr, SVt_NV);
aece5585
GA
3790 break;
3791 case SVt_RV:
3792 case SVt_PV:
3793 case SVt_PVIV:
a0d0e21e 3794 sv_upgrade(dstr, SVt_PVNV);
aece5585
GA
3795 break;
3796 }
9d6ce603 3797 SvNV_set(dstr, SvNVX(sstr));
aece5585 3798 (void)SvNOK_only(dstr);
27c9684d
AP
3799 if (SvTAINTED(sstr))
3800 SvTAINT(dstr);
aece5585 3801 return;
8990e307 3802 }
aece5585
GA
3803 goto undef_sstr;
3804
ed6116ce 3805 case SVt_RV:
8990e307 3806 if (dtype < SVt_RV)
ed6116ce 3807 sv_upgrade(dstr, SVt_RV);
c07a80fd 3808 else if (dtype == SVt_PVGV &&
23bb1b96 3809 SvROK(sstr) && SvTYPE(SvRV(sstr)) == SVt_PVGV) {
c07a80fd 3810 sstr = SvRV(sstr);
a5f75d66 3811 if (sstr == dstr) {
1d7c1841
GS
3812 if (GvIMPORTED(dstr) != GVf_IMPORTED
3813 && CopSTASH_ne(PL_curcop, GvSTASH(dstr)))
3814 {
a5f75d66 3815 GvIMPORTED_on(dstr);
1d7c1841 3816 }
a5f75d66
AD
3817 GvMULTI_on(dstr);
3818 return;
3819 }
c07a80fd 3820 goto glob_assign;
3821 }
ed6116ce 3822 break;
fc36a67e 3823 case SVt_PVFM:
f8c7b90f 3824#ifdef PERL_OLD_COPY_ON_WRITE
d89fc664
NC
3825 if ((SvFLAGS(sstr) & CAN_COW_MASK) == CAN_COW_FLAGS) {
3826 if (dtype < SVt_PVIV)
3827 sv_upgrade(dstr, SVt_PVIV);
3828 break;
3829 }
3830 /* Fall through */
3831#endif
3832 case SVt_PV:
8990e307 3833 if (dtype < SVt_PV)
463ee0b2 3834 sv_upgrade(dstr, SVt_PV);
463ee0b2
LW
3835 break;
3836 case SVt_PVIV:
8990e307 3837 if (dtype < SVt_PVIV)
463ee0b2 3838 sv_upgrade(dstr, SVt_PVIV);
463ee0b2
LW
3839 break;
3840 case SVt_PVNV:
8990e307 3841 if (dtype < SVt_PVNV)
463ee0b2 3842 sv_upgrade(dstr, SVt_PVNV);
463ee0b2 3843 break;
4633a7c4
LW
3844 case SVt_PVAV:
3845 case SVt_PVHV:
3846 case SVt_PVCV:
4633a7c4 3847 case SVt_PVIO:
a3b680e6
AL
3848 {
3849 const char * const type = sv_reftype(sstr,0);
533c011a 3850 if (PL_op)
a3b680e6 3851 Perl_croak(aTHX_ "Bizarre copy of %s in %s", type, OP_NAME(PL_op));
4633a7c4 3852 else
a3b680e6
AL
3853 Perl_croak(aTHX_ "Bizarre copy of %s", type);
3854 }
4633a7c4
LW
3855 break;
3856
79072805 3857 case SVt_PVGV:
8990e307 3858 if (dtype <= SVt_PVGV) {
c07a80fd 3859 glob_assign:
a5f75d66 3860 if (dtype != SVt_PVGV) {
a3b680e6
AL
3861 const char * const name = GvNAME(sstr);
3862 const STRLEN len = GvNAMELEN(sstr);
b76195c2
DM
3863 /* don't upgrade SVt_PVLV: it can hold a glob */
3864 if (dtype != SVt_PVLV)
3865 sv_upgrade(dstr, SVt_PVGV);
14befaf4 3866 sv_magic(dstr, dstr, PERL_MAGIC_glob, Nullch, 0);
e15faf7d
NC
3867 GvSTASH(dstr) = GvSTASH(sstr);
3868 if (GvSTASH(dstr))
3869 Perl_sv_add_backref(aTHX_ (SV*)GvSTASH(dstr), dstr);
a0d0e21e
LW
3870 GvNAME(dstr) = savepvn(name, len);
3871 GvNAMELEN(dstr) = len;
3872 SvFAKE_on(dstr); /* can coerce to non-glob */
3873 }
7bac28a0 3874 /* ahem, death to those who redefine active sort subs */
3280af22
NIS
3875 else if (PL_curstackinfo->si_type == PERLSI_SORT
3876 && GvCV(dstr) && PL_sortcop == CvSTART(GvCV(dstr)))
cea2e8a9 3877 Perl_croak(aTHX_ "Can't redefine active sort subroutine %s",
7bac28a0 3878 GvNAME(dstr));
5bd07a3d 3879
7fb37951
AMS
3880#ifdef GV_UNIQUE_CHECK
3881 if (GvUNIQUE((GV*)dstr)) {
5bd07a3d
DM
3882 Perl_croak(aTHX_ PL_no_modify);
3883 }
3884#endif
3885
a0d0e21e 3886 (void)SvOK_off(dstr);
a5f75d66 3887 GvINTRO_off(dstr); /* one-shot flag */
1edc1566 3888 gp_free((GV*)dstr);
79072805 3889 GvGP(dstr) = gp_ref(GvGP(sstr));
27c9684d
AP
3890 if (SvTAINTED(sstr))
3891 SvTAINT(dstr);
1d7c1841
GS
3892 if (GvIMPORTED(dstr) != GVf_IMPORTED
3893 && CopSTASH_ne(PL_curcop, GvSTASH(dstr)))
3894 {
a5f75d66 3895 GvIMPORTED_on(dstr);
1d7c1841 3896 }
a5f75d66 3897 GvMULTI_on(dstr);
79072805
LW
3898 return;
3899 }
3900 /* FALL THROUGH */
3901
3902 default:
8d6d96c1 3903 if (SvGMAGICAL(sstr) && (flags & SV_GMAGIC)) {
973f89ab 3904 mg_get(sstr);
eb160463 3905 if ((int)SvTYPE(sstr) != stype) {
973f89ab
CS
3906 stype = SvTYPE(sstr);
3907 if (stype == SVt_PVGV && dtype <= SVt_PVGV)
3908 goto glob_assign;
3909 }
3910 }
ded42b9f 3911 if (stype == SVt_PVLV)
862a34c6 3912 SvUPGRADE(dstr, SVt_PVNV);
ded42b9f 3913 else
862a34c6 3914 SvUPGRADE(dstr, (U32)stype);
79072805
LW
3915 }
3916
8990e307
LW
3917 sflags = SvFLAGS(sstr);
3918
3919 if (sflags & SVf_ROK) {
3920 if (dtype >= SVt_PV) {
3921 if (dtype == SVt_PVGV) {
3922 SV *sref = SvREFCNT_inc(SvRV(sstr));
3923 SV *dref = 0;
a3b680e6 3924 const int intro = GvINTRO(dstr);
a0d0e21e 3925
7fb37951
AMS
3926#ifdef GV_UNIQUE_CHECK
3927 if (GvUNIQUE((GV*)dstr)) {
5bd07a3d
DM
3928 Perl_croak(aTHX_ PL_no_modify);
3929 }
3930#endif
3931
a0d0e21e 3932 if (intro) {
a5f75d66 3933 GvINTRO_off(dstr); /* one-shot flag */
1d7c1841 3934 GvLINE(dstr) = CopLINE(PL_curcop);
1edc1566 3935 GvEGV(dstr) = (GV*)dstr;
a0d0e21e 3936 }
a5f75d66 3937 GvMULTI_on(dstr);
8990e307
LW
3938 switch (SvTYPE(sref)) {
3939 case SVt_PVAV:
a0d0e21e 3940 if (intro)
890ed176 3941 SAVEGENERICSV(GvAV(dstr));
a0d0e21e
LW
3942 else
3943 dref = (SV*)GvAV(dstr);
8990e307 3944 GvAV(dstr) = (AV*)sref;
39bac7f7 3945 if (!GvIMPORTED_AV(dstr)
1d7c1841
GS
3946 && CopSTASH_ne(PL_curcop, GvSTASH(dstr)))
3947 {
a5f75d66 3948 GvIMPORTED_AV_on(dstr);
1d7c1841 3949 }
8990e307
LW
3950 break;
3951 case SVt_PVHV:
a0d0e21e 3952 if (intro)
890ed176 3953 SAVEGENERICSV(GvHV(dstr));
a0d0e21e
LW
3954 else
3955 dref = (SV*)GvHV(dstr);
8990e307 3956 GvHV(dstr) = (HV*)sref;
39bac7f7 3957 if (!GvIMPORTED_HV(dstr)
1d7c1841
GS
3958 && CopSTASH_ne(PL_curcop, GvSTASH(dstr)))
3959 {
a5f75d66 3960 GvIMPORTED_HV_on(dstr);
1d7c1841 3961 }
8990e307
LW
3962 break;
3963 case SVt_PVCV:
8ebc5c01 3964 if (intro) {
3965 if (GvCVGEN(dstr) && GvCV(dstr) != (CV*)sref) {
3966 SvREFCNT_dec(GvCV(dstr));
3967 GvCV(dstr) = Nullcv;
68dc0745 3968 GvCVGEN(dstr) = 0; /* Switch off cacheness. */
3280af22 3969 PL_sub_generation++;
8ebc5c01 3970 }
890ed176 3971 SAVEGENERICSV(GvCV(dstr));
8ebc5c01 3972 }
68dc0745 3973 else
3974 dref = (SV*)GvCV(dstr);
3975 if (GvCV(dstr) != (CV*)sref) {
748a9306 3976 CV* cv = GvCV(dstr);
4633a7c4 3977 if (cv) {
68dc0745 3978 if (!GvCVGEN((GV*)dstr) &&
3979 (CvROOT(cv) || CvXSUB(cv)))
3980 {
7bac28a0 3981 /* ahem, death to those who redefine
3982 * active sort subs */
3280af22
NIS
3983 if (PL_curstackinfo->si_type == PERLSI_SORT &&
3984 PL_sortcop == CvSTART(cv))
1c846c1f 3985 Perl_croak(aTHX_
7bac28a0 3986 "Can't redefine active sort subroutine %s",
3987 GvENAME((GV*)dstr));
beab0874
JT
3988 /* Redefining a sub - warning is mandatory if
3989 it was a const and its value changed. */
3990 if (ckWARN(WARN_REDEFINE)
3991 || (CvCONST(cv)
3992 && (!CvCONST((CV*)sref)
3993 || sv_cmp(cv_const_sv(cv),
3994 cv_const_sv((CV*)sref)))))
3995 {
9014280d 3996 Perl_warner(aTHX_ packWARN(WARN_REDEFINE),
beab0874 3997 CvCONST(cv)
910764e6
RGS
3998 ? "Constant subroutine %s::%s redefined"
3999 : "Subroutine %s::%s redefined",
bfcb3514 4000 HvNAME_get(GvSTASH((GV*)dstr)),
beab0874
JT
4001 GvENAME((GV*)dstr));
4002 }
9607fc9c 4003 }
fb24441d
RGS
4004 if (!intro)
4005 cv_ckproto(cv, (GV*)dstr,
93524f2b
NC
4006 SvPOK(sref)
4007 ? SvPVX_const(sref) : Nullch);
4633a7c4 4008 }
a5f75d66 4009 GvCV(dstr) = (CV*)sref;
7a4c00b4 4010 GvCVGEN(dstr) = 0; /* Switch off cacheness. */
a5f75d66 4011 GvASSUMECV_on(dstr);
3280af22 4012 PL_sub_generation++;
a5f75d66 4013 }
39bac7f7 4014 if (!GvIMPORTED_CV(dstr)
1d7c1841
GS
4015 && CopSTASH_ne(PL_curcop, GvSTASH(dstr)))
4016 {
a5f75d66 4017 GvIMPORTED_CV_on(dstr);
1d7c1841 4018 }
8990e307 4019 break;
91bba347
LW
4020 case SVt_PVIO:
4021 if (intro)
890ed176 4022 SAVEGENERICSV(GvIOp(dstr));
91bba347
LW
4023 else
4024 dref = (SV*)GvIOp(dstr);
4025 GvIOp(dstr) = (IO*)sref;
4026 break;
f4d13ee9
JH
4027 case SVt_PVFM:
4028 if (intro)
890ed176 4029 SAVEGENERICSV(GvFORM(dstr));
f4d13ee9
JH
4030 else
4031 dref = (SV*)GvFORM(dstr);
4032 GvFORM(dstr) = (CV*)sref;
4033 break;
8990e307 4034 default:
a0d0e21e 4035 if (intro)
890ed176 4036 SAVEGENERICSV(GvSV(dstr));
a0d0e21e
LW
4037 else
4038 dref = (SV*)GvSV(dstr);
8990e307 4039 GvSV(dstr) = sref;
39bac7f7 4040 if (!GvIMPORTED_SV(dstr)
1d7c1841
GS
4041 && CopSTASH_ne(PL_curcop, GvSTASH(dstr)))
4042 {
a5f75d66 4043 GvIMPORTED_SV_on(dstr);
1d7c1841 4044 }
8990e307
LW
4045 break;
4046 }
4047 if (dref)
4048 SvREFCNT_dec(dref);
27c9684d
AP
4049 if (SvTAINTED(sstr))
4050 SvTAINT(dstr);
8990e307
LW
4051 return;
4052 }
3f7c398e 4053 if (SvPVX_const(dstr)) {
8bd4d4c5 4054 SvPV_free(dstr);
b162af07
SP
4055 SvLEN_set(dstr, 0);
4056 SvCUR_set(dstr, 0);
a0d0e21e 4057 }
8990e307 4058 }
a0d0e21e 4059 (void)SvOK_off(dstr);
b162af07 4060 SvRV_set(dstr, SvREFCNT_inc(SvRV(sstr)));
ed6116ce 4061 SvROK_on(dstr);
8990e307 4062 if (sflags & SVp_NOK) {
3332b3c1
JH
4063 SvNOKp_on(dstr);
4064 /* Only set the public OK flag if the source has public OK. */
4065 if (sflags & SVf_NOK)
4066 SvFLAGS(dstr) |= SVf_NOK;
9d6ce603 4067 SvNV_set(dstr, SvNVX(sstr));
ed6116ce 4068 }
8990e307 4069 if (sflags & SVp_IOK) {
3332b3c1
JH
4070 (void)SvIOKp_on(dstr);
4071 if (sflags & SVf_IOK)
4072 SvFLAGS(dstr) |= SVf_IOK;
2b1c7e3e 4073 if (sflags & SVf_IVisUV)
25da4f38 4074 SvIsUV_on(dstr);
45977657 4075 SvIV_set(dstr, SvIVX(sstr));
ed6116ce 4076 }
a0d0e21e
LW
4077 if (SvAMAGIC(sstr)) {
4078 SvAMAGIC_on(dstr);
4079 }
ed6116ce 4080 }
8990e307 4081 else if (sflags & SVp_POK) {
765f542d 4082 bool isSwipe = 0;
79072805
LW
4083
4084 /*
4085 * Check to see if we can just swipe the string. If so, it's a
4086 * possible small lose on short strings, but a big win on long ones.
3f7c398e
SP
4087 * It might even be a win on short strings if SvPVX_const(dstr)
4088 * has to be allocated and SvPVX_const(sstr) has to be freed.
79072805
LW
4089 */
4090
120fac95
NC
4091 /* Whichever path we take through the next code, we want this true,
4092 and doing it now facilitates the COW check. */
4093 (void)SvPOK_only(dstr);
4094
765f542d 4095 if (
b8f9541a
NC
4096 /* We're not already COW */
4097 ((sflags & (SVf_FAKE | SVf_READONLY)) != (SVf_FAKE | SVf_READONLY)
f8c7b90f 4098#ifndef PERL_OLD_COPY_ON_WRITE
b8f9541a
NC
4099 /* or we are, but dstr isn't a suitable target. */
4100 || (SvFLAGS(dstr) & CAN_COW_MASK) != CAN_COW_FLAGS
4101#endif
4102 )
765f542d 4103 &&
765f542d
NC
4104 !(isSwipe =
4105 (sflags & SVs_TEMP) && /* slated for free anyway? */
4106 !(sflags & SVf_OOK) && /* and not involved in OOK hack? */
5fcdf167
NC
4107 (!(flags & SV_NOSTEAL)) &&
4108 /* and we're allowed to steal temps */
765f542d
NC
4109 SvREFCNT(sstr) == 1 && /* and no other references to it? */
4110 SvLEN(sstr) && /* and really is a string */
645c22ef 4111 /* and won't be needed again, potentially */
765f542d 4112 !(PL_op && PL_op->op_type == OP_AASSIGN))
f8c7b90f 4113#ifdef PERL_OLD_COPY_ON_WRITE
765f542d 4114 && !((sflags & CAN_COW_MASK) == CAN_COW_FLAGS
120fac95 4115 && (SvFLAGS(dstr) & CAN_COW_MASK) == CAN_COW_FLAGS
765f542d
NC
4116 && SvTYPE(sstr) >= SVt_PVIV)
4117#endif
4118 ) {
4119 /* Failed the swipe test, and it's not a shared hash key either.
4120 Have to copy the string. */
4121 STRLEN len = SvCUR(sstr);
4122 SvGROW(dstr, len + 1); /* inlined from sv_setpvn */
3f7c398e 4123 Move(SvPVX_const(sstr),SvPVX(dstr),len,char);
765f542d
NC
4124 SvCUR_set(dstr, len);
4125 *SvEND(dstr) = '\0';
765f542d 4126 } else {
f8c7b90f 4127 /* If PERL_OLD_COPY_ON_WRITE is not defined, then isSwipe will always
765f542d 4128 be true in here. */
765f542d
NC
4129 /* Either it's a shared hash key, or it's suitable for
4130 copy-on-write or we can swipe the string. */
46187eeb 4131 if (DEBUG_C_TEST) {
ed252734 4132 PerlIO_printf(Perl_debug_log, "Copy on write: sstr --> dstr\n");
e419cbc5
NC
4133 sv_dump(sstr);
4134 sv_dump(dstr);
46187eeb 4135 }
f8c7b90f 4136#ifdef PERL_OLD_COPY_ON_WRITE
765f542d
NC
4137 if (!isSwipe) {
4138 /* I believe I should acquire a global SV mutex if
4139 it's a COW sv (not a shared hash key) to stop
4140 it going un copy-on-write.
4141 If the source SV has gone un copy on write between up there
4142 and down here, then (assert() that) it is of the correct
4143 form to make it copy on write again */
4144 if ((sflags & (SVf_FAKE | SVf_READONLY))
4145 != (SVf_FAKE | SVf_READONLY)) {
4146 SvREADONLY_on(sstr);
4147 SvFAKE_on(sstr);
4148 /* Make the source SV into a loop of 1.
4149 (about to become 2) */
a29f6d03 4150 SV_COW_NEXT_SV_SET(sstr, sstr);
765f542d
NC
4151 }
4152 }
4153#endif
4154 /* Initial code is common. */
94010e71
NC
4155 if (SvPVX_const(dstr)) { /* we know that dtype >= SVt_PV */
4156 SvPV_free(dstr);
79072805 4157 }
765f542d 4158
765f542d
NC
4159 if (!isSwipe) {
4160 /* making another shared SV. */
4161 STRLEN cur = SvCUR(sstr);
4162 STRLEN len = SvLEN(sstr);
f8c7b90f 4163#ifdef PERL_OLD_COPY_ON_WRITE
765f542d 4164 if (len) {
b8f9541a 4165 assert (SvTYPE(dstr) >= SVt_PVIV);
765f542d
NC
4166 /* SvIsCOW_normal */
4167 /* splice us in between source and next-after-source. */
a29f6d03
NC
4168 SV_COW_NEXT_SV_SET(dstr, SV_COW_NEXT_SV(sstr));
4169 SV_COW_NEXT_SV_SET(sstr, dstr);
940132f3 4170 SvPV_set(dstr, SvPVX_mutable(sstr));
a604c751
NC
4171 } else
4172#endif
4173 {
765f542d 4174 /* SvIsCOW_shared_hash */
46187eeb
NC
4175 DEBUG_C(PerlIO_printf(Perl_debug_log,
4176 "Copy on write: Sharing hash\n"));
b8f9541a 4177
bdd68bc3 4178 assert (SvTYPE(dstr) >= SVt_PV);
765f542d 4179 SvPV_set(dstr,
d1db91c6 4180 HEK_KEY(share_hek_hek(SvSHARED_HEK_FROM_PV(SvPVX_const(sstr)))));
bdd68bc3 4181 }
87a1ef3d
SP
4182 SvLEN_set(dstr, len);
4183 SvCUR_set(dstr, cur);
765f542d
NC
4184 SvREADONLY_on(dstr);
4185 SvFAKE_on(dstr);
4186 /* Relesase a global SV mutex. */
4187 }
4188 else
765f542d 4189 { /* Passes the swipe test. */
78d1e721 4190 SvPV_set(dstr, SvPVX_mutable(sstr));
765f542d
NC
4191 SvLEN_set(dstr, SvLEN(sstr));
4192 SvCUR_set(dstr, SvCUR(sstr));
4193
4194 SvTEMP_off(dstr);
4195 (void)SvOK_off(sstr); /* NOTE: nukes most SvFLAGS on sstr */
4196 SvPV_set(sstr, Nullch);
4197 SvLEN_set(sstr, 0);
4198 SvCUR_set(sstr, 0);
4199 SvTEMP_off(sstr);
4200 }
4201 }
9aa983d2 4202 if (sflags & SVf_UTF8)
a7cb1f99 4203 SvUTF8_on(dstr);
8990e307 4204 if (sflags & SVp_NOK) {
3332b3c1
JH
4205 SvNOKp_on(dstr);
4206 if (sflags & SVf_NOK)
4207 SvFLAGS(dstr) |= SVf_NOK;
9d6ce603 4208 SvNV_set(dstr, SvNVX(sstr));
79072805 4209 }
8990e307 4210 if (sflags & SVp_IOK) {
3332b3c1
JH
4211 (void)SvIOKp_on(dstr);
4212 if (sflags & SVf_IOK)
4213 SvFLAGS(dstr) |= SVf_IOK;
2b1c7e3e 4214 if (sflags & SVf_IVisUV)
25da4f38 4215 SvIsUV_on(dstr);
45977657 4216 SvIV_set(dstr, SvIVX(sstr));
79072805 4217 }
92f0c265 4218 if (SvVOK(sstr)) {
7a5fa8a2 4219 MAGIC *smg = mg_find(sstr,PERL_MAGIC_vstring);
ece467f9
JP
4220 sv_magic(dstr, NULL, PERL_MAGIC_vstring,
4221 smg->mg_ptr, smg->mg_len);
439cb1c4 4222 SvRMAGICAL_on(dstr);
7a5fa8a2 4223 }
79072805 4224 }
8990e307 4225 else if (sflags & SVp_IOK) {
3332b3c1
JH
4226 if (sflags & SVf_IOK)
4227 (void)SvIOK_only(dstr);
4228 else {
9cbac4c7
DM
4229 (void)SvOK_off(dstr);
4230 (void)SvIOKp_on(dstr);
3332b3c1
JH
4231 }
4232 /* XXXX Do we want to set IsUV for IV(ROK)? Be extra safe... */
2b1c7e3e 4233 if (sflags & SVf_IVisUV)
25da4f38 4234 SvIsUV_on(dstr);
45977657 4235 SvIV_set(dstr, SvIVX(sstr));
3332b3c1
JH
4236 if (sflags & SVp_NOK) {
4237 if (sflags & SVf_NOK)
4238 (void)SvNOK_on(dstr);
4239 else
4240 (void)SvNOKp_on(dstr);
9d6ce603 4241 SvNV_set(dstr, SvNVX(sstr));
3332b3c1
JH
4242 }
4243 }
4244 else if (sflags & SVp_NOK) {
4245 if (sflags & SVf_NOK)
4246 (void)SvNOK_only(dstr);
4247 else {
9cbac4c7 4248 (void)SvOK_off(dstr);
3332b3c1
JH
4249 SvNOKp_on(dstr);
4250 }
9d6ce603 4251 SvNV_set(dstr, SvNVX(sstr));
79072805
LW
4252 }
4253 else {
20408e3c 4254 if (dtype == SVt_PVGV) {
e476b1b5 4255 if (ckWARN(WARN_MISC))
9014280d 4256 Perl_warner(aTHX_ packWARN(WARN_MISC), "Undefined value assigned to typeglob");
20408e3c
GS
4257 }
4258 else
4259 (void)SvOK_off(dstr);
a0d0e21e 4260 }
27c9684d
AP
4261 if (SvTAINTED(sstr))
4262 SvTAINT(dstr);
79072805
LW
4263}
4264
954c1994
GS
4265/*
4266=for apidoc sv_setsv_mg
4267
4268Like C<sv_setsv>, but also handles 'set' magic.
4269
4270=cut
4271*/
4272
79072805 4273void
864dbfa3 4274Perl_sv_setsv_mg(pTHX_ SV *dstr, register SV *sstr)
ef50df4b
GS
4275{
4276 sv_setsv(dstr,sstr);
4277 SvSETMAGIC(dstr);
4278}
4279
f8c7b90f 4280#ifdef PERL_OLD_COPY_ON_WRITE
ed252734
NC
4281SV *
4282Perl_sv_setsv_cow(pTHX_ SV *dstr, SV *sstr)
4283{
4284 STRLEN cur = SvCUR(sstr);
4285 STRLEN len = SvLEN(sstr);
4286 register char *new_pv;
4287
4288 if (DEBUG_C_TEST) {
4289 PerlIO_printf(Perl_debug_log, "Fast copy on write: %p -> %p\n",
4290 sstr, dstr);
4291 sv_dump(sstr);
4292 if (dstr)
4293 sv_dump(dstr);
4294 }
4295
4296 if (dstr) {
4297 if (SvTHINKFIRST(dstr))
4298 sv_force_normal_flags(dstr, SV_COW_DROP_PV);
3f7c398e
SP
4299 else if (SvPVX_const(dstr))
4300 Safefree(SvPVX_const(dstr));
ed252734
NC
4301 }
4302 else
4303 new_SV(dstr);
862a34c6 4304 SvUPGRADE(dstr, SVt_PVIV);
ed252734
NC
4305
4306 assert (SvPOK(sstr));
4307 assert (SvPOKp(sstr));
4308 assert (!SvIOK(sstr));
4309 assert (!SvIOKp(sstr));
4310 assert (!SvNOK(sstr));
4311 assert (!SvNOKp(sstr));
4312
4313 if (SvIsCOW(sstr)) {
4314
4315 if (SvLEN(sstr) == 0) {
4316 /* source is a COW shared hash key. */
ed252734
NC
4317 DEBUG_C(PerlIO_printf(Perl_debug_log,
4318 "Fast copy on write: Sharing hash\n"));
d1db91c6 4319 new_pv = HEK_KEY(share_hek_hek(SvSHARED_HEK_FROM_PV(SvPVX_const(sstr))));
ed252734
NC
4320 goto common_exit;
4321 }
4322 SV_COW_NEXT_SV_SET(dstr, SV_COW_NEXT_SV(sstr));
4323 } else {
4324 assert ((SvFLAGS(sstr) & CAN_COW_MASK) == CAN_COW_FLAGS);
862a34c6 4325 SvUPGRADE(sstr, SVt_PVIV);
ed252734
NC
4326 SvREADONLY_on(sstr);
4327 SvFAKE_on(sstr);
4328 DEBUG_C(PerlIO_printf(Perl_debug_log,
4329 "Fast copy on write: Converting sstr to COW\n"));
4330 SV_COW_NEXT_SV_SET(dstr, sstr);
4331 }
4332 SV_COW_NEXT_SV_SET(sstr, dstr);
940132f3 4333 new_pv = SvPVX_mutable(sstr);
ed252734
NC
4334
4335 common_exit:
4336 SvPV_set(dstr, new_pv);
4337 SvFLAGS(dstr) = (SVt_PVIV|SVf_POK|SVp_POK|SVf_FAKE|SVf_READONLY);
4338 if (SvUTF8(sstr))
4339 SvUTF8_on(dstr);
87a1ef3d
SP
4340 SvLEN_set(dstr, len);
4341 SvCUR_set(dstr, cur);
ed252734
NC
4342 if (DEBUG_C_TEST) {
4343 sv_dump(dstr);
4344 }
4345 return dstr;
4346}
4347#endif
4348
954c1994
GS
4349/*
4350=for apidoc sv_setpvn
4351
4352Copies a string into an SV. The C<len> parameter indicates the number of
9e09f5f2
MHM
4353bytes to be copied. If the C<ptr> argument is NULL the SV will become
4354undefined. Does not handle 'set' magic. See C<sv_setpvn_mg>.
954c1994
GS
4355
4356=cut
4357*/
4358
ef50df4b 4359void
864dbfa3 4360Perl_sv_setpvn(pTHX_ register SV *sv, register const char *ptr, register STRLEN len)
79072805 4361{
c6f8c383 4362 register char *dptr;
22c522df 4363
765f542d 4364 SV_CHECK_THINKFIRST_COW_DROP(sv);
463ee0b2 4365 if (!ptr) {
a0d0e21e 4366 (void)SvOK_off(sv);
463ee0b2
LW
4367 return;
4368 }
22c522df
JH
4369 else {
4370 /* len is STRLEN which is unsigned, need to copy to signed */
a3b680e6 4371 const IV iv = len;
9c5ffd7c
JH
4372 if (iv < 0)
4373 Perl_croak(aTHX_ "panic: sv_setpvn called with negative strlen");
22c522df 4374 }
862a34c6 4375 SvUPGRADE(sv, SVt_PV);
c6f8c383 4376
5902b6a9 4377 dptr = SvGROW(sv, len + 1);
c6f8c383
GA
4378 Move(ptr,dptr,len,char);
4379 dptr[len] = '\0';
79072805 4380 SvCUR_set(sv, len);
1aa99e6b 4381 (void)SvPOK_only_UTF8(sv); /* validate pointer */
463ee0b2 4382 SvTAINT(sv);
79072805
LW
4383}
4384
954c1994
GS
4385/*
4386=for apidoc sv_setpvn_mg
4387
4388Like C<sv_setpvn>, but also handles 'set' magic.
4389
4390=cut
4391*/
4392
79072805 4393void
864dbfa3 4394Perl_sv_setpvn_mg(pTHX_ register SV *sv, register const char *ptr, register STRLEN len)
ef50df4b
GS
4395{
4396 sv_setpvn(sv,ptr,len);
4397 SvSETMAGIC(sv);
4398}
4399
954c1994
GS
4400/*
4401=for apidoc sv_setpv
4402
4403Copies a string into an SV. The string must be null-terminated. Does not
4404handle 'set' magic. See C<sv_setpv_mg>.
4405
4406=cut
4407*/
4408
ef50df4b 4409void
864dbfa3 4410Perl_sv_setpv(pTHX_ register SV *sv, register const char *ptr)
79072805
LW
4411{
4412 register STRLEN len;
4413
765f542d 4414 SV_CHECK_THINKFIRST_COW_DROP(sv);
463ee0b2 4415 if (!ptr) {
a0d0e21e 4416 (void)SvOK_off(sv);
463ee0b2
LW
4417 return;
4418 }
79072805 4419 len = strlen(ptr);
862a34c6 4420 SvUPGRADE(sv, SVt_PV);
c6f8c383 4421
79072805 4422 SvGROW(sv, len + 1);
463ee0b2 4423 Move(ptr,SvPVX(sv),len+1,char);
79072805 4424 SvCUR_set(sv, len);
1aa99e6b 4425 (void)SvPOK_only_UTF8(sv); /* validate pointer */
463ee0b2
LW
4426 SvTAINT(sv);
4427}
4428
954c1994
GS
4429/*
4430=for apidoc sv_setpv_mg
4431
4432Like C<sv_setpv>, but also handles 'set' magic.
4433
4434=cut
4435*/
4436
463ee0b2 4437void
864dbfa3 4438Perl_sv_setpv_mg(pTHX_ register SV *sv, register const char *ptr)
ef50df4b
GS
4439{
4440 sv_setpv(sv,ptr);
4441 SvSETMAGIC(sv);
4442}
4443
954c1994
GS
4444/*
4445=for apidoc sv_usepvn
4446
4447Tells an SV to use C<ptr> to find its string value. Normally the string is
1c846c1f 4448stored inside the SV but sv_usepvn allows the SV to use an outside string.
954c1994
GS
4449The C<ptr> should point to memory that was allocated by C<malloc>. The
4450string length, C<len>, must be supplied. This function will realloc the
4451memory pointed to by C<ptr>, so that pointer should not be freed or used by
4452the programmer after giving it to sv_usepvn. Does not handle 'set' magic.
4453See C<sv_usepvn_mg>.
4454
4455=cut
4456*/
4457
ef50df4b 4458void
864dbfa3 4459Perl_sv_usepvn(pTHX_ register SV *sv, register char *ptr, register STRLEN len)
463ee0b2 4460{
1936d2a7 4461 STRLEN allocate;
765f542d 4462 SV_CHECK_THINKFIRST_COW_DROP(sv);
862a34c6 4463 SvUPGRADE(sv, SVt_PV);
463ee0b2 4464 if (!ptr) {
a0d0e21e 4465 (void)SvOK_off(sv);
463ee0b2
LW
4466 return;
4467 }
3f7c398e 4468 if (SvPVX_const(sv))
8bd4d4c5 4469 SvPV_free(sv);
1936d2a7
NC
4470
4471 allocate = PERL_STRLEN_ROUNDUP(len + 1);
7a9b70e9 4472 ptr = saferealloc (ptr, allocate);
f880fe2f 4473 SvPV_set(sv, ptr);
463ee0b2 4474 SvCUR_set(sv, len);
1936d2a7 4475 SvLEN_set(sv, allocate);
463ee0b2 4476 *SvEND(sv) = '\0';
1aa99e6b 4477 (void)SvPOK_only_UTF8(sv); /* validate pointer */
463ee0b2 4478 SvTAINT(sv);
79072805
LW
4479}
4480
954c1994
GS
4481/*
4482=for apidoc sv_usepvn_mg
4483
4484Like C<sv_usepvn>, but also handles 'set' magic.
4485
4486=cut
4487*/
4488
ef50df4b 4489void
864dbfa3 4490Perl_sv_usepvn_mg(pTHX_ register SV *sv, register char *ptr, register STRLEN len)
ef50df4b 4491{
51c1089b 4492 sv_usepvn(sv,ptr,len);
ef50df4b
GS
4493 SvSETMAGIC(sv);
4494}
4495
f8c7b90f 4496#ifdef PERL_OLD_COPY_ON_WRITE
765f542d
NC
4497/* Need to do this *after* making the SV normal, as we need the buffer
4498 pointer to remain valid until after we've copied it. If we let go too early,
4499 another thread could invalidate it by unsharing last of the same hash key
4500 (which it can do by means other than releasing copy-on-write Svs)
4501 or by changing the other copy-on-write SVs in the loop. */
4502STATIC void
bdd68bc3 4503S_sv_release_COW(pTHX_ register SV *sv, const char *pvx, STRLEN len, SV *after)
765f542d
NC
4504{
4505 if (len) { /* this SV was SvIsCOW_normal(sv) */
4506 /* we need to find the SV pointing to us. */
aec46f14 4507 SV * const current = SV_COW_NEXT_SV(after);
7a5fa8a2 4508
765f542d
NC
4509 if (current == sv) {
4510 /* The SV we point to points back to us (there were only two of us
4511 in the loop.)
4512 Hence other SV is no longer copy on write either. */
4513 SvFAKE_off(after);
4514 SvREADONLY_off(after);
4515 } else {
4516 /* We need to follow the pointers around the loop. */
4517 SV *next;
4518 while ((next = SV_COW_NEXT_SV(current)) != sv) {
4519 assert (next);
4520 current = next;
4521 /* don't loop forever if the structure is bust, and we have
4522 a pointer into a closed loop. */
4523 assert (current != after);
3f7c398e 4524 assert (SvPVX_const(current) == pvx);
765f542d
NC
4525 }
4526 /* Make the SV before us point to the SV after us. */
a29f6d03 4527 SV_COW_NEXT_SV_SET(current, after);
765f542d
NC
4528 }
4529 } else {
bdd68bc3 4530 unshare_hek(SvSHARED_HEK_FROM_PV(pvx));
765f542d
NC
4531 }
4532}
4533
4534int
4535Perl_sv_release_IVX(pTHX_ register SV *sv)
4536{
4537 if (SvIsCOW(sv))
4538 sv_force_normal_flags(sv, 0);
0c34ef67
MHM
4539 SvOOK_off(sv);
4540 return 0;
765f542d
NC
4541}
4542#endif
645c22ef
DM
4543/*
4544=for apidoc sv_force_normal_flags
4545
4546Undo various types of fakery on an SV: if the PV is a shared string, make
4547a private copy; if we're a ref, stop refing; if we're a glob, downgrade to
765f542d
NC
4548an xpvmg; if we're a copy-on-write scalar, this is the on-write time when
4549we do the copy, and is also used locally. If C<SV_COW_DROP_PV> is set
4550then a copy-on-write scalar drops its PV buffer (if any) and becomes
4551SvPOK_off rather than making a copy. (Used where this scalar is about to be
d3050d9d 4552set to some other value.) In addition, the C<flags> parameter gets passed to
765f542d
NC
4553C<sv_unref_flags()> when unrefing. C<sv_force_normal> calls this function
4554with flags set to 0.
645c22ef
DM
4555
4556=cut
4557*/
4558
6fc92669 4559void
840a7b70 4560Perl_sv_force_normal_flags(pTHX_ register SV *sv, U32 flags)
0f15f207 4561{
f8c7b90f 4562#ifdef PERL_OLD_COPY_ON_WRITE
765f542d
NC
4563 if (SvREADONLY(sv)) {
4564 /* At this point I believe I should acquire a global SV mutex. */
4565 if (SvFAKE(sv)) {
b64e5050 4566 const char * const pvx = SvPVX_const(sv);
a28509cc
AL
4567 const STRLEN len = SvLEN(sv);
4568 const STRLEN cur = SvCUR(sv);
a28509cc 4569 SV * const next = SV_COW_NEXT_SV(sv); /* next COW sv in the loop. */
46187eeb
NC
4570 if (DEBUG_C_TEST) {
4571 PerlIO_printf(Perl_debug_log,
4572 "Copy on write: Force normal %ld\n",
4573 (long) flags);
e419cbc5 4574 sv_dump(sv);
46187eeb 4575 }
765f542d
NC
4576 SvFAKE_off(sv);
4577 SvREADONLY_off(sv);
9f653bb5 4578 /* This SV doesn't own the buffer, so need to Newx() a new one: */
f880fe2f 4579 SvPV_set(sv, (char*)0);
87a1ef3d 4580 SvLEN_set(sv, 0);
765f542d
NC
4581 if (flags & SV_COW_DROP_PV) {
4582 /* OK, so we don't need to copy our buffer. */
4583 SvPOK_off(sv);
4584 } else {
4585 SvGROW(sv, cur + 1);
4586 Move(pvx,SvPVX(sv),cur,char);
87a1ef3d 4587 SvCUR_set(sv, cur);
765f542d
NC
4588 *SvEND(sv) = '\0';
4589 }
bdd68bc3 4590 sv_release_COW(sv, pvx, len, next);
46187eeb 4591 if (DEBUG_C_TEST) {
e419cbc5 4592 sv_dump(sv);
46187eeb 4593 }
765f542d 4594 }
923e4eb5 4595 else if (IN_PERL_RUNTIME)
765f542d
NC
4596 Perl_croak(aTHX_ PL_no_modify);
4597 /* At this point I believe that I can drop the global SV mutex. */
4598 }
4599#else
2213622d 4600 if (SvREADONLY(sv)) {
1c846c1f 4601 if (SvFAKE(sv)) {
b64e5050 4602 const char * const pvx = SvPVX_const(sv);
66a1b24b 4603 const STRLEN len = SvCUR(sv);
10bcdfd6
NC
4604 SvFAKE_off(sv);
4605 SvREADONLY_off(sv);
66a1b24b
AL
4606 SvPV_set(sv, Nullch);
4607 SvLEN_set(sv, 0);
1c846c1f 4608 SvGROW(sv, len + 1);
706aa1c9 4609 Move(pvx,SvPVX(sv),len,char);
1c846c1f 4610 *SvEND(sv) = '\0';
bdd68bc3 4611 unshare_hek(SvSHARED_HEK_FROM_PV(pvx));
1c846c1f 4612 }
923e4eb5 4613 else if (IN_PERL_RUNTIME)
cea2e8a9 4614 Perl_croak(aTHX_ PL_no_modify);
0f15f207 4615 }
765f542d 4616#endif
2213622d 4617 if (SvROK(sv))
840a7b70 4618 sv_unref_flags(sv, flags);
6fc92669
GS
4619 else if (SvFAKE(sv) && SvTYPE(sv) == SVt_PVGV)
4620 sv_unglob(sv);
0f15f207 4621}
1c846c1f 4622
645c22ef
DM
4623/*
4624=for apidoc sv_force_normal
4625
4626Undo various types of fakery on an SV: if the PV is a shared string, make
4627a private copy; if we're a ref, stop refing; if we're a glob, downgrade to
4628an xpvmg. See also C<sv_force_normal_flags>.
4629
4630=cut
4631*/
4632
840a7b70
IZ
4633void
4634Perl_sv_force_normal(pTHX_ register SV *sv)
4635{
4636 sv_force_normal_flags(sv, 0);
4637}
4638
954c1994
GS
4639/*
4640=for apidoc sv_chop
4641
1c846c1f 4642Efficient removal of characters from the beginning of the string buffer.
954c1994
GS
4643SvPOK(sv) must be true and the C<ptr> must be a pointer to somewhere inside
4644the string buffer. The C<ptr> becomes the first character of the adjusted
645c22ef 4645string. Uses the "OOK hack".
3f7c398e 4646Beware: after this function returns, C<ptr> and SvPVX_const(sv) may no longer
31869a79 4647refer to the same chunk of data.
954c1994
GS
4648
4649=cut
4650*/
4651
79072805 4652void
f54cb97a 4653Perl_sv_chop(pTHX_ register SV *sv, register const char *ptr)
79072805
LW
4654{
4655 register STRLEN delta;
a0d0e21e 4656 if (!ptr || !SvPOKp(sv))
79072805 4657 return;
3f7c398e 4658 delta = ptr - SvPVX_const(sv);
2213622d 4659 SV_CHECK_THINKFIRST(sv);
79072805
LW
4660 if (SvTYPE(sv) < SVt_PVIV)
4661 sv_upgrade(sv,SVt_PVIV);
4662
4663 if (!SvOOK(sv)) {
50483b2c 4664 if (!SvLEN(sv)) { /* make copy of shared string */
3f7c398e 4665 const char *pvx = SvPVX_const(sv);
a28509cc 4666 const STRLEN len = SvCUR(sv);
50483b2c 4667 SvGROW(sv, len + 1);
706aa1c9 4668 Move(pvx,SvPVX(sv),len,char);
50483b2c
JD
4669 *SvEND(sv) = '\0';
4670 }
45977657 4671 SvIV_set(sv, 0);
a4bfb290
AB
4672 /* Same SvOOK_on but SvOOK_on does a SvIOK_off
4673 and we do that anyway inside the SvNIOK_off
4674 */
7a5fa8a2 4675 SvFLAGS(sv) |= SVf_OOK;
79072805 4676 }
a4bfb290 4677 SvNIOK_off(sv);
b162af07
SP
4678 SvLEN_set(sv, SvLEN(sv) - delta);
4679 SvCUR_set(sv, SvCUR(sv) - delta);
f880fe2f 4680 SvPV_set(sv, SvPVX(sv) + delta);
45977657 4681 SvIV_set(sv, SvIVX(sv) + delta);
79072805
LW
4682}
4683
09540bc3
JH
4684/* sv_catpvn() is now a macro using Perl_sv_catpvn_flags();
4685 * this function provided for binary compatibility only
4686 */
4687
4688void
4689Perl_sv_catpvn(pTHX_ SV *dsv, const char* sstr, STRLEN slen)
4690{
4691 sv_catpvn_flags(dsv, sstr, slen, SV_GMAGIC);
4692}
4693
954c1994
GS
4694/*
4695=for apidoc sv_catpvn
4696
4697Concatenates the string onto the end of the string which is in the SV. The
1e54db1a
JH
4698C<len> indicates number of bytes to copy. If the SV has the UTF-8
4699status set, then the bytes appended should be valid UTF-8.
d5ce4a7c 4700Handles 'get' magic, but not 'set' magic. See C<sv_catpvn_mg>.
954c1994 4701
8d6d96c1
HS
4702=for apidoc sv_catpvn_flags
4703
4704Concatenates the string onto the end of the string which is in the SV. The
1e54db1a
JH
4705C<len> indicates number of bytes to copy. If the SV has the UTF-8
4706status set, then the bytes appended should be valid UTF-8.
8d6d96c1
HS
4707If C<flags> has C<SV_GMAGIC> bit set, will C<mg_get> on C<dsv> if
4708appropriate, else not. C<sv_catpvn> and C<sv_catpvn_nomg> are implemented
4709in terms of this function.
4710
4711=cut
4712*/
4713
4714void
4715Perl_sv_catpvn_flags(pTHX_ register SV *dsv, register const char *sstr, register STRLEN slen, I32 flags)
4716{
4717 STRLEN dlen;
f54cb97a 4718 const char *dstr = SvPV_force_flags(dsv, dlen, flags);
8d6d96c1 4719
8d6d96c1
HS
4720 SvGROW(dsv, dlen + slen + 1);
4721 if (sstr == dstr)
3f7c398e 4722 sstr = SvPVX_const(dsv);
8d6d96c1 4723 Move(sstr, SvPVX(dsv) + dlen, slen, char);
b162af07 4724 SvCUR_set(dsv, SvCUR(dsv) + slen);
8d6d96c1
HS
4725 *SvEND(dsv) = '\0';
4726 (void)SvPOK_only_UTF8(dsv); /* validate pointer */
4727 SvTAINT(dsv);
79072805
LW
4728}
4729
954c1994
GS
4730/*
4731=for apidoc sv_catpvn_mg
4732
4733Like C<sv_catpvn>, but also handles 'set' magic.
4734
4735=cut
4736*/
4737
79072805 4738void
864dbfa3 4739Perl_sv_catpvn_mg(pTHX_ register SV *sv, register const char *ptr, register STRLEN len)
ef50df4b
GS
4740{
4741 sv_catpvn(sv,ptr,len);
4742 SvSETMAGIC(sv);
4743}
4744
09540bc3
JH
4745/* sv_catsv() is now a macro using Perl_sv_catsv_flags();
4746 * this function provided for binary compatibility only
4747 */
4748
4749void
4750Perl_sv_catsv(pTHX_ SV *dstr, register SV *sstr)
4751{
4752 sv_catsv_flags(dstr, sstr, SV_GMAGIC);
4753}
4754
954c1994
GS
4755/*
4756=for apidoc sv_catsv
4757
13e8c8e3
JH
4758Concatenates the string from SV C<ssv> onto the end of the string in
4759SV C<dsv>. Modifies C<dsv> but not C<ssv>. Handles 'get' magic, but
4760not 'set' magic. See C<sv_catsv_mg>.
954c1994 4761
8d6d96c1
HS
4762=for apidoc sv_catsv_flags
4763
4764Concatenates the string from SV C<ssv> onto the end of the string in
4765SV C<dsv>. Modifies C<dsv> but not C<ssv>. If C<flags> has C<SV_GMAGIC>
4766bit set, will C<mg_get> on the SVs if appropriate, else not. C<sv_catsv>
4767and C<sv_catsv_nomg> are implemented in terms of this function.
4768
4769=cut */
4770
ef50df4b 4771void
8d6d96c1 4772Perl_sv_catsv_flags(pTHX_ SV *dsv, register SV *ssv, I32 flags)
79072805 4773{
4d84ee25 4774 const char *spv;
13e8c8e3 4775 STRLEN slen;
46199a12 4776 if (!ssv)
79072805 4777 return;
4d84ee25 4778 if ((spv = SvPV_const(ssv, slen))) {
4fd84b44
AD
4779 /* sutf8 and dutf8 were type bool, but under USE_ITHREADS,
4780 gcc version 2.95.2 20000220 (Debian GNU/Linux) for
8cf8f3d1
NIS
4781 Linux xxx 2.2.17 on sparc64 with gcc -O2, we erroneously
4782 get dutf8 = 0x20000000, (i.e. SVf_UTF8) even though
4fd84b44
AD
4783 dsv->sv_flags doesn't have that bit set.
4784 Andy Dougherty 12 Oct 2001
4785 */
b464bac0 4786 const I32 sutf8 = DO_UTF8(ssv);
4fd84b44 4787 I32 dutf8;
13e8c8e3 4788
8d6d96c1
HS
4789 if (SvGMAGICAL(dsv) && (flags & SV_GMAGIC))
4790 mg_get(dsv);
4791 dutf8 = DO_UTF8(dsv);
4792
4793 if (dutf8 != sutf8) {
13e8c8e3 4794 if (dutf8) {
46199a12 4795 /* Not modifying source SV, so taking a temporary copy. */
8d6d96c1 4796 SV* csv = sv_2mortal(newSVpvn(spv, slen));
13e8c8e3 4797
46199a12 4798 sv_utf8_upgrade(csv);
93524f2b 4799 spv = SvPV_const(csv, slen);
13e8c8e3 4800 }
8d6d96c1
HS
4801 else
4802 sv_utf8_upgrade_nomg(dsv);
e84ff256 4803 }
8d6d96c1 4804 sv_catpvn_nomg(dsv, spv, slen);
560a288e 4805 }
79072805
LW
4806}
4807
954c1994
GS
4808/*
4809=for apidoc sv_catsv_mg
4810
4811Like C<sv_catsv>, but also handles 'set' magic.
4812
4813=cut
4814*/
4815
79072805 4816void
46199a12 4817Perl_sv_catsv_mg(pTHX_ SV *dsv, register SV *ssv)
ef50df4b 4818{
46199a12
JH
4819 sv_catsv(dsv,ssv);
4820 SvSETMAGIC(dsv);
ef50df4b
GS
4821}
4822
954c1994
GS
4823/*
4824=for apidoc sv_catpv
4825
4826Concatenates the string onto the end of the string which is in the SV.
1e54db1a
JH
4827If the SV has the UTF-8 status set, then the bytes appended should be
4828valid UTF-8. Handles 'get' magic, but not 'set' magic. See C<sv_catpv_mg>.
954c1994 4829
d5ce4a7c 4830=cut */
954c1994 4831
ef50df4b 4832void
0c981600 4833Perl_sv_catpv(pTHX_ register SV *sv, register const char *ptr)
79072805
LW
4834{
4835 register STRLEN len;
463ee0b2 4836 STRLEN tlen;
748a9306 4837 char *junk;
79072805 4838
0c981600 4839 if (!ptr)
79072805 4840 return;
748a9306 4841 junk = SvPV_force(sv, tlen);
0c981600 4842 len = strlen(ptr);
463ee0b2 4843 SvGROW(sv, tlen + len + 1);
0c981600 4844 if (ptr == junk)
3f7c398e 4845 ptr = SvPVX_const(sv);
0c981600 4846 Move(ptr,SvPVX(sv)+tlen,len+1,char);
b162af07 4847 SvCUR_set(sv, SvCUR(sv) + len);
d41ff1b8 4848 (void)SvPOK_only_UTF8(sv); /* validate pointer */
463ee0b2 4849 SvTAINT(sv);
79072805
LW
4850}
4851
954c1994
GS
4852/*
4853=for apidoc sv_catpv_mg
4854
4855Like C<sv_catpv>, but also handles 'set' magic.
4856
4857=cut
4858*/
4859
ef50df4b 4860void
0c981600 4861Perl_sv_catpv_mg(pTHX_ register SV *sv, register const char *ptr)
ef50df4b 4862{
0c981600 4863 sv_catpv(sv,ptr);
ef50df4b
GS
4864 SvSETMAGIC(sv);
4865}
4866
645c22ef
DM
4867/*
4868=for apidoc newSV
4869
4870Create a new null SV, or if len > 0, create a new empty SVt_PV type SV
4871with an initial PV allocation of len+1. Normally accessed via the C<NEWSV>
4872macro.
4873
4874=cut
4875*/
4876
79072805 4877SV *
864dbfa3 4878Perl_newSV(pTHX_ STRLEN len)
79072805
LW
4879{
4880 register SV *sv;
1c846c1f 4881
4561caa4 4882 new_SV(sv);
79072805
LW
4883 if (len) {
4884 sv_upgrade(sv, SVt_PV);
4885 SvGROW(sv, len + 1);
4886 }
4887 return sv;
4888}
954c1994 4889/*
92110913 4890=for apidoc sv_magicext
954c1994 4891
68795e93 4892Adds magic to an SV, upgrading it if necessary. Applies the
2d8d5d5a 4893supplied vtable and returns a pointer to the magic added.
92110913 4894
2d8d5d5a
SH
4895Note that C<sv_magicext> will allow things that C<sv_magic> will not.
4896In particular, you can add magic to SvREADONLY SVs, and add more than
4897one instance of the same 'how'.
645c22ef 4898
2d8d5d5a
SH
4899If C<namlen> is greater than zero then a C<savepvn> I<copy> of C<name> is
4900stored, if C<namlen> is zero then C<name> is stored as-is and - as another
4901special case - if C<(name && namlen == HEf_SVKEY)> then C<name> is assumed
4902to contain an C<SV*> and is stored as-is with its REFCNT incremented.
92110913 4903
2d8d5d5a 4904(This is now used as a subroutine by C<sv_magic>.)
954c1994
GS
4905
4906=cut
4907*/
92110913 4908MAGIC *
e1ec3a88 4909Perl_sv_magicext(pTHX_ SV* sv, SV* obj, int how, const MGVTBL *vtable,
92110913 4910 const char* name, I32 namlen)
79072805
LW
4911{
4912 MAGIC* mg;
68795e93 4913
92110913 4914 if (SvTYPE(sv) < SVt_PVMG) {
862a34c6 4915 SvUPGRADE(sv, SVt_PVMG);
463ee0b2 4916 }
a02a5408 4917 Newxz(mg, 1, MAGIC);
79072805 4918 mg->mg_moremagic = SvMAGIC(sv);
b162af07 4919 SvMAGIC_set(sv, mg);
75f9d97a 4920
05f95b08
SB
4921 /* Sometimes a magic contains a reference loop, where the sv and
4922 object refer to each other. To prevent a reference loop that
4923 would prevent such objects being freed, we look for such loops
4924 and if we find one we avoid incrementing the object refcount.
87f0b213
JH
4925
4926 Note we cannot do this to avoid self-tie loops as intervening RV must
b5ccf5f2 4927 have its REFCNT incremented to keep it in existence.
87f0b213
JH
4928
4929 */
14befaf4
DM
4930 if (!obj || obj == sv ||
4931 how == PERL_MAGIC_arylen ||
4932 how == PERL_MAGIC_qr ||
8d2f4536 4933 how == PERL_MAGIC_symtab ||
75f9d97a
JH
4934 (SvTYPE(obj) == SVt_PVGV &&
4935 (GvSV(obj) == sv || GvHV(obj) == (HV*)sv || GvAV(obj) == (AV*)sv ||
4936 GvCV(obj) == (CV*)sv || GvIOp(obj) == (IO*)sv ||
2628be26 4937 GvFORM(obj) == (CV*)sv)))
75f9d97a 4938 {
8990e307 4939 mg->mg_obj = obj;
75f9d97a 4940 }
85e6fe83 4941 else {
8990e307 4942 mg->mg_obj = SvREFCNT_inc(obj);
85e6fe83
LW
4943 mg->mg_flags |= MGf_REFCOUNTED;
4944 }
b5ccf5f2
YST
4945
4946 /* Normal self-ties simply pass a null object, and instead of
4947 using mg_obj directly, use the SvTIED_obj macro to produce a
4948 new RV as needed. For glob "self-ties", we are tieing the PVIO
4949 with an RV obj pointing to the glob containing the PVIO. In
4950 this case, to avoid a reference loop, we need to weaken the
4951 reference.
4952 */
4953
4954 if (how == PERL_MAGIC_tiedscalar && SvTYPE(sv) == SVt_PVIO &&
4955 obj && SvROK(obj) && GvIO(SvRV(obj)) == (IO*)sv)
4956 {
4957 sv_rvweaken(obj);
4958 }
4959
79072805 4960 mg->mg_type = how;
565764a8 4961 mg->mg_len = namlen;
9cbac4c7 4962 if (name) {
92110913 4963 if (namlen > 0)
1edc1566 4964 mg->mg_ptr = savepvn(name, namlen);
c6ee37c5 4965 else if (namlen == HEf_SVKEY)
1edc1566 4966 mg->mg_ptr = (char*)SvREFCNT_inc((SV*)name);
68795e93 4967 else
92110913 4968 mg->mg_ptr = (char *) name;
9cbac4c7 4969 }
92110913 4970 mg->mg_virtual = vtable;
68795e93 4971
92110913
NIS
4972 mg_magical(sv);
4973 if (SvGMAGICAL(sv))
4974 SvFLAGS(sv) &= ~(SVf_IOK|SVf_NOK|SVf_POK);
4975 return mg;
4976}
4977
4978/*
4979=for apidoc sv_magic
1c846c1f 4980
92110913
NIS
4981Adds magic to an SV. First upgrades C<sv> to type C<SVt_PVMG> if necessary,
4982then adds a new magic item of type C<how> to the head of the magic list.
4983
2d8d5d5a
SH
4984See C<sv_magicext> (which C<sv_magic> now calls) for a description of the
4985handling of the C<name> and C<namlen> arguments.
4986
4509d3fb
SB
4987You need to use C<sv_magicext> to add magic to SvREADONLY SVs and also
4988to add more than one instance of the same 'how'.
4989
92110913
NIS
4990=cut
4991*/
4992
4993void
4994Perl_sv_magic(pTHX_ register SV *sv, SV *obj, int how, const char *name, I32 namlen)
68795e93 4995{
aec46f14 4996 const MGVTBL *vtable;
92110913 4997 MAGIC* mg;
92110913 4998
f8c7b90f 4999#ifdef PERL_OLD_COPY_ON_WRITE
765f542d
NC
5000 if (SvIsCOW(sv))
5001 sv_force_normal_flags(sv, 0);
5002#endif
92110913 5003 if (SvREADONLY(sv)) {
d8084ca5
DM
5004 if (
5005 /* its okay to attach magic to shared strings; the subsequent
5006 * upgrade to PVMG will unshare the string */
5007 !(SvFAKE(sv) && SvTYPE(sv) < SVt_PVMG)
5008
5009 && IN_PERL_RUNTIME
92110913
NIS
5010 && how != PERL_MAGIC_regex_global
5011 && how != PERL_MAGIC_bm
5012 && how != PERL_MAGIC_fm
5013 && how != PERL_MAGIC_sv
e6469971 5014 && how != PERL_MAGIC_backref
92110913
NIS
5015 )
5016 {
5017 Perl_croak(aTHX_ PL_no_modify);
5018 }
5019 }
5020 if (SvMAGICAL(sv) || (how == PERL_MAGIC_taint && SvTYPE(sv) >= SVt_PVMG)) {
5021 if (SvMAGIC(sv) && (mg = mg_find(sv, how))) {
68795e93
NIS
5022 /* sv_magic() refuses to add a magic of the same 'how' as an
5023 existing one
92110913
NIS
5024 */
5025 if (how == PERL_MAGIC_taint)
5026 mg->mg_len |= 1;
5027 return;
5028 }
5029 }
68795e93 5030
79072805 5031 switch (how) {
14befaf4 5032 case PERL_MAGIC_sv:
92110913 5033 vtable = &PL_vtbl_sv;
79072805 5034 break;
14befaf4 5035 case PERL_MAGIC_overload:
92110913 5036 vtable = &PL_vtbl_amagic;
a0d0e21e 5037 break;
14befaf4 5038 case PERL_MAGIC_overload_elem:
92110913 5039 vtable = &PL_vtbl_amagicelem;
a0d0e21e 5040 break;
14befaf4 5041 case PERL_MAGIC_overload_table:
92110913 5042 vtable = &PL_vtbl_ovrld;
a0d0e21e 5043 break;
14befaf4 5044 case PERL_MAGIC_bm:
92110913 5045 vtable = &PL_vtbl_bm;
79072805 5046 break;
14befaf4 5047 case PERL_MAGIC_regdata:
92110913 5048 vtable = &PL_vtbl_regdata;
6cef1e77 5049 break;
14befaf4 5050 case PERL_MAGIC_regdatum:
92110913 5051 vtable = &PL_vtbl_regdatum;
6cef1e77 5052 break;
14befaf4 5053 case PERL_MAGIC_env:
92110913 5054 vtable = &PL_vtbl_env;
79072805 5055 break;
14befaf4 5056 case PERL_MAGIC_fm:
92110913 5057 vtable = &PL_vtbl_fm;
55497cff 5058 break;
14befaf4 5059 case PERL_MAGIC_envelem:
92110913 5060 vtable = &PL_vtbl_envelem;
79072805 5061 break;
14befaf4 5062 case PERL_MAGIC_regex_global:
92110913 5063 vtable = &PL_vtbl_mglob;
93a17b20 5064 break;
14befaf4 5065 case PERL_MAGIC_isa:
92110913 5066 vtable = &PL_vtbl_isa;
463ee0b2 5067 break;
14befaf4 5068 case PERL_MAGIC_isaelem:
92110913 5069 vtable = &PL_vtbl_isaelem;
463ee0b2 5070 break;
14befaf4 5071 case PERL_MAGIC_nkeys:
92110913 5072 vtable = &PL_vtbl_nkeys;
16660edb 5073 break;
14befaf4 5074 case PERL_MAGIC_dbfile:
aec46f14 5075 vtable = NULL;
93a17b20 5076 break;
14befaf4 5077 case PERL_MAGIC_dbline:
92110913 5078 vtable = &PL_vtbl_dbline;
79072805 5079 break;
36477c24 5080#ifdef USE_LOCALE_COLLATE
14befaf4 5081 case PERL_MAGIC_collxfrm:
92110913 5082 vtable = &PL_vtbl_collxfrm;
bbce6d69 5083 break;
36477c24 5084#endif /* USE_LOCALE_COLLATE */
14befaf4 5085 case PERL_MAGIC_tied:
92110913 5086 vtable = &PL_vtbl_pack;
463ee0b2 5087 break;
14befaf4
DM
5088 case PERL_MAGIC_tiedelem:
5089 case PERL_MAGIC_tiedscalar:
92110913 5090 vtable = &PL_vtbl_packelem;
463ee0b2 5091 break;
14befaf4 5092 case PERL_MAGIC_qr:
92110913 5093 vtable = &PL_vtbl_regexp;
c277df42 5094 break;
14befaf4 5095 case PERL_MAGIC_sig:
92110913 5096 vtable = &PL_vtbl_sig;
79072805 5097 break;
14befaf4 5098 case PERL_MAGIC_sigelem:
92110913 5099 vtable = &PL_vtbl_sigelem;
79072805 5100 break;
14befaf4 5101 case PERL_MAGIC_taint:
92110913 5102 vtable = &PL_vtbl_taint;
463ee0b2 5103 break;
14befaf4 5104 case PERL_MAGIC_uvar:
92110913 5105 vtable = &PL_vtbl_uvar;
79072805 5106 break;
14befaf4 5107 case PERL_MAGIC_vec:
92110913 5108 vtable = &PL_vtbl_vec;
79072805 5109 break;
a3874608 5110 case PERL_MAGIC_arylen_p:
bfcb3514 5111 case PERL_MAGIC_rhash:
8d2f4536 5112 case PERL_MAGIC_symtab:
ece467f9 5113 case PERL_MAGIC_vstring:
aec46f14 5114 vtable = NULL;
ece467f9 5115 break;
7e8c5dac
HS
5116 case PERL_MAGIC_utf8:
5117 vtable = &PL_vtbl_utf8;
5118 break;
14befaf4 5119 case PERL_MAGIC_substr:
92110913 5120 vtable = &PL_vtbl_substr;
79072805 5121 break;
14befaf4 5122 case PERL_MAGIC_defelem:
92110913 5123 vtable = &PL_vtbl_defelem;
5f05dabc 5124 break;
14befaf4 5125 case PERL_MAGIC_glob:
92110913 5126 vtable = &PL_vtbl_glob;
79072805 5127 break;
14befaf4 5128 case PERL_MAGIC_arylen:
92110913 5129 vtable = &PL_vtbl_arylen;
79072805 5130 break;
14befaf4 5131 case PERL_MAGIC_pos:
92110913 5132 vtable = &PL_vtbl_pos;
a0d0e21e 5133 break;
14befaf4 5134 case PERL_MAGIC_backref:
92110913 5135 vtable = &PL_vtbl_backref;
810b8aa5 5136 break;
14befaf4
DM
5137 case PERL_MAGIC_ext:
5138 /* Reserved for use by extensions not perl internals. */
4633a7c4
LW
5139 /* Useful for attaching extension internal data to perl vars. */
5140 /* Note that multiple extensions may clash if magical scalars */
5141 /* etc holding private data from one are passed to another. */
aec46f14 5142 vtable = NULL;
a0d0e21e 5143 break;
79072805 5144 default:
14befaf4 5145 Perl_croak(aTHX_ "Don't know how to handle magic of type \\%o", how);
463ee0b2 5146 }
68795e93 5147
92110913 5148 /* Rest of work is done else where */
aec46f14 5149 mg = sv_magicext(sv,obj,how,vtable,name,namlen);
68795e93 5150
92110913
NIS
5151 switch (how) {
5152 case PERL_MAGIC_taint:
5153 mg->mg_len = 1;
5154 break;
5155 case PERL_MAGIC_ext:
5156 case PERL_MAGIC_dbfile:
5157 SvRMAGICAL_on(sv);
5158 break;
5159 }
463ee0b2
LW
5160}
5161
c461cf8f
JH
5162/*
5163=for apidoc sv_unmagic
5164
645c22ef 5165Removes all magic of type C<type> from an SV.
c461cf8f
JH
5166
5167=cut
5168*/
5169
463ee0b2 5170int
864dbfa3 5171Perl_sv_unmagic(pTHX_ SV *sv, int type)
463ee0b2
LW
5172{
5173 MAGIC* mg;
5174 MAGIC** mgp;
91bba347 5175 if (SvTYPE(sv) < SVt_PVMG || !SvMAGIC(sv))
463ee0b2
LW
5176 return 0;
5177 mgp = &SvMAGIC(sv);
5178 for (mg = *mgp; mg; mg = *mgp) {
5179 if (mg->mg_type == type) {
e1ec3a88 5180 const MGVTBL* const vtbl = mg->mg_virtual;
463ee0b2 5181 *mgp = mg->mg_moremagic;
1d7c1841 5182 if (vtbl && vtbl->svt_free)
fc0dc3b3 5183 CALL_FPTR(vtbl->svt_free)(aTHX_ sv, mg);
14befaf4 5184 if (mg->mg_ptr && mg->mg_type != PERL_MAGIC_regex_global) {
92110913 5185 if (mg->mg_len > 0)
1edc1566 5186 Safefree(mg->mg_ptr);
565764a8 5187 else if (mg->mg_len == HEf_SVKEY)
1edc1566 5188 SvREFCNT_dec((SV*)mg->mg_ptr);
7e8c5dac
HS
5189 else if (mg->mg_type == PERL_MAGIC_utf8 && mg->mg_ptr)
5190 Safefree(mg->mg_ptr);
9cbac4c7 5191 }
a0d0e21e
LW
5192 if (mg->mg_flags & MGf_REFCOUNTED)
5193 SvREFCNT_dec(mg->mg_obj);
463ee0b2
LW
5194 Safefree(mg);
5195 }
5196 else
5197 mgp = &mg->mg_moremagic;
79072805 5198 }
91bba347 5199 if (!SvMAGIC(sv)) {
463ee0b2 5200 SvMAGICAL_off(sv);
06759ea0 5201 SvFLAGS(sv) |= (SvFLAGS(sv) & (SVp_NOK|SVp_POK)) >> PRIVSHIFT;
463ee0b2
LW
5202 }
5203
5204 return 0;
79072805
LW
5205}
5206
c461cf8f
JH
5207/*
5208=for apidoc sv_rvweaken
5209
645c22ef
DM
5210Weaken a reference: set the C<SvWEAKREF> flag on this RV; give the
5211referred-to SV C<PERL_MAGIC_backref> magic if it hasn't already; and
5212push a back-reference to this RV onto the array of backreferences
5213associated with that magic.
c461cf8f
JH
5214
5215=cut
5216*/
5217
810b8aa5 5218SV *
864dbfa3 5219Perl_sv_rvweaken(pTHX_ SV *sv)
810b8aa5
GS
5220{
5221 SV *tsv;
5222 if (!SvOK(sv)) /* let undefs pass */
5223 return sv;
5224 if (!SvROK(sv))
cea2e8a9 5225 Perl_croak(aTHX_ "Can't weaken a nonreference");
810b8aa5 5226 else if (SvWEAKREF(sv)) {
810b8aa5 5227 if (ckWARN(WARN_MISC))
9014280d 5228 Perl_warner(aTHX_ packWARN(WARN_MISC), "Reference is already weak");
810b8aa5
GS
5229 return sv;
5230 }
5231 tsv = SvRV(sv);
e15faf7d 5232 Perl_sv_add_backref(aTHX_ tsv, sv);
810b8aa5 5233 SvWEAKREF_on(sv);
1c846c1f 5234 SvREFCNT_dec(tsv);
810b8aa5
GS
5235 return sv;
5236}
5237
645c22ef
DM
5238/* Give tsv backref magic if it hasn't already got it, then push a
5239 * back-reference to sv onto the array associated with the backref magic.
5240 */
5241
e15faf7d
NC
5242void
5243Perl_sv_add_backref(pTHX_ SV *tsv, SV *sv)
810b8aa5
GS
5244{
5245 AV *av;
5246 MAGIC *mg;
14befaf4 5247 if (SvMAGICAL(tsv) && (mg = mg_find(tsv, PERL_MAGIC_backref)))
810b8aa5
GS
5248 av = (AV*)mg->mg_obj;
5249 else {
5250 av = newAV();
14befaf4 5251 sv_magic(tsv, (SV*)av, PERL_MAGIC_backref, NULL, 0);
d99b02a1
DM
5252 /* av now has a refcnt of 2, which avoids it getting freed
5253 * before us during global cleanup. The extra ref is removed
5254 * by magic_killbackrefs() when tsv is being freed */
810b8aa5 5255 }
d91d49e8 5256 if (AvFILLp(av) >= AvMAX(av)) {
d91d49e8
MM
5257 av_extend(av, AvFILLp(av)+1);
5258 }
5259 AvARRAY(av)[++AvFILLp(av)] = sv; /* av_push() */
810b8aa5
GS
5260}
5261
645c22ef
DM
5262/* delete a back-reference to ourselves from the backref magic associated
5263 * with the SV we point to.
5264 */
5265
1c846c1f 5266STATIC void
e15faf7d 5267S_sv_del_backref(pTHX_ SV *tsv, SV *sv)
810b8aa5
GS
5268{
5269 AV *av;
5270 SV **svp;
5271 I32 i;
c04a4dfe 5272 MAGIC *mg = NULL;
e15faf7d
NC
5273 if (!SvMAGICAL(tsv) || !(mg = mg_find(tsv, PERL_MAGIC_backref))) {
5274 if (PL_in_clean_all)
5275 return;
5276 }
14befaf4 5277 if (!SvMAGICAL(tsv) || !(mg = mg_find(tsv, PERL_MAGIC_backref)))
cea2e8a9 5278 Perl_croak(aTHX_ "panic: del_backref");
810b8aa5
GS
5279 av = (AV *)mg->mg_obj;
5280 svp = AvARRAY(av);
6a76db8b
NC
5281 /* We shouldn't be in here more than once, but for paranoia reasons lets
5282 not assume this. */
5283 for (i = AvFILLp(av); i >= 0; i--) {
5284 if (svp[i] == sv) {
5285 const SSize_t fill = AvFILLp(av);
5286 if (i != fill) {
5287 /* We weren't the last entry.
5288 An unordered list has this property that you can take the
5289 last element off the end to fill the hole, and it's still
5290 an unordered list :-)
5291 */
5292 svp[i] = svp[fill];
5293 }
5294 svp[fill] = Nullsv;
5295 AvFILLp(av) = fill - 1;
5296 }
5297 }
810b8aa5
GS
5298}
5299
954c1994
GS
5300/*
5301=for apidoc sv_insert
5302
5303Inserts a string at the specified offset/length within the SV. Similar to
5304the Perl substr() function.
5305
5306=cut
5307*/
5308
79072805 5309void
e1ec3a88 5310Perl_sv_insert(pTHX_ SV *bigstr, STRLEN offset, STRLEN len, const char *little, STRLEN littlelen)
79072805
LW
5311{
5312 register char *big;
5313 register char *mid;
5314 register char *midend;
5315 register char *bigend;
5316 register I32 i;
6ff81951 5317 STRLEN curlen;
1c846c1f 5318
79072805 5319
8990e307 5320 if (!bigstr)
cea2e8a9 5321 Perl_croak(aTHX_ "Can't modify non-existent substring");
6ff81951 5322 SvPV_force(bigstr, curlen);
60fa28ff 5323 (void)SvPOK_only_UTF8(bigstr);
6ff81951
GS
5324 if (offset + len > curlen) {
5325 SvGROW(bigstr, offset+len+1);
93524f2b 5326 Zero(SvPVX(bigstr)+curlen, offset+len-curlen, char);
6ff81951
GS
5327 SvCUR_set(bigstr, offset+len);
5328 }
79072805 5329
69b47968 5330 SvTAINT(bigstr);
79072805
LW
5331 i = littlelen - len;
5332 if (i > 0) { /* string might grow */
a0d0e21e 5333 big = SvGROW(bigstr, SvCUR(bigstr) + i + 1);
79072805
LW
5334 mid = big + offset + len;
5335 midend = bigend = big + SvCUR(bigstr);
5336 bigend += i;
5337 *bigend = '\0';
5338 while (midend > mid) /* shove everything down */
5339 *--bigend = *--midend;
5340 Move(little,big+offset,littlelen,char);
b162af07 5341 SvCUR_set(bigstr, SvCUR(bigstr) + i);
79072805
LW
5342 SvSETMAGIC(bigstr);
5343 return;
5344 }
5345 else if (i == 0) {
463ee0b2 5346 Move(little,SvPVX(bigstr)+offset,len,char);
79072805
LW
5347 SvSETMAGIC(bigstr);
5348 return;
5349 }
5350
463ee0b2 5351 big = SvPVX(bigstr);
79072805
LW
5352 mid = big + offset;
5353 midend = mid + len;
5354 bigend = big + SvCUR(bigstr);
5355
5356 if (midend > bigend)
cea2e8a9 5357 Perl_croak(aTHX_ "panic: sv_insert");
79072805
LW
5358
5359 if (mid - big > bigend - midend) { /* faster to shorten from end */
5360 if (littlelen) {
5361 Move(little, mid, littlelen,char);
5362 mid += littlelen;
5363 }
5364 i = bigend - midend;
5365 if (i > 0) {
5366 Move(midend, mid, i,char);
5367 mid += i;
5368 }
5369 *mid = '\0';
5370 SvCUR_set(bigstr, mid - big);
5371 }
155aba94 5372 else if ((i = mid - big)) { /* faster from front */
79072805
LW
5373 midend -= littlelen;
5374 mid = midend;
5375 sv_chop(bigstr,midend-i);
5376 big += i;
5377 while (i--)
5378 *--midend = *--big;
5379 if (littlelen)
5380 Move(little, mid, littlelen,char);
5381 }
5382 else if (littlelen) {
5383 midend -= littlelen;
5384 sv_chop(bigstr,midend);
5385 Move(little,midend,littlelen,char);
5386 }
5387 else {
5388 sv_chop(bigstr,midend);
5389 }
5390 SvSETMAGIC(bigstr);
5391}
5392
c461cf8f
JH
5393/*
5394=for apidoc sv_replace
5395
5396Make the first argument a copy of the second, then delete the original.
645c22ef
DM
5397The target SV physically takes over ownership of the body of the source SV
5398and inherits its flags; however, the target keeps any magic it owns,
5399and any magic in the source is discarded.
ff276b08 5400Note that this is a rather specialist SV copying operation; most of the
645c22ef 5401time you'll want to use C<sv_setsv> or one of its many macro front-ends.
c461cf8f
JH
5402
5403=cut
5404*/
79072805
LW
5405
5406void
864dbfa3 5407Perl_sv_replace(pTHX_ register SV *sv, register SV *nsv)
79072805 5408{
a3b680e6 5409 const U32 refcnt = SvREFCNT(sv);
765f542d 5410 SV_CHECK_THINKFIRST_COW_DROP(sv);
30e5c352 5411 if (SvREFCNT(nsv) != 1) {
7437becc 5412 Perl_croak(aTHX_ "panic: reference miscount on nsv in sv_replace() (%"
30e5c352
NC
5413 UVuf " != 1)", (UV) SvREFCNT(nsv));
5414 }
93a17b20 5415 if (SvMAGICAL(sv)) {
a0d0e21e
LW
5416 if (SvMAGICAL(nsv))
5417 mg_free(nsv);
5418 else
5419 sv_upgrade(nsv, SVt_PVMG);
b162af07 5420 SvMAGIC_set(nsv, SvMAGIC(sv));
a0d0e21e 5421 SvFLAGS(nsv) |= SvMAGICAL(sv);
93a17b20 5422 SvMAGICAL_off(sv);
b162af07 5423 SvMAGIC_set(sv, NULL);
93a17b20 5424 }
79072805
LW
5425 SvREFCNT(sv) = 0;
5426 sv_clear(sv);
477f5d66 5427 assert(!SvREFCNT(sv));
fd0854ff
DM
5428#ifdef DEBUG_LEAKING_SCALARS
5429 sv->sv_flags = nsv->sv_flags;
5430 sv->sv_any = nsv->sv_any;
5431 sv->sv_refcnt = nsv->sv_refcnt;
f34d0642 5432 sv->sv_u = nsv->sv_u;
fd0854ff 5433#else
79072805 5434 StructCopy(nsv,sv,SV);
fd0854ff 5435#endif
7b2c381c
NC
5436 /* Currently could join these into one piece of pointer arithmetic, but
5437 it would be unclear. */
5438 if(SvTYPE(sv) == SVt_IV)
5439 SvANY(sv)
339049b0 5440 = (XPVIV*)((char*)&(sv->sv_u.svu_iv) - STRUCT_OFFSET(XPVIV, xiv_iv));
7b2c381c 5441 else if (SvTYPE(sv) == SVt_RV) {
339049b0 5442 SvANY(sv) = &sv->sv_u.svu_rv;
7b2c381c
NC
5443 }
5444
fd0854ff 5445
f8c7b90f 5446#ifdef PERL_OLD_COPY_ON_WRITE
d3d0e6f1
NC
5447 if (SvIsCOW_normal(nsv)) {
5448 /* We need to follow the pointers around the loop to make the
5449 previous SV point to sv, rather than nsv. */
5450 SV *next;
5451 SV *current = nsv;
5452 while ((next = SV_COW_NEXT_SV(current)) != nsv) {
5453 assert(next);
5454 current = next;
3f7c398e 5455 assert(SvPVX_const(current) == SvPVX_const(nsv));
d3d0e6f1
NC
5456 }
5457 /* Make the SV before us point to the SV after us. */
5458 if (DEBUG_C_TEST) {
5459 PerlIO_printf(Perl_debug_log, "previous is\n");
5460 sv_dump(current);
a29f6d03
NC
5461 PerlIO_printf(Perl_debug_log,
5462 "move it from 0x%"UVxf" to 0x%"UVxf"\n",
d3d0e6f1
NC
5463 (UV) SV_COW_NEXT_SV(current), (UV) sv);
5464 }
a29f6d03 5465 SV_COW_NEXT_SV_SET(current, sv);
d3d0e6f1
NC
5466 }
5467#endif
79072805 5468 SvREFCNT(sv) = refcnt;
1edc1566 5469 SvFLAGS(nsv) |= SVTYPEMASK; /* Mark as freed */
39cf41c2 5470 SvREFCNT(nsv) = 0;
463ee0b2 5471 del_SV(nsv);
79072805
LW
5472}
5473
c461cf8f
JH
5474/*
5475=for apidoc sv_clear
5476
645c22ef
DM
5477Clear an SV: call any destructors, free up any memory used by the body,
5478and free the body itself. The SV's head is I<not> freed, although
5479its type is set to all 1's so that it won't inadvertently be assumed
5480to be live during global destruction etc.
5481This function should only be called when REFCNT is zero. Most of the time
5482you'll want to call C<sv_free()> (or its macro wrapper C<SvREFCNT_dec>)
5483instead.
c461cf8f
JH
5484
5485=cut
5486*/
5487
79072805 5488void
864dbfa3 5489Perl_sv_clear(pTHX_ register SV *sv)
79072805 5490{
27da23d5 5491 dVAR;
82bb6deb
NC
5492 void** old_body_arena;
5493 size_t old_body_offset;
5494 const U32 type = SvTYPE(sv);
5495
79072805
LW
5496 assert(sv);
5497 assert(SvREFCNT(sv) == 0);
5498
82bb6deb
NC
5499 if (type <= SVt_IV)
5500 return;
5501
5502 old_body_arena = 0;
5503 old_body_offset = 0;
5504
ed6116ce 5505 if (SvOBJECT(sv)) {
3280af22 5506 if (PL_defstash) { /* Still have a symbol table? */
39644a26 5507 dSP;
893645bd 5508 HV* stash;
d460ef45 5509 do {
b464bac0 5510 CV* destructor;
4e8e7886 5511 stash = SvSTASH(sv);
32251b26 5512 destructor = StashHANDLER(stash,DESTROY);
4e8e7886 5513 if (destructor) {
1b6737cc 5514 SV* const tmpref = newRV(sv);
5cc433a6 5515 SvREADONLY_on(tmpref); /* DESTROY() could be naughty */
4e8e7886 5516 ENTER;
e788e7d3 5517 PUSHSTACKi(PERLSI_DESTROY);
4e8e7886
GS
5518 EXTEND(SP, 2);
5519 PUSHMARK(SP);
5cc433a6 5520 PUSHs(tmpref);
4e8e7886 5521 PUTBACK;
44389ee9 5522 call_sv((SV*)destructor, G_DISCARD|G_EVAL|G_KEEPERR|G_VOID);
7a5fa8a2
NIS
5523
5524
d3acc0f7 5525 POPSTACK;
3095d977 5526 SPAGAIN;
4e8e7886 5527 LEAVE;
5cc433a6
AB
5528 if(SvREFCNT(tmpref) < 2) {
5529 /* tmpref is not kept alive! */
5530 SvREFCNT(sv)--;
b162af07 5531 SvRV_set(tmpref, NULL);
5cc433a6
AB
5532 SvROK_off(tmpref);
5533 }
5534 SvREFCNT_dec(tmpref);
4e8e7886
GS
5535 }
5536 } while (SvOBJECT(sv) && SvSTASH(sv) != stash);
8ebc5c01 5537
6f44e0a4
JP
5538
5539 if (SvREFCNT(sv)) {
5540 if (PL_in_clean_objs)
cea2e8a9 5541 Perl_croak(aTHX_ "DESTROY created new reference to dead object '%s'",
bfcb3514 5542 HvNAME_get(stash));
6f44e0a4
JP
5543 /* DESTROY gave object new lease on life */
5544 return;
5545 }
a0d0e21e 5546 }
4e8e7886 5547
a0d0e21e 5548 if (SvOBJECT(sv)) {
4e8e7886 5549 SvREFCNT_dec(SvSTASH(sv)); /* possibly of changed persuasion */
a0d0e21e 5550 SvOBJECT_off(sv); /* Curse the object. */
82bb6deb 5551 if (type != SVt_PVIO)
3280af22 5552 --PL_sv_objcount; /* XXX Might want something more general */
a0d0e21e 5553 }
463ee0b2 5554 }
82bb6deb 5555 if (type >= SVt_PVMG) {
524189f1
JH
5556 if (SvMAGIC(sv))
5557 mg_free(sv);
82bb6deb 5558 if (type == SVt_PVMG && SvFLAGS(sv) & SVpad_TYPED)
524189f1
JH
5559 SvREFCNT_dec(SvSTASH(sv));
5560 }
82bb6deb 5561 switch (type) {
8990e307 5562 case SVt_PVIO:
df0bd2f4
GS
5563 if (IoIFP(sv) &&
5564 IoIFP(sv) != PerlIO_stdin() &&
5f05dabc 5565 IoIFP(sv) != PerlIO_stdout() &&
5566 IoIFP(sv) != PerlIO_stderr())
93578b34 5567 {
f2b5be74 5568 io_close((IO*)sv, FALSE);
93578b34 5569 }
1d7c1841 5570 if (IoDIRP(sv) && !(IoFLAGS(sv) & IOf_FAKE_DIRP))
1236053a 5571 PerlDir_close(IoDIRP(sv));
1d7c1841 5572 IoDIRP(sv) = (DIR*)NULL;
8990e307
LW
5573 Safefree(IoTOP_NAME(sv));
5574 Safefree(IoFMT_NAME(sv));
5575 Safefree(IoBOTTOM_NAME(sv));
82bb6deb
NC
5576 /* PVIOs aren't from arenas */
5577 goto freescalar;
79072805 5578 case SVt_PVBM:
82bb6deb 5579 old_body_arena = (void **) &PL_xpvbm_root;
a0d0e21e 5580 goto freescalar;
79072805 5581 case SVt_PVCV:
82bb6deb 5582 old_body_arena = (void **) &PL_xpvcv_root;
748a9306 5583 case SVt_PVFM:
82bb6deb 5584 /* PVFMs aren't from arenas */
85e6fe83 5585 cv_undef((CV*)sv);
a0d0e21e 5586 goto freescalar;
79072805 5587 case SVt_PVHV:
85e6fe83 5588 hv_undef((HV*)sv);
82bb6deb
NC
5589 old_body_arena = (void **) &PL_xpvhv_root;
5590 old_body_offset = STRUCT_OFFSET(XPVHV, xhv_fill);
a0d0e21e 5591 break;
79072805 5592 case SVt_PVAV:
85e6fe83 5593 av_undef((AV*)sv);
82bb6deb
NC
5594 old_body_arena = (void **) &PL_xpvav_root;
5595 old_body_offset = STRUCT_OFFSET(XPVAV, xav_fill);
a0d0e21e 5596 break;
02270b4e 5597 case SVt_PVLV:
dd28f7bb
DM
5598 if (LvTYPE(sv) == 'T') { /* for tie: return HE to pool */
5599 SvREFCNT_dec(HeKEY_sv((HE*)LvTARG(sv)));
5600 HeNEXT((HE*)LvTARG(sv)) = PL_hv_fetch_ent_mh;
5601 PL_hv_fetch_ent_mh = (HE*)LvTARG(sv);
5602 }
5603 else if (LvTYPE(sv) != 't') /* unless tie: unrefcnted fake SV** */
5604 SvREFCNT_dec(LvTARG(sv));
82bb6deb 5605 old_body_arena = (void **) &PL_xpvlv_root;
02270b4e 5606 goto freescalar;
a0d0e21e 5607 case SVt_PVGV:
1edc1566 5608 gp_free((GV*)sv);
a0d0e21e 5609 Safefree(GvNAME(sv));
893645bd
NC
5610 /* If we're in a stash, we don't own a reference to it. However it does
5611 have a back reference to us, which needs to be cleared. */
5612 if (GvSTASH(sv))
5613 sv_del_backref((SV*)GvSTASH(sv), sv);
82bb6deb
NC
5614 old_body_arena = (void **) &PL_xpvgv_root;
5615 goto freescalar;
79072805 5616 case SVt_PVMG:
82bb6deb
NC
5617 old_body_arena = (void **) &PL_xpvmg_root;
5618 goto freescalar;
79072805 5619 case SVt_PVNV:
82bb6deb
NC
5620 old_body_arena = (void **) &PL_xpvnv_root;
5621 goto freescalar;
79072805 5622 case SVt_PVIV:
82bb6deb
NC
5623 old_body_arena = (void **) &PL_xpviv_root;
5624 old_body_offset = STRUCT_OFFSET(XPVIV, xpv_cur);
a0d0e21e 5625 freescalar:
5228ca4e
NC
5626 /* Don't bother with SvOOK_off(sv); as we're only going to free it. */
5627 if (SvOOK(sv)) {
93524f2b 5628 SvPV_set(sv, SvPVX_mutable(sv) - SvIVX(sv));
5228ca4e
NC
5629 /* Don't even bother with turning off the OOK flag. */
5630 }
82bb6deb 5631 goto pvrv_common;
79072805 5632 case SVt_PV:
82bb6deb
NC
5633 old_body_arena = (void **) &PL_xpv_root;
5634 old_body_offset = STRUCT_OFFSET(XPV, xpv_cur);
a0d0e21e 5635 case SVt_RV:
82bb6deb 5636 pvrv_common:
810b8aa5 5637 if (SvROK(sv)) {
e15faf7d 5638 SV *target = SvRV(sv);
810b8aa5 5639 if (SvWEAKREF(sv))
e15faf7d 5640 sv_del_backref(target, sv);
810b8aa5 5641 else
e15faf7d 5642 SvREFCNT_dec(target);
810b8aa5 5643 }
f8c7b90f 5644#ifdef PERL_OLD_COPY_ON_WRITE
3f7c398e 5645 else if (SvPVX_const(sv)) {
765f542d
NC
5646 if (SvIsCOW(sv)) {
5647 /* I believe I need to grab the global SV mutex here and
5648 then recheck the COW status. */
46187eeb
NC
5649 if (DEBUG_C_TEST) {
5650 PerlIO_printf(Perl_debug_log, "Copy on write: clear\n");
e419cbc5 5651 sv_dump(sv);
46187eeb 5652 }
bdd68bc3
NC
5653 sv_release_COW(sv, SvPVX_const(sv), SvLEN(sv),
5654 SV_COW_NEXT_SV(sv));
765f542d
NC
5655 /* And drop it here. */
5656 SvFAKE_off(sv);
5657 } else if (SvLEN(sv)) {
3f7c398e 5658 Safefree(SvPVX_const(sv));
765f542d
NC
5659 }
5660 }
5661#else
3f7c398e 5662 else if (SvPVX_const(sv) && SvLEN(sv))
94010e71 5663 Safefree(SvPVX_mutable(sv));
3f7c398e 5664 else if (SvPVX_const(sv) && SvREADONLY(sv) && SvFAKE(sv)) {
bdd68bc3 5665 unshare_hek(SvSHARED_HEK_FROM_PV(SvPVX_const(sv)));
1c846c1f
NIS
5666 SvFAKE_off(sv);
5667 }
765f542d 5668#endif
79072805
LW
5669 break;
5670 case SVt_NV:
82bb6deb 5671 old_body_arena = (void **) &PL_xnv_root;
79072805
LW
5672 break;
5673 }
5674
893645bd
NC
5675 SvFLAGS(sv) &= SVf_BREAK;
5676 SvFLAGS(sv) |= SVTYPEMASK;
5677
82bb6deb
NC
5678#ifndef PURIFY
5679 if (old_body_arena) {
5680 del_body(((char *)SvANY(sv) + old_body_offset), old_body_arena);
79072805 5681 }
82bb6deb
NC
5682 else
5683#endif
5684 if (type > SVt_RV) {
5685 my_safefree(SvANY(sv));
5686 }
79072805
LW
5687}
5688
645c22ef
DM
5689/*
5690=for apidoc sv_newref
5691
5692Increment an SV's reference count. Use the C<SvREFCNT_inc()> wrapper
5693instead.
5694
5695=cut
5696*/
5697
79072805 5698SV *
864dbfa3 5699Perl_sv_newref(pTHX_ SV *sv)
79072805 5700{
463ee0b2 5701 if (sv)
4db098f4 5702 (SvREFCNT(sv))++;
79072805
LW
5703 return sv;
5704}
5705
c461cf8f
JH
5706/*
5707=for apidoc sv_free
5708
645c22ef
DM
5709Decrement an SV's reference count, and if it drops to zero, call
5710C<sv_clear> to invoke destructors and free up any memory used by
5711the body; finally, deallocate the SV's head itself.
5712Normally called via a wrapper macro C<SvREFCNT_dec>.
c461cf8f
JH
5713
5714=cut
5715*/
5716
79072805 5717void
864dbfa3 5718Perl_sv_free(pTHX_ SV *sv)
79072805 5719{
27da23d5 5720 dVAR;
79072805
LW
5721 if (!sv)
5722 return;
a0d0e21e
LW
5723 if (SvREFCNT(sv) == 0) {
5724 if (SvFLAGS(sv) & SVf_BREAK)
645c22ef
DM
5725 /* this SV's refcnt has been artificially decremented to
5726 * trigger cleanup */
a0d0e21e 5727 return;
3280af22 5728 if (PL_in_clean_all) /* All is fair */
1edc1566 5729 return;
d689ffdd
JP
5730 if (SvREADONLY(sv) && SvIMMORTAL(sv)) {
5731 /* make sure SvREFCNT(sv)==0 happens very seldom */
5732 SvREFCNT(sv) = (~(U32)0)/2;
5733 return;
5734 }
41e4abd8 5735 if (ckWARN_d(WARN_INTERNAL)) {
d5dede04 5736 Perl_warner(aTHX_ packWARN(WARN_INTERNAL),
472d47bc
SB
5737 "Attempt to free unreferenced scalar: SV 0x%"UVxf
5738 pTHX__FORMAT, PTR2UV(sv) pTHX__VALUE);
41e4abd8
NC
5739#ifdef DEBUG_LEAKING_SCALARS_FORK_DUMP
5740 Perl_dump_sv_child(aTHX_ sv);
5741#endif
5742 }
79072805
LW
5743 return;
5744 }
4db098f4 5745 if (--(SvREFCNT(sv)) > 0)
8990e307 5746 return;
8c4d3c90
NC
5747 Perl_sv_free2(aTHX_ sv);
5748}
5749
5750void
5751Perl_sv_free2(pTHX_ SV *sv)
5752{
27da23d5 5753 dVAR;
463ee0b2
LW
5754#ifdef DEBUGGING
5755 if (SvTEMP(sv)) {
0453d815 5756 if (ckWARN_d(WARN_DEBUGGING))
9014280d 5757 Perl_warner(aTHX_ packWARN(WARN_DEBUGGING),
472d47bc
SB
5758 "Attempt to free temp prematurely: SV 0x%"UVxf
5759 pTHX__FORMAT, PTR2UV(sv) pTHX__VALUE);
79072805 5760 return;
79072805 5761 }
463ee0b2 5762#endif
d689ffdd
JP
5763 if (SvREADONLY(sv) && SvIMMORTAL(sv)) {
5764 /* make sure SvREFCNT(sv)==0 happens very seldom */
5765 SvREFCNT(sv) = (~(U32)0)/2;
5766 return;
5767 }
79072805 5768 sv_clear(sv);
477f5d66
CS
5769 if (! SvREFCNT(sv))
5770 del_SV(sv);
79072805
LW
5771}
5772
954c1994
GS
5773/*
5774=for apidoc sv_len
5775
645c22ef
DM
5776Returns the length of the string in the SV. Handles magic and type
5777coercion. See also C<SvCUR>, which gives raw access to the xpv_cur slot.
954c1994
GS
5778
5779=cut
5780*/
5781
79072805 5782STRLEN
864dbfa3 5783Perl_sv_len(pTHX_ register SV *sv)
79072805 5784{
463ee0b2 5785 STRLEN len;
79072805
LW
5786
5787 if (!sv)
5788 return 0;
5789
8990e307 5790 if (SvGMAGICAL(sv))
565764a8 5791 len = mg_length(sv);
8990e307 5792 else
4d84ee25 5793 (void)SvPV_const(sv, len);
463ee0b2 5794 return len;
79072805
LW
5795}
5796
c461cf8f
JH
5797/*
5798=for apidoc sv_len_utf8
5799
5800Returns the number of characters in the string in an SV, counting wide
1e54db1a 5801UTF-8 bytes as a single character. Handles magic and type coercion.
c461cf8f
JH
5802
5803=cut
5804*/
5805
7e8c5dac
HS
5806/*
5807 * The length is cached in PERL_UTF8_magic, in the mg_len field. Also the
5808 * mg_ptr is used, by sv_pos_u2b(), see the comments of S_utf8_mg_pos_init().
5809 * (Note that the mg_len is not the length of the mg_ptr field.)
7a5fa8a2 5810 *
7e8c5dac
HS
5811 */
5812
a0ed51b3 5813STRLEN
864dbfa3 5814Perl_sv_len_utf8(pTHX_ register SV *sv)
a0ed51b3 5815{
a0ed51b3
LW
5816 if (!sv)
5817 return 0;
5818
a0ed51b3 5819 if (SvGMAGICAL(sv))
b76347f2 5820 return mg_length(sv);
a0ed51b3 5821 else
b76347f2 5822 {
7e8c5dac 5823 STRLEN len, ulen;
e62f0680 5824 const U8 *s = (U8*)SvPV_const(sv, len);
7e8c5dac
HS
5825 MAGIC *mg = SvMAGICAL(sv) ? mg_find(sv, PERL_MAGIC_utf8) : 0;
5826
e23c8137 5827 if (mg && mg->mg_len != -1 && (mg->mg_len > 0 || len == 0)) {
7e8c5dac 5828 ulen = mg->mg_len;
e23c8137
JH
5829#ifdef PERL_UTF8_CACHE_ASSERT
5830 assert(ulen == Perl_utf8_length(aTHX_ s, s + len));
5831#endif
5832 }
7e8c5dac
HS
5833 else {
5834 ulen = Perl_utf8_length(aTHX_ s, s + len);
5835 if (!mg && !SvREADONLY(sv)) {
5836 sv_magic(sv, 0, PERL_MAGIC_utf8, 0, 0);
5837 mg = mg_find(sv, PERL_MAGIC_utf8);
5838 assert(mg);
5839 }
5840 if (mg)
5841 mg->mg_len = ulen;
5842 }
5843 return ulen;
5844 }
5845}
5846
5847/* S_utf8_mg_pos_init() is used to initialize the mg_ptr field of
5848 * a PERL_UTF8_magic. The mg_ptr is used to store the mapping
5849 * between UTF-8 and byte offsets. There are two (substr offset and substr
5850 * length, the i offset, PERL_MAGIC_UTF8_CACHESIZE) times two (UTF-8 offset
5851 * and byte offset) cache positions.
5852 *
5853 * The mg_len field is used by sv_len_utf8(), see its comments.
5854 * Note that the mg_len is not the length of the mg_ptr field.
5855 *
5856 */
5857STATIC bool
245d4a47
NC
5858S_utf8_mg_pos_init(pTHX_ SV *sv, MAGIC **mgp, STRLEN **cachep, I32 i,
5859 I32 offsetp, const U8 *s, const U8 *start)
7e8c5dac 5860{
7a5fa8a2 5861 bool found = FALSE;
7e8c5dac
HS
5862
5863 if (SvMAGICAL(sv) && !SvREADONLY(sv)) {
8f78557a 5864 if (!*mgp)
27da23d5 5865 *mgp = sv_magicext(sv, 0, PERL_MAGIC_utf8, (MGVTBL*)&PL_vtbl_utf8, 0, 0);
7e8c5dac 5866 assert(*mgp);
b76347f2 5867
7e8c5dac
HS
5868 if ((*mgp)->mg_ptr)
5869 *cachep = (STRLEN *) (*mgp)->mg_ptr;
5870 else {
a02a5408 5871 Newxz(*cachep, PERL_MAGIC_UTF8_CACHESIZE * 2, STRLEN);
7e8c5dac
HS
5872 (*mgp)->mg_ptr = (char *) *cachep;
5873 }
5874 assert(*cachep);
5875
a3b680e6 5876 (*cachep)[i] = offsetp;
7e8c5dac
HS
5877 (*cachep)[i+1] = s - start;
5878 found = TRUE;
a0ed51b3 5879 }
7e8c5dac
HS
5880
5881 return found;
a0ed51b3
LW
5882}
5883
645c22ef 5884/*
7e8c5dac
HS
5885 * S_utf8_mg_pos() is used to query and update mg_ptr field of
5886 * a PERL_UTF8_magic. The mg_ptr is used to store the mapping
5887 * between UTF-8 and byte offsets. See also the comments of
5888 * S_utf8_mg_pos_init().
5889 *
5890 */
5891STATIC bool
245d4a47 5892S_utf8_mg_pos(pTHX_ SV *sv, MAGIC **mgp, STRLEN **cachep, I32 i, I32 *offsetp, I32 uoff, const U8 **sp, const U8 *start, const U8 *send)
7e8c5dac
HS
5893{
5894 bool found = FALSE;
5895
5896 if (SvMAGICAL(sv) && !SvREADONLY(sv)) {
5897 if (!*mgp)
5898 *mgp = mg_find(sv, PERL_MAGIC_utf8);
5899 if (*mgp && (*mgp)->mg_ptr) {
5900 *cachep = (STRLEN *) (*mgp)->mg_ptr;
e23c8137 5901 ASSERT_UTF8_CACHE(*cachep);
667208dd 5902 if ((*cachep)[i] == (STRLEN)uoff) /* An exact match. */
7a5fa8a2 5903 found = TRUE;
7e8c5dac
HS
5904 else { /* We will skip to the right spot. */
5905 STRLEN forw = 0;
5906 STRLEN backw = 0;
a3b680e6 5907 const U8* p = NULL;
7e8c5dac
HS
5908
5909 /* The assumption is that going backward is half
5910 * the speed of going forward (that's where the
5911 * 2 * backw in the below comes from). (The real
5912 * figure of course depends on the UTF-8 data.) */
5913
667208dd 5914 if ((*cachep)[i] > (STRLEN)uoff) {
7e8c5dac 5915 forw = uoff;
667208dd 5916 backw = (*cachep)[i] - (STRLEN)uoff;
7e8c5dac
HS
5917
5918 if (forw < 2 * backw)
5919 p = start;
5920 else
5921 p = start + (*cachep)[i+1];
5922 }
5923 /* Try this only for the substr offset (i == 0),
5924 * not for the substr length (i == 2). */
5925 else if (i == 0) { /* (*cachep)[i] < uoff */
a3b680e6 5926 const STRLEN ulen = sv_len_utf8(sv);
7e8c5dac 5927
667208dd
JH
5928 if ((STRLEN)uoff < ulen) {
5929 forw = (STRLEN)uoff - (*cachep)[i];
5930 backw = ulen - (STRLEN)uoff;
7e8c5dac
HS
5931
5932 if (forw < 2 * backw)
5933 p = start + (*cachep)[i+1];
5934 else
5935 p = send;
5936 }
5937
5938 /* If the string is not long enough for uoff,
5939 * we could extend it, but not at this low a level. */
5940 }
5941
5942 if (p) {
5943 if (forw < 2 * backw) {
5944 while (forw--)
5945 p += UTF8SKIP(p);
5946 }
5947 else {
5948 while (backw--) {
5949 p--;
5950 while (UTF8_IS_CONTINUATION(*p))
5951 p--;
5952 }
5953 }
5954
5955 /* Update the cache. */
667208dd 5956 (*cachep)[i] = (STRLEN)uoff;
7e8c5dac 5957 (*cachep)[i+1] = p - start;
8f78557a
AE
5958
5959 /* Drop the stale "length" cache */
5960 if (i == 0) {
5961 (*cachep)[2] = 0;
5962 (*cachep)[3] = 0;
5963 }
7a5fa8a2 5964
7e8c5dac
HS
5965 found = TRUE;
5966 }
5967 }
5968 if (found) { /* Setup the return values. */
5969 *offsetp = (*cachep)[i+1];
5970 *sp = start + *offsetp;
5971 if (*sp >= send) {
5972 *sp = send;
5973 *offsetp = send - start;
5974 }
5975 else if (*sp < start) {
5976 *sp = start;
5977 *offsetp = 0;
5978 }
5979 }
5980 }
e23c8137
JH
5981#ifdef PERL_UTF8_CACHE_ASSERT
5982 if (found) {
5983 U8 *s = start;
5984 I32 n = uoff;
5985
5986 while (n-- && s < send)
5987 s += UTF8SKIP(s);
5988
5989 if (i == 0) {
5990 assert(*offsetp == s - start);
5991 assert((*cachep)[0] == (STRLEN)uoff);
5992 assert((*cachep)[1] == *offsetp);
5993 }
5994 ASSERT_UTF8_CACHE(*cachep);
5995 }
5996#endif
7e8c5dac 5997 }
e23c8137 5998
7e8c5dac
HS
5999 return found;
6000}
7a5fa8a2 6001
7e8c5dac 6002/*
645c22ef
DM
6003=for apidoc sv_pos_u2b
6004
1e54db1a 6005Converts the value pointed to by offsetp from a count of UTF-8 chars from
645c22ef
DM
6006the start of the string, to a count of the equivalent number of bytes; if
6007lenp is non-zero, it does the same to lenp, but this time starting from
6008the offset, rather than from the start of the string. Handles magic and
6009type coercion.
6010
6011=cut
6012*/
6013
7e8c5dac
HS
6014/*
6015 * sv_pos_u2b() uses, like sv_pos_b2u(), the mg_ptr of the potential
6016 * PERL_UTF8_magic of the sv to store the mapping between UTF-8 and
6017 * byte offsets. See also the comments of S_utf8_mg_pos().
6018 *
6019 */
6020
a0ed51b3 6021void
864dbfa3 6022Perl_sv_pos_u2b(pTHX_ register SV *sv, I32* offsetp, I32* lenp)
a0ed51b3 6023{
245d4a47 6024 const U8 *start;
a0ed51b3
LW
6025 STRLEN len;
6026
6027 if (!sv)
6028 return;
6029
245d4a47 6030 start = (U8*)SvPV_const(sv, len);
7e8c5dac 6031 if (len) {
b464bac0
AL
6032 STRLEN boffset = 0;
6033 STRLEN *cache = 0;
245d4a47
NC
6034 const U8 *s = start;
6035 I32 uoffset = *offsetp;
9d4ba2ae 6036 const U8 * const send = s + len;
245d4a47
NC
6037 MAGIC *mg = 0;
6038 bool found = FALSE;
7e8c5dac 6039
bdf77a2a 6040 if (utf8_mg_pos(sv, &mg, &cache, 0, offsetp, *offsetp, &s, start, send))
7e8c5dac
HS
6041 found = TRUE;
6042 if (!found && uoffset > 0) {
6043 while (s < send && uoffset--)
6044 s += UTF8SKIP(s);
6045 if (s >= send)
6046 s = send;
a3b680e6 6047 if (utf8_mg_pos_init(sv, &mg, &cache, 0, *offsetp, s, start))
7e8c5dac
HS
6048 boffset = cache[1];
6049 *offsetp = s - start;
6050 }
6051 if (lenp) {
6052 found = FALSE;
6053 start = s;
ec062429 6054 if (utf8_mg_pos(sv, &mg, &cache, 2, lenp, *lenp, &s, start, send)) {
7e8c5dac
HS
6055 *lenp -= boffset;
6056 found = TRUE;
6057 }
6058 if (!found && *lenp > 0) {
6059 I32 ulen = *lenp;
6060 if (ulen > 0)
6061 while (s < send && ulen--)
6062 s += UTF8SKIP(s);
6063 if (s >= send)
6064 s = send;
a3b680e6 6065 utf8_mg_pos_init(sv, &mg, &cache, 2, *lenp, s, start);
7e8c5dac
HS
6066 }
6067 *lenp = s - start;
6068 }
e23c8137 6069 ASSERT_UTF8_CACHE(cache);
7e8c5dac
HS
6070 }
6071 else {
6072 *offsetp = 0;
6073 if (lenp)
6074 *lenp = 0;
a0ed51b3 6075 }
e23c8137 6076
a0ed51b3
LW
6077 return;
6078}
6079
645c22ef
DM
6080/*
6081=for apidoc sv_pos_b2u
6082
6083Converts the value pointed to by offsetp from a count of bytes from the
1e54db1a 6084start of the string, to a count of the equivalent number of UTF-8 chars.
645c22ef
DM
6085Handles magic and type coercion.
6086
6087=cut
6088*/
6089
7e8c5dac
HS
6090/*
6091 * sv_pos_b2u() uses, like sv_pos_u2b(), the mg_ptr of the potential
6092 * PERL_UTF8_magic of the sv to store the mapping between UTF-8 and
6093 * byte offsets. See also the comments of S_utf8_mg_pos().
6094 *
6095 */
6096
a0ed51b3 6097void
7e8c5dac 6098Perl_sv_pos_b2u(pTHX_ register SV* sv, I32* offsetp)
a0ed51b3 6099{
83003860 6100 const U8* s;
a0ed51b3
LW
6101 STRLEN len;
6102
6103 if (!sv)
6104 return;
6105
83003860 6106 s = (const U8*)SvPV_const(sv, len);
eb160463 6107 if ((I32)len < *offsetp)
a0dbb045 6108 Perl_croak(aTHX_ "panic: sv_pos_b2u: bad byte offset");
7e8c5dac 6109 else {
83003860 6110 const U8* send = s + *offsetp;
7e8c5dac
HS
6111 MAGIC* mg = NULL;
6112 STRLEN *cache = NULL;
6113
6114 len = 0;
6115
6116 if (SvMAGICAL(sv) && !SvREADONLY(sv)) {
6117 mg = mg_find(sv, PERL_MAGIC_utf8);
6118 if (mg && mg->mg_ptr) {
6119 cache = (STRLEN *) mg->mg_ptr;
c5661c80 6120 if (cache[1] == (STRLEN)*offsetp) {
7e8c5dac
HS
6121 /* An exact match. */
6122 *offsetp = cache[0];
6123
6124 return;
6125 }
c5661c80 6126 else if (cache[1] < (STRLEN)*offsetp) {
7e8c5dac
HS
6127 /* We already know part of the way. */
6128 len = cache[0];
6129 s += cache[1];
7a5fa8a2 6130 /* Let the below loop do the rest. */
7e8c5dac
HS
6131 }
6132 else { /* cache[1] > *offsetp */
6133 /* We already know all of the way, now we may
6134 * be able to walk back. The same assumption
6135 * is made as in S_utf8_mg_pos(), namely that
6136 * walking backward is twice slower than
6137 * walking forward. */
9d4ba2ae 6138 const STRLEN forw = *offsetp;
7e8c5dac
HS
6139 STRLEN backw = cache[1] - *offsetp;
6140
6141 if (!(forw < 2 * backw)) {
83003860 6142 const U8 *p = s + cache[1];
7e8c5dac 6143 STRLEN ubackw = 0;
7a5fa8a2 6144
a5b510f2
AE
6145 cache[1] -= backw;
6146
7e8c5dac
HS
6147 while (backw--) {
6148 p--;
0aeb64d0 6149 while (UTF8_IS_CONTINUATION(*p)) {
7e8c5dac 6150 p--;
0aeb64d0
JH
6151 backw--;
6152 }
7e8c5dac
HS
6153 ubackw++;
6154 }
6155
6156 cache[0] -= ubackw;
0aeb64d0 6157 *offsetp = cache[0];
a67d7df9
TS
6158
6159 /* Drop the stale "length" cache */
6160 cache[2] = 0;
6161 cache[3] = 0;
6162
0aeb64d0 6163 return;
7e8c5dac
HS
6164 }
6165 }
6166 }
e23c8137 6167 ASSERT_UTF8_CACHE(cache);
a0dbb045 6168 }
7e8c5dac
HS
6169
6170 while (s < send) {
6171 STRLEN n = 1;
6172
6173 /* Call utf8n_to_uvchr() to validate the sequence
6174 * (unless a simple non-UTF character) */
6175 if (!UTF8_IS_INVARIANT(*s))
6176 utf8n_to_uvchr(s, UTF8SKIP(s), &n, 0);
6177 if (n > 0) {
6178 s += n;
6179 len++;
6180 }
6181 else
6182 break;
6183 }
6184
6185 if (!SvREADONLY(sv)) {
6186 if (!mg) {
6187 sv_magic(sv, 0, PERL_MAGIC_utf8, 0, 0);
6188 mg = mg_find(sv, PERL_MAGIC_utf8);
6189 }
6190 assert(mg);
6191
6192 if (!mg->mg_ptr) {
a02a5408 6193 Newxz(cache, PERL_MAGIC_UTF8_CACHESIZE * 2, STRLEN);
7e8c5dac
HS
6194 mg->mg_ptr = (char *) cache;
6195 }
6196 assert(cache);
6197
6198 cache[0] = len;
6199 cache[1] = *offsetp;
a67d7df9
TS
6200 /* Drop the stale "length" cache */
6201 cache[2] = 0;
6202 cache[3] = 0;
7e8c5dac
HS
6203 }
6204
6205 *offsetp = len;
a0ed51b3 6206 }
a0ed51b3
LW
6207 return;
6208}
6209
954c1994
GS
6210/*
6211=for apidoc sv_eq
6212
6213Returns a boolean indicating whether the strings in the two SVs are
645c22ef
DM
6214identical. Is UTF-8 and 'use bytes' aware, handles get magic, and will
6215coerce its args to strings if necessary.
954c1994
GS
6216
6217=cut
6218*/
6219
79072805 6220I32
e01b9e88 6221Perl_sv_eq(pTHX_ register SV *sv1, register SV *sv2)
79072805 6222{
e1ec3a88 6223 const char *pv1;
463ee0b2 6224 STRLEN cur1;
e1ec3a88 6225 const char *pv2;
463ee0b2 6226 STRLEN cur2;
e01b9e88 6227 I32 eq = 0;
553e1bcc
AT
6228 char *tpv = Nullch;
6229 SV* svrecode = Nullsv;
79072805 6230
e01b9e88 6231 if (!sv1) {
79072805
LW
6232 pv1 = "";
6233 cur1 = 0;
6234 }
463ee0b2 6235 else
4d84ee25 6236 pv1 = SvPV_const(sv1, cur1);
79072805 6237
e01b9e88
SC
6238 if (!sv2){
6239 pv2 = "";
6240 cur2 = 0;
92d29cee 6241 }
e01b9e88 6242 else
4d84ee25 6243 pv2 = SvPV_const(sv2, cur2);
79072805 6244
cf48d248 6245 if (cur1 && cur2 && SvUTF8(sv1) != SvUTF8(sv2) && !IN_BYTES) {
799ef3cb
JH
6246 /* Differing utf8ness.
6247 * Do not UTF8size the comparands as a side-effect. */
6248 if (PL_encoding) {
6249 if (SvUTF8(sv1)) {
553e1bcc
AT
6250 svrecode = newSVpvn(pv2, cur2);
6251 sv_recode_to_utf8(svrecode, PL_encoding);
93524f2b 6252 pv2 = SvPV_const(svrecode, cur2);
799ef3cb
JH
6253 }
6254 else {
553e1bcc
AT
6255 svrecode = newSVpvn(pv1, cur1);
6256 sv_recode_to_utf8(svrecode, PL_encoding);
93524f2b 6257 pv1 = SvPV_const(svrecode, cur1);
799ef3cb
JH
6258 }
6259 /* Now both are in UTF-8. */
0a1bd7ac
DM
6260 if (cur1 != cur2) {
6261 SvREFCNT_dec(svrecode);
799ef3cb 6262 return FALSE;
0a1bd7ac 6263 }
799ef3cb
JH
6264 }
6265 else {
6266 bool is_utf8 = TRUE;
6267
6268 if (SvUTF8(sv1)) {
6269 /* sv1 is the UTF-8 one,
6270 * if is equal it must be downgrade-able */
9d4ba2ae 6271 char * const pv = (char*)bytes_from_utf8((const U8*)pv1,
799ef3cb
JH
6272 &cur1, &is_utf8);
6273 if (pv != pv1)
553e1bcc 6274 pv1 = tpv = pv;
799ef3cb
JH
6275 }
6276 else {
6277 /* sv2 is the UTF-8 one,
6278 * if is equal it must be downgrade-able */
9d4ba2ae 6279 char * const pv = (char *)bytes_from_utf8((const U8*)pv2,
799ef3cb
JH
6280 &cur2, &is_utf8);
6281 if (pv != pv2)
553e1bcc 6282 pv2 = tpv = pv;
799ef3cb
JH
6283 }
6284 if (is_utf8) {
6285 /* Downgrade not possible - cannot be eq */
bf694877 6286 assert (tpv == 0);
799ef3cb
JH
6287 return FALSE;
6288 }
6289 }
cf48d248
JH
6290 }
6291
6292 if (cur1 == cur2)
765f542d 6293 eq = (pv1 == pv2) || memEQ(pv1, pv2, cur1);
e01b9e88 6294
553e1bcc
AT
6295 if (svrecode)
6296 SvREFCNT_dec(svrecode);
799ef3cb 6297
553e1bcc
AT
6298 if (tpv)
6299 Safefree(tpv);
cf48d248 6300
e01b9e88 6301 return eq;
79072805
LW
6302}
6303
954c1994
GS
6304/*
6305=for apidoc sv_cmp
6306
6307Compares the strings in two SVs. Returns -1, 0, or 1 indicating whether the
6308string in C<sv1> is less than, equal to, or greater than the string in
645c22ef
DM
6309C<sv2>. Is UTF-8 and 'use bytes' aware, handles get magic, and will
6310coerce its args to strings if necessary. See also C<sv_cmp_locale>.
954c1994
GS
6311
6312=cut
6313*/
6314
79072805 6315I32
e01b9e88 6316Perl_sv_cmp(pTHX_ register SV *sv1, register SV *sv2)
79072805 6317{
560a288e 6318 STRLEN cur1, cur2;
e1ec3a88
AL
6319 const char *pv1, *pv2;
6320 char *tpv = Nullch;
cf48d248 6321 I32 cmp;
553e1bcc 6322 SV *svrecode = Nullsv;
560a288e 6323
e01b9e88
SC
6324 if (!sv1) {
6325 pv1 = "";
560a288e
GS
6326 cur1 = 0;
6327 }
e01b9e88 6328 else
4d84ee25 6329 pv1 = SvPV_const(sv1, cur1);
560a288e 6330
553e1bcc 6331 if (!sv2) {
e01b9e88 6332 pv2 = "";
560a288e
GS
6333 cur2 = 0;
6334 }
e01b9e88 6335 else
4d84ee25 6336 pv2 = SvPV_const(sv2, cur2);
79072805 6337
cf48d248 6338 if (cur1 && cur2 && SvUTF8(sv1) != SvUTF8(sv2) && !IN_BYTES) {
799ef3cb
JH
6339 /* Differing utf8ness.
6340 * Do not UTF8size the comparands as a side-effect. */
cf48d248 6341 if (SvUTF8(sv1)) {
799ef3cb 6342 if (PL_encoding) {
553e1bcc
AT
6343 svrecode = newSVpvn(pv2, cur2);
6344 sv_recode_to_utf8(svrecode, PL_encoding);
93524f2b 6345 pv2 = SvPV_const(svrecode, cur2);
799ef3cb
JH
6346 }
6347 else {
e1ec3a88 6348 pv2 = tpv = (char*)bytes_to_utf8((const U8*)pv2, &cur2);
799ef3cb 6349 }
cf48d248
JH
6350 }
6351 else {
799ef3cb 6352 if (PL_encoding) {
553e1bcc
AT
6353 svrecode = newSVpvn(pv1, cur1);
6354 sv_recode_to_utf8(svrecode, PL_encoding);
93524f2b 6355 pv1 = SvPV_const(svrecode, cur1);
799ef3cb
JH
6356 }
6357 else {
e1ec3a88 6358 pv1 = tpv = (char*)bytes_to_utf8((const U8*)pv1, &cur1);
799ef3cb 6359 }
cf48d248
JH
6360 }
6361 }
6362
e01b9e88 6363 if (!cur1) {
cf48d248 6364 cmp = cur2 ? -1 : 0;
e01b9e88 6365 } else if (!cur2) {
cf48d248
JH
6366 cmp = 1;
6367 } else {
e1ec3a88 6368 const I32 retval = memcmp((const void*)pv1, (const void*)pv2, cur1 < cur2 ? cur1 : cur2);
e01b9e88
SC
6369
6370 if (retval) {
cf48d248 6371 cmp = retval < 0 ? -1 : 1;
e01b9e88 6372 } else if (cur1 == cur2) {
cf48d248
JH
6373 cmp = 0;
6374 } else {
6375 cmp = cur1 < cur2 ? -1 : 1;
e01b9e88 6376 }
cf48d248 6377 }
16660edb 6378
553e1bcc
AT
6379 if (svrecode)
6380 SvREFCNT_dec(svrecode);
799ef3cb 6381
553e1bcc
AT
6382 if (tpv)
6383 Safefree(tpv);
cf48d248
JH
6384
6385 return cmp;
bbce6d69 6386}
16660edb 6387
c461cf8f
JH
6388/*
6389=for apidoc sv_cmp_locale
6390
645c22ef
DM
6391Compares the strings in two SVs in a locale-aware manner. Is UTF-8 and
6392'use bytes' aware, handles get magic, and will coerce its args to strings
6393if necessary. See also C<sv_cmp_locale>. See also C<sv_cmp>.
c461cf8f
JH
6394
6395=cut
6396*/
6397
bbce6d69 6398I32
864dbfa3 6399Perl_sv_cmp_locale(pTHX_ register SV *sv1, register SV *sv2)
bbce6d69 6400{
36477c24 6401#ifdef USE_LOCALE_COLLATE
16660edb 6402
bbce6d69 6403 char *pv1, *pv2;
6404 STRLEN len1, len2;
6405 I32 retval;
16660edb 6406
3280af22 6407 if (PL_collation_standard)
bbce6d69 6408 goto raw_compare;
16660edb 6409
bbce6d69 6410 len1 = 0;
8ac85365 6411 pv1 = sv1 ? sv_collxfrm(sv1, &len1) : (char *) NULL;
bbce6d69 6412 len2 = 0;
8ac85365 6413 pv2 = sv2 ? sv_collxfrm(sv2, &len2) : (char *) NULL;
16660edb 6414
bbce6d69 6415 if (!pv1 || !len1) {
6416 if (pv2 && len2)
6417 return -1;
6418 else
6419 goto raw_compare;
6420 }
6421 else {
6422 if (!pv2 || !len2)
6423 return 1;
6424 }
16660edb 6425
bbce6d69 6426 retval = memcmp((void*)pv1, (void*)pv2, len1 < len2 ? len1 : len2);
16660edb 6427
bbce6d69 6428 if (retval)
16660edb 6429 return retval < 0 ? -1 : 1;
6430
bbce6d69 6431 /*
6432 * When the result of collation is equality, that doesn't mean
6433 * that there are no differences -- some locales exclude some
6434 * characters from consideration. So to avoid false equalities,
6435 * we use the raw string as a tiebreaker.
6436 */
16660edb 6437
bbce6d69 6438 raw_compare:
6439 /* FALL THROUGH */
16660edb 6440
36477c24 6441#endif /* USE_LOCALE_COLLATE */
16660edb 6442
bbce6d69 6443 return sv_cmp(sv1, sv2);
6444}
79072805 6445
645c22ef 6446
36477c24 6447#ifdef USE_LOCALE_COLLATE
645c22ef 6448
7a4c00b4 6449/*
645c22ef
DM
6450=for apidoc sv_collxfrm
6451
6452Add Collate Transform magic to an SV if it doesn't already have it.
6453
6454Any scalar variable may carry PERL_MAGIC_collxfrm magic that contains the
6455scalar data of the variable, but transformed to such a format that a normal
6456memory comparison can be used to compare the data according to the locale
6457settings.
6458
6459=cut
6460*/
6461
bbce6d69 6462char *
864dbfa3 6463Perl_sv_collxfrm(pTHX_ SV *sv, STRLEN *nxp)
bbce6d69 6464{
7a4c00b4 6465 MAGIC *mg;
16660edb 6466
14befaf4 6467 mg = SvMAGICAL(sv) ? mg_find(sv, PERL_MAGIC_collxfrm) : (MAGIC *) NULL;
3280af22 6468 if (!mg || !mg->mg_ptr || *(U32*)mg->mg_ptr != PL_collation_ix) {
93524f2b
NC
6469 const char *s;
6470 char *xf;
bbce6d69 6471 STRLEN len, xlen;
6472
7a4c00b4 6473 if (mg)
6474 Safefree(mg->mg_ptr);
93524f2b 6475 s = SvPV_const(sv, len);
bbce6d69 6476 if ((xf = mem_collxfrm(s, len, &xlen))) {
ff0cee69 6477 if (SvREADONLY(sv)) {
6478 SAVEFREEPV(xf);
6479 *nxp = xlen;
3280af22 6480 return xf + sizeof(PL_collation_ix);
ff0cee69 6481 }
7a4c00b4 6482 if (! mg) {
14befaf4
DM
6483 sv_magic(sv, 0, PERL_MAGIC_collxfrm, 0, 0);
6484 mg = mg_find(sv, PERL_MAGIC_collxfrm);
7a4c00b4 6485 assert(mg);
bbce6d69 6486 }
7a4c00b4 6487 mg->mg_ptr = xf;
565764a8 6488 mg->mg_len = xlen;
7a4c00b4 6489 }
6490 else {
ff0cee69 6491 if (mg) {
6492 mg->mg_ptr = NULL;
565764a8 6493 mg->mg_len = -1;
ff0cee69 6494 }
bbce6d69 6495 }
6496 }
7a4c00b4 6497 if (mg && mg->mg_ptr) {
565764a8 6498 *nxp = mg->mg_len;
3280af22 6499 return mg->mg_ptr + sizeof(PL_collation_ix);
bbce6d69 6500 }
6501 else {
6502 *nxp = 0;
6503 return NULL;
16660edb 6504 }
79072805
LW
6505}
6506
36477c24 6507#endif /* USE_LOCALE_COLLATE */
bbce6d69 6508
c461cf8f
JH
6509/*
6510=for apidoc sv_gets
6511
6512Get a line from the filehandle and store it into the SV, optionally
6513appending to the currently-stored string.
6514
6515=cut
6516*/
6517
79072805 6518char *
864dbfa3 6519Perl_sv_gets(pTHX_ register SV *sv, register PerlIO *fp, I32 append)
79072805 6520{
e1ec3a88 6521 const char *rsptr;
c07a80fd 6522 STRLEN rslen;
6523 register STDCHAR rslast;
6524 register STDCHAR *bp;
6525 register I32 cnt;
9c5ffd7c 6526 I32 i = 0;
8bfdd7d9 6527 I32 rspara = 0;
e311fd51 6528 I32 recsize;
c07a80fd 6529
bc44a8a2
NC
6530 if (SvTHINKFIRST(sv))
6531 sv_force_normal_flags(sv, append ? 0 : SV_COW_DROP_PV);
765f542d
NC
6532 /* XXX. If you make this PVIV, then copy on write can copy scalars read
6533 from <>.
6534 However, perlbench says it's slower, because the existing swipe code
6535 is faster than copy on write.
6536 Swings and roundabouts. */
862a34c6 6537 SvUPGRADE(sv, SVt_PV);
99491443 6538
ff68c719 6539 SvSCREAM_off(sv);
efd8b2ba
AE
6540
6541 if (append) {
6542 if (PerlIO_isutf8(fp)) {
6543 if (!SvUTF8(sv)) {
6544 sv_utf8_upgrade_nomg(sv);
6545 sv_pos_u2b(sv,&append,0);
6546 }
6547 } else if (SvUTF8(sv)) {
1b6737cc 6548 SV * const tsv = NEWSV(0,0);
efd8b2ba
AE
6549 sv_gets(tsv, fp, 0);
6550 sv_utf8_upgrade_nomg(tsv);
6551 SvCUR_set(sv,append);
6552 sv_catsv(sv,tsv);
6553 sv_free(tsv);
6554 goto return_string_or_null;
6555 }
6556 }
6557
6558 SvPOK_only(sv);
6559 if (PerlIO_isutf8(fp))
6560 SvUTF8_on(sv);
c07a80fd 6561
923e4eb5 6562 if (IN_PERL_COMPILETIME) {
8bfdd7d9
HS
6563 /* we always read code in line mode */
6564 rsptr = "\n";
6565 rslen = 1;
6566 }
6567 else if (RsSNARF(PL_rs)) {
7a5fa8a2
NIS
6568 /* If it is a regular disk file use size from stat() as estimate
6569 of amount we are going to read - may result in malloc-ing
6570 more memory than we realy need if layers bellow reduce
e468d35b
NIS
6571 size we read (e.g. CRLF or a gzip layer)
6572 */
e311fd51 6573 Stat_t st;
e468d35b 6574 if (!PerlLIO_fstat(PerlIO_fileno(fp), &st) && S_ISREG(st.st_mode)) {
f54cb97a 6575 const Off_t offset = PerlIO_tell(fp);
58f1856e 6576 if (offset != (Off_t) -1 && st.st_size + append > offset) {
e468d35b
NIS
6577 (void) SvGROW(sv, (STRLEN)((st.st_size - offset) + append + 1));
6578 }
6579 }
c07a80fd 6580 rsptr = NULL;
6581 rslen = 0;
6582 }
3280af22 6583 else if (RsRECORD(PL_rs)) {
e311fd51 6584 I32 bytesread;
5b2b9c68
HM
6585 char *buffer;
6586
6587 /* Grab the size of the record we're getting */
3280af22 6588 recsize = SvIV(SvRV(PL_rs));
e311fd51 6589 buffer = SvGROW(sv, (STRLEN)(recsize + append + 1)) + append;
5b2b9c68
HM
6590 /* Go yank in */
6591#ifdef VMS
6592 /* VMS wants read instead of fread, because fread doesn't respect */
6593 /* RMS record boundaries. This is not necessarily a good thing to be */
e468d35b
NIS
6594 /* doing, but we've got no other real choice - except avoid stdio
6595 as implementation - perhaps write a :vms layer ?
6596 */
5b2b9c68
HM
6597 bytesread = PerlLIO_read(PerlIO_fileno(fp), buffer, recsize);
6598#else
6599 bytesread = PerlIO_read(fp, buffer, recsize);
6600#endif
27e6ca2d
AE
6601 if (bytesread < 0)
6602 bytesread = 0;
e311fd51 6603 SvCUR_set(sv, bytesread += append);
e670df4e 6604 buffer[bytesread] = '\0';
efd8b2ba 6605 goto return_string_or_null;
5b2b9c68 6606 }
3280af22 6607 else if (RsPARA(PL_rs)) {
c07a80fd 6608 rsptr = "\n\n";
6609 rslen = 2;
8bfdd7d9 6610 rspara = 1;
c07a80fd 6611 }
7d59b7e4
NIS
6612 else {
6613 /* Get $/ i.e. PL_rs into same encoding as stream wants */
6614 if (PerlIO_isutf8(fp)) {
6615 rsptr = SvPVutf8(PL_rs, rslen);
6616 }
6617 else {
6618 if (SvUTF8(PL_rs)) {
6619 if (!sv_utf8_downgrade(PL_rs, TRUE)) {
6620 Perl_croak(aTHX_ "Wide character in $/");
6621 }
6622 }
93524f2b 6623 rsptr = SvPV_const(PL_rs, rslen);
7d59b7e4
NIS
6624 }
6625 }
6626
c07a80fd 6627 rslast = rslen ? rsptr[rslen - 1] : '\0';
6628
8bfdd7d9 6629 if (rspara) { /* have to do this both before and after */
79072805 6630 do { /* to make sure file boundaries work right */
760ac839 6631 if (PerlIO_eof(fp))
a0d0e21e 6632 return 0;
760ac839 6633 i = PerlIO_getc(fp);
79072805 6634 if (i != '\n') {
a0d0e21e
LW
6635 if (i == -1)
6636 return 0;
760ac839 6637 PerlIO_ungetc(fp,i);
79072805
LW
6638 break;
6639 }
6640 } while (i != EOF);
6641 }
c07a80fd 6642
760ac839
LW
6643 /* See if we know enough about I/O mechanism to cheat it ! */
6644
6645 /* This used to be #ifdef test - it is made run-time test for ease
1c846c1f 6646 of abstracting out stdio interface. One call should be cheap
760ac839
LW
6647 enough here - and may even be a macro allowing compile
6648 time optimization.
6649 */
6650
6651 if (PerlIO_fast_gets(fp)) {
6652
6653 /*
6654 * We're going to steal some values from the stdio struct
6655 * and put EVERYTHING in the innermost loop into registers.
6656 */
6657 register STDCHAR *ptr;
6658 STRLEN bpx;
6659 I32 shortbuffered;
6660
16660edb 6661#if defined(VMS) && defined(PERLIO_IS_STDIO)
6662 /* An ungetc()d char is handled separately from the regular
6663 * buffer, so we getc() it back out and stuff it in the buffer.
6664 */
6665 i = PerlIO_getc(fp);
6666 if (i == EOF) return 0;
6667 *(--((*fp)->_ptr)) = (unsigned char) i;
6668 (*fp)->_cnt++;
6669#endif
c07a80fd 6670
c2960299 6671 /* Here is some breathtakingly efficient cheating */
c07a80fd 6672
a20bf0c3 6673 cnt = PerlIO_get_cnt(fp); /* get count into register */
e468d35b 6674 /* make sure we have the room */
7a5fa8a2 6675 if ((I32)(SvLEN(sv) - append) <= cnt + 1) {
e468d35b 6676 /* Not room for all of it
7a5fa8a2 6677 if we are looking for a separator and room for some
e468d35b
NIS
6678 */
6679 if (rslen && cnt > 80 && (I32)SvLEN(sv) > append) {
7a5fa8a2 6680 /* just process what we have room for */
79072805
LW
6681 shortbuffered = cnt - SvLEN(sv) + append + 1;
6682 cnt -= shortbuffered;
6683 }
6684 else {
6685 shortbuffered = 0;
bbce6d69 6686 /* remember that cnt can be negative */
eb160463 6687 SvGROW(sv, (STRLEN)(append + (cnt <= 0 ? 2 : (cnt + 1))));
79072805
LW
6688 }
6689 }
7a5fa8a2 6690 else
79072805 6691 shortbuffered = 0;
3f7c398e 6692 bp = (STDCHAR*)SvPVX_const(sv) + append; /* move these two too to registers */
a20bf0c3 6693 ptr = (STDCHAR*)PerlIO_get_ptr(fp);
16660edb 6694 DEBUG_P(PerlIO_printf(Perl_debug_log,
1d7c1841 6695 "Screamer: entering, ptr=%"UVuf", cnt=%ld\n",PTR2UV(ptr),(long)cnt));
16660edb 6696 DEBUG_P(PerlIO_printf(Perl_debug_log,
ba7abf9d 6697 "Screamer: entering: PerlIO * thinks ptr=%"UVuf", cnt=%ld, base=%"UVuf"\n",
1c846c1f 6698 PTR2UV(PerlIO_get_ptr(fp)), (long)PerlIO_get_cnt(fp),
1d7c1841 6699 PTR2UV(PerlIO_has_base(fp) ? PerlIO_get_base(fp) : 0)));
79072805
LW
6700 for (;;) {
6701 screamer:
93a17b20 6702 if (cnt > 0) {
c07a80fd 6703 if (rslen) {
760ac839
LW
6704 while (cnt > 0) { /* this | eat */
6705 cnt--;
c07a80fd 6706 if ((*bp++ = *ptr++) == rslast) /* really | dust */
6707 goto thats_all_folks; /* screams | sed :-) */
6708 }
6709 }
6710 else {
1c846c1f
NIS
6711 Copy(ptr, bp, cnt, char); /* this | eat */
6712 bp += cnt; /* screams | dust */
c07a80fd 6713 ptr += cnt; /* louder | sed :-) */
a5f75d66 6714 cnt = 0;
93a17b20 6715 }
79072805
LW
6716 }
6717
748a9306 6718 if (shortbuffered) { /* oh well, must extend */
79072805
LW
6719 cnt = shortbuffered;
6720 shortbuffered = 0;
3f7c398e 6721 bpx = bp - (STDCHAR*)SvPVX_const(sv); /* box up before relocation */
79072805
LW
6722 SvCUR_set(sv, bpx);
6723 SvGROW(sv, SvLEN(sv) + append + cnt + 2);
3f7c398e 6724 bp = (STDCHAR*)SvPVX_const(sv) + bpx; /* unbox after relocation */
79072805
LW
6725 continue;
6726 }
6727
16660edb 6728 DEBUG_P(PerlIO_printf(Perl_debug_log,
1d7c1841
GS
6729 "Screamer: going to getc, ptr=%"UVuf", cnt=%ld\n",
6730 PTR2UV(ptr),(long)cnt));
cc00df79 6731 PerlIO_set_ptrcnt(fp, (STDCHAR*)ptr, cnt); /* deregisterize cnt and ptr */
ba7abf9d 6732#if 0
16660edb 6733 DEBUG_P(PerlIO_printf(Perl_debug_log,
1d7c1841 6734 "Screamer: pre: FILE * thinks ptr=%"UVuf", cnt=%ld, base=%"UVuf"\n",
1c846c1f 6735 PTR2UV(PerlIO_get_ptr(fp)), (long)PerlIO_get_cnt(fp),
1d7c1841 6736 PTR2UV(PerlIO_has_base (fp) ? PerlIO_get_base(fp) : 0)));
ba7abf9d 6737#endif
1c846c1f 6738 /* This used to call 'filbuf' in stdio form, but as that behaves like
774d564b 6739 getc when cnt <= 0 we use PerlIO_getc here to avoid introducing
6740 another abstraction. */
760ac839 6741 i = PerlIO_getc(fp); /* get more characters */
ba7abf9d 6742#if 0
16660edb 6743 DEBUG_P(PerlIO_printf(Perl_debug_log,
1d7c1841 6744 "Screamer: post: FILE * thinks ptr=%"UVuf", cnt=%ld, base=%"UVuf"\n",
1c846c1f 6745 PTR2UV(PerlIO_get_ptr(fp)), (long)PerlIO_get_cnt(fp),
1d7c1841 6746 PTR2UV(PerlIO_has_base (fp) ? PerlIO_get_base(fp) : 0)));
ba7abf9d 6747#endif
a20bf0c3
JH
6748 cnt = PerlIO_get_cnt(fp);
6749 ptr = (STDCHAR*)PerlIO_get_ptr(fp); /* reregisterize cnt and ptr */
16660edb 6750 DEBUG_P(PerlIO_printf(Perl_debug_log,
1d7c1841 6751 "Screamer: after getc, ptr=%"UVuf", cnt=%ld\n",PTR2UV(ptr),(long)cnt));
79072805 6752
748a9306
LW
6753 if (i == EOF) /* all done for ever? */
6754 goto thats_really_all_folks;
6755
3f7c398e 6756 bpx = bp - (STDCHAR*)SvPVX_const(sv); /* box up before relocation */
79072805
LW
6757 SvCUR_set(sv, bpx);
6758 SvGROW(sv, bpx + cnt + 2);
3f7c398e 6759 bp = (STDCHAR*)SvPVX_const(sv) + bpx; /* unbox after relocation */
c07a80fd 6760
eb160463 6761 *bp++ = (STDCHAR)i; /* store character from PerlIO_getc */
79072805 6762
c07a80fd 6763 if (rslen && (STDCHAR)i == rslast) /* all done for now? */
79072805 6764 goto thats_all_folks;
79072805
LW
6765 }
6766
6767thats_all_folks:
3f7c398e 6768 if ((rslen > 1 && (STRLEN)(bp - (STDCHAR*)SvPVX_const(sv)) < rslen) ||
36477c24 6769 memNE((char*)bp - rslen, rsptr, rslen))
760ac839 6770 goto screamer; /* go back to the fray */
79072805
LW
6771thats_really_all_folks:
6772 if (shortbuffered)
6773 cnt += shortbuffered;
16660edb 6774 DEBUG_P(PerlIO_printf(Perl_debug_log,
1d7c1841 6775 "Screamer: quitting, ptr=%"UVuf", cnt=%ld\n",PTR2UV(ptr),(long)cnt));
cc00df79 6776 PerlIO_set_ptrcnt(fp, (STDCHAR*)ptr, cnt); /* put these back or we're in trouble */
16660edb 6777 DEBUG_P(PerlIO_printf(Perl_debug_log,
1d7c1841 6778 "Screamer: end: FILE * thinks ptr=%"UVuf", cnt=%ld, base=%"UVuf"\n",
1c846c1f 6779 PTR2UV(PerlIO_get_ptr(fp)), (long)PerlIO_get_cnt(fp),
1d7c1841 6780 PTR2UV(PerlIO_has_base (fp) ? PerlIO_get_base(fp) : 0)));
79072805 6781 *bp = '\0';
3f7c398e 6782 SvCUR_set(sv, bp - (STDCHAR*)SvPVX_const(sv)); /* set length */
16660edb 6783 DEBUG_P(PerlIO_printf(Perl_debug_log,
fb73857a 6784 "Screamer: done, len=%ld, string=|%.*s|\n",
3f7c398e 6785 (long)SvCUR(sv),(int)SvCUR(sv),SvPVX_const(sv)));
760ac839
LW
6786 }
6787 else
79072805 6788 {
6edd2cd5 6789 /*The big, slow, and stupid way. */
27da23d5 6790#ifdef USE_HEAP_INSTEAD_OF_STACK /* Even slower way. */
6edd2cd5 6791 STDCHAR *buf = 0;
a02a5408 6792 Newx(buf, 8192, STDCHAR);
6edd2cd5 6793 assert(buf);
4d2c4e07 6794#else
6edd2cd5 6795 STDCHAR buf[8192];
4d2c4e07 6796#endif
79072805 6797
760ac839 6798screamer2:
c07a80fd 6799 if (rslen) {
6867be6d 6800 const register STDCHAR *bpe = buf + sizeof(buf);
760ac839 6801 bp = buf;
eb160463 6802 while ((i = PerlIO_getc(fp)) != EOF && (*bp++ = (STDCHAR)i) != rslast && bp < bpe)
760ac839
LW
6803 ; /* keep reading */
6804 cnt = bp - buf;
c07a80fd 6805 }
6806 else {
760ac839 6807 cnt = PerlIO_read(fp,(char*)buf, sizeof(buf));
16660edb 6808 /* Accomodate broken VAXC compiler, which applies U8 cast to
6809 * both args of ?: operator, causing EOF to change into 255
6810 */
37be0adf 6811 if (cnt > 0)
cbe9e203
JH
6812 i = (U8)buf[cnt - 1];
6813 else
37be0adf 6814 i = EOF;
c07a80fd 6815 }
79072805 6816
cbe9e203
JH
6817 if (cnt < 0)
6818 cnt = 0; /* we do need to re-set the sv even when cnt <= 0 */
6819 if (append)
6820 sv_catpvn(sv, (char *) buf, cnt);
6821 else
6822 sv_setpvn(sv, (char *) buf, cnt);
c07a80fd 6823
6824 if (i != EOF && /* joy */
6825 (!rslen ||
6826 SvCUR(sv) < rslen ||
3f7c398e 6827 memNE(SvPVX_const(sv) + SvCUR(sv) - rslen, rsptr, rslen)))
79072805
LW
6828 {
6829 append = -1;
63e4d877
CS
6830 /*
6831 * If we're reading from a TTY and we get a short read,
6832 * indicating that the user hit his EOF character, we need
6833 * to notice it now, because if we try to read from the TTY
6834 * again, the EOF condition will disappear.
6835 *
6836 * The comparison of cnt to sizeof(buf) is an optimization
6837 * that prevents unnecessary calls to feof().
6838 *
6839 * - jik 9/25/96
6840 */
6841 if (!(cnt < sizeof(buf) && PerlIO_eof(fp)))
6842 goto screamer2;
79072805 6843 }
6edd2cd5 6844
27da23d5 6845#ifdef USE_HEAP_INSTEAD_OF_STACK
6edd2cd5
JH
6846 Safefree(buf);
6847#endif
79072805
LW
6848 }
6849
8bfdd7d9 6850 if (rspara) { /* have to do this both before and after */
c07a80fd 6851 while (i != EOF) { /* to make sure file boundaries work right */
760ac839 6852 i = PerlIO_getc(fp);
79072805 6853 if (i != '\n') {
760ac839 6854 PerlIO_ungetc(fp,i);
79072805
LW
6855 break;
6856 }
6857 }
6858 }
c07a80fd 6859
efd8b2ba 6860return_string_or_null:
c07a80fd 6861 return (SvCUR(sv) - append) ? SvPVX(sv) : Nullch;
79072805
LW
6862}
6863
954c1994
GS
6864/*
6865=for apidoc sv_inc
6866
645c22ef
DM
6867Auto-increment of the value in the SV, doing string to numeric conversion
6868if necessary. Handles 'get' magic.
954c1994
GS
6869
6870=cut
6871*/
6872
79072805 6873void
864dbfa3 6874Perl_sv_inc(pTHX_ register SV *sv)
79072805
LW
6875{
6876 register char *d;
463ee0b2 6877 int flags;
79072805
LW
6878
6879 if (!sv)
6880 return;
5b295bef 6881 SvGETMAGIC(sv);
ed6116ce 6882 if (SvTHINKFIRST(sv)) {
765f542d
NC
6883 if (SvIsCOW(sv))
6884 sv_force_normal_flags(sv, 0);
0f15f207 6885 if (SvREADONLY(sv)) {
923e4eb5 6886 if (IN_PERL_RUNTIME)
cea2e8a9 6887 Perl_croak(aTHX_ PL_no_modify);
0f15f207 6888 }
a0d0e21e 6889 if (SvROK(sv)) {
b5be31e9 6890 IV i;
9e7bc3e8
JD
6891 if (SvAMAGIC(sv) && AMG_CALLun(sv,inc))
6892 return;
56431972 6893 i = PTR2IV(SvRV(sv));
b5be31e9
SM
6894 sv_unref(sv);
6895 sv_setiv(sv, i);
a0d0e21e 6896 }
ed6116ce 6897 }
8990e307 6898 flags = SvFLAGS(sv);
28e5dec8
JH
6899 if ((flags & (SVp_NOK|SVp_IOK)) == SVp_NOK) {
6900 /* It's (privately or publicly) a float, but not tested as an
6901 integer, so test it to see. */
d460ef45 6902 (void) SvIV(sv);
28e5dec8
JH
6903 flags = SvFLAGS(sv);
6904 }
6905 if ((flags & SVf_IOK) || ((flags & (SVp_IOK | SVp_NOK)) == SVp_IOK)) {
6906 /* It's publicly an integer, or privately an integer-not-float */
59d8ce62 6907#ifdef PERL_PRESERVE_IVUV
28e5dec8 6908 oops_its_int:
59d8ce62 6909#endif
25da4f38
IZ
6910 if (SvIsUV(sv)) {
6911 if (SvUVX(sv) == UV_MAX)
a1e868e7 6912 sv_setnv(sv, UV_MAX_P1);
25da4f38
IZ
6913 else
6914 (void)SvIOK_only_UV(sv);
607fa7f2 6915 SvUV_set(sv, SvUVX(sv) + 1);
25da4f38
IZ
6916 } else {
6917 if (SvIVX(sv) == IV_MAX)
28e5dec8 6918 sv_setuv(sv, (UV)IV_MAX + 1);
25da4f38
IZ
6919 else {
6920 (void)SvIOK_only(sv);
45977657 6921 SvIV_set(sv, SvIVX(sv) + 1);
1c846c1f 6922 }
55497cff 6923 }
79072805
LW
6924 return;
6925 }
28e5dec8
JH
6926 if (flags & SVp_NOK) {
6927 (void)SvNOK_only(sv);
9d6ce603 6928 SvNV_set(sv, SvNVX(sv) + 1.0);
28e5dec8
JH
6929 return;
6930 }
6931
3f7c398e 6932 if (!(flags & SVp_POK) || !*SvPVX_const(sv)) {
28e5dec8 6933 if ((flags & SVTYPEMASK) < SVt_PVIV)
f5282e15 6934 sv_upgrade(sv, ((flags & SVTYPEMASK) > SVt_IV ? SVt_PVIV : SVt_IV));
28e5dec8 6935 (void)SvIOK_only(sv);
45977657 6936 SvIV_set(sv, 1);
79072805
LW
6937 return;
6938 }
463ee0b2 6939 d = SvPVX(sv);
79072805
LW
6940 while (isALPHA(*d)) d++;
6941 while (isDIGIT(*d)) d++;
6942 if (*d) {
28e5dec8 6943#ifdef PERL_PRESERVE_IVUV
d1be9408 6944 /* Got to punt this as an integer if needs be, but we don't issue
28e5dec8
JH
6945 warnings. Probably ought to make the sv_iv_please() that does
6946 the conversion if possible, and silently. */
504618e9 6947 const int numtype = grok_number(SvPVX_const(sv), SvCUR(sv), NULL);
28e5dec8
JH
6948 if (numtype && !(numtype & IS_NUMBER_INFINITY)) {
6949 /* Need to try really hard to see if it's an integer.
6950 9.22337203685478e+18 is an integer.
6951 but "9.22337203685478e+18" + 0 is UV=9223372036854779904
6952 so $a="9.22337203685478e+18"; $a+0; $a++
6953 needs to be the same as $a="9.22337203685478e+18"; $a++
6954 or we go insane. */
d460ef45 6955
28e5dec8
JH
6956 (void) sv_2iv(sv);
6957 if (SvIOK(sv))
6958 goto oops_its_int;
6959
6960 /* sv_2iv *should* have made this an NV */
6961 if (flags & SVp_NOK) {
6962 (void)SvNOK_only(sv);
9d6ce603 6963 SvNV_set(sv, SvNVX(sv) + 1.0);
28e5dec8
JH
6964 return;
6965 }
6966 /* I don't think we can get here. Maybe I should assert this
6967 And if we do get here I suspect that sv_setnv will croak. NWC
6968 Fall through. */
6969#if defined(USE_LONG_DOUBLE)
6970 DEBUG_c(PerlIO_printf(Perl_debug_log,"sv_inc punt failed to convert '%s' to IOK or NOKp, UV=0x%"UVxf" NV=%"PERL_PRIgldbl"\n",
3f7c398e 6971 SvPVX_const(sv), SvIVX(sv), SvNVX(sv)));
28e5dec8 6972#else
1779d84d 6973 DEBUG_c(PerlIO_printf(Perl_debug_log,"sv_inc punt failed to convert '%s' to IOK or NOKp, UV=0x%"UVxf" NV=%"NVgf"\n",
3f7c398e 6974 SvPVX_const(sv), SvIVX(sv), SvNVX(sv)));
28e5dec8
JH
6975#endif
6976 }
6977#endif /* PERL_PRESERVE_IVUV */
3f7c398e 6978 sv_setnv(sv,Atof(SvPVX_const(sv)) + 1.0);
79072805
LW
6979 return;
6980 }
6981 d--;
3f7c398e 6982 while (d >= SvPVX_const(sv)) {
79072805
LW
6983 if (isDIGIT(*d)) {
6984 if (++*d <= '9')
6985 return;
6986 *(d--) = '0';
6987 }
6988 else {
9d116dd7
JH
6989#ifdef EBCDIC
6990 /* MKS: The original code here died if letters weren't consecutive.
6991 * at least it didn't have to worry about non-C locales. The
6992 * new code assumes that ('z'-'a')==('Z'-'A'), letters are
1c846c1f 6993 * arranged in order (although not consecutively) and that only
9d116dd7
JH
6994 * [A-Za-z] are accepted by isALPHA in the C locale.
6995 */
6996 if (*d != 'z' && *d != 'Z') {
6997 do { ++*d; } while (!isALPHA(*d));
6998 return;
6999 }
7000 *(d--) -= 'z' - 'a';
7001#else
79072805
LW
7002 ++*d;
7003 if (isALPHA(*d))
7004 return;
7005 *(d--) -= 'z' - 'a' + 1;
9d116dd7 7006#endif
79072805
LW
7007 }
7008 }
7009 /* oh,oh, the number grew */
7010 SvGROW(sv, SvCUR(sv) + 2);
b162af07 7011 SvCUR_set(sv, SvCUR(sv) + 1);
3f7c398e 7012 for (d = SvPVX(sv) + SvCUR(sv); d > SvPVX_const(sv); d--)
79072805
LW
7013 *d = d[-1];
7014 if (isDIGIT(d[1]))
7015 *d = '1';
7016 else
7017 *d = d[1];
7018}
7019
954c1994
GS
7020/*
7021=for apidoc sv_dec
7022
645c22ef
DM
7023Auto-decrement of the value in the SV, doing string to numeric conversion
7024if necessary. Handles 'get' magic.
954c1994
GS
7025
7026=cut
7027*/
7028
79072805 7029void
864dbfa3 7030Perl_sv_dec(pTHX_ register SV *sv)
79072805 7031{
463ee0b2
LW
7032 int flags;
7033
79072805
LW
7034 if (!sv)
7035 return;
5b295bef 7036 SvGETMAGIC(sv);
ed6116ce 7037 if (SvTHINKFIRST(sv)) {
765f542d
NC
7038 if (SvIsCOW(sv))
7039 sv_force_normal_flags(sv, 0);
0f15f207 7040 if (SvREADONLY(sv)) {
923e4eb5 7041 if (IN_PERL_RUNTIME)
cea2e8a9 7042 Perl_croak(aTHX_ PL_no_modify);
0f15f207 7043 }
a0d0e21e 7044 if (SvROK(sv)) {
b5be31e9 7045 IV i;
9e7bc3e8
JD
7046 if (SvAMAGIC(sv) && AMG_CALLun(sv,dec))
7047 return;
56431972 7048 i = PTR2IV(SvRV(sv));
b5be31e9
SM
7049 sv_unref(sv);
7050 sv_setiv(sv, i);
a0d0e21e 7051 }
ed6116ce 7052 }
28e5dec8
JH
7053 /* Unlike sv_inc we don't have to worry about string-never-numbers
7054 and keeping them magic. But we mustn't warn on punting */
8990e307 7055 flags = SvFLAGS(sv);
28e5dec8
JH
7056 if ((flags & SVf_IOK) || ((flags & (SVp_IOK | SVp_NOK)) == SVp_IOK)) {
7057 /* It's publicly an integer, or privately an integer-not-float */
59d8ce62 7058#ifdef PERL_PRESERVE_IVUV
28e5dec8 7059 oops_its_int:
59d8ce62 7060#endif
25da4f38
IZ
7061 if (SvIsUV(sv)) {
7062 if (SvUVX(sv) == 0) {
7063 (void)SvIOK_only(sv);
45977657 7064 SvIV_set(sv, -1);
25da4f38
IZ
7065 }
7066 else {
7067 (void)SvIOK_only_UV(sv);
f4eee32f 7068 SvUV_set(sv, SvUVX(sv) - 1);
1c846c1f 7069 }
25da4f38
IZ
7070 } else {
7071 if (SvIVX(sv) == IV_MIN)
65202027 7072 sv_setnv(sv, (NV)IV_MIN - 1.0);
25da4f38
IZ
7073 else {
7074 (void)SvIOK_only(sv);
45977657 7075 SvIV_set(sv, SvIVX(sv) - 1);
1c846c1f 7076 }
55497cff 7077 }
7078 return;
7079 }
28e5dec8 7080 if (flags & SVp_NOK) {
9d6ce603 7081 SvNV_set(sv, SvNVX(sv) - 1.0);
28e5dec8
JH
7082 (void)SvNOK_only(sv);
7083 return;
7084 }
8990e307 7085 if (!(flags & SVp_POK)) {
ef088171
NC
7086 if ((flags & SVTYPEMASK) < SVt_PVIV)
7087 sv_upgrade(sv, ((flags & SVTYPEMASK) > SVt_IV) ? SVt_PVIV : SVt_IV);
7088 SvIV_set(sv, -1);
7089 (void)SvIOK_only(sv);
79072805
LW
7090 return;
7091 }
28e5dec8
JH
7092#ifdef PERL_PRESERVE_IVUV
7093 {
504618e9 7094 const int numtype = grok_number(SvPVX_const(sv), SvCUR(sv), NULL);
28e5dec8
JH
7095 if (numtype && !(numtype & IS_NUMBER_INFINITY)) {
7096 /* Need to try really hard to see if it's an integer.
7097 9.22337203685478e+18 is an integer.
7098 but "9.22337203685478e+18" + 0 is UV=9223372036854779904
7099 so $a="9.22337203685478e+18"; $a+0; $a--
7100 needs to be the same as $a="9.22337203685478e+18"; $a--
7101 or we go insane. */
d460ef45 7102
28e5dec8
JH
7103 (void) sv_2iv(sv);
7104 if (SvIOK(sv))
7105 goto oops_its_int;
7106
7107 /* sv_2iv *should* have made this an NV */
7108 if (flags & SVp_NOK) {
7109 (void)SvNOK_only(sv);
9d6ce603 7110 SvNV_set(sv, SvNVX(sv) - 1.0);
28e5dec8
JH
7111 return;
7112 }
7113 /* I don't think we can get here. Maybe I should assert this
7114 And if we do get here I suspect that sv_setnv will croak. NWC
7115 Fall through. */
7116#if defined(USE_LONG_DOUBLE)
7117 DEBUG_c(PerlIO_printf(Perl_debug_log,"sv_dec punt failed to convert '%s' to IOK or NOKp, UV=0x%"UVxf" NV=%"PERL_PRIgldbl"\n",
3f7c398e 7118 SvPVX_const(sv), SvIVX(sv), SvNVX(sv)));
28e5dec8 7119#else
1779d84d 7120 DEBUG_c(PerlIO_printf(Perl_debug_log,"sv_dec punt failed to convert '%s' to IOK or NOKp, UV=0x%"UVxf" NV=%"NVgf"\n",
3f7c398e 7121 SvPVX_const(sv), SvIVX(sv), SvNVX(sv)));
28e5dec8
JH
7122#endif
7123 }
7124 }
7125#endif /* PERL_PRESERVE_IVUV */
3f7c398e 7126 sv_setnv(sv,Atof(SvPVX_const(sv)) - 1.0); /* punt */
79072805
LW
7127}
7128
954c1994
GS
7129/*
7130=for apidoc sv_mortalcopy
7131
645c22ef 7132Creates a new SV which is a copy of the original SV (using C<sv_setsv>).
d4236ebc
DM
7133The new SV is marked as mortal. It will be destroyed "soon", either by an
7134explicit call to FREETMPS, or by an implicit call at places such as
7135statement boundaries. See also C<sv_newmortal> and C<sv_2mortal>.
954c1994
GS
7136
7137=cut
7138*/
7139
79072805
LW
7140/* Make a string that will exist for the duration of the expression
7141 * evaluation. Actually, it may have to last longer than that, but
7142 * hopefully we won't free it until it has been assigned to a
7143 * permanent location. */
7144
7145SV *
864dbfa3 7146Perl_sv_mortalcopy(pTHX_ SV *oldstr)
79072805 7147{
463ee0b2 7148 register SV *sv;
b881518d 7149
4561caa4 7150 new_SV(sv);
79072805 7151 sv_setsv(sv,oldstr);
677b06e3
GS
7152 EXTEND_MORTAL(1);
7153 PL_tmps_stack[++PL_tmps_ix] = sv;
8990e307
LW
7154 SvTEMP_on(sv);
7155 return sv;
7156}
7157
954c1994
GS
7158/*
7159=for apidoc sv_newmortal
7160
645c22ef 7161Creates a new null SV which is mortal. The reference count of the SV is
d4236ebc
DM
7162set to 1. It will be destroyed "soon", either by an explicit call to
7163FREETMPS, or by an implicit call at places such as statement boundaries.
7164See also C<sv_mortalcopy> and C<sv_2mortal>.
954c1994
GS
7165
7166=cut
7167*/
7168
8990e307 7169SV *
864dbfa3 7170Perl_sv_newmortal(pTHX)
8990e307
LW
7171{
7172 register SV *sv;
7173
4561caa4 7174 new_SV(sv);
8990e307 7175 SvFLAGS(sv) = SVs_TEMP;
677b06e3
GS
7176 EXTEND_MORTAL(1);
7177 PL_tmps_stack[++PL_tmps_ix] = sv;
79072805
LW
7178 return sv;
7179}
7180
954c1994
GS
7181/*
7182=for apidoc sv_2mortal
7183
d4236ebc
DM
7184Marks an existing SV as mortal. The SV will be destroyed "soon", either
7185by an explicit call to FREETMPS, or by an implicit call at places such as
37d2ac18
NC
7186statement boundaries. SvTEMP() is turned on which means that the SV's
7187string buffer can be "stolen" if this SV is copied. See also C<sv_newmortal>
7188and C<sv_mortalcopy>.
954c1994
GS
7189
7190=cut
7191*/
7192
79072805 7193SV *
864dbfa3 7194Perl_sv_2mortal(pTHX_ register SV *sv)
79072805 7195{
27da23d5 7196 dVAR;
79072805
LW
7197 if (!sv)
7198 return sv;
d689ffdd 7199 if (SvREADONLY(sv) && SvIMMORTAL(sv))
11162842 7200 return sv;
677b06e3
GS
7201 EXTEND_MORTAL(1);
7202 PL_tmps_stack[++PL_tmps_ix] = sv;
8990e307 7203 SvTEMP_on(sv);
79072805
LW
7204 return sv;
7205}
7206
954c1994
GS
7207/*
7208=for apidoc newSVpv
7209
7210Creates a new SV and copies a string into it. The reference count for the
7211SV is set to 1. If C<len> is zero, Perl will compute the length using
7212strlen(). For efficiency, consider using C<newSVpvn> instead.
7213
7214=cut
7215*/
7216
79072805 7217SV *
864dbfa3 7218Perl_newSVpv(pTHX_ const char *s, STRLEN len)
79072805 7219{
463ee0b2 7220 register SV *sv;
79072805 7221
4561caa4 7222 new_SV(sv);
616d8c9c 7223 sv_setpvn(sv,s,len ? len : strlen(s));
79072805
LW
7224 return sv;
7225}
7226
954c1994
GS
7227/*
7228=for apidoc newSVpvn
7229
7230Creates a new SV and copies a string into it. The reference count for the
1c846c1f 7231SV is set to 1. Note that if C<len> is zero, Perl will create a zero length
954c1994 7232string. You are responsible for ensuring that the source string is at least
9e09f5f2 7233C<len> bytes long. If the C<s> argument is NULL the new SV will be undefined.
954c1994
GS
7234
7235=cut
7236*/
7237
9da1e3b5 7238SV *
864dbfa3 7239Perl_newSVpvn(pTHX_ const char *s, STRLEN len)
9da1e3b5
MUN
7240{
7241 register SV *sv;
7242
7243 new_SV(sv);
9da1e3b5
MUN
7244 sv_setpvn(sv,s,len);
7245 return sv;
7246}
7247
bd08039b
NC
7248
7249/*
926f8064 7250=for apidoc newSVhek
bd08039b
NC
7251
7252Creates a new SV from the hash key structure. It will generate scalars that
5aaec2b4
NC
7253point to the shared string table where possible. Returns a new (undefined)
7254SV if the hek is NULL.
bd08039b
NC
7255
7256=cut
7257*/
7258
7259SV *
c1b02ed8 7260Perl_newSVhek(pTHX_ const HEK *hek)
bd08039b 7261{
5aaec2b4
NC
7262 if (!hek) {
7263 SV *sv;
7264
7265 new_SV(sv);
7266 return sv;
7267 }
7268
bd08039b
NC
7269 if (HEK_LEN(hek) == HEf_SVKEY) {
7270 return newSVsv(*(SV**)HEK_KEY(hek));
7271 } else {
7272 const int flags = HEK_FLAGS(hek);
7273 if (flags & HVhek_WASUTF8) {
7274 /* Trouble :-)
7275 Andreas would like keys he put in as utf8 to come back as utf8
7276 */
7277 STRLEN utf8_len = HEK_LEN(hek);
b64e5050
AL
7278 const U8 *as_utf8 = bytes_to_utf8 ((U8*)HEK_KEY(hek), &utf8_len);
7279 SV * const sv = newSVpvn ((const char*)as_utf8, utf8_len);
bd08039b
NC
7280
7281 SvUTF8_on (sv);
7282 Safefree (as_utf8); /* bytes_to_utf8() allocates a new string */
7283 return sv;
7284 } else if (flags & HVhek_REHASH) {
7285 /* We don't have a pointer to the hv, so we have to replicate the
7286 flag into every HEK. This hv is using custom a hasing
7287 algorithm. Hence we can't return a shared string scalar, as
7288 that would contain the (wrong) hash value, and might get passed
7289 into an hv routine with a regular hash */
7290
b64e5050 7291 SV * const sv = newSVpvn (HEK_KEY(hek), HEK_LEN(hek));
bd08039b
NC
7292 if (HEK_UTF8(hek))
7293 SvUTF8_on (sv);
7294 return sv;
7295 }
7296 /* This will be overwhelminly the most common case. */
7297 return newSVpvn_share(HEK_KEY(hek),
7298 (HEK_UTF8(hek) ? -HEK_LEN(hek) : HEK_LEN(hek)),
7299 HEK_HASH(hek));
7300 }
7301}
7302
1c846c1f
NIS
7303/*
7304=for apidoc newSVpvn_share
7305
3f7c398e 7306Creates a new SV with its SvPVX_const pointing to a shared string in the string
645c22ef
DM
7307table. If the string does not already exist in the table, it is created
7308first. Turns on READONLY and FAKE. The string's hash is stored in the UV
7309slot of the SV; if the C<hash> parameter is non-zero, that value is used;
7310otherwise the hash is computed. The idea here is that as the string table
3f7c398e 7311is used for shared hash keys these strings will have SvPVX_const == HeKEY and
645c22ef 7312hash lookup will avoid string compare.
1c846c1f
NIS
7313
7314=cut
7315*/
7316
7317SV *
c3654f1a 7318Perl_newSVpvn_share(pTHX_ const char *src, I32 len, U32 hash)
1c846c1f
NIS
7319{
7320 register SV *sv;
c3654f1a
IH
7321 bool is_utf8 = FALSE;
7322 if (len < 0) {
77caf834 7323 STRLEN tmplen = -len;
c3654f1a 7324 is_utf8 = TRUE;
75a54232 7325 /* See the note in hv.c:hv_fetch() --jhi */
e1ec3a88 7326 src = (char*)bytes_from_utf8((const U8*)src, &tmplen, &is_utf8);
75a54232
JH
7327 len = tmplen;
7328 }
1c846c1f 7329 if (!hash)
5afd6d42 7330 PERL_HASH(hash, src, len);
1c846c1f 7331 new_SV(sv);
bdd68bc3 7332 sv_upgrade(sv, SVt_PV);
f880fe2f 7333 SvPV_set(sv, sharepvn(src, is_utf8?-len:len, hash));
b162af07 7334 SvCUR_set(sv, len);
b162af07 7335 SvLEN_set(sv, 0);
1c846c1f
NIS
7336 SvREADONLY_on(sv);
7337 SvFAKE_on(sv);
7338 SvPOK_on(sv);
c3654f1a
IH
7339 if (is_utf8)
7340 SvUTF8_on(sv);
1c846c1f
NIS
7341 return sv;
7342}
7343
645c22ef 7344
cea2e8a9 7345#if defined(PERL_IMPLICIT_CONTEXT)
645c22ef
DM
7346
7347/* pTHX_ magic can't cope with varargs, so this is a no-context
7348 * version of the main function, (which may itself be aliased to us).
7349 * Don't access this version directly.
7350 */
7351
46fc3d4c 7352SV *
cea2e8a9 7353Perl_newSVpvf_nocontext(const char* pat, ...)
46fc3d4c 7354{
cea2e8a9 7355 dTHX;
46fc3d4c 7356 register SV *sv;
7357 va_list args;
46fc3d4c 7358 va_start(args, pat);
c5be433b 7359 sv = vnewSVpvf(pat, &args);
46fc3d4c 7360 va_end(args);
7361 return sv;
7362}
cea2e8a9 7363#endif
46fc3d4c 7364
954c1994
GS
7365/*
7366=for apidoc newSVpvf
7367
645c22ef 7368Creates a new SV and initializes it with the string formatted like
954c1994
GS
7369C<sprintf>.
7370
7371=cut
7372*/
7373
cea2e8a9
GS
7374SV *
7375Perl_newSVpvf(pTHX_ const char* pat, ...)
7376{
7377 register SV *sv;
7378 va_list args;
cea2e8a9 7379 va_start(args, pat);
c5be433b 7380 sv = vnewSVpvf(pat, &args);
cea2e8a9
GS
7381 va_end(args);
7382 return sv;
7383}
46fc3d4c 7384
645c22ef
DM
7385/* backend for newSVpvf() and newSVpvf_nocontext() */
7386
79072805 7387SV *
c5be433b
GS
7388Perl_vnewSVpvf(pTHX_ const char* pat, va_list* args)
7389{
7390 register SV *sv;
7391 new_SV(sv);
7392 sv_vsetpvfn(sv, pat, strlen(pat), args, Null(SV**), 0, Null(bool*));
7393 return sv;
7394}
7395
954c1994
GS
7396/*
7397=for apidoc newSVnv
7398
7399Creates a new SV and copies a floating point value into it.
7400The reference count for the SV is set to 1.
7401
7402=cut
7403*/
7404
c5be433b 7405SV *
65202027 7406Perl_newSVnv(pTHX_ NV n)
79072805 7407{
463ee0b2 7408 register SV *sv;
79072805 7409
4561caa4 7410 new_SV(sv);
79072805
LW
7411 sv_setnv(sv,n);
7412 return sv;
7413}
7414
954c1994
GS
7415/*
7416=for apidoc newSViv
7417
7418Creates a new SV and copies an integer into it. The reference count for the
7419SV is set to 1.
7420
7421=cut
7422*/
7423
79072805 7424SV *
864dbfa3 7425Perl_newSViv(pTHX_ IV i)
79072805 7426{
463ee0b2 7427 register SV *sv;
79072805 7428
4561caa4 7429 new_SV(sv);
79072805
LW
7430 sv_setiv(sv,i);
7431 return sv;
7432}
7433
954c1994 7434/*
1a3327fb
JH
7435=for apidoc newSVuv
7436
7437Creates a new SV and copies an unsigned integer into it.
7438The reference count for the SV is set to 1.
7439
7440=cut
7441*/
7442
7443SV *
7444Perl_newSVuv(pTHX_ UV u)
7445{
7446 register SV *sv;
7447
7448 new_SV(sv);
7449 sv_setuv(sv,u);
7450 return sv;
7451}
7452
7453/*
954c1994
GS
7454=for apidoc newRV_noinc
7455
7456Creates an RV wrapper for an SV. The reference count for the original
7457SV is B<not> incremented.
7458
7459=cut
7460*/
7461
2304df62 7462SV *
864dbfa3 7463Perl_newRV_noinc(pTHX_ SV *tmpRef)
2304df62
AD
7464{
7465 register SV *sv;
7466
4561caa4 7467 new_SV(sv);
2304df62 7468 sv_upgrade(sv, SVt_RV);
76e3520e 7469 SvTEMP_off(tmpRef);
b162af07 7470 SvRV_set(sv, tmpRef);
2304df62 7471 SvROK_on(sv);
2304df62
AD
7472 return sv;
7473}
7474
ff276b08 7475/* newRV_inc is the official function name to use now.
645c22ef
DM
7476 * newRV_inc is in fact #defined to newRV in sv.h
7477 */
7478
5f05dabc 7479SV *
864dbfa3 7480Perl_newRV(pTHX_ SV *tmpRef)
5f05dabc 7481{
5f6447b6 7482 return newRV_noinc(SvREFCNT_inc(tmpRef));
5f05dabc 7483}
5f05dabc 7484
954c1994
GS
7485/*
7486=for apidoc newSVsv
7487
7488Creates a new SV which is an exact duplicate of the original SV.
645c22ef 7489(Uses C<sv_setsv>).
954c1994
GS
7490
7491=cut
7492*/
7493
79072805 7494SV *
864dbfa3 7495Perl_newSVsv(pTHX_ register SV *old)
79072805 7496{
463ee0b2 7497 register SV *sv;
79072805
LW
7498
7499 if (!old)
7500 return Nullsv;
8990e307 7501 if (SvTYPE(old) == SVTYPEMASK) {
0453d815 7502 if (ckWARN_d(WARN_INTERNAL))
9014280d 7503 Perl_warner(aTHX_ packWARN(WARN_INTERNAL), "semi-panic: attempt to dup freed string");
79072805
LW
7504 return Nullsv;
7505 }
4561caa4 7506 new_SV(sv);
e90aabeb
NC
7507 /* SV_GMAGIC is the default for sv_setv()
7508 SV_NOSTEAL prevents TEMP buffers being, well, stolen, and saves games
7509 with SvTEMP_off and SvTEMP_on round a call to sv_setsv. */
7510 sv_setsv_flags(sv, old, SV_GMAGIC | SV_NOSTEAL);
463ee0b2 7511 return sv;
79072805
LW
7512}
7513
645c22ef
DM
7514/*
7515=for apidoc sv_reset
7516
7517Underlying implementation for the C<reset> Perl function.
7518Note that the perl-level function is vaguely deprecated.
7519
7520=cut
7521*/
7522
79072805 7523void
e1ec3a88 7524Perl_sv_reset(pTHX_ register const char *s, HV *stash)
79072805 7525{
27da23d5 7526 dVAR;
4802d5d7 7527 char todo[PERL_UCHAR_MAX+1];
79072805 7528
49d8d3a1
MB
7529 if (!stash)
7530 return;
7531
79072805 7532 if (!*s) { /* reset ?? searches */
aec46f14 7533 MAGIC * const mg = mg_find((SV *)stash, PERL_MAGIC_symtab);
8d2f4536
NC
7534 if (mg) {
7535 PMOP *pm = (PMOP *) mg->mg_obj;
7536 while (pm) {
7537 pm->op_pmdynflags &= ~PMdf_USED;
7538 pm = pm->op_pmnext;
7539 }
79072805
LW
7540 }
7541 return;
7542 }
7543
7544 /* reset variables */
7545
7546 if (!HvARRAY(stash))
7547 return;
463ee0b2
LW
7548
7549 Zero(todo, 256, char);
79072805 7550 while (*s) {
b464bac0
AL
7551 I32 max;
7552 I32 i = (unsigned char)*s;
79072805
LW
7553 if (s[1] == '-') {
7554 s += 2;
7555 }
4802d5d7 7556 max = (unsigned char)*s++;
79072805 7557 for ( ; i <= max; i++) {
463ee0b2
LW
7558 todo[i] = 1;
7559 }
a0d0e21e 7560 for (i = 0; i <= (I32) HvMAX(stash); i++) {
b464bac0 7561 HE *entry;
79072805 7562 for (entry = HvARRAY(stash)[i];
9e35f4b3
GS
7563 entry;
7564 entry = HeNEXT(entry))
7565 {
b464bac0
AL
7566 register GV *gv;
7567 register SV *sv;
7568
1edc1566 7569 if (!todo[(U8)*HeKEY(entry)])
463ee0b2 7570 continue;
1edc1566 7571 gv = (GV*)HeVAL(entry);
79072805 7572 sv = GvSV(gv);
e203899d
NC
7573 if (sv) {
7574 if (SvTHINKFIRST(sv)) {
7575 if (!SvREADONLY(sv) && SvROK(sv))
7576 sv_unref(sv);
7577 /* XXX Is this continue a bug? Why should THINKFIRST
7578 exempt us from resetting arrays and hashes? */
7579 continue;
7580 }
7581 SvOK_off(sv);
7582 if (SvTYPE(sv) >= SVt_PV) {
7583 SvCUR_set(sv, 0);
7584 if (SvPVX_const(sv) != Nullch)
7585 *SvPVX(sv) = '\0';
7586 SvTAINT(sv);
7587 }
79072805
LW
7588 }
7589 if (GvAV(gv)) {
7590 av_clear(GvAV(gv));
7591 }
bfcb3514 7592 if (GvHV(gv) && !HvNAME_get(GvHV(gv))) {
463ee0b2 7593 hv_clear(GvHV(gv));
2f42fcb0 7594#ifndef PERL_MICRO
fa6a1c44 7595#ifdef USE_ENVIRON_ARRAY
4efc5df6
GS
7596 if (gv == PL_envgv
7597# ifdef USE_ITHREADS
7598 && PL_curinterp == aTHX
7599# endif
7600 )
7601 {
79072805 7602 environ[0] = Nullch;
4efc5df6 7603 }
a0d0e21e 7604#endif
2f42fcb0 7605#endif /* !PERL_MICRO */
79072805
LW
7606 }
7607 }
7608 }
7609 }
7610}
7611
645c22ef
DM
7612/*
7613=for apidoc sv_2io
7614
7615Using various gambits, try to get an IO from an SV: the IO slot if its a
7616GV; or the recursive result if we're an RV; or the IO slot of the symbol
7617named after the PV if we're a string.
7618
7619=cut
7620*/
7621
46fc3d4c 7622IO*
864dbfa3 7623Perl_sv_2io(pTHX_ SV *sv)
46fc3d4c 7624{
7625 IO* io;
7626 GV* gv;
7627
7628 switch (SvTYPE(sv)) {
7629 case SVt_PVIO:
7630 io = (IO*)sv;
7631 break;
7632 case SVt_PVGV:
7633 gv = (GV*)sv;
7634 io = GvIO(gv);
7635 if (!io)
cea2e8a9 7636 Perl_croak(aTHX_ "Bad filehandle: %s", GvNAME(gv));
46fc3d4c 7637 break;
7638 default:
7639 if (!SvOK(sv))
cea2e8a9 7640 Perl_croak(aTHX_ PL_no_usym, "filehandle");
46fc3d4c 7641 if (SvROK(sv))
7642 return sv_2io(SvRV(sv));
7a5fd60d 7643 gv = gv_fetchsv(sv, FALSE, SVt_PVIO);
46fc3d4c 7644 if (gv)
7645 io = GvIO(gv);
7646 else
7647 io = 0;
7648 if (!io)
35c1215d 7649 Perl_croak(aTHX_ "Bad filehandle: %"SVf, sv);
46fc3d4c 7650 break;
7651 }
7652 return io;
7653}
7654
645c22ef
DM
7655/*
7656=for apidoc sv_2cv
7657
7658Using various gambits, try to get a CV from an SV; in addition, try if
7659possible to set C<*st> and C<*gvp> to the stash and GV associated with it.
7660
7661=cut
7662*/
7663
79072805 7664CV *
864dbfa3 7665Perl_sv_2cv(pTHX_ SV *sv, HV **st, GV **gvp, I32 lref)
79072805 7666{
27da23d5 7667 dVAR;
c04a4dfe
JH
7668 GV *gv = Nullgv;
7669 CV *cv = Nullcv;
79072805
LW
7670
7671 if (!sv)
93a17b20 7672 return *gvp = Nullgv, Nullcv;
79072805 7673 switch (SvTYPE(sv)) {
79072805
LW
7674 case SVt_PVCV:
7675 *st = CvSTASH(sv);
7676 *gvp = Nullgv;
7677 return (CV*)sv;
7678 case SVt_PVHV:
7679 case SVt_PVAV:
7680 *gvp = Nullgv;
7681 return Nullcv;
8990e307
LW
7682 case SVt_PVGV:
7683 gv = (GV*)sv;
a0d0e21e 7684 *gvp = gv;
8990e307
LW
7685 *st = GvESTASH(gv);
7686 goto fix_gv;
7687
79072805 7688 default:
5b295bef 7689 SvGETMAGIC(sv);
a0d0e21e 7690 if (SvROK(sv)) {
f5284f61
IZ
7691 SV **sp = &sv; /* Used in tryAMAGICunDEREF macro. */
7692 tryAMAGICunDEREF(to_cv);
7693
62f274bf
GS
7694 sv = SvRV(sv);
7695 if (SvTYPE(sv) == SVt_PVCV) {
7696 cv = (CV*)sv;
7697 *gvp = Nullgv;
7698 *st = CvSTASH(cv);
7699 return cv;
7700 }
7701 else if(isGV(sv))
7702 gv = (GV*)sv;
7703 else
cea2e8a9 7704 Perl_croak(aTHX_ "Not a subroutine reference");
a0d0e21e 7705 }
62f274bf 7706 else if (isGV(sv))
79072805
LW
7707 gv = (GV*)sv;
7708 else
7a5fd60d 7709 gv = gv_fetchsv(sv, lref, SVt_PVCV);
79072805
LW
7710 *gvp = gv;
7711 if (!gv)
7712 return Nullcv;
7713 *st = GvESTASH(gv);
8990e307 7714 fix_gv:
8ebc5c01 7715 if (lref && !GvCVu(gv)) {
4633a7c4 7716 SV *tmpsv;
748a9306 7717 ENTER;
4633a7c4 7718 tmpsv = NEWSV(704,0);
16660edb 7719 gv_efullname3(tmpsv, gv, Nullch);
f6ec51f7
GS
7720 /* XXX this is probably not what they think they're getting.
7721 * It has the same effect as "sub name;", i.e. just a forward
7722 * declaration! */
774d564b 7723 newSUB(start_subparse(FALSE, 0),
4633a7c4
LW
7724 newSVOP(OP_CONST, 0, tmpsv),
7725 Nullop,
8990e307 7726 Nullop);
748a9306 7727 LEAVE;
8ebc5c01 7728 if (!GvCVu(gv))
35c1215d
NC
7729 Perl_croak(aTHX_ "Unable to create sub named \"%"SVf"\"",
7730 sv);
8990e307 7731 }
8ebc5c01 7732 return GvCVu(gv);
79072805
LW
7733 }
7734}
7735
c461cf8f
JH
7736/*
7737=for apidoc sv_true
7738
7739Returns true if the SV has a true value by Perl's rules.
645c22ef
DM
7740Use the C<SvTRUE> macro instead, which may call C<sv_true()> or may
7741instead use an in-line version.
c461cf8f
JH
7742
7743=cut
7744*/
7745
79072805 7746I32
864dbfa3 7747Perl_sv_true(pTHX_ register SV *sv)
79072805 7748{
8990e307
LW
7749 if (!sv)
7750 return 0;
79072805 7751 if (SvPOK(sv)) {
e1ec3a88 7752 const register XPV* tXpv;
4e35701f 7753 if ((tXpv = (XPV*)SvANY(sv)) &&
c2f1de04 7754 (tXpv->xpv_cur > 1 ||
339049b0 7755 (tXpv->xpv_cur && *sv->sv_u.svu_pv != '0')))
79072805
LW
7756 return 1;
7757 else
7758 return 0;
7759 }
7760 else {
7761 if (SvIOK(sv))
463ee0b2 7762 return SvIVX(sv) != 0;
79072805
LW
7763 else {
7764 if (SvNOK(sv))
463ee0b2 7765 return SvNVX(sv) != 0.0;
79072805 7766 else
463ee0b2 7767 return sv_2bool(sv);
79072805
LW
7768 }
7769 }
7770}
79072805 7771
645c22ef
DM
7772/*
7773=for apidoc sv_iv
7774
7775A private implementation of the C<SvIVx> macro for compilers which can't
7776cope with complex macro expressions. Always use the macro instead.
7777
7778=cut
7779*/
7780
ff68c719 7781IV
864dbfa3 7782Perl_sv_iv(pTHX_ register SV *sv)
85e6fe83 7783{
25da4f38
IZ
7784 if (SvIOK(sv)) {
7785 if (SvIsUV(sv))
7786 return (IV)SvUVX(sv);
ff68c719 7787 return SvIVX(sv);
25da4f38 7788 }
ff68c719 7789 return sv_2iv(sv);
85e6fe83 7790}
85e6fe83 7791
645c22ef
DM
7792/*
7793=for apidoc sv_uv
7794
7795A private implementation of the C<SvUVx> macro for compilers which can't
7796cope with complex macro expressions. Always use the macro instead.
7797
7798=cut
7799*/
7800
ff68c719 7801UV
864dbfa3 7802Perl_sv_uv(pTHX_ register SV *sv)
ff68c719 7803{
25da4f38
IZ
7804 if (SvIOK(sv)) {
7805 if (SvIsUV(sv))
7806 return SvUVX(sv);
7807 return (UV)SvIVX(sv);
7808 }
ff68c719 7809 return sv_2uv(sv);
7810}
85e6fe83 7811
645c22ef
DM
7812/*
7813=for apidoc sv_nv
7814
7815A private implementation of the C<SvNVx> macro for compilers which can't
7816cope with complex macro expressions. Always use the macro instead.
7817
7818=cut
7819*/
7820
65202027 7821NV
864dbfa3 7822Perl_sv_nv(pTHX_ register SV *sv)
79072805 7823{
ff68c719 7824 if (SvNOK(sv))
7825 return SvNVX(sv);
7826 return sv_2nv(sv);
79072805 7827}
79072805 7828
09540bc3
JH
7829/* sv_pv() is now a macro using SvPV_nolen();
7830 * this function provided for binary compatibility only
7831 */
7832
7833char *
7834Perl_sv_pv(pTHX_ SV *sv)
7835{
09540bc3
JH
7836 if (SvPOK(sv))
7837 return SvPVX(sv);
7838
93524f2b 7839 return sv_2pv(sv, 0);
09540bc3
JH
7840}
7841
645c22ef
DM
7842/*
7843=for apidoc sv_pv
7844
baca2b92 7845Use the C<SvPV_nolen> macro instead
645c22ef 7846
645c22ef
DM
7847=for apidoc sv_pvn
7848
7849A private implementation of the C<SvPV> macro for compilers which can't
7850cope with complex macro expressions. Always use the macro instead.
7851
7852=cut
7853*/
7854
1fa8b10d 7855char *
864dbfa3 7856Perl_sv_pvn(pTHX_ SV *sv, STRLEN *lp)
79072805 7857{
85e6fe83
LW
7858 if (SvPOK(sv)) {
7859 *lp = SvCUR(sv);
a0d0e21e 7860 return SvPVX(sv);
85e6fe83 7861 }
463ee0b2 7862 return sv_2pv(sv, lp);
79072805 7863}
79072805 7864
6e9d1081
NC
7865
7866char *
7867Perl_sv_pvn_nomg(pTHX_ register SV *sv, STRLEN *lp)
7868{
7869 if (SvPOK(sv)) {
7870 *lp = SvCUR(sv);
7871 return SvPVX(sv);
7872 }
7873 return sv_2pv_flags(sv, lp, 0);
7874}
7875
09540bc3
JH
7876/* sv_pvn_force() is now a macro using Perl_sv_pvn_force_flags();
7877 * this function provided for binary compatibility only
7878 */
7879
7880char *
7881Perl_sv_pvn_force(pTHX_ SV *sv, STRLEN *lp)
7882{
7883 return sv_pvn_force_flags(sv, lp, SV_GMAGIC);
7884}
7885
c461cf8f
JH
7886/*
7887=for apidoc sv_pvn_force
7888
7889Get a sensible string out of the SV somehow.
645c22ef
DM
7890A private implementation of the C<SvPV_force> macro for compilers which
7891can't cope with complex macro expressions. Always use the macro instead.
c461cf8f 7892
8d6d96c1
HS
7893=for apidoc sv_pvn_force_flags
7894
7895Get a sensible string out of the SV somehow.
7896If C<flags> has C<SV_GMAGIC> bit set, will C<mg_get> on C<sv> if
7897appropriate, else not. C<sv_pvn_force> and C<sv_pvn_force_nomg> are
7898implemented in terms of this function.
645c22ef
DM
7899You normally want to use the various wrapper macros instead: see
7900C<SvPV_force> and C<SvPV_force_nomg>
8d6d96c1
HS
7901
7902=cut
7903*/
7904
7905char *
7906Perl_sv_pvn_force_flags(pTHX_ SV *sv, STRLEN *lp, I32 flags)
7907{
a0d0e21e 7908
6fc92669 7909 if (SvTHINKFIRST(sv) && !SvROK(sv))
765f542d 7910 sv_force_normal_flags(sv, 0);
1c846c1f 7911
a0d0e21e 7912 if (SvPOK(sv)) {
13c5b33c
NC
7913 if (lp)
7914 *lp = SvCUR(sv);
a0d0e21e
LW
7915 }
7916 else {
a3b680e6 7917 char *s;
13c5b33c
NC
7918 STRLEN len;
7919
4d84ee25 7920 if (SvREADONLY(sv) && !(flags & SV_MUTABLE_RETURN)) {
b64e5050 7921 const char * const ref = sv_reftype(sv,0);
4d84ee25
NC
7922 if (PL_op)
7923 Perl_croak(aTHX_ "Can't coerce readonly %s to string in %s",
b64e5050 7924 ref, OP_NAME(PL_op));
4d84ee25 7925 else
b64e5050 7926 Perl_croak(aTHX_ "Can't coerce readonly %s to string", ref);
4d84ee25 7927 }
b64e5050 7928 if (SvTYPE(sv) > SVt_PVLV && SvTYPE(sv) != SVt_PVFM)
cea2e8a9 7929 Perl_croak(aTHX_ "Can't coerce %s to string in %s", sv_reftype(sv,0),
53e06cf0 7930 OP_NAME(PL_op));
b64e5050 7931 s = sv_2pv_flags(sv, &len, flags);
13c5b33c
NC
7932 if (lp)
7933 *lp = len;
7934
3f7c398e 7935 if (s != SvPVX_const(sv)) { /* Almost, but not quite, sv_setpvn() */
a0d0e21e
LW
7936 if (SvROK(sv))
7937 sv_unref(sv);
862a34c6 7938 SvUPGRADE(sv, SVt_PV); /* Never FALSE */
a0d0e21e 7939 SvGROW(sv, len + 1);
706aa1c9 7940 Move(s,SvPVX(sv),len,char);
a0d0e21e
LW
7941 SvCUR_set(sv, len);
7942 *SvEND(sv) = '\0';
7943 }
7944 if (!SvPOK(sv)) {
7945 SvPOK_on(sv); /* validate pointer */
7946 SvTAINT(sv);
1d7c1841 7947 DEBUG_c(PerlIO_printf(Perl_debug_log, "0x%"UVxf" 2pv(%s)\n",
3f7c398e 7948 PTR2UV(sv),SvPVX_const(sv)));
a0d0e21e
LW
7949 }
7950 }
4d84ee25 7951 return SvPVX_mutable(sv);
a0d0e21e
LW
7952}
7953
09540bc3
JH
7954/* sv_pvbyte () is now a macro using Perl_sv_2pv_flags();
7955 * this function provided for binary compatibility only
7956 */
7957
7958char *
7959Perl_sv_pvbyte(pTHX_ SV *sv)
7960{
7961 sv_utf8_downgrade(sv,0);
7962 return sv_pv(sv);
7963}
7964
645c22ef
DM
7965/*
7966=for apidoc sv_pvbyte
7967
baca2b92 7968Use C<SvPVbyte_nolen> instead.
645c22ef 7969
645c22ef
DM
7970=for apidoc sv_pvbyten
7971
7972A private implementation of the C<SvPVbyte> macro for compilers
7973which can't cope with complex macro expressions. Always use the macro
7974instead.
7975
7976=cut
7977*/
7978
7340a771
GS
7979char *
7980Perl_sv_pvbyten(pTHX_ SV *sv, STRLEN *lp)
7981{
ffebcc3e 7982 sv_utf8_downgrade(sv,0);
7340a771
GS
7983 return sv_pvn(sv,lp);
7984}
7985
645c22ef
DM
7986/*
7987=for apidoc sv_pvbyten_force
7988
7989A private implementation of the C<SvPVbytex_force> macro for compilers
7990which can't cope with complex macro expressions. Always use the macro
7991instead.
7992
7993=cut
7994*/
7995
7340a771
GS
7996char *
7997Perl_sv_pvbyten_force(pTHX_ SV *sv, STRLEN *lp)
7998{
46ec2f14 7999 sv_pvn_force(sv,lp);
ffebcc3e 8000 sv_utf8_downgrade(sv,0);
46ec2f14
TS
8001 *lp = SvCUR(sv);
8002 return SvPVX(sv);
7340a771
GS
8003}
8004
09540bc3
JH
8005/* sv_pvutf8 () is now a macro using Perl_sv_2pv_flags();
8006 * this function provided for binary compatibility only
8007 */
8008
8009char *
8010Perl_sv_pvutf8(pTHX_ SV *sv)
8011{
8012 sv_utf8_upgrade(sv);
8013 return sv_pv(sv);
8014}
8015
645c22ef
DM
8016/*
8017=for apidoc sv_pvutf8
8018
baca2b92 8019Use the C<SvPVutf8_nolen> macro instead
645c22ef 8020
645c22ef
DM
8021=for apidoc sv_pvutf8n
8022
8023A private implementation of the C<SvPVutf8> macro for compilers
8024which can't cope with complex macro expressions. Always use the macro
8025instead.
8026
8027=cut
8028*/
8029
7340a771
GS
8030char *
8031Perl_sv_pvutf8n(pTHX_ SV *sv, STRLEN *lp)
8032{
560a288e 8033 sv_utf8_upgrade(sv);
7340a771
GS
8034 return sv_pvn(sv,lp);
8035}
8036
c461cf8f
JH
8037/*
8038=for apidoc sv_pvutf8n_force
8039
645c22ef
DM
8040A private implementation of the C<SvPVutf8_force> macro for compilers
8041which can't cope with complex macro expressions. Always use the macro
8042instead.
c461cf8f
JH
8043
8044=cut
8045*/
8046
7340a771
GS
8047char *
8048Perl_sv_pvutf8n_force(pTHX_ SV *sv, STRLEN *lp)
8049{
46ec2f14 8050 sv_pvn_force(sv,lp);
560a288e 8051 sv_utf8_upgrade(sv);
46ec2f14
TS
8052 *lp = SvCUR(sv);
8053 return SvPVX(sv);
7340a771
GS
8054}
8055
c461cf8f
JH
8056/*
8057=for apidoc sv_reftype
8058
8059Returns a string describing what the SV is a reference to.
8060
8061=cut
8062*/
8063
1cb0ed9b 8064char *
bfed75c6 8065Perl_sv_reftype(pTHX_ const SV *sv, int ob)
a0d0e21e 8066{
07409e01
NC
8067 /* The fact that I don't need to downcast to char * everywhere, only in ?:
8068 inside return suggests a const propagation bug in g++. */
c86bf373 8069 if (ob && SvOBJECT(sv)) {
1b6737cc 8070 char * const name = HvNAME_get(SvSTASH(sv));
07409e01 8071 return name ? name : (char *) "__ANON__";
c86bf373 8072 }
a0d0e21e
LW
8073 else {
8074 switch (SvTYPE(sv)) {
8075 case SVt_NULL:
8076 case SVt_IV:
8077 case SVt_NV:
8078 case SVt_RV:
8079 case SVt_PV:
8080 case SVt_PVIV:
8081 case SVt_PVNV:
8082 case SVt_PVMG:
8083 case SVt_PVBM:
1cb0ed9b 8084 if (SvVOK(sv))
439cb1c4 8085 return "VSTRING";
a0d0e21e
LW
8086 if (SvROK(sv))
8087 return "REF";
8088 else
8089 return "SCALAR";
1cb0ed9b 8090
07409e01 8091 case SVt_PVLV: return (char *) (SvROK(sv) ? "REF"
be65207d
DM
8092 /* tied lvalues should appear to be
8093 * scalars for backwards compatitbility */
8094 : (LvTYPE(sv) == 't' || LvTYPE(sv) == 'T')
07409e01 8095 ? "SCALAR" : "LVALUE");
a0d0e21e
LW
8096 case SVt_PVAV: return "ARRAY";
8097 case SVt_PVHV: return "HASH";
8098 case SVt_PVCV: return "CODE";
8099 case SVt_PVGV: return "GLOB";
1d2dff63 8100 case SVt_PVFM: return "FORMAT";
27f9d8f3 8101 case SVt_PVIO: return "IO";
a0d0e21e
LW
8102 default: return "UNKNOWN";
8103 }
8104 }
8105}
8106
954c1994
GS
8107/*
8108=for apidoc sv_isobject
8109
8110Returns a boolean indicating whether the SV is an RV pointing to a blessed
8111object. If the SV is not an RV, or if the object is not blessed, then this
8112will return false.
8113
8114=cut
8115*/
8116
463ee0b2 8117int
864dbfa3 8118Perl_sv_isobject(pTHX_ SV *sv)
85e6fe83 8119{
68dc0745 8120 if (!sv)
8121 return 0;
5b295bef 8122 SvGETMAGIC(sv);
85e6fe83
LW
8123 if (!SvROK(sv))
8124 return 0;
8125 sv = (SV*)SvRV(sv);
8126 if (!SvOBJECT(sv))
8127 return 0;
8128 return 1;
8129}
8130
954c1994
GS
8131/*
8132=for apidoc sv_isa
8133
8134Returns a boolean indicating whether the SV is blessed into the specified
8135class. This does not check for subtypes; use C<sv_derived_from> to verify
8136an inheritance relationship.
8137
8138=cut
8139*/
8140
85e6fe83 8141int
864dbfa3 8142Perl_sv_isa(pTHX_ SV *sv, const char *name)
463ee0b2 8143{
bfcb3514 8144 const char *hvname;
68dc0745 8145 if (!sv)
8146 return 0;
5b295bef 8147 SvGETMAGIC(sv);
ed6116ce 8148 if (!SvROK(sv))
463ee0b2 8149 return 0;
ed6116ce
LW
8150 sv = (SV*)SvRV(sv);
8151 if (!SvOBJECT(sv))
463ee0b2 8152 return 0;
bfcb3514
NC
8153 hvname = HvNAME_get(SvSTASH(sv));
8154 if (!hvname)
e27ad1f2 8155 return 0;
463ee0b2 8156
bfcb3514 8157 return strEQ(hvname, name);
463ee0b2
LW
8158}
8159
954c1994
GS
8160/*
8161=for apidoc newSVrv
8162
8163Creates a new SV for the RV, C<rv>, to point to. If C<rv> is not an RV then
8164it will be upgraded to one. If C<classname> is non-null then the new SV will
8165be blessed in the specified package. The new SV is returned and its
8166reference count is 1.
8167
8168=cut
8169*/
8170
463ee0b2 8171SV*
864dbfa3 8172Perl_newSVrv(pTHX_ SV *rv, const char *classname)
463ee0b2 8173{
463ee0b2
LW
8174 SV *sv;
8175
4561caa4 8176 new_SV(sv);
51cf62d8 8177
765f542d 8178 SV_CHECK_THINKFIRST_COW_DROP(rv);
51cf62d8 8179 SvAMAGIC_off(rv);
51cf62d8 8180
0199fce9 8181 if (SvTYPE(rv) >= SVt_PVMG) {
a3b680e6 8182 const U32 refcnt = SvREFCNT(rv);
0199fce9
JD
8183 SvREFCNT(rv) = 0;
8184 sv_clear(rv);
8185 SvFLAGS(rv) = 0;
8186 SvREFCNT(rv) = refcnt;
8187 }
8188
51cf62d8 8189 if (SvTYPE(rv) < SVt_RV)
0199fce9
JD
8190 sv_upgrade(rv, SVt_RV);
8191 else if (SvTYPE(rv) > SVt_RV) {
8bd4d4c5 8192 SvPV_free(rv);
0199fce9
JD
8193 SvCUR_set(rv, 0);
8194 SvLEN_set(rv, 0);
8195 }
51cf62d8 8196
0c34ef67 8197 SvOK_off(rv);
b162af07 8198 SvRV_set(rv, sv);
ed6116ce 8199 SvROK_on(rv);
463ee0b2 8200
a0d0e21e 8201 if (classname) {
1b6737cc 8202 HV* const stash = gv_stashpv(classname, TRUE);
a0d0e21e
LW
8203 (void)sv_bless(rv, stash);
8204 }
8205 return sv;
8206}
8207
954c1994
GS
8208/*
8209=for apidoc sv_setref_pv
8210
8211Copies a pointer into a new SV, optionally blessing the SV. The C<rv>
8212argument will be upgraded to an RV. That RV will be modified to point to
8213the new SV. If the C<pv> argument is NULL then C<PL_sv_undef> will be placed
8214into the SV. The C<classname> argument indicates the package for the
8215blessing. Set C<classname> to C<Nullch> to avoid the blessing. The new SV
d34c2299 8216will have a reference count of 1, and the RV will be returned.
954c1994
GS
8217
8218Do not use with other Perl types such as HV, AV, SV, CV, because those
8219objects will become corrupted by the pointer copy process.
8220
8221Note that C<sv_setref_pvn> copies the string while this copies the pointer.
8222
8223=cut
8224*/
8225
a0d0e21e 8226SV*
864dbfa3 8227Perl_sv_setref_pv(pTHX_ SV *rv, const char *classname, void *pv)
a0d0e21e 8228{
189b2af5 8229 if (!pv) {
3280af22 8230 sv_setsv(rv, &PL_sv_undef);
189b2af5
GS
8231 SvSETMAGIC(rv);
8232 }
a0d0e21e 8233 else
56431972 8234 sv_setiv(newSVrv(rv,classname), PTR2IV(pv));
a0d0e21e
LW
8235 return rv;
8236}
8237
954c1994
GS
8238/*
8239=for apidoc sv_setref_iv
8240
8241Copies an integer into a new SV, optionally blessing the SV. The C<rv>
8242argument will be upgraded to an RV. That RV will be modified to point to
8243the new SV. The C<classname> argument indicates the package for the
8244blessing. Set C<classname> to C<Nullch> to avoid the blessing. The new SV
d34c2299 8245will have a reference count of 1, and the RV will be returned.
954c1994
GS
8246
8247=cut
8248*/
8249
a0d0e21e 8250SV*
864dbfa3 8251Perl_sv_setref_iv(pTHX_ SV *rv, const char *classname, IV iv)
a0d0e21e
LW
8252{
8253 sv_setiv(newSVrv(rv,classname), iv);
8254 return rv;
8255}
8256
954c1994 8257/*
e1c57cef
JH
8258=for apidoc sv_setref_uv
8259
8260Copies an unsigned integer into a new SV, optionally blessing the SV. The C<rv>
8261argument will be upgraded to an RV. That RV will be modified to point to
8262the new SV. The C<classname> argument indicates the package for the
8263blessing. Set C<classname> to C<Nullch> to avoid the blessing. The new SV
d34c2299 8264will have a reference count of 1, and the RV will be returned.
e1c57cef
JH
8265
8266=cut
8267*/
8268
8269SV*
8270Perl_sv_setref_uv(pTHX_ SV *rv, const char *classname, UV uv)
8271{
8272 sv_setuv(newSVrv(rv,classname), uv);
8273 return rv;
8274}
8275
8276/*
954c1994
GS
8277=for apidoc sv_setref_nv
8278
8279Copies a double into a new SV, optionally blessing the SV. The C<rv>
8280argument will be upgraded to an RV. That RV will be modified to point to
8281the new SV. The C<classname> argument indicates the package for the
8282blessing. Set C<classname> to C<Nullch> to avoid the blessing. The new SV
d34c2299 8283will have a reference count of 1, and the RV will be returned.
954c1994
GS
8284
8285=cut
8286*/
8287
a0d0e21e 8288SV*
65202027 8289Perl_sv_setref_nv(pTHX_ SV *rv, const char *classname, NV nv)
a0d0e21e
LW
8290{
8291 sv_setnv(newSVrv(rv,classname), nv);
8292 return rv;
8293}
463ee0b2 8294
954c1994
GS
8295/*
8296=for apidoc sv_setref_pvn
8297
8298Copies a string into a new SV, optionally blessing the SV. The length of the
8299string must be specified with C<n>. The C<rv> argument will be upgraded to
8300an RV. That RV will be modified to point to the new SV. The C<classname>
8301argument indicates the package for the blessing. Set C<classname> to
7a5fa8a2 8302C<Nullch> to avoid the blessing. The new SV will have a reference count
d34c2299 8303of 1, and the RV will be returned.
954c1994
GS
8304
8305Note that C<sv_setref_pv> copies the pointer while this copies the string.
8306
8307=cut
8308*/
8309
a0d0e21e 8310SV*
1b6737cc 8311Perl_sv_setref_pvn(pTHX_ SV *rv, const char *classname, const char *pv, STRLEN n)
a0d0e21e
LW
8312{
8313 sv_setpvn(newSVrv(rv,classname), pv, n);
463ee0b2
LW
8314 return rv;
8315}
8316
954c1994
GS
8317/*
8318=for apidoc sv_bless
8319
8320Blesses an SV into a specified package. The SV must be an RV. The package
8321must be designated by its stash (see C<gv_stashpv()>). The reference count
8322of the SV is unaffected.
8323
8324=cut
8325*/
8326
a0d0e21e 8327SV*
864dbfa3 8328Perl_sv_bless(pTHX_ SV *sv, HV *stash)
a0d0e21e 8329{
76e3520e 8330 SV *tmpRef;
a0d0e21e 8331 if (!SvROK(sv))
cea2e8a9 8332 Perl_croak(aTHX_ "Can't bless non-reference value");
76e3520e
GS
8333 tmpRef = SvRV(sv);
8334 if (SvFLAGS(tmpRef) & (SVs_OBJECT|SVf_READONLY)) {
8335 if (SvREADONLY(tmpRef))
cea2e8a9 8336 Perl_croak(aTHX_ PL_no_modify);
76e3520e
GS
8337 if (SvOBJECT(tmpRef)) {
8338 if (SvTYPE(tmpRef) != SVt_PVIO)
3280af22 8339 --PL_sv_objcount;
76e3520e 8340 SvREFCNT_dec(SvSTASH(tmpRef));
2e3febc6 8341 }
a0d0e21e 8342 }
76e3520e
GS
8343 SvOBJECT_on(tmpRef);
8344 if (SvTYPE(tmpRef) != SVt_PVIO)
3280af22 8345 ++PL_sv_objcount;
862a34c6 8346 SvUPGRADE(tmpRef, SVt_PVMG);
b162af07 8347 SvSTASH_set(tmpRef, (HV*)SvREFCNT_inc(stash));
a0d0e21e 8348
2e3febc6
CS
8349 if (Gv_AMG(stash))
8350 SvAMAGIC_on(sv);
8351 else
8352 SvAMAGIC_off(sv);
a0d0e21e 8353
1edbfb88
AB
8354 if(SvSMAGICAL(tmpRef))
8355 if(mg_find(tmpRef, PERL_MAGIC_ext) || mg_find(tmpRef, PERL_MAGIC_uvar))
8356 mg_set(tmpRef);
8357
8358
ecdeb87c 8359
a0d0e21e
LW
8360 return sv;
8361}
8362
645c22ef 8363/* Downgrades a PVGV to a PVMG.
645c22ef
DM
8364 */
8365
76e3520e 8366STATIC void
cea2e8a9 8367S_sv_unglob(pTHX_ SV *sv)
a0d0e21e 8368{
850fabdf
GS
8369 void *xpvmg;
8370
a0d0e21e
LW
8371 assert(SvTYPE(sv) == SVt_PVGV);
8372 SvFAKE_off(sv);
8373 if (GvGP(sv))
1edc1566 8374 gp_free((GV*)sv);
e826b3c7 8375 if (GvSTASH(sv)) {
e15faf7d 8376 sv_del_backref((SV*)GvSTASH(sv), sv);
e826b3c7
GS
8377 GvSTASH(sv) = Nullhv;
8378 }
14befaf4 8379 sv_unmagic(sv, PERL_MAGIC_glob);
a0d0e21e 8380 Safefree(GvNAME(sv));
a5f75d66 8381 GvMULTI_off(sv);
850fabdf
GS
8382
8383 /* need to keep SvANY(sv) in the right arena */
8384 xpvmg = new_XPVMG();
8385 StructCopy(SvANY(sv), xpvmg, XPVMG);
8386 del_XPVGV(SvANY(sv));
8387 SvANY(sv) = xpvmg;
8388
a0d0e21e
LW
8389 SvFLAGS(sv) &= ~SVTYPEMASK;
8390 SvFLAGS(sv) |= SVt_PVMG;
8391}
8392
954c1994 8393/*
840a7b70 8394=for apidoc sv_unref_flags
954c1994
GS
8395
8396Unsets the RV status of the SV, and decrements the reference count of
8397whatever was being referenced by the RV. This can almost be thought of
840a7b70
IZ
8398as a reversal of C<newSVrv>. The C<cflags> argument can contain
8399C<SV_IMMEDIATE_UNREF> to force the reference count to be decremented
8400(otherwise the decrementing is conditional on the reference count being
8401different from one or the reference being a readonly SV).
7889fe52 8402See C<SvROK_off>.
954c1994
GS
8403
8404=cut
8405*/
8406
ed6116ce 8407void
e15faf7d 8408Perl_sv_unref_flags(pTHX_ SV *ref, U32 flags)
ed6116ce 8409{
b64e5050 8410 SV* const target = SvRV(ref);
810b8aa5 8411
e15faf7d
NC
8412 if (SvWEAKREF(ref)) {
8413 sv_del_backref(target, ref);
8414 SvWEAKREF_off(ref);
8415 SvRV_set(ref, NULL);
810b8aa5
GS
8416 return;
8417 }
e15faf7d
NC
8418 SvRV_set(ref, NULL);
8419 SvROK_off(ref);
8420 /* You can't have a || SvREADONLY(target) here, as $a = $$a, where $a was
04ca4930 8421 assigned to as BEGIN {$a = \"Foo"} will fail. */
e15faf7d
NC
8422 if (SvREFCNT(target) != 1 || (flags & SV_IMMEDIATE_UNREF))
8423 SvREFCNT_dec(target);
840a7b70 8424 else /* XXX Hack, but hard to make $a=$a->[1] work otherwise */
e15faf7d 8425 sv_2mortal(target); /* Schedule for freeing later */
ed6116ce 8426}
8990e307 8427
840a7b70
IZ
8428/*
8429=for apidoc sv_unref
8430
8431Unsets the RV status of the SV, and decrements the reference count of
8432whatever was being referenced by the RV. This can almost be thought of
8433as a reversal of C<newSVrv>. This is C<sv_unref_flags> with the C<flag>
7889fe52 8434being zero. See C<SvROK_off>.
840a7b70
IZ
8435
8436=cut
8437*/
8438
8439void
8440Perl_sv_unref(pTHX_ SV *sv)
8441{
8442 sv_unref_flags(sv, 0);
8443}
8444
645c22ef
DM
8445/*
8446=for apidoc sv_taint
8447
8448Taint an SV. Use C<SvTAINTED_on> instead.
8449=cut
8450*/
8451
bbce6d69 8452void
864dbfa3 8453Perl_sv_taint(pTHX_ SV *sv)
bbce6d69 8454{
14befaf4 8455 sv_magic((sv), Nullsv, PERL_MAGIC_taint, Nullch, 0);
bbce6d69 8456}
8457
645c22ef
DM
8458/*
8459=for apidoc sv_untaint
8460
8461Untaint an SV. Use C<SvTAINTED_off> instead.
8462=cut
8463*/
8464
bbce6d69 8465void
864dbfa3 8466Perl_sv_untaint(pTHX_ SV *sv)
bbce6d69 8467{
13f57bf8 8468 if (SvTYPE(sv) >= SVt_PVMG && SvMAGIC(sv)) {
b64e5050 8469 MAGIC * const mg = mg_find(sv, PERL_MAGIC_taint);
36477c24 8470 if (mg)
565764a8 8471 mg->mg_len &= ~1;
36477c24 8472 }
bbce6d69 8473}
8474
645c22ef
DM
8475/*
8476=for apidoc sv_tainted
8477
8478Test an SV for taintedness. Use C<SvTAINTED> instead.
8479=cut
8480*/
8481
bbce6d69 8482bool
864dbfa3 8483Perl_sv_tainted(pTHX_ SV *sv)
bbce6d69 8484{
13f57bf8 8485 if (SvTYPE(sv) >= SVt_PVMG && SvMAGIC(sv)) {
a28509cc 8486 MAGIC * const mg = mg_find(sv, PERL_MAGIC_taint);
2ddb8a4f 8487 if (mg && (mg->mg_len & 1) )
36477c24 8488 return TRUE;
8489 }
8490 return FALSE;
bbce6d69 8491}
8492
09540bc3
JH
8493/*
8494=for apidoc sv_setpviv
8495
8496Copies an integer into the given SV, also updating its string value.
8497Does not handle 'set' magic. See C<sv_setpviv_mg>.
8498
8499=cut
8500*/
8501
8502void
8503Perl_sv_setpviv(pTHX_ SV *sv, IV iv)
8504{
8505 char buf[TYPE_CHARS(UV)];
8506 char *ebuf;
b64e5050 8507 char * const ptr = uiv_2buf(buf, iv, 0, 0, &ebuf);
09540bc3
JH
8508
8509 sv_setpvn(sv, ptr, ebuf - ptr);
8510}
8511
8512/*
8513=for apidoc sv_setpviv_mg
8514
8515Like C<sv_setpviv>, but also handles 'set' magic.
8516
8517=cut
8518*/
8519
8520void
8521Perl_sv_setpviv_mg(pTHX_ SV *sv, IV iv)
8522{
8523 char buf[TYPE_CHARS(UV)];
8524 char *ebuf;
b64e5050 8525 char * const ptr = uiv_2buf(buf, iv, 0, 0, &ebuf);
09540bc3
JH
8526
8527 sv_setpvn(sv, ptr, ebuf - ptr);
8528 SvSETMAGIC(sv);
8529}
8530
cea2e8a9 8531#if defined(PERL_IMPLICIT_CONTEXT)
645c22ef
DM
8532
8533/* pTHX_ magic can't cope with varargs, so this is a no-context
8534 * version of the main function, (which may itself be aliased to us).
8535 * Don't access this version directly.
8536 */
8537
cea2e8a9
GS
8538void
8539Perl_sv_setpvf_nocontext(SV *sv, const char* pat, ...)
8540{
8541 dTHX;
8542 va_list args;
8543 va_start(args, pat);
c5be433b 8544 sv_vsetpvf(sv, pat, &args);
cea2e8a9
GS
8545 va_end(args);
8546}
8547
645c22ef
DM
8548/* pTHX_ magic can't cope with varargs, so this is a no-context
8549 * version of the main function, (which may itself be aliased to us).
8550 * Don't access this version directly.
8551 */
cea2e8a9
GS
8552
8553void
8554Perl_sv_setpvf_mg_nocontext(SV *sv, const char* pat, ...)
8555{
8556 dTHX;
8557 va_list args;
8558 va_start(args, pat);
c5be433b 8559 sv_vsetpvf_mg(sv, pat, &args);
cea2e8a9 8560 va_end(args);
cea2e8a9
GS
8561}
8562#endif
8563
954c1994
GS
8564/*
8565=for apidoc sv_setpvf
8566
bffc3d17
SH
8567Works like C<sv_catpvf> but copies the text into the SV instead of
8568appending it. Does not handle 'set' magic. See C<sv_setpvf_mg>.
954c1994
GS
8569
8570=cut
8571*/
8572
46fc3d4c 8573void
864dbfa3 8574Perl_sv_setpvf(pTHX_ SV *sv, const char* pat, ...)
46fc3d4c 8575{
8576 va_list args;
46fc3d4c 8577 va_start(args, pat);
c5be433b 8578 sv_vsetpvf(sv, pat, &args);
46fc3d4c 8579 va_end(args);
8580}
8581
bffc3d17
SH
8582/*
8583=for apidoc sv_vsetpvf
8584
8585Works like C<sv_vcatpvf> but copies the text into the SV instead of
8586appending it. Does not handle 'set' magic. See C<sv_vsetpvf_mg>.
8587
8588Usually used via its frontend C<sv_setpvf>.
8589
8590=cut
8591*/
645c22ef 8592
c5be433b
GS
8593void
8594Perl_sv_vsetpvf(pTHX_ SV *sv, const char* pat, va_list* args)
8595{
8596 sv_vsetpvfn(sv, pat, strlen(pat), args, Null(SV**), 0, Null(bool*));
8597}
ef50df4b 8598
954c1994
GS
8599/*
8600=for apidoc sv_setpvf_mg
8601
8602Like C<sv_setpvf>, but also handles 'set' magic.
8603
8604=cut
8605*/
8606
ef50df4b 8607void
864dbfa3 8608Perl_sv_setpvf_mg(pTHX_ SV *sv, const char* pat, ...)
ef50df4b
GS
8609{
8610 va_list args;
ef50df4b 8611 va_start(args, pat);
c5be433b 8612 sv_vsetpvf_mg(sv, pat, &args);
ef50df4b 8613 va_end(args);
c5be433b
GS
8614}
8615
bffc3d17
SH
8616/*
8617=for apidoc sv_vsetpvf_mg
8618
8619Like C<sv_vsetpvf>, but also handles 'set' magic.
8620
8621Usually used via its frontend C<sv_setpvf_mg>.
8622
8623=cut
8624*/
645c22ef 8625
c5be433b
GS
8626void
8627Perl_sv_vsetpvf_mg(pTHX_ SV *sv, const char* pat, va_list* args)
8628{
8629 sv_vsetpvfn(sv, pat, strlen(pat), args, Null(SV**), 0, Null(bool*));
ef50df4b
GS
8630 SvSETMAGIC(sv);
8631}
8632
cea2e8a9 8633#if defined(PERL_IMPLICIT_CONTEXT)
645c22ef
DM
8634
8635/* pTHX_ magic can't cope with varargs, so this is a no-context
8636 * version of the main function, (which may itself be aliased to us).
8637 * Don't access this version directly.
8638 */
8639
cea2e8a9
GS
8640void
8641Perl_sv_catpvf_nocontext(SV *sv, const char* pat, ...)
8642{
8643 dTHX;
8644 va_list args;
8645 va_start(args, pat);
c5be433b 8646 sv_vcatpvf(sv, pat, &args);
cea2e8a9
GS
8647 va_end(args);
8648}
8649
645c22ef
DM
8650/* pTHX_ magic can't cope with varargs, so this is a no-context
8651 * version of the main function, (which may itself be aliased to us).
8652 * Don't access this version directly.
8653 */
8654
cea2e8a9
GS
8655void
8656Perl_sv_catpvf_mg_nocontext(SV *sv, const char* pat, ...)
8657{
8658 dTHX;
8659 va_list args;
8660 va_start(args, pat);
c5be433b 8661 sv_vcatpvf_mg(sv, pat, &args);
cea2e8a9 8662 va_end(args);
cea2e8a9
GS
8663}
8664#endif
8665
954c1994
GS
8666/*
8667=for apidoc sv_catpvf
8668
d5ce4a7c
GA
8669Processes its arguments like C<sprintf> and appends the formatted
8670output to an SV. If the appended data contains "wide" characters
8671(including, but not limited to, SVs with a UTF-8 PV formatted with %s,
8672and characters >255 formatted with %c), the original SV might get
bffc3d17 8673upgraded to UTF-8. Handles 'get' magic, but not 'set' magic. See
cdd94ca7
NC
8674C<sv_catpvf_mg>. If the original SV was UTF-8, the pattern should be
8675valid UTF-8; if the original SV was bytes, the pattern should be too.
954c1994 8676
d5ce4a7c 8677=cut */
954c1994 8678
46fc3d4c 8679void
864dbfa3 8680Perl_sv_catpvf(pTHX_ SV *sv, const char* pat, ...)
46fc3d4c 8681{
8682 va_list args;
46fc3d4c 8683 va_start(args, pat);
c5be433b 8684 sv_vcatpvf(sv, pat, &args);
46fc3d4c 8685 va_end(args);
8686}
8687
bffc3d17
SH
8688/*
8689=for apidoc sv_vcatpvf
8690
8691Processes its arguments like C<vsprintf> and appends the formatted output
8692to an SV. Does not handle 'set' magic. See C<sv_vcatpvf_mg>.
8693
8694Usually used via its frontend C<sv_catpvf>.
8695
8696=cut
8697*/
645c22ef 8698
ef50df4b 8699void
c5be433b
GS
8700Perl_sv_vcatpvf(pTHX_ SV *sv, const char* pat, va_list* args)
8701{
8702 sv_vcatpvfn(sv, pat, strlen(pat), args, Null(SV**), 0, Null(bool*));
8703}
8704
954c1994
GS
8705/*
8706=for apidoc sv_catpvf_mg
8707
8708Like C<sv_catpvf>, but also handles 'set' magic.
8709
8710=cut
8711*/
8712
c5be433b 8713void
864dbfa3 8714Perl_sv_catpvf_mg(pTHX_ SV *sv, const char* pat, ...)
ef50df4b
GS
8715{
8716 va_list args;
ef50df4b 8717 va_start(args, pat);
c5be433b 8718 sv_vcatpvf_mg(sv, pat, &args);
ef50df4b 8719 va_end(args);
c5be433b
GS
8720}
8721
bffc3d17
SH
8722/*
8723=for apidoc sv_vcatpvf_mg
8724
8725Like C<sv_vcatpvf>, but also handles 'set' magic.
8726
8727Usually used via its frontend C<sv_catpvf_mg>.
8728
8729=cut
8730*/
645c22ef 8731
c5be433b
GS
8732void
8733Perl_sv_vcatpvf_mg(pTHX_ SV *sv, const char* pat, va_list* args)
8734{
8735 sv_vcatpvfn(sv, pat, strlen(pat), args, Null(SV**), 0, Null(bool*));
ef50df4b
GS
8736 SvSETMAGIC(sv);
8737}
8738
954c1994
GS
8739/*
8740=for apidoc sv_vsetpvfn
8741
bffc3d17 8742Works like C<sv_vcatpvfn> but copies the text into the SV instead of
954c1994
GS
8743appending it.
8744
bffc3d17 8745Usually used via one of its frontends C<sv_vsetpvf> and C<sv_vsetpvf_mg>.
645c22ef 8746
954c1994
GS
8747=cut
8748*/
8749
46fc3d4c 8750void
7d5ea4e7 8751Perl_sv_vsetpvfn(pTHX_ SV *sv, const char *pat, STRLEN patlen, va_list *args, SV **svargs, I32 svmax, bool *maybe_tainted)
46fc3d4c 8752{
8753 sv_setpvn(sv, "", 0);
7d5ea4e7 8754 sv_vcatpvfn(sv, pat, patlen, args, svargs, svmax, maybe_tainted);
46fc3d4c 8755}
8756
645c22ef
DM
8757/* private function for use in sv_vcatpvfn via the EXPECT_NUMBER macro */
8758
2d00ba3b 8759STATIC I32
9dd79c3f 8760S_expect_number(pTHX_ char** pattern)
211dfcf1
HS
8761{
8762 I32 var = 0;
8763 switch (**pattern) {
8764 case '1': case '2': case '3':
8765 case '4': case '5': case '6':
8766 case '7': case '8': case '9':
8767 while (isDIGIT(**pattern))
8768 var = var * 10 + (*(*pattern)++ - '0');
8769 }
8770 return var;
8771}
9dd79c3f 8772#define EXPECT_NUMBER(pattern, var) (var = S_expect_number(aTHX_ &pattern))
211dfcf1 8773
4151a5fe
IZ
8774static char *
8775F0convert(NV nv, char *endbuf, STRLEN *len)
8776{
a3b680e6 8777 const int neg = nv < 0;
4151a5fe 8778 UV uv;
4151a5fe
IZ
8779
8780 if (neg)
8781 nv = -nv;
8782 if (nv < UV_MAX) {
b464bac0 8783 char *p = endbuf;
4151a5fe 8784 nv += 0.5;
028f8eaa 8785 uv = (UV)nv;
4151a5fe
IZ
8786 if (uv & 1 && uv == nv)
8787 uv--; /* Round to even */
8788 do {
a3b680e6 8789 const unsigned dig = uv % 10;
4151a5fe
IZ
8790 *--p = '0' + dig;
8791 } while (uv /= 10);
8792 if (neg)
8793 *--p = '-';
8794 *len = endbuf - p;
8795 return p;
8796 }
8797 return Nullch;
8798}
8799
8800
954c1994
GS
8801/*
8802=for apidoc sv_vcatpvfn
8803
8804Processes its arguments like C<vsprintf> and appends the formatted output
8805to an SV. Uses an array of SVs if the C style variable argument list is
8806missing (NULL). When running with taint checks enabled, indicates via
8807C<maybe_tainted> if results are untrustworthy (often due to the use of
8808locales).
8809
bffc3d17 8810Usually used via one of its frontends C<sv_vcatpvf> and C<sv_vcatpvf_mg>.
645c22ef 8811
954c1994
GS
8812=cut
8813*/
8814
8896765a
RB
8815
8816#define VECTORIZE_ARGS vecsv = va_arg(*args, SV*);\
8817 vecstr = (U8*)SvPV_const(vecsv,veclen);\
8818 vec_utf8 = DO_UTF8(vecsv);
8819
1ef29b0e
RGS
8820/* XXX maybe_tainted is never assigned to, so the doc above is lying. */
8821
46fc3d4c 8822void
7d5ea4e7 8823Perl_sv_vcatpvfn(pTHX_ SV *sv, const char *pat, STRLEN patlen, va_list *args, SV **svargs, I32 svmax, bool *maybe_tainted)
46fc3d4c 8824{
8825 char *p;
8826 char *q;
a3b680e6 8827 const char *patend;
fc36a67e 8828 STRLEN origlen;
46fc3d4c 8829 I32 svix = 0;
27da23d5 8830 static const char nullstr[] = "(null)";
9c5ffd7c 8831 SV *argsv = Nullsv;
b464bac0
AL
8832 bool has_utf8 = DO_UTF8(sv); /* has the result utf8? */
8833 const bool pat_utf8 = has_utf8; /* the pattern is in utf8? */
db79b45b 8834 SV *nsv = Nullsv;
4151a5fe
IZ
8835 /* Times 4: a decimal digit takes more than 3 binary digits.
8836 * NV_DIG: mantissa takes than many decimal digits.
8837 * Plus 32: Playing safe. */
8838 char ebuf[IV_DIG * 4 + NV_DIG + 32];
8839 /* large enough for "%#.#f" --chip */
8840 /* what about long double NVs? --jhi */
db79b45b 8841
53c1dcc0
AL
8842 PERL_UNUSED_ARG(maybe_tainted);
8843
46fc3d4c 8844 /* no matter what, this is a string now */
fc36a67e 8845 (void)SvPV_force(sv, origlen);
46fc3d4c 8846
8896765a 8847 /* special-case "", "%s", and "%-p" (SVf - see below) */
46fc3d4c 8848 if (patlen == 0)
8849 return;
0dbb1585 8850 if (patlen == 2 && pat[0] == '%' && pat[1] == 's') {
2d03de9c
AL
8851 if (args) {
8852 const char * const s = va_arg(*args, char*);
8853 sv_catpv(sv, s ? s : nullstr);
8854 }
8855 else if (svix < svmax) {
8856 sv_catsv(sv, *svargs);
8857 if (DO_UTF8(*svargs))
8858 SvUTF8_on(sv);
8859 }
8860 return;
0dbb1585 8861 }
8896765a
RB
8862 if (args && patlen == 3 && pat[0] == '%' &&
8863 pat[1] == '-' && pat[2] == 'p') {
8864 argsv = va_arg(*args, SV*);
8865 sv_catsv(sv, argsv);
8866 if (DO_UTF8(argsv))
8867 SvUTF8_on(sv);
8868 return;
46fc3d4c 8869 }
8870
1d917b39 8871#ifndef USE_LONG_DOUBLE
4151a5fe 8872 /* special-case "%.<number>[gf]" */
7af36d83 8873 if ( !args && patlen <= 5 && pat[0] == '%' && pat[1] == '.'
4151a5fe
IZ
8874 && (pat[patlen-1] == 'g' || pat[patlen-1] == 'f') ) {
8875 unsigned digits = 0;
8876 const char *pp;
8877
8878 pp = pat + 2;
8879 while (*pp >= '0' && *pp <= '9')
8880 digits = 10 * digits + (*pp++ - '0');
028f8eaa 8881 if (pp - pat == (int)patlen - 1) {
4151a5fe
IZ
8882 NV nv;
8883
7af36d83 8884 if (svix < svmax)
4151a5fe
IZ
8885 nv = SvNV(*svargs);
8886 else
8887 return;
8888 if (*pp == 'g') {
2873255c
NC
8889 /* Add check for digits != 0 because it seems that some
8890 gconverts are buggy in this case, and we don't yet have
8891 a Configure test for this. */
8892 if (digits && digits < sizeof(ebuf) - NV_DIG - 10) {
8893 /* 0, point, slack */
2e59c212 8894 Gconvert(nv, (int)digits, 0, ebuf);
4151a5fe
IZ
8895 sv_catpv(sv, ebuf);
8896 if (*ebuf) /* May return an empty string for digits==0 */
8897 return;
8898 }
8899 } else if (!digits) {
8900 STRLEN l;
8901
8902 if ((p = F0convert(nv, ebuf + sizeof ebuf, &l))) {
8903 sv_catpvn(sv, p, l);
8904 return;
8905 }
8906 }
8907 }
8908 }
1d917b39 8909#endif /* !USE_LONG_DOUBLE */
4151a5fe 8910
2cf2cfc6 8911 if (!args && svix < svmax && DO_UTF8(*svargs))
205f51d8 8912 has_utf8 = TRUE;
2cf2cfc6 8913
46fc3d4c 8914 patend = (char*)pat + patlen;
8915 for (p = (char*)pat; p < patend; p = q) {
8916 bool alt = FALSE;
8917 bool left = FALSE;
b22c7a20 8918 bool vectorize = FALSE;
211dfcf1 8919 bool vectorarg = FALSE;
2cf2cfc6 8920 bool vec_utf8 = FALSE;
46fc3d4c 8921 char fill = ' ';
8922 char plus = 0;
8923 char intsize = 0;
8924 STRLEN width = 0;
fc36a67e 8925 STRLEN zeros = 0;
46fc3d4c 8926 bool has_precis = FALSE;
8927 STRLEN precis = 0;
58e33a90 8928 I32 osvix = svix;
2cf2cfc6 8929 bool is_utf8 = FALSE; /* is this item utf8? */
20f6aaab
AS
8930#ifdef HAS_LDBL_SPRINTF_BUG
8931 /* This is to try to fix a bug with irix/nonstop-ux/powerux and
205f51d8 8932 with sfio - Allen <allens@cpan.org> */
20f6aaab
AS
8933 bool fix_ldbl_sprintf_bug = FALSE;
8934#endif
205f51d8 8935
46fc3d4c 8936 char esignbuf[4];
89ebb4a3 8937 U8 utf8buf[UTF8_MAXBYTES+1];
46fc3d4c 8938 STRLEN esignlen = 0;
8939
4d84ee25 8940 const char *eptr = Nullch;
fc36a67e 8941 STRLEN elen = 0;
81f715da 8942 SV *vecsv = Nullsv;
245d4a47 8943 const U8 *vecstr = Null(U8*);
b22c7a20 8944 STRLEN veclen = 0;
934abaf1 8945 char c = 0;
46fc3d4c 8946 int i;
9c5ffd7c 8947 unsigned base = 0;
8c8eb53c
RB
8948 IV iv = 0;
8949 UV uv = 0;
9e5b023a
JH
8950 /* we need a long double target in case HAS_LONG_DOUBLE but
8951 not USE_LONG_DOUBLE
8952 */
35fff930 8953#if defined(HAS_LONG_DOUBLE) && LONG_DOUBLESIZE > DOUBLESIZE
9e5b023a
JH
8954 long double nv;
8955#else
65202027 8956 NV nv;
9e5b023a 8957#endif
46fc3d4c 8958 STRLEN have;
8959 STRLEN need;
8960 STRLEN gap;
7af36d83 8961 const char *dotstr = ".";
b22c7a20 8962 STRLEN dotstrlen = 1;
211dfcf1 8963 I32 efix = 0; /* explicit format parameter index */
eb3fce90 8964 I32 ewix = 0; /* explicit width index */
211dfcf1
HS
8965 I32 epix = 0; /* explicit precision index */
8966 I32 evix = 0; /* explicit vector index */
eb3fce90 8967 bool asterisk = FALSE;
46fc3d4c 8968
211dfcf1 8969 /* echo everything up to the next format specification */
46fc3d4c 8970 for (q = p; q < patend && *q != '%'; ++q) ;
8971 if (q > p) {
db79b45b
JH
8972 if (has_utf8 && !pat_utf8)
8973 sv_catpvn_utf8_upgrade(sv, p, q - p, nsv);
8974 else
8975 sv_catpvn(sv, p, q - p);
46fc3d4c 8976 p = q;
8977 }
8978 if (q++ >= patend)
8979 break;
8980
211dfcf1
HS
8981/*
8982 We allow format specification elements in this order:
8983 \d+\$ explicit format parameter index
8984 [-+ 0#]+ flags
a472f209 8985 v|\*(\d+\$)?v vector with optional (optionally specified) arg
f3583277 8986 0 flag (as above): repeated to allow "v02"
211dfcf1
HS
8987 \d+|\*(\d+\$)? width using optional (optionally specified) arg
8988 \.(\d*|\*(\d+\$)?) precision using optional (optionally specified) arg
8989 [hlqLV] size
8896765a
RB
8990 [%bcdefginopsuxDFOUX] format (mandatory)
8991*/
8992
8993 if (args) {
8994/*
8995 As of perl5.9.3, printf format checking is on by default.
8996 Internally, perl uses %p formats to provide an escape to
8997 some extended formatting. This block deals with those
8998 extensions: if it does not match, (char*)q is reset and
8999 the normal format processing code is used.
9000
9001 Currently defined extensions are:
9002 %p include pointer address (standard)
9003 %-p (SVf) include an SV (previously %_)
9004 %-<num>p include an SV with precision <num>
9005 %1p (VDf) include a v-string (as %vd)
9006 %<num>p reserved for future extensions
9007
9008 Robin Barker 2005-07-14
211dfcf1 9009*/
8896765a
RB
9010 char* r = q;
9011 bool sv = FALSE;
9012 STRLEN n = 0;
9013 if (*q == '-')
9014 sv = *q++;
9015 EXPECT_NUMBER(q, n);
9016 if (*q++ == 'p') {
9017 if (sv) { /* SVf */
9018 if (n) {
9019 precis = n;
9020 has_precis = TRUE;
9021 }
9022 argsv = va_arg(*args, SV*);
9023 eptr = SvPVx_const(argsv, elen);
9024 if (DO_UTF8(argsv))
9025 is_utf8 = TRUE;
9026 goto string;
9027 }
9028#if vdNUMBER
9029 else if (n == vdNUMBER) { /* VDf */
9030 vectorize = TRUE;
9031 VECTORIZE_ARGS
9032 goto format_vd;
9033 }
9034#endif
9035 else if (n) {
9036 if (ckWARN_d(WARN_INTERNAL))
9037 Perl_warner(aTHX_ packWARN(WARN_INTERNAL),
9038 "internal %%<num>p might conflict with future printf extensions");
9039 }
9040 }
9041 q = r;
9042 }
9043
211dfcf1
HS
9044 if (EXPECT_NUMBER(q, width)) {
9045 if (*q == '$') {
9046 ++q;
9047 efix = width;
9048 } else {
9049 goto gotwidth;
9050 }
9051 }
9052
fc36a67e 9053 /* FLAGS */
9054
46fc3d4c 9055 while (*q) {
9056 switch (*q) {
9057 case ' ':
9058 case '+':
9059 plus = *q++;
9060 continue;
9061
9062 case '-':
9063 left = TRUE;
9064 q++;
9065 continue;
9066
9067 case '0':
9068 fill = *q++;
9069 continue;
9070
9071 case '#':
9072 alt = TRUE;
9073 q++;
9074 continue;
9075
fc36a67e 9076 default:
9077 break;
9078 }
9079 break;
9080 }
46fc3d4c 9081
211dfcf1 9082 tryasterisk:
eb3fce90 9083 if (*q == '*') {
211dfcf1
HS
9084 q++;
9085 if (EXPECT_NUMBER(q, ewix))
9086 if (*q++ != '$')
9087 goto unknown;
eb3fce90 9088 asterisk = TRUE;
211dfcf1
HS
9089 }
9090 if (*q == 'v') {
eb3fce90 9091 q++;
211dfcf1
HS
9092 if (vectorize)
9093 goto unknown;
9cbac4c7 9094 if ((vectorarg = asterisk)) {
211dfcf1
HS
9095 evix = ewix;
9096 ewix = 0;
9097 asterisk = FALSE;
9098 }
9099 vectorize = TRUE;
9100 goto tryasterisk;
eb3fce90
JH
9101 }
9102
211dfcf1 9103 if (!asterisk)
858a90f9 9104 {
7a5fa8a2 9105 if( *q == '0' )
f3583277 9106 fill = *q++;
211dfcf1 9107 EXPECT_NUMBER(q, width);
858a90f9 9108 }
211dfcf1
HS
9109
9110 if (vectorize) {
9111 if (vectorarg) {
9112 if (args)
9113 vecsv = va_arg(*args, SV*);
9114 else
9115 vecsv = (evix ? evix <= svmax : svix < svmax) ?
3a7a539e 9116 svargs[evix ? evix-1 : svix++] : &PL_sv_undef;
245d4a47 9117 dotstr = SvPV_const(vecsv, dotstrlen);
211dfcf1 9118 if (DO_UTF8(vecsv))
2cf2cfc6 9119 is_utf8 = TRUE;
211dfcf1
HS
9120 }
9121 if (args) {
8896765a 9122 VECTORIZE_ARGS
eb3fce90 9123 }
211dfcf1
HS
9124 else if (efix ? efix <= svmax : svix < svmax) {
9125 vecsv = svargs[efix ? efix-1 : svix++];
245d4a47 9126 vecstr = (U8*)SvPV_const(vecsv,veclen);
2cf2cfc6 9127 vec_utf8 = DO_UTF8(vecsv);
d7aa5382 9128 /* if this is a version object, we need to return the
3f7c398e 9129 * stringified representation (which the SvPVX_const has
d7aa5382
JP
9130 * already done for us), but not vectorize the args
9131 */
9132 if ( *q == 'd' && sv_derived_from(vecsv,"version") )
9133 {
9134 q++; /* skip past the rest of the %vd format */
245d4a47 9135 eptr = (const char *) vecstr;
d7aa5382
JP
9136 elen = strlen(eptr);
9137 vectorize=FALSE;
9138 goto string;
9139 }
211dfcf1
HS
9140 }
9141 else {
9142 vecstr = (U8*)"";
9143 veclen = 0;
9144 }
eb3fce90 9145 }
fc36a67e 9146
eb3fce90 9147 if (asterisk) {
fc36a67e 9148 if (args)
9149 i = va_arg(*args, int);
9150 else
eb3fce90
JH
9151 i = (ewix ? ewix <= svmax : svix < svmax) ?
9152 SvIVx(svargs[ewix ? ewix-1 : svix++]) : 0;
fc36a67e 9153 left |= (i < 0);
9154 width = (i < 0) ? -i : i;
fc36a67e 9155 }
211dfcf1 9156 gotwidth:
fc36a67e 9157
9158 /* PRECISION */
46fc3d4c 9159
fc36a67e 9160 if (*q == '.') {
9161 q++;
9162 if (*q == '*') {
211dfcf1 9163 q++;
7b8dd722
HS
9164 if (EXPECT_NUMBER(q, epix) && *q++ != '$')
9165 goto unknown;
9166 /* XXX: todo, support specified precision parameter */
9167 if (epix)
211dfcf1 9168 goto unknown;
46fc3d4c 9169 if (args)
9170 i = va_arg(*args, int);
9171 else
eb3fce90
JH
9172 i = (ewix ? ewix <= svmax : svix < svmax)
9173 ? SvIVx(svargs[ewix ? ewix-1 : svix++]) : 0;
fc36a67e 9174 precis = (i < 0) ? 0 : i;
fc36a67e 9175 }
9176 else {
9177 precis = 0;
9178 while (isDIGIT(*q))
9179 precis = precis * 10 + (*q++ - '0');
9180 }
9181 has_precis = TRUE;
9182 }
46fc3d4c 9183
fc36a67e 9184 /* SIZE */
46fc3d4c 9185
fc36a67e 9186 switch (*q) {
c623ac67
GS
9187#ifdef WIN32
9188 case 'I': /* Ix, I32x, and I64x */
9189# ifdef WIN64
9190 if (q[1] == '6' && q[2] == '4') {
9191 q += 3;
9192 intsize = 'q';
9193 break;
9194 }
9195# endif
9196 if (q[1] == '3' && q[2] == '2') {
9197 q += 3;
9198 break;
9199 }
9200# ifdef WIN64
9201 intsize = 'q';
9202# endif
9203 q++;
9204 break;
9205#endif
9e5b023a 9206#if defined(HAS_QUAD) || defined(HAS_LONG_DOUBLE)
6f9bb7fd 9207 case 'L': /* Ld */
e5c81feb 9208 /* FALL THROUGH */
e5c81feb 9209#ifdef HAS_QUAD
6f9bb7fd 9210 case 'q': /* qd */
9e5b023a 9211#endif
6f9bb7fd
GS
9212 intsize = 'q';
9213 q++;
9214 break;
9215#endif
fc36a67e 9216 case 'l':
9e5b023a 9217#if defined(HAS_QUAD) || defined(HAS_LONG_DOUBLE)
205f51d8 9218 if (*(q + 1) == 'l') { /* lld, llf */
fc36a67e 9219 intsize = 'q';
9220 q += 2;
46fc3d4c 9221 break;
cf2093f6 9222 }
fc36a67e 9223#endif
6f9bb7fd 9224 /* FALL THROUGH */
fc36a67e 9225 case 'h':
cf2093f6 9226 /* FALL THROUGH */
fc36a67e 9227 case 'V':
9228 intsize = *q++;
46fc3d4c 9229 break;
9230 }
9231
fc36a67e 9232 /* CONVERSION */
9233
211dfcf1
HS
9234 if (*q == '%') {
9235 eptr = q++;
9236 elen = 1;
9237 goto string;
9238 }
9239
be75b157
HS
9240 if (vectorize)
9241 argsv = vecsv;
9242 else if (!args)
211dfcf1
HS
9243 argsv = (efix ? efix <= svmax : svix < svmax) ?
9244 svargs[efix ? efix-1 : svix++] : &PL_sv_undef;
9245
46fc3d4c 9246 switch (c = *q++) {
9247
9248 /* STRINGS */
9249
46fc3d4c 9250 case 'c':
be75b157 9251 uv = (args && !vectorize) ? va_arg(*args, int) : SvIVx(argsv);
1bd104fb
JH
9252 if ((uv > 255 ||
9253 (!UNI_IS_INVARIANT(uv) && SvUTF8(sv)))
0064a8a9 9254 && !IN_BYTES) {
dfe13c55 9255 eptr = (char*)utf8buf;
9041c2e3 9256 elen = uvchr_to_utf8((U8*)eptr, uv) - utf8buf;
2cf2cfc6 9257 is_utf8 = TRUE;
7e2040f0
GS
9258 }
9259 else {
9260 c = (char)uv;
9261 eptr = &c;
9262 elen = 1;
a0ed51b3 9263 }
46fc3d4c 9264 goto string;
9265
46fc3d4c 9266 case 's':
be75b157 9267 if (args && !vectorize) {
fc36a67e 9268 eptr = va_arg(*args, char*);
c635e13b 9269 if (eptr)
1d7c1841
GS
9270#ifdef MACOS_TRADITIONAL
9271 /* On MacOS, %#s format is used for Pascal strings */
9272 if (alt)
9273 elen = *eptr++;
9274 else
9275#endif
c635e13b 9276 elen = strlen(eptr);
9277 else {
27da23d5 9278 eptr = (char *)nullstr;
c635e13b 9279 elen = sizeof nullstr - 1;
9280 }
46fc3d4c 9281 }
211dfcf1 9282 else {
4d84ee25 9283 eptr = SvPVx_const(argsv, elen);
7e2040f0 9284 if (DO_UTF8(argsv)) {
a0ed51b3
LW
9285 if (has_precis && precis < elen) {
9286 I32 p = precis;
7e2040f0 9287 sv_pos_u2b(argsv, &p, 0); /* sticks at end */
a0ed51b3
LW
9288 precis = p;
9289 }
9290 if (width) { /* fudge width (can't fudge elen) */
7e2040f0 9291 width += elen - sv_len_utf8(argsv);
a0ed51b3 9292 }
2cf2cfc6 9293 is_utf8 = TRUE;
a0ed51b3
LW
9294 }
9295 }
fc36a67e 9296
46fc3d4c 9297 string:
b22c7a20 9298 vectorize = FALSE;
46fc3d4c 9299 if (has_precis && elen > precis)
9300 elen = precis;
9301 break;
9302
9303 /* INTEGERS */
9304
fc36a67e 9305 case 'p':
be75b157 9306 if (alt || vectorize)
c2e66d9e 9307 goto unknown;
211dfcf1 9308 uv = PTR2UV(args ? va_arg(*args, void*) : argsv);
fc36a67e 9309 base = 16;
9310 goto integer;
9311
46fc3d4c 9312 case 'D':
29fe7a80 9313#ifdef IV_IS_QUAD
22f3ae8c 9314 intsize = 'q';
29fe7a80 9315#else
46fc3d4c 9316 intsize = 'l';
29fe7a80 9317#endif
46fc3d4c 9318 /* FALL THROUGH */
9319 case 'd':
9320 case 'i':
8896765a
RB
9321#if vdNUMBER
9322 format_vd:
9323#endif
b22c7a20 9324 if (vectorize) {
ba210ebe 9325 STRLEN ulen;
211dfcf1
HS
9326 if (!veclen)
9327 continue;
2cf2cfc6
A
9328 if (vec_utf8)
9329 uv = utf8n_to_uvchr(vecstr, veclen, &ulen,
9330 UTF8_ALLOW_ANYUV);
b22c7a20 9331 else {
e83d50c9 9332 uv = *vecstr;
b22c7a20
GS
9333 ulen = 1;
9334 }
9335 vecstr += ulen;
9336 veclen -= ulen;
e83d50c9
JP
9337 if (plus)
9338 esignbuf[esignlen++] = plus;
b22c7a20
GS
9339 }
9340 else if (args) {
46fc3d4c 9341 switch (intsize) {
9342 case 'h': iv = (short)va_arg(*args, int); break;
46fc3d4c 9343 case 'l': iv = va_arg(*args, long); break;
fc36a67e 9344 case 'V': iv = va_arg(*args, IV); break;
b10c0dba 9345 default: iv = va_arg(*args, int); break;
cf2093f6
JH
9346#ifdef HAS_QUAD
9347 case 'q': iv = va_arg(*args, Quad_t); break;
9348#endif
46fc3d4c 9349 }
9350 }
9351 else {
b10c0dba 9352 IV tiv = SvIVx(argsv); /* work around GCC bug #13488 */
46fc3d4c 9353 switch (intsize) {
b10c0dba
MHM
9354 case 'h': iv = (short)tiv; break;
9355 case 'l': iv = (long)tiv; break;
9356 case 'V':
9357 default: iv = tiv; break;
cf2093f6 9358#ifdef HAS_QUAD
b10c0dba 9359 case 'q': iv = (Quad_t)tiv; break;
cf2093f6 9360#endif
46fc3d4c 9361 }
9362 }
e83d50c9
JP
9363 if ( !vectorize ) /* we already set uv above */
9364 {
9365 if (iv >= 0) {
9366 uv = iv;
9367 if (plus)
9368 esignbuf[esignlen++] = plus;
9369 }
9370 else {
9371 uv = -iv;
9372 esignbuf[esignlen++] = '-';
9373 }
46fc3d4c 9374 }
9375 base = 10;
9376 goto integer;
9377
fc36a67e 9378 case 'U':
29fe7a80 9379#ifdef IV_IS_QUAD
22f3ae8c 9380 intsize = 'q';
29fe7a80 9381#else
fc36a67e 9382 intsize = 'l';
29fe7a80 9383#endif
fc36a67e 9384 /* FALL THROUGH */
9385 case 'u':
9386 base = 10;
9387 goto uns_integer;
9388
4f19785b
WSI
9389 case 'b':
9390 base = 2;
9391 goto uns_integer;
9392
46fc3d4c 9393 case 'O':
29fe7a80 9394#ifdef IV_IS_QUAD
22f3ae8c 9395 intsize = 'q';
29fe7a80 9396#else
46fc3d4c 9397 intsize = 'l';
29fe7a80 9398#endif
46fc3d4c 9399 /* FALL THROUGH */
9400 case 'o':
9401 base = 8;
9402 goto uns_integer;
9403
9404 case 'X':
46fc3d4c 9405 case 'x':
9406 base = 16;
46fc3d4c 9407
9408 uns_integer:
b22c7a20 9409 if (vectorize) {
ba210ebe 9410 STRLEN ulen;
b22c7a20 9411 vector:
211dfcf1
HS
9412 if (!veclen)
9413 continue;
2cf2cfc6
A
9414 if (vec_utf8)
9415 uv = utf8n_to_uvchr(vecstr, veclen, &ulen,
9416 UTF8_ALLOW_ANYUV);
b22c7a20 9417 else {
a05b299f 9418 uv = *vecstr;
b22c7a20
GS
9419 ulen = 1;
9420 }
9421 vecstr += ulen;
9422 veclen -= ulen;
9423 }
9424 else if (args) {
46fc3d4c 9425 switch (intsize) {
9426 case 'h': uv = (unsigned short)va_arg(*args, unsigned); break;
46fc3d4c 9427 case 'l': uv = va_arg(*args, unsigned long); break;
fc36a67e 9428 case 'V': uv = va_arg(*args, UV); break;
b10c0dba 9429 default: uv = va_arg(*args, unsigned); break;
cf2093f6 9430#ifdef HAS_QUAD
9e3321a5 9431 case 'q': uv = va_arg(*args, Uquad_t); break;
cf2093f6 9432#endif
46fc3d4c 9433 }
9434 }
9435 else {
b10c0dba 9436 UV tuv = SvUVx(argsv); /* work around GCC bug #13488 */
46fc3d4c 9437 switch (intsize) {
b10c0dba
MHM
9438 case 'h': uv = (unsigned short)tuv; break;
9439 case 'l': uv = (unsigned long)tuv; break;
9440 case 'V':
9441 default: uv = tuv; break;
cf2093f6 9442#ifdef HAS_QUAD
b10c0dba 9443 case 'q': uv = (Uquad_t)tuv; break;
cf2093f6 9444#endif
46fc3d4c 9445 }
9446 }
9447
9448 integer:
4d84ee25
NC
9449 {
9450 char *ptr = ebuf + sizeof ebuf;
9451 switch (base) {
9452 unsigned dig;
9453 case 16:
9454 if (!uv)
9455 alt = FALSE;
9456 p = (char*)((c == 'X')
9457 ? "0123456789ABCDEF" : "0123456789abcdef");
9458 do {
9459 dig = uv & 15;
9460 *--ptr = p[dig];
9461 } while (uv >>= 4);
9462 if (alt) {
9463 esignbuf[esignlen++] = '0';
9464 esignbuf[esignlen++] = c; /* 'x' or 'X' */
9465 }
9466 break;
9467 case 8:
9468 do {
9469 dig = uv & 7;
9470 *--ptr = '0' + dig;
9471 } while (uv >>= 3);
9472 if (alt && *ptr != '0')
9473 *--ptr = '0';
9474 break;
9475 case 2:
9476 do {
9477 dig = uv & 1;
9478 *--ptr = '0' + dig;
9479 } while (uv >>= 1);
9480 if (alt) {
9481 esignbuf[esignlen++] = '0';
9482 esignbuf[esignlen++] = 'b';
9483 }
9484 break;
9485 default: /* it had better be ten or less */
9486 do {
9487 dig = uv % base;
9488 *--ptr = '0' + dig;
9489 } while (uv /= base);
9490 break;
46fc3d4c 9491 }
4d84ee25
NC
9492 elen = (ebuf + sizeof ebuf) - ptr;
9493 eptr = ptr;
9494 if (has_precis) {
9495 if (precis > elen)
9496 zeros = precis - elen;
9497 else if (precis == 0 && elen == 1 && *eptr == '0')
9498 elen = 0;
eda88b6d 9499 }
c10ed8b9 9500 }
46fc3d4c 9501 break;
9502
9503 /* FLOATING POINT */
9504
fc36a67e 9505 case 'F':
9506 c = 'f'; /* maybe %F isn't supported here */
9507 /* FALL THROUGH */
46fc3d4c 9508 case 'e': case 'E':
fc36a67e 9509 case 'f':
46fc3d4c 9510 case 'g': case 'G':
9511
9512 /* This is evil, but floating point is even more evil */
9513
9e5b023a
JH
9514 /* for SV-style calling, we can only get NV
9515 for C-style calling, we assume %f is double;
9516 for simplicity we allow any of %Lf, %llf, %qf for long double
9517 */
9518 switch (intsize) {
9519 case 'V':
9520#if defined(USE_LONG_DOUBLE)
9521 intsize = 'q';
9522#endif
9523 break;
8a2e3f14 9524/* [perl #20339] - we should accept and ignore %lf rather than die */
00e17364
HS
9525 case 'l':
9526 /* FALL THROUGH */
9e5b023a
JH
9527 default:
9528#if defined(USE_LONG_DOUBLE)
9529 intsize = args ? 0 : 'q';
9530#endif
9531 break;
9532 case 'q':
9533#if defined(HAS_LONG_DOUBLE)
9534 break;
9535#else
9536 /* FALL THROUGH */
9537#endif
9538 case 'h':
9e5b023a
JH
9539 goto unknown;
9540 }
9541
9542 /* now we need (long double) if intsize == 'q', else (double) */
be75b157 9543 nv = (args && !vectorize) ?
35fff930
JH
9544#if LONG_DOUBLESIZE > DOUBLESIZE
9545 intsize == 'q' ?
205f51d8
AS
9546 va_arg(*args, long double) :
9547 va_arg(*args, double)
35fff930 9548#else
205f51d8 9549 va_arg(*args, double)
35fff930 9550#endif
9e5b023a 9551 : SvNVx(argsv);
fc36a67e 9552
9553 need = 0;
be75b157 9554 vectorize = FALSE;
fc36a67e 9555 if (c != 'e' && c != 'E') {
9556 i = PERL_INT_MIN;
9e5b023a
JH
9557 /* FIXME: if HAS_LONG_DOUBLE but not USE_LONG_DOUBLE this
9558 will cast our (long double) to (double) */
73b309ea 9559 (void)Perl_frexp(nv, &i);
fc36a67e 9560 if (i == PERL_INT_MIN)
cea2e8a9 9561 Perl_die(aTHX_ "panic: frexp");
c635e13b 9562 if (i > 0)
fc36a67e 9563 need = BIT_DIGITS(i);
9564 }
9565 need += has_precis ? precis : 6; /* known default */
20f6aaab 9566
fc36a67e 9567 if (need < width)
9568 need = width;
9569
20f6aaab
AS
9570#ifdef HAS_LDBL_SPRINTF_BUG
9571 /* This is to try to fix a bug with irix/nonstop-ux/powerux and
205f51d8
AS
9572 with sfio - Allen <allens@cpan.org> */
9573
9574# ifdef DBL_MAX
9575# define MY_DBL_MAX DBL_MAX
9576# else /* XXX guessing! HUGE_VAL may be defined as infinity, so not using */
9577# if DOUBLESIZE >= 8
9578# define MY_DBL_MAX 1.7976931348623157E+308L
9579# else
9580# define MY_DBL_MAX 3.40282347E+38L
9581# endif
9582# endif
9583
9584# ifdef HAS_LDBL_SPRINTF_BUG_LESS1 /* only between -1L & 1L - Allen */
9585# define MY_DBL_MAX_BUG 1L
20f6aaab 9586# else
205f51d8 9587# define MY_DBL_MAX_BUG MY_DBL_MAX
20f6aaab 9588# endif
20f6aaab 9589
205f51d8
AS
9590# ifdef DBL_MIN
9591# define MY_DBL_MIN DBL_MIN
9592# else /* XXX guessing! -Allen */
9593# if DOUBLESIZE >= 8
9594# define MY_DBL_MIN 2.2250738585072014E-308L
9595# else
9596# define MY_DBL_MIN 1.17549435E-38L
9597# endif
9598# endif
20f6aaab 9599
205f51d8
AS
9600 if ((intsize == 'q') && (c == 'f') &&
9601 ((nv < MY_DBL_MAX_BUG) && (nv > -MY_DBL_MAX_BUG)) &&
9602 (need < DBL_DIG)) {
9603 /* it's going to be short enough that
9604 * long double precision is not needed */
9605
9606 if ((nv <= 0L) && (nv >= -0L))
9607 fix_ldbl_sprintf_bug = TRUE; /* 0 is 0 - easiest */
9608 else {
9609 /* would use Perl_fp_class as a double-check but not
9610 * functional on IRIX - see perl.h comments */
9611
9612 if ((nv >= MY_DBL_MIN) || (nv <= -MY_DBL_MIN)) {
9613 /* It's within the range that a double can represent */
9614#if defined(DBL_MAX) && !defined(DBL_MIN)
9615 if ((nv >= ((long double)1/DBL_MAX)) ||
9616 (nv <= (-(long double)1/DBL_MAX)))
20f6aaab 9617#endif
205f51d8 9618 fix_ldbl_sprintf_bug = TRUE;
20f6aaab 9619 }
205f51d8
AS
9620 }
9621 if (fix_ldbl_sprintf_bug == TRUE) {
9622 double temp;
9623
9624 intsize = 0;
9625 temp = (double)nv;
9626 nv = (NV)temp;
9627 }
20f6aaab 9628 }
205f51d8
AS
9629
9630# undef MY_DBL_MAX
9631# undef MY_DBL_MAX_BUG
9632# undef MY_DBL_MIN
9633
20f6aaab
AS
9634#endif /* HAS_LDBL_SPRINTF_BUG */
9635
46fc3d4c 9636 need += 20; /* fudge factor */
80252599
GS
9637 if (PL_efloatsize < need) {
9638 Safefree(PL_efloatbuf);
9639 PL_efloatsize = need + 20; /* more fudge */
a02a5408 9640 Newx(PL_efloatbuf, PL_efloatsize, char);
7d5ea4e7 9641 PL_efloatbuf[0] = '\0';
46fc3d4c 9642 }
9643
4151a5fe
IZ
9644 if ( !(width || left || plus || alt) && fill != '0'
9645 && has_precis && intsize != 'q' ) { /* Shortcuts */
2873255c
NC
9646 /* See earlier comment about buggy Gconvert when digits,
9647 aka precis is 0 */
9648 if ( c == 'g' && precis) {
2e59c212 9649 Gconvert((NV)nv, (int)precis, 0, PL_efloatbuf);
4151a5fe
IZ
9650 if (*PL_efloatbuf) /* May return an empty string for digits==0 */
9651 goto float_converted;
9652 } else if ( c == 'f' && !precis) {
9653 if ((eptr = F0convert(nv, ebuf + sizeof ebuf, &elen)))
9654 break;
9655 }
9656 }
4d84ee25
NC
9657 {
9658 char *ptr = ebuf + sizeof ebuf;
9659 *--ptr = '\0';
9660 *--ptr = c;
9661 /* FIXME: what to do if HAS_LONG_DOUBLE but not PERL_PRIfldbl? */
9e5b023a 9662#if defined(HAS_LONG_DOUBLE) && defined(PERL_PRIfldbl)
4d84ee25
NC
9663 if (intsize == 'q') {
9664 /* Copy the one or more characters in a long double
9665 * format before the 'base' ([efgEFG]) character to
9666 * the format string. */
9667 static char const prifldbl[] = PERL_PRIfldbl;
9668 char const *p = prifldbl + sizeof(prifldbl) - 3;
9669 while (p >= prifldbl) { *--ptr = *p--; }
9670 }
65202027 9671#endif
4d84ee25
NC
9672 if (has_precis) {
9673 base = precis;
9674 do { *--ptr = '0' + (base % 10); } while (base /= 10);
9675 *--ptr = '.';
9676 }
9677 if (width) {
9678 base = width;
9679 do { *--ptr = '0' + (base % 10); } while (base /= 10);
9680 }
9681 if (fill == '0')
9682 *--ptr = fill;
9683 if (left)
9684 *--ptr = '-';
9685 if (plus)
9686 *--ptr = plus;
9687 if (alt)
9688 *--ptr = '#';
9689 *--ptr = '%';
9690
9691 /* No taint. Otherwise we are in the strange situation
9692 * where printf() taints but print($float) doesn't.
9693 * --jhi */
9e5b023a 9694#if defined(HAS_LONG_DOUBLE)
4d84ee25
NC
9695 if (intsize == 'q')
9696 (void)sprintf(PL_efloatbuf, ptr, nv);
9697 else
9698 (void)sprintf(PL_efloatbuf, ptr, (double)nv);
9e5b023a 9699#else
4d84ee25 9700 (void)sprintf(PL_efloatbuf, ptr, nv);
9e5b023a 9701#endif
4d84ee25 9702 }
4151a5fe 9703 float_converted:
80252599
GS
9704 eptr = PL_efloatbuf;
9705 elen = strlen(PL_efloatbuf);
46fc3d4c 9706 break;
9707
fc36a67e 9708 /* SPECIAL */
9709
9710 case 'n':
9711 i = SvCUR(sv) - origlen;
be75b157 9712 if (args && !vectorize) {
c635e13b 9713 switch (intsize) {
9714 case 'h': *(va_arg(*args, short*)) = i; break;
9715 default: *(va_arg(*args, int*)) = i; break;
9716 case 'l': *(va_arg(*args, long*)) = i; break;
9717 case 'V': *(va_arg(*args, IV*)) = i; break;
cf2093f6
JH
9718#ifdef HAS_QUAD
9719 case 'q': *(va_arg(*args, Quad_t*)) = i; break;
9720#endif
c635e13b 9721 }
fc36a67e 9722 }
9dd79c3f 9723 else
211dfcf1 9724 sv_setuv_mg(argsv, (UV)i);
be75b157 9725 vectorize = FALSE;
fc36a67e 9726 continue; /* not "break" */
9727
9728 /* UNKNOWN */
9729
46fc3d4c 9730 default:
fc36a67e 9731 unknown:
041457d9
DM
9732 if (!args
9733 && (PL_op->op_type == OP_PRTF || PL_op->op_type == OP_SPRINTF)
9734 && ckWARN(WARN_PRINTF))
9735 {
c635e13b 9736 SV *msg = sv_newmortal();
35c1215d
NC
9737 Perl_sv_setpvf(aTHX_ msg, "Invalid conversion in %sprintf: ",
9738 (PL_op->op_type == OP_PRTF) ? "" : "s");
0f4b6630 9739 if (c) {
0f4b6630 9740 if (isPRINT(c))
1c846c1f 9741 Perl_sv_catpvf(aTHX_ msg,
0f4b6630
JH
9742 "\"%%%c\"", c & 0xFF);
9743 else
9744 Perl_sv_catpvf(aTHX_ msg,
57def98f 9745 "\"%%\\%03"UVof"\"",
0f4b6630 9746 (UV)c & 0xFF);
0f4b6630 9747 } else
c635e13b 9748 sv_catpv(msg, "end of string");
9014280d 9749 Perl_warner(aTHX_ packWARN(WARN_PRINTF), "%"SVf, msg); /* yes, this is reentrant */
c635e13b 9750 }
fb73857a 9751
9752 /* output mangled stuff ... */
9753 if (c == '\0')
9754 --q;
46fc3d4c 9755 eptr = p;
9756 elen = q - p;
fb73857a 9757
9758 /* ... right here, because formatting flags should not apply */
9759 SvGROW(sv, SvCUR(sv) + elen + 1);
9760 p = SvEND(sv);
4459522c 9761 Copy(eptr, p, elen, char);
fb73857a 9762 p += elen;
9763 *p = '\0';
3f7c398e 9764 SvCUR_set(sv, p - SvPVX_const(sv));
58e33a90 9765 svix = osvix;
fb73857a 9766 continue; /* not "break" */
46fc3d4c 9767 }
9768
6c94ec8b
HS
9769 /* calculate width before utf8_upgrade changes it */
9770 have = esignlen + zeros + elen;
9771
d2876be5
JH
9772 if (is_utf8 != has_utf8) {
9773 if (is_utf8) {
9774 if (SvCUR(sv))
9775 sv_utf8_upgrade(sv);
9776 }
9777 else {
53c1dcc0 9778 SV * const nsv = sv_2mortal(newSVpvn(eptr, elen));
d2876be5 9779 sv_utf8_upgrade(nsv);
93524f2b 9780 eptr = SvPVX_const(nsv);
d2876be5
JH
9781 elen = SvCUR(nsv);
9782 }
9783 SvGROW(sv, SvCUR(sv) + elen + 1);
9784 p = SvEND(sv);
9785 *p = '\0';
9786 }
6af65485 9787
46fc3d4c 9788 need = (have > width ? have : width);
9789 gap = need - have;
9790
b22c7a20 9791 SvGROW(sv, SvCUR(sv) + need + dotstrlen + 1);
46fc3d4c 9792 p = SvEND(sv);
9793 if (esignlen && fill == '0') {
53c1dcc0 9794 int i;
eb160463 9795 for (i = 0; i < (int)esignlen; i++)
46fc3d4c 9796 *p++ = esignbuf[i];
9797 }
9798 if (gap && !left) {
9799 memset(p, fill, gap);
9800 p += gap;
9801 }
9802 if (esignlen && fill != '0') {
53c1dcc0 9803 int i;
eb160463 9804 for (i = 0; i < (int)esignlen; i++)
46fc3d4c 9805 *p++ = esignbuf[i];
9806 }
fc36a67e 9807 if (zeros) {
53c1dcc0 9808 int i;
fc36a67e 9809 for (i = zeros; i; i--)
9810 *p++ = '0';
9811 }
46fc3d4c 9812 if (elen) {
4459522c 9813 Copy(eptr, p, elen, char);
46fc3d4c 9814 p += elen;
9815 }
9816 if (gap && left) {
9817 memset(p, ' ', gap);
9818 p += gap;
9819 }
b22c7a20
GS
9820 if (vectorize) {
9821 if (veclen) {
4459522c 9822 Copy(dotstr, p, dotstrlen, char);
b22c7a20
GS
9823 p += dotstrlen;
9824 }
9825 else
9826 vectorize = FALSE; /* done iterating over vecstr */
9827 }
2cf2cfc6
A
9828 if (is_utf8)
9829 has_utf8 = TRUE;
9830 if (has_utf8)
7e2040f0 9831 SvUTF8_on(sv);
46fc3d4c 9832 *p = '\0';
3f7c398e 9833 SvCUR_set(sv, p - SvPVX_const(sv));
b22c7a20
GS
9834 if (vectorize) {
9835 esignlen = 0;
9836 goto vector;
9837 }
46fc3d4c 9838 }
9839}
51371543 9840
645c22ef
DM
9841/* =========================================================================
9842
9843=head1 Cloning an interpreter
9844
9845All the macros and functions in this section are for the private use of
9846the main function, perl_clone().
9847
9848The foo_dup() functions make an exact copy of an existing foo thinngy.
9849During the course of a cloning, a hash table is used to map old addresses
9850to new addresses. The table is created and manipulated with the
9851ptr_table_* functions.
9852
9853=cut
9854
9855============================================================================*/
9856
9857
1d7c1841
GS
9858#if defined(USE_ITHREADS)
9859
1d7c1841
GS
9860#ifndef GpREFCNT_inc
9861# define GpREFCNT_inc(gp) ((gp) ? (++(gp)->gp_refcnt, (gp)) : (GP*)NULL)
9862#endif
9863
9864
d2d73c3e
AB
9865#define sv_dup_inc(s,t) SvREFCNT_inc(sv_dup(s,t))
9866#define av_dup(s,t) (AV*)sv_dup((SV*)s,t)
9867#define av_dup_inc(s,t) (AV*)SvREFCNT_inc(sv_dup((SV*)s,t))
9868#define hv_dup(s,t) (HV*)sv_dup((SV*)s,t)
9869#define hv_dup_inc(s,t) (HV*)SvREFCNT_inc(sv_dup((SV*)s,t))
9870#define cv_dup(s,t) (CV*)sv_dup((SV*)s,t)
9871#define cv_dup_inc(s,t) (CV*)SvREFCNT_inc(sv_dup((SV*)s,t))
9872#define io_dup(s,t) (IO*)sv_dup((SV*)s,t)
9873#define io_dup_inc(s,t) (IO*)SvREFCNT_inc(sv_dup((SV*)s,t))
9874#define gv_dup(s,t) (GV*)sv_dup((SV*)s,t)
9875#define gv_dup_inc(s,t) (GV*)SvREFCNT_inc(sv_dup((SV*)s,t))
1d7c1841
GS
9876#define SAVEPV(p) (p ? savepv(p) : Nullch)
9877#define SAVEPVN(p,n) (p ? savepvn(p,n) : Nullch)
8cf8f3d1 9878
d2d73c3e 9879
d2f185dc
AMS
9880/* Duplicate a regexp. Required reading: pregcomp() and pregfree() in
9881 regcomp.c. AMS 20010712 */
645c22ef 9882
1d7c1841 9883REGEXP *
53c1dcc0 9884Perl_re_dup(pTHX_ const REGEXP *r, CLONE_PARAMS *param)
1d7c1841 9885{
27da23d5 9886 dVAR;
d2f185dc
AMS
9887 REGEXP *ret;
9888 int i, len, npar;
9889 struct reg_substr_datum *s;
9890
9891 if (!r)
9892 return (REGEXP *)NULL;
9893
9894 if ((ret = (REGEXP *)ptr_table_fetch(PL_ptr_table, r)))
9895 return ret;
9896
9897 len = r->offsets[0];
9898 npar = r->nparens+1;
9899
a02a5408 9900 Newxc(ret, sizeof(regexp) + (len+1)*sizeof(regnode), char, regexp);
d2f185dc
AMS
9901 Copy(r->program, ret->program, len+1, regnode);
9902
a02a5408 9903 Newx(ret->startp, npar, I32);
d2f185dc 9904 Copy(r->startp, ret->startp, npar, I32);
a02a5408 9905 Newx(ret->endp, npar, I32);
d2f185dc
AMS
9906 Copy(r->startp, ret->startp, npar, I32);
9907
a02a5408 9908 Newx(ret->substrs, 1, struct reg_substr_data);
d2f185dc
AMS
9909 for (s = ret->substrs->data, i = 0; i < 3; i++, s++) {
9910 s->min_offset = r->substrs->data[i].min_offset;
9911 s->max_offset = r->substrs->data[i].max_offset;
9912 s->substr = sv_dup_inc(r->substrs->data[i].substr, param);
33b8afdf 9913 s->utf8_substr = sv_dup_inc(r->substrs->data[i].utf8_substr, param);
d2f185dc
AMS
9914 }
9915
70612e96 9916 ret->regstclass = NULL;
d2f185dc
AMS
9917 if (r->data) {
9918 struct reg_data *d;
e1ec3a88 9919 const int count = r->data->count;
53c1dcc0 9920 int i;
d2f185dc 9921
a02a5408 9922 Newxc(d, sizeof(struct reg_data) + count*sizeof(void *),
d2f185dc 9923 char, struct reg_data);
a02a5408 9924 Newx(d->what, count, U8);
d2f185dc
AMS
9925
9926 d->count = count;
9927 for (i = 0; i < count; i++) {
9928 d->what[i] = r->data->what[i];
9929 switch (d->what[i]) {
a3621e74
YO
9930 /* legal options are one of: sfpont
9931 see also regcomp.h and pregfree() */
d2f185dc
AMS
9932 case 's':
9933 d->data[i] = sv_dup_inc((SV *)r->data->data[i], param);
9934 break;
9935 case 'p':
9936 d->data[i] = av_dup_inc((AV *)r->data->data[i], param);
9937 break;
9938 case 'f':
9939 /* This is cheating. */
a02a5408 9940 Newx(d->data[i], 1, struct regnode_charclass_class);
d2f185dc
AMS
9941 StructCopy(r->data->data[i], d->data[i],
9942 struct regnode_charclass_class);
70612e96 9943 ret->regstclass = (regnode*)d->data[i];
d2f185dc
AMS
9944 break;
9945 case 'o':
33773810
AMS
9946 /* Compiled op trees are readonly, and can thus be
9947 shared without duplication. */
b34c0dd4 9948 OP_REFCNT_LOCK;
9b978d73 9949 d->data[i] = (void*)OpREFCNT_inc((OP*)r->data->data[i]);
b34c0dd4 9950 OP_REFCNT_UNLOCK;
9b978d73 9951 break;
d2f185dc
AMS
9952 case 'n':
9953 d->data[i] = r->data->data[i];
9954 break;
a3621e74
YO
9955 case 't':
9956 d->data[i] = r->data->data[i];
9957 OP_REFCNT_LOCK;
9958 ((reg_trie_data*)d->data[i])->refcount++;
9959 OP_REFCNT_UNLOCK;
9960 break;
9961 default:
9962 Perl_croak(aTHX_ "panic: re_dup unknown data code '%c'", r->data->what[i]);
d2f185dc
AMS
9963 }
9964 }
9965
9966 ret->data = d;
9967 }
9968 else
9969 ret->data = NULL;
9970
a02a5408 9971 Newx(ret->offsets, 2*len+1, U32);
d2f185dc
AMS
9972 Copy(r->offsets, ret->offsets, 2*len+1, U32);
9973
e01c5899 9974 ret->precomp = SAVEPVN(r->precomp, r->prelen);
d2f185dc
AMS
9975 ret->refcnt = r->refcnt;
9976 ret->minlen = r->minlen;
9977 ret->prelen = r->prelen;
9978 ret->nparens = r->nparens;
9979 ret->lastparen = r->lastparen;
9980 ret->lastcloseparen = r->lastcloseparen;
9981 ret->reganch = r->reganch;
9982
70612e96
RG
9983 ret->sublen = r->sublen;
9984
9985 if (RX_MATCH_COPIED(ret))
e01c5899 9986 ret->subbeg = SAVEPVN(r->subbeg, r->sublen);
70612e96
RG
9987 else
9988 ret->subbeg = Nullch;
f8c7b90f 9989#ifdef PERL_OLD_COPY_ON_WRITE
9a26048b
NC
9990 ret->saved_copy = Nullsv;
9991#endif
70612e96 9992
d2f185dc
AMS
9993 ptr_table_store(PL_ptr_table, r, ret);
9994 return ret;
1d7c1841
GS
9995}
9996
d2d73c3e 9997/* duplicate a file handle */
645c22ef 9998
1d7c1841 9999PerlIO *
a8fc9800 10000Perl_fp_dup(pTHX_ PerlIO *fp, char type, CLONE_PARAMS *param)
1d7c1841
GS
10001{
10002 PerlIO *ret;
53c1dcc0
AL
10003
10004 PERL_UNUSED_ARG(type);
73d840c0 10005
1d7c1841
GS
10006 if (!fp)
10007 return (PerlIO*)NULL;
10008
10009 /* look for it in the table first */
10010 ret = (PerlIO*)ptr_table_fetch(PL_ptr_table, fp);
10011 if (ret)
10012 return ret;
10013
10014 /* create anew and remember what it is */
ecdeb87c 10015 ret = PerlIO_fdupopen(aTHX_ fp, param, PERLIO_DUP_CLONE);
1d7c1841
GS
10016 ptr_table_store(PL_ptr_table, fp, ret);
10017 return ret;
10018}
10019
645c22ef
DM
10020/* duplicate a directory handle */
10021
1d7c1841
GS
10022DIR *
10023Perl_dirp_dup(pTHX_ DIR *dp)
10024{
10025 if (!dp)
10026 return (DIR*)NULL;
10027 /* XXX TODO */
10028 return dp;
10029}
10030
ff276b08 10031/* duplicate a typeglob */
645c22ef 10032
1d7c1841 10033GP *
a8fc9800 10034Perl_gp_dup(pTHX_ GP *gp, CLONE_PARAMS* param)
1d7c1841
GS
10035{
10036 GP *ret;
10037 if (!gp)
10038 return (GP*)NULL;
10039 /* look for it in the table first */
10040 ret = (GP*)ptr_table_fetch(PL_ptr_table, gp);
10041 if (ret)
10042 return ret;
10043
10044 /* create anew and remember what it is */
a02a5408 10045 Newxz(ret, 1, GP);
1d7c1841
GS
10046 ptr_table_store(PL_ptr_table, gp, ret);
10047
10048 /* clone */
10049 ret->gp_refcnt = 0; /* must be before any other dups! */
d2d73c3e
AB
10050 ret->gp_sv = sv_dup_inc(gp->gp_sv, param);
10051 ret->gp_io = io_dup_inc(gp->gp_io, param);
10052 ret->gp_form = cv_dup_inc(gp->gp_form, param);
10053 ret->gp_av = av_dup_inc(gp->gp_av, param);
10054 ret->gp_hv = hv_dup_inc(gp->gp_hv, param);
10055 ret->gp_egv = gv_dup(gp->gp_egv, param);/* GvEGV is not refcounted */
10056 ret->gp_cv = cv_dup_inc(gp->gp_cv, param);
1d7c1841 10057 ret->gp_cvgen = gp->gp_cvgen;
1d7c1841
GS
10058 ret->gp_line = gp->gp_line;
10059 ret->gp_file = gp->gp_file; /* points to COP.cop_file */
10060 return ret;
10061}
10062
645c22ef
DM
10063/* duplicate a chain of magic */
10064
1d7c1841 10065MAGIC *
a8fc9800 10066Perl_mg_dup(pTHX_ MAGIC *mg, CLONE_PARAMS* param)
1d7c1841 10067{
cb359b41
JH
10068 MAGIC *mgprev = (MAGIC*)NULL;
10069 MAGIC *mgret;
1d7c1841
GS
10070 if (!mg)
10071 return (MAGIC*)NULL;
10072 /* look for it in the table first */
10073 mgret = (MAGIC*)ptr_table_fetch(PL_ptr_table, mg);
10074 if (mgret)
10075 return mgret;
10076
10077 for (; mg; mg = mg->mg_moremagic) {
10078 MAGIC *nmg;
a02a5408 10079 Newxz(nmg, 1, MAGIC);
cb359b41 10080 if (mgprev)
1d7c1841 10081 mgprev->mg_moremagic = nmg;
cb359b41
JH
10082 else
10083 mgret = nmg;
1d7c1841
GS
10084 nmg->mg_virtual = mg->mg_virtual; /* XXX copy dynamic vtable? */
10085 nmg->mg_private = mg->mg_private;
10086 nmg->mg_type = mg->mg_type;
10087 nmg->mg_flags = mg->mg_flags;
14befaf4 10088 if (mg->mg_type == PERL_MAGIC_qr) {
d2f185dc 10089 nmg->mg_obj = (SV*)re_dup((REGEXP*)mg->mg_obj, param);
1d7c1841 10090 }
05bd4103 10091 else if(mg->mg_type == PERL_MAGIC_backref) {
7fc63493 10092 const AV * const av = (AV*) mg->mg_obj;
fdc9a813
AE
10093 SV **svp;
10094 I32 i;
7fc63493 10095 (void)SvREFCNT_inc(nmg->mg_obj = (SV*)newAV());
fdc9a813
AE
10096 svp = AvARRAY(av);
10097 for (i = AvFILLp(av); i >= 0; i--) {
3a81978b 10098 if (!svp[i]) continue;
fdc9a813
AE
10099 av_push((AV*)nmg->mg_obj,sv_dup(svp[i],param));
10100 }
05bd4103 10101 }
8d2f4536
NC
10102 else if (mg->mg_type == PERL_MAGIC_symtab) {
10103 nmg->mg_obj = mg->mg_obj;
10104 }
1d7c1841
GS
10105 else {
10106 nmg->mg_obj = (mg->mg_flags & MGf_REFCOUNTED)
d2d73c3e
AB
10107 ? sv_dup_inc(mg->mg_obj, param)
10108 : sv_dup(mg->mg_obj, param);
1d7c1841
GS
10109 }
10110 nmg->mg_len = mg->mg_len;
10111 nmg->mg_ptr = mg->mg_ptr; /* XXX random ptr? */
14befaf4 10112 if (mg->mg_ptr && mg->mg_type != PERL_MAGIC_regex_global) {
68795e93 10113 if (mg->mg_len > 0) {
1d7c1841 10114 nmg->mg_ptr = SAVEPVN(mg->mg_ptr, mg->mg_len);
14befaf4
DM
10115 if (mg->mg_type == PERL_MAGIC_overload_table &&
10116 AMT_AMAGIC((AMT*)mg->mg_ptr))
10117 {
1d7c1841
GS
10118 AMT *amtp = (AMT*)mg->mg_ptr;
10119 AMT *namtp = (AMT*)nmg->mg_ptr;
10120 I32 i;
10121 for (i = 1; i < NofAMmeth; i++) {
d2d73c3e 10122 namtp->table[i] = cv_dup_inc(amtp->table[i], param);
1d7c1841
GS
10123 }
10124 }
10125 }
10126 else if (mg->mg_len == HEf_SVKEY)
d2d73c3e 10127 nmg->mg_ptr = (char*)sv_dup_inc((SV*)mg->mg_ptr, param);
1d7c1841 10128 }
68795e93
NIS
10129 if ((mg->mg_flags & MGf_DUP) && mg->mg_virtual && mg->mg_virtual->svt_dup) {
10130 CALL_FPTR(nmg->mg_virtual->svt_dup)(aTHX_ nmg, param);
10131 }
1d7c1841
GS
10132 mgprev = nmg;
10133 }
10134 return mgret;
10135}
10136
645c22ef
DM
10137/* create a new pointer-mapping table */
10138
1d7c1841
GS
10139PTR_TBL_t *
10140Perl_ptr_table_new(pTHX)
10141{
10142 PTR_TBL_t *tbl;
a02a5408 10143 Newxz(tbl, 1, PTR_TBL_t);
1d7c1841
GS
10144 tbl->tbl_max = 511;
10145 tbl->tbl_items = 0;
a02a5408 10146 Newxz(tbl->tbl_ary, tbl->tbl_max + 1, PTR_TBL_ENT_t*);
1d7c1841
GS
10147 return tbl;
10148}
10149
134ca3d6
DM
10150#if (PTRSIZE == 8)
10151# define PTR_TABLE_HASH(ptr) (PTR2UV(ptr) >> 3)
10152#else
10153# define PTR_TABLE_HASH(ptr) (PTR2UV(ptr) >> 2)
10154#endif
10155
cb4415b8 10156#define del_pte(p) del_body_type(p, struct ptr_tbl_ent, pte)
32e691d0 10157
645c22ef
DM
10158/* map an existing pointer using a table */
10159
1d7c1841 10160void *
53c1dcc0 10161Perl_ptr_table_fetch(pTHX_ PTR_TBL_t *tbl, const void *sv)
1d7c1841
GS
10162{
10163 PTR_TBL_ENT_t *tblent;
4373e329 10164 const UV hash = PTR_TABLE_HASH(sv);
1d7c1841
GS
10165 assert(tbl);
10166 tblent = tbl->tbl_ary[hash & tbl->tbl_max];
10167 for (; tblent; tblent = tblent->next) {
10168 if (tblent->oldval == sv)
10169 return tblent->newval;
10170 }
10171 return (void*)NULL;
10172}
10173
645c22ef
DM
10174/* add a new entry to a pointer-mapping table */
10175
1d7c1841 10176void
53c1dcc0 10177Perl_ptr_table_store(pTHX_ PTR_TBL_t *tbl, const void *oldv, void *newv)
1d7c1841
GS
10178{
10179 PTR_TBL_ENT_t *tblent, **otblent;
10180 /* XXX this may be pessimal on platforms where pointers aren't good
10181 * hash values e.g. if they grow faster in the most significant
10182 * bits */
4373e329 10183 const UV hash = PTR_TABLE_HASH(oldv);
14cade97 10184 bool empty = 1;
1d7c1841
GS
10185
10186 assert(tbl);
10187 otblent = &tbl->tbl_ary[hash & tbl->tbl_max];
14cade97 10188 for (tblent = *otblent; tblent; empty=0, tblent = tblent->next) {
1d7c1841
GS
10189 if (tblent->oldval == oldv) {
10190 tblent->newval = newv;
1d7c1841
GS
10191 return;
10192 }
10193 }
08742458
NC
10194 new_body_inline(tblent, (void**)&PL_pte_arenaroot, (void**)&PL_pte_root,
10195 sizeof(struct ptr_tbl_ent));
1d7c1841
GS
10196 tblent->oldval = oldv;
10197 tblent->newval = newv;
10198 tblent->next = *otblent;
10199 *otblent = tblent;
10200 tbl->tbl_items++;
14cade97 10201 if (!empty && tbl->tbl_items > tbl->tbl_max)
1d7c1841
GS
10202 ptr_table_split(tbl);
10203}
10204
645c22ef
DM
10205/* double the hash bucket size of an existing ptr table */
10206
1d7c1841
GS
10207void
10208Perl_ptr_table_split(pTHX_ PTR_TBL_t *tbl)
10209{
10210 PTR_TBL_ENT_t **ary = tbl->tbl_ary;
4373e329 10211 const UV oldsize = tbl->tbl_max + 1;
1d7c1841
GS
10212 UV newsize = oldsize * 2;
10213 UV i;
10214
10215 Renew(ary, newsize, PTR_TBL_ENT_t*);
10216 Zero(&ary[oldsize], newsize-oldsize, PTR_TBL_ENT_t*);
10217 tbl->tbl_max = --newsize;
10218 tbl->tbl_ary = ary;
10219 for (i=0; i < oldsize; i++, ary++) {
10220 PTR_TBL_ENT_t **curentp, **entp, *ent;
10221 if (!*ary)
10222 continue;
10223 curentp = ary + oldsize;
10224 for (entp = ary, ent = *ary; ent; ent = *entp) {
134ca3d6 10225 if ((newsize & PTR_TABLE_HASH(ent->oldval)) != i) {
1d7c1841
GS
10226 *entp = ent->next;
10227 ent->next = *curentp;
10228 *curentp = ent;
10229 continue;
10230 }
10231 else
10232 entp = &ent->next;
10233 }
10234 }
10235}
10236
645c22ef
DM
10237/* remove all the entries from a ptr table */
10238
a0739874
DM
10239void
10240Perl_ptr_table_clear(pTHX_ PTR_TBL_t *tbl)
10241{
10242 register PTR_TBL_ENT_t **array;
10243 register PTR_TBL_ENT_t *entry;
a0739874
DM
10244 UV riter = 0;
10245 UV max;
10246
10247 if (!tbl || !tbl->tbl_items) {
10248 return;
10249 }
10250
10251 array = tbl->tbl_ary;
10252 entry = array[0];
10253 max = tbl->tbl_max;
10254
10255 for (;;) {
10256 if (entry) {
4373e329 10257 PTR_TBL_ENT_t *oentry = entry;
a0739874 10258 entry = entry->next;
437a6bf1 10259 del_pte(oentry);
a0739874
DM
10260 }
10261 if (!entry) {
10262 if (++riter > max) {
10263 break;
10264 }
10265 entry = array[riter];
10266 }
10267 }
10268
10269 tbl->tbl_items = 0;
10270}
10271
645c22ef
DM
10272/* clear and free a ptr table */
10273
a0739874
DM
10274void
10275Perl_ptr_table_free(pTHX_ PTR_TBL_t *tbl)
10276{
10277 if (!tbl) {
10278 return;
10279 }
10280 ptr_table_clear(tbl);
10281 Safefree(tbl->tbl_ary);
10282 Safefree(tbl);
10283}
10284
5bd07a3d 10285
83841fad
NIS
10286void
10287Perl_rvpv_dup(pTHX_ SV *dstr, SV *sstr, CLONE_PARAMS* param)
10288{
10289 if (SvROK(sstr)) {
b162af07
SP
10290 SvRV_set(dstr, SvWEAKREF(sstr)
10291 ? sv_dup(SvRV(sstr), param)
10292 : sv_dup_inc(SvRV(sstr), param));
f880fe2f 10293
83841fad 10294 }
3f7c398e 10295 else if (SvPVX_const(sstr)) {
83841fad
NIS
10296 /* Has something there */
10297 if (SvLEN(sstr)) {
68795e93 10298 /* Normal PV - clone whole allocated space */
3f7c398e 10299 SvPV_set(dstr, SAVEPVN(SvPVX_const(sstr), SvLEN(sstr)-1));
d3d0e6f1
NC
10300 if (SvREADONLY(sstr) && SvFAKE(sstr)) {
10301 /* Not that normal - actually sstr is copy on write.
10302 But we are a true, independant SV, so: */
10303 SvREADONLY_off(dstr);
10304 SvFAKE_off(dstr);
10305 }
68795e93 10306 }
83841fad
NIS
10307 else {
10308 /* Special case - not normally malloced for some reason */
ef10be65
NC
10309 if ((SvREADONLY(sstr) && SvFAKE(sstr))) {
10310 /* A "shared" PV - clone it as "shared" PV */
10311 SvPV_set(dstr,
10312 HEK_KEY(hek_dup(SvSHARED_HEK_FROM_PV(SvPVX_const(sstr)),
10313 param)));
83841fad
NIS
10314 }
10315 else {
10316 /* Some other special case - random pointer */
f880fe2f 10317 SvPV_set(dstr, SvPVX(sstr));
d3d0e6f1 10318 }
83841fad
NIS
10319 }
10320 }
10321 else {
10322 /* Copy the Null */
f880fe2f 10323 if (SvTYPE(dstr) == SVt_RV)
b162af07 10324 SvRV_set(dstr, NULL);
f880fe2f
SP
10325 else
10326 SvPV_set(dstr, 0);
83841fad
NIS
10327 }
10328}
10329
662fb8b2
NC
10330/* duplicate an SV of any type (including AV, HV etc) */
10331
1d7c1841 10332SV *
a8fc9800 10333Perl_sv_dup(pTHX_ SV *sstr, CLONE_PARAMS* param)
1d7c1841 10334{
27da23d5 10335 dVAR;
1d7c1841
GS
10336 SV *dstr;
10337
10338 if (!sstr || SvTYPE(sstr) == SVTYPEMASK)
10339 return Nullsv;
10340 /* look for it in the table first */
10341 dstr = (SV*)ptr_table_fetch(PL_ptr_table, sstr);
10342 if (dstr)
10343 return dstr;
10344
0405e91e
AB
10345 if(param->flags & CLONEf_JOIN_IN) {
10346 /** We are joining here so we don't want do clone
10347 something that is bad **/
bfcb3514 10348 const char *hvname;
0405e91e
AB
10349
10350 if(SvTYPE(sstr) == SVt_PVHV &&
bfcb3514 10351 (hvname = HvNAME_get(sstr))) {
0405e91e 10352 /** don't clone stashes if they already exist **/
bfcb3514 10353 HV* old_stash = gv_stashpv(hvname,0);
0405e91e
AB
10354 return (SV*) old_stash;
10355 }
10356 }
10357
1d7c1841
GS
10358 /* create anew and remember what it is */
10359 new_SV(dstr);
fd0854ff
DM
10360
10361#ifdef DEBUG_LEAKING_SCALARS
10362 dstr->sv_debug_optype = sstr->sv_debug_optype;
10363 dstr->sv_debug_line = sstr->sv_debug_line;
10364 dstr->sv_debug_inpad = sstr->sv_debug_inpad;
10365 dstr->sv_debug_cloned = 1;
10366# ifdef NETWARE
10367 dstr->sv_debug_file = savepv(sstr->sv_debug_file);
10368# else
10369 dstr->sv_debug_file = savesharedpv(sstr->sv_debug_file);
10370# endif
10371#endif
10372
1d7c1841
GS
10373 ptr_table_store(PL_ptr_table, sstr, dstr);
10374
10375 /* clone */
10376 SvFLAGS(dstr) = SvFLAGS(sstr);
10377 SvFLAGS(dstr) &= ~SVf_OOK; /* don't propagate OOK hack */
10378 SvREFCNT(dstr) = 0; /* must be before any other dups! */
10379
10380#ifdef DEBUGGING
3f7c398e 10381 if (SvANY(sstr) && PL_watch_pvx && SvPVX_const(sstr) == PL_watch_pvx)
1d7c1841 10382 PerlIO_printf(Perl_debug_log, "watch at %p hit, found string \"%s\"\n",
3f7c398e 10383 PL_watch_pvx, SvPVX_const(sstr));
1d7c1841
GS
10384#endif
10385
9660f481
DM
10386 /* don't clone objects whose class has asked us not to */
10387 if (SvOBJECT(sstr) && ! (SvFLAGS(SvSTASH(sstr)) & SVphv_CLONEABLE)) {
10388 SvFLAGS(dstr) &= ~SVTYPEMASK;
10389 SvOBJECT_off(dstr);
10390 return dstr;
10391 }
10392
1d7c1841
GS
10393 switch (SvTYPE(sstr)) {
10394 case SVt_NULL:
10395 SvANY(dstr) = NULL;
10396 break;
10397 case SVt_IV:
339049b0 10398 SvANY(dstr) = (XPVIV*)((char*)&(dstr->sv_u.svu_iv) - STRUCT_OFFSET(XPVIV, xiv_iv));
45977657 10399 SvIV_set(dstr, SvIVX(sstr));
1d7c1841
GS
10400 break;
10401 case SVt_NV:
10402 SvANY(dstr) = new_XNV();
9d6ce603 10403 SvNV_set(dstr, SvNVX(sstr));
1d7c1841
GS
10404 break;
10405 case SVt_RV:
339049b0 10406 SvANY(dstr) = &(dstr->sv_u.svu_rv);
83841fad 10407 Perl_rvpv_dup(aTHX_ dstr, sstr, param);
1d7c1841 10408 break;
662fb8b2
NC
10409 default:
10410 {
10411 /* These are all the types that need complex bodies allocating. */
10412 size_t new_body_length;
10413 size_t new_body_offset = 0;
10414 void **new_body_arena;
10415 void **new_body_arenaroot;
10416 void *new_body;
10417
10418 switch (SvTYPE(sstr)) {
10419 default:
10420 Perl_croak(aTHX_ "Bizarre SvTYPE [%" IVdf "]",
10421 (IV)SvTYPE(sstr));
10422 break;
10423
10424 case SVt_PVIO:
10425 new_body = new_XPVIO();
10426 new_body_length = sizeof(XPVIO);
10427 break;
10428 case SVt_PVFM:
10429 new_body = new_XPVFM();
10430 new_body_length = sizeof(XPVFM);
10431 break;
10432
10433 case SVt_PVHV:
10434 new_body_arena = (void **) &PL_xpvhv_root;
10435 new_body_arenaroot = (void **) &PL_xpvhv_arenaroot;
10436 new_body_offset = STRUCT_OFFSET(XPVHV, xhv_fill)
10437 - STRUCT_OFFSET(xpvhv_allocated, xhv_fill);
10438 new_body_length = STRUCT_OFFSET(XPVHV, xmg_stash)
10439 + sizeof (((XPVHV*)SvANY(sstr))->xmg_stash)
10440 - new_body_offset;
10441 goto new_body;
10442 case SVt_PVAV:
10443 new_body_arena = (void **) &PL_xpvav_root;
10444 new_body_arenaroot = (void **) &PL_xpvav_arenaroot;
10445 new_body_offset = STRUCT_OFFSET(XPVAV, xav_fill)
10446 - STRUCT_OFFSET(xpvav_allocated, xav_fill);
10447 new_body_length = STRUCT_OFFSET(XPVHV, xmg_stash)
10448 + sizeof (((XPVHV*)SvANY(sstr))->xmg_stash)
10449 - new_body_offset;
10450 goto new_body;
10451 case SVt_PVBM:
10452 new_body_length = sizeof(XPVBM);
10453 new_body_arena = (void **) &PL_xpvbm_root;
10454 new_body_arenaroot = (void **) &PL_xpvbm_arenaroot;
10455 goto new_body;
10456 case SVt_PVGV:
10457 if (GvUNIQUE((GV*)sstr)) {
0abe3f7c 10458 /* Do sharing here. */
662fb8b2
NC
10459 }
10460 new_body_length = sizeof(XPVGV);
10461 new_body_arena = (void **) &PL_xpvgv_root;
10462 new_body_arenaroot = (void **) &PL_xpvgv_arenaroot;
10463 goto new_body;
10464 case SVt_PVCV:
10465 new_body_length = sizeof(XPVCV);
10466 new_body_arena = (void **) &PL_xpvcv_root;
10467 new_body_arenaroot = (void **) &PL_xpvcv_arenaroot;
10468 goto new_body;
10469 case SVt_PVLV:
10470 new_body_length = sizeof(XPVLV);
10471 new_body_arena = (void **) &PL_xpvlv_root;
10472 new_body_arenaroot = (void **) &PL_xpvlv_arenaroot;
10473 goto new_body;
10474 case SVt_PVMG:
10475 new_body_length = sizeof(XPVMG);
10476 new_body_arena = (void **) &PL_xpvmg_root;
10477 new_body_arenaroot = (void **) &PL_xpvmg_arenaroot;
10478 goto new_body;
10479 case SVt_PVNV:
10480 new_body_length = sizeof(XPVNV);
10481 new_body_arena = (void **) &PL_xpvnv_root;
10482 new_body_arenaroot = (void **) &PL_xpvnv_arenaroot;
10483 goto new_body;
10484 case SVt_PVIV:
10485 new_body_offset = STRUCT_OFFSET(XPVIV, xpv_cur)
10486 - STRUCT_OFFSET(xpviv_allocated, xpv_cur);
10487 new_body_length = sizeof(XPVIV) - new_body_offset;
10488 new_body_arena = (void **) &PL_xpviv_root;
10489 new_body_arenaroot = (void **) &PL_xpviv_arenaroot;
10490 goto new_body;
10491 case SVt_PV:
10492 new_body_offset = STRUCT_OFFSET(XPV, xpv_cur)
10493 - STRUCT_OFFSET(xpv_allocated, xpv_cur);
10494 new_body_length = sizeof(XPV) - new_body_offset;
10495 new_body_arena = (void **) &PL_xpv_root;
10496 new_body_arenaroot = (void **) &PL_xpv_arenaroot;
10497 new_body:
10498 assert(new_body_length);
10499#ifndef PURIFY
08742458
NC
10500 new_body_inline(new_body, new_body_arenaroot, new_body_arena,
10501 new_body_length);
10502 new_body = (void*)((char*)new_body - new_body_offset);
662fb8b2
NC
10503#else
10504 /* We always allocated the full length item with PURIFY */
10505 new_body_length += new_body_offset;
10506 new_body_offset = 0;
10507 new_body = my_safemalloc(new_body_length);
5bd07a3d 10508#endif
1d7c1841 10509 }
662fb8b2
NC
10510 assert(new_body);
10511 SvANY(dstr) = new_body;
10512
10513 Copy(((char*)SvANY(sstr)) + new_body_offset,
10514 ((char*)SvANY(dstr)) + new_body_offset,
10515 new_body_length, char);
10516
10517 if (SvTYPE(sstr) != SVt_PVAV && SvTYPE(sstr) != SVt_PVHV)
10518 Perl_rvpv_dup(aTHX_ dstr, sstr, param);
10519
10520 /* The Copy above means that all the source (unduplicated) pointers
10521 are now in the destination. We can check the flags and the
10522 pointers in either, but it's possible that there's less cache
10523 missing by always going for the destination.
10524 FIXME - instrument and check that assumption */
10525 if (SvTYPE(sstr) >= SVt_PVMG) {
10526 if (SvMAGIC(dstr))
10527 SvMAGIC_set(dstr, mg_dup(SvMAGIC(dstr), param));
10528 if (SvSTASH(dstr))
10529 SvSTASH_set(dstr, hv_dup_inc(SvSTASH(dstr), param));
1d7c1841 10530 }
662fb8b2
NC
10531
10532 switch (SvTYPE(sstr)) {
10533 case SVt_PV:
10534 break;
10535 case SVt_PVIV:
10536 break;
10537 case SVt_PVNV:
10538 break;
10539 case SVt_PVMG:
10540 break;
10541 case SVt_PVBM:
10542 break;
10543 case SVt_PVLV:
10544 /* XXX LvTARGOFF sometimes holds PMOP* when DEBUGGING */
10545 if (LvTYPE(dstr) == 't') /* for tie: unrefcnted fake (SV**) */
10546 LvTARG(dstr) = dstr;
10547 else if (LvTYPE(dstr) == 'T') /* for tie: fake HE */
10548 LvTARG(dstr) = (SV*)he_dup((HE*)LvTARG(dstr), 0, param);
10549 else
10550 LvTARG(dstr) = sv_dup_inc(LvTARG(dstr), param);
10551 break;
10552 case SVt_PVGV:
10553 GvNAME(dstr) = SAVEPVN(GvNAME(dstr), GvNAMELEN(dstr));
e15faf7d
NC
10554 GvSTASH(dstr) = hv_dup(GvSTASH(dstr), param);
10555 /* Don't call sv_add_backref here as it's going to be created
10556 as part of the magic cloning of the symbol table. */
662fb8b2
NC
10557 GvGP(dstr) = gp_dup(GvGP(dstr), param);
10558 (void)GpREFCNT_inc(GvGP(dstr));
10559 break;
10560 case SVt_PVIO:
10561 IoIFP(dstr) = fp_dup(IoIFP(dstr), IoTYPE(dstr), param);
10562 if (IoOFP(dstr) == IoIFP(sstr))
10563 IoOFP(dstr) = IoIFP(dstr);
10564 else
10565 IoOFP(dstr) = fp_dup(IoOFP(dstr), IoTYPE(dstr), param);
10566 /* PL_rsfp_filters entries have fake IoDIRP() */
10567 if (IoDIRP(dstr) && !(IoFLAGS(dstr) & IOf_FAKE_DIRP))
10568 IoDIRP(dstr) = dirp_dup(IoDIRP(dstr));
10569 if(IoFLAGS(dstr) & IOf_FAKE_DIRP) {
10570 /* I have no idea why fake dirp (rsfps)
10571 should be treated differently but otherwise
10572 we end up with leaks -- sky*/
10573 IoTOP_GV(dstr) = gv_dup_inc(IoTOP_GV(dstr), param);
10574 IoFMT_GV(dstr) = gv_dup_inc(IoFMT_GV(dstr), param);
10575 IoBOTTOM_GV(dstr) = gv_dup_inc(IoBOTTOM_GV(dstr), param);
10576 } else {
10577 IoTOP_GV(dstr) = gv_dup(IoTOP_GV(dstr), param);
10578 IoFMT_GV(dstr) = gv_dup(IoFMT_GV(dstr), param);
10579 IoBOTTOM_GV(dstr) = gv_dup(IoBOTTOM_GV(dstr), param);
10580 }
10581 IoTOP_NAME(dstr) = SAVEPV(IoTOP_NAME(dstr));
10582 IoFMT_NAME(dstr) = SAVEPV(IoFMT_NAME(dstr));
10583 IoBOTTOM_NAME(dstr) = SAVEPV(IoBOTTOM_NAME(dstr));
10584 break;
10585 case SVt_PVAV:
10586 if (AvARRAY((AV*)sstr)) {
10587 SV **dst_ary, **src_ary;
10588 SSize_t items = AvFILLp((AV*)sstr) + 1;
10589
10590 src_ary = AvARRAY((AV*)sstr);
a02a5408 10591 Newxz(dst_ary, AvMAX((AV*)sstr)+1, SV*);
662fb8b2
NC
10592 ptr_table_store(PL_ptr_table, src_ary, dst_ary);
10593 SvPV_set(dstr, (char*)dst_ary);
10594 AvALLOC((AV*)dstr) = dst_ary;
10595 if (AvREAL((AV*)sstr)) {
10596 while (items-- > 0)
10597 *dst_ary++ = sv_dup_inc(*src_ary++, param);
10598 }
10599 else {
10600 while (items-- > 0)
10601 *dst_ary++ = sv_dup(*src_ary++, param);
10602 }
10603 items = AvMAX((AV*)sstr) - AvFILLp((AV*)sstr);
10604 while (items-- > 0) {
10605 *dst_ary++ = &PL_sv_undef;
10606 }
bfcb3514 10607 }
662fb8b2
NC
10608 else {
10609 SvPV_set(dstr, Nullch);
10610 AvALLOC((AV*)dstr) = (SV**)NULL;
b79f7545 10611 }
662fb8b2
NC
10612 break;
10613 case SVt_PVHV:
10614 {
10615 HEK *hvname = 0;
10616
10617 if (HvARRAY((HV*)sstr)) {
10618 STRLEN i = 0;
10619 const bool sharekeys = !!HvSHAREKEYS(sstr);
10620 XPVHV * const dxhv = (XPVHV*)SvANY(dstr);
10621 XPVHV * const sxhv = (XPVHV*)SvANY(sstr);
10622 char *darray;
a02a5408 10623 Newx(darray, PERL_HV_ARRAY_ALLOC_BYTES(dxhv->xhv_max+1)
662fb8b2
NC
10624 + (SvOOK(sstr) ? sizeof(struct xpvhv_aux) : 0),
10625 char);
10626 HvARRAY(dstr) = (HE**)darray;
10627 while (i <= sxhv->xhv_max) {
5c4138a0 10628 const HE *source = HvARRAY(sstr)[i];
662fb8b2
NC
10629 HvARRAY(dstr)[i] = source
10630 ? he_dup(source, sharekeys, param) : 0;
10631 ++i;
10632 }
10633 if (SvOOK(sstr)) {
10634 struct xpvhv_aux *saux = HvAUX(sstr);
10635 struct xpvhv_aux *daux = HvAUX(dstr);
10636 /* This flag isn't copied. */
10637 /* SvOOK_on(hv) attacks the IV flags. */
10638 SvFLAGS(dstr) |= SVf_OOK;
10639
10640 hvname = saux->xhv_name;
dd690478
NC
10641 daux->xhv_name
10642 = hvname ? hek_dup(hvname, param) : hvname;
662fb8b2
NC
10643
10644 daux->xhv_riter = saux->xhv_riter;
10645 daux->xhv_eiter = saux->xhv_eiter
dd690478
NC
10646 ? he_dup(saux->xhv_eiter,
10647 (bool)!!HvSHAREKEYS(sstr), param) : 0;
662fb8b2
NC
10648 }
10649 }
10650 else {
10651 SvPV_set(dstr, Nullch);
10652 }
10653 /* Record stashes for possible cloning in Perl_clone(). */
10654 if(hvname)
10655 av_push(param->stashes, dstr);
10656 }
10657 break;
10658 case SVt_PVFM:
10659 case SVt_PVCV:
10660 /* NOTE: not refcounted */
10661 CvSTASH(dstr) = hv_dup(CvSTASH(dstr), param);
10662 OP_REFCNT_LOCK;
10663 CvROOT(dstr) = OpREFCNT_inc(CvROOT(dstr));
10664 OP_REFCNT_UNLOCK;
10665 if (CvCONST(dstr)) {
10666 CvXSUBANY(dstr).any_ptr = GvUNIQUE(CvGV(dstr)) ?
10667 SvREFCNT_inc(CvXSUBANY(dstr).any_ptr) :
10668 sv_dup_inc((SV *)CvXSUBANY(dstr).any_ptr, param);
10669 }
10670 /* don't dup if copying back - CvGV isn't refcounted, so the
10671 * duped GV may never be freed. A bit of a hack! DAPM */
10672 CvGV(dstr) = (param->flags & CLONEf_JOIN_IN) ?
10673 Nullgv : gv_dup(CvGV(dstr), param) ;
10674 if (!(param->flags & CLONEf_COPY_STACKS)) {
10675 CvDEPTH(dstr) = 0;
10676 }
10677 PAD_DUP(CvPADLIST(dstr), CvPADLIST(sstr), param);
10678 CvOUTSIDE(dstr) =
10679 CvWEAKOUTSIDE(sstr)
10680 ? cv_dup( CvOUTSIDE(dstr), param)
10681 : cv_dup_inc(CvOUTSIDE(dstr), param);
10682 if (!CvXSUB(dstr))
10683 CvFILE(dstr) = SAVEPV(CvFILE(dstr));
10684 break;
bfcb3514 10685 }
1d7c1841 10686 }
1d7c1841
GS
10687 }
10688
10689 if (SvOBJECT(dstr) && SvTYPE(dstr) != SVt_PVIO)
10690 ++PL_sv_objcount;
10691
10692 return dstr;
d2d73c3e 10693 }
1d7c1841 10694
645c22ef
DM
10695/* duplicate a context */
10696
1d7c1841 10697PERL_CONTEXT *
a8fc9800 10698Perl_cx_dup(pTHX_ PERL_CONTEXT *cxs, I32 ix, I32 max, CLONE_PARAMS* param)
1d7c1841
GS
10699{
10700 PERL_CONTEXT *ncxs;
10701
10702 if (!cxs)
10703 return (PERL_CONTEXT*)NULL;
10704
10705 /* look for it in the table first */
10706 ncxs = (PERL_CONTEXT*)ptr_table_fetch(PL_ptr_table, cxs);
10707 if (ncxs)
10708 return ncxs;
10709
10710 /* create anew and remember what it is */
a02a5408 10711 Newxz(ncxs, max + 1, PERL_CONTEXT);
1d7c1841
GS
10712 ptr_table_store(PL_ptr_table, cxs, ncxs);
10713
10714 while (ix >= 0) {
10715 PERL_CONTEXT *cx = &cxs[ix];
10716 PERL_CONTEXT *ncx = &ncxs[ix];
10717 ncx->cx_type = cx->cx_type;
10718 if (CxTYPE(cx) == CXt_SUBST) {
10719 Perl_croak(aTHX_ "Cloning substitution context is unimplemented");
10720 }
10721 else {
10722 ncx->blk_oldsp = cx->blk_oldsp;
10723 ncx->blk_oldcop = cx->blk_oldcop;
1d7c1841
GS
10724 ncx->blk_oldmarksp = cx->blk_oldmarksp;
10725 ncx->blk_oldscopesp = cx->blk_oldscopesp;
10726 ncx->blk_oldpm = cx->blk_oldpm;
10727 ncx->blk_gimme = cx->blk_gimme;
10728 switch (CxTYPE(cx)) {
10729 case CXt_SUB:
10730 ncx->blk_sub.cv = (cx->blk_sub.olddepth == 0
d2d73c3e
AB
10731 ? cv_dup_inc(cx->blk_sub.cv, param)
10732 : cv_dup(cx->blk_sub.cv,param));
1d7c1841 10733 ncx->blk_sub.argarray = (cx->blk_sub.hasargs
d2d73c3e 10734 ? av_dup_inc(cx->blk_sub.argarray, param)
1d7c1841 10735 : Nullav);
d2d73c3e 10736 ncx->blk_sub.savearray = av_dup_inc(cx->blk_sub.savearray, param);
1d7c1841
GS
10737 ncx->blk_sub.olddepth = cx->blk_sub.olddepth;
10738 ncx->blk_sub.hasargs = cx->blk_sub.hasargs;
10739 ncx->blk_sub.lval = cx->blk_sub.lval;
f39bc417 10740 ncx->blk_sub.retop = cx->blk_sub.retop;
1d7c1841
GS
10741 break;
10742 case CXt_EVAL:
10743 ncx->blk_eval.old_in_eval = cx->blk_eval.old_in_eval;
10744 ncx->blk_eval.old_op_type = cx->blk_eval.old_op_type;
b47cad08 10745 ncx->blk_eval.old_namesv = sv_dup_inc(cx->blk_eval.old_namesv, param);
1d7c1841 10746 ncx->blk_eval.old_eval_root = cx->blk_eval.old_eval_root;
d2d73c3e 10747 ncx->blk_eval.cur_text = sv_dup(cx->blk_eval.cur_text, param);
f39bc417 10748 ncx->blk_eval.retop = cx->blk_eval.retop;
1d7c1841
GS
10749 break;
10750 case CXt_LOOP:
10751 ncx->blk_loop.label = cx->blk_loop.label;
10752 ncx->blk_loop.resetsp = cx->blk_loop.resetsp;
10753 ncx->blk_loop.redo_op = cx->blk_loop.redo_op;
10754 ncx->blk_loop.next_op = cx->blk_loop.next_op;
10755 ncx->blk_loop.last_op = cx->blk_loop.last_op;
10756 ncx->blk_loop.iterdata = (CxPADLOOP(cx)
10757 ? cx->blk_loop.iterdata
d2d73c3e 10758 : gv_dup((GV*)cx->blk_loop.iterdata, param));
f3548bdc
DM
10759 ncx->blk_loop.oldcomppad
10760 = (PAD*)ptr_table_fetch(PL_ptr_table,
10761 cx->blk_loop.oldcomppad);
d2d73c3e
AB
10762 ncx->blk_loop.itersave = sv_dup_inc(cx->blk_loop.itersave, param);
10763 ncx->blk_loop.iterlval = sv_dup_inc(cx->blk_loop.iterlval, param);
10764 ncx->blk_loop.iterary = av_dup_inc(cx->blk_loop.iterary, param);
1d7c1841
GS
10765 ncx->blk_loop.iterix = cx->blk_loop.iterix;
10766 ncx->blk_loop.itermax = cx->blk_loop.itermax;
10767 break;
10768 case CXt_FORMAT:
d2d73c3e
AB
10769 ncx->blk_sub.cv = cv_dup(cx->blk_sub.cv, param);
10770 ncx->blk_sub.gv = gv_dup(cx->blk_sub.gv, param);
10771 ncx->blk_sub.dfoutgv = gv_dup_inc(cx->blk_sub.dfoutgv, param);
1d7c1841 10772 ncx->blk_sub.hasargs = cx->blk_sub.hasargs;
f39bc417 10773 ncx->blk_sub.retop = cx->blk_sub.retop;
1d7c1841
GS
10774 break;
10775 case CXt_BLOCK:
10776 case CXt_NULL:
10777 break;
10778 }
10779 }
10780 --ix;
10781 }
10782 return ncxs;
10783}
10784
645c22ef
DM
10785/* duplicate a stack info structure */
10786
1d7c1841 10787PERL_SI *
a8fc9800 10788Perl_si_dup(pTHX_ PERL_SI *si, CLONE_PARAMS* param)
1d7c1841
GS
10789{
10790 PERL_SI *nsi;
10791
10792 if (!si)
10793 return (PERL_SI*)NULL;
10794
10795 /* look for it in the table first */
10796 nsi = (PERL_SI*)ptr_table_fetch(PL_ptr_table, si);
10797 if (nsi)
10798 return nsi;
10799
10800 /* create anew and remember what it is */
a02a5408 10801 Newxz(nsi, 1, PERL_SI);
1d7c1841
GS
10802 ptr_table_store(PL_ptr_table, si, nsi);
10803
d2d73c3e 10804 nsi->si_stack = av_dup_inc(si->si_stack, param);
1d7c1841
GS
10805 nsi->si_cxix = si->si_cxix;
10806 nsi->si_cxmax = si->si_cxmax;
d2d73c3e 10807 nsi->si_cxstack = cx_dup(si->si_cxstack, si->si_cxix, si->si_cxmax, param);
1d7c1841 10808 nsi->si_type = si->si_type;
d2d73c3e
AB
10809 nsi->si_prev = si_dup(si->si_prev, param);
10810 nsi->si_next = si_dup(si->si_next, param);
1d7c1841
GS
10811 nsi->si_markoff = si->si_markoff;
10812
10813 return nsi;
10814}
10815
10816#define POPINT(ss,ix) ((ss)[--(ix)].any_i32)
10817#define TOPINT(ss,ix) ((ss)[ix].any_i32)
10818#define POPLONG(ss,ix) ((ss)[--(ix)].any_long)
10819#define TOPLONG(ss,ix) ((ss)[ix].any_long)
10820#define POPIV(ss,ix) ((ss)[--(ix)].any_iv)
10821#define TOPIV(ss,ix) ((ss)[ix].any_iv)
38d8b13e
HS
10822#define POPBOOL(ss,ix) ((ss)[--(ix)].any_bool)
10823#define TOPBOOL(ss,ix) ((ss)[ix].any_bool)
1d7c1841
GS
10824#define POPPTR(ss,ix) ((ss)[--(ix)].any_ptr)
10825#define TOPPTR(ss,ix) ((ss)[ix].any_ptr)
10826#define POPDPTR(ss,ix) ((ss)[--(ix)].any_dptr)
10827#define TOPDPTR(ss,ix) ((ss)[ix].any_dptr)
10828#define POPDXPTR(ss,ix) ((ss)[--(ix)].any_dxptr)
10829#define TOPDXPTR(ss,ix) ((ss)[ix].any_dxptr)
10830
10831/* XXXXX todo */
10832#define pv_dup_inc(p) SAVEPV(p)
10833#define pv_dup(p) SAVEPV(p)
10834#define svp_dup_inc(p,pp) any_dup(p,pp)
10835
645c22ef
DM
10836/* map any object to the new equivent - either something in the
10837 * ptr table, or something in the interpreter structure
10838 */
10839
1d7c1841 10840void *
53c1dcc0 10841Perl_any_dup(pTHX_ void *v, const PerlInterpreter *proto_perl)
1d7c1841
GS
10842{
10843 void *ret;
10844
10845 if (!v)
10846 return (void*)NULL;
10847
10848 /* look for it in the table first */
10849 ret = ptr_table_fetch(PL_ptr_table, v);
10850 if (ret)
10851 return ret;
10852
10853 /* see if it is part of the interpreter structure */
10854 if (v >= (void*)proto_perl && v < (void*)(proto_perl+1))
acfe0abc 10855 ret = (void*)(((char*)aTHX) + (((char*)v) - (char*)proto_perl));
05ec9bb3 10856 else {
1d7c1841 10857 ret = v;
05ec9bb3 10858 }
1d7c1841
GS
10859
10860 return ret;
10861}
10862
645c22ef
DM
10863/* duplicate the save stack */
10864
1d7c1841 10865ANY *
a8fc9800 10866Perl_ss_dup(pTHX_ PerlInterpreter *proto_perl, CLONE_PARAMS* param)
1d7c1841 10867{
53c1dcc0
AL
10868 ANY * const ss = proto_perl->Tsavestack;
10869 const I32 max = proto_perl->Tsavestack_max;
10870 I32 ix = proto_perl->Tsavestack_ix;
1d7c1841
GS
10871 ANY *nss;
10872 SV *sv;
10873 GV *gv;
10874 AV *av;
10875 HV *hv;
10876 void* ptr;
10877 int intval;
10878 long longval;
10879 GP *gp;
10880 IV iv;
c4e33207 10881 char *c = NULL;
1d7c1841 10882 void (*dptr) (void*);
acfe0abc 10883 void (*dxptr) (pTHX_ void*);
1d7c1841 10884
a02a5408 10885 Newxz(nss, max, ANY);
1d7c1841
GS
10886
10887 while (ix > 0) {
b464bac0 10888 I32 i = POPINT(ss,ix);
1d7c1841
GS
10889 TOPINT(nss,ix) = i;
10890 switch (i) {
10891 case SAVEt_ITEM: /* normal string */
10892 sv = (SV*)POPPTR(ss,ix);
d2d73c3e 10893 TOPPTR(nss,ix) = sv_dup_inc(sv, param);
1d7c1841 10894 sv = (SV*)POPPTR(ss,ix);
d2d73c3e 10895 TOPPTR(nss,ix) = sv_dup_inc(sv, param);
1d7c1841
GS
10896 break;
10897 case SAVEt_SV: /* scalar reference */
10898 sv = (SV*)POPPTR(ss,ix);
d2d73c3e 10899 TOPPTR(nss,ix) = sv_dup_inc(sv, param);
1d7c1841 10900 gv = (GV*)POPPTR(ss,ix);
d2d73c3e 10901 TOPPTR(nss,ix) = gv_dup_inc(gv, param);
1d7c1841 10902 break;
f4dd75d9
GS
10903 case SAVEt_GENERIC_PVREF: /* generic char* */
10904 c = (char*)POPPTR(ss,ix);
10905 TOPPTR(nss,ix) = pv_dup(c);
10906 ptr = POPPTR(ss,ix);
10907 TOPPTR(nss,ix) = any_dup(ptr, proto_perl);
10908 break;
05ec9bb3
NIS
10909 case SAVEt_SHARED_PVREF: /* char* in shared space */
10910 c = (char*)POPPTR(ss,ix);
10911 TOPPTR(nss,ix) = savesharedpv(c);
10912 ptr = POPPTR(ss,ix);
10913 TOPPTR(nss,ix) = any_dup(ptr, proto_perl);
10914 break;
1d7c1841
GS
10915 case SAVEt_GENERIC_SVREF: /* generic sv */
10916 case SAVEt_SVREF: /* scalar reference */
10917 sv = (SV*)POPPTR(ss,ix);
d2d73c3e 10918 TOPPTR(nss,ix) = sv_dup_inc(sv, param);
1d7c1841
GS
10919 ptr = POPPTR(ss,ix);
10920 TOPPTR(nss,ix) = svp_dup_inc((SV**)ptr, proto_perl);/* XXXXX */
10921 break;
10922 case SAVEt_AV: /* array reference */
10923 av = (AV*)POPPTR(ss,ix);
d2d73c3e 10924 TOPPTR(nss,ix) = av_dup_inc(av, param);
1d7c1841 10925 gv = (GV*)POPPTR(ss,ix);
d2d73c3e 10926 TOPPTR(nss,ix) = gv_dup(gv, param);
1d7c1841
GS
10927 break;
10928 case SAVEt_HV: /* hash reference */
10929 hv = (HV*)POPPTR(ss,ix);
d2d73c3e 10930 TOPPTR(nss,ix) = hv_dup_inc(hv, param);
1d7c1841 10931 gv = (GV*)POPPTR(ss,ix);
d2d73c3e 10932 TOPPTR(nss,ix) = gv_dup(gv, param);
1d7c1841
GS
10933 break;
10934 case SAVEt_INT: /* int reference */
10935 ptr = POPPTR(ss,ix);
10936 TOPPTR(nss,ix) = any_dup(ptr, proto_perl);
10937 intval = (int)POPINT(ss,ix);
10938 TOPINT(nss,ix) = intval;
10939 break;
10940 case SAVEt_LONG: /* long reference */
10941 ptr = POPPTR(ss,ix);
10942 TOPPTR(nss,ix) = any_dup(ptr, proto_perl);
10943 longval = (long)POPLONG(ss,ix);
10944 TOPLONG(nss,ix) = longval;
10945 break;
10946 case SAVEt_I32: /* I32 reference */
10947 case SAVEt_I16: /* I16 reference */
10948 case SAVEt_I8: /* I8 reference */
10949 ptr = POPPTR(ss,ix);
10950 TOPPTR(nss,ix) = any_dup(ptr, proto_perl);
10951 i = POPINT(ss,ix);
10952 TOPINT(nss,ix) = i;
10953 break;
10954 case SAVEt_IV: /* IV reference */
10955 ptr = POPPTR(ss,ix);
10956 TOPPTR(nss,ix) = any_dup(ptr, proto_perl);
10957 iv = POPIV(ss,ix);
10958 TOPIV(nss,ix) = iv;
10959 break;
10960 case SAVEt_SPTR: /* SV* reference */
10961 ptr = POPPTR(ss,ix);
10962 TOPPTR(nss,ix) = any_dup(ptr, proto_perl);
10963 sv = (SV*)POPPTR(ss,ix);
d2d73c3e 10964 TOPPTR(nss,ix) = sv_dup(sv, param);
1d7c1841
GS
10965 break;
10966 case SAVEt_VPTR: /* random* reference */
10967 ptr = POPPTR(ss,ix);
10968 TOPPTR(nss,ix) = any_dup(ptr, proto_perl);
10969 ptr = POPPTR(ss,ix);
10970 TOPPTR(nss,ix) = any_dup(ptr, proto_perl);
10971 break;
10972 case SAVEt_PPTR: /* char* reference */
10973 ptr = POPPTR(ss,ix);
10974 TOPPTR(nss,ix) = any_dup(ptr, proto_perl);
10975 c = (char*)POPPTR(ss,ix);
10976 TOPPTR(nss,ix) = pv_dup(c);
10977 break;
10978 case SAVEt_HPTR: /* HV* reference */
10979 ptr = POPPTR(ss,ix);
10980 TOPPTR(nss,ix) = any_dup(ptr, proto_perl);
10981 hv = (HV*)POPPTR(ss,ix);
d2d73c3e 10982 TOPPTR(nss,ix) = hv_dup(hv, param);
1d7c1841
GS
10983 break;
10984 case SAVEt_APTR: /* AV* reference */
10985 ptr = POPPTR(ss,ix);
10986 TOPPTR(nss,ix) = any_dup(ptr, proto_perl);
10987 av = (AV*)POPPTR(ss,ix);
d2d73c3e 10988 TOPPTR(nss,ix) = av_dup(av, param);
1d7c1841
GS
10989 break;
10990 case SAVEt_NSTAB:
10991 gv = (GV*)POPPTR(ss,ix);
d2d73c3e 10992 TOPPTR(nss,ix) = gv_dup(gv, param);
1d7c1841
GS
10993 break;
10994 case SAVEt_GP: /* scalar reference */
10995 gp = (GP*)POPPTR(ss,ix);
d2d73c3e 10996 TOPPTR(nss,ix) = gp = gp_dup(gp, param);
1d7c1841
GS
10997 (void)GpREFCNT_inc(gp);
10998 gv = (GV*)POPPTR(ss,ix);
2ed3c8fc 10999 TOPPTR(nss,ix) = gv_dup_inc(gv, param);
1d7c1841
GS
11000 c = (char*)POPPTR(ss,ix);
11001 TOPPTR(nss,ix) = pv_dup(c);
11002 iv = POPIV(ss,ix);
11003 TOPIV(nss,ix) = iv;
11004 iv = POPIV(ss,ix);
11005 TOPIV(nss,ix) = iv;
11006 break;
11007 case SAVEt_FREESV:
26d9b02f 11008 case SAVEt_MORTALIZESV:
1d7c1841 11009 sv = (SV*)POPPTR(ss,ix);
d2d73c3e 11010 TOPPTR(nss,ix) = sv_dup_inc(sv, param);
1d7c1841
GS
11011 break;
11012 case SAVEt_FREEOP:
11013 ptr = POPPTR(ss,ix);
11014 if (ptr && (((OP*)ptr)->op_private & OPpREFCOUNTED)) {
11015 /* these are assumed to be refcounted properly */
53c1dcc0 11016 OP *o;
1d7c1841
GS
11017 switch (((OP*)ptr)->op_type) {
11018 case OP_LEAVESUB:
11019 case OP_LEAVESUBLV:
11020 case OP_LEAVEEVAL:
11021 case OP_LEAVE:
11022 case OP_SCOPE:
11023 case OP_LEAVEWRITE:
e977893f
GS
11024 TOPPTR(nss,ix) = ptr;
11025 o = (OP*)ptr;
11026 OpREFCNT_inc(o);
1d7c1841
GS
11027 break;
11028 default:
11029 TOPPTR(nss,ix) = Nullop;
11030 break;
11031 }
11032 }
11033 else
11034 TOPPTR(nss,ix) = Nullop;
11035 break;
11036 case SAVEt_FREEPV:
11037 c = (char*)POPPTR(ss,ix);
11038 TOPPTR(nss,ix) = pv_dup_inc(c);
11039 break;
11040 case SAVEt_CLEARSV:
11041 longval = POPLONG(ss,ix);
11042 TOPLONG(nss,ix) = longval;
11043 break;
11044 case SAVEt_DELETE:
11045 hv = (HV*)POPPTR(ss,ix);
d2d73c3e 11046 TOPPTR(nss,ix) = hv_dup_inc(hv, param);
1d7c1841
GS
11047 c = (char*)POPPTR(ss,ix);
11048 TOPPTR(nss,ix) = pv_dup_inc(c);
11049 i = POPINT(ss,ix);
11050 TOPINT(nss,ix) = i;
11051 break;
11052 case SAVEt_DESTRUCTOR:
11053 ptr = POPPTR(ss,ix);
11054 TOPPTR(nss,ix) = any_dup(ptr, proto_perl); /* XXX quite arbitrary */
11055 dptr = POPDPTR(ss,ix);
8141890a
JH
11056 TOPDPTR(nss,ix) = DPTR2FPTR(void (*)(void*),
11057 any_dup(FPTR2DPTR(void *, dptr),
11058 proto_perl));
1d7c1841
GS
11059 break;
11060 case SAVEt_DESTRUCTOR_X:
11061 ptr = POPPTR(ss,ix);
11062 TOPPTR(nss,ix) = any_dup(ptr, proto_perl); /* XXX quite arbitrary */
11063 dxptr = POPDXPTR(ss,ix);
8141890a
JH
11064 TOPDXPTR(nss,ix) = DPTR2FPTR(void (*)(pTHX_ void*),
11065 any_dup(FPTR2DPTR(void *, dxptr),
11066 proto_perl));
1d7c1841
GS
11067 break;
11068 case SAVEt_REGCONTEXT:
11069 case SAVEt_ALLOC:
11070 i = POPINT(ss,ix);
11071 TOPINT(nss,ix) = i;
11072 ix -= i;
11073 break;
11074 case SAVEt_STACK_POS: /* Position on Perl stack */
11075 i = POPINT(ss,ix);
11076 TOPINT(nss,ix) = i;
11077 break;
11078 case SAVEt_AELEM: /* array element */
11079 sv = (SV*)POPPTR(ss,ix);
d2d73c3e 11080 TOPPTR(nss,ix) = sv_dup_inc(sv, param);
1d7c1841
GS
11081 i = POPINT(ss,ix);
11082 TOPINT(nss,ix) = i;
11083 av = (AV*)POPPTR(ss,ix);
d2d73c3e 11084 TOPPTR(nss,ix) = av_dup_inc(av, param);
1d7c1841
GS
11085 break;
11086 case SAVEt_HELEM: /* hash element */
11087 sv = (SV*)POPPTR(ss,ix);
d2d73c3e 11088 TOPPTR(nss,ix) = sv_dup_inc(sv, param);
1d7c1841 11089 sv = (SV*)POPPTR(ss,ix);
d2d73c3e 11090 TOPPTR(nss,ix) = sv_dup_inc(sv, param);
1d7c1841 11091 hv = (HV*)POPPTR(ss,ix);
d2d73c3e 11092 TOPPTR(nss,ix) = hv_dup_inc(hv, param);
1d7c1841
GS
11093 break;
11094 case SAVEt_OP:
11095 ptr = POPPTR(ss,ix);
11096 TOPPTR(nss,ix) = ptr;
11097 break;
11098 case SAVEt_HINTS:
11099 i = POPINT(ss,ix);
11100 TOPINT(nss,ix) = i;
11101 break;
c4410b1b
GS
11102 case SAVEt_COMPPAD:
11103 av = (AV*)POPPTR(ss,ix);
58ed4fbe 11104 TOPPTR(nss,ix) = av_dup(av, param);
c4410b1b 11105 break;
c3564e5c
GS
11106 case SAVEt_PADSV:
11107 longval = (long)POPLONG(ss,ix);
11108 TOPLONG(nss,ix) = longval;
11109 ptr = POPPTR(ss,ix);
11110 TOPPTR(nss,ix) = any_dup(ptr, proto_perl);
11111 sv = (SV*)POPPTR(ss,ix);
d2d73c3e 11112 TOPPTR(nss,ix) = sv_dup(sv, param);
c3564e5c 11113 break;
a1bb4754 11114 case SAVEt_BOOL:
38d8b13e 11115 ptr = POPPTR(ss,ix);
b9609c01 11116 TOPPTR(nss,ix) = any_dup(ptr, proto_perl);
38d8b13e 11117 longval = (long)POPBOOL(ss,ix);
b9609c01 11118 TOPBOOL(nss,ix) = (bool)longval;
a1bb4754 11119 break;
8bd2680e
MHM
11120 case SAVEt_SET_SVFLAGS:
11121 i = POPINT(ss,ix);
11122 TOPINT(nss,ix) = i;
11123 i = POPINT(ss,ix);
11124 TOPINT(nss,ix) = i;
11125 sv = (SV*)POPPTR(ss,ix);
11126 TOPPTR(nss,ix) = sv_dup(sv, param);
11127 break;
1d7c1841
GS
11128 default:
11129 Perl_croak(aTHX_ "panic: ss_dup inconsistency");
11130 }
11131 }
11132
11133 return nss;
11134}
11135
9660f481
DM
11136
11137/* if sv is a stash, call $class->CLONE_SKIP(), and set the SVphv_CLONEABLE
11138 * flag to the result. This is done for each stash before cloning starts,
11139 * so we know which stashes want their objects cloned */
11140
11141static void
11142do_mark_cloneable_stash(pTHX_ SV *sv)
11143{
53c1dcc0 11144 const HEK * const hvname = HvNAME_HEK((HV*)sv);
bfcb3514 11145 if (hvname) {
53c1dcc0 11146 GV* const cloner = gv_fetchmethod_autoload((HV*)sv, "CLONE_SKIP", 0);
9660f481
DM
11147 SvFLAGS(sv) |= SVphv_CLONEABLE; /* clone objects by default */
11148 if (cloner && GvCV(cloner)) {
11149 dSP;
11150 UV status;
11151
11152 ENTER;
11153 SAVETMPS;
11154 PUSHMARK(SP);
84bda14a 11155 XPUSHs(sv_2mortal(newSVhek(hvname)));
9660f481
DM
11156 PUTBACK;
11157 call_sv((SV*)GvCV(cloner), G_SCALAR);
11158 SPAGAIN;
11159 status = POPu;
11160 PUTBACK;
11161 FREETMPS;
11162 LEAVE;
11163 if (status)
11164 SvFLAGS(sv) &= ~SVphv_CLONEABLE;
11165 }
11166 }
11167}
11168
11169
11170
645c22ef
DM
11171/*
11172=for apidoc perl_clone
11173
11174Create and return a new interpreter by cloning the current one.
11175
4be49ee6 11176perl_clone takes these flags as parameters:
6a78b4db 11177
7a5fa8a2
NIS
11178CLONEf_COPY_STACKS - is used to, well, copy the stacks also,
11179without it we only clone the data and zero the stacks,
11180with it we copy the stacks and the new perl interpreter is
11181ready to run at the exact same point as the previous one.
11182The pseudo-fork code uses COPY_STACKS while the
6a78b4db
AB
11183threads->new doesn't.
11184
11185CLONEf_KEEP_PTR_TABLE
7a5fa8a2
NIS
11186perl_clone keeps a ptr_table with the pointer of the old
11187variable as a key and the new variable as a value,
11188this allows it to check if something has been cloned and not
11189clone it again but rather just use the value and increase the
11190refcount. If KEEP_PTR_TABLE is not set then perl_clone will kill
11191the ptr_table using the function
11192C<ptr_table_free(PL_ptr_table); PL_ptr_table = NULL;>,
11193reason to keep it around is if you want to dup some of your own
11194variable who are outside the graph perl scans, example of this
6a78b4db
AB
11195code is in threads.xs create
11196
11197CLONEf_CLONE_HOST
7a5fa8a2
NIS
11198This is a win32 thing, it is ignored on unix, it tells perls
11199win32host code (which is c++) to clone itself, this is needed on
11200win32 if you want to run two threads at the same time,
11201if you just want to do some stuff in a separate perl interpreter
11202and then throw it away and return to the original one,
6a78b4db
AB
11203you don't need to do anything.
11204
645c22ef
DM
11205=cut
11206*/
11207
11208/* XXX the above needs expanding by someone who actually understands it ! */
3fc56081
NK
11209EXTERN_C PerlInterpreter *
11210perl_clone_host(PerlInterpreter* proto_perl, UV flags);
645c22ef 11211
1d7c1841
GS
11212PerlInterpreter *
11213perl_clone(PerlInterpreter *proto_perl, UV flags)
11214{
27da23d5 11215 dVAR;
1d7c1841 11216#ifdef PERL_IMPLICIT_SYS
c43294b8
AB
11217
11218 /* perlhost.h so we need to call into it
11219 to clone the host, CPerlHost should have a c interface, sky */
11220
11221 if (flags & CLONEf_CLONE_HOST) {
11222 return perl_clone_host(proto_perl,flags);
11223 }
11224 return perl_clone_using(proto_perl, flags,
1d7c1841
GS
11225 proto_perl->IMem,
11226 proto_perl->IMemShared,
11227 proto_perl->IMemParse,
11228 proto_perl->IEnv,
11229 proto_perl->IStdIO,
11230 proto_perl->ILIO,
11231 proto_perl->IDir,
11232 proto_perl->ISock,
11233 proto_perl->IProc);
11234}
11235
11236PerlInterpreter *
11237perl_clone_using(PerlInterpreter *proto_perl, UV flags,
11238 struct IPerlMem* ipM, struct IPerlMem* ipMS,
11239 struct IPerlMem* ipMP, struct IPerlEnv* ipE,
11240 struct IPerlStdIO* ipStd, struct IPerlLIO* ipLIO,
11241 struct IPerlDir* ipD, struct IPerlSock* ipS,
11242 struct IPerlProc* ipP)
11243{
11244 /* XXX many of the string copies here can be optimized if they're
11245 * constants; they need to be allocated as common memory and just
11246 * their pointers copied. */
11247
8fc9efbd 11248 IV i;
64aa0685
GS
11249 CLONE_PARAMS clone_params;
11250 CLONE_PARAMS* param = &clone_params;
d2d73c3e 11251
1d7c1841 11252 PerlInterpreter *my_perl = (PerlInterpreter*)(*ipM->pMalloc)(ipM, sizeof(PerlInterpreter));
9660f481
DM
11253 /* for each stash, determine whether its objects should be cloned */
11254 S_visit(proto_perl, do_mark_cloneable_stash, SVt_PVHV, SVTYPEMASK);
ba869deb 11255 PERL_SET_THX(my_perl);
1d7c1841 11256
acfe0abc 11257# ifdef DEBUGGING
a4530404 11258 Poison(my_perl, 1, PerlInterpreter);
fd0854ff 11259 PL_op = Nullop;
c008732b 11260 PL_curcop = (COP *)Nullop;
1d7c1841
GS
11261 PL_markstack = 0;
11262 PL_scopestack = 0;
11263 PL_savestack = 0;
22f7c9c9
JH
11264 PL_savestack_ix = 0;
11265 PL_savestack_max = -1;
66fe0623 11266 PL_sig_pending = 0;
25596c82 11267 Zero(&PL_debug_pad, 1, struct perl_debug_pad);
acfe0abc 11268# else /* !DEBUGGING */
1d7c1841 11269 Zero(my_perl, 1, PerlInterpreter);
acfe0abc 11270# endif /* DEBUGGING */
1d7c1841
GS
11271
11272 /* host pointers */
11273 PL_Mem = ipM;
11274 PL_MemShared = ipMS;
11275 PL_MemParse = ipMP;
11276 PL_Env = ipE;
11277 PL_StdIO = ipStd;
11278 PL_LIO = ipLIO;
11279 PL_Dir = ipD;
11280 PL_Sock = ipS;
11281 PL_Proc = ipP;
1d7c1841
GS
11282#else /* !PERL_IMPLICIT_SYS */
11283 IV i;
64aa0685
GS
11284 CLONE_PARAMS clone_params;
11285 CLONE_PARAMS* param = &clone_params;
1d7c1841 11286 PerlInterpreter *my_perl = (PerlInterpreter*)PerlMem_malloc(sizeof(PerlInterpreter));
9660f481
DM
11287 /* for each stash, determine whether its objects should be cloned */
11288 S_visit(proto_perl, do_mark_cloneable_stash, SVt_PVHV, SVTYPEMASK);
ba869deb 11289 PERL_SET_THX(my_perl);
1d7c1841
GS
11290
11291# ifdef DEBUGGING
a4530404 11292 Poison(my_perl, 1, PerlInterpreter);
fd0854ff 11293 PL_op = Nullop;
c008732b 11294 PL_curcop = (COP *)Nullop;
1d7c1841
GS
11295 PL_markstack = 0;
11296 PL_scopestack = 0;
11297 PL_savestack = 0;
22f7c9c9
JH
11298 PL_savestack_ix = 0;
11299 PL_savestack_max = -1;
66fe0623 11300 PL_sig_pending = 0;
25596c82 11301 Zero(&PL_debug_pad, 1, struct perl_debug_pad);
1d7c1841
GS
11302# else /* !DEBUGGING */
11303 Zero(my_perl, 1, PerlInterpreter);
11304# endif /* DEBUGGING */
11305#endif /* PERL_IMPLICIT_SYS */
83236556 11306 param->flags = flags;
59b40662 11307 param->proto_perl = proto_perl;
1d7c1841
GS
11308
11309 /* arena roots */
612f20c3 11310 PL_xnv_arenaroot = NULL;
1d7c1841 11311 PL_xnv_root = NULL;
612f20c3 11312 PL_xpv_arenaroot = NULL;
1d7c1841 11313 PL_xpv_root = NULL;
612f20c3 11314 PL_xpviv_arenaroot = NULL;
1d7c1841 11315 PL_xpviv_root = NULL;
612f20c3 11316 PL_xpvnv_arenaroot = NULL;
1d7c1841 11317 PL_xpvnv_root = NULL;
612f20c3 11318 PL_xpvcv_arenaroot = NULL;
1d7c1841 11319 PL_xpvcv_root = NULL;
612f20c3 11320 PL_xpvav_arenaroot = NULL;
1d7c1841 11321 PL_xpvav_root = NULL;
612f20c3 11322 PL_xpvhv_arenaroot = NULL;
1d7c1841 11323 PL_xpvhv_root = NULL;
612f20c3 11324 PL_xpvmg_arenaroot = NULL;
1d7c1841 11325 PL_xpvmg_root = NULL;
7552b40b
DM
11326 PL_xpvgv_arenaroot = NULL;
11327 PL_xpvgv_root = NULL;
612f20c3 11328 PL_xpvlv_arenaroot = NULL;
1d7c1841 11329 PL_xpvlv_root = NULL;
612f20c3 11330 PL_xpvbm_arenaroot = NULL;
1d7c1841 11331 PL_xpvbm_root = NULL;
612f20c3 11332 PL_he_arenaroot = NULL;
1d7c1841 11333 PL_he_root = NULL;
892b45be 11334#if defined(USE_ITHREADS)
32e691d0
NC
11335 PL_pte_arenaroot = NULL;
11336 PL_pte_root = NULL;
892b45be 11337#endif
1d7c1841
GS
11338 PL_nice_chunk = NULL;
11339 PL_nice_chunk_size = 0;
11340 PL_sv_count = 0;
11341 PL_sv_objcount = 0;
11342 PL_sv_root = Nullsv;
11343 PL_sv_arenaroot = Nullsv;
11344
11345 PL_debug = proto_perl->Idebug;
11346
8df990a8
NC
11347 PL_hash_seed = proto_perl->Ihash_seed;
11348 PL_rehash_seed = proto_perl->Irehash_seed;
11349
e5dd39fc 11350#ifdef USE_REENTRANT_API
68853529
SB
11351 /* XXX: things like -Dm will segfault here in perlio, but doing
11352 * PERL_SET_CONTEXT(proto_perl);
11353 * breaks too many other things
11354 */
59bd0823 11355 Perl_reentrant_init(aTHX);
e5dd39fc
AB
11356#endif
11357
1d7c1841
GS
11358 /* create SV map for pointer relocation */
11359 PL_ptr_table = ptr_table_new();
11360
11361 /* initialize these special pointers as early as possible */
11362 SvANY(&PL_sv_undef) = NULL;
11363 SvREFCNT(&PL_sv_undef) = (~(U32)0)/2;
11364 SvFLAGS(&PL_sv_undef) = SVf_READONLY|SVt_NULL;
11365 ptr_table_store(PL_ptr_table, &proto_perl->Isv_undef, &PL_sv_undef);
11366
1d7c1841 11367 SvANY(&PL_sv_no) = new_XPVNV();
1d7c1841 11368 SvREFCNT(&PL_sv_no) = (~(U32)0)/2;
0309f36e
NC
11369 SvFLAGS(&PL_sv_no) = SVp_IOK|SVf_IOK|SVp_NOK|SVf_NOK
11370 |SVp_POK|SVf_POK|SVf_READONLY|SVt_PVNV;
f880fe2f 11371 SvPV_set(&PL_sv_no, SAVEPVN(PL_No, 0));
b162af07
SP
11372 SvCUR_set(&PL_sv_no, 0);
11373 SvLEN_set(&PL_sv_no, 1);
45977657 11374 SvIV_set(&PL_sv_no, 0);
9d6ce603 11375 SvNV_set(&PL_sv_no, 0);
1d7c1841
GS
11376 ptr_table_store(PL_ptr_table, &proto_perl->Isv_no, &PL_sv_no);
11377
1d7c1841 11378 SvANY(&PL_sv_yes) = new_XPVNV();
1d7c1841 11379 SvREFCNT(&PL_sv_yes) = (~(U32)0)/2;
0309f36e
NC
11380 SvFLAGS(&PL_sv_yes) = SVp_IOK|SVf_IOK|SVp_NOK|SVf_NOK
11381 |SVp_POK|SVf_POK|SVf_READONLY|SVt_PVNV;
f880fe2f 11382 SvPV_set(&PL_sv_yes, SAVEPVN(PL_Yes, 1));
b162af07
SP
11383 SvCUR_set(&PL_sv_yes, 1);
11384 SvLEN_set(&PL_sv_yes, 2);
45977657 11385 SvIV_set(&PL_sv_yes, 1);
9d6ce603 11386 SvNV_set(&PL_sv_yes, 1);
1d7c1841
GS
11387 ptr_table_store(PL_ptr_table, &proto_perl->Isv_yes, &PL_sv_yes);
11388
05ec9bb3 11389 /* create (a non-shared!) shared string table */
1d7c1841
GS
11390 PL_strtab = newHV();
11391 HvSHAREKEYS_off(PL_strtab);
c4a9c09d 11392 hv_ksplit(PL_strtab, HvTOTALKEYS(proto_perl->Istrtab));
1d7c1841
GS
11393 ptr_table_store(PL_ptr_table, proto_perl->Istrtab, PL_strtab);
11394
05ec9bb3
NIS
11395 PL_compiling = proto_perl->Icompiling;
11396
11397 /* These two PVs will be free'd special way so must set them same way op.c does */
11398 PL_compiling.cop_stashpv = savesharedpv(PL_compiling.cop_stashpv);
11399 ptr_table_store(PL_ptr_table, proto_perl->Icompiling.cop_stashpv, PL_compiling.cop_stashpv);
11400
11401 PL_compiling.cop_file = savesharedpv(PL_compiling.cop_file);
11402 ptr_table_store(PL_ptr_table, proto_perl->Icompiling.cop_file, PL_compiling.cop_file);
11403
1d7c1841
GS
11404 ptr_table_store(PL_ptr_table, &proto_perl->Icompiling, &PL_compiling);
11405 if (!specialWARN(PL_compiling.cop_warnings))
d2d73c3e 11406 PL_compiling.cop_warnings = sv_dup_inc(PL_compiling.cop_warnings, param);
ac27b0f5 11407 if (!specialCopIO(PL_compiling.cop_io))
d2d73c3e 11408 PL_compiling.cop_io = sv_dup_inc(PL_compiling.cop_io, param);
1d7c1841
GS
11409 PL_curcop = (COP*)any_dup(proto_perl->Tcurcop, proto_perl);
11410
11411 /* pseudo environmental stuff */
11412 PL_origargc = proto_perl->Iorigargc;
e2975953 11413 PL_origargv = proto_perl->Iorigargv;
d2d73c3e 11414
d2d73c3e
AB
11415 param->stashes = newAV(); /* Setup array of objects to call clone on */
11416
d419787a
SH
11417 /* Set tainting stuff before PerlIO_debug can possibly get called */
11418 PL_tainting = proto_perl->Itainting;
11419 PL_taint_warn = proto_perl->Itaint_warn;
11420
a1ea730d 11421#ifdef PERLIO_LAYERS
3a1ee7e8
NIS
11422 /* Clone PerlIO tables as soon as we can handle general xx_dup() */
11423 PerlIO_clone(aTHX_ proto_perl, param);
a1ea730d 11424#endif
d2d73c3e
AB
11425
11426 PL_envgv = gv_dup(proto_perl->Ienvgv, param);
11427 PL_incgv = gv_dup(proto_perl->Iincgv, param);
11428 PL_hintgv = gv_dup(proto_perl->Ihintgv, param);
1d7c1841 11429 PL_origfilename = SAVEPV(proto_perl->Iorigfilename);
d2d73c3e
AB
11430 PL_diehook = sv_dup_inc(proto_perl->Idiehook, param);
11431 PL_warnhook = sv_dup_inc(proto_perl->Iwarnhook, param);
1d7c1841
GS
11432
11433 /* switches */
11434 PL_minus_c = proto_perl->Iminus_c;
d2d73c3e 11435 PL_patchlevel = sv_dup_inc(proto_perl->Ipatchlevel, param);
1d7c1841
GS
11436 PL_localpatches = proto_perl->Ilocalpatches;
11437 PL_splitstr = proto_perl->Isplitstr;
11438 PL_preprocess = proto_perl->Ipreprocess;
11439 PL_minus_n = proto_perl->Iminus_n;
11440 PL_minus_p = proto_perl->Iminus_p;
11441 PL_minus_l = proto_perl->Iminus_l;
11442 PL_minus_a = proto_perl->Iminus_a;
11443 PL_minus_F = proto_perl->Iminus_F;
11444 PL_doswitches = proto_perl->Idoswitches;
11445 PL_dowarn = proto_perl->Idowarn;
11446 PL_doextract = proto_perl->Idoextract;
11447 PL_sawampersand = proto_perl->Isawampersand;
11448 PL_unsafe = proto_perl->Iunsafe;
11449 PL_inplace = SAVEPV(proto_perl->Iinplace);
d2d73c3e 11450 PL_e_script = sv_dup_inc(proto_perl->Ie_script, param);
1d7c1841
GS
11451 PL_perldb = proto_perl->Iperldb;
11452 PL_perl_destruct_level = proto_perl->Iperl_destruct_level;
1cbb0781 11453 PL_exit_flags = proto_perl->Iexit_flags;
1d7c1841
GS
11454
11455 /* magical thingies */
11456 /* XXX time(&PL_basetime) when asked for? */
11457 PL_basetime = proto_perl->Ibasetime;
d2d73c3e 11458 PL_formfeed = sv_dup(proto_perl->Iformfeed, param);
1d7c1841
GS
11459
11460 PL_maxsysfd = proto_perl->Imaxsysfd;
11461 PL_multiline = proto_perl->Imultiline;
11462 PL_statusvalue = proto_perl->Istatusvalue;
11463#ifdef VMS
11464 PL_statusvalue_vms = proto_perl->Istatusvalue_vms;
11465#endif
0a378802 11466 PL_encoding = sv_dup(proto_perl->Iencoding, param);
1d7c1841 11467
4a4c6fe3 11468 sv_setpvn(PERL_DEBUG_PAD(0), "", 0); /* For regex debugging. */
1f483ca1
JH
11469 sv_setpvn(PERL_DEBUG_PAD(1), "", 0); /* ext/re needs these */
11470 sv_setpvn(PERL_DEBUG_PAD(2), "", 0); /* even without DEBUGGING. */
4a4c6fe3 11471
d2f185dc
AMS
11472 /* Clone the regex array */
11473 PL_regex_padav = newAV();
11474 {
a3b680e6 11475 const I32 len = av_len((AV*)proto_perl->Iregex_padav);
53c1dcc0 11476 SV** const regexen = AvARRAY((AV*)proto_perl->Iregex_padav);
b464bac0 11477 IV i;
0f95fc41
AB
11478 av_push(PL_regex_padav,
11479 sv_dup_inc(regexen[0],param));
11480 for(i = 1; i <= len; i++) {
11481 if(SvREPADTMP(regexen[i])) {
11482 av_push(PL_regex_padav, sv_dup_inc(regexen[i], param));
8cf8f3d1 11483 } else {
0f95fc41
AB
11484 av_push(PL_regex_padav,
11485 SvREFCNT_inc(
8cf8f3d1 11486 newSViv(PTR2IV(re_dup(INT2PTR(REGEXP *,
cbfa9890 11487 SvIVX(regexen[i])), param)))
0f95fc41
AB
11488 ));
11489 }
d2f185dc
AMS
11490 }
11491 }
11492 PL_regex_pad = AvARRAY(PL_regex_padav);
1fcf4c12 11493
1d7c1841 11494 /* shortcuts to various I/O objects */
d2d73c3e
AB
11495 PL_stdingv = gv_dup(proto_perl->Istdingv, param);
11496 PL_stderrgv = gv_dup(proto_perl->Istderrgv, param);
11497 PL_defgv = gv_dup(proto_perl->Idefgv, param);
11498 PL_argvgv = gv_dup(proto_perl->Iargvgv, param);
11499 PL_argvoutgv = gv_dup(proto_perl->Iargvoutgv, param);
11500 PL_argvout_stack = av_dup_inc(proto_perl->Iargvout_stack, param);
1d7c1841
GS
11501
11502 /* shortcuts to regexp stuff */
d2d73c3e 11503 PL_replgv = gv_dup(proto_perl->Ireplgv, param);
1d7c1841
GS
11504
11505 /* shortcuts to misc objects */
d2d73c3e 11506 PL_errgv = gv_dup(proto_perl->Ierrgv, param);
1d7c1841
GS
11507
11508 /* shortcuts to debugging objects */
d2d73c3e
AB
11509 PL_DBgv = gv_dup(proto_perl->IDBgv, param);
11510 PL_DBline = gv_dup(proto_perl->IDBline, param);
11511 PL_DBsub = gv_dup(proto_perl->IDBsub, param);
11512 PL_DBsingle = sv_dup(proto_perl->IDBsingle, param);
11513 PL_DBtrace = sv_dup(proto_perl->IDBtrace, param);
11514 PL_DBsignal = sv_dup(proto_perl->IDBsignal, param);
06492da6 11515 PL_DBassertion = sv_dup(proto_perl->IDBassertion, param);
d2d73c3e
AB
11516 PL_lineary = av_dup(proto_perl->Ilineary, param);
11517 PL_dbargs = av_dup(proto_perl->Idbargs, param);
1d7c1841
GS
11518
11519 /* symbol tables */
d2d73c3e
AB
11520 PL_defstash = hv_dup_inc(proto_perl->Tdefstash, param);
11521 PL_curstash = hv_dup(proto_perl->Tcurstash, param);
d2d73c3e
AB
11522 PL_debstash = hv_dup(proto_perl->Idebstash, param);
11523 PL_globalstash = hv_dup(proto_perl->Iglobalstash, param);
11524 PL_curstname = sv_dup_inc(proto_perl->Icurstname, param);
11525
11526 PL_beginav = av_dup_inc(proto_perl->Ibeginav, param);
ee1c5a4e 11527 PL_beginav_save = av_dup_inc(proto_perl->Ibeginav_save, param);
ece599bd 11528 PL_checkav_save = av_dup_inc(proto_perl->Icheckav_save, param);
d2d73c3e
AB
11529 PL_endav = av_dup_inc(proto_perl->Iendav, param);
11530 PL_checkav = av_dup_inc(proto_perl->Icheckav, param);
11531 PL_initav = av_dup_inc(proto_perl->Iinitav, param);
1d7c1841
GS
11532
11533 PL_sub_generation = proto_perl->Isub_generation;
11534
11535 /* funky return mechanisms */
11536 PL_forkprocess = proto_perl->Iforkprocess;
11537
11538 /* subprocess state */
d2d73c3e 11539 PL_fdpid = av_dup_inc(proto_perl->Ifdpid, param);
1d7c1841
GS
11540
11541 /* internal state */
1d7c1841
GS
11542 PL_maxo = proto_perl->Imaxo;
11543 if (proto_perl->Iop_mask)
11544 PL_op_mask = SAVEPVN(proto_perl->Iop_mask, PL_maxo);
11545 else
11546 PL_op_mask = Nullch;
06492da6 11547 /* PL_asserting = proto_perl->Iasserting; */
1d7c1841
GS
11548
11549 /* current interpreter roots */
d2d73c3e 11550 PL_main_cv = cv_dup_inc(proto_perl->Imain_cv, param);
1d7c1841
GS
11551 PL_main_root = OpREFCNT_inc(proto_perl->Imain_root);
11552 PL_main_start = proto_perl->Imain_start;
e977893f 11553 PL_eval_root = proto_perl->Ieval_root;
1d7c1841
GS
11554 PL_eval_start = proto_perl->Ieval_start;
11555
11556 /* runtime control stuff */
11557 PL_curcopdb = (COP*)any_dup(proto_perl->Icurcopdb, proto_perl);
11558 PL_copline = proto_perl->Icopline;
11559
11560 PL_filemode = proto_perl->Ifilemode;
11561 PL_lastfd = proto_perl->Ilastfd;
11562 PL_oldname = proto_perl->Ioldname; /* XXX not quite right */
11563 PL_Argv = NULL;
11564 PL_Cmd = Nullch;
11565 PL_gensym = proto_perl->Igensym;
11566 PL_preambled = proto_perl->Ipreambled;
d2d73c3e 11567 PL_preambleav = av_dup_inc(proto_perl->Ipreambleav, param);
1d7c1841
GS
11568 PL_laststatval = proto_perl->Ilaststatval;
11569 PL_laststype = proto_perl->Ilaststype;
11570 PL_mess_sv = Nullsv;
11571
d2d73c3e 11572 PL_ors_sv = sv_dup_inc(proto_perl->Iors_sv, param);
1d7c1841
GS
11573
11574 /* interpreter atexit processing */
11575 PL_exitlistlen = proto_perl->Iexitlistlen;
11576 if (PL_exitlistlen) {
a02a5408 11577 Newx(PL_exitlist, PL_exitlistlen, PerlExitListEntry);
1d7c1841
GS
11578 Copy(proto_perl->Iexitlist, PL_exitlist, PL_exitlistlen, PerlExitListEntry);
11579 }
11580 else
11581 PL_exitlist = (PerlExitListEntry*)NULL;
d2d73c3e 11582 PL_modglobal = hv_dup_inc(proto_perl->Imodglobal, param);
19e8ce8e
AB
11583 PL_custom_op_names = hv_dup_inc(proto_perl->Icustom_op_names,param);
11584 PL_custom_op_descs = hv_dup_inc(proto_perl->Icustom_op_descs,param);
1d7c1841
GS
11585
11586 PL_profiledata = NULL;
a8fc9800 11587 PL_rsfp = fp_dup(proto_perl->Irsfp, '<', param);
1d7c1841 11588 /* PL_rsfp_filters entries have fake IoDIRP() */
d2d73c3e 11589 PL_rsfp_filters = av_dup_inc(proto_perl->Irsfp_filters, param);
1d7c1841 11590
d2d73c3e 11591 PL_compcv = cv_dup(proto_perl->Icompcv, param);
dd2155a4
DM
11592
11593 PAD_CLONE_VARS(proto_perl, param);
1d7c1841
GS
11594
11595#ifdef HAVE_INTERP_INTERN
11596 sys_intern_dup(&proto_perl->Isys_intern, &PL_sys_intern);
11597#endif
11598
11599 /* more statics moved here */
11600 PL_generation = proto_perl->Igeneration;
d2d73c3e 11601 PL_DBcv = cv_dup(proto_perl->IDBcv, param);
1d7c1841
GS
11602
11603 PL_in_clean_objs = proto_perl->Iin_clean_objs;
11604 PL_in_clean_all = proto_perl->Iin_clean_all;
11605
11606 PL_uid = proto_perl->Iuid;
11607 PL_euid = proto_perl->Ieuid;
11608 PL_gid = proto_perl->Igid;
11609 PL_egid = proto_perl->Iegid;
11610 PL_nomemok = proto_perl->Inomemok;
11611 PL_an = proto_perl->Ian;
1d7c1841
GS
11612 PL_evalseq = proto_perl->Ievalseq;
11613 PL_origenviron = proto_perl->Iorigenviron; /* XXX not quite right */
11614 PL_origalen = proto_perl->Iorigalen;
11615 PL_pidstatus = newHV(); /* XXX flag for cloning? */
11616 PL_osname = SAVEPV(proto_perl->Iosname);
1d7c1841
GS
11617 PL_sighandlerp = proto_perl->Isighandlerp;
11618
1d7c1841
GS
11619 PL_runops = proto_perl->Irunops;
11620
11621 Copy(proto_perl->Itokenbuf, PL_tokenbuf, 256, char);
11622
11623#ifdef CSH
11624 PL_cshlen = proto_perl->Icshlen;
74f1b2b8 11625 PL_cshname = proto_perl->Icshname; /* XXX never deallocated */
1d7c1841
GS
11626#endif
11627
11628 PL_lex_state = proto_perl->Ilex_state;
11629 PL_lex_defer = proto_perl->Ilex_defer;
11630 PL_lex_expect = proto_perl->Ilex_expect;
11631 PL_lex_formbrack = proto_perl->Ilex_formbrack;
11632 PL_lex_dojoin = proto_perl->Ilex_dojoin;
11633 PL_lex_starts = proto_perl->Ilex_starts;
d2d73c3e
AB
11634 PL_lex_stuff = sv_dup_inc(proto_perl->Ilex_stuff, param);
11635 PL_lex_repl = sv_dup_inc(proto_perl->Ilex_repl, param);
1d7c1841
GS
11636 PL_lex_op = proto_perl->Ilex_op;
11637 PL_lex_inpat = proto_perl->Ilex_inpat;
11638 PL_lex_inwhat = proto_perl->Ilex_inwhat;
11639 PL_lex_brackets = proto_perl->Ilex_brackets;
11640 i = (PL_lex_brackets < 120 ? 120 : PL_lex_brackets);
11641 PL_lex_brackstack = SAVEPVN(proto_perl->Ilex_brackstack,i);
11642 PL_lex_casemods = proto_perl->Ilex_casemods;
11643 i = (PL_lex_casemods < 12 ? 12 : PL_lex_casemods);
11644 PL_lex_casestack = SAVEPVN(proto_perl->Ilex_casestack,i);
11645
11646 Copy(proto_perl->Inextval, PL_nextval, 5, YYSTYPE);
11647 Copy(proto_perl->Inexttype, PL_nexttype, 5, I32);
11648 PL_nexttoke = proto_perl->Inexttoke;
11649
1d773130
TB
11650 /* XXX This is probably masking the deeper issue of why
11651 * SvANY(proto_perl->Ilinestr) can be NULL at this point. For test case:
11652 * http://archive.develooper.com/perl5-porters%40perl.org/msg83298.html
11653 * (A little debugging with a watchpoint on it may help.)
11654 */
389edf32
TB
11655 if (SvANY(proto_perl->Ilinestr)) {
11656 PL_linestr = sv_dup_inc(proto_perl->Ilinestr, param);
3f7c398e 11657 i = proto_perl->Ibufptr - SvPVX_const(proto_perl->Ilinestr);
389edf32 11658 PL_bufptr = SvPVX(PL_linestr) + (i < 0 ? 0 : i);
3f7c398e 11659 i = proto_perl->Ioldbufptr - SvPVX_const(proto_perl->Ilinestr);
389edf32 11660 PL_oldbufptr = SvPVX(PL_linestr) + (i < 0 ? 0 : i);
3f7c398e 11661 i = proto_perl->Ioldoldbufptr - SvPVX_const(proto_perl->Ilinestr);
389edf32 11662 PL_oldoldbufptr = SvPVX(PL_linestr) + (i < 0 ? 0 : i);
3f7c398e 11663 i = proto_perl->Ilinestart - SvPVX_const(proto_perl->Ilinestr);
389edf32
TB
11664 PL_linestart = SvPVX(PL_linestr) + (i < 0 ? 0 : i);
11665 }
11666 else {
11667 PL_linestr = NEWSV(65,79);
11668 sv_upgrade(PL_linestr,SVt_PVIV);
11669 sv_setpvn(PL_linestr,"",0);
11670 PL_bufptr = PL_oldbufptr = PL_oldoldbufptr = PL_linestart = SvPVX(PL_linestr);
11671 }
1d7c1841 11672 PL_bufend = SvPVX(PL_linestr) + SvCUR(PL_linestr);
1d7c1841
GS
11673 PL_pending_ident = proto_perl->Ipending_ident;
11674 PL_sublex_info = proto_perl->Isublex_info; /* XXX not quite right */
11675
11676 PL_expect = proto_perl->Iexpect;
11677
11678 PL_multi_start = proto_perl->Imulti_start;
11679 PL_multi_end = proto_perl->Imulti_end;
11680 PL_multi_open = proto_perl->Imulti_open;
11681 PL_multi_close = proto_perl->Imulti_close;
11682
11683 PL_error_count = proto_perl->Ierror_count;
11684 PL_subline = proto_perl->Isubline;
d2d73c3e 11685 PL_subname = sv_dup_inc(proto_perl->Isubname, param);
1d7c1841 11686
1d773130 11687 /* XXX See comment on SvANY(proto_perl->Ilinestr) above */
389edf32 11688 if (SvANY(proto_perl->Ilinestr)) {
3f7c398e 11689 i = proto_perl->Ilast_uni - SvPVX_const(proto_perl->Ilinestr);
389edf32 11690 PL_last_uni = SvPVX(PL_linestr) + (i < 0 ? 0 : i);
3f7c398e 11691 i = proto_perl->Ilast_lop - SvPVX_const(proto_perl->Ilinestr);
389edf32
TB
11692 PL_last_lop = SvPVX(PL_linestr) + (i < 0 ? 0 : i);
11693 PL_last_lop_op = proto_perl->Ilast_lop_op;
11694 }
11695 else {
11696 PL_last_uni = SvPVX(PL_linestr);
11697 PL_last_lop = SvPVX(PL_linestr);
11698 PL_last_lop_op = 0;
11699 }
1d7c1841 11700 PL_in_my = proto_perl->Iin_my;
d2d73c3e 11701 PL_in_my_stash = hv_dup(proto_perl->Iin_my_stash, param);
1d7c1841
GS
11702#ifdef FCRYPT
11703 PL_cryptseen = proto_perl->Icryptseen;
11704#endif
11705
11706 PL_hints = proto_perl->Ihints;
11707
11708 PL_amagic_generation = proto_perl->Iamagic_generation;
11709
11710#ifdef USE_LOCALE_COLLATE
11711 PL_collation_ix = proto_perl->Icollation_ix;
11712 PL_collation_name = SAVEPV(proto_perl->Icollation_name);
11713 PL_collation_standard = proto_perl->Icollation_standard;
11714 PL_collxfrm_base = proto_perl->Icollxfrm_base;
11715 PL_collxfrm_mult = proto_perl->Icollxfrm_mult;
11716#endif /* USE_LOCALE_COLLATE */
11717
11718#ifdef USE_LOCALE_NUMERIC
11719 PL_numeric_name = SAVEPV(proto_perl->Inumeric_name);
11720 PL_numeric_standard = proto_perl->Inumeric_standard;
11721 PL_numeric_local = proto_perl->Inumeric_local;
d2d73c3e 11722 PL_numeric_radix_sv = sv_dup_inc(proto_perl->Inumeric_radix_sv, param);
1d7c1841
GS
11723#endif /* !USE_LOCALE_NUMERIC */
11724
11725 /* utf8 character classes */
d2d73c3e
AB
11726 PL_utf8_alnum = sv_dup_inc(proto_perl->Iutf8_alnum, param);
11727 PL_utf8_alnumc = sv_dup_inc(proto_perl->Iutf8_alnumc, param);
11728 PL_utf8_ascii = sv_dup_inc(proto_perl->Iutf8_ascii, param);
11729 PL_utf8_alpha = sv_dup_inc(proto_perl->Iutf8_alpha, param);
11730 PL_utf8_space = sv_dup_inc(proto_perl->Iutf8_space, param);
11731 PL_utf8_cntrl = sv_dup_inc(proto_perl->Iutf8_cntrl, param);
11732 PL_utf8_graph = sv_dup_inc(proto_perl->Iutf8_graph, param);
11733 PL_utf8_digit = sv_dup_inc(proto_perl->Iutf8_digit, param);
11734 PL_utf8_upper = sv_dup_inc(proto_perl->Iutf8_upper, param);
11735 PL_utf8_lower = sv_dup_inc(proto_perl->Iutf8_lower, param);
11736 PL_utf8_print = sv_dup_inc(proto_perl->Iutf8_print, param);
11737 PL_utf8_punct = sv_dup_inc(proto_perl->Iutf8_punct, param);
11738 PL_utf8_xdigit = sv_dup_inc(proto_perl->Iutf8_xdigit, param);
11739 PL_utf8_mark = sv_dup_inc(proto_perl->Iutf8_mark, param);
11740 PL_utf8_toupper = sv_dup_inc(proto_perl->Iutf8_toupper, param);
11741 PL_utf8_totitle = sv_dup_inc(proto_perl->Iutf8_totitle, param);
11742 PL_utf8_tolower = sv_dup_inc(proto_perl->Iutf8_tolower, param);
b4e400f9 11743 PL_utf8_tofold = sv_dup_inc(proto_perl->Iutf8_tofold, param);
82686b01
JH
11744 PL_utf8_idstart = sv_dup_inc(proto_perl->Iutf8_idstart, param);
11745 PL_utf8_idcont = sv_dup_inc(proto_perl->Iutf8_idcont, param);
1d7c1841 11746
6c3182a5 11747 /* Did the locale setup indicate UTF-8? */
9769094f 11748 PL_utf8locale = proto_perl->Iutf8locale;
6c3182a5
JH
11749 /* Unicode features (see perlrun/-C) */
11750 PL_unicode = proto_perl->Iunicode;
11751
11752 /* Pre-5.8 signals control */
11753 PL_signals = proto_perl->Isignals;
11754
11755 /* times() ticks per second */
11756 PL_clocktick = proto_perl->Iclocktick;
11757
11758 /* Recursion stopper for PerlIO_find_layer */
11759 PL_in_load_module = proto_perl->Iin_load_module;
11760
11761 /* sort() routine */
11762 PL_sort_RealCmp = proto_perl->Isort_RealCmp;
11763
57c6e6d2
JH
11764 /* Not really needed/useful since the reenrant_retint is "volatile",
11765 * but do it for consistency's sake. */
11766 PL_reentrant_retint = proto_perl->Ireentrant_retint;
11767
15a5279a
JH
11768 /* Hooks to shared SVs and locks. */
11769 PL_sharehook = proto_perl->Isharehook;
11770 PL_lockhook = proto_perl->Ilockhook;
11771 PL_unlockhook = proto_perl->Iunlockhook;
11772 PL_threadhook = proto_perl->Ithreadhook;
11773
bce260cd
JH
11774 PL_runops_std = proto_perl->Irunops_std;
11775 PL_runops_dbg = proto_perl->Irunops_dbg;
11776
11777#ifdef THREADS_HAVE_PIDS
11778 PL_ppid = proto_perl->Ippid;
11779#endif
11780
1d7c1841
GS
11781 /* swatch cache */
11782 PL_last_swash_hv = Nullhv; /* reinits on demand */
11783 PL_last_swash_klen = 0;
11784 PL_last_swash_key[0]= '\0';
11785 PL_last_swash_tmps = (U8*)NULL;
11786 PL_last_swash_slen = 0;
11787
1d7c1841
GS
11788 PL_glob_index = proto_perl->Iglob_index;
11789 PL_srand_called = proto_perl->Isrand_called;
11790 PL_uudmap['M'] = 0; /* reinits on demand */
11791 PL_bitcount = Nullch; /* reinits on demand */
11792
66fe0623 11793 if (proto_perl->Ipsig_pend) {
a02a5408 11794 Newxz(PL_psig_pend, SIG_SIZE, int);
9dd79c3f 11795 }
66fe0623
NIS
11796 else {
11797 PL_psig_pend = (int*)NULL;
11798 }
11799
1d7c1841 11800 if (proto_perl->Ipsig_ptr) {
a02a5408
JC
11801 Newxz(PL_psig_ptr, SIG_SIZE, SV*);
11802 Newxz(PL_psig_name, SIG_SIZE, SV*);
76d3c696 11803 for (i = 1; i < SIG_SIZE; i++) {
d2d73c3e
AB
11804 PL_psig_ptr[i] = sv_dup_inc(proto_perl->Ipsig_ptr[i], param);
11805 PL_psig_name[i] = sv_dup_inc(proto_perl->Ipsig_name[i], param);
1d7c1841
GS
11806 }
11807 }
11808 else {
11809 PL_psig_ptr = (SV**)NULL;
11810 PL_psig_name = (SV**)NULL;
11811 }
11812
11813 /* thrdvar.h stuff */
11814
a0739874 11815 if (flags & CLONEf_COPY_STACKS) {
1d7c1841
GS
11816 /* next allocation will be PL_tmps_stack[PL_tmps_ix+1] */
11817 PL_tmps_ix = proto_perl->Ttmps_ix;
11818 PL_tmps_max = proto_perl->Ttmps_max;
11819 PL_tmps_floor = proto_perl->Ttmps_floor;
a02a5408 11820 Newxz(PL_tmps_stack, PL_tmps_max, SV*);
1d7c1841
GS
11821 i = 0;
11822 while (i <= PL_tmps_ix) {
d2d73c3e 11823 PL_tmps_stack[i] = sv_dup_inc(proto_perl->Ttmps_stack[i], param);
1d7c1841
GS
11824 ++i;
11825 }
11826
11827 /* next PUSHMARK() sets *(PL_markstack_ptr+1) */
11828 i = proto_perl->Tmarkstack_max - proto_perl->Tmarkstack;
a02a5408 11829 Newxz(PL_markstack, i, I32);
1d7c1841
GS
11830 PL_markstack_max = PL_markstack + (proto_perl->Tmarkstack_max
11831 - proto_perl->Tmarkstack);
11832 PL_markstack_ptr = PL_markstack + (proto_perl->Tmarkstack_ptr
11833 - proto_perl->Tmarkstack);
11834 Copy(proto_perl->Tmarkstack, PL_markstack,
11835 PL_markstack_ptr - PL_markstack + 1, I32);
11836
11837 /* next push_scope()/ENTER sets PL_scopestack[PL_scopestack_ix]
11838 * NOTE: unlike the others! */
11839 PL_scopestack_ix = proto_perl->Tscopestack_ix;
11840 PL_scopestack_max = proto_perl->Tscopestack_max;
a02a5408 11841 Newxz(PL_scopestack, PL_scopestack_max, I32);
1d7c1841
GS
11842 Copy(proto_perl->Tscopestack, PL_scopestack, PL_scopestack_ix, I32);
11843
1d7c1841 11844 /* NOTE: si_dup() looks at PL_markstack */
d2d73c3e 11845 PL_curstackinfo = si_dup(proto_perl->Tcurstackinfo, param);
1d7c1841
GS
11846
11847 /* PL_curstack = PL_curstackinfo->si_stack; */
d2d73c3e
AB
11848 PL_curstack = av_dup(proto_perl->Tcurstack, param);
11849 PL_mainstack = av_dup(proto_perl->Tmainstack, param);
1d7c1841
GS
11850
11851 /* next PUSHs() etc. set *(PL_stack_sp+1) */
11852 PL_stack_base = AvARRAY(PL_curstack);
11853 PL_stack_sp = PL_stack_base + (proto_perl->Tstack_sp
11854 - proto_perl->Tstack_base);
11855 PL_stack_max = PL_stack_base + AvMAX(PL_curstack);
11856
11857 /* next SSPUSHFOO() sets PL_savestack[PL_savestack_ix]
11858 * NOTE: unlike the others! */
11859 PL_savestack_ix = proto_perl->Tsavestack_ix;
11860 PL_savestack_max = proto_perl->Tsavestack_max;
a02a5408 11861 /*Newxz(PL_savestack, PL_savestack_max, ANY);*/
d2d73c3e 11862 PL_savestack = ss_dup(proto_perl, param);
1d7c1841
GS
11863 }
11864 else {
11865 init_stacks();
985e7056 11866 ENTER; /* perl_destruct() wants to LEAVE; */
1d7c1841
GS
11867 }
11868
11869 PL_start_env = proto_perl->Tstart_env; /* XXXXXX */
11870 PL_top_env = &PL_start_env;
11871
11872 PL_op = proto_perl->Top;
11873
11874 PL_Sv = Nullsv;
11875 PL_Xpv = (XPV*)NULL;
11876 PL_na = proto_perl->Tna;
11877
11878 PL_statbuf = proto_perl->Tstatbuf;
11879 PL_statcache = proto_perl->Tstatcache;
d2d73c3e
AB
11880 PL_statgv = gv_dup(proto_perl->Tstatgv, param);
11881 PL_statname = sv_dup_inc(proto_perl->Tstatname, param);
1d7c1841
GS
11882#ifdef HAS_TIMES
11883 PL_timesbuf = proto_perl->Ttimesbuf;
11884#endif
11885
11886 PL_tainted = proto_perl->Ttainted;
11887 PL_curpm = proto_perl->Tcurpm; /* XXX No PMOP ref count */
d2d73c3e
AB
11888 PL_rs = sv_dup_inc(proto_perl->Trs, param);
11889 PL_last_in_gv = gv_dup(proto_perl->Tlast_in_gv, param);
11890 PL_ofs_sv = sv_dup_inc(proto_perl->Tofs_sv, param);
11891 PL_defoutgv = gv_dup_inc(proto_perl->Tdefoutgv, param);
1d7c1841 11892 PL_chopset = proto_perl->Tchopset; /* XXX never deallocated */
d2d73c3e
AB
11893 PL_toptarget = sv_dup_inc(proto_perl->Ttoptarget, param);
11894 PL_bodytarget = sv_dup_inc(proto_perl->Tbodytarget, param);
11895 PL_formtarget = sv_dup(proto_perl->Tformtarget, param);
1d7c1841
GS
11896
11897 PL_restartop = proto_perl->Trestartop;
11898 PL_in_eval = proto_perl->Tin_eval;
11899 PL_delaymagic = proto_perl->Tdelaymagic;
11900 PL_dirty = proto_perl->Tdirty;
11901 PL_localizing = proto_perl->Tlocalizing;
11902
d2d73c3e 11903 PL_errors = sv_dup_inc(proto_perl->Terrors, param);
dd28f7bb 11904 PL_hv_fetch_ent_mh = Nullhe;
1d7c1841
GS
11905 PL_modcount = proto_perl->Tmodcount;
11906 PL_lastgotoprobe = Nullop;
11907 PL_dumpindent = proto_perl->Tdumpindent;
11908
11909 PL_sortcop = (OP*)any_dup(proto_perl->Tsortcop, proto_perl);
d2d73c3e
AB
11910 PL_sortstash = hv_dup(proto_perl->Tsortstash, param);
11911 PL_firstgv = gv_dup(proto_perl->Tfirstgv, param);
11912 PL_secondgv = gv_dup(proto_perl->Tsecondgv, param);
1d7c1841
GS
11913 PL_sortcxix = proto_perl->Tsortcxix;
11914 PL_efloatbuf = Nullch; /* reinits on demand */
11915 PL_efloatsize = 0; /* reinits on demand */
11916
11917 /* regex stuff */
11918
11919 PL_screamfirst = NULL;
11920 PL_screamnext = NULL;
11921 PL_maxscream = -1; /* reinits on demand */
11922 PL_lastscream = Nullsv;
11923
11924 PL_watchaddr = NULL;
11925 PL_watchok = Nullch;
11926
11927 PL_regdummy = proto_perl->Tregdummy;
1d7c1841
GS
11928 PL_regprecomp = Nullch;
11929 PL_regnpar = 0;
11930 PL_regsize = 0;
1d7c1841
GS
11931 PL_colorset = 0; /* reinits PL_colors[] */
11932 /*PL_colors[6] = {0,0,0,0,0,0};*/
1d7c1841
GS
11933 PL_reginput = Nullch;
11934 PL_regbol = Nullch;
11935 PL_regeol = Nullch;
11936 PL_regstartp = (I32*)NULL;
11937 PL_regendp = (I32*)NULL;
11938 PL_reglastparen = (U32*)NULL;
2d862feb 11939 PL_reglastcloseparen = (U32*)NULL;
1d7c1841 11940 PL_regtill = Nullch;
1d7c1841
GS
11941 PL_reg_start_tmp = (char**)NULL;
11942 PL_reg_start_tmpl = 0;
11943 PL_regdata = (struct reg_data*)NULL;
11944 PL_bostr = Nullch;
11945 PL_reg_flags = 0;
11946 PL_reg_eval_set = 0;
11947 PL_regnarrate = 0;
11948 PL_regprogram = (regnode*)NULL;
11949 PL_regindent = 0;
11950 PL_regcc = (CURCUR*)NULL;
11951 PL_reg_call_cc = (struct re_cc_state*)NULL;
11952 PL_reg_re = (regexp*)NULL;
11953 PL_reg_ganch = Nullch;
11954 PL_reg_sv = Nullsv;
53c4c00c 11955 PL_reg_match_utf8 = FALSE;
1d7c1841
GS
11956 PL_reg_magic = (MAGIC*)NULL;
11957 PL_reg_oldpos = 0;
11958 PL_reg_oldcurpm = (PMOP*)NULL;
11959 PL_reg_curpm = (PMOP*)NULL;
11960 PL_reg_oldsaved = Nullch;
11961 PL_reg_oldsavedlen = 0;
f8c7b90f 11962#ifdef PERL_OLD_COPY_ON_WRITE
504cff3b 11963 PL_nrs = Nullsv;
ed252734 11964#endif
1d7c1841
GS
11965 PL_reg_maxiter = 0;
11966 PL_reg_leftiter = 0;
11967 PL_reg_poscache = Nullch;
11968 PL_reg_poscache_size= 0;
11969
11970 /* RE engine - function pointers */
11971 PL_regcompp = proto_perl->Tregcompp;
11972 PL_regexecp = proto_perl->Tregexecp;
11973 PL_regint_start = proto_perl->Tregint_start;
11974 PL_regint_string = proto_perl->Tregint_string;
11975 PL_regfree = proto_perl->Tregfree;
11976
11977 PL_reginterp_cnt = 0;
11978 PL_reg_starttry = 0;
11979
a2efc822
SC
11980 /* Pluggable optimizer */
11981 PL_peepp = proto_perl->Tpeepp;
11982
081fc587
AB
11983 PL_stashcache = newHV();
11984
a0739874
DM
11985 if (!(flags & CLONEf_KEEP_PTR_TABLE)) {
11986 ptr_table_free(PL_ptr_table);
11987 PL_ptr_table = NULL;
11988 }
8cf8f3d1 11989
f284b03f
AMS
11990 /* Call the ->CLONE method, if it exists, for each of the stashes
11991 identified by sv_dup() above.
11992 */
d2d73c3e 11993 while(av_len(param->stashes) != -1) {
53c1dcc0
AL
11994 HV* const stash = (HV*) av_shift(param->stashes);
11995 GV* const cloner = gv_fetchmethod_autoload(stash, "CLONE", 0);
f284b03f
AMS
11996 if (cloner && GvCV(cloner)) {
11997 dSP;
11998 ENTER;
11999 SAVETMPS;
12000 PUSHMARK(SP);
84bda14a 12001 XPUSHs(sv_2mortal(newSVhek(HvNAME_HEK(stash))));
f284b03f
AMS
12002 PUTBACK;
12003 call_sv((SV*)GvCV(cloner), G_DISCARD);
12004 FREETMPS;
12005 LEAVE;
12006 }
4a09accc 12007 }
a0739874 12008
dc507217 12009 SvREFCNT_dec(param->stashes);
dc507217 12010
6d26897e
DM
12011 /* orphaned? eg threads->new inside BEGIN or use */
12012 if (PL_compcv && ! SvREFCNT(PL_compcv)) {
a3b680e6 12013 (void)SvREFCNT_inc(PL_compcv);
6d26897e
DM
12014 SAVEFREESV(PL_compcv);
12015 }
12016
1d7c1841 12017 return my_perl;
1d7c1841
GS
12018}
12019
1d7c1841 12020#endif /* USE_ITHREADS */
a0ae6670 12021
9f4817db 12022/*
ccfc67b7
JH
12023=head1 Unicode Support
12024
9f4817db
JH
12025=for apidoc sv_recode_to_utf8
12026
5d170f3a
JH
12027The encoding is assumed to be an Encode object, on entry the PV
12028of the sv is assumed to be octets in that encoding, and the sv
12029will be converted into Unicode (and UTF-8).
9f4817db 12030
5d170f3a
JH
12031If the sv already is UTF-8 (or if it is not POK), or if the encoding
12032is not a reference, nothing is done to the sv. If the encoding is not
1768d7eb
JH
12033an C<Encode::XS> Encoding object, bad things will happen.
12034(See F<lib/encoding.pm> and L<Encode>).
9f4817db 12035
5d170f3a 12036The PV of the sv is returned.
9f4817db 12037
5d170f3a
JH
12038=cut */
12039
12040char *
12041Perl_sv_recode_to_utf8(pTHX_ SV *sv, SV *encoding)
12042{
27da23d5 12043 dVAR;
220e2d4e 12044 if (SvPOK(sv) && !SvUTF8(sv) && !IN_BYTES && SvROK(encoding)) {
d0063567
DK
12045 SV *uni;
12046 STRLEN len;
93524f2b 12047 const char *s;
d0063567
DK
12048 dSP;
12049 ENTER;
12050 SAVETMPS;
220e2d4e 12051 save_re_context();
d0063567
DK
12052 PUSHMARK(sp);
12053 EXTEND(SP, 3);
12054 XPUSHs(encoding);
12055 XPUSHs(sv);
7a5fa8a2 12056/*
f9893866
NIS
12057 NI-S 2002/07/09
12058 Passing sv_yes is wrong - it needs to be or'ed set of constants
7a5fa8a2 12059 for Encode::XS, while UTf-8 decode (currently) assumes a true value means
f9893866
NIS
12060 remove converted chars from source.
12061
12062 Both will default the value - let them.
7a5fa8a2 12063
d0063567 12064 XPUSHs(&PL_sv_yes);
f9893866 12065*/
d0063567
DK
12066 PUTBACK;
12067 call_method("decode", G_SCALAR);
12068 SPAGAIN;
12069 uni = POPs;
12070 PUTBACK;
93524f2b 12071 s = SvPV_const(uni, len);
3f7c398e 12072 if (s != SvPVX_const(sv)) {
d0063567 12073 SvGROW(sv, len + 1);
93524f2b 12074 Move(s, SvPVX(sv), len + 1, char);
d0063567 12075 SvCUR_set(sv, len);
d0063567
DK
12076 }
12077 FREETMPS;
12078 LEAVE;
d0063567 12079 SvUTF8_on(sv);
95899a2a 12080 return SvPVX(sv);
f9893866 12081 }
95899a2a 12082 return SvPOKp(sv) ? SvPVX(sv) : NULL;
9f4817db
JH
12083}
12084
220e2d4e
IH
12085/*
12086=for apidoc sv_cat_decode
12087
12088The encoding is assumed to be an Encode object, the PV of the ssv is
12089assumed to be octets in that encoding and decoding the input starts
12090from the position which (PV + *offset) pointed to. The dsv will be
12091concatenated the decoded UTF-8 string from ssv. Decoding will terminate
12092when the string tstr appears in decoding output or the input ends on
12093the PV of the ssv. The value which the offset points will be modified
12094to the last input position on the ssv.
68795e93 12095
220e2d4e
IH
12096Returns TRUE if the terminator was found, else returns FALSE.
12097
12098=cut */
12099
12100bool
12101Perl_sv_cat_decode(pTHX_ SV *dsv, SV *encoding,
12102 SV *ssv, int *offset, char *tstr, int tlen)
12103{
27da23d5 12104 dVAR;
a73e8557 12105 bool ret = FALSE;
220e2d4e 12106 if (SvPOK(ssv) && SvPOK(dsv) && SvROK(encoding) && offset) {
220e2d4e
IH
12107 SV *offsv;
12108 dSP;
12109 ENTER;
12110 SAVETMPS;
12111 save_re_context();
12112 PUSHMARK(sp);
12113 EXTEND(SP, 6);
12114 XPUSHs(encoding);
12115 XPUSHs(dsv);
12116 XPUSHs(ssv);
12117 XPUSHs(offsv = sv_2mortal(newSViv(*offset)));
12118 XPUSHs(sv_2mortal(newSVpvn(tstr, tlen)));
12119 PUTBACK;
12120 call_method("cat_decode", G_SCALAR);
12121 SPAGAIN;
12122 ret = SvTRUE(TOPs);
12123 *offset = SvIV(offsv);
12124 PUTBACK;
12125 FREETMPS;
12126 LEAVE;
220e2d4e 12127 }
a73e8557
JH
12128 else
12129 Perl_croak(aTHX_ "Invalid argument to sv_cat_decode");
12130 return ret;
220e2d4e 12131}
f9893866 12132
241d1a3b
NC
12133/*
12134 * Local variables:
12135 * c-indentation-style: bsd
12136 * c-basic-offset: 4
12137 * indent-tabs-mode: t
12138 * End:
12139 *
37442d52
RGS
12140 * ex: set ts=8 sts=4 sw=4 noet:
12141 */