This is a live mirror of the Perl 5 development currently hosted at https://github.com/perl/perl5
Make -V "Compile-time options" list everything used in makedef.pl
[perl5.git] / sv.c
CommitLineData
a0d0e21e 1/* sv.c
79072805 2 *
4bb101f2 3 * Copyright (C) 1991, 1992, 1993, 1994, 1995, 1996, 1997, 1998, 1999,
241d1a3b 4 * 2000, 2001, 2002, 2003, 2004, 2005, by Larry Wall and others
79072805
LW
5 *
6 * You may distribute under the terms of either the GNU General Public
7 * License or the Artistic License, as specified in the README file.
8 *
a0d0e21e 9 * "I wonder what the Entish is for 'yes' and 'no'," he thought.
645c22ef
DM
10 *
11 *
5e045b90
AMS
12 * This file contains the code that creates, manipulates and destroys
13 * scalar values (SVs). The other types (AV, HV, GV, etc.) reuse the
14 * structure of an SV, so their creation and destruction is handled
15 * here; higher-level functions are in av.c, hv.c, and so on. Opcode
16 * level functions (eg. substr, split, join) for each of the types are
17 * in the pp*.c files.
79072805
LW
18 */
19
20#include "EXTERN.h"
864dbfa3 21#define PERL_IN_SV_C
79072805 22#include "perl.h"
d2f185dc 23#include "regcomp.h"
79072805 24
51371543 25#define FCALL *f
2c5424a7 26
2f8ed50e
OS
27#ifdef __Lynx__
28/* Missing proto on LynxOS */
29 char *gconvert(double, int, int, char *);
30#endif
31
e23c8137
JH
32#ifdef PERL_UTF8_CACHE_ASSERT
33/* The cache element 0 is the Unicode offset;
34 * the cache element 1 is the byte offset of the element 0;
35 * the cache element 2 is the Unicode length of the substring;
36 * the cache element 3 is the byte length of the substring;
37 * The checking of the substring side would be good
38 * but substr() has enough code paths to make my head spin;
39 * if adding more checks watch out for the following tests:
40 * t/op/index.t t/op/length.t t/op/pat.t t/op/substr.t
41 * lib/utf8.t lib/Unicode/Collate/t/index.t
42 * --jhi
43 */
44#define ASSERT_UTF8_CACHE(cache) \
45 STMT_START { if (cache) { assert((cache)[0] <= (cache)[1]); } } STMT_END
46#else
47#define ASSERT_UTF8_CACHE(cache) NOOP
48#endif
49
f8c7b90f 50#ifdef PERL_OLD_COPY_ON_WRITE
765f542d 51#define SV_COW_NEXT_SV(sv) INT2PTR(SV *,SvUVX(sv))
607fa7f2 52#define SV_COW_NEXT_SV_SET(current,next) SvUV_set(current, PTR2UV(next))
b5ccf5f2 53/* This is a pessimistic view. Scalar must be purely a read-write PV to copy-
765f542d 54 on-write. */
765f542d 55#endif
645c22ef
DM
56
57/* ============================================================================
58
59=head1 Allocation and deallocation of SVs.
60
5e045b90
AMS
61An SV (or AV, HV, etc.) is allocated in two parts: the head (struct sv,
62av, hv...) contains type and reference count information, as well as a
63pointer to the body (struct xrv, xpv, xpviv...), which contains fields
64specific to each type.
65
4977e971
NC
66Normally, this allocation is done using arenas, which by default are
67approximately 4K chunks of memory parcelled up into N heads or bodies. The
68first slot in each arena is reserved, and is used to hold a link to the next
69arena. In the case of heads, the unused first slot also contains some flags
70and a note of the number of slots. Snaked through each arena chain is a
5e045b90 71linked list of free items; when this becomes empty, an extra arena is
4977e971 72allocated and divided up into N items which are threaded into the free list.
645c22ef
DM
73
74The following global variables are associated with arenas:
75
76 PL_sv_arenaroot pointer to list of SV arenas
77 PL_sv_root pointer to list of free SV structures
78
79 PL_foo_arenaroot pointer to list of foo arenas,
80 PL_foo_root pointer to list of free foo bodies
81 ... for foo in xiv, xnv, xrv, xpv etc.
82
83Note that some of the larger and more rarely used body types (eg xpvio)
84are not allocated using arenas, but are instead just malloc()/free()ed as
85required. Also, if PURIFY is defined, arenas are abandoned altogether,
86with all items individually malloc()ed. In addition, a few SV heads are
87not allocated from an arena, but are instead directly created as static
4977e971
NC
88or auto variables, eg PL_sv_undef. The size of arenas can be changed from
89the default by setting PERL_ARENA_SIZE appropriately at compile time.
645c22ef
DM
90
91The SV arena serves the secondary purpose of allowing still-live SVs
92to be located and destroyed during final cleanup.
93
94At the lowest level, the macros new_SV() and del_SV() grab and free
95an SV head. (If debugging with -DD, del_SV() calls the function S_del_sv()
96to return the SV to the free list with error checking.) new_SV() calls
97more_sv() / sv_add_arena() to add an extra arena if the free list is empty.
98SVs in the free list have their SvTYPE field set to all ones.
99
100Similarly, there are macros new_XIV()/del_XIV(), new_XNV()/del_XNV() etc
101that allocate and return individual body types. Normally these are mapped
ff276b08
RG
102to the arena-manipulating functions new_xiv()/del_xiv() etc, but may be
103instead mapped directly to malloc()/free() if PURIFY is defined. The
645c22ef
DM
104new/del functions remove from, or add to, the appropriate PL_foo_root
105list, and call more_xiv() etc to add a new arena if the list is empty.
106
ff276b08 107At the time of very final cleanup, sv_free_arenas() is called from
645c22ef
DM
108perl_destruct() to physically free all the arenas allocated since the
109start of the interpreter. Note that this also clears PL_he_arenaroot,
110which is otherwise dealt with in hv.c.
111
112Manipulation of any of the PL_*root pointers is protected by enclosing
113LOCK_SV_MUTEX; ... UNLOCK_SV_MUTEX calls which should Do the Right Thing
114if threads are enabled.
115
116The function visit() scans the SV arenas list, and calls a specified
117function for each SV it finds which is still live - ie which has an SvTYPE
118other than all 1's, and a non-zero SvREFCNT. visit() is used by the
119following functions (specified as [function that calls visit()] / [function
120called by visit() for each SV]):
121
122 sv_report_used() / do_report_used()
123 dump all remaining SVs (debugging aid)
124
125 sv_clean_objs() / do_clean_objs(),do_clean_named_objs()
126 Attempt to free all objects pointed to by RVs,
127 and, unless DISABLE_DESTRUCTOR_KLUDGE is defined,
128 try to do the same for all objects indirectly
129 referenced by typeglobs too. Called once from
130 perl_destruct(), prior to calling sv_clean_all()
131 below.
132
133 sv_clean_all() / do_clean_all()
134 SvREFCNT_dec(sv) each remaining SV, possibly
135 triggering an sv_free(). It also sets the
136 SVf_BREAK flag on the SV to indicate that the
137 refcnt has been artificially lowered, and thus
138 stopping sv_free() from giving spurious warnings
139 about SVs which unexpectedly have a refcnt
140 of zero. called repeatedly from perl_destruct()
141 until there are no SVs left.
142
143=head2 Summary
144
145Private API to rest of sv.c
146
147 new_SV(), del_SV(),
148
149 new_XIV(), del_XIV(),
150 new_XNV(), del_XNV(),
151 etc
152
153Public API:
154
8cf8f3d1 155 sv_report_used(), sv_clean_objs(), sv_clean_all(), sv_free_arenas()
645c22ef
DM
156
157
158=cut
159
160============================================================================ */
161
162
51371543 163
4561caa4
CS
164/*
165 * "A time to plant, and a time to uproot what was planted..."
166 */
167
77354fb4
NC
168/*
169 * nice_chunk and nice_chunk size need to be set
170 * and queried under the protection of sv_mutex
171 */
172void
173Perl_offer_nice_chunk(pTHX_ void *chunk, U32 chunk_size)
174{
175 void *new_chunk;
176 U32 new_chunk_size;
177 LOCK_SV_MUTEX;
178 new_chunk = (void *)(chunk);
179 new_chunk_size = (chunk_size);
180 if (new_chunk_size > PL_nice_chunk_size) {
181 Safefree(PL_nice_chunk);
182 PL_nice_chunk = (char *) new_chunk;
183 PL_nice_chunk_size = new_chunk_size;
184 } else {
185 Safefree(chunk);
186 }
187 UNLOCK_SV_MUTEX;
188}
cac9b346 189
fd0854ff
DM
190#ifdef DEBUG_LEAKING_SCALARS
191# ifdef NETWARE
192# define FREE_SV_DEBUG_FILE(sv) PerlMemfree((sv)->sv_debug_file)
193# else
194# define FREE_SV_DEBUG_FILE(sv) PerlMemShared_free((sv)->sv_debug_file)
195# endif
196#else
197# define FREE_SV_DEBUG_FILE(sv)
198#endif
199
053fc874
GS
200#define plant_SV(p) \
201 STMT_START { \
fd0854ff 202 FREE_SV_DEBUG_FILE(p); \
053fc874
GS
203 SvANY(p) = (void *)PL_sv_root; \
204 SvFLAGS(p) = SVTYPEMASK; \
205 PL_sv_root = (p); \
206 --PL_sv_count; \
207 } STMT_END
a0d0e21e 208
fba3b22e 209/* sv_mutex must be held while calling uproot_SV() */
053fc874
GS
210#define uproot_SV(p) \
211 STMT_START { \
212 (p) = PL_sv_root; \
213 PL_sv_root = (SV*)SvANY(p); \
214 ++PL_sv_count; \
215 } STMT_END
216
645c22ef 217
cac9b346
NC
218/* make some more SVs by adding another arena */
219
220/* sv_mutex must be held while calling more_sv() */
221STATIC SV*
222S_more_sv(pTHX)
223{
224 SV* sv;
225
226 if (PL_nice_chunk) {
227 sv_add_arena(PL_nice_chunk, PL_nice_chunk_size, 0);
228 PL_nice_chunk = Nullch;
229 PL_nice_chunk_size = 0;
230 }
231 else {
232 char *chunk; /* must use New here to match call to */
a02a5408 233 Newx(chunk,PERL_ARENA_SIZE,char); /* Safefree() in sv_free_arenas() */
2e7ed132 234 sv_add_arena(chunk, PERL_ARENA_SIZE, 0);
cac9b346
NC
235 }
236 uproot_SV(sv);
237 return sv;
238}
239
645c22ef
DM
240/* new_SV(): return a new, empty SV head */
241
eba0f806
DM
242#ifdef DEBUG_LEAKING_SCALARS
243/* provide a real function for a debugger to play with */
244STATIC SV*
245S_new_SV(pTHX)
246{
247 SV* sv;
248
249 LOCK_SV_MUTEX;
250 if (PL_sv_root)
251 uproot_SV(sv);
252 else
cac9b346 253 sv = S_more_sv(aTHX);
eba0f806
DM
254 UNLOCK_SV_MUTEX;
255 SvANY(sv) = 0;
256 SvREFCNT(sv) = 1;
257 SvFLAGS(sv) = 0;
fd0854ff
DM
258 sv->sv_debug_optype = PL_op ? PL_op->op_type : 0;
259 sv->sv_debug_line = (U16) ((PL_copline == NOLINE) ?
260 (PL_curcop ? CopLINE(PL_curcop) : 0) : PL_copline);
261 sv->sv_debug_inpad = 0;
262 sv->sv_debug_cloned = 0;
263# ifdef NETWARE
264 sv->sv_debug_file = PL_curcop ? savepv(CopFILE(PL_curcop)): NULL;
265# else
266 sv->sv_debug_file = PL_curcop ? savesharedpv(CopFILE(PL_curcop)): NULL;
267# endif
268
eba0f806
DM
269 return sv;
270}
271# define new_SV(p) (p)=S_new_SV(aTHX)
272
273#else
274# define new_SV(p) \
053fc874
GS
275 STMT_START { \
276 LOCK_SV_MUTEX; \
277 if (PL_sv_root) \
278 uproot_SV(p); \
279 else \
cac9b346 280 (p) = S_more_sv(aTHX); \
053fc874
GS
281 UNLOCK_SV_MUTEX; \
282 SvANY(p) = 0; \
283 SvREFCNT(p) = 1; \
284 SvFLAGS(p) = 0; \
285 } STMT_END
eba0f806 286#endif
463ee0b2 287
645c22ef
DM
288
289/* del_SV(): return an empty SV head to the free list */
290
a0d0e21e 291#ifdef DEBUGGING
4561caa4 292
053fc874
GS
293#define del_SV(p) \
294 STMT_START { \
295 LOCK_SV_MUTEX; \
aea4f609 296 if (DEBUG_D_TEST) \
053fc874
GS
297 del_sv(p); \
298 else \
299 plant_SV(p); \
300 UNLOCK_SV_MUTEX; \
301 } STMT_END
a0d0e21e 302
76e3520e 303STATIC void
cea2e8a9 304S_del_sv(pTHX_ SV *p)
463ee0b2 305{
aea4f609 306 if (DEBUG_D_TEST) {
4633a7c4 307 SV* sva;
a3b680e6 308 bool ok = 0;
3280af22 309 for (sva = PL_sv_arenaroot; sva; sva = (SV *) SvANY(sva)) {
53c1dcc0
AL
310 const SV * const sv = sva + 1;
311 const SV * const svend = &sva[SvREFCNT(sva)];
c0ff570e 312 if (p >= sv && p < svend) {
a0d0e21e 313 ok = 1;
c0ff570e
NC
314 break;
315 }
a0d0e21e
LW
316 }
317 if (!ok) {
0453d815 318 if (ckWARN_d(WARN_INTERNAL))
9014280d 319 Perl_warner(aTHX_ packWARN(WARN_INTERNAL),
472d47bc
SB
320 "Attempt to free non-arena SV: 0x%"UVxf
321 pTHX__FORMAT, PTR2UV(p) pTHX__VALUE);
a0d0e21e
LW
322 return;
323 }
324 }
4561caa4 325 plant_SV(p);
463ee0b2 326}
a0d0e21e 327
4561caa4
CS
328#else /* ! DEBUGGING */
329
330#define del_SV(p) plant_SV(p)
331
332#endif /* DEBUGGING */
463ee0b2 333
645c22ef
DM
334
335/*
ccfc67b7
JH
336=head1 SV Manipulation Functions
337
645c22ef
DM
338=for apidoc sv_add_arena
339
340Given a chunk of memory, link it to the head of the list of arenas,
341and split it into a list of free SVs.
342
343=cut
344*/
345
4633a7c4 346void
864dbfa3 347Perl_sv_add_arena(pTHX_ char *ptr, U32 size, U32 flags)
463ee0b2 348{
4633a7c4 349 SV* sva = (SV*)ptr;
463ee0b2
LW
350 register SV* sv;
351 register SV* svend;
4633a7c4
LW
352
353 /* The first SV in an arena isn't an SV. */
3280af22 354 SvANY(sva) = (void *) PL_sv_arenaroot; /* ptr to next arena */
4633a7c4
LW
355 SvREFCNT(sva) = size / sizeof(SV); /* number of SV slots */
356 SvFLAGS(sva) = flags; /* FAKE if not to be freed */
357
3280af22
NIS
358 PL_sv_arenaroot = sva;
359 PL_sv_root = sva + 1;
4633a7c4
LW
360
361 svend = &sva[SvREFCNT(sva) - 1];
362 sv = sva + 1;
463ee0b2 363 while (sv < svend) {
a0d0e21e 364 SvANY(sv) = (void *)(SV*)(sv + 1);
03e36789 365#ifdef DEBUGGING
978b032e 366 SvREFCNT(sv) = 0;
03e36789
NC
367#endif
368 /* Must always set typemask because it's awlays checked in on cleanup
369 when the arenas are walked looking for objects. */
8990e307 370 SvFLAGS(sv) = SVTYPEMASK;
463ee0b2
LW
371 sv++;
372 }
373 SvANY(sv) = 0;
03e36789
NC
374#ifdef DEBUGGING
375 SvREFCNT(sv) = 0;
376#endif
4633a7c4
LW
377 SvFLAGS(sv) = SVTYPEMASK;
378}
379
055972dc
DM
380/* visit(): call the named function for each non-free SV in the arenas
381 * whose flags field matches the flags/mask args. */
645c22ef 382
5226ed68 383STATIC I32
055972dc 384S_visit(pTHX_ SVFUNC_t f, U32 flags, U32 mask)
8990e307 385{
4633a7c4 386 SV* sva;
5226ed68 387 I32 visited = 0;
8990e307 388
3280af22 389 for (sva = PL_sv_arenaroot; sva; sva = (SV*)SvANY(sva)) {
53c1dcc0 390 register const SV * const svend = &sva[SvREFCNT(sva)];
a3b680e6 391 register SV* sv;
4561caa4 392 for (sv = sva + 1; sv < svend; ++sv) {
055972dc
DM
393 if (SvTYPE(sv) != SVTYPEMASK
394 && (sv->sv_flags & mask) == flags
395 && SvREFCNT(sv))
396 {
acfe0abc 397 (FCALL)(aTHX_ sv);
5226ed68
JH
398 ++visited;
399 }
8990e307
LW
400 }
401 }
5226ed68 402 return visited;
8990e307
LW
403}
404
758a08c3
JH
405#ifdef DEBUGGING
406
645c22ef
DM
407/* called by sv_report_used() for each live SV */
408
409static void
acfe0abc 410do_report_used(pTHX_ SV *sv)
645c22ef
DM
411{
412 if (SvTYPE(sv) != SVTYPEMASK) {
413 PerlIO_printf(Perl_debug_log, "****\n");
414 sv_dump(sv);
415 }
416}
758a08c3 417#endif
645c22ef
DM
418
419/*
420=for apidoc sv_report_used
421
422Dump the contents of all SVs not yet freed. (Debugging aid).
423
424=cut
425*/
426
8990e307 427void
864dbfa3 428Perl_sv_report_used(pTHX)
4561caa4 429{
ff270d3a 430#ifdef DEBUGGING
055972dc 431 visit(do_report_used, 0, 0);
ff270d3a 432#endif
4561caa4
CS
433}
434
645c22ef
DM
435/* called by sv_clean_objs() for each live SV */
436
437static void
e15faf7d 438do_clean_objs(pTHX_ SV *ref)
645c22ef 439{
e15faf7d 440 SV* target;
645c22ef 441
e15faf7d
NC
442 if (SvROK(ref) && SvOBJECT(target = SvRV(ref))) {
443 DEBUG_D((PerlIO_printf(Perl_debug_log, "Cleaning object ref:\n "), sv_dump(ref)));
444 if (SvWEAKREF(ref)) {
445 sv_del_backref(target, ref);
446 SvWEAKREF_off(ref);
447 SvRV_set(ref, NULL);
645c22ef 448 } else {
e15faf7d
NC
449 SvROK_off(ref);
450 SvRV_set(ref, NULL);
451 SvREFCNT_dec(target);
645c22ef
DM
452 }
453 }
454
455 /* XXX Might want to check arrays, etc. */
456}
457
458/* called by sv_clean_objs() for each live SV */
459
460#ifndef DISABLE_DESTRUCTOR_KLUDGE
461static void
acfe0abc 462do_clean_named_objs(pTHX_ SV *sv)
645c22ef
DM
463{
464 if (SvTYPE(sv) == SVt_PVGV && GvGP(sv)) {
c69033f2
NC
465 if ((
466#ifdef PERL_DONT_CREATE_GVSV
467 GvSV(sv) &&
468#endif
469 SvOBJECT(GvSV(sv))) ||
645c22ef
DM
470 (GvAV(sv) && SvOBJECT(GvAV(sv))) ||
471 (GvHV(sv) && SvOBJECT(GvHV(sv))) ||
472 (GvIO(sv) && SvOBJECT(GvIO(sv))) ||
473 (GvCV(sv) && SvOBJECT(GvCV(sv))) )
474 {
475 DEBUG_D((PerlIO_printf(Perl_debug_log, "Cleaning named glob object:\n "), sv_dump(sv)));
ec5f3c78 476 SvFLAGS(sv) |= SVf_BREAK;
645c22ef
DM
477 SvREFCNT_dec(sv);
478 }
479 }
480}
481#endif
482
483/*
484=for apidoc sv_clean_objs
485
486Attempt to destroy all objects not yet freed
487
488=cut
489*/
490
4561caa4 491void
864dbfa3 492Perl_sv_clean_objs(pTHX)
4561caa4 493{
3280af22 494 PL_in_clean_objs = TRUE;
055972dc 495 visit(do_clean_objs, SVf_ROK, SVf_ROK);
4561caa4 496#ifndef DISABLE_DESTRUCTOR_KLUDGE
2d0f3c12 497 /* some barnacles may yet remain, clinging to typeglobs */
055972dc 498 visit(do_clean_named_objs, SVt_PVGV, SVTYPEMASK);
4561caa4 499#endif
3280af22 500 PL_in_clean_objs = FALSE;
4561caa4
CS
501}
502
645c22ef
DM
503/* called by sv_clean_all() for each live SV */
504
505static void
acfe0abc 506do_clean_all(pTHX_ SV *sv)
645c22ef
DM
507{
508 DEBUG_D((PerlIO_printf(Perl_debug_log, "Cleaning loops: SV at 0x%"UVxf"\n", PTR2UV(sv)) ));
509 SvFLAGS(sv) |= SVf_BREAK;
0e705b3b
DM
510 if (PL_comppad == (AV*)sv) {
511 PL_comppad = Nullav;
512 PL_curpad = Null(SV**);
513 }
645c22ef
DM
514 SvREFCNT_dec(sv);
515}
516
517/*
518=for apidoc sv_clean_all
519
520Decrement the refcnt of each remaining SV, possibly triggering a
521cleanup. This function may have to be called multiple times to free
ff276b08 522SVs which are in complex self-referential hierarchies.
645c22ef
DM
523
524=cut
525*/
526
5226ed68 527I32
864dbfa3 528Perl_sv_clean_all(pTHX)
8990e307 529{
5226ed68 530 I32 cleaned;
3280af22 531 PL_in_clean_all = TRUE;
055972dc 532 cleaned = visit(do_clean_all, 0,0);
3280af22 533 PL_in_clean_all = FALSE;
5226ed68 534 return cleaned;
8990e307 535}
463ee0b2 536
7cfef17e
NC
537static void
538S_free_arena(pTHX_ void **root) {
539 while (root) {
1b6737cc 540 void ** const next = *(void **)root;
7cfef17e
NC
541 Safefree(root);
542 root = next;
543 }
544}
545
645c22ef
DM
546/*
547=for apidoc sv_free_arenas
548
549Deallocate the memory used by all arenas. Note that all the individual SV
550heads and bodies within the arenas must already have been freed.
551
552=cut
553*/
554
7cfef17e
NC
555#define free_arena(name) \
556 STMT_START { \
557 S_free_arena(aTHX_ (void**) PL_ ## name ## _arenaroot); \
558 PL_ ## name ## _arenaroot = 0; \
559 PL_ ## name ## _root = 0; \
560 } STMT_END
561
4633a7c4 562void
864dbfa3 563Perl_sv_free_arenas(pTHX)
4633a7c4
LW
564{
565 SV* sva;
566 SV* svanext;
567
568 /* Free arenas here, but be careful about fake ones. (We assume
569 contiguity of the fake ones with the corresponding real ones.) */
570
3280af22 571 for (sva = PL_sv_arenaroot; sva; sva = svanext) {
4633a7c4
LW
572 svanext = (SV*) SvANY(sva);
573 while (svanext && SvFAKE(svanext))
574 svanext = (SV*) SvANY(svanext);
575
576 if (!SvFAKE(sva))
1df70142 577 Safefree(sva);
4633a7c4 578 }
8b4f5e17 579
7cfef17e
NC
580 free_arena(xnv);
581 free_arena(xpv);
582 free_arena(xpviv);
583 free_arena(xpvnv);
584 free_arena(xpvcv);
585 free_arena(xpvav);
586 free_arena(xpvhv);
587 free_arena(xpvmg);
588 free_arena(xpvgv);
589 free_arena(xpvlv);
590 free_arena(xpvbm);
591 free_arena(he);
592#if defined(USE_ITHREADS)
593 free_arena(pte);
594#endif
612f20c3 595
43c5f42d 596 Safefree(PL_nice_chunk);
3280af22
NIS
597 PL_nice_chunk = Nullch;
598 PL_nice_chunk_size = 0;
599 PL_sv_arenaroot = 0;
600 PL_sv_root = 0;
4633a7c4
LW
601}
602
29489e7c
DM
603/* ---------------------------------------------------------------------
604 *
605 * support functions for report_uninit()
606 */
607
608/* the maxiumum size of array or hash where we will scan looking
609 * for the undefined element that triggered the warning */
610
611#define FUV_MAX_SEARCH_SIZE 1000
612
613/* Look for an entry in the hash whose value has the same SV as val;
614 * If so, return a mortal copy of the key. */
615
616STATIC SV*
617S_find_hash_subscript(pTHX_ HV *hv, SV* val)
618{
27da23d5 619 dVAR;
29489e7c 620 register HE **array;
29489e7c
DM
621 I32 i;
622
623 if (!hv || SvMAGICAL(hv) || !HvARRAY(hv) ||
624 (HvTOTALKEYS(hv) > FUV_MAX_SEARCH_SIZE))
625 return Nullsv;
626
627 array = HvARRAY(hv);
628
629 for (i=HvMAX(hv); i>0; i--) {
f54cb97a 630 register HE *entry;
29489e7c
DM
631 for (entry = array[i]; entry; entry = HeNEXT(entry)) {
632 if (HeVAL(entry) != val)
633 continue;
634 if ( HeVAL(entry) == &PL_sv_undef ||
635 HeVAL(entry) == &PL_sv_placeholder)
636 continue;
637 if (!HeKEY(entry))
638 return Nullsv;
639 if (HeKLEN(entry) == HEf_SVKEY)
640 return sv_mortalcopy(HeKEY_sv(entry));
641 return sv_2mortal(newSVpvn(HeKEY(entry), HeKLEN(entry)));
642 }
643 }
644 return Nullsv;
645}
646
647/* Look for an entry in the array whose value has the same SV as val;
648 * If so, return the index, otherwise return -1. */
649
650STATIC I32
651S_find_array_subscript(pTHX_ AV *av, SV* val)
652{
653 SV** svp;
654 I32 i;
655 if (!av || SvMAGICAL(av) || !AvARRAY(av) ||
656 (AvFILLp(av) > FUV_MAX_SEARCH_SIZE))
657 return -1;
658
659 svp = AvARRAY(av);
660 for (i=AvFILLp(av); i>=0; i--) {
661 if (svp[i] == val && svp[i] != &PL_sv_undef)
662 return i;
663 }
664 return -1;
665}
666
667/* S_varname(): return the name of a variable, optionally with a subscript.
668 * If gv is non-zero, use the name of that global, along with gvtype (one
669 * of "$", "@", "%"); otherwise use the name of the lexical at pad offset
670 * targ. Depending on the value of the subscript_type flag, return:
671 */
672
673#define FUV_SUBSCRIPT_NONE 1 /* "@foo" */
674#define FUV_SUBSCRIPT_ARRAY 2 /* "$foo[aindex]" */
675#define FUV_SUBSCRIPT_HASH 3 /* "$foo{keyname}" */
676#define FUV_SUBSCRIPT_WITHIN 4 /* "within @foo" */
677
678STATIC SV*
be2ef075 679S_varname(pTHX_ GV *gv, const char gvtype, PADOFFSET targ,
29489e7c
DM
680 SV* keyname, I32 aindex, int subscript_type)
681{
29489e7c 682
a3b680e6 683 SV * const name = sv_newmortal();
29489e7c
DM
684 if (gv) {
685
686 /* simulate gv_fullname4(), but add literal '^' for $^FOO names
687 * XXX get rid of all this if gv_fullnameX() ever supports this
688 * directly */
689
bfed75c6 690 const char *p;
53c1dcc0 691 HV * const hv = GvSTASH(gv);
29489e7c
DM
692 if (!hv)
693 p = "???";
bfcb3514 694 else if (!(p=HvNAME_get(hv)))
29489e7c 695 p = "__ANON__";
be2ef075
NC
696 if (strEQ(p, "main"))
697 sv_setpvn(name, &gvtype, 1);
698 else
699 Perl_sv_setpvf(aTHX_ name, "%c%s::", gvtype, p);
700
29489e7c
DM
701 if (GvNAMELEN(gv)>= 1 &&
702 ((unsigned int)*GvNAME(gv)) <= 26)
703 { /* handle $^FOO */
704 Perl_sv_catpvf(aTHX_ name,"^%c", *GvNAME(gv) + 'A' - 1);
705 sv_catpvn(name,GvNAME(gv)+1,GvNAMELEN(gv)-1);
706 }
707 else
708 sv_catpvn(name,GvNAME(gv),GvNAMELEN(gv));
709 }
710 else {
53c1dcc0
AL
711 U32 unused;
712 CV * const cv = find_runcv(&unused);
713 SV *sv;
714 AV *av;
715
29489e7c 716 if (!cv || !CvPADLIST(cv))
1b6737cc 717 return Nullsv;
29489e7c
DM
718 av = (AV*)(*av_fetch(CvPADLIST(cv), 0, FALSE));
719 sv = *av_fetch(av, targ, FALSE);
720 /* SvLEN in a pad name is not to be trusted */
f9926b10 721 sv_setpv(name, SvPV_nolen_const(sv));
29489e7c
DM
722 }
723
724 if (subscript_type == FUV_SUBSCRIPT_HASH) {
1b6737cc 725 SV * const sv = NEWSV(0,0);
29489e7c 726 *SvPVX(name) = '$';
29489e7c 727 Perl_sv_catpvf(aTHX_ name, "{%s}",
3f7c398e 728 pv_display(sv,SvPVX_const(keyname), SvCUR(keyname), 0, 32));
29489e7c
DM
729 SvREFCNT_dec(sv);
730 }
731 else if (subscript_type == FUV_SUBSCRIPT_ARRAY) {
732 *SvPVX(name) = '$';
265a12b8 733 Perl_sv_catpvf(aTHX_ name, "[%"IVdf"]", (IV)aindex);
29489e7c
DM
734 }
735 else if (subscript_type == FUV_SUBSCRIPT_WITHIN)
736 sv_insert(name, 0, 0, "within ", 7);
737
738 return name;
739}
740
741
742/*
743=for apidoc find_uninit_var
744
745Find the name of the undefined variable (if any) that caused the operator o
746to issue a "Use of uninitialized value" warning.
747If match is true, only return a name if it's value matches uninit_sv.
748So roughly speaking, if a unary operator (such as OP_COS) generates a
749warning, then following the direct child of the op may yield an
750OP_PADSV or OP_GV that gives the name of the undefined variable. On the
751other hand, with OP_ADD there are two branches to follow, so we only print
752the variable name if we get an exact match.
753
754The name is returned as a mortal SV.
755
756Assumes that PL_op is the op that originally triggered the error, and that
757PL_comppad/PL_curpad points to the currently executing pad.
758
759=cut
760*/
761
762STATIC SV *
763S_find_uninit_var(pTHX_ OP* obase, SV* uninit_sv, bool match)
764{
27da23d5 765 dVAR;
29489e7c
DM
766 SV *sv;
767 AV *av;
29489e7c
DM
768 GV *gv;
769 OP *o, *o2, *kid;
770
771 if (!obase || (match && (!uninit_sv || uninit_sv == &PL_sv_undef ||
772 uninit_sv == &PL_sv_placeholder)))
773 return Nullsv;
774
775 switch (obase->op_type) {
776
777 case OP_RV2AV:
778 case OP_RV2HV:
779 case OP_PADAV:
780 case OP_PADHV:
781 {
f54cb97a
AL
782 const bool pad = (obase->op_type == OP_PADAV || obase->op_type == OP_PADHV);
783 const bool hash = (obase->op_type == OP_PADHV || obase->op_type == OP_RV2HV);
112dcc46
RGS
784 I32 index = 0;
785 SV *keysv = Nullsv;
29489e7c
DM
786 int subscript_type = FUV_SUBSCRIPT_WITHIN;
787
788 if (pad) { /* @lex, %lex */
789 sv = PAD_SVl(obase->op_targ);
790 gv = Nullgv;
791 }
792 else {
793 if (cUNOPx(obase)->op_first->op_type == OP_GV) {
794 /* @global, %global */
795 gv = cGVOPx_gv(cUNOPx(obase)->op_first);
796 if (!gv)
797 break;
798 sv = hash ? (SV*)GvHV(gv): (SV*)GvAV(gv);
799 }
800 else /* @{expr}, %{expr} */
801 return find_uninit_var(cUNOPx(obase)->op_first,
802 uninit_sv, match);
803 }
804
805 /* attempt to find a match within the aggregate */
806 if (hash) {
807 keysv = S_find_hash_subscript(aTHX_ (HV*)sv, uninit_sv);
808 if (keysv)
809 subscript_type = FUV_SUBSCRIPT_HASH;
810 }
811 else {
812 index = S_find_array_subscript(aTHX_ (AV*)sv, uninit_sv);
813 if (index >= 0)
814 subscript_type = FUV_SUBSCRIPT_ARRAY;
815 }
816
817 if (match && subscript_type == FUV_SUBSCRIPT_WITHIN)
818 break;
819
be2ef075 820 return varname(gv, hash ? '%' : '@', obase->op_targ,
29489e7c
DM
821 keysv, index, subscript_type);
822 }
823
824 case OP_PADSV:
825 if (match && PAD_SVl(obase->op_targ) != uninit_sv)
826 break;
be2ef075 827 return varname(Nullgv, '$', obase->op_targ,
29489e7c
DM
828 Nullsv, 0, FUV_SUBSCRIPT_NONE);
829
830 case OP_GVSV:
831 gv = cGVOPx_gv(obase);
832 if (!gv || (match && GvSV(gv) != uninit_sv))
833 break;
be2ef075 834 return varname(gv, '$', 0, Nullsv, 0, FUV_SUBSCRIPT_NONE);
29489e7c
DM
835
836 case OP_AELEMFAST:
837 if (obase->op_flags & OPf_SPECIAL) { /* lexical array */
838 if (match) {
1b6737cc 839 SV **svp;
29489e7c
DM
840 av = (AV*)PAD_SV(obase->op_targ);
841 if (!av || SvRMAGICAL(av))
842 break;
843 svp = av_fetch(av, (I32)obase->op_private, FALSE);
844 if (!svp || *svp != uninit_sv)
845 break;
846 }
be2ef075 847 return varname(Nullgv, '$', obase->op_targ,
29489e7c
DM
848 Nullsv, (I32)obase->op_private, FUV_SUBSCRIPT_ARRAY);
849 }
850 else {
851 gv = cGVOPx_gv(obase);
852 if (!gv)
853 break;
854 if (match) {
1b6737cc 855 SV **svp;
29489e7c
DM
856 av = GvAV(gv);
857 if (!av || SvRMAGICAL(av))
858 break;
859 svp = av_fetch(av, (I32)obase->op_private, FALSE);
860 if (!svp || *svp != uninit_sv)
861 break;
862 }
be2ef075 863 return varname(gv, '$', 0,
29489e7c
DM
864 Nullsv, (I32)obase->op_private, FUV_SUBSCRIPT_ARRAY);
865 }
866 break;
867
868 case OP_EXISTS:
869 o = cUNOPx(obase)->op_first;
870 if (!o || o->op_type != OP_NULL ||
871 ! (o->op_targ == OP_AELEM || o->op_targ == OP_HELEM))
872 break;
873 return find_uninit_var(cBINOPo->op_last, uninit_sv, match);
874
875 case OP_AELEM:
876 case OP_HELEM:
877 if (PL_op == obase)
878 /* $a[uninit_expr] or $h{uninit_expr} */
879 return find_uninit_var(cBINOPx(obase)->op_last, uninit_sv, match);
880
881 gv = Nullgv;
882 o = cBINOPx(obase)->op_first;
883 kid = cBINOPx(obase)->op_last;
884
885 /* get the av or hv, and optionally the gv */
886 sv = Nullsv;
887 if (o->op_type == OP_PADAV || o->op_type == OP_PADHV) {
888 sv = PAD_SV(o->op_targ);
889 }
890 else if ((o->op_type == OP_RV2AV || o->op_type == OP_RV2HV)
891 && cUNOPo->op_first->op_type == OP_GV)
892 {
893 gv = cGVOPx_gv(cUNOPo->op_first);
894 if (!gv)
895 break;
896 sv = o->op_type == OP_RV2HV ? (SV*)GvHV(gv) : (SV*)GvAV(gv);
897 }
898 if (!sv)
899 break;
900
901 if (kid && kid->op_type == OP_CONST && SvOK(cSVOPx_sv(kid))) {
902 /* index is constant */
903 if (match) {
904 if (SvMAGICAL(sv))
905 break;
906 if (obase->op_type == OP_HELEM) {
907 HE* he = hv_fetch_ent((HV*)sv, cSVOPx_sv(kid), 0, 0);
908 if (!he || HeVAL(he) != uninit_sv)
909 break;
910 }
911 else {
1b6737cc 912 SV ** const svp = av_fetch((AV*)sv, SvIV(cSVOPx_sv(kid)), FALSE);
29489e7c
DM
913 if (!svp || *svp != uninit_sv)
914 break;
915 }
916 }
917 if (obase->op_type == OP_HELEM)
be2ef075 918 return varname(gv, '%', o->op_targ,
29489e7c
DM
919 cSVOPx_sv(kid), 0, FUV_SUBSCRIPT_HASH);
920 else
be2ef075 921 return varname(gv, '@', o->op_targ, Nullsv,
29489e7c
DM
922 SvIV(cSVOPx_sv(kid)), FUV_SUBSCRIPT_ARRAY);
923 ;
924 }
925 else {
926 /* index is an expression;
927 * attempt to find a match within the aggregate */
928 if (obase->op_type == OP_HELEM) {
53c1dcc0 929 SV * const keysv = S_find_hash_subscript(aTHX_ (HV*)sv, uninit_sv);
29489e7c 930 if (keysv)
be2ef075 931 return varname(gv, '%', o->op_targ,
29489e7c
DM
932 keysv, 0, FUV_SUBSCRIPT_HASH);
933 }
934 else {
f54cb97a 935 const I32 index = S_find_array_subscript(aTHX_ (AV*)sv, uninit_sv);
29489e7c 936 if (index >= 0)
be2ef075 937 return varname(gv, '@', o->op_targ,
29489e7c
DM
938 Nullsv, index, FUV_SUBSCRIPT_ARRAY);
939 }
940 if (match)
941 break;
1b6737cc 942 return varname(gv,
29489e7c 943 (o->op_type == OP_PADAV || o->op_type == OP_RV2AV)
be2ef075 944 ? '@' : '%',
29489e7c
DM
945 o->op_targ, Nullsv, 0, FUV_SUBSCRIPT_WITHIN);
946 }
947
948 break;
949
950 case OP_AASSIGN:
951 /* only examine RHS */
952 return find_uninit_var(cBINOPx(obase)->op_first, uninit_sv, match);
953
954 case OP_OPEN:
955 o = cUNOPx(obase)->op_first;
956 if (o->op_type == OP_PUSHMARK)
957 o = o->op_sibling;
958
959 if (!o->op_sibling) {
960 /* one-arg version of open is highly magical */
961
962 if (o->op_type == OP_GV) { /* open FOO; */
963 gv = cGVOPx_gv(o);
964 if (match && GvSV(gv) != uninit_sv)
965 break;
be2ef075 966 return varname(gv, '$', 0,
29489e7c
DM
967 Nullsv, 0, FUV_SUBSCRIPT_NONE);
968 }
969 /* other possibilities not handled are:
970 * open $x; or open my $x; should return '${*$x}'
971 * open expr; should return '$'.expr ideally
972 */
973 break;
974 }
975 goto do_op;
976
977 /* ops where $_ may be an implicit arg */
978 case OP_TRANS:
979 case OP_SUBST:
980 case OP_MATCH:
981 if ( !(obase->op_flags & OPf_STACKED)) {
982 if (uninit_sv == ((obase->op_private & OPpTARGET_MY)
983 ? PAD_SVl(obase->op_targ)
984 : DEFSV))
985 {
986 sv = sv_newmortal();
616d8c9c 987 sv_setpvn(sv, "$_", 2);
29489e7c
DM
988 return sv;
989 }
990 }
991 goto do_op;
992
993 case OP_PRTF:
994 case OP_PRINT:
995 /* skip filehandle as it can't produce 'undef' warning */
996 o = cUNOPx(obase)->op_first;
997 if ((obase->op_flags & OPf_STACKED) && o->op_type == OP_PUSHMARK)
998 o = o->op_sibling->op_sibling;
999 goto do_op2;
1000
1001
e21bd382 1002 case OP_RV2SV:
29489e7c
DM
1003 case OP_CUSTOM:
1004 case OP_ENTERSUB:
1005 match = 1; /* XS or custom code could trigger random warnings */
1006 goto do_op;
1007
1008 case OP_SCHOMP:
1009 case OP_CHOMP:
1010 if (SvROK(PL_rs) && uninit_sv == SvRV(PL_rs))
d0043bd1 1011 return sv_2mortal(newSVpvn("${$/}", 5));
29489e7c
DM
1012 /* FALL THROUGH */
1013
1014 default:
1015 do_op:
1016 if (!(obase->op_flags & OPf_KIDS))
1017 break;
1018 o = cUNOPx(obase)->op_first;
1019
1020 do_op2:
1021 if (!o)
1022 break;
1023
1024 /* if all except one arg are constant, or have no side-effects,
1025 * or are optimized away, then it's unambiguous */
1026 o2 = Nullop;
1027 for (kid=o; kid; kid = kid->op_sibling) {
1028 if (kid &&
1029 ( (kid->op_type == OP_CONST && SvOK(cSVOPx_sv(kid)))
1030 || (kid->op_type == OP_NULL && ! (kid->op_flags & OPf_KIDS))
1031 || (kid->op_type == OP_PUSHMARK)
1032 )
1033 )
1034 continue;
1035 if (o2) { /* more than one found */
1036 o2 = Nullop;
1037 break;
1038 }
1039 o2 = kid;
1040 }
1041 if (o2)
1042 return find_uninit_var(o2, uninit_sv, match);
1043
1044 /* scan all args */
1045 while (o) {
1046 sv = find_uninit_var(o, uninit_sv, 1);
1047 if (sv)
1048 return sv;
1049 o = o->op_sibling;
1050 }
1051 break;
1052 }
1053 return Nullsv;
1054}
1055
1056
645c22ef
DM
1057/*
1058=for apidoc report_uninit
1059
1060Print appropriate "Use of uninitialized variable" warning
1061
1062=cut
1063*/
1064
1d7c1841 1065void
29489e7c
DM
1066Perl_report_uninit(pTHX_ SV* uninit_sv)
1067{
1068 if (PL_op) {
112dcc46 1069 SV* varname = Nullsv;
29489e7c
DM
1070 if (uninit_sv) {
1071 varname = find_uninit_var(PL_op, uninit_sv,0);
1072 if (varname)
1073 sv_insert(varname, 0, 0, " ", 1);
1074 }
9014280d 1075 Perl_warner(aTHX_ packWARN(WARN_UNINITIALIZED), PL_warn_uninit,
93524f2b 1076 varname ? SvPV_nolen_const(varname) : "",
29489e7c
DM
1077 " in ", OP_DESC(PL_op));
1078 }
1d7c1841 1079 else
29489e7c
DM
1080 Perl_warner(aTHX_ packWARN(WARN_UNINITIALIZED), PL_warn_uninit,
1081 "", "", "");
1d7c1841
GS
1082}
1083
de042e1d 1084STATIC void *
e3bbdc67 1085S_more_bodies (pTHX_ void **arena_root, void **root, size_t size)
cac9b346 1086{
e3bbdc67
NC
1087 char *start;
1088 const char *end;
53c1dcc0 1089 const size_t count = PERL_ARENA_SIZE/size;
a02a5408 1090 Newx(start, count*size, char);
e3bbdc67
NC
1091 *((void **) start) = *arena_root;
1092 *arena_root = (void *)start;
cac9b346 1093
e3bbdc67 1094 end = start + (count-1) * size;
cac9b346 1095
e3bbdc67
NC
1096 /* The initial slot is used to link the arenas together, so it isn't to be
1097 linked into the list of ready-to-use bodies. */
cac9b346 1098
e3bbdc67 1099 start += size;
cac9b346 1100
e3bbdc67 1101 *root = (void *)start;
cac9b346 1102
e3bbdc67 1103 while (start < end) {
53c1dcc0 1104 char * const next = start + size;
e3bbdc67
NC
1105 *(void**) start = (void *)next;
1106 start = next;
cac9b346 1107 }
e3bbdc67 1108 *(void **)start = 0;
de042e1d
NC
1109
1110 return *root;
cac9b346
NC
1111}
1112
aeb18a1e 1113/* grab a new thing from the free list, allocating more if necessary */
645c22ef 1114
30f9da9e 1115/* 1st, the inline version */
08742458
NC
1116
1117#define new_body_inline(xpv, arena_root, root, size) \
1118 STMT_START { \
1119 LOCK_SV_MUTEX; \
1120 xpv = *((void **)(root)) \
1121 ? *((void **)(root)) : S_more_bodies(aTHX_ arena_root, root, size); \
1122 *(root) = *(void**)(xpv); \
1123 UNLOCK_SV_MUTEX; \
1124 } STMT_END
1125
30f9da9e
JC
1126/* now use the inline version in the proper function */
1127
1128STATIC void *
1129S_new_body(pTHX_ void **arena_root, void **root, size_t size)
1130{
1131 void *xpv;
1132 new_body_inline(xpv, arena_root, root, size);
1133 return xpv;
1134}
1135
aeb18a1e 1136/* return a thing to the free list */
645c22ef 1137
cb4415b8
NC
1138#define del_body(thing, root) \
1139 STMT_START { \
49c04cc7 1140 void **thing_copy = (void **)thing; \
cb4415b8 1141 LOCK_SV_MUTEX; \
49c04cc7
NC
1142 *thing_copy = *root; \
1143 *root = (void*)thing_copy; \
cb4415b8
NC
1144 UNLOCK_SV_MUTEX; \
1145 } STMT_END
932e9ff9 1146
aeb18a1e
NC
1147/* Conventionally we simply malloc() a big block of memory, then divide it
1148 up into lots of the thing that we're allocating.
645c22ef 1149
aeb18a1e
NC
1150 This macro will expand to call to S_new_body. So for XPVBM (with ithreads),
1151 it would become
932e9ff9 1152
aeb18a1e
NC
1153 S_new_body(my_perl, (void**)&(my_perl->Ixpvbm_arenaroot),
1154 (void**)&(my_perl->Ixpvbm_root), sizeof(XPVBM), 0)
1155*/
645c22ef 1156
08742458 1157#define new_body_type(TYPE,lctype) \
aeb18a1e
NC
1158 S_new_body(aTHX_ (void**)&PL_ ## lctype ## _arenaroot, \
1159 (void**)&PL_ ## lctype ## _root, \
dd690478
NC
1160 sizeof(TYPE))
1161
cb4415b8
NC
1162#define del_body_type(p,TYPE,lctype) \
1163 del_body((void*)p, (void**)&PL_ ## lctype ## _root)
aeb18a1e
NC
1164
1165/* But for some types, we cheat. The type starts with some members that are
1166 never accessed. So we allocate the substructure, starting at the first used
1167 member, then adjust the pointer back in memory by the size of the bit not
1168 allocated, so it's as if we allocated the full structure.
1169 (But things will all go boom if you write to the part that is "not there",
1170 because you'll be overwriting the last members of the preceding structure
1171 in memory.)
1172
1173 We calculate the correction using the STRUCT_OFFSET macro. For example, if
1174 xpv_allocated is the same structure as XPV then the two OFFSETs sum to zero,
1175 and the pointer is unchanged. If the allocated structure is smaller (no
1176 initial NV actually allocated) then the net effect is to subtract the size
1177 of the NV from the pointer, to return a new pointer as if an initial NV were
1178 actually allocated.
1179
1180 This is the same trick as was used for NV and IV bodies. Ironically it
1181 doesn't need to be used for NV bodies any more, because NV is now at the
1182 start of the structure. IV bodies don't need it either, because they are
1183 no longer allocated. */
1184
1185#define new_body_allocated(TYPE,lctype,member) \
dd690478
NC
1186 (void*)((char*)S_new_body(aTHX_ (void**)&PL_ ## lctype ## _arenaroot, \
1187 (void**)&PL_ ## lctype ## _root, \
1188 sizeof(lctype ## _allocated)) - \
1189 STRUCT_OFFSET(TYPE, member) \
1190 + STRUCT_OFFSET(lctype ## _allocated, member))
aeb18a1e
NC
1191
1192
aeb18a1e 1193#define del_body_allocated(p,TYPE,lctype,member) \
cb4415b8
NC
1194 del_body((void*)((char*)p + STRUCT_OFFSET(TYPE, member) \
1195 - STRUCT_OFFSET(lctype ## _allocated, member)), \
1196 (void**)&PL_ ## lctype ## _root)
932e9ff9 1197
7bab3ede
MB
1198#define my_safemalloc(s) (void*)safemalloc(s)
1199#define my_safefree(p) safefree((char*)p)
463ee0b2 1200
d33b2eba 1201#ifdef PURIFY
463ee0b2 1202
d33b2eba
GS
1203#define new_XNV() my_safemalloc(sizeof(XPVNV))
1204#define del_XNV(p) my_safefree(p)
463ee0b2 1205
d33b2eba
GS
1206#define new_XPV() my_safemalloc(sizeof(XPV))
1207#define del_XPV(p) my_safefree(p)
9b94d1dd 1208
d33b2eba
GS
1209#define new_XPVIV() my_safemalloc(sizeof(XPVIV))
1210#define del_XPVIV(p) my_safefree(p)
932e9ff9 1211
d33b2eba
GS
1212#define new_XPVNV() my_safemalloc(sizeof(XPVNV))
1213#define del_XPVNV(p) my_safefree(p)
932e9ff9 1214
d33b2eba
GS
1215#define new_XPVCV() my_safemalloc(sizeof(XPVCV))
1216#define del_XPVCV(p) my_safefree(p)
932e9ff9 1217
d33b2eba
GS
1218#define new_XPVAV() my_safemalloc(sizeof(XPVAV))
1219#define del_XPVAV(p) my_safefree(p)
1220
1221#define new_XPVHV() my_safemalloc(sizeof(XPVHV))
1222#define del_XPVHV(p) my_safefree(p)
1c846c1f 1223
d33b2eba
GS
1224#define new_XPVMG() my_safemalloc(sizeof(XPVMG))
1225#define del_XPVMG(p) my_safefree(p)
1226
727879eb
NC
1227#define new_XPVGV() my_safemalloc(sizeof(XPVGV))
1228#define del_XPVGV(p) my_safefree(p)
1229
d33b2eba
GS
1230#define new_XPVLV() my_safemalloc(sizeof(XPVLV))
1231#define del_XPVLV(p) my_safefree(p)
1232
1233#define new_XPVBM() my_safemalloc(sizeof(XPVBM))
1234#define del_XPVBM(p) my_safefree(p)
1235
1236#else /* !PURIFY */
1237
08742458 1238#define new_XNV() new_body_type(NV, xnv)
cb4415b8 1239#define del_XNV(p) del_body_type(p, NV, xnv)
9b94d1dd 1240
aeb18a1e
NC
1241#define new_XPV() new_body_allocated(XPV, xpv, xpv_cur)
1242#define del_XPV(p) del_body_allocated(p, XPV, xpv, xpv_cur)
d33b2eba 1243
aeb18a1e
NC
1244#define new_XPVIV() new_body_allocated(XPVIV, xpviv, xpv_cur)
1245#define del_XPVIV(p) del_body_allocated(p, XPVIV, xpviv, xpv_cur)
d33b2eba 1246
08742458 1247#define new_XPVNV() new_body_type(XPVNV, xpvnv)
cb4415b8 1248#define del_XPVNV(p) del_body_type(p, XPVNV, xpvnv)
d33b2eba 1249
08742458 1250#define new_XPVCV() new_body_type(XPVCV, xpvcv)
cb4415b8 1251#define del_XPVCV(p) del_body_type(p, XPVCV, xpvcv)
d33b2eba 1252
aeb18a1e
NC
1253#define new_XPVAV() new_body_allocated(XPVAV, xpvav, xav_fill)
1254#define del_XPVAV(p) del_body_allocated(p, XPVAV, xpvav, xav_fill)
d33b2eba 1255
aeb18a1e
NC
1256#define new_XPVHV() new_body_allocated(XPVHV, xpvhv, xhv_fill)
1257#define del_XPVHV(p) del_body_allocated(p, XPVHV, xpvhv, xhv_fill)
1c846c1f 1258
08742458 1259#define new_XPVMG() new_body_type(XPVMG, xpvmg)
cb4415b8 1260#define del_XPVMG(p) del_body_type(p, XPVMG, xpvmg)
d33b2eba 1261
08742458 1262#define new_XPVGV() new_body_type(XPVGV, xpvgv)
cb4415b8 1263#define del_XPVGV(p) del_body_type(p, XPVGV, xpvgv)
727879eb 1264
08742458 1265#define new_XPVLV() new_body_type(XPVLV, xpvlv)
cb4415b8 1266#define del_XPVLV(p) del_body_type(p, XPVLV, xpvlv)
d33b2eba 1267
08742458 1268#define new_XPVBM() new_body_type(XPVBM, xpvbm)
cb4415b8 1269#define del_XPVBM(p) del_body_type(p, XPVBM, xpvbm)
d33b2eba
GS
1270
1271#endif /* PURIFY */
9b94d1dd 1272
d33b2eba
GS
1273#define new_XPVFM() my_safemalloc(sizeof(XPVFM))
1274#define del_XPVFM(p) my_safefree(p)
1c846c1f 1275
d33b2eba
GS
1276#define new_XPVIO() my_safemalloc(sizeof(XPVIO))
1277#define del_XPVIO(p) my_safefree(p)
8990e307 1278
954c1994
GS
1279/*
1280=for apidoc sv_upgrade
1281
ff276b08 1282Upgrade an SV to a more complex form. Generally adds a new body type to the
645c22ef 1283SV, then copies across as much information as possible from the old body.
ff276b08 1284You generally want to use the C<SvUPGRADE> macro wrapper. See also C<svtype>.
954c1994
GS
1285
1286=cut
1287*/
1288
63f97190 1289void
864dbfa3 1290Perl_sv_upgrade(pTHX_ register SV *sv, U32 mt)
79072805 1291{
9a085840 1292 void** old_body_arena;
878cc751 1293 size_t old_body_offset;
4cbc76b1 1294 size_t old_body_length; /* Well, the length to copy. */
878cc751 1295 void* old_body;
16b305e3
NC
1296#ifndef NV_ZERO_IS_ALLBITS_ZERO
1297 /* If NV 0.0 is store as all bits 0 then Zero() already creates a correct
1298 0.0 for us. */
4cbc76b1 1299 bool zero_nv = TRUE;
16b305e3 1300#endif
403d36eb
NC
1301 void* new_body;
1302 size_t new_body_length;
1303 size_t new_body_offset;
1304 void** new_body_arena;
1305 void** new_body_arenaroot;
53c1dcc0 1306 const U32 old_type = SvTYPE(sv);
79072805 1307
765f542d
NC
1308 if (mt != SVt_PV && SvIsCOW(sv)) {
1309 sv_force_normal_flags(sv, 0);
f130fd45
NIS
1310 }
1311
79072805 1312 if (SvTYPE(sv) == mt)
63f97190 1313 return;
79072805 1314
f5282e15 1315 if (SvTYPE(sv) > mt)
921edb34
RGS
1316 Perl_croak(aTHX_ "sv_upgrade from type %d down to type %d",
1317 (int)SvTYPE(sv), (int)mt);
f5282e15 1318
d2e56290 1319
878cc751
NC
1320 old_body = SvANY(sv);
1321 old_body_arena = 0;
1322 old_body_offset = 0;
4cbc76b1 1323 old_body_length = 0;
403d36eb
NC
1324 new_body_offset = 0;
1325 new_body_length = ~0;
1326
1327 /* Copying structures onto other structures that have been neatly zeroed
1328 has a subtle gotcha. Consider XPVMG
1329
1330 +------+------+------+------+------+-------+-------+
1331 | NV | CUR | LEN | IV | MAGIC | STASH |
1332 +------+------+------+------+------+-------+-------+
1333 0 4 8 12 16 20 24 28
1334
1335 where NVs are aligned to 8 bytes, so that sizeof that structure is
1336 actually 32 bytes long, with 4 bytes of padding at the end:
1337
1338 +------+------+------+------+------+-------+-------+------+
1339 | NV | CUR | LEN | IV | MAGIC | STASH | ??? |
1340 +------+------+------+------+------+-------+-------+------+
1341 0 4 8 12 16 20 24 28 32
1342
1343 so what happens if you allocate memory for this structure:
1344
1345 +------+------+------+------+------+-------+-------+------+------+...
1346 | NV | CUR | LEN | IV | MAGIC | STASH | GP | NAME |
1347 +------+------+------+------+------+-------+-------+------+------+...
1348 0 4 8 12 16 20 24 28 32 36
1349
1350 zero it, then copy sizeof(XPVMG) bytes on top of it? Not quite what you
1351 expect, because you copy the area marked ??? onto GP. Now, ??? may have
1352 started out as zero once, but it's quite possible that it isn't. So now,
1353 rather than a nicely zeroed GP, you have it pointing somewhere random.
1354 Bugs ensue.
1355
1356 (In fact, GP ends up pointing at a previous GP structure, because the
1357 principle cause of the padding in XPVMG getting garbage is a copy of
1358 sizeof(XPVMG) bytes from a XPVGV structure in sv_unglob)
1359
1360 So we are careful and work out the size of used parts of all the
1361 structures. */
878cc751 1362
79072805
LW
1363 switch (SvTYPE(sv)) {
1364 case SVt_NULL:
79072805 1365 break;
79072805 1366 case SVt_IV:
ed6116ce 1367 if (mt == SVt_NV)
463ee0b2 1368 mt = SVt_PVNV;
ed6116ce
LW
1369 else if (mt < SVt_PVIV)
1370 mt = SVt_PVIV;
4cbc76b1
NC
1371 old_body_offset = STRUCT_OFFSET(XPVIV, xiv_iv);
1372 old_body_length = sizeof(IV);
79072805
LW
1373 break;
1374 case SVt_NV:
9a085840 1375 old_body_arena = (void **) &PL_xnv_root;
4cbc76b1 1376 old_body_length = sizeof(NV);
16b305e3 1377#ifndef NV_ZERO_IS_ALLBITS_ZERO
4cbc76b1 1378 zero_nv = FALSE;
16b305e3 1379#endif
ed6116ce 1380 if (mt < SVt_PVNV)
79072805
LW
1381 mt = SVt_PVNV;
1382 break;
ed6116ce 1383 case SVt_RV:
ed6116ce 1384 break;
79072805 1385 case SVt_PV:
9a085840 1386 old_body_arena = (void **) &PL_xpv_root;
878cc751
NC
1387 old_body_offset = STRUCT_OFFSET(XPV, xpv_cur)
1388 - STRUCT_OFFSET(xpv_allocated, xpv_cur);
403d36eb
NC
1389 old_body_length = STRUCT_OFFSET(XPV, xpv_len)
1390 + sizeof (((XPV*)SvANY(sv))->xpv_len)
1391 - old_body_offset;
748a9306
LW
1392 if (mt <= SVt_IV)
1393 mt = SVt_PVIV;
1394 else if (mt == SVt_NV)
1395 mt = SVt_PVNV;
79072805
LW
1396 break;
1397 case SVt_PVIV:
9a085840 1398 old_body_arena = (void **) &PL_xpviv_root;
878cc751
NC
1399 old_body_offset = STRUCT_OFFSET(XPVIV, xpv_cur)
1400 - STRUCT_OFFSET(xpviv_allocated, xpv_cur);
403d36eb
NC
1401 old_body_length = STRUCT_OFFSET(XPVIV, xiv_u)
1402 + sizeof (((XPVIV*)SvANY(sv))->xiv_u)
1403 - old_body_offset;
79072805
LW
1404 break;
1405 case SVt_PVNV:
9a085840 1406 old_body_arena = (void **) &PL_xpvnv_root;
403d36eb
NC
1407 old_body_length = STRUCT_OFFSET(XPVNV, xiv_u)
1408 + sizeof (((XPVNV*)SvANY(sv))->xiv_u);
16b305e3 1409#ifndef NV_ZERO_IS_ALLBITS_ZERO
4cbc76b1 1410 zero_nv = FALSE;
16b305e3 1411#endif
79072805
LW
1412 break;
1413 case SVt_PVMG:
0ec50a73
NC
1414 /* Because the XPVMG of PL_mess_sv isn't allocated from the arena,
1415 there's no way that it can be safely upgraded, because perl.c
1416 expects to Safefree(SvANY(PL_mess_sv)) */
1417 assert(sv != PL_mess_sv);
bce8f412
NC
1418 /* This flag bit is used to mean other things in other scalar types.
1419 Given that it only has meaning inside the pad, it shouldn't be set
1420 on anything that can get upgraded. */
1421 assert((SvFLAGS(sv) & SVpad_TYPED) == 0);
9a085840 1422 old_body_arena = (void **) &PL_xpvmg_root;
403d36eb
NC
1423 old_body_length = STRUCT_OFFSET(XPVMG, xmg_stash)
1424 + sizeof (((XPVMG*)SvANY(sv))->xmg_stash);
16b305e3 1425#ifndef NV_ZERO_IS_ALLBITS_ZERO
4cbc76b1 1426 zero_nv = FALSE;
16b305e3 1427#endif
79072805
LW
1428 break;
1429 default:
cea2e8a9 1430 Perl_croak(aTHX_ "Can't upgrade that kind of scalar");
79072805
LW
1431 }
1432
ffb05e06
NC
1433 SvFLAGS(sv) &= ~SVTYPEMASK;
1434 SvFLAGS(sv) |= mt;
1435
79072805
LW
1436 switch (mt) {
1437 case SVt_NULL:
cea2e8a9 1438 Perl_croak(aTHX_ "Can't upgrade to undef");
79072805 1439 case SVt_IV:
4cbc76b1 1440 assert(old_type == SVt_NULL);
339049b0 1441 SvANY(sv) = (XPVIV*)((char*)&(sv->sv_u.svu_iv) - STRUCT_OFFSET(XPVIV, xiv_iv));
403d36eb 1442 SvIV_set(sv, 0);
85274cbc 1443 return;
79072805 1444 case SVt_NV:
4cbc76b1 1445 assert(old_type == SVt_NULL);
79072805 1446 SvANY(sv) = new_XNV();
403d36eb 1447 SvNV_set(sv, 0);
85274cbc 1448 return;
ed6116ce 1449 case SVt_RV:
4cbc76b1 1450 assert(old_type == SVt_NULL);
339049b0 1451 SvANY(sv) = &sv->sv_u.svu_rv;
403d36eb 1452 SvRV_set(sv, 0);
85274cbc 1453 return;
79072805
LW
1454 case SVt_PVHV:
1455 SvANY(sv) = new_XPVHV();
463ee0b2
LW
1456 HvFILL(sv) = 0;
1457 HvMAX(sv) = 0;
8aacddc1 1458 HvTOTALKEYS(sv) = 0;
bd4b1eb5 1459
2068cd4d
NC
1460 goto hv_av_common;
1461
1462 case SVt_PVAV:
1463 SvANY(sv) = new_XPVAV();
1464 AvMAX(sv) = -1;
1465 AvFILLp(sv) = -1;
1466 AvALLOC(sv) = 0;
1467 AvREAL_only(sv);
1468
1469 hv_av_common:
1470 /* SVt_NULL isn't the only thing upgraded to AV or HV.
1471 The target created by newSVrv also is, and it can have magic.
1472 However, it never has SvPVX set.
1473 */
1474 if (old_type >= SVt_RV) {
1475 assert(SvPVX_const(sv) == 0);
8bd4d4c5 1476 }
2068cd4d
NC
1477
1478 /* Could put this in the else clause below, as PVMG must have SvPVX
1479 0 already (the assertion above) */
bd4b1eb5 1480 SvPV_set(sv, (char*)0);
2068cd4d
NC
1481
1482 if (old_type >= SVt_PVMG) {
1483 SvMAGIC_set(sv, ((XPVMG*)old_body)->xmg_magic);
1484 SvSTASH_set(sv, ((XPVMG*)old_body)->xmg_stash);
1485 } else {
1486 SvMAGIC_set(sv, 0);
1487 SvSTASH_set(sv, 0);
1488 }
79072805 1489 break;
bd4b1eb5
NC
1490
1491 case SVt_PVIO:
403d36eb
NC
1492 new_body = new_XPVIO();
1493 new_body_length = sizeof(XPVIO);
1494 goto zero;
bd4b1eb5 1495 case SVt_PVFM:
403d36eb
NC
1496 new_body = new_XPVFM();
1497 new_body_length = sizeof(XPVFM);
1498 goto zero;
1499
bd4b1eb5 1500 case SVt_PVBM:
403d36eb
NC
1501 new_body_length = sizeof(XPVBM);
1502 new_body_arena = (void **) &PL_xpvbm_root;
1503 new_body_arenaroot = (void **) &PL_xpvbm_arenaroot;
1504 goto new_body;
bd4b1eb5 1505 case SVt_PVGV:
403d36eb
NC
1506 new_body_length = sizeof(XPVGV);
1507 new_body_arena = (void **) &PL_xpvgv_root;
1508 new_body_arenaroot = (void **) &PL_xpvgv_arenaroot;
1509 goto new_body;
79072805 1510 case SVt_PVCV:
403d36eb
NC
1511 new_body_length = sizeof(XPVCV);
1512 new_body_arena = (void **) &PL_xpvcv_root;
1513 new_body_arenaroot = (void **) &PL_xpvcv_arenaroot;
1514 goto new_body;
bd4b1eb5 1515 case SVt_PVLV:
403d36eb
NC
1516 new_body_length = sizeof(XPVLV);
1517 new_body_arena = (void **) &PL_xpvlv_root;
1518 new_body_arenaroot = (void **) &PL_xpvlv_arenaroot;
1519 goto new_body;
1520 case SVt_PVMG:
1521 new_body_length = sizeof(XPVMG);
1522 new_body_arena = (void **) &PL_xpvmg_root;
1523 new_body_arenaroot = (void **) &PL_xpvmg_arenaroot;
1524 goto new_body;
1525 case SVt_PVNV:
1526 new_body_length = sizeof(XPVNV);
1527 new_body_arena = (void **) &PL_xpvnv_root;
1528 new_body_arenaroot = (void **) &PL_xpvnv_arenaroot;
1529 goto new_body;
1530 case SVt_PVIV:
1531 new_body_offset = STRUCT_OFFSET(XPVIV, xpv_cur)
1532 - STRUCT_OFFSET(xpviv_allocated, xpv_cur);
1533 new_body_length = sizeof(XPVIV) - new_body_offset;
1534 new_body_arena = (void **) &PL_xpviv_root;
1535 new_body_arenaroot = (void **) &PL_xpviv_arenaroot;
1536 /* XXX Is this still needed? Was it ever needed? Surely as there is
1537 no route from NV to PVIV, NOK can never be true */
1538 if (SvNIOK(sv))
1539 (void)SvIOK_on(sv);
1540 SvNOK_off(sv);
1541 goto new_body_no_NV;
1542 case SVt_PV:
1543 new_body_offset = STRUCT_OFFSET(XPV, xpv_cur)
1544 - STRUCT_OFFSET(xpv_allocated, xpv_cur);
1545 new_body_length = sizeof(XPV) - new_body_offset;
1546 new_body_arena = (void **) &PL_xpv_root;
1547 new_body_arenaroot = (void **) &PL_xpv_arenaroot;
1548 new_body_no_NV:
1549 /* PV and PVIV don't have an NV slot. */
16b305e3 1550#ifndef NV_ZERO_IS_ALLBITS_ZERO
403d36eb 1551 zero_nv = FALSE;
16b305e3 1552#endif
403d36eb 1553
16b305e3
NC
1554 new_body:
1555 assert(new_body_length);
403d36eb 1556#ifndef PURIFY
16b305e3 1557 /* This points to the start of the allocated area. */
08742458
NC
1558 new_body_inline(new_body, new_body_arenaroot, new_body_arena,
1559 new_body_length);
403d36eb 1560#else
16b305e3
NC
1561 /* We always allocated the full length item with PURIFY */
1562 new_body_length += new_body_offset;
1563 new_body_offset = 0;
1564 new_body = my_safemalloc(new_body_length);
403d36eb
NC
1565
1566#endif
16b305e3
NC
1567 zero:
1568 Zero(new_body, new_body_length, char);
1569 new_body = ((char *)new_body) - new_body_offset;
1570 SvANY(sv) = new_body;
1571
1572 if (old_body_length) {
1573 Copy((char *)old_body + old_body_offset,
1574 (char *)new_body + old_body_offset,
1575 old_body_length, char);
1576 }
403d36eb 1577
16b305e3
NC
1578#ifndef NV_ZERO_IS_ALLBITS_ZERO
1579 if (zero_nv)
1580 SvNV_set(sv, 0);
1581#endif
403d36eb 1582
16b305e3
NC
1583 if (mt == SVt_PVIO)
1584 IoPAGE_LEN(sv) = 60;
1585 if (old_type < SVt_RV)
1586 SvPV_set(sv, 0);
8990e307 1587 break;
403d36eb
NC
1588 default:
1589 Perl_croak(aTHX_ "panic: sv_upgrade to unknown type %lu", mt);
8990e307 1590 }
878cc751
NC
1591
1592
1593 if (old_body_arena) {
1594#ifdef PURIFY
ee6954bb 1595 my_safefree(old_body);
878cc751 1596#else
cb4415b8
NC
1597 del_body((void*)((char*)old_body + old_body_offset),
1598 old_body_arena);
878cc751 1599#endif
2068cd4d 1600 }
79072805
LW
1601}
1602
645c22ef
DM
1603/*
1604=for apidoc sv_backoff
1605
1606Remove any string offset. You should normally use the C<SvOOK_off> macro
1607wrapper instead.
1608
1609=cut
1610*/
1611
79072805 1612int
864dbfa3 1613Perl_sv_backoff(pTHX_ register SV *sv)
79072805
LW
1614{
1615 assert(SvOOK(sv));
b79f7545
NC
1616 assert(SvTYPE(sv) != SVt_PVHV);
1617 assert(SvTYPE(sv) != SVt_PVAV);
463ee0b2 1618 if (SvIVX(sv)) {
53c1dcc0 1619 const char * const s = SvPVX_const(sv);
b162af07 1620 SvLEN_set(sv, SvLEN(sv) + SvIVX(sv));
f880fe2f 1621 SvPV_set(sv, SvPVX(sv) - SvIVX(sv));
79072805 1622 SvIV_set(sv, 0);
463ee0b2 1623 Move(s, SvPVX(sv), SvCUR(sv)+1, char);
79072805
LW
1624 }
1625 SvFLAGS(sv) &= ~SVf_OOK;
a0d0e21e 1626 return 0;
79072805
LW
1627}
1628
954c1994
GS
1629/*
1630=for apidoc sv_grow
1631
645c22ef
DM
1632Expands the character buffer in the SV. If necessary, uses C<sv_unref> and
1633upgrades the SV to C<SVt_PV>. Returns a pointer to the character buffer.
1634Use the C<SvGROW> wrapper instead.
954c1994
GS
1635
1636=cut
1637*/
1638
79072805 1639char *
864dbfa3 1640Perl_sv_grow(pTHX_ register SV *sv, register STRLEN newlen)
79072805
LW
1641{
1642 register char *s;
1643
55497cff 1644#ifdef HAS_64K_LIMIT
79072805 1645 if (newlen >= 0x10000) {
1d7c1841
GS
1646 PerlIO_printf(Perl_debug_log,
1647 "Allocation too large: %"UVxf"\n", (UV)newlen);
79072805
LW
1648 my_exit(1);
1649 }
55497cff 1650#endif /* HAS_64K_LIMIT */
a0d0e21e
LW
1651 if (SvROK(sv))
1652 sv_unref(sv);
79072805
LW
1653 if (SvTYPE(sv) < SVt_PV) {
1654 sv_upgrade(sv, SVt_PV);
93524f2b 1655 s = SvPVX_mutable(sv);
79072805
LW
1656 }
1657 else if (SvOOK(sv)) { /* pv is offset? */
1658 sv_backoff(sv);
93524f2b 1659 s = SvPVX_mutable(sv);
79072805
LW
1660 if (newlen > SvLEN(sv))
1661 newlen += 10 * (newlen - SvCUR(sv)); /* avoid copy each time */
c6f8c383
GA
1662#ifdef HAS_64K_LIMIT
1663 if (newlen >= 0x10000)
1664 newlen = 0xFFFF;
1665#endif
79072805 1666 }
bc44a8a2 1667 else
4d84ee25 1668 s = SvPVX_mutable(sv);
54f0641b 1669
79072805 1670 if (newlen > SvLEN(sv)) { /* need more room? */
7a9b70e9 1671 newlen = PERL_STRLEN_ROUNDUP(newlen);
8d6dde3e 1672 if (SvLEN(sv) && s) {
7bab3ede 1673#ifdef MYMALLOC
93524f2b 1674 const STRLEN l = malloced_size((void*)SvPVX_const(sv));
8d6dde3e
IZ
1675 if (newlen <= l) {
1676 SvLEN_set(sv, l);
1677 return s;
1678 } else
c70c8a0a 1679#endif
1936d2a7 1680 s = saferealloc(s, newlen);
8d6dde3e 1681 }
bfed75c6 1682 else {
1936d2a7 1683 s = safemalloc(newlen);
3f7c398e
SP
1684 if (SvPVX_const(sv) && SvCUR(sv)) {
1685 Move(SvPVX_const(sv), s, (newlen < SvCUR(sv)) ? newlen : SvCUR(sv), char);
40565179 1686 }
4e83176d 1687 }
79072805 1688 SvPV_set(sv, s);
e1ec3a88 1689 SvLEN_set(sv, newlen);
79072805
LW
1690 }
1691 return s;
1692}
1693
954c1994
GS
1694/*
1695=for apidoc sv_setiv
1696
645c22ef
DM
1697Copies an integer into the given SV, upgrading first if necessary.
1698Does not handle 'set' magic. See also C<sv_setiv_mg>.
954c1994
GS
1699
1700=cut
1701*/
1702
79072805 1703void
864dbfa3 1704Perl_sv_setiv(pTHX_ register SV *sv, IV i)
79072805 1705{
765f542d 1706 SV_CHECK_THINKFIRST_COW_DROP(sv);
463ee0b2
LW
1707 switch (SvTYPE(sv)) {
1708 case SVt_NULL:
79072805 1709 sv_upgrade(sv, SVt_IV);
463ee0b2
LW
1710 break;
1711 case SVt_NV:
1712 sv_upgrade(sv, SVt_PVNV);
1713 break;
ed6116ce 1714 case SVt_RV:
463ee0b2 1715 case SVt_PV:
79072805 1716 sv_upgrade(sv, SVt_PVIV);
463ee0b2 1717 break;
a0d0e21e
LW
1718
1719 case SVt_PVGV:
a0d0e21e
LW
1720 case SVt_PVAV:
1721 case SVt_PVHV:
1722 case SVt_PVCV:
1723 case SVt_PVFM:
1724 case SVt_PVIO:
411caa50 1725 Perl_croak(aTHX_ "Can't coerce %s to integer in %s", sv_reftype(sv,0),
53e06cf0 1726 OP_DESC(PL_op));
463ee0b2 1727 }
a0d0e21e 1728 (void)SvIOK_only(sv); /* validate number */
45977657 1729 SvIV_set(sv, i);
463ee0b2 1730 SvTAINT(sv);
79072805
LW
1731}
1732
954c1994
GS
1733/*
1734=for apidoc sv_setiv_mg
1735
1736Like C<sv_setiv>, but also handles 'set' magic.
1737
1738=cut
1739*/
1740
79072805 1741void
864dbfa3 1742Perl_sv_setiv_mg(pTHX_ register SV *sv, IV i)
ef50df4b
GS
1743{
1744 sv_setiv(sv,i);
1745 SvSETMAGIC(sv);
1746}
1747
954c1994
GS
1748/*
1749=for apidoc sv_setuv
1750
645c22ef
DM
1751Copies an unsigned integer into the given SV, upgrading first if necessary.
1752Does not handle 'set' magic. See also C<sv_setuv_mg>.
954c1994
GS
1753
1754=cut
1755*/
1756
ef50df4b 1757void
864dbfa3 1758Perl_sv_setuv(pTHX_ register SV *sv, UV u)
55497cff 1759{
55ada374
NC
1760 /* With these two if statements:
1761 u=1.49 s=0.52 cu=72.49 cs=10.64 scripts=270 tests=20865
d460ef45 1762
55ada374
NC
1763 without
1764 u=1.35 s=0.47 cu=73.45 cs=11.43 scripts=270 tests=20865
d460ef45 1765
55ada374
NC
1766 If you wish to remove them, please benchmark to see what the effect is
1767 */
28e5dec8
JH
1768 if (u <= (UV)IV_MAX) {
1769 sv_setiv(sv, (IV)u);
1770 return;
1771 }
25da4f38
IZ
1772 sv_setiv(sv, 0);
1773 SvIsUV_on(sv);
607fa7f2 1774 SvUV_set(sv, u);
55497cff 1775}
1776
954c1994
GS
1777/*
1778=for apidoc sv_setuv_mg
1779
1780Like C<sv_setuv>, but also handles 'set' magic.
1781
1782=cut
1783*/
1784
55497cff 1785void
864dbfa3 1786Perl_sv_setuv_mg(pTHX_ register SV *sv, UV u)
ef50df4b 1787{
aa0f650e
NC
1788 sv_setiv(sv, 0);
1789 SvIsUV_on(sv);
1790 sv_setuv(sv,u);
ef50df4b
GS
1791 SvSETMAGIC(sv);
1792}
1793
954c1994
GS
1794/*
1795=for apidoc sv_setnv
1796
645c22ef
DM
1797Copies a double into the given SV, upgrading first if necessary.
1798Does not handle 'set' magic. See also C<sv_setnv_mg>.
954c1994
GS
1799
1800=cut
1801*/
1802
ef50df4b 1803void
65202027 1804Perl_sv_setnv(pTHX_ register SV *sv, NV num)
79072805 1805{
765f542d 1806 SV_CHECK_THINKFIRST_COW_DROP(sv);
a0d0e21e
LW
1807 switch (SvTYPE(sv)) {
1808 case SVt_NULL:
1809 case SVt_IV:
79072805 1810 sv_upgrade(sv, SVt_NV);
a0d0e21e 1811 break;
a0d0e21e
LW
1812 case SVt_RV:
1813 case SVt_PV:
1814 case SVt_PVIV:
79072805 1815 sv_upgrade(sv, SVt_PVNV);
a0d0e21e 1816 break;
827b7e14 1817
a0d0e21e 1818 case SVt_PVGV:
a0d0e21e
LW
1819 case SVt_PVAV:
1820 case SVt_PVHV:
1821 case SVt_PVCV:
1822 case SVt_PVFM:
1823 case SVt_PVIO:
411caa50 1824 Perl_croak(aTHX_ "Can't coerce %s to number in %s", sv_reftype(sv,0),
53e06cf0 1825 OP_NAME(PL_op));
79072805 1826 }
9d6ce603 1827 SvNV_set(sv, num);
a0d0e21e 1828 (void)SvNOK_only(sv); /* validate number */
463ee0b2 1829 SvTAINT(sv);
79072805
LW
1830}
1831
954c1994
GS
1832/*
1833=for apidoc sv_setnv_mg
1834
1835Like C<sv_setnv>, but also handles 'set' magic.
1836
1837=cut
1838*/
1839
ef50df4b 1840void
65202027 1841Perl_sv_setnv_mg(pTHX_ register SV *sv, NV num)
ef50df4b
GS
1842{
1843 sv_setnv(sv,num);
1844 SvSETMAGIC(sv);
1845}
1846
645c22ef
DM
1847/* Print an "isn't numeric" warning, using a cleaned-up,
1848 * printable version of the offending string
1849 */
1850
76e3520e 1851STATIC void
cea2e8a9 1852S_not_a_number(pTHX_ SV *sv)
a0d0e21e 1853{
94463019
JH
1854 SV *dsv;
1855 char tmpbuf[64];
1b6737cc 1856 const char *pv;
94463019
JH
1857
1858 if (DO_UTF8(sv)) {
d0043bd1 1859 dsv = sv_2mortal(newSVpvn("", 0));
94463019
JH
1860 pv = sv_uni_display(dsv, sv, 10, 0);
1861 } else {
1862 char *d = tmpbuf;
1863 char *limit = tmpbuf + sizeof(tmpbuf) - 8;
1864 /* each *s can expand to 4 chars + "...\0",
1865 i.e. need room for 8 chars */
ecdeb87c 1866
e62f0680
NC
1867 const char *s, *end;
1868 for (s = SvPVX_const(sv), end = s + SvCUR(sv); s < end && d < limit;
1869 s++) {
94463019
JH
1870 int ch = *s & 0xFF;
1871 if (ch & 128 && !isPRINT_LC(ch)) {
1872 *d++ = 'M';
1873 *d++ = '-';
1874 ch &= 127;
1875 }
1876 if (ch == '\n') {
1877 *d++ = '\\';
1878 *d++ = 'n';
1879 }
1880 else if (ch == '\r') {
1881 *d++ = '\\';
1882 *d++ = 'r';
1883 }
1884 else if (ch == '\f') {
1885 *d++ = '\\';
1886 *d++ = 'f';
1887 }
1888 else if (ch == '\\') {
1889 *d++ = '\\';
1890 *d++ = '\\';
1891 }
1892 else if (ch == '\0') {
1893 *d++ = '\\';
1894 *d++ = '0';
1895 }
1896 else if (isPRINT_LC(ch))
1897 *d++ = ch;
1898 else {
1899 *d++ = '^';
1900 *d++ = toCTRL(ch);
1901 }
1902 }
1903 if (s < end) {
1904 *d++ = '.';
1905 *d++ = '.';
1906 *d++ = '.';
1907 }
1908 *d = '\0';
1909 pv = tmpbuf;
a0d0e21e 1910 }
a0d0e21e 1911
533c011a 1912 if (PL_op)
9014280d 1913 Perl_warner(aTHX_ packWARN(WARN_NUMERIC),
94463019
JH
1914 "Argument \"%s\" isn't numeric in %s", pv,
1915 OP_DESC(PL_op));
a0d0e21e 1916 else
9014280d 1917 Perl_warner(aTHX_ packWARN(WARN_NUMERIC),
94463019 1918 "Argument \"%s\" isn't numeric", pv);
a0d0e21e
LW
1919}
1920
c2988b20
NC
1921/*
1922=for apidoc looks_like_number
1923
645c22ef
DM
1924Test if the content of an SV looks like a number (or is a number).
1925C<Inf> and C<Infinity> are treated as numbers (so will not issue a
1926non-numeric warning), even if your atof() doesn't grok them.
c2988b20
NC
1927
1928=cut
1929*/
1930
1931I32
1932Perl_looks_like_number(pTHX_ SV *sv)
1933{
a3b680e6 1934 register const char *sbegin;
c2988b20
NC
1935 STRLEN len;
1936
1937 if (SvPOK(sv)) {
3f7c398e 1938 sbegin = SvPVX_const(sv);
c2988b20
NC
1939 len = SvCUR(sv);
1940 }
1941 else if (SvPOKp(sv))
83003860 1942 sbegin = SvPV_const(sv, len);
c2988b20 1943 else
e0ab1c0e 1944 return SvFLAGS(sv) & (SVf_NOK|SVp_NOK|SVf_IOK|SVp_IOK);
c2988b20
NC
1945 return grok_number(sbegin, len, NULL);
1946}
25da4f38
IZ
1947
1948/* Actually, ISO C leaves conversion of UV to IV undefined, but
1949 until proven guilty, assume that things are not that bad... */
1950
645c22ef
DM
1951/*
1952 NV_PRESERVES_UV:
1953
1954 As 64 bit platforms often have an NV that doesn't preserve all bits of
28e5dec8
JH
1955 an IV (an assumption perl has been based on to date) it becomes necessary
1956 to remove the assumption that the NV always carries enough precision to
1957 recreate the IV whenever needed, and that the NV is the canonical form.
1958 Instead, IV/UV and NV need to be given equal rights. So as to not lose
645c22ef 1959 precision as a side effect of conversion (which would lead to insanity
28e5dec8
JH
1960 and the dragon(s) in t/op/numconvert.t getting very angry) the intent is
1961 1) to distinguish between IV/UV/NV slots that have cached a valid
1962 conversion where precision was lost and IV/UV/NV slots that have a
1963 valid conversion which has lost no precision
645c22ef 1964 2) to ensure that if a numeric conversion to one form is requested that
28e5dec8
JH
1965 would lose precision, the precise conversion (or differently
1966 imprecise conversion) is also performed and cached, to prevent
1967 requests for different numeric formats on the same SV causing
1968 lossy conversion chains. (lossless conversion chains are perfectly
1969 acceptable (still))
1970
1971
1972 flags are used:
1973 SvIOKp is true if the IV slot contains a valid value
1974 SvIOK is true only if the IV value is accurate (UV if SvIOK_UV true)
1975 SvNOKp is true if the NV slot contains a valid value
1976 SvNOK is true only if the NV value is accurate
1977
1978 so
645c22ef 1979 while converting from PV to NV, check to see if converting that NV to an
28e5dec8
JH
1980 IV(or UV) would lose accuracy over a direct conversion from PV to
1981 IV(or UV). If it would, cache both conversions, return NV, but mark
1982 SV as IOK NOKp (ie not NOK).
1983
645c22ef 1984 While converting from PV to IV, check to see if converting that IV to an
28e5dec8
JH
1985 NV would lose accuracy over a direct conversion from PV to NV. If it
1986 would, cache both conversions, flag similarly.
1987
1988 Before, the SV value "3.2" could become NV=3.2 IV=3 NOK, IOK quite
1989 correctly because if IV & NV were set NV *always* overruled.
645c22ef
DM
1990 Now, "3.2" will become NV=3.2 IV=3 NOK, IOKp, because the flag's meaning
1991 changes - now IV and NV together means that the two are interchangeable:
28e5dec8 1992 SvIVX == (IV) SvNVX && SvNVX == (NV) SvIVX;
d460ef45 1993
645c22ef
DM
1994 The benefit of this is that operations such as pp_add know that if
1995 SvIOK is true for both left and right operands, then integer addition
1996 can be used instead of floating point (for cases where the result won't
1997 overflow). Before, floating point was always used, which could lead to
28e5dec8
JH
1998 loss of precision compared with integer addition.
1999
2000 * making IV and NV equal status should make maths accurate on 64 bit
2001 platforms
2002 * may speed up maths somewhat if pp_add and friends start to use
645c22ef 2003 integers when possible instead of fp. (Hopefully the overhead in
28e5dec8
JH
2004 looking for SvIOK and checking for overflow will not outweigh the
2005 fp to integer speedup)
2006 * will slow down integer operations (callers of SvIV) on "inaccurate"
2007 values, as the change from SvIOK to SvIOKp will cause a call into
2008 sv_2iv each time rather than a macro access direct to the IV slot
2009 * should speed up number->string conversion on integers as IV is
645c22ef 2010 favoured when IV and NV are equally accurate
28e5dec8
JH
2011
2012 ####################################################################
645c22ef
DM
2013 You had better be using SvIOK_notUV if you want an IV for arithmetic:
2014 SvIOK is true if (IV or UV), so you might be getting (IV)SvUV.
2015 On the other hand, SvUOK is true iff UV.
28e5dec8
JH
2016 ####################################################################
2017
645c22ef 2018 Your mileage will vary depending your CPU's relative fp to integer
28e5dec8
JH
2019 performance ratio.
2020*/
2021
2022#ifndef NV_PRESERVES_UV
645c22ef
DM
2023# define IS_NUMBER_UNDERFLOW_IV 1
2024# define IS_NUMBER_UNDERFLOW_UV 2
2025# define IS_NUMBER_IV_AND_UV 2
2026# define IS_NUMBER_OVERFLOW_IV 4
2027# define IS_NUMBER_OVERFLOW_UV 5
2028
2029/* sv_2iuv_non_preserve(): private routine for use by sv_2iv() and sv_2uv() */
28e5dec8
JH
2030
2031/* For sv_2nv these three cases are "SvNOK and don't bother casting" */
2032STATIC int
645c22ef 2033S_sv_2iuv_non_preserve(pTHX_ register SV *sv, I32 numtype)
28e5dec8 2034{
3f7c398e 2035 DEBUG_c(PerlIO_printf(Perl_debug_log,"sv_2iuv_non '%s', IV=0x%"UVxf" NV=%"NVgf" inttype=%"UVXf"\n", SvPVX_const(sv), SvIVX(sv), SvNVX(sv), (UV)numtype));
28e5dec8
JH
2036 if (SvNVX(sv) < (NV)IV_MIN) {
2037 (void)SvIOKp_on(sv);
2038 (void)SvNOK_on(sv);
45977657 2039 SvIV_set(sv, IV_MIN);
28e5dec8
JH
2040 return IS_NUMBER_UNDERFLOW_IV;
2041 }
2042 if (SvNVX(sv) > (NV)UV_MAX) {
2043 (void)SvIOKp_on(sv);
2044 (void)SvNOK_on(sv);
2045 SvIsUV_on(sv);
607fa7f2 2046 SvUV_set(sv, UV_MAX);
28e5dec8
JH
2047 return IS_NUMBER_OVERFLOW_UV;
2048 }
c2988b20
NC
2049 (void)SvIOKp_on(sv);
2050 (void)SvNOK_on(sv);
2051 /* Can't use strtol etc to convert this string. (See truth table in
2052 sv_2iv */
2053 if (SvNVX(sv) <= (UV)IV_MAX) {
45977657 2054 SvIV_set(sv, I_V(SvNVX(sv)));
c2988b20
NC
2055 if ((NV)(SvIVX(sv)) == SvNVX(sv)) {
2056 SvIOK_on(sv); /* Integer is precise. NOK, IOK */
2057 } else {
2058 /* Integer is imprecise. NOK, IOKp */
2059 }
2060 return SvNVX(sv) < 0 ? IS_NUMBER_UNDERFLOW_UV : IS_NUMBER_IV_AND_UV;
2061 }
2062 SvIsUV_on(sv);
607fa7f2 2063 SvUV_set(sv, U_V(SvNVX(sv)));
c2988b20
NC
2064 if ((NV)(SvUVX(sv)) == SvNVX(sv)) {
2065 if (SvUVX(sv) == UV_MAX) {
2066 /* As we know that NVs don't preserve UVs, UV_MAX cannot
2067 possibly be preserved by NV. Hence, it must be overflow.
2068 NOK, IOKp */
2069 return IS_NUMBER_OVERFLOW_UV;
2070 }
2071 SvIOK_on(sv); /* Integer is precise. NOK, UOK */
2072 } else {
2073 /* Integer is imprecise. NOK, IOKp */
28e5dec8 2074 }
c2988b20 2075 return IS_NUMBER_OVERFLOW_IV;
28e5dec8 2076}
645c22ef
DM
2077#endif /* !NV_PRESERVES_UV*/
2078
891f9566
YST
2079/* sv_2iv() is now a macro using Perl_sv_2iv_flags();
2080 * this function provided for binary compatibility only
2081 */
2082
2083IV
2084Perl_sv_2iv(pTHX_ register SV *sv)
2085{
2086 return sv_2iv_flags(sv, SV_GMAGIC);
2087}
2088
645c22ef 2089/*
891f9566 2090=for apidoc sv_2iv_flags
645c22ef 2091
891f9566
YST
2092Return the integer value of an SV, doing any necessary string
2093conversion. If flags includes SV_GMAGIC, does an mg_get() first.
2094Normally used via the C<SvIV(sv)> and C<SvIVx(sv)> macros.
645c22ef
DM
2095
2096=cut
2097*/
28e5dec8 2098
a0d0e21e 2099IV
891f9566 2100Perl_sv_2iv_flags(pTHX_ register SV *sv, I32 flags)
79072805
LW
2101{
2102 if (!sv)
2103 return 0;
8990e307 2104 if (SvGMAGICAL(sv)) {
891f9566
YST
2105 if (flags & SV_GMAGIC)
2106 mg_get(sv);
463ee0b2
LW
2107 if (SvIOKp(sv))
2108 return SvIVX(sv);
748a9306 2109 if (SvNOKp(sv)) {
25da4f38 2110 return I_V(SvNVX(sv));
748a9306 2111 }
36477c24 2112 if (SvPOKp(sv) && SvLEN(sv))
2113 return asIV(sv);
3fe9a6f1 2114 if (!SvROK(sv)) {
d008e5eb 2115 if (!(SvFLAGS(sv) & SVs_PADTMP)) {
041457d9 2116 if (!PL_localizing && ckWARN(WARN_UNINITIALIZED))
29489e7c 2117 report_uninit(sv);
c6ee37c5 2118 }
36477c24 2119 return 0;
3fe9a6f1 2120 }
463ee0b2 2121 }
ed6116ce 2122 if (SvTHINKFIRST(sv)) {
a0d0e21e 2123 if (SvROK(sv)) {
a0d0e21e 2124 SV* tmpstr;
1554e226 2125 if (SvAMAGIC(sv) && (tmpstr=AMG_CALLun(sv,numer)) &&
b4b9a328 2126 (!SvROK(tmpstr) || (SvRV(tmpstr) != SvRV(sv))))
9e7bc3e8 2127 return SvIV(tmpstr);
56431972 2128 return PTR2IV(SvRV(sv));
a0d0e21e 2129 }
765f542d
NC
2130 if (SvIsCOW(sv)) {
2131 sv_force_normal_flags(sv, 0);
47deb5e7 2132 }
0336b60e 2133 if (SvREADONLY(sv) && !SvOK(sv)) {
0336b60e 2134 if (ckWARN(WARN_UNINITIALIZED))
29489e7c 2135 report_uninit(sv);
ed6116ce
LW
2136 return 0;
2137 }
79072805 2138 }
25da4f38
IZ
2139 if (SvIOKp(sv)) {
2140 if (SvIsUV(sv)) {
2141 return (IV)(SvUVX(sv));
2142 }
2143 else {
2144 return SvIVX(sv);
2145 }
463ee0b2 2146 }
748a9306 2147 if (SvNOKp(sv)) {
28e5dec8
JH
2148 /* erm. not sure. *should* never get NOKp (without NOK) from sv_2nv
2149 * without also getting a cached IV/UV from it at the same time
2150 * (ie PV->NV conversion should detect loss of accuracy and cache
2151 * IV or UV at same time to avoid this. NWC */
25da4f38
IZ
2152
2153 if (SvTYPE(sv) == SVt_NV)
2154 sv_upgrade(sv, SVt_PVNV);
2155
28e5dec8
JH
2156 (void)SvIOKp_on(sv); /* Must do this first, to clear any SvOOK */
2157 /* < not <= as for NV doesn't preserve UV, ((NV)IV_MAX+1) will almost
2158 certainly cast into the IV range at IV_MAX, whereas the correct
2159 answer is the UV IV_MAX +1. Hence < ensures that dodgy boundary
2160 cases go to UV */
2161 if (SvNVX(sv) < (NV)IV_MAX + 0.5) {
45977657 2162 SvIV_set(sv, I_V(SvNVX(sv)));
28e5dec8
JH
2163 if (SvNVX(sv) == (NV) SvIVX(sv)
2164#ifndef NV_PRESERVES_UV
2165 && (((UV)1 << NV_PRESERVES_UV_BITS) >
2166 (UV)(SvIVX(sv) > 0 ? SvIVX(sv) : -SvIVX(sv)))
2167 /* Don't flag it as "accurately an integer" if the number
2168 came from a (by definition imprecise) NV operation, and
2169 we're outside the range of NV integer precision */
2170#endif
2171 ) {
2172 SvIOK_on(sv); /* Can this go wrong with rounding? NWC */
2173 DEBUG_c(PerlIO_printf(Perl_debug_log,
7234c960 2174 "0x%"UVxf" iv(%"NVgf" => %"IVdf") (precise)\n",
28e5dec8
JH
2175 PTR2UV(sv),
2176 SvNVX(sv),
2177 SvIVX(sv)));
2178
2179 } else {
2180 /* IV not precise. No need to convert from PV, as NV
2181 conversion would already have cached IV if it detected
2182 that PV->IV would be better than PV->NV->IV
2183 flags already correct - don't set public IOK. */
2184 DEBUG_c(PerlIO_printf(Perl_debug_log,
7234c960 2185 "0x%"UVxf" iv(%"NVgf" => %"IVdf") (imprecise)\n",
28e5dec8
JH
2186 PTR2UV(sv),
2187 SvNVX(sv),
2188 SvIVX(sv)));
2189 }
2190 /* Can the above go wrong if SvIVX == IV_MIN and SvNVX < IV_MIN,
2191 but the cast (NV)IV_MIN rounds to a the value less (more
2192 negative) than IV_MIN which happens to be equal to SvNVX ??
2193 Analogous to 0xFFFFFFFFFFFFFFFF rounding up to NV (2**64) and
2194 NV rounding back to 0xFFFFFFFFFFFFFFFF, so UVX == UV(NVX) and
2195 (NV)UVX == NVX are both true, but the values differ. :-(
2196 Hopefully for 2s complement IV_MIN is something like
2197 0x8000000000000000 which will be exact. NWC */
d460ef45 2198 }
25da4f38 2199 else {
607fa7f2 2200 SvUV_set(sv, U_V(SvNVX(sv)));
28e5dec8
JH
2201 if (
2202 (SvNVX(sv) == (NV) SvUVX(sv))
2203#ifndef NV_PRESERVES_UV
2204 /* Make sure it's not 0xFFFFFFFFFFFFFFFF */
2205 /*&& (SvUVX(sv) != UV_MAX) irrelevant with code below */
2206 && (((UV)1 << NV_PRESERVES_UV_BITS) > SvUVX(sv))
2207 /* Don't flag it as "accurately an integer" if the number
2208 came from a (by definition imprecise) NV operation, and
2209 we're outside the range of NV integer precision */
2210#endif
2211 )
2212 SvIOK_on(sv);
25da4f38
IZ
2213 SvIsUV_on(sv);
2214 ret_iv_max:
1c846c1f 2215 DEBUG_c(PerlIO_printf(Perl_debug_log,
57def98f 2216 "0x%"UVxf" 2iv(%"UVuf" => %"IVdf") (as unsigned)\n",
56431972 2217 PTR2UV(sv),
57def98f
JH
2218 SvUVX(sv),
2219 SvUVX(sv)));
25da4f38
IZ
2220 return (IV)SvUVX(sv);
2221 }
748a9306
LW
2222 }
2223 else if (SvPOKp(sv) && SvLEN(sv)) {
c2988b20 2224 UV value;
504618e9 2225 const int numtype = grok_number(SvPVX_const(sv), SvCUR(sv), &value);
25da4f38
IZ
2226 /* We want to avoid a possible problem when we cache an IV which
2227 may be later translated to an NV, and the resulting NV is not
c2988b20
NC
2228 the same as the direct translation of the initial string
2229 (eg 123.456 can shortcut to the IV 123 with atol(), but we must
2230 be careful to ensure that the value with the .456 is around if the
2231 NV value is requested in the future).
1c846c1f 2232
25da4f38
IZ
2233 This means that if we cache such an IV, we need to cache the
2234 NV as well. Moreover, we trade speed for space, and do not
28e5dec8 2235 cache the NV if we are sure it's not needed.
25da4f38 2236 */
16b7a9a4 2237
c2988b20
NC
2238 /* SVt_PVNV is one higher than SVt_PVIV, hence this order */
2239 if ((numtype & (IS_NUMBER_IN_UV | IS_NUMBER_NOT_INT))
2240 == IS_NUMBER_IN_UV) {
5e045b90 2241 /* It's definitely an integer, only upgrade to PVIV */
28e5dec8
JH
2242 if (SvTYPE(sv) < SVt_PVIV)
2243 sv_upgrade(sv, SVt_PVIV);
f7bbb42a 2244 (void)SvIOK_on(sv);
c2988b20
NC
2245 } else if (SvTYPE(sv) < SVt_PVNV)
2246 sv_upgrade(sv, SVt_PVNV);
28e5dec8 2247
c2988b20
NC
2248 /* If NV preserves UV then we only use the UV value if we know that
2249 we aren't going to call atof() below. If NVs don't preserve UVs
2250 then the value returned may have more precision than atof() will
2251 return, even though value isn't perfectly accurate. */
2252 if ((numtype & (IS_NUMBER_IN_UV
2253#ifdef NV_PRESERVES_UV
2254 | IS_NUMBER_NOT_INT
2255#endif
2256 )) == IS_NUMBER_IN_UV) {
2257 /* This won't turn off the public IOK flag if it was set above */
2258 (void)SvIOKp_on(sv);
2259
2260 if (!(numtype & IS_NUMBER_NEG)) {
2261 /* positive */;
2262 if (value <= (UV)IV_MAX) {
45977657 2263 SvIV_set(sv, (IV)value);
c2988b20 2264 } else {
607fa7f2 2265 SvUV_set(sv, value);
c2988b20
NC
2266 SvIsUV_on(sv);
2267 }
2268 } else {
2269 /* 2s complement assumption */
2270 if (value <= (UV)IV_MIN) {
45977657 2271 SvIV_set(sv, -(IV)value);
c2988b20
NC
2272 } else {
2273 /* Too negative for an IV. This is a double upgrade, but
d1be9408 2274 I'm assuming it will be rare. */
c2988b20
NC
2275 if (SvTYPE(sv) < SVt_PVNV)
2276 sv_upgrade(sv, SVt_PVNV);
2277 SvNOK_on(sv);
2278 SvIOK_off(sv);
2279 SvIOKp_on(sv);
9d6ce603 2280 SvNV_set(sv, -(NV)value);
45977657 2281 SvIV_set(sv, IV_MIN);
c2988b20
NC
2282 }
2283 }
2284 }
2285 /* For !NV_PRESERVES_UV and IS_NUMBER_IN_UV and IS_NUMBER_NOT_INT we
2286 will be in the previous block to set the IV slot, and the next
2287 block to set the NV slot. So no else here. */
2288
2289 if ((numtype & (IS_NUMBER_IN_UV | IS_NUMBER_NOT_INT))
2290 != IS_NUMBER_IN_UV) {
2291 /* It wasn't an (integer that doesn't overflow the UV). */
3f7c398e 2292 SvNV_set(sv, Atof(SvPVX_const(sv)));
28e5dec8 2293
c2988b20
NC
2294 if (! numtype && ckWARN(WARN_NUMERIC))
2295 not_a_number(sv);
28e5dec8 2296
65202027 2297#if defined(USE_LONG_DOUBLE)
c2988b20
NC
2298 DEBUG_c(PerlIO_printf(Perl_debug_log, "0x%"UVxf" 2iv(%" PERL_PRIgldbl ")\n",
2299 PTR2UV(sv), SvNVX(sv)));
65202027 2300#else
1779d84d 2301 DEBUG_c(PerlIO_printf(Perl_debug_log, "0x%"UVxf" 2iv(%"NVgf")\n",
c2988b20 2302 PTR2UV(sv), SvNVX(sv)));
65202027 2303#endif
28e5dec8
JH
2304
2305
2306#ifdef NV_PRESERVES_UV
c2988b20
NC
2307 (void)SvIOKp_on(sv);
2308 (void)SvNOK_on(sv);
2309 if (SvNVX(sv) < (NV)IV_MAX + 0.5) {
45977657 2310 SvIV_set(sv, I_V(SvNVX(sv)));
c2988b20
NC
2311 if ((NV)(SvIVX(sv)) == SvNVX(sv)) {
2312 SvIOK_on(sv);
28e5dec8 2313 } else {
c2988b20
NC
2314 /* Integer is imprecise. NOK, IOKp */
2315 }
2316 /* UV will not work better than IV */
2317 } else {
2318 if (SvNVX(sv) > (NV)UV_MAX) {
2319 SvIsUV_on(sv);
2320 /* Integer is inaccurate. NOK, IOKp, is UV */
607fa7f2 2321 SvUV_set(sv, UV_MAX);
c2988b20
NC
2322 SvIsUV_on(sv);
2323 } else {
607fa7f2 2324 SvUV_set(sv, U_V(SvNVX(sv)));
c2988b20
NC
2325 /* 0xFFFFFFFFFFFFFFFF not an issue in here */
2326 if ((NV)(SvUVX(sv)) == SvNVX(sv)) {
2327 SvIOK_on(sv);
28e5dec8
JH
2328 SvIsUV_on(sv);
2329 } else {
c2988b20
NC
2330 /* Integer is imprecise. NOK, IOKp, is UV */
2331 SvIsUV_on(sv);
28e5dec8 2332 }
28e5dec8 2333 }
c2988b20
NC
2334 goto ret_iv_max;
2335 }
28e5dec8 2336#else /* NV_PRESERVES_UV */
c2988b20
NC
2337 if ((numtype & (IS_NUMBER_IN_UV | IS_NUMBER_NOT_INT))
2338 == (IS_NUMBER_IN_UV | IS_NUMBER_NOT_INT)) {
2339 /* The IV slot will have been set from value returned by
2340 grok_number above. The NV slot has just been set using
2341 Atof. */
560b0c46 2342 SvNOK_on(sv);
c2988b20
NC
2343 assert (SvIOKp(sv));
2344 } else {
2345 if (((UV)1 << NV_PRESERVES_UV_BITS) >
2346 U_V(SvNVX(sv) > 0 ? SvNVX(sv) : -SvNVX(sv))) {
2347 /* Small enough to preserve all bits. */
2348 (void)SvIOKp_on(sv);
2349 SvNOK_on(sv);
45977657 2350 SvIV_set(sv, I_V(SvNVX(sv)));
c2988b20
NC
2351 if ((NV)(SvIVX(sv)) == SvNVX(sv))
2352 SvIOK_on(sv);
2353 /* Assumption: first non-preserved integer is < IV_MAX,
2354 this NV is in the preserved range, therefore: */
2355 if (!(U_V(SvNVX(sv) > 0 ? SvNVX(sv) : -SvNVX(sv))
2356 < (UV)IV_MAX)) {
32fdb065 2357 Perl_croak(aTHX_ "sv_2iv assumed (U_V(fabs((double)SvNVX(sv))) < (UV)IV_MAX) but SvNVX(sv)=%"NVgf" U_V is 0x%"UVxf", IV_MAX is 0x%"UVxf"\n", SvNVX(sv), U_V(SvNVX(sv)), (UV)IV_MAX);
c2988b20
NC
2358 }
2359 } else {
2360 /* IN_UV NOT_INT
2361 0 0 already failed to read UV.
2362 0 1 already failed to read UV.
2363 1 0 you won't get here in this case. IV/UV
2364 slot set, public IOK, Atof() unneeded.
2365 1 1 already read UV.
2366 so there's no point in sv_2iuv_non_preserve() attempting
2367 to use atol, strtol, strtoul etc. */
2368 if (sv_2iuv_non_preserve (sv, numtype)
2369 >= IS_NUMBER_OVERFLOW_IV)
2370 goto ret_iv_max;
2371 }
2372 }
28e5dec8 2373#endif /* NV_PRESERVES_UV */
25da4f38 2374 }
28e5dec8 2375 } else {
041457d9 2376 if (!PL_localizing && !(SvFLAGS(sv) & SVs_PADTMP) && ckWARN(WARN_UNINITIALIZED))
29489e7c 2377 report_uninit(sv);
25da4f38
IZ
2378 if (SvTYPE(sv) < SVt_IV)
2379 /* Typically the caller expects that sv_any is not NULL now. */
2380 sv_upgrade(sv, SVt_IV);
a0d0e21e 2381 return 0;
79072805 2382 }
1d7c1841
GS
2383 DEBUG_c(PerlIO_printf(Perl_debug_log, "0x%"UVxf" 2iv(%"IVdf")\n",
2384 PTR2UV(sv),SvIVX(sv)));
25da4f38 2385 return SvIsUV(sv) ? (IV)SvUVX(sv) : SvIVX(sv);
79072805
LW
2386}
2387
891f9566
YST
2388/* sv_2uv() is now a macro using Perl_sv_2uv_flags();
2389 * this function provided for binary compatibility only
2390 */
2391
2392UV
2393Perl_sv_2uv(pTHX_ register SV *sv)
2394{
2395 return sv_2uv_flags(sv, SV_GMAGIC);
2396}
2397
645c22ef 2398/*
891f9566 2399=for apidoc sv_2uv_flags
645c22ef
DM
2400
2401Return the unsigned integer value of an SV, doing any necessary string
891f9566
YST
2402conversion. If flags includes SV_GMAGIC, does an mg_get() first.
2403Normally used via the C<SvUV(sv)> and C<SvUVx(sv)> macros.
645c22ef
DM
2404
2405=cut
2406*/
2407
ff68c719 2408UV
891f9566 2409Perl_sv_2uv_flags(pTHX_ register SV *sv, I32 flags)
ff68c719 2410{
2411 if (!sv)
2412 return 0;
2413 if (SvGMAGICAL(sv)) {
891f9566
YST
2414 if (flags & SV_GMAGIC)
2415 mg_get(sv);
ff68c719 2416 if (SvIOKp(sv))
2417 return SvUVX(sv);
2418 if (SvNOKp(sv))
2419 return U_V(SvNVX(sv));
36477c24 2420 if (SvPOKp(sv) && SvLEN(sv))
2421 return asUV(sv);
3fe9a6f1 2422 if (!SvROK(sv)) {
d008e5eb 2423 if (!(SvFLAGS(sv) & SVs_PADTMP)) {
041457d9 2424 if (!PL_localizing && ckWARN(WARN_UNINITIALIZED))
29489e7c 2425 report_uninit(sv);
c6ee37c5 2426 }
36477c24 2427 return 0;
3fe9a6f1 2428 }
ff68c719 2429 }
2430 if (SvTHINKFIRST(sv)) {
2431 if (SvROK(sv)) {
ff68c719 2432 SV* tmpstr;
1554e226 2433 if (SvAMAGIC(sv) && (tmpstr=AMG_CALLun(sv,numer)) &&
b4b9a328 2434 (!SvROK(tmpstr) || (SvRV(tmpstr) != SvRV(sv))))
9e7bc3e8 2435 return SvUV(tmpstr);
56431972 2436 return PTR2UV(SvRV(sv));
ff68c719 2437 }
765f542d
NC
2438 if (SvIsCOW(sv)) {
2439 sv_force_normal_flags(sv, 0);
8a818333 2440 }
0336b60e 2441 if (SvREADONLY(sv) && !SvOK(sv)) {
0336b60e 2442 if (ckWARN(WARN_UNINITIALIZED))
29489e7c 2443 report_uninit(sv);
ff68c719 2444 return 0;
2445 }
2446 }
25da4f38
IZ
2447 if (SvIOKp(sv)) {
2448 if (SvIsUV(sv)) {
2449 return SvUVX(sv);
2450 }
2451 else {
2452 return (UV)SvIVX(sv);
2453 }
ff68c719 2454 }
2455 if (SvNOKp(sv)) {
28e5dec8
JH
2456 /* erm. not sure. *should* never get NOKp (without NOK) from sv_2nv
2457 * without also getting a cached IV/UV from it at the same time
2458 * (ie PV->NV conversion should detect loss of accuracy and cache
2459 * IV or UV at same time to avoid this. */
2460 /* IV-over-UV optimisation - choose to cache IV if possible */
2461
25da4f38
IZ
2462 if (SvTYPE(sv) == SVt_NV)
2463 sv_upgrade(sv, SVt_PVNV);
28e5dec8
JH
2464
2465 (void)SvIOKp_on(sv); /* Must do this first, to clear any SvOOK */
2466 if (SvNVX(sv) < (NV)IV_MAX + 0.5) {
45977657 2467 SvIV_set(sv, I_V(SvNVX(sv)));
28e5dec8
JH
2468 if (SvNVX(sv) == (NV) SvIVX(sv)
2469#ifndef NV_PRESERVES_UV
2470 && (((UV)1 << NV_PRESERVES_UV_BITS) >
2471 (UV)(SvIVX(sv) > 0 ? SvIVX(sv) : -SvIVX(sv)))
2472 /* Don't flag it as "accurately an integer" if the number
2473 came from a (by definition imprecise) NV operation, and
2474 we're outside the range of NV integer precision */
2475#endif
2476 ) {
2477 SvIOK_on(sv); /* Can this go wrong with rounding? NWC */
2478 DEBUG_c(PerlIO_printf(Perl_debug_log,
7234c960 2479 "0x%"UVxf" uv(%"NVgf" => %"IVdf") (precise)\n",
28e5dec8
JH
2480 PTR2UV(sv),
2481 SvNVX(sv),
2482 SvIVX(sv)));
2483
2484 } else {
2485 /* IV not precise. No need to convert from PV, as NV
2486 conversion would already have cached IV if it detected
2487 that PV->IV would be better than PV->NV->IV
2488 flags already correct - don't set public IOK. */
2489 DEBUG_c(PerlIO_printf(Perl_debug_log,
7234c960 2490 "0x%"UVxf" uv(%"NVgf" => %"IVdf") (imprecise)\n",
28e5dec8
JH
2491 PTR2UV(sv),
2492 SvNVX(sv),
2493 SvIVX(sv)));
2494 }
2495 /* Can the above go wrong if SvIVX == IV_MIN and SvNVX < IV_MIN,
2496 but the cast (NV)IV_MIN rounds to a the value less (more
2497 negative) than IV_MIN which happens to be equal to SvNVX ??
2498 Analogous to 0xFFFFFFFFFFFFFFFF rounding up to NV (2**64) and
2499 NV rounding back to 0xFFFFFFFFFFFFFFFF, so UVX == UV(NVX) and
2500 (NV)UVX == NVX are both true, but the values differ. :-(
2501 Hopefully for 2s complement IV_MIN is something like
2502 0x8000000000000000 which will be exact. NWC */
d460ef45 2503 }
28e5dec8 2504 else {
607fa7f2 2505 SvUV_set(sv, U_V(SvNVX(sv)));
28e5dec8
JH
2506 if (
2507 (SvNVX(sv) == (NV) SvUVX(sv))
2508#ifndef NV_PRESERVES_UV
2509 /* Make sure it's not 0xFFFFFFFFFFFFFFFF */
2510 /*&& (SvUVX(sv) != UV_MAX) irrelevant with code below */
2511 && (((UV)1 << NV_PRESERVES_UV_BITS) > SvUVX(sv))
2512 /* Don't flag it as "accurately an integer" if the number
2513 came from a (by definition imprecise) NV operation, and
2514 we're outside the range of NV integer precision */
2515#endif
2516 )
2517 SvIOK_on(sv);
2518 SvIsUV_on(sv);
1c846c1f 2519 DEBUG_c(PerlIO_printf(Perl_debug_log,
28e5dec8 2520 "0x%"UVxf" 2uv(%"UVuf" => %"IVdf") (as unsigned)\n",
57def98f 2521 PTR2UV(sv),
28e5dec8
JH
2522 SvUVX(sv),
2523 SvUVX(sv)));
25da4f38 2524 }
ff68c719 2525 }
2526 else if (SvPOKp(sv) && SvLEN(sv)) {
c2988b20 2527 UV value;
504618e9 2528 const int numtype = grok_number(SvPVX_const(sv), SvCUR(sv), &value);
25da4f38
IZ
2529
2530 /* We want to avoid a possible problem when we cache a UV which
2531 may be later translated to an NV, and the resulting NV is not
2532 the translation of the initial data.
1c846c1f 2533
25da4f38
IZ
2534 This means that if we cache such a UV, we need to cache the
2535 NV as well. Moreover, we trade speed for space, and do not
2536 cache the NV if not needed.
2537 */
16b7a9a4 2538
c2988b20
NC
2539 /* SVt_PVNV is one higher than SVt_PVIV, hence this order */
2540 if ((numtype & (IS_NUMBER_IN_UV | IS_NUMBER_NOT_INT))
2541 == IS_NUMBER_IN_UV) {
5e045b90 2542 /* It's definitely an integer, only upgrade to PVIV */
28e5dec8 2543 if (SvTYPE(sv) < SVt_PVIV)
f7bbb42a
JH
2544 sv_upgrade(sv, SVt_PVIV);
2545 (void)SvIOK_on(sv);
c2988b20
NC
2546 } else if (SvTYPE(sv) < SVt_PVNV)
2547 sv_upgrade(sv, SVt_PVNV);
d460ef45 2548
c2988b20
NC
2549 /* If NV preserves UV then we only use the UV value if we know that
2550 we aren't going to call atof() below. If NVs don't preserve UVs
2551 then the value returned may have more precision than atof() will
2552 return, even though it isn't accurate. */
2553 if ((numtype & (IS_NUMBER_IN_UV
2554#ifdef NV_PRESERVES_UV
2555 | IS_NUMBER_NOT_INT
2556#endif
2557 )) == IS_NUMBER_IN_UV) {
2558 /* This won't turn off the public IOK flag if it was set above */
2559 (void)SvIOKp_on(sv);
2560
2561 if (!(numtype & IS_NUMBER_NEG)) {
2562 /* positive */;
2563 if (value <= (UV)IV_MAX) {
45977657 2564 SvIV_set(sv, (IV)value);
28e5dec8
JH
2565 } else {
2566 /* it didn't overflow, and it was positive. */
607fa7f2 2567 SvUV_set(sv, value);
28e5dec8
JH
2568 SvIsUV_on(sv);
2569 }
c2988b20
NC
2570 } else {
2571 /* 2s complement assumption */
2572 if (value <= (UV)IV_MIN) {
45977657 2573 SvIV_set(sv, -(IV)value);
c2988b20
NC
2574 } else {
2575 /* Too negative for an IV. This is a double upgrade, but
d1be9408 2576 I'm assuming it will be rare. */
c2988b20
NC
2577 if (SvTYPE(sv) < SVt_PVNV)
2578 sv_upgrade(sv, SVt_PVNV);
2579 SvNOK_on(sv);
2580 SvIOK_off(sv);
2581 SvIOKp_on(sv);
9d6ce603 2582 SvNV_set(sv, -(NV)value);
45977657 2583 SvIV_set(sv, IV_MIN);
c2988b20
NC
2584 }
2585 }
2586 }
2587
2588 if ((numtype & (IS_NUMBER_IN_UV | IS_NUMBER_NOT_INT))
2589 != IS_NUMBER_IN_UV) {
2590 /* It wasn't an integer, or it overflowed the UV. */
3f7c398e 2591 SvNV_set(sv, Atof(SvPVX_const(sv)));
28e5dec8 2592
c2988b20 2593 if (! numtype && ckWARN(WARN_NUMERIC))
28e5dec8
JH
2594 not_a_number(sv);
2595
2596#if defined(USE_LONG_DOUBLE)
c2988b20
NC
2597 DEBUG_c(PerlIO_printf(Perl_debug_log, "0x%"UVxf" 2uv(%" PERL_PRIgldbl ")\n",
2598 PTR2UV(sv), SvNVX(sv)));
28e5dec8 2599#else
1779d84d 2600 DEBUG_c(PerlIO_printf(Perl_debug_log, "0x%"UVxf" 2uv(%"NVgf")\n",
c2988b20 2601 PTR2UV(sv), SvNVX(sv)));
28e5dec8
JH
2602#endif
2603
2604#ifdef NV_PRESERVES_UV
c2988b20
NC
2605 (void)SvIOKp_on(sv);
2606 (void)SvNOK_on(sv);
2607 if (SvNVX(sv) < (NV)IV_MAX + 0.5) {
45977657 2608 SvIV_set(sv, I_V(SvNVX(sv)));
c2988b20
NC
2609 if ((NV)(SvIVX(sv)) == SvNVX(sv)) {
2610 SvIOK_on(sv);
2611 } else {
2612 /* Integer is imprecise. NOK, IOKp */
2613 }
2614 /* UV will not work better than IV */
2615 } else {
2616 if (SvNVX(sv) > (NV)UV_MAX) {
2617 SvIsUV_on(sv);
2618 /* Integer is inaccurate. NOK, IOKp, is UV */
607fa7f2 2619 SvUV_set(sv, UV_MAX);
c2988b20
NC
2620 SvIsUV_on(sv);
2621 } else {
607fa7f2 2622 SvUV_set(sv, U_V(SvNVX(sv)));
c2988b20
NC
2623 /* 0xFFFFFFFFFFFFFFFF not an issue in here, NVs
2624 NV preservse UV so can do correct comparison. */
2625 if ((NV)(SvUVX(sv)) == SvNVX(sv)) {
2626 SvIOK_on(sv);
2627 SvIsUV_on(sv);
2628 } else {
2629 /* Integer is imprecise. NOK, IOKp, is UV */
2630 SvIsUV_on(sv);
2631 }
2632 }
2633 }
28e5dec8 2634#else /* NV_PRESERVES_UV */
c2988b20
NC
2635 if ((numtype & (IS_NUMBER_IN_UV | IS_NUMBER_NOT_INT))
2636 == (IS_NUMBER_IN_UV | IS_NUMBER_NOT_INT)) {
2637 /* The UV slot will have been set from value returned by
2638 grok_number above. The NV slot has just been set using
2639 Atof. */
560b0c46 2640 SvNOK_on(sv);
c2988b20
NC
2641 assert (SvIOKp(sv));
2642 } else {
2643 if (((UV)1 << NV_PRESERVES_UV_BITS) >
2644 U_V(SvNVX(sv) > 0 ? SvNVX(sv) : -SvNVX(sv))) {
2645 /* Small enough to preserve all bits. */
2646 (void)SvIOKp_on(sv);
2647 SvNOK_on(sv);
45977657 2648 SvIV_set(sv, I_V(SvNVX(sv)));
c2988b20
NC
2649 if ((NV)(SvIVX(sv)) == SvNVX(sv))
2650 SvIOK_on(sv);
2651 /* Assumption: first non-preserved integer is < IV_MAX,
2652 this NV is in the preserved range, therefore: */
2653 if (!(U_V(SvNVX(sv) > 0 ? SvNVX(sv) : -SvNVX(sv))
2654 < (UV)IV_MAX)) {
32fdb065 2655 Perl_croak(aTHX_ "sv_2uv assumed (U_V(fabs((double)SvNVX(sv))) < (UV)IV_MAX) but SvNVX(sv)=%"NVgf" U_V is 0x%"UVxf", IV_MAX is 0x%"UVxf"\n", SvNVX(sv), U_V(SvNVX(sv)), (UV)IV_MAX);
c2988b20
NC
2656 }
2657 } else
2658 sv_2iuv_non_preserve (sv, numtype);
2659 }
28e5dec8 2660#endif /* NV_PRESERVES_UV */
f7bbb42a 2661 }
ff68c719 2662 }
2663 else {
d008e5eb 2664 if (!(SvFLAGS(sv) & SVs_PADTMP)) {
041457d9 2665 if (!PL_localizing && ckWARN(WARN_UNINITIALIZED))
29489e7c 2666 report_uninit(sv);
c6ee37c5 2667 }
25da4f38
IZ
2668 if (SvTYPE(sv) < SVt_IV)
2669 /* Typically the caller expects that sv_any is not NULL now. */
2670 sv_upgrade(sv, SVt_IV);
ff68c719 2671 return 0;
2672 }
25da4f38 2673
1d7c1841
GS
2674 DEBUG_c(PerlIO_printf(Perl_debug_log, "0x%"UVxf" 2uv(%"UVuf")\n",
2675 PTR2UV(sv),SvUVX(sv)));
25da4f38 2676 return SvIsUV(sv) ? SvUVX(sv) : (UV)SvIVX(sv);
ff68c719 2677}
2678
645c22ef
DM
2679/*
2680=for apidoc sv_2nv
2681
2682Return the num value of an SV, doing any necessary string or integer
2683conversion, magic etc. Normally used via the C<SvNV(sv)> and C<SvNVx(sv)>
2684macros.
2685
2686=cut
2687*/
2688
65202027 2689NV
864dbfa3 2690Perl_sv_2nv(pTHX_ register SV *sv)
79072805
LW
2691{
2692 if (!sv)
2693 return 0.0;
8990e307 2694 if (SvGMAGICAL(sv)) {
463ee0b2
LW
2695 mg_get(sv);
2696 if (SvNOKp(sv))
2697 return SvNVX(sv);
a0d0e21e 2698 if (SvPOKp(sv) && SvLEN(sv)) {
041457d9 2699 if (!SvIOKp(sv) && ckWARN(WARN_NUMERIC) &&
504618e9 2700 !grok_number(SvPVX_const(sv), SvCUR(sv), NULL))
a0d0e21e 2701 not_a_number(sv);
3f7c398e 2702 return Atof(SvPVX_const(sv));
a0d0e21e 2703 }
25da4f38 2704 if (SvIOKp(sv)) {
1c846c1f 2705 if (SvIsUV(sv))
65202027 2706 return (NV)SvUVX(sv);
25da4f38 2707 else
65202027 2708 return (NV)SvIVX(sv);
25da4f38 2709 }
16d20bd9 2710 if (!SvROK(sv)) {
d008e5eb 2711 if (!(SvFLAGS(sv) & SVs_PADTMP)) {
041457d9 2712 if (!PL_localizing && ckWARN(WARN_UNINITIALIZED))
29489e7c 2713 report_uninit(sv);
c6ee37c5 2714 }
66a1b24b 2715 return (NV)0;
16d20bd9 2716 }
463ee0b2 2717 }
ed6116ce 2718 if (SvTHINKFIRST(sv)) {
a0d0e21e 2719 if (SvROK(sv)) {
a0d0e21e 2720 SV* tmpstr;
1554e226 2721 if (SvAMAGIC(sv) && (tmpstr=AMG_CALLun(sv,numer)) &&
b4b9a328 2722 (!SvROK(tmpstr) || (SvRV(tmpstr) != SvRV(sv))))
9e7bc3e8 2723 return SvNV(tmpstr);
56431972 2724 return PTR2NV(SvRV(sv));
a0d0e21e 2725 }
765f542d
NC
2726 if (SvIsCOW(sv)) {
2727 sv_force_normal_flags(sv, 0);
8a818333 2728 }
0336b60e 2729 if (SvREADONLY(sv) && !SvOK(sv)) {
599cee73 2730 if (ckWARN(WARN_UNINITIALIZED))
29489e7c 2731 report_uninit(sv);
ed6116ce
LW
2732 return 0.0;
2733 }
79072805
LW
2734 }
2735 if (SvTYPE(sv) < SVt_NV) {
463ee0b2
LW
2736 if (SvTYPE(sv) == SVt_IV)
2737 sv_upgrade(sv, SVt_PVNV);
2738 else
2739 sv_upgrade(sv, SVt_NV);
906f284f 2740#ifdef USE_LONG_DOUBLE
097ee67d 2741 DEBUG_c({
f93f4e46 2742 STORE_NUMERIC_LOCAL_SET_STANDARD();
1d7c1841
GS
2743 PerlIO_printf(Perl_debug_log,
2744 "0x%"UVxf" num(%" PERL_PRIgldbl ")\n",
2745 PTR2UV(sv), SvNVX(sv));
572bbb43
GS
2746 RESTORE_NUMERIC_LOCAL();
2747 });
65202027 2748#else
572bbb43 2749 DEBUG_c({
f93f4e46 2750 STORE_NUMERIC_LOCAL_SET_STANDARD();
1779d84d 2751 PerlIO_printf(Perl_debug_log, "0x%"UVxf" num(%"NVgf")\n",
1d7c1841 2752 PTR2UV(sv), SvNVX(sv));
097ee67d
JH
2753 RESTORE_NUMERIC_LOCAL();
2754 });
572bbb43 2755#endif
79072805
LW
2756 }
2757 else if (SvTYPE(sv) < SVt_PVNV)
2758 sv_upgrade(sv, SVt_PVNV);
59d8ce62
NC
2759 if (SvNOKp(sv)) {
2760 return SvNVX(sv);
61604483 2761 }
59d8ce62 2762 if (SvIOKp(sv)) {
9d6ce603 2763 SvNV_set(sv, SvIsUV(sv) ? (NV)SvUVX(sv) : (NV)SvIVX(sv));
28e5dec8
JH
2764#ifdef NV_PRESERVES_UV
2765 SvNOK_on(sv);
2766#else
2767 /* Only set the public NV OK flag if this NV preserves the IV */
2768 /* Check it's not 0xFFFFFFFFFFFFFFFF */
2769 if (SvIsUV(sv) ? ((SvUVX(sv) != UV_MAX)&&(SvUVX(sv) == U_V(SvNVX(sv))))
2770 : (SvIVX(sv) == I_V(SvNVX(sv))))
2771 SvNOK_on(sv);
2772 else
2773 SvNOKp_on(sv);
2774#endif
93a17b20 2775 }
748a9306 2776 else if (SvPOKp(sv) && SvLEN(sv)) {
c2988b20 2777 UV value;
3f7c398e 2778 const int numtype = grok_number(SvPVX_const(sv), SvCUR(sv), &value);
041457d9 2779 if (!SvIOKp(sv) && !numtype && ckWARN(WARN_NUMERIC))
a0d0e21e 2780 not_a_number(sv);
28e5dec8 2781#ifdef NV_PRESERVES_UV
c2988b20
NC
2782 if ((numtype & (IS_NUMBER_IN_UV | IS_NUMBER_NOT_INT))
2783 == IS_NUMBER_IN_UV) {
5e045b90 2784 /* It's definitely an integer */
9d6ce603 2785 SvNV_set(sv, (numtype & IS_NUMBER_NEG) ? -(NV)value : (NV)value);
c2988b20 2786 } else
3f7c398e 2787 SvNV_set(sv, Atof(SvPVX_const(sv)));
28e5dec8
JH
2788 SvNOK_on(sv);
2789#else
3f7c398e 2790 SvNV_set(sv, Atof(SvPVX_const(sv)));
28e5dec8
JH
2791 /* Only set the public NV OK flag if this NV preserves the value in
2792 the PV at least as well as an IV/UV would.
2793 Not sure how to do this 100% reliably. */
2794 /* if that shift count is out of range then Configure's test is
2795 wonky. We shouldn't be in here with NV_PRESERVES_UV_BITS ==
2796 UV_BITS */
2797 if (((UV)1 << NV_PRESERVES_UV_BITS) >
c2988b20 2798 U_V(SvNVX(sv) > 0 ? SvNVX(sv) : -SvNVX(sv))) {
28e5dec8 2799 SvNOK_on(sv); /* Definitely small enough to preserve all bits */
c2988b20
NC
2800 } else if (!(numtype & IS_NUMBER_IN_UV)) {
2801 /* Can't use strtol etc to convert this string, so don't try.
2802 sv_2iv and sv_2uv will use the NV to convert, not the PV. */
2803 SvNOK_on(sv);
2804 } else {
2805 /* value has been set. It may not be precise. */
2806 if ((numtype & IS_NUMBER_NEG) && (value > (UV)IV_MIN)) {
2807 /* 2s complement assumption for (UV)IV_MIN */
2808 SvNOK_on(sv); /* Integer is too negative. */
2809 } else {
2810 SvNOKp_on(sv);
2811 SvIOKp_on(sv);
6fa402ec 2812
c2988b20 2813 if (numtype & IS_NUMBER_NEG) {
45977657 2814 SvIV_set(sv, -(IV)value);
c2988b20 2815 } else if (value <= (UV)IV_MAX) {
45977657 2816 SvIV_set(sv, (IV)value);
c2988b20 2817 } else {
607fa7f2 2818 SvUV_set(sv, value);
c2988b20
NC
2819 SvIsUV_on(sv);
2820 }
2821
2822 if (numtype & IS_NUMBER_NOT_INT) {
2823 /* I believe that even if the original PV had decimals,
2824 they are lost beyond the limit of the FP precision.
2825 However, neither is canonical, so both only get p
2826 flags. NWC, 2000/11/25 */
2827 /* Both already have p flags, so do nothing */
2828 } else {
66a1b24b 2829 const NV nv = SvNVX(sv);
c2988b20
NC
2830 if (SvNVX(sv) < (NV)IV_MAX + 0.5) {
2831 if (SvIVX(sv) == I_V(nv)) {
2832 SvNOK_on(sv);
2833 SvIOK_on(sv);
2834 } else {
2835 SvIOK_on(sv);
2836 /* It had no "." so it must be integer. */
2837 }
2838 } else {
2839 /* between IV_MAX and NV(UV_MAX).
2840 Could be slightly > UV_MAX */
6fa402ec 2841
c2988b20
NC
2842 if (numtype & IS_NUMBER_NOT_INT) {
2843 /* UV and NV both imprecise. */
2844 } else {
66a1b24b 2845 const UV nv_as_uv = U_V(nv);
c2988b20
NC
2846
2847 if (value == nv_as_uv && SvUVX(sv) != UV_MAX) {
2848 SvNOK_on(sv);
2849 SvIOK_on(sv);
2850 } else {
2851 SvIOK_on(sv);
2852 }
2853 }
2854 }
2855 }
2856 }
2857 }
28e5dec8 2858#endif /* NV_PRESERVES_UV */
93a17b20 2859 }
79072805 2860 else {
041457d9 2861 if (!PL_localizing && !(SvFLAGS(sv) & SVs_PADTMP) && ckWARN(WARN_UNINITIALIZED))
29489e7c 2862 report_uninit(sv);
25da4f38
IZ
2863 if (SvTYPE(sv) < SVt_NV)
2864 /* Typically the caller expects that sv_any is not NULL now. */
28e5dec8
JH
2865 /* XXX Ilya implies that this is a bug in callers that assume this
2866 and ideally should be fixed. */
25da4f38 2867 sv_upgrade(sv, SVt_NV);
a0d0e21e 2868 return 0.0;
79072805 2869 }
572bbb43 2870#if defined(USE_LONG_DOUBLE)
097ee67d 2871 DEBUG_c({
f93f4e46 2872 STORE_NUMERIC_LOCAL_SET_STANDARD();
1d7c1841
GS
2873 PerlIO_printf(Perl_debug_log, "0x%"UVxf" 2nv(%" PERL_PRIgldbl ")\n",
2874 PTR2UV(sv), SvNVX(sv));
572bbb43
GS
2875 RESTORE_NUMERIC_LOCAL();
2876 });
65202027 2877#else
572bbb43 2878 DEBUG_c({
f93f4e46 2879 STORE_NUMERIC_LOCAL_SET_STANDARD();
1779d84d 2880 PerlIO_printf(Perl_debug_log, "0x%"UVxf" 1nv(%"NVgf")\n",
1d7c1841 2881 PTR2UV(sv), SvNVX(sv));
097ee67d
JH
2882 RESTORE_NUMERIC_LOCAL();
2883 });
572bbb43 2884#endif
463ee0b2 2885 return SvNVX(sv);
79072805
LW
2886}
2887
645c22ef
DM
2888/* asIV(): extract an integer from the string value of an SV.
2889 * Caller must validate PVX */
2890
76e3520e 2891STATIC IV
cea2e8a9 2892S_asIV(pTHX_ SV *sv)
36477c24 2893{
c2988b20 2894 UV value;
66a1b24b 2895 const int numtype = grok_number(SvPVX_const(sv), SvCUR(sv), &value);
c2988b20
NC
2896
2897 if ((numtype & (IS_NUMBER_IN_UV | IS_NUMBER_NOT_INT))
2898 == IS_NUMBER_IN_UV) {
645c22ef 2899 /* It's definitely an integer */
c2988b20
NC
2900 if (numtype & IS_NUMBER_NEG) {
2901 if (value < (UV)IV_MIN)
2902 return -(IV)value;
2903 } else {
2904 if (value < (UV)IV_MAX)
2905 return (IV)value;
2906 }
2907 }
d008e5eb 2908 if (!numtype) {
d008e5eb
GS
2909 if (ckWARN(WARN_NUMERIC))
2910 not_a_number(sv);
2911 }
3f7c398e 2912 return I_V(Atof(SvPVX_const(sv)));
36477c24 2913}
2914
645c22ef
DM
2915/* asUV(): extract an unsigned integer from the string value of an SV
2916 * Caller must validate PVX */
2917
76e3520e 2918STATIC UV
cea2e8a9 2919S_asUV(pTHX_ SV *sv)
36477c24 2920{
c2988b20 2921 UV value;
504618e9 2922 const int numtype = grok_number(SvPVX_const(sv), SvCUR(sv), &value);
36477c24 2923
c2988b20
NC
2924 if ((numtype & (IS_NUMBER_IN_UV | IS_NUMBER_NOT_INT))
2925 == IS_NUMBER_IN_UV) {
645c22ef 2926 /* It's definitely an integer */
6fa402ec 2927 if (!(numtype & IS_NUMBER_NEG))
c2988b20
NC
2928 return value;
2929 }
d008e5eb 2930 if (!numtype) {
d008e5eb
GS
2931 if (ckWARN(WARN_NUMERIC))
2932 not_a_number(sv);
2933 }
3f7c398e 2934 return U_V(Atof(SvPVX_const(sv)));
36477c24 2935}
2936
645c22ef
DM
2937/*
2938=for apidoc sv_2pv_nolen
2939
2940Like C<sv_2pv()>, but doesn't return the length too. You should usually
2941use the macro wrapper C<SvPV_nolen(sv)> instead.
2942=cut
2943*/
2944
79072805 2945char *
864dbfa3 2946Perl_sv_2pv_nolen(pTHX_ register SV *sv)
1fa8b10d 2947{
dafda6d1 2948 return sv_2pv(sv, 0);
1fa8b10d
JD
2949}
2950
645c22ef
DM
2951/* uiv_2buf(): private routine for use by sv_2pv_flags(): print an IV or
2952 * UV as a string towards the end of buf, and return pointers to start and
2953 * end of it.
2954 *
2955 * We assume that buf is at least TYPE_CHARS(UV) long.
2956 */
2957
864dbfa3 2958static char *
25da4f38
IZ
2959uiv_2buf(char *buf, IV iv, UV uv, int is_uv, char **peob)
2960{
25da4f38
IZ
2961 char *ptr = buf + TYPE_CHARS(UV);
2962 char *ebuf = ptr;
2963 int sign;
25da4f38
IZ
2964
2965 if (is_uv)
2966 sign = 0;
2967 else if (iv >= 0) {
2968 uv = iv;
2969 sign = 0;
2970 } else {
2971 uv = -iv;
2972 sign = 1;
2973 }
2974 do {
eb160463 2975 *--ptr = '0' + (char)(uv % 10);
25da4f38
IZ
2976 } while (uv /= 10);
2977 if (sign)
2978 *--ptr = '-';
2979 *peob = ebuf;
2980 return ptr;
2981}
2982
09540bc3
JH
2983/* sv_2pv() is now a macro using Perl_sv_2pv_flags();
2984 * this function provided for binary compatibility only
2985 */
2986
2987char *
2988Perl_sv_2pv(pTHX_ register SV *sv, STRLEN *lp)
2989{
2990 return sv_2pv_flags(sv, lp, SV_GMAGIC);
2991}
2992
645c22ef
DM
2993/*
2994=for apidoc sv_2pv_flags
2995
ff276b08 2996Returns a pointer to the string value of an SV, and sets *lp to its length.
645c22ef
DM
2997If flags includes SV_GMAGIC, does an mg_get() first. Coerces sv to a string
2998if necessary.
2999Normally invoked via the C<SvPV_flags> macro. C<sv_2pv()> and C<sv_2pv_nomg>
3000usually end up here too.
3001
3002=cut
3003*/
3004
8d6d96c1
HS
3005char *
3006Perl_sv_2pv_flags(pTHX_ register SV *sv, STRLEN *lp, I32 flags)
3007{
79072805
LW
3008 register char *s;
3009 int olderrno;
cb50f42d 3010 SV *tsv, *origsv;
25da4f38
IZ
3011 char tbuf[64]; /* Must fit sprintf/Gconvert of longest IV/NV */
3012 char *tmpbuf = tbuf;
79072805 3013
463ee0b2 3014 if (!sv) {
cdb061a3
NC
3015 if (lp)
3016 *lp = 0;
73d840c0 3017 return (char *)"";
463ee0b2 3018 }
8990e307 3019 if (SvGMAGICAL(sv)) {
8d6d96c1
HS
3020 if (flags & SV_GMAGIC)
3021 mg_get(sv);
463ee0b2 3022 if (SvPOKp(sv)) {
cdb061a3
NC
3023 if (lp)
3024 *lp = SvCUR(sv);
10516c54
NC
3025 if (flags & SV_MUTABLE_RETURN)
3026 return SvPVX_mutable(sv);
4d84ee25
NC
3027 if (flags & SV_CONST_RETURN)
3028 return (char *)SvPVX_const(sv);
463ee0b2
LW
3029 return SvPVX(sv);
3030 }
cf2093f6 3031 if (SvIOKp(sv)) {
1c846c1f 3032 if (SvIsUV(sv))
57def98f 3033 (void)sprintf(tmpbuf,"%"UVuf, (UV)SvUVX(sv));
cf2093f6 3034 else
57def98f 3035 (void)sprintf(tmpbuf,"%"IVdf, (IV)SvIVX(sv));
46fc3d4c 3036 tsv = Nullsv;
a0d0e21e 3037 goto tokensave;
463ee0b2
LW
3038 }
3039 if (SvNOKp(sv)) {
2d4389e4 3040 Gconvert(SvNVX(sv), NV_DIG, 0, tmpbuf);
46fc3d4c 3041 tsv = Nullsv;
a0d0e21e 3042 goto tokensave;
463ee0b2 3043 }
16d20bd9 3044 if (!SvROK(sv)) {
d008e5eb 3045 if (!(SvFLAGS(sv) & SVs_PADTMP)) {
041457d9 3046 if (!PL_localizing && ckWARN(WARN_UNINITIALIZED))
29489e7c 3047 report_uninit(sv);
c6ee37c5 3048 }
cdb061a3
NC
3049 if (lp)
3050 *lp = 0;
73d840c0 3051 return (char *)"";
16d20bd9 3052 }
463ee0b2 3053 }
ed6116ce
LW
3054 if (SvTHINKFIRST(sv)) {
3055 if (SvROK(sv)) {
a0d0e21e 3056 SV* tmpstr;
e1ec3a88 3057 register const char *typestr;
1554e226 3058 if (SvAMAGIC(sv) && (tmpstr=AMG_CALLun(sv,string)) &&
b4b9a328 3059 (!SvROK(tmpstr) || (SvRV(tmpstr) != SvRV(sv)))) {
50adf7d2
NC
3060 /* Unwrap this: */
3061 /* char *pv = lp ? SvPV(tmpstr, *lp) : SvPV_nolen(tmpstr); */
3062
3063 char *pv;
3064 if ((SvFLAGS(tmpstr) & (SVf_POK)) == SVf_POK) {
3065 if (flags & SV_CONST_RETURN) {
3066 pv = (char *) SvPVX_const(tmpstr);
3067 } else {
3068 pv = (flags & SV_MUTABLE_RETURN)
3069 ? SvPVX_mutable(tmpstr) : SvPVX(tmpstr);
3070 }
3071 if (lp)
3072 *lp = SvCUR(tmpstr);
3073 } else {
3074 pv = sv_2pv_flags(tmpstr, lp, flags);
3075 }
446eaa42
YST
3076 if (SvUTF8(tmpstr))
3077 SvUTF8_on(sv);
3078 else
3079 SvUTF8_off(sv);
3080 return pv;
3081 }
cb50f42d 3082 origsv = sv;
ed6116ce
LW
3083 sv = (SV*)SvRV(sv);
3084 if (!sv)
e1ec3a88 3085 typestr = "NULLREF";
ed6116ce 3086 else {
f9277f47
IZ
3087 MAGIC *mg;
3088
ed6116ce 3089 switch (SvTYPE(sv)) {
f9277f47
IZ
3090 case SVt_PVMG:
3091 if ( ((SvFLAGS(sv) &
1c846c1f 3092 (SVs_OBJECT|SVf_OK|SVs_GMG|SVs_SMG|SVs_RMG))
faf82a0b 3093 == (SVs_OBJECT|SVs_SMG))
14befaf4 3094 && (mg = mg_find(sv, PERL_MAGIC_qr))) {
e1ec3a88 3095 const regexp *re = (regexp *)mg->mg_obj;
1bd3ad17 3096
2cd61cdb 3097 if (!mg->mg_ptr) {
e1ec3a88 3098 const char *fptr = "msix";
8782bef2
GB
3099 char reflags[6];
3100 char ch;
3101 int left = 0;
3102 int right = 4;
ff385a1b 3103 char need_newline = 0;
eb160463 3104 U16 reganch = (U16)((re->reganch & PMf_COMPILETIME) >> 12);
8782bef2 3105
155aba94 3106 while((ch = *fptr++)) {
8782bef2
GB
3107 if(reganch & 1) {
3108 reflags[left++] = ch;
3109 }
3110 else {
3111 reflags[right--] = ch;
3112 }
3113 reganch >>= 1;
3114 }
3115 if(left != 4) {
3116 reflags[left] = '-';
3117 left = 5;
3118 }
3119
3120 mg->mg_len = re->prelen + 4 + left;
ff385a1b
JF
3121 /*
3122 * If /x was used, we have to worry about a regex
3123 * ending with a comment later being embedded
3124 * within another regex. If so, we don't want this
3125 * regex's "commentization" to leak out to the
3126 * right part of the enclosing regex, we must cap
3127 * it with a newline.
3128 *
3129 * So, if /x was used, we scan backwards from the
3130 * end of the regex. If we find a '#' before we
3131 * find a newline, we need to add a newline
3132 * ourself. If we find a '\n' first (or if we
3133 * don't find '#' or '\n'), we don't need to add
3134 * anything. -jfriedl
3135 */
3136 if (PMf_EXTENDED & re->reganch)
3137 {
e1ec3a88 3138 const char *endptr = re->precomp + re->prelen;
ff385a1b
JF
3139 while (endptr >= re->precomp)
3140 {
e1ec3a88 3141 const char c = *(endptr--);
ff385a1b
JF
3142 if (c == '\n')
3143 break; /* don't need another */
3144 if (c == '#') {
3145 /* we end while in a comment, so we
3146 need a newline */
3147 mg->mg_len++; /* save space for it */
3148 need_newline = 1; /* note to add it */
ab01544f 3149 break;
ff385a1b
JF
3150 }
3151 }
3152 }
3153
a02a5408 3154 Newx(mg->mg_ptr, mg->mg_len + 1 + left, char);
8782bef2
GB
3155 Copy("(?", mg->mg_ptr, 2, char);
3156 Copy(reflags, mg->mg_ptr+2, left, char);
3157 Copy(":", mg->mg_ptr+left+2, 1, char);
3158 Copy(re->precomp, mg->mg_ptr+3+left, re->prelen, char);
ff385a1b
JF
3159 if (need_newline)
3160 mg->mg_ptr[mg->mg_len - 2] = '\n';
1bd3ad17
IZ
3161 mg->mg_ptr[mg->mg_len - 1] = ')';
3162 mg->mg_ptr[mg->mg_len] = 0;
3163 }
3280af22 3164 PL_reginterp_cnt += re->program[0].next_off;
cb50f42d
YST
3165
3166 if (re->reganch & ROPT_UTF8)
3167 SvUTF8_on(origsv);
3168 else
3169 SvUTF8_off(origsv);
cdb061a3
NC
3170 if (lp)
3171 *lp = mg->mg_len;
1bd3ad17 3172 return mg->mg_ptr;
f9277f47
IZ
3173 }
3174 /* Fall through */
ed6116ce
LW
3175 case SVt_NULL:
3176 case SVt_IV:
3177 case SVt_NV:
3178 case SVt_RV:
3179 case SVt_PV:
3180 case SVt_PVIV:
3181 case SVt_PVNV:
e1ec3a88
AL
3182 case SVt_PVBM: typestr = SvROK(sv) ? "REF" : "SCALAR"; break;
3183 case SVt_PVLV: typestr = SvROK(sv) ? "REF"
be65207d
DM
3184 /* tied lvalues should appear to be
3185 * scalars for backwards compatitbility */
3186 : (LvTYPE(sv) == 't' || LvTYPE(sv) == 'T')
3187 ? "SCALAR" : "LVALUE"; break;
e1ec3a88
AL
3188 case SVt_PVAV: typestr = "ARRAY"; break;
3189 case SVt_PVHV: typestr = "HASH"; break;
3190 case SVt_PVCV: typestr = "CODE"; break;
3191 case SVt_PVGV: typestr = "GLOB"; break;
3192 case SVt_PVFM: typestr = "FORMAT"; break;
3193 case SVt_PVIO: typestr = "IO"; break;
3194 default: typestr = "UNKNOWN"; break;
ed6116ce 3195 }
46fc3d4c 3196 tsv = NEWSV(0,0);
a5cb6b62 3197 if (SvOBJECT(sv)) {
bfcb3514 3198 const char *name = HvNAME_get(SvSTASH(sv));
a5cb6b62 3199 Perl_sv_setpvf(aTHX_ tsv, "%s=%s(0x%"UVxf")",
e1ec3a88 3200 name ? name : "__ANON__" , typestr, PTR2UV(sv));
a5cb6b62 3201 }
ed6116ce 3202 else
e1ec3a88 3203 Perl_sv_setpvf(aTHX_ tsv, "%s(0x%"UVxf")", typestr, PTR2UV(sv));
a0d0e21e 3204 goto tokensaveref;
463ee0b2 3205 }
cdb061a3
NC
3206 if (lp)
3207 *lp = strlen(typestr);
73d840c0 3208 return (char *)typestr;
79072805 3209 }
0336b60e 3210 if (SvREADONLY(sv) && !SvOK(sv)) {
0336b60e 3211 if (ckWARN(WARN_UNINITIALIZED))
29489e7c 3212 report_uninit(sv);
cdb061a3
NC
3213 if (lp)
3214 *lp = 0;
73d840c0 3215 return (char *)"";
79072805 3216 }
79072805 3217 }
28e5dec8
JH
3218 if (SvIOK(sv) || ((SvIOKp(sv) && !SvNOKp(sv)))) {
3219 /* I'm assuming that if both IV and NV are equally valid then
3220 converting the IV is going to be more efficient */
e1ec3a88
AL
3221 const U32 isIOK = SvIOK(sv);
3222 const U32 isUIOK = SvIsUV(sv);
28e5dec8
JH
3223 char buf[TYPE_CHARS(UV)];
3224 char *ebuf, *ptr;
3225
3226 if (SvTYPE(sv) < SVt_PVIV)
3227 sv_upgrade(sv, SVt_PVIV);
3228 if (isUIOK)
3229 ptr = uiv_2buf(buf, 0, SvUVX(sv), 1, &ebuf);
3230 else
3231 ptr = uiv_2buf(buf, SvIVX(sv), 0, 0, &ebuf);
5902b6a9
NC
3232 /* inlined from sv_setpvn */
3233 SvGROW_mutable(sv, (STRLEN)(ebuf - ptr + 1));
4d84ee25 3234 Move(ptr,SvPVX_mutable(sv),ebuf - ptr,char);
28e5dec8
JH
3235 SvCUR_set(sv, ebuf - ptr);
3236 s = SvEND(sv);
3237 *s = '\0';
3238 if (isIOK)
3239 SvIOK_on(sv);
3240 else
3241 SvIOKp_on(sv);
3242 if (isUIOK)
3243 SvIsUV_on(sv);
3244 }
3245 else if (SvNOKp(sv)) {
79072805
LW
3246 if (SvTYPE(sv) < SVt_PVNV)
3247 sv_upgrade(sv, SVt_PVNV);
1c846c1f 3248 /* The +20 is pure guesswork. Configure test needed. --jhi */
5902b6a9 3249 s = SvGROW_mutable(sv, NV_DIG + 20);
79072805 3250 olderrno = errno; /* some Xenix systems wipe out errno here */
79072805 3251#ifdef apollo
463ee0b2 3252 if (SvNVX(sv) == 0.0)
79072805
LW
3253 (void)strcpy(s,"0");
3254 else
3255#endif /*apollo*/
bbce6d69 3256 {
2d4389e4 3257 Gconvert(SvNVX(sv), NV_DIG, 0, s);
bbce6d69 3258 }
79072805 3259 errno = olderrno;
a0d0e21e
LW
3260#ifdef FIXNEGATIVEZERO
3261 if (*s == '-' && s[1] == '0' && !s[2])
3262 strcpy(s,"0");
3263#endif
79072805
LW
3264 while (*s) s++;
3265#ifdef hcx
3266 if (s[-1] == '.')
46fc3d4c 3267 *--s = '\0';
79072805
LW
3268#endif
3269 }
79072805 3270 else {
041457d9 3271 if (!PL_localizing && !(SvFLAGS(sv) & SVs_PADTMP) && ckWARN(WARN_UNINITIALIZED))
29489e7c 3272 report_uninit(sv);
cdb061a3 3273 if (lp)
a0d0e21e 3274 *lp = 0;
25da4f38
IZ
3275 if (SvTYPE(sv) < SVt_PV)
3276 /* Typically the caller expects that sv_any is not NULL now. */
3277 sv_upgrade(sv, SVt_PV);
73d840c0 3278 return (char *)"";
79072805 3279 }
cdb061a3
NC
3280 {
3281 STRLEN len = s - SvPVX_const(sv);
3282 if (lp)
3283 *lp = len;
3284 SvCUR_set(sv, len);
3285 }
79072805 3286 SvPOK_on(sv);
1d7c1841 3287 DEBUG_c(PerlIO_printf(Perl_debug_log, "0x%"UVxf" 2pv(%s)\n",
3f7c398e 3288 PTR2UV(sv),SvPVX_const(sv)));
4d84ee25
NC
3289 if (flags & SV_CONST_RETURN)
3290 return (char *)SvPVX_const(sv);
10516c54
NC
3291 if (flags & SV_MUTABLE_RETURN)
3292 return SvPVX_mutable(sv);
463ee0b2 3293 return SvPVX(sv);
a0d0e21e
LW
3294
3295 tokensave:
3296 if (SvROK(sv)) { /* XXX Skip this when sv_pvn_force calls */
3297 /* Sneaky stuff here */
3298
3299 tokensaveref:
46fc3d4c 3300 if (!tsv)
96827780 3301 tsv = newSVpv(tmpbuf, 0);
46fc3d4c 3302 sv_2mortal(tsv);
cdb061a3
NC
3303 if (lp)
3304 *lp = SvCUR(tsv);
46fc3d4c 3305 return SvPVX(tsv);
a0d0e21e
LW
3306 }
3307 else {
27da23d5 3308 dVAR;
a0d0e21e 3309 STRLEN len;
73d840c0 3310 const char *t;
46fc3d4c 3311
3312 if (tsv) {
3313 sv_2mortal(tsv);
3f7c398e 3314 t = SvPVX_const(tsv);
46fc3d4c 3315 len = SvCUR(tsv);
3316 }
3317 else {
96827780
MB
3318 t = tmpbuf;
3319 len = strlen(tmpbuf);
46fc3d4c 3320 }
a0d0e21e 3321#ifdef FIXNEGATIVEZERO
46fc3d4c 3322 if (len == 2 && t[0] == '-' && t[1] == '0') {
3323 t = "0";
3324 len = 1;
3325 }
a0d0e21e 3326#endif
862a34c6 3327 SvUPGRADE(sv, SVt_PV);
cdb061a3
NC
3328 if (lp)
3329 *lp = len;
5902b6a9 3330 s = SvGROW_mutable(sv, len + 1);
a0d0e21e 3331 SvCUR_set(sv, len);
6bf554b4 3332 SvPOKp_on(sv);
490a0e98 3333 return memcpy(s, t, len + 1);
a0d0e21e 3334 }
463ee0b2
LW
3335}
3336
645c22ef 3337/*
6050d10e
JP
3338=for apidoc sv_copypv
3339
3340Copies a stringified representation of the source SV into the
3341destination SV. Automatically performs any necessary mg_get and
54f0641b 3342coercion of numeric values into strings. Guaranteed to preserve
6050d10e 3343UTF-8 flag even from overloaded objects. Similar in nature to
54f0641b
NIS
3344sv_2pv[_flags] but operates directly on an SV instead of just the
3345string. Mostly uses sv_2pv_flags to do its work, except when that
6050d10e
JP
3346would lose the UTF-8'ness of the PV.
3347
3348=cut
3349*/
3350
3351void
3352Perl_sv_copypv(pTHX_ SV *dsv, register SV *ssv)
3353{
446eaa42 3354 STRLEN len;
53c1dcc0 3355 const char * const s = SvPV_const(ssv,len);
cb50f42d 3356 sv_setpvn(dsv,s,len);
446eaa42 3357 if (SvUTF8(ssv))
cb50f42d 3358 SvUTF8_on(dsv);
446eaa42 3359 else
cb50f42d 3360 SvUTF8_off(dsv);
6050d10e
JP
3361}
3362
3363/*
645c22ef
DM
3364=for apidoc sv_2pvbyte_nolen
3365
3366Return a pointer to the byte-encoded representation of the SV.
1e54db1a 3367May cause the SV to be downgraded from UTF-8 as a side-effect.
645c22ef
DM
3368
3369Usually accessed via the C<SvPVbyte_nolen> macro.
3370
3371=cut
3372*/
3373
7340a771
GS
3374char *
3375Perl_sv_2pvbyte_nolen(pTHX_ register SV *sv)
3376{
dafda6d1 3377 return sv_2pvbyte(sv, 0);
7340a771
GS
3378}
3379
645c22ef
DM
3380/*
3381=for apidoc sv_2pvbyte
3382
3383Return a pointer to the byte-encoded representation of the SV, and set *lp
1e54db1a 3384to its length. May cause the SV to be downgraded from UTF-8 as a
645c22ef
DM
3385side-effect.
3386
3387Usually accessed via the C<SvPVbyte> macro.
3388
3389=cut
3390*/
3391
7340a771
GS
3392char *
3393Perl_sv_2pvbyte(pTHX_ register SV *sv, STRLEN *lp)
3394{
0875d2fe 3395 sv_utf8_downgrade(sv,0);
97972285 3396 return lp ? SvPV(sv,*lp) : SvPV_nolen(sv);
7340a771
GS
3397}
3398
645c22ef
DM
3399/*
3400=for apidoc sv_2pvutf8_nolen
3401
1e54db1a
JH
3402Return a pointer to the UTF-8-encoded representation of the SV.
3403May cause the SV to be upgraded to UTF-8 as a side-effect.
645c22ef
DM
3404
3405Usually accessed via the C<SvPVutf8_nolen> macro.
3406
3407=cut
3408*/
3409
7340a771
GS
3410char *
3411Perl_sv_2pvutf8_nolen(pTHX_ register SV *sv)
3412{
dafda6d1 3413 return sv_2pvutf8(sv, 0);
7340a771
GS
3414}
3415
645c22ef
DM
3416/*
3417=for apidoc sv_2pvutf8
3418
1e54db1a
JH
3419Return a pointer to the UTF-8-encoded representation of the SV, and set *lp
3420to its length. May cause the SV to be upgraded to UTF-8 as a side-effect.
645c22ef
DM
3421
3422Usually accessed via the C<SvPVutf8> macro.
3423
3424=cut
3425*/
3426
7340a771
GS
3427char *
3428Perl_sv_2pvutf8(pTHX_ register SV *sv, STRLEN *lp)
3429{
560a288e 3430 sv_utf8_upgrade(sv);
7d59b7e4 3431 return SvPV(sv,*lp);
7340a771 3432}
1c846c1f 3433
645c22ef
DM
3434/*
3435=for apidoc sv_2bool
3436
3437This function is only called on magical items, and is only used by
8cf8f3d1 3438sv_true() or its macro equivalent.
645c22ef
DM
3439
3440=cut
3441*/
3442
463ee0b2 3443bool
864dbfa3 3444Perl_sv_2bool(pTHX_ register SV *sv)
463ee0b2 3445{
8990e307 3446 if (SvGMAGICAL(sv))
463ee0b2
LW
3447 mg_get(sv);
3448
a0d0e21e
LW
3449 if (!SvOK(sv))
3450 return 0;
3451 if (SvROK(sv)) {
a0d0e21e 3452 SV* tmpsv;
1554e226 3453 if (SvAMAGIC(sv) && (tmpsv=AMG_CALLun(sv,bool_)) &&
9e3013b1 3454 (!SvROK(tmpsv) || (SvRV(tmpsv) != SvRV(sv))))
8a31060d 3455 return (bool)SvTRUE(tmpsv);
a0d0e21e
LW
3456 return SvRV(sv) != 0;
3457 }
463ee0b2 3458 if (SvPOKp(sv)) {
53c1dcc0
AL
3459 register XPV* const Xpvtmp = (XPV*)SvANY(sv);
3460 if (Xpvtmp &&
339049b0 3461 (*sv->sv_u.svu_pv > '0' ||
11343788 3462 Xpvtmp->xpv_cur > 1 ||
339049b0 3463 (Xpvtmp->xpv_cur && *sv->sv_u.svu_pv != '0')))
463ee0b2
LW
3464 return 1;
3465 else
3466 return 0;
3467 }
3468 else {
3469 if (SvIOKp(sv))
3470 return SvIVX(sv) != 0;
3471 else {
3472 if (SvNOKp(sv))
3473 return SvNVX(sv) != 0.0;
3474 else
3475 return FALSE;
3476 }
3477 }
79072805
LW
3478}
3479
09540bc3
JH
3480/* sv_utf8_upgrade() is now a macro using sv_utf8_upgrade_flags();
3481 * this function provided for binary compatibility only
3482 */
3483
3484
3485STRLEN
3486Perl_sv_utf8_upgrade(pTHX_ register SV *sv)
3487{
3488 return sv_utf8_upgrade_flags(sv, SV_GMAGIC);
3489}
3490
c461cf8f
JH
3491/*
3492=for apidoc sv_utf8_upgrade
3493
78ea37eb 3494Converts the PV of an SV to its UTF-8-encoded form.
645c22ef 3495Forces the SV to string form if it is not already.
4411f3b6
NIS
3496Always sets the SvUTF8 flag to avoid future validity checks even
3497if all the bytes have hibit clear.
c461cf8f 3498
13a6c0e0
JH
3499This is not as a general purpose byte encoding to Unicode interface:
3500use the Encode extension for that.
3501
8d6d96c1
HS
3502=for apidoc sv_utf8_upgrade_flags
3503
78ea37eb 3504Converts the PV of an SV to its UTF-8-encoded form.
645c22ef 3505Forces the SV to string form if it is not already.
8d6d96c1
HS
3506Always sets the SvUTF8 flag to avoid future validity checks even
3507if all the bytes have hibit clear. If C<flags> has C<SV_GMAGIC> bit set,
3508will C<mg_get> on C<sv> if appropriate, else not. C<sv_utf8_upgrade> and
3509C<sv_utf8_upgrade_nomg> are implemented in terms of this function.
3510
13a6c0e0
JH
3511This is not as a general purpose byte encoding to Unicode interface:
3512use the Encode extension for that.
3513
8d6d96c1
HS
3514=cut
3515*/
3516
3517STRLEN
3518Perl_sv_utf8_upgrade_flags(pTHX_ register SV *sv, I32 flags)
3519{
808c356f
RGS
3520 if (sv == &PL_sv_undef)
3521 return 0;
e0e62c2a
NIS
3522 if (!SvPOK(sv)) {
3523 STRLEN len = 0;
d52b7888
NC
3524 if (SvREADONLY(sv) && (SvPOKp(sv) || SvIOKp(sv) || SvNOKp(sv))) {
3525 (void) sv_2pv_flags(sv,&len, flags);
3526 if (SvUTF8(sv))
3527 return len;
3528 } else {
3529 (void) SvPV_force(sv,len);
3530 }
e0e62c2a 3531 }
4411f3b6 3532
f5cee72b 3533 if (SvUTF8(sv)) {
5fec3b1d 3534 return SvCUR(sv);
f5cee72b 3535 }
5fec3b1d 3536
765f542d
NC
3537 if (SvIsCOW(sv)) {
3538 sv_force_normal_flags(sv, 0);
db42d148
NIS
3539 }
3540
88632417 3541 if (PL_encoding && !(flags & SV_UTF8_NO_ENCODING))
799ef3cb 3542 sv_recode_to_utf8(sv, PL_encoding);
9f4817db 3543 else { /* Assume Latin-1/EBCDIC */
c4e7c712
NC
3544 /* This function could be much more efficient if we
3545 * had a FLAG in SVs to signal if there are any hibit
3546 * chars in the PV. Given that there isn't such a flag
3547 * make the loop as fast as possible. */
93524f2b
NC
3548 const U8 *s = (U8 *) SvPVX_const(sv);
3549 const U8 *e = (U8 *) SvEND(sv);
3550 const U8 *t = s;
c4e7c712
NC
3551 int hibit = 0;
3552
3553 while (t < e) {
53c1dcc0 3554 const U8 ch = *t++;
c4e7c712
NC
3555 if ((hibit = !NATIVE_IS_INVARIANT(ch)))
3556 break;
3557 }
3558 if (hibit) {
3559 STRLEN len = SvCUR(sv) + 1; /* Plus the \0 */
53c1dcc0 3560 U8 * const recoded = bytes_to_utf8((U8*)s, &len);
c4e7c712
NC
3561
3562 SvPV_free(sv); /* No longer using what was there before. */
3563
1e2ebb21 3564 SvPV_set(sv, (char*)recoded);
c4e7c712
NC
3565 SvCUR_set(sv, len - 1);
3566 SvLEN_set(sv, len); /* No longer know the real size. */
3567 }
3568 /* Mark as UTF-8 even if no hibit - saves scanning loop */
3569 SvUTF8_on(sv);
560a288e 3570 }
4411f3b6 3571 return SvCUR(sv);
560a288e
GS
3572}
3573
c461cf8f
JH
3574/*
3575=for apidoc sv_utf8_downgrade
3576
78ea37eb
TS
3577Attempts to convert the PV of an SV from characters to bytes.
3578If the PV contains a character beyond byte, this conversion will fail;
3579in this case, either returns false or, if C<fail_ok> is not
c461cf8f
JH
3580true, croaks.
3581
13a6c0e0
JH
3582This is not as a general purpose Unicode to byte encoding interface:
3583use the Encode extension for that.
3584
c461cf8f
JH
3585=cut
3586*/
3587
560a288e
GS
3588bool
3589Perl_sv_utf8_downgrade(pTHX_ register SV* sv, bool fail_ok)
3590{
78ea37eb 3591 if (SvPOKp(sv) && SvUTF8(sv)) {
fa301091 3592 if (SvCUR(sv)) {
03cfe0ae 3593 U8 *s;
652088fc 3594 STRLEN len;
fa301091 3595
765f542d
NC
3596 if (SvIsCOW(sv)) {
3597 sv_force_normal_flags(sv, 0);
3598 }
03cfe0ae
NIS
3599 s = (U8 *) SvPV(sv, len);
3600 if (!utf8_to_bytes(s, &len)) {
fa301091
JH
3601 if (fail_ok)
3602 return FALSE;
3603 else {
3604 if (PL_op)
3605 Perl_croak(aTHX_ "Wide character in %s",
53e06cf0 3606 OP_DESC(PL_op));
fa301091
JH
3607 else
3608 Perl_croak(aTHX_ "Wide character");
3609 }
4b3603a4 3610 }
b162af07 3611 SvCUR_set(sv, len);
67e989fb 3612 }
560a288e 3613 }
ffebcc3e 3614 SvUTF8_off(sv);
560a288e
GS
3615 return TRUE;
3616}
3617
c461cf8f
JH
3618/*
3619=for apidoc sv_utf8_encode
3620
78ea37eb
TS
3621Converts the PV of an SV to UTF-8, but then turns the C<SvUTF8>
3622flag off so that it looks like octets again.
c461cf8f
JH
3623
3624=cut
3625*/
3626
560a288e
GS
3627void
3628Perl_sv_utf8_encode(pTHX_ register SV *sv)
3629{
4411f3b6 3630 (void) sv_utf8_upgrade(sv);
4c94c214
NC
3631 if (SvIsCOW(sv)) {
3632 sv_force_normal_flags(sv, 0);
3633 }
3634 if (SvREADONLY(sv)) {
3635 Perl_croak(aTHX_ PL_no_modify);
3636 }
560a288e
GS
3637 SvUTF8_off(sv);
3638}
3639
4411f3b6
NIS
3640/*
3641=for apidoc sv_utf8_decode
3642
78ea37eb
TS
3643If the PV of the SV is an octet sequence in UTF-8
3644and contains a multiple-byte character, the C<SvUTF8> flag is turned on
3645so that it looks like a character. If the PV contains only single-byte
3646characters, the C<SvUTF8> flag stays being off.
3647Scans PV for validity and returns false if the PV is invalid UTF-8.
4411f3b6
NIS
3648
3649=cut
3650*/
3651
560a288e
GS
3652bool
3653Perl_sv_utf8_decode(pTHX_ register SV *sv)
3654{
78ea37eb 3655 if (SvPOKp(sv)) {
93524f2b
NC
3656 const U8 *c;
3657 const U8 *e;
9cbac4c7 3658
645c22ef
DM
3659 /* The octets may have got themselves encoded - get them back as
3660 * bytes
3661 */
3662 if (!sv_utf8_downgrade(sv, TRUE))
560a288e
GS
3663 return FALSE;
3664
3665 /* it is actually just a matter of turning the utf8 flag on, but
3666 * we want to make sure everything inside is valid utf8 first.
3667 */
93524f2b 3668 c = (const U8 *) SvPVX_const(sv);
63cd0674 3669 if (!is_utf8_string(c, SvCUR(sv)+1))
67e989fb 3670 return FALSE;
93524f2b 3671 e = (const U8 *) SvEND(sv);
511c2ff0 3672 while (c < e) {
b64e5050 3673 const U8 ch = *c++;
c4d5f83a 3674 if (!UTF8_IS_INVARIANT(ch)) {
67e989fb
JH
3675 SvUTF8_on(sv);
3676 break;
3677 }
560a288e 3678 }
560a288e
GS
3679 }
3680 return TRUE;
3681}
3682
09540bc3
JH
3683/* sv_setsv() is now a macro using Perl_sv_setsv_flags();
3684 * this function provided for binary compatibility only
3685 */
3686
3687void
3688Perl_sv_setsv(pTHX_ SV *dstr, register SV *sstr)
3689{
3690 sv_setsv_flags(dstr, sstr, SV_GMAGIC);
3691}
3692
954c1994
GS
3693/*
3694=for apidoc sv_setsv
3695
645c22ef
DM
3696Copies the contents of the source SV C<ssv> into the destination SV
3697C<dsv>. The source SV may be destroyed if it is mortal, so don't use this
3698function if the source SV needs to be reused. Does not handle 'set' magic.
3699Loosely speaking, it performs a copy-by-value, obliterating any previous
3700content of the destination.
3701
3702You probably want to use one of the assortment of wrappers, such as
3703C<SvSetSV>, C<SvSetSV_nosteal>, C<SvSetMagicSV> and
3704C<SvSetMagicSV_nosteal>.
3705
8d6d96c1
HS
3706=for apidoc sv_setsv_flags
3707
645c22ef
DM
3708Copies the contents of the source SV C<ssv> into the destination SV
3709C<dsv>. The source SV may be destroyed if it is mortal, so don't use this
3710function if the source SV needs to be reused. Does not handle 'set' magic.
3711Loosely speaking, it performs a copy-by-value, obliterating any previous
3712content of the destination.
3713If the C<flags> parameter has the C<SV_GMAGIC> bit set, will C<mg_get> on
5fcdf167
NC
3714C<ssv> if appropriate, else not. If the C<flags> parameter has the
3715C<NOSTEAL> bit set then the buffers of temps will not be stolen. <sv_setsv>
3716and C<sv_setsv_nomg> are implemented in terms of this function.
645c22ef
DM
3717
3718You probably want to use one of the assortment of wrappers, such as
3719C<SvSetSV>, C<SvSetSV_nosteal>, C<SvSetMagicSV> and
3720C<SvSetMagicSV_nosteal>.
3721
3722This is the primary function for copying scalars, and most other
3723copy-ish functions and macros use this underneath.
8d6d96c1
HS
3724
3725=cut
3726*/
3727
3728void
3729Perl_sv_setsv_flags(pTHX_ SV *dstr, register SV *sstr, I32 flags)
3730{
8990e307
LW
3731 register U32 sflags;
3732 register int dtype;
3733 register int stype;
463ee0b2 3734
79072805
LW
3735 if (sstr == dstr)
3736 return;
765f542d 3737 SV_CHECK_THINKFIRST_COW_DROP(dstr);
79072805 3738 if (!sstr)
3280af22 3739 sstr = &PL_sv_undef;
8990e307
LW
3740 stype = SvTYPE(sstr);
3741 dtype = SvTYPE(dstr);
79072805 3742
a0d0e21e 3743 SvAMAGIC_off(dstr);
7a5fa8a2 3744 if ( SvVOK(dstr) )
ece467f9
JP
3745 {
3746 /* need to nuke the magic */
3747 mg_free(dstr);
3748 SvRMAGICAL_off(dstr);
3749 }
9e7bc3e8 3750
463ee0b2 3751 /* There's a lot of redundancy below but we're going for speed here */
79072805 3752
8990e307 3753 switch (stype) {
79072805 3754 case SVt_NULL:
aece5585 3755 undef_sstr:
20408e3c
GS
3756 if (dtype != SVt_PVGV) {
3757 (void)SvOK_off(dstr);
3758 return;
3759 }
3760 break;
463ee0b2 3761 case SVt_IV:
aece5585
GA
3762 if (SvIOK(sstr)) {
3763 switch (dtype) {
3764 case SVt_NULL:
8990e307 3765 sv_upgrade(dstr, SVt_IV);
aece5585
GA
3766 break;
3767 case SVt_NV:
8990e307 3768 sv_upgrade(dstr, SVt_PVNV);
aece5585
GA
3769 break;
3770 case SVt_RV:
3771 case SVt_PV:
a0d0e21e 3772 sv_upgrade(dstr, SVt_PVIV);
aece5585
GA
3773 break;
3774 }
3775 (void)SvIOK_only(dstr);
45977657 3776 SvIV_set(dstr, SvIVX(sstr));
25da4f38
IZ
3777 if (SvIsUV(sstr))
3778 SvIsUV_on(dstr);
27c9684d
AP
3779 if (SvTAINTED(sstr))
3780 SvTAINT(dstr);
aece5585 3781 return;
8990e307 3782 }
aece5585
GA
3783 goto undef_sstr;
3784
463ee0b2 3785 case SVt_NV:
aece5585
GA
3786 if (SvNOK(sstr)) {
3787 switch (dtype) {
3788 case SVt_NULL:
3789 case SVt_IV:
8990e307 3790 sv_upgrade(dstr, SVt_NV);
aece5585
GA
3791 break;
3792 case SVt_RV:
3793 case SVt_PV:
3794 case SVt_PVIV:
a0d0e21e 3795 sv_upgrade(dstr, SVt_PVNV);
aece5585
GA
3796 break;
3797 }
9d6ce603 3798 SvNV_set(dstr, SvNVX(sstr));
aece5585 3799 (void)SvNOK_only(dstr);
27c9684d
AP
3800 if (SvTAINTED(sstr))
3801 SvTAINT(dstr);
aece5585 3802 return;
8990e307 3803 }
aece5585
GA
3804 goto undef_sstr;
3805
ed6116ce 3806 case SVt_RV:
8990e307 3807 if (dtype < SVt_RV)
ed6116ce 3808 sv_upgrade(dstr, SVt_RV);
c07a80fd 3809 else if (dtype == SVt_PVGV &&
23bb1b96 3810 SvROK(sstr) && SvTYPE(SvRV(sstr)) == SVt_PVGV) {
c07a80fd 3811 sstr = SvRV(sstr);
a5f75d66 3812 if (sstr == dstr) {
1d7c1841
GS
3813 if (GvIMPORTED(dstr) != GVf_IMPORTED
3814 && CopSTASH_ne(PL_curcop, GvSTASH(dstr)))
3815 {
a5f75d66 3816 GvIMPORTED_on(dstr);
1d7c1841 3817 }
a5f75d66
AD
3818 GvMULTI_on(dstr);
3819 return;
3820 }
c07a80fd 3821 goto glob_assign;
3822 }
ed6116ce 3823 break;
fc36a67e 3824 case SVt_PVFM:
f8c7b90f 3825#ifdef PERL_OLD_COPY_ON_WRITE
d89fc664
NC
3826 if ((SvFLAGS(sstr) & CAN_COW_MASK) == CAN_COW_FLAGS) {
3827 if (dtype < SVt_PVIV)
3828 sv_upgrade(dstr, SVt_PVIV);
3829 break;
3830 }
3831 /* Fall through */
3832#endif
3833 case SVt_PV:
8990e307 3834 if (dtype < SVt_PV)
463ee0b2 3835 sv_upgrade(dstr, SVt_PV);
463ee0b2
LW
3836 break;
3837 case SVt_PVIV:
8990e307 3838 if (dtype < SVt_PVIV)
463ee0b2 3839 sv_upgrade(dstr, SVt_PVIV);
463ee0b2
LW
3840 break;
3841 case SVt_PVNV:
8990e307 3842 if (dtype < SVt_PVNV)
463ee0b2 3843 sv_upgrade(dstr, SVt_PVNV);
463ee0b2 3844 break;
4633a7c4
LW
3845 case SVt_PVAV:
3846 case SVt_PVHV:
3847 case SVt_PVCV:
4633a7c4 3848 case SVt_PVIO:
a3b680e6
AL
3849 {
3850 const char * const type = sv_reftype(sstr,0);
533c011a 3851 if (PL_op)
a3b680e6 3852 Perl_croak(aTHX_ "Bizarre copy of %s in %s", type, OP_NAME(PL_op));
4633a7c4 3853 else
a3b680e6
AL
3854 Perl_croak(aTHX_ "Bizarre copy of %s", type);
3855 }
4633a7c4
LW
3856 break;
3857
79072805 3858 case SVt_PVGV:
8990e307 3859 if (dtype <= SVt_PVGV) {
c07a80fd 3860 glob_assign:
a5f75d66 3861 if (dtype != SVt_PVGV) {
a3b680e6
AL
3862 const char * const name = GvNAME(sstr);
3863 const STRLEN len = GvNAMELEN(sstr);
b76195c2
DM
3864 /* don't upgrade SVt_PVLV: it can hold a glob */
3865 if (dtype != SVt_PVLV)
3866 sv_upgrade(dstr, SVt_PVGV);
14befaf4 3867 sv_magic(dstr, dstr, PERL_MAGIC_glob, Nullch, 0);
e15faf7d
NC
3868 GvSTASH(dstr) = GvSTASH(sstr);
3869 if (GvSTASH(dstr))
3870 Perl_sv_add_backref(aTHX_ (SV*)GvSTASH(dstr), dstr);
a0d0e21e
LW
3871 GvNAME(dstr) = savepvn(name, len);
3872 GvNAMELEN(dstr) = len;
3873 SvFAKE_on(dstr); /* can coerce to non-glob */
3874 }
7bac28a0 3875 /* ahem, death to those who redefine active sort subs */
3280af22
NIS
3876 else if (PL_curstackinfo->si_type == PERLSI_SORT
3877 && GvCV(dstr) && PL_sortcop == CvSTART(GvCV(dstr)))
cea2e8a9 3878 Perl_croak(aTHX_ "Can't redefine active sort subroutine %s",
7bac28a0 3879 GvNAME(dstr));
5bd07a3d 3880
7fb37951
AMS
3881#ifdef GV_UNIQUE_CHECK
3882 if (GvUNIQUE((GV*)dstr)) {
5bd07a3d
DM
3883 Perl_croak(aTHX_ PL_no_modify);
3884 }
3885#endif
3886
a0d0e21e 3887 (void)SvOK_off(dstr);
a5f75d66 3888 GvINTRO_off(dstr); /* one-shot flag */
1edc1566 3889 gp_free((GV*)dstr);
79072805 3890 GvGP(dstr) = gp_ref(GvGP(sstr));
27c9684d
AP
3891 if (SvTAINTED(sstr))
3892 SvTAINT(dstr);
1d7c1841
GS
3893 if (GvIMPORTED(dstr) != GVf_IMPORTED
3894 && CopSTASH_ne(PL_curcop, GvSTASH(dstr)))
3895 {
a5f75d66 3896 GvIMPORTED_on(dstr);
1d7c1841 3897 }
a5f75d66 3898 GvMULTI_on(dstr);
79072805
LW
3899 return;
3900 }
3901 /* FALL THROUGH */
3902
3903 default:
8d6d96c1 3904 if (SvGMAGICAL(sstr) && (flags & SV_GMAGIC)) {
973f89ab 3905 mg_get(sstr);
eb160463 3906 if ((int)SvTYPE(sstr) != stype) {
973f89ab
CS
3907 stype = SvTYPE(sstr);
3908 if (stype == SVt_PVGV && dtype <= SVt_PVGV)
3909 goto glob_assign;
3910 }
3911 }
ded42b9f 3912 if (stype == SVt_PVLV)
862a34c6 3913 SvUPGRADE(dstr, SVt_PVNV);
ded42b9f 3914 else
862a34c6 3915 SvUPGRADE(dstr, (U32)stype);
79072805
LW
3916 }
3917
8990e307
LW
3918 sflags = SvFLAGS(sstr);
3919
3920 if (sflags & SVf_ROK) {
3921 if (dtype >= SVt_PV) {
3922 if (dtype == SVt_PVGV) {
3923 SV *sref = SvREFCNT_inc(SvRV(sstr));
3924 SV *dref = 0;
a3b680e6 3925 const int intro = GvINTRO(dstr);
a0d0e21e 3926
7fb37951
AMS
3927#ifdef GV_UNIQUE_CHECK
3928 if (GvUNIQUE((GV*)dstr)) {
5bd07a3d
DM
3929 Perl_croak(aTHX_ PL_no_modify);
3930 }
3931#endif
3932
a0d0e21e 3933 if (intro) {
a5f75d66 3934 GvINTRO_off(dstr); /* one-shot flag */
1d7c1841 3935 GvLINE(dstr) = CopLINE(PL_curcop);
1edc1566 3936 GvEGV(dstr) = (GV*)dstr;
a0d0e21e 3937 }
a5f75d66 3938 GvMULTI_on(dstr);
8990e307
LW
3939 switch (SvTYPE(sref)) {
3940 case SVt_PVAV:
a0d0e21e 3941 if (intro)
890ed176 3942 SAVEGENERICSV(GvAV(dstr));
a0d0e21e
LW
3943 else
3944 dref = (SV*)GvAV(dstr);
8990e307 3945 GvAV(dstr) = (AV*)sref;
39bac7f7 3946 if (!GvIMPORTED_AV(dstr)
1d7c1841
GS
3947 && CopSTASH_ne(PL_curcop, GvSTASH(dstr)))
3948 {
a5f75d66 3949 GvIMPORTED_AV_on(dstr);
1d7c1841 3950 }
8990e307
LW
3951 break;
3952 case SVt_PVHV:
a0d0e21e 3953 if (intro)
890ed176 3954 SAVEGENERICSV(GvHV(dstr));
a0d0e21e
LW
3955 else
3956 dref = (SV*)GvHV(dstr);
8990e307 3957 GvHV(dstr) = (HV*)sref;
39bac7f7 3958 if (!GvIMPORTED_HV(dstr)
1d7c1841
GS
3959 && CopSTASH_ne(PL_curcop, GvSTASH(dstr)))
3960 {
a5f75d66 3961 GvIMPORTED_HV_on(dstr);
1d7c1841 3962 }
8990e307
LW
3963 break;
3964 case SVt_PVCV:
8ebc5c01 3965 if (intro) {
3966 if (GvCVGEN(dstr) && GvCV(dstr) != (CV*)sref) {
3967 SvREFCNT_dec(GvCV(dstr));
3968 GvCV(dstr) = Nullcv;
68dc0745 3969 GvCVGEN(dstr) = 0; /* Switch off cacheness. */
3280af22 3970 PL_sub_generation++;
8ebc5c01 3971 }
890ed176 3972 SAVEGENERICSV(GvCV(dstr));
8ebc5c01 3973 }
68dc0745 3974 else
3975 dref = (SV*)GvCV(dstr);
3976 if (GvCV(dstr) != (CV*)sref) {
748a9306 3977 CV* cv = GvCV(dstr);
4633a7c4 3978 if (cv) {
68dc0745 3979 if (!GvCVGEN((GV*)dstr) &&
3980 (CvROOT(cv) || CvXSUB(cv)))
3981 {
7bac28a0 3982 /* ahem, death to those who redefine
3983 * active sort subs */
3280af22
NIS
3984 if (PL_curstackinfo->si_type == PERLSI_SORT &&
3985 PL_sortcop == CvSTART(cv))
1c846c1f 3986 Perl_croak(aTHX_
7bac28a0 3987 "Can't redefine active sort subroutine %s",
3988 GvENAME((GV*)dstr));
beab0874
JT
3989 /* Redefining a sub - warning is mandatory if
3990 it was a const and its value changed. */
3991 if (ckWARN(WARN_REDEFINE)
3992 || (CvCONST(cv)
3993 && (!CvCONST((CV*)sref)
3994 || sv_cmp(cv_const_sv(cv),
3995 cv_const_sv((CV*)sref)))))
3996 {
9014280d 3997 Perl_warner(aTHX_ packWARN(WARN_REDEFINE),
beab0874 3998 CvCONST(cv)
910764e6
RGS
3999 ? "Constant subroutine %s::%s redefined"
4000 : "Subroutine %s::%s redefined",
bfcb3514 4001 HvNAME_get(GvSTASH((GV*)dstr)),
beab0874
JT
4002 GvENAME((GV*)dstr));
4003 }
9607fc9c 4004 }
fb24441d
RGS
4005 if (!intro)
4006 cv_ckproto(cv, (GV*)dstr,
93524f2b
NC
4007 SvPOK(sref)
4008 ? SvPVX_const(sref) : Nullch);
4633a7c4 4009 }
a5f75d66 4010 GvCV(dstr) = (CV*)sref;
7a4c00b4 4011 GvCVGEN(dstr) = 0; /* Switch off cacheness. */
a5f75d66 4012 GvASSUMECV_on(dstr);
3280af22 4013 PL_sub_generation++;
a5f75d66 4014 }
39bac7f7 4015 if (!GvIMPORTED_CV(dstr)
1d7c1841
GS
4016 && CopSTASH_ne(PL_curcop, GvSTASH(dstr)))
4017 {
a5f75d66 4018 GvIMPORTED_CV_on(dstr);
1d7c1841 4019 }
8990e307 4020 break;
91bba347
LW
4021 case SVt_PVIO:
4022 if (intro)
890ed176 4023 SAVEGENERICSV(GvIOp(dstr));
91bba347
LW
4024 else
4025 dref = (SV*)GvIOp(dstr);
4026 GvIOp(dstr) = (IO*)sref;
4027 break;
f4d13ee9
JH
4028 case SVt_PVFM:
4029 if (intro)
890ed176 4030 SAVEGENERICSV(GvFORM(dstr));
f4d13ee9
JH
4031 else
4032 dref = (SV*)GvFORM(dstr);
4033 GvFORM(dstr) = (CV*)sref;
4034 break;
8990e307 4035 default:
a0d0e21e 4036 if (intro)
890ed176 4037 SAVEGENERICSV(GvSV(dstr));
a0d0e21e
LW
4038 else
4039 dref = (SV*)GvSV(dstr);
8990e307 4040 GvSV(dstr) = sref;
39bac7f7 4041 if (!GvIMPORTED_SV(dstr)
1d7c1841
GS
4042 && CopSTASH_ne(PL_curcop, GvSTASH(dstr)))
4043 {
a5f75d66 4044 GvIMPORTED_SV_on(dstr);
1d7c1841 4045 }
8990e307
LW
4046 break;
4047 }
4048 if (dref)
4049 SvREFCNT_dec(dref);
27c9684d
AP
4050 if (SvTAINTED(sstr))
4051 SvTAINT(dstr);
8990e307
LW
4052 return;
4053 }
3f7c398e 4054 if (SvPVX_const(dstr)) {
8bd4d4c5 4055 SvPV_free(dstr);
b162af07
SP
4056 SvLEN_set(dstr, 0);
4057 SvCUR_set(dstr, 0);
a0d0e21e 4058 }
8990e307 4059 }
a0d0e21e 4060 (void)SvOK_off(dstr);
b162af07 4061 SvRV_set(dstr, SvREFCNT_inc(SvRV(sstr)));
ed6116ce 4062 SvROK_on(dstr);
8990e307 4063 if (sflags & SVp_NOK) {
3332b3c1
JH
4064 SvNOKp_on(dstr);
4065 /* Only set the public OK flag if the source has public OK. */
4066 if (sflags & SVf_NOK)
4067 SvFLAGS(dstr) |= SVf_NOK;
9d6ce603 4068 SvNV_set(dstr, SvNVX(sstr));
ed6116ce 4069 }
8990e307 4070 if (sflags & SVp_IOK) {
3332b3c1
JH
4071 (void)SvIOKp_on(dstr);
4072 if (sflags & SVf_IOK)
4073 SvFLAGS(dstr) |= SVf_IOK;
2b1c7e3e 4074 if (sflags & SVf_IVisUV)
25da4f38 4075 SvIsUV_on(dstr);
45977657 4076 SvIV_set(dstr, SvIVX(sstr));
ed6116ce 4077 }
a0d0e21e
LW
4078 if (SvAMAGIC(sstr)) {
4079 SvAMAGIC_on(dstr);
4080 }
ed6116ce 4081 }
8990e307 4082 else if (sflags & SVp_POK) {
765f542d 4083 bool isSwipe = 0;
79072805
LW
4084
4085 /*
4086 * Check to see if we can just swipe the string. If so, it's a
4087 * possible small lose on short strings, but a big win on long ones.
3f7c398e
SP
4088 * It might even be a win on short strings if SvPVX_const(dstr)
4089 * has to be allocated and SvPVX_const(sstr) has to be freed.
79072805
LW
4090 */
4091
120fac95
NC
4092 /* Whichever path we take through the next code, we want this true,
4093 and doing it now facilitates the COW check. */
4094 (void)SvPOK_only(dstr);
4095
765f542d 4096 if (
b8f9541a
NC
4097 /* We're not already COW */
4098 ((sflags & (SVf_FAKE | SVf_READONLY)) != (SVf_FAKE | SVf_READONLY)
f8c7b90f 4099#ifndef PERL_OLD_COPY_ON_WRITE
b8f9541a
NC
4100 /* or we are, but dstr isn't a suitable target. */
4101 || (SvFLAGS(dstr) & CAN_COW_MASK) != CAN_COW_FLAGS
4102#endif
4103 )
765f542d 4104 &&
765f542d
NC
4105 !(isSwipe =
4106 (sflags & SVs_TEMP) && /* slated for free anyway? */
4107 !(sflags & SVf_OOK) && /* and not involved in OOK hack? */
5fcdf167
NC
4108 (!(flags & SV_NOSTEAL)) &&
4109 /* and we're allowed to steal temps */
765f542d
NC
4110 SvREFCNT(sstr) == 1 && /* and no other references to it? */
4111 SvLEN(sstr) && /* and really is a string */
645c22ef 4112 /* and won't be needed again, potentially */
765f542d 4113 !(PL_op && PL_op->op_type == OP_AASSIGN))
f8c7b90f 4114#ifdef PERL_OLD_COPY_ON_WRITE
765f542d 4115 && !((sflags & CAN_COW_MASK) == CAN_COW_FLAGS
120fac95 4116 && (SvFLAGS(dstr) & CAN_COW_MASK) == CAN_COW_FLAGS
765f542d
NC
4117 && SvTYPE(sstr) >= SVt_PVIV)
4118#endif
4119 ) {
4120 /* Failed the swipe test, and it's not a shared hash key either.
4121 Have to copy the string. */
4122 STRLEN len = SvCUR(sstr);
4123 SvGROW(dstr, len + 1); /* inlined from sv_setpvn */
3f7c398e 4124 Move(SvPVX_const(sstr),SvPVX(dstr),len,char);
765f542d
NC
4125 SvCUR_set(dstr, len);
4126 *SvEND(dstr) = '\0';
765f542d 4127 } else {
f8c7b90f 4128 /* If PERL_OLD_COPY_ON_WRITE is not defined, then isSwipe will always
765f542d 4129 be true in here. */
765f542d
NC
4130 /* Either it's a shared hash key, or it's suitable for
4131 copy-on-write or we can swipe the string. */
46187eeb 4132 if (DEBUG_C_TEST) {
ed252734 4133 PerlIO_printf(Perl_debug_log, "Copy on write: sstr --> dstr\n");
e419cbc5
NC
4134 sv_dump(sstr);
4135 sv_dump(dstr);
46187eeb 4136 }
f8c7b90f 4137#ifdef PERL_OLD_COPY_ON_WRITE
765f542d
NC
4138 if (!isSwipe) {
4139 /* I believe I should acquire a global SV mutex if
4140 it's a COW sv (not a shared hash key) to stop
4141 it going un copy-on-write.
4142 If the source SV has gone un copy on write between up there
4143 and down here, then (assert() that) it is of the correct
4144 form to make it copy on write again */
4145 if ((sflags & (SVf_FAKE | SVf_READONLY))
4146 != (SVf_FAKE | SVf_READONLY)) {
4147 SvREADONLY_on(sstr);
4148 SvFAKE_on(sstr);
4149 /* Make the source SV into a loop of 1.
4150 (about to become 2) */
a29f6d03 4151 SV_COW_NEXT_SV_SET(sstr, sstr);
765f542d
NC
4152 }
4153 }
4154#endif
4155 /* Initial code is common. */
94010e71
NC
4156 if (SvPVX_const(dstr)) { /* we know that dtype >= SVt_PV */
4157 SvPV_free(dstr);
79072805 4158 }
765f542d 4159
765f542d
NC
4160 if (!isSwipe) {
4161 /* making another shared SV. */
4162 STRLEN cur = SvCUR(sstr);
4163 STRLEN len = SvLEN(sstr);
f8c7b90f 4164#ifdef PERL_OLD_COPY_ON_WRITE
765f542d 4165 if (len) {
b8f9541a 4166 assert (SvTYPE(dstr) >= SVt_PVIV);
765f542d
NC
4167 /* SvIsCOW_normal */
4168 /* splice us in between source and next-after-source. */
a29f6d03
NC
4169 SV_COW_NEXT_SV_SET(dstr, SV_COW_NEXT_SV(sstr));
4170 SV_COW_NEXT_SV_SET(sstr, dstr);
940132f3 4171 SvPV_set(dstr, SvPVX_mutable(sstr));
a604c751
NC
4172 } else
4173#endif
4174 {
765f542d 4175 /* SvIsCOW_shared_hash */
46187eeb
NC
4176 DEBUG_C(PerlIO_printf(Perl_debug_log,
4177 "Copy on write: Sharing hash\n"));
b8f9541a 4178
bdd68bc3 4179 assert (SvTYPE(dstr) >= SVt_PV);
765f542d 4180 SvPV_set(dstr,
d1db91c6 4181 HEK_KEY(share_hek_hek(SvSHARED_HEK_FROM_PV(SvPVX_const(sstr)))));
bdd68bc3 4182 }
87a1ef3d
SP
4183 SvLEN_set(dstr, len);
4184 SvCUR_set(dstr, cur);
765f542d
NC
4185 SvREADONLY_on(dstr);
4186 SvFAKE_on(dstr);
4187 /* Relesase a global SV mutex. */
4188 }
4189 else
765f542d 4190 { /* Passes the swipe test. */
78d1e721 4191 SvPV_set(dstr, SvPVX_mutable(sstr));
765f542d
NC
4192 SvLEN_set(dstr, SvLEN(sstr));
4193 SvCUR_set(dstr, SvCUR(sstr));
4194
4195 SvTEMP_off(dstr);
4196 (void)SvOK_off(sstr); /* NOTE: nukes most SvFLAGS on sstr */
4197 SvPV_set(sstr, Nullch);
4198 SvLEN_set(sstr, 0);
4199 SvCUR_set(sstr, 0);
4200 SvTEMP_off(sstr);
4201 }
4202 }
9aa983d2 4203 if (sflags & SVf_UTF8)
a7cb1f99 4204 SvUTF8_on(dstr);
8990e307 4205 if (sflags & SVp_NOK) {
3332b3c1
JH
4206 SvNOKp_on(dstr);
4207 if (sflags & SVf_NOK)
4208 SvFLAGS(dstr) |= SVf_NOK;
9d6ce603 4209 SvNV_set(dstr, SvNVX(sstr));
79072805 4210 }
8990e307 4211 if (sflags & SVp_IOK) {
3332b3c1
JH
4212 (void)SvIOKp_on(dstr);
4213 if (sflags & SVf_IOK)
4214 SvFLAGS(dstr) |= SVf_IOK;
2b1c7e3e 4215 if (sflags & SVf_IVisUV)
25da4f38 4216 SvIsUV_on(dstr);
45977657 4217 SvIV_set(dstr, SvIVX(sstr));
79072805 4218 }
92f0c265 4219 if (SvVOK(sstr)) {
7a5fa8a2 4220 MAGIC *smg = mg_find(sstr,PERL_MAGIC_vstring);
ece467f9
JP
4221 sv_magic(dstr, NULL, PERL_MAGIC_vstring,
4222 smg->mg_ptr, smg->mg_len);
439cb1c4 4223 SvRMAGICAL_on(dstr);
7a5fa8a2 4224 }
79072805 4225 }
8990e307 4226 else if (sflags & SVp_IOK) {
3332b3c1
JH
4227 if (sflags & SVf_IOK)
4228 (void)SvIOK_only(dstr);
4229 else {
9cbac4c7
DM
4230 (void)SvOK_off(dstr);
4231 (void)SvIOKp_on(dstr);
3332b3c1
JH
4232 }
4233 /* XXXX Do we want to set IsUV for IV(ROK)? Be extra safe... */
2b1c7e3e 4234 if (sflags & SVf_IVisUV)
25da4f38 4235 SvIsUV_on(dstr);
45977657 4236 SvIV_set(dstr, SvIVX(sstr));
3332b3c1
JH
4237 if (sflags & SVp_NOK) {
4238 if (sflags & SVf_NOK)
4239 (void)SvNOK_on(dstr);
4240 else
4241 (void)SvNOKp_on(dstr);
9d6ce603 4242 SvNV_set(dstr, SvNVX(sstr));
3332b3c1
JH
4243 }
4244 }
4245 else if (sflags & SVp_NOK) {
4246 if (sflags & SVf_NOK)
4247 (void)SvNOK_only(dstr);
4248 else {
9cbac4c7 4249 (void)SvOK_off(dstr);
3332b3c1
JH
4250 SvNOKp_on(dstr);
4251 }
9d6ce603 4252 SvNV_set(dstr, SvNVX(sstr));
79072805
LW
4253 }
4254 else {
20408e3c 4255 if (dtype == SVt_PVGV) {
e476b1b5 4256 if (ckWARN(WARN_MISC))
9014280d 4257 Perl_warner(aTHX_ packWARN(WARN_MISC), "Undefined value assigned to typeglob");
20408e3c
GS
4258 }
4259 else
4260 (void)SvOK_off(dstr);
a0d0e21e 4261 }
27c9684d
AP
4262 if (SvTAINTED(sstr))
4263 SvTAINT(dstr);
79072805
LW
4264}
4265
954c1994
GS
4266/*
4267=for apidoc sv_setsv_mg
4268
4269Like C<sv_setsv>, but also handles 'set' magic.
4270
4271=cut
4272*/
4273
79072805 4274void
864dbfa3 4275Perl_sv_setsv_mg(pTHX_ SV *dstr, register SV *sstr)
ef50df4b
GS
4276{
4277 sv_setsv(dstr,sstr);
4278 SvSETMAGIC(dstr);
4279}
4280
f8c7b90f 4281#ifdef PERL_OLD_COPY_ON_WRITE
ed252734
NC
4282SV *
4283Perl_sv_setsv_cow(pTHX_ SV *dstr, SV *sstr)
4284{
4285 STRLEN cur = SvCUR(sstr);
4286 STRLEN len = SvLEN(sstr);
4287 register char *new_pv;
4288
4289 if (DEBUG_C_TEST) {
4290 PerlIO_printf(Perl_debug_log, "Fast copy on write: %p -> %p\n",
4291 sstr, dstr);
4292 sv_dump(sstr);
4293 if (dstr)
4294 sv_dump(dstr);
4295 }
4296
4297 if (dstr) {
4298 if (SvTHINKFIRST(dstr))
4299 sv_force_normal_flags(dstr, SV_COW_DROP_PV);
3f7c398e
SP
4300 else if (SvPVX_const(dstr))
4301 Safefree(SvPVX_const(dstr));
ed252734
NC
4302 }
4303 else
4304 new_SV(dstr);
862a34c6 4305 SvUPGRADE(dstr, SVt_PVIV);
ed252734
NC
4306
4307 assert (SvPOK(sstr));
4308 assert (SvPOKp(sstr));
4309 assert (!SvIOK(sstr));
4310 assert (!SvIOKp(sstr));
4311 assert (!SvNOK(sstr));
4312 assert (!SvNOKp(sstr));
4313
4314 if (SvIsCOW(sstr)) {
4315
4316 if (SvLEN(sstr) == 0) {
4317 /* source is a COW shared hash key. */
ed252734
NC
4318 DEBUG_C(PerlIO_printf(Perl_debug_log,
4319 "Fast copy on write: Sharing hash\n"));
d1db91c6 4320 new_pv = HEK_KEY(share_hek_hek(SvSHARED_HEK_FROM_PV(SvPVX_const(sstr))));
ed252734
NC
4321 goto common_exit;
4322 }
4323 SV_COW_NEXT_SV_SET(dstr, SV_COW_NEXT_SV(sstr));
4324 } else {
4325 assert ((SvFLAGS(sstr) & CAN_COW_MASK) == CAN_COW_FLAGS);
862a34c6 4326 SvUPGRADE(sstr, SVt_PVIV);
ed252734
NC
4327 SvREADONLY_on(sstr);
4328 SvFAKE_on(sstr);
4329 DEBUG_C(PerlIO_printf(Perl_debug_log,
4330 "Fast copy on write: Converting sstr to COW\n"));
4331 SV_COW_NEXT_SV_SET(dstr, sstr);
4332 }
4333 SV_COW_NEXT_SV_SET(sstr, dstr);
940132f3 4334 new_pv = SvPVX_mutable(sstr);
ed252734
NC
4335
4336 common_exit:
4337 SvPV_set(dstr, new_pv);
4338 SvFLAGS(dstr) = (SVt_PVIV|SVf_POK|SVp_POK|SVf_FAKE|SVf_READONLY);
4339 if (SvUTF8(sstr))
4340 SvUTF8_on(dstr);
87a1ef3d
SP
4341 SvLEN_set(dstr, len);
4342 SvCUR_set(dstr, cur);
ed252734
NC
4343 if (DEBUG_C_TEST) {
4344 sv_dump(dstr);
4345 }
4346 return dstr;
4347}
4348#endif
4349
954c1994
GS
4350/*
4351=for apidoc sv_setpvn
4352
4353Copies a string into an SV. The C<len> parameter indicates the number of
9e09f5f2
MHM
4354bytes to be copied. If the C<ptr> argument is NULL the SV will become
4355undefined. Does not handle 'set' magic. See C<sv_setpvn_mg>.
954c1994
GS
4356
4357=cut
4358*/
4359
ef50df4b 4360void
864dbfa3 4361Perl_sv_setpvn(pTHX_ register SV *sv, register const char *ptr, register STRLEN len)
79072805 4362{
c6f8c383 4363 register char *dptr;
22c522df 4364
765f542d 4365 SV_CHECK_THINKFIRST_COW_DROP(sv);
463ee0b2 4366 if (!ptr) {
a0d0e21e 4367 (void)SvOK_off(sv);
463ee0b2
LW
4368 return;
4369 }
22c522df
JH
4370 else {
4371 /* len is STRLEN which is unsigned, need to copy to signed */
a3b680e6 4372 const IV iv = len;
9c5ffd7c
JH
4373 if (iv < 0)
4374 Perl_croak(aTHX_ "panic: sv_setpvn called with negative strlen");
22c522df 4375 }
862a34c6 4376 SvUPGRADE(sv, SVt_PV);
c6f8c383 4377
5902b6a9 4378 dptr = SvGROW(sv, len + 1);
c6f8c383
GA
4379 Move(ptr,dptr,len,char);
4380 dptr[len] = '\0';
79072805 4381 SvCUR_set(sv, len);
1aa99e6b 4382 (void)SvPOK_only_UTF8(sv); /* validate pointer */
463ee0b2 4383 SvTAINT(sv);
79072805
LW
4384}
4385
954c1994
GS
4386/*
4387=for apidoc sv_setpvn_mg
4388
4389Like C<sv_setpvn>, but also handles 'set' magic.
4390
4391=cut
4392*/
4393
79072805 4394void
864dbfa3 4395Perl_sv_setpvn_mg(pTHX_ register SV *sv, register const char *ptr, register STRLEN len)
ef50df4b
GS
4396{
4397 sv_setpvn(sv,ptr,len);
4398 SvSETMAGIC(sv);
4399}
4400
954c1994
GS
4401/*
4402=for apidoc sv_setpv
4403
4404Copies a string into an SV. The string must be null-terminated. Does not
4405handle 'set' magic. See C<sv_setpv_mg>.
4406
4407=cut
4408*/
4409
ef50df4b 4410void
864dbfa3 4411Perl_sv_setpv(pTHX_ register SV *sv, register const char *ptr)
79072805
LW
4412{
4413 register STRLEN len;
4414
765f542d 4415 SV_CHECK_THINKFIRST_COW_DROP(sv);
463ee0b2 4416 if (!ptr) {
a0d0e21e 4417 (void)SvOK_off(sv);
463ee0b2
LW
4418 return;
4419 }
79072805 4420 len = strlen(ptr);
862a34c6 4421 SvUPGRADE(sv, SVt_PV);
c6f8c383 4422
79072805 4423 SvGROW(sv, len + 1);
463ee0b2 4424 Move(ptr,SvPVX(sv),len+1,char);
79072805 4425 SvCUR_set(sv, len);
1aa99e6b 4426 (void)SvPOK_only_UTF8(sv); /* validate pointer */
463ee0b2
LW
4427 SvTAINT(sv);
4428}
4429
954c1994
GS
4430/*
4431=for apidoc sv_setpv_mg
4432
4433Like C<sv_setpv>, but also handles 'set' magic.
4434
4435=cut
4436*/
4437
463ee0b2 4438void
864dbfa3 4439Perl_sv_setpv_mg(pTHX_ register SV *sv, register const char *ptr)
ef50df4b
GS
4440{
4441 sv_setpv(sv,ptr);
4442 SvSETMAGIC(sv);
4443}
4444
954c1994
GS
4445/*
4446=for apidoc sv_usepvn
4447
4448Tells an SV to use C<ptr> to find its string value. Normally the string is
1c846c1f 4449stored inside the SV but sv_usepvn allows the SV to use an outside string.
954c1994
GS
4450The C<ptr> should point to memory that was allocated by C<malloc>. The
4451string length, C<len>, must be supplied. This function will realloc the
4452memory pointed to by C<ptr>, so that pointer should not be freed or used by
4453the programmer after giving it to sv_usepvn. Does not handle 'set' magic.
4454See C<sv_usepvn_mg>.
4455
4456=cut
4457*/
4458
ef50df4b 4459void
864dbfa3 4460Perl_sv_usepvn(pTHX_ register SV *sv, register char *ptr, register STRLEN len)
463ee0b2 4461{
1936d2a7 4462 STRLEN allocate;
765f542d 4463 SV_CHECK_THINKFIRST_COW_DROP(sv);
862a34c6 4464 SvUPGRADE(sv, SVt_PV);
463ee0b2 4465 if (!ptr) {
a0d0e21e 4466 (void)SvOK_off(sv);
463ee0b2
LW
4467 return;
4468 }
3f7c398e 4469 if (SvPVX_const(sv))
8bd4d4c5 4470 SvPV_free(sv);
1936d2a7
NC
4471
4472 allocate = PERL_STRLEN_ROUNDUP(len + 1);
7a9b70e9 4473 ptr = saferealloc (ptr, allocate);
f880fe2f 4474 SvPV_set(sv, ptr);
463ee0b2 4475 SvCUR_set(sv, len);
1936d2a7 4476 SvLEN_set(sv, allocate);
463ee0b2 4477 *SvEND(sv) = '\0';
1aa99e6b 4478 (void)SvPOK_only_UTF8(sv); /* validate pointer */
463ee0b2 4479 SvTAINT(sv);
79072805
LW
4480}
4481
954c1994
GS
4482/*
4483=for apidoc sv_usepvn_mg
4484
4485Like C<sv_usepvn>, but also handles 'set' magic.
4486
4487=cut
4488*/
4489
ef50df4b 4490void
864dbfa3 4491Perl_sv_usepvn_mg(pTHX_ register SV *sv, register char *ptr, register STRLEN len)
ef50df4b 4492{
51c1089b 4493 sv_usepvn(sv,ptr,len);
ef50df4b
GS
4494 SvSETMAGIC(sv);
4495}
4496
f8c7b90f 4497#ifdef PERL_OLD_COPY_ON_WRITE
765f542d
NC
4498/* Need to do this *after* making the SV normal, as we need the buffer
4499 pointer to remain valid until after we've copied it. If we let go too early,
4500 another thread could invalidate it by unsharing last of the same hash key
4501 (which it can do by means other than releasing copy-on-write Svs)
4502 or by changing the other copy-on-write SVs in the loop. */
4503STATIC void
bdd68bc3 4504S_sv_release_COW(pTHX_ register SV *sv, const char *pvx, STRLEN len, SV *after)
765f542d
NC
4505{
4506 if (len) { /* this SV was SvIsCOW_normal(sv) */
4507 /* we need to find the SV pointing to us. */
4508 SV *current = SV_COW_NEXT_SV(after);
7a5fa8a2 4509
765f542d
NC
4510 if (current == sv) {
4511 /* The SV we point to points back to us (there were only two of us
4512 in the loop.)
4513 Hence other SV is no longer copy on write either. */
4514 SvFAKE_off(after);
4515 SvREADONLY_off(after);
4516 } else {
4517 /* We need to follow the pointers around the loop. */
4518 SV *next;
4519 while ((next = SV_COW_NEXT_SV(current)) != sv) {
4520 assert (next);
4521 current = next;
4522 /* don't loop forever if the structure is bust, and we have
4523 a pointer into a closed loop. */
4524 assert (current != after);
3f7c398e 4525 assert (SvPVX_const(current) == pvx);
765f542d
NC
4526 }
4527 /* Make the SV before us point to the SV after us. */
a29f6d03 4528 SV_COW_NEXT_SV_SET(current, after);
765f542d
NC
4529 }
4530 } else {
bdd68bc3 4531 unshare_hek(SvSHARED_HEK_FROM_PV(pvx));
765f542d
NC
4532 }
4533}
4534
4535int
4536Perl_sv_release_IVX(pTHX_ register SV *sv)
4537{
4538 if (SvIsCOW(sv))
4539 sv_force_normal_flags(sv, 0);
0c34ef67
MHM
4540 SvOOK_off(sv);
4541 return 0;
765f542d
NC
4542}
4543#endif
645c22ef
DM
4544/*
4545=for apidoc sv_force_normal_flags
4546
4547Undo various types of fakery on an SV: if the PV is a shared string, make
4548a private copy; if we're a ref, stop refing; if we're a glob, downgrade to
765f542d
NC
4549an xpvmg; if we're a copy-on-write scalar, this is the on-write time when
4550we do the copy, and is also used locally. If C<SV_COW_DROP_PV> is set
4551then a copy-on-write scalar drops its PV buffer (if any) and becomes
4552SvPOK_off rather than making a copy. (Used where this scalar is about to be
d3050d9d 4553set to some other value.) In addition, the C<flags> parameter gets passed to
765f542d
NC
4554C<sv_unref_flags()> when unrefing. C<sv_force_normal> calls this function
4555with flags set to 0.
645c22ef
DM
4556
4557=cut
4558*/
4559
6fc92669 4560void
840a7b70 4561Perl_sv_force_normal_flags(pTHX_ register SV *sv, U32 flags)
0f15f207 4562{
f8c7b90f 4563#ifdef PERL_OLD_COPY_ON_WRITE
765f542d
NC
4564 if (SvREADONLY(sv)) {
4565 /* At this point I believe I should acquire a global SV mutex. */
4566 if (SvFAKE(sv)) {
b64e5050 4567 const char * const pvx = SvPVX_const(sv);
a28509cc
AL
4568 const STRLEN len = SvLEN(sv);
4569 const STRLEN cur = SvCUR(sv);
a28509cc 4570 SV * const next = SV_COW_NEXT_SV(sv); /* next COW sv in the loop. */
46187eeb
NC
4571 if (DEBUG_C_TEST) {
4572 PerlIO_printf(Perl_debug_log,
4573 "Copy on write: Force normal %ld\n",
4574 (long) flags);
e419cbc5 4575 sv_dump(sv);
46187eeb 4576 }
765f542d
NC
4577 SvFAKE_off(sv);
4578 SvREADONLY_off(sv);
9f653bb5 4579 /* This SV doesn't own the buffer, so need to Newx() a new one: */
f880fe2f 4580 SvPV_set(sv, (char*)0);
87a1ef3d 4581 SvLEN_set(sv, 0);
765f542d
NC
4582 if (flags & SV_COW_DROP_PV) {
4583 /* OK, so we don't need to copy our buffer. */
4584 SvPOK_off(sv);
4585 } else {
4586 SvGROW(sv, cur + 1);
4587 Move(pvx,SvPVX(sv),cur,char);
87a1ef3d 4588 SvCUR_set(sv, cur);
765f542d
NC
4589 *SvEND(sv) = '\0';
4590 }
bdd68bc3 4591 sv_release_COW(sv, pvx, len, next);
46187eeb 4592 if (DEBUG_C_TEST) {
e419cbc5 4593 sv_dump(sv);
46187eeb 4594 }
765f542d 4595 }
923e4eb5 4596 else if (IN_PERL_RUNTIME)
765f542d
NC
4597 Perl_croak(aTHX_ PL_no_modify);
4598 /* At this point I believe that I can drop the global SV mutex. */
4599 }
4600#else
2213622d 4601 if (SvREADONLY(sv)) {
1c846c1f 4602 if (SvFAKE(sv)) {
b64e5050 4603 const char * const pvx = SvPVX_const(sv);
66a1b24b 4604 const STRLEN len = SvCUR(sv);
10bcdfd6
NC
4605 SvFAKE_off(sv);
4606 SvREADONLY_off(sv);
66a1b24b
AL
4607 SvPV_set(sv, Nullch);
4608 SvLEN_set(sv, 0);
1c846c1f 4609 SvGROW(sv, len + 1);
3f7c398e 4610 Move(pvx,SvPVX_const(sv),len,char);
1c846c1f 4611 *SvEND(sv) = '\0';
bdd68bc3 4612 unshare_hek(SvSHARED_HEK_FROM_PV(pvx));
1c846c1f 4613 }
923e4eb5 4614 else if (IN_PERL_RUNTIME)
cea2e8a9 4615 Perl_croak(aTHX_ PL_no_modify);
0f15f207 4616 }
765f542d 4617#endif
2213622d 4618 if (SvROK(sv))
840a7b70 4619 sv_unref_flags(sv, flags);
6fc92669
GS
4620 else if (SvFAKE(sv) && SvTYPE(sv) == SVt_PVGV)
4621 sv_unglob(sv);
0f15f207 4622}
1c846c1f 4623
645c22ef
DM
4624/*
4625=for apidoc sv_force_normal
4626
4627Undo various types of fakery on an SV: if the PV is a shared string, make
4628a private copy; if we're a ref, stop refing; if we're a glob, downgrade to
4629an xpvmg. See also C<sv_force_normal_flags>.
4630
4631=cut
4632*/
4633
840a7b70
IZ
4634void
4635Perl_sv_force_normal(pTHX_ register SV *sv)
4636{
4637 sv_force_normal_flags(sv, 0);
4638}
4639
954c1994
GS
4640/*
4641=for apidoc sv_chop
4642
1c846c1f 4643Efficient removal of characters from the beginning of the string buffer.
954c1994
GS
4644SvPOK(sv) must be true and the C<ptr> must be a pointer to somewhere inside
4645the string buffer. The C<ptr> becomes the first character of the adjusted
645c22ef 4646string. Uses the "OOK hack".
3f7c398e 4647Beware: after this function returns, C<ptr> and SvPVX_const(sv) may no longer
31869a79 4648refer to the same chunk of data.
954c1994
GS
4649
4650=cut
4651*/
4652
79072805 4653void
f54cb97a 4654Perl_sv_chop(pTHX_ register SV *sv, register const char *ptr)
79072805
LW
4655{
4656 register STRLEN delta;
a0d0e21e 4657 if (!ptr || !SvPOKp(sv))
79072805 4658 return;
3f7c398e 4659 delta = ptr - SvPVX_const(sv);
2213622d 4660 SV_CHECK_THINKFIRST(sv);
79072805
LW
4661 if (SvTYPE(sv) < SVt_PVIV)
4662 sv_upgrade(sv,SVt_PVIV);
4663
4664 if (!SvOOK(sv)) {
50483b2c 4665 if (!SvLEN(sv)) { /* make copy of shared string */
3f7c398e 4666 const char *pvx = SvPVX_const(sv);
a28509cc 4667 const STRLEN len = SvCUR(sv);
50483b2c 4668 SvGROW(sv, len + 1);
3f7c398e 4669 Move(pvx,SvPVX_const(sv),len,char);
50483b2c
JD
4670 *SvEND(sv) = '\0';
4671 }
45977657 4672 SvIV_set(sv, 0);
a4bfb290
AB
4673 /* Same SvOOK_on but SvOOK_on does a SvIOK_off
4674 and we do that anyway inside the SvNIOK_off
4675 */
7a5fa8a2 4676 SvFLAGS(sv) |= SVf_OOK;
79072805 4677 }
a4bfb290 4678 SvNIOK_off(sv);
b162af07
SP
4679 SvLEN_set(sv, SvLEN(sv) - delta);
4680 SvCUR_set(sv, SvCUR(sv) - delta);
f880fe2f 4681 SvPV_set(sv, SvPVX(sv) + delta);
45977657 4682 SvIV_set(sv, SvIVX(sv) + delta);
79072805
LW
4683}
4684
09540bc3
JH
4685/* sv_catpvn() is now a macro using Perl_sv_catpvn_flags();
4686 * this function provided for binary compatibility only
4687 */
4688
4689void
4690Perl_sv_catpvn(pTHX_ SV *dsv, const char* sstr, STRLEN slen)
4691{
4692 sv_catpvn_flags(dsv, sstr, slen, SV_GMAGIC);
4693}
4694
954c1994
GS
4695/*
4696=for apidoc sv_catpvn
4697
4698Concatenates the string onto the end of the string which is in the SV. The
1e54db1a
JH
4699C<len> indicates number of bytes to copy. If the SV has the UTF-8
4700status set, then the bytes appended should be valid UTF-8.
d5ce4a7c 4701Handles 'get' magic, but not 'set' magic. See C<sv_catpvn_mg>.
954c1994 4702
8d6d96c1
HS
4703=for apidoc sv_catpvn_flags
4704
4705Concatenates the string onto the end of the string which is in the SV. The
1e54db1a
JH
4706C<len> indicates number of bytes to copy. If the SV has the UTF-8
4707status set, then the bytes appended should be valid UTF-8.
8d6d96c1
HS
4708If C<flags> has C<SV_GMAGIC> bit set, will C<mg_get> on C<dsv> if
4709appropriate, else not. C<sv_catpvn> and C<sv_catpvn_nomg> are implemented
4710in terms of this function.
4711
4712=cut
4713*/
4714
4715void
4716Perl_sv_catpvn_flags(pTHX_ register SV *dsv, register const char *sstr, register STRLEN slen, I32 flags)
4717{
4718 STRLEN dlen;
f54cb97a 4719 const char *dstr = SvPV_force_flags(dsv, dlen, flags);
8d6d96c1 4720
8d6d96c1
HS
4721 SvGROW(dsv, dlen + slen + 1);
4722 if (sstr == dstr)
3f7c398e 4723 sstr = SvPVX_const(dsv);
8d6d96c1 4724 Move(sstr, SvPVX(dsv) + dlen, slen, char);
b162af07 4725 SvCUR_set(dsv, SvCUR(dsv) + slen);
8d6d96c1
HS
4726 *SvEND(dsv) = '\0';
4727 (void)SvPOK_only_UTF8(dsv); /* validate pointer */
4728 SvTAINT(dsv);
79072805
LW
4729}
4730
954c1994
GS
4731/*
4732=for apidoc sv_catpvn_mg
4733
4734Like C<sv_catpvn>, but also handles 'set' magic.
4735
4736=cut
4737*/
4738
79072805 4739void
864dbfa3 4740Perl_sv_catpvn_mg(pTHX_ register SV *sv, register const char *ptr, register STRLEN len)
ef50df4b
GS
4741{
4742 sv_catpvn(sv,ptr,len);
4743 SvSETMAGIC(sv);
4744}
4745
09540bc3
JH
4746/* sv_catsv() is now a macro using Perl_sv_catsv_flags();
4747 * this function provided for binary compatibility only
4748 */
4749
4750void
4751Perl_sv_catsv(pTHX_ SV *dstr, register SV *sstr)
4752{
4753 sv_catsv_flags(dstr, sstr, SV_GMAGIC);
4754}
4755
954c1994
GS
4756/*
4757=for apidoc sv_catsv
4758
13e8c8e3
JH
4759Concatenates the string from SV C<ssv> onto the end of the string in
4760SV C<dsv>. Modifies C<dsv> but not C<ssv>. Handles 'get' magic, but
4761not 'set' magic. See C<sv_catsv_mg>.
954c1994 4762
8d6d96c1
HS
4763=for apidoc sv_catsv_flags
4764
4765Concatenates the string from SV C<ssv> onto the end of the string in
4766SV C<dsv>. Modifies C<dsv> but not C<ssv>. If C<flags> has C<SV_GMAGIC>
4767bit set, will C<mg_get> on the SVs if appropriate, else not. C<sv_catsv>
4768and C<sv_catsv_nomg> are implemented in terms of this function.
4769
4770=cut */
4771
ef50df4b 4772void
8d6d96c1 4773Perl_sv_catsv_flags(pTHX_ SV *dsv, register SV *ssv, I32 flags)
79072805 4774{
4d84ee25 4775 const char *spv;
13e8c8e3 4776 STRLEN slen;
46199a12 4777 if (!ssv)
79072805 4778 return;
4d84ee25 4779 if ((spv = SvPV_const(ssv, slen))) {
4fd84b44
AD
4780 /* sutf8 and dutf8 were type bool, but under USE_ITHREADS,
4781 gcc version 2.95.2 20000220 (Debian GNU/Linux) for
8cf8f3d1
NIS
4782 Linux xxx 2.2.17 on sparc64 with gcc -O2, we erroneously
4783 get dutf8 = 0x20000000, (i.e. SVf_UTF8) even though
4fd84b44
AD
4784 dsv->sv_flags doesn't have that bit set.
4785 Andy Dougherty 12 Oct 2001
4786 */
b464bac0 4787 const I32 sutf8 = DO_UTF8(ssv);
4fd84b44 4788 I32 dutf8;
13e8c8e3 4789
8d6d96c1
HS
4790 if (SvGMAGICAL(dsv) && (flags & SV_GMAGIC))
4791 mg_get(dsv);
4792 dutf8 = DO_UTF8(dsv);
4793
4794 if (dutf8 != sutf8) {
13e8c8e3 4795 if (dutf8) {
46199a12 4796 /* Not modifying source SV, so taking a temporary copy. */
8d6d96c1 4797 SV* csv = sv_2mortal(newSVpvn(spv, slen));
13e8c8e3 4798
46199a12 4799 sv_utf8_upgrade(csv);
93524f2b 4800 spv = SvPV_const(csv, slen);
13e8c8e3 4801 }
8d6d96c1
HS
4802 else
4803 sv_utf8_upgrade_nomg(dsv);
e84ff256 4804 }
8d6d96c1 4805 sv_catpvn_nomg(dsv, spv, slen);
560a288e 4806 }
79072805
LW
4807}
4808
954c1994
GS
4809/*
4810=for apidoc sv_catsv_mg
4811
4812Like C<sv_catsv>, but also handles 'set' magic.
4813
4814=cut
4815*/
4816
79072805 4817void
46199a12 4818Perl_sv_catsv_mg(pTHX_ SV *dsv, register SV *ssv)
ef50df4b 4819{
46199a12
JH
4820 sv_catsv(dsv,ssv);
4821 SvSETMAGIC(dsv);
ef50df4b
GS
4822}
4823
954c1994
GS
4824/*
4825=for apidoc sv_catpv
4826
4827Concatenates the string onto the end of the string which is in the SV.
1e54db1a
JH
4828If the SV has the UTF-8 status set, then the bytes appended should be
4829valid UTF-8. Handles 'get' magic, but not 'set' magic. See C<sv_catpv_mg>.
954c1994 4830
d5ce4a7c 4831=cut */
954c1994 4832
ef50df4b 4833void
0c981600 4834Perl_sv_catpv(pTHX_ register SV *sv, register const char *ptr)
79072805
LW
4835{
4836 register STRLEN len;
463ee0b2 4837 STRLEN tlen;
748a9306 4838 char *junk;
79072805 4839
0c981600 4840 if (!ptr)
79072805 4841 return;
748a9306 4842 junk = SvPV_force(sv, tlen);
0c981600 4843 len = strlen(ptr);
463ee0b2 4844 SvGROW(sv, tlen + len + 1);
0c981600 4845 if (ptr == junk)
3f7c398e 4846 ptr = SvPVX_const(sv);
0c981600 4847 Move(ptr,SvPVX(sv)+tlen,len+1,char);
b162af07 4848 SvCUR_set(sv, SvCUR(sv) + len);
d41ff1b8 4849 (void)SvPOK_only_UTF8(sv); /* validate pointer */
463ee0b2 4850 SvTAINT(sv);
79072805
LW
4851}
4852
954c1994
GS
4853/*
4854=for apidoc sv_catpv_mg
4855
4856Like C<sv_catpv>, but also handles 'set' magic.
4857
4858=cut
4859*/
4860
ef50df4b 4861void
0c981600 4862Perl_sv_catpv_mg(pTHX_ register SV *sv, register const char *ptr)
ef50df4b 4863{
0c981600 4864 sv_catpv(sv,ptr);
ef50df4b
GS
4865 SvSETMAGIC(sv);
4866}
4867
645c22ef
DM
4868/*
4869=for apidoc newSV
4870
4871Create a new null SV, or if len > 0, create a new empty SVt_PV type SV
4872with an initial PV allocation of len+1. Normally accessed via the C<NEWSV>
4873macro.
4874
4875=cut
4876*/
4877
79072805 4878SV *
864dbfa3 4879Perl_newSV(pTHX_ STRLEN len)
79072805
LW
4880{
4881 register SV *sv;
1c846c1f 4882
4561caa4 4883 new_SV(sv);
79072805
LW
4884 if (len) {
4885 sv_upgrade(sv, SVt_PV);
4886 SvGROW(sv, len + 1);
4887 }
4888 return sv;
4889}
954c1994 4890/*
92110913 4891=for apidoc sv_magicext
954c1994 4892
68795e93 4893Adds magic to an SV, upgrading it if necessary. Applies the
2d8d5d5a 4894supplied vtable and returns a pointer to the magic added.
92110913 4895
2d8d5d5a
SH
4896Note that C<sv_magicext> will allow things that C<sv_magic> will not.
4897In particular, you can add magic to SvREADONLY SVs, and add more than
4898one instance of the same 'how'.
645c22ef 4899
2d8d5d5a
SH
4900If C<namlen> is greater than zero then a C<savepvn> I<copy> of C<name> is
4901stored, if C<namlen> is zero then C<name> is stored as-is and - as another
4902special case - if C<(name && namlen == HEf_SVKEY)> then C<name> is assumed
4903to contain an C<SV*> and is stored as-is with its REFCNT incremented.
92110913 4904
2d8d5d5a 4905(This is now used as a subroutine by C<sv_magic>.)
954c1994
GS
4906
4907=cut
4908*/
92110913 4909MAGIC *
e1ec3a88 4910Perl_sv_magicext(pTHX_ SV* sv, SV* obj, int how, const MGVTBL *vtable,
92110913 4911 const char* name, I32 namlen)
79072805
LW
4912{
4913 MAGIC* mg;
68795e93 4914
92110913 4915 if (SvTYPE(sv) < SVt_PVMG) {
862a34c6 4916 SvUPGRADE(sv, SVt_PVMG);
463ee0b2 4917 }
a02a5408 4918 Newxz(mg, 1, MAGIC);
79072805 4919 mg->mg_moremagic = SvMAGIC(sv);
b162af07 4920 SvMAGIC_set(sv, mg);
75f9d97a 4921
05f95b08
SB
4922 /* Sometimes a magic contains a reference loop, where the sv and
4923 object refer to each other. To prevent a reference loop that
4924 would prevent such objects being freed, we look for such loops
4925 and if we find one we avoid incrementing the object refcount.
87f0b213
JH
4926
4927 Note we cannot do this to avoid self-tie loops as intervening RV must
b5ccf5f2 4928 have its REFCNT incremented to keep it in existence.
87f0b213
JH
4929
4930 */
14befaf4
DM
4931 if (!obj || obj == sv ||
4932 how == PERL_MAGIC_arylen ||
4933 how == PERL_MAGIC_qr ||
8d2f4536 4934 how == PERL_MAGIC_symtab ||
75f9d97a
JH
4935 (SvTYPE(obj) == SVt_PVGV &&
4936 (GvSV(obj) == sv || GvHV(obj) == (HV*)sv || GvAV(obj) == (AV*)sv ||
4937 GvCV(obj) == (CV*)sv || GvIOp(obj) == (IO*)sv ||
2628be26 4938 GvFORM(obj) == (CV*)sv)))
75f9d97a 4939 {
8990e307 4940 mg->mg_obj = obj;
75f9d97a 4941 }
85e6fe83 4942 else {
8990e307 4943 mg->mg_obj = SvREFCNT_inc(obj);
85e6fe83
LW
4944 mg->mg_flags |= MGf_REFCOUNTED;
4945 }
b5ccf5f2
YST
4946
4947 /* Normal self-ties simply pass a null object, and instead of
4948 using mg_obj directly, use the SvTIED_obj macro to produce a
4949 new RV as needed. For glob "self-ties", we are tieing the PVIO
4950 with an RV obj pointing to the glob containing the PVIO. In
4951 this case, to avoid a reference loop, we need to weaken the
4952 reference.
4953 */
4954
4955 if (how == PERL_MAGIC_tiedscalar && SvTYPE(sv) == SVt_PVIO &&
4956 obj && SvROK(obj) && GvIO(SvRV(obj)) == (IO*)sv)
4957 {
4958 sv_rvweaken(obj);
4959 }
4960
79072805 4961 mg->mg_type = how;
565764a8 4962 mg->mg_len = namlen;
9cbac4c7 4963 if (name) {
92110913 4964 if (namlen > 0)
1edc1566 4965 mg->mg_ptr = savepvn(name, namlen);
c6ee37c5 4966 else if (namlen == HEf_SVKEY)
1edc1566 4967 mg->mg_ptr = (char*)SvREFCNT_inc((SV*)name);
68795e93 4968 else
92110913 4969 mg->mg_ptr = (char *) name;
9cbac4c7 4970 }
92110913 4971 mg->mg_virtual = vtable;
68795e93 4972
92110913
NIS
4973 mg_magical(sv);
4974 if (SvGMAGICAL(sv))
4975 SvFLAGS(sv) &= ~(SVf_IOK|SVf_NOK|SVf_POK);
4976 return mg;
4977}
4978
4979/*
4980=for apidoc sv_magic
1c846c1f 4981
92110913
NIS
4982Adds magic to an SV. First upgrades C<sv> to type C<SVt_PVMG> if necessary,
4983then adds a new magic item of type C<how> to the head of the magic list.
4984
2d8d5d5a
SH
4985See C<sv_magicext> (which C<sv_magic> now calls) for a description of the
4986handling of the C<name> and C<namlen> arguments.
4987
4509d3fb
SB
4988You need to use C<sv_magicext> to add magic to SvREADONLY SVs and also
4989to add more than one instance of the same 'how'.
4990
92110913
NIS
4991=cut
4992*/
4993
4994void
4995Perl_sv_magic(pTHX_ register SV *sv, SV *obj, int how, const char *name, I32 namlen)
68795e93 4996{
e1ec3a88 4997 const MGVTBL *vtable = 0;
92110913 4998 MAGIC* mg;
92110913 4999
f8c7b90f 5000#ifdef PERL_OLD_COPY_ON_WRITE
765f542d
NC
5001 if (SvIsCOW(sv))
5002 sv_force_normal_flags(sv, 0);
5003#endif
92110913 5004 if (SvREADONLY(sv)) {
d8084ca5
DM
5005 if (
5006 /* its okay to attach magic to shared strings; the subsequent
5007 * upgrade to PVMG will unshare the string */
5008 !(SvFAKE(sv) && SvTYPE(sv) < SVt_PVMG)
5009
5010 && IN_PERL_RUNTIME
92110913
NIS
5011 && how != PERL_MAGIC_regex_global
5012 && how != PERL_MAGIC_bm
5013 && how != PERL_MAGIC_fm
5014 && how != PERL_MAGIC_sv
e6469971 5015 && how != PERL_MAGIC_backref
92110913
NIS
5016 )
5017 {
5018 Perl_croak(aTHX_ PL_no_modify);
5019 }
5020 }
5021 if (SvMAGICAL(sv) || (how == PERL_MAGIC_taint && SvTYPE(sv) >= SVt_PVMG)) {
5022 if (SvMAGIC(sv) && (mg = mg_find(sv, how))) {
68795e93
NIS
5023 /* sv_magic() refuses to add a magic of the same 'how' as an
5024 existing one
92110913
NIS
5025 */
5026 if (how == PERL_MAGIC_taint)
5027 mg->mg_len |= 1;
5028 return;
5029 }
5030 }
68795e93 5031
79072805 5032 switch (how) {
14befaf4 5033 case PERL_MAGIC_sv:
92110913 5034 vtable = &PL_vtbl_sv;
79072805 5035 break;
14befaf4 5036 case PERL_MAGIC_overload:
92110913 5037 vtable = &PL_vtbl_amagic;
a0d0e21e 5038 break;
14befaf4 5039 case PERL_MAGIC_overload_elem:
92110913 5040 vtable = &PL_vtbl_amagicelem;
a0d0e21e 5041 break;
14befaf4 5042 case PERL_MAGIC_overload_table:
92110913 5043 vtable = &PL_vtbl_ovrld;
a0d0e21e 5044 break;
14befaf4 5045 case PERL_MAGIC_bm:
92110913 5046 vtable = &PL_vtbl_bm;
79072805 5047 break;
14befaf4 5048 case PERL_MAGIC_regdata:
92110913 5049 vtable = &PL_vtbl_regdata;
6cef1e77 5050 break;
14befaf4 5051 case PERL_MAGIC_regdatum:
92110913 5052 vtable = &PL_vtbl_regdatum;
6cef1e77 5053 break;
14befaf4 5054 case PERL_MAGIC_env:
92110913 5055 vtable = &PL_vtbl_env;
79072805 5056 break;
14befaf4 5057 case PERL_MAGIC_fm:
92110913 5058 vtable = &PL_vtbl_fm;
55497cff 5059 break;
14befaf4 5060 case PERL_MAGIC_envelem:
92110913 5061 vtable = &PL_vtbl_envelem;
79072805 5062 break;
14befaf4 5063 case PERL_MAGIC_regex_global:
92110913 5064 vtable = &PL_vtbl_mglob;
93a17b20 5065 break;
14befaf4 5066 case PERL_MAGIC_isa:
92110913 5067 vtable = &PL_vtbl_isa;
463ee0b2 5068 break;
14befaf4 5069 case PERL_MAGIC_isaelem:
92110913 5070 vtable = &PL_vtbl_isaelem;
463ee0b2 5071 break;
14befaf4 5072 case PERL_MAGIC_nkeys:
92110913 5073 vtable = &PL_vtbl_nkeys;
16660edb 5074 break;
14befaf4 5075 case PERL_MAGIC_dbfile:
92110913 5076 vtable = 0;
93a17b20 5077 break;
14befaf4 5078 case PERL_MAGIC_dbline:
92110913 5079 vtable = &PL_vtbl_dbline;
79072805 5080 break;
36477c24 5081#ifdef USE_LOCALE_COLLATE
14befaf4 5082 case PERL_MAGIC_collxfrm:
92110913 5083 vtable = &PL_vtbl_collxfrm;
bbce6d69 5084 break;
36477c24 5085#endif /* USE_LOCALE_COLLATE */
14befaf4 5086 case PERL_MAGIC_tied:
92110913 5087 vtable = &PL_vtbl_pack;
463ee0b2 5088 break;
14befaf4
DM
5089 case PERL_MAGIC_tiedelem:
5090 case PERL_MAGIC_tiedscalar:
92110913 5091 vtable = &PL_vtbl_packelem;
463ee0b2 5092 break;
14befaf4 5093 case PERL_MAGIC_qr:
92110913 5094 vtable = &PL_vtbl_regexp;
c277df42 5095 break;
14befaf4 5096 case PERL_MAGIC_sig:
92110913 5097 vtable = &PL_vtbl_sig;
79072805 5098 break;
14befaf4 5099 case PERL_MAGIC_sigelem:
92110913 5100 vtable = &PL_vtbl_sigelem;
79072805 5101 break;
14befaf4 5102 case PERL_MAGIC_taint:
92110913 5103 vtable = &PL_vtbl_taint;
463ee0b2 5104 break;
14befaf4 5105 case PERL_MAGIC_uvar:
92110913 5106 vtable = &PL_vtbl_uvar;
79072805 5107 break;
14befaf4 5108 case PERL_MAGIC_vec:
92110913 5109 vtable = &PL_vtbl_vec;
79072805 5110 break;
a3874608 5111 case PERL_MAGIC_arylen_p:
bfcb3514 5112 case PERL_MAGIC_rhash:
8d2f4536 5113 case PERL_MAGIC_symtab:
ece467f9
JP
5114 case PERL_MAGIC_vstring:
5115 vtable = 0;
5116 break;
7e8c5dac
HS
5117 case PERL_MAGIC_utf8:
5118 vtable = &PL_vtbl_utf8;
5119 break;
14befaf4 5120 case PERL_MAGIC_substr:
92110913 5121 vtable = &PL_vtbl_substr;
79072805 5122 break;
14befaf4 5123 case PERL_MAGIC_defelem:
92110913 5124 vtable = &PL_vtbl_defelem;
5f05dabc 5125 break;
14befaf4 5126 case PERL_MAGIC_glob:
92110913 5127 vtable = &PL_vtbl_glob;
79072805 5128 break;
14befaf4 5129 case PERL_MAGIC_arylen:
92110913 5130 vtable = &PL_vtbl_arylen;
79072805 5131 break;
14befaf4 5132 case PERL_MAGIC_pos:
92110913 5133 vtable = &PL_vtbl_pos;
a0d0e21e 5134 break;
14befaf4 5135 case PERL_MAGIC_backref:
92110913 5136 vtable = &PL_vtbl_backref;
810b8aa5 5137 break;
14befaf4
DM
5138 case PERL_MAGIC_ext:
5139 /* Reserved for use by extensions not perl internals. */
4633a7c4
LW
5140 /* Useful for attaching extension internal data to perl vars. */
5141 /* Note that multiple extensions may clash if magical scalars */
5142 /* etc holding private data from one are passed to another. */
a0d0e21e 5143 break;
79072805 5144 default:
14befaf4 5145 Perl_croak(aTHX_ "Don't know how to handle magic of type \\%o", how);
463ee0b2 5146 }
68795e93 5147
92110913 5148 /* Rest of work is done else where */
27da23d5 5149 mg = sv_magicext(sv,obj,how,(MGVTBL*)vtable,name,namlen);
68795e93 5150
92110913
NIS
5151 switch (how) {
5152 case PERL_MAGIC_taint:
5153 mg->mg_len = 1;
5154 break;
5155 case PERL_MAGIC_ext:
5156 case PERL_MAGIC_dbfile:
5157 SvRMAGICAL_on(sv);
5158 break;
5159 }
463ee0b2
LW
5160}
5161
c461cf8f
JH
5162/*
5163=for apidoc sv_unmagic
5164
645c22ef 5165Removes all magic of type C<type> from an SV.
c461cf8f
JH
5166
5167=cut
5168*/
5169
463ee0b2 5170int
864dbfa3 5171Perl_sv_unmagic(pTHX_ SV *sv, int type)
463ee0b2
LW
5172{
5173 MAGIC* mg;
5174 MAGIC** mgp;
91bba347 5175 if (SvTYPE(sv) < SVt_PVMG || !SvMAGIC(sv))
463ee0b2
LW
5176 return 0;
5177 mgp = &SvMAGIC(sv);
5178 for (mg = *mgp; mg; mg = *mgp) {
5179 if (mg->mg_type == type) {
e1ec3a88 5180 const MGVTBL* const vtbl = mg->mg_virtual;
463ee0b2 5181 *mgp = mg->mg_moremagic;
1d7c1841 5182 if (vtbl && vtbl->svt_free)
fc0dc3b3 5183 CALL_FPTR(vtbl->svt_free)(aTHX_ sv, mg);
14befaf4 5184 if (mg->mg_ptr && mg->mg_type != PERL_MAGIC_regex_global) {
92110913 5185 if (mg->mg_len > 0)
1edc1566 5186 Safefree(mg->mg_ptr);
565764a8 5187 else if (mg->mg_len == HEf_SVKEY)
1edc1566 5188 SvREFCNT_dec((SV*)mg->mg_ptr);
7e8c5dac
HS
5189 else if (mg->mg_type == PERL_MAGIC_utf8 && mg->mg_ptr)
5190 Safefree(mg->mg_ptr);
9cbac4c7 5191 }
a0d0e21e
LW
5192 if (mg->mg_flags & MGf_REFCOUNTED)
5193 SvREFCNT_dec(mg->mg_obj);
463ee0b2
LW
5194 Safefree(mg);
5195 }
5196 else
5197 mgp = &mg->mg_moremagic;
79072805 5198 }
91bba347 5199 if (!SvMAGIC(sv)) {
463ee0b2 5200 SvMAGICAL_off(sv);
06759ea0 5201 SvFLAGS(sv) |= (SvFLAGS(sv) & (SVp_NOK|SVp_POK)) >> PRIVSHIFT;
463ee0b2
LW
5202 }
5203
5204 return 0;
79072805
LW
5205}
5206
c461cf8f
JH
5207/*
5208=for apidoc sv_rvweaken
5209
645c22ef
DM
5210Weaken a reference: set the C<SvWEAKREF> flag on this RV; give the
5211referred-to SV C<PERL_MAGIC_backref> magic if it hasn't already; and
5212push a back-reference to this RV onto the array of backreferences
5213associated with that magic.
c461cf8f
JH
5214
5215=cut
5216*/
5217
810b8aa5 5218SV *
864dbfa3 5219Perl_sv_rvweaken(pTHX_ SV *sv)
810b8aa5
GS
5220{
5221 SV *tsv;
5222 if (!SvOK(sv)) /* let undefs pass */
5223 return sv;
5224 if (!SvROK(sv))
cea2e8a9 5225 Perl_croak(aTHX_ "Can't weaken a nonreference");
810b8aa5 5226 else if (SvWEAKREF(sv)) {
810b8aa5 5227 if (ckWARN(WARN_MISC))
9014280d 5228 Perl_warner(aTHX_ packWARN(WARN_MISC), "Reference is already weak");
810b8aa5
GS
5229 return sv;
5230 }
5231 tsv = SvRV(sv);
e15faf7d 5232 Perl_sv_add_backref(aTHX_ tsv, sv);
810b8aa5 5233 SvWEAKREF_on(sv);
1c846c1f 5234 SvREFCNT_dec(tsv);
810b8aa5
GS
5235 return sv;
5236}
5237
645c22ef
DM
5238/* Give tsv backref magic if it hasn't already got it, then push a
5239 * back-reference to sv onto the array associated with the backref magic.
5240 */
5241
e15faf7d
NC
5242void
5243Perl_sv_add_backref(pTHX_ SV *tsv, SV *sv)
810b8aa5
GS
5244{
5245 AV *av;
5246 MAGIC *mg;
14befaf4 5247 if (SvMAGICAL(tsv) && (mg = mg_find(tsv, PERL_MAGIC_backref)))
810b8aa5
GS
5248 av = (AV*)mg->mg_obj;
5249 else {
5250 av = newAV();
14befaf4 5251 sv_magic(tsv, (SV*)av, PERL_MAGIC_backref, NULL, 0);
d99b02a1
DM
5252 /* av now has a refcnt of 2, which avoids it getting freed
5253 * before us during global cleanup. The extra ref is removed
5254 * by magic_killbackrefs() when tsv is being freed */
810b8aa5 5255 }
d91d49e8 5256 if (AvFILLp(av) >= AvMAX(av)) {
d91d49e8
MM
5257 av_extend(av, AvFILLp(av)+1);
5258 }
5259 AvARRAY(av)[++AvFILLp(av)] = sv; /* av_push() */
810b8aa5
GS
5260}
5261
645c22ef
DM
5262/* delete a back-reference to ourselves from the backref magic associated
5263 * with the SV we point to.
5264 */
5265
1c846c1f 5266STATIC void
e15faf7d 5267S_sv_del_backref(pTHX_ SV *tsv, SV *sv)
810b8aa5
GS
5268{
5269 AV *av;
5270 SV **svp;
5271 I32 i;
c04a4dfe 5272 MAGIC *mg = NULL;
e15faf7d
NC
5273 if (!SvMAGICAL(tsv) || !(mg = mg_find(tsv, PERL_MAGIC_backref))) {
5274 if (PL_in_clean_all)
5275 return;
5276 }
14befaf4 5277 if (!SvMAGICAL(tsv) || !(mg = mg_find(tsv, PERL_MAGIC_backref)))
cea2e8a9 5278 Perl_croak(aTHX_ "panic: del_backref");
810b8aa5
GS
5279 av = (AV *)mg->mg_obj;
5280 svp = AvARRAY(av);
6a76db8b
NC
5281 /* We shouldn't be in here more than once, but for paranoia reasons lets
5282 not assume this. */
5283 for (i = AvFILLp(av); i >= 0; i--) {
5284 if (svp[i] == sv) {
5285 const SSize_t fill = AvFILLp(av);
5286 if (i != fill) {
5287 /* We weren't the last entry.
5288 An unordered list has this property that you can take the
5289 last element off the end to fill the hole, and it's still
5290 an unordered list :-)
5291 */
5292 svp[i] = svp[fill];
5293 }
5294 svp[fill] = Nullsv;
5295 AvFILLp(av) = fill - 1;
5296 }
5297 }
810b8aa5
GS
5298}
5299
954c1994
GS
5300/*
5301=for apidoc sv_insert
5302
5303Inserts a string at the specified offset/length within the SV. Similar to
5304the Perl substr() function.
5305
5306=cut
5307*/
5308
79072805 5309void
e1ec3a88 5310Perl_sv_insert(pTHX_ SV *bigstr, STRLEN offset, STRLEN len, const char *little, STRLEN littlelen)
79072805
LW
5311{
5312 register char *big;
5313 register char *mid;
5314 register char *midend;
5315 register char *bigend;
5316 register I32 i;
6ff81951 5317 STRLEN curlen;
1c846c1f 5318
79072805 5319
8990e307 5320 if (!bigstr)
cea2e8a9 5321 Perl_croak(aTHX_ "Can't modify non-existent substring");
6ff81951 5322 SvPV_force(bigstr, curlen);
60fa28ff 5323 (void)SvPOK_only_UTF8(bigstr);
6ff81951
GS
5324 if (offset + len > curlen) {
5325 SvGROW(bigstr, offset+len+1);
93524f2b 5326 Zero(SvPVX(bigstr)+curlen, offset+len-curlen, char);
6ff81951
GS
5327 SvCUR_set(bigstr, offset+len);
5328 }
79072805 5329
69b47968 5330 SvTAINT(bigstr);
79072805
LW
5331 i = littlelen - len;
5332 if (i > 0) { /* string might grow */
a0d0e21e 5333 big = SvGROW(bigstr, SvCUR(bigstr) + i + 1);
79072805
LW
5334 mid = big + offset + len;
5335 midend = bigend = big + SvCUR(bigstr);
5336 bigend += i;
5337 *bigend = '\0';
5338 while (midend > mid) /* shove everything down */
5339 *--bigend = *--midend;
5340 Move(little,big+offset,littlelen,char);
b162af07 5341 SvCUR_set(bigstr, SvCUR(bigstr) + i);
79072805
LW
5342 SvSETMAGIC(bigstr);
5343 return;
5344 }
5345 else if (i == 0) {
463ee0b2 5346 Move(little,SvPVX(bigstr)+offset,len,char);
79072805
LW
5347 SvSETMAGIC(bigstr);
5348 return;
5349 }
5350
463ee0b2 5351 big = SvPVX(bigstr);
79072805
LW
5352 mid = big + offset;
5353 midend = mid + len;
5354 bigend = big + SvCUR(bigstr);
5355
5356 if (midend > bigend)
cea2e8a9 5357 Perl_croak(aTHX_ "panic: sv_insert");
79072805
LW
5358
5359 if (mid - big > bigend - midend) { /* faster to shorten from end */
5360 if (littlelen) {
5361 Move(little, mid, littlelen,char);
5362 mid += littlelen;
5363 }
5364 i = bigend - midend;
5365 if (i > 0) {
5366 Move(midend, mid, i,char);
5367 mid += i;
5368 }
5369 *mid = '\0';
5370 SvCUR_set(bigstr, mid - big);
5371 }
155aba94 5372 else if ((i = mid - big)) { /* faster from front */
79072805
LW
5373 midend -= littlelen;
5374 mid = midend;
5375 sv_chop(bigstr,midend-i);
5376 big += i;
5377 while (i--)
5378 *--midend = *--big;
5379 if (littlelen)
5380 Move(little, mid, littlelen,char);
5381 }
5382 else if (littlelen) {
5383 midend -= littlelen;
5384 sv_chop(bigstr,midend);
5385 Move(little,midend,littlelen,char);
5386 }
5387 else {
5388 sv_chop(bigstr,midend);
5389 }
5390 SvSETMAGIC(bigstr);
5391}
5392
c461cf8f
JH
5393/*
5394=for apidoc sv_replace
5395
5396Make the first argument a copy of the second, then delete the original.
645c22ef
DM
5397The target SV physically takes over ownership of the body of the source SV
5398and inherits its flags; however, the target keeps any magic it owns,
5399and any magic in the source is discarded.
ff276b08 5400Note that this is a rather specialist SV copying operation; most of the
645c22ef 5401time you'll want to use C<sv_setsv> or one of its many macro front-ends.
c461cf8f
JH
5402
5403=cut
5404*/
79072805
LW
5405
5406void
864dbfa3 5407Perl_sv_replace(pTHX_ register SV *sv, register SV *nsv)
79072805 5408{
a3b680e6 5409 const U32 refcnt = SvREFCNT(sv);
765f542d 5410 SV_CHECK_THINKFIRST_COW_DROP(sv);
0453d815 5411 if (SvREFCNT(nsv) != 1 && ckWARN_d(WARN_INTERNAL))
9014280d 5412 Perl_warner(aTHX_ packWARN(WARN_INTERNAL), "Reference miscount in sv_replace()");
93a17b20 5413 if (SvMAGICAL(sv)) {
a0d0e21e
LW
5414 if (SvMAGICAL(nsv))
5415 mg_free(nsv);
5416 else
5417 sv_upgrade(nsv, SVt_PVMG);
b162af07 5418 SvMAGIC_set(nsv, SvMAGIC(sv));
a0d0e21e 5419 SvFLAGS(nsv) |= SvMAGICAL(sv);
93a17b20 5420 SvMAGICAL_off(sv);
b162af07 5421 SvMAGIC_set(sv, NULL);
93a17b20 5422 }
79072805
LW
5423 SvREFCNT(sv) = 0;
5424 sv_clear(sv);
477f5d66 5425 assert(!SvREFCNT(sv));
fd0854ff
DM
5426#ifdef DEBUG_LEAKING_SCALARS
5427 sv->sv_flags = nsv->sv_flags;
5428 sv->sv_any = nsv->sv_any;
5429 sv->sv_refcnt = nsv->sv_refcnt;
f34d0642 5430 sv->sv_u = nsv->sv_u;
fd0854ff 5431#else
79072805 5432 StructCopy(nsv,sv,SV);
fd0854ff 5433#endif
7b2c381c
NC
5434 /* Currently could join these into one piece of pointer arithmetic, but
5435 it would be unclear. */
5436 if(SvTYPE(sv) == SVt_IV)
5437 SvANY(sv)
339049b0 5438 = (XPVIV*)((char*)&(sv->sv_u.svu_iv) - STRUCT_OFFSET(XPVIV, xiv_iv));
7b2c381c 5439 else if (SvTYPE(sv) == SVt_RV) {
339049b0 5440 SvANY(sv) = &sv->sv_u.svu_rv;
7b2c381c
NC
5441 }
5442
fd0854ff 5443
f8c7b90f 5444#ifdef PERL_OLD_COPY_ON_WRITE
d3d0e6f1
NC
5445 if (SvIsCOW_normal(nsv)) {
5446 /* We need to follow the pointers around the loop to make the
5447 previous SV point to sv, rather than nsv. */
5448 SV *next;
5449 SV *current = nsv;
5450 while ((next = SV_COW_NEXT_SV(current)) != nsv) {
5451 assert(next);
5452 current = next;
3f7c398e 5453 assert(SvPVX_const(current) == SvPVX_const(nsv));
d3d0e6f1
NC
5454 }
5455 /* Make the SV before us point to the SV after us. */
5456 if (DEBUG_C_TEST) {
5457 PerlIO_printf(Perl_debug_log, "previous is\n");
5458 sv_dump(current);
a29f6d03
NC
5459 PerlIO_printf(Perl_debug_log,
5460 "move it from 0x%"UVxf" to 0x%"UVxf"\n",
d3d0e6f1
NC
5461 (UV) SV_COW_NEXT_SV(current), (UV) sv);
5462 }
a29f6d03 5463 SV_COW_NEXT_SV_SET(current, sv);
d3d0e6f1
NC
5464 }
5465#endif
79072805 5466 SvREFCNT(sv) = refcnt;
1edc1566 5467 SvFLAGS(nsv) |= SVTYPEMASK; /* Mark as freed */
39cf41c2 5468 SvREFCNT(nsv) = 0;
463ee0b2 5469 del_SV(nsv);
79072805
LW
5470}
5471
c461cf8f
JH
5472/*
5473=for apidoc sv_clear
5474
645c22ef
DM
5475Clear an SV: call any destructors, free up any memory used by the body,
5476and free the body itself. The SV's head is I<not> freed, although
5477its type is set to all 1's so that it won't inadvertently be assumed
5478to be live during global destruction etc.
5479This function should only be called when REFCNT is zero. Most of the time
5480you'll want to call C<sv_free()> (or its macro wrapper C<SvREFCNT_dec>)
5481instead.
c461cf8f
JH
5482
5483=cut
5484*/
5485
79072805 5486void
864dbfa3 5487Perl_sv_clear(pTHX_ register SV *sv)
79072805 5488{
27da23d5 5489 dVAR;
82bb6deb
NC
5490 void** old_body_arena;
5491 size_t old_body_offset;
5492 const U32 type = SvTYPE(sv);
5493
79072805
LW
5494 assert(sv);
5495 assert(SvREFCNT(sv) == 0);
5496
82bb6deb
NC
5497 if (type <= SVt_IV)
5498 return;
5499
5500 old_body_arena = 0;
5501 old_body_offset = 0;
5502
ed6116ce 5503 if (SvOBJECT(sv)) {
3280af22 5504 if (PL_defstash) { /* Still have a symbol table? */
39644a26 5505 dSP;
893645bd 5506 HV* stash;
d460ef45 5507 do {
b464bac0 5508 CV* destructor;
4e8e7886 5509 stash = SvSTASH(sv);
32251b26 5510 destructor = StashHANDLER(stash,DESTROY);
4e8e7886 5511 if (destructor) {
1b6737cc 5512 SV* const tmpref = newRV(sv);
5cc433a6 5513 SvREADONLY_on(tmpref); /* DESTROY() could be naughty */
4e8e7886 5514 ENTER;
e788e7d3 5515 PUSHSTACKi(PERLSI_DESTROY);
4e8e7886
GS
5516 EXTEND(SP, 2);
5517 PUSHMARK(SP);
5cc433a6 5518 PUSHs(tmpref);
4e8e7886 5519 PUTBACK;
44389ee9 5520 call_sv((SV*)destructor, G_DISCARD|G_EVAL|G_KEEPERR|G_VOID);
7a5fa8a2
NIS
5521
5522
d3acc0f7 5523 POPSTACK;
3095d977 5524 SPAGAIN;
4e8e7886 5525 LEAVE;
5cc433a6
AB
5526 if(SvREFCNT(tmpref) < 2) {
5527 /* tmpref is not kept alive! */
5528 SvREFCNT(sv)--;
b162af07 5529 SvRV_set(tmpref, NULL);
5cc433a6
AB
5530 SvROK_off(tmpref);
5531 }
5532 SvREFCNT_dec(tmpref);
4e8e7886
GS
5533 }
5534 } while (SvOBJECT(sv) && SvSTASH(sv) != stash);
8ebc5c01 5535
6f44e0a4
JP
5536
5537 if (SvREFCNT(sv)) {
5538 if (PL_in_clean_objs)
cea2e8a9 5539 Perl_croak(aTHX_ "DESTROY created new reference to dead object '%s'",
bfcb3514 5540 HvNAME_get(stash));
6f44e0a4
JP
5541 /* DESTROY gave object new lease on life */
5542 return;
5543 }
a0d0e21e 5544 }
4e8e7886 5545
a0d0e21e 5546 if (SvOBJECT(sv)) {
4e8e7886 5547 SvREFCNT_dec(SvSTASH(sv)); /* possibly of changed persuasion */
a0d0e21e 5548 SvOBJECT_off(sv); /* Curse the object. */
82bb6deb 5549 if (type != SVt_PVIO)
3280af22 5550 --PL_sv_objcount; /* XXX Might want something more general */
a0d0e21e 5551 }
463ee0b2 5552 }
82bb6deb 5553 if (type >= SVt_PVMG) {
524189f1
JH
5554 if (SvMAGIC(sv))
5555 mg_free(sv);
82bb6deb 5556 if (type == SVt_PVMG && SvFLAGS(sv) & SVpad_TYPED)
524189f1
JH
5557 SvREFCNT_dec(SvSTASH(sv));
5558 }
82bb6deb 5559 switch (type) {
8990e307 5560 case SVt_PVIO:
df0bd2f4
GS
5561 if (IoIFP(sv) &&
5562 IoIFP(sv) != PerlIO_stdin() &&
5f05dabc 5563 IoIFP(sv) != PerlIO_stdout() &&
5564 IoIFP(sv) != PerlIO_stderr())
93578b34 5565 {
f2b5be74 5566 io_close((IO*)sv, FALSE);
93578b34 5567 }
1d7c1841 5568 if (IoDIRP(sv) && !(IoFLAGS(sv) & IOf_FAKE_DIRP))
1236053a 5569 PerlDir_close(IoDIRP(sv));
1d7c1841 5570 IoDIRP(sv) = (DIR*)NULL;
8990e307
LW
5571 Safefree(IoTOP_NAME(sv));
5572 Safefree(IoFMT_NAME(sv));
5573 Safefree(IoBOTTOM_NAME(sv));
82bb6deb
NC
5574 /* PVIOs aren't from arenas */
5575 goto freescalar;
79072805 5576 case SVt_PVBM:
82bb6deb 5577 old_body_arena = (void **) &PL_xpvbm_root;
a0d0e21e 5578 goto freescalar;
79072805 5579 case SVt_PVCV:
82bb6deb 5580 old_body_arena = (void **) &PL_xpvcv_root;
748a9306 5581 case SVt_PVFM:
82bb6deb 5582 /* PVFMs aren't from arenas */
85e6fe83 5583 cv_undef((CV*)sv);
a0d0e21e 5584 goto freescalar;
79072805 5585 case SVt_PVHV:
85e6fe83 5586 hv_undef((HV*)sv);
82bb6deb
NC
5587 old_body_arena = (void **) &PL_xpvhv_root;
5588 old_body_offset = STRUCT_OFFSET(XPVHV, xhv_fill);
a0d0e21e 5589 break;
79072805 5590 case SVt_PVAV:
85e6fe83 5591 av_undef((AV*)sv);
82bb6deb
NC
5592 old_body_arena = (void **) &PL_xpvav_root;
5593 old_body_offset = STRUCT_OFFSET(XPVAV, xav_fill);
a0d0e21e 5594 break;
02270b4e 5595 case SVt_PVLV:
dd28f7bb
DM
5596 if (LvTYPE(sv) == 'T') { /* for tie: return HE to pool */
5597 SvREFCNT_dec(HeKEY_sv((HE*)LvTARG(sv)));
5598 HeNEXT((HE*)LvTARG(sv)) = PL_hv_fetch_ent_mh;
5599 PL_hv_fetch_ent_mh = (HE*)LvTARG(sv);
5600 }
5601 else if (LvTYPE(sv) != 't') /* unless tie: unrefcnted fake SV** */
5602 SvREFCNT_dec(LvTARG(sv));
82bb6deb 5603 old_body_arena = (void **) &PL_xpvlv_root;
02270b4e 5604 goto freescalar;
a0d0e21e 5605 case SVt_PVGV:
1edc1566 5606 gp_free((GV*)sv);
a0d0e21e 5607 Safefree(GvNAME(sv));
893645bd
NC
5608 /* If we're in a stash, we don't own a reference to it. However it does
5609 have a back reference to us, which needs to be cleared. */
5610 if (GvSTASH(sv))
5611 sv_del_backref((SV*)GvSTASH(sv), sv);
82bb6deb
NC
5612 old_body_arena = (void **) &PL_xpvgv_root;
5613 goto freescalar;
79072805 5614 case SVt_PVMG:
82bb6deb
NC
5615 old_body_arena = (void **) &PL_xpvmg_root;
5616 goto freescalar;
79072805 5617 case SVt_PVNV:
82bb6deb
NC
5618 old_body_arena = (void **) &PL_xpvnv_root;
5619 goto freescalar;
79072805 5620 case SVt_PVIV:
82bb6deb
NC
5621 old_body_arena = (void **) &PL_xpviv_root;
5622 old_body_offset = STRUCT_OFFSET(XPVIV, xpv_cur);
a0d0e21e 5623 freescalar:
5228ca4e
NC
5624 /* Don't bother with SvOOK_off(sv); as we're only going to free it. */
5625 if (SvOOK(sv)) {
93524f2b 5626 SvPV_set(sv, SvPVX_mutable(sv) - SvIVX(sv));
5228ca4e
NC
5627 /* Don't even bother with turning off the OOK flag. */
5628 }
82bb6deb 5629 goto pvrv_common;
79072805 5630 case SVt_PV:
82bb6deb
NC
5631 old_body_arena = (void **) &PL_xpv_root;
5632 old_body_offset = STRUCT_OFFSET(XPV, xpv_cur);
a0d0e21e 5633 case SVt_RV:
82bb6deb 5634 pvrv_common:
810b8aa5 5635 if (SvROK(sv)) {
e15faf7d 5636 SV *target = SvRV(sv);
810b8aa5 5637 if (SvWEAKREF(sv))
e15faf7d 5638 sv_del_backref(target, sv);
810b8aa5 5639 else
e15faf7d 5640 SvREFCNT_dec(target);
810b8aa5 5641 }
f8c7b90f 5642#ifdef PERL_OLD_COPY_ON_WRITE
3f7c398e 5643 else if (SvPVX_const(sv)) {
765f542d
NC
5644 if (SvIsCOW(sv)) {
5645 /* I believe I need to grab the global SV mutex here and
5646 then recheck the COW status. */
46187eeb
NC
5647 if (DEBUG_C_TEST) {
5648 PerlIO_printf(Perl_debug_log, "Copy on write: clear\n");
e419cbc5 5649 sv_dump(sv);
46187eeb 5650 }
bdd68bc3
NC
5651 sv_release_COW(sv, SvPVX_const(sv), SvLEN(sv),
5652 SV_COW_NEXT_SV(sv));
765f542d
NC
5653 /* And drop it here. */
5654 SvFAKE_off(sv);
5655 } else if (SvLEN(sv)) {
3f7c398e 5656 Safefree(SvPVX_const(sv));
765f542d
NC
5657 }
5658 }
5659#else
3f7c398e 5660 else if (SvPVX_const(sv) && SvLEN(sv))
94010e71 5661 Safefree(SvPVX_mutable(sv));
3f7c398e 5662 else if (SvPVX_const(sv) && SvREADONLY(sv) && SvFAKE(sv)) {
bdd68bc3 5663 unshare_hek(SvSHARED_HEK_FROM_PV(SvPVX_const(sv)));
1c846c1f
NIS
5664 SvFAKE_off(sv);
5665 }
765f542d 5666#endif
79072805
LW
5667 break;
5668 case SVt_NV:
82bb6deb 5669 old_body_arena = (void **) &PL_xnv_root;
79072805
LW
5670 break;
5671 }
5672
893645bd
NC
5673 SvFLAGS(sv) &= SVf_BREAK;
5674 SvFLAGS(sv) |= SVTYPEMASK;
5675
82bb6deb
NC
5676#ifndef PURIFY
5677 if (old_body_arena) {
5678 del_body(((char *)SvANY(sv) + old_body_offset), old_body_arena);
79072805 5679 }
82bb6deb
NC
5680 else
5681#endif
5682 if (type > SVt_RV) {
5683 my_safefree(SvANY(sv));
5684 }
79072805
LW
5685}
5686
645c22ef
DM
5687/*
5688=for apidoc sv_newref
5689
5690Increment an SV's reference count. Use the C<SvREFCNT_inc()> wrapper
5691instead.
5692
5693=cut
5694*/
5695
79072805 5696SV *
864dbfa3 5697Perl_sv_newref(pTHX_ SV *sv)
79072805 5698{
463ee0b2 5699 if (sv)
4db098f4 5700 (SvREFCNT(sv))++;
79072805
LW
5701 return sv;
5702}
5703
c461cf8f
JH
5704/*
5705=for apidoc sv_free
5706
645c22ef
DM
5707Decrement an SV's reference count, and if it drops to zero, call
5708C<sv_clear> to invoke destructors and free up any memory used by
5709the body; finally, deallocate the SV's head itself.
5710Normally called via a wrapper macro C<SvREFCNT_dec>.
c461cf8f
JH
5711
5712=cut
5713*/
5714
79072805 5715void
864dbfa3 5716Perl_sv_free(pTHX_ SV *sv)
79072805 5717{
27da23d5 5718 dVAR;
79072805
LW
5719 if (!sv)
5720 return;
a0d0e21e
LW
5721 if (SvREFCNT(sv) == 0) {
5722 if (SvFLAGS(sv) & SVf_BREAK)
645c22ef
DM
5723 /* this SV's refcnt has been artificially decremented to
5724 * trigger cleanup */
a0d0e21e 5725 return;
3280af22 5726 if (PL_in_clean_all) /* All is fair */
1edc1566 5727 return;
d689ffdd
JP
5728 if (SvREADONLY(sv) && SvIMMORTAL(sv)) {
5729 /* make sure SvREFCNT(sv)==0 happens very seldom */
5730 SvREFCNT(sv) = (~(U32)0)/2;
5731 return;
5732 }
41e4abd8 5733 if (ckWARN_d(WARN_INTERNAL)) {
d5dede04 5734 Perl_warner(aTHX_ packWARN(WARN_INTERNAL),
472d47bc
SB
5735 "Attempt to free unreferenced scalar: SV 0x%"UVxf
5736 pTHX__FORMAT, PTR2UV(sv) pTHX__VALUE);
41e4abd8
NC
5737#ifdef DEBUG_LEAKING_SCALARS_FORK_DUMP
5738 Perl_dump_sv_child(aTHX_ sv);
5739#endif
5740 }
79072805
LW
5741 return;
5742 }
4db098f4 5743 if (--(SvREFCNT(sv)) > 0)
8990e307 5744 return;
8c4d3c90
NC
5745 Perl_sv_free2(aTHX_ sv);
5746}
5747
5748void
5749Perl_sv_free2(pTHX_ SV *sv)
5750{
27da23d5 5751 dVAR;
463ee0b2
LW
5752#ifdef DEBUGGING
5753 if (SvTEMP(sv)) {
0453d815 5754 if (ckWARN_d(WARN_DEBUGGING))
9014280d 5755 Perl_warner(aTHX_ packWARN(WARN_DEBUGGING),
472d47bc
SB
5756 "Attempt to free temp prematurely: SV 0x%"UVxf
5757 pTHX__FORMAT, PTR2UV(sv) pTHX__VALUE);
79072805 5758 return;
79072805 5759 }
463ee0b2 5760#endif
d689ffdd
JP
5761 if (SvREADONLY(sv) && SvIMMORTAL(sv)) {
5762 /* make sure SvREFCNT(sv)==0 happens very seldom */
5763 SvREFCNT(sv) = (~(U32)0)/2;
5764 return;
5765 }
79072805 5766 sv_clear(sv);
477f5d66
CS
5767 if (! SvREFCNT(sv))
5768 del_SV(sv);
79072805
LW
5769}
5770
954c1994
GS
5771/*
5772=for apidoc sv_len
5773
645c22ef
DM
5774Returns the length of the string in the SV. Handles magic and type
5775coercion. See also C<SvCUR>, which gives raw access to the xpv_cur slot.
954c1994
GS
5776
5777=cut
5778*/
5779
79072805 5780STRLEN
864dbfa3 5781Perl_sv_len(pTHX_ register SV *sv)
79072805 5782{
463ee0b2 5783 STRLEN len;
79072805
LW
5784
5785 if (!sv)
5786 return 0;
5787
8990e307 5788 if (SvGMAGICAL(sv))
565764a8 5789 len = mg_length(sv);
8990e307 5790 else
4d84ee25 5791 (void)SvPV_const(sv, len);
463ee0b2 5792 return len;
79072805
LW
5793}
5794
c461cf8f
JH
5795/*
5796=for apidoc sv_len_utf8
5797
5798Returns the number of characters in the string in an SV, counting wide
1e54db1a 5799UTF-8 bytes as a single character. Handles magic and type coercion.
c461cf8f
JH
5800
5801=cut
5802*/
5803
7e8c5dac
HS
5804/*
5805 * The length is cached in PERL_UTF8_magic, in the mg_len field. Also the
5806 * mg_ptr is used, by sv_pos_u2b(), see the comments of S_utf8_mg_pos_init().
5807 * (Note that the mg_len is not the length of the mg_ptr field.)
7a5fa8a2 5808 *
7e8c5dac
HS
5809 */
5810
a0ed51b3 5811STRLEN
864dbfa3 5812Perl_sv_len_utf8(pTHX_ register SV *sv)
a0ed51b3 5813{
a0ed51b3
LW
5814 if (!sv)
5815 return 0;
5816
a0ed51b3 5817 if (SvGMAGICAL(sv))
b76347f2 5818 return mg_length(sv);
a0ed51b3 5819 else
b76347f2 5820 {
7e8c5dac 5821 STRLEN len, ulen;
e62f0680 5822 const U8 *s = (U8*)SvPV_const(sv, len);
7e8c5dac
HS
5823 MAGIC *mg = SvMAGICAL(sv) ? mg_find(sv, PERL_MAGIC_utf8) : 0;
5824
e23c8137 5825 if (mg && mg->mg_len != -1 && (mg->mg_len > 0 || len == 0)) {
7e8c5dac 5826 ulen = mg->mg_len;
e23c8137
JH
5827#ifdef PERL_UTF8_CACHE_ASSERT
5828 assert(ulen == Perl_utf8_length(aTHX_ s, s + len));
5829#endif
5830 }
7e8c5dac
HS
5831 else {
5832 ulen = Perl_utf8_length(aTHX_ s, s + len);
5833 if (!mg && !SvREADONLY(sv)) {
5834 sv_magic(sv, 0, PERL_MAGIC_utf8, 0, 0);
5835 mg = mg_find(sv, PERL_MAGIC_utf8);
5836 assert(mg);
5837 }
5838 if (mg)
5839 mg->mg_len = ulen;
5840 }
5841 return ulen;
5842 }
5843}
5844
5845/* S_utf8_mg_pos_init() is used to initialize the mg_ptr field of
5846 * a PERL_UTF8_magic. The mg_ptr is used to store the mapping
5847 * between UTF-8 and byte offsets. There are two (substr offset and substr
5848 * length, the i offset, PERL_MAGIC_UTF8_CACHESIZE) times two (UTF-8 offset
5849 * and byte offset) cache positions.
5850 *
5851 * The mg_len field is used by sv_len_utf8(), see its comments.
5852 * Note that the mg_len is not the length of the mg_ptr field.
5853 *
5854 */
5855STATIC bool
245d4a47
NC
5856S_utf8_mg_pos_init(pTHX_ SV *sv, MAGIC **mgp, STRLEN **cachep, I32 i,
5857 I32 offsetp, const U8 *s, const U8 *start)
7e8c5dac 5858{
7a5fa8a2 5859 bool found = FALSE;
7e8c5dac
HS
5860
5861 if (SvMAGICAL(sv) && !SvREADONLY(sv)) {
8f78557a 5862 if (!*mgp)
27da23d5 5863 *mgp = sv_magicext(sv, 0, PERL_MAGIC_utf8, (MGVTBL*)&PL_vtbl_utf8, 0, 0);
7e8c5dac 5864 assert(*mgp);
b76347f2 5865
7e8c5dac
HS
5866 if ((*mgp)->mg_ptr)
5867 *cachep = (STRLEN *) (*mgp)->mg_ptr;
5868 else {
a02a5408 5869 Newxz(*cachep, PERL_MAGIC_UTF8_CACHESIZE * 2, STRLEN);
7e8c5dac
HS
5870 (*mgp)->mg_ptr = (char *) *cachep;
5871 }
5872 assert(*cachep);
5873
a3b680e6 5874 (*cachep)[i] = offsetp;
7e8c5dac
HS
5875 (*cachep)[i+1] = s - start;
5876 found = TRUE;
a0ed51b3 5877 }
7e8c5dac
HS
5878
5879 return found;
a0ed51b3
LW
5880}
5881
645c22ef 5882/*
7e8c5dac
HS
5883 * S_utf8_mg_pos() is used to query and update mg_ptr field of
5884 * a PERL_UTF8_magic. The mg_ptr is used to store the mapping
5885 * between UTF-8 and byte offsets. See also the comments of
5886 * S_utf8_mg_pos_init().
5887 *
5888 */
5889STATIC bool
245d4a47 5890S_utf8_mg_pos(pTHX_ SV *sv, MAGIC **mgp, STRLEN **cachep, I32 i, I32 *offsetp, I32 uoff, const U8 **sp, const U8 *start, const U8 *send)
7e8c5dac
HS
5891{
5892 bool found = FALSE;
5893
5894 if (SvMAGICAL(sv) && !SvREADONLY(sv)) {
5895 if (!*mgp)
5896 *mgp = mg_find(sv, PERL_MAGIC_utf8);
5897 if (*mgp && (*mgp)->mg_ptr) {
5898 *cachep = (STRLEN *) (*mgp)->mg_ptr;
e23c8137 5899 ASSERT_UTF8_CACHE(*cachep);
667208dd 5900 if ((*cachep)[i] == (STRLEN)uoff) /* An exact match. */
7a5fa8a2 5901 found = TRUE;
7e8c5dac
HS
5902 else { /* We will skip to the right spot. */
5903 STRLEN forw = 0;
5904 STRLEN backw = 0;
a3b680e6 5905 const U8* p = NULL;
7e8c5dac
HS
5906
5907 /* The assumption is that going backward is half
5908 * the speed of going forward (that's where the
5909 * 2 * backw in the below comes from). (The real
5910 * figure of course depends on the UTF-8 data.) */
5911
667208dd 5912 if ((*cachep)[i] > (STRLEN)uoff) {
7e8c5dac 5913 forw = uoff;
667208dd 5914 backw = (*cachep)[i] - (STRLEN)uoff;
7e8c5dac
HS
5915
5916 if (forw < 2 * backw)
5917 p = start;
5918 else
5919 p = start + (*cachep)[i+1];
5920 }
5921 /* Try this only for the substr offset (i == 0),
5922 * not for the substr length (i == 2). */
5923 else if (i == 0) { /* (*cachep)[i] < uoff */
a3b680e6 5924 const STRLEN ulen = sv_len_utf8(sv);
7e8c5dac 5925
667208dd
JH
5926 if ((STRLEN)uoff < ulen) {
5927 forw = (STRLEN)uoff - (*cachep)[i];
5928 backw = ulen - (STRLEN)uoff;
7e8c5dac
HS
5929
5930 if (forw < 2 * backw)
5931 p = start + (*cachep)[i+1];
5932 else
5933 p = send;
5934 }
5935
5936 /* If the string is not long enough for uoff,
5937 * we could extend it, but not at this low a level. */
5938 }
5939
5940 if (p) {
5941 if (forw < 2 * backw) {
5942 while (forw--)
5943 p += UTF8SKIP(p);
5944 }
5945 else {
5946 while (backw--) {
5947 p--;
5948 while (UTF8_IS_CONTINUATION(*p))
5949 p--;
5950 }
5951 }
5952
5953 /* Update the cache. */
667208dd 5954 (*cachep)[i] = (STRLEN)uoff;
7e8c5dac 5955 (*cachep)[i+1] = p - start;
8f78557a
AE
5956
5957 /* Drop the stale "length" cache */
5958 if (i == 0) {
5959 (*cachep)[2] = 0;
5960 (*cachep)[3] = 0;
5961 }
7a5fa8a2 5962
7e8c5dac
HS
5963 found = TRUE;
5964 }
5965 }
5966 if (found) { /* Setup the return values. */
5967 *offsetp = (*cachep)[i+1];
5968 *sp = start + *offsetp;
5969 if (*sp >= send) {
5970 *sp = send;
5971 *offsetp = send - start;
5972 }
5973 else if (*sp < start) {
5974 *sp = start;
5975 *offsetp = 0;
5976 }
5977 }
5978 }
e23c8137
JH
5979#ifdef PERL_UTF8_CACHE_ASSERT
5980 if (found) {
5981 U8 *s = start;
5982 I32 n = uoff;
5983
5984 while (n-- && s < send)
5985 s += UTF8SKIP(s);
5986
5987 if (i == 0) {
5988 assert(*offsetp == s - start);
5989 assert((*cachep)[0] == (STRLEN)uoff);
5990 assert((*cachep)[1] == *offsetp);
5991 }
5992 ASSERT_UTF8_CACHE(*cachep);
5993 }
5994#endif
7e8c5dac 5995 }
e23c8137 5996
7e8c5dac
HS
5997 return found;
5998}
7a5fa8a2 5999
7e8c5dac 6000/*
645c22ef
DM
6001=for apidoc sv_pos_u2b
6002
1e54db1a 6003Converts the value pointed to by offsetp from a count of UTF-8 chars from
645c22ef
DM
6004the start of the string, to a count of the equivalent number of bytes; if
6005lenp is non-zero, it does the same to lenp, but this time starting from
6006the offset, rather than from the start of the string. Handles magic and
6007type coercion.
6008
6009=cut
6010*/
6011
7e8c5dac
HS
6012/*
6013 * sv_pos_u2b() uses, like sv_pos_b2u(), the mg_ptr of the potential
6014 * PERL_UTF8_magic of the sv to store the mapping between UTF-8 and
6015 * byte offsets. See also the comments of S_utf8_mg_pos().
6016 *
6017 */
6018
a0ed51b3 6019void
864dbfa3 6020Perl_sv_pos_u2b(pTHX_ register SV *sv, I32* offsetp, I32* lenp)
a0ed51b3 6021{
245d4a47 6022 const U8 *start;
a0ed51b3
LW
6023 STRLEN len;
6024
6025 if (!sv)
6026 return;
6027
245d4a47 6028 start = (U8*)SvPV_const(sv, len);
7e8c5dac 6029 if (len) {
b464bac0
AL
6030 STRLEN boffset = 0;
6031 STRLEN *cache = 0;
245d4a47
NC
6032 const U8 *s = start;
6033 I32 uoffset = *offsetp;
9d4ba2ae 6034 const U8 * const send = s + len;
245d4a47
NC
6035 MAGIC *mg = 0;
6036 bool found = FALSE;
7e8c5dac 6037
bdf77a2a 6038 if (utf8_mg_pos(sv, &mg, &cache, 0, offsetp, *offsetp, &s, start, send))
7e8c5dac
HS
6039 found = TRUE;
6040 if (!found && uoffset > 0) {
6041 while (s < send && uoffset--)
6042 s += UTF8SKIP(s);
6043 if (s >= send)
6044 s = send;
a3b680e6 6045 if (utf8_mg_pos_init(sv, &mg, &cache, 0, *offsetp, s, start))
7e8c5dac
HS
6046 boffset = cache[1];
6047 *offsetp = s - start;
6048 }
6049 if (lenp) {
6050 found = FALSE;
6051 start = s;
ec062429 6052 if (utf8_mg_pos(sv, &mg, &cache, 2, lenp, *lenp, &s, start, send)) {
7e8c5dac
HS
6053 *lenp -= boffset;
6054 found = TRUE;
6055 }
6056 if (!found && *lenp > 0) {
6057 I32 ulen = *lenp;
6058 if (ulen > 0)
6059 while (s < send && ulen--)
6060 s += UTF8SKIP(s);
6061 if (s >= send)
6062 s = send;
a3b680e6 6063 utf8_mg_pos_init(sv, &mg, &cache, 2, *lenp, s, start);
7e8c5dac
HS
6064 }
6065 *lenp = s - start;
6066 }
e23c8137 6067 ASSERT_UTF8_CACHE(cache);
7e8c5dac
HS
6068 }
6069 else {
6070 *offsetp = 0;
6071 if (lenp)
6072 *lenp = 0;
a0ed51b3 6073 }
e23c8137 6074
a0ed51b3
LW
6075 return;
6076}
6077
645c22ef
DM
6078/*
6079=for apidoc sv_pos_b2u
6080
6081Converts the value pointed to by offsetp from a count of bytes from the
1e54db1a 6082start of the string, to a count of the equivalent number of UTF-8 chars.
645c22ef
DM
6083Handles magic and type coercion.
6084
6085=cut
6086*/
6087
7e8c5dac
HS
6088/*
6089 * sv_pos_b2u() uses, like sv_pos_u2b(), the mg_ptr of the potential
6090 * PERL_UTF8_magic of the sv to store the mapping between UTF-8 and
6091 * byte offsets. See also the comments of S_utf8_mg_pos().
6092 *
6093 */
6094
a0ed51b3 6095void
7e8c5dac 6096Perl_sv_pos_b2u(pTHX_ register SV* sv, I32* offsetp)
a0ed51b3 6097{
83003860 6098 const U8* s;
a0ed51b3
LW
6099 STRLEN len;
6100
6101 if (!sv)
6102 return;
6103
83003860 6104 s = (const U8*)SvPV_const(sv, len);
eb160463 6105 if ((I32)len < *offsetp)
a0dbb045 6106 Perl_croak(aTHX_ "panic: sv_pos_b2u: bad byte offset");
7e8c5dac 6107 else {
83003860 6108 const U8* send = s + *offsetp;
7e8c5dac
HS
6109 MAGIC* mg = NULL;
6110 STRLEN *cache = NULL;
6111
6112 len = 0;
6113
6114 if (SvMAGICAL(sv) && !SvREADONLY(sv)) {
6115 mg = mg_find(sv, PERL_MAGIC_utf8);
6116 if (mg && mg->mg_ptr) {
6117 cache = (STRLEN *) mg->mg_ptr;
c5661c80 6118 if (cache[1] == (STRLEN)*offsetp) {
7e8c5dac
HS
6119 /* An exact match. */
6120 *offsetp = cache[0];
6121
6122 return;
6123 }
c5661c80 6124 else if (cache[1] < (STRLEN)*offsetp) {
7e8c5dac
HS
6125 /* We already know part of the way. */
6126 len = cache[0];
6127 s += cache[1];
7a5fa8a2 6128 /* Let the below loop do the rest. */
7e8c5dac
HS
6129 }
6130 else { /* cache[1] > *offsetp */
6131 /* We already know all of the way, now we may
6132 * be able to walk back. The same assumption
6133 * is made as in S_utf8_mg_pos(), namely that
6134 * walking backward is twice slower than
6135 * walking forward. */
9d4ba2ae 6136 const STRLEN forw = *offsetp;
7e8c5dac
HS
6137 STRLEN backw = cache[1] - *offsetp;
6138
6139 if (!(forw < 2 * backw)) {
83003860 6140 const U8 *p = s + cache[1];
7e8c5dac 6141 STRLEN ubackw = 0;
7a5fa8a2 6142
a5b510f2
AE
6143 cache[1] -= backw;
6144
7e8c5dac
HS
6145 while (backw--) {
6146 p--;
0aeb64d0 6147 while (UTF8_IS_CONTINUATION(*p)) {
7e8c5dac 6148 p--;
0aeb64d0
JH
6149 backw--;
6150 }
7e8c5dac
HS
6151 ubackw++;
6152 }
6153
6154 cache[0] -= ubackw;
0aeb64d0 6155 *offsetp = cache[0];
a67d7df9
TS
6156
6157 /* Drop the stale "length" cache */
6158 cache[2] = 0;
6159 cache[3] = 0;
6160
0aeb64d0 6161 return;
7e8c5dac
HS
6162 }
6163 }
6164 }
e23c8137 6165 ASSERT_UTF8_CACHE(cache);
a0dbb045 6166 }
7e8c5dac
HS
6167
6168 while (s < send) {
6169 STRLEN n = 1;
6170
6171 /* Call utf8n_to_uvchr() to validate the sequence
6172 * (unless a simple non-UTF character) */
6173 if (!UTF8_IS_INVARIANT(*s))
6174 utf8n_to_uvchr(s, UTF8SKIP(s), &n, 0);
6175 if (n > 0) {
6176 s += n;
6177 len++;
6178 }
6179 else
6180 break;
6181 }
6182
6183 if (!SvREADONLY(sv)) {
6184 if (!mg) {
6185 sv_magic(sv, 0, PERL_MAGIC_utf8, 0, 0);
6186 mg = mg_find(sv, PERL_MAGIC_utf8);
6187 }
6188 assert(mg);
6189
6190 if (!mg->mg_ptr) {
a02a5408 6191 Newxz(cache, PERL_MAGIC_UTF8_CACHESIZE * 2, STRLEN);
7e8c5dac
HS
6192 mg->mg_ptr = (char *) cache;
6193 }
6194 assert(cache);
6195
6196 cache[0] = len;
6197 cache[1] = *offsetp;
a67d7df9
TS
6198 /* Drop the stale "length" cache */
6199 cache[2] = 0;
6200 cache[3] = 0;
7e8c5dac
HS
6201 }
6202
6203 *offsetp = len;
a0ed51b3 6204 }
a0ed51b3
LW
6205 return;
6206}
6207
954c1994
GS
6208/*
6209=for apidoc sv_eq
6210
6211Returns a boolean indicating whether the strings in the two SVs are
645c22ef
DM
6212identical. Is UTF-8 and 'use bytes' aware, handles get magic, and will
6213coerce its args to strings if necessary.
954c1994
GS
6214
6215=cut
6216*/
6217
79072805 6218I32
e01b9e88 6219Perl_sv_eq(pTHX_ register SV *sv1, register SV *sv2)
79072805 6220{
e1ec3a88 6221 const char *pv1;
463ee0b2 6222 STRLEN cur1;
e1ec3a88 6223 const char *pv2;
463ee0b2 6224 STRLEN cur2;
e01b9e88 6225 I32 eq = 0;
553e1bcc
AT
6226 char *tpv = Nullch;
6227 SV* svrecode = Nullsv;
79072805 6228
e01b9e88 6229 if (!sv1) {
79072805
LW
6230 pv1 = "";
6231 cur1 = 0;
6232 }
463ee0b2 6233 else
4d84ee25 6234 pv1 = SvPV_const(sv1, cur1);
79072805 6235
e01b9e88
SC
6236 if (!sv2){
6237 pv2 = "";
6238 cur2 = 0;
92d29cee 6239 }
e01b9e88 6240 else
4d84ee25 6241 pv2 = SvPV_const(sv2, cur2);
79072805 6242
cf48d248 6243 if (cur1 && cur2 && SvUTF8(sv1) != SvUTF8(sv2) && !IN_BYTES) {
799ef3cb
JH
6244 /* Differing utf8ness.
6245 * Do not UTF8size the comparands as a side-effect. */
6246 if (PL_encoding) {
6247 if (SvUTF8(sv1)) {
553e1bcc
AT
6248 svrecode = newSVpvn(pv2, cur2);
6249 sv_recode_to_utf8(svrecode, PL_encoding);
93524f2b 6250 pv2 = SvPV_const(svrecode, cur2);
799ef3cb
JH
6251 }
6252 else {
553e1bcc
AT
6253 svrecode = newSVpvn(pv1, cur1);
6254 sv_recode_to_utf8(svrecode, PL_encoding);
93524f2b 6255 pv1 = SvPV_const(svrecode, cur1);
799ef3cb
JH
6256 }
6257 /* Now both are in UTF-8. */
0a1bd7ac
DM
6258 if (cur1 != cur2) {
6259 SvREFCNT_dec(svrecode);
799ef3cb 6260 return FALSE;
0a1bd7ac 6261 }
799ef3cb
JH
6262 }
6263 else {
6264 bool is_utf8 = TRUE;
6265
6266 if (SvUTF8(sv1)) {
6267 /* sv1 is the UTF-8 one,
6268 * if is equal it must be downgrade-able */
9d4ba2ae 6269 char * const pv = (char*)bytes_from_utf8((const U8*)pv1,
799ef3cb
JH
6270 &cur1, &is_utf8);
6271 if (pv != pv1)
553e1bcc 6272 pv1 = tpv = pv;
799ef3cb
JH
6273 }
6274 else {
6275 /* sv2 is the UTF-8 one,
6276 * if is equal it must be downgrade-able */
9d4ba2ae 6277 char * const pv = (char *)bytes_from_utf8((const U8*)pv2,
799ef3cb
JH
6278 &cur2, &is_utf8);
6279 if (pv != pv2)
553e1bcc 6280 pv2 = tpv = pv;
799ef3cb
JH
6281 }
6282 if (is_utf8) {
6283 /* Downgrade not possible - cannot be eq */
bf694877 6284 assert (tpv == 0);
799ef3cb
JH
6285 return FALSE;
6286 }
6287 }
cf48d248
JH
6288 }
6289
6290 if (cur1 == cur2)
765f542d 6291 eq = (pv1 == pv2) || memEQ(pv1, pv2, cur1);
e01b9e88 6292
553e1bcc
AT
6293 if (svrecode)
6294 SvREFCNT_dec(svrecode);
799ef3cb 6295
553e1bcc
AT
6296 if (tpv)
6297 Safefree(tpv);
cf48d248 6298
e01b9e88 6299 return eq;
79072805
LW
6300}
6301
954c1994
GS
6302/*
6303=for apidoc sv_cmp
6304
6305Compares the strings in two SVs. Returns -1, 0, or 1 indicating whether the
6306string in C<sv1> is less than, equal to, or greater than the string in
645c22ef
DM
6307C<sv2>. Is UTF-8 and 'use bytes' aware, handles get magic, and will
6308coerce its args to strings if necessary. See also C<sv_cmp_locale>.
954c1994
GS
6309
6310=cut
6311*/
6312
79072805 6313I32
e01b9e88 6314Perl_sv_cmp(pTHX_ register SV *sv1, register SV *sv2)
79072805 6315{
560a288e 6316 STRLEN cur1, cur2;
e1ec3a88
AL
6317 const char *pv1, *pv2;
6318 char *tpv = Nullch;
cf48d248 6319 I32 cmp;
553e1bcc 6320 SV *svrecode = Nullsv;
560a288e 6321
e01b9e88
SC
6322 if (!sv1) {
6323 pv1 = "";
560a288e
GS
6324 cur1 = 0;
6325 }
e01b9e88 6326 else
4d84ee25 6327 pv1 = SvPV_const(sv1, cur1);
560a288e 6328
553e1bcc 6329 if (!sv2) {
e01b9e88 6330 pv2 = "";
560a288e
GS
6331 cur2 = 0;
6332 }
e01b9e88 6333 else
4d84ee25 6334 pv2 = SvPV_const(sv2, cur2);
79072805 6335
cf48d248 6336 if (cur1 && cur2 && SvUTF8(sv1) != SvUTF8(sv2) && !IN_BYTES) {
799ef3cb
JH
6337 /* Differing utf8ness.
6338 * Do not UTF8size the comparands as a side-effect. */
cf48d248 6339 if (SvUTF8(sv1)) {
799ef3cb 6340 if (PL_encoding) {
553e1bcc
AT
6341 svrecode = newSVpvn(pv2, cur2);
6342 sv_recode_to_utf8(svrecode, PL_encoding);
93524f2b 6343 pv2 = SvPV_const(svrecode, cur2);
799ef3cb
JH
6344 }
6345 else {
e1ec3a88 6346 pv2 = tpv = (char*)bytes_to_utf8((const U8*)pv2, &cur2);
799ef3cb 6347 }
cf48d248
JH
6348 }
6349 else {
799ef3cb 6350 if (PL_encoding) {
553e1bcc
AT
6351 svrecode = newSVpvn(pv1, cur1);
6352 sv_recode_to_utf8(svrecode, PL_encoding);
93524f2b 6353 pv1 = SvPV_const(svrecode, cur1);
799ef3cb
JH
6354 }
6355 else {
e1ec3a88 6356 pv1 = tpv = (char*)bytes_to_utf8((const U8*)pv1, &cur1);
799ef3cb 6357 }
cf48d248
JH
6358 }
6359 }
6360
e01b9e88 6361 if (!cur1) {
cf48d248 6362 cmp = cur2 ? -1 : 0;
e01b9e88 6363 } else if (!cur2) {
cf48d248
JH
6364 cmp = 1;
6365 } else {
e1ec3a88 6366 const I32 retval = memcmp((const void*)pv1, (const void*)pv2, cur1 < cur2 ? cur1 : cur2);
e01b9e88
SC
6367
6368 if (retval) {
cf48d248 6369 cmp = retval < 0 ? -1 : 1;
e01b9e88 6370 } else if (cur1 == cur2) {
cf48d248
JH
6371 cmp = 0;
6372 } else {
6373 cmp = cur1 < cur2 ? -1 : 1;
e01b9e88 6374 }
cf48d248 6375 }
16660edb 6376
553e1bcc
AT
6377 if (svrecode)
6378 SvREFCNT_dec(svrecode);
799ef3cb 6379
553e1bcc
AT
6380 if (tpv)
6381 Safefree(tpv);
cf48d248
JH
6382
6383 return cmp;
bbce6d69 6384}
16660edb 6385
c461cf8f
JH
6386/*
6387=for apidoc sv_cmp_locale
6388
645c22ef
DM
6389Compares the strings in two SVs in a locale-aware manner. Is UTF-8 and
6390'use bytes' aware, handles get magic, and will coerce its args to strings
6391if necessary. See also C<sv_cmp_locale>. See also C<sv_cmp>.
c461cf8f
JH
6392
6393=cut
6394*/
6395
bbce6d69 6396I32
864dbfa3 6397Perl_sv_cmp_locale(pTHX_ register SV *sv1, register SV *sv2)
bbce6d69 6398{
36477c24 6399#ifdef USE_LOCALE_COLLATE
16660edb 6400
bbce6d69 6401 char *pv1, *pv2;
6402 STRLEN len1, len2;
6403 I32 retval;
16660edb 6404
3280af22 6405 if (PL_collation_standard)
bbce6d69 6406 goto raw_compare;
16660edb 6407
bbce6d69 6408 len1 = 0;
8ac85365 6409 pv1 = sv1 ? sv_collxfrm(sv1, &len1) : (char *) NULL;
bbce6d69 6410 len2 = 0;
8ac85365 6411 pv2 = sv2 ? sv_collxfrm(sv2, &len2) : (char *) NULL;
16660edb 6412
bbce6d69 6413 if (!pv1 || !len1) {
6414 if (pv2 && len2)
6415 return -1;
6416 else
6417 goto raw_compare;
6418 }
6419 else {
6420 if (!pv2 || !len2)
6421 return 1;
6422 }
16660edb 6423
bbce6d69 6424 retval = memcmp((void*)pv1, (void*)pv2, len1 < len2 ? len1 : len2);
16660edb 6425
bbce6d69 6426 if (retval)
16660edb 6427 return retval < 0 ? -1 : 1;
6428
bbce6d69 6429 /*
6430 * When the result of collation is equality, that doesn't mean
6431 * that there are no differences -- some locales exclude some
6432 * characters from consideration. So to avoid false equalities,
6433 * we use the raw string as a tiebreaker.
6434 */
16660edb 6435
bbce6d69 6436 raw_compare:
6437 /* FALL THROUGH */
16660edb 6438
36477c24 6439#endif /* USE_LOCALE_COLLATE */
16660edb 6440
bbce6d69 6441 return sv_cmp(sv1, sv2);
6442}
79072805 6443
645c22ef 6444
36477c24 6445#ifdef USE_LOCALE_COLLATE
645c22ef 6446
7a4c00b4 6447/*
645c22ef
DM
6448=for apidoc sv_collxfrm
6449
6450Add Collate Transform magic to an SV if it doesn't already have it.
6451
6452Any scalar variable may carry PERL_MAGIC_collxfrm magic that contains the
6453scalar data of the variable, but transformed to such a format that a normal
6454memory comparison can be used to compare the data according to the locale
6455settings.
6456
6457=cut
6458*/
6459
bbce6d69 6460char *
864dbfa3 6461Perl_sv_collxfrm(pTHX_ SV *sv, STRLEN *nxp)
bbce6d69 6462{
7a4c00b4 6463 MAGIC *mg;
16660edb 6464
14befaf4 6465 mg = SvMAGICAL(sv) ? mg_find(sv, PERL_MAGIC_collxfrm) : (MAGIC *) NULL;
3280af22 6466 if (!mg || !mg->mg_ptr || *(U32*)mg->mg_ptr != PL_collation_ix) {
93524f2b
NC
6467 const char *s;
6468 char *xf;
bbce6d69 6469 STRLEN len, xlen;
6470
7a4c00b4 6471 if (mg)
6472 Safefree(mg->mg_ptr);
93524f2b 6473 s = SvPV_const(sv, len);
bbce6d69 6474 if ((xf = mem_collxfrm(s, len, &xlen))) {
ff0cee69 6475 if (SvREADONLY(sv)) {
6476 SAVEFREEPV(xf);
6477 *nxp = xlen;
3280af22 6478 return xf + sizeof(PL_collation_ix);
ff0cee69 6479 }
7a4c00b4 6480 if (! mg) {
14befaf4
DM
6481 sv_magic(sv, 0, PERL_MAGIC_collxfrm, 0, 0);
6482 mg = mg_find(sv, PERL_MAGIC_collxfrm);
7a4c00b4 6483 assert(mg);
bbce6d69 6484 }
7a4c00b4 6485 mg->mg_ptr = xf;
565764a8 6486 mg->mg_len = xlen;
7a4c00b4 6487 }
6488 else {
ff0cee69 6489 if (mg) {
6490 mg->mg_ptr = NULL;
565764a8 6491 mg->mg_len = -1;
ff0cee69 6492 }
bbce6d69 6493 }
6494 }
7a4c00b4 6495 if (mg && mg->mg_ptr) {
565764a8 6496 *nxp = mg->mg_len;
3280af22 6497 return mg->mg_ptr + sizeof(PL_collation_ix);
bbce6d69 6498 }
6499 else {
6500 *nxp = 0;
6501 return NULL;
16660edb 6502 }
79072805
LW
6503}
6504
36477c24 6505#endif /* USE_LOCALE_COLLATE */
bbce6d69 6506
c461cf8f
JH
6507/*
6508=for apidoc sv_gets
6509
6510Get a line from the filehandle and store it into the SV, optionally
6511appending to the currently-stored string.
6512
6513=cut
6514*/
6515
79072805 6516char *
864dbfa3 6517Perl_sv_gets(pTHX_ register SV *sv, register PerlIO *fp, I32 append)
79072805 6518{
e1ec3a88 6519 const char *rsptr;
c07a80fd 6520 STRLEN rslen;
6521 register STDCHAR rslast;
6522 register STDCHAR *bp;
6523 register I32 cnt;
9c5ffd7c 6524 I32 i = 0;
8bfdd7d9 6525 I32 rspara = 0;
e311fd51 6526 I32 recsize;
c07a80fd 6527
bc44a8a2
NC
6528 if (SvTHINKFIRST(sv))
6529 sv_force_normal_flags(sv, append ? 0 : SV_COW_DROP_PV);
765f542d
NC
6530 /* XXX. If you make this PVIV, then copy on write can copy scalars read
6531 from <>.
6532 However, perlbench says it's slower, because the existing swipe code
6533 is faster than copy on write.
6534 Swings and roundabouts. */
862a34c6 6535 SvUPGRADE(sv, SVt_PV);
99491443 6536
ff68c719 6537 SvSCREAM_off(sv);
efd8b2ba
AE
6538
6539 if (append) {
6540 if (PerlIO_isutf8(fp)) {
6541 if (!SvUTF8(sv)) {
6542 sv_utf8_upgrade_nomg(sv);
6543 sv_pos_u2b(sv,&append,0);
6544 }
6545 } else if (SvUTF8(sv)) {
1b6737cc 6546 SV * const tsv = NEWSV(0,0);
efd8b2ba
AE
6547 sv_gets(tsv, fp, 0);
6548 sv_utf8_upgrade_nomg(tsv);
6549 SvCUR_set(sv,append);
6550 sv_catsv(sv,tsv);
6551 sv_free(tsv);
6552 goto return_string_or_null;
6553 }
6554 }
6555
6556 SvPOK_only(sv);
6557 if (PerlIO_isutf8(fp))
6558 SvUTF8_on(sv);
c07a80fd 6559
923e4eb5 6560 if (IN_PERL_COMPILETIME) {
8bfdd7d9
HS
6561 /* we always read code in line mode */
6562 rsptr = "\n";
6563 rslen = 1;
6564 }
6565 else if (RsSNARF(PL_rs)) {
7a5fa8a2
NIS
6566 /* If it is a regular disk file use size from stat() as estimate
6567 of amount we are going to read - may result in malloc-ing
6568 more memory than we realy need if layers bellow reduce
e468d35b
NIS
6569 size we read (e.g. CRLF or a gzip layer)
6570 */
e311fd51 6571 Stat_t st;
e468d35b 6572 if (!PerlLIO_fstat(PerlIO_fileno(fp), &st) && S_ISREG(st.st_mode)) {
f54cb97a 6573 const Off_t offset = PerlIO_tell(fp);
58f1856e 6574 if (offset != (Off_t) -1 && st.st_size + append > offset) {
e468d35b
NIS
6575 (void) SvGROW(sv, (STRLEN)((st.st_size - offset) + append + 1));
6576 }
6577 }
c07a80fd 6578 rsptr = NULL;
6579 rslen = 0;
6580 }
3280af22 6581 else if (RsRECORD(PL_rs)) {
e311fd51 6582 I32 bytesread;
5b2b9c68
HM
6583 char *buffer;
6584
6585 /* Grab the size of the record we're getting */
3280af22 6586 recsize = SvIV(SvRV(PL_rs));
e311fd51 6587 buffer = SvGROW(sv, (STRLEN)(recsize + append + 1)) + append;
5b2b9c68
HM
6588 /* Go yank in */
6589#ifdef VMS
6590 /* VMS wants read instead of fread, because fread doesn't respect */
6591 /* RMS record boundaries. This is not necessarily a good thing to be */
e468d35b
NIS
6592 /* doing, but we've got no other real choice - except avoid stdio
6593 as implementation - perhaps write a :vms layer ?
6594 */
5b2b9c68
HM
6595 bytesread = PerlLIO_read(PerlIO_fileno(fp), buffer, recsize);
6596#else
6597 bytesread = PerlIO_read(fp, buffer, recsize);
6598#endif
27e6ca2d
AE
6599 if (bytesread < 0)
6600 bytesread = 0;
e311fd51 6601 SvCUR_set(sv, bytesread += append);
e670df4e 6602 buffer[bytesread] = '\0';
efd8b2ba 6603 goto return_string_or_null;
5b2b9c68 6604 }
3280af22 6605 else if (RsPARA(PL_rs)) {
c07a80fd 6606 rsptr = "\n\n";
6607 rslen = 2;
8bfdd7d9 6608 rspara = 1;
c07a80fd 6609 }
7d59b7e4
NIS
6610 else {
6611 /* Get $/ i.e. PL_rs into same encoding as stream wants */
6612 if (PerlIO_isutf8(fp)) {
6613 rsptr = SvPVutf8(PL_rs, rslen);
6614 }
6615 else {
6616 if (SvUTF8(PL_rs)) {
6617 if (!sv_utf8_downgrade(PL_rs, TRUE)) {
6618 Perl_croak(aTHX_ "Wide character in $/");
6619 }
6620 }
93524f2b 6621 rsptr = SvPV_const(PL_rs, rslen);
7d59b7e4
NIS
6622 }
6623 }
6624
c07a80fd 6625 rslast = rslen ? rsptr[rslen - 1] : '\0';
6626
8bfdd7d9 6627 if (rspara) { /* have to do this both before and after */
79072805 6628 do { /* to make sure file boundaries work right */
760ac839 6629 if (PerlIO_eof(fp))
a0d0e21e 6630 return 0;
760ac839 6631 i = PerlIO_getc(fp);
79072805 6632 if (i != '\n') {
a0d0e21e
LW
6633 if (i == -1)
6634 return 0;
760ac839 6635 PerlIO_ungetc(fp,i);
79072805
LW
6636 break;
6637 }
6638 } while (i != EOF);
6639 }
c07a80fd 6640
760ac839
LW
6641 /* See if we know enough about I/O mechanism to cheat it ! */
6642
6643 /* This used to be #ifdef test - it is made run-time test for ease
1c846c1f 6644 of abstracting out stdio interface. One call should be cheap
760ac839
LW
6645 enough here - and may even be a macro allowing compile
6646 time optimization.
6647 */
6648
6649 if (PerlIO_fast_gets(fp)) {
6650
6651 /*
6652 * We're going to steal some values from the stdio struct
6653 * and put EVERYTHING in the innermost loop into registers.
6654 */
6655 register STDCHAR *ptr;
6656 STRLEN bpx;
6657 I32 shortbuffered;
6658
16660edb 6659#if defined(VMS) && defined(PERLIO_IS_STDIO)
6660 /* An ungetc()d char is handled separately from the regular
6661 * buffer, so we getc() it back out and stuff it in the buffer.
6662 */
6663 i = PerlIO_getc(fp);
6664 if (i == EOF) return 0;
6665 *(--((*fp)->_ptr)) = (unsigned char) i;
6666 (*fp)->_cnt++;
6667#endif
c07a80fd 6668
c2960299 6669 /* Here is some breathtakingly efficient cheating */
c07a80fd 6670
a20bf0c3 6671 cnt = PerlIO_get_cnt(fp); /* get count into register */
e468d35b 6672 /* make sure we have the room */
7a5fa8a2 6673 if ((I32)(SvLEN(sv) - append) <= cnt + 1) {
e468d35b 6674 /* Not room for all of it
7a5fa8a2 6675 if we are looking for a separator and room for some
e468d35b
NIS
6676 */
6677 if (rslen && cnt > 80 && (I32)SvLEN(sv) > append) {
7a5fa8a2 6678 /* just process what we have room for */
79072805
LW
6679 shortbuffered = cnt - SvLEN(sv) + append + 1;
6680 cnt -= shortbuffered;
6681 }
6682 else {
6683 shortbuffered = 0;
bbce6d69 6684 /* remember that cnt can be negative */
eb160463 6685 SvGROW(sv, (STRLEN)(append + (cnt <= 0 ? 2 : (cnt + 1))));
79072805
LW
6686 }
6687 }
7a5fa8a2 6688 else
79072805 6689 shortbuffered = 0;
3f7c398e 6690 bp = (STDCHAR*)SvPVX_const(sv) + append; /* move these two too to registers */
a20bf0c3 6691 ptr = (STDCHAR*)PerlIO_get_ptr(fp);
16660edb 6692 DEBUG_P(PerlIO_printf(Perl_debug_log,
1d7c1841 6693 "Screamer: entering, ptr=%"UVuf", cnt=%ld\n",PTR2UV(ptr),(long)cnt));
16660edb 6694 DEBUG_P(PerlIO_printf(Perl_debug_log,
ba7abf9d 6695 "Screamer: entering: PerlIO * thinks ptr=%"UVuf", cnt=%ld, base=%"UVuf"\n",
1c846c1f 6696 PTR2UV(PerlIO_get_ptr(fp)), (long)PerlIO_get_cnt(fp),
1d7c1841 6697 PTR2UV(PerlIO_has_base(fp) ? PerlIO_get_base(fp) : 0)));
79072805
LW
6698 for (;;) {
6699 screamer:
93a17b20 6700 if (cnt > 0) {
c07a80fd 6701 if (rslen) {
760ac839
LW
6702 while (cnt > 0) { /* this | eat */
6703 cnt--;
c07a80fd 6704 if ((*bp++ = *ptr++) == rslast) /* really | dust */
6705 goto thats_all_folks; /* screams | sed :-) */
6706 }
6707 }
6708 else {
1c846c1f
NIS
6709 Copy(ptr, bp, cnt, char); /* this | eat */
6710 bp += cnt; /* screams | dust */
c07a80fd 6711 ptr += cnt; /* louder | sed :-) */
a5f75d66 6712 cnt = 0;
93a17b20 6713 }
79072805
LW
6714 }
6715
748a9306 6716 if (shortbuffered) { /* oh well, must extend */
79072805
LW
6717 cnt = shortbuffered;
6718 shortbuffered = 0;
3f7c398e 6719 bpx = bp - (STDCHAR*)SvPVX_const(sv); /* box up before relocation */
79072805
LW
6720 SvCUR_set(sv, bpx);
6721 SvGROW(sv, SvLEN(sv) + append + cnt + 2);
3f7c398e 6722 bp = (STDCHAR*)SvPVX_const(sv) + bpx; /* unbox after relocation */
79072805
LW
6723 continue;
6724 }
6725
16660edb 6726 DEBUG_P(PerlIO_printf(Perl_debug_log,
1d7c1841
GS
6727 "Screamer: going to getc, ptr=%"UVuf", cnt=%ld\n",
6728 PTR2UV(ptr),(long)cnt));
cc00df79 6729 PerlIO_set_ptrcnt(fp, (STDCHAR*)ptr, cnt); /* deregisterize cnt and ptr */
ba7abf9d 6730#if 0
16660edb 6731 DEBUG_P(PerlIO_printf(Perl_debug_log,
1d7c1841 6732 "Screamer: pre: FILE * thinks ptr=%"UVuf", cnt=%ld, base=%"UVuf"\n",
1c846c1f 6733 PTR2UV(PerlIO_get_ptr(fp)), (long)PerlIO_get_cnt(fp),
1d7c1841 6734 PTR2UV(PerlIO_has_base (fp) ? PerlIO_get_base(fp) : 0)));
ba7abf9d 6735#endif
1c846c1f 6736 /* This used to call 'filbuf' in stdio form, but as that behaves like
774d564b 6737 getc when cnt <= 0 we use PerlIO_getc here to avoid introducing
6738 another abstraction. */
760ac839 6739 i = PerlIO_getc(fp); /* get more characters */
ba7abf9d 6740#if 0
16660edb 6741 DEBUG_P(PerlIO_printf(Perl_debug_log,
1d7c1841 6742 "Screamer: post: FILE * thinks ptr=%"UVuf", cnt=%ld, base=%"UVuf"\n",
1c846c1f 6743 PTR2UV(PerlIO_get_ptr(fp)), (long)PerlIO_get_cnt(fp),
1d7c1841 6744 PTR2UV(PerlIO_has_base (fp) ? PerlIO_get_base(fp) : 0)));
ba7abf9d 6745#endif
a20bf0c3
JH
6746 cnt = PerlIO_get_cnt(fp);
6747 ptr = (STDCHAR*)PerlIO_get_ptr(fp); /* reregisterize cnt and ptr */
16660edb 6748 DEBUG_P(PerlIO_printf(Perl_debug_log,
1d7c1841 6749 "Screamer: after getc, ptr=%"UVuf", cnt=%ld\n",PTR2UV(ptr),(long)cnt));
79072805 6750
748a9306
LW
6751 if (i == EOF) /* all done for ever? */
6752 goto thats_really_all_folks;
6753
3f7c398e 6754 bpx = bp - (STDCHAR*)SvPVX_const(sv); /* box up before relocation */
79072805
LW
6755 SvCUR_set(sv, bpx);
6756 SvGROW(sv, bpx + cnt + 2);
3f7c398e 6757 bp = (STDCHAR*)SvPVX_const(sv) + bpx; /* unbox after relocation */
c07a80fd 6758
eb160463 6759 *bp++ = (STDCHAR)i; /* store character from PerlIO_getc */
79072805 6760
c07a80fd 6761 if (rslen && (STDCHAR)i == rslast) /* all done for now? */
79072805 6762 goto thats_all_folks;
79072805
LW
6763 }
6764
6765thats_all_folks:
3f7c398e 6766 if ((rslen > 1 && (STRLEN)(bp - (STDCHAR*)SvPVX_const(sv)) < rslen) ||
36477c24 6767 memNE((char*)bp - rslen, rsptr, rslen))
760ac839 6768 goto screamer; /* go back to the fray */
79072805
LW
6769thats_really_all_folks:
6770 if (shortbuffered)
6771 cnt += shortbuffered;
16660edb 6772 DEBUG_P(PerlIO_printf(Perl_debug_log,
1d7c1841 6773 "Screamer: quitting, ptr=%"UVuf", cnt=%ld\n",PTR2UV(ptr),(long)cnt));
cc00df79 6774 PerlIO_set_ptrcnt(fp, (STDCHAR*)ptr, cnt); /* put these back or we're in trouble */
16660edb 6775 DEBUG_P(PerlIO_printf(Perl_debug_log,
1d7c1841 6776 "Screamer: end: FILE * thinks ptr=%"UVuf", cnt=%ld, base=%"UVuf"\n",
1c846c1f 6777 PTR2UV(PerlIO_get_ptr(fp)), (long)PerlIO_get_cnt(fp),
1d7c1841 6778 PTR2UV(PerlIO_has_base (fp) ? PerlIO_get_base(fp) : 0)));
79072805 6779 *bp = '\0';
3f7c398e 6780 SvCUR_set(sv, bp - (STDCHAR*)SvPVX_const(sv)); /* set length */
16660edb 6781 DEBUG_P(PerlIO_printf(Perl_debug_log,
fb73857a 6782 "Screamer: done, len=%ld, string=|%.*s|\n",
3f7c398e 6783 (long)SvCUR(sv),(int)SvCUR(sv),SvPVX_const(sv)));
760ac839
LW
6784 }
6785 else
79072805 6786 {
6edd2cd5 6787 /*The big, slow, and stupid way. */
27da23d5 6788#ifdef USE_HEAP_INSTEAD_OF_STACK /* Even slower way. */
6edd2cd5 6789 STDCHAR *buf = 0;
a02a5408 6790 Newx(buf, 8192, STDCHAR);
6edd2cd5 6791 assert(buf);
4d2c4e07 6792#else
6edd2cd5 6793 STDCHAR buf[8192];
4d2c4e07 6794#endif
79072805 6795
760ac839 6796screamer2:
c07a80fd 6797 if (rslen) {
6867be6d 6798 const register STDCHAR *bpe = buf + sizeof(buf);
760ac839 6799 bp = buf;
eb160463 6800 while ((i = PerlIO_getc(fp)) != EOF && (*bp++ = (STDCHAR)i) != rslast && bp < bpe)
760ac839
LW
6801 ; /* keep reading */
6802 cnt = bp - buf;
c07a80fd 6803 }
6804 else {
760ac839 6805 cnt = PerlIO_read(fp,(char*)buf, sizeof(buf));
16660edb 6806 /* Accomodate broken VAXC compiler, which applies U8 cast to
6807 * both args of ?: operator, causing EOF to change into 255
6808 */
37be0adf 6809 if (cnt > 0)
cbe9e203
JH
6810 i = (U8)buf[cnt - 1];
6811 else
37be0adf 6812 i = EOF;
c07a80fd 6813 }
79072805 6814
cbe9e203
JH
6815 if (cnt < 0)
6816 cnt = 0; /* we do need to re-set the sv even when cnt <= 0 */
6817 if (append)
6818 sv_catpvn(sv, (char *) buf, cnt);
6819 else
6820 sv_setpvn(sv, (char *) buf, cnt);
c07a80fd 6821
6822 if (i != EOF && /* joy */
6823 (!rslen ||
6824 SvCUR(sv) < rslen ||
3f7c398e 6825 memNE(SvPVX_const(sv) + SvCUR(sv) - rslen, rsptr, rslen)))
79072805
LW
6826 {
6827 append = -1;
63e4d877
CS
6828 /*
6829 * If we're reading from a TTY and we get a short read,
6830 * indicating that the user hit his EOF character, we need
6831 * to notice it now, because if we try to read from the TTY
6832 * again, the EOF condition will disappear.
6833 *
6834 * The comparison of cnt to sizeof(buf) is an optimization
6835 * that prevents unnecessary calls to feof().
6836 *
6837 * - jik 9/25/96
6838 */
6839 if (!(cnt < sizeof(buf) && PerlIO_eof(fp)))
6840 goto screamer2;
79072805 6841 }
6edd2cd5 6842
27da23d5 6843#ifdef USE_HEAP_INSTEAD_OF_STACK
6edd2cd5
JH
6844 Safefree(buf);
6845#endif
79072805
LW
6846 }
6847
8bfdd7d9 6848 if (rspara) { /* have to do this both before and after */
c07a80fd 6849 while (i != EOF) { /* to make sure file boundaries work right */
760ac839 6850 i = PerlIO_getc(fp);
79072805 6851 if (i != '\n') {
760ac839 6852 PerlIO_ungetc(fp,i);
79072805
LW
6853 break;
6854 }
6855 }
6856 }
c07a80fd 6857
efd8b2ba 6858return_string_or_null:
c07a80fd 6859 return (SvCUR(sv) - append) ? SvPVX(sv) : Nullch;
79072805
LW
6860}
6861
954c1994
GS
6862/*
6863=for apidoc sv_inc
6864
645c22ef
DM
6865Auto-increment of the value in the SV, doing string to numeric conversion
6866if necessary. Handles 'get' magic.
954c1994
GS
6867
6868=cut
6869*/
6870
79072805 6871void
864dbfa3 6872Perl_sv_inc(pTHX_ register SV *sv)
79072805
LW
6873{
6874 register char *d;
463ee0b2 6875 int flags;
79072805
LW
6876
6877 if (!sv)
6878 return;
b23a5f78
GB
6879 if (SvGMAGICAL(sv))
6880 mg_get(sv);
ed6116ce 6881 if (SvTHINKFIRST(sv)) {
765f542d
NC
6882 if (SvIsCOW(sv))
6883 sv_force_normal_flags(sv, 0);
0f15f207 6884 if (SvREADONLY(sv)) {
923e4eb5 6885 if (IN_PERL_RUNTIME)
cea2e8a9 6886 Perl_croak(aTHX_ PL_no_modify);
0f15f207 6887 }
a0d0e21e 6888 if (SvROK(sv)) {
b5be31e9 6889 IV i;
9e7bc3e8
JD
6890 if (SvAMAGIC(sv) && AMG_CALLun(sv,inc))
6891 return;
56431972 6892 i = PTR2IV(SvRV(sv));
b5be31e9
SM
6893 sv_unref(sv);
6894 sv_setiv(sv, i);
a0d0e21e 6895 }
ed6116ce 6896 }
8990e307 6897 flags = SvFLAGS(sv);
28e5dec8
JH
6898 if ((flags & (SVp_NOK|SVp_IOK)) == SVp_NOK) {
6899 /* It's (privately or publicly) a float, but not tested as an
6900 integer, so test it to see. */
d460ef45 6901 (void) SvIV(sv);
28e5dec8
JH
6902 flags = SvFLAGS(sv);
6903 }
6904 if ((flags & SVf_IOK) || ((flags & (SVp_IOK | SVp_NOK)) == SVp_IOK)) {
6905 /* It's publicly an integer, or privately an integer-not-float */
59d8ce62 6906#ifdef PERL_PRESERVE_IVUV
28e5dec8 6907 oops_its_int:
59d8ce62 6908#endif
25da4f38
IZ
6909 if (SvIsUV(sv)) {
6910 if (SvUVX(sv) == UV_MAX)
a1e868e7 6911 sv_setnv(sv, UV_MAX_P1);
25da4f38
IZ
6912 else
6913 (void)SvIOK_only_UV(sv);
607fa7f2 6914 SvUV_set(sv, SvUVX(sv) + 1);
25da4f38
IZ
6915 } else {
6916 if (SvIVX(sv) == IV_MAX)
28e5dec8 6917 sv_setuv(sv, (UV)IV_MAX + 1);
25da4f38
IZ
6918 else {
6919 (void)SvIOK_only(sv);
45977657 6920 SvIV_set(sv, SvIVX(sv) + 1);
1c846c1f 6921 }
55497cff 6922 }
79072805
LW
6923 return;
6924 }
28e5dec8
JH
6925 if (flags & SVp_NOK) {
6926 (void)SvNOK_only(sv);
9d6ce603 6927 SvNV_set(sv, SvNVX(sv) + 1.0);
28e5dec8
JH
6928 return;
6929 }
6930
3f7c398e 6931 if (!(flags & SVp_POK) || !*SvPVX_const(sv)) {
28e5dec8 6932 if ((flags & SVTYPEMASK) < SVt_PVIV)
f5282e15 6933 sv_upgrade(sv, ((flags & SVTYPEMASK) > SVt_IV ? SVt_PVIV : SVt_IV));
28e5dec8 6934 (void)SvIOK_only(sv);
45977657 6935 SvIV_set(sv, 1);
79072805
LW
6936 return;
6937 }
463ee0b2 6938 d = SvPVX(sv);
79072805
LW
6939 while (isALPHA(*d)) d++;
6940 while (isDIGIT(*d)) d++;
6941 if (*d) {
28e5dec8 6942#ifdef PERL_PRESERVE_IVUV
d1be9408 6943 /* Got to punt this as an integer if needs be, but we don't issue
28e5dec8
JH
6944 warnings. Probably ought to make the sv_iv_please() that does
6945 the conversion if possible, and silently. */
504618e9 6946 const int numtype = grok_number(SvPVX_const(sv), SvCUR(sv), NULL);
28e5dec8
JH
6947 if (numtype && !(numtype & IS_NUMBER_INFINITY)) {
6948 /* Need to try really hard to see if it's an integer.
6949 9.22337203685478e+18 is an integer.
6950 but "9.22337203685478e+18" + 0 is UV=9223372036854779904
6951 so $a="9.22337203685478e+18"; $a+0; $a++
6952 needs to be the same as $a="9.22337203685478e+18"; $a++
6953 or we go insane. */
d460ef45 6954
28e5dec8
JH
6955 (void) sv_2iv(sv);
6956 if (SvIOK(sv))
6957 goto oops_its_int;
6958
6959 /* sv_2iv *should* have made this an NV */
6960 if (flags & SVp_NOK) {
6961 (void)SvNOK_only(sv);
9d6ce603 6962 SvNV_set(sv, SvNVX(sv) + 1.0);
28e5dec8
JH
6963 return;
6964 }
6965 /* I don't think we can get here. Maybe I should assert this
6966 And if we do get here I suspect that sv_setnv will croak. NWC
6967 Fall through. */
6968#if defined(USE_LONG_DOUBLE)
6969 DEBUG_c(PerlIO_printf(Perl_debug_log,"sv_inc punt failed to convert '%s' to IOK or NOKp, UV=0x%"UVxf" NV=%"PERL_PRIgldbl"\n",
3f7c398e 6970 SvPVX_const(sv), SvIVX(sv), SvNVX(sv)));
28e5dec8 6971#else
1779d84d 6972 DEBUG_c(PerlIO_printf(Perl_debug_log,"sv_inc punt failed to convert '%s' to IOK or NOKp, UV=0x%"UVxf" NV=%"NVgf"\n",
3f7c398e 6973 SvPVX_const(sv), SvIVX(sv), SvNVX(sv)));
28e5dec8
JH
6974#endif
6975 }
6976#endif /* PERL_PRESERVE_IVUV */
3f7c398e 6977 sv_setnv(sv,Atof(SvPVX_const(sv)) + 1.0);
79072805
LW
6978 return;
6979 }
6980 d--;
3f7c398e 6981 while (d >= SvPVX_const(sv)) {
79072805
LW
6982 if (isDIGIT(*d)) {
6983 if (++*d <= '9')
6984 return;
6985 *(d--) = '0';
6986 }
6987 else {
9d116dd7
JH
6988#ifdef EBCDIC
6989 /* MKS: The original code here died if letters weren't consecutive.
6990 * at least it didn't have to worry about non-C locales. The
6991 * new code assumes that ('z'-'a')==('Z'-'A'), letters are
1c846c1f 6992 * arranged in order (although not consecutively) and that only
9d116dd7
JH
6993 * [A-Za-z] are accepted by isALPHA in the C locale.
6994 */
6995 if (*d != 'z' && *d != 'Z') {
6996 do { ++*d; } while (!isALPHA(*d));
6997 return;
6998 }
6999 *(d--) -= 'z' - 'a';
7000#else
79072805
LW
7001 ++*d;
7002 if (isALPHA(*d))
7003 return;
7004 *(d--) -= 'z' - 'a' + 1;
9d116dd7 7005#endif
79072805
LW
7006 }
7007 }
7008 /* oh,oh, the number grew */
7009 SvGROW(sv, SvCUR(sv) + 2);
b162af07 7010 SvCUR_set(sv, SvCUR(sv) + 1);
3f7c398e 7011 for (d = SvPVX(sv) + SvCUR(sv); d > SvPVX_const(sv); d--)
79072805
LW
7012 *d = d[-1];
7013 if (isDIGIT(d[1]))
7014 *d = '1';
7015 else
7016 *d = d[1];
7017}
7018
954c1994
GS
7019/*
7020=for apidoc sv_dec
7021
645c22ef
DM
7022Auto-decrement of the value in the SV, doing string to numeric conversion
7023if necessary. Handles 'get' magic.
954c1994
GS
7024
7025=cut
7026*/
7027
79072805 7028void
864dbfa3 7029Perl_sv_dec(pTHX_ register SV *sv)
79072805 7030{
463ee0b2
LW
7031 int flags;
7032
79072805
LW
7033 if (!sv)
7034 return;
b23a5f78
GB
7035 if (SvGMAGICAL(sv))
7036 mg_get(sv);
ed6116ce 7037 if (SvTHINKFIRST(sv)) {
765f542d
NC
7038 if (SvIsCOW(sv))
7039 sv_force_normal_flags(sv, 0);
0f15f207 7040 if (SvREADONLY(sv)) {
923e4eb5 7041 if (IN_PERL_RUNTIME)
cea2e8a9 7042 Perl_croak(aTHX_ PL_no_modify);
0f15f207 7043 }
a0d0e21e 7044 if (SvROK(sv)) {
b5be31e9 7045 IV i;
9e7bc3e8
JD
7046 if (SvAMAGIC(sv) && AMG_CALLun(sv,dec))
7047 return;
56431972 7048 i = PTR2IV(SvRV(sv));
b5be31e9
SM
7049 sv_unref(sv);
7050 sv_setiv(sv, i);
a0d0e21e 7051 }
ed6116ce 7052 }
28e5dec8
JH
7053 /* Unlike sv_inc we don't have to worry about string-never-numbers
7054 and keeping them magic. But we mustn't warn on punting */
8990e307 7055 flags = SvFLAGS(sv);
28e5dec8
JH
7056 if ((flags & SVf_IOK) || ((flags & (SVp_IOK | SVp_NOK)) == SVp_IOK)) {
7057 /* It's publicly an integer, or privately an integer-not-float */
59d8ce62 7058#ifdef PERL_PRESERVE_IVUV
28e5dec8 7059 oops_its_int:
59d8ce62 7060#endif
25da4f38
IZ
7061 if (SvIsUV(sv)) {
7062 if (SvUVX(sv) == 0) {
7063 (void)SvIOK_only(sv);
45977657 7064 SvIV_set(sv, -1);
25da4f38
IZ
7065 }
7066 else {
7067 (void)SvIOK_only_UV(sv);
f4eee32f 7068 SvUV_set(sv, SvUVX(sv) - 1);
1c846c1f 7069 }
25da4f38
IZ
7070 } else {
7071 if (SvIVX(sv) == IV_MIN)
65202027 7072 sv_setnv(sv, (NV)IV_MIN - 1.0);
25da4f38
IZ
7073 else {
7074 (void)SvIOK_only(sv);
45977657 7075 SvIV_set(sv, SvIVX(sv) - 1);
1c846c1f 7076 }
55497cff 7077 }
7078 return;
7079 }
28e5dec8 7080 if (flags & SVp_NOK) {
9d6ce603 7081 SvNV_set(sv, SvNVX(sv) - 1.0);
28e5dec8
JH
7082 (void)SvNOK_only(sv);
7083 return;
7084 }
8990e307 7085 if (!(flags & SVp_POK)) {
ef088171
NC
7086 if ((flags & SVTYPEMASK) < SVt_PVIV)
7087 sv_upgrade(sv, ((flags & SVTYPEMASK) > SVt_IV) ? SVt_PVIV : SVt_IV);
7088 SvIV_set(sv, -1);
7089 (void)SvIOK_only(sv);
79072805
LW
7090 return;
7091 }
28e5dec8
JH
7092#ifdef PERL_PRESERVE_IVUV
7093 {
504618e9 7094 const int numtype = grok_number(SvPVX_const(sv), SvCUR(sv), NULL);
28e5dec8
JH
7095 if (numtype && !(numtype & IS_NUMBER_INFINITY)) {
7096 /* Need to try really hard to see if it's an integer.
7097 9.22337203685478e+18 is an integer.
7098 but "9.22337203685478e+18" + 0 is UV=9223372036854779904
7099 so $a="9.22337203685478e+18"; $a+0; $a--
7100 needs to be the same as $a="9.22337203685478e+18"; $a--
7101 or we go insane. */
d460ef45 7102
28e5dec8
JH
7103 (void) sv_2iv(sv);
7104 if (SvIOK(sv))
7105 goto oops_its_int;
7106
7107 /* sv_2iv *should* have made this an NV */
7108 if (flags & SVp_NOK) {
7109 (void)SvNOK_only(sv);
9d6ce603 7110 SvNV_set(sv, SvNVX(sv) - 1.0);
28e5dec8
JH
7111 return;
7112 }
7113 /* I don't think we can get here. Maybe I should assert this
7114 And if we do get here I suspect that sv_setnv will croak. NWC
7115 Fall through. */
7116#if defined(USE_LONG_DOUBLE)
7117 DEBUG_c(PerlIO_printf(Perl_debug_log,"sv_dec punt failed to convert '%s' to IOK or NOKp, UV=0x%"UVxf" NV=%"PERL_PRIgldbl"\n",
3f7c398e 7118 SvPVX_const(sv), SvIVX(sv), SvNVX(sv)));
28e5dec8 7119#else
1779d84d 7120 DEBUG_c(PerlIO_printf(Perl_debug_log,"sv_dec punt failed to convert '%s' to IOK or NOKp, UV=0x%"UVxf" NV=%"NVgf"\n",
3f7c398e 7121 SvPVX_const(sv), SvIVX(sv), SvNVX(sv)));
28e5dec8
JH
7122#endif
7123 }
7124 }
7125#endif /* PERL_PRESERVE_IVUV */
3f7c398e 7126 sv_setnv(sv,Atof(SvPVX_const(sv)) - 1.0); /* punt */
79072805
LW
7127}
7128
954c1994
GS
7129/*
7130=for apidoc sv_mortalcopy
7131
645c22ef 7132Creates a new SV which is a copy of the original SV (using C<sv_setsv>).
d4236ebc
DM
7133The new SV is marked as mortal. It will be destroyed "soon", either by an
7134explicit call to FREETMPS, or by an implicit call at places such as
7135statement boundaries. See also C<sv_newmortal> and C<sv_2mortal>.
954c1994
GS
7136
7137=cut
7138*/
7139
79072805
LW
7140/* Make a string that will exist for the duration of the expression
7141 * evaluation. Actually, it may have to last longer than that, but
7142 * hopefully we won't free it until it has been assigned to a
7143 * permanent location. */
7144
7145SV *
864dbfa3 7146Perl_sv_mortalcopy(pTHX_ SV *oldstr)
79072805 7147{
463ee0b2 7148 register SV *sv;
b881518d 7149
4561caa4 7150 new_SV(sv);
79072805 7151 sv_setsv(sv,oldstr);
677b06e3
GS
7152 EXTEND_MORTAL(1);
7153 PL_tmps_stack[++PL_tmps_ix] = sv;
8990e307
LW
7154 SvTEMP_on(sv);
7155 return sv;
7156}
7157
954c1994
GS
7158/*
7159=for apidoc sv_newmortal
7160
645c22ef 7161Creates a new null SV which is mortal. The reference count of the SV is
d4236ebc
DM
7162set to 1. It will be destroyed "soon", either by an explicit call to
7163FREETMPS, or by an implicit call at places such as statement boundaries.
7164See also C<sv_mortalcopy> and C<sv_2mortal>.
954c1994
GS
7165
7166=cut
7167*/
7168
8990e307 7169SV *
864dbfa3 7170Perl_sv_newmortal(pTHX)
8990e307
LW
7171{
7172 register SV *sv;
7173
4561caa4 7174 new_SV(sv);
8990e307 7175 SvFLAGS(sv) = SVs_TEMP;
677b06e3
GS
7176 EXTEND_MORTAL(1);
7177 PL_tmps_stack[++PL_tmps_ix] = sv;
79072805
LW
7178 return sv;
7179}
7180
954c1994
GS
7181/*
7182=for apidoc sv_2mortal
7183
d4236ebc
DM
7184Marks an existing SV as mortal. The SV will be destroyed "soon", either
7185by an explicit call to FREETMPS, or by an implicit call at places such as
37d2ac18
NC
7186statement boundaries. SvTEMP() is turned on which means that the SV's
7187string buffer can be "stolen" if this SV is copied. See also C<sv_newmortal>
7188and C<sv_mortalcopy>.
954c1994
GS
7189
7190=cut
7191*/
7192
79072805 7193SV *
864dbfa3 7194Perl_sv_2mortal(pTHX_ register SV *sv)
79072805 7195{
27da23d5 7196 dVAR;
79072805
LW
7197 if (!sv)
7198 return sv;
d689ffdd 7199 if (SvREADONLY(sv) && SvIMMORTAL(sv))
11162842 7200 return sv;
677b06e3
GS
7201 EXTEND_MORTAL(1);
7202 PL_tmps_stack[++PL_tmps_ix] = sv;
8990e307 7203 SvTEMP_on(sv);
79072805
LW
7204 return sv;
7205}
7206
954c1994
GS
7207/*
7208=for apidoc newSVpv
7209
7210Creates a new SV and copies a string into it. The reference count for the
7211SV is set to 1. If C<len> is zero, Perl will compute the length using
7212strlen(). For efficiency, consider using C<newSVpvn> instead.
7213
7214=cut
7215*/
7216
79072805 7217SV *
864dbfa3 7218Perl_newSVpv(pTHX_ const char *s, STRLEN len)
79072805 7219{
463ee0b2 7220 register SV *sv;
79072805 7221
4561caa4 7222 new_SV(sv);
616d8c9c 7223 sv_setpvn(sv,s,len ? len : strlen(s));
79072805
LW
7224 return sv;
7225}
7226
954c1994
GS
7227/*
7228=for apidoc newSVpvn
7229
7230Creates a new SV and copies a string into it. The reference count for the
1c846c1f 7231SV is set to 1. Note that if C<len> is zero, Perl will create a zero length
954c1994 7232string. You are responsible for ensuring that the source string is at least
9e09f5f2 7233C<len> bytes long. If the C<s> argument is NULL the new SV will be undefined.
954c1994
GS
7234
7235=cut
7236*/
7237
9da1e3b5 7238SV *
864dbfa3 7239Perl_newSVpvn(pTHX_ const char *s, STRLEN len)
9da1e3b5
MUN
7240{
7241 register SV *sv;
7242
7243 new_SV(sv);
9da1e3b5
MUN
7244 sv_setpvn(sv,s,len);
7245 return sv;
7246}
7247
bd08039b
NC
7248
7249/*
926f8064 7250=for apidoc newSVhek
bd08039b
NC
7251
7252Creates a new SV from the hash key structure. It will generate scalars that
5aaec2b4
NC
7253point to the shared string table where possible. Returns a new (undefined)
7254SV if the hek is NULL.
bd08039b
NC
7255
7256=cut
7257*/
7258
7259SV *
c1b02ed8 7260Perl_newSVhek(pTHX_ const HEK *hek)
bd08039b 7261{
5aaec2b4
NC
7262 if (!hek) {
7263 SV *sv;
7264
7265 new_SV(sv);
7266 return sv;
7267 }
7268
bd08039b
NC
7269 if (HEK_LEN(hek) == HEf_SVKEY) {
7270 return newSVsv(*(SV**)HEK_KEY(hek));
7271 } else {
7272 const int flags = HEK_FLAGS(hek);
7273 if (flags & HVhek_WASUTF8) {
7274 /* Trouble :-)
7275 Andreas would like keys he put in as utf8 to come back as utf8
7276 */
7277 STRLEN utf8_len = HEK_LEN(hek);
b64e5050
AL
7278 const U8 *as_utf8 = bytes_to_utf8 ((U8*)HEK_KEY(hek), &utf8_len);
7279 SV * const sv = newSVpvn ((const char*)as_utf8, utf8_len);
bd08039b
NC
7280
7281 SvUTF8_on (sv);
7282 Safefree (as_utf8); /* bytes_to_utf8() allocates a new string */
7283 return sv;
7284 } else if (flags & HVhek_REHASH) {
7285 /* We don't have a pointer to the hv, so we have to replicate the
7286 flag into every HEK. This hv is using custom a hasing
7287 algorithm. Hence we can't return a shared string scalar, as
7288 that would contain the (wrong) hash value, and might get passed
7289 into an hv routine with a regular hash */
7290
b64e5050 7291 SV * const sv = newSVpvn (HEK_KEY(hek), HEK_LEN(hek));
bd08039b
NC
7292 if (HEK_UTF8(hek))
7293 SvUTF8_on (sv);
7294 return sv;
7295 }
7296 /* This will be overwhelminly the most common case. */
7297 return newSVpvn_share(HEK_KEY(hek),
7298 (HEK_UTF8(hek) ? -HEK_LEN(hek) : HEK_LEN(hek)),
7299 HEK_HASH(hek));
7300 }
7301}
7302
1c846c1f
NIS
7303/*
7304=for apidoc newSVpvn_share
7305
3f7c398e 7306Creates a new SV with its SvPVX_const pointing to a shared string in the string
645c22ef
DM
7307table. If the string does not already exist in the table, it is created
7308first. Turns on READONLY and FAKE. The string's hash is stored in the UV
7309slot of the SV; if the C<hash> parameter is non-zero, that value is used;
7310otherwise the hash is computed. The idea here is that as the string table
3f7c398e 7311is used for shared hash keys these strings will have SvPVX_const == HeKEY and
645c22ef 7312hash lookup will avoid string compare.
1c846c1f
NIS
7313
7314=cut
7315*/
7316
7317SV *
c3654f1a 7318Perl_newSVpvn_share(pTHX_ const char *src, I32 len, U32 hash)
1c846c1f
NIS
7319{
7320 register SV *sv;
c3654f1a
IH
7321 bool is_utf8 = FALSE;
7322 if (len < 0) {
77caf834 7323 STRLEN tmplen = -len;
c3654f1a 7324 is_utf8 = TRUE;
75a54232 7325 /* See the note in hv.c:hv_fetch() --jhi */
e1ec3a88 7326 src = (char*)bytes_from_utf8((const U8*)src, &tmplen, &is_utf8);
75a54232
JH
7327 len = tmplen;
7328 }
1c846c1f 7329 if (!hash)
5afd6d42 7330 PERL_HASH(hash, src, len);
1c846c1f 7331 new_SV(sv);
bdd68bc3 7332 sv_upgrade(sv, SVt_PV);
f880fe2f 7333 SvPV_set(sv, sharepvn(src, is_utf8?-len:len, hash));
b162af07 7334 SvCUR_set(sv, len);
b162af07 7335 SvLEN_set(sv, 0);
1c846c1f
NIS
7336 SvREADONLY_on(sv);
7337 SvFAKE_on(sv);
7338 SvPOK_on(sv);
c3654f1a
IH
7339 if (is_utf8)
7340 SvUTF8_on(sv);
1c846c1f
NIS
7341 return sv;
7342}
7343
645c22ef 7344
cea2e8a9 7345#if defined(PERL_IMPLICIT_CONTEXT)
645c22ef
DM
7346
7347/* pTHX_ magic can't cope with varargs, so this is a no-context
7348 * version of the main function, (which may itself be aliased to us).
7349 * Don't access this version directly.
7350 */
7351
46fc3d4c 7352SV *
cea2e8a9 7353Perl_newSVpvf_nocontext(const char* pat, ...)
46fc3d4c 7354{
cea2e8a9 7355 dTHX;
46fc3d4c 7356 register SV *sv;
7357 va_list args;
46fc3d4c 7358 va_start(args, pat);
c5be433b 7359 sv = vnewSVpvf(pat, &args);
46fc3d4c 7360 va_end(args);
7361 return sv;
7362}
cea2e8a9 7363#endif
46fc3d4c 7364
954c1994
GS
7365/*
7366=for apidoc newSVpvf
7367
645c22ef 7368Creates a new SV and initializes it with the string formatted like
954c1994
GS
7369C<sprintf>.
7370
7371=cut
7372*/
7373
cea2e8a9
GS
7374SV *
7375Perl_newSVpvf(pTHX_ const char* pat, ...)
7376{
7377 register SV *sv;
7378 va_list args;
cea2e8a9 7379 va_start(args, pat);
c5be433b 7380 sv = vnewSVpvf(pat, &args);
cea2e8a9
GS
7381 va_end(args);
7382 return sv;
7383}
46fc3d4c 7384
645c22ef
DM
7385/* backend for newSVpvf() and newSVpvf_nocontext() */
7386
79072805 7387SV *
c5be433b
GS
7388Perl_vnewSVpvf(pTHX_ const char* pat, va_list* args)
7389{
7390 register SV *sv;
7391 new_SV(sv);
7392 sv_vsetpvfn(sv, pat, strlen(pat), args, Null(SV**), 0, Null(bool*));
7393 return sv;
7394}
7395
954c1994
GS
7396/*
7397=for apidoc newSVnv
7398
7399Creates a new SV and copies a floating point value into it.
7400The reference count for the SV is set to 1.
7401
7402=cut
7403*/
7404
c5be433b 7405SV *
65202027 7406Perl_newSVnv(pTHX_ NV n)
79072805 7407{
463ee0b2 7408 register SV *sv;
79072805 7409
4561caa4 7410 new_SV(sv);
79072805
LW
7411 sv_setnv(sv,n);
7412 return sv;
7413}
7414
954c1994
GS
7415/*
7416=for apidoc newSViv
7417
7418Creates a new SV and copies an integer into it. The reference count for the
7419SV is set to 1.
7420
7421=cut
7422*/
7423
79072805 7424SV *
864dbfa3 7425Perl_newSViv(pTHX_ IV i)
79072805 7426{
463ee0b2 7427 register SV *sv;
79072805 7428
4561caa4 7429 new_SV(sv);
79072805
LW
7430 sv_setiv(sv,i);
7431 return sv;
7432}
7433
954c1994 7434/*
1a3327fb
JH
7435=for apidoc newSVuv
7436
7437Creates a new SV and copies an unsigned integer into it.
7438The reference count for the SV is set to 1.
7439
7440=cut
7441*/
7442
7443SV *
7444Perl_newSVuv(pTHX_ UV u)
7445{
7446 register SV *sv;
7447
7448 new_SV(sv);
7449 sv_setuv(sv,u);
7450 return sv;
7451}
7452
7453/*
954c1994
GS
7454=for apidoc newRV_noinc
7455
7456Creates an RV wrapper for an SV. The reference count for the original
7457SV is B<not> incremented.
7458
7459=cut
7460*/
7461
2304df62 7462SV *
864dbfa3 7463Perl_newRV_noinc(pTHX_ SV *tmpRef)
2304df62
AD
7464{
7465 register SV *sv;
7466
4561caa4 7467 new_SV(sv);
2304df62 7468 sv_upgrade(sv, SVt_RV);
76e3520e 7469 SvTEMP_off(tmpRef);
b162af07 7470 SvRV_set(sv, tmpRef);
2304df62 7471 SvROK_on(sv);
2304df62
AD
7472 return sv;
7473}
7474
ff276b08 7475/* newRV_inc is the official function name to use now.
645c22ef
DM
7476 * newRV_inc is in fact #defined to newRV in sv.h
7477 */
7478
5f05dabc 7479SV *
864dbfa3 7480Perl_newRV(pTHX_ SV *tmpRef)
5f05dabc 7481{
5f6447b6 7482 return newRV_noinc(SvREFCNT_inc(tmpRef));
5f05dabc 7483}
5f05dabc 7484
954c1994
GS
7485/*
7486=for apidoc newSVsv
7487
7488Creates a new SV which is an exact duplicate of the original SV.
645c22ef 7489(Uses C<sv_setsv>).
954c1994
GS
7490
7491=cut
7492*/
7493
79072805 7494SV *
864dbfa3 7495Perl_newSVsv(pTHX_ register SV *old)
79072805 7496{
463ee0b2 7497 register SV *sv;
79072805
LW
7498
7499 if (!old)
7500 return Nullsv;
8990e307 7501 if (SvTYPE(old) == SVTYPEMASK) {
0453d815 7502 if (ckWARN_d(WARN_INTERNAL))
9014280d 7503 Perl_warner(aTHX_ packWARN(WARN_INTERNAL), "semi-panic: attempt to dup freed string");
79072805
LW
7504 return Nullsv;
7505 }
4561caa4 7506 new_SV(sv);
e90aabeb
NC
7507 /* SV_GMAGIC is the default for sv_setv()
7508 SV_NOSTEAL prevents TEMP buffers being, well, stolen, and saves games
7509 with SvTEMP_off and SvTEMP_on round a call to sv_setsv. */
7510 sv_setsv_flags(sv, old, SV_GMAGIC | SV_NOSTEAL);
463ee0b2 7511 return sv;
79072805
LW
7512}
7513
645c22ef
DM
7514/*
7515=for apidoc sv_reset
7516
7517Underlying implementation for the C<reset> Perl function.
7518Note that the perl-level function is vaguely deprecated.
7519
7520=cut
7521*/
7522
79072805 7523void
e1ec3a88 7524Perl_sv_reset(pTHX_ register const char *s, HV *stash)
79072805 7525{
27da23d5 7526 dVAR;
4802d5d7 7527 char todo[PERL_UCHAR_MAX+1];
79072805 7528
49d8d3a1
MB
7529 if (!stash)
7530 return;
7531
79072805 7532 if (!*s) { /* reset ?? searches */
8d2f4536
NC
7533 MAGIC *mg = mg_find((SV *)stash, PERL_MAGIC_symtab);
7534 if (mg) {
7535 PMOP *pm = (PMOP *) mg->mg_obj;
7536 while (pm) {
7537 pm->op_pmdynflags &= ~PMdf_USED;
7538 pm = pm->op_pmnext;
7539 }
79072805
LW
7540 }
7541 return;
7542 }
7543
7544 /* reset variables */
7545
7546 if (!HvARRAY(stash))
7547 return;
463ee0b2
LW
7548
7549 Zero(todo, 256, char);
79072805 7550 while (*s) {
b464bac0
AL
7551 I32 max;
7552 I32 i = (unsigned char)*s;
79072805
LW
7553 if (s[1] == '-') {
7554 s += 2;
7555 }
4802d5d7 7556 max = (unsigned char)*s++;
79072805 7557 for ( ; i <= max; i++) {
463ee0b2
LW
7558 todo[i] = 1;
7559 }
a0d0e21e 7560 for (i = 0; i <= (I32) HvMAX(stash); i++) {
b464bac0 7561 HE *entry;
79072805 7562 for (entry = HvARRAY(stash)[i];
9e35f4b3
GS
7563 entry;
7564 entry = HeNEXT(entry))
7565 {
b464bac0
AL
7566 register GV *gv;
7567 register SV *sv;
7568
1edc1566 7569 if (!todo[(U8)*HeKEY(entry)])
463ee0b2 7570 continue;
1edc1566 7571 gv = (GV*)HeVAL(entry);
79072805 7572 sv = GvSV(gv);
e203899d
NC
7573 if (sv) {
7574 if (SvTHINKFIRST(sv)) {
7575 if (!SvREADONLY(sv) && SvROK(sv))
7576 sv_unref(sv);
7577 /* XXX Is this continue a bug? Why should THINKFIRST
7578 exempt us from resetting arrays and hashes? */
7579 continue;
7580 }
7581 SvOK_off(sv);
7582 if (SvTYPE(sv) >= SVt_PV) {
7583 SvCUR_set(sv, 0);
7584 if (SvPVX_const(sv) != Nullch)
7585 *SvPVX(sv) = '\0';
7586 SvTAINT(sv);
7587 }
79072805
LW
7588 }
7589 if (GvAV(gv)) {
7590 av_clear(GvAV(gv));
7591 }
bfcb3514 7592 if (GvHV(gv) && !HvNAME_get(GvHV(gv))) {
463ee0b2 7593 hv_clear(GvHV(gv));
2f42fcb0 7594#ifndef PERL_MICRO
fa6a1c44 7595#ifdef USE_ENVIRON_ARRAY
4efc5df6
GS
7596 if (gv == PL_envgv
7597# ifdef USE_ITHREADS
7598 && PL_curinterp == aTHX
7599# endif
7600 )
7601 {
79072805 7602 environ[0] = Nullch;
4efc5df6 7603 }
a0d0e21e 7604#endif
2f42fcb0 7605#endif /* !PERL_MICRO */
79072805
LW
7606 }
7607 }
7608 }
7609 }
7610}
7611
645c22ef
DM
7612/*
7613=for apidoc sv_2io
7614
7615Using various gambits, try to get an IO from an SV: the IO slot if its a
7616GV; or the recursive result if we're an RV; or the IO slot of the symbol
7617named after the PV if we're a string.
7618
7619=cut
7620*/
7621
46fc3d4c 7622IO*
864dbfa3 7623Perl_sv_2io(pTHX_ SV *sv)
46fc3d4c 7624{
7625 IO* io;
7626 GV* gv;
7627
7628 switch (SvTYPE(sv)) {
7629 case SVt_PVIO:
7630 io = (IO*)sv;
7631 break;
7632 case SVt_PVGV:
7633 gv = (GV*)sv;
7634 io = GvIO(gv);
7635 if (!io)
cea2e8a9 7636 Perl_croak(aTHX_ "Bad filehandle: %s", GvNAME(gv));
46fc3d4c 7637 break;
7638 default:
7639 if (!SvOK(sv))
cea2e8a9 7640 Perl_croak(aTHX_ PL_no_usym, "filehandle");
46fc3d4c 7641 if (SvROK(sv))
7642 return sv_2io(SvRV(sv));
7a5fd60d 7643 gv = gv_fetchsv(sv, FALSE, SVt_PVIO);
46fc3d4c 7644 if (gv)
7645 io = GvIO(gv);
7646 else
7647 io = 0;
7648 if (!io)
35c1215d 7649 Perl_croak(aTHX_ "Bad filehandle: %"SVf, sv);
46fc3d4c 7650 break;
7651 }
7652 return io;
7653}
7654
645c22ef
DM
7655/*
7656=for apidoc sv_2cv
7657
7658Using various gambits, try to get a CV from an SV; in addition, try if
7659possible to set C<*st> and C<*gvp> to the stash and GV associated with it.
7660
7661=cut
7662*/
7663
79072805 7664CV *
864dbfa3 7665Perl_sv_2cv(pTHX_ SV *sv, HV **st, GV **gvp, I32 lref)
79072805 7666{
27da23d5 7667 dVAR;
c04a4dfe
JH
7668 GV *gv = Nullgv;
7669 CV *cv = Nullcv;
79072805
LW
7670
7671 if (!sv)
93a17b20 7672 return *gvp = Nullgv, Nullcv;
79072805 7673 switch (SvTYPE(sv)) {
79072805
LW
7674 case SVt_PVCV:
7675 *st = CvSTASH(sv);
7676 *gvp = Nullgv;
7677 return (CV*)sv;
7678 case SVt_PVHV:
7679 case SVt_PVAV:
7680 *gvp = Nullgv;
7681 return Nullcv;
8990e307
LW
7682 case SVt_PVGV:
7683 gv = (GV*)sv;
a0d0e21e 7684 *gvp = gv;
8990e307
LW
7685 *st = GvESTASH(gv);
7686 goto fix_gv;
7687
79072805 7688 default:
a0d0e21e
LW
7689 if (SvGMAGICAL(sv))
7690 mg_get(sv);
7691 if (SvROK(sv)) {
f5284f61
IZ
7692 SV **sp = &sv; /* Used in tryAMAGICunDEREF macro. */
7693 tryAMAGICunDEREF(to_cv);
7694
62f274bf
GS
7695 sv = SvRV(sv);
7696 if (SvTYPE(sv) == SVt_PVCV) {
7697 cv = (CV*)sv;
7698 *gvp = Nullgv;
7699 *st = CvSTASH(cv);
7700 return cv;
7701 }
7702 else if(isGV(sv))
7703 gv = (GV*)sv;
7704 else
cea2e8a9 7705 Perl_croak(aTHX_ "Not a subroutine reference");
a0d0e21e 7706 }
62f274bf 7707 else if (isGV(sv))
79072805
LW
7708 gv = (GV*)sv;
7709 else
7a5fd60d 7710 gv = gv_fetchsv(sv, lref, SVt_PVCV);
79072805
LW
7711 *gvp = gv;
7712 if (!gv)
7713 return Nullcv;
7714 *st = GvESTASH(gv);
8990e307 7715 fix_gv:
8ebc5c01 7716 if (lref && !GvCVu(gv)) {
4633a7c4 7717 SV *tmpsv;
748a9306 7718 ENTER;
4633a7c4 7719 tmpsv = NEWSV(704,0);
16660edb 7720 gv_efullname3(tmpsv, gv, Nullch);
f6ec51f7
GS
7721 /* XXX this is probably not what they think they're getting.
7722 * It has the same effect as "sub name;", i.e. just a forward
7723 * declaration! */
774d564b 7724 newSUB(start_subparse(FALSE, 0),
4633a7c4
LW
7725 newSVOP(OP_CONST, 0, tmpsv),
7726 Nullop,
8990e307 7727 Nullop);
748a9306 7728 LEAVE;
8ebc5c01 7729 if (!GvCVu(gv))
35c1215d
NC
7730 Perl_croak(aTHX_ "Unable to create sub named \"%"SVf"\"",
7731 sv);
8990e307 7732 }
8ebc5c01 7733 return GvCVu(gv);
79072805
LW
7734 }
7735}
7736
c461cf8f
JH
7737/*
7738=for apidoc sv_true
7739
7740Returns true if the SV has a true value by Perl's rules.
645c22ef
DM
7741Use the C<SvTRUE> macro instead, which may call C<sv_true()> or may
7742instead use an in-line version.
c461cf8f
JH
7743
7744=cut
7745*/
7746
79072805 7747I32
864dbfa3 7748Perl_sv_true(pTHX_ register SV *sv)
79072805 7749{
8990e307
LW
7750 if (!sv)
7751 return 0;
79072805 7752 if (SvPOK(sv)) {
e1ec3a88 7753 const register XPV* tXpv;
4e35701f 7754 if ((tXpv = (XPV*)SvANY(sv)) &&
c2f1de04 7755 (tXpv->xpv_cur > 1 ||
339049b0 7756 (tXpv->xpv_cur && *sv->sv_u.svu_pv != '0')))
79072805
LW
7757 return 1;
7758 else
7759 return 0;
7760 }
7761 else {
7762 if (SvIOK(sv))
463ee0b2 7763 return SvIVX(sv) != 0;
79072805
LW
7764 else {
7765 if (SvNOK(sv))
463ee0b2 7766 return SvNVX(sv) != 0.0;
79072805 7767 else
463ee0b2 7768 return sv_2bool(sv);
79072805
LW
7769 }
7770 }
7771}
79072805 7772
645c22ef
DM
7773/*
7774=for apidoc sv_iv
7775
7776A private implementation of the C<SvIVx> macro for compilers which can't
7777cope with complex macro expressions. Always use the macro instead.
7778
7779=cut
7780*/
7781
ff68c719 7782IV
864dbfa3 7783Perl_sv_iv(pTHX_ register SV *sv)
85e6fe83 7784{
25da4f38
IZ
7785 if (SvIOK(sv)) {
7786 if (SvIsUV(sv))
7787 return (IV)SvUVX(sv);
ff68c719 7788 return SvIVX(sv);
25da4f38 7789 }
ff68c719 7790 return sv_2iv(sv);
85e6fe83 7791}
85e6fe83 7792
645c22ef
DM
7793/*
7794=for apidoc sv_uv
7795
7796A private implementation of the C<SvUVx> macro for compilers which can't
7797cope with complex macro expressions. Always use the macro instead.
7798
7799=cut
7800*/
7801
ff68c719 7802UV
864dbfa3 7803Perl_sv_uv(pTHX_ register SV *sv)
ff68c719 7804{
25da4f38
IZ
7805 if (SvIOK(sv)) {
7806 if (SvIsUV(sv))
7807 return SvUVX(sv);
7808 return (UV)SvIVX(sv);
7809 }
ff68c719 7810 return sv_2uv(sv);
7811}
85e6fe83 7812
645c22ef
DM
7813/*
7814=for apidoc sv_nv
7815
7816A private implementation of the C<SvNVx> macro for compilers which can't
7817cope with complex macro expressions. Always use the macro instead.
7818
7819=cut
7820*/
7821
65202027 7822NV
864dbfa3 7823Perl_sv_nv(pTHX_ register SV *sv)
79072805 7824{
ff68c719 7825 if (SvNOK(sv))
7826 return SvNVX(sv);
7827 return sv_2nv(sv);
79072805 7828}
79072805 7829
09540bc3
JH
7830/* sv_pv() is now a macro using SvPV_nolen();
7831 * this function provided for binary compatibility only
7832 */
7833
7834char *
7835Perl_sv_pv(pTHX_ SV *sv)
7836{
09540bc3
JH
7837 if (SvPOK(sv))
7838 return SvPVX(sv);
7839
93524f2b 7840 return sv_2pv(sv, 0);
09540bc3
JH
7841}
7842
645c22ef
DM
7843/*
7844=for apidoc sv_pv
7845
baca2b92 7846Use the C<SvPV_nolen> macro instead
645c22ef 7847
645c22ef
DM
7848=for apidoc sv_pvn
7849
7850A private implementation of the C<SvPV> macro for compilers which can't
7851cope with complex macro expressions. Always use the macro instead.
7852
7853=cut
7854*/
7855
1fa8b10d 7856char *
864dbfa3 7857Perl_sv_pvn(pTHX_ SV *sv, STRLEN *lp)
79072805 7858{
85e6fe83
LW
7859 if (SvPOK(sv)) {
7860 *lp = SvCUR(sv);
a0d0e21e 7861 return SvPVX(sv);
85e6fe83 7862 }
463ee0b2 7863 return sv_2pv(sv, lp);
79072805 7864}
79072805 7865
6e9d1081
NC
7866
7867char *
7868Perl_sv_pvn_nomg(pTHX_ register SV *sv, STRLEN *lp)
7869{
7870 if (SvPOK(sv)) {
7871 *lp = SvCUR(sv);
7872 return SvPVX(sv);
7873 }
7874 return sv_2pv_flags(sv, lp, 0);
7875}
7876
09540bc3
JH
7877/* sv_pvn_force() is now a macro using Perl_sv_pvn_force_flags();
7878 * this function provided for binary compatibility only
7879 */
7880
7881char *
7882Perl_sv_pvn_force(pTHX_ SV *sv, STRLEN *lp)
7883{
7884 return sv_pvn_force_flags(sv, lp, SV_GMAGIC);
7885}
7886
c461cf8f
JH
7887/*
7888=for apidoc sv_pvn_force
7889
7890Get a sensible string out of the SV somehow.
645c22ef
DM
7891A private implementation of the C<SvPV_force> macro for compilers which
7892can't cope with complex macro expressions. Always use the macro instead.
c461cf8f 7893
8d6d96c1
HS
7894=for apidoc sv_pvn_force_flags
7895
7896Get a sensible string out of the SV somehow.
7897If C<flags> has C<SV_GMAGIC> bit set, will C<mg_get> on C<sv> if
7898appropriate, else not. C<sv_pvn_force> and C<sv_pvn_force_nomg> are
7899implemented in terms of this function.
645c22ef
DM
7900You normally want to use the various wrapper macros instead: see
7901C<SvPV_force> and C<SvPV_force_nomg>
8d6d96c1
HS
7902
7903=cut
7904*/
7905
7906char *
7907Perl_sv_pvn_force_flags(pTHX_ SV *sv, STRLEN *lp, I32 flags)
7908{
a0d0e21e 7909
6fc92669 7910 if (SvTHINKFIRST(sv) && !SvROK(sv))
765f542d 7911 sv_force_normal_flags(sv, 0);
1c846c1f 7912
a0d0e21e 7913 if (SvPOK(sv)) {
13c5b33c
NC
7914 if (lp)
7915 *lp = SvCUR(sv);
a0d0e21e
LW
7916 }
7917 else {
a3b680e6 7918 char *s;
13c5b33c
NC
7919 STRLEN len;
7920
4d84ee25 7921 if (SvREADONLY(sv) && !(flags & SV_MUTABLE_RETURN)) {
b64e5050 7922 const char * const ref = sv_reftype(sv,0);
4d84ee25
NC
7923 if (PL_op)
7924 Perl_croak(aTHX_ "Can't coerce readonly %s to string in %s",
b64e5050 7925 ref, OP_NAME(PL_op));
4d84ee25 7926 else
b64e5050 7927 Perl_croak(aTHX_ "Can't coerce readonly %s to string", ref);
4d84ee25 7928 }
b64e5050 7929 if (SvTYPE(sv) > SVt_PVLV && SvTYPE(sv) != SVt_PVFM)
cea2e8a9 7930 Perl_croak(aTHX_ "Can't coerce %s to string in %s", sv_reftype(sv,0),
53e06cf0 7931 OP_NAME(PL_op));
b64e5050 7932 s = sv_2pv_flags(sv, &len, flags);
13c5b33c
NC
7933 if (lp)
7934 *lp = len;
7935
3f7c398e 7936 if (s != SvPVX_const(sv)) { /* Almost, but not quite, sv_setpvn() */
a0d0e21e
LW
7937 if (SvROK(sv))
7938 sv_unref(sv);
862a34c6 7939 SvUPGRADE(sv, SVt_PV); /* Never FALSE */
a0d0e21e 7940 SvGROW(sv, len + 1);
3f7c398e 7941 Move(s,SvPVX_const(sv),len,char);
a0d0e21e
LW
7942 SvCUR_set(sv, len);
7943 *SvEND(sv) = '\0';
7944 }
7945 if (!SvPOK(sv)) {
7946 SvPOK_on(sv); /* validate pointer */
7947 SvTAINT(sv);
1d7c1841 7948 DEBUG_c(PerlIO_printf(Perl_debug_log, "0x%"UVxf" 2pv(%s)\n",
3f7c398e 7949 PTR2UV(sv),SvPVX_const(sv)));
a0d0e21e
LW
7950 }
7951 }
4d84ee25 7952 return SvPVX_mutable(sv);
a0d0e21e
LW
7953}
7954
09540bc3
JH
7955/* sv_pvbyte () is now a macro using Perl_sv_2pv_flags();
7956 * this function provided for binary compatibility only
7957 */
7958
7959char *
7960Perl_sv_pvbyte(pTHX_ SV *sv)
7961{
7962 sv_utf8_downgrade(sv,0);
7963 return sv_pv(sv);
7964}
7965
645c22ef
DM
7966/*
7967=for apidoc sv_pvbyte
7968
baca2b92 7969Use C<SvPVbyte_nolen> instead.
645c22ef 7970
645c22ef
DM
7971=for apidoc sv_pvbyten
7972
7973A private implementation of the C<SvPVbyte> macro for compilers
7974which can't cope with complex macro expressions. Always use the macro
7975instead.
7976
7977=cut
7978*/
7979
7340a771
GS
7980char *
7981Perl_sv_pvbyten(pTHX_ SV *sv, STRLEN *lp)
7982{
ffebcc3e 7983 sv_utf8_downgrade(sv,0);
7340a771
GS
7984 return sv_pvn(sv,lp);
7985}
7986
645c22ef
DM
7987/*
7988=for apidoc sv_pvbyten_force
7989
7990A private implementation of the C<SvPVbytex_force> macro for compilers
7991which can't cope with complex macro expressions. Always use the macro
7992instead.
7993
7994=cut
7995*/
7996
7340a771
GS
7997char *
7998Perl_sv_pvbyten_force(pTHX_ SV *sv, STRLEN *lp)
7999{
46ec2f14 8000 sv_pvn_force(sv,lp);
ffebcc3e 8001 sv_utf8_downgrade(sv,0);
46ec2f14
TS
8002 *lp = SvCUR(sv);
8003 return SvPVX(sv);
7340a771
GS
8004}
8005
09540bc3
JH
8006/* sv_pvutf8 () is now a macro using Perl_sv_2pv_flags();
8007 * this function provided for binary compatibility only
8008 */
8009
8010char *
8011Perl_sv_pvutf8(pTHX_ SV *sv)
8012{
8013 sv_utf8_upgrade(sv);
8014 return sv_pv(sv);
8015}
8016
645c22ef
DM
8017/*
8018=for apidoc sv_pvutf8
8019
baca2b92 8020Use the C<SvPVutf8_nolen> macro instead
645c22ef 8021
645c22ef
DM
8022=for apidoc sv_pvutf8n
8023
8024A private implementation of the C<SvPVutf8> macro for compilers
8025which can't cope with complex macro expressions. Always use the macro
8026instead.
8027
8028=cut
8029*/
8030
7340a771
GS
8031char *
8032Perl_sv_pvutf8n(pTHX_ SV *sv, STRLEN *lp)
8033{
560a288e 8034 sv_utf8_upgrade(sv);
7340a771
GS
8035 return sv_pvn(sv,lp);
8036}
8037
c461cf8f
JH
8038/*
8039=for apidoc sv_pvutf8n_force
8040
645c22ef
DM
8041A private implementation of the C<SvPVutf8_force> macro for compilers
8042which can't cope with complex macro expressions. Always use the macro
8043instead.
c461cf8f
JH
8044
8045=cut
8046*/
8047
7340a771
GS
8048char *
8049Perl_sv_pvutf8n_force(pTHX_ SV *sv, STRLEN *lp)
8050{
46ec2f14 8051 sv_pvn_force(sv,lp);
560a288e 8052 sv_utf8_upgrade(sv);
46ec2f14
TS
8053 *lp = SvCUR(sv);
8054 return SvPVX(sv);
7340a771
GS
8055}
8056
c461cf8f
JH
8057/*
8058=for apidoc sv_reftype
8059
8060Returns a string describing what the SV is a reference to.
8061
8062=cut
8063*/
8064
1cb0ed9b 8065char *
bfed75c6 8066Perl_sv_reftype(pTHX_ const SV *sv, int ob)
a0d0e21e 8067{
07409e01
NC
8068 /* The fact that I don't need to downcast to char * everywhere, only in ?:
8069 inside return suggests a const propagation bug in g++. */
c86bf373 8070 if (ob && SvOBJECT(sv)) {
1b6737cc 8071 char * const name = HvNAME_get(SvSTASH(sv));
07409e01 8072 return name ? name : (char *) "__ANON__";
c86bf373 8073 }
a0d0e21e
LW
8074 else {
8075 switch (SvTYPE(sv)) {
8076 case SVt_NULL:
8077 case SVt_IV:
8078 case SVt_NV:
8079 case SVt_RV:
8080 case SVt_PV:
8081 case SVt_PVIV:
8082 case SVt_PVNV:
8083 case SVt_PVMG:
8084 case SVt_PVBM:
1cb0ed9b 8085 if (SvVOK(sv))
439cb1c4 8086 return "VSTRING";
a0d0e21e
LW
8087 if (SvROK(sv))
8088 return "REF";
8089 else
8090 return "SCALAR";
1cb0ed9b 8091
07409e01 8092 case SVt_PVLV: return (char *) (SvROK(sv) ? "REF"
be65207d
DM
8093 /* tied lvalues should appear to be
8094 * scalars for backwards compatitbility */
8095 : (LvTYPE(sv) == 't' || LvTYPE(sv) == 'T')
07409e01 8096 ? "SCALAR" : "LVALUE");
a0d0e21e
LW
8097 case SVt_PVAV: return "ARRAY";
8098 case SVt_PVHV: return "HASH";
8099 case SVt_PVCV: return "CODE";
8100 case SVt_PVGV: return "GLOB";
1d2dff63 8101 case SVt_PVFM: return "FORMAT";
27f9d8f3 8102 case SVt_PVIO: return "IO";
a0d0e21e
LW
8103 default: return "UNKNOWN";
8104 }
8105 }
8106}
8107
954c1994
GS
8108/*
8109=for apidoc sv_isobject
8110
8111Returns a boolean indicating whether the SV is an RV pointing to a blessed
8112object. If the SV is not an RV, or if the object is not blessed, then this
8113will return false.
8114
8115=cut
8116*/
8117
463ee0b2 8118int
864dbfa3 8119Perl_sv_isobject(pTHX_ SV *sv)
85e6fe83 8120{
68dc0745 8121 if (!sv)
8122 return 0;
8123 if (SvGMAGICAL(sv))
8124 mg_get(sv);
85e6fe83
LW
8125 if (!SvROK(sv))
8126 return 0;
8127 sv = (SV*)SvRV(sv);
8128 if (!SvOBJECT(sv))
8129 return 0;
8130 return 1;
8131}
8132
954c1994
GS
8133/*
8134=for apidoc sv_isa
8135
8136Returns a boolean indicating whether the SV is blessed into the specified
8137class. This does not check for subtypes; use C<sv_derived_from> to verify
8138an inheritance relationship.
8139
8140=cut
8141*/
8142
85e6fe83 8143int
864dbfa3 8144Perl_sv_isa(pTHX_ SV *sv, const char *name)
463ee0b2 8145{
bfcb3514 8146 const char *hvname;
68dc0745 8147 if (!sv)
8148 return 0;
8149 if (SvGMAGICAL(sv))
8150 mg_get(sv);
ed6116ce 8151 if (!SvROK(sv))
463ee0b2 8152 return 0;
ed6116ce
LW
8153 sv = (SV*)SvRV(sv);
8154 if (!SvOBJECT(sv))
463ee0b2 8155 return 0;
bfcb3514
NC
8156 hvname = HvNAME_get(SvSTASH(sv));
8157 if (!hvname)
e27ad1f2 8158 return 0;
463ee0b2 8159
bfcb3514 8160 return strEQ(hvname, name);
463ee0b2
LW
8161}
8162
954c1994
GS
8163/*
8164=for apidoc newSVrv
8165
8166Creates a new SV for the RV, C<rv>, to point to. If C<rv> is not an RV then
8167it will be upgraded to one. If C<classname> is non-null then the new SV will
8168be blessed in the specified package. The new SV is returned and its
8169reference count is 1.
8170
8171=cut
8172*/
8173
463ee0b2 8174SV*
864dbfa3 8175Perl_newSVrv(pTHX_ SV *rv, const char *classname)
463ee0b2 8176{
463ee0b2
LW
8177 SV *sv;
8178
4561caa4 8179 new_SV(sv);
51cf62d8 8180
765f542d 8181 SV_CHECK_THINKFIRST_COW_DROP(rv);
51cf62d8 8182 SvAMAGIC_off(rv);
51cf62d8 8183
0199fce9 8184 if (SvTYPE(rv) >= SVt_PVMG) {
a3b680e6 8185 const U32 refcnt = SvREFCNT(rv);
0199fce9
JD
8186 SvREFCNT(rv) = 0;
8187 sv_clear(rv);
8188 SvFLAGS(rv) = 0;
8189 SvREFCNT(rv) = refcnt;
8190 }
8191
51cf62d8 8192 if (SvTYPE(rv) < SVt_RV)
0199fce9
JD
8193 sv_upgrade(rv, SVt_RV);
8194 else if (SvTYPE(rv) > SVt_RV) {
8bd4d4c5 8195 SvPV_free(rv);
0199fce9
JD
8196 SvCUR_set(rv, 0);
8197 SvLEN_set(rv, 0);
8198 }
51cf62d8 8199
0c34ef67 8200 SvOK_off(rv);
b162af07 8201 SvRV_set(rv, sv);
ed6116ce 8202 SvROK_on(rv);
463ee0b2 8203
a0d0e21e 8204 if (classname) {
1b6737cc 8205 HV* const stash = gv_stashpv(classname, TRUE);
a0d0e21e
LW
8206 (void)sv_bless(rv, stash);
8207 }
8208 return sv;
8209}
8210
954c1994
GS
8211/*
8212=for apidoc sv_setref_pv
8213
8214Copies a pointer into a new SV, optionally blessing the SV. The C<rv>
8215argument will be upgraded to an RV. That RV will be modified to point to
8216the new SV. If the C<pv> argument is NULL then C<PL_sv_undef> will be placed
8217into the SV. The C<classname> argument indicates the package for the
8218blessing. Set C<classname> to C<Nullch> to avoid the blessing. The new SV
d34c2299 8219will have a reference count of 1, and the RV will be returned.
954c1994
GS
8220
8221Do not use with other Perl types such as HV, AV, SV, CV, because those
8222objects will become corrupted by the pointer copy process.
8223
8224Note that C<sv_setref_pvn> copies the string while this copies the pointer.
8225
8226=cut
8227*/
8228
a0d0e21e 8229SV*
864dbfa3 8230Perl_sv_setref_pv(pTHX_ SV *rv, const char *classname, void *pv)
a0d0e21e 8231{
189b2af5 8232 if (!pv) {
3280af22 8233 sv_setsv(rv, &PL_sv_undef);
189b2af5
GS
8234 SvSETMAGIC(rv);
8235 }
a0d0e21e 8236 else
56431972 8237 sv_setiv(newSVrv(rv,classname), PTR2IV(pv));
a0d0e21e
LW
8238 return rv;
8239}
8240
954c1994
GS
8241/*
8242=for apidoc sv_setref_iv
8243
8244Copies an integer into a new SV, optionally blessing the SV. The C<rv>
8245argument will be upgraded to an RV. That RV will be modified to point to
8246the new SV. The C<classname> argument indicates the package for the
8247blessing. Set C<classname> to C<Nullch> to avoid the blessing. The new SV
d34c2299 8248will have a reference count of 1, and the RV will be returned.
954c1994
GS
8249
8250=cut
8251*/
8252
a0d0e21e 8253SV*
864dbfa3 8254Perl_sv_setref_iv(pTHX_ SV *rv, const char *classname, IV iv)
a0d0e21e
LW
8255{
8256 sv_setiv(newSVrv(rv,classname), iv);
8257 return rv;
8258}
8259
954c1994 8260/*
e1c57cef
JH
8261=for apidoc sv_setref_uv
8262
8263Copies an unsigned integer into a new SV, optionally blessing the SV. The C<rv>
8264argument will be upgraded to an RV. That RV will be modified to point to
8265the new SV. The C<classname> argument indicates the package for the
8266blessing. Set C<classname> to C<Nullch> to avoid the blessing. The new SV
d34c2299 8267will have a reference count of 1, and the RV will be returned.
e1c57cef
JH
8268
8269=cut
8270*/
8271
8272SV*
8273Perl_sv_setref_uv(pTHX_ SV *rv, const char *classname, UV uv)
8274{
8275 sv_setuv(newSVrv(rv,classname), uv);
8276 return rv;
8277}
8278
8279/*
954c1994
GS
8280=for apidoc sv_setref_nv
8281
8282Copies a double into a new SV, optionally blessing the SV. The C<rv>
8283argument will be upgraded to an RV. That RV will be modified to point to
8284the new SV. The C<classname> argument indicates the package for the
8285blessing. Set C<classname> to C<Nullch> to avoid the blessing. The new SV
d34c2299 8286will have a reference count of 1, and the RV will be returned.
954c1994
GS
8287
8288=cut
8289*/
8290
a0d0e21e 8291SV*
65202027 8292Perl_sv_setref_nv(pTHX_ SV *rv, const char *classname, NV nv)
a0d0e21e
LW
8293{
8294 sv_setnv(newSVrv(rv,classname), nv);
8295 return rv;
8296}
463ee0b2 8297
954c1994
GS
8298/*
8299=for apidoc sv_setref_pvn
8300
8301Copies a string into a new SV, optionally blessing the SV. The length of the
8302string must be specified with C<n>. The C<rv> argument will be upgraded to
8303an RV. That RV will be modified to point to the new SV. The C<classname>
8304argument indicates the package for the blessing. Set C<classname> to
7a5fa8a2 8305C<Nullch> to avoid the blessing. The new SV will have a reference count
d34c2299 8306of 1, and the RV will be returned.
954c1994
GS
8307
8308Note that C<sv_setref_pv> copies the pointer while this copies the string.
8309
8310=cut
8311*/
8312
a0d0e21e 8313SV*
1b6737cc 8314Perl_sv_setref_pvn(pTHX_ SV *rv, const char *classname, const char *pv, STRLEN n)
a0d0e21e
LW
8315{
8316 sv_setpvn(newSVrv(rv,classname), pv, n);
463ee0b2
LW
8317 return rv;
8318}
8319
954c1994
GS
8320/*
8321=for apidoc sv_bless
8322
8323Blesses an SV into a specified package. The SV must be an RV. The package
8324must be designated by its stash (see C<gv_stashpv()>). The reference count
8325of the SV is unaffected.
8326
8327=cut
8328*/
8329
a0d0e21e 8330SV*
864dbfa3 8331Perl_sv_bless(pTHX_ SV *sv, HV *stash)
a0d0e21e 8332{
76e3520e 8333 SV *tmpRef;
a0d0e21e 8334 if (!SvROK(sv))
cea2e8a9 8335 Perl_croak(aTHX_ "Can't bless non-reference value");
76e3520e
GS
8336 tmpRef = SvRV(sv);
8337 if (SvFLAGS(tmpRef) & (SVs_OBJECT|SVf_READONLY)) {
8338 if (SvREADONLY(tmpRef))
cea2e8a9 8339 Perl_croak(aTHX_ PL_no_modify);
76e3520e
GS
8340 if (SvOBJECT(tmpRef)) {
8341 if (SvTYPE(tmpRef) != SVt_PVIO)
3280af22 8342 --PL_sv_objcount;
76e3520e 8343 SvREFCNT_dec(SvSTASH(tmpRef));
2e3febc6 8344 }
a0d0e21e 8345 }
76e3520e
GS
8346 SvOBJECT_on(tmpRef);
8347 if (SvTYPE(tmpRef) != SVt_PVIO)
3280af22 8348 ++PL_sv_objcount;
862a34c6 8349 SvUPGRADE(tmpRef, SVt_PVMG);
b162af07 8350 SvSTASH_set(tmpRef, (HV*)SvREFCNT_inc(stash));
a0d0e21e 8351
2e3febc6
CS
8352 if (Gv_AMG(stash))
8353 SvAMAGIC_on(sv);
8354 else
8355 SvAMAGIC_off(sv);
a0d0e21e 8356
1edbfb88
AB
8357 if(SvSMAGICAL(tmpRef))
8358 if(mg_find(tmpRef, PERL_MAGIC_ext) || mg_find(tmpRef, PERL_MAGIC_uvar))
8359 mg_set(tmpRef);
8360
8361
ecdeb87c 8362
a0d0e21e
LW
8363 return sv;
8364}
8365
645c22ef 8366/* Downgrades a PVGV to a PVMG.
645c22ef
DM
8367 */
8368
76e3520e 8369STATIC void
cea2e8a9 8370S_sv_unglob(pTHX_ SV *sv)
a0d0e21e 8371{
850fabdf
GS
8372 void *xpvmg;
8373
a0d0e21e
LW
8374 assert(SvTYPE(sv) == SVt_PVGV);
8375 SvFAKE_off(sv);
8376 if (GvGP(sv))
1edc1566 8377 gp_free((GV*)sv);
e826b3c7 8378 if (GvSTASH(sv)) {
e15faf7d 8379 sv_del_backref((SV*)GvSTASH(sv), sv);
e826b3c7
GS
8380 GvSTASH(sv) = Nullhv;
8381 }
14befaf4 8382 sv_unmagic(sv, PERL_MAGIC_glob);
a0d0e21e 8383 Safefree(GvNAME(sv));
a5f75d66 8384 GvMULTI_off(sv);
850fabdf
GS
8385
8386 /* need to keep SvANY(sv) in the right arena */
8387 xpvmg = new_XPVMG();
8388 StructCopy(SvANY(sv), xpvmg, XPVMG);
8389 del_XPVGV(SvANY(sv));
8390 SvANY(sv) = xpvmg;
8391
a0d0e21e
LW
8392 SvFLAGS(sv) &= ~SVTYPEMASK;
8393 SvFLAGS(sv) |= SVt_PVMG;
8394}
8395
954c1994 8396/*
840a7b70 8397=for apidoc sv_unref_flags
954c1994
GS
8398
8399Unsets the RV status of the SV, and decrements the reference count of
8400whatever was being referenced by the RV. This can almost be thought of
840a7b70
IZ
8401as a reversal of C<newSVrv>. The C<cflags> argument can contain
8402C<SV_IMMEDIATE_UNREF> to force the reference count to be decremented
8403(otherwise the decrementing is conditional on the reference count being
8404different from one or the reference being a readonly SV).
7889fe52 8405See C<SvROK_off>.
954c1994
GS
8406
8407=cut
8408*/
8409
ed6116ce 8410void
e15faf7d 8411Perl_sv_unref_flags(pTHX_ SV *ref, U32 flags)
ed6116ce 8412{
b64e5050 8413 SV* const target = SvRV(ref);
810b8aa5 8414
e15faf7d
NC
8415 if (SvWEAKREF(ref)) {
8416 sv_del_backref(target, ref);
8417 SvWEAKREF_off(ref);
8418 SvRV_set(ref, NULL);
810b8aa5
GS
8419 return;
8420 }
e15faf7d
NC
8421 SvRV_set(ref, NULL);
8422 SvROK_off(ref);
8423 /* You can't have a || SvREADONLY(target) here, as $a = $$a, where $a was
04ca4930 8424 assigned to as BEGIN {$a = \"Foo"} will fail. */
e15faf7d
NC
8425 if (SvREFCNT(target) != 1 || (flags & SV_IMMEDIATE_UNREF))
8426 SvREFCNT_dec(target);
840a7b70 8427 else /* XXX Hack, but hard to make $a=$a->[1] work otherwise */
e15faf7d 8428 sv_2mortal(target); /* Schedule for freeing later */
ed6116ce 8429}
8990e307 8430
840a7b70
IZ
8431/*
8432=for apidoc sv_unref
8433
8434Unsets the RV status of the SV, and decrements the reference count of
8435whatever was being referenced by the RV. This can almost be thought of
8436as a reversal of C<newSVrv>. This is C<sv_unref_flags> with the C<flag>
7889fe52 8437being zero. See C<SvROK_off>.
840a7b70
IZ
8438
8439=cut
8440*/
8441
8442void
8443Perl_sv_unref(pTHX_ SV *sv)
8444{
8445 sv_unref_flags(sv, 0);
8446}
8447
645c22ef
DM
8448/*
8449=for apidoc sv_taint
8450
8451Taint an SV. Use C<SvTAINTED_on> instead.
8452=cut
8453*/
8454
bbce6d69 8455void
864dbfa3 8456Perl_sv_taint(pTHX_ SV *sv)
bbce6d69 8457{
14befaf4 8458 sv_magic((sv), Nullsv, PERL_MAGIC_taint, Nullch, 0);
bbce6d69 8459}
8460
645c22ef
DM
8461/*
8462=for apidoc sv_untaint
8463
8464Untaint an SV. Use C<SvTAINTED_off> instead.
8465=cut
8466*/
8467
bbce6d69 8468void
864dbfa3 8469Perl_sv_untaint(pTHX_ SV *sv)
bbce6d69 8470{
13f57bf8 8471 if (SvTYPE(sv) >= SVt_PVMG && SvMAGIC(sv)) {
b64e5050 8472 MAGIC * const mg = mg_find(sv, PERL_MAGIC_taint);
36477c24 8473 if (mg)
565764a8 8474 mg->mg_len &= ~1;
36477c24 8475 }
bbce6d69 8476}
8477
645c22ef
DM
8478/*
8479=for apidoc sv_tainted
8480
8481Test an SV for taintedness. Use C<SvTAINTED> instead.
8482=cut
8483*/
8484
bbce6d69 8485bool
864dbfa3 8486Perl_sv_tainted(pTHX_ SV *sv)
bbce6d69 8487{
13f57bf8 8488 if (SvTYPE(sv) >= SVt_PVMG && SvMAGIC(sv)) {
a28509cc 8489 MAGIC * const mg = mg_find(sv, PERL_MAGIC_taint);
2ddb8a4f 8490 if (mg && (mg->mg_len & 1) )
36477c24 8491 return TRUE;
8492 }
8493 return FALSE;
bbce6d69 8494}
8495
09540bc3
JH
8496/*
8497=for apidoc sv_setpviv
8498
8499Copies an integer into the given SV, also updating its string value.
8500Does not handle 'set' magic. See C<sv_setpviv_mg>.
8501
8502=cut
8503*/
8504
8505void
8506Perl_sv_setpviv(pTHX_ SV *sv, IV iv)
8507{
8508 char buf[TYPE_CHARS(UV)];
8509 char *ebuf;
b64e5050 8510 char * const ptr = uiv_2buf(buf, iv, 0, 0, &ebuf);
09540bc3
JH
8511
8512 sv_setpvn(sv, ptr, ebuf - ptr);
8513}
8514
8515/*
8516=for apidoc sv_setpviv_mg
8517
8518Like C<sv_setpviv>, but also handles 'set' magic.
8519
8520=cut
8521*/
8522
8523void
8524Perl_sv_setpviv_mg(pTHX_ SV *sv, IV iv)
8525{
8526 char buf[TYPE_CHARS(UV)];
8527 char *ebuf;
b64e5050 8528 char * const ptr = uiv_2buf(buf, iv, 0, 0, &ebuf);
09540bc3
JH
8529
8530 sv_setpvn(sv, ptr, ebuf - ptr);
8531 SvSETMAGIC(sv);
8532}
8533
cea2e8a9 8534#if defined(PERL_IMPLICIT_CONTEXT)
645c22ef
DM
8535
8536/* pTHX_ magic can't cope with varargs, so this is a no-context
8537 * version of the main function, (which may itself be aliased to us).
8538 * Don't access this version directly.
8539 */
8540
cea2e8a9
GS
8541void
8542Perl_sv_setpvf_nocontext(SV *sv, const char* pat, ...)
8543{
8544 dTHX;
8545 va_list args;
8546 va_start(args, pat);
c5be433b 8547 sv_vsetpvf(sv, pat, &args);
cea2e8a9
GS
8548 va_end(args);
8549}
8550
645c22ef
DM
8551/* pTHX_ magic can't cope with varargs, so this is a no-context
8552 * version of the main function, (which may itself be aliased to us).
8553 * Don't access this version directly.
8554 */
cea2e8a9
GS
8555
8556void
8557Perl_sv_setpvf_mg_nocontext(SV *sv, const char* pat, ...)
8558{
8559 dTHX;
8560 va_list args;
8561 va_start(args, pat);
c5be433b 8562 sv_vsetpvf_mg(sv, pat, &args);
cea2e8a9 8563 va_end(args);
cea2e8a9
GS
8564}
8565#endif
8566
954c1994
GS
8567/*
8568=for apidoc sv_setpvf
8569
bffc3d17
SH
8570Works like C<sv_catpvf> but copies the text into the SV instead of
8571appending it. Does not handle 'set' magic. See C<sv_setpvf_mg>.
954c1994
GS
8572
8573=cut
8574*/
8575
46fc3d4c 8576void
864dbfa3 8577Perl_sv_setpvf(pTHX_ SV *sv, const char* pat, ...)
46fc3d4c 8578{
8579 va_list args;
46fc3d4c 8580 va_start(args, pat);
c5be433b 8581 sv_vsetpvf(sv, pat, &args);
46fc3d4c 8582 va_end(args);
8583}
8584
bffc3d17
SH
8585/*
8586=for apidoc sv_vsetpvf
8587
8588Works like C<sv_vcatpvf> but copies the text into the SV instead of
8589appending it. Does not handle 'set' magic. See C<sv_vsetpvf_mg>.
8590
8591Usually used via its frontend C<sv_setpvf>.
8592
8593=cut
8594*/
645c22ef 8595
c5be433b
GS
8596void
8597Perl_sv_vsetpvf(pTHX_ SV *sv, const char* pat, va_list* args)
8598{
8599 sv_vsetpvfn(sv, pat, strlen(pat), args, Null(SV**), 0, Null(bool*));
8600}
ef50df4b 8601
954c1994
GS
8602/*
8603=for apidoc sv_setpvf_mg
8604
8605Like C<sv_setpvf>, but also handles 'set' magic.
8606
8607=cut
8608*/
8609
ef50df4b 8610void
864dbfa3 8611Perl_sv_setpvf_mg(pTHX_ SV *sv, const char* pat, ...)
ef50df4b
GS
8612{
8613 va_list args;
ef50df4b 8614 va_start(args, pat);
c5be433b 8615 sv_vsetpvf_mg(sv, pat, &args);
ef50df4b 8616 va_end(args);
c5be433b
GS
8617}
8618
bffc3d17
SH
8619/*
8620=for apidoc sv_vsetpvf_mg
8621
8622Like C<sv_vsetpvf>, but also handles 'set' magic.
8623
8624Usually used via its frontend C<sv_setpvf_mg>.
8625
8626=cut
8627*/
645c22ef 8628
c5be433b
GS
8629void
8630Perl_sv_vsetpvf_mg(pTHX_ SV *sv, const char* pat, va_list* args)
8631{
8632 sv_vsetpvfn(sv, pat, strlen(pat), args, Null(SV**), 0, Null(bool*));
ef50df4b
GS
8633 SvSETMAGIC(sv);
8634}
8635
cea2e8a9 8636#if defined(PERL_IMPLICIT_CONTEXT)
645c22ef
DM
8637
8638/* pTHX_ magic can't cope with varargs, so this is a no-context
8639 * version of the main function, (which may itself be aliased to us).
8640 * Don't access this version directly.
8641 */
8642
cea2e8a9
GS
8643void
8644Perl_sv_catpvf_nocontext(SV *sv, const char* pat, ...)
8645{
8646 dTHX;
8647 va_list args;
8648 va_start(args, pat);
c5be433b 8649 sv_vcatpvf(sv, pat, &args);
cea2e8a9
GS
8650 va_end(args);
8651}
8652
645c22ef
DM
8653/* pTHX_ magic can't cope with varargs, so this is a no-context
8654 * version of the main function, (which may itself be aliased to us).
8655 * Don't access this version directly.
8656 */
8657
cea2e8a9
GS
8658void
8659Perl_sv_catpvf_mg_nocontext(SV *sv, const char* pat, ...)
8660{
8661 dTHX;
8662 va_list args;
8663 va_start(args, pat);
c5be433b 8664 sv_vcatpvf_mg(sv, pat, &args);
cea2e8a9 8665 va_end(args);
cea2e8a9
GS
8666}
8667#endif
8668
954c1994
GS
8669/*
8670=for apidoc sv_catpvf
8671
d5ce4a7c
GA
8672Processes its arguments like C<sprintf> and appends the formatted
8673output to an SV. If the appended data contains "wide" characters
8674(including, but not limited to, SVs with a UTF-8 PV formatted with %s,
8675and characters >255 formatted with %c), the original SV might get
bffc3d17 8676upgraded to UTF-8. Handles 'get' magic, but not 'set' magic. See
cdd94ca7
NC
8677C<sv_catpvf_mg>. If the original SV was UTF-8, the pattern should be
8678valid UTF-8; if the original SV was bytes, the pattern should be too.
954c1994 8679
d5ce4a7c 8680=cut */
954c1994 8681
46fc3d4c 8682void
864dbfa3 8683Perl_sv_catpvf(pTHX_ SV *sv, const char* pat, ...)
46fc3d4c 8684{
8685 va_list args;
46fc3d4c 8686 va_start(args, pat);
c5be433b 8687 sv_vcatpvf(sv, pat, &args);
46fc3d4c 8688 va_end(args);
8689}
8690
bffc3d17
SH
8691/*
8692=for apidoc sv_vcatpvf
8693
8694Processes its arguments like C<vsprintf> and appends the formatted output
8695to an SV. Does not handle 'set' magic. See C<sv_vcatpvf_mg>.
8696
8697Usually used via its frontend C<sv_catpvf>.
8698
8699=cut
8700*/
645c22ef 8701
ef50df4b 8702void
c5be433b
GS
8703Perl_sv_vcatpvf(pTHX_ SV *sv, const char* pat, va_list* args)
8704{
8705 sv_vcatpvfn(sv, pat, strlen(pat), args, Null(SV**), 0, Null(bool*));
8706}
8707
954c1994
GS
8708/*
8709=for apidoc sv_catpvf_mg
8710
8711Like C<sv_catpvf>, but also handles 'set' magic.
8712
8713=cut
8714*/
8715
c5be433b 8716void
864dbfa3 8717Perl_sv_catpvf_mg(pTHX_ SV *sv, const char* pat, ...)
ef50df4b
GS
8718{
8719 va_list args;
ef50df4b 8720 va_start(args, pat);
c5be433b 8721 sv_vcatpvf_mg(sv, pat, &args);
ef50df4b 8722 va_end(args);
c5be433b
GS
8723}
8724
bffc3d17
SH
8725/*
8726=for apidoc sv_vcatpvf_mg
8727
8728Like C<sv_vcatpvf>, but also handles 'set' magic.
8729
8730Usually used via its frontend C<sv_catpvf_mg>.
8731
8732=cut
8733*/
645c22ef 8734
c5be433b
GS
8735void
8736Perl_sv_vcatpvf_mg(pTHX_ SV *sv, const char* pat, va_list* args)
8737{
8738 sv_vcatpvfn(sv, pat, strlen(pat), args, Null(SV**), 0, Null(bool*));
ef50df4b
GS
8739 SvSETMAGIC(sv);
8740}
8741
954c1994
GS
8742/*
8743=for apidoc sv_vsetpvfn
8744
bffc3d17 8745Works like C<sv_vcatpvfn> but copies the text into the SV instead of
954c1994
GS
8746appending it.
8747
bffc3d17 8748Usually used via one of its frontends C<sv_vsetpvf> and C<sv_vsetpvf_mg>.
645c22ef 8749
954c1994
GS
8750=cut
8751*/
8752
46fc3d4c 8753void
7d5ea4e7 8754Perl_sv_vsetpvfn(pTHX_ SV *sv, const char *pat, STRLEN patlen, va_list *args, SV **svargs, I32 svmax, bool *maybe_tainted)
46fc3d4c 8755{
8756 sv_setpvn(sv, "", 0);
7d5ea4e7 8757 sv_vcatpvfn(sv, pat, patlen, args, svargs, svmax, maybe_tainted);
46fc3d4c 8758}
8759
645c22ef
DM
8760/* private function for use in sv_vcatpvfn via the EXPECT_NUMBER macro */
8761
2d00ba3b 8762STATIC I32
9dd79c3f 8763S_expect_number(pTHX_ char** pattern)
211dfcf1
HS
8764{
8765 I32 var = 0;
8766 switch (**pattern) {
8767 case '1': case '2': case '3':
8768 case '4': case '5': case '6':
8769 case '7': case '8': case '9':
8770 while (isDIGIT(**pattern))
8771 var = var * 10 + (*(*pattern)++ - '0');
8772 }
8773 return var;
8774}
9dd79c3f 8775#define EXPECT_NUMBER(pattern, var) (var = S_expect_number(aTHX_ &pattern))
211dfcf1 8776
4151a5fe
IZ
8777static char *
8778F0convert(NV nv, char *endbuf, STRLEN *len)
8779{
a3b680e6 8780 const int neg = nv < 0;
4151a5fe 8781 UV uv;
4151a5fe
IZ
8782
8783 if (neg)
8784 nv = -nv;
8785 if (nv < UV_MAX) {
b464bac0 8786 char *p = endbuf;
4151a5fe 8787 nv += 0.5;
028f8eaa 8788 uv = (UV)nv;
4151a5fe
IZ
8789 if (uv & 1 && uv == nv)
8790 uv--; /* Round to even */
8791 do {
a3b680e6 8792 const unsigned dig = uv % 10;
4151a5fe
IZ
8793 *--p = '0' + dig;
8794 } while (uv /= 10);
8795 if (neg)
8796 *--p = '-';
8797 *len = endbuf - p;
8798 return p;
8799 }
8800 return Nullch;
8801}
8802
8803
954c1994
GS
8804/*
8805=for apidoc sv_vcatpvfn
8806
8807Processes its arguments like C<vsprintf> and appends the formatted output
8808to an SV. Uses an array of SVs if the C style variable argument list is
8809missing (NULL). When running with taint checks enabled, indicates via
8810C<maybe_tainted> if results are untrustworthy (often due to the use of
8811locales).
8812
bffc3d17 8813Usually used via one of its frontends C<sv_vcatpvf> and C<sv_vcatpvf_mg>.
645c22ef 8814
954c1994
GS
8815=cut
8816*/
8817
1ef29b0e
RGS
8818/* XXX maybe_tainted is never assigned to, so the doc above is lying. */
8819
46fc3d4c 8820void
7d5ea4e7 8821Perl_sv_vcatpvfn(pTHX_ SV *sv, const char *pat, STRLEN patlen, va_list *args, SV **svargs, I32 svmax, bool *maybe_tainted)
46fc3d4c 8822{
8823 char *p;
8824 char *q;
a3b680e6 8825 const char *patend;
fc36a67e 8826 STRLEN origlen;
46fc3d4c 8827 I32 svix = 0;
27da23d5 8828 static const char nullstr[] = "(null)";
9c5ffd7c 8829 SV *argsv = Nullsv;
b464bac0
AL
8830 bool has_utf8 = DO_UTF8(sv); /* has the result utf8? */
8831 const bool pat_utf8 = has_utf8; /* the pattern is in utf8? */
db79b45b 8832 SV *nsv = Nullsv;
4151a5fe
IZ
8833 /* Times 4: a decimal digit takes more than 3 binary digits.
8834 * NV_DIG: mantissa takes than many decimal digits.
8835 * Plus 32: Playing safe. */
8836 char ebuf[IV_DIG * 4 + NV_DIG + 32];
8837 /* large enough for "%#.#f" --chip */
8838 /* what about long double NVs? --jhi */
db79b45b 8839
53c1dcc0
AL
8840 PERL_UNUSED_ARG(maybe_tainted);
8841
46fc3d4c 8842 /* no matter what, this is a string now */
fc36a67e 8843 (void)SvPV_force(sv, origlen);
46fc3d4c 8844
0dbb1585 8845 /* special-case "", "%s", and "%-p" (SVf) */
46fc3d4c 8846 if (patlen == 0)
8847 return;
0dbb1585 8848 if (patlen == 2 && pat[0] == '%' && pat[1] == 's') {
c635e13b 8849 if (args) {
53c1dcc0 8850 const char * const s = va_arg(*args, char*);
c635e13b 8851 sv_catpv(sv, s ? s : nullstr);
8852 }
7e2040f0 8853 else if (svix < svmax) {
fc36a67e 8854 sv_catsv(sv, *svargs);
7e2040f0
GS
8855 if (DO_UTF8(*svargs))
8856 SvUTF8_on(sv);
8857 }
fc36a67e 8858 return;
0dbb1585
AL
8859 }
8860 if (patlen == 3 && pat[0] == '%' &&
8861 pat[1] == '-' && pat[2] == 'p') {
fc36a67e 8862 if (args) {
7e2040f0
GS
8863 argsv = va_arg(*args, SV*);
8864 sv_catsv(sv, argsv);
8865 if (DO_UTF8(argsv))
8866 SvUTF8_on(sv);
fc36a67e 8867 return;
8868 }
46fc3d4c 8869 }
8870
1d917b39 8871#ifndef USE_LONG_DOUBLE
4151a5fe 8872 /* special-case "%.<number>[gf]" */
7af36d83 8873 if ( !args && patlen <= 5 && pat[0] == '%' && pat[1] == '.'
4151a5fe
IZ
8874 && (pat[patlen-1] == 'g' || pat[patlen-1] == 'f') ) {
8875 unsigned digits = 0;
8876 const char *pp;
8877
8878 pp = pat + 2;
8879 while (*pp >= '0' && *pp <= '9')
8880 digits = 10 * digits + (*pp++ - '0');
028f8eaa 8881 if (pp - pat == (int)patlen - 1) {
4151a5fe
IZ
8882 NV nv;
8883
7af36d83 8884 if (svix < svmax)
4151a5fe
IZ
8885 nv = SvNV(*svargs);
8886 else
8887 return;
8888 if (*pp == 'g') {
2873255c
NC
8889 /* Add check for digits != 0 because it seems that some
8890 gconverts are buggy in this case, and we don't yet have
8891 a Configure test for this. */
8892 if (digits && digits < sizeof(ebuf) - NV_DIG - 10) {
8893 /* 0, point, slack */
2e59c212 8894 Gconvert(nv, (int)digits, 0, ebuf);
4151a5fe
IZ
8895 sv_catpv(sv, ebuf);
8896 if (*ebuf) /* May return an empty string for digits==0 */
8897 return;
8898 }
8899 } else if (!digits) {
8900 STRLEN l;
8901
8902 if ((p = F0convert(nv, ebuf + sizeof ebuf, &l))) {
8903 sv_catpvn(sv, p, l);
8904 return;
8905 }
8906 }
8907 }
8908 }
1d917b39 8909#endif /* !USE_LONG_DOUBLE */
4151a5fe 8910
2cf2cfc6 8911 if (!args && svix < svmax && DO_UTF8(*svargs))
205f51d8 8912 has_utf8 = TRUE;
2cf2cfc6 8913
46fc3d4c 8914 patend = (char*)pat + patlen;
8915 for (p = (char*)pat; p < patend; p = q) {
8916 bool alt = FALSE;
8917 bool left = FALSE;
b22c7a20 8918 bool vectorize = FALSE;
211dfcf1 8919 bool vectorarg = FALSE;
2cf2cfc6 8920 bool vec_utf8 = FALSE;
46fc3d4c 8921 char fill = ' ';
8922 char plus = 0;
8923 char intsize = 0;
8924 STRLEN width = 0;
fc36a67e 8925 STRLEN zeros = 0;
46fc3d4c 8926 bool has_precis = FALSE;
8927 STRLEN precis = 0;
58e33a90 8928 I32 osvix = svix;
2cf2cfc6 8929 bool is_utf8 = FALSE; /* is this item utf8? */
20f6aaab
AS
8930#ifdef HAS_LDBL_SPRINTF_BUG
8931 /* This is to try to fix a bug with irix/nonstop-ux/powerux and
205f51d8 8932 with sfio - Allen <allens@cpan.org> */
20f6aaab
AS
8933 bool fix_ldbl_sprintf_bug = FALSE;
8934#endif
205f51d8 8935
46fc3d4c 8936 char esignbuf[4];
89ebb4a3 8937 U8 utf8buf[UTF8_MAXBYTES+1];
46fc3d4c 8938 STRLEN esignlen = 0;
8939
4d84ee25 8940 const char *eptr = Nullch;
fc36a67e 8941 STRLEN elen = 0;
81f715da 8942 SV *vecsv = Nullsv;
245d4a47 8943 const U8 *vecstr = Null(U8*);
b22c7a20 8944 STRLEN veclen = 0;
934abaf1 8945 char c = 0;
46fc3d4c 8946 int i;
9c5ffd7c 8947 unsigned base = 0;
8c8eb53c
RB
8948 IV iv = 0;
8949 UV uv = 0;
9e5b023a
JH
8950 /* we need a long double target in case HAS_LONG_DOUBLE but
8951 not USE_LONG_DOUBLE
8952 */
35fff930 8953#if defined(HAS_LONG_DOUBLE) && LONG_DOUBLESIZE > DOUBLESIZE
9e5b023a
JH
8954 long double nv;
8955#else
65202027 8956 NV nv;
9e5b023a 8957#endif
46fc3d4c 8958 STRLEN have;
8959 STRLEN need;
8960 STRLEN gap;
7af36d83 8961 const char *dotstr = ".";
b22c7a20 8962 STRLEN dotstrlen = 1;
211dfcf1 8963 I32 efix = 0; /* explicit format parameter index */
eb3fce90 8964 I32 ewix = 0; /* explicit width index */
211dfcf1
HS
8965 I32 epix = 0; /* explicit precision index */
8966 I32 evix = 0; /* explicit vector index */
eb3fce90 8967 bool asterisk = FALSE;
46fc3d4c 8968
211dfcf1 8969 /* echo everything up to the next format specification */
46fc3d4c 8970 for (q = p; q < patend && *q != '%'; ++q) ;
8971 if (q > p) {
db79b45b
JH
8972 if (has_utf8 && !pat_utf8)
8973 sv_catpvn_utf8_upgrade(sv, p, q - p, nsv);
8974 else
8975 sv_catpvn(sv, p, q - p);
46fc3d4c 8976 p = q;
8977 }
8978 if (q++ >= patend)
8979 break;
8980
211dfcf1
HS
8981/*
8982 We allow format specification elements in this order:
8983 \d+\$ explicit format parameter index
8984 [-+ 0#]+ flags
a472f209 8985 v|\*(\d+\$)?v vector with optional (optionally specified) arg
f3583277 8986 0 flag (as above): repeated to allow "v02"
211dfcf1
HS
8987 \d+|\*(\d+\$)? width using optional (optionally specified) arg
8988 \.(\d*|\*(\d+\$)?) precision using optional (optionally specified) arg
8989 [hlqLV] size
8990 [%bcdefginopsux_DFOUX] format (mandatory)
8991*/
8992 if (EXPECT_NUMBER(q, width)) {
8993 if (*q == '$') {
8994 ++q;
8995 efix = width;
8996 } else {
8997 goto gotwidth;
8998 }
8999 }
9000
fc36a67e 9001 /* FLAGS */
9002
46fc3d4c 9003 while (*q) {
9004 switch (*q) {
9005 case ' ':
9006 case '+':
9007 plus = *q++;
9008 continue;
9009
9010 case '-':
9011 left = TRUE;
9012 q++;
9013 continue;
9014
9015 case '0':
9016 fill = *q++;
9017 continue;
9018
9019 case '#':
9020 alt = TRUE;
9021 q++;
9022 continue;
9023
fc36a67e 9024 default:
9025 break;
9026 }
9027 break;
9028 }
46fc3d4c 9029
211dfcf1 9030 tryasterisk:
eb3fce90 9031 if (*q == '*') {
211dfcf1
HS
9032 q++;
9033 if (EXPECT_NUMBER(q, ewix))
9034 if (*q++ != '$')
9035 goto unknown;
eb3fce90 9036 asterisk = TRUE;
211dfcf1
HS
9037 }
9038 if (*q == 'v') {
eb3fce90 9039 q++;
211dfcf1
HS
9040 if (vectorize)
9041 goto unknown;
9cbac4c7 9042 if ((vectorarg = asterisk)) {
211dfcf1
HS
9043 evix = ewix;
9044 ewix = 0;
9045 asterisk = FALSE;
9046 }
9047 vectorize = TRUE;
9048 goto tryasterisk;
eb3fce90
JH
9049 }
9050
211dfcf1 9051 if (!asterisk)
7a5fa8a2 9052 if( *q == '0' )
f3583277 9053 fill = *q++;
211dfcf1
HS
9054 EXPECT_NUMBER(q, width);
9055
9056 if (vectorize) {
9057 if (vectorarg) {
9058 if (args)
9059 vecsv = va_arg(*args, SV*);
9060 else
9061 vecsv = (evix ? evix <= svmax : svix < svmax) ?
3a7a539e 9062 svargs[evix ? evix-1 : svix++] : &PL_sv_undef;
245d4a47 9063 dotstr = SvPV_const(vecsv, dotstrlen);
211dfcf1 9064 if (DO_UTF8(vecsv))
2cf2cfc6 9065 is_utf8 = TRUE;
211dfcf1
HS
9066 }
9067 if (args) {
9068 vecsv = va_arg(*args, SV*);
245d4a47 9069 vecstr = (U8*)SvPV_const(vecsv,veclen);
2cf2cfc6 9070 vec_utf8 = DO_UTF8(vecsv);
eb3fce90 9071 }
211dfcf1
HS
9072 else if (efix ? efix <= svmax : svix < svmax) {
9073 vecsv = svargs[efix ? efix-1 : svix++];
245d4a47 9074 vecstr = (U8*)SvPV_const(vecsv,veclen);
2cf2cfc6 9075 vec_utf8 = DO_UTF8(vecsv);
d7aa5382 9076 /* if this is a version object, we need to return the
3f7c398e 9077 * stringified representation (which the SvPVX_const has
d7aa5382
JP
9078 * already done for us), but not vectorize the args
9079 */
9080 if ( *q == 'd' && sv_derived_from(vecsv,"version") )
9081 {
9082 q++; /* skip past the rest of the %vd format */
245d4a47 9083 eptr = (const char *) vecstr;
d7aa5382
JP
9084 elen = strlen(eptr);
9085 vectorize=FALSE;
9086 goto string;
9087 }
211dfcf1
HS
9088 }
9089 else {
9090 vecstr = (U8*)"";
9091 veclen = 0;
9092 }
eb3fce90 9093 }
fc36a67e 9094
eb3fce90 9095 if (asterisk) {
fc36a67e 9096 if (args)
9097 i = va_arg(*args, int);
9098 else
eb3fce90
JH
9099 i = (ewix ? ewix <= svmax : svix < svmax) ?
9100 SvIVx(svargs[ewix ? ewix-1 : svix++]) : 0;
fc36a67e 9101 left |= (i < 0);
9102 width = (i < 0) ? -i : i;
fc36a67e 9103 }
211dfcf1 9104 gotwidth:
fc36a67e 9105
9106 /* PRECISION */
46fc3d4c 9107
fc36a67e 9108 if (*q == '.') {
9109 q++;
9110 if (*q == '*') {
211dfcf1 9111 q++;
7b8dd722
HS
9112 if (EXPECT_NUMBER(q, epix) && *q++ != '$')
9113 goto unknown;
9114 /* XXX: todo, support specified precision parameter */
9115 if (epix)
211dfcf1 9116 goto unknown;
46fc3d4c 9117 if (args)
9118 i = va_arg(*args, int);
9119 else
eb3fce90
JH
9120 i = (ewix ? ewix <= svmax : svix < svmax)
9121 ? SvIVx(svargs[ewix ? ewix-1 : svix++]) : 0;
fc36a67e 9122 precis = (i < 0) ? 0 : i;
fc36a67e 9123 }
9124 else {
9125 precis = 0;
9126 while (isDIGIT(*q))
9127 precis = precis * 10 + (*q++ - '0');
9128 }
9129 has_precis = TRUE;
9130 }
46fc3d4c 9131
fc36a67e 9132 /* SIZE */
46fc3d4c 9133
fc36a67e 9134 switch (*q) {
c623ac67
GS
9135#ifdef WIN32
9136 case 'I': /* Ix, I32x, and I64x */
9137# ifdef WIN64
9138 if (q[1] == '6' && q[2] == '4') {
9139 q += 3;
9140 intsize = 'q';
9141 break;
9142 }
9143# endif
9144 if (q[1] == '3' && q[2] == '2') {
9145 q += 3;
9146 break;
9147 }
9148# ifdef WIN64
9149 intsize = 'q';
9150# endif
9151 q++;
9152 break;
9153#endif
9e5b023a 9154#if defined(HAS_QUAD) || defined(HAS_LONG_DOUBLE)
6f9bb7fd 9155 case 'L': /* Ld */
e5c81feb 9156 /* FALL THROUGH */
e5c81feb 9157#ifdef HAS_QUAD
6f9bb7fd 9158 case 'q': /* qd */
9e5b023a 9159#endif
6f9bb7fd
GS
9160 intsize = 'q';
9161 q++;
9162 break;
9163#endif
fc36a67e 9164 case 'l':
9e5b023a 9165#if defined(HAS_QUAD) || defined(HAS_LONG_DOUBLE)
205f51d8 9166 if (*(q + 1) == 'l') { /* lld, llf */
fc36a67e 9167 intsize = 'q';
9168 q += 2;
46fc3d4c 9169 break;
cf2093f6 9170 }
fc36a67e 9171#endif
6f9bb7fd 9172 /* FALL THROUGH */
fc36a67e 9173 case 'h':
cf2093f6 9174 /* FALL THROUGH */
fc36a67e 9175 case 'V':
9176 intsize = *q++;
46fc3d4c 9177 break;
9178 }
9179
fc36a67e 9180 /* CONVERSION */
9181
211dfcf1
HS
9182 if (*q == '%') {
9183 eptr = q++;
9184 elen = 1;
9185 goto string;
9186 }
9187
be75b157
HS
9188 if (vectorize)
9189 argsv = vecsv;
9190 else if (!args)
211dfcf1
HS
9191 argsv = (efix ? efix <= svmax : svix < svmax) ?
9192 svargs[efix ? efix-1 : svix++] : &PL_sv_undef;
9193
46fc3d4c 9194 switch (c = *q++) {
9195
9196 /* STRINGS */
9197
46fc3d4c 9198 case 'c':
be75b157 9199 uv = (args && !vectorize) ? va_arg(*args, int) : SvIVx(argsv);
1bd104fb
JH
9200 if ((uv > 255 ||
9201 (!UNI_IS_INVARIANT(uv) && SvUTF8(sv)))
0064a8a9 9202 && !IN_BYTES) {
dfe13c55 9203 eptr = (char*)utf8buf;
9041c2e3 9204 elen = uvchr_to_utf8((U8*)eptr, uv) - utf8buf;
2cf2cfc6 9205 is_utf8 = TRUE;
7e2040f0
GS
9206 }
9207 else {
9208 c = (char)uv;
9209 eptr = &c;
9210 elen = 1;
a0ed51b3 9211 }
46fc3d4c 9212 goto string;
9213
46fc3d4c 9214 case 's':
be75b157 9215 if (args && !vectorize) {
fc36a67e 9216 eptr = va_arg(*args, char*);
c635e13b 9217 if (eptr)
1d7c1841
GS
9218#ifdef MACOS_TRADITIONAL
9219 /* On MacOS, %#s format is used for Pascal strings */
9220 if (alt)
9221 elen = *eptr++;
9222 else
9223#endif
c635e13b 9224 elen = strlen(eptr);
9225 else {
27da23d5 9226 eptr = (char *)nullstr;
c635e13b 9227 elen = sizeof nullstr - 1;
9228 }
46fc3d4c 9229 }
211dfcf1 9230 else {
4d84ee25 9231 eptr = SvPVx_const(argsv, elen);
7e2040f0 9232 if (DO_UTF8(argsv)) {
a0ed51b3
LW
9233 if (has_precis && precis < elen) {
9234 I32 p = precis;
7e2040f0 9235 sv_pos_u2b(argsv, &p, 0); /* sticks at end */
a0ed51b3
LW
9236 precis = p;
9237 }
9238 if (width) { /* fudge width (can't fudge elen) */
7e2040f0 9239 width += elen - sv_len_utf8(argsv);
a0ed51b3 9240 }
2cf2cfc6 9241 is_utf8 = TRUE;
a0ed51b3
LW
9242 }
9243 }
fc36a67e 9244
46fc3d4c 9245 string:
b22c7a20 9246 vectorize = FALSE;
46fc3d4c 9247 if (has_precis && elen > precis)
9248 elen = precis;
9249 break;
9250
9251 /* INTEGERS */
9252
fc36a67e 9253 case 'p':
0dbb1585 9254 if (left && args) { /* SVf */
5df617be 9255 left = FALSE;
0dbb1585
AL
9256 if (width) {
9257 precis = width;
9258 has_precis = TRUE;
9259 width = 0;
9260 }
9261 if (vectorize)
9262 goto unknown;
9263 argsv = va_arg(*args, SV*);
4d84ee25 9264 eptr = SvPVx_const(argsv, elen);
0dbb1585
AL
9265 if (DO_UTF8(argsv))
9266 is_utf8 = TRUE;
9267 goto string;
5df617be 9268 }
be75b157 9269 if (alt || vectorize)
c2e66d9e 9270 goto unknown;
211dfcf1 9271 uv = PTR2UV(args ? va_arg(*args, void*) : argsv);
fc36a67e 9272 base = 16;
9273 goto integer;
9274
46fc3d4c 9275 case 'D':
29fe7a80 9276#ifdef IV_IS_QUAD
22f3ae8c 9277 intsize = 'q';
29fe7a80 9278#else
46fc3d4c 9279 intsize = 'l';
29fe7a80 9280#endif
46fc3d4c 9281 /* FALL THROUGH */
9282 case 'd':
9283 case 'i':
b22c7a20 9284 if (vectorize) {
ba210ebe 9285 STRLEN ulen;
211dfcf1
HS
9286 if (!veclen)
9287 continue;
2cf2cfc6
A
9288 if (vec_utf8)
9289 uv = utf8n_to_uvchr(vecstr, veclen, &ulen,
9290 UTF8_ALLOW_ANYUV);
b22c7a20 9291 else {
e83d50c9 9292 uv = *vecstr;
b22c7a20
GS
9293 ulen = 1;
9294 }
9295 vecstr += ulen;
9296 veclen -= ulen;
e83d50c9
JP
9297 if (plus)
9298 esignbuf[esignlen++] = plus;
b22c7a20
GS
9299 }
9300 else if (args) {
46fc3d4c 9301 switch (intsize) {
9302 case 'h': iv = (short)va_arg(*args, int); break;
46fc3d4c 9303 case 'l': iv = va_arg(*args, long); break;
fc36a67e 9304 case 'V': iv = va_arg(*args, IV); break;
b10c0dba 9305 default: iv = va_arg(*args, int); break;
cf2093f6
JH
9306#ifdef HAS_QUAD
9307 case 'q': iv = va_arg(*args, Quad_t); break;
9308#endif
46fc3d4c 9309 }
9310 }
9311 else {
b10c0dba 9312 IV tiv = SvIVx(argsv); /* work around GCC bug #13488 */
46fc3d4c 9313 switch (intsize) {
b10c0dba
MHM
9314 case 'h': iv = (short)tiv; break;
9315 case 'l': iv = (long)tiv; break;
9316 case 'V':
9317 default: iv = tiv; break;
cf2093f6 9318#ifdef HAS_QUAD
b10c0dba 9319 case 'q': iv = (Quad_t)tiv; break;
cf2093f6 9320#endif
46fc3d4c 9321 }
9322 }
e83d50c9
JP
9323 if ( !vectorize ) /* we already set uv above */
9324 {
9325 if (iv >= 0) {
9326 uv = iv;
9327 if (plus)
9328 esignbuf[esignlen++] = plus;
9329 }
9330 else {
9331 uv = -iv;
9332 esignbuf[esignlen++] = '-';
9333 }
46fc3d4c 9334 }
9335 base = 10;
9336 goto integer;
9337
fc36a67e 9338 case 'U':
29fe7a80 9339#ifdef IV_IS_QUAD
22f3ae8c 9340 intsize = 'q';
29fe7a80 9341#else
fc36a67e 9342 intsize = 'l';
29fe7a80 9343#endif
fc36a67e 9344 /* FALL THROUGH */
9345 case 'u':
9346 base = 10;
9347 goto uns_integer;
9348
4f19785b
WSI
9349 case 'b':
9350 base = 2;
9351 goto uns_integer;
9352
46fc3d4c 9353 case 'O':
29fe7a80 9354#ifdef IV_IS_QUAD
22f3ae8c 9355 intsize = 'q';
29fe7a80 9356#else
46fc3d4c 9357 intsize = 'l';
29fe7a80 9358#endif
46fc3d4c 9359 /* FALL THROUGH */
9360 case 'o':
9361 base = 8;
9362 goto uns_integer;
9363
9364 case 'X':
46fc3d4c 9365 case 'x':
9366 base = 16;
46fc3d4c 9367
9368 uns_integer:
b22c7a20 9369 if (vectorize) {
ba210ebe 9370 STRLEN ulen;
b22c7a20 9371 vector:
211dfcf1
HS
9372 if (!veclen)
9373 continue;
2cf2cfc6
A
9374 if (vec_utf8)
9375 uv = utf8n_to_uvchr(vecstr, veclen, &ulen,
9376 UTF8_ALLOW_ANYUV);
b22c7a20 9377 else {
a05b299f 9378 uv = *vecstr;
b22c7a20
GS
9379 ulen = 1;
9380 }
9381 vecstr += ulen;
9382 veclen -= ulen;
9383 }
9384 else if (args) {
46fc3d4c 9385 switch (intsize) {
9386 case 'h': uv = (unsigned short)va_arg(*args, unsigned); break;
46fc3d4c 9387 case 'l': uv = va_arg(*args, unsigned long); break;
fc36a67e 9388 case 'V': uv = va_arg(*args, UV); break;
b10c0dba 9389 default: uv = va_arg(*args, unsigned); break;
cf2093f6 9390#ifdef HAS_QUAD
9e3321a5 9391 case 'q': uv = va_arg(*args, Uquad_t); break;
cf2093f6 9392#endif
46fc3d4c 9393 }
9394 }
9395 else {
b10c0dba 9396 UV tuv = SvUVx(argsv); /* work around GCC bug #13488 */
46fc3d4c 9397 switch (intsize) {
b10c0dba
MHM
9398 case 'h': uv = (unsigned short)tuv; break;
9399 case 'l': uv = (unsigned long)tuv; break;
9400 case 'V':
9401 default: uv = tuv; break;
cf2093f6 9402#ifdef HAS_QUAD
b10c0dba 9403 case 'q': uv = (Uquad_t)tuv; break;
cf2093f6 9404#endif
46fc3d4c 9405 }
9406 }
9407
9408 integer:
4d84ee25
NC
9409 {
9410 char *ptr = ebuf + sizeof ebuf;
9411 switch (base) {
9412 unsigned dig;
9413 case 16:
9414 if (!uv)
9415 alt = FALSE;
9416 p = (char*)((c == 'X')
9417 ? "0123456789ABCDEF" : "0123456789abcdef");
9418 do {
9419 dig = uv & 15;
9420 *--ptr = p[dig];
9421 } while (uv >>= 4);
9422 if (alt) {
9423 esignbuf[esignlen++] = '0';
9424 esignbuf[esignlen++] = c; /* 'x' or 'X' */
9425 }
9426 break;
9427 case 8:
9428 do {
9429 dig = uv & 7;
9430 *--ptr = '0' + dig;
9431 } while (uv >>= 3);
9432 if (alt && *ptr != '0')
9433 *--ptr = '0';
9434 break;
9435 case 2:
9436 do {
9437 dig = uv & 1;
9438 *--ptr = '0' + dig;
9439 } while (uv >>= 1);
9440 if (alt) {
9441 esignbuf[esignlen++] = '0';
9442 esignbuf[esignlen++] = 'b';
9443 }
9444 break;
9445 default: /* it had better be ten or less */
9446 do {
9447 dig = uv % base;
9448 *--ptr = '0' + dig;
9449 } while (uv /= base);
9450 break;
46fc3d4c 9451 }
4d84ee25
NC
9452 elen = (ebuf + sizeof ebuf) - ptr;
9453 eptr = ptr;
9454 if (has_precis) {
9455 if (precis > elen)
9456 zeros = precis - elen;
9457 else if (precis == 0 && elen == 1 && *eptr == '0')
9458 elen = 0;
eda88b6d 9459 }
c10ed8b9 9460 }
46fc3d4c 9461 break;
9462
9463 /* FLOATING POINT */
9464
fc36a67e 9465 case 'F':
9466 c = 'f'; /* maybe %F isn't supported here */
9467 /* FALL THROUGH */
46fc3d4c 9468 case 'e': case 'E':
fc36a67e 9469 case 'f':
46fc3d4c 9470 case 'g': case 'G':
9471
9472 /* This is evil, but floating point is even more evil */
9473
9e5b023a
JH
9474 /* for SV-style calling, we can only get NV
9475 for C-style calling, we assume %f is double;
9476 for simplicity we allow any of %Lf, %llf, %qf for long double
9477 */
9478 switch (intsize) {
9479 case 'V':
9480#if defined(USE_LONG_DOUBLE)
9481 intsize = 'q';
9482#endif
9483 break;
8a2e3f14 9484/* [perl #20339] - we should accept and ignore %lf rather than die */
00e17364
HS
9485 case 'l':
9486 /* FALL THROUGH */
9e5b023a
JH
9487 default:
9488#if defined(USE_LONG_DOUBLE)
9489 intsize = args ? 0 : 'q';
9490#endif
9491 break;
9492 case 'q':
9493#if defined(HAS_LONG_DOUBLE)
9494 break;
9495#else
9496 /* FALL THROUGH */
9497#endif
9498 case 'h':
9e5b023a
JH
9499 goto unknown;
9500 }
9501
9502 /* now we need (long double) if intsize == 'q', else (double) */
be75b157 9503 nv = (args && !vectorize) ?
35fff930
JH
9504#if LONG_DOUBLESIZE > DOUBLESIZE
9505 intsize == 'q' ?
205f51d8
AS
9506 va_arg(*args, long double) :
9507 va_arg(*args, double)
35fff930 9508#else
205f51d8 9509 va_arg(*args, double)
35fff930 9510#endif
9e5b023a 9511 : SvNVx(argsv);
fc36a67e 9512
9513 need = 0;
be75b157 9514 vectorize = FALSE;
fc36a67e 9515 if (c != 'e' && c != 'E') {
9516 i = PERL_INT_MIN;
9e5b023a
JH
9517 /* FIXME: if HAS_LONG_DOUBLE but not USE_LONG_DOUBLE this
9518 will cast our (long double) to (double) */
73b309ea 9519 (void)Perl_frexp(nv, &i);
fc36a67e 9520 if (i == PERL_INT_MIN)
cea2e8a9 9521 Perl_die(aTHX_ "panic: frexp");
c635e13b 9522 if (i > 0)
fc36a67e 9523 need = BIT_DIGITS(i);
9524 }
9525 need += has_precis ? precis : 6; /* known default */
20f6aaab 9526
fc36a67e 9527 if (need < width)
9528 need = width;
9529
20f6aaab
AS
9530#ifdef HAS_LDBL_SPRINTF_BUG
9531 /* This is to try to fix a bug with irix/nonstop-ux/powerux and
205f51d8
AS
9532 with sfio - Allen <allens@cpan.org> */
9533
9534# ifdef DBL_MAX
9535# define MY_DBL_MAX DBL_MAX
9536# else /* XXX guessing! HUGE_VAL may be defined as infinity, so not using */
9537# if DOUBLESIZE >= 8
9538# define MY_DBL_MAX 1.7976931348623157E+308L
9539# else
9540# define MY_DBL_MAX 3.40282347E+38L
9541# endif
9542# endif
9543
9544# ifdef HAS_LDBL_SPRINTF_BUG_LESS1 /* only between -1L & 1L - Allen */
9545# define MY_DBL_MAX_BUG 1L
20f6aaab 9546# else
205f51d8 9547# define MY_DBL_MAX_BUG MY_DBL_MAX
20f6aaab 9548# endif
20f6aaab 9549
205f51d8
AS
9550# ifdef DBL_MIN
9551# define MY_DBL_MIN DBL_MIN
9552# else /* XXX guessing! -Allen */
9553# if DOUBLESIZE >= 8
9554# define MY_DBL_MIN 2.2250738585072014E-308L
9555# else
9556# define MY_DBL_MIN 1.17549435E-38L
9557# endif
9558# endif
20f6aaab 9559
205f51d8
AS
9560 if ((intsize == 'q') && (c == 'f') &&
9561 ((nv < MY_DBL_MAX_BUG) && (nv > -MY_DBL_MAX_BUG)) &&
9562 (need < DBL_DIG)) {
9563 /* it's going to be short enough that
9564 * long double precision is not needed */
9565
9566 if ((nv <= 0L) && (nv >= -0L))
9567 fix_ldbl_sprintf_bug = TRUE; /* 0 is 0 - easiest */
9568 else {
9569 /* would use Perl_fp_class as a double-check but not
9570 * functional on IRIX - see perl.h comments */
9571
9572 if ((nv >= MY_DBL_MIN) || (nv <= -MY_DBL_MIN)) {
9573 /* It's within the range that a double can represent */
9574#if defined(DBL_MAX) && !defined(DBL_MIN)
9575 if ((nv >= ((long double)1/DBL_MAX)) ||
9576 (nv <= (-(long double)1/DBL_MAX)))
20f6aaab 9577#endif
205f51d8 9578 fix_ldbl_sprintf_bug = TRUE;
20f6aaab 9579 }
205f51d8
AS
9580 }
9581 if (fix_ldbl_sprintf_bug == TRUE) {
9582 double temp;
9583
9584 intsize = 0;
9585 temp = (double)nv;
9586 nv = (NV)temp;
9587 }
20f6aaab 9588 }
205f51d8
AS
9589
9590# undef MY_DBL_MAX
9591# undef MY_DBL_MAX_BUG
9592# undef MY_DBL_MIN
9593
20f6aaab
AS
9594#endif /* HAS_LDBL_SPRINTF_BUG */
9595
46fc3d4c 9596 need += 20; /* fudge factor */
80252599
GS
9597 if (PL_efloatsize < need) {
9598 Safefree(PL_efloatbuf);
9599 PL_efloatsize = need + 20; /* more fudge */
a02a5408 9600 Newx(PL_efloatbuf, PL_efloatsize, char);
7d5ea4e7 9601 PL_efloatbuf[0] = '\0';
46fc3d4c 9602 }
9603
4151a5fe
IZ
9604 if ( !(width || left || plus || alt) && fill != '0'
9605 && has_precis && intsize != 'q' ) { /* Shortcuts */
2873255c
NC
9606 /* See earlier comment about buggy Gconvert when digits,
9607 aka precis is 0 */
9608 if ( c == 'g' && precis) {
2e59c212 9609 Gconvert((NV)nv, (int)precis, 0, PL_efloatbuf);
4151a5fe
IZ
9610 if (*PL_efloatbuf) /* May return an empty string for digits==0 */
9611 goto float_converted;
9612 } else if ( c == 'f' && !precis) {
9613 if ((eptr = F0convert(nv, ebuf + sizeof ebuf, &elen)))
9614 break;
9615 }
9616 }
4d84ee25
NC
9617 {
9618 char *ptr = ebuf + sizeof ebuf;
9619 *--ptr = '\0';
9620 *--ptr = c;
9621 /* FIXME: what to do if HAS_LONG_DOUBLE but not PERL_PRIfldbl? */
9e5b023a 9622#if defined(HAS_LONG_DOUBLE) && defined(PERL_PRIfldbl)
4d84ee25
NC
9623 if (intsize == 'q') {
9624 /* Copy the one or more characters in a long double
9625 * format before the 'base' ([efgEFG]) character to
9626 * the format string. */
9627 static char const prifldbl[] = PERL_PRIfldbl;
9628 char const *p = prifldbl + sizeof(prifldbl) - 3;
9629 while (p >= prifldbl) { *--ptr = *p--; }
9630 }
65202027 9631#endif
4d84ee25
NC
9632 if (has_precis) {
9633 base = precis;
9634 do { *--ptr = '0' + (base % 10); } while (base /= 10);
9635 *--ptr = '.';
9636 }
9637 if (width) {
9638 base = width;
9639 do { *--ptr = '0' + (base % 10); } while (base /= 10);
9640 }
9641 if (fill == '0')
9642 *--ptr = fill;
9643 if (left)
9644 *--ptr = '-';
9645 if (plus)
9646 *--ptr = plus;
9647 if (alt)
9648 *--ptr = '#';
9649 *--ptr = '%';
9650
9651 /* No taint. Otherwise we are in the strange situation
9652 * where printf() taints but print($float) doesn't.
9653 * --jhi */
9e5b023a 9654#if defined(HAS_LONG_DOUBLE)
4d84ee25
NC
9655 if (intsize == 'q')
9656 (void)sprintf(PL_efloatbuf, ptr, nv);
9657 else
9658 (void)sprintf(PL_efloatbuf, ptr, (double)nv);
9e5b023a 9659#else
4d84ee25 9660 (void)sprintf(PL_efloatbuf, ptr, nv);
9e5b023a 9661#endif
4d84ee25 9662 }
4151a5fe 9663 float_converted:
80252599
GS
9664 eptr = PL_efloatbuf;
9665 elen = strlen(PL_efloatbuf);
46fc3d4c 9666 break;
9667
fc36a67e 9668 /* SPECIAL */
9669
9670 case 'n':
9671 i = SvCUR(sv) - origlen;
be75b157 9672 if (args && !vectorize) {
c635e13b 9673 switch (intsize) {
9674 case 'h': *(va_arg(*args, short*)) = i; break;
9675 default: *(va_arg(*args, int*)) = i; break;
9676 case 'l': *(va_arg(*args, long*)) = i; break;
9677 case 'V': *(va_arg(*args, IV*)) = i; break;
cf2093f6
JH
9678#ifdef HAS_QUAD
9679 case 'q': *(va_arg(*args, Quad_t*)) = i; break;
9680#endif
c635e13b 9681 }
fc36a67e 9682 }
9dd79c3f 9683 else
211dfcf1 9684 sv_setuv_mg(argsv, (UV)i);
be75b157 9685 vectorize = FALSE;
fc36a67e 9686 continue; /* not "break" */
9687
9688 /* UNKNOWN */
9689
46fc3d4c 9690 default:
fc36a67e 9691 unknown:
041457d9
DM
9692 if (!args
9693 && (PL_op->op_type == OP_PRTF || PL_op->op_type == OP_SPRINTF)
9694 && ckWARN(WARN_PRINTF))
9695 {
c635e13b 9696 SV *msg = sv_newmortal();
35c1215d
NC
9697 Perl_sv_setpvf(aTHX_ msg, "Invalid conversion in %sprintf: ",
9698 (PL_op->op_type == OP_PRTF) ? "" : "s");
0f4b6630 9699 if (c) {
0f4b6630 9700 if (isPRINT(c))
1c846c1f 9701 Perl_sv_catpvf(aTHX_ msg,
0f4b6630
JH
9702 "\"%%%c\"", c & 0xFF);
9703 else
9704 Perl_sv_catpvf(aTHX_ msg,
57def98f 9705 "\"%%\\%03"UVof"\"",
0f4b6630 9706 (UV)c & 0xFF);
0f4b6630 9707 } else
c635e13b 9708 sv_catpv(msg, "end of string");
9014280d 9709 Perl_warner(aTHX_ packWARN(WARN_PRINTF), "%"SVf, msg); /* yes, this is reentrant */
c635e13b 9710 }
fb73857a 9711
9712 /* output mangled stuff ... */
9713 if (c == '\0')
9714 --q;
46fc3d4c 9715 eptr = p;
9716 elen = q - p;
fb73857a 9717
9718 /* ... right here, because formatting flags should not apply */
9719 SvGROW(sv, SvCUR(sv) + elen + 1);
9720 p = SvEND(sv);
4459522c 9721 Copy(eptr, p, elen, char);
fb73857a 9722 p += elen;
9723 *p = '\0';
3f7c398e 9724 SvCUR_set(sv, p - SvPVX_const(sv));
58e33a90 9725 svix = osvix;
fb73857a 9726 continue; /* not "break" */
46fc3d4c 9727 }
9728
6c94ec8b
HS
9729 /* calculate width before utf8_upgrade changes it */
9730 have = esignlen + zeros + elen;
9731
d2876be5
JH
9732 if (is_utf8 != has_utf8) {
9733 if (is_utf8) {
9734 if (SvCUR(sv))
9735 sv_utf8_upgrade(sv);
9736 }
9737 else {
53c1dcc0 9738 SV * const nsv = sv_2mortal(newSVpvn(eptr, elen));
d2876be5 9739 sv_utf8_upgrade(nsv);
93524f2b 9740 eptr = SvPVX_const(nsv);
d2876be5
JH
9741 elen = SvCUR(nsv);
9742 }
9743 SvGROW(sv, SvCUR(sv) + elen + 1);
9744 p = SvEND(sv);
9745 *p = '\0';
9746 }
6af65485 9747
46fc3d4c 9748 need = (have > width ? have : width);
9749 gap = need - have;
9750
b22c7a20 9751 SvGROW(sv, SvCUR(sv) + need + dotstrlen + 1);
46fc3d4c 9752 p = SvEND(sv);
9753 if (esignlen && fill == '0') {
53c1dcc0 9754 int i;
eb160463 9755 for (i = 0; i < (int)esignlen; i++)
46fc3d4c 9756 *p++ = esignbuf[i];
9757 }
9758 if (gap && !left) {
9759 memset(p, fill, gap);
9760 p += gap;
9761 }
9762 if (esignlen && fill != '0') {
53c1dcc0 9763 int i;
eb160463 9764 for (i = 0; i < (int)esignlen; i++)
46fc3d4c 9765 *p++ = esignbuf[i];
9766 }
fc36a67e 9767 if (zeros) {
53c1dcc0 9768 int i;
fc36a67e 9769 for (i = zeros; i; i--)
9770 *p++ = '0';
9771 }
46fc3d4c 9772 if (elen) {
4459522c 9773 Copy(eptr, p, elen, char);
46fc3d4c 9774 p += elen;
9775 }
9776 if (gap && left) {
9777 memset(p, ' ', gap);
9778 p += gap;
9779 }
b22c7a20
GS
9780 if (vectorize) {
9781 if (veclen) {
4459522c 9782 Copy(dotstr, p, dotstrlen, char);
b22c7a20
GS
9783 p += dotstrlen;
9784 }
9785 else
9786 vectorize = FALSE; /* done iterating over vecstr */
9787 }
2cf2cfc6
A
9788 if (is_utf8)
9789 has_utf8 = TRUE;
9790 if (has_utf8)
7e2040f0 9791 SvUTF8_on(sv);
46fc3d4c 9792 *p = '\0';
3f7c398e 9793 SvCUR_set(sv, p - SvPVX_const(sv));
b22c7a20
GS
9794 if (vectorize) {
9795 esignlen = 0;
9796 goto vector;
9797 }
46fc3d4c 9798 }
9799}
51371543 9800
645c22ef
DM
9801/* =========================================================================
9802
9803=head1 Cloning an interpreter
9804
9805All the macros and functions in this section are for the private use of
9806the main function, perl_clone().
9807
9808The foo_dup() functions make an exact copy of an existing foo thinngy.
9809During the course of a cloning, a hash table is used to map old addresses
9810to new addresses. The table is created and manipulated with the
9811ptr_table_* functions.
9812
9813=cut
9814
9815============================================================================*/
9816
9817
1d7c1841
GS
9818#if defined(USE_ITHREADS)
9819
1d7c1841
GS
9820#ifndef GpREFCNT_inc
9821# define GpREFCNT_inc(gp) ((gp) ? (++(gp)->gp_refcnt, (gp)) : (GP*)NULL)
9822#endif
9823
9824
d2d73c3e
AB
9825#define sv_dup_inc(s,t) SvREFCNT_inc(sv_dup(s,t))
9826#define av_dup(s,t) (AV*)sv_dup((SV*)s,t)
9827#define av_dup_inc(s,t) (AV*)SvREFCNT_inc(sv_dup((SV*)s,t))
9828#define hv_dup(s,t) (HV*)sv_dup((SV*)s,t)
9829#define hv_dup_inc(s,t) (HV*)SvREFCNT_inc(sv_dup((SV*)s,t))
9830#define cv_dup(s,t) (CV*)sv_dup((SV*)s,t)
9831#define cv_dup_inc(s,t) (CV*)SvREFCNT_inc(sv_dup((SV*)s,t))
9832#define io_dup(s,t) (IO*)sv_dup((SV*)s,t)
9833#define io_dup_inc(s,t) (IO*)SvREFCNT_inc(sv_dup((SV*)s,t))
9834#define gv_dup(s,t) (GV*)sv_dup((SV*)s,t)
9835#define gv_dup_inc(s,t) (GV*)SvREFCNT_inc(sv_dup((SV*)s,t))
1d7c1841
GS
9836#define SAVEPV(p) (p ? savepv(p) : Nullch)
9837#define SAVEPVN(p,n) (p ? savepvn(p,n) : Nullch)
8cf8f3d1 9838
d2d73c3e 9839
d2f185dc
AMS
9840/* Duplicate a regexp. Required reading: pregcomp() and pregfree() in
9841 regcomp.c. AMS 20010712 */
645c22ef 9842
1d7c1841 9843REGEXP *
53c1dcc0 9844Perl_re_dup(pTHX_ const REGEXP *r, CLONE_PARAMS *param)
1d7c1841 9845{
27da23d5 9846 dVAR;
d2f185dc
AMS
9847 REGEXP *ret;
9848 int i, len, npar;
9849 struct reg_substr_datum *s;
9850
9851 if (!r)
9852 return (REGEXP *)NULL;
9853
9854 if ((ret = (REGEXP *)ptr_table_fetch(PL_ptr_table, r)))
9855 return ret;
9856
9857 len = r->offsets[0];
9858 npar = r->nparens+1;
9859
a02a5408 9860 Newxc(ret, sizeof(regexp) + (len+1)*sizeof(regnode), char, regexp);
d2f185dc
AMS
9861 Copy(r->program, ret->program, len+1, regnode);
9862
a02a5408 9863 Newx(ret->startp, npar, I32);
d2f185dc 9864 Copy(r->startp, ret->startp, npar, I32);
a02a5408 9865 Newx(ret->endp, npar, I32);
d2f185dc
AMS
9866 Copy(r->startp, ret->startp, npar, I32);
9867
a02a5408 9868 Newx(ret->substrs, 1, struct reg_substr_data);
d2f185dc
AMS
9869 for (s = ret->substrs->data, i = 0; i < 3; i++, s++) {
9870 s->min_offset = r->substrs->data[i].min_offset;
9871 s->max_offset = r->substrs->data[i].max_offset;
9872 s->substr = sv_dup_inc(r->substrs->data[i].substr, param);
33b8afdf 9873 s->utf8_substr = sv_dup_inc(r->substrs->data[i].utf8_substr, param);
d2f185dc
AMS
9874 }
9875
70612e96 9876 ret->regstclass = NULL;
d2f185dc
AMS
9877 if (r->data) {
9878 struct reg_data *d;
e1ec3a88 9879 const int count = r->data->count;
53c1dcc0 9880 int i;
d2f185dc 9881
a02a5408 9882 Newxc(d, sizeof(struct reg_data) + count*sizeof(void *),
d2f185dc 9883 char, struct reg_data);
a02a5408 9884 Newx(d->what, count, U8);
d2f185dc
AMS
9885
9886 d->count = count;
9887 for (i = 0; i < count; i++) {
9888 d->what[i] = r->data->what[i];
9889 switch (d->what[i]) {
a3621e74
YO
9890 /* legal options are one of: sfpont
9891 see also regcomp.h and pregfree() */
d2f185dc
AMS
9892 case 's':
9893 d->data[i] = sv_dup_inc((SV *)r->data->data[i], param);
9894 break;
9895 case 'p':
9896 d->data[i] = av_dup_inc((AV *)r->data->data[i], param);
9897 break;
9898 case 'f':
9899 /* This is cheating. */
a02a5408 9900 Newx(d->data[i], 1, struct regnode_charclass_class);
d2f185dc
AMS
9901 StructCopy(r->data->data[i], d->data[i],
9902 struct regnode_charclass_class);
70612e96 9903 ret->regstclass = (regnode*)d->data[i];
d2f185dc
AMS
9904 break;
9905 case 'o':
33773810
AMS
9906 /* Compiled op trees are readonly, and can thus be
9907 shared without duplication. */
b34c0dd4 9908 OP_REFCNT_LOCK;
9b978d73 9909 d->data[i] = (void*)OpREFCNT_inc((OP*)r->data->data[i]);
b34c0dd4 9910 OP_REFCNT_UNLOCK;
9b978d73 9911 break;
d2f185dc
AMS
9912 case 'n':
9913 d->data[i] = r->data->data[i];
9914 break;
a3621e74
YO
9915 case 't':
9916 d->data[i] = r->data->data[i];
9917 OP_REFCNT_LOCK;
9918 ((reg_trie_data*)d->data[i])->refcount++;
9919 OP_REFCNT_UNLOCK;
9920 break;
9921 default:
9922 Perl_croak(aTHX_ "panic: re_dup unknown data code '%c'", r->data->what[i]);
d2f185dc
AMS
9923 }
9924 }
9925
9926 ret->data = d;
9927 }
9928 else
9929 ret->data = NULL;
9930
a02a5408 9931 Newx(ret->offsets, 2*len+1, U32);
d2f185dc
AMS
9932 Copy(r->offsets, ret->offsets, 2*len+1, U32);
9933
e01c5899 9934 ret->precomp = SAVEPVN(r->precomp, r->prelen);
d2f185dc
AMS
9935 ret->refcnt = r->refcnt;
9936 ret->minlen = r->minlen;
9937 ret->prelen = r->prelen;
9938 ret->nparens = r->nparens;
9939 ret->lastparen = r->lastparen;
9940 ret->lastcloseparen = r->lastcloseparen;
9941 ret->reganch = r->reganch;
9942
70612e96
RG
9943 ret->sublen = r->sublen;
9944
9945 if (RX_MATCH_COPIED(ret))
e01c5899 9946 ret->subbeg = SAVEPVN(r->subbeg, r->sublen);
70612e96
RG
9947 else
9948 ret->subbeg = Nullch;
f8c7b90f 9949#ifdef PERL_OLD_COPY_ON_WRITE
9a26048b
NC
9950 ret->saved_copy = Nullsv;
9951#endif
70612e96 9952
d2f185dc
AMS
9953 ptr_table_store(PL_ptr_table, r, ret);
9954 return ret;
1d7c1841
GS
9955}
9956
d2d73c3e 9957/* duplicate a file handle */
645c22ef 9958
1d7c1841 9959PerlIO *
a8fc9800 9960Perl_fp_dup(pTHX_ PerlIO *fp, char type, CLONE_PARAMS *param)
1d7c1841
GS
9961{
9962 PerlIO *ret;
53c1dcc0
AL
9963
9964 PERL_UNUSED_ARG(type);
73d840c0 9965
1d7c1841
GS
9966 if (!fp)
9967 return (PerlIO*)NULL;
9968
9969 /* look for it in the table first */
9970 ret = (PerlIO*)ptr_table_fetch(PL_ptr_table, fp);
9971 if (ret)
9972 return ret;
9973
9974 /* create anew and remember what it is */
ecdeb87c 9975 ret = PerlIO_fdupopen(aTHX_ fp, param, PERLIO_DUP_CLONE);
1d7c1841
GS
9976 ptr_table_store(PL_ptr_table, fp, ret);
9977 return ret;
9978}
9979
645c22ef
DM
9980/* duplicate a directory handle */
9981
1d7c1841
GS
9982DIR *
9983Perl_dirp_dup(pTHX_ DIR *dp)
9984{
9985 if (!dp)
9986 return (DIR*)NULL;
9987 /* XXX TODO */
9988 return dp;
9989}
9990
ff276b08 9991/* duplicate a typeglob */
645c22ef 9992
1d7c1841 9993GP *
a8fc9800 9994Perl_gp_dup(pTHX_ GP *gp, CLONE_PARAMS* param)
1d7c1841
GS
9995{
9996 GP *ret;
9997 if (!gp)
9998 return (GP*)NULL;
9999 /* look for it in the table first */
10000 ret = (GP*)ptr_table_fetch(PL_ptr_table, gp);
10001 if (ret)
10002 return ret;
10003
10004 /* create anew and remember what it is */
a02a5408 10005 Newxz(ret, 1, GP);
1d7c1841
GS
10006 ptr_table_store(PL_ptr_table, gp, ret);
10007
10008 /* clone */
10009 ret->gp_refcnt = 0; /* must be before any other dups! */
d2d73c3e
AB
10010 ret->gp_sv = sv_dup_inc(gp->gp_sv, param);
10011 ret->gp_io = io_dup_inc(gp->gp_io, param);
10012 ret->gp_form = cv_dup_inc(gp->gp_form, param);
10013 ret->gp_av = av_dup_inc(gp->gp_av, param);
10014 ret->gp_hv = hv_dup_inc(gp->gp_hv, param);
10015 ret->gp_egv = gv_dup(gp->gp_egv, param);/* GvEGV is not refcounted */
10016 ret->gp_cv = cv_dup_inc(gp->gp_cv, param);
1d7c1841 10017 ret->gp_cvgen = gp->gp_cvgen;
1d7c1841
GS
10018 ret->gp_line = gp->gp_line;
10019 ret->gp_file = gp->gp_file; /* points to COP.cop_file */
10020 return ret;
10021}
10022
645c22ef
DM
10023/* duplicate a chain of magic */
10024
1d7c1841 10025MAGIC *
a8fc9800 10026Perl_mg_dup(pTHX_ MAGIC *mg, CLONE_PARAMS* param)
1d7c1841 10027{
cb359b41
JH
10028 MAGIC *mgprev = (MAGIC*)NULL;
10029 MAGIC *mgret;
1d7c1841
GS
10030 if (!mg)
10031 return (MAGIC*)NULL;
10032 /* look for it in the table first */
10033 mgret = (MAGIC*)ptr_table_fetch(PL_ptr_table, mg);
10034 if (mgret)
10035 return mgret;
10036
10037 for (; mg; mg = mg->mg_moremagic) {
10038 MAGIC *nmg;
a02a5408 10039 Newxz(nmg, 1, MAGIC);
cb359b41 10040 if (mgprev)
1d7c1841 10041 mgprev->mg_moremagic = nmg;
cb359b41
JH
10042 else
10043 mgret = nmg;
1d7c1841
GS
10044 nmg->mg_virtual = mg->mg_virtual; /* XXX copy dynamic vtable? */
10045 nmg->mg_private = mg->mg_private;
10046 nmg->mg_type = mg->mg_type;
10047 nmg->mg_flags = mg->mg_flags;
14befaf4 10048 if (mg->mg_type == PERL_MAGIC_qr) {
d2f185dc 10049 nmg->mg_obj = (SV*)re_dup((REGEXP*)mg->mg_obj, param);
1d7c1841 10050 }
05bd4103 10051 else if(mg->mg_type == PERL_MAGIC_backref) {
7fc63493 10052 const AV * const av = (AV*) mg->mg_obj;
fdc9a813
AE
10053 SV **svp;
10054 I32 i;
7fc63493 10055 (void)SvREFCNT_inc(nmg->mg_obj = (SV*)newAV());
fdc9a813
AE
10056 svp = AvARRAY(av);
10057 for (i = AvFILLp(av); i >= 0; i--) {
3a81978b 10058 if (!svp[i]) continue;
fdc9a813
AE
10059 av_push((AV*)nmg->mg_obj,sv_dup(svp[i],param));
10060 }
05bd4103 10061 }
8d2f4536
NC
10062 else if (mg->mg_type == PERL_MAGIC_symtab) {
10063 nmg->mg_obj = mg->mg_obj;
10064 }
1d7c1841
GS
10065 else {
10066 nmg->mg_obj = (mg->mg_flags & MGf_REFCOUNTED)
d2d73c3e
AB
10067 ? sv_dup_inc(mg->mg_obj, param)
10068 : sv_dup(mg->mg_obj, param);
1d7c1841
GS
10069 }
10070 nmg->mg_len = mg->mg_len;
10071 nmg->mg_ptr = mg->mg_ptr; /* XXX random ptr? */
14befaf4 10072 if (mg->mg_ptr && mg->mg_type != PERL_MAGIC_regex_global) {
68795e93 10073 if (mg->mg_len > 0) {
1d7c1841 10074 nmg->mg_ptr = SAVEPVN(mg->mg_ptr, mg->mg_len);
14befaf4
DM
10075 if (mg->mg_type == PERL_MAGIC_overload_table &&
10076 AMT_AMAGIC((AMT*)mg->mg_ptr))
10077 {
1d7c1841
GS
10078 AMT *amtp = (AMT*)mg->mg_ptr;
10079 AMT *namtp = (AMT*)nmg->mg_ptr;
10080 I32 i;
10081 for (i = 1; i < NofAMmeth; i++) {
d2d73c3e 10082 namtp->table[i] = cv_dup_inc(amtp->table[i], param);
1d7c1841
GS
10083 }
10084 }
10085 }
10086 else if (mg->mg_len == HEf_SVKEY)
d2d73c3e 10087 nmg->mg_ptr = (char*)sv_dup_inc((SV*)mg->mg_ptr, param);
1d7c1841 10088 }
68795e93
NIS
10089 if ((mg->mg_flags & MGf_DUP) && mg->mg_virtual && mg->mg_virtual->svt_dup) {
10090 CALL_FPTR(nmg->mg_virtual->svt_dup)(aTHX_ nmg, param);
10091 }
1d7c1841
GS
10092 mgprev = nmg;
10093 }
10094 return mgret;
10095}
10096
645c22ef
DM
10097/* create a new pointer-mapping table */
10098
1d7c1841
GS
10099PTR_TBL_t *
10100Perl_ptr_table_new(pTHX)
10101{
10102 PTR_TBL_t *tbl;
a02a5408 10103 Newxz(tbl, 1, PTR_TBL_t);
1d7c1841
GS
10104 tbl->tbl_max = 511;
10105 tbl->tbl_items = 0;
a02a5408 10106 Newxz(tbl->tbl_ary, tbl->tbl_max + 1, PTR_TBL_ENT_t*);
1d7c1841
GS
10107 return tbl;
10108}
10109
134ca3d6
DM
10110#if (PTRSIZE == 8)
10111# define PTR_TABLE_HASH(ptr) (PTR2UV(ptr) >> 3)
10112#else
10113# define PTR_TABLE_HASH(ptr) (PTR2UV(ptr) >> 2)
10114#endif
10115
cb4415b8 10116#define del_pte(p) del_body_type(p, struct ptr_tbl_ent, pte)
32e691d0 10117
645c22ef
DM
10118/* map an existing pointer using a table */
10119
1d7c1841 10120void *
53c1dcc0 10121Perl_ptr_table_fetch(pTHX_ PTR_TBL_t *tbl, const void *sv)
1d7c1841
GS
10122{
10123 PTR_TBL_ENT_t *tblent;
4373e329 10124 const UV hash = PTR_TABLE_HASH(sv);
1d7c1841
GS
10125 assert(tbl);
10126 tblent = tbl->tbl_ary[hash & tbl->tbl_max];
10127 for (; tblent; tblent = tblent->next) {
10128 if (tblent->oldval == sv)
10129 return tblent->newval;
10130 }
10131 return (void*)NULL;
10132}
10133
645c22ef
DM
10134/* add a new entry to a pointer-mapping table */
10135
1d7c1841 10136void
53c1dcc0 10137Perl_ptr_table_store(pTHX_ PTR_TBL_t *tbl, const void *oldv, void *newv)
1d7c1841
GS
10138{
10139 PTR_TBL_ENT_t *tblent, **otblent;
10140 /* XXX this may be pessimal on platforms where pointers aren't good
10141 * hash values e.g. if they grow faster in the most significant
10142 * bits */
4373e329 10143 const UV hash = PTR_TABLE_HASH(oldv);
14cade97 10144 bool empty = 1;
1d7c1841
GS
10145
10146 assert(tbl);
10147 otblent = &tbl->tbl_ary[hash & tbl->tbl_max];
14cade97 10148 for (tblent = *otblent; tblent; empty=0, tblent = tblent->next) {
1d7c1841
GS
10149 if (tblent->oldval == oldv) {
10150 tblent->newval = newv;
1d7c1841
GS
10151 return;
10152 }
10153 }
08742458
NC
10154 new_body_inline(tblent, (void**)&PL_pte_arenaroot, (void**)&PL_pte_root,
10155 sizeof(struct ptr_tbl_ent));
1d7c1841
GS
10156 tblent->oldval = oldv;
10157 tblent->newval = newv;
10158 tblent->next = *otblent;
10159 *otblent = tblent;
10160 tbl->tbl_items++;
14cade97 10161 if (!empty && tbl->tbl_items > tbl->tbl_max)
1d7c1841
GS
10162 ptr_table_split(tbl);
10163}
10164
645c22ef
DM
10165/* double the hash bucket size of an existing ptr table */
10166
1d7c1841
GS
10167void
10168Perl_ptr_table_split(pTHX_ PTR_TBL_t *tbl)
10169{
10170 PTR_TBL_ENT_t **ary = tbl->tbl_ary;
4373e329 10171 const UV oldsize = tbl->tbl_max + 1;
1d7c1841
GS
10172 UV newsize = oldsize * 2;
10173 UV i;
10174
10175 Renew(ary, newsize, PTR_TBL_ENT_t*);
10176 Zero(&ary[oldsize], newsize-oldsize, PTR_TBL_ENT_t*);
10177 tbl->tbl_max = --newsize;
10178 tbl->tbl_ary = ary;
10179 for (i=0; i < oldsize; i++, ary++) {
10180 PTR_TBL_ENT_t **curentp, **entp, *ent;
10181 if (!*ary)
10182 continue;
10183 curentp = ary + oldsize;
10184 for (entp = ary, ent = *ary; ent; ent = *entp) {
134ca3d6 10185 if ((newsize & PTR_TABLE_HASH(ent->oldval)) != i) {
1d7c1841
GS
10186 *entp = ent->next;
10187 ent->next = *curentp;
10188 *curentp = ent;
10189 continue;
10190 }
10191 else
10192 entp = &ent->next;
10193 }
10194 }
10195}
10196
645c22ef
DM
10197/* remove all the entries from a ptr table */
10198
a0739874
DM
10199void
10200Perl_ptr_table_clear(pTHX_ PTR_TBL_t *tbl)
10201{
10202 register PTR_TBL_ENT_t **array;
10203 register PTR_TBL_ENT_t *entry;
a0739874
DM
10204 UV riter = 0;
10205 UV max;
10206
10207 if (!tbl || !tbl->tbl_items) {
10208 return;
10209 }
10210
10211 array = tbl->tbl_ary;
10212 entry = array[0];
10213 max = tbl->tbl_max;
10214
10215 for (;;) {
10216 if (entry) {
4373e329 10217 PTR_TBL_ENT_t *oentry = entry;
a0739874 10218 entry = entry->next;
437a6bf1 10219 del_pte(oentry);
a0739874
DM
10220 }
10221 if (!entry) {
10222 if (++riter > max) {
10223 break;
10224 }
10225 entry = array[riter];
10226 }
10227 }
10228
10229 tbl->tbl_items = 0;
10230}
10231
645c22ef
DM
10232/* clear and free a ptr table */
10233
a0739874
DM
10234void
10235Perl_ptr_table_free(pTHX_ PTR_TBL_t *tbl)
10236{
10237 if (!tbl) {
10238 return;
10239 }
10240 ptr_table_clear(tbl);
10241 Safefree(tbl->tbl_ary);
10242 Safefree(tbl);
10243}
10244
5bd07a3d 10245
83841fad
NIS
10246void
10247Perl_rvpv_dup(pTHX_ SV *dstr, SV *sstr, CLONE_PARAMS* param)
10248{
10249 if (SvROK(sstr)) {
b162af07
SP
10250 SvRV_set(dstr, SvWEAKREF(sstr)
10251 ? sv_dup(SvRV(sstr), param)
10252 : sv_dup_inc(SvRV(sstr), param));
f880fe2f 10253
83841fad 10254 }
3f7c398e 10255 else if (SvPVX_const(sstr)) {
83841fad
NIS
10256 /* Has something there */
10257 if (SvLEN(sstr)) {
68795e93 10258 /* Normal PV - clone whole allocated space */
3f7c398e 10259 SvPV_set(dstr, SAVEPVN(SvPVX_const(sstr), SvLEN(sstr)-1));
d3d0e6f1
NC
10260 if (SvREADONLY(sstr) && SvFAKE(sstr)) {
10261 /* Not that normal - actually sstr is copy on write.
10262 But we are a true, independant SV, so: */
10263 SvREADONLY_off(dstr);
10264 SvFAKE_off(dstr);
10265 }
68795e93 10266 }
83841fad
NIS
10267 else {
10268 /* Special case - not normally malloced for some reason */
ef10be65
NC
10269 if ((SvREADONLY(sstr) && SvFAKE(sstr))) {
10270 /* A "shared" PV - clone it as "shared" PV */
10271 SvPV_set(dstr,
10272 HEK_KEY(hek_dup(SvSHARED_HEK_FROM_PV(SvPVX_const(sstr)),
10273 param)));
83841fad
NIS
10274 }
10275 else {
10276 /* Some other special case - random pointer */
f880fe2f 10277 SvPV_set(dstr, SvPVX(sstr));
d3d0e6f1 10278 }
83841fad
NIS
10279 }
10280 }
10281 else {
10282 /* Copy the Null */
f880fe2f 10283 if (SvTYPE(dstr) == SVt_RV)
b162af07 10284 SvRV_set(dstr, NULL);
f880fe2f
SP
10285 else
10286 SvPV_set(dstr, 0);
83841fad
NIS
10287 }
10288}
10289
662fb8b2
NC
10290/* duplicate an SV of any type (including AV, HV etc) */
10291
1d7c1841 10292SV *
a8fc9800 10293Perl_sv_dup(pTHX_ SV *sstr, CLONE_PARAMS* param)
1d7c1841 10294{
27da23d5 10295 dVAR;
1d7c1841
GS
10296 SV *dstr;
10297
10298 if (!sstr || SvTYPE(sstr) == SVTYPEMASK)
10299 return Nullsv;
10300 /* look for it in the table first */
10301 dstr = (SV*)ptr_table_fetch(PL_ptr_table, sstr);
10302 if (dstr)
10303 return dstr;
10304
0405e91e
AB
10305 if(param->flags & CLONEf_JOIN_IN) {
10306 /** We are joining here so we don't want do clone
10307 something that is bad **/
bfcb3514 10308 const char *hvname;
0405e91e
AB
10309
10310 if(SvTYPE(sstr) == SVt_PVHV &&
bfcb3514 10311 (hvname = HvNAME_get(sstr))) {
0405e91e 10312 /** don't clone stashes if they already exist **/
bfcb3514 10313 HV* old_stash = gv_stashpv(hvname,0);
0405e91e
AB
10314 return (SV*) old_stash;
10315 }
10316 }
10317
1d7c1841
GS
10318 /* create anew and remember what it is */
10319 new_SV(dstr);
fd0854ff
DM
10320
10321#ifdef DEBUG_LEAKING_SCALARS
10322 dstr->sv_debug_optype = sstr->sv_debug_optype;
10323 dstr->sv_debug_line = sstr->sv_debug_line;
10324 dstr->sv_debug_inpad = sstr->sv_debug_inpad;
10325 dstr->sv_debug_cloned = 1;
10326# ifdef NETWARE
10327 dstr->sv_debug_file = savepv(sstr->sv_debug_file);
10328# else
10329 dstr->sv_debug_file = savesharedpv(sstr->sv_debug_file);
10330# endif
10331#endif
10332
1d7c1841
GS
10333 ptr_table_store(PL_ptr_table, sstr, dstr);
10334
10335 /* clone */
10336 SvFLAGS(dstr) = SvFLAGS(sstr);
10337 SvFLAGS(dstr) &= ~SVf_OOK; /* don't propagate OOK hack */
10338 SvREFCNT(dstr) = 0; /* must be before any other dups! */
10339
10340#ifdef DEBUGGING
3f7c398e 10341 if (SvANY(sstr) && PL_watch_pvx && SvPVX_const(sstr) == PL_watch_pvx)
1d7c1841 10342 PerlIO_printf(Perl_debug_log, "watch at %p hit, found string \"%s\"\n",
3f7c398e 10343 PL_watch_pvx, SvPVX_const(sstr));
1d7c1841
GS
10344#endif
10345
9660f481
DM
10346 /* don't clone objects whose class has asked us not to */
10347 if (SvOBJECT(sstr) && ! (SvFLAGS(SvSTASH(sstr)) & SVphv_CLONEABLE)) {
10348 SvFLAGS(dstr) &= ~SVTYPEMASK;
10349 SvOBJECT_off(dstr);
10350 return dstr;
10351 }
10352
1d7c1841
GS
10353 switch (SvTYPE(sstr)) {
10354 case SVt_NULL:
10355 SvANY(dstr) = NULL;
10356 break;
10357 case SVt_IV:
339049b0 10358 SvANY(dstr) = (XPVIV*)((char*)&(dstr->sv_u.svu_iv) - STRUCT_OFFSET(XPVIV, xiv_iv));
45977657 10359 SvIV_set(dstr, SvIVX(sstr));
1d7c1841
GS
10360 break;
10361 case SVt_NV:
10362 SvANY(dstr) = new_XNV();
9d6ce603 10363 SvNV_set(dstr, SvNVX(sstr));
1d7c1841
GS
10364 break;
10365 case SVt_RV:
339049b0 10366 SvANY(dstr) = &(dstr->sv_u.svu_rv);
83841fad 10367 Perl_rvpv_dup(aTHX_ dstr, sstr, param);
1d7c1841 10368 break;
662fb8b2
NC
10369 default:
10370 {
10371 /* These are all the types that need complex bodies allocating. */
10372 size_t new_body_length;
10373 size_t new_body_offset = 0;
10374 void **new_body_arena;
10375 void **new_body_arenaroot;
10376 void *new_body;
10377
10378 switch (SvTYPE(sstr)) {
10379 default:
10380 Perl_croak(aTHX_ "Bizarre SvTYPE [%" IVdf "]",
10381 (IV)SvTYPE(sstr));
10382 break;
10383
10384 case SVt_PVIO:
10385 new_body = new_XPVIO();
10386 new_body_length = sizeof(XPVIO);
10387 break;
10388 case SVt_PVFM:
10389 new_body = new_XPVFM();
10390 new_body_length = sizeof(XPVFM);
10391 break;
10392
10393 case SVt_PVHV:
10394 new_body_arena = (void **) &PL_xpvhv_root;
10395 new_body_arenaroot = (void **) &PL_xpvhv_arenaroot;
10396 new_body_offset = STRUCT_OFFSET(XPVHV, xhv_fill)
10397 - STRUCT_OFFSET(xpvhv_allocated, xhv_fill);
10398 new_body_length = STRUCT_OFFSET(XPVHV, xmg_stash)
10399 + sizeof (((XPVHV*)SvANY(sstr))->xmg_stash)
10400 - new_body_offset;
10401 goto new_body;
10402 case SVt_PVAV:
10403 new_body_arena = (void **) &PL_xpvav_root;
10404 new_body_arenaroot = (void **) &PL_xpvav_arenaroot;
10405 new_body_offset = STRUCT_OFFSET(XPVAV, xav_fill)
10406 - STRUCT_OFFSET(xpvav_allocated, xav_fill);
10407 new_body_length = STRUCT_OFFSET(XPVHV, xmg_stash)
10408 + sizeof (((XPVHV*)SvANY(sstr))->xmg_stash)
10409 - new_body_offset;
10410 goto new_body;
10411 case SVt_PVBM:
10412 new_body_length = sizeof(XPVBM);
10413 new_body_arena = (void **) &PL_xpvbm_root;
10414 new_body_arenaroot = (void **) &PL_xpvbm_arenaroot;
10415 goto new_body;
10416 case SVt_PVGV:
10417 if (GvUNIQUE((GV*)sstr)) {
0abe3f7c 10418 /* Do sharing here. */
662fb8b2
NC
10419 }
10420 new_body_length = sizeof(XPVGV);
10421 new_body_arena = (void **) &PL_xpvgv_root;
10422 new_body_arenaroot = (void **) &PL_xpvgv_arenaroot;
10423 goto new_body;
10424 case SVt_PVCV:
10425 new_body_length = sizeof(XPVCV);
10426 new_body_arena = (void **) &PL_xpvcv_root;
10427 new_body_arenaroot = (void **) &PL_xpvcv_arenaroot;
10428 goto new_body;
10429 case SVt_PVLV:
10430 new_body_length = sizeof(XPVLV);
10431 new_body_arena = (void **) &PL_xpvlv_root;
10432 new_body_arenaroot = (void **) &PL_xpvlv_arenaroot;
10433 goto new_body;
10434 case SVt_PVMG:
10435 new_body_length = sizeof(XPVMG);
10436 new_body_arena = (void **) &PL_xpvmg_root;
10437 new_body_arenaroot = (void **) &PL_xpvmg_arenaroot;
10438 goto new_body;
10439 case SVt_PVNV:
10440 new_body_length = sizeof(XPVNV);
10441 new_body_arena = (void **) &PL_xpvnv_root;
10442 new_body_arenaroot = (void **) &PL_xpvnv_arenaroot;
10443 goto new_body;
10444 case SVt_PVIV:
10445 new_body_offset = STRUCT_OFFSET(XPVIV, xpv_cur)
10446 - STRUCT_OFFSET(xpviv_allocated, xpv_cur);
10447 new_body_length = sizeof(XPVIV) - new_body_offset;
10448 new_body_arena = (void **) &PL_xpviv_root;
10449 new_body_arenaroot = (void **) &PL_xpviv_arenaroot;
10450 goto new_body;
10451 case SVt_PV:
10452 new_body_offset = STRUCT_OFFSET(XPV, xpv_cur)
10453 - STRUCT_OFFSET(xpv_allocated, xpv_cur);
10454 new_body_length = sizeof(XPV) - new_body_offset;
10455 new_body_arena = (void **) &PL_xpv_root;
10456 new_body_arenaroot = (void **) &PL_xpv_arenaroot;
10457 new_body:
10458 assert(new_body_length);
10459#ifndef PURIFY
08742458
NC
10460 new_body_inline(new_body, new_body_arenaroot, new_body_arena,
10461 new_body_length);
10462 new_body = (void*)((char*)new_body - new_body_offset);
662fb8b2
NC
10463#else
10464 /* We always allocated the full length item with PURIFY */
10465 new_body_length += new_body_offset;
10466 new_body_offset = 0;
10467 new_body = my_safemalloc(new_body_length);
5bd07a3d 10468#endif
1d7c1841 10469 }
662fb8b2
NC
10470 assert(new_body);
10471 SvANY(dstr) = new_body;
10472
10473 Copy(((char*)SvANY(sstr)) + new_body_offset,
10474 ((char*)SvANY(dstr)) + new_body_offset,
10475 new_body_length, char);
10476
10477 if (SvTYPE(sstr) != SVt_PVAV && SvTYPE(sstr) != SVt_PVHV)
10478 Perl_rvpv_dup(aTHX_ dstr, sstr, param);
10479
10480 /* The Copy above means that all the source (unduplicated) pointers
10481 are now in the destination. We can check the flags and the
10482 pointers in either, but it's possible that there's less cache
10483 missing by always going for the destination.
10484 FIXME - instrument and check that assumption */
10485 if (SvTYPE(sstr) >= SVt_PVMG) {
10486 if (SvMAGIC(dstr))
10487 SvMAGIC_set(dstr, mg_dup(SvMAGIC(dstr), param));
10488 if (SvSTASH(dstr))
10489 SvSTASH_set(dstr, hv_dup_inc(SvSTASH(dstr), param));
1d7c1841 10490 }
662fb8b2
NC
10491
10492 switch (SvTYPE(sstr)) {
10493 case SVt_PV:
10494 break;
10495 case SVt_PVIV:
10496 break;
10497 case SVt_PVNV:
10498 break;
10499 case SVt_PVMG:
10500 break;
10501 case SVt_PVBM:
10502 break;
10503 case SVt_PVLV:
10504 /* XXX LvTARGOFF sometimes holds PMOP* when DEBUGGING */
10505 if (LvTYPE(dstr) == 't') /* for tie: unrefcnted fake (SV**) */
10506 LvTARG(dstr) = dstr;
10507 else if (LvTYPE(dstr) == 'T') /* for tie: fake HE */
10508 LvTARG(dstr) = (SV*)he_dup((HE*)LvTARG(dstr), 0, param);
10509 else
10510 LvTARG(dstr) = sv_dup_inc(LvTARG(dstr), param);
10511 break;
10512 case SVt_PVGV:
10513 GvNAME(dstr) = SAVEPVN(GvNAME(dstr), GvNAMELEN(dstr));
e15faf7d
NC
10514 GvSTASH(dstr) = hv_dup(GvSTASH(dstr), param);
10515 /* Don't call sv_add_backref here as it's going to be created
10516 as part of the magic cloning of the symbol table. */
662fb8b2
NC
10517 GvGP(dstr) = gp_dup(GvGP(dstr), param);
10518 (void)GpREFCNT_inc(GvGP(dstr));
10519 break;
10520 case SVt_PVIO:
10521 IoIFP(dstr) = fp_dup(IoIFP(dstr), IoTYPE(dstr), param);
10522 if (IoOFP(dstr) == IoIFP(sstr))
10523 IoOFP(dstr) = IoIFP(dstr);
10524 else
10525 IoOFP(dstr) = fp_dup(IoOFP(dstr), IoTYPE(dstr), param);
10526 /* PL_rsfp_filters entries have fake IoDIRP() */
10527 if (IoDIRP(dstr) && !(IoFLAGS(dstr) & IOf_FAKE_DIRP))
10528 IoDIRP(dstr) = dirp_dup(IoDIRP(dstr));
10529 if(IoFLAGS(dstr) & IOf_FAKE_DIRP) {
10530 /* I have no idea why fake dirp (rsfps)
10531 should be treated differently but otherwise
10532 we end up with leaks -- sky*/
10533 IoTOP_GV(dstr) = gv_dup_inc(IoTOP_GV(dstr), param);
10534 IoFMT_GV(dstr) = gv_dup_inc(IoFMT_GV(dstr), param);
10535 IoBOTTOM_GV(dstr) = gv_dup_inc(IoBOTTOM_GV(dstr), param);
10536 } else {
10537 IoTOP_GV(dstr) = gv_dup(IoTOP_GV(dstr), param);
10538 IoFMT_GV(dstr) = gv_dup(IoFMT_GV(dstr), param);
10539 IoBOTTOM_GV(dstr) = gv_dup(IoBOTTOM_GV(dstr), param);
10540 }
10541 IoTOP_NAME(dstr) = SAVEPV(IoTOP_NAME(dstr));
10542 IoFMT_NAME(dstr) = SAVEPV(IoFMT_NAME(dstr));
10543 IoBOTTOM_NAME(dstr) = SAVEPV(IoBOTTOM_NAME(dstr));
10544 break;
10545 case SVt_PVAV:
10546 if (AvARRAY((AV*)sstr)) {
10547 SV **dst_ary, **src_ary;
10548 SSize_t items = AvFILLp((AV*)sstr) + 1;
10549
10550 src_ary = AvARRAY((AV*)sstr);
a02a5408 10551 Newxz(dst_ary, AvMAX((AV*)sstr)+1, SV*);
662fb8b2
NC
10552 ptr_table_store(PL_ptr_table, src_ary, dst_ary);
10553 SvPV_set(dstr, (char*)dst_ary);
10554 AvALLOC((AV*)dstr) = dst_ary;
10555 if (AvREAL((AV*)sstr)) {
10556 while (items-- > 0)
10557 *dst_ary++ = sv_dup_inc(*src_ary++, param);
10558 }
10559 else {
10560 while (items-- > 0)
10561 *dst_ary++ = sv_dup(*src_ary++, param);
10562 }
10563 items = AvMAX((AV*)sstr) - AvFILLp((AV*)sstr);
10564 while (items-- > 0) {
10565 *dst_ary++ = &PL_sv_undef;
10566 }
bfcb3514 10567 }
662fb8b2
NC
10568 else {
10569 SvPV_set(dstr, Nullch);
10570 AvALLOC((AV*)dstr) = (SV**)NULL;
b79f7545 10571 }
662fb8b2
NC
10572 break;
10573 case SVt_PVHV:
10574 {
10575 HEK *hvname = 0;
10576
10577 if (HvARRAY((HV*)sstr)) {
10578 STRLEN i = 0;
10579 const bool sharekeys = !!HvSHAREKEYS(sstr);
10580 XPVHV * const dxhv = (XPVHV*)SvANY(dstr);
10581 XPVHV * const sxhv = (XPVHV*)SvANY(sstr);
10582 char *darray;
a02a5408 10583 Newx(darray, PERL_HV_ARRAY_ALLOC_BYTES(dxhv->xhv_max+1)
662fb8b2
NC
10584 + (SvOOK(sstr) ? sizeof(struct xpvhv_aux) : 0),
10585 char);
10586 HvARRAY(dstr) = (HE**)darray;
10587 while (i <= sxhv->xhv_max) {
10588 HE *source = HvARRAY(sstr)[i];
10589 HvARRAY(dstr)[i] = source
10590 ? he_dup(source, sharekeys, param) : 0;
10591 ++i;
10592 }
10593 if (SvOOK(sstr)) {
10594 struct xpvhv_aux *saux = HvAUX(sstr);
10595 struct xpvhv_aux *daux = HvAUX(dstr);
10596 /* This flag isn't copied. */
10597 /* SvOOK_on(hv) attacks the IV flags. */
10598 SvFLAGS(dstr) |= SVf_OOK;
10599
10600 hvname = saux->xhv_name;
dd690478
NC
10601 daux->xhv_name
10602 = hvname ? hek_dup(hvname, param) : hvname;
662fb8b2
NC
10603
10604 daux->xhv_riter = saux->xhv_riter;
10605 daux->xhv_eiter = saux->xhv_eiter
dd690478
NC
10606 ? he_dup(saux->xhv_eiter,
10607 (bool)!!HvSHAREKEYS(sstr), param) : 0;
662fb8b2
NC
10608 }
10609 }
10610 else {
10611 SvPV_set(dstr, Nullch);
10612 }
10613 /* Record stashes for possible cloning in Perl_clone(). */
10614 if(hvname)
10615 av_push(param->stashes, dstr);
10616 }
10617 break;
10618 case SVt_PVFM:
10619 case SVt_PVCV:
10620 /* NOTE: not refcounted */
10621 CvSTASH(dstr) = hv_dup(CvSTASH(dstr), param);
10622 OP_REFCNT_LOCK;
10623 CvROOT(dstr) = OpREFCNT_inc(CvROOT(dstr));
10624 OP_REFCNT_UNLOCK;
10625 if (CvCONST(dstr)) {
10626 CvXSUBANY(dstr).any_ptr = GvUNIQUE(CvGV(dstr)) ?
10627 SvREFCNT_inc(CvXSUBANY(dstr).any_ptr) :
10628 sv_dup_inc((SV *)CvXSUBANY(dstr).any_ptr, param);
10629 }
10630 /* don't dup if copying back - CvGV isn't refcounted, so the
10631 * duped GV may never be freed. A bit of a hack! DAPM */
10632 CvGV(dstr) = (param->flags & CLONEf_JOIN_IN) ?
10633 Nullgv : gv_dup(CvGV(dstr), param) ;
10634 if (!(param->flags & CLONEf_COPY_STACKS)) {
10635 CvDEPTH(dstr) = 0;
10636 }
10637 PAD_DUP(CvPADLIST(dstr), CvPADLIST(sstr), param);
10638 CvOUTSIDE(dstr) =
10639 CvWEAKOUTSIDE(sstr)
10640 ? cv_dup( CvOUTSIDE(dstr), param)
10641 : cv_dup_inc(CvOUTSIDE(dstr), param);
10642 if (!CvXSUB(dstr))
10643 CvFILE(dstr) = SAVEPV(CvFILE(dstr));
10644 break;
bfcb3514 10645 }
1d7c1841 10646 }
1d7c1841
GS
10647 }
10648
10649 if (SvOBJECT(dstr) && SvTYPE(dstr) != SVt_PVIO)
10650 ++PL_sv_objcount;
10651
10652 return dstr;
d2d73c3e 10653 }
1d7c1841 10654
645c22ef
DM
10655/* duplicate a context */
10656
1d7c1841 10657PERL_CONTEXT *
a8fc9800 10658Perl_cx_dup(pTHX_ PERL_CONTEXT *cxs, I32 ix, I32 max, CLONE_PARAMS* param)
1d7c1841
GS
10659{
10660 PERL_CONTEXT *ncxs;
10661
10662 if (!cxs)
10663 return (PERL_CONTEXT*)NULL;
10664
10665 /* look for it in the table first */
10666 ncxs = (PERL_CONTEXT*)ptr_table_fetch(PL_ptr_table, cxs);
10667 if (ncxs)
10668 return ncxs;
10669
10670 /* create anew and remember what it is */
a02a5408 10671 Newxz(ncxs, max + 1, PERL_CONTEXT);
1d7c1841
GS
10672 ptr_table_store(PL_ptr_table, cxs, ncxs);
10673
10674 while (ix >= 0) {
10675 PERL_CONTEXT *cx = &cxs[ix];
10676 PERL_CONTEXT *ncx = &ncxs[ix];
10677 ncx->cx_type = cx->cx_type;
10678 if (CxTYPE(cx) == CXt_SUBST) {
10679 Perl_croak(aTHX_ "Cloning substitution context is unimplemented");
10680 }
10681 else {
10682 ncx->blk_oldsp = cx->blk_oldsp;
10683 ncx->blk_oldcop = cx->blk_oldcop;
1d7c1841
GS
10684 ncx->blk_oldmarksp = cx->blk_oldmarksp;
10685 ncx->blk_oldscopesp = cx->blk_oldscopesp;
10686 ncx->blk_oldpm = cx->blk_oldpm;
10687 ncx->blk_gimme = cx->blk_gimme;
10688 switch (CxTYPE(cx)) {
10689 case CXt_SUB:
10690 ncx->blk_sub.cv = (cx->blk_sub.olddepth == 0
d2d73c3e
AB
10691 ? cv_dup_inc(cx->blk_sub.cv, param)
10692 : cv_dup(cx->blk_sub.cv,param));
1d7c1841 10693 ncx->blk_sub.argarray = (cx->blk_sub.hasargs
d2d73c3e 10694 ? av_dup_inc(cx->blk_sub.argarray, param)
1d7c1841 10695 : Nullav);
d2d73c3e 10696 ncx->blk_sub.savearray = av_dup_inc(cx->blk_sub.savearray, param);
1d7c1841
GS
10697 ncx->blk_sub.olddepth = cx->blk_sub.olddepth;
10698 ncx->blk_sub.hasargs = cx->blk_sub.hasargs;
10699 ncx->blk_sub.lval = cx->blk_sub.lval;
f39bc417 10700 ncx->blk_sub.retop = cx->blk_sub.retop;
1d7c1841
GS
10701 break;
10702 case CXt_EVAL:
10703 ncx->blk_eval.old_in_eval = cx->blk_eval.old_in_eval;
10704 ncx->blk_eval.old_op_type = cx->blk_eval.old_op_type;
b47cad08 10705 ncx->blk_eval.old_namesv = sv_dup_inc(cx->blk_eval.old_namesv, param);
1d7c1841 10706 ncx->blk_eval.old_eval_root = cx->blk_eval.old_eval_root;
d2d73c3e 10707 ncx->blk_eval.cur_text = sv_dup(cx->blk_eval.cur_text, param);
f39bc417 10708 ncx->blk_eval.retop = cx->blk_eval.retop;
1d7c1841
GS
10709 break;
10710 case CXt_LOOP:
10711 ncx->blk_loop.label = cx->blk_loop.label;
10712 ncx->blk_loop.resetsp = cx->blk_loop.resetsp;
10713 ncx->blk_loop.redo_op = cx->blk_loop.redo_op;
10714 ncx->blk_loop.next_op = cx->blk_loop.next_op;
10715 ncx->blk_loop.last_op = cx->blk_loop.last_op;
10716 ncx->blk_loop.iterdata = (CxPADLOOP(cx)
10717 ? cx->blk_loop.iterdata
d2d73c3e 10718 : gv_dup((GV*)cx->blk_loop.iterdata, param));
f3548bdc
DM
10719 ncx->blk_loop.oldcomppad
10720 = (PAD*)ptr_table_fetch(PL_ptr_table,
10721 cx->blk_loop.oldcomppad);
d2d73c3e
AB
10722 ncx->blk_loop.itersave = sv_dup_inc(cx->blk_loop.itersave, param);
10723 ncx->blk_loop.iterlval = sv_dup_inc(cx->blk_loop.iterlval, param);
10724 ncx->blk_loop.iterary = av_dup_inc(cx->blk_loop.iterary, param);
1d7c1841
GS
10725 ncx->blk_loop.iterix = cx->blk_loop.iterix;
10726 ncx->blk_loop.itermax = cx->blk_loop.itermax;
10727 break;
10728 case CXt_FORMAT:
d2d73c3e
AB
10729 ncx->blk_sub.cv = cv_dup(cx->blk_sub.cv, param);
10730 ncx->blk_sub.gv = gv_dup(cx->blk_sub.gv, param);
10731 ncx->blk_sub.dfoutgv = gv_dup_inc(cx->blk_sub.dfoutgv, param);
1d7c1841 10732 ncx->blk_sub.hasargs = cx->blk_sub.hasargs;
f39bc417 10733 ncx->blk_sub.retop = cx->blk_sub.retop;
1d7c1841
GS
10734 break;
10735 case CXt_BLOCK:
10736 case CXt_NULL:
10737 break;
10738 }
10739 }
10740 --ix;
10741 }
10742 return ncxs;
10743}
10744
645c22ef
DM
10745/* duplicate a stack info structure */
10746
1d7c1841 10747PERL_SI *
a8fc9800 10748Perl_si_dup(pTHX_ PERL_SI *si, CLONE_PARAMS* param)
1d7c1841
GS
10749{
10750 PERL_SI *nsi;
10751
10752 if (!si)
10753 return (PERL_SI*)NULL;
10754
10755 /* look for it in the table first */
10756 nsi = (PERL_SI*)ptr_table_fetch(PL_ptr_table, si);
10757 if (nsi)
10758 return nsi;
10759
10760 /* create anew and remember what it is */
a02a5408 10761 Newxz(nsi, 1, PERL_SI);
1d7c1841
GS
10762 ptr_table_store(PL_ptr_table, si, nsi);
10763
d2d73c3e 10764 nsi->si_stack = av_dup_inc(si->si_stack, param);
1d7c1841
GS
10765 nsi->si_cxix = si->si_cxix;
10766 nsi->si_cxmax = si->si_cxmax;
d2d73c3e 10767 nsi->si_cxstack = cx_dup(si->si_cxstack, si->si_cxix, si->si_cxmax, param);
1d7c1841 10768 nsi->si_type = si->si_type;
d2d73c3e
AB
10769 nsi->si_prev = si_dup(si->si_prev, param);
10770 nsi->si_next = si_dup(si->si_next, param);
1d7c1841
GS
10771 nsi->si_markoff = si->si_markoff;
10772
10773 return nsi;
10774}
10775
10776#define POPINT(ss,ix) ((ss)[--(ix)].any_i32)
10777#define TOPINT(ss,ix) ((ss)[ix].any_i32)
10778#define POPLONG(ss,ix) ((ss)[--(ix)].any_long)
10779#define TOPLONG(ss,ix) ((ss)[ix].any_long)
10780#define POPIV(ss,ix) ((ss)[--(ix)].any_iv)
10781#define TOPIV(ss,ix) ((ss)[ix].any_iv)
38d8b13e
HS
10782#define POPBOOL(ss,ix) ((ss)[--(ix)].any_bool)
10783#define TOPBOOL(ss,ix) ((ss)[ix].any_bool)
1d7c1841
GS
10784#define POPPTR(ss,ix) ((ss)[--(ix)].any_ptr)
10785#define TOPPTR(ss,ix) ((ss)[ix].any_ptr)
10786#define POPDPTR(ss,ix) ((ss)[--(ix)].any_dptr)
10787#define TOPDPTR(ss,ix) ((ss)[ix].any_dptr)
10788#define POPDXPTR(ss,ix) ((ss)[--(ix)].any_dxptr)
10789#define TOPDXPTR(ss,ix) ((ss)[ix].any_dxptr)
10790
10791/* XXXXX todo */
10792#define pv_dup_inc(p) SAVEPV(p)
10793#define pv_dup(p) SAVEPV(p)
10794#define svp_dup_inc(p,pp) any_dup(p,pp)
10795
645c22ef
DM
10796/* map any object to the new equivent - either something in the
10797 * ptr table, or something in the interpreter structure
10798 */
10799
1d7c1841 10800void *
53c1dcc0 10801Perl_any_dup(pTHX_ void *v, const PerlInterpreter *proto_perl)
1d7c1841
GS
10802{
10803 void *ret;
10804
10805 if (!v)
10806 return (void*)NULL;
10807
10808 /* look for it in the table first */
10809 ret = ptr_table_fetch(PL_ptr_table, v);
10810 if (ret)
10811 return ret;
10812
10813 /* see if it is part of the interpreter structure */
10814 if (v >= (void*)proto_perl && v < (void*)(proto_perl+1))
acfe0abc 10815 ret = (void*)(((char*)aTHX) + (((char*)v) - (char*)proto_perl));
05ec9bb3 10816 else {
1d7c1841 10817 ret = v;
05ec9bb3 10818 }
1d7c1841
GS
10819
10820 return ret;
10821}
10822
645c22ef
DM
10823/* duplicate the save stack */
10824
1d7c1841 10825ANY *
a8fc9800 10826Perl_ss_dup(pTHX_ PerlInterpreter *proto_perl, CLONE_PARAMS* param)
1d7c1841 10827{
53c1dcc0
AL
10828 ANY * const ss = proto_perl->Tsavestack;
10829 const I32 max = proto_perl->Tsavestack_max;
10830 I32 ix = proto_perl->Tsavestack_ix;
1d7c1841
GS
10831 ANY *nss;
10832 SV *sv;
10833 GV *gv;
10834 AV *av;
10835 HV *hv;
10836 void* ptr;
10837 int intval;
10838 long longval;
10839 GP *gp;
10840 IV iv;
c4e33207 10841 char *c = NULL;
1d7c1841 10842 void (*dptr) (void*);
acfe0abc 10843 void (*dxptr) (pTHX_ void*);
1d7c1841 10844
a02a5408 10845 Newxz(nss, max, ANY);
1d7c1841
GS
10846
10847 while (ix > 0) {
b464bac0 10848 I32 i = POPINT(ss,ix);
1d7c1841
GS
10849 TOPINT(nss,ix) = i;
10850 switch (i) {
10851 case SAVEt_ITEM: /* normal string */
10852 sv = (SV*)POPPTR(ss,ix);
d2d73c3e 10853 TOPPTR(nss,ix) = sv_dup_inc(sv, param);
1d7c1841 10854 sv = (SV*)POPPTR(ss,ix);
d2d73c3e 10855 TOPPTR(nss,ix) = sv_dup_inc(sv, param);
1d7c1841
GS
10856 break;
10857 case SAVEt_SV: /* scalar reference */
10858 sv = (SV*)POPPTR(ss,ix);
d2d73c3e 10859 TOPPTR(nss,ix) = sv_dup_inc(sv, param);
1d7c1841 10860 gv = (GV*)POPPTR(ss,ix);
d2d73c3e 10861 TOPPTR(nss,ix) = gv_dup_inc(gv, param);
1d7c1841 10862 break;
f4dd75d9
GS
10863 case SAVEt_GENERIC_PVREF: /* generic char* */
10864 c = (char*)POPPTR(ss,ix);
10865 TOPPTR(nss,ix) = pv_dup(c);
10866 ptr = POPPTR(ss,ix);
10867 TOPPTR(nss,ix) = any_dup(ptr, proto_perl);
10868 break;
05ec9bb3
NIS
10869 case SAVEt_SHARED_PVREF: /* char* in shared space */
10870 c = (char*)POPPTR(ss,ix);
10871 TOPPTR(nss,ix) = savesharedpv(c);
10872 ptr = POPPTR(ss,ix);
10873 TOPPTR(nss,ix) = any_dup(ptr, proto_perl);
10874 break;
1d7c1841
GS
10875 case SAVEt_GENERIC_SVREF: /* generic sv */
10876 case SAVEt_SVREF: /* scalar reference */
10877 sv = (SV*)POPPTR(ss,ix);
d2d73c3e 10878 TOPPTR(nss,ix) = sv_dup_inc(sv, param);
1d7c1841
GS
10879 ptr = POPPTR(ss,ix);
10880 TOPPTR(nss,ix) = svp_dup_inc((SV**)ptr, proto_perl);/* XXXXX */
10881 break;
10882 case SAVEt_AV: /* array reference */
10883 av = (AV*)POPPTR(ss,ix);
d2d73c3e 10884 TOPPTR(nss,ix) = av_dup_inc(av, param);
1d7c1841 10885 gv = (GV*)POPPTR(ss,ix);
d2d73c3e 10886 TOPPTR(nss,ix) = gv_dup(gv, param);
1d7c1841
GS
10887 break;
10888 case SAVEt_HV: /* hash reference */
10889 hv = (HV*)POPPTR(ss,ix);
d2d73c3e 10890 TOPPTR(nss,ix) = hv_dup_inc(hv, param);
1d7c1841 10891 gv = (GV*)POPPTR(ss,ix);
d2d73c3e 10892 TOPPTR(nss,ix) = gv_dup(gv, param);
1d7c1841
GS
10893 break;
10894 case SAVEt_INT: /* int reference */
10895 ptr = POPPTR(ss,ix);
10896 TOPPTR(nss,ix) = any_dup(ptr, proto_perl);
10897 intval = (int)POPINT(ss,ix);
10898 TOPINT(nss,ix) = intval;
10899 break;
10900 case SAVEt_LONG: /* long reference */
10901 ptr = POPPTR(ss,ix);
10902 TOPPTR(nss,ix) = any_dup(ptr, proto_perl);
10903 longval = (long)POPLONG(ss,ix);
10904 TOPLONG(nss,ix) = longval;
10905 break;
10906 case SAVEt_I32: /* I32 reference */
10907 case SAVEt_I16: /* I16 reference */
10908 case SAVEt_I8: /* I8 reference */
10909 ptr = POPPTR(ss,ix);
10910 TOPPTR(nss,ix) = any_dup(ptr, proto_perl);
10911 i = POPINT(ss,ix);
10912 TOPINT(nss,ix) = i;
10913 break;
10914 case SAVEt_IV: /* IV reference */
10915 ptr = POPPTR(ss,ix);
10916 TOPPTR(nss,ix) = any_dup(ptr, proto_perl);
10917 iv = POPIV(ss,ix);
10918 TOPIV(nss,ix) = iv;
10919 break;
10920 case SAVEt_SPTR: /* SV* reference */
10921 ptr = POPPTR(ss,ix);
10922 TOPPTR(nss,ix) = any_dup(ptr, proto_perl);
10923 sv = (SV*)POPPTR(ss,ix);
d2d73c3e 10924 TOPPTR(nss,ix) = sv_dup(sv, param);
1d7c1841
GS
10925 break;
10926 case SAVEt_VPTR: /* random* reference */
10927 ptr = POPPTR(ss,ix);
10928 TOPPTR(nss,ix) = any_dup(ptr, proto_perl);
10929 ptr = POPPTR(ss,ix);
10930 TOPPTR(nss,ix) = any_dup(ptr, proto_perl);
10931 break;
10932 case SAVEt_PPTR: /* char* reference */
10933 ptr = POPPTR(ss,ix);
10934 TOPPTR(nss,ix) = any_dup(ptr, proto_perl);
10935 c = (char*)POPPTR(ss,ix);
10936 TOPPTR(nss,ix) = pv_dup(c);
10937 break;
10938 case SAVEt_HPTR: /* HV* reference */
10939 ptr = POPPTR(ss,ix);
10940 TOPPTR(nss,ix) = any_dup(ptr, proto_perl);
10941 hv = (HV*)POPPTR(ss,ix);
d2d73c3e 10942 TOPPTR(nss,ix) = hv_dup(hv, param);
1d7c1841
GS
10943 break;
10944 case SAVEt_APTR: /* AV* reference */
10945 ptr = POPPTR(ss,ix);
10946 TOPPTR(nss,ix) = any_dup(ptr, proto_perl);
10947 av = (AV*)POPPTR(ss,ix);
d2d73c3e 10948 TOPPTR(nss,ix) = av_dup(av, param);
1d7c1841
GS
10949 break;
10950 case SAVEt_NSTAB:
10951 gv = (GV*)POPPTR(ss,ix);
d2d73c3e 10952 TOPPTR(nss,ix) = gv_dup(gv, param);
1d7c1841
GS
10953 break;
10954 case SAVEt_GP: /* scalar reference */
10955 gp = (GP*)POPPTR(ss,ix);
d2d73c3e 10956 TOPPTR(nss,ix) = gp = gp_dup(gp, param);
1d7c1841
GS
10957 (void)GpREFCNT_inc(gp);
10958 gv = (GV*)POPPTR(ss,ix);
2ed3c8fc 10959 TOPPTR(nss,ix) = gv_dup_inc(gv, param);
1d7c1841
GS
10960 c = (char*)POPPTR(ss,ix);
10961 TOPPTR(nss,ix) = pv_dup(c);
10962 iv = POPIV(ss,ix);
10963 TOPIV(nss,ix) = iv;
10964 iv = POPIV(ss,ix);
10965 TOPIV(nss,ix) = iv;
10966 break;
10967 case SAVEt_FREESV:
26d9b02f 10968 case SAVEt_MORTALIZESV:
1d7c1841 10969 sv = (SV*)POPPTR(ss,ix);
d2d73c3e 10970 TOPPTR(nss,ix) = sv_dup_inc(sv, param);
1d7c1841
GS
10971 break;
10972 case SAVEt_FREEOP:
10973 ptr = POPPTR(ss,ix);
10974 if (ptr && (((OP*)ptr)->op_private & OPpREFCOUNTED)) {
10975 /* these are assumed to be refcounted properly */
53c1dcc0 10976 OP *o;
1d7c1841
GS
10977 switch (((OP*)ptr)->op_type) {
10978 case OP_LEAVESUB:
10979 case OP_LEAVESUBLV:
10980 case OP_LEAVEEVAL:
10981 case OP_LEAVE:
10982 case OP_SCOPE:
10983 case OP_LEAVEWRITE:
e977893f
GS
10984 TOPPTR(nss,ix) = ptr;
10985 o = (OP*)ptr;
10986 OpREFCNT_inc(o);
1d7c1841
GS
10987 break;
10988 default:
10989 TOPPTR(nss,ix) = Nullop;
10990 break;
10991 }
10992 }
10993 else
10994 TOPPTR(nss,ix) = Nullop;
10995 break;
10996 case SAVEt_FREEPV:
10997 c = (char*)POPPTR(ss,ix);
10998 TOPPTR(nss,ix) = pv_dup_inc(c);
10999 break;
11000 case SAVEt_CLEARSV:
11001 longval = POPLONG(ss,ix);
11002 TOPLONG(nss,ix) = longval;
11003 break;
11004 case SAVEt_DELETE:
11005 hv = (HV*)POPPTR(ss,ix);
d2d73c3e 11006 TOPPTR(nss,ix) = hv_dup_inc(hv, param);
1d7c1841
GS
11007 c = (char*)POPPTR(ss,ix);
11008 TOPPTR(nss,ix) = pv_dup_inc(c);
11009 i = POPINT(ss,ix);
11010 TOPINT(nss,ix) = i;
11011 break;
11012 case SAVEt_DESTRUCTOR:
11013 ptr = POPPTR(ss,ix);
11014 TOPPTR(nss,ix) = any_dup(ptr, proto_perl); /* XXX quite arbitrary */
11015 dptr = POPDPTR(ss,ix);
8141890a
JH
11016 TOPDPTR(nss,ix) = DPTR2FPTR(void (*)(void*),
11017 any_dup(FPTR2DPTR(void *, dptr),
11018 proto_perl));
1d7c1841
GS
11019 break;
11020 case SAVEt_DESTRUCTOR_X:
11021 ptr = POPPTR(ss,ix);
11022 TOPPTR(nss,ix) = any_dup(ptr, proto_perl); /* XXX quite arbitrary */
11023 dxptr = POPDXPTR(ss,ix);
8141890a
JH
11024 TOPDXPTR(nss,ix) = DPTR2FPTR(void (*)(pTHX_ void*),
11025 any_dup(FPTR2DPTR(void *, dxptr),
11026 proto_perl));
1d7c1841
GS
11027 break;
11028 case SAVEt_REGCONTEXT:
11029 case SAVEt_ALLOC:
11030 i = POPINT(ss,ix);
11031 TOPINT(nss,ix) = i;
11032 ix -= i;
11033 break;
11034 case SAVEt_STACK_POS: /* Position on Perl stack */
11035 i = POPINT(ss,ix);
11036 TOPINT(nss,ix) = i;
11037 break;
11038 case SAVEt_AELEM: /* array element */
11039 sv = (SV*)POPPTR(ss,ix);
d2d73c3e 11040 TOPPTR(nss,ix) = sv_dup_inc(sv, param);
1d7c1841
GS
11041 i = POPINT(ss,ix);
11042 TOPINT(nss,ix) = i;
11043 av = (AV*)POPPTR(ss,ix);
d2d73c3e 11044 TOPPTR(nss,ix) = av_dup_inc(av, param);
1d7c1841
GS
11045 break;
11046 case SAVEt_HELEM: /* hash element */
11047 sv = (SV*)POPPTR(ss,ix);
d2d73c3e 11048 TOPPTR(nss,ix) = sv_dup_inc(sv, param);
1d7c1841 11049 sv = (SV*)POPPTR(ss,ix);
d2d73c3e 11050 TOPPTR(nss,ix) = sv_dup_inc(sv, param);
1d7c1841 11051 hv = (HV*)POPPTR(ss,ix);
d2d73c3e 11052 TOPPTR(nss,ix) = hv_dup_inc(hv, param);
1d7c1841
GS
11053 break;
11054 case SAVEt_OP:
11055 ptr = POPPTR(ss,ix);
11056 TOPPTR(nss,ix) = ptr;
11057 break;
11058 case SAVEt_HINTS:
11059 i = POPINT(ss,ix);
11060 TOPINT(nss,ix) = i;
11061 break;
c4410b1b
GS
11062 case SAVEt_COMPPAD:
11063 av = (AV*)POPPTR(ss,ix);
58ed4fbe 11064 TOPPTR(nss,ix) = av_dup(av, param);
c4410b1b 11065 break;
c3564e5c
GS
11066 case SAVEt_PADSV:
11067 longval = (long)POPLONG(ss,ix);
11068 TOPLONG(nss,ix) = longval;
11069 ptr = POPPTR(ss,ix);
11070 TOPPTR(nss,ix) = any_dup(ptr, proto_perl);
11071 sv = (SV*)POPPTR(ss,ix);
d2d73c3e 11072 TOPPTR(nss,ix) = sv_dup(sv, param);
c3564e5c 11073 break;
a1bb4754 11074 case SAVEt_BOOL:
38d8b13e 11075 ptr = POPPTR(ss,ix);
b9609c01 11076 TOPPTR(nss,ix) = any_dup(ptr, proto_perl);
38d8b13e 11077 longval = (long)POPBOOL(ss,ix);
b9609c01 11078 TOPBOOL(nss,ix) = (bool)longval;
a1bb4754 11079 break;
8bd2680e
MHM
11080 case SAVEt_SET_SVFLAGS:
11081 i = POPINT(ss,ix);
11082 TOPINT(nss,ix) = i;
11083 i = POPINT(ss,ix);
11084 TOPINT(nss,ix) = i;
11085 sv = (SV*)POPPTR(ss,ix);
11086 TOPPTR(nss,ix) = sv_dup(sv, param);
11087 break;
1d7c1841
GS
11088 default:
11089 Perl_croak(aTHX_ "panic: ss_dup inconsistency");
11090 }
11091 }
11092
11093 return nss;
11094}
11095
9660f481
DM
11096
11097/* if sv is a stash, call $class->CLONE_SKIP(), and set the SVphv_CLONEABLE
11098 * flag to the result. This is done for each stash before cloning starts,
11099 * so we know which stashes want their objects cloned */
11100
11101static void
11102do_mark_cloneable_stash(pTHX_ SV *sv)
11103{
53c1dcc0 11104 const HEK * const hvname = HvNAME_HEK((HV*)sv);
bfcb3514 11105 if (hvname) {
53c1dcc0 11106 GV* const cloner = gv_fetchmethod_autoload((HV*)sv, "CLONE_SKIP", 0);
9660f481
DM
11107 SvFLAGS(sv) |= SVphv_CLONEABLE; /* clone objects by default */
11108 if (cloner && GvCV(cloner)) {
11109 dSP;
11110 UV status;
11111
11112 ENTER;
11113 SAVETMPS;
11114 PUSHMARK(SP);
84bda14a 11115 XPUSHs(sv_2mortal(newSVhek(hvname)));
9660f481
DM
11116 PUTBACK;
11117 call_sv((SV*)GvCV(cloner), G_SCALAR);
11118 SPAGAIN;
11119 status = POPu;
11120 PUTBACK;
11121 FREETMPS;
11122 LEAVE;
11123 if (status)
11124 SvFLAGS(sv) &= ~SVphv_CLONEABLE;
11125 }
11126 }
11127}
11128
11129
11130
645c22ef
DM
11131/*
11132=for apidoc perl_clone
11133
11134Create and return a new interpreter by cloning the current one.
11135
4be49ee6 11136perl_clone takes these flags as parameters:
6a78b4db 11137
7a5fa8a2
NIS
11138CLONEf_COPY_STACKS - is used to, well, copy the stacks also,
11139without it we only clone the data and zero the stacks,
11140with it we copy the stacks and the new perl interpreter is
11141ready to run at the exact same point as the previous one.
11142The pseudo-fork code uses COPY_STACKS while the
6a78b4db
AB
11143threads->new doesn't.
11144
11145CLONEf_KEEP_PTR_TABLE
7a5fa8a2
NIS
11146perl_clone keeps a ptr_table with the pointer of the old
11147variable as a key and the new variable as a value,
11148this allows it to check if something has been cloned and not
11149clone it again but rather just use the value and increase the
11150refcount. If KEEP_PTR_TABLE is not set then perl_clone will kill
11151the ptr_table using the function
11152C<ptr_table_free(PL_ptr_table); PL_ptr_table = NULL;>,
11153reason to keep it around is if you want to dup some of your own
11154variable who are outside the graph perl scans, example of this
6a78b4db
AB
11155code is in threads.xs create
11156
11157CLONEf_CLONE_HOST
7a5fa8a2
NIS
11158This is a win32 thing, it is ignored on unix, it tells perls
11159win32host code (which is c++) to clone itself, this is needed on
11160win32 if you want to run two threads at the same time,
11161if you just want to do some stuff in a separate perl interpreter
11162and then throw it away and return to the original one,
6a78b4db
AB
11163you don't need to do anything.
11164
645c22ef
DM
11165=cut
11166*/
11167
11168/* XXX the above needs expanding by someone who actually understands it ! */
3fc56081
NK
11169EXTERN_C PerlInterpreter *
11170perl_clone_host(PerlInterpreter* proto_perl, UV flags);
645c22ef 11171
1d7c1841
GS
11172PerlInterpreter *
11173perl_clone(PerlInterpreter *proto_perl, UV flags)
11174{
27da23d5 11175 dVAR;
1d7c1841 11176#ifdef PERL_IMPLICIT_SYS
c43294b8
AB
11177
11178 /* perlhost.h so we need to call into it
11179 to clone the host, CPerlHost should have a c interface, sky */
11180
11181 if (flags & CLONEf_CLONE_HOST) {
11182 return perl_clone_host(proto_perl,flags);
11183 }
11184 return perl_clone_using(proto_perl, flags,
1d7c1841
GS
11185 proto_perl->IMem,
11186 proto_perl->IMemShared,
11187 proto_perl->IMemParse,
11188 proto_perl->IEnv,
11189 proto_perl->IStdIO,
11190 proto_perl->ILIO,
11191 proto_perl->IDir,
11192 proto_perl->ISock,
11193 proto_perl->IProc);
11194}
11195
11196PerlInterpreter *
11197perl_clone_using(PerlInterpreter *proto_perl, UV flags,
11198 struct IPerlMem* ipM, struct IPerlMem* ipMS,
11199 struct IPerlMem* ipMP, struct IPerlEnv* ipE,
11200 struct IPerlStdIO* ipStd, struct IPerlLIO* ipLIO,
11201 struct IPerlDir* ipD, struct IPerlSock* ipS,
11202 struct IPerlProc* ipP)
11203{
11204 /* XXX many of the string copies here can be optimized if they're
11205 * constants; they need to be allocated as common memory and just
11206 * their pointers copied. */
11207
8fc9efbd 11208 IV i;
64aa0685
GS
11209 CLONE_PARAMS clone_params;
11210 CLONE_PARAMS* param = &clone_params;
d2d73c3e 11211
1d7c1841 11212 PerlInterpreter *my_perl = (PerlInterpreter*)(*ipM->pMalloc)(ipM, sizeof(PerlInterpreter));
9660f481
DM
11213 /* for each stash, determine whether its objects should be cloned */
11214 S_visit(proto_perl, do_mark_cloneable_stash, SVt_PVHV, SVTYPEMASK);
ba869deb 11215 PERL_SET_THX(my_perl);
1d7c1841 11216
acfe0abc 11217# ifdef DEBUGGING
a4530404 11218 Poison(my_perl, 1, PerlInterpreter);
fd0854ff 11219 PL_op = Nullop;
c008732b 11220 PL_curcop = (COP *)Nullop;
1d7c1841
GS
11221 PL_markstack = 0;
11222 PL_scopestack = 0;
11223 PL_savestack = 0;
22f7c9c9
JH
11224 PL_savestack_ix = 0;
11225 PL_savestack_max = -1;
66fe0623 11226 PL_sig_pending = 0;
25596c82 11227 Zero(&PL_debug_pad, 1, struct perl_debug_pad);
acfe0abc 11228# else /* !DEBUGGING */
1d7c1841 11229 Zero(my_perl, 1, PerlInterpreter);
acfe0abc 11230# endif /* DEBUGGING */
1d7c1841
GS
11231
11232 /* host pointers */
11233 PL_Mem = ipM;
11234 PL_MemShared = ipMS;
11235 PL_MemParse = ipMP;
11236 PL_Env = ipE;
11237 PL_StdIO = ipStd;
11238 PL_LIO = ipLIO;
11239 PL_Dir = ipD;
11240 PL_Sock = ipS;
11241 PL_Proc = ipP;
1d7c1841
GS
11242#else /* !PERL_IMPLICIT_SYS */
11243 IV i;
64aa0685
GS
11244 CLONE_PARAMS clone_params;
11245 CLONE_PARAMS* param = &clone_params;
1d7c1841 11246 PerlInterpreter *my_perl = (PerlInterpreter*)PerlMem_malloc(sizeof(PerlInterpreter));
9660f481
DM
11247 /* for each stash, determine whether its objects should be cloned */
11248 S_visit(proto_perl, do_mark_cloneable_stash, SVt_PVHV, SVTYPEMASK);
ba869deb 11249 PERL_SET_THX(my_perl);
1d7c1841
GS
11250
11251# ifdef DEBUGGING
a4530404 11252 Poison(my_perl, 1, PerlInterpreter);
fd0854ff 11253 PL_op = Nullop;
c008732b 11254 PL_curcop = (COP *)Nullop;
1d7c1841
GS
11255 PL_markstack = 0;
11256 PL_scopestack = 0;
11257 PL_savestack = 0;
22f7c9c9
JH
11258 PL_savestack_ix = 0;
11259 PL_savestack_max = -1;
66fe0623 11260 PL_sig_pending = 0;
25596c82 11261 Zero(&PL_debug_pad, 1, struct perl_debug_pad);
1d7c1841
GS
11262# else /* !DEBUGGING */
11263 Zero(my_perl, 1, PerlInterpreter);
11264# endif /* DEBUGGING */
11265#endif /* PERL_IMPLICIT_SYS */
83236556 11266 param->flags = flags;
59b40662 11267 param->proto_perl = proto_perl;
1d7c1841
GS
11268
11269 /* arena roots */
612f20c3 11270 PL_xnv_arenaroot = NULL;
1d7c1841 11271 PL_xnv_root = NULL;
612f20c3 11272 PL_xpv_arenaroot = NULL;
1d7c1841 11273 PL_xpv_root = NULL;
612f20c3 11274 PL_xpviv_arenaroot = NULL;
1d7c1841 11275 PL_xpviv_root = NULL;
612f20c3 11276 PL_xpvnv_arenaroot = NULL;
1d7c1841 11277 PL_xpvnv_root = NULL;
612f20c3 11278 PL_xpvcv_arenaroot = NULL;
1d7c1841 11279 PL_xpvcv_root = NULL;
612f20c3 11280 PL_xpvav_arenaroot = NULL;
1d7c1841 11281 PL_xpvav_root = NULL;
612f20c3 11282 PL_xpvhv_arenaroot = NULL;
1d7c1841 11283 PL_xpvhv_root = NULL;
612f20c3 11284 PL_xpvmg_arenaroot = NULL;
1d7c1841 11285 PL_xpvmg_root = NULL;
7552b40b
DM
11286 PL_xpvgv_arenaroot = NULL;
11287 PL_xpvgv_root = NULL;
612f20c3 11288 PL_xpvlv_arenaroot = NULL;
1d7c1841 11289 PL_xpvlv_root = NULL;
612f20c3 11290 PL_xpvbm_arenaroot = NULL;
1d7c1841 11291 PL_xpvbm_root = NULL;
612f20c3 11292 PL_he_arenaroot = NULL;
1d7c1841 11293 PL_he_root = NULL;
892b45be 11294#if defined(USE_ITHREADS)
32e691d0
NC
11295 PL_pte_arenaroot = NULL;
11296 PL_pte_root = NULL;
892b45be 11297#endif
1d7c1841
GS
11298 PL_nice_chunk = NULL;
11299 PL_nice_chunk_size = 0;
11300 PL_sv_count = 0;
11301 PL_sv_objcount = 0;
11302 PL_sv_root = Nullsv;
11303 PL_sv_arenaroot = Nullsv;
11304
11305 PL_debug = proto_perl->Idebug;
11306
8df990a8
NC
11307 PL_hash_seed = proto_perl->Ihash_seed;
11308 PL_rehash_seed = proto_perl->Irehash_seed;
11309
e5dd39fc 11310#ifdef USE_REENTRANT_API
68853529
SB
11311 /* XXX: things like -Dm will segfault here in perlio, but doing
11312 * PERL_SET_CONTEXT(proto_perl);
11313 * breaks too many other things
11314 */
59bd0823 11315 Perl_reentrant_init(aTHX);
e5dd39fc
AB
11316#endif
11317
1d7c1841
GS
11318 /* create SV map for pointer relocation */
11319 PL_ptr_table = ptr_table_new();
11320
11321 /* initialize these special pointers as early as possible */
11322 SvANY(&PL_sv_undef) = NULL;
11323 SvREFCNT(&PL_sv_undef) = (~(U32)0)/2;
11324 SvFLAGS(&PL_sv_undef) = SVf_READONLY|SVt_NULL;
11325 ptr_table_store(PL_ptr_table, &proto_perl->Isv_undef, &PL_sv_undef);
11326
1d7c1841 11327 SvANY(&PL_sv_no) = new_XPVNV();
1d7c1841 11328 SvREFCNT(&PL_sv_no) = (~(U32)0)/2;
0309f36e
NC
11329 SvFLAGS(&PL_sv_no) = SVp_IOK|SVf_IOK|SVp_NOK|SVf_NOK
11330 |SVp_POK|SVf_POK|SVf_READONLY|SVt_PVNV;
f880fe2f 11331 SvPV_set(&PL_sv_no, SAVEPVN(PL_No, 0));
b162af07
SP
11332 SvCUR_set(&PL_sv_no, 0);
11333 SvLEN_set(&PL_sv_no, 1);
45977657 11334 SvIV_set(&PL_sv_no, 0);
9d6ce603 11335 SvNV_set(&PL_sv_no, 0);
1d7c1841
GS
11336 ptr_table_store(PL_ptr_table, &proto_perl->Isv_no, &PL_sv_no);
11337
1d7c1841 11338 SvANY(&PL_sv_yes) = new_XPVNV();
1d7c1841 11339 SvREFCNT(&PL_sv_yes) = (~(U32)0)/2;
0309f36e
NC
11340 SvFLAGS(&PL_sv_yes) = SVp_IOK|SVf_IOK|SVp_NOK|SVf_NOK
11341 |SVp_POK|SVf_POK|SVf_READONLY|SVt_PVNV;
f880fe2f 11342 SvPV_set(&PL_sv_yes, SAVEPVN(PL_Yes, 1));
b162af07
SP
11343 SvCUR_set(&PL_sv_yes, 1);
11344 SvLEN_set(&PL_sv_yes, 2);
45977657 11345 SvIV_set(&PL_sv_yes, 1);
9d6ce603 11346 SvNV_set(&PL_sv_yes, 1);
1d7c1841
GS
11347 ptr_table_store(PL_ptr_table, &proto_perl->Isv_yes, &PL_sv_yes);
11348
05ec9bb3 11349 /* create (a non-shared!) shared string table */
1d7c1841
GS
11350 PL_strtab = newHV();
11351 HvSHAREKEYS_off(PL_strtab);
c4a9c09d 11352 hv_ksplit(PL_strtab, HvTOTALKEYS(proto_perl->Istrtab));
1d7c1841
GS
11353 ptr_table_store(PL_ptr_table, proto_perl->Istrtab, PL_strtab);
11354
05ec9bb3
NIS
11355 PL_compiling = proto_perl->Icompiling;
11356
11357 /* These two PVs will be free'd special way so must set them same way op.c does */
11358 PL_compiling.cop_stashpv = savesharedpv(PL_compiling.cop_stashpv);
11359 ptr_table_store(PL_ptr_table, proto_perl->Icompiling.cop_stashpv, PL_compiling.cop_stashpv);
11360
11361 PL_compiling.cop_file = savesharedpv(PL_compiling.cop_file);
11362 ptr_table_store(PL_ptr_table, proto_perl->Icompiling.cop_file, PL_compiling.cop_file);
11363
1d7c1841
GS
11364 ptr_table_store(PL_ptr_table, &proto_perl->Icompiling, &PL_compiling);
11365 if (!specialWARN(PL_compiling.cop_warnings))
d2d73c3e 11366 PL_compiling.cop_warnings = sv_dup_inc(PL_compiling.cop_warnings, param);
ac27b0f5 11367 if (!specialCopIO(PL_compiling.cop_io))
d2d73c3e 11368 PL_compiling.cop_io = sv_dup_inc(PL_compiling.cop_io, param);
1d7c1841
GS
11369 PL_curcop = (COP*)any_dup(proto_perl->Tcurcop, proto_perl);
11370
11371 /* pseudo environmental stuff */
11372 PL_origargc = proto_perl->Iorigargc;
e2975953 11373 PL_origargv = proto_perl->Iorigargv;
d2d73c3e 11374
d2d73c3e
AB
11375 param->stashes = newAV(); /* Setup array of objects to call clone on */
11376
d419787a
SH
11377 /* Set tainting stuff before PerlIO_debug can possibly get called */
11378 PL_tainting = proto_perl->Itainting;
11379 PL_taint_warn = proto_perl->Itaint_warn;
11380
a1ea730d 11381#ifdef PERLIO_LAYERS
3a1ee7e8
NIS
11382 /* Clone PerlIO tables as soon as we can handle general xx_dup() */
11383 PerlIO_clone(aTHX_ proto_perl, param);
a1ea730d 11384#endif
d2d73c3e
AB
11385
11386 PL_envgv = gv_dup(proto_perl->Ienvgv, param);
11387 PL_incgv = gv_dup(proto_perl->Iincgv, param);
11388 PL_hintgv = gv_dup(proto_perl->Ihintgv, param);
1d7c1841 11389 PL_origfilename = SAVEPV(proto_perl->Iorigfilename);
d2d73c3e
AB
11390 PL_diehook = sv_dup_inc(proto_perl->Idiehook, param);
11391 PL_warnhook = sv_dup_inc(proto_perl->Iwarnhook, param);
1d7c1841
GS
11392
11393 /* switches */
11394 PL_minus_c = proto_perl->Iminus_c;
d2d73c3e 11395 PL_patchlevel = sv_dup_inc(proto_perl->Ipatchlevel, param);
1d7c1841
GS
11396 PL_localpatches = proto_perl->Ilocalpatches;
11397 PL_splitstr = proto_perl->Isplitstr;
11398 PL_preprocess = proto_perl->Ipreprocess;
11399 PL_minus_n = proto_perl->Iminus_n;
11400 PL_minus_p = proto_perl->Iminus_p;
11401 PL_minus_l = proto_perl->Iminus_l;
11402 PL_minus_a = proto_perl->Iminus_a;
11403 PL_minus_F = proto_perl->Iminus_F;
11404 PL_doswitches = proto_perl->Idoswitches;
11405 PL_dowarn = proto_perl->Idowarn;
11406 PL_doextract = proto_perl->Idoextract;
11407 PL_sawampersand = proto_perl->Isawampersand;
11408 PL_unsafe = proto_perl->Iunsafe;
11409 PL_inplace = SAVEPV(proto_perl->Iinplace);
d2d73c3e 11410 PL_e_script = sv_dup_inc(proto_perl->Ie_script, param);
1d7c1841
GS
11411 PL_perldb = proto_perl->Iperldb;
11412 PL_perl_destruct_level = proto_perl->Iperl_destruct_level;
1cbb0781 11413 PL_exit_flags = proto_perl->Iexit_flags;
1d7c1841
GS
11414
11415 /* magical thingies */
11416 /* XXX time(&PL_basetime) when asked for? */
11417 PL_basetime = proto_perl->Ibasetime;
d2d73c3e 11418 PL_formfeed = sv_dup(proto_perl->Iformfeed, param);
1d7c1841
GS
11419
11420 PL_maxsysfd = proto_perl->Imaxsysfd;
11421 PL_multiline = proto_perl->Imultiline;
11422 PL_statusvalue = proto_perl->Istatusvalue;
11423#ifdef VMS
11424 PL_statusvalue_vms = proto_perl->Istatusvalue_vms;
11425#endif
0a378802 11426 PL_encoding = sv_dup(proto_perl->Iencoding, param);
1d7c1841 11427
4a4c6fe3 11428 sv_setpvn(PERL_DEBUG_PAD(0), "", 0); /* For regex debugging. */
1f483ca1
JH
11429 sv_setpvn(PERL_DEBUG_PAD(1), "", 0); /* ext/re needs these */
11430 sv_setpvn(PERL_DEBUG_PAD(2), "", 0); /* even without DEBUGGING. */
4a4c6fe3 11431
d2f185dc
AMS
11432 /* Clone the regex array */
11433 PL_regex_padav = newAV();
11434 {
a3b680e6 11435 const I32 len = av_len((AV*)proto_perl->Iregex_padav);
53c1dcc0 11436 SV** const regexen = AvARRAY((AV*)proto_perl->Iregex_padav);
b464bac0 11437 IV i;
0f95fc41
AB
11438 av_push(PL_regex_padav,
11439 sv_dup_inc(regexen[0],param));
11440 for(i = 1; i <= len; i++) {
11441 if(SvREPADTMP(regexen[i])) {
11442 av_push(PL_regex_padav, sv_dup_inc(regexen[i], param));
8cf8f3d1 11443 } else {
0f95fc41
AB
11444 av_push(PL_regex_padav,
11445 SvREFCNT_inc(
8cf8f3d1 11446 newSViv(PTR2IV(re_dup(INT2PTR(REGEXP *,
cbfa9890 11447 SvIVX(regexen[i])), param)))
0f95fc41
AB
11448 ));
11449 }
d2f185dc
AMS
11450 }
11451 }
11452 PL_regex_pad = AvARRAY(PL_regex_padav);
1fcf4c12 11453
1d7c1841 11454 /* shortcuts to various I/O objects */
d2d73c3e
AB
11455 PL_stdingv = gv_dup(proto_perl->Istdingv, param);
11456 PL_stderrgv = gv_dup(proto_perl->Istderrgv, param);
11457 PL_defgv = gv_dup(proto_perl->Idefgv, param);
11458 PL_argvgv = gv_dup(proto_perl->Iargvgv, param);
11459 PL_argvoutgv = gv_dup(proto_perl->Iargvoutgv, param);
11460 PL_argvout_stack = av_dup_inc(proto_perl->Iargvout_stack, param);
1d7c1841
GS
11461
11462 /* shortcuts to regexp stuff */
d2d73c3e 11463 PL_replgv = gv_dup(proto_perl->Ireplgv, param);
1d7c1841
GS
11464
11465 /* shortcuts to misc objects */
d2d73c3e 11466 PL_errgv = gv_dup(proto_perl->Ierrgv, param);
1d7c1841
GS
11467
11468 /* shortcuts to debugging objects */
d2d73c3e
AB
11469 PL_DBgv = gv_dup(proto_perl->IDBgv, param);
11470 PL_DBline = gv_dup(proto_perl->IDBline, param);
11471 PL_DBsub = gv_dup(proto_perl->IDBsub, param);
11472 PL_DBsingle = sv_dup(proto_perl->IDBsingle, param);
11473 PL_DBtrace = sv_dup(proto_perl->IDBtrace, param);
11474 PL_DBsignal = sv_dup(proto_perl->IDBsignal, param);
06492da6 11475 PL_DBassertion = sv_dup(proto_perl->IDBassertion, param);
d2d73c3e
AB
11476 PL_lineary = av_dup(proto_perl->Ilineary, param);
11477 PL_dbargs = av_dup(proto_perl->Idbargs, param);
1d7c1841
GS
11478
11479 /* symbol tables */
d2d73c3e
AB
11480 PL_defstash = hv_dup_inc(proto_perl->Tdefstash, param);
11481 PL_curstash = hv_dup(proto_perl->Tcurstash, param);
d2d73c3e
AB
11482 PL_debstash = hv_dup(proto_perl->Idebstash, param);
11483 PL_globalstash = hv_dup(proto_perl->Iglobalstash, param);
11484 PL_curstname = sv_dup_inc(proto_perl->Icurstname, param);
11485
11486 PL_beginav = av_dup_inc(proto_perl->Ibeginav, param);
ee1c5a4e 11487 PL_beginav_save = av_dup_inc(proto_perl->Ibeginav_save, param);
ece599bd 11488 PL_checkav_save = av_dup_inc(proto_perl->Icheckav_save, param);
d2d73c3e
AB
11489 PL_endav = av_dup_inc(proto_perl->Iendav, param);
11490 PL_checkav = av_dup_inc(proto_perl->Icheckav, param);
11491 PL_initav = av_dup_inc(proto_perl->Iinitav, param);
1d7c1841
GS
11492
11493 PL_sub_generation = proto_perl->Isub_generation;
11494
11495 /* funky return mechanisms */
11496 PL_forkprocess = proto_perl->Iforkprocess;
11497
11498 /* subprocess state */
d2d73c3e 11499 PL_fdpid = av_dup_inc(proto_perl->Ifdpid, param);
1d7c1841
GS
11500
11501 /* internal state */
1d7c1841
GS
11502 PL_maxo = proto_perl->Imaxo;
11503 if (proto_perl->Iop_mask)
11504 PL_op_mask = SAVEPVN(proto_perl->Iop_mask, PL_maxo);
11505 else
11506 PL_op_mask = Nullch;
06492da6 11507 /* PL_asserting = proto_perl->Iasserting; */
1d7c1841
GS
11508
11509 /* current interpreter roots */
d2d73c3e 11510 PL_main_cv = cv_dup_inc(proto_perl->Imain_cv, param);
1d7c1841
GS
11511 PL_main_root = OpREFCNT_inc(proto_perl->Imain_root);
11512 PL_main_start = proto_perl->Imain_start;
e977893f 11513 PL_eval_root = proto_perl->Ieval_root;
1d7c1841
GS
11514 PL_eval_start = proto_perl->Ieval_start;
11515
11516 /* runtime control stuff */
11517 PL_curcopdb = (COP*)any_dup(proto_perl->Icurcopdb, proto_perl);
11518 PL_copline = proto_perl->Icopline;
11519
11520 PL_filemode = proto_perl->Ifilemode;
11521 PL_lastfd = proto_perl->Ilastfd;
11522 PL_oldname = proto_perl->Ioldname; /* XXX not quite right */
11523 PL_Argv = NULL;
11524 PL_Cmd = Nullch;
11525 PL_gensym = proto_perl->Igensym;
11526 PL_preambled = proto_perl->Ipreambled;
d2d73c3e 11527 PL_preambleav = av_dup_inc(proto_perl->Ipreambleav, param);
1d7c1841
GS
11528 PL_laststatval = proto_perl->Ilaststatval;
11529 PL_laststype = proto_perl->Ilaststype;
11530 PL_mess_sv = Nullsv;
11531
d2d73c3e 11532 PL_ors_sv = sv_dup_inc(proto_perl->Iors_sv, param);
1d7c1841
GS
11533
11534 /* interpreter atexit processing */
11535 PL_exitlistlen = proto_perl->Iexitlistlen;
11536 if (PL_exitlistlen) {
a02a5408 11537 Newx(PL_exitlist, PL_exitlistlen, PerlExitListEntry);
1d7c1841
GS
11538 Copy(proto_perl->Iexitlist, PL_exitlist, PL_exitlistlen, PerlExitListEntry);
11539 }
11540 else
11541 PL_exitlist = (PerlExitListEntry*)NULL;
d2d73c3e 11542 PL_modglobal = hv_dup_inc(proto_perl->Imodglobal, param);
19e8ce8e
AB
11543 PL_custom_op_names = hv_dup_inc(proto_perl->Icustom_op_names,param);
11544 PL_custom_op_descs = hv_dup_inc(proto_perl->Icustom_op_descs,param);
1d7c1841
GS
11545
11546 PL_profiledata = NULL;
a8fc9800 11547 PL_rsfp = fp_dup(proto_perl->Irsfp, '<', param);
1d7c1841 11548 /* PL_rsfp_filters entries have fake IoDIRP() */
d2d73c3e 11549 PL_rsfp_filters = av_dup_inc(proto_perl->Irsfp_filters, param);
1d7c1841 11550
d2d73c3e 11551 PL_compcv = cv_dup(proto_perl->Icompcv, param);
dd2155a4
DM
11552
11553 PAD_CLONE_VARS(proto_perl, param);
1d7c1841
GS
11554
11555#ifdef HAVE_INTERP_INTERN
11556 sys_intern_dup(&proto_perl->Isys_intern, &PL_sys_intern);
11557#endif
11558
11559 /* more statics moved here */
11560 PL_generation = proto_perl->Igeneration;
d2d73c3e 11561 PL_DBcv = cv_dup(proto_perl->IDBcv, param);
1d7c1841
GS
11562
11563 PL_in_clean_objs = proto_perl->Iin_clean_objs;
11564 PL_in_clean_all = proto_perl->Iin_clean_all;
11565
11566 PL_uid = proto_perl->Iuid;
11567 PL_euid = proto_perl->Ieuid;
11568 PL_gid = proto_perl->Igid;
11569 PL_egid = proto_perl->Iegid;
11570 PL_nomemok = proto_perl->Inomemok;
11571 PL_an = proto_perl->Ian;
1d7c1841
GS
11572 PL_evalseq = proto_perl->Ievalseq;
11573 PL_origenviron = proto_perl->Iorigenviron; /* XXX not quite right */
11574 PL_origalen = proto_perl->Iorigalen;
11575 PL_pidstatus = newHV(); /* XXX flag for cloning? */
11576 PL_osname = SAVEPV(proto_perl->Iosname);
1d7c1841
GS
11577 PL_sighandlerp = proto_perl->Isighandlerp;
11578
1d7c1841
GS
11579 PL_runops = proto_perl->Irunops;
11580
11581 Copy(proto_perl->Itokenbuf, PL_tokenbuf, 256, char);
11582
11583#ifdef CSH
11584 PL_cshlen = proto_perl->Icshlen;
74f1b2b8 11585 PL_cshname = proto_perl->Icshname; /* XXX never deallocated */
1d7c1841
GS
11586#endif
11587
11588 PL_lex_state = proto_perl->Ilex_state;
11589 PL_lex_defer = proto_perl->Ilex_defer;
11590 PL_lex_expect = proto_perl->Ilex_expect;
11591 PL_lex_formbrack = proto_perl->Ilex_formbrack;
11592 PL_lex_dojoin = proto_perl->Ilex_dojoin;
11593 PL_lex_starts = proto_perl->Ilex_starts;
d2d73c3e
AB
11594 PL_lex_stuff = sv_dup_inc(proto_perl->Ilex_stuff, param);
11595 PL_lex_repl = sv_dup_inc(proto_perl->Ilex_repl, param);
1d7c1841
GS
11596 PL_lex_op = proto_perl->Ilex_op;
11597 PL_lex_inpat = proto_perl->Ilex_inpat;
11598 PL_lex_inwhat = proto_perl->Ilex_inwhat;
11599 PL_lex_brackets = proto_perl->Ilex_brackets;
11600 i = (PL_lex_brackets < 120 ? 120 : PL_lex_brackets);
11601 PL_lex_brackstack = SAVEPVN(proto_perl->Ilex_brackstack,i);
11602 PL_lex_casemods = proto_perl->Ilex_casemods;
11603 i = (PL_lex_casemods < 12 ? 12 : PL_lex_casemods);
11604 PL_lex_casestack = SAVEPVN(proto_perl->Ilex_casestack,i);
11605
11606 Copy(proto_perl->Inextval, PL_nextval, 5, YYSTYPE);
11607 Copy(proto_perl->Inexttype, PL_nexttype, 5, I32);
11608 PL_nexttoke = proto_perl->Inexttoke;
11609
1d773130
TB
11610 /* XXX This is probably masking the deeper issue of why
11611 * SvANY(proto_perl->Ilinestr) can be NULL at this point. For test case:
11612 * http://archive.develooper.com/perl5-porters%40perl.org/msg83298.html
11613 * (A little debugging with a watchpoint on it may help.)
11614 */
389edf32
TB
11615 if (SvANY(proto_perl->Ilinestr)) {
11616 PL_linestr = sv_dup_inc(proto_perl->Ilinestr, param);
3f7c398e 11617 i = proto_perl->Ibufptr - SvPVX_const(proto_perl->Ilinestr);
389edf32 11618 PL_bufptr = SvPVX(PL_linestr) + (i < 0 ? 0 : i);
3f7c398e 11619 i = proto_perl->Ioldbufptr - SvPVX_const(proto_perl->Ilinestr);
389edf32 11620 PL_oldbufptr = SvPVX(PL_linestr) + (i < 0 ? 0 : i);
3f7c398e 11621 i = proto_perl->Ioldoldbufptr - SvPVX_const(proto_perl->Ilinestr);
389edf32 11622 PL_oldoldbufptr = SvPVX(PL_linestr) + (i < 0 ? 0 : i);
3f7c398e 11623 i = proto_perl->Ilinestart - SvPVX_const(proto_perl->Ilinestr);
389edf32
TB
11624 PL_linestart = SvPVX(PL_linestr) + (i < 0 ? 0 : i);
11625 }
11626 else {
11627 PL_linestr = NEWSV(65,79);
11628 sv_upgrade(PL_linestr,SVt_PVIV);
11629 sv_setpvn(PL_linestr,"",0);
11630 PL_bufptr = PL_oldbufptr = PL_oldoldbufptr = PL_linestart = SvPVX(PL_linestr);
11631 }
1d7c1841 11632 PL_bufend = SvPVX(PL_linestr) + SvCUR(PL_linestr);
1d7c1841
GS
11633 PL_pending_ident = proto_perl->Ipending_ident;
11634 PL_sublex_info = proto_perl->Isublex_info; /* XXX not quite right */
11635
11636 PL_expect = proto_perl->Iexpect;
11637
11638 PL_multi_start = proto_perl->Imulti_start;
11639 PL_multi_end = proto_perl->Imulti_end;
11640 PL_multi_open = proto_perl->Imulti_open;
11641 PL_multi_close = proto_perl->Imulti_close;
11642
11643 PL_error_count = proto_perl->Ierror_count;
11644 PL_subline = proto_perl->Isubline;
d2d73c3e 11645 PL_subname = sv_dup_inc(proto_perl->Isubname, param);
1d7c1841 11646
1d773130 11647 /* XXX See comment on SvANY(proto_perl->Ilinestr) above */
389edf32 11648 if (SvANY(proto_perl->Ilinestr)) {
3f7c398e 11649 i = proto_perl->Ilast_uni - SvPVX_const(proto_perl->Ilinestr);
389edf32 11650 PL_last_uni = SvPVX(PL_linestr) + (i < 0 ? 0 : i);
3f7c398e 11651 i = proto_perl->Ilast_lop - SvPVX_const(proto_perl->Ilinestr);
389edf32
TB
11652 PL_last_lop = SvPVX(PL_linestr) + (i < 0 ? 0 : i);
11653 PL_last_lop_op = proto_perl->Ilast_lop_op;
11654 }
11655 else {
11656 PL_last_uni = SvPVX(PL_linestr);
11657 PL_last_lop = SvPVX(PL_linestr);
11658 PL_last_lop_op = 0;
11659 }
1d7c1841 11660 PL_in_my = proto_perl->Iin_my;
d2d73c3e 11661 PL_in_my_stash = hv_dup(proto_perl->Iin_my_stash, param);
1d7c1841
GS
11662#ifdef FCRYPT
11663 PL_cryptseen = proto_perl->Icryptseen;
11664#endif
11665
11666 PL_hints = proto_perl->Ihints;
11667
11668 PL_amagic_generation = proto_perl->Iamagic_generation;
11669
11670#ifdef USE_LOCALE_COLLATE
11671 PL_collation_ix = proto_perl->Icollation_ix;
11672 PL_collation_name = SAVEPV(proto_perl->Icollation_name);
11673 PL_collation_standard = proto_perl->Icollation_standard;
11674 PL_collxfrm_base = proto_perl->Icollxfrm_base;
11675 PL_collxfrm_mult = proto_perl->Icollxfrm_mult;
11676#endif /* USE_LOCALE_COLLATE */
11677
11678#ifdef USE_LOCALE_NUMERIC
11679 PL_numeric_name = SAVEPV(proto_perl->Inumeric_name);
11680 PL_numeric_standard = proto_perl->Inumeric_standard;
11681 PL_numeric_local = proto_perl->Inumeric_local;
d2d73c3e 11682 PL_numeric_radix_sv = sv_dup_inc(proto_perl->Inumeric_radix_sv, param);
1d7c1841
GS
11683#endif /* !USE_LOCALE_NUMERIC */
11684
11685 /* utf8 character classes */
d2d73c3e
AB
11686 PL_utf8_alnum = sv_dup_inc(proto_perl->Iutf8_alnum, param);
11687 PL_utf8_alnumc = sv_dup_inc(proto_perl->Iutf8_alnumc, param);
11688 PL_utf8_ascii = sv_dup_inc(proto_perl->Iutf8_ascii, param);
11689 PL_utf8_alpha = sv_dup_inc(proto_perl->Iutf8_alpha, param);
11690 PL_utf8_space = sv_dup_inc(proto_perl->Iutf8_space, param);
11691 PL_utf8_cntrl = sv_dup_inc(proto_perl->Iutf8_cntrl, param);
11692 PL_utf8_graph = sv_dup_inc(proto_perl->Iutf8_graph, param);
11693 PL_utf8_digit = sv_dup_inc(proto_perl->Iutf8_digit, param);
11694 PL_utf8_upper = sv_dup_inc(proto_perl->Iutf8_upper, param);
11695 PL_utf8_lower = sv_dup_inc(proto_perl->Iutf8_lower, param);
11696 PL_utf8_print = sv_dup_inc(proto_perl->Iutf8_print, param);
11697 PL_utf8_punct = sv_dup_inc(proto_perl->Iutf8_punct, param);
11698 PL_utf8_xdigit = sv_dup_inc(proto_perl->Iutf8_xdigit, param);
11699 PL_utf8_mark = sv_dup_inc(proto_perl->Iutf8_mark, param);
11700 PL_utf8_toupper = sv_dup_inc(proto_perl->Iutf8_toupper, param);
11701 PL_utf8_totitle = sv_dup_inc(proto_perl->Iutf8_totitle, param);
11702 PL_utf8_tolower = sv_dup_inc(proto_perl->Iutf8_tolower, param);
b4e400f9 11703 PL_utf8_tofold = sv_dup_inc(proto_perl->Iutf8_tofold, param);
82686b01
JH
11704 PL_utf8_idstart = sv_dup_inc(proto_perl->Iutf8_idstart, param);
11705 PL_utf8_idcont = sv_dup_inc(proto_perl->Iutf8_idcont, param);
1d7c1841 11706
6c3182a5 11707 /* Did the locale setup indicate UTF-8? */
9769094f 11708 PL_utf8locale = proto_perl->Iutf8locale;
6c3182a5
JH
11709 /* Unicode features (see perlrun/-C) */
11710 PL_unicode = proto_perl->Iunicode;
11711
11712 /* Pre-5.8 signals control */
11713 PL_signals = proto_perl->Isignals;
11714
11715 /* times() ticks per second */
11716 PL_clocktick = proto_perl->Iclocktick;
11717
11718 /* Recursion stopper for PerlIO_find_layer */
11719 PL_in_load_module = proto_perl->Iin_load_module;
11720
11721 /* sort() routine */
11722 PL_sort_RealCmp = proto_perl->Isort_RealCmp;
11723
57c6e6d2
JH
11724 /* Not really needed/useful since the reenrant_retint is "volatile",
11725 * but do it for consistency's sake. */
11726 PL_reentrant_retint = proto_perl->Ireentrant_retint;
11727
15a5279a
JH
11728 /* Hooks to shared SVs and locks. */
11729 PL_sharehook = proto_perl->Isharehook;
11730 PL_lockhook = proto_perl->Ilockhook;
11731 PL_unlockhook = proto_perl->Iunlockhook;
11732 PL_threadhook = proto_perl->Ithreadhook;
11733
bce260cd
JH
11734 PL_runops_std = proto_perl->Irunops_std;
11735 PL_runops_dbg = proto_perl->Irunops_dbg;
11736
11737#ifdef THREADS_HAVE_PIDS
11738 PL_ppid = proto_perl->Ippid;
11739#endif
11740
1d7c1841
GS
11741 /* swatch cache */
11742 PL_last_swash_hv = Nullhv; /* reinits on demand */
11743 PL_last_swash_klen = 0;
11744 PL_last_swash_key[0]= '\0';
11745 PL_last_swash_tmps = (U8*)NULL;
11746 PL_last_swash_slen = 0;
11747
1d7c1841
GS
11748 PL_glob_index = proto_perl->Iglob_index;
11749 PL_srand_called = proto_perl->Isrand_called;
11750 PL_uudmap['M'] = 0; /* reinits on demand */
11751 PL_bitcount = Nullch; /* reinits on demand */
11752
66fe0623 11753 if (proto_perl->Ipsig_pend) {
a02a5408 11754 Newxz(PL_psig_pend, SIG_SIZE, int);
9dd79c3f 11755 }
66fe0623
NIS
11756 else {
11757 PL_psig_pend = (int*)NULL;
11758 }
11759
1d7c1841 11760 if (proto_perl->Ipsig_ptr) {
a02a5408
JC
11761 Newxz(PL_psig_ptr, SIG_SIZE, SV*);
11762 Newxz(PL_psig_name, SIG_SIZE, SV*);
76d3c696 11763 for (i = 1; i < SIG_SIZE; i++) {
d2d73c3e
AB
11764 PL_psig_ptr[i] = sv_dup_inc(proto_perl->Ipsig_ptr[i], param);
11765 PL_psig_name[i] = sv_dup_inc(proto_perl->Ipsig_name[i], param);
1d7c1841
GS
11766 }
11767 }
11768 else {
11769 PL_psig_ptr = (SV**)NULL;
11770 PL_psig_name = (SV**)NULL;
11771 }
11772
11773 /* thrdvar.h stuff */
11774
a0739874 11775 if (flags & CLONEf_COPY_STACKS) {
1d7c1841
GS
11776 /* next allocation will be PL_tmps_stack[PL_tmps_ix+1] */
11777 PL_tmps_ix = proto_perl->Ttmps_ix;
11778 PL_tmps_max = proto_perl->Ttmps_max;
11779 PL_tmps_floor = proto_perl->Ttmps_floor;
a02a5408 11780 Newxz(PL_tmps_stack, PL_tmps_max, SV*);
1d7c1841
GS
11781 i = 0;
11782 while (i <= PL_tmps_ix) {
d2d73c3e 11783 PL_tmps_stack[i] = sv_dup_inc(proto_perl->Ttmps_stack[i], param);
1d7c1841
GS
11784 ++i;
11785 }
11786
11787 /* next PUSHMARK() sets *(PL_markstack_ptr+1) */
11788 i = proto_perl->Tmarkstack_max - proto_perl->Tmarkstack;
a02a5408 11789 Newxz(PL_markstack, i, I32);
1d7c1841
GS
11790 PL_markstack_max = PL_markstack + (proto_perl->Tmarkstack_max
11791 - proto_perl->Tmarkstack);
11792 PL_markstack_ptr = PL_markstack + (proto_perl->Tmarkstack_ptr
11793 - proto_perl->Tmarkstack);
11794 Copy(proto_perl->Tmarkstack, PL_markstack,
11795 PL_markstack_ptr - PL_markstack + 1, I32);
11796
11797 /* next push_scope()/ENTER sets PL_scopestack[PL_scopestack_ix]
11798 * NOTE: unlike the others! */
11799 PL_scopestack_ix = proto_perl->Tscopestack_ix;
11800 PL_scopestack_max = proto_perl->Tscopestack_max;
a02a5408 11801 Newxz(PL_scopestack, PL_scopestack_max, I32);
1d7c1841
GS
11802 Copy(proto_perl->Tscopestack, PL_scopestack, PL_scopestack_ix, I32);
11803
1d7c1841 11804 /* NOTE: si_dup() looks at PL_markstack */
d2d73c3e 11805 PL_curstackinfo = si_dup(proto_perl->Tcurstackinfo, param);
1d7c1841
GS
11806
11807 /* PL_curstack = PL_curstackinfo->si_stack; */
d2d73c3e
AB
11808 PL_curstack = av_dup(proto_perl->Tcurstack, param);
11809 PL_mainstack = av_dup(proto_perl->Tmainstack, param);
1d7c1841
GS
11810
11811 /* next PUSHs() etc. set *(PL_stack_sp+1) */
11812 PL_stack_base = AvARRAY(PL_curstack);
11813 PL_stack_sp = PL_stack_base + (proto_perl->Tstack_sp
11814 - proto_perl->Tstack_base);
11815 PL_stack_max = PL_stack_base + AvMAX(PL_curstack);
11816
11817 /* next SSPUSHFOO() sets PL_savestack[PL_savestack_ix]
11818 * NOTE: unlike the others! */
11819 PL_savestack_ix = proto_perl->Tsavestack_ix;
11820 PL_savestack_max = proto_perl->Tsavestack_max;
a02a5408 11821 /*Newxz(PL_savestack, PL_savestack_max, ANY);*/
d2d73c3e 11822 PL_savestack = ss_dup(proto_perl, param);
1d7c1841
GS
11823 }
11824 else {
11825 init_stacks();
985e7056 11826 ENTER; /* perl_destruct() wants to LEAVE; */
1d7c1841
GS
11827 }
11828
11829 PL_start_env = proto_perl->Tstart_env; /* XXXXXX */
11830 PL_top_env = &PL_start_env;
11831
11832 PL_op = proto_perl->Top;
11833
11834 PL_Sv = Nullsv;
11835 PL_Xpv = (XPV*)NULL;
11836 PL_na = proto_perl->Tna;
11837
11838 PL_statbuf = proto_perl->Tstatbuf;
11839 PL_statcache = proto_perl->Tstatcache;
d2d73c3e
AB
11840 PL_statgv = gv_dup(proto_perl->Tstatgv, param);
11841 PL_statname = sv_dup_inc(proto_perl->Tstatname, param);
1d7c1841
GS
11842#ifdef HAS_TIMES
11843 PL_timesbuf = proto_perl->Ttimesbuf;
11844#endif
11845
11846 PL_tainted = proto_perl->Ttainted;
11847 PL_curpm = proto_perl->Tcurpm; /* XXX No PMOP ref count */
d2d73c3e
AB
11848 PL_rs = sv_dup_inc(proto_perl->Trs, param);
11849 PL_last_in_gv = gv_dup(proto_perl->Tlast_in_gv, param);
11850 PL_ofs_sv = sv_dup_inc(proto_perl->Tofs_sv, param);
11851 PL_defoutgv = gv_dup_inc(proto_perl->Tdefoutgv, param);
1d7c1841 11852 PL_chopset = proto_perl->Tchopset; /* XXX never deallocated */
d2d73c3e
AB
11853 PL_toptarget = sv_dup_inc(proto_perl->Ttoptarget, param);
11854 PL_bodytarget = sv_dup_inc(proto_perl->Tbodytarget, param);
11855 PL_formtarget = sv_dup(proto_perl->Tformtarget, param);
1d7c1841
GS
11856
11857 PL_restartop = proto_perl->Trestartop;
11858 PL_in_eval = proto_perl->Tin_eval;
11859 PL_delaymagic = proto_perl->Tdelaymagic;
11860 PL_dirty = proto_perl->Tdirty;
11861 PL_localizing = proto_perl->Tlocalizing;
11862
d2d73c3e 11863 PL_errors = sv_dup_inc(proto_perl->Terrors, param);
dd28f7bb 11864 PL_hv_fetch_ent_mh = Nullhe;
1d7c1841
GS
11865 PL_modcount = proto_perl->Tmodcount;
11866 PL_lastgotoprobe = Nullop;
11867 PL_dumpindent = proto_perl->Tdumpindent;
11868
11869 PL_sortcop = (OP*)any_dup(proto_perl->Tsortcop, proto_perl);
d2d73c3e
AB
11870 PL_sortstash = hv_dup(proto_perl->Tsortstash, param);
11871 PL_firstgv = gv_dup(proto_perl->Tfirstgv, param);
11872 PL_secondgv = gv_dup(proto_perl->Tsecondgv, param);
1d7c1841
GS
11873 PL_sortcxix = proto_perl->Tsortcxix;
11874 PL_efloatbuf = Nullch; /* reinits on demand */
11875 PL_efloatsize = 0; /* reinits on demand */
11876
11877 /* regex stuff */
11878
11879 PL_screamfirst = NULL;
11880 PL_screamnext = NULL;
11881 PL_maxscream = -1; /* reinits on demand */
11882 PL_lastscream = Nullsv;
11883
11884 PL_watchaddr = NULL;
11885 PL_watchok = Nullch;
11886
11887 PL_regdummy = proto_perl->Tregdummy;
1d7c1841
GS
11888 PL_regprecomp = Nullch;
11889 PL_regnpar = 0;
11890 PL_regsize = 0;
1d7c1841
GS
11891 PL_colorset = 0; /* reinits PL_colors[] */
11892 /*PL_colors[6] = {0,0,0,0,0,0};*/
1d7c1841
GS
11893 PL_reginput = Nullch;
11894 PL_regbol = Nullch;
11895 PL_regeol = Nullch;
11896 PL_regstartp = (I32*)NULL;
11897 PL_regendp = (I32*)NULL;
11898 PL_reglastparen = (U32*)NULL;
2d862feb 11899 PL_reglastcloseparen = (U32*)NULL;
1d7c1841 11900 PL_regtill = Nullch;
1d7c1841
GS
11901 PL_reg_start_tmp = (char**)NULL;
11902 PL_reg_start_tmpl = 0;
11903 PL_regdata = (struct reg_data*)NULL;
11904 PL_bostr = Nullch;
11905 PL_reg_flags = 0;
11906 PL_reg_eval_set = 0;
11907 PL_regnarrate = 0;
11908 PL_regprogram = (regnode*)NULL;
11909 PL_regindent = 0;
11910 PL_regcc = (CURCUR*)NULL;
11911 PL_reg_call_cc = (struct re_cc_state*)NULL;
11912 PL_reg_re = (regexp*)NULL;
11913 PL_reg_ganch = Nullch;
11914 PL_reg_sv = Nullsv;
53c4c00c 11915 PL_reg_match_utf8 = FALSE;
1d7c1841
GS
11916 PL_reg_magic = (MAGIC*)NULL;
11917 PL_reg_oldpos = 0;
11918 PL_reg_oldcurpm = (PMOP*)NULL;
11919 PL_reg_curpm = (PMOP*)NULL;
11920 PL_reg_oldsaved = Nullch;
11921 PL_reg_oldsavedlen = 0;
f8c7b90f 11922#ifdef PERL_OLD_COPY_ON_WRITE
504cff3b 11923 PL_nrs = Nullsv;
ed252734 11924#endif
1d7c1841
GS
11925 PL_reg_maxiter = 0;
11926 PL_reg_leftiter = 0;
11927 PL_reg_poscache = Nullch;
11928 PL_reg_poscache_size= 0;
11929
11930 /* RE engine - function pointers */
11931 PL_regcompp = proto_perl->Tregcompp;
11932 PL_regexecp = proto_perl->Tregexecp;
11933 PL_regint_start = proto_perl->Tregint_start;
11934 PL_regint_string = proto_perl->Tregint_string;
11935 PL_regfree = proto_perl->Tregfree;
11936
11937 PL_reginterp_cnt = 0;
11938 PL_reg_starttry = 0;
11939
a2efc822
SC
11940 /* Pluggable optimizer */
11941 PL_peepp = proto_perl->Tpeepp;
11942
081fc587
AB
11943 PL_stashcache = newHV();
11944
a0739874
DM
11945 if (!(flags & CLONEf_KEEP_PTR_TABLE)) {
11946 ptr_table_free(PL_ptr_table);
11947 PL_ptr_table = NULL;
11948 }
8cf8f3d1 11949
f284b03f
AMS
11950 /* Call the ->CLONE method, if it exists, for each of the stashes
11951 identified by sv_dup() above.
11952 */
d2d73c3e 11953 while(av_len(param->stashes) != -1) {
53c1dcc0
AL
11954 HV* const stash = (HV*) av_shift(param->stashes);
11955 GV* const cloner = gv_fetchmethod_autoload(stash, "CLONE", 0);
f284b03f
AMS
11956 if (cloner && GvCV(cloner)) {
11957 dSP;
11958 ENTER;
11959 SAVETMPS;
11960 PUSHMARK(SP);
84bda14a 11961 XPUSHs(sv_2mortal(newSVhek(HvNAME_HEK(stash))));
f284b03f
AMS
11962 PUTBACK;
11963 call_sv((SV*)GvCV(cloner), G_DISCARD);
11964 FREETMPS;
11965 LEAVE;
11966 }
4a09accc 11967 }
a0739874 11968
dc507217 11969 SvREFCNT_dec(param->stashes);
dc507217 11970
6d26897e
DM
11971 /* orphaned? eg threads->new inside BEGIN or use */
11972 if (PL_compcv && ! SvREFCNT(PL_compcv)) {
a3b680e6 11973 (void)SvREFCNT_inc(PL_compcv);
6d26897e
DM
11974 SAVEFREESV(PL_compcv);
11975 }
11976
1d7c1841 11977 return my_perl;
1d7c1841
GS
11978}
11979
1d7c1841 11980#endif /* USE_ITHREADS */
a0ae6670 11981
9f4817db 11982/*
ccfc67b7
JH
11983=head1 Unicode Support
11984
9f4817db
JH
11985=for apidoc sv_recode_to_utf8
11986
5d170f3a
JH
11987The encoding is assumed to be an Encode object, on entry the PV
11988of the sv is assumed to be octets in that encoding, and the sv
11989will be converted into Unicode (and UTF-8).
9f4817db 11990
5d170f3a
JH
11991If the sv already is UTF-8 (or if it is not POK), or if the encoding
11992is not a reference, nothing is done to the sv. If the encoding is not
1768d7eb
JH
11993an C<Encode::XS> Encoding object, bad things will happen.
11994(See F<lib/encoding.pm> and L<Encode>).
9f4817db 11995
5d170f3a 11996The PV of the sv is returned.
9f4817db 11997
5d170f3a
JH
11998=cut */
11999
12000char *
12001Perl_sv_recode_to_utf8(pTHX_ SV *sv, SV *encoding)
12002{
27da23d5 12003 dVAR;
220e2d4e 12004 if (SvPOK(sv) && !SvUTF8(sv) && !IN_BYTES && SvROK(encoding)) {
d0063567
DK
12005 SV *uni;
12006 STRLEN len;
93524f2b 12007 const char *s;
d0063567
DK
12008 dSP;
12009 ENTER;
12010 SAVETMPS;
220e2d4e 12011 save_re_context();
d0063567
DK
12012 PUSHMARK(sp);
12013 EXTEND(SP, 3);
12014 XPUSHs(encoding);
12015 XPUSHs(sv);
7a5fa8a2 12016/*
f9893866
NIS
12017 NI-S 2002/07/09
12018 Passing sv_yes is wrong - it needs to be or'ed set of constants
7a5fa8a2 12019 for Encode::XS, while UTf-8 decode (currently) assumes a true value means
f9893866
NIS
12020 remove converted chars from source.
12021
12022 Both will default the value - let them.
7a5fa8a2 12023
d0063567 12024 XPUSHs(&PL_sv_yes);
f9893866 12025*/
d0063567
DK
12026 PUTBACK;
12027 call_method("decode", G_SCALAR);
12028 SPAGAIN;
12029 uni = POPs;
12030 PUTBACK;
93524f2b 12031 s = SvPV_const(uni, len);
3f7c398e 12032 if (s != SvPVX_const(sv)) {
d0063567 12033 SvGROW(sv, len + 1);
93524f2b 12034 Move(s, SvPVX(sv), len + 1, char);
d0063567 12035 SvCUR_set(sv, len);
d0063567
DK
12036 }
12037 FREETMPS;
12038 LEAVE;
d0063567 12039 SvUTF8_on(sv);
95899a2a 12040 return SvPVX(sv);
f9893866 12041 }
95899a2a 12042 return SvPOKp(sv) ? SvPVX(sv) : NULL;
9f4817db
JH
12043}
12044
220e2d4e
IH
12045/*
12046=for apidoc sv_cat_decode
12047
12048The encoding is assumed to be an Encode object, the PV of the ssv is
12049assumed to be octets in that encoding and decoding the input starts
12050from the position which (PV + *offset) pointed to. The dsv will be
12051concatenated the decoded UTF-8 string from ssv. Decoding will terminate
12052when the string tstr appears in decoding output or the input ends on
12053the PV of the ssv. The value which the offset points will be modified
12054to the last input position on the ssv.
68795e93 12055
220e2d4e
IH
12056Returns TRUE if the terminator was found, else returns FALSE.
12057
12058=cut */
12059
12060bool
12061Perl_sv_cat_decode(pTHX_ SV *dsv, SV *encoding,
12062 SV *ssv, int *offset, char *tstr, int tlen)
12063{
27da23d5 12064 dVAR;
a73e8557 12065 bool ret = FALSE;
220e2d4e 12066 if (SvPOK(ssv) && SvPOK(dsv) && SvROK(encoding) && offset) {
220e2d4e
IH
12067 SV *offsv;
12068 dSP;
12069 ENTER;
12070 SAVETMPS;
12071 save_re_context();
12072 PUSHMARK(sp);
12073 EXTEND(SP, 6);
12074 XPUSHs(encoding);
12075 XPUSHs(dsv);
12076 XPUSHs(ssv);
12077 XPUSHs(offsv = sv_2mortal(newSViv(*offset)));
12078 XPUSHs(sv_2mortal(newSVpvn(tstr, tlen)));
12079 PUTBACK;
12080 call_method("cat_decode", G_SCALAR);
12081 SPAGAIN;
12082 ret = SvTRUE(TOPs);
12083 *offset = SvIV(offsv);
12084 PUTBACK;
12085 FREETMPS;
12086 LEAVE;
220e2d4e 12087 }
a73e8557
JH
12088 else
12089 Perl_croak(aTHX_ "Invalid argument to sv_cat_decode");
12090 return ret;
220e2d4e 12091}
f9893866 12092
241d1a3b
NC
12093/*
12094 * Local variables:
12095 * c-indentation-style: bsd
12096 * c-basic-offset: 4
12097 * indent-tabs-mode: t
12098 * End:
12099 *
37442d52
RGS
12100 * ex: set ts=8 sts=4 sw=4 noet:
12101 */