This is a live mirror of the Perl 5 development currently hosted at https://github.com/perl/perl5
utf8.h: Add macro TWO_BYTE_UTF8_TO_UNI()
[perl5.git] / hv.c
CommitLineData
a0d0e21e 1/* hv.c
79072805 2 *
1129b882
NC
3 * Copyright (C) 1991, 1992, 1993, 1994, 1995, 1996, 1997, 1998, 1999, 2000,
4 * 2001, 2002, 2003, 2004, 2005, 2006, 2007, 2008 by Larry Wall and others
79072805
LW
5 *
6 * You may distribute under the terms of either the GNU General Public
7 * License or the Artistic License, as specified in the README file.
8 *
a0d0e21e
LW
9 */
10
11/*
4ac71550
TC
12 * I sit beside the fire and think
13 * of all that I have seen.
14 * --Bilbo
15 *
16 * [p.278 of _The Lord of the Rings_, II/iii: "The Ring Goes South"]
79072805
LW
17 */
18
d5afce77
RB
19/*
20=head1 Hash Manipulation Functions
166f8a29
DM
21
22A HV structure represents a Perl hash. It consists mainly of an array
23of pointers, each of which points to a linked list of HE structures. The
24array is indexed by the hash function of the key, so each linked list
25represents all the hash entries with the same hash value. Each HE contains
26a pointer to the actual value, plus a pointer to a HEK structure which
27holds the key and hash value.
28
29=cut
30
d5afce77
RB
31*/
32
79072805 33#include "EXTERN.h"
864dbfa3 34#define PERL_IN_HV_C
3d78eb94 35#define PERL_HASH_INTERNAL_ACCESS
79072805
LW
36#include "perl.h"
37
d8012aaf 38#define HV_MAX_LENGTH_BEFORE_SPLIT 14
fdcd69b6 39
d75ce684 40static const char S_strtab_error[]
5d2b1485
NC
41 = "Cannot modify shared string table in hv_%s";
42
c941fb51
NC
43#ifdef PURIFY
44
45#define new_HE() (HE*)safemalloc(sizeof(HE))
46#define del_HE(p) safefree((char*)p)
47
48#else
49
76e3520e 50STATIC HE*
cea2e8a9 51S_new_he(pTHX)
4633a7c4 52{
97aff369 53 dVAR;
4633a7c4 54 HE* he;
0bd48802 55 void ** const root = &PL_body_roots[HE_SVSLOT];
6a93a7e5 56
6a93a7e5 57 if (!*root)
1e30fcd5 58 Perl_more_bodies(aTHX_ HE_SVSLOT, sizeof(HE), PERL_ARENA_SIZE);
10edeb5d 59 he = (HE*) *root;
ce3e5c45 60 assert(he);
6a93a7e5 61 *root = HeNEXT(he);
333f433b 62 return he;
4633a7c4
LW
63}
64
c941fb51
NC
65#define new_HE() new_he()
66#define del_HE(p) \
67 STMT_START { \
6a93a7e5
NC
68 HeNEXT(p) = (HE*)(PL_body_roots[HE_SVSLOT]); \
69 PL_body_roots[HE_SVSLOT] = p; \
c941fb51 70 } STMT_END
d33b2eba 71
d33b2eba 72
d33b2eba
GS
73
74#endif
75
76e3520e 76STATIC HEK *
5f66b61c 77S_save_hek_flags(const char *str, I32 len, U32 hash, int flags)
bbce6d69 78{
35a4481c 79 const int flags_masked = flags & HVhek_MASK;
bbce6d69 80 char *k;
81 register HEK *hek;
1c846c1f 82
7918f24d
NC
83 PERL_ARGS_ASSERT_SAVE_HEK_FLAGS;
84
a02a5408 85 Newx(k, HEK_BASESIZE + len + 2, char);
bbce6d69 86 hek = (HEK*)k;
ff68c719 87 Copy(str, HEK_KEY(hek), len, char);
e05949c7 88 HEK_KEY(hek)[len] = 0;
ff68c719 89 HEK_LEN(hek) = len;
90 HEK_HASH(hek) = hash;
45e34800 91 HEK_FLAGS(hek) = (unsigned char)flags_masked | HVhek_UNSHARED;
dcf933a4
NC
92
93 if (flags & HVhek_FREEKEY)
94 Safefree(str);
bbce6d69 95 return hek;
96}
97
4a31713e 98/* free the pool of temporary HE/HEK pairs returned by hv_fetch_ent
dd28f7bb
DM
99 * for tied hashes */
100
101void
102Perl_free_tied_hv_pool(pTHX)
103{
97aff369 104 dVAR;
dd28f7bb
DM
105 HE *he = PL_hv_fetch_ent_mh;
106 while (he) {
9d4ba2ae 107 HE * const ohe = he;
dd28f7bb 108 Safefree(HeKEY_hek(he));
dd28f7bb
DM
109 he = HeNEXT(he);
110 del_HE(ohe);
111 }
4608196e 112 PL_hv_fetch_ent_mh = NULL;
dd28f7bb
DM
113}
114
d18c6117 115#if defined(USE_ITHREADS)
0bff533c
NC
116HEK *
117Perl_hek_dup(pTHX_ HEK *source, CLONE_PARAMS* param)
118{
566771cc 119 HEK *shared;
9d4ba2ae 120
7918f24d 121 PERL_ARGS_ASSERT_HEK_DUP;
9d4ba2ae 122 PERL_UNUSED_ARG(param);
0bff533c 123
566771cc
NC
124 if (!source)
125 return NULL;
126
127 shared = (HEK*)ptr_table_fetch(PL_ptr_table, source);
0bff533c
NC
128 if (shared) {
129 /* We already shared this hash key. */
454f1e26 130 (void)share_hek_hek(shared);
0bff533c
NC
131 }
132 else {
658b4a4a 133 shared
6e838c70
NC
134 = share_hek_flags(HEK_KEY(source), HEK_LEN(source),
135 HEK_HASH(source), HEK_FLAGS(source));
658b4a4a 136 ptr_table_store(PL_ptr_table, source, shared);
0bff533c 137 }
658b4a4a 138 return shared;
0bff533c
NC
139}
140
d18c6117 141HE *
5c4138a0 142Perl_he_dup(pTHX_ const HE *e, bool shared, CLONE_PARAMS* param)
d18c6117
GS
143{
144 HE *ret;
145
7918f24d
NC
146 PERL_ARGS_ASSERT_HE_DUP;
147
d18c6117 148 if (!e)
4608196e 149 return NULL;
7766f137
GS
150 /* look for it in the table first */
151 ret = (HE*)ptr_table_fetch(PL_ptr_table, e);
152 if (ret)
153 return ret;
154
155 /* create anew and remember what it is */
d33b2eba 156 ret = new_HE();
7766f137
GS
157 ptr_table_store(PL_ptr_table, e, ret);
158
d2d73c3e 159 HeNEXT(ret) = he_dup(HeNEXT(e),shared, param);
dd28f7bb
DM
160 if (HeKLEN(e) == HEf_SVKEY) {
161 char *k;
ad64d0ec 162 Newx(k, HEK_BASESIZE + sizeof(const SV *), char);
dd28f7bb 163 HeKEY_hek(ret) = (HEK*)k;
a09252eb 164 HeKEY_sv(ret) = sv_dup_inc(HeKEY_sv(e), param);
dd28f7bb 165 }
c21d1a0f 166 else if (shared) {
0bff533c
NC
167 /* This is hek_dup inlined, which seems to be important for speed
168 reasons. */
1b6737cc 169 HEK * const source = HeKEY_hek(e);
658b4a4a 170 HEK *shared = (HEK*)ptr_table_fetch(PL_ptr_table, source);
c21d1a0f
NC
171
172 if (shared) {
173 /* We already shared this hash key. */
454f1e26 174 (void)share_hek_hek(shared);
c21d1a0f
NC
175 }
176 else {
658b4a4a 177 shared
6e838c70
NC
178 = share_hek_flags(HEK_KEY(source), HEK_LEN(source),
179 HEK_HASH(source), HEK_FLAGS(source));
658b4a4a 180 ptr_table_store(PL_ptr_table, source, shared);
c21d1a0f 181 }
658b4a4a 182 HeKEY_hek(ret) = shared;
c21d1a0f 183 }
d18c6117 184 else
19692e8d
NC
185 HeKEY_hek(ret) = save_hek_flags(HeKEY(e), HeKLEN(e), HeHASH(e),
186 HeKFLAGS(e));
a09252eb 187 HeVAL(ret) = sv_dup_inc(HeVAL(e), param);
d18c6117
GS
188 return ret;
189}
190#endif /* USE_ITHREADS */
191
1b1f1335 192static void
2393f1b9
JH
193S_hv_notallowed(pTHX_ int flags, const char *key, I32 klen,
194 const char *msg)
1b1f1335 195{
1b6737cc 196 SV * const sv = sv_newmortal();
7918f24d
NC
197
198 PERL_ARGS_ASSERT_HV_NOTALLOWED;
199
19692e8d 200 if (!(flags & HVhek_FREEKEY)) {
1b1f1335
NIS
201 sv_setpvn(sv, key, klen);
202 }
203 else {
204 /* Need to free saved eventually assign to mortal SV */
34c3c4e3 205 /* XXX is this line an error ???: SV *sv = sv_newmortal(); */
1b1f1335
NIS
206 sv_usepvn(sv, (char *) key, klen);
207 }
19692e8d 208 if (flags & HVhek_UTF8) {
1b1f1335
NIS
209 SvUTF8_on(sv);
210 }
be2597df 211 Perl_croak(aTHX_ msg, SVfARG(sv));
1b1f1335
NIS
212}
213
fde52b5c 214/* (klen == HEf_SVKEY) is special for MAGICAL hv entries, meaning key slot
215 * contains an SV* */
216
34a6f7b4
NC
217/*
218=for apidoc hv_store
219
220Stores an SV in a hash. The hash key is specified as C<key> and C<klen> is
221the length of the key. The C<hash> parameter is the precomputed hash
222value; if it is zero then Perl will compute it. The return value will be
223NULL if the operation failed or if the value did not need to be actually
224stored within the hash (as in the case of tied hashes). Otherwise it can
225be dereferenced to get the original C<SV*>. Note that the caller is
226responsible for suitably incrementing the reference count of C<val> before
227the call, and decrementing it if the function returned NULL. Effectively
228a successful hv_store takes ownership of one reference to C<val>. This is
229usually what you want; a newly created SV has a reference count of one, so
230if all your code does is create SVs then store them in a hash, hv_store
231will own the only reference to the new SV, and your code doesn't need to do
232anything further to tidy up. hv_store is not implemented as a call to
233hv_store_ent, and does not create a temporary SV for the key, so if your
234key data is not already in SV form then use hv_store in preference to
235hv_store_ent.
236
237See L<perlguts/"Understanding the Magic of Tied Hashes and Arrays"> for more
238information on how to use this function on tied hashes.
239
34a6f7b4
NC
240=for apidoc hv_store_ent
241
242Stores C<val> in a hash. The hash key is specified as C<key>. The C<hash>
243parameter is the precomputed hash value; if it is zero then Perl will
244compute it. The return value is the new hash entry so created. It will be
245NULL if the operation failed or if the value did not need to be actually
246stored within the hash (as in the case of tied hashes). Otherwise the
247contents of the return value can be accessed using the C<He?> macros
248described here. Note that the caller is responsible for suitably
249incrementing the reference count of C<val> before the call, and
250decrementing it if the function returned NULL. Effectively a successful
251hv_store_ent takes ownership of one reference to C<val>. This is
252usually what you want; a newly created SV has a reference count of one, so
253if all your code does is create SVs then store them in a hash, hv_store
254will own the only reference to the new SV, and your code doesn't need to do
255anything further to tidy up. Note that hv_store_ent only reads the C<key>;
256unlike C<val> it does not take ownership of it, so maintaining the correct
257reference count on C<key> is entirely the caller's responsibility. hv_store
258is not implemented as a call to hv_store_ent, and does not create a temporary
259SV for the key, so if your key data is not already in SV form then use
260hv_store in preference to hv_store_ent.
261
262See L<perlguts/"Understanding the Magic of Tied Hashes and Arrays"> for more
263information on how to use this function on tied hashes.
264
34a6f7b4
NC
265=for apidoc hv_exists
266
267Returns a boolean indicating whether the specified hash key exists. The
268C<klen> is the length of the key.
269
954c1994
GS
270=for apidoc hv_fetch
271
272Returns the SV which corresponds to the specified key in the hash. The
273C<klen> is the length of the key. If C<lval> is set then the fetch will be
274part of a store. Check that the return value is non-null before
d1be9408 275dereferencing it to an C<SV*>.
954c1994 276
96f1132b 277See L<perlguts/"Understanding the Magic of Tied Hashes and Arrays"> for more
954c1994
GS
278information on how to use this function on tied hashes.
279
34a6f7b4
NC
280=for apidoc hv_exists_ent
281
282Returns a boolean indicating whether the specified hash key exists. C<hash>
283can be a valid precomputed hash value, or 0 to ask for it to be
284computed.
285
286=cut
287*/
288
d1be9408 289/* returns an HE * structure with the all fields set */
fde52b5c 290/* note that hent_val will be a mortal sv for MAGICAL hashes */
954c1994
GS
291/*
292=for apidoc hv_fetch_ent
293
294Returns the hash entry which corresponds to the specified key in the hash.
295C<hash> must be a valid precomputed hash number for the given C<key>, or 0
296if you want the function to compute it. IF C<lval> is set then the fetch
297will be part of a store. Make sure the return value is non-null before
b24b84ef 298accessing it. The return value when C<hv> is a tied hash is a pointer to a
954c1994 299static location, so be sure to make a copy of the structure if you need to
1c846c1f 300store it somewhere.
954c1994 301
96f1132b 302See L<perlguts/"Understanding the Magic of Tied Hashes and Arrays"> for more
954c1994
GS
303information on how to use this function on tied hashes.
304
305=cut
306*/
307
a038e571
NC
308/* Common code for hv_delete()/hv_exists()/hv_fetch()/hv_store() */
309void *
310Perl_hv_common_key_len(pTHX_ HV *hv, const char *key, I32 klen_i32,
311 const int action, SV *val, const U32 hash)
312{
313 STRLEN klen;
314 int flags;
315
7918f24d
NC
316 PERL_ARGS_ASSERT_HV_COMMON_KEY_LEN;
317
a038e571
NC
318 if (klen_i32 < 0) {
319 klen = -klen_i32;
320 flags = HVhek_UTF8;
321 } else {
322 klen = klen_i32;
323 flags = 0;
324 }
325 return hv_common(hv, NULL, key, klen, flags, action, val, hash);
326}
327
63c89345 328void *
d3ba3f5c
NC
329Perl_hv_common(pTHX_ HV *hv, SV *keysv, const char *key, STRLEN klen,
330 int flags, int action, SV *val, register U32 hash)
113738bb 331{
27da23d5 332 dVAR;
b2c64049 333 XPVHV* xhv;
b2c64049
NC
334 HE *entry;
335 HE **oentry;
fde52b5c 336 SV *sv;
da58a35d 337 bool is_utf8;
113738bb 338 int masked_flags;
3c84c864 339 const int return_svp = action & HV_FETCH_JUST_SV;
fde52b5c 340
341 if (!hv)
a4fc7abc 342 return NULL;
8265e3d1
NC
343 if (SvTYPE(hv) == SVTYPEMASK)
344 return NULL;
345
346 assert(SvTYPE(hv) == SVt_PVHV);
fde52b5c 347
bdee33e4 348 if (SvSMAGICAL(hv) && SvGMAGICAL(hv) && !(action & HV_DISABLE_UVAR_XKEY)) {
fda2d18a 349 MAGIC* mg;
ad64d0ec 350 if ((mg = mg_find((const SV *)hv, PERL_MAGIC_uvar))) {
fda2d18a
NC
351 struct ufuncs * const uf = (struct ufuncs *)mg->mg_ptr;
352 if (uf->uf_set == NULL) {
353 SV* obj = mg->mg_obj;
354
355 if (!keysv) {
59cd0e26
NC
356 keysv = newSVpvn_flags(key, klen, SVs_TEMP |
357 ((flags & HVhek_UTF8)
358 ? SVf_UTF8 : 0));
fda2d18a
NC
359 }
360
361 mg->mg_obj = keysv; /* pass key */
362 uf->uf_index = action; /* pass action */
ad64d0ec 363 magic_getuvar(MUTABLE_SV(hv), mg);
fda2d18a
NC
364 keysv = mg->mg_obj; /* may have changed */
365 mg->mg_obj = obj;
366
367 /* If the key may have changed, then we need to invalidate
368 any passed-in computed hash value. */
369 hash = 0;
370 }
371 }
bdee33e4 372 }
113738bb 373 if (keysv) {
e593d2fe
AE
374 if (flags & HVhek_FREEKEY)
375 Safefree(key);
5c144d81 376 key = SvPV_const(keysv, klen);
113738bb 377 is_utf8 = (SvUTF8(keysv) != 0);
44b87b50
NC
378 if (SvIsCOW_shared_hash(keysv)) {
379 flags = HVhek_KEYCANONICAL | (is_utf8 ? HVhek_UTF8 : 0);
380 } else {
381 flags = 0;
382 }
113738bb 383 } else {
c1fe5510 384 is_utf8 = ((flags & HVhek_UTF8) ? TRUE : FALSE);
113738bb 385 }
113738bb 386
9dbc5603 387 if (action & HV_DELETE) {
3c84c864
NC
388 return (void *) hv_delete_common(hv, keysv, key, klen,
389 flags | (is_utf8 ? HVhek_UTF8 : 0),
390 action, hash);
9dbc5603
NC
391 }
392
b2c64049 393 xhv = (XPVHV*)SvANY(hv);
7f66fda2 394 if (SvMAGICAL(hv)) {
6136c704 395 if (SvRMAGICAL(hv) && !(action & (HV_FETCH_ISSTORE|HV_FETCH_ISEXISTS))) {
ad64d0ec
NC
396 if (mg_find((const SV *)hv, PERL_MAGIC_tied)
397 || SvGMAGICAL((const SV *)hv))
e62cc96a 398 {
3c84c864 399 /* FIXME should be able to skimp on the HE/HEK here when
7f66fda2 400 HV_FETCH_JUST_SV is true. */
7f66fda2 401 if (!keysv) {
740cce10
NC
402 keysv = newSVpvn_utf8(key, klen, is_utf8);
403 } else {
7f66fda2 404 keysv = newSVsv(keysv);
113738bb 405 }
44a2ac75 406 sv = sv_newmortal();
ad64d0ec 407 mg_copy(MUTABLE_SV(hv), sv, (char *)keysv, HEf_SVKEY);
7f66fda2
NC
408
409 /* grab a fake HE/HEK pair from the pool or make a new one */
410 entry = PL_hv_fetch_ent_mh;
411 if (entry)
412 PL_hv_fetch_ent_mh = HeNEXT(entry);
413 else {
414 char *k;
415 entry = new_HE();
ad64d0ec 416 Newx(k, HEK_BASESIZE + sizeof(const SV *), char);
7f66fda2
NC
417 HeKEY_hek(entry) = (HEK*)k;
418 }
4608196e 419 HeNEXT(entry) = NULL;
7f66fda2
NC
420 HeSVKEY_set(entry, keysv);
421 HeVAL(entry) = sv;
422 sv_upgrade(sv, SVt_PVLV);
423 LvTYPE(sv) = 'T';
424 /* so we can free entry when freeing sv */
ad64d0ec 425 LvTARG(sv) = MUTABLE_SV(entry);
7f66fda2
NC
426
427 /* XXX remove at some point? */
428 if (flags & HVhek_FREEKEY)
429 Safefree(key);
430
3c84c864
NC
431 if (return_svp) {
432 return entry ? (void *) &HeVAL(entry) : NULL;
433 }
434 return (void *) entry;
113738bb 435 }
7f66fda2 436#ifdef ENV_IS_CASELESS
ad64d0ec 437 else if (mg_find((const SV *)hv, PERL_MAGIC_env)) {
7f66fda2
NC
438 U32 i;
439 for (i = 0; i < klen; ++i)
440 if (isLOWER(key[i])) {
086cb327
NC
441 /* Would be nice if we had a routine to do the
442 copy and upercase in a single pass through. */
0bd48802 443 const char * const nkey = strupr(savepvn(key,klen));
086cb327
NC
444 /* Note that this fetch is for nkey (the uppercased
445 key) whereas the store is for key (the original) */
63c89345
NC
446 void *result = hv_common(hv, NULL, nkey, klen,
447 HVhek_FREEKEY, /* free nkey */
448 0 /* non-LVAL fetch */
3c84c864
NC
449 | HV_DISABLE_UVAR_XKEY
450 | return_svp,
63c89345
NC
451 NULL /* no value */,
452 0 /* compute hash */);
26488bcf 453 if (!result && (action & HV_FETCH_LVALUE)) {
086cb327
NC
454 /* This call will free key if necessary.
455 Do it this way to encourage compiler to tail
456 call optimise. */
63c89345
NC
457 result = hv_common(hv, keysv, key, klen, flags,
458 HV_FETCH_ISSTORE
3c84c864
NC
459 | HV_DISABLE_UVAR_XKEY
460 | return_svp,
63c89345 461 newSV(0), hash);
086cb327
NC
462 } else {
463 if (flags & HVhek_FREEKEY)
464 Safefree(key);
465 }
63c89345 466 return result;
7f66fda2 467 }
902173a3 468 }
7f66fda2
NC
469#endif
470 } /* ISFETCH */
471 else if (SvRMAGICAL(hv) && (action & HV_FETCH_ISEXISTS)) {
ad64d0ec
NC
472 if (mg_find((const SV *)hv, PERL_MAGIC_tied)
473 || SvGMAGICAL((const SV *)hv)) {
b2c64049
NC
474 /* I don't understand why hv_exists_ent has svret and sv,
475 whereas hv_exists only had one. */
9d4ba2ae 476 SV * const svret = sv_newmortal();
b2c64049 477 sv = sv_newmortal();
7f66fda2
NC
478
479 if (keysv || is_utf8) {
480 if (!keysv) {
740cce10 481 keysv = newSVpvn_utf8(key, klen, TRUE);
7f66fda2
NC
482 } else {
483 keysv = newSVsv(keysv);
484 }
ad64d0ec 485 mg_copy(MUTABLE_SV(hv), sv, (char *)sv_2mortal(keysv), HEf_SVKEY);
b2c64049 486 } else {
ad64d0ec 487 mg_copy(MUTABLE_SV(hv), sv, key, klen);
7f66fda2 488 }
b2c64049
NC
489 if (flags & HVhek_FREEKEY)
490 Safefree(key);
7f66fda2
NC
491 magic_existspack(svret, mg_find(sv, PERL_MAGIC_tiedelem));
492 /* This cast somewhat evil, but I'm merely using NULL/
493 not NULL to return the boolean exists.
494 And I know hv is not NULL. */
3c84c864 495 return SvTRUE(svret) ? (void *)hv : NULL;
e7152ba2 496 }
7f66fda2 497#ifdef ENV_IS_CASELESS
ad64d0ec 498 else if (mg_find((const SV *)hv, PERL_MAGIC_env)) {
7f66fda2 499 /* XXX This code isn't UTF8 clean. */
a15d23f8 500 char * const keysave = (char * const)key;
b2c64049
NC
501 /* Will need to free this, so set FREEKEY flag. */
502 key = savepvn(key,klen);
503 key = (const char*)strupr((char*)key);
6136c704 504 is_utf8 = FALSE;
7f66fda2 505 hash = 0;
8b4f7dd5 506 keysv = 0;
b2c64049
NC
507
508 if (flags & HVhek_FREEKEY) {
509 Safefree(keysave);
510 }
511 flags |= HVhek_FREEKEY;
7f66fda2 512 }
902173a3 513#endif
7f66fda2 514 } /* ISEXISTS */
b2c64049
NC
515 else if (action & HV_FETCH_ISSTORE) {
516 bool needs_copy;
517 bool needs_store;
518 hv_magic_check (hv, &needs_copy, &needs_store);
519 if (needs_copy) {
a3b680e6 520 const bool save_taint = PL_tainted;
b2c64049
NC
521 if (keysv || is_utf8) {
522 if (!keysv) {
740cce10 523 keysv = newSVpvn_utf8(key, klen, TRUE);
b2c64049
NC
524 }
525 if (PL_tainting)
526 PL_tainted = SvTAINTED(keysv);
527 keysv = sv_2mortal(newSVsv(keysv));
ad64d0ec 528 mg_copy(MUTABLE_SV(hv), val, (char*)keysv, HEf_SVKEY);
b2c64049 529 } else {
ad64d0ec 530 mg_copy(MUTABLE_SV(hv), val, key, klen);
b2c64049
NC
531 }
532
533 TAINT_IF(save_taint);
1baaf5d7 534 if (!needs_store) {
b2c64049
NC
535 if (flags & HVhek_FREEKEY)
536 Safefree(key);
4608196e 537 return NULL;
b2c64049
NC
538 }
539#ifdef ENV_IS_CASELESS
ad64d0ec 540 else if (mg_find((const SV *)hv, PERL_MAGIC_env)) {
b2c64049
NC
541 /* XXX This code isn't UTF8 clean. */
542 const char *keysave = key;
543 /* Will need to free this, so set FREEKEY flag. */
544 key = savepvn(key,klen);
545 key = (const char*)strupr((char*)key);
6136c704 546 is_utf8 = FALSE;
b2c64049 547 hash = 0;
8b4f7dd5 548 keysv = 0;
b2c64049
NC
549
550 if (flags & HVhek_FREEKEY) {
551 Safefree(keysave);
552 }
553 flags |= HVhek_FREEKEY;
554 }
555#endif
556 }
557 } /* ISSTORE */
7f66fda2 558 } /* SvMAGICAL */
fde52b5c 559
7b2c381c 560 if (!HvARRAY(hv)) {
b2c64049 561 if ((action & (HV_FETCH_LVALUE | HV_FETCH_ISSTORE))
fde52b5c 562#ifdef DYNAMIC_ENV_FETCH /* if it's an %ENV lookup, we may get it on the fly */
ad64d0ec
NC
563 || (SvRMAGICAL((const SV *)hv)
564 && mg_find((const SV *)hv, PERL_MAGIC_env))
fde52b5c 565#endif
d58e6666
NC
566 ) {
567 char *array;
a02a5408 568 Newxz(array,
cbec9347 569 PERL_HV_ARRAY_ALLOC_BYTES(xhv->xhv_max+1 /* HvMAX(hv)+1 */),
d58e6666
NC
570 char);
571 HvARRAY(hv) = (HE**)array;
572 }
7f66fda2
NC
573#ifdef DYNAMIC_ENV_FETCH
574 else if (action & HV_FETCH_ISEXISTS) {
575 /* for an %ENV exists, if we do an insert it's by a recursive
576 store call, so avoid creating HvARRAY(hv) right now. */
577 }
578#endif
113738bb
NC
579 else {
580 /* XXX remove at some point? */
581 if (flags & HVhek_FREEKEY)
582 Safefree(key);
583
3c84c864 584 return NULL;
113738bb 585 }
fde52b5c 586 }
587
44b87b50 588 if (is_utf8 & !(flags & HVhek_KEYCANONICAL)) {
41d88b63 589 char * const keysave = (char *)key;
f9a63242 590 key = (char*)bytes_from_utf8((U8*)key, &klen, &is_utf8);
19692e8d 591 if (is_utf8)
c1fe5510
NC
592 flags |= HVhek_UTF8;
593 else
594 flags &= ~HVhek_UTF8;
7f66fda2
NC
595 if (key != keysave) {
596 if (flags & HVhek_FREEKEY)
597 Safefree(keysave);
19692e8d 598 flags |= HVhek_WASUTF8 | HVhek_FREEKEY;
527df579
NC
599 /* If the caller calculated a hash, it was on the sequence of
600 octets that are the UTF-8 form. We've now changed the sequence
601 of octets stored to that of the equivalent byte representation,
602 so the hash we need is different. */
603 hash = 0;
7f66fda2 604 }
19692e8d 605 }
f9a63242 606
4b5190b5
NC
607 if (HvREHASH(hv)) {
608 PERL_HASH_INTERNAL(hash, key, klen);
b2c64049
NC
609 /* We don't have a pointer to the hv, so we have to replicate the
610 flag into every HEK, so that hv_iterkeysv can see it. */
611 /* And yes, you do need this even though you are not "storing" because
fdcd69b6
NC
612 you can flip the flags below if doing an lval lookup. (And that
613 was put in to give the semantics Andreas was expecting.) */
614 flags |= HVhek_REHASH;
4b5190b5 615 } else if (!hash) {
113738bb 616 if (keysv && (SvIsCOW_shared_hash(keysv))) {
c158a4fd 617 hash = SvSHARED_HASH(keysv);
46187eeb
NC
618 } else {
619 PERL_HASH(hash, key, klen);
620 }
621 }
effa1e2d 622
113738bb
NC
623 masked_flags = (flags & HVhek_MASK);
624
7f66fda2 625#ifdef DYNAMIC_ENV_FETCH
4608196e 626 if (!HvARRAY(hv)) entry = NULL;
7f66fda2
NC
627 else
628#endif
b2c64049 629 {
7b2c381c 630 entry = (HvARRAY(hv))[hash & (I32) HvMAX(hv)];
b2c64049 631 }
0298d7b9 632 for (; entry; entry = HeNEXT(entry)) {
fde52b5c 633 if (HeHASH(entry) != hash) /* strings can't be equal */
634 continue;
eb160463 635 if (HeKLEN(entry) != (I32)klen)
fde52b5c 636 continue;
1c846c1f 637 if (HeKEY(entry) != key && memNE(HeKEY(entry),key,klen)) /* is this it? */
fde52b5c 638 continue;
113738bb 639 if ((HeKFLAGS(entry) ^ masked_flags) & HVhek_UTF8)
c3654f1a 640 continue;
b2c64049
NC
641
642 if (action & (HV_FETCH_LVALUE|HV_FETCH_ISSTORE)) {
643 if (HeKFLAGS(entry) != masked_flags) {
644 /* We match if HVhek_UTF8 bit in our flags and hash key's
645 match. But if entry was set previously with HVhek_WASUTF8
646 and key now doesn't (or vice versa) then we should change
647 the key's flag, as this is assignment. */
648 if (HvSHAREKEYS(hv)) {
649 /* Need to swap the key we have for a key with the flags we
650 need. As keys are shared we can't just write to the
651 flag, so we share the new one, unshare the old one. */
6136c704 652 HEK * const new_hek = share_hek_flags(key, klen, hash,
6e838c70 653 masked_flags);
b2c64049
NC
654 unshare_hek (HeKEY_hek(entry));
655 HeKEY_hek(entry) = new_hek;
656 }
5d2b1485
NC
657 else if (hv == PL_strtab) {
658 /* PL_strtab is usually the only hash without HvSHAREKEYS,
659 so putting this test here is cheap */
660 if (flags & HVhek_FREEKEY)
661 Safefree(key);
662 Perl_croak(aTHX_ S_strtab_error,
663 action & HV_FETCH_LVALUE ? "fetch" : "store");
664 }
b2c64049
NC
665 else
666 HeKFLAGS(entry) = masked_flags;
667 if (masked_flags & HVhek_ENABLEHVKFLAGS)
668 HvHASKFLAGS_on(hv);
669 }
670 if (HeVAL(entry) == &PL_sv_placeholder) {
671 /* yes, can store into placeholder slot */
672 if (action & HV_FETCH_LVALUE) {
673 if (SvMAGICAL(hv)) {
674 /* This preserves behaviour with the old hv_fetch
675 implementation which at this point would bail out
676 with a break; (at "if we find a placeholder, we
677 pretend we haven't found anything")
678
679 That break mean that if a placeholder were found, it
680 caused a call into hv_store, which in turn would
681 check magic, and if there is no magic end up pretty
682 much back at this point (in hv_store's code). */
683 break;
684 }
685 /* LVAL fetch which actaully needs a store. */
561b68a9 686 val = newSV(0);
ca732855 687 HvPLACEHOLDERS(hv)--;
b2c64049
NC
688 } else {
689 /* store */
690 if (val != &PL_sv_placeholder)
ca732855 691 HvPLACEHOLDERS(hv)--;
b2c64049
NC
692 }
693 HeVAL(entry) = val;
694 } else if (action & HV_FETCH_ISSTORE) {
cefd5c7c 695 SvREFCNT_dec(HeVAL(entry));
b2c64049
NC
696 HeVAL(entry) = val;
697 }
27bcc0a7 698 } else if (HeVAL(entry) == &PL_sv_placeholder) {
b2c64049
NC
699 /* if we find a placeholder, we pretend we haven't found
700 anything */
8aacddc1 701 break;
b2c64049 702 }
113738bb
NC
703 if (flags & HVhek_FREEKEY)
704 Safefree(key);
3c84c864
NC
705 if (return_svp) {
706 return entry ? (void *) &HeVAL(entry) : NULL;
707 }
fde52b5c 708 return entry;
709 }
710#ifdef DYNAMIC_ENV_FETCH /* %ENV lookup? If so, try to fetch the value now */
0ed29950 711 if (!(action & HV_FETCH_ISSTORE)
ad64d0ec
NC
712 && SvRMAGICAL((const SV *)hv)
713 && mg_find((const SV *)hv, PERL_MAGIC_env)) {
a6c40364 714 unsigned long len;
9d4ba2ae 715 const char * const env = PerlEnv_ENVgetenv_len(key,&len);
a6c40364
GS
716 if (env) {
717 sv = newSVpvn(env,len);
718 SvTAINTED_on(sv);
d3ba3f5c 719 return hv_common(hv, keysv, key, klen, flags,
3c84c864
NC
720 HV_FETCH_ISSTORE|HV_DISABLE_UVAR_XKEY|return_svp,
721 sv, hash);
a6c40364 722 }
fde52b5c 723 }
724#endif
7f66fda2
NC
725
726 if (!entry && SvREADONLY(hv) && !(action & HV_FETCH_ISEXISTS)) {
c445ea15 727 hv_notallowed(flags, key, klen,
c8cd6465
NC
728 "Attempt to access disallowed key '%"SVf"' in"
729 " a restricted hash");
1b1f1335 730 }
b2c64049
NC
731 if (!(action & (HV_FETCH_LVALUE|HV_FETCH_ISSTORE))) {
732 /* Not doing some form of store, so return failure. */
733 if (flags & HVhek_FREEKEY)
734 Safefree(key);
3c84c864 735 return NULL;
b2c64049 736 }
113738bb 737 if (action & HV_FETCH_LVALUE) {
df5f182b 738 val = action & HV_FETCH_EMPTY_HE ? NULL : newSV(0);
b2c64049
NC
739 if (SvMAGICAL(hv)) {
740 /* At this point the old hv_fetch code would call to hv_store,
741 which in turn might do some tied magic. So we need to make that
742 magic check happen. */
743 /* gonna assign to this, so it better be there */
fda2d18a
NC
744 /* If a fetch-as-store fails on the fetch, then the action is to
745 recurse once into "hv_store". If we didn't do this, then that
746 recursive call would call the key conversion routine again.
747 However, as we replace the original key with the converted
748 key, this would result in a double conversion, which would show
749 up as a bug if the conversion routine is not idempotent. */
d3ba3f5c 750 return hv_common(hv, keysv, key, klen, flags,
3c84c864
NC
751 HV_FETCH_ISSTORE|HV_DISABLE_UVAR_XKEY|return_svp,
752 val, hash);
b2c64049
NC
753 /* XXX Surely that could leak if the fetch-was-store fails?
754 Just like the hv_fetch. */
113738bb
NC
755 }
756 }
757
b2c64049
NC
758 /* Welcome to hv_store... */
759
7b2c381c 760 if (!HvARRAY(hv)) {
b2c64049
NC
761 /* Not sure if we can get here. I think the only case of oentry being
762 NULL is for %ENV with dynamic env fetch. But that should disappear
763 with magic in the previous code. */
d58e6666 764 char *array;
a02a5408 765 Newxz(array,
b2c64049 766 PERL_HV_ARRAY_ALLOC_BYTES(xhv->xhv_max+1 /* HvMAX(hv)+1 */),
d58e6666
NC
767 char);
768 HvARRAY(hv) = (HE**)array;
b2c64049
NC
769 }
770
7b2c381c 771 oentry = &(HvARRAY(hv))[hash & (I32) xhv->xhv_max];
ab4af705 772
b2c64049
NC
773 entry = new_HE();
774 /* share_hek_flags will do the free for us. This might be considered
775 bad API design. */
776 if (HvSHAREKEYS(hv))
6e838c70 777 HeKEY_hek(entry) = share_hek_flags(key, klen, hash, flags);
5d2b1485
NC
778 else if (hv == PL_strtab) {
779 /* PL_strtab is usually the only hash without HvSHAREKEYS, so putting
780 this test here is cheap */
781 if (flags & HVhek_FREEKEY)
782 Safefree(key);
783 Perl_croak(aTHX_ S_strtab_error,
784 action & HV_FETCH_LVALUE ? "fetch" : "store");
785 }
b2c64049
NC
786 else /* gotta do the real thing */
787 HeKEY_hek(entry) = save_hek_flags(key, klen, hash, flags);
788 HeVAL(entry) = val;
789 HeNEXT(entry) = *oentry;
790 *oentry = entry;
791
792 if (val == &PL_sv_placeholder)
ca732855 793 HvPLACEHOLDERS(hv)++;
b2c64049
NC
794 if (masked_flags & HVhek_ENABLEHVKFLAGS)
795 HvHASKFLAGS_on(hv);
796
0298d7b9
NC
797 {
798 const HE *counter = HeNEXT(entry);
799
4c7185a0 800 xhv->xhv_keys++; /* HvTOTALKEYS(hv)++ */
0298d7b9 801 if (!counter) { /* initial entry? */
5ac36297 802 } else if (xhv->xhv_keys > xhv->xhv_max) {
0298d7b9
NC
803 hsplit(hv);
804 } else if(!HvREHASH(hv)) {
805 U32 n_links = 1;
806
807 while ((counter = HeNEXT(counter)))
808 n_links++;
809
810 if (n_links > HV_MAX_LENGTH_BEFORE_SPLIT) {
811 /* Use only the old HvKEYS(hv) > HvMAX(hv) condition to limit
812 bucket splits on a rehashed hash, as we're not going to
813 split it again, and if someone is lucky (evil) enough to
814 get all the keys in one list they could exhaust our memory
815 as we repeatedly double the number of buckets on every
816 entry. Linear search feels a less worse thing to do. */
817 hsplit(hv);
818 }
819 }
fde52b5c 820 }
b2c64049 821
3c84c864
NC
822 if (return_svp) {
823 return entry ? (void *) &HeVAL(entry) : NULL;
824 }
825 return (void *) entry;
fde52b5c 826}
827
864dbfa3 828STATIC void
b0e6ae5b 829S_hv_magic_check(HV *hv, bool *needs_copy, bool *needs_store)
d0066dc7 830{
a3b680e6 831 const MAGIC *mg = SvMAGIC(hv);
7918f24d
NC
832
833 PERL_ARGS_ASSERT_HV_MAGIC_CHECK;
834
d0066dc7
OT
835 *needs_copy = FALSE;
836 *needs_store = TRUE;
837 while (mg) {
838 if (isUPPER(mg->mg_type)) {
839 *needs_copy = TRUE;
d60c5a05 840 if (mg->mg_type == PERL_MAGIC_tied) {
d0066dc7 841 *needs_store = FALSE;
4ab2a30b 842 return; /* We've set all there is to set. */
d0066dc7
OT
843 }
844 }
845 mg = mg->mg_moremagic;
846 }
847}
848
954c1994 849/*
a3bcc51e
TP
850=for apidoc hv_scalar
851
852Evaluates the hash in scalar context and returns the result. Handles magic when the hash is tied.
853
854=cut
855*/
856
857SV *
858Perl_hv_scalar(pTHX_ HV *hv)
859{
a3bcc51e 860 SV *sv;
823a54a3 861
7918f24d
NC
862 PERL_ARGS_ASSERT_HV_SCALAR;
863
823a54a3 864 if (SvRMAGICAL(hv)) {
ad64d0ec 865 MAGIC * const mg = mg_find((const SV *)hv, PERL_MAGIC_tied);
823a54a3
AL
866 if (mg)
867 return magic_scalarpack(hv, mg);
868 }
a3bcc51e
TP
869
870 sv = sv_newmortal();
f4431c56 871 if (HvTOTALKEYS((const HV *)hv))
a3bcc51e
TP
872 Perl_sv_setpvf(aTHX_ sv, "%ld/%ld",
873 (long)HvFILL(hv), (long)HvMAX(hv) + 1);
874 else
875 sv_setiv(sv, 0);
876
877 return sv;
878}
879
880/*
954c1994
GS
881=for apidoc hv_delete
882
3025a2e4
CS
883Deletes a key/value pair in the hash. The value's SV is removed from the
884hash, made mortal, and returned to the caller. The C<klen> is the length of
885the key. The C<flags> value will normally be zero; if set to G_DISCARD then
886NULL will be returned. NULL will also be returned if the key is not found.
954c1994 887
954c1994
GS
888=for apidoc hv_delete_ent
889
3025a2e4
CS
890Deletes a key/value pair in the hash. The value SV is removed from the hash,
891made mortal, and returned to the caller. The C<flags> value will normally be
892zero; if set to G_DISCARD then NULL will be returned. NULL will also be
893returned if the key is not found. C<hash> can be a valid precomputed hash
894value, or 0 to ask for it to be computed.
954c1994
GS
895
896=cut
897*/
898
8f8d40ab 899STATIC SV *
cd6d36ac
NC
900S_hv_delete_common(pTHX_ HV *hv, SV *keysv, const char *key, STRLEN klen,
901 int k_flags, I32 d_flags, U32 hash)
f1317c8d 902{
27da23d5 903 dVAR;
cbec9347 904 register XPVHV* xhv;
fde52b5c 905 register HE *entry;
906 register HE **oentry;
9e720f71 907 HE *const *first_entry;
9dbc5603 908 bool is_utf8 = (k_flags & HVhek_UTF8) ? TRUE : FALSE;
7a9669ca 909 int masked_flags;
1c846c1f 910
fde52b5c 911 if (SvRMAGICAL(hv)) {
0a0bb7c7
OT
912 bool needs_copy;
913 bool needs_store;
914 hv_magic_check (hv, &needs_copy, &needs_store);
915
f1317c8d 916 if (needs_copy) {
6136c704 917 SV *sv;
63c89345
NC
918 entry = (HE *) hv_common(hv, keysv, key, klen,
919 k_flags & ~HVhek_FREEKEY,
920 HV_FETCH_LVALUE|HV_DISABLE_UVAR_XKEY,
921 NULL, hash);
7a9669ca 922 sv = entry ? HeVAL(entry) : NULL;
f1317c8d
NC
923 if (sv) {
924 if (SvMAGICAL(sv)) {
925 mg_clear(sv);
926 }
927 if (!needs_store) {
928 if (mg_find(sv, PERL_MAGIC_tiedelem)) {
929 /* No longer an element */
930 sv_unmagic(sv, PERL_MAGIC_tiedelem);
931 return sv;
932 }
a0714e2c 933 return NULL; /* element cannot be deleted */
f1317c8d 934 }
902173a3 935#ifdef ENV_IS_CASELESS
ad64d0ec 936 else if (mg_find((const SV *)hv, PERL_MAGIC_env)) {
8167a60a 937 /* XXX This code isn't UTF8 clean. */
59cd0e26 938 keysv = newSVpvn_flags(key, klen, SVs_TEMP);
8167a60a
NC
939 if (k_flags & HVhek_FREEKEY) {
940 Safefree(key);
941 }
942 key = strupr(SvPVX(keysv));
943 is_utf8 = 0;
944 k_flags = 0;
945 hash = 0;
7f66fda2 946 }
510ac311 947#endif
2fd1c6b8 948 }
2fd1c6b8 949 }
fde52b5c 950 }
cbec9347 951 xhv = (XPVHV*)SvANY(hv);
7b2c381c 952 if (!HvARRAY(hv))
a0714e2c 953 return NULL;
fde52b5c 954
19692e8d 955 if (is_utf8) {
c445ea15 956 const char * const keysave = key;
b464bac0 957 key = (char*)bytes_from_utf8((U8*)key, &klen, &is_utf8);
cd6d36ac 958
19692e8d 959 if (is_utf8)
cd6d36ac
NC
960 k_flags |= HVhek_UTF8;
961 else
962 k_flags &= ~HVhek_UTF8;
7f66fda2
NC
963 if (key != keysave) {
964 if (k_flags & HVhek_FREEKEY) {
965 /* This shouldn't happen if our caller does what we expect,
966 but strictly the API allows it. */
967 Safefree(keysave);
968 }
969 k_flags |= HVhek_WASUTF8 | HVhek_FREEKEY;
970 }
ad64d0ec 971 HvHASKFLAGS_on(MUTABLE_SV(hv));
19692e8d 972 }
f9a63242 973
4b5190b5
NC
974 if (HvREHASH(hv)) {
975 PERL_HASH_INTERNAL(hash, key, klen);
976 } else if (!hash) {
7a9669ca 977 if (keysv && (SvIsCOW_shared_hash(keysv))) {
c158a4fd 978 hash = SvSHARED_HASH(keysv);
7a9669ca
NC
979 } else {
980 PERL_HASH(hash, key, klen);
981 }
4b5190b5 982 }
fde52b5c 983
7a9669ca
NC
984 masked_flags = (k_flags & HVhek_MASK);
985
9e720f71 986 first_entry = oentry = &(HvARRAY(hv))[hash & (I32) HvMAX(hv)];
fde52b5c 987 entry = *oentry;
9e720f71 988 for (; entry; oentry = &HeNEXT(entry), entry = *oentry) {
6136c704 989 SV *sv;
f3d2f32d 990 U8 mro_changes = 0; /* 1 = isa; 2 = package moved */
0290c710 991 GV *gv = NULL;
0c3bb3c2
FC
992 HV *stash = NULL;
993
fde52b5c 994 if (HeHASH(entry) != hash) /* strings can't be equal */
995 continue;
eb160463 996 if (HeKLEN(entry) != (I32)klen)
fde52b5c 997 continue;
1c846c1f 998 if (HeKEY(entry) != key && memNE(HeKEY(entry),key,klen)) /* is this it? */
fde52b5c 999 continue;
7a9669ca 1000 if ((HeKFLAGS(entry) ^ masked_flags) & HVhek_UTF8)
c3654f1a 1001 continue;
8aacddc1 1002
5d2b1485
NC
1003 if (hv == PL_strtab) {
1004 if (k_flags & HVhek_FREEKEY)
1005 Safefree(key);
1006 Perl_croak(aTHX_ S_strtab_error, "delete");
1007 }
1008
8aacddc1 1009 /* if placeholder is here, it's already been deleted.... */
6136c704
AL
1010 if (HeVAL(entry) == &PL_sv_placeholder) {
1011 if (k_flags & HVhek_FREEKEY)
1012 Safefree(key);
1013 return NULL;
8aacddc1 1014 }
6136c704 1015 if (SvREADONLY(hv) && HeVAL(entry) && SvREADONLY(HeVAL(entry))) {
d4c19fe8 1016 hv_notallowed(k_flags, key, klen,
c8cd6465
NC
1017 "Attempt to delete readonly key '%"SVf"' from"
1018 " a restricted hash");
8aacddc1 1019 }
b84d0860
NC
1020 if (k_flags & HVhek_FREEKEY)
1021 Safefree(key);
8aacddc1 1022
35759254 1023 /* If this is a stash and the key ends with ::, then someone is
0c3bb3c2 1024 * deleting a package.
0c3bb3c2 1025 */
78b79c77 1026 if (HeVAL(entry) && HvENAME_get(hv)) {
0290c710 1027 gv = (GV *)HeVAL(entry);
35759254
FC
1028 if (keysv) key = SvPV(keysv, klen);
1029 if (klen > 1 && key[klen-2] == ':' && key[klen-1] == ':'
e0a52395 1030 && (klen != 6 || hv!=PL_defstash || memNE(key,"main::",6))
0290c710 1031 && SvTYPE(gv) == SVt_PVGV && (stash = GvHV((GV *)gv))
0c3bb3c2 1032 && HvENAME_get(stash)) {
0290c710
FC
1033 /* A previous version of this code checked that the
1034 * GV was still in the symbol table by fetching the
1035 * GV with its name. That is not necessary (and
1036 * sometimes incorrect), as HvENAME cannot be set
1037 * on hv if it is not in the symtab. */
f3d2f32d 1038 mro_changes = 2;
0c3bb3c2
FC
1039 /* Hang on to it for a bit. */
1040 SvREFCNT_inc_simple_void_NN(
0290c710 1041 sv_2mortal((SV *)gv)
35759254
FC
1042 );
1043 }
f3d2f32d
FC
1044 else if (klen == 3 && strnEQ(key, "ISA", 3))
1045 mro_changes = 1;
35759254
FC
1046 }
1047
cd6d36ac 1048 if (d_flags & G_DISCARD)
a0714e2c 1049 sv = NULL;
94f7643d 1050 else {
79d01fbf 1051 sv = sv_2mortal(HeVAL(entry));
7996736c 1052 HeVAL(entry) = &PL_sv_placeholder;
94f7643d 1053 }
8aacddc1
NIS
1054
1055 /*
1056 * If a restricted hash, rather than really deleting the entry, put
1057 * a placeholder there. This marks the key as being "approved", so
1058 * we can still access via not-really-existing key without raising
1059 * an error.
1060 */
1061 if (SvREADONLY(hv)) {
754604c4 1062 SvREFCNT_dec(HeVAL(entry));
7996736c 1063 HeVAL(entry) = &PL_sv_placeholder;
8aacddc1
NIS
1064 /* We'll be saving this slot, so the number of allocated keys
1065 * doesn't go down, but the number placeholders goes up */
ca732855 1066 HvPLACEHOLDERS(hv)++;
8aacddc1 1067 } else {
a26e96df 1068 *oentry = HeNEXT(entry);
b79f7545 1069 if (SvOOK(hv) && entry == HvAUX(hv)->xhv_eiter /* HvEITER(hv) */)
8aacddc1
NIS
1070 HvLAZYDEL_on(hv);
1071 else
1072 hv_free_ent(hv, entry);
4c7185a0 1073 xhv->xhv_keys--; /* HvTOTALKEYS(hv)-- */
574c8022 1074 if (xhv->xhv_keys == 0)
19692e8d 1075 HvHASKFLAGS_off(hv);
8aacddc1 1076 }
0c3bb3c2 1077
f3d2f32d
FC
1078 if (mro_changes == 1) mro_isa_changed_in(hv);
1079 else if (mro_changes == 2)
afdbe55d 1080 mro_package_moved(NULL, stash, gv, 1);
0c3bb3c2 1081
79072805
LW
1082 return sv;
1083 }
8aacddc1 1084 if (SvREADONLY(hv)) {
d4c19fe8 1085 hv_notallowed(k_flags, key, klen,
c8cd6465
NC
1086 "Attempt to delete disallowed key '%"SVf"' from"
1087 " a restricted hash");
8aacddc1
NIS
1088 }
1089
19692e8d 1090 if (k_flags & HVhek_FREEKEY)
f9a63242 1091 Safefree(key);
a0714e2c 1092 return NULL;
79072805
LW
1093}
1094
76e3520e 1095STATIC void
cea2e8a9 1096S_hsplit(pTHX_ HV *hv)
79072805 1097{
97aff369 1098 dVAR;
1e05feb3 1099 register XPVHV* const xhv = (XPVHV*)SvANY(hv);
a3b680e6 1100 const I32 oldsize = (I32) xhv->xhv_max+1; /* HvMAX(hv)+1 (sick) */
79072805
LW
1101 register I32 newsize = oldsize * 2;
1102 register I32 i;
7b2c381c 1103 char *a = (char*) HvARRAY(hv);
72311751 1104 register HE **aep;
4b5190b5
NC
1105 int longest_chain = 0;
1106 int was_shared;
79072805 1107
7918f24d
NC
1108 PERL_ARGS_ASSERT_HSPLIT;
1109
18026298 1110 /*PerlIO_printf(PerlIO_stderr(), "hsplit called for %p which had %d\n",
6c9570dc 1111 (void*)hv, (int) oldsize);*/
18026298 1112
5d88ecd7 1113 if (HvPLACEHOLDERS_get(hv) && !SvREADONLY(hv)) {
18026298
NC
1114 /* Can make this clear any placeholders first for non-restricted hashes,
1115 even though Storable rebuilds restricted hashes by putting in all the
1116 placeholders (first) before turning on the readonly flag, because
1117 Storable always pre-splits the hash. */
1118 hv_clear_placeholders(hv);
1119 }
1120
3280af22 1121 PL_nomemok = TRUE;
8d6dde3e 1122#if defined(STRANGE_MALLOC) || defined(MYMALLOC)
b79f7545
NC
1123 Renew(a, PERL_HV_ARRAY_ALLOC_BYTES(newsize)
1124 + (SvOOK(hv) ? sizeof(struct xpvhv_aux) : 0), char);
422a93e5 1125 if (!a) {
4a33f861 1126 PL_nomemok = FALSE;
422a93e5
GA
1127 return;
1128 }
b79f7545 1129 if (SvOOK(hv)) {
31f0e52e 1130 Move(&a[oldsize * sizeof(HE*)], &a[newsize * sizeof(HE*)], 1, struct xpvhv_aux);
b79f7545 1131 }
4633a7c4 1132#else
a02a5408 1133 Newx(a, PERL_HV_ARRAY_ALLOC_BYTES(newsize)
b79f7545 1134 + (SvOOK(hv) ? sizeof(struct xpvhv_aux) : 0), char);
422a93e5 1135 if (!a) {
3280af22 1136 PL_nomemok = FALSE;
422a93e5
GA
1137 return;
1138 }
7b2c381c 1139 Copy(HvARRAY(hv), a, oldsize * sizeof(HE*), char);
b79f7545
NC
1140 if (SvOOK(hv)) {
1141 Copy(HvAUX(hv), &a[newsize * sizeof(HE*)], 1, struct xpvhv_aux);
1142 }
9a87bd09 1143 Safefree(HvARRAY(hv));
4633a7c4
LW
1144#endif
1145
3280af22 1146 PL_nomemok = FALSE;
72311751 1147 Zero(&a[oldsize * sizeof(HE*)], (newsize-oldsize) * sizeof(HE*), char); /* zero 2nd half*/
cbec9347 1148 xhv->xhv_max = --newsize; /* HvMAX(hv) = --newsize */
7b2c381c 1149 HvARRAY(hv) = (HE**) a;
72311751 1150 aep = (HE**)a;
79072805 1151
72311751 1152 for (i=0; i<oldsize; i++,aep++) {
4b5190b5
NC
1153 int left_length = 0;
1154 int right_length = 0;
a50a3493
NC
1155 HE **oentry = aep;
1156 HE *entry = *aep;
a3b680e6 1157 register HE **bep;
4b5190b5 1158
a50a3493 1159 if (!entry) /* non-existent */
79072805 1160 continue;
72311751 1161 bep = aep+oldsize;
4c9d89c5 1162 do {
eb160463 1163 if ((HeHASH(entry) & newsize) != (U32)i) {
fde52b5c 1164 *oentry = HeNEXT(entry);
72311751 1165 HeNEXT(entry) = *bep;
72311751 1166 *bep = entry;
4b5190b5 1167 right_length++;
79072805 1168 }
4b5190b5 1169 else {
fde52b5c 1170 oentry = &HeNEXT(entry);
4b5190b5
NC
1171 left_length++;
1172 }
4c9d89c5
NC
1173 entry = *oentry;
1174 } while (entry);
4b5190b5
NC
1175 /* I think we don't actually need to keep track of the longest length,
1176 merely flag if anything is too long. But for the moment while
1177 developing this code I'll track it. */
1178 if (left_length > longest_chain)
1179 longest_chain = left_length;
1180 if (right_length > longest_chain)
1181 longest_chain = right_length;
1182 }
1183
1184
1185 /* Pick your policy for "hashing isn't working" here: */
fdcd69b6 1186 if (longest_chain <= HV_MAX_LENGTH_BEFORE_SPLIT /* split worked? */
4b5190b5
NC
1187 || HvREHASH(hv)) {
1188 return;
79072805 1189 }
4b5190b5
NC
1190
1191 if (hv == PL_strtab) {
1192 /* Urg. Someone is doing something nasty to the string table.
1193 Can't win. */
1194 return;
1195 }
1196
1197 /* Awooga. Awooga. Pathological data. */
6c9570dc 1198 /*PerlIO_printf(PerlIO_stderr(), "%p %d of %d with %d/%d buckets\n", (void*)hv,
4b5190b5
NC
1199 longest_chain, HvTOTALKEYS(hv), HvFILL(hv), 1+HvMAX(hv));*/
1200
1201 ++newsize;
a02a5408 1202 Newxz(a, PERL_HV_ARRAY_ALLOC_BYTES(newsize)
b79f7545
NC
1203 + (SvOOK(hv) ? sizeof(struct xpvhv_aux) : 0), char);
1204 if (SvOOK(hv)) {
1205 Copy(HvAUX(hv), &a[newsize * sizeof(HE*)], 1, struct xpvhv_aux);
1206 }
1207
4b5190b5
NC
1208 was_shared = HvSHAREKEYS(hv);
1209
4b5190b5
NC
1210 HvSHAREKEYS_off(hv);
1211 HvREHASH_on(hv);
1212
7b2c381c 1213 aep = HvARRAY(hv);
4b5190b5
NC
1214
1215 for (i=0; i<newsize; i++,aep++) {
a3b680e6 1216 register HE *entry = *aep;
4b5190b5
NC
1217 while (entry) {
1218 /* We're going to trash this HE's next pointer when we chain it
1219 into the new hash below, so store where we go next. */
9d4ba2ae 1220 HE * const next = HeNEXT(entry);
4b5190b5 1221 UV hash;
a3b680e6 1222 HE **bep;
4b5190b5
NC
1223
1224 /* Rehash it */
1225 PERL_HASH_INTERNAL(hash, HeKEY(entry), HeKLEN(entry));
1226
1227 if (was_shared) {
1228 /* Unshare it. */
aec46f14 1229 HEK * const new_hek
4b5190b5
NC
1230 = save_hek_flags(HeKEY(entry), HeKLEN(entry),
1231 hash, HeKFLAGS(entry));
1232 unshare_hek (HeKEY_hek(entry));
1233 HeKEY_hek(entry) = new_hek;
1234 } else {
1235 /* Not shared, so simply write the new hash in. */
1236 HeHASH(entry) = hash;
1237 }
1238 /*PerlIO_printf(PerlIO_stderr(), "%d ", HeKFLAGS(entry));*/
1239 HEK_REHASH_on(HeKEY_hek(entry));
1240 /*PerlIO_printf(PerlIO_stderr(), "%d\n", HeKFLAGS(entry));*/
1241
1242 /* Copy oentry to the correct new chain. */
1243 bep = ((HE**)a) + (hash & (I32) xhv->xhv_max);
4b5190b5
NC
1244 HeNEXT(entry) = *bep;
1245 *bep = entry;
1246
1247 entry = next;
1248 }
1249 }
7b2c381c
NC
1250 Safefree (HvARRAY(hv));
1251 HvARRAY(hv) = (HE **)a;
79072805
LW
1252}
1253
72940dca 1254void
864dbfa3 1255Perl_hv_ksplit(pTHX_ HV *hv, IV newmax)
72940dca 1256{
97aff369 1257 dVAR;
cbec9347 1258 register XPVHV* xhv = (XPVHV*)SvANY(hv);
a3b680e6 1259 const I32 oldsize = (I32) xhv->xhv_max+1; /* HvMAX(hv)+1 (sick) */
72940dca 1260 register I32 newsize;
1261 register I32 i;
72311751
GS
1262 register char *a;
1263 register HE **aep;
72940dca 1264
7918f24d
NC
1265 PERL_ARGS_ASSERT_HV_KSPLIT;
1266
72940dca 1267 newsize = (I32) newmax; /* possible truncation here */
1268 if (newsize != newmax || newmax <= oldsize)
1269 return;
1270 while ((newsize & (1 + ~newsize)) != newsize) {
1271 newsize &= ~(newsize & (1 + ~newsize)); /* get proper power of 2 */
1272 }
1273 if (newsize < newmax)
1274 newsize *= 2;
1275 if (newsize < newmax)
1276 return; /* overflow detection */
1277
7b2c381c 1278 a = (char *) HvARRAY(hv);
72940dca 1279 if (a) {
3280af22 1280 PL_nomemok = TRUE;
8d6dde3e 1281#if defined(STRANGE_MALLOC) || defined(MYMALLOC)
b79f7545
NC
1282 Renew(a, PERL_HV_ARRAY_ALLOC_BYTES(newsize)
1283 + (SvOOK(hv) ? sizeof(struct xpvhv_aux) : 0), char);
8aacddc1 1284 if (!a) {
4a33f861 1285 PL_nomemok = FALSE;
422a93e5
GA
1286 return;
1287 }
b79f7545 1288 if (SvOOK(hv)) {
7a9b70e9 1289 Copy(&a[oldsize * sizeof(HE*)], &a[newsize * sizeof(HE*)], 1, struct xpvhv_aux);
b79f7545 1290 }
72940dca 1291#else
a02a5408 1292 Newx(a, PERL_HV_ARRAY_ALLOC_BYTES(newsize)
b79f7545 1293 + (SvOOK(hv) ? sizeof(struct xpvhv_aux) : 0), char);
8aacddc1 1294 if (!a) {
3280af22 1295 PL_nomemok = FALSE;
422a93e5
GA
1296 return;
1297 }
7b2c381c 1298 Copy(HvARRAY(hv), a, oldsize * sizeof(HE*), char);
b79f7545
NC
1299 if (SvOOK(hv)) {
1300 Copy(HvAUX(hv), &a[newsize * sizeof(HE*)], 1, struct xpvhv_aux);
1301 }
9a87bd09 1302 Safefree(HvARRAY(hv));
72940dca 1303#endif
3280af22 1304 PL_nomemok = FALSE;
72311751 1305 Zero(&a[oldsize * sizeof(HE*)], (newsize-oldsize) * sizeof(HE*), char); /* zero 2nd half*/
72940dca 1306 }
1307 else {
a02a5408 1308 Newxz(a, PERL_HV_ARRAY_ALLOC_BYTES(newsize), char);
72940dca 1309 }
cbec9347 1310 xhv->xhv_max = --newsize; /* HvMAX(hv) = --newsize */
7b2c381c 1311 HvARRAY(hv) = (HE **) a;
f4431c56 1312 if (!xhv->xhv_keys /* !HvTOTALKEYS(hv) */) /* skip rest if no entries */
72940dca 1313 return;
1314
72311751
GS
1315 aep = (HE**)a;
1316 for (i=0; i<oldsize; i++,aep++) {
a50a3493
NC
1317 HE **oentry = aep;
1318 HE *entry = *aep;
1319
1320 if (!entry) /* non-existent */
72940dca 1321 continue;
4c9d89c5 1322 do {
6136c704
AL
1323 register I32 j = (HeHASH(entry) & newsize);
1324
1325 if (j != i) {
72940dca 1326 j -= i;
1327 *oentry = HeNEXT(entry);
4d0fbddd 1328 HeNEXT(entry) = aep[j];
72311751 1329 aep[j] = entry;
72940dca 1330 }
1331 else
1332 oentry = &HeNEXT(entry);
4c9d89c5
NC
1333 entry = *oentry;
1334 } while (entry);
72940dca 1335 }
1336}
1337
b3ac6de7 1338HV *
864dbfa3 1339Perl_newHVhv(pTHX_ HV *ohv)
b3ac6de7 1340{
749123ff 1341 dVAR;
9d4ba2ae 1342 HV * const hv = newHV();
f4431c56 1343 STRLEN hv_max;
4beac62f 1344
f4431c56 1345 if (!ohv || !HvTOTALKEYS(ohv))
4beac62f 1346 return hv;
4beac62f 1347 hv_max = HvMAX(ohv);
b3ac6de7 1348
ad64d0ec 1349 if (!SvMAGICAL((const SV *)ohv)) {
b56ba0bf 1350 /* It's an ordinary hash, so copy it fast. AMS 20010804 */
eb160463 1351 STRLEN i;
a3b680e6 1352 const bool shared = !!HvSHAREKEYS(ohv);
aec46f14 1353 HE **ents, ** const oents = (HE **)HvARRAY(ohv);
ff875642 1354 char *a;
a02a5408 1355 Newx(a, PERL_HV_ARRAY_ALLOC_BYTES(hv_max+1), char);
ff875642 1356 ents = (HE**)a;
b56ba0bf
AMS
1357
1358 /* In each bucket... */
1359 for (i = 0; i <= hv_max; i++) {
6136c704 1360 HE *prev = NULL;
aec46f14 1361 HE *oent = oents[i];
b56ba0bf
AMS
1362
1363 if (!oent) {
1364 ents[i] = NULL;
1365 continue;
1366 }
1367
1368 /* Copy the linked list of entries. */
aec46f14 1369 for (; oent; oent = HeNEXT(oent)) {
a3b680e6
AL
1370 const U32 hash = HeHASH(oent);
1371 const char * const key = HeKEY(oent);
1372 const STRLEN len = HeKLEN(oent);
1373 const int flags = HeKFLAGS(oent);
6136c704 1374 HE * const ent = new_HE();
c3acb9e0 1375 SV *const val = HeVAL(oent);
b56ba0bf 1376
c3acb9e0 1377 HeVAL(ent) = SvIMMORTAL(val) ? val : newSVsv(val);
19692e8d 1378 HeKEY_hek(ent)
6e838c70 1379 = shared ? share_hek_flags(key, len, hash, flags)
19692e8d 1380 : save_hek_flags(key, len, hash, flags);
b56ba0bf
AMS
1381 if (prev)
1382 HeNEXT(prev) = ent;
1383 else
1384 ents[i] = ent;
1385 prev = ent;
1386 HeNEXT(ent) = NULL;
1387 }
1388 }
1389
1390 HvMAX(hv) = hv_max;
8aacddc1 1391 HvTOTALKEYS(hv) = HvTOTALKEYS(ohv);
b56ba0bf 1392 HvARRAY(hv) = ents;
aec46f14 1393 } /* not magical */
b56ba0bf
AMS
1394 else {
1395 /* Iterate over ohv, copying keys and values one at a time. */
b3ac6de7 1396 HE *entry;
bfcb3514
NC
1397 const I32 riter = HvRITER_get(ohv);
1398 HE * const eiter = HvEITER_get(ohv);
f4431c56 1399 STRLEN hv_fill = HvFILL(ohv);
b56ba0bf
AMS
1400
1401 /* Can we use fewer buckets? (hv_max is always 2^n-1) */
1402 while (hv_max && hv_max + 1 >= hv_fill * 2)
1403 hv_max = hv_max / 2;
1404 HvMAX(hv) = hv_max;
1405
4a76a316 1406 hv_iterinit(ohv);
e16e2ff8 1407 while ((entry = hv_iternext_flags(ohv, 0))) {
c3acb9e0 1408 SV *const val = HeVAL(entry);
04fe65b0 1409 (void)hv_store_flags(hv, HeKEY(entry), HeKLEN(entry),
c3acb9e0
NC
1410 SvIMMORTAL(val) ? val : newSVsv(val),
1411 HeHASH(entry), HeKFLAGS(entry));
b3ac6de7 1412 }
bfcb3514
NC
1413 HvRITER_set(ohv, riter);
1414 HvEITER_set(ohv, eiter);
b3ac6de7 1415 }
1c846c1f 1416
b3ac6de7
IZ
1417 return hv;
1418}
1419
defdfed5
Z
1420/*
1421=for apidoc Am|HV *|hv_copy_hints_hv|HV *ohv
1422
1423A specialised version of L</newHVhv> for copying C<%^H>. I<ohv> must be
1424a pointer to a hash (which may have C<%^H> magic, but should be generally
1425non-magical), or C<NULL> (interpreted as an empty hash). The content
1426of I<ohv> is copied to a new hash, which has the C<%^H>-specific magic
1427added to it. A pointer to the new hash is returned.
1428
1429=cut
1430*/
1431
5b9c0671
NC
1432HV *
1433Perl_hv_copy_hints_hv(pTHX_ HV *const ohv)
1434{
1435 HV * const hv = newHV();
5b9c0671 1436
f4431c56 1437 if (ohv && HvTOTALKEYS(ohv)) {
5b9c0671 1438 STRLEN hv_max = HvMAX(ohv);
f4431c56 1439 STRLEN hv_fill = HvFILL(ohv);
5b9c0671
NC
1440 HE *entry;
1441 const I32 riter = HvRITER_get(ohv);
1442 HE * const eiter = HvEITER_get(ohv);
1443
1444 while (hv_max && hv_max + 1 >= hv_fill * 2)
1445 hv_max = hv_max / 2;
1446 HvMAX(hv) = hv_max;
1447
1448 hv_iterinit(ohv);
1449 while ((entry = hv_iternext_flags(ohv, 0))) {
1450 SV *const sv = newSVsv(HeVAL(entry));
e3b1b6b1 1451 SV *heksv = newSVhek(HeKEY_hek(entry));
5b9c0671 1452 sv_magic(sv, NULL, PERL_MAGIC_hintselem,
e3b1b6b1
RGS
1453 (char *)heksv, HEf_SVKEY);
1454 SvREFCNT_dec(heksv);
04fe65b0
RGS
1455 (void)hv_store_flags(hv, HeKEY(entry), HeKLEN(entry),
1456 sv, HeHASH(entry), HeKFLAGS(entry));
5b9c0671
NC
1457 }
1458 HvRITER_set(ohv, riter);
1459 HvEITER_set(ohv, eiter);
1460 }
1461 hv_magic(hv, NULL, PERL_MAGIC_hints);
1462 return hv;
1463}
1464
79072805 1465void
864dbfa3 1466Perl_hv_free_ent(pTHX_ HV *hv, register HE *entry)
79072805 1467{
97aff369 1468 dVAR;
16bdeea2
GS
1469 SV *val;
1470
7918f24d
NC
1471 PERL_ARGS_ASSERT_HV_FREE_ENT;
1472
68dc0745 1473 if (!entry)
79072805 1474 return;
16bdeea2 1475 val = HeVAL(entry);
00169e2c 1476 if (val && isGV(val) && isGV_with_GP(val) && GvCVu(val) && HvENAME(hv))
803f2748 1477 mro_method_changed_in(hv); /* deletion of method from stash */
16bdeea2 1478 SvREFCNT_dec(val);
68dc0745 1479 if (HeKLEN(entry) == HEf_SVKEY) {
1480 SvREFCNT_dec(HeKEY_sv(entry));
8aacddc1 1481 Safefree(HeKEY_hek(entry));
44a8e56a 1482 }
1483 else if (HvSHAREKEYS(hv))
68dc0745 1484 unshare_hek(HeKEY_hek(entry));
fde52b5c 1485 else
68dc0745 1486 Safefree(HeKEY_hek(entry));
d33b2eba 1487 del_HE(entry);
79072805
LW
1488}
1489
f1c32fec 1490
79072805 1491void
864dbfa3 1492Perl_hv_delayfree_ent(pTHX_ HV *hv, register HE *entry)
79072805 1493{
97aff369 1494 dVAR;
7918f24d
NC
1495
1496 PERL_ARGS_ASSERT_HV_DELAYFREE_ENT;
1497
68dc0745 1498 if (!entry)
79072805 1499 return;
bc4947fc
NC
1500 /* SvREFCNT_inc to counter the SvREFCNT_dec in hv_free_ent */
1501 sv_2mortal(SvREFCNT_inc(HeVAL(entry))); /* free between statements */
68dc0745 1502 if (HeKLEN(entry) == HEf_SVKEY) {
bc4947fc 1503 sv_2mortal(SvREFCNT_inc(HeKEY_sv(entry)));
44a8e56a 1504 }
bc4947fc 1505 hv_free_ent(hv, entry);
79072805
LW
1506}
1507
954c1994
GS
1508/*
1509=for apidoc hv_clear
1510
1511Clears a hash, making it empty.
1512
1513=cut
1514*/
1515
79072805 1516void
864dbfa3 1517Perl_hv_clear(pTHX_ HV *hv)
79072805 1518{
27da23d5 1519 dVAR;
cbec9347 1520 register XPVHV* xhv;
79072805
LW
1521 if (!hv)
1522 return;
49293501 1523
ecae49c0
NC
1524 DEBUG_A(Perl_hv_assert(aTHX_ hv));
1525
34c3c4e3
DM
1526 xhv = (XPVHV*)SvANY(hv);
1527
7b2c381c 1528 if (SvREADONLY(hv) && HvARRAY(hv) != NULL) {
34c3c4e3 1529 /* restricted hash: convert all keys to placeholders */
b464bac0
AL
1530 STRLEN i;
1531 for (i = 0; i <= xhv->xhv_max; i++) {
7b2c381c 1532 HE *entry = (HvARRAY(hv))[i];
3a676441
JH
1533 for (; entry; entry = HeNEXT(entry)) {
1534 /* not already placeholder */
7996736c 1535 if (HeVAL(entry) != &PL_sv_placeholder) {
3a676441 1536 if (HeVAL(entry) && SvREADONLY(HeVAL(entry))) {
6136c704 1537 SV* const keysv = hv_iterkeysv(entry);
3a676441 1538 Perl_croak(aTHX_
95b63a38
JH
1539 "Attempt to delete readonly key '%"SVf"' from a restricted hash",
1540 (void*)keysv);
3a676441
JH
1541 }
1542 SvREFCNT_dec(HeVAL(entry));
7996736c 1543 HeVAL(entry) = &PL_sv_placeholder;
ca732855 1544 HvPLACEHOLDERS(hv)++;
3a676441 1545 }
34c3c4e3
DM
1546 }
1547 }
df8c6964 1548 goto reset;
49293501
MS
1549 }
1550
463ee0b2 1551 hfreeentries(hv);
ca732855 1552 HvPLACEHOLDERS_set(hv, 0);
7b2c381c 1553 if (HvARRAY(hv))
41f62432 1554 Zero(HvARRAY(hv), xhv->xhv_max+1 /* HvMAX(hv)+1 */, HE*);
a0d0e21e
LW
1555
1556 if (SvRMAGICAL(hv))
ad64d0ec 1557 mg_clear(MUTABLE_SV(hv));
574c8022 1558
19692e8d 1559 HvHASKFLAGS_off(hv);
bb443f97 1560 HvREHASH_off(hv);
df8c6964 1561 reset:
b79f7545 1562 if (SvOOK(hv)) {
00169e2c 1563 if(HvENAME_get(hv))
dd69841b 1564 mro_isa_changed_in(hv);
bfcb3514
NC
1565 HvEITER_set(hv, NULL);
1566 }
79072805
LW
1567}
1568
3540d4ce
AB
1569/*
1570=for apidoc hv_clear_placeholders
1571
1572Clears any placeholders from a hash. If a restricted hash has any of its keys
1573marked as readonly and the key is subsequently deleted, the key is not actually
1574deleted but is marked by assigning it a value of &PL_sv_placeholder. This tags
1575it so it will be ignored by future operations such as iterating over the hash,
4cdaeff7 1576but will still allow the hash to have a value reassigned to the key at some
3540d4ce
AB
1577future point. This function clears any such placeholder keys from the hash.
1578See Hash::Util::lock_keys() for an example of its use.
1579
1580=cut
1581*/
1582
1583void
1584Perl_hv_clear_placeholders(pTHX_ HV *hv)
1585{
27da23d5 1586 dVAR;
b3ca2e83
NC
1587 const U32 items = (U32)HvPLACEHOLDERS_get(hv);
1588
7918f24d
NC
1589 PERL_ARGS_ASSERT_HV_CLEAR_PLACEHOLDERS;
1590
b3ca2e83
NC
1591 if (items)
1592 clear_placeholders(hv, items);
1593}
1594
1595static void
1596S_clear_placeholders(pTHX_ HV *hv, U32 items)
1597{
1598 dVAR;
b464bac0 1599 I32 i;
d3677389 1600
7918f24d
NC
1601 PERL_ARGS_ASSERT_CLEAR_PLACEHOLDERS;
1602
d3677389
NC
1603 if (items == 0)
1604 return;
1605
b464bac0 1606 i = HvMAX(hv);
d3677389
NC
1607 do {
1608 /* Loop down the linked list heads */
6136c704 1609 bool first = TRUE;
d3677389 1610 HE **oentry = &(HvARRAY(hv))[i];
cf6db12b 1611 HE *entry;
d3677389 1612
cf6db12b 1613 while ((entry = *oentry)) {
d3677389
NC
1614 if (HeVAL(entry) == &PL_sv_placeholder) {
1615 *oentry = HeNEXT(entry);
2e58978b 1616 if (entry == HvEITER_get(hv))
d3677389
NC
1617 HvLAZYDEL_on(hv);
1618 else
1619 hv_free_ent(hv, entry);
1620
1621 if (--items == 0) {
1622 /* Finished. */
5d88ecd7 1623 HvTOTALKEYS(hv) -= (IV)HvPLACEHOLDERS_get(hv);
d3677389
NC
1624 if (HvKEYS(hv) == 0)
1625 HvHASKFLAGS_off(hv);
5d88ecd7 1626 HvPLACEHOLDERS_set(hv, 0);
d3677389
NC
1627 return;
1628 }
213ce8b3
NC
1629 } else {
1630 oentry = &HeNEXT(entry);
6136c704 1631 first = FALSE;
d3677389
NC
1632 }
1633 }
1634 } while (--i >= 0);
1635 /* You can't get here, hence assertion should always fail. */
1636 assert (items == 0);
1637 assert (0);
3540d4ce
AB
1638}
1639
76e3520e 1640STATIC void
cea2e8a9 1641S_hfreeentries(pTHX_ HV *hv)
79072805 1642{
23976bdd 1643 /* This is the array that we're going to restore */
fd7de8a8 1644 HE **const orig_array = HvARRAY(hv);
2d0d1ecc
FC
1645 HE **tmp_array = NULL;
1646 const bool has_aux = SvOOK(hv);
1647 struct xpvhv_aux * current_aux = NULL;
23976bdd 1648 int attempts = 100;
745edda6
FC
1649
1650 const bool mpm = PL_phase != PERL_PHASE_DESTRUCT && HvENAME(hv);
3abe233e 1651
7918f24d
NC
1652 PERL_ARGS_ASSERT_HFREEENTRIES;
1653
fd7de8a8 1654 if (!orig_array)
79072805 1655 return;
a0d0e21e 1656
23976bdd
NC
1657 /* orig_array remains unchanged throughout the loop. If after freeing all
1658 the entries it turns out that one of the little blighters has triggered
1659 an action that has caused HvARRAY to be re-allocated, then we set
1660 array to the new HvARRAY, and try again. */
1661
1662 while (1) {
1663 /* This is the one we're going to try to empty. First time round
1664 it's the original array. (Hopefully there will only be 1 time
1665 round) */
6136c704 1666 HE ** const array = HvARRAY(hv);
7440661e 1667 I32 i = HvMAX(hv);
23976bdd 1668
2d0d1ecc
FC
1669 struct xpvhv_aux *iter = SvOOK(hv) ? HvAUX(hv) : NULL;
1670
1671 /* make everyone else think the array is empty, so that the destructors
1672 * called for freed entries can't recursively mess with us */
1673 HvARRAY(hv) = NULL;
23976bdd
NC
1674
1675 if (SvOOK(hv)) {
7440661e 1676 HE *entry;
2d0d1ecc
FC
1677
1678 SvFLAGS(hv) &= ~SVf_OOK; /* Goodbye, aux structure. */
1679 /* What aux structure? */
1680 /* (But we still have a pointer to it in iter.) */
1681
47f1cf77
FC
1682 /* Copy the name and MRO stuff to a new aux structure
1683 if present. */
1684 if (iter->xhv_name || iter->xhv_mro_meta) {
2d0d1ecc
FC
1685 struct xpvhv_aux * const newaux = hv_auxinit(hv);
1686 newaux->xhv_name = iter->xhv_name;
1687 newaux->xhv_name_count = iter->xhv_name_count;
1688 iter->xhv_name = NULL;
47f1cf77
FC
1689 newaux->xhv_mro_meta = iter->xhv_mro_meta;
1690 iter->xhv_mro_meta = NULL;
2d0d1ecc
FC
1691 }
1692
47f1cf77
FC
1693 /* Because we have taken xhv_name and
1694 xhv_mro_meta out, the only allocated
2d0d1ecc 1695 pointers in the aux structure that might exist are the back-
47f1cf77 1696 reference array and xhv_eiter.
2d0d1ecc
FC
1697 */
1698
cdb996f4
DM
1699 /* weak references: if called from sv_clear(), the backrefs
1700 * should already have been killed; if there are any left, its
1701 * because we're doing hv_clear() or hv_undef(), and the HV
1702 * will continue to live.
1703 * Because while freeing the entries we fake up a NULL HvARRAY
1704 * (and hence HvAUX), we need to store the backref array
1705 * somewhere else; but it still needs to be visible in case
1706 * any the things we free happen to call sv_del_backref().
1707 * We do this by storing it in magic instead.
1708 * If, during the entry freeing, a destructor happens to add
1709 * a new weak backref, then sv_add_backref will look in both
1710 * places (magic in HvAUX) for the AV, but will create a new
8ac9a371
DM
1711 * AV in HvAUX if it can't find one (if it finds it in magic,
1712 * it moves it back into HvAUX. So at the end of the iteration
1713 * we have to allow for this. */
1714
09aad8f0
DM
1715
1716 if (iter->xhv_backreferences) {
5648c0ae
DM
1717 if (SvTYPE(iter->xhv_backreferences) == SVt_PVAV) {
1718 /* The sv_magic will increase the reference count of the AV,
1719 so we need to drop it first. */
09aad8f0 1720 SvREFCNT_dec(iter->xhv_backreferences);
5648c0ae
DM
1721 if (AvFILLp(iter->xhv_backreferences) == -1) {
1722 /* Turns out that the array is empty. Just free it. */
1723 SvREFCNT_dec(iter->xhv_backreferences);
1b8791d1 1724
5648c0ae
DM
1725 } else {
1726 sv_magic(MUTABLE_SV(hv),
1727 MUTABLE_SV(iter->xhv_backreferences),
1728 PERL_MAGIC_backref, NULL, 0);
1729 }
1730 }
1731 else {
1732 MAGIC *mg;
1733 sv_magic(MUTABLE_SV(hv), NULL, PERL_MAGIC_backref, NULL, 0);
1734 mg = mg_find(MUTABLE_SV(hv), PERL_MAGIC_backref);
1735 mg->mg_obj = (SV*)iter->xhv_backreferences;
09aad8f0
DM
1736 }
1737 iter->xhv_backreferences = NULL;
5b285ea4 1738 }
86f55936 1739
23976bdd
NC
1740 entry = iter->xhv_eiter; /* HvEITER(hv) */
1741 if (entry && HvLAZYDEL(hv)) { /* was deleted earlier? */
1742 HvLAZYDEL_off(hv);
1743 hv_free_ent(hv, entry);
1744 }
1745 iter->xhv_riter = -1; /* HvRITER(hv) = -1 */
4608196e 1746 iter->xhv_eiter = NULL; /* HvEITER(hv) = NULL */
b79f7545 1747
23976bdd 1748 /* There are now no allocated pointers in the aux structure. */
a0d0e21e 1749 }
bfcb3514 1750
2d0d1ecc
FC
1751 /* If there are no keys, there is nothing left to free. */
1752 if (!((XPVHV*) SvANY(hv))->xhv_keys) break;
23976bdd 1753
2d0d1ecc
FC
1754 /* Since we have removed the HvARRAY (and possibly replaced it by
1755 calling hv_auxinit), set the number of keys accordingly. */
1756 ((XPVHV*) SvANY(hv))->xhv_keys = 0;
7440661e
NC
1757
1758 do {
1759 /* Loop down the linked list heads */
1760 HE *entry = array[i];
1761
1762 while (entry) {
23976bdd
NC
1763 register HE * const oentry = entry;
1764 entry = HeNEXT(entry);
745edda6
FC
1765 if (
1766 mpm && HeVAL(oentry) && isGV(HeVAL(oentry)) &&
1767 GvHV(HeVAL(oentry)) && HvENAME(GvHV(HeVAL(oentry)))
1768 ) {
1769 STRLEN klen;
1770 const char * const key = HePV(oentry,klen);
1771 if (klen > 1 && key[klen-1]==':' && key[klen-2]==':') {
1772 mro_package_moved(
1773 NULL, GvHV(HeVAL(oentry)),
afdbe55d 1774 (GV *)HeVAL(oentry), 0
745edda6
FC
1775 );
1776 }
1777 }
23976bdd
NC
1778 hv_free_ent(hv, oentry);
1779 }
7440661e 1780 } while (--i >= 0);
b79f7545 1781
23976bdd
NC
1782 /* As there are no allocated pointers in the aux structure, it's now
1783 safe to free the array we just cleaned up, if it's not the one we're
1784 going to put back. */
1785 if (array != orig_array) {
1786 Safefree(array);
1787 }
b79f7545 1788
23976bdd
NC
1789 if (!HvARRAY(hv)) {
1790 /* Good. No-one added anything this time round. */
1791 break;
bfcb3514 1792 }
b79f7545 1793
23976bdd
NC
1794 if (--attempts == 0) {
1795 Perl_die(aTHX_ "panic: hfreeentries failed to free hash - something is repeatedly re-creating entries");
1796 }
6136c704 1797 }
23976bdd 1798
2d0d1ecc
FC
1799 /* Set aside the current array for now, in case we still need it. */
1800 if (SvOOK(hv)) current_aux = HvAUX(hv);
1801 if (HvARRAY(hv) && HvARRAY(hv) != orig_array)
1802 tmp_array = HvARRAY(hv);
1803
23976bdd
NC
1804 HvARRAY(hv) = orig_array;
1805
3905af2e 1806 if (has_aux && current_aux)
23976bdd 1807 SvFLAGS(hv) |= SVf_OOK;
2d0d1ecc
FC
1808 else
1809 SvFLAGS(hv) &=~SVf_OOK;
1810
47f1cf77
FC
1811 /* If the hash was actually a symbol table, put the name and MRO
1812 caches back. */
2d0d1ecc
FC
1813 if (current_aux) {
1814 struct xpvhv_aux * const aux
1815 = SvOOK(hv) ? HvAUX(hv) : hv_auxinit(hv);
1816 aux->xhv_name = current_aux->xhv_name;
1817 aux->xhv_name_count = current_aux->xhv_name_count;
47f1cf77 1818 aux->xhv_mro_meta = current_aux->xhv_mro_meta;
1b8791d1 1819 }
2d0d1ecc
FC
1820
1821 if (tmp_array) Safefree(tmp_array);
79072805
LW
1822}
1823
954c1994
GS
1824/*
1825=for apidoc hv_undef
1826
1827Undefines the hash.
1828
1829=cut
1830*/
1831
79072805 1832void
8581adba 1833Perl_hv_undef_flags(pTHX_ HV *hv, U32 flags)
79072805 1834{
97aff369 1835 dVAR;
cbec9347 1836 register XPVHV* xhv;
bfcb3514 1837 const char *name;
86f55936 1838
79072805
LW
1839 if (!hv)
1840 return;
ecae49c0 1841 DEBUG_A(Perl_hv_assert(aTHX_ hv));
cbec9347 1842 xhv = (XPVHV*)SvANY(hv);
dd69841b 1843
745edda6
FC
1844 /* The name must be deleted before the call to hfreeeeentries so that
1845 CVs are anonymised properly. But the effective name must be pre-
1846 served until after that call (and only deleted afterwards if the
1847 call originated from sv_clear). For stashes with one name that is
1848 both the canonical name and the effective name, hv_name_set has to
1849 allocate an array for storing the effective name. We can skip that
1850 during global destruction, as it does not matter where the CVs point
1851 if they will be freed anyway. */
1852 if (PL_phase != PERL_PHASE_DESTRUCT && (name = HvNAME(hv))) {
04fe65b0
RGS
1853 if (PL_stashcache)
1854 (void)hv_delete(PL_stashcache, name, HvNAMELEN_get(hv), G_DISCARD);
bd61b366 1855 hv_name_set(hv, NULL, 0, 0);
85e6fe83 1856 }
2d0d1ecc 1857 hfreeentries(hv);
47f1cf77
FC
1858 if (SvOOK(hv)) {
1859 struct xpvhv_aux * const aux = HvAUX(hv);
1860 struct mro_meta *meta;
745edda6
FC
1861 bool zeroed = FALSE;
1862
1863 if ((name = HvENAME_get(hv))) {
1864 if (PL_phase != PERL_PHASE_DESTRUCT) {
1865 /* This must come at this point in case
1866 mro_isa_changed_in dies. */
1867 Zero(HvARRAY(hv), xhv->xhv_max+1 /* HvMAX(hv)+1 */, HE*);
1868 zeroed = TRUE;
1869
1870 mro_isa_changed_in(hv);
1871 }
1872 if (PL_stashcache)
1873 (void)hv_delete(
1874 PL_stashcache, name, HvENAMELEN_get(hv), G_DISCARD
1875 );
1876 }
1877
1878 /* If this call originated from sv_clear, then we must check for
1879 * effective names that need freeing, as well as the usual name. */
1880 name = HvNAME(hv);
1881 if (flags & HV_NAME_SETALL ? (const char *)aux->xhv_name : name) {
1882 if (name && PL_stashcache)
2d0d1ecc 1883 (void)hv_delete(PL_stashcache, name, HvNAMELEN_get(hv), G_DISCARD);
745edda6 1884 hv_name_set(hv, NULL, 0, flags);
47f1cf77
FC
1885 }
1886 if((meta = aux->xhv_mro_meta)) {
1887 if (meta->mro_linear_all) {
1888 SvREFCNT_dec(MUTABLE_SV(meta->mro_linear_all));
1889 meta->mro_linear_all = NULL;
1890 /* This is just acting as a shortcut pointer. */
1891 meta->mro_linear_current = NULL;
1892 } else if (meta->mro_linear_current) {
1893 /* Only the current MRO is stored, so this owns the data.
1894 */
1895 SvREFCNT_dec(meta->mro_linear_current);
1896 meta->mro_linear_current = NULL;
1897 }
1898 if(meta->mro_nextmethod) SvREFCNT_dec(meta->mro_nextmethod);
1899 SvREFCNT_dec(meta->isa);
1900 Safefree(meta);
1901 aux->xhv_mro_meta = NULL;
1902 }
745edda6
FC
1903 if (!aux->xhv_name)
1904 SvFLAGS(hv) &= ~SVf_OOK;
1905 else if (!zeroed)
1906 Zero(HvARRAY(hv), xhv->xhv_max+1 /* HvMAX(hv)+1 */, HE*);
1907 }
1908 if (!SvOOK(hv)) {
1909 Safefree(HvARRAY(hv));
1910 xhv->xhv_max = 7; /* HvMAX(hv) = 7 (it's a normal hash) */
1911 HvARRAY(hv) = 0;
2d0d1ecc 1912 }
ca732855 1913 HvPLACEHOLDERS_set(hv, 0);
a0d0e21e
LW
1914
1915 if (SvRMAGICAL(hv))
ad64d0ec 1916 mg_clear(MUTABLE_SV(hv));
79072805
LW
1917}
1918
4d0fbddd
NC
1919/*
1920=for apidoc hv_fill
1921
1922Returns the number of hash buckets that happen to be in use. This function is
1923wrapped by the macro C<HvFILL>.
1924
1925Previously this value was stored in the HV structure, rather than being
1926calculated on demand.
1927
1928=cut
1929*/
1930
1931STRLEN
1932Perl_hv_fill(pTHX_ HV const *const hv)
1933{
1934 STRLEN count = 0;
1935 HE **ents = HvARRAY(hv);
1936
1937 PERL_ARGS_ASSERT_HV_FILL;
1938
1939 if (ents) {
fcd24582
NC
1940 HE *const *const last = ents + HvMAX(hv);
1941 count = last + 1 - ents;
4d0fbddd
NC
1942
1943 do {
fcd24582
NC
1944 if (!*ents)
1945 --count;
1946 } while (++ents <= last);
4d0fbddd
NC
1947 }
1948 return count;
1949}
1950
b464bac0 1951static struct xpvhv_aux*
5f66b61c 1952S_hv_auxinit(HV *hv) {
bfcb3514 1953 struct xpvhv_aux *iter;
b79f7545 1954 char *array;
bfcb3514 1955
7918f24d
NC
1956 PERL_ARGS_ASSERT_HV_AUXINIT;
1957
b79f7545 1958 if (!HvARRAY(hv)) {
a02a5408 1959 Newxz(array, PERL_HV_ARRAY_ALLOC_BYTES(HvMAX(hv) + 1)
b79f7545
NC
1960 + sizeof(struct xpvhv_aux), char);
1961 } else {
1962 array = (char *) HvARRAY(hv);
1963 Renew(array, PERL_HV_ARRAY_ALLOC_BYTES(HvMAX(hv) + 1)
1964 + sizeof(struct xpvhv_aux), char);
1965 }
1966 HvARRAY(hv) = (HE**) array;
1967 /* SvOOK_on(hv) attacks the IV flags. */
1968 SvFLAGS(hv) |= SVf_OOK;
1969 iter = HvAUX(hv);
bfcb3514
NC
1970
1971 iter->xhv_riter = -1; /* HvRITER(hv) = -1 */
4608196e 1972 iter->xhv_eiter = NULL; /* HvEITER(hv) = NULL */
bfcb3514 1973 iter->xhv_name = 0;
b7247a80 1974 iter->xhv_name_count = 0;
86f55936 1975 iter->xhv_backreferences = 0;
e1a479c5 1976 iter->xhv_mro_meta = NULL;
bfcb3514
NC
1977 return iter;
1978}
1979
954c1994
GS
1980/*
1981=for apidoc hv_iterinit
1982
1983Prepares a starting point to traverse a hash table. Returns the number of
b24b84ef 1984keys in the hash (i.e. the same as C<HvKEYS(hv)>). The return value is
1c846c1f 1985currently only meaningful for hashes without tie magic.
954c1994
GS
1986
1987NOTE: Before version 5.004_65, C<hv_iterinit> used to return the number of
1988hash buckets that happen to be in use. If you still need that esoteric
b24b84ef 1989value, you can get it through the macro C<HvFILL(hv)>.
954c1994 1990
e16e2ff8 1991
954c1994
GS
1992=cut
1993*/
1994
79072805 1995I32
864dbfa3 1996Perl_hv_iterinit(pTHX_ HV *hv)
79072805 1997{
7918f24d
NC
1998 PERL_ARGS_ASSERT_HV_ITERINIT;
1999
2000 /* FIXME: Are we not NULL, or do we croak? Place bets now! */
2001
aa689395 2002 if (!hv)
cea2e8a9 2003 Perl_croak(aTHX_ "Bad hash");
bfcb3514 2004
b79f7545 2005 if (SvOOK(hv)) {
6136c704 2006 struct xpvhv_aux * const iter = HvAUX(hv);
0bd48802 2007 HE * const entry = iter->xhv_eiter; /* HvEITER(hv) */
bfcb3514
NC
2008 if (entry && HvLAZYDEL(hv)) { /* was deleted earlier? */
2009 HvLAZYDEL_off(hv);
2010 hv_free_ent(hv, entry);
2011 }
2012 iter->xhv_riter = -1; /* HvRITER(hv) = -1 */
4608196e 2013 iter->xhv_eiter = NULL; /* HvEITER(hv) = NULL */
bfcb3514 2014 } else {
6136c704 2015 hv_auxinit(hv);
72940dca 2016 }
44a2ac75 2017
cbec9347 2018 /* used to be xhv->xhv_fill before 5.004_65 */
5d88ecd7 2019 return HvTOTALKEYS(hv);
79072805 2020}
bfcb3514
NC
2021
2022I32 *
2023Perl_hv_riter_p(pTHX_ HV *hv) {
2024 struct xpvhv_aux *iter;
2025
7918f24d
NC
2026 PERL_ARGS_ASSERT_HV_RITER_P;
2027
bfcb3514
NC
2028 if (!hv)
2029 Perl_croak(aTHX_ "Bad hash");
2030
6136c704 2031 iter = SvOOK(hv) ? HvAUX(hv) : hv_auxinit(hv);
bfcb3514
NC
2032 return &(iter->xhv_riter);
2033}
2034
2035HE **
2036Perl_hv_eiter_p(pTHX_ HV *hv) {
2037 struct xpvhv_aux *iter;
2038
7918f24d
NC
2039 PERL_ARGS_ASSERT_HV_EITER_P;
2040
bfcb3514
NC
2041 if (!hv)
2042 Perl_croak(aTHX_ "Bad hash");
2043
6136c704 2044 iter = SvOOK(hv) ? HvAUX(hv) : hv_auxinit(hv);
bfcb3514
NC
2045 return &(iter->xhv_eiter);
2046}
2047
2048void
2049Perl_hv_riter_set(pTHX_ HV *hv, I32 riter) {
2050 struct xpvhv_aux *iter;
2051
7918f24d
NC
2052 PERL_ARGS_ASSERT_HV_RITER_SET;
2053
bfcb3514
NC
2054 if (!hv)
2055 Perl_croak(aTHX_ "Bad hash");
2056
b79f7545
NC
2057 if (SvOOK(hv)) {
2058 iter = HvAUX(hv);
2059 } else {
bfcb3514
NC
2060 if (riter == -1)
2061 return;
2062
6136c704 2063 iter = hv_auxinit(hv);
bfcb3514
NC
2064 }
2065 iter->xhv_riter = riter;
2066}
2067
2068void
2069Perl_hv_eiter_set(pTHX_ HV *hv, HE *eiter) {
2070 struct xpvhv_aux *iter;
2071
7918f24d
NC
2072 PERL_ARGS_ASSERT_HV_EITER_SET;
2073
bfcb3514
NC
2074 if (!hv)
2075 Perl_croak(aTHX_ "Bad hash");
2076
b79f7545
NC
2077 if (SvOOK(hv)) {
2078 iter = HvAUX(hv);
2079 } else {
bfcb3514
NC
2080 /* 0 is the default so don't go malloc()ing a new structure just to
2081 hold 0. */
2082 if (!eiter)
2083 return;
2084
6136c704 2085 iter = hv_auxinit(hv);
bfcb3514
NC
2086 }
2087 iter->xhv_eiter = eiter;
2088}
2089
bfcb3514 2090void
4164be69 2091Perl_hv_name_set(pTHX_ HV *hv, const char *name, U32 len, U32 flags)
bfcb3514 2092{
97aff369 2093 dVAR;
b79f7545 2094 struct xpvhv_aux *iter;
7423f6db 2095 U32 hash;
78b79c77 2096 HEK **spot;
46c461b5 2097
7918f24d 2098 PERL_ARGS_ASSERT_HV_NAME_SET;
46c461b5 2099 PERL_UNUSED_ARG(flags);
bfcb3514 2100
4164be69
NC
2101 if (len > I32_MAX)
2102 Perl_croak(aTHX_ "panic: hv name too long (%"UVuf")", (UV) len);
2103
b79f7545
NC
2104 if (SvOOK(hv)) {
2105 iter = HvAUX(hv);
7423f6db 2106 if (iter->xhv_name) {
b7247a80 2107 if(iter->xhv_name_count) {
745edda6 2108 if(flags & HV_NAME_SETALL) {
b7247a80 2109 HEK ** const name = (HEK **)HvAUX(hv)->xhv_name;
78b79c77
FC
2110 HEK **hekp = name + (
2111 iter->xhv_name_count < 0
2112 ? -iter->xhv_name_count
2113 : iter->xhv_name_count
2114 );
2115 while(hekp-- > name+1)
b7247a80 2116 unshare_hek_or_pvn(*hekp, 0, 0, 0);
78b79c77
FC
2117 /* The first elem may be null. */
2118 if(*name) unshare_hek_or_pvn(*name, 0, 0, 0);
b7247a80 2119 Safefree(name);
78b79c77
FC
2120 spot = &iter->xhv_name;
2121 iter->xhv_name_count = 0;
2122 }
2123 else {
78b79c77
FC
2124 if(iter->xhv_name_count > 0) {
2125 /* shift some things over */
4c2bfb4f
FC
2126 Renewc(
2127 iter->xhv_name, iter->xhv_name_count + 1, HEK *, HEK
2128 );
2129 spot = (HEK **)iter->xhv_name;
2130 spot[iter->xhv_name_count] = spot[1];
78b79c77 2131 spot[1] = spot[0];
4c2bfb4f 2132 iter->xhv_name_count = -(iter->xhv_name_count + 1);
78b79c77 2133 }
4c2bfb4f 2134 else if(*(spot = (HEK **)iter->xhv_name)) {
78b79c77
FC
2135 unshare_hek_or_pvn(*spot, 0, 0, 0);
2136 }
2137 }
2138 }
745edda6 2139 else if (flags & HV_NAME_SETALL) {
78b79c77
FC
2140 unshare_hek_or_pvn(iter->xhv_name, 0, 0, 0);
2141 spot = &iter->xhv_name;
b7247a80 2142 }
745edda6
FC
2143 else {
2144 HEK * const existing_name = iter->xhv_name;
2145 Newxc(iter->xhv_name, 2, HEK *, HEK);
2146 iter->xhv_name_count = -2;
2147 spot = (HEK **)iter->xhv_name;
2148 spot[1] = existing_name;
2149 }
7423f6db 2150 }
745edda6 2151 else { spot = &iter->xhv_name; iter->xhv_name_count = 0; }
16580ff5 2152 } else {
bfcb3514
NC
2153 if (name == 0)
2154 return;
2155
6136c704 2156 iter = hv_auxinit(hv);
78b79c77 2157 spot = &iter->xhv_name;
bfcb3514 2158 }
7423f6db 2159 PERL_HASH(hash, name, len);
78b79c77 2160 *spot = name ? share_hek(name, len, hash) : NULL;
bfcb3514
NC
2161}
2162
99206677
FC
2163/*
2164=for apidoc hv_ename_add
2165
2166Adds a name to a stash's internal list of effective names. See
2167C<hv_ename_delete>.
2168
2169This is called when a stash is assigned to a new location in the symbol
2170table.
2171
2172=cut
2173*/
2174
ee72b38d 2175void
27a1175b 2176Perl_hv_ename_add(pTHX_ HV *hv, const char *name, U32 len, U32 flags)
ee72b38d
FC
2177{
2178 dVAR;
2179 struct xpvhv_aux *aux = SvOOK(hv) ? HvAUX(hv) : hv_auxinit(hv);
2180 U32 hash;
2181
78b79c77 2182 PERL_ARGS_ASSERT_HV_ENAME_ADD;
27a1175b 2183 PERL_UNUSED_ARG(flags);
ee72b38d
FC
2184
2185 if (len > I32_MAX)
2186 Perl_croak(aTHX_ "panic: hv name too long (%"UVuf")", (UV) len);
2187
2188 PERL_HASH(hash, name, len);
2189
ee72b38d
FC
2190 if (aux->xhv_name_count) {
2191 HEK ** const xhv_name = (HEK **)aux->xhv_name;
78b79c77
FC
2192 I32 count = aux->xhv_name_count;
2193 HEK **hekp = xhv_name + (count < 0 ? -count : count);
ee72b38d
FC
2194 while (hekp-- > xhv_name)
2195 if (
2196 HEK_LEN(*hekp) == (I32)len && memEQ(HEK_KEY(*hekp), name, len)
78b79c77
FC
2197 ) {
2198 if (hekp == xhv_name && count < 0)
2199 aux->xhv_name_count = -count;
2200 return;
2201 }
2202 if (count < 0) aux->xhv_name_count--, count = -count;
2203 else aux->xhv_name_count++;
2204 Renewc(aux->xhv_name, count + 1, HEK *, HEK);
ee72b38d
FC
2205 ((HEK **)aux->xhv_name)[count] = share_hek(name, len, hash);
2206 }
2207 else {
2208 HEK *existing_name = aux->xhv_name;
2209 if (
78b79c77 2210 existing_name && HEK_LEN(existing_name) == (I32)len
ee72b38d
FC
2211 && memEQ(HEK_KEY(existing_name), name, len)
2212 ) return;
96517a90 2213 Newxc(aux->xhv_name, 2, HEK *, HEK);
78b79c77 2214 aux->xhv_name_count = existing_name ? 2 : -2;
ee72b38d
FC
2215 *(HEK **)aux->xhv_name = existing_name;
2216 ((HEK **)aux->xhv_name)[1] = share_hek(name, len, hash);
2217 }
2218}
2219
99206677
FC
2220/*
2221=for apidoc hv_ename_delete
2222
2223Removes a name from a stash's internal list of effective names. If this is
2224the name returned by C<HvENAME>, then another name in the list will take
2225its place (C<HvENAME> will use it).
2226
2227This is called when a stash is deleted from the symbol table.
2228
2229=cut
2230*/
2231
ee72b38d 2232void
27a1175b 2233Perl_hv_ename_delete(pTHX_ HV *hv, const char *name, U32 len, U32 flags)
ee72b38d
FC
2234{
2235 dVAR;
2236 struct xpvhv_aux *aux;
2237
78b79c77 2238 PERL_ARGS_ASSERT_HV_ENAME_DELETE;
27a1175b 2239 PERL_UNUSED_ARG(flags);
ee72b38d
FC
2240
2241 if (len > I32_MAX)
2242 Perl_croak(aTHX_ "panic: hv name too long (%"UVuf")", (UV) len);
2243
2244 if (!SvOOK(hv)) return;
2245
2246 aux = HvAUX(hv);
2247 if (!aux->xhv_name) return;
2248
2249 if (aux->xhv_name_count) {
2250 HEK ** const namep = (HEK **)aux->xhv_name;
78b79c77
FC
2251 I32 const count = aux->xhv_name_count;
2252 HEK **victim = namep + (count < 0 ? -count : count);
2253 while (victim-- > namep + 1)
ee72b38d
FC
2254 if (
2255 HEK_LEN(*victim) == (I32)len
2256 && memEQ(HEK_KEY(*victim), name, len)
2257 ) {
2258 unshare_hek_or_pvn(*victim, 0, 0, 0);
78b79c77
FC
2259 if (count < 0) ++aux->xhv_name_count;
2260 else --aux->xhv_name_count;
2261 if (
2262 (aux->xhv_name_count == 1 || aux->xhv_name_count == -1)
2263 && !*namep
2264 ) { /* if there are none left */
ee72b38d
FC
2265 Safefree(namep);
2266 aux->xhv_name = NULL;
78b79c77 2267 aux->xhv_name_count = 0;
ee72b38d
FC
2268 }
2269 else {
2270 /* Move the last one back to fill the empty slot. It
2271 does not matter what order they are in. */
78b79c77 2272 *victim = *(namep + (count < 0 ? -count : count) - 1);
ee72b38d
FC
2273 }
2274 return;
2275 }
78b79c77
FC
2276 if (
2277 count > 0 && HEK_LEN(*namep) == (I32)len
2278 && memEQ(HEK_KEY(*namep),name,len)
2279 ) {
2280 aux->xhv_name_count = -count;
2281 }
ee72b38d
FC
2282 }
2283 else if(
2284 HEK_LEN(aux->xhv_name) == (I32)len
2285 && memEQ(HEK_KEY(aux->xhv_name), name, len)
2286 ) {
3f783763
FC
2287 const HEK * const namehek = aux->xhv_name;
2288 Newxc(aux->xhv_name, 1, HEK *, HEK);
2289 *(const HEK **)aux->xhv_name = namehek;
2290 aux->xhv_name_count = -1;
ee72b38d
FC
2291 }
2292}
2293
86f55936
NC
2294AV **
2295Perl_hv_backreferences_p(pTHX_ HV *hv) {
6136c704 2296 struct xpvhv_aux * const iter = SvOOK(hv) ? HvAUX(hv) : hv_auxinit(hv);
7918f24d
NC
2297
2298 PERL_ARGS_ASSERT_HV_BACKREFERENCES_P;
96a5add6 2299 PERL_UNUSED_CONTEXT;
7918f24d 2300
86f55936
NC
2301 return &(iter->xhv_backreferences);
2302}
2303
09aad8f0
DM
2304void
2305Perl_hv_kill_backrefs(pTHX_ HV *hv) {
2306 AV *av;
2307
2308 PERL_ARGS_ASSERT_HV_KILL_BACKREFS;
2309
2310 if (!SvOOK(hv))
2311 return;
2312
2313 av = HvAUX(hv)->xhv_backreferences;
2314
2315 if (av) {
2316 HvAUX(hv)->xhv_backreferences = 0;
2317 Perl_sv_kill_backrefs(aTHX_ MUTABLE_SV(hv), av);
5648c0ae
DM
2318 if (SvTYPE(av) == SVt_PVAV)
2319 SvREFCNT_dec(av);
09aad8f0
DM
2320 }
2321}
2322
954c1994 2323/*
7a7b9979
NC
2324hv_iternext is implemented as a macro in hv.h
2325
954c1994
GS
2326=for apidoc hv_iternext
2327
2328Returns entries from a hash iterator. See C<hv_iterinit>.
2329
fe7bca90
NC
2330You may call C<hv_delete> or C<hv_delete_ent> on the hash entry that the
2331iterator currently points to, without losing your place or invalidating your
2332iterator. Note that in this case the current entry is deleted from the hash
2333with your iterator holding the last reference to it. Your iterator is flagged
2334to free the entry on the next call to C<hv_iternext>, so you must not discard
2335your iterator immediately else the entry will leak - call C<hv_iternext> to
2336trigger the resource deallocation.
2337
fe7bca90
NC
2338=for apidoc hv_iternext_flags
2339
2340Returns entries from a hash iterator. See C<hv_iterinit> and C<hv_iternext>.
2341The C<flags> value will normally be zero; if HV_ITERNEXT_WANTPLACEHOLDERS is
2342set the placeholders keys (for restricted hashes) will be returned in addition
2343to normal keys. By default placeholders are automatically skipped over.
7996736c
MHM
2344Currently a placeholder is implemented with a value that is
2345C<&Perl_sv_placeholder>. Note that the implementation of placeholders and
fe7bca90
NC
2346restricted hashes may change, and the implementation currently is
2347insufficiently abstracted for any change to be tidy.
e16e2ff8 2348
fe7bca90 2349=cut
e16e2ff8
NC
2350*/
2351
2352HE *
2353Perl_hv_iternext_flags(pTHX_ HV *hv, I32 flags)
2354{
27da23d5 2355 dVAR;
cbec9347 2356 register XPVHV* xhv;
79072805 2357 register HE *entry;
a0d0e21e 2358 HE *oldentry;
463ee0b2 2359 MAGIC* mg;
bfcb3514 2360 struct xpvhv_aux *iter;
79072805 2361
7918f24d
NC
2362 PERL_ARGS_ASSERT_HV_ITERNEXT_FLAGS;
2363
79072805 2364 if (!hv)
cea2e8a9 2365 Perl_croak(aTHX_ "Bad hash");
81714fb9 2366
cbec9347 2367 xhv = (XPVHV*)SvANY(hv);
bfcb3514 2368
b79f7545 2369 if (!SvOOK(hv)) {
bfcb3514
NC
2370 /* Too many things (well, pp_each at least) merrily assume that you can
2371 call iv_iternext without calling hv_iterinit, so we'll have to deal
2372 with it. */
2373 hv_iterinit(hv);
bfcb3514 2374 }
b79f7545 2375 iter = HvAUX(hv);
bfcb3514
NC
2376
2377 oldentry = entry = iter->xhv_eiter; /* HvEITER(hv) */
e62cc96a 2378 if (SvMAGICAL(hv) && SvRMAGICAL(hv)) {
ad64d0ec 2379 if ( ( mg = mg_find((const SV *)hv, PERL_MAGIC_tied) ) ) {
e62cc96a
YO
2380 SV * const key = sv_newmortal();
2381 if (entry) {
2382 sv_setsv(key, HeSVKEY_force(entry));
2383 SvREFCNT_dec(HeSVKEY(entry)); /* get rid of previous key */
2384 }
2385 else {
2386 char *k;
2387 HEK *hek;
2388
2389 /* one HE per MAGICAL hash */
2390 iter->xhv_eiter = entry = new_HE(); /* HvEITER(hv) = new_HE() */
2391 Zero(entry, 1, HE);
ad64d0ec 2392 Newxz(k, HEK_BASESIZE + sizeof(const SV *), char);
e62cc96a
YO
2393 hek = (HEK*)k;
2394 HeKEY_hek(entry) = hek;
2395 HeKLEN(entry) = HEf_SVKEY;
2396 }
ad64d0ec 2397 magic_nextpack(MUTABLE_SV(hv),mg,key);
e62cc96a
YO
2398 if (SvOK(key)) {
2399 /* force key to stay around until next time */
2400 HeSVKEY_set(entry, SvREFCNT_inc_simple_NN(key));
2401 return entry; /* beware, hent_val is not set */
2402 }
ef8d46e8 2403 SvREFCNT_dec(HeVAL(entry));
e62cc96a
YO
2404 Safefree(HeKEY_hek(entry));
2405 del_HE(entry);
2406 iter->xhv_eiter = NULL; /* HvEITER(hv) = NULL */
2407 return NULL;
81714fb9 2408 }
79072805 2409 }
7ee146b1 2410#if defined(DYNAMIC_ENV_FETCH) && !defined(__riscos__) /* set up %ENV for iteration */
ad64d0ec
NC
2411 if (!entry && SvRMAGICAL((const SV *)hv)
2412 && mg_find((const SV *)hv, PERL_MAGIC_env)) {
f675dbe5 2413 prime_env_iter();
03026e68
JM
2414#ifdef VMS
2415 /* The prime_env_iter() on VMS just loaded up new hash values
2416 * so the iteration count needs to be reset back to the beginning
2417 */
2418 hv_iterinit(hv);
2419 iter = HvAUX(hv);
2420 oldentry = entry = iter->xhv_eiter; /* HvEITER(hv) */
2421#endif
2422 }
f675dbe5 2423#endif
463ee0b2 2424
b79f7545
NC
2425 /* hv_iterint now ensures this. */
2426 assert (HvARRAY(hv));
2427
015a5f36 2428 /* At start of hash, entry is NULL. */
fde52b5c 2429 if (entry)
8aacddc1 2430 {
fde52b5c 2431 entry = HeNEXT(entry);
e16e2ff8
NC
2432 if (!(flags & HV_ITERNEXT_WANTPLACEHOLDERS)) {
2433 /*
2434 * Skip past any placeholders -- don't want to include them in
2435 * any iteration.
2436 */
7996736c 2437 while (entry && HeVAL(entry) == &PL_sv_placeholder) {
e16e2ff8
NC
2438 entry = HeNEXT(entry);
2439 }
8aacddc1
NIS
2440 }
2441 }
015a5f36 2442
9eb4ebd1
NC
2443 /* Skip the entire loop if the hash is empty. */
2444 if ((flags & HV_ITERNEXT_WANTPLACEHOLDERS)
2445 ? HvTOTALKEYS(hv) : HvUSEDKEYS(hv)) {
900ac051
MM
2446 while (!entry) {
2447 /* OK. Come to the end of the current list. Grab the next one. */
2448
2449 iter->xhv_riter++; /* HvRITER(hv)++ */
2450 if (iter->xhv_riter > (I32)xhv->xhv_max /* HvRITER(hv) > HvMAX(hv) */) {
2451 /* There is no next one. End of the hash. */
2452 iter->xhv_riter = -1; /* HvRITER(hv) = -1 */
2453 break;
2454 }
2455 entry = (HvARRAY(hv))[iter->xhv_riter];
8aacddc1 2456
900ac051
MM
2457 if (!(flags & HV_ITERNEXT_WANTPLACEHOLDERS)) {
2458 /* If we have an entry, but it's a placeholder, don't count it.
2459 Try the next. */
2460 while (entry && HeVAL(entry) == &PL_sv_placeholder)
2461 entry = HeNEXT(entry);
2462 }
2463 /* Will loop again if this linked list starts NULL
2464 (for HV_ITERNEXT_WANTPLACEHOLDERS)
2465 or if we run through it and find only placeholders. */
015a5f36 2466 }
fde52b5c 2467 }
79072805 2468
72940dca 2469 if (oldentry && HvLAZYDEL(hv)) { /* was deleted earlier? */
2470 HvLAZYDEL_off(hv);
68dc0745 2471 hv_free_ent(hv, oldentry);
72940dca 2472 }
a0d0e21e 2473
fdcd69b6 2474 /*if (HvREHASH(hv) && entry && !HeKREHASH(entry))
6c9570dc 2475 PerlIO_printf(PerlIO_stderr(), "Awooga %p %p\n", (void*)hv, (void*)entry);*/
fdcd69b6 2476
bfcb3514 2477 iter->xhv_eiter = entry; /* HvEITER(hv) = entry */
79072805
LW
2478 return entry;
2479}
2480
954c1994
GS
2481/*
2482=for apidoc hv_iterkey
2483
2484Returns the key from the current position of the hash iterator. See
2485C<hv_iterinit>.
2486
2487=cut
2488*/
2489
79072805 2490char *
864dbfa3 2491Perl_hv_iterkey(pTHX_ register HE *entry, I32 *retlen)
79072805 2492{
7918f24d
NC
2493 PERL_ARGS_ASSERT_HV_ITERKEY;
2494
fde52b5c 2495 if (HeKLEN(entry) == HEf_SVKEY) {
fb73857a 2496 STRLEN len;
0bd48802 2497 char * const p = SvPV(HeKEY_sv(entry), len);
fb73857a 2498 *retlen = len;
2499 return p;
fde52b5c 2500 }
2501 else {
2502 *retlen = HeKLEN(entry);
2503 return HeKEY(entry);
2504 }
2505}
2506
2507/* unlike hv_iterval(), this always returns a mortal copy of the key */
954c1994
GS
2508/*
2509=for apidoc hv_iterkeysv
2510
2511Returns the key as an C<SV*> from the current position of the hash
2512iterator. The return value will always be a mortal copy of the key. Also
2513see C<hv_iterinit>.
2514
2515=cut
2516*/
2517
fde52b5c 2518SV *
864dbfa3 2519Perl_hv_iterkeysv(pTHX_ register HE *entry)
fde52b5c 2520{
7918f24d
NC
2521 PERL_ARGS_ASSERT_HV_ITERKEYSV;
2522
c1b02ed8 2523 return sv_2mortal(newSVhek(HeKEY_hek(entry)));
79072805
LW
2524}
2525
954c1994
GS
2526/*
2527=for apidoc hv_iterval
2528
2529Returns the value from the current position of the hash iterator. See
2530C<hv_iterkey>.
2531
2532=cut
2533*/
2534
79072805 2535SV *
864dbfa3 2536Perl_hv_iterval(pTHX_ HV *hv, register HE *entry)
79072805 2537{
7918f24d
NC
2538 PERL_ARGS_ASSERT_HV_ITERVAL;
2539
8990e307 2540 if (SvRMAGICAL(hv)) {
ad64d0ec 2541 if (mg_find((const SV *)hv, PERL_MAGIC_tied)) {
c4420975 2542 SV* const sv = sv_newmortal();
bbce6d69 2543 if (HeKLEN(entry) == HEf_SVKEY)
ad64d0ec 2544 mg_copy(MUTABLE_SV(hv), sv, (char*)HeKEY_sv(entry), HEf_SVKEY);
a3b680e6 2545 else
ad64d0ec 2546 mg_copy(MUTABLE_SV(hv), sv, HeKEY(entry), HeKLEN(entry));
463ee0b2
LW
2547 return sv;
2548 }
79072805 2549 }
fde52b5c 2550 return HeVAL(entry);
79072805
LW
2551}
2552
954c1994
GS
2553/*
2554=for apidoc hv_iternextsv
2555
2556Performs an C<hv_iternext>, C<hv_iterkey>, and C<hv_iterval> in one
2557operation.
2558
2559=cut
2560*/
2561
a0d0e21e 2562SV *
864dbfa3 2563Perl_hv_iternextsv(pTHX_ HV *hv, char **key, I32 *retlen)
a0d0e21e 2564{
0bd48802
AL
2565 HE * const he = hv_iternext_flags(hv, 0);
2566
7918f24d
NC
2567 PERL_ARGS_ASSERT_HV_ITERNEXTSV;
2568
0bd48802 2569 if (!he)
a0d0e21e
LW
2570 return NULL;
2571 *key = hv_iterkey(he, retlen);
2572 return hv_iterval(hv, he);
2573}
2574
954c1994 2575/*
bc5cdc23
NC
2576
2577Now a macro in hv.h
2578
954c1994
GS
2579=for apidoc hv_magic
2580
2581Adds magic to a hash. See C<sv_magic>.
2582
2583=cut
2584*/
2585
bbce6d69 2586/* possibly free a shared string if no one has access to it
fde52b5c 2587 * len and hash must both be valid for str.
2588 */
bbce6d69 2589void
864dbfa3 2590Perl_unsharepvn(pTHX_ const char *str, I32 len, U32 hash)
fde52b5c 2591{
19692e8d
NC
2592 unshare_hek_or_pvn (NULL, str, len, hash);
2593}
2594
2595
2596void
2597Perl_unshare_hek(pTHX_ HEK *hek)
2598{
bf11fd37 2599 assert(hek);
19692e8d
NC
2600 unshare_hek_or_pvn(hek, NULL, 0, 0);
2601}
2602
2603/* possibly free a shared string if no one has access to it
2604 hek if non-NULL takes priority over the other 3, else str, len and hash
2605 are used. If so, len and hash must both be valid for str.
2606 */
df132699 2607STATIC void
97ddebaf 2608S_unshare_hek_or_pvn(pTHX_ const HEK *hek, const char *str, I32 len, U32 hash)
19692e8d 2609{
97aff369 2610 dVAR;
cbec9347 2611 register XPVHV* xhv;
20454177 2612 HE *entry;
fde52b5c 2613 register HE **oentry;
45d1cc86 2614 HE **first;
c3654f1a 2615 bool is_utf8 = FALSE;
19692e8d 2616 int k_flags = 0;
aec46f14 2617 const char * const save = str;
cbbf8932 2618 struct shared_he *he = NULL;
c3654f1a 2619
19692e8d 2620 if (hek) {
cbae3960
NC
2621 /* Find the shared he which is just before us in memory. */
2622 he = (struct shared_he *)(((char *)hek)
2623 - STRUCT_OFFSET(struct shared_he,
2624 shared_he_hek));
2625
2626 /* Assert that the caller passed us a genuine (or at least consistent)
2627 shared hek */
2628 assert (he->shared_he_he.hent_hek == hek);
29404ae0 2629
de616631
NC
2630 if (he->shared_he_he.he_valu.hent_refcount - 1) {
2631 --he->shared_he_he.he_valu.hent_refcount;
29404ae0
NC
2632 return;
2633 }
29404ae0 2634
19692e8d
NC
2635 hash = HEK_HASH(hek);
2636 } else if (len < 0) {
2637 STRLEN tmplen = -len;
2638 is_utf8 = TRUE;
2639 /* See the note in hv_fetch(). --jhi */
2640 str = (char*)bytes_from_utf8((U8*)str, &tmplen, &is_utf8);
2641 len = tmplen;
2642 if (is_utf8)
2643 k_flags = HVhek_UTF8;
2644 if (str != save)
2645 k_flags |= HVhek_WASUTF8 | HVhek_FREEKEY;
c3654f1a 2646 }
1c846c1f 2647
de616631 2648 /* what follows was the moral equivalent of:
6b88bc9c 2649 if ((Svp = hv_fetch(PL_strtab, tmpsv, FALSE, hash))) {
a0714e2c 2650 if (--*Svp == NULL)
6b88bc9c 2651 hv_delete(PL_strtab, str, len, G_DISCARD, hash);
bbce6d69 2652 } */
cbec9347 2653 xhv = (XPVHV*)SvANY(PL_strtab);
fde52b5c 2654 /* assert(xhv_array != 0) */
45d1cc86 2655 first = oentry = &(HvARRAY(PL_strtab))[hash & (I32) HvMAX(PL_strtab)];
6c1b96a1
NC
2656 if (he) {
2657 const HE *const he_he = &(he->shared_he_he);
45d1cc86 2658 for (entry = *oentry; entry; oentry = &HeNEXT(entry), entry = *oentry) {
35ab5632
NC
2659 if (entry == he_he)
2660 break;
19692e8d
NC
2661 }
2662 } else {
35a4481c 2663 const int flags_masked = k_flags & HVhek_MASK;
45d1cc86 2664 for (entry = *oentry; entry; oentry = &HeNEXT(entry), entry = *oentry) {
19692e8d
NC
2665 if (HeHASH(entry) != hash) /* strings can't be equal */
2666 continue;
2667 if (HeKLEN(entry) != len)
2668 continue;
2669 if (HeKEY(entry) != str && memNE(HeKEY(entry),str,len)) /* is this it? */
2670 continue;
2671 if (HeKFLAGS(entry) != flags_masked)
2672 continue;
19692e8d
NC
2673 break;
2674 }
2675 }
2676
35ab5632
NC
2677 if (entry) {
2678 if (--entry->he_valu.hent_refcount == 0) {
19692e8d 2679 *oentry = HeNEXT(entry);
cbae3960 2680 Safefree(entry);
4c7185a0 2681 xhv->xhv_keys--; /* HvTOTALKEYS(hv)-- */
19692e8d 2682 }
fde52b5c 2683 }
19692e8d 2684
9b387841
NC
2685 if (!entry)
2686 Perl_ck_warner_d(aTHX_ packWARN(WARN_INTERNAL),
2687 "Attempt to free non-existent shared string '%s'%s"
2688 pTHX__FORMAT,
2689 hek ? HEK_KEY(hek) : str,
2690 ((k_flags & HVhek_UTF8) ? " (utf8)" : "") pTHX__VALUE);
19692e8d
NC
2691 if (k_flags & HVhek_FREEKEY)
2692 Safefree(str);
fde52b5c 2693}
2694
bbce6d69 2695/* get a (constant) string ptr from the global string table
2696 * string will get added if it is not already there.
fde52b5c 2697 * len and hash must both be valid for str.
2698 */
bbce6d69 2699HEK *
864dbfa3 2700Perl_share_hek(pTHX_ const char *str, I32 len, register U32 hash)
fde52b5c 2701{
da58a35d 2702 bool is_utf8 = FALSE;
19692e8d 2703 int flags = 0;
aec46f14 2704 const char * const save = str;
da58a35d 2705
7918f24d
NC
2706 PERL_ARGS_ASSERT_SHARE_HEK;
2707
da58a35d 2708 if (len < 0) {
77caf834 2709 STRLEN tmplen = -len;
da58a35d 2710 is_utf8 = TRUE;
77caf834
JH
2711 /* See the note in hv_fetch(). --jhi */
2712 str = (char*)bytes_from_utf8((U8*)str, &tmplen, &is_utf8);
2713 len = tmplen;
19692e8d
NC
2714 /* If we were able to downgrade here, then than means that we were passed
2715 in a key which only had chars 0-255, but was utf8 encoded. */
2716 if (is_utf8)
2717 flags = HVhek_UTF8;
2718 /* If we found we were able to downgrade the string to bytes, then
2719 we should flag that it needs upgrading on keys or each. Also flag
2720 that we need share_hek_flags to free the string. */
2721 if (str != save)
2722 flags |= HVhek_WASUTF8 | HVhek_FREEKEY;
2723 }
2724
6e838c70 2725 return share_hek_flags (str, len, hash, flags);
19692e8d
NC
2726}
2727
6e838c70 2728STATIC HEK *
19692e8d
NC
2729S_share_hek_flags(pTHX_ const char *str, I32 len, register U32 hash, int flags)
2730{
97aff369 2731 dVAR;
19692e8d 2732 register HE *entry;
35a4481c 2733 const int flags_masked = flags & HVhek_MASK;
263cb4a6 2734 const U32 hindex = hash & (I32) HvMAX(PL_strtab);
7918f24d
NC
2735 register XPVHV * const xhv = (XPVHV*)SvANY(PL_strtab);
2736
2737 PERL_ARGS_ASSERT_SHARE_HEK_FLAGS;
bbce6d69 2738
fde52b5c 2739 /* what follows is the moral equivalent of:
1c846c1f 2740
6b88bc9c 2741 if (!(Svp = hv_fetch(PL_strtab, str, len, FALSE)))
a0714e2c 2742 hv_store(PL_strtab, str, len, NULL, hash);
fdcd69b6
NC
2743
2744 Can't rehash the shared string table, so not sure if it's worth
2745 counting the number of entries in the linked list
bbce6d69 2746 */
7918f24d 2747
fde52b5c 2748 /* assert(xhv_array != 0) */
263cb4a6
NC
2749 entry = (HvARRAY(PL_strtab))[hindex];
2750 for (;entry; entry = HeNEXT(entry)) {
fde52b5c 2751 if (HeHASH(entry) != hash) /* strings can't be equal */
2752 continue;
2753 if (HeKLEN(entry) != len)
2754 continue;
1c846c1f 2755 if (HeKEY(entry) != str && memNE(HeKEY(entry),str,len)) /* is this it? */
fde52b5c 2756 continue;
19692e8d 2757 if (HeKFLAGS(entry) != flags_masked)
c3654f1a 2758 continue;
fde52b5c 2759 break;
2760 }
263cb4a6
NC
2761
2762 if (!entry) {
45d1cc86
NC
2763 /* What used to be head of the list.
2764 If this is NULL, then we're the first entry for this slot, which
2765 means we need to increate fill. */
cbae3960
NC
2766 struct shared_he *new_entry;
2767 HEK *hek;
2768 char *k;
263cb4a6
NC
2769 HE **const head = &HvARRAY(PL_strtab)[hindex];
2770 HE *const next = *head;
cbae3960
NC
2771
2772 /* We don't actually store a HE from the arena and a regular HEK.
2773 Instead we allocate one chunk of memory big enough for both,
2774 and put the HEK straight after the HE. This way we can find the
2775 HEK directly from the HE.
2776 */
2777
a02a5408 2778 Newx(k, STRUCT_OFFSET(struct shared_he,
cbae3960
NC
2779 shared_he_hek.hek_key[0]) + len + 2, char);
2780 new_entry = (struct shared_he *)k;
2781 entry = &(new_entry->shared_he_he);
2782 hek = &(new_entry->shared_he_hek);
2783
2784 Copy(str, HEK_KEY(hek), len, char);
2785 HEK_KEY(hek)[len] = 0;
2786 HEK_LEN(hek) = len;
2787 HEK_HASH(hek) = hash;
2788 HEK_FLAGS(hek) = (unsigned char)flags_masked;
2789
2790 /* Still "point" to the HEK, so that other code need not know what
2791 we're up to. */
2792 HeKEY_hek(entry) = hek;
de616631 2793 entry->he_valu.hent_refcount = 0;
263cb4a6
NC
2794 HeNEXT(entry) = next;
2795 *head = entry;
cbae3960 2796
4c7185a0 2797 xhv->xhv_keys++; /* HvTOTALKEYS(hv)++ */
263cb4a6 2798 if (!next) { /* initial entry? */
5ac36297 2799 } else if (xhv->xhv_keys > xhv->xhv_max /* HvKEYS(hv) > HvMAX(hv) */) {
cbec9347 2800 hsplit(PL_strtab);
bbce6d69 2801 }
2802 }
2803
de616631 2804 ++entry->he_valu.hent_refcount;
19692e8d
NC
2805
2806 if (flags & HVhek_FREEKEY)
f9a63242 2807 Safefree(str);
19692e8d 2808
6e838c70 2809 return HeKEY_hek(entry);
fde52b5c 2810}
ecae49c0 2811
ca732855
NC
2812I32 *
2813Perl_hv_placeholders_p(pTHX_ HV *hv)
2814{
2815 dVAR;
ad64d0ec 2816 MAGIC *mg = mg_find((const SV *)hv, PERL_MAGIC_rhash);
ca732855 2817
7918f24d
NC
2818 PERL_ARGS_ASSERT_HV_PLACEHOLDERS_P;
2819
ca732855 2820 if (!mg) {
ad64d0ec 2821 mg = sv_magicext(MUTABLE_SV(hv), 0, PERL_MAGIC_rhash, 0, 0, 0);
ca732855
NC
2822
2823 if (!mg) {
2824 Perl_die(aTHX_ "panic: hv_placeholders_p");
2825 }
2826 }
2827 return &(mg->mg_len);
2828}
2829
2830
2831I32
0c289d13 2832Perl_hv_placeholders_get(pTHX_ const HV *hv)
ca732855
NC
2833{
2834 dVAR;
0c289d13 2835 MAGIC * const mg = mg_find((const SV *)hv, PERL_MAGIC_rhash);
ca732855 2836
7918f24d
NC
2837 PERL_ARGS_ASSERT_HV_PLACEHOLDERS_GET;
2838
ca732855
NC
2839 return mg ? mg->mg_len : 0;
2840}
2841
2842void
ac1e784a 2843Perl_hv_placeholders_set(pTHX_ HV *hv, I32 ph)
ca732855
NC
2844{
2845 dVAR;
ad64d0ec 2846 MAGIC * const mg = mg_find((const SV *)hv, PERL_MAGIC_rhash);
ca732855 2847
7918f24d
NC
2848 PERL_ARGS_ASSERT_HV_PLACEHOLDERS_SET;
2849
ca732855
NC
2850 if (mg) {
2851 mg->mg_len = ph;
2852 } else if (ph) {
ad64d0ec 2853 if (!sv_magicext(MUTABLE_SV(hv), 0, PERL_MAGIC_rhash, 0, 0, ph))
ca732855
NC
2854 Perl_die(aTHX_ "panic: hv_placeholders_set");
2855 }
2856 /* else we don't need to add magic to record 0 placeholders. */
2857}
ecae49c0 2858
2a49f0f5 2859STATIC SV *
7b0bddfa
NC
2860S_refcounted_he_value(pTHX_ const struct refcounted_he *he)
2861{
0b2d3faa 2862 dVAR;
7b0bddfa 2863 SV *value;
7918f24d
NC
2864
2865 PERL_ARGS_ASSERT_REFCOUNTED_HE_VALUE;
2866
7b0bddfa
NC
2867 switch(he->refcounted_he_data[0] & HVrhek_typemask) {
2868 case HVrhek_undef:
2869 value = newSV(0);
2870 break;
2871 case HVrhek_delete:
2872 value = &PL_sv_placeholder;
2873 break;
2874 case HVrhek_IV:
44ebaf21
NC
2875 value = newSViv(he->refcounted_he_val.refcounted_he_u_iv);
2876 break;
2877 case HVrhek_UV:
2878 value = newSVuv(he->refcounted_he_val.refcounted_he_u_uv);
7b0bddfa
NC
2879 break;
2880 case HVrhek_PV:
44ebaf21 2881 case HVrhek_PV_UTF8:
7b0bddfa
NC
2882 /* Create a string SV that directly points to the bytes in our
2883 structure. */
b9f83d2f 2884 value = newSV_type(SVt_PV);
7b0bddfa
NC
2885 SvPV_set(value, (char *) he->refcounted_he_data + 1);
2886 SvCUR_set(value, he->refcounted_he_val.refcounted_he_u_len);
2887 /* This stops anything trying to free it */
2888 SvLEN_set(value, 0);
2889 SvPOK_on(value);
2890 SvREADONLY_on(value);
44ebaf21 2891 if ((he->refcounted_he_data[0] & HVrhek_typemask) == HVrhek_PV_UTF8)
7b0bddfa
NC
2892 SvUTF8_on(value);
2893 break;
2894 default:
20439bc7
Z
2895 Perl_croak(aTHX_ "panic: refcounted_he_value bad flags %"UVxf,
2896 (UV)he->refcounted_he_data[0]);
7b0bddfa
NC
2897 }
2898 return value;
2899}
2900
ecae49c0 2901/*
20439bc7 2902=for apidoc m|HV *|refcounted_he_chain_2hv|const struct refcounted_he *c|U32 flags
8dff4fc5 2903
20439bc7
Z
2904Generates and returns a C<HV *> representing the content of a
2905C<refcounted_he> chain.
2906I<flags> is currently unused and must be zero.
8dff4fc5
BM
2907
2908=cut
2909*/
2910HV *
20439bc7 2911Perl_refcounted_he_chain_2hv(pTHX_ const struct refcounted_he *chain, U32 flags)
8dff4fc5 2912{
20439bc7
Z
2913 dVAR;
2914 HV *hv;
2915 U32 placeholders, max;
b3ca2e83 2916
20439bc7
Z
2917 if (flags)
2918 Perl_croak(aTHX_ "panic: refcounted_he_chain_2hv bad flags %"UVxf,
2919 (UV)flags);
b3ca2e83 2920
b3ca2e83
NC
2921 /* We could chase the chain once to get an idea of the number of keys,
2922 and call ksplit. But for now we'll make a potentially inefficient
2923 hash with only 8 entries in its array. */
20439bc7
Z
2924 hv = newHV();
2925 max = HvMAX(hv);
b3ca2e83
NC
2926 if (!HvARRAY(hv)) {
2927 char *array;
2928 Newxz(array, PERL_HV_ARRAY_ALLOC_BYTES(max + 1), char);
2929 HvARRAY(hv) = (HE**)array;
2930 }
2931
20439bc7 2932 placeholders = 0;
b3ca2e83 2933 while (chain) {
cbb1fbea 2934#ifdef USE_ITHREADS
b6bbf3fa 2935 U32 hash = chain->refcounted_he_hash;
cbb1fbea
NC
2936#else
2937 U32 hash = HEK_HASH(chain->refcounted_he_hek);
2938#endif
b3ca2e83
NC
2939 HE **oentry = &((HvARRAY(hv))[hash & max]);
2940 HE *entry = *oentry;
b6bbf3fa 2941 SV *value;
cbb1fbea 2942
b3ca2e83
NC
2943 for (; entry; entry = HeNEXT(entry)) {
2944 if (HeHASH(entry) == hash) {
9f769845
NC
2945 /* We might have a duplicate key here. If so, entry is older
2946 than the key we've already put in the hash, so if they are
2947 the same, skip adding entry. */
2948#ifdef USE_ITHREADS
2949 const STRLEN klen = HeKLEN(entry);
2950 const char *const key = HeKEY(entry);
2951 if (klen == chain->refcounted_he_keylen
2952 && (!!HeKUTF8(entry)
2953 == !!(chain->refcounted_he_data[0] & HVhek_UTF8))
2954 && memEQ(key, REF_HE_KEY(chain), klen))
2955 goto next_please;
2956#else
2957 if (HeKEY_hek(entry) == chain->refcounted_he_hek)
2958 goto next_please;
2959 if (HeKLEN(entry) == HEK_LEN(chain->refcounted_he_hek)
2960 && HeKUTF8(entry) == HEK_UTF8(chain->refcounted_he_hek)
2961 && memEQ(HeKEY(entry), HEK_KEY(chain->refcounted_he_hek),
2962 HeKLEN(entry)))
2963 goto next_please;
2964#endif
b3ca2e83
NC
2965 }
2966 }
2967 assert (!entry);
2968 entry = new_HE();
2969
cbb1fbea
NC
2970#ifdef USE_ITHREADS
2971 HeKEY_hek(entry)
7b0bddfa 2972 = share_hek_flags(REF_HE_KEY(chain),
b6bbf3fa
NC
2973 chain->refcounted_he_keylen,
2974 chain->refcounted_he_hash,
2975 (chain->refcounted_he_data[0]
2976 & (HVhek_UTF8|HVhek_WASUTF8)));
cbb1fbea 2977#else
71ad1b0c 2978 HeKEY_hek(entry) = share_hek_hek(chain->refcounted_he_hek);
cbb1fbea 2979#endif
7b0bddfa
NC
2980 value = refcounted_he_value(chain);
2981 if (value == &PL_sv_placeholder)
b3ca2e83 2982 placeholders++;
b6bbf3fa 2983 HeVAL(entry) = value;
b3ca2e83
NC
2984
2985 /* Link it into the chain. */
2986 HeNEXT(entry) = *oentry;
b3ca2e83
NC
2987 *oentry = entry;
2988
2989 HvTOTALKEYS(hv)++;
2990
2991 next_please:
71ad1b0c 2992 chain = chain->refcounted_he_next;
b3ca2e83
NC
2993 }
2994
2995 if (placeholders) {
2996 clear_placeholders(hv, placeholders);
2997 HvTOTALKEYS(hv) -= placeholders;
2998 }
2999
3000 /* We could check in the loop to see if we encounter any keys with key
3001 flags, but it's probably not worth it, as this per-hash flag is only
3002 really meant as an optimisation for things like Storable. */
3003 HvHASKFLAGS_on(hv);
def9038f 3004 DEBUG_A(Perl_hv_assert(aTHX_ hv));
b3ca2e83
NC
3005
3006 return hv;
3007}
3008
20439bc7
Z
3009/*
3010=for apidoc m|SV *|refcounted_he_fetch_pvn|const struct refcounted_he *chain|const char *keypv|STRLEN keylen|U32 hash|U32 flags
3011
3012Search along a C<refcounted_he> chain for an entry with the key specified
3013by I<keypv> and I<keylen>. If I<flags> has the C<REFCOUNTED_HE_KEY_UTF8>
3014bit set, the key octets are interpreted as UTF-8, otherwise they
3015are interpreted as Latin-1. I<hash> is a precomputed hash of the key
3016string, or zero if it has not been precomputed. Returns a mortal scalar
3017representing the value associated with the key, or C<&PL_sv_placeholder>
3018if there is no value associated with the key.
3019
3020=cut
3021*/
3022
7b0bddfa 3023SV *
20439bc7
Z
3024Perl_refcounted_he_fetch_pvn(pTHX_ const struct refcounted_he *chain,
3025 const char *keypv, STRLEN keylen, U32 hash, U32 flags)
7b0bddfa 3026{
0b2d3faa 3027 dVAR;
20439bc7
Z
3028 U8 utf8_flag;
3029 PERL_ARGS_ASSERT_REFCOUNTED_HE_FETCH_PVN;
7b0bddfa 3030
20439bc7
Z
3031 if (flags & ~REFCOUNTED_HE_KEY_UTF8)
3032 Perl_croak(aTHX_ "panic: refcounted_he_fetch_pvn bad flags %"UVxf,
3033 (UV)flags);
3034 if (!chain)
3035 return &PL_sv_placeholder;
3036 if (flags & REFCOUNTED_HE_KEY_UTF8) {
3037 /* For searching purposes, canonicalise to Latin-1 where possible. */
3038 const char *keyend = keypv + keylen, *p;
3039 STRLEN nonascii_count = 0;
3040 for (p = keypv; p != keyend; p++) {
3041 U8 c = (U8)*p;
3042 if (c & 0x80) {
3043 if (!((c & 0xfe) == 0xc2 && ++p != keyend &&
3044 (((U8)*p) & 0xc0) == 0x80))
3045 goto canonicalised_key;
3046 nonascii_count++;
3047 }
cd1d2f8a 3048 }
20439bc7
Z
3049 if (nonascii_count) {
3050 char *q;
3051 const char *p = keypv, *keyend = keypv + keylen;
3052 keylen -= nonascii_count;
3053 Newx(q, keylen, char);
3054 SAVEFREEPV(q);
3055 keypv = q;
3056 for (; p != keyend; p++, q++) {
3057 U8 c = (U8)*p;
3058 *q = (char)
3059 ((c & 0x80) ? ((c & 0x03) << 6) | (((U8)*++p) & 0x3f) : c);
cd1d2f8a
NC
3060 }
3061 }
20439bc7
Z
3062 flags &= ~REFCOUNTED_HE_KEY_UTF8;
3063 canonicalised_key: ;
3064 }
3065 utf8_flag = (flags & REFCOUNTED_HE_KEY_UTF8) ? HVhek_UTF8 : 0;
3066 if (!hash)
3067 PERL_HASH(hash, keypv, keylen);
7b0bddfa 3068
20439bc7
Z
3069 for (; chain; chain = chain->refcounted_he_next) {
3070 if (
7b0bddfa 3071#ifdef USE_ITHREADS
20439bc7
Z
3072 hash == chain->refcounted_he_hash &&
3073 keylen == chain->refcounted_he_keylen &&
3074 memEQ(REF_HE_KEY(chain), keypv, keylen) &&
3075 utf8_flag == (chain->refcounted_he_data[0] & HVhek_UTF8)
7b0bddfa 3076#else
20439bc7
Z
3077 hash == HEK_HASH(chain->refcounted_he_hek) &&
3078 keylen == (STRLEN)HEK_LEN(chain->refcounted_he_hek) &&
3079 memEQ(HEK_KEY(chain->refcounted_he_hek), keypv, keylen) &&
3080 utf8_flag == (HEK_FLAGS(chain->refcounted_he_hek) & HVhek_UTF8)
7b0bddfa 3081#endif
20439bc7
Z
3082 )
3083 return sv_2mortal(refcounted_he_value(chain));
7b0bddfa 3084 }
20439bc7
Z
3085 return &PL_sv_placeholder;
3086}
7b0bddfa 3087
20439bc7
Z
3088/*
3089=for apidoc m|SV *|refcounted_he_fetch_pv|const struct refcounted_he *chain|const char *key|U32 hash|U32 flags
7b0bddfa 3090
20439bc7
Z
3091Like L</refcounted_he_fetch_pvn>, but takes a nul-terminated string
3092instead of a string/length pair.
3093
3094=cut
3095*/
3096
3097SV *
3098Perl_refcounted_he_fetch_pv(pTHX_ const struct refcounted_he *chain,
3099 const char *key, U32 hash, U32 flags)
3100{
3101 PERL_ARGS_ASSERT_REFCOUNTED_HE_FETCH_PV;
3102 return refcounted_he_fetch_pvn(chain, key, strlen(key), hash, flags);
7b0bddfa
NC
3103}
3104
b3ca2e83 3105/*
20439bc7
Z
3106=for apidoc m|SV *|refcounted_he_fetch_sv|const struct refcounted_he *chain|SV *key|U32 hash|U32 flags
3107
3108Like L</refcounted_he_fetch_pvn>, but takes a Perl scalar instead of a
3109string/length pair.
3110
3111=cut
3112*/
b3ca2e83 3113
20439bc7
Z
3114SV *
3115Perl_refcounted_he_fetch_sv(pTHX_ const struct refcounted_he *chain,
3116 SV *key, U32 hash, U32 flags)
3117{
3118 const char *keypv;
3119 STRLEN keylen;
3120 PERL_ARGS_ASSERT_REFCOUNTED_HE_FETCH_SV;
3121 if (flags & REFCOUNTED_HE_KEY_UTF8)
3122 Perl_croak(aTHX_ "panic: refcounted_he_fetch_sv bad flags %"UVxf,
3123 (UV)flags);
3124 keypv = SvPV_const(key, keylen);
3125 if (SvUTF8(key))
3126 flags |= REFCOUNTED_HE_KEY_UTF8;
3127 if (!hash && SvIsCOW_shared_hash(key))
3128 hash = SvSHARED_HASH(key);
3129 return refcounted_he_fetch_pvn(chain, keypv, keylen, hash, flags);
3130}
3131
3132/*
3133=for apidoc m|struct refcounted_he *|refcounted_he_new_pvn|struct refcounted_he *parent|const char *keypv|STRLEN keylen|U32 hash|SV *value|U32 flags
3134
3135Creates a new C<refcounted_he>. This consists of a single key/value
3136pair and a reference to an existing C<refcounted_he> chain (which may
3137be empty), and thus forms a longer chain. When using the longer chain,
3138the new key/value pair takes precedence over any entry for the same key
3139further along the chain.
3140
3141The new key is specified by I<keypv> and I<keylen>. If I<flags> has
3142the C<REFCOUNTED_HE_KEY_UTF8> bit set, the key octets are interpreted
3143as UTF-8, otherwise they are interpreted as Latin-1. I<hash> is
3144a precomputed hash of the key string, or zero if it has not been
3145precomputed.
3146
3147I<value> is the scalar value to store for this key. I<value> is copied
3148by this function, which thus does not take ownership of any reference
3149to it, and later changes to the scalar will not be reflected in the
3150value visible in the C<refcounted_he>. Complex types of scalar will not
3151be stored with referential integrity, but will be coerced to strings.
3152I<value> may be either null or C<&PL_sv_placeholder> to indicate that no
3153value is to be associated with the key; this, as with any non-null value,
3154takes precedence over the existence of a value for the key further along
3155the chain.
3156
3157I<parent> points to the rest of the C<refcounted_he> chain to be
3158attached to the new C<refcounted_he>. This function takes ownership
3159of one reference to I<parent>, and returns one reference to the new
3160C<refcounted_he>.
b3ca2e83
NC
3161
3162=cut
3163*/
3164
3165struct refcounted_he *
20439bc7
Z
3166Perl_refcounted_he_new_pvn(pTHX_ struct refcounted_he *parent,
3167 const char *keypv, STRLEN keylen, U32 hash, SV *value, U32 flags)
3168{
7a89be66 3169 dVAR;
b6bbf3fa 3170 STRLEN value_len = 0;
95b63a38 3171 const char *value_p = NULL;
20439bc7 3172 bool is_pv;
b6bbf3fa 3173 char value_type;
20439bc7
Z
3174 char hekflags;
3175 STRLEN key_offset = 1;
3176 struct refcounted_he *he;
3177 PERL_ARGS_ASSERT_REFCOUNTED_HE_NEW_PVN;
b6bbf3fa 3178
20439bc7
Z
3179 if (!value || value == &PL_sv_placeholder) {
3180 value_type = HVrhek_delete;
3181 } else if (SvPOK(value)) {
b6bbf3fa
NC
3182 value_type = HVrhek_PV;
3183 } else if (SvIOK(value)) {
ad64d0ec 3184 value_type = SvUOK((const SV *)value) ? HVrhek_UV : HVrhek_IV;
b6bbf3fa
NC
3185 } else if (!SvOK(value)) {
3186 value_type = HVrhek_undef;
3187 } else {
3188 value_type = HVrhek_PV;
3189 }
20439bc7
Z
3190 is_pv = value_type == HVrhek_PV;
3191 if (is_pv) {
012da8e5
NC
3192 /* Do it this way so that the SvUTF8() test is after the SvPV, in case
3193 the value is overloaded, and doesn't yet have the UTF-8flag set. */
b6bbf3fa 3194 value_p = SvPV_const(value, value_len);
012da8e5
NC
3195 if (SvUTF8(value))
3196 value_type = HVrhek_PV_UTF8;
20439bc7
Z
3197 key_offset = value_len + 2;
3198 }
3199 hekflags = value_type;
3200
3201 if (flags & REFCOUNTED_HE_KEY_UTF8) {
3202 /* Canonicalise to Latin-1 where possible. */
3203 const char *keyend = keypv + keylen, *p;
3204 STRLEN nonascii_count = 0;
3205 for (p = keypv; p != keyend; p++) {
3206 U8 c = (U8)*p;
3207 if (c & 0x80) {
3208 if (!((c & 0xfe) == 0xc2 && ++p != keyend &&
3209 (((U8)*p) & 0xc0) == 0x80))
3210 goto canonicalised_key;
3211 nonascii_count++;
3212 }
3213 }
3214 if (nonascii_count) {
3215 char *q;
3216 const char *p = keypv, *keyend = keypv + keylen;
3217 keylen -= nonascii_count;
3218 Newx(q, keylen, char);
3219 SAVEFREEPV(q);
3220 keypv = q;
3221 for (; p != keyend; p++, q++) {
3222 U8 c = (U8)*p;
3223 *q = (char)
3224 ((c & 0x80) ? ((c & 0x03) << 6) | (((U8)*++p) & 0x3f) : c);
3225 }
3226 }
3227 flags &= ~REFCOUNTED_HE_KEY_UTF8;
3228 canonicalised_key: ;
b6bbf3fa 3229 }
20439bc7
Z
3230 if (flags & REFCOUNTED_HE_KEY_UTF8)
3231 hekflags |= HVhek_UTF8;
3232 if (!hash)
3233 PERL_HASH(hash, keypv, keylen);
012da8e5 3234
0de694c5 3235#ifdef USE_ITHREADS
10edeb5d
JH
3236 he = (struct refcounted_he*)
3237 PerlMemShared_malloc(sizeof(struct refcounted_he) - 1
20439bc7 3238 + keylen
20439bc7 3239 + key_offset);
0de694c5
NC
3240#else
3241 he = (struct refcounted_he*)
3242 PerlMemShared_malloc(sizeof(struct refcounted_he) - 1
3243 + key_offset);
3244#endif
b3ca2e83 3245
71ad1b0c 3246 he->refcounted_he_next = parent;
b6bbf3fa 3247
012da8e5 3248 if (is_pv) {
20439bc7 3249 Copy(value_p, he->refcounted_he_data + 1, value_len + 1, char);
b6bbf3fa 3250 he->refcounted_he_val.refcounted_he_u_len = value_len;
b6bbf3fa 3251 } else if (value_type == HVrhek_IV) {
20439bc7 3252 he->refcounted_he_val.refcounted_he_u_iv = SvIVX(value);
012da8e5 3253 } else if (value_type == HVrhek_UV) {
20439bc7 3254 he->refcounted_he_val.refcounted_he_u_uv = SvUVX(value);
b6bbf3fa
NC
3255 }
3256
cbb1fbea 3257#ifdef USE_ITHREADS
b6bbf3fa 3258 he->refcounted_he_hash = hash;
20439bc7
Z
3259 he->refcounted_he_keylen = keylen;
3260 Copy(keypv, he->refcounted_he_data + key_offset, keylen, char);
cbb1fbea 3261#else
20439bc7 3262 he->refcounted_he_hek = share_hek_flags(keypv, keylen, hash, hekflags);
cbb1fbea 3263#endif
b6bbf3fa 3264
20439bc7 3265 he->refcounted_he_data[0] = hekflags;
b3ca2e83
NC
3266 he->refcounted_he_refcnt = 1;
3267
3268 return he;
3269}
3270
3271/*
20439bc7 3272=for apidoc m|struct refcounted_he *|refcounted_he_new_pv|struct refcounted_he *parent|const char *key|U32 hash|SV *value|U32 flags
b3ca2e83 3273
20439bc7
Z
3274Like L</refcounted_he_new_pvn>, but takes a nul-terminated string instead
3275of a string/length pair.
3276
3277=cut
3278*/
3279
3280struct refcounted_he *
3281Perl_refcounted_he_new_pv(pTHX_ struct refcounted_he *parent,
3282 const char *key, U32 hash, SV *value, U32 flags)
3283{
3284 PERL_ARGS_ASSERT_REFCOUNTED_HE_NEW_PV;
3285 return refcounted_he_new_pvn(parent, key, strlen(key), hash, value, flags);
3286}
3287
3288/*
3289=for apidoc m|struct refcounted_he *|refcounted_he_new_sv|struct refcounted_he *parent|SV *key|U32 hash|SV *value|U32 flags
3290
3291Like L</refcounted_he_new_pvn>, but takes a Perl scalar instead of a
3292string/length pair.
3293
3294=cut
3295*/
3296
3297struct refcounted_he *
3298Perl_refcounted_he_new_sv(pTHX_ struct refcounted_he *parent,
3299 SV *key, U32 hash, SV *value, U32 flags)
3300{
3301 const char *keypv;
3302 STRLEN keylen;
3303 PERL_ARGS_ASSERT_REFCOUNTED_HE_NEW_SV;
3304 if (flags & REFCOUNTED_HE_KEY_UTF8)
3305 Perl_croak(aTHX_ "panic: refcounted_he_new_sv bad flags %"UVxf,
3306 (UV)flags);
3307 keypv = SvPV_const(key, keylen);
3308 if (SvUTF8(key))
3309 flags |= REFCOUNTED_HE_KEY_UTF8;
3310 if (!hash && SvIsCOW_shared_hash(key))
3311 hash = SvSHARED_HASH(key);
3312 return refcounted_he_new_pvn(parent, keypv, keylen, hash, value, flags);
3313}
3314
3315/*
3316=for apidoc m|void|refcounted_he_free|struct refcounted_he *he
3317
3318Decrements the reference count of a C<refcounted_he> by one. If the
3319reference count reaches zero the structure's memory is freed, which
3320(recursively) causes a reduction of its parent C<refcounted_he>'s
3321reference count. It is safe to pass a null pointer to this function:
3322no action occurs in this case.
b3ca2e83
NC
3323
3324=cut
3325*/
3326
3327void
3328Perl_refcounted_he_free(pTHX_ struct refcounted_he *he) {
53d44271 3329 dVAR;
57ca3b03
AL
3330 PERL_UNUSED_CONTEXT;
3331
b3ca2e83
NC
3332 while (he) {
3333 struct refcounted_he *copy;
cbb1fbea 3334 U32 new_count;
b3ca2e83 3335
cbb1fbea
NC
3336 HINTS_REFCNT_LOCK;
3337 new_count = --he->refcounted_he_refcnt;
3338 HINTS_REFCNT_UNLOCK;
3339
3340 if (new_count) {
b3ca2e83 3341 return;
cbb1fbea 3342 }
b3ca2e83 3343
b6bbf3fa 3344#ifndef USE_ITHREADS
71ad1b0c 3345 unshare_hek_or_pvn (he->refcounted_he_hek, 0, 0, 0);
cbb1fbea 3346#endif
b3ca2e83 3347 copy = he;
71ad1b0c 3348 he = he->refcounted_he_next;
b6bbf3fa 3349 PerlMemShared_free(copy);
b3ca2e83
NC
3350 }
3351}
3352
20439bc7
Z
3353/*
3354=for apidoc m|struct refcounted_he *|refcounted_he_inc|struct refcounted_he *he
3355
3356Increment the reference count of a C<refcounted_he>. The pointer to the
3357C<refcounted_he> is also returned. It is safe to pass a null pointer
3358to this function: no action occurs and a null pointer is returned.
3359
3360=cut
3361*/
3362
3363struct refcounted_he *
3364Perl_refcounted_he_inc(pTHX_ struct refcounted_he *he)
3365{
3366 if (he) {
3367 HINTS_REFCNT_LOCK;
3368 he->refcounted_he_refcnt++;
3369 HINTS_REFCNT_UNLOCK;
3370 }
3371 return he;
3372}
3373
47550813
NC
3374/* pp_entereval is aware that labels are stored with a key ':' at the top of
3375 the linked list. */
dca6062a 3376const char *
ce42d03d 3377Perl_fetch_cop_label(pTHX_ COP *const cop, STRLEN *len, U32 *flags) {
d6747b7a
NC
3378 struct refcounted_he *const chain = cop->cop_hints_hash;
3379
3380 PERL_ARGS_ASSERT_FETCH_COP_LABEL;
3381
dca6062a
NC
3382 if (!chain)
3383 return NULL;
3384#ifdef USE_ITHREADS
3385 if (chain->refcounted_he_keylen != 1)
3386 return NULL;
3387 if (*REF_HE_KEY(chain) != ':')
3388 return NULL;
3389#else
3390 if ((STRLEN)HEK_LEN(chain->refcounted_he_hek) != 1)
3391 return NULL;
3392 if (*HEK_KEY(chain->refcounted_he_hek) != ':')
3393 return NULL;
3394#endif
012da8e5
NC
3395 /* Stop anyone trying to really mess us up by adding their own value for
3396 ':' into %^H */
3397 if ((chain->refcounted_he_data[0] & HVrhek_typemask) != HVrhek_PV
3398 && (chain->refcounted_he_data[0] & HVrhek_typemask) != HVrhek_PV_UTF8)
3399 return NULL;
3400
dca6062a
NC
3401 if (len)
3402 *len = chain->refcounted_he_val.refcounted_he_u_len;
3403 if (flags) {
3404 *flags = ((chain->refcounted_he_data[0] & HVrhek_typemask)
3405 == HVrhek_PV_UTF8) ? SVf_UTF8 : 0;
3406 }
3407 return chain->refcounted_he_data + 1;
3408}
3409
a77ac40c
NC
3410void
3411Perl_store_cop_label(pTHX_ COP *const cop, const char *label, STRLEN len,
3412 U32 flags)
012da8e5 3413{
20439bc7 3414 SV *labelsv;
547bb267
NC
3415 PERL_ARGS_ASSERT_STORE_COP_LABEL;
3416
a77ac40c
NC
3417 if (flags & ~(SVf_UTF8))
3418 Perl_croak(aTHX_ "panic: store_cop_label illegal flag bits 0x%" UVxf,
3419 (UV)flags);
20439bc7
Z
3420 labelsv = sv_2mortal(newSVpvn(label, len));
3421 if (flags & SVf_UTF8)
3422 SvUTF8_on(labelsv);
a77ac40c 3423 cop->cop_hints_hash
20439bc7 3424 = refcounted_he_new_pvs(cop->cop_hints_hash, ":", labelsv, 0);
012da8e5
NC
3425}
3426
b3ca2e83 3427/*
ecae49c0
NC
3428=for apidoc hv_assert
3429
3430Check that a hash is in an internally consistent state.
3431
3432=cut
3433*/
3434
943795c2
NC
3435#ifdef DEBUGGING
3436
ecae49c0
NC
3437void
3438Perl_hv_assert(pTHX_ HV *hv)
3439{
57ca3b03
AL
3440 dVAR;
3441 HE* entry;
3442 int withflags = 0;
3443 int placeholders = 0;
3444 int real = 0;
3445 int bad = 0;
3446 const I32 riter = HvRITER_get(hv);
3447 HE *eiter = HvEITER_get(hv);
3448
7918f24d
NC
3449 PERL_ARGS_ASSERT_HV_ASSERT;
3450
57ca3b03
AL
3451 (void)hv_iterinit(hv);
3452
3453 while ((entry = hv_iternext_flags(hv, HV_ITERNEXT_WANTPLACEHOLDERS))) {
3454 /* sanity check the values */
3455 if (HeVAL(entry) == &PL_sv_placeholder)
3456 placeholders++;
3457 else
3458 real++;
3459 /* sanity check the keys */
3460 if (HeSVKEY(entry)) {
6f207bd3 3461 NOOP; /* Don't know what to check on SV keys. */
57ca3b03
AL
3462 } else if (HeKUTF8(entry)) {
3463 withflags++;
3464 if (HeKWASUTF8(entry)) {
3465 PerlIO_printf(Perl_debug_log,
d2a455e7 3466 "hash key has both WASUTF8 and UTF8: '%.*s'\n",
57ca3b03
AL
3467 (int) HeKLEN(entry), HeKEY(entry));
3468 bad = 1;
3469 }
3470 } else if (HeKWASUTF8(entry))
3471 withflags++;
3472 }
ad64d0ec 3473 if (!SvTIED_mg((const SV *)hv, PERL_MAGIC_tied)) {
57ca3b03
AL
3474 static const char bad_count[] = "Count %d %s(s), but hash reports %d\n";
3475 const int nhashkeys = HvUSEDKEYS(hv);
3476 const int nhashplaceholders = HvPLACEHOLDERS_get(hv);
3477
3478 if (nhashkeys != real) {
3479 PerlIO_printf(Perl_debug_log, bad_count, real, "keys", nhashkeys );
3480 bad = 1;
3481 }
3482 if (nhashplaceholders != placeholders) {
3483 PerlIO_printf(Perl_debug_log, bad_count, placeholders, "placeholder", nhashplaceholders );
3484 bad = 1;
3485 }
3486 }
3487 if (withflags && ! HvHASKFLAGS(hv)) {
3488 PerlIO_printf(Perl_debug_log,
3489 "Hash has HASKFLAGS off but I count %d key(s) with flags\n",
3490 withflags);
3491 bad = 1;
3492 }
3493 if (bad) {
ad64d0ec 3494 sv_dump(MUTABLE_SV(hv));
57ca3b03
AL
3495 }
3496 HvRITER_set(hv, riter); /* Restore hash iterator state */
3497 HvEITER_set(hv, eiter);
ecae49c0 3498}
af3babe4 3499
943795c2
NC
3500#endif
3501
af3babe4
NC
3502/*
3503 * Local variables:
3504 * c-indentation-style: bsd
3505 * c-basic-offset: 4
3506 * indent-tabs-mode: t
3507 * End:
3508 *
37442d52
RGS
3509 * ex: set ts=8 sts=4 sw=4 noet:
3510 */