X-Git-Url: https://perl5.git.perl.org/perl5.git/blobdiff_plain/ac7a6f5849b5fd57b2e837f4ddbc18c992610e9c..3c239bea80af65ef9ef306b586824cecbad9e09c:/inline_invlist.c diff --git a/inline_invlist.c b/inline_invlist.c index b194c0d..1875a05 100644 --- a/inline_invlist.c +++ b/inline_invlist.c @@ -8,63 +8,44 @@ #if defined(PERL_IN_UTF8_C) || defined(PERL_IN_REGCOMP_C) || defined(PERL_IN_REGEXEC_C) -#define INVLIST_LEN_OFFSET 0 /* Number of elements in the inversion list */ -#define INVLIST_ITER_OFFSET 1 /* Current iteration position */ -#define INVLIST_PREVIOUS_INDEX_OFFSET 2 /* Place to cache index of previous - result */ - -/* This is a combination of a version and data structure type, so that one - * being passed in can be validated to be an inversion list of the correct - * vintage. When the structure of the header is changed, a new random number - * in the range 2**31-1 should be generated and the new() method changed to - * insert that at this location. Then, if an auxiliary program doesn't change - * correspondingly, it will be discovered immediately */ -#define INVLIST_VERSION_ID_OFFSET 3 -#define INVLIST_VERSION_ID 1039476070 - -#define INVLIST_ZERO_OFFSET 4 /* 0 or 1 */ -/* The UV at position ZERO contains either 0 or 1. If 0, the inversion list - * contains the code point U+00000, and begins at element [0] in the array, - * which always contains 0. If 1, the inversion list doesn't contain U+0000, - * and it begins at element [1]. Inverting an inversion list consists of - * adding or removing the 0 at the beginning of it. By reserving a space for - * that 0, inversion can be made very fast: we just flip this UV */ - -/* For safety, when adding new elements, remember to #undef them at the end of - * the inversion list code section */ - -#define HEADER_LENGTH (INVLIST_ZERO_OFFSET + 2) /* includes 1 for the constant - 0 element */ - /* An element is in an inversion list iff its index is even numbered: 0, 2, 4, * etc */ #define ELEMENT_RANGE_MATCHES_INVLIST(i) (! ((i) & 1)) #define PREV_RANGE_MATCHES_INVLIST(i) (! ELEMENT_RANGE_MATCHES_INVLIST(i)) -PERL_STATIC_INLINE UV* -S__get_invlist_len_addr(pTHX_ SV* invlist) +/* This converts to/from our UVs to what the SV code is expecting: bytes. */ +#define TO_INTERNAL_SIZE(x) ((x) * sizeof(UV)) +#define FROM_INTERNAL_SIZE(x) ((x)/ sizeof(UV)) + +PERL_STATIC_INLINE bool* +S_get_invlist_offset_addr(SV* invlist) { - /* Return the address of the UV that contains the current number - * of used elements in the inversion list */ + /* Return the address of the field that says whether the inversion list is + * offset (it contains 1) or not (contains 0) */ + PERL_ARGS_ASSERT_GET_INVLIST_OFFSET_ADDR; - PERL_ARGS_ASSERT__GET_INVLIST_LEN_ADDR; + assert(SvTYPE(invlist) == SVt_INVLIST); - return (UV *) (SvPVX(invlist) + (INVLIST_LEN_OFFSET * sizeof (UV))); + return &(((XINVLIST*) SvANY(invlist))->is_offset); } PERL_STATIC_INLINE UV -S__invlist_len(pTHX_ SV* const invlist) +S__invlist_len(SV* const invlist) { /* Returns the current number of elements stored in the inversion list's * array */ PERL_ARGS_ASSERT__INVLIST_LEN; - return *_get_invlist_len_addr(invlist); + assert(SvTYPE(invlist) == SVt_INVLIST); + + return (SvCUR(invlist) == 0) + ? 0 + : FROM_INTERNAL_SIZE(SvCUR(invlist)) - *get_invlist_offset_addr(invlist); } PERL_STATIC_INLINE bool -S__invlist_contains_cp(pTHX_ SV* const invlist, const UV cp) +S__invlist_contains_cp(SV* const invlist, const UV cp) { /* Does contain code point as part of the set? */ @@ -75,4 +56,11 @@ S__invlist_contains_cp(pTHX_ SV* const invlist, const UV cp) return index >= 0 && ELEMENT_RANGE_MATCHES_INVLIST(index); } +# if defined(PERL_IN_UTF8_C) || defined(PERL_IN_REGEXEC_C) + +/* These symbols are only needed later in regcomp.c */ +# undef TO_INTERNAL_SIZE +# undef FROM_INTERNAL_SIZE +# endif + #endif