regcomp.c: Fix comment

[perl5.git] / numeric.c
diff --git a/numeric.c b/numeric.c

index 1900d10..7065486 100644 (file)
--- a/numeric.c
+++ b/numeric.c
@@ -39,7 +39,7 @@ Perl_cast_ulong(NV f)
      if (f < U32_MAX_P1_HALF)
        return (U32) f;
      f -= U32_MAX_P1_HALF;
-    return ((U32) f) | (1 + U32_MAX >> 1);
+    return ((U32) f) | (1 + (U32_MAX >> 1));
  #else
      return (U32) f;
  #endif
@@ -57,7 +57,7 @@ Perl_cast_i32(NV f)
      if (f < U32_MAX_P1_HALF)
        return (I32)(U32) f;
      f -= U32_MAX_P1_HALF;
-    return (I32)(((U32) f) | (1 + U32_MAX >> 1));
+    return (I32)(((U32) f) | (1 + (U32_MAX >> 1)));
  #else
      return (I32)(U32) f;
  #endif
@@ -76,7 +76,7 @@ Perl_cast_iv(NV f)
      if (f < UV_MAX_P1_HALF)
        return (IV)(UV) f;
      f -= UV_MAX_P1_HALF;
-    return (IV)(((UV) f) | (1 + UV_MAX >> 1));
+    return (IV)(((UV) f) | (1 + (UV_MAX >> 1)));
  #else
      return (IV)(UV) f;
  #endif
@@ -94,7 +94,7 @@ Perl_cast_uv(NV f)
      if (f < UV_MAX_P1_HALF)
        return (UV) f;
      f -= UV_MAX_P1_HALF;
-    return ((UV) f) | (1 + UV_MAX >> 1);
+    return ((UV) f) | (1 + (UV_MAX >> 1));
  #else
      return (UV) f;
  #endif
@@ -108,7 +108,7 @@ Perl_cast_uv(NV f)
  converts a string representing a binary number to numeric form.
  
  On entry C<start> and C<*len> give the string to scan, C<*flags> gives
-conversion flags, and C<result> should be NULL or a pointer to an NV.
+conversion flags, and C<result> should be C<NULL> or a pointer to an NV.
  The scan stops at the end of the string, or the first invalid character.
  Unless C<PERL_SCAN_SILENT_ILLDIGIT> is set in C<*flags>, encountering an
  invalid character will also trigger a warning.
@@ -116,15 +116,15 @@ On return C<*len> is set to the length of the scanned string,
  and C<*flags> gives output flags.
  
  If the value is <= C<UV_MAX> it is returned as a UV, the output flags are clear,
-and nothing is written to C<*result>.  If the value is > UV_MAX C<grok_bin>
-returns UV_MAX, sets C<PERL_SCAN_GREATER_THAN_UV_MAX> in the output flags,
+and nothing is written to C<*result>.  If the value is > C<UV_MAX>, C<grok_bin>
+returns C<UV_MAX>, sets C<PERL_SCAN_GREATER_THAN_UV_MAX> in the output flags,
  and writes the value to C<*result> (or the value is discarded if C<result>
  is NULL).
  
-The binary number may optionally be prefixed with "0b" or "b" unless
+The binary number may optionally be prefixed with C<"0b"> or C<"b"> unless
  C<PERL_SCAN_DISALLOW_PREFIX> is set in C<*flags> on entry.  If
  C<PERL_SCAN_ALLOW_UNDERSCORES> is set in C<*flags> then the binary
-number may use '_' characters to separate digits.
+number may use C<"_"> characters to separate digits.
  
  =cut
  
@@ -231,23 +231,23 @@ Perl_grok_bin(pTHX_ const char *start, STRLEN *len_p, I32 *flags, NV *result)
  converts a string representing a hex number to numeric form.
  
  On entry C<start> and C<*len_p> give the string to scan, C<*flags> gives
-conversion flags, and C<result> should be NULL or a pointer to an NV.
+conversion flags, and C<result> should be C<NULL> or a pointer to an NV.
  The scan stops at the end of the string, or the first invalid character.
  Unless C<PERL_SCAN_SILENT_ILLDIGIT> is set in C<*flags>, encountering an
  invalid character will also trigger a warning.
  On return C<*len> is set to the length of the scanned string,
  and C<*flags> gives output flags.
  
-If the value is <= UV_MAX it is returned as a UV, the output flags are clear,
-and nothing is written to C<*result>.  If the value is > UV_MAX C<grok_hex>
-returns UV_MAX, sets C<PERL_SCAN_GREATER_THAN_UV_MAX> in the output flags,
+If the value is <= C<UV_MAX> it is returned as a UV, the output flags are clear,
+and nothing is written to C<*result>.  If the value is > C<UV_MAX>, C<grok_hex>
+returns C<UV_MAX>, sets C<PERL_SCAN_GREATER_THAN_UV_MAX> in the output flags,
  and writes the value to C<*result> (or the value is discarded if C<result>
-is NULL).
+is C<NULL>).
  
-The hex number may optionally be prefixed with "0x" or "x" unless
+The hex number may optionally be prefixed with C<"0x"> or C<"x"> unless
  C<PERL_SCAN_DISALLOW_PREFIX> is set in C<*flags> on entry.  If
  C<PERL_SCAN_ALLOW_UNDERSCORES> is set in C<*flags> then the hex
-number may use '_' characters to separate digits.
+number may use C<"_"> characters to separate digits.
  
  =cut
  
@@ -352,21 +352,21 @@ Perl_grok_hex(pTHX_ const char *start, STRLEN *len_p, I32 *flags, NV *result)
  converts a string representing an octal number to numeric form.
  
  On entry C<start> and C<*len> give the string to scan, C<*flags> gives
-conversion flags, and C<result> should be NULL or a pointer to an NV.
+conversion flags, and C<result> should be C<NULL> or a pointer to an NV.
  The scan stops at the end of the string, or the first invalid character.
  Unless C<PERL_SCAN_SILENT_ILLDIGIT> is set in C<*flags>, encountering an
  8 or 9 will also trigger a warning.
  On return C<*len> is set to the length of the scanned string,
  and C<*flags> gives output flags.
  
-If the value is <= UV_MAX it is returned as a UV, the output flags are clear,
-and nothing is written to C<*result>.  If the value is > UV_MAX C<grok_oct>
-returns UV_MAX, sets C<PERL_SCAN_GREATER_THAN_UV_MAX> in the output flags,
+If the value is <= C<UV_MAX> it is returned as a UV, the output flags are clear,
+and nothing is written to C<*result>.  If the value is > C<UV_MAX>, C<grok_oct>
+returns C<UV_MAX>, sets C<PERL_SCAN_GREATER_THAN_UV_MAX> in the output flags,
  and writes the value to C<*result> (or the value is discarded if C<result>
-is NULL).
+is C<NULL>).
  
  If C<PERL_SCAN_ALLOW_UNDERSCORES> is set in C<*flags> then the octal
-number may use '_' characters to separate digits.
+number may use C<"_"> characters to separate digits.
  
  =cut
  
@@ -551,7 +551,7 @@ Perl_grok_numeric_radix(pTHX_ const char **sp, const char *send)
  /*
  =for apidoc grok_infnan
  
-Helper for grok_number(), accepts various ways of spelling "infinity"
+Helper for C<grok_number()>, accepts various ways of spelling "infinity"
  or "not a number", and returns one of the following flag combinations:
  
    IS_NUMBER_INFINITE
@@ -560,11 +560,11 @@ or "not a number", and returns one of the following flag combinations:
    IS_NUMBER_NAN | IS_NUMBER_NEG
    0
  
-possibly |-ed with IS_NUMBER_TRAILING.
+possibly |-ed with C<IS_NUMBER_TRAILING>.
  
-If an infinity or a not-a-number is recognized, the *sp will point to
+If an infinity or a not-a-number is recognized, C<*sp> will point to
  one byte past the end of the recognized string.  If the recognition fails,
-zero is returned, and the *sp will not move.
+zero is returned, and C<*sp> will not move.
  
  =cut
  */
@@ -574,6 +574,7 @@ Perl_grok_infnan(pTHX_ const char** sp, const char* send)
  {
      const char* s = *sp;
      int flags = 0;
+#if defined(NV_INF) || defined(NV_NAN)
      bool odh = FALSE; /* one-dot-hash: 1.#INF */
  
      PERL_ARGS_ASSERT_GROK_INFNAN;
@@ -798,6 +799,9 @@ Perl_grok_infnan(pTHX_ const char** sp, const char* send)
      while (s < send && isSPACE(*s))
          s++;
  
+#else
+    PERL_UNUSED_ARG(send);
+#endif /* #if defined(NV_INF) || defined(NV_NAN) */
      *sp = s;
      return flags;
  }
@@ -807,20 +811,20 @@ Perl_grok_infnan(pTHX_ const char** sp, const char* send)
  
  Recognise (or not) a number.  The type of the number is returned
  (0 if unrecognised), otherwise it is a bit-ORed combination of
-IS_NUMBER_IN_UV, IS_NUMBER_GREATER_THAN_UV_MAX, IS_NUMBER_NOT_INT,
-IS_NUMBER_NEG, IS_NUMBER_INFINITY, IS_NUMBER_NAN (defined in perl.h).
-
-If the value of the number can fit in a UV, it is returned in the *valuep
-IS_NUMBER_IN_UV will be set to indicate that *valuep is valid, IS_NUMBER_IN_UV
-will never be set unless *valuep is valid, but *valuep may have been assigned
-to during processing even though IS_NUMBER_IN_UV is not set on return.
-If valuep is NULL, IS_NUMBER_IN_UV will be set for the same cases as when
-valuep is non-NULL, but no actual assignment (or SEGV) will occur.
-
-IS_NUMBER_NOT_INT will be set with IS_NUMBER_IN_UV if trailing decimals were
-seen (in which case *valuep gives the true value truncated to an integer), and
-IS_NUMBER_NEG if the number is negative (in which case *valuep holds the
-absolute value).  IS_NUMBER_IN_UV is not set if e notation was used or the
+C<IS_NUMBER_IN_UV>, C<IS_NUMBER_GREATER_THAN_UV_MAX>, C<IS_NUMBER_NOT_INT>,
+C<IS_NUMBER_NEG>, C<IS_NUMBER_INFINITY>, C<IS_NUMBER_NAN> (defined in perl.h).
+
+If the value of the number can fit in a UV, it is returned in C<*valuep>.
+C<IS_NUMBER_IN_UV> will be set to indicate that C<*valuep> is valid, C<IS_NUMBER_IN_UV>
+will never be set unless C<*valuep> is valid, but C<*valuep> may have been assigned
+to during processing even though C<IS_NUMBER_IN_UV> is not set on return.
+If C<valuep> is C<NULL>, C<IS_NUMBER_IN_UV> will be set for the same cases as when
+C<valuep> is non-C<NULL>, but no actual assignment (or SEGV) will occur.
+
+C<IS_NUMBER_NOT_INT> will be set with C<IS_NUMBER_IN_UV> if trailing decimals were
+seen (in which case C<*valuep> gives the true value truncated to an integer), and
+C<IS_NUMBER_NEG> if the number is negative (in which case C<*valuep> holds the
+absolute value).  C<IS_NUMBER_IN_UV> is not set if e notation was used or the
  number is larger than a UV.
  
  C<flags> allows only C<PERL_SCAN_TRAILING>, which allows for trailing
@@ -829,7 +833,7 @@ C<IS_NUMBER_TRAILING> on the result.
  
  =for apidoc grok_number
  
-Identical to grok_number_flags() with flags set to zero.
+Identical to C<grok_number_flags()> with C<flags> set to zero.
  
  =cut
   */
@@ -1009,7 +1013,7 @@ Perl_grok_number_flags(pTHX_ const char *pv, STRLEN len, UV *valuep, U32 flags)
      s++;
    if (s >= send)
      return numtype;
-  if (len == 10 && memEQ(pv, "0 but true", 10)) {
+  if (memEQs(pv, len, "0 but true")) {
      if (valuep)
        *valuep = 0;
      return IS_NUMBER_IN_UV;
@@ -1018,7 +1022,7 @@ Perl_grok_number_flags(pTHX_ const char *pv, STRLEN len, UV *valuep, U32 flags)
    if ((s + 2 < send) && strchr("inqs#", toFOLD(*s))) {
        /* Really detect inf/nan. Start at d, not s, since the above
         * code might have already consumed the "1." or "1". */
-      int infnan = Perl_grok_infnan(aTHX_ &d, send);
+      const int infnan = Perl_grok_infnan(aTHX_ &d, send);
        if ((infnan & IS_NUMBER_INFINITY)) {
            return (numtype | infnan); /* Keep sign for infinity. */
        }
@@ -1085,7 +1089,7 @@ Perl_grok_atoUV(const char *pv, UV *valptr, const char** endptr)
                  /* This could be unrolled like in grok_number(), but
                   * the expected uses of this are not speed-needy, and
                   * unlikely to need full 64-bitness. */
-                U8 digit = *s++ - '0';
+                const U8 digit = *s++ - '0';
                  if (val < uv_max_div_10 ||
                      (val == uv_max_div_10 && digit <= uv_max_mod_10)) {
                      val = val * 10 + digit;
@@ -1138,7 +1142,7 @@ S_mulexp10(NV value, I32 exponent)
       * a hammer.  Therefore we need to catch potential overflows before
       * it's too late. */
  
-#if ((defined(VMS) && !defined(_IEEE_FP)) || defined(_UNICOS)) && defined(NV_MAX_10_EXP)
+#if ((defined(VMS) && !defined(_IEEE_FP)) || defined(_UNICOS) || defined(DOUBLE_IS_VAX_FLOAT)) && defined(NV_MAX_10_EXP)
      STMT_START {
         const NV exp_v = log10(value);
         if (exponent >= NV_MAX_10_EXP || exponent + exp_v >= NV_MAX_10_EXP)
@@ -1185,7 +1189,11 @@ S_mulexp10(NV value, I32 exponent)
             result *= power;
  #ifdef FP_OVERFLOWS_TO_ZERO
              if (result == 0)
+# ifdef NV_INF
                  return value < 0 ? -NV_INF : NV_INF;
+# else
+                return value < 0 ? -FLT_MAX : FLT_MAX;
+# endif
  #endif
             /* Floating point exceptions are supposed to be turned off,
              *  but if we're obviously done, don't risk another iteration.  
@@ -1201,21 +1209,26 @@ S_mulexp10(NV value, I32 exponent)
  NV
  Perl_my_atof(pTHX_ const char* s)
  {
+    /* 's' must be NUL terminated */
+
      NV x = 0.0;
+
+    PERL_ARGS_ASSERT_MY_ATOF;
+
  #ifdef USE_QUADMATH
+
      Perl_my_atof2(aTHX_ s, &x);
-    return x;
+
+#elif ! defined(USE_LOCALE_NUMERIC)
+
+    Perl_atof2(s, x);
+
  #else
-#  ifdef USE_LOCALE_NUMERIC
-    PERL_ARGS_ASSERT_MY_ATOF;
  
      {
          DECLARATION_FOR_LC_NUMERIC_MANIPULATION;
          STORE_LC_NUMERIC_SET_TO_NEEDED();
          if (PL_numeric_radix_sv && IN_LC(LC_NUMERIC)) {
-            const char *standard = NULL, *local = NULL;
-            bool use_standard_radix;
-
              /* Look through the string for the first thing that looks like a
               * decimal point: either the value in the current locale or the
               * standard fallback of '.'. The one which appears earliest in the
@@ -1223,10 +1236,11 @@ Perl_my_atof(pTHX_ const char* s)
               * that we have to determine this beforehand because on some
               * systems, Perl_atof2 is just a wrapper around the system's atof.
               * */
-            standard = strchr(s, '.');
-            local = strstr(s, SvPV_nolen(PL_numeric_radix_sv));
-
-            use_standard_radix = standard && (!local || standard < local);
+            const char * const standard_pos = strchr(s, '.');
+            const char * const local_pos
+                                  = strstr(s, SvPV_nolen(PL_numeric_radix_sv));
+            const bool use_standard_radix
+                    = standard_pos && (!local_pos || standard_pos < local_pos);
  
              if (use_standard_radix)
                  SET_NUMERIC_STANDARD();
@@ -1240,13 +1254,13 @@ Perl_my_atof(pTHX_ const char* s)
              Perl_atof2(s, x);
          RESTORE_LC_NUMERIC();
      }
-#  else
-    Perl_atof2(s, x);
-#  endif
+
  #endif
+
      return x;
  }
  
+#if defined(NV_INF) || defined(NV_NAN)
  
  #ifdef USING_MSVC6
  #  pragma warning(push)
@@ -1257,7 +1271,7 @@ S_my_atof_infnan(pTHX_ const char* s, bool negative, const char* send, NV* value
  {
      const char *p0 = negative ? s - 1 : s;
      const char *p = p0;
-    int infnan = grok_infnan(&p, send);
+    const int infnan = grok_infnan(&p, send);
      if (infnan && p != p0) {
          /* If we can generate inf/nan directly, let's do so. */
  #ifdef NV_INF
@@ -1276,8 +1290,6 @@ S_my_atof_infnan(pTHX_ const char* s, bool negative, const char* send, NV* value
          /* If still here, we didn't have either NV_INF or NV_NAN,
           * and can try falling back to native strtod/strtold.
           *
-         * (Though, are our NV_INF or NV_NAN ever not defined?)
-         *
           * The native interface might not recognize all the possible
           * inf/nan strings Perl recognizes.  What we can try
           * is to try faking the input.  We will try inf/-inf/nan
@@ -1286,36 +1298,44 @@ S_my_atof_infnan(pTHX_ const char* s, bool negative, const char* send, NV* value
              const char* fake = NULL;
              char* endp;
              NV nv;
+#ifdef NV_INF
              if ((infnan & IS_NUMBER_INFINITY)) {
                  fake = ((infnan & IS_NUMBER_NEG)) ? "-inf" : "inf";
              }
-            else if ((infnan & IS_NUMBER_NAN)) {
+#endif
+#ifdef NV_NAN
+            if ((infnan & IS_NUMBER_NAN)) {
                  fake = "nan";
              }
+#endif
              assert(fake);
              nv = Perl_strtod(fake, &endp);
              if (fake != endp) {
+#ifdef NV_INF
                  if ((infnan & IS_NUMBER_INFINITY)) {
-#ifdef Perl_isinf
+#  ifdef Perl_isinf
                      if (Perl_isinf(nv))
                          *value = nv;
-#else
+#  else
                      /* last resort, may generate SIGFPE */
                      *value = Perl_exp((NV)1e9);
                      if ((infnan & IS_NUMBER_NEG))
                          *value = -*value;
-#endif
+#  endif
                      return (char*)p; /* p, not endp */
                  }
-                else if ((infnan & IS_NUMBER_NAN)) {
-#ifdef Perl_isnan
+#endif
+#ifdef NV_NAN
+                if ((infnan & IS_NUMBER_NAN)) {
+#  ifdef Perl_isnan
                      if (Perl_isnan(nv))
                          *value = nv;
-#else
+#  else
                      /* last resort, may generate SIGFPE */
                      *value = Perl_log((NV)-1.0);
-#endif
+#  endif
                      return (char*)p; /* p, not endp */
+#endif
                  }
              }
          }
@@ -1327,6 +1347,8 @@ S_my_atof_infnan(pTHX_ const char* s, bool negative, const char* send, NV* value
  #  pragma warning(pop)
  #endif
  
+#endif /* if defined(NV_INF) || defined(NV_NAN) */
+
  char*
  Perl_my_atof2(pTHX_ const char* orig, NV* value)
  {
@@ -1409,11 +1431,13 @@ Perl_my_atof2(pTHX_ const char* orig, NV* value)
  /* the max number we can accumulate in a UV, and still safely do 10*N+9 */
  #define MAX_ACCUMULATE ( (UV) ((UV_MAX - 9)/10))
  
+#if defined(NV_INF) || defined(NV_NAN)
      {
-        const char* endp;
+        char* endp;
          if ((endp = S_my_atof_infnan(aTHX_ s, negative, send, value)))
-            return (char*)endp;
+            return endp;
      }
+#endif
  
      /* we accumulate digits into an integer; when this becomes too
       * large, we add the total to NV and start again */
@@ -1470,9 +1494,9 @@ Perl_my_atof2(pTHX_ const char* orig, NV* value)
         else if (!seen_dp && GROK_NUMERIC_RADIX(&s, send)) {
             seen_dp = 1;
             if (sig_digits > MAX_SIG_DIGITS) {
-               do {
+               while (isDIGIT(*s)) {
                     ++s;
-               } while (isDIGIT(*s));
+               }
                 break;
             }
         }
@@ -1525,9 +1549,9 @@ Perl_my_atof2(pTHX_ const char* orig, NV* value)
  /*
  =for apidoc isinfnan
  
-Perl_isinfnan() is utility function that returns true if the NV
-argument is either an infinity or a NaN, false otherwise.  To test
-in more detail, use Perl_isinf() and Perl_isnan().
+C<Perl_isinfnan()> is utility function that returns true if the NV
+argument is either an infinity or a C<NaN>, false otherwise.  To test
+in more detail, use C<Perl_isinf()> and C<Perl_isnan()>.
  
  This is also the logical inverse of Perl_isfinite().
  
@@ -1536,6 +1560,7 @@ This is also the logical inverse of Perl_isfinite().
  bool
  Perl_isinfnan(NV nv)
  {
+  PERL_UNUSED_ARG(nv);
  #ifdef Perl_isinf
      if (Perl_isinf(nv))
          return TRUE;
@@ -1550,9 +1575,9 @@ Perl_isinfnan(NV nv)
  /*
  =for apidoc
  
-Checks whether the argument would be either an infinity or NaN when used
+Checks whether the argument would be either an infinity or C<NaN> when used
  as a number, but is careful not to trigger non-numeric or uninitialized
-warnings.  it assumes the caller has done SvGETMAGIC(sv) already.
+warnings.  it assumes the caller has done C<SvGETMAGIC(sv)> already.
  
  =cut
  */
@@ -1610,19 +1635,19 @@ Perl_my_frexpl(long double x, int *e) {
  Return a non-zero integer if the sign bit on an NV is set, and 0 if
  it is not.  
  
-If Configure detects this system has a signbit() that will work with
-our NVs, then we just use it via the #define in perl.h.  Otherwise,
+If F<Configure> detects this system has a C<signbit()> that will work with
+our NVs, then we just use it via the C<#define> in F<perl.h>.  Otherwise,
  fall back on this implementation.  The main use of this function
-is catching -0.0.
+is catching C<-0.0>.
  
-Configure notes:  This function is called 'Perl_signbit' instead of a
-plain 'signbit' because it is easy to imagine a system having a signbit()
+C<Configure> notes:  This function is called C<'Perl_signbit'> instead of a
+plain C<'signbit'> because it is easy to imagine a system having a C<signbit()>
  function or macro that doesn't happen to work with our particular choice
-of NVs.  We shouldn't just re-#define signbit as Perl_signbit and expect
+of NVs.  We shouldn't just re-C<#define> C<signbit> as C<Perl_signbit> and expect
  the standard system headers to be happy.  Also, this is a no-context
-function (no pTHX_) because Perl_signbit() is usually re-#defined in
-perl.h as a simple macro call to the system's signbit().
-Users should just always call Perl_signbit().
+function (no C<pTHX_>) because C<Perl_signbit()> is usually re-C<#defined> in
+F<perl.h> as a simple macro call to the system's C<signbit()>.
+Users should just always call C<Perl_signbit()>.
  
  =cut
  */
@@ -1630,10 +1655,22 @@ Users should just always call Perl_signbit().
  int
  Perl_signbit(NV x) {
  #  ifdef Perl_fp_class_nzero
-    if (x == 0)
-        return Perl_fp_class_nzero(x);
-#  endif
+    return Perl_fp_class_nzero(x);
+    /* Try finding the high byte, and assume it's highest bit
+     * is the sign.  This assumption is probably wrong somewhere. */
+#  elif defined(USE_LONG_DOUBLE) && LONG_DOUBLEKIND == LONG_DOUBLE_IS_X86_80_BIT_LITTLE_ENDIAN
+    return (((unsigned char *)&x)[9] & 0x80);
+#  elif defined(NV_LITTLE_ENDIAN)
+    /* Note that NVSIZE is sizeof(NV), which would make the below be
+     * wrong if the end bytes are unused, which happens with the x86
+     * 80-bit long doubles, which is why take care of that above. */
+    return (((unsigned char *)&x)[NVSIZE - 1] & 0x80);
+#  elif defined(NV_BIG_ENDIAN)
+    return (((unsigned char *)&x)[0] & 0x80);
+#  else
+    /* This last resort fallback is wrong for the negative zero. */
      return (x < 0.0) ? 1 : 0;
+#  endif
  }
  #endif