PERL_GLOBAL_STRUCT_PRIVATE: fix scope.c:arg_counts

[perl5.git] / utf8.h
diff --git a/utf8.h b/utf8.h

index 2ec14fc..affa2d6 100644 (file)
--- a/utf8.h
+++ b/utf8.h
@@ -76,10 +76,15 @@ the string is invariant.
                                  utf8n_to_uvchr_error(s, len, lenp, flags, 0)
  
  #define to_uni_fold(c, p, lenp) _to_uni_fold_flags(c, p, lenp, FOLD_FLAGS_FULL)
-#define to_utf8_fold(c, p, lenp) _to_utf8_fold_flags(c, p, lenp, FOLD_FLAGS_FULL)
-#define to_utf8_lower(a,b,c) _to_utf8_lower_flags(a,b,c,0)
-#define to_utf8_upper(a,b,c) _to_utf8_upper_flags(a,b,c,0)
-#define to_utf8_title(a,b,c) _to_utf8_title_flags(a,b,c,0)
+
+#define to_utf8_fold(s, r, lenr)                                                \
+    _to_utf8_fold_flags (s, NULL, r, lenr, FOLD_FLAGS_FULL, __FILE__, __LINE__)
+#define to_utf8_lower(s, r, lenr)                                               \
+                  _to_utf8_lower_flags(s, NULL, r ,lenr, 0, __FILE__, __LINE__)
+#define to_utf8_upper(s, r, lenr)                                               \
+                  _to_utf8_upper_flags(s, NULL, r, lenr, 0, __FILE__, __LINE__)
+#define to_utf8_title(s, r, lenr)                                               \
+                  _to_utf8_title_flags(s, NULL, r, lenr ,0, __FILE__, __LINE__)
  
  #define foldEQ_utf8(s1, pe1, l1, u1, s2, pe2, l2, u2) \
                     foldEQ_utf8_flags(s1, pe1, l1, u1, s2, pe2, l2, u2, 0)
@@ -702,7 +707,7 @@ with a ptr argument.
  /* A Unicode character can fold to up to 3 characters */
  #define UTF8_MAX_FOLD_CHAR_EXPAND 3
  
-#define IN_BYTES (CopHINTS_get(PL_curcop) & HINT_BYTES)
+#define IN_BYTES UNLIKELY(CopHINTS_get(PL_curcop) & HINT_BYTES)
  
  /*
  
@@ -721,12 +726,12 @@ case any call to string overloading updates the internal UTF-8 encoding flag.
   * Is so within 'feature unicode_strings' or 'locale :not_characters', and not
   * within 'use bytes'.  UTF-8 locales are not tested for here, but perhaps
   * could be */
-#define IN_UNI_8_BIT                                                             \
-           (((CopHINTS_get(PL_curcop) & (HINT_UNI_8_BIT))                       \
-               || (CopHINTS_get(PL_curcop) & HINT_LOCALE_PARTIAL                 \
-                   /* -1 below is for :not_characters */                         \
-                   && _is_in_locale_category(FALSE, -1)))                        \
-              && ! IN_BYTES)
+#define IN_UNI_8_BIT                                                    \
+           ((    (      (CopHINTS_get(PL_curcop) & HINT_UNI_8_BIT))    \
+                   || (   CopHINTS_get(PL_curcop) & HINT_LOCALE_PARTIAL \
+                            /* -1 below is for :not_characters */       \
+                       && _is_in_locale_category(FALSE, -1)))           \
+              && (! IN_BYTES))
  
  
  #define UTF8_ALLOW_EMPTY               0x0001  /* Allow a zero length string */
@@ -779,6 +784,7 @@ case any call to string overloading updates the internal UTF-8 encoding flag.
  #define UTF8_WARN_FE_FF                 UTF8_WARN_ABOVE_31_BIT
  
  #define UTF8_CHECK_ONLY                        0x10000
+#define _UTF8_NO_CONFIDENCE_IN_CURLEN   0x20000  /* Internal core use only */
  
  /* For backwards source compatibility.  They do nothing, as the default now
   * includes what they used to mean.  The first one's meaning was to allow the
@@ -796,10 +802,10 @@ case any call to string overloading updates the internal UTF-8 encoding flag.
  #define UTF8_WARN_ILLEGAL_INTERCHANGE \
                            (UTF8_WARN_ILLEGAL_C9_INTERCHANGE|UTF8_WARN_NONCHAR)
  
-/* This is used typically for code that is willing to accept inputs of
- * illformed UTF-8 sequences, for whatever reason.  However, all such sequences
- * evaluate to the REPLACEMENT CHARACTER unless other flags overriding this are
- * also present. */
+/* This is typically used for code that processes UTF-8 input and doesn't want
+ * to have to deal with any malformations that might be present.  All such will
+ * be safely replaced by the REPLACEMENT CHARACTER, unless other flags
+ * overriding this are also present. */
  #define UTF8_ALLOW_ANY ( UTF8_ALLOW_CONTINUATION                                \
                          |UTF8_ALLOW_NON_CONTINUATION                            \
                          |UTF8_ALLOW_SHORT                                       \