ICU-59117.0.1.tar.gz

[apple/icu.git] / icuSources / common / ucase.cpp
diff --git a/icuSources/common/ucase.cpp b/icuSources/common/ucase.cpp

index b04c2d40cf0c45a1d669eda6c7ca8c1cd3f5fde1..706d7289691293147407418c2ed5f27a6da93175 100644 (file)
--- a/icuSources/common/ucase.cpp
+++ b/icuSources/common/ucase.cpp
@@ -1,3 +1,5 @@
+// © 2016 and later: Unicode, Inc. and others.
+// License & terms of use: http://www.unicode.org/copyright.html
  /*
  *******************************************************************************
  *
@@ -6,7 +8,7 @@
  *
  *******************************************************************************
  *   file name:  ucase.cpp
-*   encoding:   US-ASCII
+*   encoding:   UTF-8
  *   tab size:   8 (not used)
  *   indentation:4
  *
@@ -44,13 +46,6 @@ struct UCaseProps {
  #define INCLUDED_FROM_UCASE_CPP
  #include "ucase_props_data.h"
  
-/* UCaseProps singleton ----------------------------------------------------- */
-
-U_CAPI const UCaseProps * U_EXPORT2
-ucase_getSingleton() {
-    return &ucase_props_singleton;
-}
-
  /* set of property starts for UnicodeSet ------------------------------------ */
  
  static UBool U_CALLCONV
@@ -62,13 +57,13 @@ _enumPropertyStartsRange(const void *context, UChar32 start, UChar32 /*end*/, ui
  }
  
  U_CFUNC void U_EXPORT2
-ucase_addPropertyStarts(const UCaseProps *csp, const USetAdder *sa, UErrorCode *pErrorCode) {
+ucase_addPropertyStarts(const USetAdder *sa, UErrorCode *pErrorCode) {
      if(U_FAILURE(*pErrorCode)) {
          return;
      }
  
      /* add the start code point of each same-value range of the trie */
-    utrie2_enum(&csp->trie, NULL, _enumPropertyStartsRange, sa);
+    utrie2_enum(&ucase_props_singleton.trie, NULL, _enumPropertyStartsRange, sa);
  
      /* add code points with hardcoded properties, plus the ones following them */
  
@@ -131,14 +126,14 @@ static const uint8_t flagsOffset[256]={
  /* simple case mappings ----------------------------------------------------- */
  
  U_CAPI UChar32 U_EXPORT2
-ucase_tolower(const UCaseProps *csp, UChar32 c) {
-    uint16_t props=UTRIE2_GET16(&csp->trie, c);
+ucase_tolower(UChar32 c) {
+    uint16_t props=UTRIE2_GET16(&ucase_props_singleton.trie, c);
      if(!PROPS_HAS_EXCEPTION(props)) {
          if(UCASE_GET_TYPE(props)>=UCASE_UPPER) {
              c+=UCASE_GET_DELTA(props);
          }
      } else {
-        const uint16_t *pe=GET_EXCEPTIONS(csp, props);
+        const uint16_t *pe=GET_EXCEPTIONS(&ucase_props_singleton, props);
          uint16_t excWord=*pe++;
          if(HAS_SLOT(excWord, UCASE_EXC_LOWER)) {
              GET_SLOT_VALUE(excWord, UCASE_EXC_LOWER, pe, c);
@@ -148,14 +143,14 @@ ucase_tolower(const UCaseProps *csp, UChar32 c) {
  }
  
  U_CAPI UChar32 U_EXPORT2
-ucase_toupper(const UCaseProps *csp, UChar32 c) {
-    uint16_t props=UTRIE2_GET16(&csp->trie, c);
+ucase_toupper(UChar32 c) {
+    uint16_t props=UTRIE2_GET16(&ucase_props_singleton.trie, c);
      if(!PROPS_HAS_EXCEPTION(props)) {
          if(UCASE_GET_TYPE(props)==UCASE_LOWER) {
              c+=UCASE_GET_DELTA(props);
          }
      } else {
-        const uint16_t *pe=GET_EXCEPTIONS(csp, props);
+        const uint16_t *pe=GET_EXCEPTIONS(&ucase_props_singleton, props);
          uint16_t excWord=*pe++;
          if(HAS_SLOT(excWord, UCASE_EXC_UPPER)) {
              GET_SLOT_VALUE(excWord, UCASE_EXC_UPPER, pe, c);
@@ -165,14 +160,14 @@ ucase_toupper(const UCaseProps *csp, UChar32 c) {
  }
  
  U_CAPI UChar32 U_EXPORT2
-ucase_totitle(const UCaseProps *csp, UChar32 c) {
-    uint16_t props=UTRIE2_GET16(&csp->trie, c);
+ucase_totitle(UChar32 c) {
+    uint16_t props=UTRIE2_GET16(&ucase_props_singleton.trie, c);
      if(!PROPS_HAS_EXCEPTION(props)) {
          if(UCASE_GET_TYPE(props)==UCASE_LOWER) {
              c+=UCASE_GET_DELTA(props);
          }
      } else {
-        const uint16_t *pe=GET_EXCEPTIONS(csp, props);
+        const uint16_t *pe=GET_EXCEPTIONS(&ucase_props_singleton, props);
          uint16_t excWord=*pe++;
          int32_t idx;
          if(HAS_SLOT(excWord, UCASE_EXC_TITLE)) {
@@ -196,7 +191,7 @@ static const UChar iDotTilde[3] = { 0x69, 0x307, 0x303 };
  
  
  U_CFUNC void U_EXPORT2
-ucase_addCaseClosure(const UCaseProps *csp, UChar32 c, const USetAdder *sa) {
+ucase_addCaseClosure(UChar32 c, const USetAdder *sa) {
      uint16_t props;
  
      /*
@@ -227,7 +222,7 @@ ucase_addCaseClosure(const UCaseProps *csp, UChar32 c, const USetAdder *sa) {
          break;
      }
  
-    props=UTRIE2_GET16(&csp->trie, c);
+    props=UTRIE2_GET16(&ucase_props_singleton.trie, c);
      if(!PROPS_HAS_EXCEPTION(props)) {
          if(UCASE_GET_TYPE(props)!=UCASE_NONE) {
              /* add the one simple case mapping, no matter what type it is */
@@ -241,7 +236,7 @@ ucase_addCaseClosure(const UCaseProps *csp, UChar32 c, const USetAdder *sa) {
           * c has exceptions, so there may be multiple simple and/or
           * full case mappings. Add them all.
           */
-        const uint16_t *pe0, *pe=GET_EXCEPTIONS(csp, props);
+        const uint16_t *pe0, *pe=GET_EXCEPTIONS(&ucase_props_singleton, props);
          const UChar *closure;
          uint16_t excWord=*pe++;
          int32_t idx, closureLength, fullLength, length;
@@ -336,10 +331,10 @@ strcmpMax(const UChar *s, int32_t length, const UChar *t, int32_t max) {
  }
  
  U_CFUNC UBool U_EXPORT2
-ucase_addStringCaseClosure(const UCaseProps *csp, const UChar *s, int32_t length, const USetAdder *sa) {
+ucase_addStringCaseClosure(const UChar *s, int32_t length, const USetAdder *sa) {
      int32_t i, start, limit, result, unfoldRows, unfoldRowWidth, unfoldStringWidth;
  
-    if(csp->unfold==NULL || s==NULL) {
+    if(ucase_props_singleton.unfold==NULL || s==NULL) {
          return FALSE; /* no reverse case folding data, or no string */
      }
      if(length<=1) {
@@ -353,7 +348,7 @@ ucase_addStringCaseClosure(const UCaseProps *csp, const UChar *s, int32_t length
          return FALSE;
      }
  
-    const uint16_t *unfold=csp->unfold;
+    const uint16_t *unfold=ucase_props_singleton.unfold;
      unfoldRows=unfold[UCASE_UNFOLD_ROWS];
      unfoldRowWidth=unfold[UCASE_UNFOLD_ROW_WIDTH];
      unfoldStringWidth=unfold[UCASE_UNFOLD_STRING_WIDTH];
@@ -379,7 +374,7 @@ ucase_addStringCaseClosure(const UCaseProps *csp, const UChar *s, int32_t length
              for(i=unfoldStringWidth; i<unfoldRowWidth && p[i]!=0;) {
                  U16_NEXT_UNSAFE(p, i, c);
                  sa->add(sa->set, c);
-                ucase_addCaseClosure(csp, c, sa);
+                ucase_addCaseClosure(c, sa);
              }
              return TRUE;
          } else if(result<0) {
@@ -428,38 +423,38 @@ U_NAMESPACE_END
  
  /** @return UCASE_NONE, UCASE_LOWER, UCASE_UPPER, UCASE_TITLE */
  U_CAPI int32_t U_EXPORT2
-ucase_getType(const UCaseProps *csp, UChar32 c) {
-    uint16_t props=UTRIE2_GET16(&csp->trie, c);
+ucase_getType(UChar32 c) {
+    uint16_t props=UTRIE2_GET16(&ucase_props_singleton.trie, c);
      return UCASE_GET_TYPE(props);
  }
  
  /** @return same as ucase_getType() and set bit 2 if c is case-ignorable */
  U_CAPI int32_t U_EXPORT2
-ucase_getTypeOrIgnorable(const UCaseProps *csp, UChar32 c) {
-    uint16_t props=UTRIE2_GET16(&csp->trie, c);
+ucase_getTypeOrIgnorable(UChar32 c) {
+    uint16_t props=UTRIE2_GET16(&ucase_props_singleton.trie, c);
      return UCASE_GET_TYPE_AND_IGNORABLE(props);
  }
  
  /** @return UCASE_NO_DOT, UCASE_SOFT_DOTTED, UCASE_ABOVE, UCASE_OTHER_ACCENT */
  static inline int32_t
-getDotType(const UCaseProps *csp, UChar32 c) {
-    uint16_t props=UTRIE2_GET16(&csp->trie, c);
+getDotType(UChar32 c) {
+    uint16_t props=UTRIE2_GET16(&ucase_props_singleton.trie, c);
      if(!PROPS_HAS_EXCEPTION(props)) {
          return props&UCASE_DOT_MASK;
      } else {
-        const uint16_t *pe=GET_EXCEPTIONS(csp, props);
+        const uint16_t *pe=GET_EXCEPTIONS(&ucase_props_singleton, props);
          return (*pe>>UCASE_EXC_DOT_SHIFT)&UCASE_DOT_MASK;
      }
  }
  
  U_CAPI UBool U_EXPORT2
-ucase_isSoftDotted(const UCaseProps *csp, UChar32 c) {
-    return (UBool)(getDotType(csp, c)==UCASE_SOFT_DOTTED);
+ucase_isSoftDotted(UChar32 c) {
+    return (UBool)(getDotType(c)==UCASE_SOFT_DOTTED);
  }
  
  U_CAPI UBool U_EXPORT2
-ucase_isCaseSensitive(const UCaseProps *csp, UChar32 c) {
-    uint16_t props=UTRIE2_GET16(&csp->trie, c);
+ucase_isCaseSensitive(UChar32 c) {
+    uint16_t props=UTRIE2_GET16(&ucase_props_singleton.trie, c);
      return (UBool)((props&UCASE_SENSITIVE)!=0);
  }
  
@@ -543,12 +538,10 @@ ucase_isCaseSensitive(const UCaseProps *csp, UChar32 c) {
   *     zero or more case-ignorable characters.
   */
  
-#define is_a(c) ((c)=='a' || (c)=='A')
  #define is_d(c) ((c)=='d' || (c)=='D')
  #define is_e(c) ((c)=='e' || (c)=='E')
  #define is_i(c) ((c)=='i' || (c)=='I')
  #define is_l(c) ((c)=='l' || (c)=='L')
-#define is_n(c) ((c)=='n' || (c)=='N')
  #define is_r(c) ((c)=='r' || (c)=='R')
  #define is_t(c) ((c)=='t' || (c)=='T')
  #define is_u(c) ((c)=='u' || (c)=='U')
@@ -563,16 +556,7 @@ ucase_isCaseSensitive(const UCaseProps *csp, UChar32 c) {
   * Accepts both 2- and 3-letter codes and accepts case variants.
   */
  U_CFUNC int32_t
-ucase_getCaseLocale(const char *locale, int32_t *locCache) {
-    int32_t result;
-    char c;
-
-    if(locCache!=NULL && (result=*locCache)!=UCASE_LOC_UNKNOWN) {
-        return result;
-    }
-
-    result=UCASE_LOC_ROOT;
-
+ucase_getCaseLocale(const char *locale) {
      /*
       * This function used to use uloc_getLanguage(), but the current code
       * removes the dependency of this low-level code on uloc implementation code
@@ -582,61 +566,149 @@ ucase_getCaseLocale(const char *locale, int32_t *locCache) {
       * Because this code does not want to depend on uloc, the caller must
       * pass in a non-NULL locale, i.e., may need to call uloc_getDefault().
       */
-    c=*locale++;
-    if(is_t(c)) {
-        /* tr or tur? */
+    char c=*locale++;
+    // Fastpath for English "en" which is often used for default (=root locale) case mappings,
+    // and for Chinese "zh": Very common but no special case mapping behavior.
+    // Then check lowercase vs. uppercase to reduce the number of comparisons
+    // for other locales without special behavior.
+    if(c=='e') {
+        /* el or ell? */
          c=*locale++;
-        if(is_u(c)) {
+        if(is_l(c)) {
              c=*locale++;
-        }
-        if(is_r(c)) {
-            c=*locale;
+            if(is_l(c)) {
+                c=*locale;
+            }
              if(is_sep(c)) {
-                result=UCASE_LOC_TURKISH;
+                return UCASE_LOC_GREEK;
              }
          }
-    } else if(is_a(c)) {
-        /* az or aze? */
-        c=*locale++;
-        if(is_z(c)) {
+        // en, es, ... -> root
+    } else if(c=='z') {
+        return UCASE_LOC_ROOT;
+#if U_CHARSET_FAMILY==U_ASCII_FAMILY
+    } else if(c>='a') {  // ASCII a-z = 0x61..0x7a, after A-Z
+#elif U_CHARSET_FAMILY==U_EBCDIC_FAMILY
+    } else if(c<='z') {  // EBCDIC a-z = 0x81..0xa9 with two gaps, before A-Z
+#else
+#   error Unknown charset family!
+#endif
+        // lowercase c
+        if(c=='t') {
+            /* tr or tur? */
              c=*locale++;
-            if(is_e(c)) {
+            if(is_u(c)) {
+                c=*locale++;
+            }
+            if(is_r(c)) {
                  c=*locale;
+                if(is_sep(c)) {
+                    return UCASE_LOC_TURKISH;
+                }
              }
-            if(is_sep(c)) {
-                result=UCASE_LOC_TURKISH;
+        } else if(c=='a') {
+            /* az or aze? */
+            c=*locale++;
+            if(is_z(c)) {
+                c=*locale++;
+                if(is_e(c)) {
+                    c=*locale;
+                }
+                if(is_sep(c)) {
+                    return UCASE_LOC_TURKISH;
+                }
              }
-        }
-    } else if(is_l(c)) {
-        /* lt or lit? */
-        c=*locale++;
-        if(is_i(c)) {
+        } else if(c=='l') {
+            /* lt or lit? */
              c=*locale++;
-        }
-        if(is_t(c)) {
-            c=*locale;
-            if(is_sep(c)) {
-                result=UCASE_LOC_LITHUANIAN;
+            if(is_i(c)) {
+                c=*locale++;
+            }
+            if(is_t(c)) {
+                c=*locale;
+                if(is_sep(c)) {
+                    return UCASE_LOC_LITHUANIAN;
+                }
+            }
+        } else if(c=='n') {
+            /* nl or nld? */
+            c=*locale++;
+            if(is_l(c)) {
+                c=*locale++;
+                if(is_d(c)) {
+                    c=*locale;
+                }
+                if(is_sep(c)) {
+                    return UCASE_LOC_DUTCH;
+                }
              }
          }
-    } else if(is_n(c)) {
-        /* nl or nld? */
-        c=*locale++;
-        if(is_l(c)) {
+    } else {
+        // uppercase c
+        // Same code as for lowercase c but also check for 'E'.
+        if(c=='T') {
+            /* tr or tur? */
              c=*locale++;
-            if(is_d(c)) {
+            if(is_u(c)) {
+                c=*locale++;
+            }
+            if(is_r(c)) {
                  c=*locale;
+                if(is_sep(c)) {
+                    return UCASE_LOC_TURKISH;
+                }
              }
-            if(is_sep(c)) {
-                result=UCASE_LOC_DUTCH;
+        } else if(c=='A') {
+            /* az or aze? */
+            c=*locale++;
+            if(is_z(c)) {
+                c=*locale++;
+                if(is_e(c)) {
+                    c=*locale;
+                }
+                if(is_sep(c)) {
+                    return UCASE_LOC_TURKISH;
+                }
+            }
+        } else if(c=='L') {
+            /* lt or lit? */
+            c=*locale++;
+            if(is_i(c)) {
+                c=*locale++;
+            }
+            if(is_t(c)) {
+                c=*locale;
+                if(is_sep(c)) {
+                    return UCASE_LOC_LITHUANIAN;
+                }
+            }
+        } else if(c=='E') {
+            /* el or ell? */
+            c=*locale++;
+            if(is_l(c)) {
+                c=*locale++;
+                if(is_l(c)) {
+                    c=*locale;
+                }
+                if(is_sep(c)) {
+                    return UCASE_LOC_GREEK;
+                }
+            }
+        } else if(c=='N') {
+            /* nl or nld? */
+            c=*locale++;
+            if(is_l(c)) {
+                c=*locale++;
+                if(is_d(c)) {
+                    c=*locale;
+                }
+                if(is_sep(c)) {
+                    return UCASE_LOC_DUTCH;
+                }
              }
          }
      }
-
-    if(locCache!=NULL) {
-        *locCache=result;
-    }
-    return result;
+    return UCASE_LOC_ROOT;
  }
  
  /*
@@ -648,7 +720,7 @@ ucase_getCaseLocale(const char *locale, int32_t *locCache) {
   * it is also cased or not.
   */
  static UBool
-isFollowedByCasedLetter(const UCaseProps *csp, UCaseContextIterator *iter, void *context, int8_t dir) {
+isFollowedByCasedLetter(UCaseContextIterator *iter, void *context, int8_t dir) {
      UChar32 c;
  
      if(iter==NULL) {
@@ -656,7 +728,7 @@ isFollowedByCasedLetter(const UCaseProps *csp, UCaseContextIterator *iter, void
      }
  
      for(/* dir!=0 sets direction */; (c=iter(context, dir))>=0; dir=0) {
-        int32_t type=ucase_getTypeOrIgnorable(csp, c);
+        int32_t type=ucase_getTypeOrIgnorable(c);
          if(type&4) {
              /* case-ignorable, continue with the loop */
          } else if(type!=UCASE_NONE) {
@@ -671,7 +743,7 @@ isFollowedByCasedLetter(const UCaseProps *csp, UCaseContextIterator *iter, void
  
  /* Is preceded by Soft_Dotted character with no intervening cc=230 ? */
  static UBool
-isPrecededBySoftDotted(const UCaseProps *csp, UCaseContextIterator *iter, void *context) {
+isPrecededBySoftDotted(UCaseContextIterator *iter, void *context) {
      UChar32 c;
      int32_t dotType;
      int8_t dir;
@@ -681,7 +753,7 @@ isPrecededBySoftDotted(const UCaseProps *csp, UCaseContextIterator *iter, void *
      }
  
      for(dir=-1; (c=iter(context, dir))>=0; dir=0) {
-        dotType=getDotType(csp, c);
+        dotType=getDotType(c);
          if(dotType==UCASE_SOFT_DOTTED) {
              return TRUE; /* preceded by TYPE_i */
          } else if(dotType!=UCASE_OTHER_ACCENT) {
@@ -728,7 +800,7 @@ isPrecededBySoftDotted(const UCaseProps *csp, UCaseContextIterator *iter, void *
  
  /* Is preceded by base character 'I' with no intervening cc=230 ? */
  static UBool
-isPrecededBy_I(const UCaseProps *csp, UCaseContextIterator *iter, void *context) {
+isPrecededBy_I(UCaseContextIterator *iter, void *context) {
      UChar32 c;
      int32_t dotType;
      int8_t dir;
@@ -741,7 +813,7 @@ isPrecededBy_I(const UCaseProps *csp, UCaseContextIterator *iter, void *context)
          if(c==0x49) {
              return TRUE; /* preceded by I */
          }
-        dotType=getDotType(csp, c);
+        dotType=getDotType(c);
          if(dotType!=UCASE_OTHER_ACCENT) {
              return FALSE; /* preceded by different base character (not I), or intervening cc==230 */
          }
@@ -752,7 +824,7 @@ isPrecededBy_I(const UCaseProps *csp, UCaseContextIterator *iter, void *context)
  
  /* Is followed by one or more cc==230 ? */
  static UBool
-isFollowedByMoreAbove(const UCaseProps *csp, UCaseContextIterator *iter, void *context) {
+isFollowedByMoreAbove(UCaseContextIterator *iter, void *context) {
      UChar32 c;
      int32_t dotType;
      int8_t dir;
@@ -762,7 +834,7 @@ isFollowedByMoreAbove(const UCaseProps *csp, UCaseContextIterator *iter, void *c
      }
  
      for(dir=1; (c=iter(context, dir))>=0; dir=0) {
-        dotType=getDotType(csp, c);
+        dotType=getDotType(c);
          if(dotType==UCASE_ABOVE) {
              return TRUE; /* at least one cc==230 following */
          } else if(dotType!=UCASE_OTHER_ACCENT) {
@@ -775,7 +847,7 @@ isFollowedByMoreAbove(const UCaseProps *csp, UCaseContextIterator *iter, void *c
  
  /* Is followed by a dot above (without cc==230 in between) ? */
  static UBool
-isFollowedByDotAbove(const UCaseProps *csp, UCaseContextIterator *iter, void *context) {
+isFollowedByDotAbove(UCaseContextIterator *iter, void *context) {
      UChar32 c;
      int32_t dotType;
      int8_t dir;
@@ -788,7 +860,7 @@ isFollowedByDotAbove(const UCaseProps *csp, UCaseContextIterator *iter, void *co
          if(c==0x307) {
              return TRUE;
          }
-        dotType=getDotType(csp, c);
+        dotType=getDotType(c);
          if(dotType!=UCASE_OTHER_ACCENT) {
              return FALSE; /* next base character or cc==230 in between */
          }
@@ -798,19 +870,20 @@ isFollowedByDotAbove(const UCaseProps *csp, UCaseContextIterator *iter, void *co
  }
  
  U_CAPI int32_t U_EXPORT2
-ucase_toFullLower(const UCaseProps *csp, UChar32 c,
+ucase_toFullLower(UChar32 c,
                    UCaseContextIterator *iter, void *context,
                    const UChar **pString,
-                  const char *locale, int32_t *locCache)
-{
+                  int32_t loc) {
+    // The sign of the result has meaning, input must be non-negative so that it can be returned as is.
+    U_ASSERT(c >= 0);
      UChar32 result=c;
-    uint16_t props=UTRIE2_GET16(&csp->trie, c);
+    uint16_t props=UTRIE2_GET16(&ucase_props_singleton.trie, c);
      if(!PROPS_HAS_EXCEPTION(props)) {
          if(UCASE_GET_TYPE(props)>=UCASE_UPPER) {
              result=c+UCASE_GET_DELTA(props);
          }
      } else {
-        const uint16_t *pe=GET_EXCEPTIONS(csp, props), *pe2;
+        const uint16_t *pe=GET_EXCEPTIONS(&ucase_props_singleton, props), *pe2;
          uint16_t excWord=*pe++;
          int32_t full;
  
@@ -818,7 +891,6 @@ ucase_toFullLower(const UCaseProps *csp, UChar32 c,
  
          if(excWord&UCASE_EXC_CONDITIONAL_SPECIAL) {
              /* use hardcoded conditions and mappings */
-            int32_t loc=ucase_getCaseLocale(locale, locCache);
  
              /*
               * Test for conditional mappings first
@@ -829,7 +901,7 @@ ucase_toFullLower(const UCaseProps *csp, UChar32 c,
              if( loc==UCASE_LOC_LITHUANIAN &&
                      /* base characters, find accents above */
                      (((c==0x49 || c==0x4a || c==0x12e) &&
-                        isFollowedByMoreAbove(csp, iter, context)) ||
+                        isFollowedByMoreAbove(iter, context)) ||
                      /* precomposed with accent above, no need to find one */
                      (c==0xcc || c==0xcd || c==0x128))
              ) {
@@ -881,7 +953,7 @@ ucase_toFullLower(const UCaseProps *csp, UChar32 c,
                      0130; 0069; 0130; 0130; az # LATIN CAPITAL LETTER I WITH DOT ABOVE
                   */
                  return 0x69;
-            } else if(loc==UCASE_LOC_TURKISH && c==0x307 && isPrecededBy_I(csp, iter, context)) {
+            } else if(loc==UCASE_LOC_TURKISH && c==0x307 && isPrecededBy_I(iter, context)) {
                  /*
                      # When lowercasing, remove dot_above in the sequence I + dot_above, which will turn into i.
                      # This matches the behavior of the canonically equivalent I-dot_above
@@ -890,7 +962,7 @@ ucase_toFullLower(const UCaseProps *csp, UChar32 c,
                      0307; ; 0307; 0307; az After_I; # COMBINING DOT ABOVE
                   */
                  return 0; /* remove the dot (continue without output) */
-            } else if(loc==UCASE_LOC_TURKISH && c==0x49 && !isFollowedByDotAbove(csp, iter, context)) {
+            } else if(loc==UCASE_LOC_TURKISH && c==0x49 && !isFollowedByDotAbove(iter, context)) {
                  /*
                      # When lowercasing, unless an I is before a dot_above, it turns into a dotless i.
  
@@ -907,8 +979,8 @@ ucase_toFullLower(const UCaseProps *csp, UChar32 c,
                  *pString=iDot;
                  return 2;
              } else if(  c==0x3a3 &&
-                        !isFollowedByCasedLetter(csp, iter, context, 1) &&
-                        isFollowedByCasedLetter(csp, iter, context, -1) /* -1=preceded */
+                        !isFollowedByCasedLetter(iter, context, 1) &&
+                        isFollowedByCasedLetter(iter, context, -1) /* -1=preceded */
              ) {
                  /* greek capital sigma maps depending on surrounding cased letters (see SpecialCasing.txt) */
                  /*
@@ -942,19 +1014,21 @@ ucase_toFullLower(const UCaseProps *csp, UChar32 c,
  
  /* internal */
  static int32_t
-toUpperOrTitle(const UCaseProps *csp, UChar32 c,
+toUpperOrTitle(UChar32 c,
                 UCaseContextIterator *iter, void *context,
                 const UChar **pString,
-               const char *locale, int32_t *locCache,
+               int32_t loc,
                 UBool upperNotTitle) {
+    // The sign of the result has meaning, input must be non-negative so that it can be returned as is.
+    U_ASSERT(c >= 0);
      UChar32 result=c;
-    uint16_t props=UTRIE2_GET16(&csp->trie, c);
+    uint16_t props=UTRIE2_GET16(&ucase_props_singleton.trie, c);
      if(!PROPS_HAS_EXCEPTION(props)) {
          if(UCASE_GET_TYPE(props)==UCASE_LOWER) {
              result=c+UCASE_GET_DELTA(props);
          }
      } else {
-        const uint16_t *pe=GET_EXCEPTIONS(csp, props), *pe2;
+        const uint16_t *pe=GET_EXCEPTIONS(&ucase_props_singleton, props), *pe2;
          uint16_t excWord=*pe++;
          int32_t full, idx;
  
@@ -962,8 +1036,6 @@ toUpperOrTitle(const UCaseProps *csp, UChar32 c,
  
          if(excWord&UCASE_EXC_CONDITIONAL_SPECIAL) {
              /* use hardcoded conditions and mappings */
-            int32_t loc=ucase_getCaseLocale(locale, locCache);
-
              if(loc==UCASE_LOC_TURKISH && c==0x69) {
                  /*
                      # Turkish and Azeri
@@ -977,7 +1049,7 @@ toUpperOrTitle(const UCaseProps *csp, UChar32 c,
                      0069; 0069; 0130; 0130; az; # LATIN SMALL LETTER I
                  */
                  return 0x130;
-            } else if(loc==UCASE_LOC_LITHUANIAN && c==0x307 && isPrecededBySoftDotted(csp, iter, context)) {
+            } else if(loc==UCASE_LOC_LITHUANIAN && c==0x307 && isPrecededBySoftDotted(iter, context)) {
                  /*
                      # Lithuanian
  
@@ -1035,19 +1107,19 @@ toUpperOrTitle(const UCaseProps *csp, UChar32 c,
  }
  
  U_CAPI int32_t U_EXPORT2
-ucase_toFullUpper(const UCaseProps *csp, UChar32 c,
+ucase_toFullUpper(UChar32 c,
                    UCaseContextIterator *iter, void *context,
                    const UChar **pString,
-                  const char *locale, int32_t *locCache) {
-    return toUpperOrTitle(csp, c, iter, context, pString, locale, locCache, TRUE);
+                  int32_t caseLocale) {
+    return toUpperOrTitle(c, iter, context, pString, caseLocale, TRUE);
  }
  
  U_CAPI int32_t U_EXPORT2
-ucase_toFullTitle(const UCaseProps *csp, UChar32 c,
+ucase_toFullTitle(UChar32 c,
                    UCaseContextIterator *iter, void *context,
                    const UChar **pString,
-                  const char *locale, int32_t *locCache) {
-    return toUpperOrTitle(csp, c, iter, context, pString, locale, locCache, FALSE);
+                  int32_t caseLocale) {
+    return toUpperOrTitle(c, iter, context, pString, caseLocale, FALSE);
  }
  
  /* case folding ------------------------------------------------------------- */
@@ -1093,14 +1165,14 @@ ucase_toFullTitle(const UCaseProps *csp, UChar32 c,
  
  /* return the simple case folding mapping for c */
  U_CAPI UChar32 U_EXPORT2
-ucase_fold(const UCaseProps *csp, UChar32 c, uint32_t options) {
-    uint16_t props=UTRIE2_GET16(&csp->trie, c);
+ucase_fold(UChar32 c, uint32_t options) {
+    uint16_t props=UTRIE2_GET16(&ucase_props_singleton.trie, c);
      if(!PROPS_HAS_EXCEPTION(props)) {
          if(UCASE_GET_TYPE(props)>=UCASE_UPPER) {
              c+=UCASE_GET_DELTA(props);
          }
      } else {
-        const uint16_t *pe=GET_EXCEPTIONS(csp, props);
+        const uint16_t *pe=GET_EXCEPTIONS(&ucase_props_singleton, props);
          uint16_t excWord=*pe++;
          int32_t idx;
          if(excWord&UCASE_EXC_CONDITIONAL_FOLD) {
@@ -1153,18 +1225,19 @@ ucase_fold(const UCaseProps *csp, UChar32 c, uint32_t options) {
   */
  
  U_CAPI int32_t U_EXPORT2
-ucase_toFullFolding(const UCaseProps *csp, UChar32 c,
+ucase_toFullFolding(UChar32 c,
                      const UChar **pString,
-                    uint32_t options)
-{
+                    uint32_t options) {
+    // The sign of the result has meaning, input must be non-negative so that it can be returned as is.
+    U_ASSERT(c >= 0);
      UChar32 result=c;
-    uint16_t props=UTRIE2_GET16(&csp->trie, c);
+    uint16_t props=UTRIE2_GET16(&ucase_props_singleton.trie, c);
      if(!PROPS_HAS_EXCEPTION(props)) {
          if(UCASE_GET_TYPE(props)>=UCASE_UPPER) {
              result=c+UCASE_GET_DELTA(props);
          }
      } else {
-        const uint16_t *pe=GET_EXCEPTIONS(csp, props), *pe2;
+        const uint16_t *pe=GET_EXCEPTIONS(&ucase_props_singleton, props), *pe2;
          uint16_t excWord=*pe++;
          int32_t full, idx;
  
@@ -1226,66 +1299,59 @@ ucase_toFullFolding(const UCaseProps *csp, UChar32 c,
  
  /* case mapping properties API ---------------------------------------------- */
  
-#define GET_CASE_PROPS() &ucase_props_singleton
-
  /* public API (see uchar.h) */
  
  U_CAPI UBool U_EXPORT2
  u_isULowercase(UChar32 c) {
-    return (UBool)(UCASE_LOWER==ucase_getType(GET_CASE_PROPS(), c));
+    return (UBool)(UCASE_LOWER==ucase_getType(c));
  }
  
  U_CAPI UBool U_EXPORT2
  u_isUUppercase(UChar32 c) {
-    return (UBool)(UCASE_UPPER==ucase_getType(GET_CASE_PROPS(), c));
+    return (UBool)(UCASE_UPPER==ucase_getType(c));
  }
  
  /* Transforms the Unicode character to its lower case equivalent.*/
  U_CAPI UChar32 U_EXPORT2
  u_tolower(UChar32 c) {
-    return ucase_tolower(GET_CASE_PROPS(), c);
+    return ucase_tolower(c);
  }
      
  /* Transforms the Unicode character to its upper case equivalent.*/
  U_CAPI UChar32 U_EXPORT2
  u_toupper(UChar32 c) {
-    return ucase_toupper(GET_CASE_PROPS(), c);
+    return ucase_toupper(c);
  }
  
  /* Transforms the Unicode character to its title case equivalent.*/
  U_CAPI UChar32 U_EXPORT2
  u_totitle(UChar32 c) {
-    return ucase_totitle(GET_CASE_PROPS(), c);
+    return ucase_totitle(c);
  }
  
  /* return the simple case folding mapping for c */
  U_CAPI UChar32 U_EXPORT2
  u_foldCase(UChar32 c, uint32_t options) {
-    return ucase_fold(GET_CASE_PROPS(), c, options);
+    return ucase_fold(c, options);
  }
  
  U_CFUNC int32_t U_EXPORT2
  ucase_hasBinaryProperty(UChar32 c, UProperty which) {
      /* case mapping properties */
      const UChar *resultString;
-    int32_t locCache;
-    const UCaseProps *csp=GET_CASE_PROPS();
-    if(csp==NULL) {
-        return FALSE;
-    }
      switch(which) {
      case UCHAR_LOWERCASE:
-        return (UBool)(UCASE_LOWER==ucase_getType(csp, c));
+        return (UBool)(UCASE_LOWER==ucase_getType(c));
      case UCHAR_UPPERCASE:
-        return (UBool)(UCASE_UPPER==ucase_getType(csp, c));
+        return (UBool)(UCASE_UPPER==ucase_getType(c));
      case UCHAR_SOFT_DOTTED:
-        return ucase_isSoftDotted(csp, c);
+        return ucase_isSoftDotted(c);
      case UCHAR_CASE_SENSITIVE:
-        return ucase_isCaseSensitive(csp, c);
+        return ucase_isCaseSensitive(c);
      case UCHAR_CASED:
-        return (UBool)(UCASE_NONE!=ucase_getType(csp, c));
+        return (UBool)(UCASE_NONE!=ucase_getType(c));
      case UCHAR_CASE_IGNORABLE:
-        return (UBool)(ucase_getTypeOrIgnorable(csp, c)>>2);
+        return (UBool)(ucase_getTypeOrIgnorable(c)>>2);
      /*
       * Note: The following Changes_When_Xyz are defined as testing whether
       * the NFD form of the input changes when Xyz-case-mapped.
@@ -1299,21 +1365,17 @@ ucase_hasBinaryProperty(UChar32 c, UProperty which) {
       * start sets for normalization and case mappings.
       */
      case UCHAR_CHANGES_WHEN_LOWERCASED:
-        locCache=UCASE_LOC_ROOT;
-        return (UBool)(ucase_toFullLower(csp, c, NULL, NULL, &resultString, "", &locCache)>=0);
+        return (UBool)(ucase_toFullLower(c, NULL, NULL, &resultString, UCASE_LOC_ROOT)>=0);
      case UCHAR_CHANGES_WHEN_UPPERCASED:
-        locCache=UCASE_LOC_ROOT;
-        return (UBool)(ucase_toFullUpper(csp, c, NULL, NULL, &resultString, "", &locCache)>=0);
+        return (UBool)(ucase_toFullUpper(c, NULL, NULL, &resultString, UCASE_LOC_ROOT)>=0);
      case UCHAR_CHANGES_WHEN_TITLECASED:
-        locCache=UCASE_LOC_ROOT;
-        return (UBool)(ucase_toFullTitle(csp, c, NULL, NULL, &resultString, "", &locCache)>=0);
+        return (UBool)(ucase_toFullTitle(c, NULL, NULL, &resultString, UCASE_LOC_ROOT)>=0);
      /* case UCHAR_CHANGES_WHEN_CASEFOLDED: -- in uprops.c */
      case UCHAR_CHANGES_WHEN_CASEMAPPED:
-        locCache=UCASE_LOC_ROOT;
          return (UBool)(
-            ucase_toFullLower(csp, c, NULL, NULL, &resultString, "", &locCache)>=0 ||
-            ucase_toFullUpper(csp, c, NULL, NULL, &resultString, "", &locCache)>=0 ||
-            ucase_toFullTitle(csp, c, NULL, NULL, &resultString, "", &locCache)>=0);
+            ucase_toFullLower(c, NULL, NULL, &resultString, UCASE_LOC_ROOT)>=0 ||
+            ucase_toFullUpper(c, NULL, NULL, &resultString, UCASE_LOC_ROOT)>=0 ||
+            ucase_toFullTitle(c, NULL, NULL, &resultString, UCASE_LOC_ROOT)>=0);
      default:
          return FALSE;
      }