ICU-62108.0.1.tar.gz

[apple/icu.git] / icuSources / common / utrie2.h
diff --git a/icuSources/common/utrie2.h b/icuSources/common/utrie2.h

index 4e7ead05215326f98272ebbf056d257cc8bfa2cd..8e1caa5e90bde2a5fff8a6bcbac75dc0b1b86bba 100644 (file)
--- a/icuSources/common/utrie2.h
+++ b/icuSources/common/utrie2.h
@@ -1,12 +1,14 @@
+// © 2016 and later: Unicode, Inc. and others.
+// License & terms of use: http://www.unicode.org/copyright.html
  /*
  ******************************************************************************
  *
-*   Copyright (C) 2001-2010, International Business Machines
+*   Copyright (C) 2001-2014, International Business Machines
  *   Corporation and others.  All Rights Reserved.
  *
  ******************************************************************************
  *   file name:  utrie2.h
-*   encoding:   US-ASCII
+*   encoding:   UTF-8
  *   tab size:   8 (not used)
  *   indentation:4
  *
@@ -18,6 +20,8 @@
  #define __UTRIE2_H__
  
  #include "unicode/utypes.h"
+#include "unicode/utf8.h"
+#include "putilimp.h"
  #include "udataswp.h"
  
  U_CDECL_BEGIN
@@ -51,6 +55,8 @@ typedef struct UTrie UTrie;
   *   is truncated, omitting both the BMP portion and the high range.
   * - There is a special small index for 2-byte UTF-8, and the initial data
   *   entries are designed for fast 1/2-byte UTF-8 lookup.
+ *   Starting with ICU 60, C0 and C1 are not recognized as UTF-8 lead bytes any more at all,
+ *   and the associated 2-byte indexes are unused.
   */
  
  /**
@@ -318,7 +324,7 @@ utrie2_isFrozen(const UTrie2 *trie);
   * @see utrie2_openFromSerialized()
   */
  U_CAPI int32_t U_EXPORT2
-utrie2_serialize(UTrie2 *trie,
+utrie2_serialize(const UTrie2 *trie,
                   void *data, int32_t capacity,
                   UErrorCode *pErrorCode);
  
@@ -618,8 +624,9 @@ U_CDECL_END
  
  /* C++ convenience wrappers ------------------------------------------------- */
  
-#ifdef XP_CPLUSPLUS
+#ifdef __cplusplus
  
+#include "unicode/utf.h"
  #include "mutex.h"
  
  U_NAMESPACE_BEGIN
@@ -657,19 +664,6 @@ public:
      const UChar *limit;
  };
  
-class UTrie2Singleton {
-public:
-    UTrie2Singleton(SimpleSingleton &s) : singleton(s) {}
-    void deleteInstance() {
-        utrie2_close((UTrie2 *)singleton.fInstance);
-        singleton.reset();
-    }
-    UTrie2 *getInstance(InstantiatorFn *instantiator, const void *context,
-                        UErrorCode &errorCode);
-private:
-    SimpleSingleton &singleton;
-};
-
  U_NAMESPACE_END
  
  #endif
@@ -942,29 +936,29 @@ utrie2_internalU8PrevIndex(const UTrie2 *trie, UChar32 c,
  /** Internal UTF-8 next-post-increment: get the next code point's data. */
  #define _UTRIE2_U8_NEXT(trie, ascii, data, src, limit, result) { \
      uint8_t __lead=(uint8_t)*(src)++; \
-    if(__lead<0xc0) { \
+    if(U8_IS_SINGLE(__lead)) { \
          (result)=(trie)->ascii[__lead]; \
      } else { \
          uint8_t __t1, __t2; \
-        if( /* handle U+0000..U+07FF inline */ \
-            __lead<0xe0 && (src)<(limit) && \
-            (__t1=(uint8_t)(*(src)-0x80))<=0x3f \
-        ) { \
-            ++(src); \
-            (result)=(trie)->data[ \
-                (trie)->index[(UTRIE2_UTF8_2B_INDEX_2_OFFSET-0xc0)+__lead]+ \
-                __t1]; \
-        } else if( /* handle U+0000..U+CFFF inline */ \
-            __lead<0xed && ((src)+1)<(limit) && \
-            (__t1=(uint8_t)(*(src)-0x80))<=0x3f && (__lead>0xe0 || __t1>=0x20) && \
+        if( /* handle U+0800..U+FFFF inline */ \
+            0xe0<=__lead && __lead<0xf0 && ((src)+1)<(limit) && \
+            U8_IS_VALID_LEAD3_AND_T1(__lead, __t1=(uint8_t)*(src)) && \
              (__t2=(uint8_t)(*((src)+1)-0x80))<= 0x3f \
          ) { \
              (src)+=2; \
              (result)=(trie)->data[ \
                  ((int32_t)((trie)->index[((__lead-0xe0)<<(12-UTRIE2_SHIFT_2))+ \
-                                         (__t1<<(6-UTRIE2_SHIFT_2))+(__t2>>UTRIE2_SHIFT_2)]) \
+                                         ((__t1&0x3f)<<(6-UTRIE2_SHIFT_2))+(__t2>>UTRIE2_SHIFT_2)]) \
                  <<UTRIE2_INDEX_SHIFT)+ \
                  (__t2&UTRIE2_DATA_MASK)]; \
+        } else if( /* handle U+0080..U+07FF inline */ \
+            __lead<0xe0 && __lead>=0xc2 && (src)<(limit) && \
+            (__t1=(uint8_t)(*(src)-0x80))<=0x3f \
+        ) { \
+            ++(src); \
+            (result)=(trie)->data[ \
+                (trie)->index[(UTRIE2_UTF8_2B_INDEX_2_OFFSET-0xc0)+__lead]+ \
+                __t1]; \
          } else { \
              int32_t __index=utrie2_internalU8NextIndex((trie), __lead, (const uint8_t *)(src), \
                                                                         (const uint8_t *)(limit)); \
@@ -977,7 +971,7 @@ utrie2_internalU8PrevIndex(const UTrie2 *trie, UChar32 c,
  /** Internal UTF-8 pre-decrement-previous: get the previous code point's data. */
  #define _UTRIE2_U8_PREV(trie, ascii, data, start, src, result) { \
      uint8_t __b=(uint8_t)*--(src); \
-    if(__b<0x80) { \
+    if(U8_IS_SINGLE(__b)) { \
          (result)=(trie)->ascii[__b]; \
      } else { \
          int32_t __index=utrie2_internalU8PrevIndex((trie), __b, (const uint8_t *)(start), \
@@ -989,11 +983,4 @@ utrie2_internalU8PrevIndex(const UTrie2 *trie, UChar32 c,
  
  U_CDECL_END
  
-/**
- * Work around MSVC 2003 optimization bugs.
- */
-#if defined (U_HAVE_MSVC_2003_OR_EARLIER)
-#pragma optimize("", off)
-#endif
-
  #endif