ICU-64252.0.1.tar.gz

[apple/icu.git] / icuSources / test / cintltst / ccapitst.c
diff --git a/icuSources/test/cintltst/ccapitst.c b/icuSources/test/cintltst/ccapitst.c

index 16c9d9de2c234055c8c636ced4b30b48c00a674b..22785b386616a940fabd920e9c47ee8e6a59ea20 100644 (file)
--- a/icuSources/test/cintltst/ccapitst.c
+++ b/icuSources/test/cintltst/ccapitst.c
@@ -1,6 +1,8 @@
+// © 2016 and later: Unicode, Inc. and others.
+// License & terms of use: http://www.unicode.org/copyright.html
  /********************************************************************
   * COPYRIGHT: 
- * Copyright (c) 1997-2015, International Business Machines Corporation and
+ * Copyright (c) 1997-2016, International Business Machines Corporation and
   * others. All Rights Reserved.
   ********************************************************************/
  /*****************************************************************************
@@ -22,6 +24,7 @@
  #include "unicode/putil.h"
  #include "unicode/uset.h"
  #include "unicode/ustring.h"
+#include "unicode/utf8.h"
  #include "ucnv_bld.h" /* for sizeof(UConverter) */
  #include "cmemory.h"  /* for UAlignedMemory */
  #include "cintltst.h"
@@ -412,7 +415,7 @@ static void TestConvert()
          const uint8_t source[]={ 0x00, 0x04, 0x05, 0x06, 0xa2, 0xb4, 0x00};
          const uint8_t expectedTarget[]={ 0x00, 0x37, 0x2d, 0x2e, 0x0e, 0x49, 0x62, 0x0f, 0x00};
          char *target=0;
-        sourceLimit=sizeof(source)/sizeof(source[0]);
+        sourceLimit=UPRV_LENGTHOF(source);
          err=U_ZERO_ERROR;
          targetLimit=0;
              
@@ -447,14 +450,14 @@ static void TestConvert()
              }
  
              err=U_ILLEGAL_ARGUMENT_ERROR;
-            sourceLimit=sizeof(source)/sizeof(source[0]);
+            sourceLimit=UPRV_LENGTHOF(source);
              i=ucnv_convert("ibm-1364", "ibm-1363", target, targetLimit , (const char*)source, sourceLimit, &err);
              if(i !=0 ){
                  log_err("FAILURE! ucnv_convert() with err=U_ILLEGAL_ARGUMENT_ERROR is expected to return 0\n");
              }
  
              err=U_ZERO_ERROR;
-            sourceLimit=sizeof(source)/sizeof(source[0]);
+            sourceLimit=UPRV_LENGTHOF(source);
              targetLimit=0;
              i=ucnv_convert("ibm-1364", "ibm-1363", target, targetLimit , (const char*)source, sourceLimit, &err);
              if(!(U_FAILURE(err) && err==U_BUFFER_OVERFLOW_ERROR)){
@@ -849,7 +852,7 @@ static void TestConvert()
  
  
          /*Reads in the file*/
-        while(!feof(ucs_file_in)&&(i+=fread(ucs_file_buffer+i, sizeof(UChar), 1, ucs_file_in)))
+        while(!feof(ucs_file_in)&&(i+=(int32_t)fread(ucs_file_buffer+i, sizeof(UChar), 1, ucs_file_in)))
          {
              myUChar = ucs_file_buffer[i-1];
              
@@ -892,7 +895,7 @@ static void TestConvert()
                       NULL,
                       targetcapacity2,
                       output_cp_buffer,
-                     strlen(output_cp_buffer),
+                     (int32_t)strlen(output_cp_buffer),
                       &err);
          /*if there is an buffer overflow then trap the values and pass them and make the actual call*/
  
@@ -904,7 +907,7 @@ static void TestConvert()
                     uchar2,
                     targetsize+1,
                     output_cp_buffer,
-                   strlen(output_cp_buffer),
+                   (int32_t)strlen(output_cp_buffer),
                     &err);
  
              if(U_FAILURE(err))
@@ -944,12 +947,12 @@ static void TestConvert()
              log_err("\nFAILURE: ucnv_fromUChars with targetLength 0 is expected to fail and throw U_BUFFER_OVERFLOW_ERROR\n");
          }
          /*toUChars with error conditions*/
-        targetsize = ucnv_toUChars(myConverter, uchar2, targetsize, output_cp_buffer, strlen(output_cp_buffer), &err);
+        targetsize = ucnv_toUChars(myConverter, uchar2, targetsize, output_cp_buffer, (int32_t)strlen(output_cp_buffer), &err);
          if(targetsize != 0){
              log_err("\nFAILURE: ucnv_toUChars with err != U_ZERO_ERROR is expected to fail and return 0\n");
          }
          err=U_ZERO_ERROR;
-        targetsize = ucnv_toUChars(myConverter, uchar2, -1, output_cp_buffer, strlen(output_cp_buffer), &err);
+        targetsize = ucnv_toUChars(myConverter, uchar2, -1, output_cp_buffer, (int32_t)strlen(output_cp_buffer), &err);
          if(targetsize != 0 || err != U_ILLEGAL_ARGUMENT_ERROR){
              log_err("\nFAILURE: ucnv_toUChars with targetsize < 0 is expected to throw U_ILLEGAL_ARGUMENT_ERROR and return 0\n");
          }
@@ -959,7 +962,7 @@ static void TestConvert()
              log_err("\nFAILURE: ucnv_toUChars with sourceLength 0 is expected to return 0\n");
          }
          targetcapacity2=0; 
-        targetsize = ucnv_toUChars(myConverter, NULL, targetcapacity2, output_cp_buffer,  strlen(output_cp_buffer), &err);
+        targetsize = ucnv_toUChars(myConverter, NULL, targetcapacity2, output_cp_buffer, (int32_t)strlen(output_cp_buffer), &err);
          if (err != U_STRING_NOT_TERMINATED_WARNING) {
              log_err("\nFAILURE: ucnv_toUChars(targetLength)->%s instead of U_STRING_NOT_TERMINATED_WARNING\n",
                      u_errorName(err));
@@ -1165,7 +1168,7 @@ static void TestAlias() {
          { "UTF32_PlatformEndian", "UTF32_PlatformEndian" },
          { "UTF-32",   "ucs-4" }
      };
-    int32_t CONVERTERS_NAMES_LENGTH = sizeof(CONVERTERS_NAMES) / sizeof(*CONVERTERS_NAMES);
+    int32_t CONVERTERS_NAMES_LENGTH = UPRV_LENGTHOF(CONVERTERS_NAMES);
  
      /* When there are bugs in gencnval or in ucnv_io, converters can
         appear to have no aliases. */
@@ -1693,16 +1696,16 @@ static void TestConvertSafeClone()
  
      char *pCharBuffer;
      const char *pConstCharBuffer;
-    const char *charBufferLimit = charBuffer + sizeof(charBuffer)/sizeof(*charBuffer);
+    const char *charBufferLimit = charBuffer + UPRV_LENGTHOF(charBuffer);
      UChar uniBuffer[] = {0x0058, 0x0059, 0x005A}; /* "XYZ" */
      UChar uniCharBuffer[20];
      char  charSourceBuffer[] = { 0x1b, 0x24, 0x42 };
      const char *pCharSource = charSourceBuffer;
      const char *pCharSourceLimit = charSourceBuffer + sizeof(charSourceBuffer);
      UChar *pUCharTarget = uniCharBuffer;
-    UChar *pUCharTargetLimit = uniCharBuffer + sizeof(uniCharBuffer)/sizeof(*uniCharBuffer);
+    UChar *pUCharTargetLimit = uniCharBuffer + UPRV_LENGTHOF(uniCharBuffer);
      const UChar * pUniBuffer;
-    const UChar *uniBufferLimit = uniBuffer + sizeof(uniBuffer)/sizeof(*uniBuffer);
+    const UChar *uniBufferLimit = uniBuffer + UPRV_LENGTHOF(uniBuffer);
      int32_t idx, j;
  
      err = U_ZERO_ERROR;
@@ -1893,7 +1896,7 @@ static void TestCCSID() {
      int32_t ccsids[]={ 37, 850, 943, 949, 950, 1047, 1252, 1392, 33722 };
      int32_t i, ccsid;
  
-    for(i=0; i<(int32_t)(sizeof(ccsids)/sizeof(int32_t)); ++i) {
+    for(i=0; i<UPRV_LENGTHOF(ccsids); ++i) {
          ccsid=ccsids[i];
  
          errorCode=U_ZERO_ERROR;
@@ -2492,6 +2495,26 @@ static UBool getTestChar(UConverter *cnv, const char *converterName,
      return TRUE;
  }
  
+static UBool isOneTruncatedUTF8(const char *s, int32_t length) {
+    if(length==0) {
+        return FALSE;
+    } else if(length==1) {
+        return U8_IS_LEAD(s[0]);
+    } else {
+        int32_t count=U8_COUNT_TRAIL_BYTES(s[0]);
+        if(length<=count) {
+            // 2 or more bytes, but fewer than the lead byte indicates.
+            int32_t oneLength=0;
+            U8_FWD_1(s, oneLength, length);
+            // Truncated if we reach the end of the string.
+            // Not true if the lead byte and first trail byte do not start a valid sequence,
+            // e.g., E0 80 -> oneLength=1.
+            return oneLength==length;
+        }
+        return FALSE;
+    }
+}
+
  static void testFromTruncatedUTF8(UConverter *utf8Cnv, UConverter *cnv, const char *converterName,
                                    char charUTF8[4], int32_t charUTF8Length,
                                    char char0[8], int32_t char0Length,
@@ -2522,8 +2545,8 @@ static void testFromTruncatedUTF8(UConverter *utf8Cnv, UConverter *cnv, const ch
  
      for(i=0; i<UPRV_LENGTHOF(badUTF8); ++i) {
          /* truncated sequence? */
-        int32_t length=strlen(badUTF8[i]);
-        if(length>=(1+U8_COUNT_TRAIL_BYTES(badUTF8[i][0]))) {
+        int32_t length = (int32_t)strlen(badUTF8[i]);
+        if(!isOneTruncatedUTF8(badUTF8[i], length)) {
              continue;
          }
  
@@ -2585,7 +2608,7 @@ static void testFromBadUTF8(UConverter *utf8Cnv, UConverter *cnv, const char *co
      expectLength=char0Length;
  
      for(i=0; i<UPRV_LENGTHOF(badUTF8); ++i) {
-        int32_t length=strlen(badUTF8[i]);
+        int32_t length = (int32_t)strlen(badUTF8[i]);
          memcpy(utf8+utf8Length, badUTF8[i], length);
          utf8Length+=length;
  
@@ -2898,7 +2921,7 @@ static void TestLMBCSMaxChar(void) {
          { 4, "HZ"},
  
          { 3, "ISO-2022"},
-        { 3, "ISO-2022-KR"},
+        { 8, "ISO-2022-KR"},
          { 6, "ISO-2022-JP"},
          { 8, "ISO-2022-CN"},