ICU-64252.0.1.tar.gz

[apple/icu.git] / icuSources / test / cintltst / nucnvtst.c
diff --git a/icuSources/test/cintltst/nucnvtst.c b/icuSources/test/cintltst/nucnvtst.c

index 6791a1ebbec03761cc4bb2bbefdc0ebbc4c2dd22..ba8d131361372466f25a3886e5248d65153d6901 100644 (file)
--- a/icuSources/test/cintltst/nucnvtst.c
+++ b/icuSources/test/cintltst/nucnvtst.c
@@ -1,11 +1,13 @@
+// © 2016 and later: Unicode, Inc. and others.
+// License & terms of use: http://www.unicode.org/copyright.html
  /********************************************************************
   * COPYRIGHT:
- * Copyright (c) 1997-2006,2008 International Business Machines Corporation and
+ * Copyright (c) 1997-2016, International Business Machines Corporation and
   * others. All Rights Reserved.
   ********************************************************************/
  /*******************************************************************************
  *
-* File CCONVTST.C
+* File nucnvtst.c
  *
  * Modification History:
  *        Name                     Description
@@ -17,18 +19,23 @@
  #include "unicode/uloc.h"
  #include "unicode/ucnv.h"
  #include "unicode/ucnv_err.h"
+#include "unicode/ucnv_cb.h"
  #include "cintltst.h"
  #include "unicode/utypes.h"
  #include "unicode/ustring.h"
  #include "unicode/ucol.h"
+#include "unicode/utf16.h"
  #include "cmemory.h"
+#include "nucnvtst.h"
  
  static void TestNextUChar(UConverter* cnv, const char* source, const char* limit, const int32_t results[], const char* message);
  static void TestNextUCharError(UConverter* cnv, const char* source, const char* limit, UErrorCode expected, const char* message);
  #if !UCONFIG_NO_COLLATION
  static void TestJitterbug981(void);
  #endif
+#if !UCONFIG_NO_LEGACY_CONVERSION
  static void TestJitterbug1293(void);
+#endif
  static void TestNewConvertWithBufferSizes(int32_t osize, int32_t isize) ;
  static void TestConverterTypesAndStarters(void);
  static void TestAmbiguous(void);
@@ -49,6 +56,9 @@ static void TestLATIN1(void);
  static void TestSBCS(void);
  static void TestDBCS(void);
  static void TestMBCS(void);
+#if !UCONFIG_NO_LEGACY_CONVERSION && !UCONFIG_NO_FILE_IO
+static void TestICCRunout(void);
+#endif
  
  #ifdef U_ENABLE_GENERIC_ISO_2022
  static void TestISO_2022(void);
@@ -60,7 +70,12 @@ static void TestISO_2022_JP_2(void);
  static void TestISO_2022_KR(void);
  static void TestISO_2022_KR_1(void);
  static void TestISO_2022_CN(void);
+#if 0
+   /*
+    * ICU 4.4 (ticket #7314) removes mappings for CNS 11643 planes 3..7
+    */
  static void TestISO_2022_CN_EXT(void);
+#endif
  static void TestJIS(void);
  static void TestHZ(void);
  #endif
@@ -73,15 +88,26 @@ static void TestGB18030(void);
  static void TestLMBCS(void);
  static void TestJitterbug255(void);
  static void TestEBCDICUS4XML(void);
+#if 0
+   /*
+    * ICU 4.4 (ticket #7314) removes mappings for CNS 11643 planes 3..7
+    */
  static void TestJitterbug915(void);
+#endif
  static void TestISCII(void);
  
  static void TestCoverageMBCS(void);
  static void TestJitterbug2346(void);
  static void TestJitterbug2411(void);
+static void TestJB5275(void);
+static void TestJB5275_1(void);
  static void TestJitterbug6175(void);
+
+static void TestIsFixedWidth(void);
  #endif
  
+static void TestInBufSizes(void);
+
  static void TestRoundTrippingAllUTF(void);
  static void TestConv(const uint16_t in[],
                       int len,
@@ -89,7 +115,6 @@ static void TestConv(const uint16_t in[],
                       const char* lang,
                       char byteArr[],
                       int byteArrLen);
-void addTestNewConvert(TestNode** root);
  
  /* open a converter, using test data if it begins with '@' */
  static UConverter *my_ucnv_open(const char *cnv, UErrorCode *err);
@@ -224,8 +249,10 @@ static void TestOutBufSizes(void)
  
  void addTestNewConvert(TestNode** root)
  {
+#if !UCONFIG_NO_FILE_IO
     addTest(root, &TestInBufSizes, "tsconv/nucnvtst/TestInBufSizes");
     addTest(root, &TestOutBufSizes, "tsconv/nucnvtst/TestOutBufSizes");
+#endif
     addTest(root, &TestConverterTypesAndStarters, "tsconv/nucnvtst/TestConverterTypesAndStarters");
     addTest(root, &TestAmbiguous, "tsconv/nucnvtst/TestAmbiguous");
     addTest(root, &TestSignatureDetection, "tsconv/nucnvtst/TestSignatureDetection");
@@ -250,7 +277,10 @@ void addTestNewConvert(TestNode** root)
  
  #if !UCONFIG_NO_LEGACY_CONVERSION
     addTest(root, &TestSBCS, "tsconv/nucnvtst/TestSBCS");
+#if !UCONFIG_NO_FILE_IO
     addTest(root, &TestDBCS, "tsconv/nucnvtst/TestDBCS");
+   addTest(root, &TestICCRunout, "tsconv/nucnvtst/TestICCRunout");
+#endif
     addTest(root, &TestMBCS, "tsconv/nucnvtst/TestMBCS");
  
  #ifdef U_ENABLE_GENERIC_ISO_2022
@@ -264,8 +294,11 @@ void addTestNewConvert(TestNode** root)
     addTest(root, &TestISO_2022_KR, "tsconv/nucnvtst/TestISO_2022_KR");
     addTest(root, &TestISO_2022_KR_1, "tsconv/nucnvtst/TestISO_2022_KR_1");
     addTest(root, &TestISO_2022_CN, "tsconv/nucnvtst/TestISO_2022_CN");
+   /*
+    * ICU 4.4 (ticket #7314) removes mappings for CNS 11643 planes 3..7
     addTest(root, &TestISO_2022_CN_EXT, "tsconv/nucnvtst/TestISO_2022_CN_EXT");
     addTest(root, &TestJitterbug915, "tsconv/nucnvtst/TestJitterbug915");
+    */
     addTest(root, &TestHZ, "tsconv/nucnvtst/TestHZ");
  #endif
  
@@ -277,7 +310,8 @@ void addTestNewConvert(TestNode** root)
     addTest(root, &TestJitterbug255, "tsconv/nucnvtst/TestJitterbug255");
     addTest(root, &TestEBCDICUS4XML, "tsconv/nucnvtst/TestEBCDICUS4XML");
     addTest(root, &TestISCII, "tsconv/nucnvtst/TestISCII");
-
+   addTest(root, &TestJB5275, "tsconv/nucnvtst/TestJB5275");
+   addTest(root, &TestJB5275_1, "tsconv/nucnvtst/TestJB5275_1");
  #if !UCONFIG_NO_COLLATION
     addTest(root, &TestJitterbug981, "tsconv/nucnvtst/TestJitterbug981");
  #endif
@@ -286,7 +320,7 @@ void addTestNewConvert(TestNode** root)
  #endif
  
  
-#if !UCONFIG_NO_LEGACY_CONVERSION
+#if !UCONFIG_NO_LEGACY_CONVERSION && !UCONFIG_NO_FILE_IO
     addTest(root, &TestCoverageMBCS, "tsconv/nucnvtst/TestCoverageMBCS");
  #endif
  
@@ -296,6 +330,8 @@ void addTestNewConvert(TestNode** root)
     addTest(root, &TestJitterbug2346, "tsconv/nucnvtst/TestJitterbug2346");
     addTest(root, &TestJitterbug2411, "tsconv/nucnvtst/TestJitterbug2411");
     addTest(root, &TestJitterbug6175, "tsconv/nucnvtst/TestJitterbug6175");
+
+   addTest(root, &TestIsFixedWidth, "tsconv/nucnvtst/TestIsFixedWidth");
  #endif
  }
  
@@ -369,7 +405,7 @@ static ETestConvertResult testConvertFromU( const UChar *source, int sourceLen,
      targ = junkout;
      offs = junokout;
  
-    realBufferSize = (sizeof(junkout)/sizeof(junkout[0]));
+    realBufferSize = UPRV_LENGTHOF(junkout);
      realBufferEnd = junkout + realBufferSize;
      realSourceEnd = source + sourceLen;
  
@@ -410,7 +446,7 @@ static ETestConvertResult testConvertFromU( const UChar *source, int sourceLen,
      log_verbose("\nConversion done [%d uchars in -> %d chars out]. \nResult :",
                  sourceLen, targ-junkout);
  
-    if(VERBOSITY)
+    if(getTestOption(VERBOSITY_OPTION))
      {
        char junk[9999];
        char offset_str[9999];
@@ -436,9 +472,9 @@ static ETestConvertResult testConvertFromU( const UChar *source, int sourceLen,
      if(expectLen != targ-junkout) {
        log_err("Expected %d chars out, got %d %s\n", expectLen, targ-junkout, gNuConvTestName);
        log_verbose("Expected %d chars out, got %d %s\n", expectLen, targ-junkout, gNuConvTestName);
-      printf("\nGot:");
+      fprintf(stderr, "Got:\n");
        printSeqErr((const unsigned char*)junkout, (int32_t)(targ-junkout));
-      printf("\nExpected:");
+      fprintf(stderr, "Expected:\n");
        printSeqErr((const unsigned char*)expect, expectLen);
        return TC_MISMATCH;
      }
@@ -469,9 +505,9 @@ static ETestConvertResult testConvertFromU( const UChar *source, int sourceLen,
      } else {
        log_err("String does not match u->%s\n", gNuConvTestName);
        printUSeqErr(source, sourceLen);
-      printf("\nGot:");
+      fprintf(stderr, "Got:\n");
        printSeqErr((const unsigned char *)junkout, expectLen);
-      printf("\nExpected:");
+      fprintf(stderr, "Expected:\n");
        printSeqErr((const unsigned char *)expect, expectLen);
        
        return TC_MISMATCH;
@@ -527,7 +563,7 @@ static ETestConvertResult testConvertToU( const uint8_t *source, int sourcelen,
      targ = junkout;
      offs = junokout;
  
-    realBufferSize = (sizeof(junkout)/sizeof(junkout[0]));
+    realBufferSize = UPRV_LENGTHOF(junkout);
      realBufferEnd = junkout + realBufferSize;
      realSourceEnd = src + sourcelen;
  
@@ -571,7 +607,7 @@ static ETestConvertResult testConvertToU( const uint8_t *source, int sourcelen,
  
      log_verbose("\nConversion done. %d bytes -> %d chars.\nResult :",
          sourcelen, targ-junkout);
-    if(VERBOSITY)
+    if(getTestOption(VERBOSITY_OPTION))
      {
          char junk[9999];
          char offset_str[9999];
@@ -649,15 +685,17 @@ static void TestNewConvertWithBufferSizes(int32_t outsize, int32_t insize )
  /** test chars #1 */
      /*  1 2 3  1Han 2Han 3Han .  */
      static const UChar   sampleText[] =
-     { 0x0031, 0x0032, 0x0033, 0x0000, 0x4e00, 0x4e8c, 0x4e09, 0x002E };
+     { 0x0031, 0x0032, 0x0033, 0x0000, 0x4e00, 0x4e8c, 0x4e09, 0x002E, 0xD840, 0xDC21 };
+    static const UChar sampleTextRoundTripUnmappable[] =
+    { 0x0031, 0x0032, 0x0033, 0x0000, 0x4e00, 0x4e8c, 0x4e09, 0x002E, 0xfffd };
  
  
      static const uint8_t expectedUTF8[] =
-     { 0x31, 0x32, 0x33, 0x00, 0xe4, 0xb8, 0x80, 0xe4, 0xba, 0x8c, 0xe4, 0xb8, 0x89, 0x2E };
+     { 0x31, 0x32, 0x33, 0x00, 0xe4, 0xb8, 0x80, 0xe4, 0xba, 0x8c, 0xe4, 0xb8, 0x89, 0x2E, 0xf0, 0xa0, 0x80, 0xa1 };
      static const int32_t toUTF8Offs[] =
-     { 0x00, 0x01, 0x02, 0x03, 0x04, 0x04, 0x04, 0x05, 0x05, 0x05, 0x06, 0x06, 0x06, 0x07};
+     { 0x00, 0x01, 0x02, 0x03, 0x04, 0x04, 0x04, 0x05, 0x05, 0x05, 0x06, 0x06, 0x06, 0x07, 0x08, 0x08, 0x08, 0x08 };
      static const int32_t fmUTF8Offs[] =
-     { 0x0000, 0x0001, 0x0002, 0x0003, 0x0004, 0x0007, 0x000a, 0x000d };
+     { 0x0000, 0x0001, 0x0002, 0x0003, 0x0004, 0x0007, 0x000a, 0x000d, 0x000e, 0x000e };
  
  #ifdef U_ENABLE_GENERIC_ISO_2022
      /* Same as UTF8, but with ^[%B preceeding */
@@ -672,59 +710,59 @@ static void TestNewConvertWithBufferSizes(int32_t outsize, int32_t insize )
  
      /*  1 2 3 0, <SO> h1 h2 h3 <SI> . EBCDIC_STATEFUL */
      static const uint8_t expectedIBM930[] =
-     { 0xF1, 0xF2, 0xF3, 0x00, 0x0E, 0x45, 0x41, 0x45, 0x42, 0x45, 0x43, 0x0F, 0x4B };
+     { 0xF1, 0xF2, 0xF3, 0x00, 0x0E, 0x45, 0x41, 0x45, 0x42, 0x45, 0x43, 0x0F, 0x4B, 0x0e, 0xfe, 0xfe, 0x0f };
      static const int32_t toIBM930Offs[] =
-     { 0x00, 0x01, 0x02, 0x03, 0x04, 0x04, 0x04, 0x05, 0x05, 0x06, 0x06, 0x07, 0x07, };
+     { 0x00, 0x01, 0x02, 0x03, 0x04, 0x04, 0x04, 0x05, 0x05, 0x06, 0x06, 0x07, 0x07, 0x08, 0x08, 0x08, -1 };
      static const int32_t fmIBM930Offs[] =
-     { 0x0000, 0x0001, 0x0002, 0x0003, 0x0005, 0x0007, 0x0009, 0x000c};
+     { 0x0000, 0x0001, 0x0002, 0x0003, 0x0005, 0x0007, 0x0009, 0x000c, 0x000e };
  
      /* 1 2 3 0 h1 h2 h3 . MBCS*/
      static const uint8_t expectedIBM943[] =
-     {  0x31, 0x32, 0x33, 0x00, 0x88, 0xea, 0x93, 0xf1, 0x8e, 0x4f, 0x2e };
+     {  0x31, 0x32, 0x33, 0x00, 0x88, 0xea, 0x93, 0xf1, 0x8e, 0x4f, 0x2e, 0xfc, 0xfc };
      static const int32_t toIBM943Offs    [] =
-     {  0x00, 0x01, 0x02, 0x03, 0x04, 0x04, 0x05, 0x05, 0x06, 0x06, 0x07 };
+     {  0x00, 0x01, 0x02, 0x03, 0x04, 0x04, 0x05, 0x05, 0x06, 0x06, 0x07, 0x08, 0x08 };
      static const int32_t fmIBM943Offs[] =
-     { 0x0000, 0x0001, 0x0002, 0x0003, 0x0004, 0x0006, 0x0008, 0x000a};
+     { 0x0000, 0x0001, 0x0002, 0x0003, 0x0004, 0x0006, 0x0008, 0x000a, 0x000b };
  
      /* 1 2 3 0 h1 h2 h3 . DBCS*/
      static const uint8_t expectedIBM9027[] =
-     {  0xfe, 0xfe, 0xfe, 0xfe, 0xfe, 0xfe, 0xfe, 0xfe, 0x4c, 0x41, 0x4c, 0x48, 0x4c, 0x55, 0xfe, 0xfe};
+     {  0xfe, 0xfe, 0xfe, 0xfe, 0xfe, 0xfe, 0xfe, 0xfe, 0x4c, 0x41, 0x4c, 0x48, 0x4c, 0x55, 0xfe, 0xfe, 0xfe, 0xfe };
      static const int32_t toIBM9027Offs    [] =
-     {  0x00, 0x00, 0x01, 0x01, 0x02, 0x02, 0x03, 0x03, 0x04, 0x04, 0x05, 0x05, 0x06, 0x06, 0x07, 0x07};
+     {  0x00, 0x00, 0x01, 0x01, 0x02, 0x02, 0x03, 0x03, 0x04, 0x04, 0x05, 0x05, 0x06, 0x06, 0x07, 0x07, 0x08, 0x08 };
  
       /* 1 2 3 0 <?> <?> <?> . SBCS*/
      static const uint8_t expectedIBM920[] =
-     {  0x31, 0x32, 0x33, 0x00, 0x1a, 0x1a, 0x1a, 0x2e };
+     {  0x31, 0x32, 0x33, 0x00, 0x1a, 0x1a, 0x1a, 0x2e, 0x1a };
      static const int32_t toIBM920Offs    [] =
-     {  0x00, 0x01, 0x02, 0x03, 0x04, 0x05, 0x06, 0x07 };
+     {  0x00, 0x01, 0x02, 0x03, 0x04, 0x05, 0x06, 0x07, 0x08 };
  
      /* 1 2 3 0 <?> <?> <?> . SBCS*/
      static const uint8_t expectedISO88593[] =
-     { 0x31, 0x32, 0x33, 0x00, 0x1a, 0x1a, 0x1a, 0x2E };
+     { 0x31, 0x32, 0x33, 0x00, 0x1a, 0x1a, 0x1a, 0x2E, 0x1a };
      static const int32_t toISO88593Offs[]     =
-     { 0x00, 0x01, 0x02, 0x03, 0x04, 0x05, 0x06, 0x07};
+     { 0x00, 0x01, 0x02, 0x03, 0x04, 0x05, 0x06, 0x07, 0x08 };
  
      /* 1 2 3 0 <?> <?> <?> . <?> LATIN_1*/
      static const uint8_t expectedLATIN1[] =
-     { 0x31, 0x32, 0x33, 0x00, 0x1a, 0x1a, 0x1a, 0x2E };
+     { 0x31, 0x32, 0x33, 0x00, 0x1a, 0x1a, 0x1a, 0x2E, 0x1a };
      static const int32_t toLATIN1Offs[]     =
-     { 0x00, 0x01, 0x02, 0x03, 0x04, 0x05, 0x06, 0x07};
+     { 0x00, 0x01, 0x02, 0x03, 0x04, 0x05, 0x06, 0x07, 0x08 };
  
  
      /*  etc */
      static const uint8_t expectedUTF16BE[] =
-     { 0x00, 0x31, 0x00, 0x32, 0x00, 0x33, 0x00, 0x00, 0x4e, 0x00, 0x4e, 0x8c, 0x4e, 0x09, 0x00, 0x2e };
+     { 0x00, 0x31, 0x00, 0x32, 0x00, 0x33, 0x00, 0x00, 0x4e, 0x00, 0x4e, 0x8c, 0x4e, 0x09, 0x00, 0x2e, 0xd8, 0x40, 0xdc, 0x21 };
      static const int32_t toUTF16BEOffs[]=
-     { 0x00, 0x00, 0x01, 0x01, 0x02, 0x02, 0x03, 0x03, 0x04, 0x04, 0x05, 0x05, 0x06, 0x06, 0x07, 0x07};
+     { 0x00, 0x00, 0x01, 0x01, 0x02, 0x02, 0x03, 0x03, 0x04, 0x04, 0x05, 0x05, 0x06, 0x06, 0x07, 0x07, 0x08, 0x08, 0x08, 0x08 };
      static const int32_t fmUTF16BEOffs[] =
-     { 0x0000, 0x0002, 0x0004, 0x0006, 0x0008, 0x000a, 0x000c,  0x000e };
+     { 0x0000, 0x0002, 0x0004, 0x0006, 0x0008, 0x000a, 0x000c,  0x000e, 0x0010, 0x0010 };
  
      static const uint8_t expectedUTF16LE[] =
-     { 0x31, 0x00, 0x32, 0x00, 0x33, 0x00, 0x00, 0x00, 0x00, 0x4e, 0x8c, 0x4e, 0x09, 0x4e, 0x2e, 0x00 };
+     { 0x31, 0x00, 0x32, 0x00, 0x33, 0x00, 0x00, 0x00, 0x00, 0x4e, 0x8c, 0x4e, 0x09, 0x4e, 0x2e, 0x00, 0x40, 0xd8, 0x21, 0xdc };
      static const int32_t toUTF16LEOffs[]=
-     { 0x00, 0x00, 0x01, 0x01, 0x02, 0x02, 0x03, 0x03, 0x04, 0x04, 0x05, 0x05, 0x06, 0x06,  0x07, 0x07};
+     { 0x00, 0x00, 0x01, 0x01, 0x02, 0x02, 0x03, 0x03, 0x04, 0x04, 0x05, 0x05, 0x06, 0x06,  0x07, 0x07, 0x08, 0x08, 0x08, 0x08 };
      static const int32_t fmUTF16LEOffs[] =
-     { 0x0000, 0x0002, 0x0004, 0x0006, 0x0008, 0x000a, 0x000c,  0x000e };
+     { 0x0000, 0x0002, 0x0004, 0x0006, 0x0008, 0x000a, 0x000c, 0x000e, 0x0010, 0x0010 };
  
      static const uint8_t expectedUTF32BE[] =
       { 0x00, 0x00, 0x00, 0x31,
@@ -734,7 +772,8 @@ static void TestNewConvertWithBufferSizes(int32_t outsize, int32_t insize )
         0x00, 0x00, 0x4e, 0x00,
         0x00, 0x00, 0x4e, 0x8c,
         0x00, 0x00, 0x4e, 0x09,
-       0x00, 0x00, 0x00, 0x2e };
+       0x00, 0x00, 0x00, 0x2e,
+       0x00, 0x02, 0x00, 0x21 };
      static const int32_t toUTF32BEOffs[]=
       { 0x00, 0x00, 0x00, 0x00,
         0x01, 0x01, 0x01, 0x01,
@@ -744,9 +783,10 @@ static void TestNewConvertWithBufferSizes(int32_t outsize, int32_t insize )
         0x05, 0x05, 0x05, 0x05,
         0x06, 0x06, 0x06, 0x06,
         0x07, 0x07, 0x07, 0x07,
+       0x08, 0x08, 0x08, 0x08,
         0x08, 0x08, 0x08, 0x08 };
      static const int32_t fmUTF32BEOffs[] =
-     { 0x0000, 0x0004, 0x0008, 0x000c, 0x0010, 0x0014, 0x0018,  0x001c };
+     { 0x0000, 0x0004, 0x0008, 0x000c, 0x0010, 0x0014, 0x0018,  0x001c, 0x0020, 0x0020 };
  
      static const uint8_t expectedUTF32LE[] =
       { 0x31, 0x00, 0x00, 0x00,
@@ -756,7 +796,8 @@ static void TestNewConvertWithBufferSizes(int32_t outsize, int32_t insize )
         0x00, 0x4e, 0x00, 0x00,
         0x8c, 0x4e, 0x00, 0x00,
         0x09, 0x4e, 0x00, 0x00,
-       0x2e, 0x00, 0x00, 0x00 };
+       0x2e, 0x00, 0x00, 0x00,
+       0x21, 0x00, 0x02, 0x00 };
      static const int32_t toUTF32LEOffs[]=
       { 0x00, 0x00, 0x00, 0x00,
         0x01, 0x01, 0x01, 0x01,
@@ -766,9 +807,10 @@ static void TestNewConvertWithBufferSizes(int32_t outsize, int32_t insize )
         0x05, 0x05, 0x05, 0x05,
         0x06, 0x06, 0x06, 0x06,
         0x07, 0x07, 0x07, 0x07,
+       0x08, 0x08, 0x08, 0x08,
         0x08, 0x08, 0x08, 0x08 };
      static const int32_t fmUTF32LEOffs[] =
-     { 0x0000, 0x0004, 0x0008, 0x000c, 0x0010, 0x0014, 0x0018,  0x001c };
+     { 0x0000, 0x0004, 0x0008, 0x000c, 0x0010, 0x0014, 0x0018, 0x001c, 0x0020, 0x0020 };
  
  
  
@@ -793,7 +835,7 @@ static void TestNewConvertWithBufferSizes(int32_t outsize, int32_t insize )
  
  
      /*UTF-8*/
-    testConvertFromU(sampleText, sizeof(sampleText)/sizeof(sampleText[0]),
+    testConvertFromU(sampleText, UPRV_LENGTHOF(sampleText),
          expectedUTF8, sizeof(expectedUTF8), "UTF8", toUTF8Offs,FALSE );
  
      log_verbose("Test surrogate behaviour for UTF8\n");
@@ -804,7 +846,7 @@ static void TestNewConvertWithBufferSizes(int32_t outsize, int32_t insize )
                             0xef, 0xbf, 0xbd
          };
          static const int32_t offsets[]={ 0, 0, 0, 1, 1, 1, 1, 3, 3, 3 };
-        testConvertFromU(testinput, sizeof(testinput)/sizeof(testinput[0]),
+        testConvertFromU(testinput, UPRV_LENGTHOF(testinput),
                           expectedUTF8test2, sizeof(expectedUTF8test2), "UTF8", offsets,FALSE );
  
  
@@ -812,47 +854,47 @@ static void TestNewConvertWithBufferSizes(int32_t outsize, int32_t insize )
  
  #if !UCONFIG_NO_LEGACY_CONVERSION && defined(U_ENABLE_GENERIC_ISO_2022)
      /*ISO-2022*/
-    testConvertFromU(sampleText, sizeof(sampleText)/sizeof(sampleText[0]),
+    testConvertFromU(sampleText, UPRV_LENGTHOF(sampleText),
          expectedISO2022, sizeof(expectedISO2022), "ISO_2022", toISO2022Offs,FALSE );
  #endif
  
      /*UTF16 LE*/
-    testConvertFromU(sampleText, sizeof(sampleText)/sizeof(sampleText[0]),
+    testConvertFromU(sampleText, UPRV_LENGTHOF(sampleText),
          expectedUTF16LE, sizeof(expectedUTF16LE), "utf-16le", toUTF16LEOffs,FALSE );
      /*UTF16 BE*/
-    testConvertFromU(sampleText, sizeof(sampleText)/sizeof(sampleText[0]),
+    testConvertFromU(sampleText, UPRV_LENGTHOF(sampleText),
          expectedUTF16BE, sizeof(expectedUTF16BE), "utf-16be", toUTF16BEOffs,FALSE );
      /*UTF32 LE*/
-    testConvertFromU(sampleText, sizeof(sampleText)/sizeof(sampleText[0]),
+    testConvertFromU(sampleText, UPRV_LENGTHOF(sampleText),
          expectedUTF32LE, sizeof(expectedUTF32LE), "utf-32le", toUTF32LEOffs,FALSE );
      /*UTF32 BE*/
-    testConvertFromU(sampleText, sizeof(sampleText)/sizeof(sampleText[0]),
+    testConvertFromU(sampleText, UPRV_LENGTHOF(sampleText),
          expectedUTF32BE, sizeof(expectedUTF32BE), "utf-32be", toUTF32BEOffs,FALSE );
  
      /*LATIN_1*/
-    testConvertFromU(sampleText, sizeof(sampleText)/sizeof(sampleText[0]),
+    testConvertFromU(sampleText, UPRV_LENGTHOF(sampleText),
          expectedLATIN1, sizeof(expectedLATIN1), "LATIN_1", toLATIN1Offs,FALSE );
  
  #if !UCONFIG_NO_LEGACY_CONVERSION
      /*EBCDIC_STATEFUL*/
-    testConvertFromU(sampleText, sizeof(sampleText)/sizeof(sampleText[0]),
+    testConvertFromU(sampleText, UPRV_LENGTHOF(sampleText),
          expectedIBM930, sizeof(expectedIBM930), "ibm-930", toIBM930Offs,FALSE );
  
-    testConvertFromU(sampleText, sizeof(sampleText)/sizeof(sampleText[0]),
+    testConvertFromU(sampleText, UPRV_LENGTHOF(sampleText),
          expectedISO88593, sizeof(expectedISO88593), "iso-8859-3", toISO88593Offs,FALSE );
  
      /*MBCS*/
  
-    testConvertFromU(sampleText, sizeof(sampleText)/sizeof(sampleText[0]),
+    testConvertFromU(sampleText, UPRV_LENGTHOF(sampleText),
          expectedIBM943, sizeof(expectedIBM943), "ibm-943", toIBM943Offs,FALSE );
      /*DBCS*/
-    testConvertFromU(sampleText, sizeof(sampleText)/sizeof(sampleText[0]),
+    testConvertFromU(sampleText, UPRV_LENGTHOF(sampleText),
          expectedIBM9027, sizeof(expectedIBM9027), "@ibm9027", toIBM9027Offs,FALSE );
      /*SBCS*/
-    testConvertFromU(sampleText, sizeof(sampleText)/sizeof(sampleText[0]),
+    testConvertFromU(sampleText, UPRV_LENGTHOF(sampleText),
          expectedIBM920, sizeof(expectedIBM920), "ibm-920", toIBM920Offs,FALSE );
      /*SBCS*/
-    testConvertFromU(sampleText, sizeof(sampleText)/sizeof(sampleText[0]),
+    testConvertFromU(sampleText, UPRV_LENGTHOF(sampleText),
          expectedISO88593, sizeof(expectedISO88593), "iso-8859-3", toISO88593Offs,FALSE );
  #endif
  
@@ -861,51 +903,51 @@ static void TestNewConvertWithBufferSizes(int32_t outsize, int32_t insize )
  
      /*UTF-8*/
      testConvertToU(expectedUTF8, sizeof(expectedUTF8),
-        sampleText, sizeof(sampleText)/sizeof(sampleText[0]), "utf8", fmUTF8Offs,FALSE);
+        sampleText, UPRV_LENGTHOF(sampleText), "utf8", fmUTF8Offs,FALSE);
  #if !UCONFIG_NO_LEGACY_CONVERSION && defined(U_ENABLE_GENERIC_ISO_2022)
      /*ISO-2022*/
      testConvertToU(expectedISO2022, sizeof(expectedISO2022),
-        sampleText, sizeof(sampleText)/sizeof(sampleText[0]), "ISO_2022", fmISO2022Offs,FALSE);
+        sampleText, UPRV_LENGTHOF(sampleText), "ISO_2022", fmISO2022Offs,FALSE);
  #endif
  
      /*UTF16 LE*/
      testConvertToU(expectedUTF16LE, sizeof(expectedUTF16LE),
-        sampleText, sizeof(sampleText)/sizeof(sampleText[0]), "utf-16le", fmUTF16LEOffs,FALSE);
+        sampleText, UPRV_LENGTHOF(sampleText), "utf-16le", fmUTF16LEOffs,FALSE);
      /*UTF16 BE*/
      testConvertToU(expectedUTF16BE, sizeof(expectedUTF16BE),
-        sampleText, sizeof(sampleText)/sizeof(sampleText[0]), "utf-16be", fmUTF16BEOffs,FALSE);
+        sampleText, UPRV_LENGTHOF(sampleText), "utf-16be", fmUTF16BEOffs,FALSE);
      /*UTF32 LE*/
      testConvertToU(expectedUTF32LE, sizeof(expectedUTF32LE),
-        sampleText, sizeof(sampleText)/sizeof(sampleText[0]), "utf-32le", fmUTF32LEOffs,FALSE);
+        sampleText, UPRV_LENGTHOF(sampleText), "utf-32le", fmUTF32LEOffs,FALSE);
      /*UTF32 BE*/
      testConvertToU(expectedUTF32BE, sizeof(expectedUTF32BE),
-        sampleText, sizeof(sampleText)/sizeof(sampleText[0]), "utf-32be", fmUTF32BEOffs,FALSE);
+        sampleText, UPRV_LENGTHOF(sampleText), "utf-32be", fmUTF32BEOffs,FALSE);
  
  #if !UCONFIG_NO_LEGACY_CONVERSION
      /*EBCDIC_STATEFUL*/
-    testConvertToU(expectedIBM930, sizeof(expectedIBM930),
-        sampleText, sizeof(sampleText)/sizeof(sampleText[0]), "ibm-930", fmIBM930Offs,FALSE);
+    testConvertToU(expectedIBM930, sizeof(expectedIBM930), sampleTextRoundTripUnmappable, 
+            UPRV_LENGTHOF(sampleTextRoundTripUnmappable), "ibm-930", fmIBM930Offs,FALSE);
      /*MBCS*/
-    testConvertToU(expectedIBM943, sizeof(expectedIBM943),
-        sampleText, sizeof(sampleText)/sizeof(sampleText[0]), "ibm-943", fmIBM943Offs,FALSE);
+    testConvertToU(expectedIBM943, sizeof(expectedIBM943),sampleTextRoundTripUnmappable, 
+            UPRV_LENGTHOF(sampleTextRoundTripUnmappable), "ibm-943", fmIBM943Offs,FALSE);
  #endif
  
      /* Try it again to make sure it still works */
      testConvertToU(expectedUTF16LE, sizeof(expectedUTF16LE),
-        sampleText, sizeof(sampleText)/sizeof(sampleText[0]), "utf-16le", fmUTF16LEOffs,FALSE);
+        sampleText, UPRV_LENGTHOF(sampleText), "utf-16le", fmUTF16LEOffs,FALSE);
  
  #if !UCONFIG_NO_LEGACY_CONVERSION
      testConvertToU(expectedMaltese913, sizeof(expectedMaltese913),
-        malteseUChars, sizeof(malteseUChars)/sizeof(malteseUChars[0]), "latin3", NULL,FALSE);
+        malteseUChars, UPRV_LENGTHOF(malteseUChars), "latin3", NULL,FALSE);
  
-    testConvertFromU(malteseUChars, sizeof(malteseUChars)/sizeof(malteseUChars[0]),
+    testConvertFromU(malteseUChars, UPRV_LENGTHOF(malteseUChars),
          expectedMaltese913, sizeof(expectedMaltese913), "iso-8859-3", NULL,FALSE );
  
      /*LMBCS*/
-    testConvertFromU(LMBCSUChars, sizeof(LMBCSUChars)/sizeof(LMBCSUChars[0]),
+    testConvertFromU(LMBCSUChars, UPRV_LENGTHOF(LMBCSUChars),
          expectedLMBCS, sizeof(expectedLMBCS), "LMBCS-1", toLMBCSOffs,FALSE );
      testConvertToU(expectedLMBCS, sizeof(expectedLMBCS),
-        LMBCSUChars, sizeof(LMBCSUChars)/sizeof(LMBCSUChars[0]), "LMBCS-1", fmLMBCSOffs,FALSE);
+        LMBCSUChars, UPRV_LENGTHOF(LMBCSUChars), "LMBCS-1", fmLMBCSOffs,FALSE);
  #endif
  
      /* UTF-7 examples are mostly from http://www.imc.org/rfc2152 */
@@ -916,12 +958,12 @@ static void TestNewConvertWithBufferSizes(int32_t outsize, int32_t insize )
                  Hi Mom -+Jjo--!
                  A+ImIDkQ.
                  +-
-                +ZeVnLIqe
+                +ZeVnLIqe-
              */
              0x48, 0x69, 0x20, 0x4d, 0x6f, 0x6d, 0x20, 0x2d, 0x2b, 0x4a, 0x6a, 0x6f, 0x2d, 0x2d, 0x21,
              0x41, 0x2b, 0x49, 0x6d, 0x49, 0x44, 0x6b, 0x51, 0x2e,
              0x2b, 0x2d,
-            0x2b, 0x5a, 0x65, 0x56, 0x6e, 0x4c, 0x49, 0x71, 0x65
+            0x2b, 0x5a, 0x65, 0x56, 0x6e, 0x4c, 0x49, 0x71, 0x65, 0x2d
          };
          static const UChar unicode[] = {
              /*
@@ -945,7 +987,7 @@ static void TestNewConvertWithBufferSizes(int32_t outsize, int32_t insize )
              0, 1, 2, 3, 4, 5, 6, 7, 8, 8, 8, 8, 8, 9, 10,
              11, 12, 12, 12, 13, 13, 13, 13, 14,
              15, 15,
-            16, 16, 16, 17, 17, 17, 18, 18, 18
+            16, 16, 16, 17, 17, 17, 18, 18, 18, 18
          };
  
          /* same but escaping set O (the exclamation mark) */
@@ -954,12 +996,12 @@ static void TestNewConvertWithBufferSizes(int32_t outsize, int32_t insize )
                  Hi Mom -+Jjo--+ACE-
                  A+ImIDkQ.
                  +-
-                +ZeVnLIqe
+                +ZeVnLIqe-
              */
              0x48, 0x69, 0x20, 0x4d, 0x6f, 0x6d, 0x20, 0x2d, 0x2b, 0x4a, 0x6a, 0x6f, 0x2d, 0x2d, 0x2b, 0x41, 0x43, 0x45, 0x2d,
              0x41, 0x2b, 0x49, 0x6d, 0x49, 0x44, 0x6b, 0x51, 0x2e,
              0x2b, 0x2d,
-            0x2b, 0x5a, 0x65, 0x56, 0x6e, 0x4c, 0x49, 0x71, 0x65
+            0x2b, 0x5a, 0x65, 0x56, 0x6e, 0x4c, 0x49, 0x71, 0x65, 0x2d
          };
          static const int32_t toUnicodeOffsetsR[] = {
              0, 1, 2, 3, 4, 5, 6, 7, 9, 13, 15,
@@ -971,16 +1013,16 @@ static void TestNewConvertWithBufferSizes(int32_t outsize, int32_t insize )
              0, 1, 2, 3, 4, 5, 6, 7, 8, 8, 8, 8, 8, 9, 10, 10, 10, 10, 10,
              11, 12, 12, 12, 13, 13, 13, 13, 14,
              15, 15,
-            16, 16, 16, 17, 17, 17, 18, 18, 18
+            16, 16, 16, 17, 17, 17, 18, 18, 18, 18
          };
  
-        testConvertFromU(unicode, sizeof(unicode)/U_SIZEOF_UCHAR, utf7, sizeof(utf7), "UTF-7", fromUnicodeOffsets,FALSE);
+        testConvertFromU(unicode, UPRV_LENGTHOF(unicode), utf7, sizeof(utf7), "UTF-7", fromUnicodeOffsets,FALSE);
  
-        testConvertToU(utf7, sizeof(utf7), unicode, sizeof(unicode)/U_SIZEOF_UCHAR, "UTF-7", toUnicodeOffsets,FALSE);
+        testConvertToU(utf7, sizeof(utf7), unicode, UPRV_LENGTHOF(unicode), "UTF-7", toUnicodeOffsets,FALSE);
  
-        testConvertFromU(unicode, sizeof(unicode)/U_SIZEOF_UCHAR, utf7Restricted, sizeof(utf7Restricted), "UTF-7,version=1", fromUnicodeOffsetsR,FALSE);
+        testConvertFromU(unicode, UPRV_LENGTHOF(unicode), utf7Restricted, sizeof(utf7Restricted), "UTF-7,version=1", fromUnicodeOffsetsR,FALSE);
  
-        testConvertToU(utf7Restricted, sizeof(utf7Restricted), unicode, sizeof(unicode)/U_SIZEOF_UCHAR, "UTF-7,version=1", toUnicodeOffsetsR,FALSE);
+        testConvertToU(utf7Restricted, sizeof(utf7Restricted), unicode, UPRV_LENGTHOF(unicode), "UTF-7,version=1", toUnicodeOffsetsR,FALSE);
      }
  
      /*
@@ -1054,9 +1096,9 @@ static void TestNewConvertWithBufferSizes(int32_t outsize, int32_t insize )
              35, 36, 36, 36, 37, 37, 37, 37, 37
          };
  
-        testConvertFromU(unicode, sizeof(unicode)/U_SIZEOF_UCHAR, imap, sizeof(imap), "IMAP-mailbox-name", fromUnicodeOffsets,FALSE);
+        testConvertFromU(unicode, UPRV_LENGTHOF(unicode), imap, sizeof(imap), "IMAP-mailbox-name", fromUnicodeOffsets,FALSE);
  
-        testConvertToU(imap, sizeof(imap), unicode, sizeof(unicode)/U_SIZEOF_UCHAR, "IMAP-mailbox-name", toUnicodeOffsets,FALSE);
+        testConvertToU(imap, sizeof(imap), unicode, UPRV_LENGTHOF(unicode), "IMAP-mailbox-name", toUnicodeOffsets,FALSE);
      }
  
      /* Test UTF-8 bad data handling*/
@@ -1071,29 +1113,39 @@ static void TestNewConvertWithBufferSizes(int32_t outsize, int32_t insize )
              0xf4, 0x8f, 0xbf, 0xbf,         /* 10FFFF */
              0xdf, 0xbf,                     /* 7ff */
              0xbf,                           /* truncated tail */
-            0xf4, 0x90, 0x80, 0x80,         /* 11FFFF */
+            0xf4, 0x90, 0x80, 0x80,         /* 110000 */
              0x02
          };
  
          static const uint16_t utf8Expected[]={
              0x0061,
-            0xfffd,
+            0xfffd, 0xfffd, 0xfffd, 0xfffd,
              0x0000,
              0x0062,
-            0xfffd,
-            0xfffd,
+            0xfffd, 0xfffd, 0xfffd, 0xfffd, 0xfffd,
+            0xfffd, 0xfffd, 0xfffd, 0xfffd, 0xfffd,
              0xdbff, 0xdfff,
              0x07ff,
              0xfffd,
-            0xfffd,
+            0xfffd, 0xfffd, 0xfffd, 0xfffd,
              0x0002
          };
  
          static const int32_t utf8Offsets[]={
-            0, 1, 5, 6, 7, 12, 17, 17, 21, 23, 24, 28
+            0,
+            1, 2, 3, 4,
+            5,
+            6,
+            7, 8, 9, 10, 11,
+            12, 13, 14, 15, 16,
+            17, 17,
+            21,
+            23,
+            24, 25, 26, 27,
+            28
          };
          testConvertToU(utf8, sizeof(utf8),
-                       utf8Expected, sizeof(utf8Expected)/sizeof(utf8Expected[0]), "utf-8", utf8Offsets ,FALSE);
+                       utf8Expected, UPRV_LENGTHOF(utf8Expected), "utf-8", utf8Offsets ,FALSE);
  
      }
  
@@ -1145,8 +1197,8 @@ static void TestNewConvertWithBufferSizes(int32_t outsize, int32_t insize )
          };
  
          testConvertToU(utf32, sizeof(utf32),
-                       utf32Expected, sizeof(utf32Expected)/sizeof(utf32Expected[0]), "utf-32be", utf32Offsets ,FALSE);
-        testConvertFromU(utf32Expected, sizeof(utf32Expected)/sizeof(utf32Expected[0]),
+                       utf32Expected, UPRV_LENGTHOF(utf32Expected), "utf-32be", utf32Offsets ,FALSE);
+        testConvertFromU(utf32Expected, UPRV_LENGTHOF(utf32Expected),
              utf32ExpectedBack, sizeof(utf32ExpectedBack), "utf-32be", utf32OffsetsBack, FALSE);
      }
  
@@ -1198,8 +1250,8 @@ static void TestNewConvertWithBufferSizes(int32_t outsize, int32_t insize )
              8,8,8,8
          };
          testConvertToU(utf32, sizeof(utf32),
-            utf32Expected, sizeof(utf32Expected)/sizeof(utf32Expected[0]), "utf-32le", utf32Offsets,FALSE );
-        testConvertFromU(utf32Expected, sizeof(utf32Expected)/sizeof(utf32Expected[0]),
+            utf32Expected, UPRV_LENGTHOF(utf32Expected), "utf-32le", utf32Offsets,FALSE );
+        testConvertFromU(utf32Expected, UPRV_LENGTHOF(utf32Expected),
              utf32ExpectedBack, sizeof(utf32ExpectedBack), "utf-32le", utf32OffsetsBack, FALSE);
      }
  }
@@ -1236,7 +1288,7 @@ static void TestCoverageMBCS(){
          int32_t  totest1Offs[]        = { 0, 1, 2, 3, 5, };
  
          /*from Unicode*/
-        testConvertFromU(unicodeInput, sizeof(unicodeInput)/sizeof(unicodeInput[0]),
+        testConvertFromU(unicodeInput, UPRV_LENGTHOF(unicodeInput),
              expectedtest1, sizeof(expectedtest1), "@test1", totest1Offs,FALSE );
      }
  
@@ -1254,12 +1306,12 @@ static void TestCoverageMBCS(){
          int32_t fromtest3Offs[]       = { 0, 1, 2, 3, 6, 6, 7, 7, 10 };
  
          /*from Unicode*/
-        testConvertFromU(unicodeInput, sizeof(unicodeInput)/sizeof(unicodeInput[0]),
+        testConvertFromU(unicodeInput, UPRV_LENGTHOF(unicodeInput),
              expectedtest3, sizeof(expectedtest3), "@test3", totest3Offs,FALSE );
  
          /*to Unicode*/
          testConvertToU(test3input, sizeof(test3input),
-            expectedUnicode, sizeof(expectedUnicode)/sizeof(expectedUnicode[0]), "@test3", fromtest3Offs ,FALSE);
+            expectedUnicode, UPRV_LENGTHOF(expectedUnicode), "@test3", fromtest3Offs ,FALSE);
  
      }
  
@@ -1277,12 +1329,12 @@ static void TestCoverageMBCS(){
          static const int32_t fromtest4Offs[] = { 0, 1, 2, 3, 7, 7, 8, 8, 12,};
  
          /*from Unicode*/
-        testConvertFromU(unicodeInput, sizeof(unicodeInput)/sizeof(unicodeInput[0]),
+        testConvertFromU(unicodeInput, UPRV_LENGTHOF(unicodeInput),
              expectedtest4, sizeof(expectedtest4), "@test4", totest4Offs,FALSE );
  
          /*to Unicode*/
          testConvertToU(test4input, sizeof(test4input),
-            expectedUnicode, sizeof(expectedUnicode)/sizeof(expectedUnicode[0]), "@test4", fromtest4Offs,FALSE );
+            expectedUnicode, UPRV_LENGTHOF(expectedUnicode), "@test4", fromtest4Offs,FALSE );
  
      }
  #if 0
@@ -1416,7 +1468,7 @@ static void TestConverterTypesAndStarters()
  
  static void
  TestAmbiguousConverter(UConverter *cnv) {
-    static const char inBytes[2]={ 0x61, 0x5c };
+    static const char inBytes[3]={ 0x61, 0x5B, 0x5c };
      UChar outUnicode[20]={ 0, 0, 0, 0 };
  
      const char *s;
@@ -1424,34 +1476,36 @@ TestAmbiguousConverter(UConverter *cnv) {
      UErrorCode errorCode;
      UBool isAmbiguous;
  
-    /* try to convert an 'a' and a US-ASCII backslash */
+    /* try to convert an 'a', a square bracket and a US-ASCII backslash */
      errorCode=U_ZERO_ERROR;
      s=inBytes;
      u=outUnicode;
-    ucnv_toUnicode(cnv, &u, u+20, &s, s+2, NULL, TRUE, &errorCode);
+    ucnv_toUnicode(cnv, &u, u+20, &s, s+3, NULL, TRUE, &errorCode);
      if(U_FAILURE(errorCode)) {
          /* we do not care about general failures in this test; the input may just not be mappable */
          return;
      }
  
-    if(outUnicode[0]!=0x61 || outUnicode[1]==0xfffd) {
-        /* not an ASCII-family encoding, or 0x5c is unassigned/illegal: this test is not applicable */
+    if(outUnicode[0]!=0x61 || outUnicode[1]!=0x5B || outUnicode[2]==0xfffd) {
+        /* not a close ASCII-family encoding, or 0x5c is unassigned/illegal: this test is not applicable */
+        /* There are some encodings that are partially ASCII based,
+        like the ISO-7 and GSM series of codepages, which we ignore. */
          return;
      }
  
      isAmbiguous=ucnv_isAmbiguous(cnv);
  
      /* check that outUnicode[1]!=0x5c is exactly the same as ucnv_isAmbiguous() */
-    if((outUnicode[1]!=0x5c)!=isAmbiguous) {
+    if((outUnicode[2]!=0x5c)!=isAmbiguous) {
          log_err("error: converter \"%s\" needs a backslash fix: %d but ucnv_isAmbiguous()==%d\n",
-            ucnv_getName(cnv, &errorCode), outUnicode[1]!=0x5c, isAmbiguous);
+            ucnv_getName(cnv, &errorCode), outUnicode[2]!=0x5c, isAmbiguous);
          return;
      }
  
-    if(outUnicode[1]!=0x5c) {
+    if(outUnicode[2]!=0x5c) {
          /* needs fixup, fix it */
          ucnv_fixFileSeparator(cnv, outUnicode, (int32_t)(u-outUnicode));
-        if(outUnicode[1]!=0x5c) {
+        if(outUnicode[2]!=0x5c) {
              /* the fix failed */
              log_err("error: ucnv_fixFileSeparator(%s) failed\n", ucnv_getName(cnv, &errorCode));
              return;
@@ -1473,7 +1527,7 @@ static void TestAmbiguous()
          0
      };
      UChar asciiResult[200], sjisResult[200];
-    int32_t asciiLength = 0, sjisLength = 0, i;
+    int32_t /*asciiLength = 0,*/ sjisLength = 0, i;
      const char *name;
  
      /* enumerate all converters */
@@ -1504,7 +1558,7 @@ static void TestAmbiguous()
          return;
      }
      /* convert target from SJIS to Unicode */
-    sjisLength = ucnv_toUChars(sjis_cnv, sjisResult, sizeof(sjisResult)/U_SIZEOF_UCHAR, target, (int32_t)strlen(target), &status);
+    sjisLength = ucnv_toUChars(sjis_cnv, sjisResult, UPRV_LENGTHOF(sjisResult), target, (int32_t)strlen(target), &status);
      if (U_FAILURE(status))
      {
          log_err("Failed to convert the SJIS string.\n");
@@ -1513,11 +1567,10 @@ static void TestAmbiguous()
          return;
      }
      /* convert target from Latin-1 to Unicode */
-    asciiLength = ucnv_toUChars(ascii_cnv, asciiResult, sizeof(asciiResult)/U_SIZEOF_UCHAR, target, (int32_t)strlen(target), &status);
+    /*asciiLength =*/ ucnv_toUChars(ascii_cnv, asciiResult, UPRV_LENGTHOF(asciiResult), target, (int32_t)strlen(target), &status);
      if (U_FAILURE(status))
      {
          log_err("Failed to convert the Latin-1 string.\n");
-        free(sjisResult);
          ucnv_close(sjis_cnv);
          ucnv_close(ascii_cnv);
          return;
@@ -1525,8 +1578,6 @@ static void TestAmbiguous()
      if (!ucnv_isAmbiguous(sjis_cnv))
      {
          log_err("SJIS converter should contain ambiguous character mappings.\n");
-        free(sjisResult);
-        free(asciiResult);
          ucnv_close(sjis_cnv);
          ucnv_close(ascii_cnv);
          return;
@@ -1624,7 +1675,7 @@ TestSignatureDetection(){
          int32_t signatureLength = -1;
          const char* source = NULL;
          const char* enc = NULL;
-        for( ; i<sizeof(data)/sizeof(char*); i++){
+        for( ; i<UPRV_LENGTHOF(data); i++){
              err = U_ZERO_ERROR;
              source = data[i];
              enc = ucnv_detectUnicodeSignature(source, -1 , &signatureLength, &err);
@@ -1737,7 +1788,7 @@ TestSignatureDetection(){
          int32_t sourceLength=-1;
          const char* source = NULL;
          const char* enc = NULL;
-        for( ; i<sizeof(data)/sizeof(char*); i++){
+        for( ; i<UPRV_LENGTHOF(data); i++){
              err = U_ZERO_ERROR;
              source = data[i];
              sourceLength = len[i];
@@ -1759,8 +1810,7 @@ TestSignatureDetection(){
      }
  }
  
-void
-static TestUTF7() {
+static void TestUTF7() {
      /* test input */
      static const uint8_t in[]={
          /* H - +Jjo- - ! +- +2AHcAQ */
@@ -1790,7 +1840,7 @@ static TestUTF7() {
      UErrorCode errorCode=U_ZERO_ERROR;
      UConverter *cnv=ucnv_open("UTF-7", &errorCode);
      if(U_FAILURE(errorCode)) {
-        log_err("Unable to open a UTF-7 converter: %s\n", u_errorName(errorCode)); /* sholdn't be a data err */
+        log_data_err("Unable to open a UTF-7 converter: %s\n", u_errorName(errorCode));
          return;
      }
      TestNextUChar(cnv, source, limit, results, "UTF-7");
@@ -1803,8 +1853,7 @@ static TestUTF7() {
      ucnv_close(cnv);
  }
  
-void
-static TestIMAP() {
+static void TestIMAP() {
      /* test input */
      static const uint8_t in[]={
          /* H - &Jjo- - ! &- &2AHcAQ- \ */
@@ -1834,7 +1883,7 @@ static TestIMAP() {
      UErrorCode errorCode=U_ZERO_ERROR;
      UConverter *cnv=ucnv_open("IMAP-mailbox-name", &errorCode);
      if(U_FAILURE(errorCode)) {
-        log_err("Unable to open a IMAP-mailbox-name converter: %s\n", u_errorName(errorCode)); /* sholdn't be a data err */
+        log_data_err("Unable to open a IMAP-mailbox-name converter: %s\n", u_errorName(errorCode));
          return;
      }
      TestNextUChar(cnv, source, limit, results, "IMAP-mailbox-name");
@@ -1847,8 +1896,7 @@ static TestIMAP() {
      ucnv_close(cnv);
  }
  
-void
-static TestUTF8() {
+static void TestUTF8() {
      /* test input */
      static const uint8_t in[]={
          0x61,
@@ -1913,8 +1961,7 @@ static TestUTF8() {
      ucnv_close(cnv);
  }
  
-void
-static TestCESU8() {
+static void TestCESU8() {
      /* test input */
      static const uint8_t in[]={
          0x61,
@@ -1969,7 +2016,7 @@ static TestCESU8() {
      UErrorCode errorCode=U_ZERO_ERROR;
      UConverter *cnv=ucnv_open("CESU-8", &errorCode);
      if(U_FAILURE(errorCode)) {
-        log_err("Unable to open a CESU-8 converter: %s\n", u_errorName(errorCode));
+        log_data_err("Unable to open a CESU-8 converter: %s\n", u_errorName(errorCode));
          return;
      }
      TestNextUChar(cnv, source, limit, results, "CESU-8");
@@ -1985,8 +2032,7 @@ static TestCESU8() {
      ucnv_close(cnv);
  }
  
-void
-static TestUTF16() {
+static void TestUTF16() {
      /* test input */
      static const uint8_t in1[]={
          0xfe, 0xff, 0x4e, 0x00, 0xfe, 0xff
@@ -2044,8 +2090,7 @@ static TestUTF16() {
      ucnv_close(cnv);
  }
  
-void
-static TestUTF16BE() {
+static void TestUTF16BE() {
      /* test input */
      static const uint8_t in[]={
          0x00, 0x61,
@@ -2155,8 +2200,7 @@ TestUTF16LE() {
      ucnv_close(cnv);
  }
  
-void
-static TestUTF32() {
+static void TestUTF32() {
      /* test input */
      static const uint8_t in1[]={
          0x00, 0x00, 0xfe, 0xff,   0x00, 0x10, 0x0f, 0x00,   0x00, 0x00, 0xfe, 0xff
@@ -2192,7 +2236,7 @@ static TestUTF32() {
      UErrorCode errorCode=U_ZERO_ERROR;
      UConverter *cnv=ucnv_open("UTF-32", &errorCode);
      if(U_FAILURE(errorCode)) {
-        log_err("Unable to open a UTF-32 converter: %s\n", u_errorName(errorCode));
+        log_data_err("Unable to open a UTF-32 converter: %s\n", u_errorName(errorCode));
          return;
      }
  
@@ -2268,7 +2312,7 @@ TestUTF32BE() {
      UErrorCode errorCode=U_ZERO_ERROR;
      UConverter *cnv=ucnv_open("UTF-32BE", &errorCode);
      if(U_FAILURE(errorCode)) {
-        log_err("Unable to open a UTF-32BE converter: %s\n", u_errorName(errorCode));
+        log_data_err("Unable to open a UTF-32BE converter: %s\n", u_errorName(errorCode));
          return;
      }
      TestNextUChar(cnv, source, limit, results, "UTF-32BE");
@@ -2339,7 +2383,7 @@ TestUTF32LE() {
      UErrorCode errorCode=U_ZERO_ERROR;
      UConverter *cnv=ucnv_open("UTF-32LE", &errorCode);
      if(U_FAILURE(errorCode)) {
-        log_err("Unable to open a UTF-32LE converter: %s\n", u_errorName(errorCode));
+        log_data_err("Unable to open a UTF-32LE converter: %s\n", u_errorName(errorCode));
          return;
      }
      TestNextUChar(cnv, source, limit, results, "UTF-32LE");
@@ -2472,7 +2516,7 @@ TestLATIN1() {
      UErrorCode errorCode=U_ZERO_ERROR;
      UConverter *cnv=ucnv_open("LATIN_1", &errorCode);
      if(U_FAILURE(errorCode)) {
-        log_err("Unable to open a LATIN_1 converter: %s\n", u_errorName(errorCode));
+        log_data_err("Unable to open a LATIN_1 converter: %s\n", u_errorName(errorCode));
          return;
      }
      TestNextUChar(cnv, source, limit, results, "LATIN_1");
@@ -2605,7 +2649,7 @@ TestMBCS() {
      TestNextUCharError(cnv, source, source, U_INDEX_OUTOFBOUNDS_ERROR, "sourceLimit <= source");
      /*Test for the condition where there is an invalid character*/
      {
-        static const uint8_t source2[]={0xa1, 0x01};
+        static const uint8_t source2[]={0xa1, 0x80};
          TestNextUCharError(cnv, (const char*)source2, (const char*)source2+sizeof(source2), U_ZERO_ERROR, "an invalid character");
      }
      /*Test for the condition where we have a truncated char*/
@@ -2618,6 +2662,62 @@ TestMBCS() {
  
  }
  
+#if !UCONFIG_NO_LEGACY_CONVERSION && !UCONFIG_NO_FILE_IO
+static void
+TestICCRunout() {
+/*    { "ibm-1363", :bin{ a2aea2 }, "\u00a1\u001a", :intvector{ 0, 2 }, :int{1}, :int{0}, "\", "?", :bin{""} } */
+
+    const char *cnvName = "ibm-1363";
+    UErrorCode status = U_ZERO_ERROR;
+    const char sourceData[] = { (char)0xa2, (char)0xae, (char)0xa2 };
+    /* UChar   expectUData[] = { 0x00a1, 0x001a }; */
+    const char *source = sourceData;
+    const char *sourceLim = sourceData+sizeof(sourceData);
+    UChar c1, c2, c3;
+    UConverter *cnv=ucnv_open(cnvName, &status);
+    if(U_FAILURE(status)) {
+        log_data_err("Unable to open %s converter: %s\n", cnvName, u_errorName(status));
+       return;
+    }
+    
+#if 0
+    {
+    UChar   targetBuf[256];
+    UChar   *target = targetBuf;
+    UChar   *targetLim = target+256;
+    ucnv_toUnicode(cnv, &target, targetLim, &source, sourceLim, NULL, TRUE, &status);
+
+    log_info("After convert: target@%d, source@%d, status%s\n",
+            target-targetBuf, source-sourceData, u_errorName(status));
+
+    if(U_FAILURE(status)) {
+       log_err("Failed to convert: %s\n", u_errorName(status));
+    } else {
+       
+    }
+    }
+#endif
+
+    c1=ucnv_getNextUChar(cnv, &source, sourceLim, &status);
+    log_verbose("c1: U+%04X, source@%d, status %s\n", c1, source-sourceData, u_errorName(status));
+
+    c2=ucnv_getNextUChar(cnv, &source, sourceLim, &status);
+    log_verbose("c2: U+%04X, source@%d, status %s\n", c2, source-sourceData, u_errorName(status));
+
+    c3=ucnv_getNextUChar(cnv, &source, sourceLim, &status);
+    log_verbose("c3: U+%04X, source@%d, status %s\n", c3, source-sourceData, u_errorName(status));
+
+    if(status==U_INDEX_OUTOFBOUNDS_ERROR && c3==0xFFFF) {
+       log_verbose("OK\n");
+    } else {
+       log_err("FAIL: c3 was not FFFF or err was not U_INDEXOUTOFBOUNDS_ERROR\n");
+    }
+
+    ucnv_close(cnv);
+    
+}
+#endif
+
  #ifdef U_ENABLE_GENERIC_ISO_2022
  
  static void
@@ -2687,7 +2787,7 @@ TestSmallTargetBuffer(const uint16_t* source, const UChar* sourceLimit,UConverte
      char *cTarget;
      const char *cTargetLimit;
      char *cBuf;
-    UChar *uBuf,*test;
+    UChar *uBuf; /*,*test;*/
      int32_t uBufSize = 120;
      int len=0;
      int i=2;
@@ -2735,7 +2835,7 @@ TestSmallTargetBuffer(const uint16_t* source, const UChar* sourceLimit,UConverte
          }while(cSource<cSourceLimit);
  
          uSource = source;
-        test =uBuf;
+        /*test =uBuf;*/
          for(len=0;len<(int)(source - sourceLimit);len++){
              if(uBuf[len]!=uSource[len]){
                  log_err("Expected : \\u%04X \t Got: \\u%04X\n",uSource[len],(int)uBuf[len]) ;
@@ -2803,7 +2903,7 @@ static void TestSmallSourceBuffer(const uint16_t* source, const UChar* sourceLim
      char *cTarget;
      const char *cTargetLimit;
      char *cBuf;
-    UChar *uBuf,*test;
+    UChar *uBuf; /*,*test;*/
      int32_t uBufSize = 120;
      int len=0;
      int i=2;
@@ -2857,7 +2957,7 @@ static void TestSmallSourceBuffer(const uint16_t* source, const UChar* sourceLim
          }while(cSource<cTarget);
  
          uSource = source;
-        test =uBuf;
+        /*test =uBuf;*/
          for(;len<(int)(source - sourceLimit);len++){
              if(uBuf[len]!=uSource[len]){
                  log_err("Expected : \\u%04X \t Got: \\u%04X\n",uSource[len],(int)uBuf[len]) ;
@@ -2870,14 +2970,14 @@ static void TestSmallSourceBuffer(const uint16_t* source, const UChar* sourceLim
  static void
  TestGetNextUChar2022(UConverter* cnv, const char* source, const char* limit,
                       const uint16_t results[], const char* message){
-     const char* s0;
+/*     const char* s0; */
       const char* s=(char*)source;
       const uint16_t *r=results;
       UErrorCode errorCode=U_ZERO_ERROR;
       uint32_t c,exC;
       ucnv_reset(cnv);
       while(s<limit) {
-        s0=s;
+        /* s0=s; */
          c=ucnv_getNextUChar(cnv, &s, limit, &errorCode);
          if(errorCode==U_INDEX_OUTOFBOUNDS_ERROR) {
              break; /* no more significant input */
@@ -2885,9 +2985,9 @@ TestGetNextUChar2022(UConverter* cnv, const char* source, const char* limit,
              log_err("%s ucnv_getNextUChar() failed: %s\n", message, u_errorName(errorCode));
              break;
          } else {
-            if(UTF_IS_FIRST_SURROGATE(*r)){
+            if(U16_IS_LEAD(*r)){
                  int i =0, len = 2;
-                UTF_NEXT_CHAR_SAFE(r, i, len, exC, FALSE);
+                U16_NEXT(r, i, len, exC);
                  r++;
              }else{
                  exC = *r;
@@ -3011,7 +3111,7 @@ TestHZ() {
      uBuf =  (UChar*)malloc(uBufSize * sizeof(UChar)*5);
      cBuf =(char*)malloc(uBufSize * sizeof(char) * 5);
      uSource = (const UChar*)in;
-    uSourceLimit=(const UChar*)in + (sizeof(in)/sizeof(in[0]));
+    uSourceLimit=(const UChar*)in + UPRV_LENGTHOF(in);
      cTarget = cBuf;
      cTargetLimit = cBuf +uBufSize*5;
      uTarget = uBuf;
@@ -3040,9 +3140,9 @@ TestHZ() {
          test++;
      }
      TestGetNextUChar2022(cnv, cBuf, cTarget, in, "HZ encoding");
-    TestSmallTargetBuffer(in,(const UChar*)in + (sizeof(in)/sizeof(in[0])),cnv);
-    TestSmallSourceBuffer(in,(const UChar*)in + (sizeof(in)/sizeof(in[0])),cnv);
-    TestToAndFromUChars(in,(const UChar*)in + (sizeof(in)/sizeof(in[0])),cnv);
+    TestSmallTargetBuffer(in,(const UChar*)in + UPRV_LENGTHOF(in),cnv);
+    TestSmallSourceBuffer(in,(const UChar*)in + UPRV_LENGTHOF(in),cnv);
+    TestToAndFromUChars(in,(const UChar*)in + UPRV_LENGTHOF(in),cnv);
      TestJitterbug930("csISO2022JP");
      ucnv_close(cnv);
      free(offsets);
@@ -3188,7 +3288,7 @@ TestISCII(){
          0xEF, 0x30,
  
      };
-    testConvertToU(byteArr,(sizeof(byteArr)),in,(sizeof(in)/U_SIZEOF_UCHAR),"x-iscii-de",NULL,TRUE);
+    testConvertToU(byteArr,(sizeof(byteArr)),in,UPRV_LENGTHOF(in),"x-iscii-de",NULL,TRUE);
      TestConv(in,(sizeof(in)/2),"ISCII,version=0","hindi", (char *)byteArr,sizeof(byteArr));    
  
  }
@@ -3201,7 +3301,7 @@ TestISO_2022_JP() {
          0x0043, 0x0044, 0x0045, 0x0046, 0x0047, 0x0048, 0x0049, 0x004A, 0x000D, 0x000A,
          0x004B, 0x004C, 0x004D, 0x004E, 0x004F, 0x0050, 0x0051, 0x0052, 0x000D, 0x000A,
          0x3005, 0x3006, 0x3007, 0x30FC, 0x2015, 0x2010, 0xFF0F, 0x005C, 0x000D, 0x000A,
-        0x301C, 0x2016, 0x2026, 0x2025, 0x2018, 0x2019, 0x201C, 0x000D, 0x000A,
+        0x3013, 0x2018, 0x2026, 0x2025, 0x2018, 0x2019, 0x201C, 0x000D, 0x000A,
          0x201D, 0x3014, 0x000D, 0x000A,
          0x0053, 0x0054, 0x0055, 0x0056, 0x0057, 0x0058, 0x0059, 0x005A, 0x000D, 0x000A,
          0x0053, 0x0054, 0x0055, 0x0056, 0x0057, 0x0058, 0x0059, 0x005A, 0x000D, 0x000A,
@@ -3230,7 +3330,7 @@ TestISO_2022_JP() {
      uBuf =  (UChar*)malloc(uBufSize * sizeof(UChar)*5);
      cBuf =(char*)malloc(uBufSize * sizeof(char) * 5);
      uSource = (const UChar*)in;
-    uSourceLimit=(const UChar*)in + (sizeof(in)/sizeof(in[0]));
+    uSourceLimit=(const UChar*)in + UPRV_LENGTHOF(in);
      cTarget = cBuf;
      cTargetLimit = cBuf +uBufSize*5;
      uTarget = uBuf;
@@ -3260,10 +3360,10 @@ TestISO_2022_JP() {
          test++;
      }
  
-    TestSmallTargetBuffer(in,(const UChar*)in + (sizeof(in)/sizeof(in[0])),cnv);
-    TestSmallSourceBuffer(in,(const UChar*)in + (sizeof(in)/sizeof(in[0])),cnv);
+    TestSmallTargetBuffer(in,(const UChar*)in + UPRV_LENGTHOF(in),cnv);
+    TestSmallSourceBuffer(in,(const UChar*)in + UPRV_LENGTHOF(in),cnv);
      TestGetNextUChar2022(cnv, cBuf, cTarget, in, "ISO-2022-JP encoding");
-    TestToAndFromUChars(in,(const UChar*)in + (sizeof(in)/sizeof(in[0])),cnv);
+    TestToAndFromUChars(in,(const UChar*)in + UPRV_LENGTHOF(in),cnv);
      TestJitterbug930("csISO2022JP");
      ucnv_close(cnv);
      free(uBuf);
@@ -3389,9 +3489,9 @@ unescape(UChar* dst, int32_t dstLen,const char* src,int32_t srcLen,UErrorCode *s
          }
          if(dstIndex < dstLen){
              if(c>0xFFFF){
-               dst[dstIndex++] = UTF16_LEAD(c);
+               dst[dstIndex++] = U16_LEAD(c);
                 if(dstIndex<dstLen){
-                    dst[dstIndex]=UTF16_TRAIL(c);
+                    dst[dstIndex]=U16_TRAIL(c);
                 }else{
                     *status=U_BUFFER_OVERFLOW_ERROR;
                 }
@@ -3429,8 +3529,8 @@ TestFullRoundtrip(const char* cp){
              usource[0] =(UChar) i;
              len=1;
          }else{
-            usource[0]=UTF16_LEAD(i);
-            usource[1]=UTF16_TRAIL(i);
+            usource[0]=U16_LEAD(i);
+            usource[1]=U16_TRAIL(i);
              len=2;
          }
          ulen=len;
@@ -3460,7 +3560,7 @@ TestFullRoundtrip(const char* cp){
  
  static void
  TestRoundTrippingAllUTF(void){
-    if(!QUICK){
+    if(!getTestOption(QUICK_OPTION)){
          log_verbose("Running exhaustive round trip test for BOCU-1\n");
          TestFullRoundtrip("BOCU-1");
          log_verbose("Running exhaustive round trip test for SCSU\n");
@@ -3487,8 +3587,19 @@ TestRoundTrippingAllUTF(void){
          TestFullRoundtrip("UTF-7,version=1");
          log_verbose("Running exhaustive round trip test for IMAP-mailbox-name\n");
          TestFullRoundtrip("IMAP-mailbox-name");
-        log_verbose("Running exhaustive round trip test for GB18030\n");
-        TestFullRoundtrip("GB18030");
+        /*
+         *
+         * With the update to GB18030 2005 (Ticket #8274), this test will fail because the 2005 version of
+         * GB18030 contains mappings to actual Unicode codepoints (which were previously mapped to PUA).
+         * The old mappings remain as fallbacks.
+         * This test may be reintroduced at a later time.
+         *
+         * 110118 - mow
+         */
+         /*
+         log_verbose("Running exhaustive round trip test for GB18030\n");
+         TestFullRoundtrip("GB18030");
+         */
      }
  }
  
@@ -3649,7 +3760,7 @@ TestSCSU() {
            "\\uf95b\\u2458\\u2468\\u0e20\\uf51b\\ue36e\\ubfc1\\u0080\\u02dd\\uf1b5\\u0cf3\\u6059\\u7489",
      };
      int i=0;
-    for(;i<sizeof(fTestCases)/sizeof(*fTestCases);i++){
+    for(;i<UPRV_LENGTHOF(fTestCases);i++){
          const char* cSrc = fTestCases[i];
          UErrorCode status = U_ZERO_ERROR;
          int32_t cSrcLen,srcLen;
@@ -3729,7 +3840,7 @@ TestISO_2022_JP_1() {
          0x52C8, 0x52CC, 0x52CF, 0x52D1, 0x52D4, 0x52D6, 0x52DB, 0x52DC, 0x000D, 0x000A,
          0x004B, 0x004C, 0x004D, 0x004E, 0x004F, 0x0050, 0x0051, 0x0052, 0x000D, 0x000A,
          0x3005, 0x3006, 0x3007, 0x30FC, 0x2015, 0x2010, 0xFF0F, 0x005C, 0x000D, 0x000A,
-        0x301C, 0x2016, 0x2026, 0x2025, 0x2018, 0x2019, 0x201C, 0x000D, 0x000A,
+        0x3013, 0x2018, 0x2026, 0x2025, 0x2018, 0x2019, 0x201C, 0x000D, 0x000A,
          0x201D, 0x000D, 0x000A,
          0x0053, 0x0054, 0x0055, 0x0056, 0x0057, 0x0058, 0x0059, 0x005A, 0x000D, 0x000A,
          0x4F94, 0x4F97, 0x52BA, 0x52BB, 0x52BD, 0x52C0, 0x52C4, 0x52C6, 0x000D, 0x000A,
@@ -3761,7 +3872,7 @@ TestISO_2022_JP_1() {
      uBuf =  (UChar*)malloc(uBufSize * sizeof(UChar)*5);
      cBuf =(char*)malloc(uBufSize * sizeof(char) * 5);
      uSource = (const UChar*)in;
-    uSourceLimit=(const UChar*)in + (sizeof(in)/sizeof(in[0]));
+    uSourceLimit=(const UChar*)in + UPRV_LENGTHOF(in);
      cTarget = cBuf;
      cTargetLimit = cBuf +uBufSize*5;
      uTarget = uBuf;
@@ -3796,8 +3907,8 @@ TestISO_2022_JP_1() {
          static const uint8_t source2[]={0x0e,0x24,0x053};
          TestNextUCharError(cnv, (const char*)source2, (const char*)source2+sizeof(source2), U_ZERO_ERROR, "an invalid character [ISO-2022-JP-1]");
      }
-    TestSmallTargetBuffer(in,(const UChar*)in + (sizeof(in)/sizeof(in[0])),cnv);
-    TestSmallSourceBuffer(in,(const UChar*)in + (sizeof(in)/sizeof(in[0])),cnv);
+    TestSmallTargetBuffer(in,(const UChar*)in + UPRV_LENGTHOF(in),cnv);
+    TestSmallSourceBuffer(in,(const UChar*)in + UPRV_LENGTHOF(in),cnv);
      ucnv_close(cnv);
      free(uBuf);
      free(cBuf);
@@ -3851,7 +3962,7 @@ TestISO_2022_JP_2() {
      uBuf =  (UChar*)malloc(uBufSize * sizeof(UChar)*5);
      cBuf =(char*)malloc(uBufSize * sizeof(char) * 5);
      uSource = (const UChar*)in;
-    uSourceLimit=(const UChar*)in + (sizeof(in)/sizeof(in[0]));
+    uSourceLimit=(const UChar*)in + UPRV_LENGTHOF(in);
      cTarget = cBuf;
      cTargetLimit = cBuf +uBufSize*5;
      uTarget = uBuf;
@@ -3879,9 +3990,9 @@ TestISO_2022_JP_2() {
          uSource++;
          test++;
      }
-    TestSmallTargetBuffer(in,(const UChar*)in + (sizeof(in)/sizeof(in[0])),cnv);
-    TestSmallSourceBuffer(in,(const UChar*)in + (sizeof(in)/sizeof(in[0])),cnv);
-    TestToAndFromUChars(in,(const UChar*)in + (sizeof(in)/sizeof(in[0])),cnv);
+    TestSmallTargetBuffer(in,(const UChar*)in + UPRV_LENGTHOF(in),cnv);
+    TestSmallSourceBuffer(in,(const UChar*)in + UPRV_LENGTHOF(in),cnv);
+    TestToAndFromUChars(in,(const UChar*)in + UPRV_LENGTHOF(in),cnv);
      /*Test for the condition where there is an invalid character*/
      ucnv_reset(cnv);
      {
@@ -3898,11 +4009,11 @@ static void
  TestISO_2022_KR() {
      /* test input */
      static const uint16_t in[]={
-                    0x9F4B,0x9F4E,0x9F52,0x9F5F,0x9F61,0x9F66,0x9F67,0x9F6A,0x000A,0x000D
-                   ,0x9F6C,0x9F77,0x9F8D,0x9F90,0x9F95,0x9F9C,0xAC00,0xAC01,0xAC02,0xAC04
+                    0x9F4B,0x9F4E,0x9F52,0x9F5F,0x9F61,0x9F67,0x9F6A,0x000A,0x000D
+                   ,0x9F6C,0x9F77,0x9F8D,0x9F90,0x9F95,0x9F9C,0xAC00,0xAC01,0xAC04
                     ,0xAC07,0xAC08,0xAC09,0x0025,0x0026,0x0027,0x000A,0x000D,0x0028,0x0029
                     ,0x002A,0x002B,0x002C,0x002D,0x002E,0x53C3,0x53C8,0x53C9,0x53CA,0x53CB
-                   ,0x53CD,0x53D4,0x53D6,0x53D7,0x53DB,0x000A,0x000D,0x53DF,0x53E1,0x53E2
+                   ,0x53CD,0x53D4,0x53D6,0x53D7,0x53DB,0x000A,0x000D,0x53E1,0x53E2
                     ,0x53E3,0x53E4,0x000A,0x000D};
      const UChar* uSource;
      const UChar* uSourceLimit;
@@ -3928,7 +4039,7 @@ TestISO_2022_KR() {
      uBuf =  (UChar*)malloc(uBufSize * sizeof(UChar)*5);
      cBuf =(char*)malloc(uBufSize * sizeof(char) * 5);
      uSource = (const UChar*)in;
-    uSourceLimit=(const UChar*)in + (sizeof(in)/sizeof(in[0]));
+    uSourceLimit=(const UChar*)in + UPRV_LENGTHOF(in);
      cTarget = cBuf;
      cTargetLimit = cBuf +uBufSize*5;
      uTarget = uBuf;
@@ -3956,9 +4067,9 @@ TestISO_2022_KR() {
          test++;
      }
      TestGetNextUChar2022(cnv, cBuf, cTarget, in, "ISO-2022-KR encoding");
-    TestSmallTargetBuffer(in,(const UChar*)in + (sizeof(in)/sizeof(in[0])),cnv);
-    TestSmallSourceBuffer(in,(const UChar*)in + (sizeof(in)/sizeof(in[0])),cnv);
-    TestToAndFromUChars(in,(const UChar*)in + (sizeof(in)/sizeof(in[0])),cnv);
+    TestSmallTargetBuffer(in,(const UChar*)in + UPRV_LENGTHOF(in),cnv);
+    TestSmallSourceBuffer(in,(const UChar*)in + UPRV_LENGTHOF(in),cnv);
+    TestToAndFromUChars(in,(const UChar*)in + UPRV_LENGTHOF(in),cnv);
      TestJitterbug930("csISO2022KR");
      /*Test for the condition where there is an invalid character*/
      ucnv_reset(cnv);
@@ -4007,7 +4118,7 @@ TestISO_2022_KR_1() {
      uBuf =  (UChar*)malloc(uBufSize * sizeof(UChar)*5);
      cBuf =(char*)malloc(uBufSize * sizeof(char) * 5);
      uSource = (const UChar*)in;
-    uSourceLimit=(const UChar*)in + (sizeof(in)/sizeof(in[0]));
+    uSourceLimit=(const UChar*)in + UPRV_LENGTHOF(in);
      cTarget = cBuf;
      cTargetLimit = cBuf +uBufSize*5;
      uTarget = uBuf;
@@ -4036,10 +4147,10 @@ TestISO_2022_KR_1() {
      }
      ucnv_reset(cnv);
      TestGetNextUChar2022(cnv, cBuf, cTarget, in, "ISO-2022-KR encoding");
-    TestSmallTargetBuffer(in,(const UChar*)in + (sizeof(in)/sizeof(in[0])),cnv);
-    TestSmallSourceBuffer(in,(const UChar*)in + (sizeof(in)/sizeof(in[0])),cnv);
+    TestSmallTargetBuffer(in,(const UChar*)in + UPRV_LENGTHOF(in),cnv);
+    TestSmallSourceBuffer(in,(const UChar*)in + UPRV_LENGTHOF(in),cnv);
      ucnv_reset(cnv);
-    TestToAndFromUChars(in,(const UChar*)in + (sizeof(in)/sizeof(in[0])),cnv);
+    TestToAndFromUChars(in,(const UChar*)in + UPRV_LENGTHOF(in),cnv);
          /*Test for the condition where there is an invalid character*/
      ucnv_reset(cnv);
      {
@@ -4156,15 +4267,19 @@ TestJIS(){
          };
  
          testConvertToU(sampleTextJIS,sizeof(sampleTextJIS),expectedISO2022JIS,
-            sizeof(expectedISO2022JIS)/sizeof(expectedISO2022JIS[0]),"JIS", toISO2022JISOffs,TRUE);
+            UPRV_LENGTHOF(expectedISO2022JIS),"JIS", toISO2022JISOffs,TRUE);
          testConvertToU(sampleTextJIS7,sizeof(sampleTextJIS7),expectedISO2022JIS7,
-            sizeof(expectedISO2022JIS7)/sizeof(expectedISO2022JIS7[0]),"JIS7", toISO2022JIS7Offs,TRUE);
+            UPRV_LENGTHOF(expectedISO2022JIS7),"JIS7", toISO2022JIS7Offs,TRUE);
          testConvertToU(sampleTextJIS8,sizeof(sampleTextJIS8),expectedISO2022JIS8,
-            sizeof(expectedISO2022JIS8)/sizeof(expectedISO2022JIS8[0]),"JIS8", toISO2022JIS8Offs,TRUE);
+            UPRV_LENGTHOF(expectedISO2022JIS8),"JIS8", toISO2022JIS8Offs,TRUE);
      }
  
  }
  
+
+#if 0
+ ICU 4.4 (ticket #7314) removes mappings for CNS 11643 planes 3..7
+
  static void TestJitterbug915(){
  /* tests for roundtripping of the below sequence
  \x1b$)G\x0E#!#"###$#%#&#'#(#)#*#+          / *plane 1 * /
@@ -4309,7 +4424,7 @@ TestISO_2022_CN_EXT() {
      uBuf =  (UChar*)malloc(uBufSize * sizeof(UChar)*5);
      cBuf =(char*)malloc(uBufSize * sizeof(char) * 10);
      uSource = (const UChar*)in;
-    uSourceLimit=(const UChar*)in + (sizeof(in)/sizeof(in[0]));
+    uSourceLimit=(const UChar*)in + UPRV_LENGTHOF(in);
      cTarget = cBuf;
      cTargetLimit = cBuf +uBufSize*5;
      uTarget = uBuf;
@@ -4339,8 +4454,8 @@ TestISO_2022_CN_EXT() {
          uSource++;
          test++;
      }
-    TestSmallTargetBuffer(in,(const UChar*)in + (sizeof(in)/sizeof(in[0])),cnv);
-    TestSmallSourceBuffer(in,(const UChar*)in + (sizeof(in)/sizeof(in[0])),cnv);
+    TestSmallTargetBuffer(in,(const UChar*)in + UPRV_LENGTHOF(in),cnv);
+    TestSmallSourceBuffer(in,(const UChar*)in + UPRV_LENGTHOF(in),cnv);
      /*Test for the condition where there is an invalid character*/
      ucnv_reset(cnv);
      {
@@ -4352,6 +4467,7 @@ TestISO_2022_CN_EXT() {
      free(cBuf);
      free(offsets);
  }
+#endif
  
  static void
  TestISO_2022_CN() {
@@ -4407,7 +4523,7 @@ TestISO_2022_CN() {
      uBuf =  (UChar*)malloc(uBufSize * sizeof(UChar)*5);
      cBuf =(char*)malloc(uBufSize * sizeof(char) * 10);
      uSource = (const UChar*)in;
-    uSourceLimit=(const UChar*)in + (sizeof(in)/sizeof(in[0]));
+    uSourceLimit=(const UChar*)in + UPRV_LENGTHOF(in);
      cTarget = cBuf;
      cTargetLimit = cBuf +uBufSize*5;
      uTarget = uBuf;
@@ -4438,9 +4554,9 @@ TestISO_2022_CN() {
          test++;
      }
      TestGetNextUChar2022(cnv, cBuf, cTarget, in, "ISO-2022-CN encoding");
-    TestSmallTargetBuffer(in,(const UChar*)in + (sizeof(in)/sizeof(in[0])),cnv);
-    TestSmallSourceBuffer(in,(const UChar*)in + (sizeof(in)/sizeof(in[0])),cnv);
-    TestToAndFromUChars(in,(const UChar*)in + (sizeof(in)/sizeof(in[0])),cnv);
+    TestSmallTargetBuffer(in,(const UChar*)in + UPRV_LENGTHOF(in),cnv);
+    TestSmallSourceBuffer(in,(const UChar*)in + UPRV_LENGTHOF(in),cnv);
+    TestToAndFromUChars(in,(const UChar*)in + UPRV_LENGTHOF(in),cnv);
      TestJitterbug930("csISO2022CN");
      /*Test for the condition where there is an invalid character*/
      ucnv_reset(cnv);
@@ -4465,10 +4581,12 @@ typedef struct {
  /* Callback for TestJitterbug6175, should only get called for empty segment errors */
  static void UCNV_TO_U_CALLBACK_EMPTYSEGMENT( const void *context, UConverterToUnicodeArgs *toArgs, const char* codeUnits,
                                               int32_t length, UConverterCallbackReason reason, UErrorCode * err ) {
-    if (reason > UCNV_IRREGULAR)
+    if (reason > UCNV_IRREGULAR) {
          return;
-    if (reason != UCNV_IRREGULAR)
+    }
+    if (reason != UCNV_IRREGULAR) {
          log_err("toUnicode callback invoked for empty segment but reason is not UCNV_IRREGULAR\n");
+    }
      /* Standard stuff below from UCNV_TO_U_CALLBACK_SUBSTITUTE */
      *err = U_ZERO_ERROR;
      ucnv_cbToUWriteSub(toArgs,0,err);
@@ -4802,14 +4920,14 @@ TestLMBCS() {
  
         UChar Out [sizeof(pszUnicode) + 1];
         UChar * pOut = Out;
-       UChar * OutLimit = Out + sizeof(pszUnicode)/sizeof(UChar);
+       UChar * OutLimit = Out + UPRV_LENGTHOF(pszUnicode);
  
         int32_t off [sizeof(offsets)];
  
        /* last 'offset' in expected results is just the final size.
           (Makes other tests easier). Compensate here: */
  
-       off[(sizeof(offsets)/sizeof(offsets[0]))-1] = sizeof(pszLMBCS);
+       off[UPRV_LENGTHOF(offsets)-1] = sizeof(pszLMBCS);
  
  
  
@@ -4892,8 +5010,8 @@ TestLMBCS() {
  
        /* 0192 (hook) converts to both group 3 & group 1. input locale should differentiate */
        ucnv_fromUnicode (cnv16he,
-                        &pLMBCSIn, (pLMBCSIn + sizeof(lmbcsString)/sizeof(lmbcsString[0])),
-                        &pUniOut, pUniOut + sizeof(uniString)/sizeof(uniString[0]),
+                        &pLMBCSIn, (pLMBCSIn + UPRV_LENGTHOF(lmbcsString)),
+                        &pUniOut, pUniOut + UPRV_LENGTHOF(uniString),
                          NULL, 1, &errorCode);
  
        if (lmbcsString[0] != 0x3 || lmbcsString[1] != 0x83)
@@ -4904,8 +5022,8 @@ TestLMBCS() {
        pLMBCSIn= (char *)lmbcsString;
        pUniOut = uniString;
        ucnv_fromUnicode (cnv01us,
-                        &pLMBCSIn, (const char *)(lmbcsString + sizeof(lmbcsString)/sizeof(lmbcsString[0])),
-                        &pUniOut, pUniOut + sizeof(uniString)/sizeof(uniString[0]),
+                        &pLMBCSIn, (const char *)(lmbcsString + UPRV_LENGTHOF(lmbcsString)),
+                        &pUniOut, pUniOut + UPRV_LENGTHOF(uniString),
                          NULL, 1, &errorCode);
  
        if (lmbcsString[0] != 0x9F)
@@ -4972,7 +5090,7 @@ TestLMBCS() {
  
         UChar Out [sizeof(pszUnicode) + 1];
         UChar * pOut = Out;
-       UChar * OutLimit = Out + sizeof(pszUnicode)/sizeof(UChar);
+       UChar * OutLimit = Out + UPRV_LENGTHOF(pszUnicode);
  
  
         cnv = ucnv_open(NAME_LMBCS_1, &errorCode);
@@ -5033,11 +5151,14 @@ TestLMBCS() {
           errorCode=U_ZERO_ERROR;
  
           /* negative source request should always return U_ILLEGAL_ARGUMENT_ERROR */
-         ucnv_fromUnicode(cnv, &pLOut,pLOut+1,&pUIn,pUIn-1,off,FALSE, &errorCode);
+         pUIn++;
+         ucnv_fromUnicode(cnv, &pLOut, pLOut+1, &pUIn, pUIn-1, off, FALSE, &errorCode);
           if (errorCode != U_ILLEGAL_ARGUMENT_ERROR)
           {
              log_err("Unexpected Error on negative source request to ucnv_fromUnicode: %s\n", u_errorName(errorCode));
           }
+         pUIn--;
+         
           errorCode=U_ZERO_ERROR;
           ucnv_toUnicode(cnv, &pUOut,pUOut+1,(const char **)&pLIn,(const char *)(pLIn-1),off,FALSE, &errorCode);
           if (errorCode != U_ILLEGAL_ARGUMENT_ERROR)
@@ -5078,7 +5199,7 @@ TestLMBCS() {
           /* running out of target room : U_BUFFER_OVERFLOW_ERROR */
  
           pUIn = pszUnicode;
-         ucnv_fromUnicode(cnv, &pLOut,pLOut+offsets[4],&pUIn,pUIn+sizeof(pszUnicode)/sizeof(UChar),off,FALSE, &errorCode);
+         ucnv_fromUnicode(cnv, &pLOut,pLOut+offsets[4],&pUIn,pUIn+UPRV_LENGTHOF(pszUnicode),off,FALSE, &errorCode);
           if (errorCode != U_BUFFER_OVERFLOW_ERROR || pLOut != LOut + offsets[4] || pUIn != pszUnicode+4 )
           {
              log_err("Unexpected results on out of target room to ucnv_fromUnicode\n");
@@ -5106,7 +5227,7 @@ TestLMBCS() {
           pUOut = UOut;
  
           ucnv_setToUCallBack(cnv, UCNV_TO_U_CALLBACK_STOP, NULL, NULL, NULL, &errorCode);
-         ucnv_toUnicode(cnv, &pUOut,pUOut+sizeof(UOut)/sizeof(UChar),(const char **)&pLIn,(const char *)(pLIn+5),off,TRUE, &errorCode);
+         ucnv_toUnicode(cnv, &pUOut,pUOut+UPRV_LENGTHOF(UOut),(const char **)&pLIn,(const char *)(pLIn+5),off,TRUE, &errorCode);
           if (UOut[0] != 0xD801 || errorCode != U_TRUNCATED_CHAR_FOUND || pUOut != UOut + 1 || pLIn != LIn + 5)
           {
              log_err("Unexpected results on chopped low surrogate\n");
@@ -5120,7 +5241,7 @@ TestLMBCS() {
           errorCode = U_ZERO_ERROR;
           pUOut = UOut;
  
-         ucnv_toUnicode(cnv, &pUOut,pUOut+sizeof(UOut)/sizeof(UChar),(const char **)&pLIn,(const char *)(pLIn+3),off,TRUE, &errorCode);
+         ucnv_toUnicode(cnv, &pUOut,pUOut+UPRV_LENGTHOF(UOut),(const char **)&pLIn,(const char *)(pLIn+3),off,TRUE, &errorCode);
           if (UOut[0] != 0xD801 || U_FAILURE(errorCode) || pUOut != UOut + 1 || pLIn != LIn + 3)
           {
              log_err("Unexpected results on chopped at surrogate boundary \n");
@@ -5137,7 +5258,7 @@ TestLMBCS() {
           errorCode = U_ZERO_ERROR;
           pUOut = UOut;
  
-         ucnv_toUnicode(cnv, &pUOut,pUOut+sizeof(UOut)/sizeof(UChar),(const char **)&pLIn,(const char *)(pLIn+6),off,TRUE, &errorCode);
+         ucnv_toUnicode(cnv, &pUOut,pUOut+UPRV_LENGTHOF(UOut),(const char **)&pLIn,(const char *)(pLIn+6),off,TRUE, &errorCode);
           if (UOut[0] != 0xD801 || UOut[1] != 0xC9D0 || U_FAILURE(errorCode) || pUOut != UOut + 2 || pLIn != LIn + 6)
           {
              log_err("Unexpected results after unpaired surrogate plus valid Unichar \n");
@@ -5154,7 +5275,7 @@ TestLMBCS() {
           errorCode = U_ZERO_ERROR;
           pUOut = UOut;
  
-         ucnv_toUnicode(cnv, &pUOut,pUOut+sizeof(UOut)/sizeof(UChar),(const char **)&pLIn,(const char *)(pLIn+5),off,TRUE, &errorCode);
+         ucnv_toUnicode(cnv, &pUOut,pUOut+UPRV_LENGTHOF(UOut),(const char **)&pLIn,(const char *)(pLIn+5),off,TRUE, &errorCode);
           if (UOut[0] != 0xD801 || errorCode != U_TRUNCATED_CHAR_FOUND || pUOut != UOut + 1 || pLIn != LIn + 5)
           {
              log_err("Unexpected results after unpaired surrogate plus chopped Unichar \n");
@@ -5171,7 +5292,7 @@ TestLMBCS() {
           errorCode = U_ZERO_ERROR;
           pUOut = UOut;
  
-         ucnv_toUnicode(cnv, &pUOut,pUOut+sizeof(UOut)/sizeof(UChar),(const char **)&pLIn,(const char *)(pLIn+5),off,TRUE, &errorCode);
+         ucnv_toUnicode(cnv, &pUOut,pUOut+UPRV_LENGTHOF(UOut),(const char **)&pLIn,(const char *)(pLIn+5),off,TRUE, &errorCode);
           if (UOut[0] != 0xD801 || UOut[1] != 0x1B || U_FAILURE(errorCode) || pUOut != UOut + 2 || pLIn != LIn + 5)
           {
              log_err("Unexpected results after unpaired surrogate plus valid non-Unichar\n");
@@ -5187,7 +5308,7 @@ TestLMBCS() {
           errorCode = U_ZERO_ERROR;
           pUOut = UOut;
  
-         ucnv_toUnicode(cnv, &pUOut,pUOut+sizeof(UOut)/sizeof(UChar),(const char **)&pLIn,(const char *)(pLIn+4),off,TRUE, &errorCode);
+         ucnv_toUnicode(cnv, &pUOut,pUOut+UPRV_LENGTHOF(UOut),(const char **)&pLIn,(const char *)(pLIn+4),off,TRUE, &errorCode);
  
           if (UOut[0] != 0xD801 || errorCode != U_TRUNCATED_CHAR_FOUND || pUOut != UOut + 1 || pLIn != LIn + 4)
           {
@@ -5205,7 +5326,7 @@ static void TestJitterbug255()
      const char *testBuffer = (const char *)testBytes;
      const char *testEnd = (const char *)testBytes + sizeof(testBytes);
      UErrorCode status = U_ZERO_ERROR;
-    UChar32 result;
+    /*UChar32 result;*/
      UConverter *cnv = 0;
  
      cnv = ucnv_open("shift-jis", &status);
@@ -5215,7 +5336,7 @@ static void TestJitterbug255()
      }
      while (testBuffer != testEnd)
      {
-        result = ucnv_getNextUChar (cnv, &testBuffer, testEnd , &status);
+        /*result = */ucnv_getNextUChar (cnv, &testBuffer, testEnd , &status);
          if (U_FAILURE(status))
          {
              log_err("Failed to convert the next UChar for SJIS.\n");
@@ -5275,16 +5396,23 @@ static void TestJitterbug981(){
      int numNeeded=0;
      utf8cnv = ucnv_open ("utf8", &status);
      if(U_FAILURE(status)){
-        log_err("Could not open UTF-8 converter. Error: %s", u_errorName(status));
+        log_err("Could not open UTF-8 converter. Error: %s\n", u_errorName(status));
          return;
      }
      myCollator = ucol_open("zh", &status);
      if(U_FAILURE(status)){
-        log_err("Could not open collator for zh locale. Error: %s", u_errorName(status));
+        log_data_err("Could not open collator for zh locale. Error: %s\n", u_errorName(status));
+        ucnv_close(utf8cnv);
          return;
      }
  
      rules = ucol_getRules(myCollator, &rules_length);
+    if(rules_length == 0) {
+        log_data_err("missing zh tailoring rule string\n");
+        ucol_close(myCollator);
+        ucnv_close(utf8cnv);
+        return;
+    }
      buff_size = rules_length * ucnv_getMaxCharSize(utf8cnv);
      buff = malloc(buff_size);
  
@@ -5294,13 +5422,14 @@ static void TestJitterbug981(){
          status = U_ZERO_ERROR;
          if(target_cap >= buff_size) {
              log_err("wanted %d bytes, only %d available\n", target_cap, buff_size);
-            return;
+            break;
          }
          bytes_needed = ucnv_fromUChars(utf8cnv, buff, target_cap,
              rules, rules_length, &status);
          target_cap = (bytes_needed > target_cap) ? bytes_needed : target_cap +1;
          if(numNeeded!=0 && numNeeded!= bytes_needed){
              log_err("ucnv_fromUChars returns different values for required capacity in pre-flight and conversion modes");
+            break;
          }
          numNeeded = bytes_needed;
      } while (status == U_BUFFER_OVERFLOW_ERROR);
@@ -5311,6 +5440,7 @@ static void TestJitterbug981(){
  
  #endif
  
+#if !UCONFIG_NO_LEGACY_CONVERSION
  static void TestJitterbug1293(){
      static const UChar src[] = {0x30DE, 0x30A4, 0x5E83, 0x544A, 0x30BF, 0x30A4, 0x30D7,0x000};
      char target[256];
@@ -5338,4 +5468,146 @@ static void TestJitterbug1293(){
      }
      ucnv_close(conv);
  }
+#endif
+
+static void TestJB5275_1(){
+
+    static const char* data = "\x3B\xB3\x0A" /* Easy characters */
+                                "\xC0\xE9\xBF\xE9\xE8\xD8\x0A" /* Gurmukhi test */
+                                /* Switch script: */
+                                "\xEF\x43\xC0\xE9\xBF\xE9\xE8\xD8\x0A" /* Bengali test */
+                                "\x3B\xB3\x0A" /* Easy characters - new line, so should default!*/
+                                "\xEF\x40\x3B\xB3\x0A";
+    static const UChar expected[] ={ 
+            0x003b, 0x0a15, 0x000a, /* Easy characters */
+            0x0a5c, 0x0a4d, 0x0a39, 0x0a5c, 0x0a4d, 0x0a39, 0x000a, /* Gurmukhi test */
+            0x09dd, 0x09dc, 0x09cd, 0x09b9, 0x000a, /* Switch script: to Bengali*/ 
+            0x003b, 0x0a15, 0x000a, /* Easy characters - new line, so should default!*/
+            0x003b, 0x0a15, 0x000a /* Back to Gurmukhi*/
+    };
+        
+    UErrorCode status = U_ZERO_ERROR;
+    UConverter* conv = ucnv_open("iscii-gur", &status);
+    UChar dest[100] = {'\0'};
+    UChar* target = dest;
+    UChar* targetLimit = dest+100;
+    const char* source = data;
+    const char* sourceLimit = data+strlen(data);
+    const UChar* exp = expected;
+    
+    if (U_FAILURE(status)) {
+        log_data_err("Unable to open converter: iscii-gur got errorCode: %s\n", u_errorName(status));
+        return;
+    }
+    
+    log_verbose("Testing switching back to default script when new line is encountered.\n");
+    ucnv_toUnicode(conv, &target, targetLimit, &source, sourceLimit, NULL, TRUE, &status);
+    if(U_FAILURE(status)){
+        log_err("conversion failed: %s \n", u_errorName(status));
+    }
+    targetLimit = target;
+    target = dest;
+    printUSeq(target, (int)(targetLimit-target));
+    while(target<targetLimit){
+        if(*exp!=*target){
+            log_err("did not get the expected output. \\u%04X != \\u%04X (got)\n", *exp, *target);
+        }
+        target++;
+        exp++;
+    }
+    ucnv_close(conv);
+}
+
+static void TestJB5275(){
+    static const char* data = 
+    /* "\xEF\x42\xEF\x41\xA4\xD5\xE5\xB3\xEA\x0A"  unsupported sequence \xEF\x41 */
+    /* "\xEF\x42\xEF\x41\xD4\xDA\xB3\xE8\xEA\x0A"  unsupported sequence \xEF\x41  */
+    /* "\xEF\x44\xEF\x41\xC8\xE1\x8B\xDB\xB3\xE8 \xB3\xE4\xC1\xE8\x0A"  unsupported sequence \xEF\x41 */
+        "\xEF\x4B\xC0\xE9\xBF\xE9\xE8\xD8\x0A"  /* Gurmukhi test */
+        "\xEF\x4A\xC0\xD4\xBF\xD4\xE8\xD8\x0A"  /* Gujarati test */
+        "\xEF\x48\x38\xB3\x0A"  /* Kannada test */
+        "\xEF\x49\x39\xB3\x0A"  /* Malayalam test */
+        "\xEF\x4A\x3A\xB3\x0A"  /* Gujarati test */
+        "\xEF\x4B\x3B\xB3\x0A"  /* Punjabi test */
+        /* "\xEF\x4C\x3C\xB3\x0A"  unsupported sequence \xEF\x41 */;
+    static const UChar expected[] ={ 
+        0x0A5C, 0x0A4D, 0x0A39, 0x0A5C, 0x0A4D, 0x0A39, 0x000A, /* Gurmukhi test */
+        0x0AA2, 0x0AB5, 0x0AA1, 0x0AB5, 0x0ACD, 0x0AB9, 0x000A,     /* Gujarati test */
+        0x0038, 0x0C95, 0x000A, /* Kannada test */
+        0x0039, 0x0D15, 0x000A, /* Malayalam test */
+        0x003A, 0x0A95, 0x000A, /* Gujarati test */
+        0x003B, 0x0A15, 0x000A, /* Punjabi test */
+    };
+        
+    UErrorCode status = U_ZERO_ERROR;
+    UConverter* conv = ucnv_open("iscii", &status);
+    UChar dest[100] = {'\0'};
+    UChar* target = dest;
+    UChar* targetLimit = dest+100;
+    const char* source = data;
+    const char* sourceLimit = data+strlen(data);
+    const UChar* exp = expected;
+    ucnv_toUnicode(conv, &target, targetLimit, &source, sourceLimit, NULL, TRUE, &status);
+    if(U_FAILURE(status)){
+        log_data_err("conversion failed: %s \n", u_errorName(status));
+    }
+    targetLimit = target;
+    target = dest;
+
+    printUSeq(target, (int)(targetLimit-target));
+    
+    while(target<targetLimit){
+        if(*exp!=*target){
+            log_err("did not get the expected output. \\u%04X != \\u%04X (got)\n", *exp, *target);
+        }
+        target++;
+        exp++;
+    }
+    ucnv_close(conv);
+}
+
+static void
+TestIsFixedWidth() {
+    UErrorCode status = U_ZERO_ERROR;
+    UConverter *cnv = NULL;
+    int32_t i;
+
+    const char *fixedWidth[] = {
+            "US-ASCII",
+            "UTF32",
+            "ibm-5478_P100-1995"
+    };
+
+    const char *notFixedWidth[] = {
+            "GB18030",
+            "UTF8",
+            "windows-949-2000",
+            "UTF16"
+    };
  
+    for (i = 0; i < UPRV_LENGTHOF(fixedWidth); i++) {
+        cnv = ucnv_open(fixedWidth[i], &status);
+        if (cnv == NULL || U_FAILURE(status)) {
+            log_data_err("Error open converter: %s - %s \n", fixedWidth[i], u_errorName(status));
+            continue;
+        }
+
+        if (!ucnv_isFixedWidth(cnv, &status)) {
+            log_err("%s is a fixedWidth converter but returned FALSE.\n", fixedWidth[i]);
+        }
+        ucnv_close(cnv);
+    }
+
+    for (i = 0; i < UPRV_LENGTHOF(notFixedWidth); i++) {
+        cnv = ucnv_open(notFixedWidth[i], &status);
+        if (cnv == NULL || U_FAILURE(status)) {
+            log_data_err("Error open converter: %s - %s \n", notFixedWidth[i], u_errorName(status));
+            continue;
+        }
+
+        if (ucnv_isFixedWidth(cnv, &status)) {
+            log_err("%s is NOT a fixedWidth converter but returned TRUE.\n", notFixedWidth[i]);
+        }
+        ucnv_close(cnv);
+    }
+}