Don't use native MSW functions in wxString::CmpNoCase().

author Vadim Zeitlin <vadim@wxwidgets.org>

Mon, 20 Sep 2010 12:52:26 +0000 (12:52 +0000)

committer Vadim Zeitlin <vadim@wxwidgets.org>

Mon, 20 Sep 2010 12:52:26 +0000 (12:52 +0000)
author Vadim Zeitlin <vadim@wxwidgets.org>
Mon, 20 Sep 2010 12:52:26 +0000 (12:52 +0000)
committer Vadim Zeitlin <vadim@wxwidgets.org>
Mon, 20 Sep 2010 12:52:26 +0000 (12:52 +0000)
diff --git a/src/common/string.cpp b/src/common/string.cpp

index a0d42cb42f520792cd1bd7191f3fc11d1a27dd68..96c9c526f4880c67ff1bee264db2a4650037f182 100644 (file)
--- a/src/common/string.cpp
+++ b/src/common/string.cpp
@@ -1083,40 +1083,63 @@ size_t wxString::find_last_not_of(const wxOtherCharType* sz, size_t nStart,
  
  int wxString::CmpNoCase(const wxString& s) const
  {
-#if defined(__WXMSW__) && !wxUSE_UNICODE_UTF8
-    // Prefer to use CompareString() if available as it's more efficient than
-    // doing it manually or even using wxStricmp() (see #10375)
-    //
-    // Also note that not using NORM_STRINGSORT may result in not having a
-    // strict weak ordering (e.g. s1 < s2 and s2 < s3 but s3 < s1) and so break
-    // algorithms such as std::sort that rely on it. It's also more consistent
-    // with the fall back version below.
-    switch ( ::CompareString(LOCALE_USER_DEFAULT,
-                             NORM_IGNORECASE | SORT_STRINGSORT,
-                             m_impl.c_str(), m_impl.length(),
-                             s.m_impl.c_str(), s.m_impl.length()) )
+#if !wxUSE_UNICODE_UTF8
+    // We compare NUL-delimited chunks of the strings inside the loop. We will
+    // do as many iterations as there are embedded NULs in the string, i.e.
+    // usually we will run it just once.
+
+    typedef const wxStringImpl::value_type *pchar_type;
+    const pchar_type thisBegin = m_impl.c_str();
+    const pchar_type thatBegin = s.m_impl.c_str();
+
+    const pchar_type thisEnd = thisBegin + m_impl.length();
+    const pchar_type thatEnd = thatBegin + s.m_impl.length();
+
+    pchar_type thisCur = thisBegin;
+    pchar_type thatCur = thatBegin;
+
+    int rc;
+    for ( ;; )
      {
-        case CSTR_LESS_THAN:
-            return -1;
+        // Compare until the next NUL, if the strings differ this is the final
+        // result.
+        rc = wxStricmp(thisCur, thatCur);
+        if ( rc )
+            break;
  
-        case CSTR_EQUAL:
-            return 0;
+        const size_t lenChunk = wxStrlen(thisCur);
+        thisCur += lenChunk;
+        thatCur += lenChunk;
  
-        case CSTR_GREATER_THAN:
-            return 1;
+        // Skip all the NULs as wxStricmp() doesn't handle them.
+        for ( ; !*thisCur; thisCur++, thatCur++ )
+        {
+            // Check if we exhausted either of the strings.
+            if ( thisCur == thisEnd )
+            {
+                // This one is exhausted, is the other one too?
+                return thatCur == thatEnd ? 0 : -1;
+            }
  
-        default:
-            wxFAIL_MSG( "unexpected CompareString() return value" );
-            // fall through
+            if ( thatCur == thatEnd )
+            {
+                // Because of the test above we know that this one is not
+                // exhausted yet so it's greater than the other one that is.
+                return 1;
+            }
  
-        case 0:
-            wxLogLastError("CompareString");
-            // use generic code below
+            if ( *thatCur )
+            {
+                // Anything non-NUL is greater than NUL.
+                return -1;
+            }
+        }
      }
-#endif // __WXMSW__ && !wxUSE_UNICODE_UTF8
  
-    // do the comparison manually: notice that we can't use wxStricmp() as it
-    // doesn't handle embedded NULs
+    return rc;
+#else // wxUSE_UNICODE_UTF8
+    // CRT functions can't be used for case-insensitive comparison of UTF-8
+    // strings so do it in the naive, simple and inefficient way.
  
      // FIXME-UTF8: use wxUniChar::ToLower/ToUpper once added
      const_iterator i1 = begin();
@@ -1140,6 +1163,7 @@ int wxString::CmpNoCase(const wxString& s) const
      else if ( len1 > len2 )
          return 1;
      return 0;
+#endif // !wxUSE_UNICODE_UTF8/wxUSE_UNICODE_UTF8
  }
  
  
diff --git a/tests/strings/strings.cpp b/tests/strings/strings.cpp

index b613cb65b02507e49548790ef74ef7027cac5fd1..16a72b7c6dfade46e3d54d7b070899e6b80506ed 100644 (file)
--- a/tests/strings/strings.cpp
+++ b/tests/strings/strings.cpp
@@ -455,6 +455,10 @@ void StringTestCase::Compare()
      CPPUNIT_ASSERT( s1 != neq2 );
      CPPUNIT_ASSERT( s1 != neq3 );
      CPPUNIT_ASSERT( s1 != neq4 );
+
+    CPPUNIT_ASSERT( wxString("\n").Cmp(" ") < 0 );
+    CPPUNIT_ASSERT( wxString("'").Cmp("!") > 0 );
+    CPPUNIT_ASSERT( wxString("!").Cmp("z") < 0 );
  }
  
  void StringTestCase::CompareNoCase()
@@ -502,6 +506,10 @@ void StringTestCase::CompareNoCase()
      CPPUNIT_CNCNEQ_ASSERT( s1, neq );
      CPPUNIT_CNCNEQ_ASSERT( s1, neq2 );
      CPPUNIT_CNCNEQ_ASSERT( s1, neq3 );
+
+    CPPUNIT_ASSERT( wxString("\n").CmpNoCase(" ") < 0 );
+    CPPUNIT_ASSERT( wxString("'").CmpNoCase("!") > 0);
+    CPPUNIT_ASSERT( wxString("!").Cmp("Z") < 0 );
  }
  
  void StringTestCase::Contains()
author	Vadim Zeitlin <vadim@wxwidgets.org>
	Mon, 20 Sep 2010 12:52:26 +0000 (12:52 +0000)
committer	Vadim Zeitlin <vadim@wxwidgets.org>
	Mon, 20 Sep 2010 12:52:26 +0000 (12:52 +0000)
src/common/string.cpp		patch \| blob \| blame \| history
tests/strings/strings.cpp		patch \| blob \| blame \| history