From 8f93a29f8e50aa9dc6076a900ad6d316fafddcc3 Mon Sep 17 00:00:00 2001
From: =?utf8?q?V=C3=A1clav=20Slav=C3=ADk?= <vslavik@fastmail.fm>
Date: Mon, 26 Mar 2007 20:28:04 +0000
Subject: [PATCH] Preparing wxString for UTF-8 representation: 1) split into
 wxStringImpl class that has std::string-like API and operates on char* or
 wchar_t* data and wxString class that provides Unicode iterators and indexes
 2) added both char* and wchar_t* versions of many wxString methods to avoid
 having to use _T()

git-svn-id: https://svn.wxwidgets.org/svn/wx/wxWidgets/trunk@45078 c3d73ce0-8a6f-49c7-b76d-6d57e0e08775
---
 include/wx/chartype.h    |   25 +
 include/wx/string.h      | 1596 +++++++++++++++++++++++++-------------
 include/wx/strvararg.h   |   20 +-
 src/common/string.cpp    |  801 ++++++++++++-------
 src/common/strvararg.cpp |    6 +-
 5 files changed, 1605 insertions(+), 843 deletions(-)
diff --git a/include/wx/chartype.h b/include/wx/chartype.h
index c73722946a..934e13d1bc 100644
--- a/include/wx/chartype.h
+++ b/include/wx/chartype.h
@@ -183,6 +183,31 @@
     #endif /* __WCHAR_TYPE__ */
 #endif /* ASCII/Unicode */
 
+/* ------------------------------------------------------------------------- */
+/* define wxStringCharType                                                   */
+/* ------------------------------------------------------------------------- */
+
+/* depending on the platform, Unicode build can either store wxStrings as
+   wchar_t* or UTF-8 encoded char*: */
+#if wxUSE_UNICODE
+    /* for now, all Unicode builds are wchar_t* based: */
+    #define wxUSE_UNICODE_WCHAR 1
+    #define wxUSE_UNICODE_UTF8  0
+#else
+    #define wxUSE_UNICODE_WCHAR 0
+    #define wxUSE_UNICODE_UTF8  0
+#endif
+
+/* define char type used by wxString internal representation: */
+#if wxUSE_UNICODE_UTF8
+    typedef char wxStringCharType;
+#elif wxUSE_UNICODE_WCHAR
+    typedef wchar_t wxStringCharType;
+#else
+    typedef char wxStringCharType;
+#endif
+
+
 /* ------------------------------------------------------------------------- */
 /* define _T() and related macros                                            */
 /* ------------------------------------------------------------------------- */
diff --git a/include/wx/string.h b/include/wx/string.h
index ae60ab5125..2bb59dc033 100644
--- a/include/wx/string.h
+++ b/include/wx/string.h
@@ -52,7 +52,6 @@
 #endif
 
 #include "wx/wxchar.h"      // for wxChar, wxStrlen() etc.
-#include "wx/unichar.h"
 #include "wx/strvararg.h"
 #include "wx/buffer.h"      // for wxCharBuffer
 #include "wx/strconv.h"     // for wxConvertXXX() macros and wxMBConv classes
@@ -83,7 +82,7 @@ class WXDLLIMPEXP_BASE wxString;
 // deprecated in favour of wxString::npos, don't use in new code
 //
 // maximum possible length for a string means "take all string" everywhere
-#define wxSTRING_MAXLEN wxStringBase::npos
+#define wxSTRING_MAXLEN wxString::npos
 
 #endif // WXWIN_COMPATIBILITY_2_6
 
@@ -180,12 +179,15 @@ inline int Stricmp(const char *psz1, const char *psz2)
 // FIXME-UTF8: using std::string as wxString base class is currently broken,
 //             so we use the standard wxString with std::string conversion
 //             enabled, this is API-compatible.
+#if 1
 #define wxUSE_STL_BASED_WXSTRING 0
 #if wxUSE_STL
     #undef wxUSE_STD_STRING
     #define wxUSE_STD_STRING 1
 #endif
-//#define wxUSE_STL_BASED_WXSTRING  wxUSE_STL
+#else
+#define wxUSE_STL_BASED_WXSTRING  wxUSE_STL
+#endif
 
 // in both cases we need to define wxStdString
 #if wxUSE_STL_BASED_WXSTRING || wxUSE_STD_STRING
@@ -194,7 +196,7 @@ inline int Stricmp(const char *psz1, const char *psz2)
 #include <string>
 #include "wx/afterstd.h"
 
-#if wxUSE_UNICODE
+#if wxUSE_UNICODE_WCHAR
     #ifdef HAVE_STD_WSTRING
         typedef std::wstring wxStdString;
     #else
@@ -208,23 +210,20 @@ inline int Stricmp(const char *psz1, const char *psz2)
 
 #if wxUSE_STL_BASED_WXSTRING
 
-    // we don't need an extra ctor from std::string when copy ctor already does
-    // the work
+    // we always want ctor from std::string when using std::string internally
     #undef wxUSE_STD_STRING
-    #define wxUSE_STD_STRING 0
+    #define wxUSE_STD_STRING 1
 
     #if (defined(__GNUG__) && (__GNUG__ < 3)) || \
         (defined(_MSC_VER) && (_MSC_VER <= 1200))
         #define wxSTRING_BASE_HASNT_CLEAR
     #endif
 
-    typedef wxStdString wxStringBase;
+    typedef wxStdString wxStringImpl;
 #else // if !wxUSE_STL_BASED_WXSTRING
 
-#if !defined(HAVE_STD_STRING_COMPARE) && \
-    (!defined(__WX_SETUP_H__) || wxUSE_STL_BASED_WXSTRING == 0)
-    #define HAVE_STD_STRING_COMPARE
-#endif
+// in non-STL mode, compare() is implemented in wxString and not wxStringImpl
+#undef HAVE_STD_STRING_COMPARE
 
 // ---------------------------------------------------------------------------
 // string data prepended with some housekeeping info (used by wxString class),
@@ -267,14 +266,15 @@ struct WXDLLIMPEXP_BASE wxStringData
   bool  IsValid() const   { return (nRefs != 0); }
 };
 
-class WXDLLIMPEXP_BASE wxStringBase
+class WXDLLIMPEXP_BASE wxStringImpl
 {
-public :
+public:
   // an 'invalid' value for string index, moved to this place due to a CW bug
   static const size_t npos;
+
 protected:
   // points to data preceded by wxStringData structure with ref count info
-  wxChar *m_pchData;
+  wxStringCharType *m_pchData;
 
   // accessor to string data
   wxStringData* GetStringData() const { return (wxStringData*)m_pchData - 1; }
@@ -282,9 +282,9 @@ protected:
   // string (re)initialization functions
     // initializes the string to the empty value (must be called only from
     // ctors, use Reinit() otherwise)
-  void Init() { m_pchData = (wxChar *)wxEmptyString; }
+  void Init() { m_pchData = (wxStringCharType *)wxEmptyString; }
     // initializes the string with (a part of) C-string
-  void InitWith(const wxChar *psz, size_t nPos = 0, size_t nLen = npos);
+  void InitWith(const wxStringCharType *psz, size_t nPos = 0, size_t nLen = npos);
     // as Init, but also frees old data
   void Reinit() { GetStringData()->Unlock(); Init(); }
 
@@ -292,11 +292,11 @@ protected:
     // allocates memory for string of length nLen
   bool AllocBuffer(size_t nLen);
     // effectively copies data to string
-  bool AssignCopy(size_t, const wxChar *);
+  bool AssignCopy(size_t, const wxStringCharType *);
 
   // append a (sub)string
-  bool ConcatSelf(size_t nLen, const wxChar *src, size_t nMaxLen);
-  bool ConcatSelf(size_t nLen, const wxChar *src)
+  bool ConcatSelf(size_t nLen, const wxStringCharType *src, size_t nMaxLen);
+  bool ConcatSelf(size_t nLen, const wxStringCharType *src)
     { return ConcatSelf(nLen, src, nLen); }
 
   // functions called before writing to the string: they copy it if there
@@ -306,179 +306,24 @@ protected:
 
     // compatibility with wxString
   bool Alloc(size_t nLen);
+
 public:
   // standard types
-  typedef wxUniChar value_type;
-  typedef wxUniChar char_type;
-  typedef wxUniCharRef reference;
-  typedef wxChar* pointer;
-  typedef const wxChar* const_pointer;
-
+  typedef wxStringCharType value_type;
+  typedef wxStringCharType char_type;
   typedef size_t size_type;
-  typedef wxUniChar const_reference;
-
-  #define WX_STR_ITERATOR_IMPL(iterator_name, pointer_type,                 \
-                               reference_type, reference_ctor)              \
-      public:                                                               \
-          typedef wxUniChar value_type;                                     \
-          typedef reference_type reference;                                 \
-          typedef pointer_type pointer;                                     \
-                                                                            \
-          iterator_name(const iterator_name& i) : m_cur(i.m_cur) {}         \
-                                                                            \
-          reference operator*() const { return reference_ctor; }            \
-                                                                            \
-          iterator_name& operator++()                                       \
-            { ++m_cur; return *this; }                                      \
-          iterator_name operator++(int)                                     \
-            { iterator_name tmp = *this; ++m_cur; return tmp; }             \
-          iterator_name& operator--()                                       \
-            { --m_cur; return *this; }                                      \
-          iterator_name operator--(int)                                     \
-            { iterator_name tmp = *this; --m_cur; return tmp; }             \
-                                                                            \
-          iterator_name operator+(int n) const                              \
-            { return iterator_name(m_cur + n); }                            \
-          iterator_name operator+(size_t n) const                           \
-            { return iterator_name(m_cur + n); }                            \
-          iterator_name operator-(int n) const                              \
-            { return iterator_name(m_cur - n); }                            \
-          iterator_name operator-(size_t n) const                           \
-            { return iterator_name(m_cur - n); }                            \
-          iterator_name operator+=(int n)                                   \
-            { m_cur += n; return *this; }                                   \
-          iterator_name operator+=(size_t n)                                \
-            { m_cur += n; return *this; }                                   \
-          iterator_name operator-=(int n)                                   \
-            { m_cur -= n; return *this; }                                   \
-          iterator_name operator-=(size_t n)                                \
-            { m_cur -= n; return *this; }                                   \
-                                                                            \
-          unsigned operator-(const iterator_name& i) const                  \
-            { return m_cur - i.m_cur; }                                     \
-                                                                            \
-          bool operator==(const iterator_name&i) const                      \
-            { return m_cur == i.m_cur; }                                    \
-          bool operator!=(const iterator_name& i) const                     \
-            { return m_cur != i.m_cur; }                                    \
-                                                                            \
-          bool operator<(const iterator_name& i) const                      \
-            { return m_cur < i.m_cur; }                                     \
-          bool operator>(const iterator_name& i) const                      \
-            { return m_cur > i.m_cur; }                                     \
-          bool operator<=(const iterator_name& i) const                     \
-            { return m_cur <= i.m_cur; }                                    \
-          bool operator>=(const iterator_name& i) const                     \
-            { return m_cur >= i.m_cur; }                                    \
-                                                                            \
-      protected:                                                            \
-          /* for internal wxString use only: */                             \
-          iterator_name(pointer ptr) : m_cur(ptr) {}                        \
-          operator pointer() const { return m_cur; }                        \
-                                                                            \
-          friend class WXDLLIMPEXP_BASE wxString;                           \
-          friend class WXDLLIMPEXP_BASE wxStringBase;                       \
-          friend class wxCStrData;                                          \
-                                                                            \
-      protected:                                                            \
-          pointer m_cur;
-
-  class const_iterator;
-
-  class iterator
-  {
-      WX_STR_ITERATOR_IMPL(iterator, wxChar*, wxUniCharRef,
-                           wxUniCharRef::CreateForString(m_cur))
-
-      friend class const_iterator;
-  };
-
-  class const_iterator
-  {
-      // NB: reference_type is intentionally value, not reference, the character
-      //     may be encoded differently in wxString data:
-      WX_STR_ITERATOR_IMPL(const_iterator, const wxChar*, wxUniChar,
-                           wxUniChar(*m_cur))
-
-  public:
-      const_iterator(const iterator& i) : m_cur(i.m_cur) {}
-  };
-
-  #undef WX_STR_ITERATOR
-
-  template <typename T>
-  class reverse_iterator_impl
-  {
-  public:
-      typedef T iterator_type;
-      typedef typename T::value_type value_type;
-      typedef typename T::reference reference;
-      typedef typename T::pointer *pointer;
-
-      reverse_iterator_impl(iterator_type i) : m_cur(i) {}
-      reverse_iterator_impl(const reverse_iterator_impl& ri)
-          : m_cur(ri.m_cur) {}
-
-      iterator_type base() const { return m_cur; }
-
-      reference operator*() const { return *(m_cur-1); }
-
-      reverse_iterator_impl& operator++()
-        { --m_cur; return *this; }
-      reverse_iterator_impl operator++(int)
-        { reverse_iterator_impl tmp = *this; --m_cur; return tmp; }
-      reverse_iterator_impl& operator--()
-        { ++m_cur; return *this; }
-      reverse_iterator_impl operator--(int)
-        { reverse_iterator_impl tmp = *this; ++m_cur; return tmp; }
-
-      reverse_iterator_impl operator+(int n) const
-        { return reverse_iterator_impl(m_cur - n); }
-      reverse_iterator_impl operator+(size_t n) const
-        { return reverse_iterator_impl(m_cur - n); }
-      reverse_iterator_impl operator-(int n) const
-        { return reverse_iterator_impl(m_cur + n); }
-      reverse_iterator_impl operator-(size_t n) const
-        { return reverse_iterator_impl(m_cur + n); }
-      reverse_iterator_impl operator+=(int n)
-        { m_cur -= n; return *this; }
-      reverse_iterator_impl operator+=(size_t n)
-        { m_cur -= n; return *this; }
-      reverse_iterator_impl operator-=(int n)
-        { m_cur += n; return *this; }
-      reverse_iterator_impl operator-=(size_t n)
-        { m_cur += n; return *this; }
-
-      unsigned operator-(const reverse_iterator_impl& i) const
-        { return i.m_cur - m_cur; }
-
-      bool operator==(const reverse_iterator_impl& ri) const
-        { return m_cur == ri.m_cur; }
-      bool operator!=(const reverse_iterator_impl& ri) const
-        { return !(*this == ri); }
-
-      bool operator<(const reverse_iterator_impl& i) const
-        { return m_cur > i.m_cur; }
-      bool operator>(const reverse_iterator_impl& i) const
-        { return m_cur < i.m_cur; }
-      bool operator<=(const reverse_iterator_impl& i) const
-        { return m_cur >= i.m_cur; }
-      bool operator>=(const reverse_iterator_impl& i) const
-        { return m_cur <= i.m_cur; }
-
-  private:
-      iterator_type m_cur;
-  };
-
-  typedef reverse_iterator_impl<iterator> reverse_iterator;
-  typedef reverse_iterator_impl<const_iterator> const_reverse_iterator;
-
+  typedef value_type& reference;
+  typedef const value_type& const_reference;
+  typedef value_type* pointer;
+  typedef const value_type* const_pointer;
+  typedef value_type *iterator;
+  typedef const value_type *const_iterator;
 
   // constructors and destructor
     // ctor for an empty string
-  wxStringBase() { Init(); }
+  wxStringImpl() { Init(); }
     // copy ctor
-  wxStringBase(const wxStringBase& stringSrc)
+  wxStringImpl(const wxStringImpl& stringSrc)
   {
     wxASSERT_MSG( stringSrc.GetStringData()->IsValid(),
                   _T("did you forget to call UngetWriteBuf()?") );
@@ -493,19 +338,15 @@ public:
     }
   }
     // string containing nRepeat copies of ch
-  wxStringBase(size_type nRepeat, wxUniChar ch);
+  wxStringImpl(size_type nRepeat, wxStringCharType ch);
     // ctor takes first nLength characters from C string
     // (default value of npos means take all the string)
-  wxStringBase(const wxChar *psz)
+  wxStringImpl(const wxStringCharType *psz)
       { InitWith(psz, 0, npos); }
-  wxStringBase(const wxChar *psz, size_t nLength)
-      { InitWith(psz, 0, nLength); }
-  wxStringBase(const wxChar *psz,
-               const wxMBConv& WXUNUSED(conv),
-               size_t nLength = npos)
+  wxStringImpl(const wxStringCharType *psz, size_t nLength)
       { InitWith(psz, 0, nLength); }
     // take nLen chars starting at nPos
-  wxStringBase(const wxStringBase& str, size_t nPos, size_t nLen)
+  wxStringImpl(const wxStringImpl& str, size_t nPos, size_t nLen)
   {
     wxASSERT_MSG( str.GetStringData()->IsValid(),
                   _T("did you forget to call UngetWriteBuf()?") );
@@ -514,10 +355,10 @@ public:
     InitWith(str.c_str(), nPos, nLen);
   }
     // take all characters from pStart to pEnd
-  wxStringBase(const void *pStart, const void *pEnd);
+  wxStringImpl(const void *pStart, const void *pEnd);
 
     // dtor is not virtual, this class must not be inherited from!
-  ~wxStringBase()
+  ~wxStringImpl()
   {
 #if defined(__VISUALC__) && (__VISUALC__ >= 1200)
       //RN - according to the above VC++ does indeed inline this,
@@ -534,11 +375,11 @@ public:
 #endif
   // overloaded assignment
     // from another wxString
-  wxStringBase& operator=(const wxStringBase& stringSrc);
+  wxStringImpl& operator=(const wxStringImpl& stringSrc);
     // from a character
-  wxStringBase& operator=(wxUniChar ch);
+  wxStringImpl& operator=(wxStringCharType ch);
     // from a C string
-  wxStringBase& operator=(const wxChar *psz);
+  wxStringImpl& operator=(const wxStringCharType *psz);
 
     // return the length of the string
   size_type length() const { return GetStringData()->nDataLength; }
@@ -547,7 +388,7 @@ public:
     // return the maximum size of the string
   size_type max_size() const { return npos; }
     // resize the string, filling the space with c if c != 0
-  void resize(size_t nSize, wxUniChar ch = wxT('\0'));
+  void resize(size_t nSize, wxStringCharType ch = '\0');
     // delete the contents of the string
   void clear() { erase(0, npos); }
     // returns true if the string is empty
@@ -565,47 +406,47 @@ public:
   {
     wxASSERT_VALID_INDEX( n );
     CopyBeforeWrite();
-    return wxUniCharRef::CreateForString(&m_pchData[n]);
-  }
+    return m_pchData[n];
+  } // FIXME-UTF8: not useful for us...?
 
   // lib.string.modifiers
     // append elements str[pos], ..., str[pos+n]
-  wxStringBase& append(const wxStringBase& str, size_t pos, size_t n)
+  wxStringImpl& append(const wxStringImpl& str, size_t pos, size_t n)
   {
     wxASSERT(pos <= str.length());
     ConcatSelf(n, str.c_str() + pos, str.length() - pos);
     return *this;
   }
     // append a string
-  wxStringBase& append(const wxStringBase& str)
+  wxStringImpl& append(const wxStringImpl& str)
     { ConcatSelf(str.length(), str.c_str()); return *this; }
     // append first n (or all if n == npos) characters of sz
-  wxStringBase& append(const wxChar *sz)
+  wxStringImpl& append(const wxStringCharType *sz)
     { ConcatSelf(wxStrlen(sz), sz); return *this; }
-  wxStringBase& append(const wxChar *sz, size_t n)
+  wxStringImpl& append(const wxStringCharType *sz, size_t n)
     { ConcatSelf(n, sz); return *this; }
     // append n copies of ch
-  wxStringBase& append(size_t n, wxUniChar ch);
+  wxStringImpl& append(size_t n, wxStringCharType ch);
     // append from first to last
-  wxStringBase& append(const_iterator first, const_iterator last)
+  wxStringImpl& append(const_iterator first, const_iterator last)
     { ConcatSelf(last - first, first); return *this; }
 
     // same as `this_string = str'
-  wxStringBase& assign(const wxStringBase& str)
+  wxStringImpl& assign(const wxStringImpl& str)
     { return *this = str; }
     // same as ` = str[pos..pos + n]
-  wxStringBase& assign(const wxStringBase& str, size_t pos, size_t n)
+  wxStringImpl& assign(const wxStringImpl& str, size_t pos, size_t n)
     { clear(); return append(str, pos, n); }
     // same as `= first n (or all if n == npos) characters of sz'
-  wxStringBase& assign(const wxChar *sz)
+  wxStringImpl& assign(const wxStringCharType *sz)
     { clear(); return append(sz, wxStrlen(sz)); }
-  wxStringBase& assign(const wxChar *sz, size_t n)
+  wxStringImpl& assign(const wxStringCharType *sz, size_t n)
     { clear(); return append(sz, n); }
     // same as `= n copies of ch'
-  wxStringBase& assign(size_t n, wxUniChar ch)
+  wxStringImpl& assign(size_t n, wxStringCharType ch)
     { clear(); return append(n, ch); }
     // assign from first to last
-  wxStringBase& assign(const_iterator first, const_iterator last)
+  wxStringImpl& assign(const_iterator first, const_iterator last)
     { clear(); return append(first, last); }
 
     // first valid index position
@@ -615,21 +456,14 @@ public:
   const_iterator end() const { return m_pchData + length(); }
   iterator end();
 
-    // first element of the reversed string
-  const_reverse_iterator rbegin() const { return const_reverse_iterator(end()); }
-  reverse_iterator rbegin() { return reverse_iterator(end()); }
-    // one beyond the end of the reversed string
-  const_reverse_iterator rend() const { return const_reverse_iterator(begin()); }
-  reverse_iterator rend() { return reverse_iterator(begin()); }
-
     // insert another string
-  wxStringBase& insert(size_t nPos, const wxStringBase& str)
+  wxStringImpl& insert(size_t nPos, const wxStringImpl& str)
   {
     wxASSERT( str.GetStringData()->IsValid() );
     return insert(nPos, str.c_str(), str.length());
   }
     // insert n chars of str starting at nStart (in str)
-  wxStringBase& insert(size_t nPos, const wxStringBase& str, size_t nStart, size_t n)
+  wxStringImpl& insert(size_t nPos, const wxStringImpl& str, size_t nStart, size_t n)
   {
     wxASSERT( str.GetStringData()->IsValid() );
     wxASSERT( nStart < str.length() );
@@ -638,19 +472,19 @@ public:
     return insert(nPos, str.c_str() + nStart, n);
   }
     // insert first n (or all if n == npos) characters of sz
-  wxStringBase& insert(size_t nPos, const wxChar *sz, size_t n = npos);
+  wxStringImpl& insert(size_t nPos, const wxStringCharType *sz, size_t n = npos);
     // insert n copies of ch
-  wxStringBase& insert(size_t nPos, size_t n, wxUniChar ch)
-    { return insert(nPos, wxStringBase(n, ch)); }
-  iterator insert(iterator it, wxUniChar ch)
+  wxStringImpl& insert(size_t nPos, size_t n, wxStringCharType ch)// FIXME-UTF8: tricky
+    { return insert(nPos, wxStringImpl(n, ch)); }
+  iterator insert(iterator it, wxStringCharType ch) // FIXME-UTF8: tricky
     { size_t idx = it - begin(); insert(idx, 1, ch); return begin() + idx; }
   void insert(iterator it, const_iterator first, const_iterator last)
     { insert(it - begin(), first, last - first); }
-  void insert(iterator it, size_type n, wxUniChar ch)
+  void insert(iterator it, size_type n, wxStringCharType ch)
     { insert(it - begin(), n, ch); }
 
     // delete characters from nStart to nStart + nLen
-  wxStringBase& erase(size_type pos = 0, size_type n = npos);
+  wxStringImpl& erase(size_type pos = 0, size_type n = npos);
   iterator erase(iterator first, iterator last)
   {
     size_t idx = first - begin();
@@ -660,138 +494,92 @@ public:
   iterator erase(iterator first);
 
   // explicit conversion to C string (use this with printf()!)
-  const wxChar* c_str() const { return m_pchData; }
-  const wxChar* data() const { return m_pchData; }
+  const wxStringCharType* c_str() const { return m_pchData; }
+  const wxStringCharType* data() const { return m_pchData; }
 
     // replaces the substring of length nLen starting at nStart
-  wxStringBase& replace(size_t nStart, size_t nLen, const wxChar* sz);
+  wxStringImpl& replace(size_t nStart, size_t nLen, const wxStringCharType* sz);
     // replaces the substring of length nLen starting at nStart
-  wxStringBase& replace(size_t nStart, size_t nLen, const wxStringBase& str)
+  wxStringImpl& replace(size_t nStart, size_t nLen, const wxStringImpl& str)
     { return replace(nStart, nLen, str.c_str()); }
     // replaces the substring with nCount copies of ch
-  wxStringBase& replace(size_t nStart, size_t nLen, size_t nCount, wxUniChar ch);
+  wxStringImpl& replace(size_t nStart, size_t nLen, size_t nCount, wxStringCharType ch);
     // replaces a substring with another substring
-  wxStringBase& replace(size_t nStart, size_t nLen,
-                        const wxStringBase& str, size_t nStart2, size_t nLen2);
+  wxStringImpl& replace(size_t nStart, size_t nLen,
+                        const wxStringImpl& str, size_t nStart2, size_t nLen2);
     // replaces the substring with first nCount chars of sz
-  wxStringBase& replace(size_t nStart, size_t nLen,
-                        const wxChar* sz, size_t nCount);
-  wxStringBase& replace(iterator first, iterator last, const_pointer s)
+  wxStringImpl& replace(size_t nStart, size_t nLen,
+                        const wxStringCharType* sz, size_t nCount);
+  wxStringImpl& replace(iterator first, iterator last, const_pointer s)
     { return replace(first - begin(), last - first, s); }
-  wxStringBase& replace(iterator first, iterator last, const_pointer s,
+  wxStringImpl& replace(iterator first, iterator last, const_pointer s,
                         size_type n)
     { return replace(first - begin(), last - first, s, n); }
-  wxStringBase& replace(iterator first, iterator last, const wxStringBase& s)
+  wxStringImpl& replace(iterator first, iterator last, const wxStringImpl& s)
     { return replace(first - begin(), last - first, s); }
-  wxStringBase& replace(iterator first, iterator last, size_type n, wxUniChar c)
+  wxStringImpl& replace(iterator first, iterator last, size_type n, wxStringCharType c)
     { return replace(first - begin(), last - first, n, c); }
-  wxStringBase& replace(iterator first, iterator last,
+  wxStringImpl& replace(iterator first, iterator last,
                         const_iterator first1, const_iterator last1)
     { return replace(first - begin(), last - first, first1, last1 - first1); }
 
     // swap two strings
-  void swap(wxStringBase& str);
+  void swap(wxStringImpl& str);
 
     // All find() functions take the nStart argument which specifies the
     // position to start the search on, the default value is 0. All functions
     // return npos if there were no match.
 
     // find a substring
-  size_t find(const wxStringBase& str, size_t nStart = 0) const;
+  size_t find(const wxStringImpl& str, size_t nStart = 0) const;
 
     // find first n characters of sz
-  size_t find(const wxChar* sz, size_t nStart = 0, size_t n = npos) const;
+  size_t find(const wxStringCharType* sz, size_t nStart = 0, size_t n = npos) const;
 
     // find the first occurence of character ch after nStart
-  size_t find(wxUniChar ch, size_t nStart = 0) const;
+  size_t find(wxStringCharType ch, size_t nStart = 0) const;
 
     // rfind() family is exactly like find() but works right to left
 
     // as find, but from the end
-  size_t rfind(const wxStringBase& str, size_t nStart = npos) const;
+  size_t rfind(const wxStringImpl& str, size_t nStart = npos) const;
 
     // as find, but from the end
-  size_t rfind(const wxChar* sz, size_t nStart = npos,
+  size_t rfind(const wxStringCharType* sz, size_t nStart = npos,
                size_t n = npos) const;
     // as find, but from the end
-  size_t rfind(wxUniChar ch, size_t nStart = npos) const;
-
-    // find first/last occurence of any character in the set
-
-    // as strpbrk() but starts at nStart, returns npos if not found
-  size_t find_first_of(const wxStringBase& str, size_t nStart = 0) const
-    { return find_first_of(str.c_str(), nStart); }
-    // same as above
-  size_t find_first_of(const wxChar* sz, size_t nStart = 0) const;
-  size_t find_first_of(const wxChar* sz, size_t nStart, size_t n) const;
-    // same as find(char, size_t)
-  size_t find_first_of(wxUniChar c, size_t nStart = 0) const
-    { return find(c, nStart); }
-    // find the last (starting from nStart) char from str in this string
-  size_t find_last_of (const wxStringBase& str, size_t nStart = npos) const
-    { return find_last_of(str.c_str(), nStart); }
-    // same as above
-  size_t find_last_of (const wxChar* sz, size_t nStart = npos) const;
-  size_t find_last_of(const wxChar* sz, size_t nStart, size_t n) const;
-    // same as above
-  size_t find_last_of(wxUniChar c, size_t nStart = npos) const
-    { return rfind(c, nStart); }
+  size_t rfind(wxStringCharType ch, size_t nStart = npos) const;
 
-    // find first/last occurence of any character not in the set
-
-    // as strspn() (starting from nStart), returns npos on failure
-  size_t find_first_not_of(const wxStringBase& str, size_t nStart = 0) const
-    { return find_first_not_of(str.c_str(), nStart); }
-    // same as above
-  size_t find_first_not_of(const wxChar* sz, size_t nStart = 0) const;
-  size_t find_first_not_of(const wxChar* sz, size_t nStart, size_t n) const;
-    // same as above
-  size_t find_first_not_of(wxUniChar ch, size_t nStart = 0) const;
-    //  as strcspn()
-  size_t find_last_not_of(const wxStringBase& str, size_t nStart = npos) const
-    { return find_last_not_of(str.c_str(), nStart); }
-    // same as above
-  size_t find_last_not_of(const wxChar* sz, size_t nStart = npos) const;
-  size_t find_last_not_of(const wxChar* sz, size_t nStart, size_t n) const;
-    // same as above
-  size_t find_last_not_of(wxUniChar ch, size_t nStart = npos) const;
-
-    // All compare functions return -1, 0 or 1 if the [sub]string is less,
-    // equal or greater than the compare() argument.
-
-    // comparison with another string
-  int compare(const wxStringBase& str) const;
-    // comparison with a substring
-  int compare(size_t nStart, size_t nLen, const wxStringBase& str) const;
-    // comparison of 2 substrings
-  int compare(size_t nStart, size_t nLen,
-              const wxStringBase& str, size_t nStart2, size_t nLen2) const;
-    // comparison with a c string
-  int compare(const wxChar* sz) const;
-    // substring comparison with first nCount characters of sz
-  int compare(size_t nStart, size_t nLen,
-              const wxChar* sz, size_t nCount = npos) const;
-
-  size_type copy(wxChar* s, size_type n, size_type pos = 0);
+  size_type copy(wxStringCharType* s, size_type n, size_type pos = 0);
 
   // substring extraction
-  wxStringBase substr(size_t nStart = 0, size_t nLen = npos) const;
+  wxStringImpl substr(size_t nStart = 0, size_t nLen = npos) const;
 
       // string += string
-  wxStringBase& operator+=(const wxStringBase& s) { return append(s); }
+  wxStringImpl& operator+=(const wxStringImpl& s) { return append(s); }
       // string += C string
-  wxStringBase& operator+=(const wxChar *psz) { return append(psz); }
+  wxStringImpl& operator+=(const wxStringCharType *psz) { return append(psz); }
       // string += char
-  wxStringBase& operator+=(wxUniChar ch) { return append(1, ch); }
-  wxStringBase& operator+=(wxUniCharRef ch) { return append(1, ch); }
-  wxStringBase& operator+=(char ch) { return append(1, ch); }
-  wxStringBase& operator+=(wchar_t ch) { return append(1, ch); }
+  wxStringImpl& operator+=(wxStringCharType ch) { return append(1, ch); }
+
+#if !wxUSE_UNICODE_UTF8
+  // helpers for wxStringBuffer and wxStringBufferLength
+  wxStringCharType *DoGetWriteBuf(size_t nLen);
+  void DoUngetWriteBuf();
+  void DoUngetWriteBuf(size_t nLen);
+#endif
+
+  friend class WXDLLIMPEXP_BASE wxString;
 };
 
+#endif // !wxUSE_STL_BASED_WXSTRING
+
 // don't pollute the library user's name space
 #undef wxASSERT_VALID_INDEX
 
-#endif // !wxUSE_STL_BASED_WXSTRING
+// wx/unichar.h needs wxStringImpl, so it's only possible to include it here
+// (it includes string.h if not included from string.h):
+#include "wx/unichar.h"
 
 // ----------------------------------------------------------------------------
 // wxCStrData
@@ -938,14 +726,20 @@ protected:
     #pragma warning (disable:4275)
 #endif
 
-class WXDLLIMPEXP_BASE wxString : public wxStringBase
+class WXDLLIMPEXP_BASE wxString
 #ifdef wxNEEDS_WXSTRING_PRINTF_MIXIN
-                                 ,public wxStringPrintfMixin
+                                : public wxStringPrintfMixin
 #endif
 {
   // NB: special care was taken in arranging the member functions in such order
   //     that all inline functions can be effectively inlined, verify that all
   //     performance critical functions are still inlined if you change order!
+public:
+#if !wxUSE_STL_BASED_WXSTRING
+  // an 'invalid' value for string index, moved to this place due to a CW bug
+  static const size_t npos;
+#endif
+
 private:
   // if we hadn't made these operators private, it would be possible to
   // compile "wxString s; s = 17;" without any warnings as 17 is implicitly
@@ -956,94 +750,461 @@ private:
   //     ambiguity between operator=(char) and operator=(int)
   wxString& operator=(int);
 
-  // these methods are not implemented - there is _no_ conversion from int to
-  // string, you're doing something wrong if the compiler wants to call it!
-  //
-  // try `s << i' or `s.Printf("%d", i)' instead
-  wxString(int);
+  // these methods are not implemented - there is _no_ conversion from int to
+  // string, you're doing something wrong if the compiler wants to call it!
+  //
+  // try `s << i' or `s.Printf("%d", i)' instead
+  wxString(int);
+
+
+  // buffer for holding temporary substring when using any of the methods
+  // that take (char*,size_t) or (wchar_t*,size_t) arguments:
+  // FIXME-UTF8: This will need changes when UTF8 build is introduced
+  template<typename T>
+  struct SubstrBufFromType
+  {
+      T data;
+      size_t len;
+
+      SubstrBufFromType() {}
+      SubstrBufFromType(const T& data_, size_t len_)
+          : data(data_), len(len_) {}
+  };
+
+#if wxUSE_UNICODE_UTF8
+  // FIXME-UTF8: this will have to use slightly different type
+#elif wxUSE_UNICODE_WCHAR
+  typedef SubstrBufFromType<const wchar_t*>  SubstrBufFromWC;
+  typedef SubstrBufFromType<wxWCharBuffer>   SubstrBufFromMB;
+  typedef SubstrBufFromWC SubstrBufFrom;
+#else
+  typedef SubstrBufFromType<const char*>     SubstrBufFromMB;
+  typedef SubstrBufFromType<wxCharBuffer>    SubstrBufFromWC;
+  typedef SubstrBufFromMB SubstrBufFrom;
+#endif
+
+
+  // Functions implementing primitive operations on string data; wxString
+  // methods and iterators are implemented in terms of it. The differences
+  // between UTF-8 and wchar_t* representations of the string are mostly
+  // contained here.
+
+#if wxUSE_UNICODE
+  // FIXME-UTF8: This will need changes when UTF8 build is introduced
+  static SubstrBufFromMB ConvertStr(const char *psz, size_t nLength,
+                                const wxMBConv& conv);
+#else
+  static SubstrBufFromWC ConvertStr(const wchar_t *pwz, size_t nLength,
+                                const wxMBConv& conv);
+#endif
+
+#if !wxUSE_UNICODE_UTF8 // wxUSE_UNICODE_WCHAR or !wxUSE_UNICODE
+  // returns C string encoded as the implementation expects (version for
+  // the same char type as used internally)
+  static const wxStringCharType* ImplStr(const wxStringCharType* str)
+    { return str; }
+  static const SubstrBufFrom ImplStr(const wxStringCharType* str, size_t n)
+    { return SubstrBufFrom(str, n); }
+  #if wxUSE_UNICODE
+  // returns C string encoded as the implementation expects (version for
+  // the other char type than the one used internally)
+  static wxWCharBuffer ImplStr(const char* str)
+    { return ConvertStr(str, npos, wxConvLibc).data; }
+  static SubstrBufFromMB ImplStr(const char* str, size_t n)
+    { return ConvertStr(str, n, wxConvLibc); }
+  #else
+  static wxCharBuffer ImplStr(const wchar_t* str)
+    { return ConvertStr(str, npos, wxConvLibc).data; }
+  static SubstrBufFromWC ImplStr(const wchar_t* str, size_t n)
+    { return ConvertStr(str, n, wxConvLibc); }
+  #endif
+
+  // moves the iterator to the next Unicode character
+  static void IncIter(wxStringImpl::iterator& i) { ++i; }
+  static void IncIter(wxStringImpl::const_iterator& i) { ++i; }
+  // moves the iterator to the previous Unicode character
+  static void DecIter(wxStringImpl::iterator& i) { --i; }
+  static void DecIter(wxStringImpl::const_iterator& i) { --i; }
+  // moves the iterator by n Unicode characters
+  static wxStringImpl::iterator AddToIter(wxStringImpl::iterator i, int n)
+    { return i + n; }
+  static wxStringImpl::const_iterator AddToIter(wxStringImpl::const_iterator i, int n)
+    { return i + n; }
+  // returns distance of the two iterators in Unicode characters
+  static int DiffIters(wxStringImpl::iterator i1, wxStringImpl::iterator i2)
+    { return i1 - i2; }
+  static int DiffIters(wxStringImpl::const_iterator i1, wxStringImpl::const_iterator i2)
+    { return i1 - i2; }
+
+  // encodes the character to a form used to represent it in internal
+  // representation (returns a string in UTF8 version)
+  static wxChar EncodeChar(wxUniChar ch) { return (wxChar)ch; }
+
+  // translates position index in wxString to/from index in underlying
+  // wxStringImpl:
+  static size_t PosToImpl(size_t pos) { return pos; }
+  static void PosLenToImpl(size_t pos, size_t len,
+                           size_t *implPos, size_t *implLen)
+    { *implPos = pos; *implLen = len; }
+  static size_t PosFromImpl(size_t pos) { return pos; }
+
+#else // wxUSE_UNICODE_UTF8
+
+  typedef char Utf8CharBuffer[5];
+  static Utf8CharBuffer EncodeChar(wxUniChar ch);
+  // returns n copies of ch encoded in UTF-8 string
+  static wxCharBuffer EncodeNChars(size_t n, wxUniChar ch);
+
+  size_t PosToImpl(size_t pos) const
+  {
+      if ( pos == 0 || pos == npos )
+          return pos;
+      else
+          return wxStringImpl::const_iterator(begin() + pos) - m_impl.begin();
+  }
+
+  size_t PosFromImpl(size_t pos) const
+  {
+      if ( pos == 0 || pos == npos )
+          return pos;
+      else
+          return const_iterator(m_impl.begin() + pos) - begin();
+  }
+
+  // FIXME: return as-is without copying under UTF8 locale, return
+  //        converted string under other locales - needs wxCharBuffer
+  //        changes
+  static wxCharBuffer ImplStr(const char* str);
+
+  static wxCharBuffer ImplStr(const wchar_t* str)
+      { return wxConvUTF8.cWC2MB(str); }
+#endif // !wxUSE_UNICODE_UTF8/wxUSE_UNICODE_UTF8
+
+
+public:
+  // constructors and destructor
+    // ctor for an empty string
+  wxString() {}
+    // copy ctor
+  wxString(const wxStringImpl& stringSrc) : m_impl(stringSrc) { }
+  wxString(const wxString& stringSrc) : m_impl(stringSrc) { }
+    // string containing nRepeat copies of ch
+  wxString(wxUniChar ch, size_t nRepeat = 1)
+      : m_impl(nRepeat, ch) { }
+  wxString(size_t nRepeat, wxUniChar ch)
+      : m_impl(nRepeat, ch) { }
+  wxString(wxUniCharRef ch, size_t nRepeat = 1)
+      : m_impl(nRepeat, ch) { }
+  wxString(size_t nRepeat, wxUniCharRef ch)
+      : m_impl(nRepeat, ch) { }
+  wxString(char ch, size_t nRepeat = 1)
+      : m_impl(nRepeat, ch) { }
+  wxString(size_t nRepeat, char ch)
+      : m_impl(nRepeat, ch) { }
+  wxString(wchar_t ch, size_t nRepeat = 1)
+      : m_impl(nRepeat, ch) { }
+  wxString(size_t nRepeat, wchar_t ch)
+      : m_impl(nRepeat, ch) { }
+    // ctor takes first nLength characters from C string
+    // (default value of npos means take all the string)
+  wxString(const wxChar *psz)
+      : m_impl(psz ? psz : wxT("")) { }
+  wxString(const wxChar *psz, size_t nLength)
+      : m_impl(psz, nLength) { }
+  wxString(const wxChar *psz,
+           const wxMBConv& WXUNUSED(conv),
+           size_t nLength = npos)
+      : m_impl(psz, nLength == npos ? wxStrlen(psz) : nLength) { }
+
+  // even if we're not built with wxUSE_STL == 1 it is very convenient to allow
+  // implicit conversions from std::string to wxString as this allows to use
+  // the same strings in non-GUI and GUI code, however we don't want to
+  // unconditionally add this ctor as it would make wx lib dependent on
+  // libstdc++ on some Linux versions which is bad, so instead we ask the
+  // client code to define this wxUSE_STD_STRING symbol if they need it
+#if wxUSE_STD_STRING
+  wxString(const wxStdString& s)
+      : m_impl(s.c_str()) { }
+#endif // wxUSE_STD_STRING
+
+#if wxUSE_UNICODE
+    // from multibyte string
+  wxString(const char *psz,
+           const wxMBConv& conv = wxConvLibc,
+           size_t nLength = npos);
+    // from multibyte string for ANSI compatibility, with wxConvLibc
+  wxString(const char *psz, size_t nLength);
+    // from wxWCharBuffer (i.e. return from wxGetString)
+  wxString(const wxWCharBuffer& psz) : m_impl(psz.data()) { }
+#else // ANSI
+    // from C string (for compilers using unsigned char)
+  wxString(const unsigned char* psz)
+      : m_impl((const char*)psz) { }
+    // from part of C string (for compilers using unsigned char)
+  wxString(const unsigned char* psz, size_t nLength)
+      : m_impl((const char*)psz, nLength) { }
+
+#if wxUSE_WCHAR_T
+    // from wide (Unicode) string
+  wxString(const wchar_t *pwz,
+           const wxMBConv& conv = wxConvLibc,
+           size_t nLength = npos);
+    // from wide string for Unicode compatibility, with wxConvLibc
+  wxString(const wchar_t *pwz, size_t nLength);
+#endif // !wxUSE_WCHAR_T
+
+    // from wxCharBuffer
+  wxString(const wxCharBuffer& psz)
+      : m_impl(psz) { }
+#endif // Unicode/ANSI
+
+    // as we provide both ctors with this signature for both char and unsigned
+    // char string, we need to provide one for wxCStrData to resolve ambiguity
+  wxString(const wxCStrData& cstr, size_t nLength)
+    { assign(cstr.AsString(), nLength); }
+
+    // and because wxString is convertible to wxCStrData and const wxChar *
+    // we also need to provide this one
+  wxString(const wxString& str, size_t nLength)
+    { assign(str, nLength); }
+
+public:
+  // standard types
+  typedef wxUniChar value_type;
+  typedef wxUniChar char_type;
+  typedef wxUniCharRef reference;
+  typedef wxChar* pointer;
+  typedef const wxChar* const_pointer;
+
+  typedef size_t size_type;
+  typedef wxUniChar const_reference;
+
+  #define WX_STR_ITERATOR_IMPL(iterator_name, pointer_type,                 \
+                               reference_type, reference_ctor)              \
+      private:                                                              \
+          typedef wxStringImpl::iterator_name underlying_iterator;          \
+      public:                                                               \
+          typedef wxUniChar value_type;                                     \
+          typedef reference_type reference;                                 \
+          typedef pointer_type pointer;                                     \
+                                                                            \
+          iterator_name(const iterator_name& i) : m_cur(i.m_cur) {}         \
+                                                                            \
+          reference operator*() const { return reference_ctor; }            \
+                                                                            \
+          iterator_name& operator++()                                       \
+            { wxString::IncIter(m_cur); return *this; }                     \
+          iterator_name& operator--()                                       \
+            { wxString::DecIter(m_cur); return *this; }                     \
+          iterator_name operator++(int)                                     \
+          {                                                                 \
+              iterator_name tmp = *this;                                    \
+              wxString::IncIter(m_cur);                                     \
+              return tmp;                                                   \
+          }                                                                 \
+          iterator_name operator--(int)                                     \
+          {                                                                 \
+              iterator_name tmp = *this;                                    \
+              wxString::DecIter(m_cur);                                     \
+              return tmp;                                                   \
+          }                                                                 \
+                                                                            \
+          iterator_name operator+(int n) const                              \
+            { return iterator_name(wxString::AddToIter(m_cur, n)); }        \
+          iterator_name operator+(size_t n) const                           \
+            { return iterator_name(wxString::AddToIter(m_cur, (int)n)); }   \
+          iterator_name operator-(int n) const                              \
+            { return iterator_name(wxString::AddToIter(m_cur, -n)); }       \
+          iterator_name operator-(size_t n) const                           \
+            { return iterator_name(wxString::AddToIter(m_cur, -(int)n)); }  \
+          iterator_name operator+=(int n)                                   \
+            { m_cur = wxString::AddToIter(m_cur, n); return *this; }        \
+          iterator_name operator+=(size_t n)                                \
+            { m_cur = wxString::AddToIter(m_cur, (int)n); return *this; }   \
+          iterator_name operator-=(int n)                                   \
+            { m_cur = wxString::AddToIter(m_cur, -n); return *this; }       \
+          iterator_name operator-=(size_t n)                                \
+            { m_cur = wxString::AddToIter(m_cur, -(int)n); return *this; }  \
+                                                                            \
+          unsigned operator-(const iterator_name& i) const                  \
+            { return wxString::DiffIters(m_cur, i.m_cur); }                 \
+                                                                            \
+          bool operator==(const iterator_name&i) const                      \
+            { return m_cur == i.m_cur; }                                    \
+          bool operator!=(const iterator_name& i) const                     \
+            { return m_cur != i.m_cur; }                                    \
+                                                                            \
+          bool operator<(const iterator_name& i) const                      \
+            { return m_cur < i.m_cur; }                                     \
+          bool operator>(const iterator_name& i) const                      \
+            { return m_cur > i.m_cur; }                                     \
+          bool operator<=(const iterator_name& i) const                     \
+            { return m_cur <= i.m_cur; }                                    \
+          bool operator>=(const iterator_name& i) const                     \
+            { return m_cur >= i.m_cur; }                                    \
+                                                                            \
+      private:                                                              \
+          /* for internal wxString use only: */                             \
+          iterator_name(underlying_iterator ptr) : m_cur(ptr) {}            \
+          operator underlying_iterator() const { return m_cur; }            \
+                                                                            \
+          friend class WXDLLIMPEXP_BASE wxString;                           \
+          friend class WXDLLIMPEXP_BASE wxStringImpl;                       \
+          friend class WXDLLIMPEXP_BASE wxCStrData;                         \
+                                                                            \
+      private:                                                              \
+          underlying_iterator m_cur;
+
+  class const_iterator;
+
+  class iterator
+  {
+      WX_STR_ITERATOR_IMPL(iterator, wxChar*, wxUniCharRef,
+                           wxUniCharRef::CreateForString(m_cur))
+
+      friend class const_iterator;
+  };
+
+  class const_iterator
+  {
+      // NB: reference_type is intentionally value, not reference, the character
+      //     may be encoded differently in wxString data:
+      WX_STR_ITERATOR_IMPL(const_iterator, const wxChar*, wxUniChar,
+                           wxUniChar(*m_cur))
+
+  public:
+      const_iterator(const iterator& i) : m_cur(i.m_cur) {}
+  };
+
+  #undef WX_STR_ITERATOR_IMPL
+
+  friend class iterator;
+  friend class const_iterator;
+
+  template <typename T>
+  class reverse_iterator_impl
+  {
+  public:
+      typedef T iterator_type;
+      typedef typename T::value_type value_type;
+      typedef typename T::reference reference;
+      typedef typename T::pointer *pointer;
+
+      reverse_iterator_impl(iterator_type i) : m_cur(i) {}
+      reverse_iterator_impl(const reverse_iterator_impl& ri)
+          : m_cur(ri.m_cur) {}
+
+      iterator_type base() const { return m_cur; }
+
+      reference operator*() const { return *(m_cur-1); }
+
+      reverse_iterator_impl& operator++()
+        { --m_cur; return *this; }
+      reverse_iterator_impl operator++(int)
+        { reverse_iterator_impl tmp = *this; --m_cur; return tmp; }
+      reverse_iterator_impl& operator--()
+        { ++m_cur; return *this; }
+      reverse_iterator_impl operator--(int)
+        { reverse_iterator_impl tmp = *this; ++m_cur; return tmp; }
+
+      reverse_iterator_impl operator+(int n) const
+        { return reverse_iterator_impl(m_cur - n); }
+      reverse_iterator_impl operator+(size_t n) const
+        { return reverse_iterator_impl(m_cur - n); }
+      reverse_iterator_impl operator-(int n) const
+        { return reverse_iterator_impl(m_cur + n); }
+      reverse_iterator_impl operator-(size_t n) const
+        { return reverse_iterator_impl(m_cur + n); }
+      reverse_iterator_impl operator+=(int n)
+        { m_cur -= n; return *this; }
+      reverse_iterator_impl operator+=(size_t n)
+        { m_cur -= n; return *this; }
+      reverse_iterator_impl operator-=(int n)
+        { m_cur += n; return *this; }
+      reverse_iterator_impl operator-=(size_t n)
+        { m_cur += n; return *this; }
+
+      unsigned operator-(const reverse_iterator_impl& i) const
+        { return i.m_cur - m_cur; }
+
+      bool operator==(const reverse_iterator_impl& ri) const
+        { return m_cur == ri.m_cur; }
+      bool operator!=(const reverse_iterator_impl& ri) const
+        { return !(*this == ri); }
+
+      bool operator<(const reverse_iterator_impl& i) const
+        { return m_cur > i.m_cur; }
+      bool operator>(const reverse_iterator_impl& i) const
+        { return m_cur < i.m_cur; }
+      bool operator<=(const reverse_iterator_impl& i) const
+        { return m_cur >= i.m_cur; }
+      bool operator>=(const reverse_iterator_impl& i) const
+        { return m_cur <= i.m_cur; }
+
+  private:
+      iterator_type m_cur;
+  };
 
-public:
-  // constructors and destructor
-    // ctor for an empty string
-  wxString() : wxStringBase() { }
-    // copy ctor
-  wxString(const wxStringBase& stringSrc) : wxStringBase(stringSrc) { }
-  wxString(const wxString& stringSrc) : wxStringBase(stringSrc) { }
-    // string containing nRepeat copies of ch
-  wxString(wxUniChar ch, size_t nRepeat = 1)
-      : wxStringBase(nRepeat, ch) { }
-  wxString(size_t nRepeat, wxUniChar ch)
-      : wxStringBase(nRepeat, ch) { }
-  wxString(wxUniCharRef ch, size_t nRepeat = 1)
-      : wxStringBase(nRepeat, ch) { }
-  wxString(size_t nRepeat, wxUniCharRef ch)
-      : wxStringBase(nRepeat, ch) { }
-  wxString(char ch, size_t nRepeat = 1)
-      : wxStringBase(nRepeat, ch) { }
-  wxString(size_t nRepeat, char ch)
-      : wxStringBase(nRepeat, ch) { }
-  wxString(wchar_t ch, size_t nRepeat = 1)
-      : wxStringBase(nRepeat, ch) { }
-  wxString(size_t nRepeat, wchar_t ch)
-      : wxStringBase(nRepeat, ch) { }
-    // ctor takes first nLength characters from C string
-    // (default value of npos means take all the string)
-  wxString(const wxChar *psz)
-      : wxStringBase(psz ? psz : wxT("")) { }
-  wxString(const wxChar *psz, size_t nLength)
-      : wxStringBase(psz, nLength) { }
-  wxString(const wxChar *psz,
-           const wxMBConv& WXUNUSED(conv),
-           size_t nLength = npos)
-      : wxStringBase(psz, nLength == npos ? wxStrlen(psz) : nLength) { }
+  typedef reverse_iterator_impl<iterator> reverse_iterator;
+  typedef reverse_iterator_impl<const_iterator> const_reverse_iterator;
 
-  // even if we're not built with wxUSE_STL == 1 it is very convenient to allow
-  // implicit conversions from std::string to wxString as this allows to use
-  // the same strings in non-GUI and GUI code, however we don't want to
-  // unconditionally add this ctor as it would make wx lib dependent on
-  // libstdc++ on some Linux versions which is bad, so instead we ask the
-  // client code to define this wxUSE_STD_STRING symbol if they need it
-#if wxUSE_STD_STRING
-  wxString(const wxStdString& s)
-      : wxStringBase(s.c_str()) { }
-#endif // wxUSE_STD_STRING
+  // first valid index position
+  const_iterator begin() const { return const_iterator(m_impl.begin()); }
+  iterator begin() { return iterator(m_impl.begin()); }
+  // position one after the last valid one
+  const_iterator end() const { return const_iterator(m_impl.end()); }
+  iterator end() { return iterator(m_impl.end()); }
+
+  // first element of the reversed string
+  const_reverse_iterator rbegin() const
+    { return const_reverse_iterator(end()); }
+  reverse_iterator rbegin()
+    { return reverse_iterator(end()); }
+  // one beyond the end of the reversed string
+  const_reverse_iterator rend() const
+    { return const_reverse_iterator(begin()); }
+  reverse_iterator rend()
+    { return reverse_iterator(begin()); }
+
+  // std::string methods:
+#if wxUSE_UNICODE_UTF8
+  size_t length() const { return end() - begin(); } // FIXME-UTF8: optimize!
+#else
+  size_t length() const { return m_impl.length(); }
+#endif
 
-#if wxUSE_UNICODE
-    // from multibyte string
-  wxString(const char *psz,
-           const wxMBConv& conv = wxConvLibc,
-           size_t nLength = npos);
-    // from wxWCharBuffer (i.e. return from wxGetString)
-  wxString(const wxWCharBuffer& psz) : wxStringBase(psz.data()) { }
-#else // ANSI
-    // from C string (for compilers using unsigned char)
-  wxString(const unsigned char* psz)
-      : wxStringBase((const char*)psz) { }
-    // from part of C string (for compilers using unsigned char)
-  wxString(const unsigned char* psz, size_t nLength)
-      : wxStringBase((const char*)psz, nLength) { }
+  size_type size() const { return length(); }
+  size_type max_size() const { return npos; }
 
-    // as we provide both ctors with this signature for both char and unsigned
-    // char string, we need to provide one for wxCStrData to resolve ambiguity
-  wxString(const wxCStrData& cstr, size_t nLength)
-      : wxStringBase(cstr.AsChar(), nLength) { }
+  bool empty() const { return m_impl.empty(); }
 
-    // and because wxString is convertible to wxCStrData and const wxChar *
-    // we also need to provide this one
-  wxString(const wxString& str, size_t nLength)
-      : wxStringBase(str, 0, nLength) { }
+  size_type capacity() const { return m_impl.capacity(); } // FIXME-UTF8
+  void reserve(size_t sz) { m_impl.reserve(sz); } // FIXME-UTF8
 
-#if wxUSE_WCHAR_T
-    // from wide (Unicode) string
-  wxString(const wchar_t *pwz,
-           const wxMBConv& conv = wxConvLibc,
-           size_t nLength = npos);
-#endif // !wxUSE_WCHAR_T
+  void resize(size_t nSize, wxUniChar ch = wxT('\0'))
+  {
+#if wxUSE_UNICODE_UTF8
+    if ( !ch.IsAscii() )
+    {
+        size_t len = length();
+        if ( nSize == len)
+            return;
+        else if ( nSize < len )
+            erase(nSize);
+        else
+            append(nSize - len, ch);
+    }
+    else
+#endif
+        m_impl.resize(nSize, (wxStringCharType)ch);
+  }
 
-    // from wxCharBuffer
-  wxString(const wxCharBuffer& psz)
-      : wxStringBase(psz) { }
-#endif // Unicode/ANSI
+  wxString substr(size_t nStart = 0, size_t nLen = npos) const
+  {
+    size_t pos, len;
+    PosLenToImpl(nStart, nLen, &pos, &len);
+    return m_impl.substr(pos, len);
+  }
 
   // generic attributes & operations
     // as standard strlen()
@@ -1078,9 +1239,13 @@ public:
 
   // data access (all indexes are 0 based)
     // read access
+    wxUniChar at(size_t n) const
+      { return *(begin() + n); } // FIXME-UTF8: optimize?
     wxUniChar GetChar(size_t n) const
       { return at(n); }
     // read/write access
+    wxUniCharRef at(size_t n)
+      { return *(begin() + n); } // FIXME-UTF8: optimize?
     wxUniCharRef GetWritableChar(size_t n)
       { return at(n); }
     // write access
@@ -1088,7 +1253,7 @@ public:
       { at(n) = ch; }
 
     // get last character
-    wxUniChar  Last() const
+    wxUniChar Last() const
       {
           wxASSERT_MSG( !empty(), _T("wxString: index out of bounds") );
 
@@ -1107,30 +1272,31 @@ public:
        ambiguity when using str[0].
      */
     wxUniChar operator[](int n) const
-      { return wxStringBase::at(n); }
+      { return at(n); }
     wxUniChar operator[](long n) const
-      { return wxStringBase::at(n); }
+      { return at(n); }
     wxUniChar operator[](size_t n) const
-      { return wxStringBase::at(n); }
+      { return at(n); }
 #ifndef wxSIZE_T_IS_UINT
     wxUniChar operator[](unsigned int n) const
-      { return wxStringBase::at(n); }
+      { return at(n); }
 #endif // size_t != unsigned int
 
     // operator versions of GetWriteableChar()
     wxUniCharRef operator[](int n)
-      { return wxStringBase::at(n); }
+      { return at(n); }
     wxUniCharRef operator[](long n)
-      { return wxStringBase::at(n); }
+      { return at(n); }
     wxUniCharRef operator[](size_t n)
-      { return wxStringBase::at(n); }
+      { return at(n); }
 #ifndef wxSIZE_T_IS_UINT
     wxUniCharRef operator[](unsigned int n)
-      { return wxStringBase::at(n); }
+      { return at(n); }
 #endif // size_t != unsigned int
 
     // explicit conversion to C string (use this with printf()!)
     wxCStrData c_str() const { return wxCStrData(this); }
+    wxCStrData data() const { return c_str(); }
 
     // implicit conversion to C string
     operator wxCStrData() const { return c_str(); }
@@ -1141,7 +1307,7 @@ public:
 
     // explicit conversion to C string in internal representation (char*,
     // wchar_t*, UTF-8-encoded char*, depending on the build):
-    const_pointer wx_str() const { return data(); }
+    const_pointer wx_str() const { return m_impl.c_str(); }
 
     // conversion to/from plain (i.e. 7 bit) ASCII: this is useful for
     // converting numbers or strings which are certain not to contain special
@@ -1203,32 +1369,33 @@ public:
 
   // overloaded assignment
     // from another wxString
-  wxString& operator=(const wxStringBase& stringSrc)
-    { return (wxString&)wxStringBase::operator=(stringSrc); }
-  wxString& operator=(const wxCStrData& cstr);
+  wxString& operator=(const wxStringImpl& stringSrc)
+    { m_impl = stringSrc; return *this; }
+  wxString& operator=(const wxCStrData& cstr)
+    { return *this = cstr.AsString(); }
     // from a character
   wxString& operator=(wxUniChar ch)
-    { return (wxString&)wxStringBase::operator=(ch); }
+    { m_impl = EncodeChar(ch); return *this; }
   wxString& operator=(wxUniCharRef ch)
-    { return (wxString&)wxStringBase::operator=((wxUniChar)ch); }
+    { return operator=((wxUniChar)ch); }
   wxString& operator=(char ch)
-    { return (wxString&)wxStringBase::operator=(wxUniChar(ch)); }
+    { return operator=(wxUniChar(ch)); }
   wxString& operator=(wchar_t ch)
-    { return (wxString&)wxStringBase::operator=(wxUniChar(ch)); }
+    { return operator=(wxUniChar(ch)); }
     // from a C string - STL probably will crash on NULL,
     // so we need to compensate in that case
 #if wxUSE_STL_BASED_WXSTRING
   wxString& operator=(const wxChar *psz)
-    { if(psz) wxStringBase::operator=(psz); else Clear(); return *this; }
+    { if(psz) m_impl = psz; else Clear(); return *this; }
 #else
   wxString& operator=(const wxChar *psz)
-    { return (wxString&)wxStringBase::operator=(psz); }
+    { m_impl = psz; return *this; }
 #endif
 
 #if wxUSE_UNICODE
     // from wxWCharBuffer
-  wxString& operator=(const wxWCharBuffer& psz)
-    { (void) operator=((const wchar_t *)psz); return *this; }
+  wxString& operator=(const wxWCharBuffer& s)
+    { (void) operator=((const wchar_t *)s); return *this; }
     // from C string
   wxString& operator=(const char* psz)
     {  return operator=(wxString(psz)); }
@@ -1254,8 +1421,8 @@ public:
       // string += string
   wxString& operator<<(const wxString& s)
   {
-#if WXWIN_COMPATIBILITY_2_8 && !wxUSE_STL
-    wxASSERT_MSG( s.GetStringData()->IsValid(),
+#if WXWIN_COMPATIBILITY_2_8 && !wxUSE_STL_BASED_WXSTRING && !wxUSE_UNICODE_UTF8
+    wxASSERT_MSG( s.IsValid(),
                   _T("did you forget to call UngetWriteBuf()?") );
 #endif
 
@@ -1263,10 +1430,12 @@ public:
     return *this;
   }
       // string += C string
-  wxString& operator<<(const wxChar *psz)
+  wxString& operator<<(const char *psz)
     { append(psz); return *this; }
+  wxString& operator<<(const wchar_t *pwz)
+    { append(pwz); return *this; }
   wxString& operator<<(const wxCStrData& psz)
-    { append(psz); return *this; }
+    { append(psz.AsString()); return *this; }
       // string += char
   wxString& operator<<(wxUniChar ch) { append(1, ch); return *this; }
   wxString& operator<<(wxUniCharRef ch) { append(1, ch); return *this; }
@@ -1274,25 +1443,15 @@ public:
   wxString& operator<<(wchar_t ch) { append(1, ch); return *this; }
 
       // string += buffer (i.e. from wxGetString)
-#if wxUSE_UNICODE
   wxString& operator<<(const wxWCharBuffer& s)
     { return operator<<((const wchar_t *)s); }
   wxString& operator+=(const wxWCharBuffer& s)
     { return operator<<((const wchar_t *)s); }
-#else // !wxUSE_UNICODE
+
   wxString& operator<<(const wxCharBuffer& s)
     { return operator<<((const char *)s); }
   wxString& operator+=(const wxCharBuffer& s)
     { return operator<<((const char *)s); }
-#endif // wxUSE_UNICODE/!wxUSE_UNICODE
-
-#if wxUSE_UNICODE
-    // string += C string in Unicode build (with conversion)
-  wxString& operator<<(const char *s)
-    { return operator<<(wxString(s)); }
-  wxString& operator+=(const char *s)
-    { return operator+=(wxString(s)); }
-#endif // wxUSE_UNICODE
 
     // string += C string
   wxString& Append(const wxString& s)
@@ -1306,8 +1465,10 @@ public:
     }
   wxString& Append(const wxCStrData& psz)
     { append(psz); return *this; }
-  wxString& Append(const wxChar* psz)
+  wxString& Append(const char* psz)
     { append(psz); return *this; }
+  wxString& Append(const wchar_t* pwz)
+    { append(pwz); return *this; }
     // append count copies of given character
   wxString& Append(wxUniChar ch, size_t count = 1u)
     { append(count, ch); return *this; }
@@ -1317,8 +1478,10 @@ public:
     { append(count, ch); return *this; }
   wxString& Append(wchar_t ch, size_t count = 1u)
     { append(count, ch); return *this; }
-  wxString& Append(const wxChar* psz, size_t nLen)
+  wxString& Append(const char* psz, size_t nLen)
     { append(psz, nLen); return *this; }
+  wxString& Append(const wchar_t* pwz, size_t nLen)
+    { append(pwz, nLen); return *this; }
 
     // prepend a string, return the string itself
   wxString& Prepend(const wxString& str)
@@ -1334,9 +1497,13 @@ public:
   friend wxString WXDLLIMPEXP_BASE operator+(wxUniChar ch, const wxString& string);
       // string with C string
   friend wxString WXDLLIMPEXP_BASE operator+(const wxString& string,
-                                             const wxChar *psz);
+                                             const char *psz);
+  friend wxString WXDLLIMPEXP_BASE operator+(const wxString& string,
+                                             const wchar_t *pwz);
       // C string with string
-  friend wxString WXDLLIMPEXP_BASE operator+(const wxChar *psz,
+  friend wxString WXDLLIMPEXP_BASE operator+(const char *psz,
+                                             const wxString& string);
+  friend wxString WXDLLIMPEXP_BASE operator+(const wchar_t *pwz,
                                              const wxString& string);
 
   // stream-like functions
@@ -1375,15 +1542,24 @@ public:
 
   // string comparison
     // case-sensitive comparison (returns a value < 0, = 0 or > 0)
-  int Cmp(const wxChar *psz) const;
-  int Cmp(const wxString& s) const;
+  int Cmp(const char *psz) const
+    { return compare(psz); }
+  int Cmp(const wchar_t *pwz) const
+    { return compare(pwz); }
+  int Cmp(const wxString& s) const
+    { return compare(s); }
     // same as Cmp() but not case-sensitive
-  int CmpNoCase(const wxChar *psz) const;
   int CmpNoCase(const wxString& s) const;
+  int CmpNoCase(const char *psz) const
+    { return CmpNoCase(wxString(psz)); }
+  int CmpNoCase(const wchar_t *pwz) const
+    { return CmpNoCase(wxString(pwz)); }
     // test for the string equality, either considering case or not
     // (if compareWithCase then the case matters)
-  bool IsSameAs(const wxChar *psz, bool compareWithCase = true) const
+  bool IsSameAs(const char *psz, bool compareWithCase = true) const
     { return (compareWithCase ? Cmp(psz) : CmpNoCase(psz)) == 0; }
+  bool IsSameAs(const wchar_t *pwz, bool compareWithCase = true) const
+    { return (compareWithCase ? Cmp(pwz) : CmpNoCase(pwz)) == 0; }
     // comparison with a single character: returns true if equal
   bool IsSameAs(wxUniChar c, bool compareWithCase = true) const
     {
@@ -1505,7 +1681,7 @@ public:
     // minimize the string's memory
     // only works if the data of this string is not shared
   bool Shrink();
-#if WXWIN_COMPATIBILITY_2_8 && !wxUSE_STL_BASED_WXSTRING
+#if WXWIN_COMPATIBILITY_2_8 && !wxUSE_STL_BASED_WXSTRING && !wxUSE_UNICODE_UTF8
     // These are deprecated, use wxStringBuffer or wxStringBufferLength instead
     //
     // get writable buffer of at least nLen bytes. Unget() *must* be called
@@ -1514,7 +1690,7 @@ public:
     // call this immediately after GetWriteBuf() has been used
   wxDEPRECATED( void UngetWriteBuf() );
   wxDEPRECATED( void UngetWriteBuf(size_t nLen) );
-#endif // WXWIN_COMPATIBILITY_2_8 && !wxUSE_STL_BASED_WXSTRING
+#endif // WXWIN_COMPATIBILITY_2_8 && !wxUSE_STL_BASED_WXSTRING && wxUSE_UNICODE_UTF8
 
   // wxWidgets version 1 compatibility functions
 
@@ -1537,7 +1713,7 @@ public:
   inline int CompareTo(const wxChar* psz, caseCompare cmp = exact) const
     { return cmp == exact ? Cmp(psz) : CmpNoCase(psz); }
 
-    // use Len
+    // use length()
   size_t Length() const { return length(); }
     // Count the number of characters
   int Freq(wxUniChar ch) const;
@@ -1559,12 +1735,12 @@ public:
       { return (wxString&)erase( nStart, nLen ); }
 
     // use Find()
-  int First( const wxUniChar ch ) const { return Find(ch); }
+  int First( wxUniChar ch ) const { return Find(ch); }
   int First( char ch ) const { return Find(ch); }
   int First( wchar_t ch ) const { return Find(ch); }
   int First( const wxChar* psz ) const { return Find(psz); }
   int First( const wxString &str ) const { return Find(str); }
-  int Last( const wxUniChar ch ) const { return Find(ch, true); }
+  int Last( wxUniChar ch ) const { return Find(ch, true); }
   bool Contains(const wxString& str) const { return Find(str) != wxNOT_FOUND; }
 
     // use empty()
@@ -1574,164 +1750,531 @@ public:
 
     // take nLen chars starting at nPos
   wxString(const wxString& str, size_t nPos, size_t nLen)
-      : wxStringBase(str, nPos, nLen) { }
+      : m_impl(str.m_impl, nPos, nLen) { }
     // take all characters from pStart to pEnd
   wxString(const void *pStart, const void *pEnd)
-      : wxStringBase((const wxChar*)pStart, (const wxChar*)pEnd) { }
+      : m_impl((const wxChar*)pStart, (const wxChar*)pEnd) { }
   wxString(const_iterator first, const_iterator last)
-      : wxStringBase(first, last) { }
+      : m_impl(first, last) { }
   wxString(iterator first, iterator last)
-      : wxStringBase(first, last) { }
+      : m_impl(first, last) { }
 
   // lib.string.modifiers
     // append elements str[pos], ..., str[pos+n]
   wxString& append(const wxString& str, size_t pos, size_t n)
-    { return (wxString&)wxStringBase::append(str, pos, n); }
+  {
+    size_t from, len;
+    str.PosLenToImpl(pos, n, &from, &len);
+    m_impl.append(str.m_impl, from, len);
+    return *this;
+  }
     // append a string
   wxString& append(const wxString& str)
-    { return (wxString&)wxStringBase::append(str); }
+    { m_impl.append(str.m_impl); return *this; }
   wxString& append(const wxCStrData& str)
-    { return (wxString&)wxStringBase::append(str.AsString()); }
+    { m_impl.append(str.AsString().m_impl); return *this; }
     // append first n (or all if n == npos) characters of sz
-  wxString& append(const wxChar *sz)
-    { return (wxString&)wxStringBase::append(sz); }
-  wxString& append(const wxChar *sz, size_t n)
-    { return (wxString&)wxStringBase::append(sz, n); }
+  wxString& append(const char *sz)
+    { m_impl.append(ImplStr(sz)); return *this; }
+  wxString& append(const wchar_t *sz)
+    { m_impl.append(ImplStr(sz)); return *this; }
+  wxString& append(const char *sz, size_t n)
+  {
+    SubstrBufFromMB str(ImplStr(sz, n));
+    m_impl.append(str.data, str.len);
+    return *this;
+  }
+  wxString& append(const wchar_t *sz, size_t n)
+  {
+    SubstrBufFromWC str(ImplStr(sz, n));
+    m_impl.append(str.data, str.len);
+    return *this;
+  }
     // append n copies of ch
   wxString& append(size_t n, wxUniChar ch)
-    { return (wxString&)wxStringBase::append(n, ch); }
+  {
+#if wxUSE_UNICODE_UTF8
+    if ( !ch.IsAscii() )
+        m_impl.append(EncodeNChars(n, ch));
+    else
+#endif
+        m_impl.append(n, (wxStringCharType)ch);
+    return *this;
+  }
     // append from first to last
   wxString& append(const_iterator first, const_iterator last)
-    { return (wxString&)wxStringBase::append(first, last); }
+    { m_impl.append(first, last); return *this; }
 
     // same as `this_string = str'
   wxString& assign(const wxString& str)
-    { return (wxString&)wxStringBase::assign(str); }
+    { m_impl = str.m_impl; return *this; }
     // same as ` = str[pos..pos + n]
   wxString& assign(const wxString& str, size_t pos, size_t n)
-    { return (wxString&)wxStringBase::assign(str, pos, n); }
+  {
+    size_t from, len;
+    str.PosLenToImpl(pos, n, &from, &len);
+    m_impl.assign(str.m_impl, from, len);
+    return *this;
+  }
     // same as `= first n (or all if n == npos) characters of sz'
-  wxString& assign(const wxChar *sz)
-    { return (wxString&)wxStringBase::assign(sz); }
-  wxString& assign(const wxChar *sz, size_t n)
-    { return (wxString&)wxStringBase::assign(sz, n); }
+  wxString& assign(const char *sz)
+    { m_impl.assign(ImplStr(sz)); return *this; }
+  wxString& assign(const wchar_t *sz)
+    { m_impl.assign(ImplStr(sz)); return *this; }
+  wxString& assign(const char *sz, size_t n)
+  {
+    SubstrBufFromMB str(ImplStr(sz, n));
+    m_impl.assign(str.data, str.len);
+    return *this;
+  }
+  wxString& assign(const wchar_t *sz, size_t n)
+  {
+    SubstrBufFromWC str(ImplStr(sz, n));
+    m_impl.assign(str.data, str.len);
+    return *this;
+  }
     // same as `= n copies of ch'
   wxString& assign(size_t n, wxUniChar ch)
-    { return (wxString&)wxStringBase::assign(n, ch); }
+  {
+#if wxUSE_UNICODE_UTF8
+    if ( !ch.IsAscii() )
+        m_impl.assign(EncodeNChars(n, ch));
+    else
+#endif
+        m_impl.assign(n, (wxStringCharType)ch);
+    return *this;
+  }
     // assign from first to last
   wxString& assign(const_iterator first, const_iterator last)
-    { return (wxString&)wxStringBase::assign(first, last); }
+    { m_impl.assign(first, last); return *this; }
 
     // string comparison
-#if !defined(HAVE_STD_STRING_COMPARE)
-  int compare(const wxStringBase& str) const;
+  int compare(const wxString& str) const;
     // comparison with a substring
-  int compare(size_t nStart, size_t nLen, const wxStringBase& str) const;
+  int compare(size_t nStart, size_t nLen, const wxString& str) const;
     // comparison of 2 substrings
   int compare(size_t nStart, size_t nLen,
-              const wxStringBase& str, size_t nStart2, size_t nLen2) const;
+              const wxString& str, size_t nStart2, size_t nLen2) const;
     // just like strcmp()
-  int compare(const wxChar* sz) const;
+  int compare(const char* sz) const;
+  int compare(const wchar_t* sz) const;
     // substring comparison with first nCount characters of sz
   int compare(size_t nStart, size_t nLen,
-              const wxChar* sz, size_t nCount = npos) const;
-#endif // !defined HAVE_STD_STRING_COMPARE
+              const char* sz, size_t nCount = npos) const;
+  int compare(size_t nStart, size_t nLen,
+              const wchar_t* sz, size_t nCount = npos) const;
 
     // insert another string
   wxString& insert(size_t nPos, const wxString& str)
-    { return (wxString&)wxStringBase::insert(nPos, str); }
+    { insert(begin() + nPos, str.begin(), str.end()); return *this; }
     // insert n chars of str starting at nStart (in str)
   wxString& insert(size_t nPos, const wxString& str, size_t nStart, size_t n)
-    { return (wxString&)wxStringBase::insert(nPos, str, nStart, n); }
+  {
+    size_t from, len;
+    str.PosLenToImpl(nStart, n, &from, &len);
+    m_impl.insert(PosToImpl(nPos), str.m_impl, from, len);
+    return *this;
+  }
     // insert first n (or all if n == npos) characters of sz
-  wxString& insert(size_t nPos, const wxChar *sz)
-    { return (wxString&)wxStringBase::insert(nPos, sz); }
-  wxString& insert(size_t nPos, const wxChar *sz, size_t n)
-    { return (wxString&)wxStringBase::insert(nPos, sz, n); }
+  wxString& insert(size_t nPos, const char *sz)
+    { m_impl.insert(PosToImpl(nPos), ImplStr(sz)); return *this; }
+  wxString& insert(size_t nPos, const wchar_t *sz)
+    { m_impl.insert(PosToImpl(nPos), ImplStr(sz)); return *this; }
+  wxString& insert(size_t nPos, const char *sz, size_t n)
+  {
+    SubstrBufFromMB str(ImplStr(sz, n));
+    m_impl.insert(PosToImpl(nPos), str.data, str.len);
+    return *this;
+  }
+  wxString& insert(size_t nPos, const wchar_t *sz, size_t n)
+  {
+    SubstrBufFromWC str(ImplStr(sz, n));
+    m_impl.insert(PosToImpl(nPos), str.data, str.len);
+    return *this;
+  }
     // insert n copies of ch
   wxString& insert(size_t nPos, size_t n, wxUniChar ch)
-    { return (wxString&)wxStringBase::insert(nPos, n, ch); }
+  {
+#if wxUSE_UNICODE_UTF8
+    if ( !ch.IsAscii() )
+        m_impl.insert(begin() + nPos, EncodeNChars(n, ch));
+    else
+#endif
+        m_impl.insert(begin() + nPos, n, (wxStringCharType)ch);
+    return *this;
+  }
   iterator insert(iterator it, wxUniChar ch)
-    { return wxStringBase::insert(it, ch); }
+    { return iterator(m_impl.insert(it, EncodeChar(ch))); }
   void insert(iterator it, const_iterator first, const_iterator last)
-    { wxStringBase::insert(it, first, last); }
+    { m_impl.insert(it, first, last); }
   void insert(iterator it, size_type n, wxUniChar ch)
-    { wxStringBase::insert(it, n, ch); }
+  {
+#if wxUSE_UNICODE_UTF8
+    if ( !ch.IsAscii() )
+        m_impl.insert(it, EncodeNChars(n, ch));
+    else
+#endif
+        m_impl.insert(it, n, (wxStringCharType)ch);
+  }
 
     // delete characters from nStart to nStart + nLen
   wxString& erase(size_type pos = 0, size_type n = npos)
-    { return (wxString&)wxStringBase::erase(pos, n); }
+  {
+    size_t from, len;
+    PosLenToImpl(pos, n, &from, &len);
+    m_impl.erase(from, len);
+    return *this;
+  }
   iterator erase(iterator first, iterator last)
-    { return wxStringBase::erase(first, last); }
+    { return iterator(m_impl.erase(first, last)); }
   iterator erase(iterator first)
-    { return wxStringBase::erase(first); }
+    { return iterator(m_impl.erase(first)); }
 
 #ifdef wxSTRING_BASE_HASNT_CLEAR
   void clear() { erase(); }
+#else
+  void clear() { m_impl.clear(); }
 #endif
 
     // replaces the substring of length nLen starting at nStart
-  wxString& replace(size_t nStart, size_t nLen, const wxChar* sz)
-    { return (wxString&)wxStringBase::replace(nStart, nLen, sz); }
+  wxString& replace(size_t nStart, size_t nLen, const char* sz)
+  {
+    size_t from, len;
+    PosLenToImpl(nStart, nLen, &from, &len);
+    m_impl.replace(from, len, ImplStr(sz));
+    return *this;
+  }
+  wxString& replace(size_t nStart, size_t nLen, const wchar_t* sz)
+  {
+    size_t from, len;
+    PosLenToImpl(nStart, nLen, &from, &len);
+    m_impl.replace(from, len, ImplStr(sz));
+    return *this;
+  }
     // replaces the substring of length nLen starting at nStart
   wxString& replace(size_t nStart, size_t nLen, const wxString& str)
-    { return (wxString&)wxStringBase::replace(nStart, nLen, str); }
+  {
+    size_t from, len;
+    PosLenToImpl(nStart, nLen, &from, &len);
+    m_impl.replace(from, len, str.m_impl);
+    return *this;
+  }
     // replaces the substring with nCount copies of ch
   wxString& replace(size_t nStart, size_t nLen, size_t nCount, wxUniChar ch)
-    { return (wxString&)wxStringBase::replace(nStart, nLen, nCount, ch); }
+  {
+    size_t from, len;
+    PosLenToImpl(nStart, nLen, &from, &len);
+#if wxUSE_UNICODE_UTF8
+    if ( !ch.IsAscii() )
+        m_impl.replace(from, len, EncodeNChars(nCount, ch));
+    else
+#endif
+        m_impl.replace(from, len, nCount, (wxStringCharType)ch);
+    return *this;
+  }
     // replaces a substring with another substring
   wxString& replace(size_t nStart, size_t nLen,
                     const wxString& str, size_t nStart2, size_t nLen2)
-    { return (wxString&)wxStringBase::replace(nStart, nLen, str,
-                                              nStart2, nLen2); }
+  {
+    size_t from, len;
+    PosLenToImpl(nStart, nLen, &from, &len);
+
+    size_t from2, len2;
+    str.PosLenToImpl(nStart2, nLen2, &from2, &len2);
+
+    m_impl.replace(from, len, str.m_impl, from2, len2);
+    return *this;
+  }
      // replaces the substring with first nCount chars of sz
   wxString& replace(size_t nStart, size_t nLen,
-                    const wxChar* sz, size_t nCount)
-    { return (wxString&)wxStringBase::replace(nStart, nLen, sz, nCount); }
-  wxString& replace(iterator first, iterator last, const_pointer s)
-    { return (wxString&)wxStringBase::replace(first, last, s); }
-  wxString& replace(iterator first, iterator last, const_pointer s,
-                    size_type n)
-    { return (wxString&)wxStringBase::replace(first, last, s, n); }
+                    const char* sz, size_t nCount)
+  {
+    size_t from, len;
+    PosLenToImpl(nStart, nLen, &from, &len);
+
+    SubstrBufFromMB str(ImplStr(sz, nCount));
+
+    m_impl.replace(from, len, str.data, str.len);
+    return *this;
+  }
+  wxString& replace(size_t nStart, size_t nLen,
+                    const wchar_t* sz, size_t nCount)
+  {
+    size_t from, len;
+    PosLenToImpl(nStart, nLen, &from, &len);
+
+    SubstrBufFromWC str(ImplStr(sz, nCount));
+
+    m_impl.replace(from, len, str.data, str.len);
+    return *this;
+  }
+  wxString& replace(iterator first, iterator last, const char* s)
+    { m_impl.replace(first, last, ImplStr(s)); return *this; }
+  wxString& replace(iterator first, iterator last, const wchar_t* s)
+    { m_impl.replace(first, last, ImplStr(s)); return *this; }
+  wxString& replace(iterator first, iterator last, const char* s, size_type n)
+  {
+    SubstrBufFromMB str(ImplStr(s, n));
+    m_impl.replace(first, last, str.data, str.len);
+    return *this;
+  }
+  wxString& replace(iterator first, iterator last, const wchar_t* s, size_type n)
+  {
+    SubstrBufFromWC str(ImplStr(s, n));
+    m_impl.replace(first, last, str.data, str.len);
+    return *this;
+  }
   wxString& replace(iterator first, iterator last, const wxString& s)
-    { return (wxString&)wxStringBase::replace(first, last, s); }
-  wxString& replace(iterator first, iterator last, size_type n, wxUniChar c)
-    { return (wxString&)wxStringBase::replace(first, last, n, c); }
+    { m_impl.replace(first, last, s.m_impl); return *this; }
+  wxString& replace(iterator first, iterator last, size_type n, wxUniChar ch)
+  {
+#if wxUSE_UNICODE_UTF8
+    if ( !ch.IsAscii() )
+        m_impl.replace(first, last, EncodeNChars(n, ch));
+    else
+#endif
+        m_impl.replace(first, last, n, (wxStringCharType)ch);
+    return *this;
+  }
   wxString& replace(iterator first, iterator last,
                     const_iterator first1, const_iterator last1)
-    { return (wxString&)wxStringBase::replace(first, last, first1, last1); }
+    { m_impl.replace(first, last, first1, last1); return *this; }
+
+  // swap two strings
+  void swap(wxString& str)
+    { m_impl.swap(str.m_impl); }
+
+    // find a substring
+  size_t find(const wxString& str, size_t nStart = 0) const
+    { return PosFromImpl(m_impl.find(str.m_impl, PosToImpl(nStart))); }
+
+    // find first n characters of sz
+  size_t find(const char* sz, size_t nStart = 0, size_t n = npos) const
+  {
+      SubstrBufFromMB str(ImplStr(sz, n));
+      return PosFromImpl(m_impl.find(str.data, PosToImpl(nStart), str.len));
+  }
+  size_t find(const wchar_t* sz, size_t nStart = 0, size_t n = npos) const
+  {
+      SubstrBufFromWC str(ImplStr(sz, n));
+      return PosFromImpl(m_impl.find(str.data, PosToImpl(nStart), str.len));
+  }
+
+    // find the first occurence of character ch after nStart
+  size_t find(wxUniChar ch, size_t nStart = 0) const
+    { return PosFromImpl(m_impl.find(EncodeChar(ch), PosToImpl(nStart))); }
+  size_t find(wxUniCharRef ch, size_t nStart = 0) const
+    {  return find(wxUniChar(ch), nStart); }
+  size_t find(char ch, size_t nStart = 0) const
+    {  return find(wxUniChar(ch), nStart); }
+  size_t find(wchar_t ch, size_t nStart = 0) const
+    {  return find(wxUniChar(ch), nStart); }
+
+    // rfind() family is exactly like find() but works right to left
+
+    // as find, but from the end
+  size_t rfind(const wxString& str, size_t nStart = npos) const
+    { return PosFromImpl(m_impl.rfind(str.m_impl, PosToImpl(nStart))); }
+
+    // as find, but from the end
+  size_t rfind(const char* sz, size_t nStart = npos, size_t n = npos) const
+  {
+      SubstrBufFromMB str(ImplStr(sz, n));
+      return PosFromImpl(m_impl.rfind(str.data, PosToImpl(nStart), str.len));
+  }
+  size_t rfind(const wchar_t* sz, size_t nStart = npos, size_t n = npos) const
+  {
+      SubstrBufFromWC str(ImplStr(sz, n));
+      return PosFromImpl(m_impl.rfind(str.data, PosToImpl(nStart), str.len));
+  }
+    // as find, but from the end
+  size_t rfind(wxUniChar ch, size_t nStart = npos) const
+    { return PosFromImpl(m_impl.rfind(EncodeChar(ch), PosToImpl(nStart))); }
+  size_t rfind(wxUniCharRef ch, size_t nStart = npos) const
+    {  return rfind(wxUniChar(ch), nStart); }
+  size_t rfind(char ch, size_t nStart = npos) const
+    {  return rfind(wxUniChar(ch), nStart); }
+  size_t rfind(wchar_t ch, size_t nStart = npos) const
+    {  return rfind(wxUniChar(ch), nStart); }
+
+  // find first/last occurence of any character (not) in the set:
+#if wxUSE_STL_BASED_WXSTRING && !wxUSE_UNICODE_UTF8
+  // FIXME-UTF8: this is not entirely correct, because it doesn't work if
+  //             sizeof(wchar_t)==2 and surrogates are present in the string;
+  //             should we care? Probably not.
+  size_t find_first_of(const wxString& str, size_t nStart = 0) const
+    { return m_impl.find_first_of(str.impl, nStart); }
+  size_t find_first_of(const char* sz, size_t nStart = 0) const
+    { return m_impl.find_first_of(ImplStr(sz), nStart); }
+  size_t find_first_of(const wchar_t* sz, size_t nStart = 0) const
+    { return m_impl.find_first_of(ImplStr(sz), nStart); }
+  size_t find_first_of(const char* sz, size_t nStart, size_t n) const;
+    { return m_impl.find_first_of(ImplStr(sz), nStart, n); }
+  size_t find_first_of(const wchar_t* sz, size_t nStart, size_t n) const;
+    { return m_impl.find_first_of(ImplStr(sz), nStart, n); }
+  size_t find_first_of(wxUniChar c, size_t nStart = 0) const
+    { return m_impl.find_first_of((wxChar)c, nStart); }
+
+  size_t find_last_of(const wxStringImpl& str, size_t nStart = npos) const
+    { return m_impl.find_last_of(str.impl, nStart); }
+  size_t find_last_of(const char* sz, size_t nStart = npos) const
+    { return m_impl.find_last_of(ImplStr(sz), nStart); }
+  size_t find_last_of(const wchar_t* sz, size_t nStart = npos) const
+    { return m_impl.find_last_of(ImplStr(sz), nStart); }
+  size_t find_last_of(const char* sz, size_t nStart, size_t n) const
+    { return m_impl.find_last_of(ImplStr(sz), nStart, n); }
+  size_t find_last_of(const wchar_t* sz, size_t nStart, size_t n) const
+    { return m_impl.find_last_of(ImplStr(sz), nStart, n); }
+  size_t find_last_of(wxUniChar c, size_t nStart = npos) const
+    { return m_impl.find_last_of((wxChar)c, nStart); }
+
+  size_t find_first_not_of(const wxStringImpl& str, size_t nStart = 0) const
+    { return m_impl.find_first_not_of(str.m_impl, nStart); }
+  size_t find_first_not_of(const char* sz, size_t nStart = 0) const;
+    { return m_impl.find_first_not_of(ImplStr(sz), nStart); }
+  size_t find_first_not_of(const wchar_t* sz, size_t nStart = 0) const;
+    { return m_impl.find_first_not_of(ImplStr(sz), nStart); }
+  size_t find_first_not_of(const char* sz, size_t nStart, size_t n) const;
+    { return m_impl.find_first_not_of(ImplStr(sz), nStart, n); }
+  size_t find_first_not_of(const wchar_t* sz, size_t nStart, size_t n) const;
+    { return m_impl.find_first_not_of(ImplStr(sz), nStart, n); }
+  size_t find_first_not_of(wxUniChar c, size_t nStart = 0) const;
+    { return m_impl.find_first_not_of((wxChar)c, nStart); }
+
+  size_t find_last_not_of(const wxStringImpl& str, size_t nStart = npos) const
+    { return m_impl.find_last_not_of(str.m_impl, nStart); }
+  size_t find_last_not_of(const char* sz, size_t nStart = npos) const;
+    { return m_impl.find_last_not_of(ImplStr(sz), nStart); }
+  size_t find_last_not_of(const wchar_t* sz, size_t nStart = npos) const;
+    { return m_impl.find_last_not_of(ImplStr(sz), nStart); }
+  size_t find_last_not_of(const char* sz, size_t nStart, size_t n) const;
+    { return m_impl.find_last_not_of(ImplStr(sz), nStart, n); }
+  size_t find_last_not_of(const wchar_t* sz, size_t nStart, size_t n) const;
+    { return m_impl.find_last_not_of(ImplStr(sz), nStart, n); }
+  size_t find_last_not_of(wxUniChar c, size_t nStart = npos) const;
+    { return m_impl.find_last_not_of((wxChar)c, nStart); }
+#else
+  // we can't use std::string implementation in UTF-8 build, because the
+  // character sets would be interpreted wrongly:
+
+    // as strpbrk() but starts at nStart, returns npos if not found
+  size_t find_first_of(const wxString& str, size_t nStart = 0) const
+    { return find_first_of((const wxChar*)str.c_str(), nStart); }
+    // same as above
+  size_t find_first_of(const char* sz, size_t nStart = 0) const;
+  size_t find_first_of(const wchar_t* sz, size_t nStart = 0) const;
+  size_t find_first_of(const char* sz, size_t nStart, size_t n) const;
+  size_t find_first_of(const wchar_t* sz, size_t nStart, size_t n) const;
+    // same as find(char, size_t)
+  size_t find_first_of(wxUniChar c, size_t nStart = 0) const
+    { return find(c, nStart); }
+    // find the last (starting from nStart) char from str in this string
+  size_t find_last_of (const wxString& str, size_t nStart = npos) const
+    { return find_last_of((const wxChar*)str.c_str(), nStart); }
+    // same as above
+  size_t find_last_of (const char* sz, size_t nStart = npos) const;
+  size_t find_last_of (const wchar_t* sz, size_t nStart = npos) const;
+  size_t find_last_of(const char* sz, size_t nStart, size_t n) const;
+  size_t find_last_of(const wchar_t* sz, size_t nStart, size_t n) const;
+    // same as above
+  size_t find_last_of(wxUniChar c, size_t nStart = npos) const
+    { return rfind(c, nStart); }
+
+    // find first/last occurence of any character not in the set
+
+    // as strspn() (starting from nStart), returns npos on failure
+  size_t find_first_not_of(const wxString& str, size_t nStart = 0) const
+    { return find_first_not_of((const wxChar*)str.c_str(), nStart); }
+    // same as above
+  size_t find_first_not_of(const char* sz, size_t nStart = 0) const;
+  size_t find_first_not_of(const wchar_t* sz, size_t nStart = 0) const;
+  size_t find_first_not_of(const char* sz, size_t nStart, size_t n) const;
+  size_t find_first_not_of(const wchar_t* sz, size_t nStart, size_t n) const;
+    // same as above
+  size_t find_first_not_of(wxUniChar ch, size_t nStart = 0) const;
+    //  as strcspn()
+  size_t find_last_not_of(const wxString& str, size_t nStart = npos) const
+    { return find_last_not_of((const wxChar*)str.c_str(), nStart); }
+    // same as above
+  size_t find_last_not_of(const char* sz, size_t nStart = npos) const;
+  size_t find_last_not_of(const wchar_t* sz, size_t nStart = npos) const;
+  size_t find_last_not_of(const char* sz, size_t nStart, size_t n) const;
+  size_t find_last_not_of(const wchar_t* sz, size_t nStart, size_t n) const;
+    // same as above
+  size_t find_last_not_of(wxUniChar ch, size_t nStart = npos) const;
+#endif // wxUSE_STL_BASED_WXSTRING && !wxUSE_UNICODE_UTF8 or not
+
+  // provide char/wchar_t/wxUniCharRef overloads for char-finding functions
+  // above to resolve ambiguities:
+  size_t find_first_of(wxUniCharRef ch, size_t nStart = 0) const
+    {  return find_first_of(wxUniChar(ch), nStart); }
+  size_t find_first_of(char ch, size_t nStart = 0) const
+    {  return find_first_of(wxUniChar(ch), nStart); }
+  size_t find_first_of(wchar_t ch, size_t nStart = 0) const
+    {  return find_first_of(wxUniChar(ch), nStart); }
+  size_t find_last_of(wxUniCharRef ch, size_t nStart = npos) const
+    {  return find_last_of(wxUniChar(ch), nStart); }
+  size_t find_last_of(char ch, size_t nStart = npos) const
+    {  return find_last_of(wxUniChar(ch), nStart); }
+  size_t find_last_of(wchar_t ch, size_t nStart = npos) const
+    {  return find_last_of(wxUniChar(ch), nStart); }
+  size_t find_first_not_of(wxUniCharRef ch, size_t nStart = 0) const
+    {  return find_first_not_of(wxUniChar(ch), nStart); }
+  size_t find_first_not_of(char ch, size_t nStart = 0) const
+    {  return find_first_not_of(wxUniChar(ch), nStart); }
+  size_t find_first_not_of(wchar_t ch, size_t nStart = 0) const
+    {  return find_first_not_of(wxUniChar(ch), nStart); }
+  size_t find_last_not_of(wxUniCharRef ch, size_t nStart = npos) const
+    {  return find_last_not_of(wxUniChar(ch), nStart); }
+  size_t find_last_not_of(char ch, size_t nStart = npos) const
+    {  return find_last_not_of(wxUniChar(ch), nStart); }
+  size_t find_last_not_of(wchar_t ch, size_t nStart = npos) const
+    {  return find_last_not_of(wxUniChar(ch), nStart); }
 
       // string += string
   wxString& operator+=(const wxString& s)
-    { return (wxString&)wxStringBase::operator+=(s); }
+    { m_impl += s.m_impl; return *this; }
       // string += C string
-  wxString& operator+=(const wxChar *psz)
-    { return (wxString&)wxStringBase::operator+=(psz); }
+  wxString& operator+=(const char *psz)
+    { m_impl += ImplStr(psz); return *this; }
+  wxString& operator+=(const wchar_t *pwz)
+    { m_impl += ImplStr(pwz); return *this; }
   wxString& operator+=(const wxCStrData& s)
-    { return (wxString&)wxStringBase::operator+=(s.AsString()); }
+    { m_impl += s.AsString().m_impl; return *this; }
       // string += char
   wxString& operator+=(wxUniChar ch)
-    { return (wxString&)wxStringBase::operator+=(ch); }
+    { m_impl += EncodeChar(ch); return *this; }
   wxString& operator+=(wxUniCharRef ch) { return *this += wxUniChar(ch); }
   wxString& operator+=(char ch) { return *this += wxUniChar(ch); }
   wxString& operator+=(unsigned char ch) { return *this += wxUniChar(ch); }
   wxString& operator+=(wchar_t ch) { return *this += wxUniChar(ch); }
 
 private:
-#if !wxUSE_STL_BASED_WXSTRING
+#if !wxUSE_STL_BASED_WXSTRING && !wxUSE_UNICODE_UTF8
   // helpers for wxStringBuffer and wxStringBufferLength
-  wxChar *DoGetWriteBuf(size_t nLen);
-  void DoUngetWriteBuf();
-  void DoUngetWriteBuf(size_t nLen);
+  wxStringCharType *DoGetWriteBuf(size_t nLen)
+    { return m_impl.DoGetWriteBuf(nLen); }
+  void DoUngetWriteBuf()
+    { m_impl.DoUngetWriteBuf(); }
+  void DoUngetWriteBuf(size_t nLen)
+    { m_impl.DoUngetWriteBuf(nLen); }
 
   friend class WXDLLIMPEXP_BASE wxStringBuffer;
   friend class WXDLLIMPEXP_BASE wxStringBufferLength;
-#endif
+#endif // !wxUSE_STL_BASED_WXSTRING && !wxUSE_UNICODE_UTF8
 
 #ifndef wxNEEDS_WXSTRING_PRINTF_MIXIN
   int DoPrintf(const wxChar *format, ...) ATTRIBUTE_PRINTF_2;
   static wxString DoFormat(const wxChar *format, ...) ATTRIBUTE_PRINTF_1;
 #endif
+
+#if !wxUSE_STL_BASED_WXSTRING
+  // check string's data validity
+  bool IsValid() const { return m_impl.GetStringData()->IsValid(); }
+#endif
+
+private:
+  wxStringImpl m_impl;
 };
 
 #ifdef wxNEEDS_WXSTRING_PRINTF_MIXIN
@@ -1743,8 +2286,10 @@ private:
 // here as friend ones are not injected in the enclosing namespace and without
 // them the code fails to compile with conforming compilers such as xlC or g++4
 wxString WXDLLIMPEXP_BASE operator+(const wxString& string1, const wxString& string2);
-wxString WXDLLIMPEXP_BASE operator+(const wxString& string, const wxChar *psz);
-wxString WXDLLIMPEXP_BASE operator+(const wxChar *psz, const wxString& string);
+wxString WXDLLIMPEXP_BASE operator+(const wxString& string, const char *psz);
+wxString WXDLLIMPEXP_BASE operator+(const wxString& string, const wchar_t *pwz);
+wxString WXDLLIMPEXP_BASE operator+(const char *psz, const wxString& string);
+wxString WXDLLIMPEXP_BASE operator+(const wchar_t *pwz, const wxString& string);
 
 wxString WXDLLIMPEXP_BASE operator+(const wxString& string, wxUniChar ch);
 wxString WXDLLIMPEXP_BASE operator+(wxUniChar ch, const wxString& string);
@@ -1778,7 +2323,7 @@ inline wxString operator+(wchar_t ch, const wxString& string)
 // wxStringBuffer: a tiny class allowing to get a writable pointer into string
 // ----------------------------------------------------------------------------
 
-#if wxUSE_STL_BASED_WXSTRING
+#if wxUSE_STL_BASED_WXSTRING || wxUSE_UNICODE_UTF8
 
 class WXDLLIMPEXP_BASE wxStringBuffer
 {
@@ -1831,7 +2376,7 @@ private:
     DECLARE_NO_COPY_CLASS(wxStringBufferLength)
 };
 
-#else // if !wxUSE_STL_BASED_WXSTRING
+#else // if !wxUSE_STL_BASED_WXSTRING && !wxUSE_UNICODE_UTF8
 
 class WXDLLIMPEXP_BASE wxStringBuffer
 {
@@ -1879,7 +2424,7 @@ private:
     DECLARE_NO_COPY_CLASS(wxStringBufferLength)
 };
 
-#endif // !wxUSE_STL_BASED_WXSTRING
+#endif // !wxUSE_STL_BASED_WXSTRING && !wxUSE_UNICODE_UTF8
 
 // ---------------------------------------------------------------------------
 // wxString comparison functions: operator versions are always case sensitive
@@ -2030,7 +2575,7 @@ inline const char* wxCStrData::AsChar() const
 #endif
 {
     if ( m_offset == 0 )
-        return m_str->wx_str(); // FIXME
+        return m_str->wx_str(); // FIXME-UTF8
     else
         return (const wxChar*)(m_str->begin() + m_offset);
 }
@@ -2058,15 +2603,6 @@ inline wxUniChar wxCStrData::operator[](size_t n) const
     return m_str->at(m_offset + n);
 }
 
-// ----------------------------------------------------------------------------
-// implementation of wxString inline methods using wxCStrData
-// ----------------------------------------------------------------------------
-
-inline wxString& wxString::operator=(const wxCStrData& cstr)
-{
-    return *this = cstr.AsString();
-}
-
 // ----------------------------------------------------------------------------
 // implementation of wx[W]CharBuffer inline methods using wxCStrData
 // ----------------------------------------------------------------------------
diff --git a/include/wx/strvararg.h b/include/wx/strvararg.h
index 290614c863..2aab05e478 100644
--- a/include/wx/strvararg.h
+++ b/include/wx/strvararg.h
@@ -89,27 +89,11 @@ struct wxArgNormalizer
 
 // special cases for converting strings:
 
-// FIXME-UTF8: move this to chartype.h!
-#if wxUSE_UNICODE
-    /* for now, all Unicode builds are wchar_t* based: */
-    #define wxUSE_UNICODE_WCHAR 1
-#else
-    #define wxUSE_UNICODE_WCHAR 0
-#endif
-
-// FIXME-UTF8: include wx/chartype.h and use wxChar after headers split
-// FIXME-UTF8: this will be char* in UTF-8 build and wchar_t* on Windows
-#if wxUSE_UNICODE_WCHAR
-    typedef wchar_t wxArgNativeCharType;
-#else
-    typedef char wxArgNativeCharType;
-#endif
-
 template<>
 struct WXDLLIMPEXP_BASE wxArgNormalizer<const wxCStrData&>
 {
     wxArgNormalizer(const wxCStrData& value) : m_value(value) {}
-    const wxArgNativeCharType *get() const;
+    const wxStringCharType *get() const;
 
     const wxCStrData& m_value;
 };
@@ -125,7 +109,7 @@ template<>
 struct WXDLLIMPEXP_BASE wxArgNormalizer<const wxString&>
 {
     wxArgNormalizer(const wxString& value) : m_value(value) {}
-    const wxArgNativeCharType *get() const;
+    const wxStringCharType *get() const;
 
     const wxString& m_value;
 };
diff --git a/src/common/string.cpp b/src/common/string.cpp
index 8d39d9ceea..db4b5fe618 100644
--- a/src/common/string.cpp
+++ b/src/common/string.cpp
@@ -52,14 +52,30 @@
 // NB: EXTRA_ALLOC must be >= 0!
 #define EXTRA_ALLOC       (19 - nLen % 16)
 
+
+// string handling functions used by wxString:
+#if wxUSE_UNICODE_UTF8
+    #define wxStringMemcpy   memcpy
+    #define wxStringMemcmp   memcmp
+    #define wxStringMemchr   memchr
+    #define wxStringStrlen   strlen
+#else
+    #define wxStringMemcpy   wxTmemcpy
+    #define wxStringMemcmp   wxTmemcmp
+    #define wxStringMemchr   wxTmemchr
+    #define wxStringStrlen   wxStrlen
+#endif
+
+
 // ---------------------------------------------------------------------------
 // static class variables definition
 // ---------------------------------------------------------------------------
 
 #if !wxUSE_STL_BASED_WXSTRING
   //According to STL _must_ be a -1 size_t
-  const size_t wxStringBase::npos = (size_t) -1;
+  const size_t wxStringImpl::npos = (size_t) -1;
 #endif
+const size_t wxString::npos = (size_t) -1;
 
 // ----------------------------------------------------------------------------
 // static data
@@ -153,11 +169,11 @@ void wxStringData::Free()
 #endif
 
 // ===========================================================================
-// wxStringBase
+// wxStringImpl
 // ===========================================================================
 
 // takes nLength elements of psz starting at nPos
-void wxStringBase::InitWith(const wxChar *psz, size_t nPos, size_t nLength)
+void wxStringImpl::InitWith(const wxChar *psz, size_t nPos, size_t nLength)
 {
   Init();
 
@@ -173,15 +189,15 @@ void wxStringBase::InitWith(const wxChar *psz, size_t nPos, size_t nLength)
   if ( nLength > 0 ) {
     // trailing '\0' is written in AllocBuffer()
     if ( !AllocBuffer(nLength) ) {
-      wxFAIL_MSG( _T("out of memory in wxStringBase::InitWith") );
+      wxFAIL_MSG( _T("out of memory in wxStringImpl::InitWith") );
       return;
     }
-    wxTmemcpy(m_pchData, psz + nPos, nLength);
+    wxStringMemcpy(m_pchData, psz + nPos, nLength);
   }
 }
 
 // poor man's iterators are "void *" pointers
-wxStringBase::wxStringBase(const void *pStart, const void *pEnd)
+wxStringImpl::wxStringImpl(const void *pStart, const void *pEnd)
 {
   if ( pEnd >= pStart )
   {
@@ -195,7 +211,7 @@ wxStringBase::wxStringBase(const void *pStart, const void *pEnd)
   }
 }
 
-wxStringBase::wxStringBase(size_type n, wxUniChar ch)
+wxStringImpl::wxStringImpl(size_type n, wxStringCharType ch)
 {
   Init();
   append(n, ch);
@@ -206,7 +222,7 @@ wxStringBase::wxStringBase(size_type n, wxUniChar ch)
 // ---------------------------------------------------------------------------
 
 // allocates memory needed to store a C string of length nLen
-bool wxStringBase::AllocBuffer(size_t nLen)
+bool wxStringImpl::AllocBuffer(size_t nLen)
 {
   // allocating 0 sized buffer doesn't make sense, all empty strings should
   // reuse g_strEmpty
@@ -238,7 +254,7 @@ bool wxStringBase::AllocBuffer(size_t nLen)
 }
 
 // must be called before changing this string
-bool wxStringBase::CopyBeforeWrite()
+bool wxStringImpl::CopyBeforeWrite()
 {
   wxStringData* pData = GetStringData();
 
@@ -249,7 +265,7 @@ bool wxStringBase::CopyBeforeWrite()
       // allocation failures are handled by the caller
       return false;
     }
-    wxTmemcpy(m_pchData, pData->data(), nLen);
+    wxStringMemcpy(m_pchData, pData->data(), nLen);
   }
 
   wxASSERT( !GetStringData()->IsShared() );  // we must be the only owner
@@ -258,7 +274,7 @@ bool wxStringBase::CopyBeforeWrite()
 }
 
 // must be called before replacing contents of this string
-bool wxStringBase::AllocBeforeWrite(size_t nLen)
+bool wxStringImpl::AllocBeforeWrite(size_t nLen)
 {
   wxASSERT( nLen != 0 );  // doesn't make any sense
 
@@ -304,12 +320,12 @@ bool wxStringBase::AllocBeforeWrite(size_t nLen)
   return true;
 }
 
-wxStringBase& wxStringBase::append(size_t n, wxUniChar ch)
+wxStringImpl& wxStringImpl::append(size_t n, wxStringCharType ch)
 {
     size_type len = length();
 
     if ( !Alloc(len + n) || !CopyBeforeWrite() ) {
-      wxFAIL_MSG( _T("out of memory in wxStringBase::append") );
+      wxFAIL_MSG( _T("out of memory in wxStringImpl::append") );
     }
     GetStringData()->nDataLength = len + n;
     m_pchData[len + n] = '\0';
@@ -318,7 +334,7 @@ wxStringBase& wxStringBase::append(size_t n, wxUniChar ch)
     return *this;
 }
 
-void wxStringBase::resize(size_t nSize, wxUniChar ch)
+void wxStringImpl::resize(size_t nSize, wxStringCharType ch)
 {
     size_t len = length();
 
@@ -334,7 +350,7 @@ void wxStringBase::resize(size_t nSize, wxUniChar ch)
 }
 
 // allocate enough memory for nLen characters
-bool wxStringBase::Alloc(size_t nLen)
+bool wxStringImpl::Alloc(size_t nLen)
 {
   wxStringData *pData = GetStringData();
   if ( pData->nAllocLength <= nLen ) {
@@ -388,41 +404,41 @@ bool wxStringBase::Alloc(size_t nLen)
   return true;
 }
 
-wxStringBase::iterator wxStringBase::begin()
+wxStringImpl::iterator wxStringImpl::begin()
 {
     if (length() > 0)
         CopyBeforeWrite();
     return m_pchData;
 }
 
-wxStringBase::iterator wxStringBase::end()
+wxStringImpl::iterator wxStringImpl::end()
 {
     if (length() > 0)
         CopyBeforeWrite();
     return m_pchData + length();
 }
 
-wxStringBase::iterator wxStringBase::erase(iterator it)
+wxStringImpl::iterator wxStringImpl::erase(iterator it)
 {
     size_type idx = it - begin();
     erase(idx, 1);
     return begin() + idx;
 }
 
-wxStringBase& wxStringBase::erase(size_t nStart, size_t nLen)
+wxStringImpl& wxStringImpl::erase(size_t nStart, size_t nLen)
 {
     wxASSERT(nStart <= length());
     size_t strLen = length() - nStart;
     // delete nLen or up to the end of the string characters
     nLen = strLen < nLen ? strLen : nLen;
-    wxString strTmp(c_str(), nStart);
+    wxStringImpl strTmp(c_str(), nStart);
     strTmp.append(c_str() + nStart + nLen, length() - nStart - nLen);
 
     swap(strTmp);
     return *this;
 }
 
-wxStringBase& wxStringBase::insert(size_t nPos, const wxChar *sz, size_t n)
+wxStringImpl& wxStringImpl::insert(size_t nPos, const wxChar *sz, size_t n)
 {
     wxASSERT( nPos <= length() );
 
@@ -430,7 +446,7 @@ wxStringBase& wxStringBase::insert(size_t nPos, const wxChar *sz, size_t n)
     if ( n == 0 ) return *this;
 
     if ( !Alloc(length() + n) || !CopyBeforeWrite() ) {
-        wxFAIL_MSG( _T("out of memory in wxStringBase::insert") );
+        wxFAIL_MSG( _T("out of memory in wxStringImpl::insert") );
     }
 
     memmove(m_pchData + nPos + n, m_pchData + nPos,
@@ -442,14 +458,14 @@ wxStringBase& wxStringBase::insert(size_t nPos, const wxChar *sz, size_t n)
     return *this;
 }
 
-void wxStringBase::swap(wxStringBase& str)
+void wxStringImpl::swap(wxStringImpl& str)
 {
-    wxChar* tmp = str.m_pchData;
+    wxStringCharType* tmp = str.m_pchData;
     str.m_pchData = m_pchData;
     m_pchData = tmp;
 }
 
-size_t wxStringBase::find(const wxStringBase& str, size_t nStart) const
+size_t wxStringImpl::find(const wxStringImpl& str, size_t nStart) const
 {
     // deal with the special case of empty string first
     const size_t nLen = length();
@@ -470,22 +486,25 @@ size_t wxStringBase::find(const wxStringBase& str, size_t nStart) const
     wxASSERT( str.GetStringData()->IsValid() );
     wxASSERT( nStart <= nLen );
 
-    const wxChar * const other = str.c_str();
+    const wxStringCharType * const other = str.c_str();
 
     // anchor
-    const wxChar* p = (const wxChar*)wxTmemchr(c_str() + nStart,
-                                               *other,
-                                               nLen - nStart);
+    const wxStringCharType* p =
+        (const wxStringCharType*)wxStringMemchr(c_str() + nStart,
+                                                *other,
+                                                nLen - nStart);
 
     if ( !p )
         return npos;
 
-    while ( p - c_str() + nLenOther <= nLen && wxTmemcmp(p, other, nLenOther) )
+    while ( p - c_str() + nLenOther <= nLen &&
+            wxStringMemcmp(p, other, nLenOther) )
     {
         p++;
 
         // anchor again
-        p = (const wxChar*)wxTmemchr(p, *other, nLen - (p - c_str()));
+        p = (const wxStringCharType*)
+                wxStringMemchr(p, *other, nLen - (p - c_str()));
 
         if ( !p )
             return npos;
@@ -494,21 +513,22 @@ size_t wxStringBase::find(const wxStringBase& str, size_t nStart) const
     return p - c_str() + nLenOther <= nLen ? p - c_str() : npos;
 }
 
-size_t wxStringBase::find(const wxChar* sz, size_t nStart, size_t n) const
+size_t wxStringImpl::find(const wxChar* sz, size_t nStart, size_t n) const
 {
-    return find(wxStringBase(sz, n), nStart);
+    return find(wxStringImpl(sz, n), nStart);
 }
 
-size_t wxStringBase::find(wxUniChar ch, size_t nStart) const
+size_t wxStringImpl::find(wxStringCharType ch, size_t nStart) const
 {
     wxASSERT( nStart <= length() );
 
-    const wxChar *p = (const wxChar*)wxTmemchr(c_str() + nStart, ch, length() - nStart);
+    const wxStringCharType *p = (const wxStringCharType*)
+        wxStringMemchr(c_str() + nStart, ch, length() - nStart);
 
     return p == NULL ? npos : p - c_str();
 }
 
-size_t wxStringBase::rfind(const wxStringBase& str, size_t nStart) const
+size_t wxStringImpl::rfind(const wxStringImpl& str, size_t nStart) const
 {
     wxASSERT( str.GetStringData()->IsValid() );
     wxASSERT( nStart == npos || nStart <= length() );
@@ -527,11 +547,10 @@ size_t wxStringBase::rfind(const wxStringBase& str, size_t nStart) const
         if ( nStart < top )
             top = nStart;
 
-        const wxChar *cursor = c_str() + top;
+        const wxStringCharType *cursor = c_str() + top;
         do
         {
-            if ( wxTmemcmp(cursor, str.c_str(),
-                        str.length()) == 0 )
+            if ( wxStringMemcmp(cursor, str.c_str(), str.length()) == 0 )
             {
                 return cursor - c_str();
             }
@@ -541,12 +560,12 @@ size_t wxStringBase::rfind(const wxStringBase& str, size_t nStart) const
     return npos;
 }
 
-size_t wxStringBase::rfind(const wxChar* sz, size_t nStart, size_t n) const
+size_t wxStringImpl::rfind(const wxChar* sz, size_t nStart, size_t n) const
 {
-    return rfind(wxStringBase(sz, n), nStart);
+    return rfind(wxStringImpl(sz, n), nStart);
 }
 
-size_t wxStringBase::rfind(wxUniChar ch, size_t nStart) const
+size_t wxStringImpl::rfind(wxStringCharType ch, size_t nStart) const
 {
     if ( nStart == npos )
     {
@@ -557,7 +576,7 @@ size_t wxStringBase::rfind(wxUniChar ch, size_t nStart) const
         wxASSERT( nStart <= length() );
     }
 
-    const wxChar *actual;
+    const wxStringCharType *actual;
     for ( actual = c_str() + ( nStart == npos ? length() : nStart + 1 );
           actual > c_str(); --actual )
     {
@@ -568,162 +587,15 @@ size_t wxStringBase::rfind(wxUniChar ch, size_t nStart) const
     return npos;
 }
 
-size_t wxStringBase::find_first_of(const wxChar* sz, size_t nStart) const
-{
-    wxASSERT(nStart <= length());
-
-    size_t len = wxStrlen(sz);
-
-    size_t i;
-    for(i = nStart; i < this->length(); ++i)
-    {
-        if (wxTmemchr(sz, *(c_str() + i), len))
-            break;
-    }
-
-    if(i == this->length())
-        return npos;
-    else
-        return i;
-}
-
-size_t wxStringBase::find_first_of(const wxChar* sz, size_t nStart,
-                                   size_t n) const
-{
-    return find_first_of(wxStringBase(sz, n), nStart);
-}
-
-size_t wxStringBase::find_last_of(const wxChar* sz, size_t nStart) const
-{
-    if ( nStart == npos )
-    {
-        nStart = length() - 1;
-    }
-    else
-    {
-        wxASSERT_MSG( nStart <= length(),
-                        _T("invalid index in find_last_of()") );
-    }
-
-    size_t len = wxStrlen(sz);
-
-    for ( const wxChar *p = c_str() + nStart; p >= c_str(); --p )
-    {
-        if ( wxTmemchr(sz, *p, len) )
-            return p - c_str();
-    }
-
-    return npos;
-}
-
-size_t wxStringBase::find_last_of(const wxChar* sz, size_t nStart,
-                                   size_t n) const
-{
-    return find_last_of(wxStringBase(sz, n), nStart);
-}
-
-size_t wxStringBase::find_first_not_of(const wxChar* sz, size_t nStart) const
-{
-    if ( nStart == npos )
-    {
-        nStart = length();
-    }
-    else
-    {
-        wxASSERT( nStart <= length() );
-    }
-
-    size_t len = wxStrlen(sz);
-
-    size_t i;
-    for(i = nStart; i < this->length(); ++i)
-    {
-        if (!wxTmemchr(sz, *(c_str() + i), len))
-            break;
-    }
-
-    if(i == this->length())
-         return npos;
-     else
-        return i;
-}
-
-size_t wxStringBase::find_first_not_of(const wxChar* sz, size_t nStart,
-                                       size_t n) const
-{
-    return find_first_not_of(wxStringBase(sz, n), nStart);
-}
-
-size_t wxStringBase::find_first_not_of(wxUniChar ch, size_t nStart) const
-{
-    wxASSERT( nStart <= length() );
-
-    for ( const_iterator p = begin() + nStart; (bool)*p; ++p ) // FIXME-DMARS
-    {
-        if ( *p != ch )
-            return p - begin();
-    }
-
-    return npos;
-}
-
-size_t wxStringBase::find_last_not_of(const wxChar* sz, size_t nStart) const
-{
-    if ( nStart == npos )
-    {
-        nStart = length() - 1;
-    }
-    else
-    {
-        wxASSERT( nStart <= length() );
-    }
-
-    size_t len = wxStrlen(sz);
-
-    for ( const wxChar *p = c_str() + nStart; p >= c_str(); --p )
-    {
-        if ( !wxTmemchr(sz, *p,len) )
-             return p - c_str();
-    }
-
-    return npos;
-}
-
-size_t wxStringBase::find_last_not_of(const wxChar* sz, size_t nStart,
-                                      size_t n) const
-{
-    return find_last_not_of(wxStringBase(sz, n), nStart);
-}
-
-size_t wxStringBase::find_last_not_of(wxUniChar ch, size_t nStart) const
-{
-    if ( nStart == npos )
-    {
-        nStart = length() - 1;
-    }
-    else
-    {
-        wxASSERT( nStart <= length() );
-    }
-
-    for ( const_iterator p = begin() + nStart; p != begin(); --p )
-    {
-        if ( *p != ch )
-            return p - begin();
-    }
-
-    return npos;
-}
-
-wxStringBase& wxStringBase::replace(size_t nStart, size_t nLen,
+wxStringImpl& wxStringImpl::replace(size_t nStart, size_t nLen,
                                     const wxChar *sz)
 {
   wxASSERT_MSG( nStart <= length(),
-                _T("index out of bounds in wxStringBase::replace") );
+                _T("index out of bounds in wxStringImpl::replace") );
   size_t strLen = length() - nStart;
   nLen = strLen < nLen ? strLen : nLen;
 
-  wxStringBase strTmp;
+  wxStringImpl strTmp;
   strTmp.reserve(length()); // micro optimisation to avoid multiple mem allocs
 
   //This is kind of inefficient, but its pretty good considering...
@@ -747,34 +619,34 @@ wxStringBase& wxStringBase::replace(size_t nStart, size_t nLen,
   return *this;
 }
 
-wxStringBase& wxStringBase::replace(size_t nStart, size_t nLen,
-                                    size_t nCount, wxUniChar ch)
+wxStringImpl& wxStringImpl::replace(size_t nStart, size_t nLen,
+                                    size_t nCount, wxStringCharType ch)
 {
-  return replace(nStart, nLen, wxStringBase(nCount, ch).c_str());
+  return replace(nStart, nLen, wxStringImpl(nCount, ch).c_str());
 }
 
-wxStringBase& wxStringBase::replace(size_t nStart, size_t nLen,
-                                    const wxStringBase& str,
+wxStringImpl& wxStringImpl::replace(size_t nStart, size_t nLen,
+                                    const wxStringImpl& str,
                                     size_t nStart2, size_t nLen2)
 {
   return replace(nStart, nLen, str.substr(nStart2, nLen2));
 }
 
-wxStringBase& wxStringBase::replace(size_t nStart, size_t nLen,
+wxStringImpl& wxStringImpl::replace(size_t nStart, size_t nLen,
                                     const wxChar* sz, size_t nCount)
 {
-  return replace(nStart, nLen, wxStringBase(sz, nCount).c_str());
+  return replace(nStart, nLen, wxStringImpl(sz, nCount).c_str());
 }
 
-wxStringBase wxStringBase::substr(size_t nStart, size_t nLen) const
+wxStringImpl wxStringImpl::substr(size_t nStart, size_t nLen) const
 {
   if ( nLen == npos )
     nLen = length() - nStart;
-  return wxStringBase(*this, nStart, nLen);
+  return wxStringImpl(*this, nStart, nLen);
 }
 
 // assigns one string to another
-wxStringBase& wxStringBase::operator=(const wxStringBase& stringSrc)
+wxStringImpl& wxStringImpl::operator=(const wxStringImpl& stringSrc)
 {
   wxASSERT( stringSrc.GetStringData()->IsValid() );
 
@@ -795,26 +667,26 @@ wxStringBase& wxStringBase::operator=(const wxStringBase& stringSrc)
 }
 
 // assigns a single character
-wxStringBase& wxStringBase::operator=(wxUniChar ch)
+wxStringImpl& wxStringImpl::operator=(wxStringCharType ch)
 {
   wxChar c(ch);
   if ( !AssignCopy(1, &c) ) {
-    wxFAIL_MSG( _T("out of memory in wxStringBase::operator=(wxChar)") );
+    wxFAIL_MSG( _T("out of memory in wxStringImpl::operator=(wxChar)") );
   }
   return *this;
 }
 
 // assigns C string
-wxStringBase& wxStringBase::operator=(const wxChar *psz)
+wxStringImpl& wxStringImpl::operator=(const wxChar *psz)
 {
   if ( !AssignCopy(wxStrlen(psz), psz) ) {
-    wxFAIL_MSG( _T("out of memory in wxStringBase::operator=(const wxChar *)") );
+    wxFAIL_MSG( _T("out of memory in wxStringImpl::operator=(const wxChar *)") );
   }
   return *this;
 }
 
 // helper function: does real copy
-bool wxStringBase::AssignCopy(size_t nSrcLen, const wxChar *pszSrcData)
+bool wxStringImpl::AssignCopy(size_t nSrcLen, const wxChar *pszSrcData)
 {
   if ( nSrcLen == 0 ) {
     Reinit();
@@ -836,7 +708,7 @@ bool wxStringBase::AssignCopy(size_t nSrcLen, const wxChar *pszSrcData)
 // ---------------------------------------------------------------------------
 
 // add something to this string
-bool wxStringBase::ConcatSelf(size_t nSrcLen, const wxChar *pszSrcData,
+bool wxStringImpl::ConcatSelf(size_t nSrcLen, const wxChar *pszSrcData,
                               size_t nMaxLen)
 {
   STATISTICS_ADD(SummandLength, nSrcLen);
@@ -893,48 +765,113 @@ bool wxStringBase::ConcatSelf(size_t nSrcLen, const wxChar *pszSrcData,
 
 #endif // !wxUSE_STL_BASED_WXSTRING
 
-#if !wxUSE_STL_BASED_WXSTRING || !defined(HAVE_STD_STRING_COMPARE)
+#ifdef HAVE_STD_STRING_COMPARE
 
-#if !wxUSE_STL_BASED_WXSTRING
-    #define STRINGCLASS wxStringBase
-#else
-    #define STRINGCLASS wxString
-#endif
+// NB: Comparison code (both if HAVE_STD_STRING_COMPARE and if not) works with
+//     UTF-8 encoded strings too, thanks to UTF-8's design which allows us to
+//     sort strings in characters code point order by sorting the byte sequence
+//     in byte values order (i.e. what strcmp() and memcmp() do).
+
+int wxString::compare(const wxString& str) const
+{
+    return m_impl.compare(str.m_impl);
+}
+
+int wxString::compare(size_t nStart, size_t nLen,
+                      const wxString& str) const
+{
+    size_t pos, len;
+    PosLenToImpl(nStart, nLen, &pos, &len);
+    return m_impl.compare(pos, len, str.m_impl);
+}
+
+int wxString::compare(size_t nStart, size_t nLen,
+                      const wxString& str,
+                      size_t nStart2, size_t nLen2) const
+{
+    size_t pos, len;
+    PosLenToImpl(nStart, nLen, &pos, &len);
+
+    size_t pos2, len2;
+    str.PosLenToImpl(nStart2, nLen2, &pos2, &len2);
+
+    return m_impl.compare(pos, len, str.m_impl, pos2, len2);
+}
+
+int wxString::compare(const char* sz) const
+{
+    return m_impl.compare(ImplStr(sz));
+}
+
+int wxString::compare(const wchar_t* sz) const
+{
+    return m_impl.compare(ImplStr(sz));
+}
+
+int wxString::compare(size_t nStart, size_t nLen,
+                      const char* sz, size_t nCount) const
+{
+    size_t pos, len;
+    PosLenToImpl(nStart, nLen, &pos, &len);
+
+    SubstrBufFromMB str(sz, nCount);
 
-static inline int wxDoCmp(const wxChar* s1, size_t l1,
-                          const wxChar* s2, size_t l2)
+    return m_impl.compare(pos, len, str.data, str.len);
+}
+
+int wxString::compare(size_t nStart, size_t nLen,
+                      const wchar_t* sz, size_t nCount) const
+{
+    size_t pos, len;
+    PosLenToImpl(nStart, nLen, &pos, &len);
+
+    SubstrBufFromWC str(sz, nCount);
+
+    return m_impl.compare(pos, len, str.data, str.len);
+}
+
+#else // !HAVE_STD_STRING_COMPARE
+
+static inline int wxDoCmp(const wxStringCharType* s1, size_t l1,
+                          const wxStringCharType* s2, size_t l2)
 {
     if( l1 == l2 )
-        return wxTmemcmp(s1, s2, l1);
+        return wxStringMemcmp(s1, s2, l1);
     else if( l1 < l2 )
     {
-        int ret = wxTmemcmp(s1, s2, l1);
+        int ret = wxStringMemcmp(s1, s2, l1);
         return ret == 0 ? -1 : ret;
     }
     else
     {
-        int ret = wxTmemcmp(s1, s2, l2);
+        int ret = wxStringMemcmp(s1, s2, l2);
         return ret == 0 ? +1 : ret;
     }
 }
 
-int STRINGCLASS::compare(const wxStringBase& str) const
+int wxString::compare(const wxString& str) const
 {
-    return ::wxDoCmp(data(), length(), str.data(), str.length());
+    return ::wxDoCmp(m_impl.data(), m_impl.length(),
+                     str.m_impl.data(), str.m_impl.length());
 }
 
-int STRINGCLASS::compare(size_t nStart, size_t nLen,
-                         const wxStringBase& str) const
+int wxString::compare(size_t nStart, size_t nLen,
+                      const wxString& str) const
 {
     wxASSERT(nStart <= length());
     size_type strLen = length() - nStart;
     nLen = strLen < nLen ? strLen : nLen;
-    return ::wxDoCmp(data() + nStart, nLen, str.data(), str.length());
+
+    size_t pos, len;
+    PosLenToImpl(nStart, nLen, &pos, &len);
+
+    return ::wxDoCmp(m_impl.data() + pos,  len,
+                     str.m_impl.data(), str.m_impl.length());
 }
 
-int STRINGCLASS::compare(size_t nStart, size_t nLen,
-                         const wxStringBase& str,
-                         size_t nStart2, size_t nLen2) const
+int wxString::compare(size_t nStart, size_t nLen,
+                      const wxString& str,
+                      size_t nStart2, size_t nLen2) const
 {
     wxASSERT(nStart <= length());
     wxASSERT(nStart2 <= str.length());
@@ -942,30 +879,67 @@ int STRINGCLASS::compare(size_t nStart, size_t nLen,
               strLen2 = str.length() - nStart2;
     nLen  = strLen  < nLen  ? strLen  : nLen;
     nLen2 = strLen2 < nLen2 ? strLen2 : nLen2;
-    return ::wxDoCmp(data() + nStart, nLen, str.data() + nStart2, nLen2);
+
+    size_t pos, len;
+    PosLenToImpl(nStart, nLen, &pos, &len);
+    size_t pos2, len2;
+    str.PosLenToImpl(nStart2, nLen2, &pos2, &len2);
+
+    return ::wxDoCmp(m_impl.data() + pos, len,
+                     str.m_impl.data() + pos2, len2);
+}
+
+int wxString::compare(const char* sz) const
+{
+    SubstrBufFromMB str(ImplStr(sz, npos));
+    if ( str.len == npos )
+        str.len = wxStringStrlen(str.data);
+    return ::wxDoCmp(m_impl.data(), m_impl.length(), str.data, str.len);
 }
 
-int STRINGCLASS::compare(const wxChar* sz) const
+int wxString::compare(const wchar_t* sz) const
 {
-    size_t nLen = wxStrlen(sz);
-    return ::wxDoCmp(data(), length(), sz, nLen);
+    SubstrBufFromWC str(ImplStr(sz, npos));
+    if ( str.len == npos )
+        str.len = wxStringStrlen(str.data);
+    return ::wxDoCmp(m_impl.data(), m_impl.length(), str.data, str.len);
 }
 
-int STRINGCLASS::compare(size_t nStart, size_t nLen,
-                         const wxChar* sz, size_t nCount) const
+int wxString::compare(size_t nStart, size_t nLen,
+                      const char* sz, size_t nCount) const
 {
     wxASSERT(nStart <= length());
     size_type strLen = length() - nStart;
     nLen = strLen < nLen ? strLen : nLen;
-    if( nCount == npos )
-        nCount = wxStrlen(sz);
 
-    return ::wxDoCmp(data() + nStart, nLen, sz, nCount);
+    size_t pos, len;
+    PosLenToImpl(nStart, nLen, &pos, &len);
+
+    SubstrBufFromMB str(ImplStr(sz, nCount));
+    if ( str.len == npos )
+        str.len = wxStringStrlen(str.data);
+
+    return ::wxDoCmp(m_impl.data() + pos, len, str.data, str.len);
 }
 
-#undef STRINGCLASS
+int wxString::compare(size_t nStart, size_t nLen,
+                      const wchar_t* sz, size_t nCount) const
+{
+    wxASSERT(nStart <= length());
+    size_type strLen = length() - nStart;
+    nLen = strLen < nLen ? strLen : nLen;
+
+    size_t pos, len;
+    PosLenToImpl(nStart, nLen, &pos, &len);
+
+    SubstrBufFromWC str(ImplStr(sz, nCount));
+    if ( str.len == npos )
+        str.len = wxStringStrlen(str.data);
+
+    return ::wxDoCmp(m_impl.data() + pos, len, str.data, str.len);
+}
 
-#endif // !wxUSE_STL_BASED_WXSTRING || !defined(HAVE_STD_STRING_COMPARE)
+#endif // HAVE_STD_STRING_COMPARE/!HAVE_STD_STRING_COMPARE
 
 // ===========================================================================
 // wxString class core
@@ -975,11 +949,54 @@ int STRINGCLASS::compare(size_t nStart, size_t nLen,
 // construction and conversion
 // ---------------------------------------------------------------------------
 
+#if wxUSE_UNICODE
+/* static */
+wxString::SubstrBufFromMB wxString::ConvertStr(const char *psz, size_t nLength,
+                                           const wxMBConv& conv)
+{
+    // anything to do?
+    if ( !psz || nLength == 0 )
+        return SubstrBufFromMB();
+
+    if ( nLength == npos )
+        nLength = wxNO_LEN;
+
+    size_t wcLen;
+    wxWCharBuffer wcBuf(conv.cMB2WC(psz, nLength, &wcLen));
+    if ( !wcLen )
+        return SubstrBufFromMB();
+    else
+        return SubstrBufFromMB(wcBuf, wcLen);
+}
+#else
+/* static */
+wxString::SubstrBufFromWC wxString::ConvertStr(const wchar_t *pwz, size_t nLength,
+                                           const wxMBConv& conv)
+{
+    // anything to do?
+    if ( !pwz || nLength == 0 )
+        return SubstrBufFromWC();
+
+    if ( nLength == npos )
+        nLength = wxNO_LEN;
+
+    size_t mbLen;
+    wxCharBuffer mbBuf(conv.cWC2MB(pwz, nLength, &mbLen));
+    if ( !mbLen )
+        return SubstrBufFromWC();
+    else
+        return SubstrBufFromWC(mbBuf, mbLen);
+}
+#endif
+
+
 #if wxUSE_UNICODE
 
 // from multibyte string
 wxString::wxString(const char *psz, const wxMBConv& conv, size_t nLength)
 {
+    // FIXME-UTF8: this will need changes
+
     // anything to do?
     if ( psz && nLength != 0 )
     {
@@ -996,6 +1013,11 @@ wxString::wxString(const char *psz, const wxMBConv& conv, size_t nLength)
     }
 }
 
+wxString::wxString(const char *psz, size_t nLength)
+{
+    assign(psz, nLength);
+}
+
 //Convert wxString in Unicode mode to a multi-byte string
 const wxCharBuffer wxString::mb_str(const wxMBConv& conv) const
 {
@@ -1009,6 +1031,8 @@ const wxCharBuffer wxString::mb_str(const wxMBConv& conv) const
 // from wide string
 wxString::wxString(const wchar_t *pwz, const wxMBConv& conv, size_t nLength)
 {
+    // FIXME-UTF8: this will need changes
+
     // anything to do?
     if ( pwz && nLength != 0 )
     {
@@ -1023,6 +1047,12 @@ wxString::wxString(const wchar_t *pwz, const wxMBConv& conv, size_t nLength)
         if ( nLenMB )
             assign(buf, nLenMB);
     }
+
+}
+
+wxString::wxString(const wchar_t *pwz, size_t nLength)
+{
+    assign(pwz, nLength);
 }
 
 //Converts this string to a wide character string if unicode
@@ -1044,9 +1074,9 @@ bool wxString::Shrink()
   return tmp.length() == length();
 }
 
-#if !wxUSE_STL_BASED_WXSTRING
+#if !wxUSE_STL_BASED_WXSTRING && !wxUSE_UNICODE_UTF8
 // get the pointer to writable buffer of (at least) nLen bytes
-wxChar *wxString::DoGetWriteBuf(size_t nLen)
+wxChar *wxStringImpl::DoGetWriteBuf(size_t nLen)
 {
   if ( !AllocBeforeWrite(nLen) ) {
     // allocation failure handled by caller
@@ -1060,12 +1090,12 @@ wxChar *wxString::DoGetWriteBuf(size_t nLen)
 }
 
 // put string back in a reasonable state after GetWriteBuf
-void wxString::DoUngetWriteBuf()
+void wxStringImpl::DoUngetWriteBuf()
 {
   DoUngetWriteBuf(wxStrlen(m_pchData));
 }
 
-void wxString::DoUngetWriteBuf(size_t nLen)
+void wxStringImpl::DoUngetWriteBuf(size_t nLen)
 {
   wxStringData * const pData = GetStringData();
 
@@ -1095,7 +1125,7 @@ void wxString::UngetWriteBuf(size_t nLen)
 }
 #endif // WXWIN_COMPATIBILITY_2_8
 
-#endif // !wxUSE_STL_BASED_WXSTRING
+#endif // !wxUSE_STL_BASED_WXSTRING && !wxUSE_UNICODE_UTF8
 
 
 // ---------------------------------------------------------------------------
@@ -1138,8 +1168,8 @@ wxString& wxString::operator=(const wchar_t *pwz)
 wxString operator+(const wxString& str1, const wxString& str2)
 {
 #if !wxUSE_STL_BASED_WXSTRING
-    wxASSERT( str1.GetStringData()->IsValid() );
-    wxASSERT( str2.GetStringData()->IsValid() );
+    wxASSERT( str1.IsValid() );
+    wxASSERT( str2.IsValid() );
 #endif
 
     wxString s = str1;
@@ -1151,7 +1181,7 @@ wxString operator+(const wxString& str1, const wxString& str2)
 wxString operator+(const wxString& str, wxUniChar ch)
 {
 #if !wxUSE_STL_BASED_WXSTRING
-    wxASSERT( str.GetStringData()->IsValid() );
+    wxASSERT( str.IsValid() );
 #endif
 
     wxString s = str;
@@ -1163,7 +1193,7 @@ wxString operator+(const wxString& str, wxUniChar ch)
 wxString operator+(wxUniChar ch, const wxString& str)
 {
 #if !wxUSE_STL_BASED_WXSTRING
-    wxASSERT( str.GetStringData()->IsValid() );
+    wxASSERT( str.IsValid() );
 #endif
 
     wxString s = ch;
@@ -1172,14 +1202,14 @@ wxString operator+(wxUniChar ch, const wxString& str)
     return s;
 }
 
-wxString operator+(const wxString& str, const wxChar *psz)
+wxString operator+(const wxString& str, const char *psz)
 {
 #if !wxUSE_STL_BASED_WXSTRING
-    wxASSERT( str.GetStringData()->IsValid() );
+    wxASSERT( str.IsValid() );
 #endif
 
     wxString s;
-    if ( !s.Alloc(wxStrlen(psz) + str.length()) ) {
+    if ( !s.Alloc(strlen(psz) + str.length()) ) {
         wxFAIL_MSG( _T("out of memory in wxString::operator+") );
     }
     s += str;
@@ -1188,14 +1218,30 @@ wxString operator+(const wxString& str, const wxChar *psz)
     return s;
 }
 
-wxString operator+(const wxChar *psz, const wxString& str)
+wxString operator+(const wxString& str, const wchar_t *pwz)
 {
 #if !wxUSE_STL_BASED_WXSTRING
-    wxASSERT( str.GetStringData()->IsValid() );
+    wxASSERT( str.IsValid() );
+#endif
+
+    wxString s;
+    if ( !s.Alloc(wxWcslen(pwz) + str.length()) ) {
+        wxFAIL_MSG( _T("out of memory in wxString::operator+") );
+    }
+    s += str;
+    s += pwz;
+
+    return s;
+}
+
+wxString operator+(const char *psz, const wxString& str)
+{
+#if !wxUSE_STL_BASED_WXSTRING
+    wxASSERT( str.IsValid() );
 #endif
 
     wxString s;
-    if ( !s.Alloc(wxStrlen(psz) + str.length()) ) {
+    if ( !s.Alloc(strlen(psz) + str.length()) ) {
         wxFAIL_MSG( _T("out of memory in wxString::operator+") );
     }
     s = psz;
@@ -1204,64 +1250,236 @@ wxString operator+(const wxChar *psz, const wxString& str)
     return s;
 }
 
-// ===========================================================================
-// other common string functions
-// ===========================================================================
+wxString operator+(const wchar_t *pwz, const wxString& str)
+{
+#if !wxUSE_STL_BASED_WXSTRING
+    wxASSERT( str.IsValid() );
+#endif
+
+    wxString s;
+    if ( !s.Alloc(wxWcslen(pwz) + str.length()) ) {
+        wxFAIL_MSG( _T("out of memory in wxString::operator+") );
+    }
+    s = pwz;
+    s += str;
+
+    return s;
+}
+
+// ---------------------------------------------------------------------------
+// find_{first,last}_[not]_of functions
+// ---------------------------------------------------------------------------
 
-int wxString::Cmp(const wxString& s) const
+#if !wxUSE_STL_BASED_WXSTRING || wxUSE_UNICODE_UTF8
+
+// NB: All these functions are implemented  with the argument being wxChar*,
+//     i.e. widechar string in any Unicode build, even though native string
+//     representation is char* in the UTF-8 build. This is because we couldn't
+//     use memchr() to determine if a character is in a set encoded as UTF-8.
+
+size_t wxString::find_first_of(const wxChar* sz, size_t nStart) const
 {
-    return compare(s);
+    return find_first_of(sz, nStart, wxStrlen(sz));
 }
 
-int wxString::Cmp(const wxChar* psz) const
+size_t wxString::find_first_not_of(const wxChar* sz, size_t nStart) const
 {
-    return compare(psz);
+    return find_first_not_of(sz, nStart, wxStrlen(sz));
 }
 
-static inline int wxDoCmpNoCase(const wxChar* s1, size_t l1,
-                                const wxChar* s2, size_t l2)
+size_t wxString::find_first_of(const wxChar* sz, size_t nStart, size_t n) const
 {
-    size_t i;
+    wxASSERT_MSG( nStart <= length(),  _T("invalid index") );
 
-    if( l1 == l2 )
+    size_t idx = nStart;
+    for ( const_iterator i = begin() + nStart; i != end(); ++idx, ++i )
     {
-        for(i = 0; i < l1; ++i)
-        {
-            if(wxTolower(s1[i]) != wxTolower(s2[i]))
-                break;
-        }
-        return i == l1 ? 0 : wxTolower(s1[i]) < wxTolower(s2[i]) ? -1 : 1;
+        if ( wxTmemchr(sz, *i, n) )
+            return idx;
     }
-    else if( l1 < l2 )
+
+    return npos;
+}
+
+size_t wxString::find_first_not_of(const wxChar* sz, size_t nStart, size_t n) const
+{
+    wxASSERT_MSG( nStart <= length(),  _T("invalid index") );
+
+    size_t idx = nStart;
+    for ( const_iterator i = begin() + nStart; i != end(); ++idx, ++i )
     {
-        for(i = 0; i < l1; ++i)
-        {
-            if(wxTolower(s1[i]) != wxTolower(s2[i]))
-                break;
-        }
-        return i == l1 ? -1 : wxTolower(s1[i]) < wxTolower(s2[i]) ? -1 : 1;
+        if ( !wxTmemchr(sz, *i, n) )
+            return idx;
+    }
+
+    return npos;
+}
+
+
+size_t wxString::find_last_of(const wxChar* sz, size_t nStart) const
+{
+    return find_last_of(sz, nStart, wxStrlen(sz));
+}
+
+size_t wxString::find_last_not_of(const wxChar* sz, size_t nStart) const
+{
+    return find_last_not_of(sz, nStart, wxStrlen(sz));
+}
+
+size_t wxString::find_last_of(const wxChar* sz, size_t nStart, size_t n) const
+{
+    size_t len = length();
+
+    if ( nStart == npos )
+    {
+        nStart = len - 1;
     }
     else
     {
-        for(i = 0; i < l2; ++i)
-        {
-            if(wxTolower(s1[i]) != wxTolower(s2[i]))
-                break;
-        }
-        return i == l2 ? 1 : wxTolower(s1[i]) < wxTolower(s2[i]) ? -1 : 1;
+        wxASSERT_MSG( nStart <= len, _T("invalid index") );
+    }
+
+    size_t idx = nStart;
+    for ( const_reverse_iterator i = rbegin() + (len - nStart - 1);
+          i != rend(); --idx, ++i )
+    {
+        if ( wxTmemchr(sz, *i, n) )
+            return idx;
     }
+
+    return npos;
 }
 
-int wxString::CmpNoCase(const wxString& s) const
+size_t wxString::find_last_not_of(const wxChar* sz, size_t nStart, size_t n) const
+{
+    size_t len = length();
+
+    if ( nStart == npos )
+    {
+        nStart = len - 1;
+    }
+    else
+    {
+        wxASSERT_MSG( nStart <= len, _T("invalid index") );
+    }
+
+    size_t idx = nStart;
+    for ( const_reverse_iterator i = rbegin() + (len - nStart - 1);
+          i != rend(); --idx, ++i )
+    {
+        if ( !wxTmemchr(sz, *i, n) )
+            return idx;
+    }
+
+    return npos;
+}
+
+size_t wxString::find_first_not_of(wxUniChar ch, size_t nStart) const
 {
-    return wxDoCmpNoCase(data(), length(), s.data(), s.length());
+    wxASSERT_MSG( nStart <= length(),  _T("invalid index") );
+
+    size_t idx = nStart;
+    for ( const_iterator i = begin() + nStart; i != end(); ++idx, ++i )
+    {
+        if ( *i != ch )
+            return idx;
+    }
+
+    return npos;
 }
 
-int wxString::CmpNoCase(const wxChar* psz) const
+size_t wxString::find_last_not_of(wxUniChar ch, size_t nStart) const
 {
-    int nLen = wxStrlen(psz);
+    size_t len = length();
+
+    if ( nStart == npos )
+    {
+        nStart = len - 1;
+    }
+    else
+    {
+        wxASSERT_MSG( nStart <= len, _T("invalid index") );
+    }
+
+    size_t idx = nStart;
+    for ( const_reverse_iterator i = rbegin() + (len - nStart - 1);
+          i != rend(); --idx, ++i )
+    {
+        if ( *i != ch )
+            return idx;
+    }
+
+    return npos;
+}
+
+// the functions above were implemented for wchar_t* arguments in Unicode
+// build and char* in ANSI build; below are implementations for the other
+// version:
+#if wxUSE_UNICODE
+    #define wxOtherCharType char
+    #define STRCONV         (const wxChar*)wxConvLibc.cMB2WC
+#else
+    #define wxOtherCharType wchar_t
+    #define STRCONV         (const wxChar*)wxConvLibc.cWC2MB
+#endif
+
+size_t wxString::find_first_of(const wxOtherCharType* sz, size_t nStart) const
+    { return find_first_of(STRCONV(sz), nStart); }
+
+size_t wxString::find_first_of(const wxOtherCharType* sz, size_t nStart,
+                               size_t n) const
+    { return find_first_of(STRCONV(sz, n, NULL), nStart, n); }
+size_t wxString::find_last_of(const wxOtherCharType* sz, size_t nStart) const
+    { return find_last_of(STRCONV(sz), nStart); }
+size_t wxString::find_last_of(const wxOtherCharType* sz, size_t nStart,
+                              size_t n) const
+    { return find_last_of(STRCONV(sz, n, NULL), nStart, n); }
+size_t wxString::find_first_not_of(const wxOtherCharType* sz, size_t nStart) const
+    { return find_first_not_of(STRCONV(sz), nStart); }
+size_t wxString::find_first_not_of(const wxOtherCharType* sz, size_t nStart,
+                                   size_t n) const
+    { return find_first_not_of(STRCONV(sz, n, NULL), nStart, n); }
+size_t wxString::find_last_not_of(const wxOtherCharType* sz, size_t nStart) const
+    { return find_last_not_of(STRCONV(sz), nStart); }
+size_t wxString::find_last_not_of(const wxOtherCharType* sz, size_t nStart,
+                                  size_t n) const
+    { return find_last_not_of(STRCONV(sz, n, NULL), nStart, n); }
+
+#undef wxOtherCharType
+#undef STRCONV
+
+#endif // !wxUSE_STL_BASED_WXSTRING || wxUSE_UNICODE_UTF8
+
+// ===========================================================================
+// other common string functions
+// ===========================================================================
+
+int wxString::CmpNoCase(const wxString& s) const
+{
+    // FIXME-UTF8: use wxUniChar::ToLower/ToUpper once added
+
+    size_t idx = 0;
+    const_iterator i1 = begin();
+    const_iterator end1 = end();
+    const_iterator i2 = s.begin();
+    const_iterator end2 = s.end();
+
+    for ( ; i1 != end1 && i2 != end2; ++idx, ++i1, ++i2 )
+    {
+        wxUniChar lower1 = (wxChar)wxTolower(*i1);
+        wxUniChar lower2 = (wxChar)wxTolower(*i2);
+        if ( lower1 != lower2 )
+            return lower1 < lower2 ? -1 : 1;
+    }
+
+    size_t len1 = length();
+    size_t len2 = s.length();
 
-    return wxDoCmpNoCase(data(), length(), psz, nLen);
+    if ( len1 < len2 )
+        return -1;
+    else if ( len1 > len2 )
+        return 1;
+    return 0;
 }
 
 
@@ -2041,10 +2259,9 @@ match:
 int wxString::Freq(wxUniChar ch) const
 {
     int count = 0;
-    int len = length();
-    for (int i = 0; i < len; i++)
+    for ( const_iterator i = begin(); i != end(); ++i )
     {
-        if (GetChar(i) == ch)
+        if ( *i == ch )
             count ++;
     }
     return count;
diff --git a/src/common/strvararg.cpp b/src/common/strvararg.cpp
index e3435e6713..00e30cbf84 100644
--- a/src/common/strvararg.cpp
+++ b/src/common/strvararg.cpp
@@ -32,14 +32,14 @@
 // implementation
 // ============================================================================
 
-const wxArgNativeCharType *wxArgNormalizer<const wxCStrData&>::get() const
+const wxStringCharType *wxArgNormalizer<const wxCStrData&>::get() const
 {
     return m_value;
 }
 
-const wxArgNativeCharType *wxArgNormalizer<const wxString&>::get() const
+const wxStringCharType *wxArgNormalizer<const wxString&>::get() const
 {
-    return m_value.c_str();
+    return m_value.wx_str();
 }
 
 #if wxUSE_UNICODE_WCHAR
-- 
2.50.0