include/wx/string.h

   1 ///////////////////////////////////////////////////////////////////////////////
   2 // Name:        wx/string.h
   3 // Purpose:     wxString class
   4 // Author:      Vadim Zeitlin
   5 // Modified by:
   6 // Created:     29/01/98
   7 // RCS-ID:      $Id$
   8 // Copyright:   (c) 1998 Vadim Zeitlin <zeitlin@dptmaths.ens-cachan.fr>
   9 // Licence:     wxWindows licence
  10 ///////////////////////////////////////////////////////////////////////////////
  11
  12 /*
  13     Efficient string class [more or less] compatible with MFC CString,
  14     wxWidgets version 1 wxString and std::string and some handy functions
  15     missing from string.h.
  16 */
  17
  18 #ifndef _WX_WXSTRING_H__
  19 #define _WX_WXSTRING_H__
  20
  21 // ----------------------------------------------------------------------------
  22 // headers
  23 // ----------------------------------------------------------------------------
  24
  25 #include "wx/defs.h"        // everybody should include this
  26
  27 #ifndef __WXPALMOS5__
  28 #if defined(__WXMAC__) || defined(__VISAGECPP__)
  29     #include <ctype.h>
  30 #endif
  31
  32 #if defined(__VISAGECPP__) && __IBMCPP__ >= 400
  33    // problem in VACPP V4 with including stdlib.h multiple times
  34    // strconv includes it anyway
  35 #  include <stdio.h>
  36 #  include <string.h>
  37 #  include <stdarg.h>
  38 #  include <limits.h>
  39 #else
  40 #  include <string.h>
  41 #  include <stdio.h>
  42 #  include <stdarg.h>
  43 #  include <limits.h>
  44 #  include <stdlib.h>
  45 #endif
  46
  47 #ifdef HAVE_STRCASECMP_IN_STRINGS_H
  48     #include <strings.h>    // for strcasecmp()
  49 #endif // HAVE_STRCASECMP_IN_STRINGS_H
  50 #endif // ! __WXPALMOS5__
  51
  52 #include "wx/wxcrtbase.h"   // for wxChar, wxStrlen() etc.
  53 #include "wx/strvararg.h"
  54 #include "wx/buffer.h"      // for wxCharBuffer
  55 #include "wx/strconv.h"     // for wxConvertXXX() macros and wxMBConv classes
  56 #include "wx/stringimpl.h"
  57 #include "wx/stringops.h"
  58 #include "wx/unichar.h"
  59
  60 // by default we cache the mapping of the positions in UTF-8 string to the byte
  61 // offset as this results in noticeable performance improvements for loops over
  62 // strings using indices; comment out this line to disable this
  63 //
  64 // notice that this optimization is well worth using even in debug builds as it
  65 // changes asymptotic complexity of algorithms using indices to iterate over
  66 // wxString back to expected linear from quadratic
  67 //
  68 // also notice that wxTLS_TYPE() (__declspec(thread) in this case) is unsafe to
  69 // use in DLL build under pre-Vista Windows so we disable this code for now, if
  70 // anybody really needs to use UTF-8 build under Windows with this optimization
  71 // it would have to be re-tested and probably corrected
  72 #if wxUSE_UNICODE_UTF8 && !defined(__WXMSW__)
  73     #define wxUSE_STRING_POS_CACHE 1
  74 #else
  75     #define wxUSE_STRING_POS_CACHE 0
  76 #endif
  77
  78 #if wxUSE_STRING_POS_CACHE
  79     #include "wx/tls.h"
  80
  81     // change this 0 to 1 to enable additional (very expensive) asserts
  82     // verifying that string caching logic works as expected
  83     #if 0
  84         #define wxSTRING_CACHE_ASSERT(cond) wxASSERT(cond)
  85     #else
  86         #define wxSTRING_CACHE_ASSERT(cond)
  87     #endif
  88 #endif // wxUSE_STRING_POS_CACHE
  89
  90 class WXDLLIMPEXP_FWD_BASE wxString;
  91
  92 // unless this symbol is predefined to disable the compatibility functions, do
  93 // use them
  94 #ifndef WXWIN_COMPATIBILITY_STRING_PTR_AS_ITER
  95     #define WXWIN_COMPATIBILITY_STRING_PTR_AS_ITER 1
  96 #endif
  97
  98 namespace wxPrivate
  99 {
 100     template <typename T> struct wxStringAsBufHelper;
 101 }
 102
 103 // ---------------------------------------------------------------------------
 104 // macros
 105 // ---------------------------------------------------------------------------
 106
 107 // casts [unfortunately!] needed to call some broken functions which require
 108 // "char *" instead of "const char *"
 109 #define   WXSTRINGCAST (wxChar *)(const wxChar *)
 110 #define   wxCSTRINGCAST (wxChar *)(const wxChar *)
 111 #define   wxMBSTRINGCAST (char *)(const char *)
 112 #define   wxWCSTRINGCAST (wchar_t *)(const wchar_t *)
 113
 114 // ----------------------------------------------------------------------------
 115 // constants
 116 // ----------------------------------------------------------------------------
 117
 118 #if WXWIN_COMPATIBILITY_2_6
 119
 120 // deprecated in favour of wxString::npos, don't use in new code
 121 //
 122 // maximum possible length for a string means "take all string" everywhere
 123 #define wxSTRING_MAXLEN wxString::npos
 124
 125 #endif // WXWIN_COMPATIBILITY_2_6
 126
 127 // ---------------------------------------------------------------------------
 128 // global functions complementing standard C string library replacements for
 129 // strlen() and portable strcasecmp()
 130 //---------------------------------------------------------------------------
 131
 132 #if WXWIN_COMPATIBILITY_2_8
 133 // Use wxXXX() functions from wxcrt.h instead! These functions are for
 134 // backwards compatibility only.
 135
 136 // checks whether the passed in pointer is NULL and if the string is empty
 137 wxDEPRECATED( inline bool IsEmpty(const char *p) );
 138 inline bool IsEmpty(const char *p) { return (!p || !*p); }
 139
 140 // safe version of strlen() (returns 0 if passed NULL pointer)
 141 wxDEPRECATED( inline size_t Strlen(const char *psz) );
 142 inline size_t Strlen(const char *psz)
 143   { return psz ? strlen(psz) : 0; }
 144
 145 // portable strcasecmp/_stricmp
 146 wxDEPRECATED( inline int Stricmp(const char *psz1, const char *psz2) );
 147 inline int Stricmp(const char *psz1, const char *psz2)
 148 {
 149 #if defined(__VISUALC__) && defined(__WXWINCE__)
 150   register char c1, c2;
 151   do {
 152     c1 = tolower(*psz1++);
 153     c2 = tolower(*psz2++);
 154   } while ( c1 && (c1 == c2) );
 155
 156   return c1 - c2;
 157 #elif defined(__VISUALC__) || ( defined(__MWERKS__) && defined(__INTEL__) )
 158   return _stricmp(psz1, psz2);
 159 #elif defined(__SC__)
 160   return _stricmp(psz1, psz2);
 161 #elif defined(__BORLANDC__)
 162   return stricmp(psz1, psz2);
 163 #elif defined(__WATCOMC__)
 164   return stricmp(psz1, psz2);
 165 #elif defined(__DJGPP__)
 166   return stricmp(psz1, psz2);
 167 #elif defined(__EMX__)
 168   return stricmp(psz1, psz2);
 169 #elif defined(__WXPM__)
 170   return stricmp(psz1, psz2);
 171 #elif defined(__WXPALMOS__) || \
 172       defined(HAVE_STRCASECMP_IN_STRING_H) || \
 173       defined(HAVE_STRCASECMP_IN_STRINGS_H) || \
 174       defined(__GNUWIN32__)
 175   return strcasecmp(psz1, psz2);
 176 #elif defined(__MWERKS__) && !defined(__INTEL__)
 177   register char c1, c2;
 178   do {
 179     c1 = tolower(*psz1++);
 180     c2 = tolower(*psz2++);
 181   } while ( c1 && (c1 == c2) );
 182
 183   return c1 - c2;
 184 #else
 185   // almost all compilers/libraries provide this function (unfortunately under
 186   // different names), that's why we don't implement our own which will surely
 187   // be more efficient than this code (uncomment to use):
 188   /*
 189     register char c1, c2;
 190     do {
 191       c1 = tolower(*psz1++);
 192       c2 = tolower(*psz2++);
 193     } while ( c1 && (c1 == c2) );
 194
 195     return c1 - c2;
 196   */
 197
 198   #error  "Please define string case-insensitive compare for your OS/compiler"
 199 #endif  // OS/compiler
 200 }
 201
 202 #endif // WXWIN_COMPATIBILITY_2_8
 203
 204 // ----------------------------------------------------------------------------
 205 // wxCStrData
 206 // ----------------------------------------------------------------------------
 207
 208 // Lightweight object returned by wxString::c_str() and implicitly convertible
 209 // to either const char* or const wchar_t*.
 210 class WXDLLIMPEXP_BASE wxCStrData
 211 {
 212 private:
 213     // Ctors; for internal use by wxString and wxCStrData only
 214     wxCStrData(const wxString *str, size_t offset = 0, bool owned = false)
 215         : m_str(str), m_offset(offset), m_owned(owned) {}
 216
 217 public:
 218     // Ctor constructs the object from char literal; they are needed to make
 219     // operator?: compile and they intentionally take char*, not const char*
 220     inline wxCStrData(char *buf);
 221     inline wxCStrData(wchar_t *buf);
 222     inline wxCStrData(const wxCStrData& data);
 223
 224     inline ~wxCStrData();
 225
 226     // methods defined inline below must be declared inline or mingw32 3.4.5
 227     // warns about "<symbol> defined locally after being referenced with
 228     // dllimport linkage"
 229 #if wxUSE_UNICODE_WCHAR
 230     inline
 231 #endif
 232     const wchar_t* AsWChar() const;
 233     operator const wchar_t*() const { return AsWChar(); }
 234
 235 #if !wxUSE_UNICODE || wxUSE_UTF8_LOCALE_ONLY
 236     inline
 237 #endif
 238     const char* AsChar() const;
 239     const unsigned char* AsUnsignedChar() const
 240         { return (const unsigned char *) AsChar(); }
 241     operator const char*() const { return AsChar(); }
 242     operator const unsigned char*() const { return AsUnsignedChar(); }
 243
 244     operator const void*() const { return AsChar(); }
 245
 246     inline const wxCharBuffer AsCharBuf() const;
 247     inline const wxWCharBuffer AsWCharBuf() const;
 248
 249     inline wxString AsString() const;
 250
 251     // returns the value as C string in internal representation (equivalent
 252     // to AsString().wx_str(), but more efficient)
 253     const wxStringCharType *AsInternal() const;
 254
 255     // allow expressions like "c_str()[0]":
 256     inline wxUniChar operator[](size_t n) const;
 257     wxUniChar operator[](int n) const { return operator[](size_t(n)); }
 258     wxUniChar operator[](long n) const { return operator[](size_t(n)); }
 259 #ifndef wxSIZE_T_IS_UINT
 260     wxUniChar operator[](unsigned int n) const { return operator[](size_t(n)); }
 261 #endif // size_t != unsigned int
 262
 263     // these operators are needed to emulate the pointer semantics of c_str():
 264     // expressions like "wxChar *p = str.c_str() + 1;" should continue to work
 265     // (we need both versions to resolve ambiguities):
 266     wxCStrData operator+(int n) const
 267         { return wxCStrData(m_str, m_offset + n, m_owned); }
 268     wxCStrData operator+(long n) const
 269         { return wxCStrData(m_str, m_offset + n, m_owned); }
 270     wxCStrData operator+(size_t n) const
 271         { return wxCStrData(m_str, m_offset + n, m_owned); }
 272
 273     // and these for "str.c_str() + (p2 - p1)" (it also works for any integer
 274     // expression but it must be ptrdiff_t and not e.g. int to work in this
 275     // example):
 276     wxCStrData operator-(ptrdiff_t n) const
 277     {
 278         wxASSERT_MSG( n <= (ptrdiff_t)m_offset,
 279                       _T("attempt to construct address before the beginning of the string") );
 280         return wxCStrData(m_str, m_offset - n, m_owned);
 281     }
 282
 283     // this operator is needed to make expressions like "*c_str()" or
 284     // "*(c_str() + 2)" work
 285     inline wxUniChar operator*() const;
 286
 287 private:
 288     const wxString *m_str;
 289     size_t m_offset;
 290     bool m_owned;
 291
 292     friend class WXDLLIMPEXP_FWD_BASE wxString;
 293 };
 294
 295 // ----------------------------------------------------------------------------
 296 // wxStringPrintfMixin
 297 // ---------------------------------------------------------------------------
 298
 299 // NB: VC6 has a bug that causes linker errors if you have template methods
 300 //     in a class using __declspec(dllimport). The solution is to split such
 301 //     class into two classes, one that contains the template methods and does
 302 //     *not* use WXDLLIMPEXP_BASE and another class that contains the rest
 303 //     (with DLL linkage).
 304 //
 305 //     We only do this for VC6 here, because the code is less efficient
 306 //     (Printf() has to use dynamic_cast<>) and because OpenWatcom compiler
 307 //     cannot compile this code.
 308
 309 #if defined(__VISUALC__) && __VISUALC__ < 1300
 310     #define wxNEEDS_WXSTRING_PRINTF_MIXIN
 311 #endif
 312
 313 #ifdef wxNEEDS_WXSTRING_PRINTF_MIXIN
 314 // this class contains implementation of wxString's vararg methods, it's
 315 // exported from wxBase DLL
 316 class WXDLLIMPEXP_BASE wxStringPrintfMixinBase
 317 {
 318 protected:
 319     wxStringPrintfMixinBase() {}
 320
 321 #if !wxUSE_UTF8_LOCALE_ONLY
 322     int DoPrintfWchar(const wxChar *format, ...);
 323     static wxString DoFormatWchar(const wxChar *format, ...);
 324 #endif
 325 #if wxUSE_UNICODE_UTF8
 326     int DoPrintfUtf8(const char *format, ...);
 327     static wxString DoFormatUtf8(const char *format, ...);
 328 #endif
 329 };
 330
 331 // this class contains template wrappers for wxString's vararg methods, it's
 332 // intentionally *not* exported from the DLL in order to fix the VC6 bug
 333 // described above
 334 class wxStringPrintfMixin : public wxStringPrintfMixinBase
 335 {
 336 private:
 337     // to further complicate things, we can't return wxString from
 338     // wxStringPrintfMixin::Format() because wxString is not yet declared at
 339     // this point; the solution is to use this fake type trait template - this
 340     // way the compiler won't know the return type until Format() is used
 341     // (this doesn't compile with Watcom, but VC6 compiles it just fine):
 342     template<typename T> struct StringReturnType
 343     {
 344         typedef wxString type;
 345     };
 346
 347 public:
 348     // these are duplicated wxString methods, they're also declared below
 349     // if !wxNEEDS_WXSTRING_PRINTF_MIXIN:
 350
 351     // static wxString Format(const wString& format, ...) ATTRIBUTE_PRINTF_1;
 352     WX_DEFINE_VARARG_FUNC_SANS_N0(static typename StringReturnType<T1>::type,
 353                                   Format, 1, (const wxFormatString&),
 354                                   DoFormatWchar, DoFormatUtf8)
 355     // We have to implement the version without template arguments manually
 356     // because of the StringReturnType<> hack, although WX_DEFINE_VARARG_FUNC
 357     // normally does it itself. It has to be a template so that we can use
 358     // the hack, even though there's no real template parameter. We can't move
 359     // it to wxStrig, because it would shadow these versions of Format() then.
 360     template<typename T>
 361     inline static typename StringReturnType<T>::type
 362     Format(const T& fmt)
 363     {
 364         // NB: this doesn't compile if T is not (some form of) a string;
 365         //     this makes Format's prototype equivalent to
 366         //     Format(const wxFormatString& fmt)
 367         return DoFormatWchar(wxFormatString(fmt));
 368     }
 369
 370     // int Printf(const wxString& format, ...);
 371     WX_DEFINE_VARARG_FUNC(int, Printf, 1, (const wxFormatString&),
 372                           DoPrintfWchar, DoPrintfUtf8)
 373     // int sprintf(const wxString& format, ...) ATTRIBUTE_PRINTF_2;
 374     WX_DEFINE_VARARG_FUNC(int, sprintf, 1, (const wxFormatString&),
 375                           DoPrintfWchar, DoPrintfUtf8)
 376
 377 protected:
 378     wxStringPrintfMixin() : wxStringPrintfMixinBase() {}
 379 };
 380 #endif // wxNEEDS_WXSTRING_PRINTF_MIXIN
 381
 382
 383 // ----------------------------------------------------------------------------
 384 // wxString: string class trying to be compatible with std::string, MFC
 385 //           CString and wxWindows 1.x wxString all at once
 386 // ---------------------------------------------------------------------------
 387
 388 #ifdef wxNEEDS_WXSTRING_PRINTF_MIXIN
 389     // "non dll-interface class 'wxStringPrintfMixin' used as base interface
 390     // for dll-interface class 'wxString'" -- this is OK in our case
 391     #pragma warning (disable:4275)
 392 #endif
 393
 394 #if wxUSE_UNICODE_UTF8
 395 // see the comment near wxString::iterator for why we need this
 396 class WXDLLIMPEXP_BASE wxStringIteratorNode
 397 {
 398 public:
 399     wxStringIteratorNode()
 400         : m_str(NULL), m_citer(NULL), m_iter(NULL), m_prev(NULL), m_next(NULL) {}
 401     wxStringIteratorNode(const wxString *str,
 402                           wxStringImpl::const_iterator *citer)
 403         { DoSet(str, citer, NULL); }
 404     wxStringIteratorNode(const wxString *str, wxStringImpl::iterator *iter)
 405         { DoSet(str, NULL, iter); }
 406     ~wxStringIteratorNode()
 407         { clear(); }
 408
 409     inline void set(const wxString *str, wxStringImpl::const_iterator *citer)
 410         { clear(); DoSet(str, citer, NULL); }
 411     inline void set(const wxString *str, wxStringImpl::iterator *iter)
 412         { clear(); DoSet(str, NULL, iter); }
 413
 414     const wxString *m_str;
 415     wxStringImpl::const_iterator *m_citer;
 416     wxStringImpl::iterator *m_iter;
 417     wxStringIteratorNode *m_prev, *m_next;
 418
 419 private:
 420     inline void clear();
 421     inline void DoSet(const wxString *str,
 422                       wxStringImpl::const_iterator *citer,
 423                       wxStringImpl::iterator *iter);
 424
 425     // the node belongs to a particular iterator instance, it's not copied
 426     // when a copy of the iterator is made
 427     DECLARE_NO_COPY_CLASS(wxStringIteratorNode)
 428 };
 429 #endif // wxUSE_UNICODE_UTF8
 430
 431 class WXDLLIMPEXP_BASE wxString
 432 #ifdef wxNEEDS_WXSTRING_PRINTF_MIXIN
 433                                 : public wxStringPrintfMixin
 434 #endif
 435 {
 436   // NB: special care was taken in arranging the member functions in such order
 437   //     that all inline functions can be effectively inlined, verify that all
 438   //     performance critical functions are still inlined if you change order!
 439 public:
 440   // an 'invalid' value for string index, moved to this place due to a CW bug
 441   static const size_t npos;
 442
 443 private:
 444   // if we hadn't made these operators private, it would be possible to
 445   // compile "wxString s; s = 17;" without any warnings as 17 is implicitly
 446   // converted to char in C and we do have operator=(char)
 447   //
 448   // NB: we don't need other versions (short/long and unsigned) as attempt
 449   //     to assign another numeric type to wxString will now result in
 450   //     ambiguity between operator=(char) and operator=(int)
 451   wxString& operator=(int);
 452
 453   // these methods are not implemented - there is _no_ conversion from int to
 454   // string, you're doing something wrong if the compiler wants to call it!
 455   //
 456   // try `s << i' or `s.Printf("%d", i)' instead
 457   wxString(int);
 458
 459
 460   // buffer for holding temporary substring when using any of the methods
 461   // that take (char*,size_t) or (wchar_t*,size_t) arguments:
 462   template<typename T>
 463   struct SubstrBufFromType
 464   {
 465       T data;
 466       size_t len;
 467
 468       SubstrBufFromType(const T& data_, size_t len_)
 469           : data(data_), len(len_)
 470       {
 471           wxASSERT_MSG( len != npos, "must have real length" );
 472       }
 473   };
 474
 475 #if wxUSE_UNICODE_UTF8
 476   // even char* -> char* needs conversion, from locale charset to UTF-8
 477   typedef SubstrBufFromType<wxCharBuffer>    SubstrBufFromWC;
 478   typedef SubstrBufFromType<wxCharBuffer>    SubstrBufFromMB;
 479 #elif wxUSE_UNICODE_WCHAR
 480   typedef SubstrBufFromType<const wchar_t*>  SubstrBufFromWC;
 481   typedef SubstrBufFromType<wxWCharBuffer>   SubstrBufFromMB;
 482 #else
 483   typedef SubstrBufFromType<const char*>     SubstrBufFromMB;
 484   typedef SubstrBufFromType<wxCharBuffer>    SubstrBufFromWC;
 485 #endif
 486
 487
 488   // Functions implementing primitive operations on string data; wxString
 489   // methods and iterators are implemented in terms of it. The differences
 490   // between UTF-8 and wchar_t* representations of the string are mostly
 491   // contained here.
 492
 493 #if wxUSE_UNICODE_UTF8
 494   static SubstrBufFromMB ConvertStr(const char *psz, size_t nLength,
 495                                     const wxMBConv& conv);
 496   static SubstrBufFromWC ConvertStr(const wchar_t *pwz, size_t nLength,
 497                                     const wxMBConv& conv);
 498 #elif wxUSE_UNICODE_WCHAR
 499   static SubstrBufFromMB ConvertStr(const char *psz, size_t nLength,
 500                                     const wxMBConv& conv);
 501 #else
 502   static SubstrBufFromWC ConvertStr(const wchar_t *pwz, size_t nLength,
 503                                     const wxMBConv& conv);
 504 #endif
 505
 506 #if !wxUSE_UNICODE_UTF8 // wxUSE_UNICODE_WCHAR or !wxUSE_UNICODE
 507   // returns C string encoded as the implementation expects:
 508   #if wxUSE_UNICODE
 509   static const wchar_t* ImplStr(const wchar_t* str)
 510     { return str ? str : wxT(""); }
 511   static const SubstrBufFromWC ImplStr(const wchar_t* str, size_t n)
 512     { return SubstrBufFromWC(str, (str && n == npos) ? wxWcslen(str) : n); }
 513   static wxWCharBuffer ImplStr(const char* str,
 514                                const wxMBConv& conv = wxConvLibc)
 515     { return ConvertStr(str, npos, conv).data; }
 516   static SubstrBufFromMB ImplStr(const char* str, size_t n,
 517                                  const wxMBConv& conv = wxConvLibc)
 518     { return ConvertStr(str, n, conv); }
 519   #else
 520   static const char* ImplStr(const char* str,
 521                              const wxMBConv& WXUNUSED(conv) = wxConvLibc)
 522     { return str ? str : ""; }
 523   static const SubstrBufFromMB ImplStr(const char* str, size_t n,
 524                                        const wxMBConv& WXUNUSED(conv) = wxConvLibc)
 525     { return SubstrBufFromMB(str, (str && n == npos) ? wxStrlen(str) : n); }
 526   static wxCharBuffer ImplStr(const wchar_t* str)
 527     { return ConvertStr(str, npos, wxConvLibc).data; }
 528   static SubstrBufFromWC ImplStr(const wchar_t* str, size_t n)
 529     { return ConvertStr(str, n, wxConvLibc); }
 530   #endif
 531
 532   // translates position index in wxString to/from index in underlying
 533   // wxStringImpl:
 534   static size_t PosToImpl(size_t pos) { return pos; }
 535   static void PosLenToImpl(size_t pos, size_t len,
 536                            size_t *implPos, size_t *implLen)
 537     { *implPos = pos; *implLen = len; }
 538   static size_t LenToImpl(size_t len) { return len; }
 539   static size_t PosFromImpl(size_t pos) { return pos; }
 540
 541   // we don't want to define these as empty inline functions as it could
 542   // result in noticeable (and quite unnecessary in non-UTF-8 build) slowdown
 543   // in debug build where the inline functions are not effectively inlined
 544   #define wxSTRING_INVALIDATE_CACHE()
 545   #define wxSTRING_INVALIDATE_CACHED_LENGTH()
 546   #define wxSTRING_UPDATE_CACHED_LENGTH(n)
 547   #define wxSTRING_SET_CACHED_LENGTH(n)
 548
 549 #else // wxUSE_UNICODE_UTF8
 550
 551   static wxCharBuffer ImplStr(const char* str,
 552                               const wxMBConv& conv = wxConvLibc)
 553     { return ConvertStr(str, npos, conv).data; }
 554   static SubstrBufFromMB ImplStr(const char* str, size_t n,
 555                                  const wxMBConv& conv = wxConvLibc)
 556     { return ConvertStr(str, n, conv); }
 557
 558   static wxCharBuffer ImplStr(const wchar_t* str)
 559     { return ConvertStr(str, npos, wxMBConvUTF8()).data; }
 560   static SubstrBufFromWC ImplStr(const wchar_t* str, size_t n)
 561     { return ConvertStr(str, n, wxMBConvUTF8()); }
 562
 563 #if wxUSE_STRING_POS_CACHE
 564   // this is an extremely simple cache used by PosToImpl(): each cache element
 565   // contains the string it applies to and the index corresponding to the last
 566   // used position in this wxString in its m_impl string
 567   //
 568   // NB: notice that this struct (and nested Element one) must be a POD or we
 569   //     wouldn't be able to use a thread-local variable of this type, in
 570   //     particular it should have no ctor -- we rely on statics being
 571   //     initialized to 0 instead
 572   struct Cache
 573   {
 574       enum { SIZE = 8 };
 575
 576       struct Element
 577       {
 578           const wxString *str;  // the string to which this element applies
 579           size_t pos,           // the cached index in this string
 580                  impl,          // the corresponding position in its m_impl
 581                  len;           // cached length or npos if unknown
 582
 583           // reset cached index to 0
 584           void ResetPos() { pos = impl = 0; }
 585
 586           // reset position and length
 587           void Reset() { ResetPos(); len = npos; }
 588       };
 589
 590       // cache the indices mapping for the last few string used
 591       Element cached[SIZE];
 592
 593       // the last used index
 594       unsigned lastUsed;
 595   };
 596
 597   static wxTLS_TYPE(Cache) ms_cache;
 598
 599   friend struct wxStrCacheDumper;
 600
 601   // uncomment this to have access to some profiling statistics on program
 602   // termination
 603   //#define wxPROFILE_STRING_CACHE
 604
 605 #ifdef wxPROFILE_STRING_CACHE
 606   static struct PosToImplCacheStats
 607   {
 608       unsigned postot,  // total non-trivial calls to PosToImpl
 609                poshits, // cache hits from PosToImpl()
 610                mishits, // cached position beyond the needed one
 611                sumpos,  // sum of all positions, used to compute the
 612                         // average position after dividing by postot
 613                sumofs,  // sum of all offsets after using the cache, used to
 614                         // compute the average after dividing by hits
 615                lentot,  // number of total calls to length()
 616                lenhits; // number of cache hits in length()
 617   } ms_cacheStats;
 618
 619   friend struct ShowCacheStats;
 620
 621   #define wxCACHE_PROFILE_FIELD_INC(field) ms_cacheStats.field++
 622   #define wxCACHE_PROFILE_FIELD_ADD(field, val) ms_cacheStats.field += (val)
 623 #else // !wxPROFILE_STRING_CACHE
 624   #define wxCACHE_PROFILE_FIELD_INC(field)
 625   #define wxCACHE_PROFILE_FIELD_ADD(field, val)
 626 #endif // wxPROFILE_STRING_CACHE/!wxPROFILE_STRING_CACHE
 627
 628   // note: it could seem that the functions below shouldn't be inline because
 629   // they are big, contain loops and so the compiler shouldn't be able to
 630   // inline them anyhow, however moving them into string.cpp does decrease the
 631   // code performance by ~5%, at least when using g++ 4.1 so do keep them here
 632   // unless tests show that it's not advantageous any more
 633
 634   // return the pointer to the cache element for this string or NULL if not
 635   // cached
 636   Cache::Element *FindCacheElement() const
 637   {
 638       // profiling seems to show a small but consistent gain if we use this
 639       // simple loop instead of starting from the last used element (there are
 640       // a lot of misses in this function...)
 641       for ( Cache::Element *c = ms_cache.cached;
 642             c != ms_cache.cached + Cache::SIZE;
 643             c++ )
 644       {
 645           if ( c->str == this )
 646               return c;
 647       }
 648
 649       return NULL;
 650   }
 651
 652   // unlike FindCacheElement(), this one always returns a valid pointer to the
 653   // cache element for this string, it may have valid last cached position and
 654   // its corresponding index in the byte string or not
 655   Cache::Element *GetCacheElement() const
 656   {
 657       Cache::Element * const cacheBegin = ms_cache.cached;
 658       Cache::Element * const cacheEnd = ms_cache.cached + Cache::SIZE;
 659       Cache::Element * const cacheStart = cacheBegin + ms_cache.lastUsed;
 660
 661       // check the last used first, this does no (measurable) harm for a miss
 662       // but does help for simple loops addressing the same string all the time
 663       if ( cacheStart->str == this )
 664           return cacheStart;
 665
 666       // notice that we're going to check cacheStart again inside this call but
 667       // profiling shows that it's still faster to use a simple loop like
 668       // inside FindCacheElement() than manually looping with wrapping starting
 669       // from the cache entry after the start one
 670       Cache::Element *c = FindCacheElement();
 671       if ( !c )
 672       {
 673           // claim the next cache entry for this string
 674           c = cacheStart;
 675           if ( ++c == cacheEnd )
 676               c = cacheBegin;
 677
 678           c->str = this;
 679           c->Reset();
 680
 681           // and remember the last used element
 682           ms_cache.lastUsed = c - cacheBegin;
 683       }
 684
 685       return c;
 686   }
 687
 688   size_t DoPosToImpl(size_t pos) const
 689   {
 690       wxCACHE_PROFILE_FIELD_INC(postot);
 691
 692       // NB: although the case of pos == 1 (and offset from cached position
 693       //     equal to 1) are common, nothing is gained by writing special code
 694       //     for handling them, the compiler (at least g++ 4.1 used) seems to
 695       //     optimize the code well enough on its own
 696
 697       wxCACHE_PROFILE_FIELD_ADD(sumpos, pos);
 698
 699       Cache::Element * const cache = GetCacheElement();
 700
 701       // cached position can't be 0 so if it is, it means that this entry was
 702       // used for length caching only so far, i.e. it doesn't count as a hit
 703       // from our point of view
 704       if ( cache->pos )
 705           wxCACHE_PROFILE_FIELD_INC(poshits);
 706
 707       if ( pos == cache->pos )
 708           return cache->impl;
 709
 710       // this seems to happen only rarely so just reset the cache in this case
 711       // instead of complicating code even further by seeking backwards in this
 712       // case
 713       if ( cache->pos > pos )
 714       {
 715           wxCACHE_PROFILE_FIELD_INC(mishits);
 716
 717           cache->ResetPos();
 718       }
 719
 720       wxCACHE_PROFILE_FIELD_ADD(sumofs, pos - cache->pos);
 721
 722
 723       wxStringImpl::const_iterator i(m_impl.begin() + cache->impl);
 724       for ( size_t n = cache->pos; n < pos; n++ )
 725           wxStringOperations::IncIter(i);
 726
 727       cache->pos = pos;
 728       cache->impl = i - m_impl.begin();
 729
 730       wxSTRING_CACHE_ASSERT(
 731           (int)cache->impl == (begin() + pos).impl() - m_impl.begin() );
 732
 733       return cache->impl;
 734   }
 735
 736   void InvalidateCache()
 737   {
 738       Cache::Element * const cache = FindCacheElement();
 739       if ( cache )
 740           cache->Reset();
 741   }
 742
 743   void InvalidateCachedLength()
 744   {
 745       Cache::Element * const cache = FindCacheElement();
 746       if ( cache )
 747           cache->len = npos;
 748   }
 749
 750   void SetCachedLength(size_t len)
 751   {
 752       // we optimistically cache the length here even if the string wasn't
 753       // present in the cache before, this seems to do no harm and the
 754       // potential for avoiding length recomputation for long strings looks
 755       // interesting
 756       GetCacheElement()->len = len;
 757   }
 758
 759   void UpdateCachedLength(ptrdiff_t delta)
 760   {
 761       Cache::Element * const cache = FindCacheElement();
 762       if ( cache && cache->len != npos )
 763       {
 764           wxSTRING_CACHE_ASSERT( (ptrdiff_t)cache->len + delta >= 0 );
 765
 766           cache->len += delta;
 767       }
 768   }
 769
 770   #define wxSTRING_INVALIDATE_CACHE() InvalidateCache()
 771   #define wxSTRING_INVALIDATE_CACHED_LENGTH() InvalidateCachedLength()
 772   #define wxSTRING_UPDATE_CACHED_LENGTH(n) UpdateCachedLength(n)
 773   #define wxSTRING_SET_CACHED_LENGTH(n) SetCachedLength(n)
 774 #else // !wxUSE_STRING_POS_CACHE
 775   size_t DoPosToImpl(size_t pos) const
 776   {
 777       return (begin() + pos).impl() - m_impl.begin();
 778   }
 779
 780   #define wxSTRING_INVALIDATE_CACHE()
 781   #define wxSTRING_INVALIDATE_CACHED_LENGTH()
 782   #define wxSTRING_UPDATE_CACHED_LENGTH(n)
 783   #define wxSTRING_SET_CACHED_LENGTH(n)
 784 #endif // wxUSE_STRING_POS_CACHE/!wxUSE_STRING_POS_CACHE
 785
 786   size_t PosToImpl(size_t pos) const
 787   {
 788       return pos == 0 || pos == npos ? pos : DoPosToImpl(pos);
 789   }
 790
 791   void PosLenToImpl(size_t pos, size_t len, size_t *implPos, size_t *implLen) const;
 792
 793   size_t LenToImpl(size_t len) const
 794   {
 795       size_t pos, len2;
 796       PosLenToImpl(0, len, &pos, &len2);
 797       return len2;
 798   }
 799
 800   size_t PosFromImpl(size_t pos) const
 801   {
 802       if ( pos == 0 || pos == npos )
 803           return pos;
 804       else
 805           return const_iterator(this, m_impl.begin() + pos) - begin();
 806   }
 807 #endif // !wxUSE_UNICODE_UTF8/wxUSE_UNICODE_UTF8
 808
 809 public:
 810   // standard types
 811   typedef wxUniChar value_type;
 812   typedef wxUniChar char_type;
 813   typedef wxUniCharRef reference;
 814   typedef wxChar* pointer;
 815   typedef const wxChar* const_pointer;
 816
 817   typedef size_t size_type;
 818   typedef wxUniChar const_reference;
 819
 820 #if wxUSE_STL
 821   #if wxUSE_UNICODE_UTF8
 822     // random access is not O(1), as required by Random Access Iterator
 823     #define WX_STR_ITERATOR_TAG std::bidirectional_iterator_tag
 824   #else
 825     #define WX_STR_ITERATOR_TAG std::random_access_iterator_tag
 826   #endif
 827 #else
 828   #define WX_STR_ITERATOR_TAG void /* dummy type */
 829 #endif
 830
 831   #define WX_STR_ITERATOR_IMPL(iterator_name, pointer_type, reference_type) \
 832       private:                                                              \
 833           typedef wxStringImpl::iterator_name underlying_iterator;          \
 834       public:                                                               \
 835           typedef WX_STR_ITERATOR_TAG iterator_category;                    \
 836           typedef wxUniChar value_type;                                     \
 837           typedef int difference_type;                                      \
 838           typedef reference_type reference;                                 \
 839           typedef pointer_type pointer;                                     \
 840                                                                             \
 841           reference operator[](size_t n) const { return *(*this + n); }     \
 842                                                                             \
 843           iterator_name& operator++()                                       \
 844             { wxStringOperations::IncIter(m_cur); return *this; }           \
 845           iterator_name& operator--()                                       \
 846             { wxStringOperations::DecIter(m_cur); return *this; }           \
 847           iterator_name operator++(int)                                     \
 848           {                                                                 \
 849               iterator_name tmp = *this;                                    \
 850               wxStringOperations::IncIter(m_cur);                           \
 851               return tmp;                                                   \
 852           }                                                                 \
 853           iterator_name operator--(int)                                     \
 854           {                                                                 \
 855               iterator_name tmp = *this;                                    \
 856               wxStringOperations::DecIter(m_cur);                           \
 857               return tmp;                                                   \
 858           }                                                                 \
 859                                                                             \
 860           iterator_name& operator+=(ptrdiff_t n)                            \
 861           {                                                                 \
 862               m_cur = wxStringOperations::AddToIter(m_cur, n);              \
 863               return *this;                                                 \
 864           }                                                                 \
 865           iterator_name& operator-=(ptrdiff_t n)                            \
 866           {                                                                 \
 867               m_cur = wxStringOperations::AddToIter(m_cur, -n);             \
 868               return *this;                                                 \
 869           }                                                                 \
 870                                                                             \
 871           difference_type operator-(const iterator_name& i) const           \
 872             { return wxStringOperations::DiffIters(m_cur, i.m_cur); }       \
 873                                                                             \
 874           bool operator==(const iterator_name& i) const                     \
 875             { return m_cur == i.m_cur; }                                    \
 876           bool operator!=(const iterator_name& i) const                     \
 877             { return m_cur != i.m_cur; }                                    \
 878                                                                             \
 879           bool operator<(const iterator_name& i) const                      \
 880             { return m_cur < i.m_cur; }                                     \
 881           bool operator>(const iterator_name& i) const                      \
 882             { return m_cur > i.m_cur; }                                     \
 883           bool operator<=(const iterator_name& i) const                     \
 884             { return m_cur <= i.m_cur; }                                    \
 885           bool operator>=(const iterator_name& i) const                     \
 886             { return m_cur >= i.m_cur; }                                    \
 887                                                                             \
 888       private:                                                              \
 889           /* for internal wxString use only: */                             \
 890           underlying_iterator impl() const { return m_cur; }                \
 891                                                                             \
 892           friend class wxString;                                            \
 893           friend class wxCStrData;                                          \
 894                                                                             \
 895       private:                                                              \
 896           underlying_iterator m_cur
 897
 898   class WXDLLIMPEXP_FWD_BASE const_iterator;
 899
 900 #if wxUSE_UNICODE_UTF8
 901   // NB: In UTF-8 build, (non-const) iterator needs to keep reference
 902   //     to the underlying wxStringImpl, because UTF-8 is variable-length
 903   //     encoding and changing the value pointer to by an iterator (using
 904   //     its operator*) requires calling wxStringImpl::replace() if the old
 905   //     and new values differ in their encoding's length.
 906   //
 907   //     Furthermore, the replace() call may invalid all iterators for the
 908   //     string, so we have to keep track of outstanding iterators and update
 909   //     them if replace() happens.
 910   //
 911   //     This is implemented by maintaining linked list of iterators for every
 912   //     string and traversing it in wxUniCharRef::operator=(). Head of the
 913   //     list is stored in wxString. (FIXME-UTF8)
 914
 915   class WXDLLIMPEXP_BASE iterator
 916   {
 917       WX_STR_ITERATOR_IMPL(iterator, wxChar*, wxUniCharRef);
 918
 919   public:
 920       iterator() {}
 921       iterator(const iterator& i)
 922           : m_cur(i.m_cur), m_node(i.str(), &m_cur) {}
 923       iterator& operator=(const iterator& i)
 924       {
 925           if (&i != this)
 926           {
 927               m_cur = i.m_cur;
 928               m_node.set(i.str(), &m_cur);
 929           }
 930           return *this;
 931       }
 932
 933       reference operator*()
 934         { return wxUniCharRef::CreateForString(*str(), m_cur); }
 935
 936       iterator operator+(ptrdiff_t n) const
 937         { return iterator(str(), wxStringOperations::AddToIter(m_cur, n)); }
 938       iterator operator-(ptrdiff_t n) const
 939         { return iterator(str(), wxStringOperations::AddToIter(m_cur, -n)); }
 940
 941   private:
 942       iterator(wxString *str, underlying_iterator ptr)
 943           : m_cur(ptr), m_node(str, &m_cur) {}
 944
 945       wxString* str() const { return wx_const_cast(wxString*, m_node.m_str); }
 946
 947       wxStringIteratorNode m_node;
 948
 949       friend class const_iterator;
 950   };
 951
 952   class WXDLLIMPEXP_BASE const_iterator
 953   {
 954       // NB: reference_type is intentionally value, not reference, the character
 955       //     may be encoded differently in wxString data:
 956       WX_STR_ITERATOR_IMPL(const_iterator, const wxChar*, wxUniChar);
 957
 958   public:
 959       const_iterator() {}
 960       const_iterator(const const_iterator& i)
 961           : m_cur(i.m_cur), m_node(i.str(), &m_cur) {}
 962       const_iterator(const iterator& i)
 963           : m_cur(i.m_cur), m_node(i.str(), &m_cur) {}
 964
 965       const_iterator& operator=(const const_iterator& i)
 966       {
 967           if (&i != this)
 968           {
 969               m_cur = i.m_cur;
 970               m_node.set(i.str(), &m_cur);
 971           }
 972           return *this;
 973       }
 974       const_iterator& operator=(const iterator& i)
 975         { m_cur = i.m_cur; m_node.set(i.str(), &m_cur); return *this; }
 976
 977       reference operator*() const
 978         { return wxStringOperations::DecodeChar(m_cur); }
 979
 980       const_iterator operator+(ptrdiff_t n) const
 981         { return const_iterator(str(), wxStringOperations::AddToIter(m_cur, n)); }
 982       const_iterator operator-(ptrdiff_t n) const
 983         { return const_iterator(str(), wxStringOperations::AddToIter(m_cur, -n)); }
 984
 985   private:
 986       // for internal wxString use only:
 987       const_iterator(const wxString *str, underlying_iterator ptr)
 988           : m_cur(ptr), m_node(str, &m_cur) {}
 989
 990       const wxString* str() const { return m_node.m_str; }
 991
 992       wxStringIteratorNode m_node;
 993   };
 994
 995   size_t IterToImplPos(wxString::iterator i) const
 996     { return wxStringImpl::const_iterator(i.impl()) - m_impl.begin(); }
 997
 998   iterator GetIterForNthChar(size_t n)
 999     { return iterator(this, m_impl.begin() + PosToImpl(n)); }
1000   const_iterator GetIterForNthChar(size_t n) const
1001     { return const_iterator(this, m_impl.begin() + PosToImpl(n)); }
1002 #else // !wxUSE_UNICODE_UTF8
1003
1004   class WXDLLIMPEXP_BASE iterator
1005   {
1006       WX_STR_ITERATOR_IMPL(iterator, wxChar*, wxUniCharRef);
1007
1008   public:
1009       iterator() {}
1010       iterator(const iterator& i) : m_cur(i.m_cur) {}
1011
1012       reference operator*()
1013         { return wxUniCharRef::CreateForString(m_cur); }
1014
1015       iterator operator+(ptrdiff_t n) const
1016         { return iterator(wxStringOperations::AddToIter(m_cur, n)); }
1017       iterator operator-(ptrdiff_t n) const
1018         { return iterator(wxStringOperations::AddToIter(m_cur, -n)); }
1019
1020   private:
1021       // for internal wxString use only:
1022       iterator(underlying_iterator ptr) : m_cur(ptr) {}
1023       iterator(wxString *WXUNUSED(str), underlying_iterator ptr) : m_cur(ptr) {}
1024
1025       friend class const_iterator;
1026   };
1027
1028   class WXDLLIMPEXP_BASE const_iterator
1029   {
1030       // NB: reference_type is intentionally value, not reference, the character
1031       //     may be encoded differently in wxString data:
1032       WX_STR_ITERATOR_IMPL(const_iterator, const wxChar*, wxUniChar);
1033
1034   public:
1035       const_iterator() {}
1036       const_iterator(const const_iterator& i) : m_cur(i.m_cur) {}
1037       const_iterator(const iterator& i) : m_cur(i.m_cur) {}
1038
1039       reference operator*() const
1040         { return wxStringOperations::DecodeChar(m_cur); }
1041
1042       const_iterator operator+(ptrdiff_t n) const
1043         { return const_iterator(wxStringOperations::AddToIter(m_cur, n)); }
1044       const_iterator operator-(ptrdiff_t n) const
1045         { return const_iterator(wxStringOperations::AddToIter(m_cur, -n)); }
1046
1047   private:
1048       // for internal wxString use only:
1049       const_iterator(underlying_iterator ptr) : m_cur(ptr) {}
1050       const_iterator(const wxString *WXUNUSED(str), underlying_iterator ptr)
1051           : m_cur(ptr) {}
1052   };
1053
1054   iterator GetIterForNthChar(size_t n) { return begin() + n; }
1055   const_iterator GetIterForNthChar(size_t n) const { return begin() + n; }
1056 #endif // wxUSE_UNICODE_UTF8/!wxUSE_UNICODE_UTF8
1057
1058   #undef WX_STR_ITERATOR_TAG
1059   #undef WX_STR_ITERATOR_IMPL
1060
1061   friend class iterator;
1062   friend class const_iterator;
1063
1064   template <typename T>
1065   class reverse_iterator_impl
1066   {
1067   public:
1068       typedef T iterator_type;
1069
1070       typedef typename T::iterator_category iterator_category;
1071       typedef typename T::value_type value_type;
1072       typedef typename T::difference_type difference_type;
1073       typedef typename T::reference reference;
1074       typedef typename T::pointer *pointer;
1075
1076       reverse_iterator_impl() {}
1077       reverse_iterator_impl(iterator_type i) : m_cur(i) {}
1078       reverse_iterator_impl(const reverse_iterator_impl& ri)
1079           : m_cur(ri.m_cur) {}
1080
1081       iterator_type base() const { return m_cur; }
1082
1083       reference operator*() const { return *(m_cur-1); }
1084       reference operator[](size_t n) const { return *(*this + n); }
1085
1086       reverse_iterator_impl& operator++()
1087         { --m_cur; return *this; }
1088       reverse_iterator_impl operator++(int)
1089         { reverse_iterator_impl tmp = *this; --m_cur; return tmp; }
1090       reverse_iterator_impl& operator--()
1091         { ++m_cur; return *this; }
1092       reverse_iterator_impl operator--(int)
1093         { reverse_iterator_impl tmp = *this; ++m_cur; return tmp; }
1094
1095       // NB: explicit <T> in the functions below is to keep BCC 5.5 happy
1096       reverse_iterator_impl operator+(ptrdiff_t n) const
1097         { return reverse_iterator_impl<T>(m_cur - n); }
1098       reverse_iterator_impl operator-(ptrdiff_t n) const
1099         { return reverse_iterator_impl<T>(m_cur + n); }
1100       reverse_iterator_impl operator+=(ptrdiff_t n)
1101         { m_cur -= n; return *this; }
1102       reverse_iterator_impl operator-=(ptrdiff_t n)
1103         { m_cur += n; return *this; }
1104
1105       unsigned operator-(const reverse_iterator_impl& i) const
1106         { return i.m_cur - m_cur; }
1107
1108       bool operator==(const reverse_iterator_impl& ri) const
1109         { return m_cur == ri.m_cur; }
1110       bool operator!=(const reverse_iterator_impl& ri) const
1111         { return !(*this == ri); }
1112
1113       bool operator<(const reverse_iterator_impl& i) const
1114         { return m_cur > i.m_cur; }
1115       bool operator>(const reverse_iterator_impl& i) const
1116         { return m_cur < i.m_cur; }
1117       bool operator<=(const reverse_iterator_impl& i) const
1118         { return m_cur >= i.m_cur; }
1119       bool operator>=(const reverse_iterator_impl& i) const
1120         { return m_cur <= i.m_cur; }
1121
1122   private:
1123       iterator_type m_cur;
1124   };
1125
1126   typedef reverse_iterator_impl<iterator> reverse_iterator;
1127   typedef reverse_iterator_impl<const_iterator> const_reverse_iterator;
1128
1129 private:
1130   // used to transform an expression built using c_str() (and hence of type
1131   // wxCStrData) to an iterator into the string
1132   static const_iterator CreateConstIterator(const wxCStrData& data)
1133   {
1134       return const_iterator(data.m_str,
1135                             (data.m_str->begin() + data.m_offset).impl());
1136   }
1137
1138   // in UTF-8 STL build, creation from std::string requires conversion under
1139   // non-UTF8 locales, so we can't have and use wxString(wxStringImpl) ctor;
1140   // instead we define dummy type that lets us have wxString ctor for creation
1141   // from wxStringImpl that couldn't be used by user code (in all other builds,
1142   // "standard" ctors can be used):
1143 #if wxUSE_UNICODE_UTF8 && wxUSE_STL_BASED_WXSTRING
1144   struct CtorFromStringImplTag {};
1145
1146   wxString(CtorFromStringImplTag* WXUNUSED(dummy), const wxStringImpl& src)
1147       : m_impl(src) {}
1148
1149   static wxString FromImpl(const wxStringImpl& src)
1150       { return wxString((CtorFromStringImplTag*)NULL, src); }
1151 #else
1152   #if !wxUSE_STL_BASED_WXSTRING
1153   wxString(const wxStringImpl& src) : m_impl(src) { }
1154   // else: already defined as wxString(wxStdString) below
1155   #endif
1156   static wxString FromImpl(const wxStringImpl& src) { return wxString(src); }
1157 #endif
1158
1159 public:
1160   // constructors and destructor
1161     // ctor for an empty string
1162   wxString() {}
1163
1164     // copy ctor
1165   wxString(const wxString& stringSrc) : m_impl(stringSrc.m_impl) { }
1166
1167     // string containing nRepeat copies of ch
1168   wxString(wxUniChar ch, size_t nRepeat = 1 )
1169     { assign(nRepeat, ch); }
1170   wxString(size_t nRepeat, wxUniChar ch)
1171     { assign(nRepeat, ch); }
1172   wxString(wxUniCharRef ch, size_t nRepeat = 1)
1173     { assign(nRepeat, ch); }
1174   wxString(size_t nRepeat, wxUniCharRef ch)
1175     { assign(nRepeat, ch); }
1176   wxString(char ch, size_t nRepeat = 1)
1177     { assign(nRepeat, ch); }
1178   wxString(size_t nRepeat, char ch)
1179     { assign(nRepeat, ch); }
1180   wxString(wchar_t ch, size_t nRepeat = 1)
1181     { assign(nRepeat, ch); }
1182   wxString(size_t nRepeat, wchar_t ch)
1183     { assign(nRepeat, ch); }
1184
1185     // ctors from char* strings:
1186   wxString(const char *psz)
1187     : m_impl(ImplStr(psz)) {}
1188   wxString(const char *psz, const wxMBConv& conv)
1189     : m_impl(ImplStr(psz, conv)) {}
1190   wxString(const char *psz, size_t nLength)
1191     { assign(psz, nLength); }
1192   wxString(const char *psz, const wxMBConv& conv, size_t nLength)
1193   {
1194     SubstrBufFromMB str(ImplStr(psz, nLength, conv));
1195     m_impl.assign(str.data, str.len);
1196   }
1197
1198     // and unsigned char*:
1199   wxString(const unsigned char *psz)
1200     : m_impl(ImplStr((const char*)psz)) {}
1201   wxString(const unsigned char *psz, const wxMBConv& conv)
1202     : m_impl(ImplStr((const char*)psz, conv)) {}
1203   wxString(const unsigned char *psz, size_t nLength)
1204     { assign((const char*)psz, nLength); }
1205   wxString(const unsigned char *psz, const wxMBConv& conv, size_t nLength)
1206   {
1207     SubstrBufFromMB str(ImplStr((const char*)psz, nLength, conv));
1208     m_impl.assign(str.data, str.len);
1209   }
1210
1211     // ctors from wchar_t* strings:
1212   wxString(const wchar_t *pwz)
1213     : m_impl(ImplStr(pwz)) {}
1214   wxString(const wchar_t *pwz, const wxMBConv& WXUNUSED(conv))
1215     : m_impl(ImplStr(pwz)) {}
1216   wxString(const wchar_t *pwz, size_t nLength)
1217     { assign(pwz, nLength); }
1218   wxString(const wchar_t *pwz, const wxMBConv& WXUNUSED(conv), size_t nLength)
1219     { assign(pwz, nLength); }
1220
1221   wxString(const wxCharBuffer& buf)
1222     { assign(buf.data()); } // FIXME-UTF8: fix for embedded NUL and buffer length
1223   wxString(const wxWCharBuffer& buf)
1224     { assign(buf.data()); } // FIXME-UTF8: fix for embedded NUL and buffer length
1225
1226     // NB: this version uses m_impl.c_str() to force making a copy of the
1227     //     string, so that "wxString(str.c_str())" idiom for passing strings
1228     //     between threads works
1229   wxString(const wxCStrData& cstr)
1230       : m_impl(cstr.AsString().m_impl.c_str()) { }
1231
1232     // as we provide both ctors with this signature for both char and unsigned
1233     // char string, we need to provide one for wxCStrData to resolve ambiguity
1234   wxString(const wxCStrData& cstr, size_t nLength)
1235       : m_impl(cstr.AsString().Mid(0, nLength).m_impl) {}
1236
1237     // and because wxString is convertible to wxCStrData and const wxChar *
1238     // we also need to provide this one
1239   wxString(const wxString& str, size_t nLength)
1240     { assign(str, nLength); }
1241
1242
1243 #if wxUSE_STRING_POS_CACHE
1244   ~wxString()
1245   {
1246       // we need to invalidate our cache entry as another string could be
1247       // recreated at the same address (unlikely, but still possible, with the
1248       // heap-allocated strings but perfectly common with stack-allocated ones)
1249       InvalidateCache();
1250   }
1251 #endif // wxUSE_STRING_POS_CACHE
1252
1253   // even if we're not built with wxUSE_STL == 1 it is very convenient to allow
1254   // implicit conversions from std::string to wxString and vice verse as this
1255   // allows to use the same strings in non-GUI and GUI code, however we don't
1256   // want to unconditionally add this ctor as it would make wx lib dependent on
1257   // libstdc++ on some Linux versions which is bad, so instead we ask the
1258   // client code to define this wxUSE_STD_STRING symbol if they need it
1259 #if wxUSE_STD_STRING
1260   #if wxUSE_UNICODE_WCHAR
1261     wxString(const wxStdWideString& str) : m_impl(str) {}
1262   #else // UTF-8 or ANSI
1263     wxString(const wxStdWideString& str)
1264         { assign(str.c_str(), str.length()); }
1265   #endif
1266
1267   #if !wxUSE_UNICODE // ANSI build
1268     // FIXME-UTF8: do this in UTF8 build #if wxUSE_UTF8_LOCALE_ONLY, too
1269     wxString(const std::string& str) : m_impl(str) {}
1270   #else // Unicode
1271     wxString(const std::string& str)
1272         { assign(str.c_str(), str.length()); }
1273   #endif
1274 #endif // wxUSE_STD_STRING
1275
1276   // Unlike ctor from std::string, we provide conversion to std::string only
1277   // if wxUSE_STL and not merely wxUSE_STD_STRING (which is on by default),
1278   // because it conflicts with operator const char/wchar_t*:
1279 #if wxUSE_STL
1280   #if wxUSE_UNICODE_WCHAR && wxUSE_STL_BASED_WXSTRING
1281     // wxStringImpl is std::string in the encoding we want
1282     operator const wxStdWideString&() const { return m_impl; }
1283   #else
1284     // wxStringImpl is either not std::string or needs conversion
1285     operator wxStdWideString() const
1286         // FIXME-UTF8: broken for embedded NULs
1287         { return wxStdWideString(wc_str()); }
1288   #endif
1289
1290   #if (!wxUSE_UNICODE || wxUSE_UTF8_LOCALE_ONLY) && wxUSE_STL_BASED_WXSTRING
1291     // wxStringImpl is std::string in the encoding we want
1292     operator const std::string&() const { return m_impl; }
1293   #else
1294     // wxStringImpl is either not std::string or needs conversion
1295     operator std::string() const
1296         // FIXME-UTF8: broken for embedded NULs
1297         { return std::string(mb_str()); }
1298   #endif
1299 #endif // wxUSE_STL
1300
1301   wxString Clone() const
1302   {
1303       // make a deep copy of the string, i.e. the returned string will have
1304       // ref count = 1 with refcounted implementation
1305       return wxString::FromImpl(wxStringImpl(m_impl.c_str(), m_impl.length()));
1306   }
1307
1308   // first valid index position
1309   const_iterator begin() const { return const_iterator(this, m_impl.begin()); }
1310   iterator begin() { return iterator(this, m_impl.begin()); }
1311   // position one after the last valid one
1312   const_iterator end() const { return const_iterator(this, m_impl.end()); }
1313   iterator end() { return iterator(this, m_impl.end()); }
1314
1315   // first element of the reversed string
1316   const_reverse_iterator rbegin() const
1317     { return const_reverse_iterator(end()); }
1318   reverse_iterator rbegin()
1319     { return reverse_iterator(end()); }
1320   // one beyond the end of the reversed string
1321   const_reverse_iterator rend() const
1322     { return const_reverse_iterator(begin()); }
1323   reverse_iterator rend()
1324     { return reverse_iterator(begin()); }
1325
1326   // std::string methods:
1327 #if wxUSE_UNICODE_UTF8
1328   size_t length() const
1329   {
1330 #if wxUSE_STRING_POS_CACHE
1331       wxCACHE_PROFILE_FIELD_INC(lentot);
1332
1333       Cache::Element * const cache = GetCacheElement();
1334
1335       if ( cache->len == npos )
1336       {
1337           // it's probably not worth trying to be clever and using cache->pos
1338           // here as it's probably 0 anyhow -- you usually call length() before
1339           // starting to index the string
1340           cache->len = end() - begin();
1341       }
1342       else
1343       {
1344           wxCACHE_PROFILE_FIELD_INC(lenhits);
1345
1346           wxSTRING_CACHE_ASSERT( (int)cache->len == end() - begin() );
1347       }
1348
1349       return cache->len;
1350 #else // !wxUSE_STRING_POS_CACHE
1351       return end() - begin();
1352 #endif // wxUSE_STRING_POS_CACHE/!wxUSE_STRING_POS_CACHE
1353   }
1354 #else
1355   size_t length() const { return m_impl.length(); }
1356 #endif
1357
1358   size_type size() const { return length(); }
1359   size_type max_size() const { return npos; }
1360
1361   bool empty() const { return m_impl.empty(); }
1362
1363   // NB: these methods don't have a well-defined meaning in UTF-8 case
1364   size_type capacity() const { return m_impl.capacity(); }
1365   void reserve(size_t sz) { m_impl.reserve(sz); }
1366
1367   void resize(size_t nSize, wxUniChar ch = wxT('\0'))
1368   {
1369     const size_t len = length();
1370     if ( nSize == len)
1371         return;
1372
1373 #if wxUSE_UNICODE_UTF8
1374     if ( nSize < len )
1375     {
1376         wxSTRING_INVALIDATE_CACHE();
1377
1378         // we can't use wxStringImpl::resize() for truncating the string as it
1379         // counts in bytes, not characters
1380         erase(nSize);
1381         return;
1382     }
1383
1384     // we also can't use (presumably more efficient) resize() if we have to
1385     // append characters taking more than one byte
1386     if ( !ch.IsAscii() )
1387     {
1388         append(nSize - len, ch);
1389     }
1390     else // can use (presumably faster) resize() version
1391 #endif // wxUSE_UNICODE_UTF8
1392     {
1393         wxSTRING_INVALIDATE_CACHED_LENGTH();
1394
1395         m_impl.resize(nSize, (wxStringCharType)ch);
1396     }
1397   }
1398
1399   wxString substr(size_t nStart = 0, size_t nLen = npos) const
1400   {
1401     size_t pos, len;
1402     PosLenToImpl(nStart, nLen, &pos, &len);
1403     return FromImpl(m_impl.substr(pos, len));
1404   }
1405
1406   // generic attributes & operations
1407     // as standard strlen()
1408   size_t Len() const { return length(); }
1409     // string contains any characters?
1410   bool IsEmpty() const { return empty(); }
1411     // empty string is "false", so !str will return true
1412   bool operator!() const { return empty(); }
1413     // truncate the string to given length
1414   wxString& Truncate(size_t uiLen);
1415     // empty string contents
1416   void Empty()
1417   {
1418     Truncate(0);
1419
1420     wxASSERT_MSG( empty(), _T("string not empty after call to Empty()?") );
1421   }
1422     // empty the string and free memory
1423   void Clear() { clear(); }
1424
1425   // contents test
1426     // Is an ascii value
1427   bool IsAscii() const;
1428     // Is a number
1429   bool IsNumber() const;
1430     // Is a word
1431   bool IsWord() const;
1432
1433   // data access (all indexes are 0 based)
1434     // read access
1435     wxUniChar at(size_t n) const
1436       { return wxStringOperations::DecodeChar(m_impl.begin() + PosToImpl(n)); }
1437     wxUniChar GetChar(size_t n) const
1438       { return at(n); }
1439     // read/write access
1440     wxUniCharRef at(size_t n)
1441       { return *GetIterForNthChar(n); }
1442     wxUniCharRef GetWritableChar(size_t n)
1443       { return at(n); }
1444     // write access
1445     void SetChar(size_t n, wxUniChar ch)
1446       { at(n) = ch; }
1447
1448     // get last character
1449     wxUniChar Last() const
1450     {
1451       wxASSERT_MSG( !empty(), _T("wxString: index out of bounds") );
1452       return *rbegin();
1453     }
1454
1455     // get writable last character
1456     wxUniCharRef Last()
1457     {
1458       wxASSERT_MSG( !empty(), _T("wxString: index out of bounds") );
1459       return *rbegin();
1460     }
1461
1462     /*
1463        Note that we we must define all of the overloads below to avoid
1464        ambiguity when using str[0].
1465      */
1466     wxUniChar operator[](int n) const
1467       { return at(n); }
1468     wxUniChar operator[](long n) const
1469       { return at(n); }
1470     wxUniChar operator[](size_t n) const
1471       { return at(n); }
1472 #ifndef wxSIZE_T_IS_UINT
1473     wxUniChar operator[](unsigned int n) const
1474       { return at(n); }
1475 #endif // size_t != unsigned int
1476
1477     // operator versions of GetWriteableChar()
1478     wxUniCharRef operator[](int n)
1479       { return at(n); }
1480     wxUniCharRef operator[](long n)
1481       { return at(n); }
1482     wxUniCharRef operator[](size_t n)
1483       { return at(n); }
1484 #ifndef wxSIZE_T_IS_UINT
1485     wxUniCharRef operator[](unsigned int n)
1486       { return at(n); }
1487 #endif // size_t != unsigned int
1488
1489     // explicit conversion to C string (use this with printf()!)
1490     wxCStrData c_str() const { return wxCStrData(this); }
1491     wxCStrData data() const { return c_str(); }
1492
1493     // implicit conversion to C string
1494     operator wxCStrData() const { return c_str(); }
1495
1496     // the first two operators conflict with operators for conversion to
1497     // std::string and they must be disabled in STL build; the next one only
1498     // makes sense if conversions to char* are also defined and not defining it
1499     // in STL build also helps us to get more clear error messages for the code
1500     // which relies on implicit conversion to char* in STL build
1501 #if !wxUSE_STL
1502     operator const char*() const { return c_str(); }
1503     operator const wchar_t*() const { return c_str(); }
1504
1505     // implicit conversion to untyped pointer for compatibility with previous
1506     // wxWidgets versions: this is the same as conversion to const char * so it
1507     // may fail!
1508     operator const void*() const { return c_str(); }
1509 #endif // wxUSE_STL
1510
1511     // identical to c_str(), for MFC compatibility
1512     const wxCStrData GetData() const { return c_str(); }
1513
1514     // explicit conversion to C string in internal representation (char*,
1515     // wchar_t*, UTF-8-encoded char*, depending on the build):
1516     const wxStringCharType *wx_str() const { return m_impl.c_str(); }
1517
1518     // conversion to *non-const* multibyte or widestring buffer; modifying
1519     // returned buffer won't affect the string, these methods are only useful
1520     // for passing values to const-incorrect functions
1521     wxWritableCharBuffer char_str(const wxMBConv& conv = wxConvLibc) const
1522         { return mb_str(conv); }
1523     wxWritableWCharBuffer wchar_str() const { return wc_str(); }
1524
1525     // conversion to the buffer of the given type T (= char or wchar_t) and
1526     // also optionally return the buffer length
1527     //
1528     // this is mostly/only useful for the template functions
1529     //
1530     // FIXME-VC6: the second argument only exists for VC6 which doesn't support
1531     //            explicit template function selection, do not use it unless
1532     //            you must support VC6!
1533     template <typename T>
1534     wxCharTypeBuffer<T> tchar_str(size_t *len = NULL,
1535                                   T * WXUNUSED(dummy) = NULL) const
1536     {
1537 #if wxUSE_UNICODE
1538         // we need a helper dispatcher depending on type
1539         return wxPrivate::wxStringAsBufHelper<T>::Get(*this, len);
1540 #else // ANSI
1541         // T can only be char in ANSI build
1542         if ( len )
1543             *len = length();
1544
1545         return wxCharTypeBuffer<T>::CreateNonOwned(wx_str());
1546 #endif // Unicode build kind
1547     }
1548
1549     // conversion to/from plain (i.e. 7 bit) ASCII: this is useful for
1550     // converting numbers or strings which are certain not to contain special
1551     // chars (typically system functions, X atoms, environment variables etc.)
1552     //
1553     // the behaviour of these functions with the strings containing anything
1554     // else than 7 bit ASCII characters is undefined, use at your own risk.
1555 #if wxUSE_UNICODE
1556     static wxString FromAscii(const char *ascii, size_t len);
1557     static wxString FromAscii(const char *ascii);
1558     static wxString FromAscii(char ascii);
1559     const wxCharBuffer ToAscii() const;
1560 #else // ANSI
1561     static wxString FromAscii(const char *ascii) { return wxString( ascii ); }
1562     static wxString FromAscii(const char *ascii, size_t len)
1563         { return wxString( ascii, len ); }
1564     static wxString FromAscii(char ascii) { return wxString( ascii ); }
1565     const char *ToAscii() const { return c_str(); }
1566 #endif // Unicode/!Unicode
1567
1568     // also provide unsigned char overloads as signed/unsigned doesn't matter
1569     // for 7 bit ASCII characters
1570     static wxString FromAscii(const unsigned char *ascii)
1571         { return FromAscii((const char *)ascii); }
1572     static wxString FromAscii(const unsigned char *ascii, size_t len)
1573         { return FromAscii((const char *)ascii, len); }
1574
1575     // conversion to/from UTF-8:
1576 #if wxUSE_UNICODE_UTF8
1577     static wxString FromUTF8Unchecked(const char *utf8)
1578     {
1579       if ( !utf8 )
1580           return wxEmptyString;
1581
1582       wxASSERT( wxStringOperations::IsValidUtf8String(utf8) );
1583       return FromImpl(wxStringImpl(utf8));
1584     }
1585     static wxString FromUTF8Unchecked(const char *utf8, size_t len)
1586     {
1587       if ( !utf8 )
1588           return wxEmptyString;
1589       if ( len == npos )
1590           return FromUTF8Unchecked(utf8);
1591
1592       wxASSERT( wxStringOperations::IsValidUtf8String(utf8, len) );
1593       return FromImpl(wxStringImpl(utf8, len));
1594     }
1595
1596     static wxString FromUTF8(const char *utf8)
1597     {
1598         if ( !utf8 || !wxStringOperations::IsValidUtf8String(utf8) )
1599             return "";
1600
1601         return FromImpl(wxStringImpl(utf8));
1602     }
1603     static wxString FromUTF8(const char *utf8, size_t len)
1604     {
1605         if ( len == npos )
1606             return FromUTF8(utf8);
1607
1608         if ( !utf8 || !wxStringOperations::IsValidUtf8String(utf8, len) )
1609             return "";
1610
1611         return FromImpl(wxStringImpl(utf8, len));
1612     }
1613
1614     const char* utf8_str() const { return wx_str(); }
1615     const char* ToUTF8() const { return wx_str(); }
1616
1617     // this function exists in UTF-8 build only and returns the length of the
1618     // internal UTF-8 representation
1619     size_t utf8_length() const { return m_impl.length(); }
1620 #elif wxUSE_UNICODE_WCHAR
1621     static wxString FromUTF8(const char *utf8, size_t len = npos)
1622       { return wxString(utf8, wxMBConvUTF8(), len); }
1623     static wxString FromUTF8Unchecked(const char *utf8, size_t len = npos)
1624     {
1625         const wxString s(utf8, wxMBConvUTF8(), len);
1626         wxASSERT_MSG( !utf8 || !*utf8 || !s.empty(),
1627                       "string must be valid UTF-8" );
1628         return s;
1629     }
1630     const wxCharBuffer utf8_str() const { return mb_str(wxMBConvUTF8()); }
1631     const wxCharBuffer ToUTF8() const { return utf8_str(); }
1632 #else // ANSI
1633     static wxString FromUTF8(const char *utf8)
1634       { return wxString(wxMBConvUTF8().cMB2WC(utf8)); }
1635     static wxString FromUTF8(const char *utf8, size_t len)
1636     {
1637         size_t wlen;
1638         wxWCharBuffer buf(wxMBConvUTF8().cMB2WC(utf8, len == npos ? wxNO_LEN : len, &wlen));
1639         return wxString(buf.data(), wlen);
1640     }
1641     static wxString FromUTF8Unchecked(const char *utf8, size_t len = npos)
1642     {
1643         size_t wlen;
1644         wxWCharBuffer buf(wxMBConvUTF8().cMB2WC(utf8,
1645                                                 len == npos ? wxNO_LEN : len,
1646                                                 &wlen));
1647         wxASSERT_MSG( !utf8 || !*utf8 || wlen,
1648                       "string must be valid UTF-8" );
1649
1650         return wxString(buf.data(), wlen);
1651     }
1652     const wxCharBuffer utf8_str() const
1653       { return wxMBConvUTF8().cWC2MB(wc_str()); }
1654     const wxCharBuffer ToUTF8() const { return utf8_str(); }
1655 #endif
1656
1657     // functions for storing binary data in wxString:
1658 #if wxUSE_UNICODE
1659     static wxString From8BitData(const char *data, size_t len)
1660       { return wxString(data, wxConvISO8859_1, len); }
1661     // version for NUL-terminated data:
1662     static wxString From8BitData(const char *data)
1663       { return wxString(data, wxConvISO8859_1); }
1664     const wxCharBuffer To8BitData() const { return mb_str(wxConvISO8859_1); }
1665 #else // ANSI
1666     static wxString From8BitData(const char *data, size_t len)
1667       { return wxString(data, len); }
1668     // version for NUL-terminated data:
1669     static wxString From8BitData(const char *data)
1670       { return wxString(data); }
1671     const char *To8BitData() const { return c_str(); }
1672 #endif // Unicode/ANSI
1673
1674     // conversions with (possible) format conversions: have to return a
1675     // buffer with temporary data
1676     //
1677     // the functions defined (in either Unicode or ANSI) mode are mb_str() to
1678     // return an ANSI (multibyte) string, wc_str() to return a wide string and
1679     // fn_str() to return a string which should be used with the OS APIs
1680     // accepting the file names. The return value is always the same, but the
1681     // type differs because a function may either return pointer to the buffer
1682     // directly or have to use intermediate buffer for translation.
1683 #if wxUSE_UNICODE
1684
1685 #if wxUSE_UTF8_LOCALE_ONLY
1686     const char* mb_str() const { return wx_str(); }
1687     const wxCharBuffer mb_str(const wxMBConv& conv) const;
1688 #else
1689     const wxCharBuffer mb_str(const wxMBConv& conv = wxConvLibc) const;
1690 #endif
1691
1692     const wxWX2MBbuf mbc_str() const { return mb_str(*wxConvCurrent); }
1693
1694 #if wxUSE_UNICODE_WCHAR
1695     const wchar_t* wc_str() const { return wx_str(); }
1696 #elif wxUSE_UNICODE_UTF8
1697     const wxWCharBuffer wc_str() const;
1698 #endif
1699     // for compatibility with !wxUSE_UNICODE version
1700     const wxWX2WCbuf wc_str(const wxMBConv& WXUNUSED(conv)) const
1701       { return wc_str(); }
1702
1703 #if wxMBFILES
1704     const wxCharBuffer fn_str() const { return mb_str(wxConvFile); }
1705 #else // !wxMBFILES
1706     const wxWX2WCbuf fn_str() const { return wc_str(); }
1707 #endif // wxMBFILES/!wxMBFILES
1708
1709 #else // ANSI
1710     const wxChar* mb_str() const { return wx_str(); }
1711
1712     // for compatibility with wxUSE_UNICODE version
1713     const char* mb_str(const wxMBConv& WXUNUSED(conv)) const { return wx_str(); }
1714
1715     const wxWX2MBbuf mbc_str() const { return mb_str(); }
1716
1717 #if wxUSE_WCHAR_T
1718     const wxWCharBuffer wc_str(const wxMBConv& conv = wxConvLibc) const;
1719 #endif // wxUSE_WCHAR_T
1720     const wxCharBuffer fn_str() const { return wxConvFile.cWC2WX( wc_str( wxConvLibc ) ); }
1721 #endif // Unicode/ANSI
1722
1723 #if wxUSE_UNICODE_UTF8
1724     const wxWCharBuffer t_str() const { return wc_str(); }
1725 #elif wxUSE_UNICODE_WCHAR
1726     const wchar_t* t_str() const { return wx_str(); }
1727 #else
1728     const char* t_str() const { return wx_str(); }
1729 #endif
1730
1731
1732   // overloaded assignment
1733     // from another wxString
1734   wxString& operator=(const wxString& stringSrc)
1735   {
1736     if ( this != &stringSrc )
1737     {
1738         wxSTRING_INVALIDATE_CACHE();
1739
1740         m_impl = stringSrc.m_impl;
1741     }
1742
1743     return *this;
1744   }
1745
1746   wxString& operator=(const wxCStrData& cstr)
1747     { return *this = cstr.AsString(); }
1748     // from a character
1749   wxString& operator=(wxUniChar ch)
1750   {
1751     wxSTRING_INVALIDATE_CACHE();
1752
1753 #if wxUSE_UNICODE_UTF8
1754     if ( !ch.IsAscii() )
1755         m_impl = wxStringOperations::EncodeChar(ch);
1756     else
1757 #endif // wxUSE_UNICODE_UTF8
1758         m_impl = (wxStringCharType)ch;
1759     return *this;
1760   }
1761
1762   wxString& operator=(wxUniCharRef ch)
1763     { return operator=((wxUniChar)ch); }
1764   wxString& operator=(char ch)
1765     { return operator=(wxUniChar(ch)); }
1766   wxString& operator=(unsigned char ch)
1767     { return operator=(wxUniChar(ch)); }
1768   wxString& operator=(wchar_t ch)
1769     { return operator=(wxUniChar(ch)); }
1770     // from a C string - STL probably will crash on NULL,
1771     // so we need to compensate in that case
1772 #if wxUSE_STL_BASED_WXSTRING
1773   wxString& operator=(const char *psz)
1774   {
1775       wxSTRING_INVALIDATE_CACHE();
1776
1777       if ( psz )
1778           m_impl = ImplStr(psz);
1779       else
1780           clear();
1781
1782       return *this;
1783   }
1784
1785   wxString& operator=(const wchar_t *pwz)
1786   {
1787       wxSTRING_INVALIDATE_CACHE();
1788
1789       if ( pwz )
1790           m_impl = ImplStr(pwz);
1791       else
1792           clear();
1793
1794       return *this;
1795   }
1796 #else // !wxUSE_STL_BASED_WXSTRING
1797   wxString& operator=(const char *psz)
1798   {
1799       wxSTRING_INVALIDATE_CACHE();
1800
1801       m_impl = ImplStr(psz);
1802
1803       return *this;
1804   }
1805
1806   wxString& operator=(const wchar_t *pwz)
1807   {
1808       wxSTRING_INVALIDATE_CACHE();
1809
1810       m_impl = ImplStr(pwz);
1811
1812       return *this;
1813   }
1814 #endif // wxUSE_STL_BASED_WXSTRING/!wxUSE_STL_BASED_WXSTRING
1815
1816   wxString& operator=(const unsigned char *psz)
1817     { return operator=((const char*)psz); }
1818
1819     // from wxWCharBuffer
1820   wxString& operator=(const wxWCharBuffer& s)
1821     { return operator=(s.data()); } // FIXME-UTF8: fix for embedded NULs
1822     // from wxCharBuffer
1823   wxString& operator=(const wxCharBuffer& s)
1824     { return operator=(s.data()); } // FIXME-UTF8: fix for embedded NULs
1825
1826   // string concatenation
1827     // in place concatenation
1828     /*
1829         Concatenate and return the result. Note that the left to right
1830         associativity of << allows to write things like "str << str1 << str2
1831         << ..." (unlike with +=)
1832      */
1833       // string += string
1834   wxString& operator<<(const wxString& s)
1835   {
1836 #if WXWIN_COMPATIBILITY_2_8 && !wxUSE_STL_BASED_WXSTRING && !wxUSE_UNICODE_UTF8
1837     wxASSERT_MSG( s.IsValid(),
1838                   _T("did you forget to call UngetWriteBuf()?") );
1839 #endif
1840
1841     append(s);
1842     return *this;
1843   }
1844       // string += C string
1845   wxString& operator<<(const char *psz)
1846     { append(psz); return *this; }
1847   wxString& operator<<(const wchar_t *pwz)
1848     { append(pwz); return *this; }
1849   wxString& operator<<(const wxCStrData& psz)
1850     { append(psz.AsString()); return *this; }
1851       // string += char
1852   wxString& operator<<(wxUniChar ch) { append(1, ch); return *this; }
1853   wxString& operator<<(wxUniCharRef ch) { append(1, ch); return *this; }
1854   wxString& operator<<(char ch) { append(1, ch); return *this; }
1855   wxString& operator<<(unsigned char ch) { append(1, ch); return *this; }
1856   wxString& operator<<(wchar_t ch) { append(1, ch); return *this; }
1857
1858       // string += buffer (i.e. from wxGetString)
1859   wxString& operator<<(const wxWCharBuffer& s)
1860     { return operator<<((const wchar_t *)s); }
1861   wxString& operator<<(const wxCharBuffer& s)
1862     { return operator<<((const char *)s); }
1863
1864     // string += C string
1865   wxString& Append(const wxString& s)
1866     {
1867         // test for empty() to share the string if possible
1868         if ( empty() )
1869             *this = s;
1870         else
1871             append(s);
1872         return *this;
1873     }
1874   wxString& Append(const char* psz)
1875     { append(psz); return *this; }
1876   wxString& Append(const wchar_t* pwz)
1877     { append(pwz); return *this; }
1878   wxString& Append(const wxCStrData& psz)
1879     { append(psz); return *this; }
1880   wxString& Append(const wxCharBuffer& psz)
1881     { append(psz); return *this; }
1882   wxString& Append(const wxWCharBuffer& psz)
1883     { append(psz); return *this; }
1884   wxString& Append(const char* psz, size_t nLen)
1885     { append(psz, nLen); return *this; }
1886   wxString& Append(const wchar_t* pwz, size_t nLen)
1887     { append(pwz, nLen); return *this; }
1888   wxString& Append(const wxCStrData& psz, size_t nLen)
1889     { append(psz, nLen); return *this; }
1890   wxString& Append(const wxCharBuffer& psz, size_t nLen)
1891     { append(psz, nLen); return *this; }
1892   wxString& Append(const wxWCharBuffer& psz, size_t nLen)
1893     { append(psz, nLen); return *this; }
1894     // append count copies of given character
1895   wxString& Append(wxUniChar ch, size_t count = 1u)
1896     { append(count, ch); return *this; }
1897   wxString& Append(wxUniCharRef ch, size_t count = 1u)
1898     { append(count, ch); return *this; }
1899   wxString& Append(char ch, size_t count = 1u)
1900     { append(count, ch); return *this; }
1901   wxString& Append(unsigned char ch, size_t count = 1u)
1902     { append(count, ch); return *this; }
1903   wxString& Append(wchar_t ch, size_t count = 1u)
1904     { append(count, ch); return *this; }
1905
1906     // prepend a string, return the string itself
1907   wxString& Prepend(const wxString& str)
1908     { *this = str + *this; return *this; }
1909
1910     // non-destructive concatenation
1911       // two strings
1912   friend wxString WXDLLIMPEXP_BASE operator+(const wxString& string1,
1913                                              const wxString& string2);
1914       // string with a single char
1915   friend wxString WXDLLIMPEXP_BASE operator+(const wxString& string, wxUniChar ch);
1916       // char with a string
1917   friend wxString WXDLLIMPEXP_BASE operator+(wxUniChar ch, const wxString& string);
1918       // string with C string
1919   friend wxString WXDLLIMPEXP_BASE operator+(const wxString& string,
1920                                              const char *psz);
1921   friend wxString WXDLLIMPEXP_BASE operator+(const wxString& string,
1922                                              const wchar_t *pwz);
1923       // C string with string
1924   friend wxString WXDLLIMPEXP_BASE operator+(const char *psz,
1925                                              const wxString& string);
1926   friend wxString WXDLLIMPEXP_BASE operator+(const wchar_t *pwz,
1927                                              const wxString& string);
1928
1929   // stream-like functions
1930       // insert an int into string
1931   wxString& operator<<(int i)
1932     { return (*this) << Format(_T("%d"), i); }
1933       // insert an unsigned int into string
1934   wxString& operator<<(unsigned int ui)
1935     { return (*this) << Format(_T("%u"), ui); }
1936       // insert a long into string
1937   wxString& operator<<(long l)
1938     { return (*this) << Format(_T("%ld"), l); }
1939       // insert an unsigned long into string
1940   wxString& operator<<(unsigned long ul)
1941     { return (*this) << Format(_T("%lu"), ul); }
1942 #if defined wxLongLong_t && !defined wxLongLongIsLong
1943       // insert a long long if they exist and aren't longs
1944   wxString& operator<<(wxLongLong_t ll)
1945     {
1946       const wxChar *fmt = _T("%") wxLongLongFmtSpec _T("d");
1947       return (*this) << Format(fmt, ll);
1948     }
1949       // insert an unsigned long long
1950   wxString& operator<<(wxULongLong_t ull)
1951     {
1952       const wxChar *fmt = _T("%") wxLongLongFmtSpec _T("u");
1953       return (*this) << Format(fmt , ull);
1954     }
1955 #endif // wxLongLong_t && !wxLongLongIsLong
1956       // insert a float into string
1957   wxString& operator<<(float f)
1958     { return (*this) << Format(_T("%f"), f); }
1959       // insert a double into string
1960   wxString& operator<<(double d)
1961     { return (*this) << Format(_T("%g"), d); }
1962
1963   // string comparison
1964     // case-sensitive comparison (returns a value < 0, = 0 or > 0)
1965   int Cmp(const char *psz) const
1966     { return compare(psz); }
1967   int Cmp(const wchar_t *pwz) const
1968     { return compare(pwz); }
1969   int Cmp(const wxString& s) const
1970     { return compare(s); }
1971   int Cmp(const wxCStrData& s) const
1972     { return compare(s); }
1973   int Cmp(const wxCharBuffer& s) const
1974     { return compare(s); }
1975   int Cmp(const wxWCharBuffer& s) const
1976     { return compare(s); }
1977     // same as Cmp() but not case-sensitive
1978   int CmpNoCase(const wxString& s) const;
1979
1980     // test for the string equality, either considering case or not
1981     // (if compareWithCase then the case matters)
1982   bool IsSameAs(const wxString& str, bool compareWithCase = true) const
1983   {
1984 #if !wxUSE_UNICODE_UTF8
1985       // in UTF-8 build, length() is O(n) and doing this would be _slower_
1986       if ( length() != str.length() )
1987           return false;
1988 #endif
1989       return (compareWithCase ? Cmp(str) : CmpNoCase(str)) == 0;
1990   }
1991   bool IsSameAs(const char *str, bool compareWithCase = true) const
1992     { return (compareWithCase ? Cmp(str) : CmpNoCase(str)) == 0; }
1993   bool IsSameAs(const wchar_t *str, bool compareWithCase = true) const
1994     { return (compareWithCase ? Cmp(str) : CmpNoCase(str)) == 0; }
1995
1996   bool IsSameAs(const wxCStrData& str, bool compareWithCase = true) const
1997     { return IsSameAs(str.AsString(), compareWithCase); }
1998   bool IsSameAs(const wxCharBuffer& str, bool compareWithCase = true) const
1999     { return IsSameAs(str.data(), compareWithCase); }
2000   bool IsSameAs(const wxWCharBuffer& str, bool compareWithCase = true) const
2001     { return IsSameAs(str.data(), compareWithCase); }
2002     // comparison with a single character: returns true if equal
2003   bool IsSameAs(wxUniChar c, bool compareWithCase = true) const;
2004   // FIXME-UTF8: remove these overloads
2005   bool IsSameAs(wxUniCharRef c, bool compareWithCase = true) const
2006     { return IsSameAs(wxUniChar(c), compareWithCase); }
2007   bool IsSameAs(char c, bool compareWithCase = true) const
2008     { return IsSameAs(wxUniChar(c), compareWithCase); }
2009   bool IsSameAs(unsigned char c, bool compareWithCase = true) const
2010     { return IsSameAs(wxUniChar(c), compareWithCase); }
2011   bool IsSameAs(wchar_t c, bool compareWithCase = true) const
2012     { return IsSameAs(wxUniChar(c), compareWithCase); }
2013   bool IsSameAs(int c, bool compareWithCase = true) const
2014     { return IsSameAs(wxUniChar(c), compareWithCase); }
2015
2016   // simple sub-string extraction
2017       // return substring starting at nFirst of length nCount (or till the end
2018       // if nCount = default value)
2019   wxString Mid(size_t nFirst, size_t nCount = npos) const;
2020
2021       // operator version of Mid()
2022   wxString  operator()(size_t start, size_t len) const
2023     { return Mid(start, len); }
2024
2025       // check if the string starts with the given prefix and return the rest
2026       // of the string in the provided pointer if it is not NULL; otherwise
2027       // return false
2028   bool StartsWith(const wxString& prefix, wxString *rest = NULL) const;
2029       // check if the string ends with the given suffix and return the
2030       // beginning of the string before the suffix in the provided pointer if
2031       // it is not NULL; otherwise return false
2032   bool EndsWith(const wxString& suffix, wxString *rest = NULL) const;
2033
2034       // get first nCount characters
2035   wxString Left(size_t nCount) const;
2036       // get last nCount characters
2037   wxString Right(size_t nCount) const;
2038       // get all characters before the first occurance of ch
2039       // (returns the whole string if ch not found)
2040   wxString BeforeFirst(wxUniChar ch) const;
2041       // get all characters before the last occurence of ch
2042       // (returns empty string if ch not found)
2043   wxString BeforeLast(wxUniChar ch) const;
2044       // get all characters after the first occurence of ch
2045       // (returns empty string if ch not found)
2046   wxString AfterFirst(wxUniChar ch) const;
2047       // get all characters after the last occurence of ch
2048       // (returns the whole string if ch not found)
2049   wxString AfterLast(wxUniChar ch) const;
2050
2051     // for compatibility only, use more explicitly named functions above
2052   wxString Before(wxUniChar ch) const { return BeforeLast(ch); }
2053   wxString After(wxUniChar ch) const { return AfterFirst(ch); }
2054
2055   // case conversion
2056       // convert to upper case in place, return the string itself
2057   wxString& MakeUpper();
2058       // convert to upper case, return the copy of the string
2059   wxString Upper() const { return wxString(*this).MakeUpper(); }
2060       // convert to lower case in place, return the string itself
2061   wxString& MakeLower();
2062       // convert to lower case, return the copy of the string
2063   wxString Lower() const { return wxString(*this).MakeLower(); }
2064       // convert the first character to the upper case and the rest to the
2065       // lower one, return the modified string itself
2066   wxString& MakeCapitalized();
2067       // convert the first character to the upper case and the rest to the
2068       // lower one, return the copy of the string
2069   wxString Capitalize() const { return wxString(*this).MakeCapitalized(); }
2070
2071   // trimming/padding whitespace (either side) and truncating
2072       // remove spaces from left or from right (default) side
2073   wxString& Trim(bool bFromRight = true);
2074       // add nCount copies chPad in the beginning or at the end (default)
2075   wxString& Pad(size_t nCount, wxUniChar chPad = wxT(' '), bool bFromRight = true);
2076
2077   // searching and replacing
2078       // searching (return starting index, or -1 if not found)
2079   int Find(wxUniChar ch, bool bFromEnd = false) const;   // like strchr/strrchr
2080   int Find(wxUniCharRef ch, bool bFromEnd = false) const
2081     { return Find(wxUniChar(ch), bFromEnd); }
2082   int Find(char ch, bool bFromEnd = false) const
2083     { return Find(wxUniChar(ch), bFromEnd); }
2084   int Find(unsigned char ch, bool bFromEnd = false) const
2085     { return Find(wxUniChar(ch), bFromEnd); }
2086   int Find(wchar_t ch, bool bFromEnd = false) const
2087     { return Find(wxUniChar(ch), bFromEnd); }
2088       // searching (return starting index, or -1 if not found)
2089   int Find(const wxString& sub) const               // like strstr
2090   {
2091     size_type idx = find(sub);
2092     return (idx == npos) ? wxNOT_FOUND : (int)idx;
2093   }
2094   int Find(const char *sub) const               // like strstr
2095   {
2096     size_type idx = find(sub);
2097     return (idx == npos) ? wxNOT_FOUND : (int)idx;
2098   }
2099   int Find(const wchar_t *sub) const               // like strstr
2100   {
2101     size_type idx = find(sub);
2102     return (idx == npos) ? wxNOT_FOUND : (int)idx;
2103   }
2104
2105   int Find(const wxCStrData& sub) const
2106     { return Find(sub.AsString()); }
2107   int Find(const wxCharBuffer& sub) const
2108     { return Find(sub.data()); }
2109   int Find(const wxWCharBuffer& sub) const
2110     { return Find(sub.data()); }
2111
2112       // replace first (or all of bReplaceAll) occurences of substring with
2113       // another string, returns the number of replacements made
2114   size_t Replace(const wxString& strOld,
2115                  const wxString& strNew,
2116                  bool bReplaceAll = true);
2117
2118     // check if the string contents matches a mask containing '*' and '?'
2119   bool Matches(const wxString& mask) const;
2120
2121     // conversion to numbers: all functions return true only if the whole
2122     // string is a number and put the value of this number into the pointer
2123     // provided, the base is the numeric base in which the conversion should be
2124     // done and must be comprised between 2 and 36 or be 0 in which case the
2125     // standard C rules apply (leading '0' => octal, "0x" => hex)
2126         // convert to a signed integer
2127     bool ToLong(long *val, int base = 10) const;
2128         // convert to an unsigned integer
2129     bool ToULong(unsigned long *val, int base = 10) const;
2130         // convert to wxLongLong
2131 #if defined(wxLongLong_t)
2132     bool ToLongLong(wxLongLong_t *val, int base = 10) const;
2133         // convert to wxULongLong
2134     bool ToULongLong(wxULongLong_t *val, int base = 10) const;
2135 #endif // wxLongLong_t
2136         // convert to a double
2137     bool ToDouble(double *val) const;
2138
2139
2140 #ifndef wxNEEDS_WXSTRING_PRINTF_MIXIN
2141   // formatted input/output
2142     // as sprintf(), returns the number of characters written or < 0 on error
2143     // (take 'this' into account in attribute parameter count)
2144   // int Printf(const wxString& format, ...);
2145   WX_DEFINE_VARARG_FUNC(int, Printf, 1, (const wxFormatString&),
2146                         DoPrintfWchar, DoPrintfUtf8)
2147 #ifdef __WATCOMC__
2148   // workaround for http://bugzilla.openwatcom.org/show_bug.cgi?id=351
2149   WX_VARARG_WATCOM_WORKAROUND(int, Printf, 1, (const wxString&),
2150                               (wxFormatString(f1)));
2151   WX_VARARG_WATCOM_WORKAROUND(int, Printf, 1, (const wxCStrData&),
2152                               (wxFormatString(f1)));
2153   WX_VARARG_WATCOM_WORKAROUND(int, Printf, 1, (const char*),
2154                               (wxFormatString(f1)));
2155   WX_VARARG_WATCOM_WORKAROUND(int, Printf, 1, (const wchar_t*),
2156                               (wxFormatString(f1)));
2157 #endif
2158 #endif // !wxNEEDS_WXSTRING_PRINTF_MIXIN
2159     // as vprintf(), returns the number of characters written or < 0 on error
2160   int PrintfV(const wxString& format, va_list argptr);
2161
2162 #ifndef wxNEEDS_WXSTRING_PRINTF_MIXIN
2163     // returns the string containing the result of Printf() to it
2164   // static wxString Format(const wxString& format, ...) ATTRIBUTE_PRINTF_1;
2165   WX_DEFINE_VARARG_FUNC(static wxString, Format, 1, (const wxFormatString&),
2166                         DoFormatWchar, DoFormatUtf8)
2167 #ifdef __WATCOMC__
2168   // workaround for http://bugzilla.openwatcom.org/show_bug.cgi?id=351
2169   WX_VARARG_WATCOM_WORKAROUND(static wxString, Format, 1, (const wxString&),
2170                               (wxFormatString(f1)));
2171   WX_VARARG_WATCOM_WORKAROUND(static wxString, Format, 1, (const wxCStrData&),
2172                               (wxFormatString(f1)));
2173   WX_VARARG_WATCOM_WORKAROUND(static wxString, Format, 1, (const char*),
2174                               (wxFormatString(f1)));
2175   WX_VARARG_WATCOM_WORKAROUND(static wxString, Format, 1, (const wchar_t*),
2176                               (wxFormatString(f1)));
2177 #endif
2178 #endif
2179     // the same as above, but takes a va_list
2180   static wxString FormatV(const wxString& format, va_list argptr);
2181
2182   // raw access to string memory
2183     // ensure that string has space for at least nLen characters
2184     // only works if the data of this string is not shared
2185   bool Alloc(size_t nLen) { reserve(nLen); return capacity() >= nLen; }
2186     // minimize the string's memory
2187     // only works if the data of this string is not shared
2188   bool Shrink();
2189 #if WXWIN_COMPATIBILITY_2_8 && !wxUSE_STL_BASED_WXSTRING && !wxUSE_UNICODE_UTF8
2190     // These are deprecated, use wxStringBuffer or wxStringBufferLength instead
2191     //
2192     // get writable buffer of at least nLen bytes. Unget() *must* be called
2193     // a.s.a.p. to put string back in a reasonable state!
2194   wxDEPRECATED( wxStringCharType *GetWriteBuf(size_t nLen) );
2195     // call this immediately after GetWriteBuf() has been used
2196   wxDEPRECATED( void UngetWriteBuf() );
2197   wxDEPRECATED( void UngetWriteBuf(size_t nLen) );
2198 #endif // WXWIN_COMPATIBILITY_2_8 && !wxUSE_STL_BASED_WXSTRING && wxUSE_UNICODE_UTF8
2199
2200   // wxWidgets version 1 compatibility functions
2201
2202   // use Mid()
2203   wxString SubString(size_t from, size_t to) const
2204       { return Mid(from, (to - from + 1)); }
2205     // values for second parameter of CompareTo function
2206   enum caseCompare {exact, ignoreCase};
2207     // values for first parameter of Strip function
2208   enum stripType {leading = 0x1, trailing = 0x2, both = 0x3};
2209
2210 #ifndef wxNEEDS_WXSTRING_PRINTF_MIXIN
2211   // use Printf()
2212   // (take 'this' into account in attribute parameter count)
2213   // int sprintf(const wxString& format, ...) ATTRIBUTE_PRINTF_2;
2214   WX_DEFINE_VARARG_FUNC(int, sprintf, 1, (const wxFormatString&),
2215                         DoPrintfWchar, DoPrintfUtf8)
2216 #ifdef __WATCOMC__
2217   // workaround for http://bugzilla.openwatcom.org/show_bug.cgi?id=351
2218   WX_VARARG_WATCOM_WORKAROUND(int, sprintf, 1, (const wxString&),
2219                               (wxFormatString(f1)));
2220   WX_VARARG_WATCOM_WORKAROUND(int, sprintf, 1, (const wxCStrData&),
2221                               (wxFormatString(f1)));
2222   WX_VARARG_WATCOM_WORKAROUND(int, sprintf, 1, (const char*),
2223                               (wxFormatString(f1)));
2224   WX_VARARG_WATCOM_WORKAROUND(int, sprintf, 1, (const wchar_t*),
2225                               (wxFormatString(f1)));
2226 #endif
2227 #endif // wxNEEDS_WXSTRING_PRINTF_MIXIN
2228
2229     // use Cmp()
2230   int CompareTo(const wxChar* psz, caseCompare cmp = exact) const
2231     { return cmp == exact ? Cmp(psz) : CmpNoCase(psz); }
2232
2233     // use length()
2234   size_t Length() const { return length(); }
2235     // Count the number of characters
2236   int Freq(wxUniChar ch) const;
2237     // use MakeLower
2238   void LowerCase() { MakeLower(); }
2239     // use MakeUpper
2240   void UpperCase() { MakeUpper(); }
2241     // use Trim except that it doesn't change this string
2242   wxString Strip(stripType w = trailing) const;
2243
2244     // use Find (more general variants not yet supported)
2245   size_t Index(const wxChar* psz) const { return Find(psz); }
2246   size_t Index(wxUniChar ch)         const { return Find(ch);  }
2247     // use Truncate
2248   wxString& Remove(size_t pos) { return Truncate(pos); }
2249   wxString& RemoveLast(size_t n = 1) { return Truncate(length() - n); }
2250
2251   wxString& Remove(size_t nStart, size_t nLen)
2252       { return (wxString&)erase( nStart, nLen ); }
2253
2254     // use Find()
2255   int First( wxUniChar ch ) const { return Find(ch); }
2256   int First( wxUniCharRef ch ) const { return Find(ch); }
2257   int First( char ch ) const { return Find(ch); }
2258   int First( unsigned char ch ) const { return Find(ch); }
2259   int First( wchar_t ch ) const { return Find(ch); }
2260   int First( const wxString& str ) const { return Find(str); }
2261   int Last( wxUniChar ch ) const { return Find(ch, true); }
2262   bool Contains(const wxString& str) const { return Find(str) != wxNOT_FOUND; }
2263
2264     // use empty()
2265   bool IsNull() const { return empty(); }
2266
2267   // std::string compatibility functions
2268
2269     // take nLen chars starting at nPos
2270   wxString(const wxString& str, size_t nPos, size_t nLen)
2271       { assign(str, nPos, nLen); }
2272     // take all characters from first to last
2273   wxString(const_iterator first, const_iterator last)
2274       : m_impl(first.impl(), last.impl()) { }
2275 #if WXWIN_COMPATIBILITY_STRING_PTR_AS_ITER
2276     // the 2 overloads below are for compatibility with the existing code using
2277     // pointers instead of iterators
2278   wxString(const char *first, const char *last)
2279   {
2280       SubstrBufFromMB str(ImplStr(first, last - first));
2281       m_impl.assign(str.data, str.len);
2282   }
2283   wxString(const wchar_t *first, const wchar_t *last)
2284   {
2285       SubstrBufFromWC str(ImplStr(first, last - first));
2286       m_impl.assign(str.data, str.len);
2287   }
2288     // and this one is needed to compile code adding offsets to c_str() result
2289   wxString(const wxCStrData& first, const wxCStrData& last)
2290       : m_impl(CreateConstIterator(first).impl(),
2291                CreateConstIterator(last).impl())
2292   {
2293       wxASSERT_MSG( first.m_str == last.m_str,
2294                     _T("pointers must be into the same string") );
2295   }
2296 #endif // WXWIN_COMPATIBILITY_STRING_PTR_AS_ITER
2297
2298   // lib.string.modifiers
2299     // append elements str[pos], ..., str[pos+n]
2300   wxString& append(const wxString& str, size_t pos, size_t n)
2301   {
2302       wxSTRING_UPDATE_CACHED_LENGTH(n);
2303
2304       size_t from, len;
2305       str.PosLenToImpl(pos, n, &from, &len);
2306       m_impl.append(str.m_impl, from, len);
2307       return *this;
2308   }
2309     // append a string
2310   wxString& append(const wxString& str)
2311   {
2312       wxSTRING_UPDATE_CACHED_LENGTH(str.length());
2313
2314       m_impl.append(str.m_impl);
2315       return *this;
2316   }
2317
2318     // append first n (or all if n == npos) characters of sz
2319   wxString& append(const char *sz)
2320   {
2321       wxSTRING_INVALIDATE_CACHED_LENGTH();
2322
2323       m_impl.append(ImplStr(sz));
2324       return *this;
2325   }
2326
2327   wxString& append(const wchar_t *sz)
2328   {
2329       wxSTRING_INVALIDATE_CACHED_LENGTH();
2330
2331       m_impl.append(ImplStr(sz));
2332       return *this;
2333   }
2334
2335   wxString& append(const char *sz, size_t n)
2336   {
2337       wxSTRING_INVALIDATE_CACHED_LENGTH();
2338
2339       SubstrBufFromMB str(ImplStr(sz, n));
2340       m_impl.append(str.data, str.len);
2341       return *this;
2342   }
2343   wxString& append(const wchar_t *sz, size_t n)
2344   {
2345       wxSTRING_UPDATE_CACHED_LENGTH(n);
2346
2347       SubstrBufFromWC str(ImplStr(sz, n));
2348       m_impl.append(str.data, str.len);
2349       return *this;
2350   }
2351
2352   wxString& append(const wxCStrData& str)
2353     { return append(str.AsString()); }
2354   wxString& append(const wxCharBuffer& str)
2355     { return append(str.data()); }
2356   wxString& append(const wxWCharBuffer& str)
2357     { return append(str.data()); }
2358   wxString& append(const wxCStrData& str, size_t n)
2359     { return append(str.AsString(), 0, n); }
2360   wxString& append(const wxCharBuffer& str, size_t n)
2361     { return append(str.data(), n); }
2362   wxString& append(const wxWCharBuffer& str, size_t n)
2363     { return append(str.data(), n); }
2364
2365     // append n copies of ch
2366   wxString& append(size_t n, wxUniChar ch)
2367   {
2368 #if wxUSE_UNICODE_UTF8
2369       if ( !ch.IsAscii() )
2370       {
2371           wxSTRING_INVALIDATE_CACHED_LENGTH();
2372
2373           m_impl.append(wxStringOperations::EncodeNChars(n, ch));
2374       }
2375       else // ASCII
2376 #endif
2377       {
2378           wxSTRING_UPDATE_CACHED_LENGTH(n);
2379
2380           m_impl.append(n, (wxStringCharType)ch);
2381       }
2382
2383       return *this;
2384   }
2385
2386   wxString& append(size_t n, wxUniCharRef ch)
2387     { return append(n, wxUniChar(ch)); }
2388   wxString& append(size_t n, char ch)
2389     { return append(n, wxUniChar(ch)); }
2390   wxString& append(size_t n, unsigned char ch)
2391     { return append(n, wxUniChar(ch)); }
2392   wxString& append(size_t n, wchar_t ch)
2393     { return append(n, wxUniChar(ch)); }
2394
2395     // append from first to last
2396   wxString& append(const_iterator first, const_iterator last)
2397   {
2398       wxSTRING_INVALIDATE_CACHED_LENGTH();
2399
2400       m_impl.append(first.impl(), last.impl());
2401       return *this;
2402   }
2403 #if WXWIN_COMPATIBILITY_STRING_PTR_AS_ITER
2404   wxString& append(const char *first, const char *last)
2405     { return append(first, last - first); }
2406   wxString& append(const wchar_t *first, const wchar_t *last)
2407     { return append(first, last - first); }
2408   wxString& append(const wxCStrData& first, const wxCStrData& last)
2409     { return append(CreateConstIterator(first), CreateConstIterator(last)); }
2410 #endif // WXWIN_COMPATIBILITY_STRING_PTR_AS_ITER
2411
2412     // same as `this_string = str'
2413   wxString& assign(const wxString& str)
2414   {
2415       wxSTRING_SET_CACHED_LENGTH(str.length());
2416
2417       m_impl = str.m_impl;
2418
2419       return *this;
2420   }
2421
2422   wxString& assign(const wxString& str, size_t len)
2423   {
2424       wxSTRING_SET_CACHED_LENGTH(len);
2425
2426       m_impl.assign(str.m_impl, 0, str.LenToImpl(len));
2427
2428       return *this;
2429   }
2430
2431     // same as ` = str[pos..pos + n]
2432   wxString& assign(const wxString& str, size_t pos, size_t n)
2433   {
2434       size_t from, len;
2435       str.PosLenToImpl(pos, n, &from, &len);
2436       m_impl.assign(str.m_impl, from, len);
2437
2438       // it's important to call this after PosLenToImpl() above in case str is
2439       // the same string as this one
2440       wxSTRING_SET_CACHED_LENGTH(n);
2441
2442       return *this;
2443   }
2444
2445     // same as `= first n (or all if n == npos) characters of sz'
2446   wxString& assign(const char *sz)
2447   {
2448       wxSTRING_INVALIDATE_CACHE();
2449
2450       m_impl.assign(ImplStr(sz));
2451
2452       return *this;
2453   }
2454
2455   wxString& assign(const wchar_t *sz)
2456   {
2457       wxSTRING_INVALIDATE_CACHE();
2458
2459       m_impl.assign(ImplStr(sz));
2460
2461       return *this;
2462   }
2463
2464   wxString& assign(const char *sz, size_t n)
2465   {
2466       wxSTRING_SET_CACHED_LENGTH(n);
2467
2468       SubstrBufFromMB str(ImplStr(sz, n));
2469       m_impl.assign(str.data, str.len);
2470
2471       return *this;
2472   }
2473
2474   wxString& assign(const wchar_t *sz, size_t n)
2475   {
2476       wxSTRING_SET_CACHED_LENGTH(n);
2477
2478       SubstrBufFromWC str(ImplStr(sz, n));
2479       m_impl.assign(str.data, str.len);
2480
2481       return *this;
2482   }
2483
2484   wxString& assign(const wxCStrData& str)
2485     { return assign(str.AsString()); }
2486   wxString& assign(const wxCharBuffer& str)
2487     { return assign(str.data()); }
2488   wxString& assign(const wxWCharBuffer& str)
2489     { return assign(str.data()); }
2490   wxString& assign(const wxCStrData& str, size_t len)
2491     { return assign(str.AsString(), len); }
2492   wxString& assign(const wxCharBuffer& str, size_t len)
2493     { return assign(str.data(), len); }
2494   wxString& assign(const wxWCharBuffer& str, size_t len)
2495     { return assign(str.data(), len); }
2496
2497     // same as `= n copies of ch'
2498   wxString& assign(size_t n, wxUniChar ch)
2499   {
2500       wxSTRING_SET_CACHED_LENGTH(n);
2501
2502 #if wxUSE_UNICODE_UTF8
2503       if ( !ch.IsAscii() )
2504           m_impl.assign(wxStringOperations::EncodeNChars(n, ch));
2505       else
2506 #endif
2507           m_impl.assign(n, (wxStringCharType)ch);
2508
2509       return *this;
2510   }
2511
2512   wxString& assign(size_t n, wxUniCharRef ch)
2513     { return assign(n, wxUniChar(ch)); }
2514   wxString& assign(size_t n, char ch)
2515     { return assign(n, wxUniChar(ch)); }
2516   wxString& assign(size_t n, unsigned char ch)
2517     { return assign(n, wxUniChar(ch)); }
2518   wxString& assign(size_t n, wchar_t ch)
2519     { return assign(n, wxUniChar(ch)); }
2520
2521     // assign from first to last
2522   wxString& assign(const_iterator first, const_iterator last)
2523   {
2524       wxSTRING_INVALIDATE_CACHE();
2525
2526       m_impl.assign(first.impl(), last.impl());
2527
2528       return *this;
2529   }
2530 #if WXWIN_COMPATIBILITY_STRING_PTR_AS_ITER
2531   wxString& assign(const char *first, const char *last)
2532     { return assign(first, last - first); }
2533   wxString& assign(const wchar_t *first, const wchar_t *last)
2534     { return assign(first, last - first); }
2535   wxString& assign(const wxCStrData& first, const wxCStrData& last)
2536     { return assign(CreateConstIterator(first), CreateConstIterator(last)); }
2537 #endif // WXWIN_COMPATIBILITY_STRING_PTR_AS_ITER
2538
2539     // string comparison
2540   int compare(const wxString& str) const;
2541   int compare(const char* sz) const;
2542   int compare(const wchar_t* sz) const;
2543   int compare(const wxCStrData& str) const
2544     { return compare(str.AsString()); }
2545   int compare(const wxCharBuffer& str) const
2546     { return compare(str.data()); }
2547   int compare(const wxWCharBuffer& str) const
2548     { return compare(str.data()); }
2549     // comparison with a substring
2550   int compare(size_t nStart, size_t nLen, const wxString& str) const;
2551     // comparison of 2 substrings
2552   int compare(size_t nStart, size_t nLen,
2553               const wxString& str, size_t nStart2, size_t nLen2) const;
2554     // substring comparison with first nCount characters of sz
2555   int compare(size_t nStart, size_t nLen,
2556               const char* sz, size_t nCount = npos) const;
2557   int compare(size_t nStart, size_t nLen,
2558               const wchar_t* sz, size_t nCount = npos) const;
2559
2560     // insert another string
2561   wxString& insert(size_t nPos, const wxString& str)
2562     { insert(GetIterForNthChar(nPos), str.begin(), str.end()); return *this; }
2563     // insert n chars of str starting at nStart (in str)
2564   wxString& insert(size_t nPos, const wxString& str, size_t nStart, size_t n)
2565   {
2566       wxSTRING_UPDATE_CACHED_LENGTH(n);
2567
2568       size_t from, len;
2569       str.PosLenToImpl(nStart, n, &from, &len);
2570       m_impl.insert(PosToImpl(nPos), str.m_impl, from, len);
2571
2572       return *this;
2573   }
2574
2575     // insert first n (or all if n == npos) characters of sz
2576   wxString& insert(size_t nPos, const char *sz)
2577   {
2578       wxSTRING_INVALIDATE_CACHE();
2579
2580       m_impl.insert(PosToImpl(nPos), ImplStr(sz));
2581
2582       return *this;
2583   }
2584
2585   wxString& insert(size_t nPos, const wchar_t *sz)
2586   {
2587       wxSTRING_INVALIDATE_CACHE();
2588
2589       m_impl.insert(PosToImpl(nPos), ImplStr(sz)); return *this;
2590   }
2591
2592   wxString& insert(size_t nPos, const char *sz, size_t n)
2593   {
2594       wxSTRING_UPDATE_CACHED_LENGTH(n);
2595
2596       SubstrBufFromMB str(ImplStr(sz, n));
2597       m_impl.insert(PosToImpl(nPos), str.data, str.len);
2598
2599       return *this;
2600   }
2601
2602   wxString& insert(size_t nPos, const wchar_t *sz, size_t n)
2603   {
2604       wxSTRING_UPDATE_CACHED_LENGTH(n);
2605
2606       SubstrBufFromWC str(ImplStr(sz, n));
2607       m_impl.insert(PosToImpl(nPos), str.data, str.len);
2608
2609       return *this;
2610   }
2611
2612     // insert n copies of ch
2613   wxString& insert(size_t nPos, size_t n, wxUniChar ch)
2614   {
2615       wxSTRING_UPDATE_CACHED_LENGTH(n);
2616
2617 #if wxUSE_UNICODE_UTF8
2618       if ( !ch.IsAscii() )
2619           m_impl.insert(PosToImpl(nPos), wxStringOperations::EncodeNChars(n, ch));
2620       else
2621 #endif
2622           m_impl.insert(PosToImpl(nPos), n, (wxStringCharType)ch);
2623       return *this;
2624   }
2625
2626   iterator insert(iterator it, wxUniChar ch)
2627   {
2628       wxSTRING_UPDATE_CACHED_LENGTH(1);
2629
2630 #if wxUSE_UNICODE_UTF8
2631       if ( !ch.IsAscii() )
2632       {
2633           size_t pos = IterToImplPos(it);
2634           m_impl.insert(pos, wxStringOperations::EncodeChar(ch));
2635           return iterator(this, m_impl.begin() + pos);
2636       }
2637       else
2638 #endif
2639           return iterator(this, m_impl.insert(it.impl(), (wxStringCharType)ch));
2640   }
2641
2642   void insert(iterator it, const_iterator first, const_iterator last)
2643   {
2644       wxSTRING_INVALIDATE_CACHE();
2645
2646       m_impl.insert(it.impl(), first.impl(), last.impl());
2647   }
2648
2649 #if WXWIN_COMPATIBILITY_STRING_PTR_AS_ITER
2650   void insert(iterator it, const char *first, const char *last)
2651     { insert(it - begin(), first, last - first); }
2652   void insert(iterator it, const wchar_t *first, const wchar_t *last)
2653     { insert(it - begin(), first, last - first); }
2654   void insert(iterator it, const wxCStrData& first, const wxCStrData& last)
2655     { insert(it, CreateConstIterator(first), CreateConstIterator(last)); }
2656 #endif // WXWIN_COMPATIBILITY_STRING_PTR_AS_ITER
2657
2658   void insert(iterator it, size_type n, wxUniChar ch)
2659   {
2660       wxSTRING_UPDATE_CACHED_LENGTH(n);
2661
2662 #if wxUSE_UNICODE_UTF8
2663       if ( !ch.IsAscii() )
2664           m_impl.insert(IterToImplPos(it), wxStringOperations::EncodeNChars(n, ch));
2665       else
2666 #endif
2667           m_impl.insert(it.impl(), n, (wxStringCharType)ch);
2668   }
2669
2670     // delete characters from nStart to nStart + nLen
2671   wxString& erase(size_type pos = 0, size_type n = npos)
2672   {
2673       wxSTRING_INVALIDATE_CACHE();
2674
2675       size_t from, len;
2676       PosLenToImpl(pos, n, &from, &len);
2677       m_impl.erase(from, len);
2678
2679       return *this;
2680   }
2681
2682     // delete characters from first up to last
2683   iterator erase(iterator first, iterator last)
2684   {
2685       wxSTRING_INVALIDATE_CACHE();
2686
2687       return iterator(this, m_impl.erase(first.impl(), last.impl()));
2688   }
2689
2690   iterator erase(iterator first)
2691   {
2692       wxSTRING_UPDATE_CACHED_LENGTH(-1);
2693
2694       return iterator(this, m_impl.erase(first.impl()));
2695   }
2696
2697 #ifdef wxSTRING_BASE_HASNT_CLEAR
2698   void clear() { erase(); }
2699 #else
2700   void clear()
2701   {
2702       wxSTRING_SET_CACHED_LENGTH(0);
2703
2704       m_impl.clear();
2705   }
2706 #endif
2707
2708     // replaces the substring of length nLen starting at nStart
2709   wxString& replace(size_t nStart, size_t nLen, const char* sz)
2710   {
2711       wxSTRING_INVALIDATE_CACHE();
2712
2713       size_t from, len;
2714       PosLenToImpl(nStart, nLen, &from, &len);
2715       m_impl.replace(from, len, ImplStr(sz));
2716
2717       return *this;
2718   }
2719
2720   wxString& replace(size_t nStart, size_t nLen, const wchar_t* sz)
2721   {
2722       wxSTRING_INVALIDATE_CACHE();
2723
2724       size_t from, len;
2725       PosLenToImpl(nStart, nLen, &from, &len);
2726       m_impl.replace(from, len, ImplStr(sz));
2727
2728       return *this;
2729   }
2730
2731     // replaces the substring of length nLen starting at nStart
2732   wxString& replace(size_t nStart, size_t nLen, const wxString& str)
2733   {
2734       wxSTRING_INVALIDATE_CACHE();
2735
2736       size_t from, len;
2737       PosLenToImpl(nStart, nLen, &from, &len);
2738       m_impl.replace(from, len, str.m_impl);
2739
2740       return *this;
2741   }
2742
2743     // replaces the substring with nCount copies of ch
2744   wxString& replace(size_t nStart, size_t nLen, size_t nCount, wxUniChar ch)
2745   {
2746       wxSTRING_INVALIDATE_CACHE();
2747
2748       size_t from, len;
2749       PosLenToImpl(nStart, nLen, &from, &len);
2750 #if wxUSE_UNICODE_UTF8
2751       if ( !ch.IsAscii() )
2752           m_impl.replace(from, len, wxStringOperations::EncodeNChars(nCount, ch));
2753       else
2754 #endif
2755           m_impl.replace(from, len, nCount, (wxStringCharType)ch);
2756
2757       return *this;
2758   }
2759
2760     // replaces a substring with another substring
2761   wxString& replace(size_t nStart, size_t nLen,
2762                     const wxString& str, size_t nStart2, size_t nLen2)
2763   {
2764       wxSTRING_INVALIDATE_CACHE();
2765
2766       size_t from, len;
2767       PosLenToImpl(nStart, nLen, &from, &len);
2768
2769       size_t from2, len2;
2770       str.PosLenToImpl(nStart2, nLen2, &from2, &len2);
2771
2772       m_impl.replace(from, len, str.m_impl, from2, len2);
2773
2774       return *this;
2775   }
2776
2777      // replaces the substring with first nCount chars of sz
2778   wxString& replace(size_t nStart, size_t nLen,
2779                     const char* sz, size_t nCount)
2780   {
2781       wxSTRING_INVALIDATE_CACHE();
2782
2783       size_t from, len;
2784       PosLenToImpl(nStart, nLen, &from, &len);
2785
2786       SubstrBufFromMB str(ImplStr(sz, nCount));
2787
2788       m_impl.replace(from, len, str.data, str.len);
2789
2790       return *this;
2791   }
2792
2793   wxString& replace(size_t nStart, size_t nLen,
2794                     const wchar_t* sz, size_t nCount)
2795   {
2796       wxSTRING_INVALIDATE_CACHE();
2797
2798       size_t from, len;
2799       PosLenToImpl(nStart, nLen, &from, &len);
2800
2801       SubstrBufFromWC str(ImplStr(sz, nCount));
2802
2803       m_impl.replace(from, len, str.data, str.len);
2804
2805       return *this;
2806   }
2807
2808   wxString& replace(size_t nStart, size_t nLen,
2809                     const wxString& s, size_t nCount)
2810   {
2811       wxSTRING_INVALIDATE_CACHE();
2812
2813       size_t from, len;
2814       PosLenToImpl(nStart, nLen, &from, &len);
2815       m_impl.replace(from, len, s.m_impl.c_str(), s.LenToImpl(nCount));
2816
2817       return *this;
2818   }
2819
2820   wxString& replace(iterator first, iterator last, const char* s)
2821   {
2822       wxSTRING_INVALIDATE_CACHE();
2823
2824       m_impl.replace(first.impl(), last.impl(), ImplStr(s));
2825
2826       return *this;
2827   }
2828
2829   wxString& replace(iterator first, iterator last, const wchar_t* s)
2830   {
2831       wxSTRING_INVALIDATE_CACHE();
2832
2833       m_impl.replace(first.impl(), last.impl(), ImplStr(s));
2834
2835       return *this;
2836   }
2837
2838   wxString& replace(iterator first, iterator last, const char* s, size_type n)
2839   {
2840       wxSTRING_INVALIDATE_CACHE();
2841
2842       SubstrBufFromMB str(ImplStr(s, n));
2843       m_impl.replace(first.impl(), last.impl(), str.data, str.len);
2844
2845       return *this;
2846   }
2847
2848   wxString& replace(iterator first, iterator last, const wchar_t* s, size_type n)
2849   {
2850       wxSTRING_INVALIDATE_CACHE();
2851
2852       SubstrBufFromWC str(ImplStr(s, n));
2853       m_impl.replace(first.impl(), last.impl(), str.data, str.len);
2854
2855       return *this;
2856   }
2857
2858   wxString& replace(iterator first, iterator last, const wxString& s)
2859   {
2860       wxSTRING_INVALIDATE_CACHE();
2861
2862       m_impl.replace(first.impl(), last.impl(), s.m_impl);
2863
2864       return *this;
2865   }
2866
2867   wxString& replace(iterator first, iterator last, size_type n, wxUniChar ch)
2868   {
2869       wxSTRING_INVALIDATE_CACHE();
2870
2871 #if wxUSE_UNICODE_UTF8
2872       if ( !ch.IsAscii() )
2873           m_impl.replace(first.impl(), last.impl(),
2874                   wxStringOperations::EncodeNChars(n, ch));
2875       else
2876 #endif
2877           m_impl.replace(first.impl(), last.impl(), n, (wxStringCharType)ch);
2878
2879       return *this;
2880   }
2881
2882   wxString& replace(iterator first, iterator last,
2883                     const_iterator first1, const_iterator last1)
2884   {
2885       wxSTRING_INVALIDATE_CACHE();
2886
2887       m_impl.replace(first.impl(), last.impl(), first1.impl(), last1.impl());
2888
2889       return *this;
2890   }
2891
2892   wxString& replace(iterator first, iterator last,
2893                     const char *first1, const char *last1)
2894     { replace(first, last, first1, last1 - first1); return *this; }
2895   wxString& replace(iterator first, iterator last,
2896                     const wchar_t *first1, const wchar_t *last1)
2897     { replace(first, last, first1, last1 - first1); return *this; }
2898
2899   // swap two strings
2900   void swap(wxString& str)
2901   {
2902 #if wxUSE_STRING_POS_CACHE
2903       // we modify not only this string but also the other one directly so we
2904       // need to invalidate cache for both of them (we could also try to
2905       // exchange their cache entries but it seems unlikely to be worth it)
2906       InvalidateCache();
2907       str.InvalidateCache();
2908 #endif // wxUSE_STRING_POS_CACHE
2909
2910       m_impl.swap(str.m_impl);
2911   }
2912
2913     // find a substring
2914   size_t find(const wxString& str, size_t nStart = 0) const
2915     { return PosFromImpl(m_impl.find(str.m_impl, PosToImpl(nStart))); }
2916
2917     // find first n characters of sz
2918   size_t find(const char* sz, size_t nStart = 0, size_t n = npos) const
2919   {
2920       SubstrBufFromMB str(ImplStr(sz, n));
2921       return PosFromImpl(m_impl.find(str.data, PosToImpl(nStart), str.len));
2922   }
2923   size_t find(const wchar_t* sz, size_t nStart = 0, size_t n = npos) const
2924   {
2925       SubstrBufFromWC str(ImplStr(sz, n));
2926       return PosFromImpl(m_impl.find(str.data, PosToImpl(nStart), str.len));
2927   }
2928   size_t find(const wxCharBuffer& s, size_t nStart = 0, size_t n = npos) const
2929     { return find(s.data(), nStart, n); }
2930   size_t find(const wxWCharBuffer& s, size_t nStart = 0, size_t n = npos) const
2931     { return find(s.data(), nStart, n); }
2932   size_t find(const wxCStrData& s, size_t nStart = 0, size_t n = npos) const
2933     { return find(s.AsWChar(), nStart, n); }
2934
2935     // find the first occurence of character ch after nStart
2936   size_t find(wxUniChar ch, size_t nStart = 0) const
2937   {
2938 #if wxUSE_UNICODE_UTF8
2939     if ( !ch.IsAscii() )
2940         return PosFromImpl(m_impl.find(wxStringOperations::EncodeChar(ch),
2941                                        PosToImpl(nStart)));
2942     else
2943 #endif
2944         return PosFromImpl(m_impl.find((wxStringCharType)ch,
2945                                        PosToImpl(nStart)));
2946
2947   }
2948   size_t find(wxUniCharRef ch, size_t nStart = 0) const
2949     {  return find(wxUniChar(ch), nStart); }
2950   size_t find(char ch, size_t nStart = 0) const
2951     {  return find(wxUniChar(ch), nStart); }
2952   size_t find(unsigned char ch, size_t nStart = 0) const
2953     {  return find(wxUniChar(ch), nStart); }
2954   size_t find(wchar_t ch, size_t nStart = 0) const
2955     {  return find(wxUniChar(ch), nStart); }
2956
2957     // rfind() family is exactly like find() but works right to left
2958
2959     // as find, but from the end
2960   size_t rfind(const wxString& str, size_t nStart = npos) const
2961     { return PosFromImpl(m_impl.rfind(str.m_impl, PosToImpl(nStart))); }
2962
2963     // as find, but from the end
2964   size_t rfind(const char* sz, size_t nStart = npos, size_t n = npos) const
2965   {
2966       SubstrBufFromMB str(ImplStr(sz, n));
2967       return PosFromImpl(m_impl.rfind(str.data, PosToImpl(nStart), str.len));
2968   }
2969   size_t rfind(const wchar_t* sz, size_t nStart = npos, size_t n = npos) const
2970   {
2971       SubstrBufFromWC str(ImplStr(sz, n));
2972       return PosFromImpl(m_impl.rfind(str.data, PosToImpl(nStart), str.len));
2973   }
2974   size_t rfind(const wxCharBuffer& s, size_t nStart = npos, size_t n = npos) const
2975     { return rfind(s.data(), nStart, n); }
2976   size_t rfind(const wxWCharBuffer& s, size_t nStart = npos, size_t n = npos) const
2977     { return rfind(s.data(), nStart, n); }
2978   size_t rfind(const wxCStrData& s, size_t nStart = npos, size_t n = npos) const
2979     { return rfind(s.AsWChar(), nStart, n); }
2980     // as find, but from the end
2981   size_t rfind(wxUniChar ch, size_t nStart = npos) const
2982   {
2983 #if wxUSE_UNICODE_UTF8
2984     if ( !ch.IsAscii() )
2985         return PosFromImpl(m_impl.rfind(wxStringOperations::EncodeChar(ch),
2986                                         PosToImpl(nStart)));
2987     else
2988 #endif
2989         return PosFromImpl(m_impl.rfind((wxStringCharType)ch,
2990                                         PosToImpl(nStart)));
2991   }
2992   size_t rfind(wxUniCharRef ch, size_t nStart = npos) const
2993     {  return rfind(wxUniChar(ch), nStart); }
2994   size_t rfind(char ch, size_t nStart = npos) const
2995     {  return rfind(wxUniChar(ch), nStart); }
2996   size_t rfind(unsigned char ch, size_t nStart = npos) const
2997     {  return rfind(wxUniChar(ch), nStart); }
2998   size_t rfind(wchar_t ch, size_t nStart = npos) const
2999     {  return rfind(wxUniChar(ch), nStart); }
3000
3001   // find first/last occurence of any character (not) in the set:
3002 #if wxUSE_STL_BASED_WXSTRING && !wxUSE_UNICODE_UTF8
3003   // FIXME-UTF8: this is not entirely correct, because it doesn't work if
3004   //             sizeof(wchar_t)==2 and surrogates are present in the string;
3005   //             should we care? Probably not.
3006   size_t find_first_of(const wxString& str, size_t nStart = 0) const
3007     { return m_impl.find_first_of(str.m_impl, nStart); }
3008   size_t find_first_of(const char* sz, size_t nStart = 0) const
3009     { return m_impl.find_first_of(ImplStr(sz), nStart); }
3010   size_t find_first_of(const wchar_t* sz, size_t nStart = 0) const
3011     { return m_impl.find_first_of(ImplStr(sz), nStart); }
3012   size_t find_first_of(const char* sz, size_t nStart, size_t n) const
3013     { return m_impl.find_first_of(ImplStr(sz), nStart, n); }
3014   size_t find_first_of(const wchar_t* sz, size_t nStart, size_t n) const
3015     { return m_impl.find_first_of(ImplStr(sz), nStart, n); }
3016   size_t find_first_of(wxUniChar c, size_t nStart = 0) const
3017     { return m_impl.find_first_of((wxChar)c, nStart); }
3018
3019   size_t find_last_of(const wxString& str, size_t nStart = npos) const
3020     { return m_impl.find_last_of(str.m_impl, nStart); }
3021   size_t find_last_of(const char* sz, size_t nStart = npos) const
3022     { return m_impl.find_last_of(ImplStr(sz), nStart); }
3023   size_t find_last_of(const wchar_t* sz, size_t nStart = npos) const
3024     { return m_impl.find_last_of(ImplStr(sz), nStart); }
3025   size_t find_last_of(const char* sz, size_t nStart, size_t n) const
3026     { return m_impl.find_last_of(ImplStr(sz), nStart, n); }
3027   size_t find_last_of(const wchar_t* sz, size_t nStart, size_t n) const
3028     { return m_impl.find_last_of(ImplStr(sz), nStart, n); }
3029   size_t find_last_of(wxUniChar c, size_t nStart = npos) const
3030     { return m_impl.find_last_of((wxChar)c, nStart); }
3031
3032   size_t find_first_not_of(const wxString& str, size_t nStart = 0) const
3033     { return m_impl.find_first_not_of(str.m_impl, nStart); }
3034   size_t find_first_not_of(const char* sz, size_t nStart = 0) const
3035     { return m_impl.find_first_not_of(ImplStr(sz), nStart); }
3036   size_t find_first_not_of(const wchar_t* sz, size_t nStart = 0) const
3037     { return m_impl.find_first_not_of(ImplStr(sz), nStart); }
3038   size_t find_first_not_of(const char* sz, size_t nStart, size_t n) const
3039     { return m_impl.find_first_not_of(ImplStr(sz), nStart, n); }
3040   size_t find_first_not_of(const wchar_t* sz, size_t nStart, size_t n) const
3041     { return m_impl.find_first_not_of(ImplStr(sz), nStart, n); }
3042   size_t find_first_not_of(wxUniChar c, size_t nStart = 0) const
3043     { return m_impl.find_first_not_of((wxChar)c, nStart); }
3044
3045   size_t find_last_not_of(const wxString& str, size_t nStart = npos) const
3046     { return m_impl.find_last_not_of(str.m_impl, nStart); }
3047   size_t find_last_not_of(const char* sz, size_t nStart = npos) const
3048     { return m_impl.find_last_not_of(ImplStr(sz), nStart); }
3049   size_t find_last_not_of(const wchar_t* sz, size_t nStart = npos) const
3050     { return m_impl.find_last_not_of(ImplStr(sz), nStart); }
3051   size_t find_last_not_of(const char* sz, size_t nStart, size_t n) const
3052     { return m_impl.find_last_not_of(ImplStr(sz), nStart, n); }
3053   size_t find_last_not_of(const wchar_t* sz, size_t nStart, size_t n) const
3054     { return m_impl.find_last_not_of(ImplStr(sz), nStart, n); }
3055   size_t find_last_not_of(wxUniChar c, size_t nStart = npos) const
3056     { return m_impl.find_last_not_of((wxChar)c, nStart); }
3057 #else
3058   // we can't use std::string implementation in UTF-8 build, because the
3059   // character sets would be interpreted wrongly:
3060
3061     // as strpbrk() but starts at nStart, returns npos if not found
3062   size_t find_first_of(const wxString& str, size_t nStart = 0) const
3063 #if wxUSE_UNICODE // FIXME-UTF8: temporary
3064     { return find_first_of(str.wc_str(), nStart); }
3065 #else
3066     { return find_first_of(str.mb_str(), nStart); }
3067 #endif
3068     // same as above
3069   size_t find_first_of(const char* sz, size_t nStart = 0) const;
3070   size_t find_first_of(const wchar_t* sz, size_t nStart = 0) const;
3071   size_t find_first_of(const char* sz, size_t nStart, size_t n) const;
3072   size_t find_first_of(const wchar_t* sz, size_t nStart, size_t n) const;
3073     // same as find(char, size_t)
3074   size_t find_first_of(wxUniChar c, size_t nStart = 0) const
3075     { return find(c, nStart); }
3076     // find the last (starting from nStart) char from str in this string
3077   size_t find_last_of (const wxString& str, size_t nStart = npos) const
3078 #if wxUSE_UNICODE // FIXME-UTF8: temporary
3079     { return find_last_of(str.wc_str(), nStart); }
3080 #else
3081     { return find_last_of(str.mb_str(), nStart); }
3082 #endif
3083     // same as above
3084   size_t find_last_of (const char* sz, size_t nStart = npos) const;
3085   size_t find_last_of (const wchar_t* sz, size_t nStart = npos) const;
3086   size_t find_last_of(const char* sz, size_t nStart, size_t n) const;
3087   size_t find_last_of(const wchar_t* sz, size_t nStart, size_t n) const;
3088     // same as above
3089   size_t find_last_of(wxUniChar c, size_t nStart = npos) const
3090     { return rfind(c, nStart); }
3091
3092     // find first/last occurence of any character not in the set
3093
3094     // as strspn() (starting from nStart), returns npos on failure
3095   size_t find_first_not_of(const wxString& str, size_t nStart = 0) const
3096 #if wxUSE_UNICODE // FIXME-UTF8: temporary
3097     { return find_first_not_of(str.wc_str(), nStart); }
3098 #else
3099     { return find_first_not_of(str.mb_str(), nStart); }
3100 #endif
3101     // same as above
3102   size_t find_first_not_of(const char* sz, size_t nStart = 0) const;
3103   size_t find_first_not_of(const wchar_t* sz, size_t nStart = 0) const;
3104   size_t find_first_not_of(const char* sz, size_t nStart, size_t n) const;
3105   size_t find_first_not_of(const wchar_t* sz, size_t nStart, size_t n) const;
3106     // same as above
3107   size_t find_first_not_of(wxUniChar ch, size_t nStart = 0) const;
3108     //  as strcspn()
3109   size_t find_last_not_of(const wxString& str, size_t nStart = npos) const
3110 #if wxUSE_UNICODE // FIXME-UTF8: temporary
3111     { return find_last_not_of(str.wc_str(), nStart); }
3112 #else
3113     { return find_last_not_of(str.mb_str(), nStart); }
3114 #endif
3115     // same as above
3116   size_t find_last_not_of(const char* sz, size_t nStart = npos) const;
3117   size_t find_last_not_of(const wchar_t* sz, size_t nStart = npos) const;
3118   size_t find_last_not_of(const char* sz, size_t nStart, size_t n) const;
3119   size_t find_last_not_of(const wchar_t* sz, size_t nStart, size_t n) const;
3120     // same as above
3121   size_t find_last_not_of(wxUniChar ch, size_t nStart = npos) const;
3122 #endif // wxUSE_STL_BASED_WXSTRING && !wxUSE_UNICODE_UTF8 or not
3123
3124   // provide char/wchar_t/wxUniCharRef overloads for char-finding functions
3125   // above to resolve ambiguities:
3126   size_t find_first_of(wxUniCharRef ch, size_t nStart = 0) const
3127     {  return find_first_of(wxUniChar(ch), nStart); }
3128   size_t find_first_of(char ch, size_t nStart = 0) const
3129     {  return find_first_of(wxUniChar(ch), nStart); }
3130   size_t find_first_of(unsigned char ch, size_t nStart = 0) const
3131     {  return find_first_of(wxUniChar(ch), nStart); }
3132   size_t find_first_of(wchar_t ch, size_t nStart = 0) const
3133     {  return find_first_of(wxUniChar(ch), nStart); }
3134   size_t find_last_of(wxUniCharRef ch, size_t nStart = npos) const
3135     {  return find_last_of(wxUniChar(ch), nStart); }
3136   size_t find_last_of(char ch, size_t nStart = npos) const
3137     {  return find_last_of(wxUniChar(ch), nStart); }
3138   size_t find_last_of(unsigned char ch, size_t nStart = npos) const
3139     {  return find_last_of(wxUniChar(ch), nStart); }
3140   size_t find_last_of(wchar_t ch, size_t nStart = npos) const
3141     {  return find_last_of(wxUniChar(ch), nStart); }
3142   size_t find_first_not_of(wxUniCharRef ch, size_t nStart = 0) const
3143     {  return find_first_not_of(wxUniChar(ch), nStart); }
3144   size_t find_first_not_of(char ch, size_t nStart = 0) const
3145     {  return find_first_not_of(wxUniChar(ch), nStart); }
3146   size_t find_first_not_of(unsigned char ch, size_t nStart = 0) const
3147     {  return find_first_not_of(wxUniChar(ch), nStart); }
3148   size_t find_first_not_of(wchar_t ch, size_t nStart = 0) const
3149     {  return find_first_not_of(wxUniChar(ch), nStart); }
3150   size_t find_last_not_of(wxUniCharRef ch, size_t nStart = npos) const
3151     {  return find_last_not_of(wxUniChar(ch), nStart); }
3152   size_t find_last_not_of(char ch, size_t nStart = npos) const
3153     {  return find_last_not_of(wxUniChar(ch), nStart); }
3154   size_t find_last_not_of(unsigned char ch, size_t nStart = npos) const
3155     {  return find_last_not_of(wxUniChar(ch), nStart); }
3156   size_t find_last_not_of(wchar_t ch, size_t nStart = npos) const
3157     {  return find_last_not_of(wxUniChar(ch), nStart); }
3158
3159   // and additional overloads for the versions taking strings:
3160   size_t find_first_of(const wxCStrData& sz, size_t nStart = 0) const
3161     { return find_first_of(sz.AsString(), nStart); }
3162   size_t find_first_of(const wxCharBuffer& sz, size_t nStart = 0) const
3163     { return find_first_of(sz.data(), nStart); }
3164   size_t find_first_of(const wxWCharBuffer& sz, size_t nStart = 0) const
3165     { return find_first_of(sz.data(), nStart); }
3166   size_t find_first_of(const wxCStrData& sz, size_t nStart, size_t n) const
3167     { return find_first_of(sz.AsWChar(), nStart, n); }
3168   size_t find_first_of(const wxCharBuffer& sz, size_t nStart, size_t n) const
3169     { return find_first_of(sz.data(), nStart, n); }
3170   size_t find_first_of(const wxWCharBuffer& sz, size_t nStart, size_t n) const
3171     { return find_first_of(sz.data(), nStart, n); }
3172
3173   size_t find_last_of(const wxCStrData& sz, size_t nStart = 0) const
3174     { return find_last_of(sz.AsString(), nStart); }
3175   size_t find_last_of(const wxCharBuffer& sz, size_t nStart = 0) const
3176     { return find_last_of(sz.data(), nStart); }
3177   size_t find_last_of(const wxWCharBuffer& sz, size_t nStart = 0) const
3178     { return find_last_of(sz.data(), nStart); }
3179   size_t find_last_of(const wxCStrData& sz, size_t nStart, size_t n) const
3180     { return find_last_of(sz.AsWChar(), nStart, n); }
3181   size_t find_last_of(const wxCharBuffer& sz, size_t nStart, size_t n) const
3182     { return find_last_of(sz.data(), nStart, n); }
3183   size_t find_last_of(const wxWCharBuffer& sz, size_t nStart, size_t n) const
3184     { return find_last_of(sz.data(), nStart, n); }
3185
3186   size_t find_first_not_of(const wxCStrData& sz, size_t nStart = 0) const
3187     { return find_first_not_of(sz.AsString(), nStart); }
3188   size_t find_first_not_of(const wxCharBuffer& sz, size_t nStart = 0) const
3189     { return find_first_not_of(sz.data(), nStart); }
3190   size_t find_first_not_of(const wxWCharBuffer& sz, size_t nStart = 0) const
3191     { return find_first_not_of(sz.data(), nStart); }
3192   size_t find_first_not_of(const wxCStrData& sz, size_t nStart, size_t n) const
3193     { return find_first_not_of(sz.AsWChar(), nStart, n); }
3194   size_t find_first_not_of(const wxCharBuffer& sz, size_t nStart, size_t n) const
3195     { return find_first_not_of(sz.data(), nStart, n); }
3196   size_t find_first_not_of(const wxWCharBuffer& sz, size_t nStart, size_t n) const
3197     { return find_first_not_of(sz.data(), nStart, n); }
3198
3199   size_t find_last_not_of(const wxCStrData& sz, size_t nStart = 0) const
3200     { return find_last_not_of(sz.AsString(), nStart); }
3201   size_t find_last_not_of(const wxCharBuffer& sz, size_t nStart = 0) const
3202     { return find_last_not_of(sz.data(), nStart); }
3203   size_t find_last_not_of(const wxWCharBuffer& sz, size_t nStart = 0) const
3204     { return find_last_not_of(sz.data(), nStart); }
3205   size_t find_last_not_of(const wxCStrData& sz, size_t nStart, size_t n) const
3206     { return find_last_not_of(sz.AsWChar(), nStart, n); }
3207   size_t find_last_not_of(const wxCharBuffer& sz, size_t nStart, size_t n) const
3208     { return find_last_not_of(sz.data(), nStart, n); }
3209   size_t find_last_not_of(const wxWCharBuffer& sz, size_t nStart, size_t n) const
3210     { return find_last_not_of(sz.data(), nStart, n); }
3211
3212       // string += string
3213   wxString& operator+=(const wxString& s)
3214   {
3215       wxSTRING_INVALIDATE_CACHED_LENGTH();
3216
3217       m_impl += s.m_impl;
3218       return *this;
3219   }
3220       // string += C string
3221   wxString& operator+=(const char *psz)
3222   {
3223       wxSTRING_INVALIDATE_CACHED_LENGTH();
3224
3225       m_impl += ImplStr(psz);
3226       return *this;
3227   }
3228   wxString& operator+=(const wchar_t *pwz)
3229   {
3230       wxSTRING_INVALIDATE_CACHED_LENGTH();
3231
3232       m_impl += ImplStr(pwz);
3233       return *this;
3234   }
3235   wxString& operator+=(const wxCStrData& s)
3236   {
3237       wxSTRING_INVALIDATE_CACHED_LENGTH();
3238
3239       m_impl += s.AsString().m_impl;
3240       return *this;
3241   }
3242   wxString& operator+=(const wxCharBuffer& s)
3243     { return operator+=(s.data()); }
3244   wxString& operator+=(const wxWCharBuffer& s)
3245     { return operator+=(s.data()); }
3246       // string += char
3247   wxString& operator+=(wxUniChar ch)
3248   {
3249       wxSTRING_UPDATE_CACHED_LENGTH(1);
3250
3251 #if wxUSE_UNICODE_UTF8
3252       if ( !ch.IsAscii() )
3253           m_impl += wxStringOperations::EncodeChar(ch);
3254       else
3255 #endif
3256           m_impl += (wxStringCharType)ch;
3257       return *this;
3258   }
3259   wxString& operator+=(wxUniCharRef ch) { return *this += wxUniChar(ch); }
3260   wxString& operator+=(int ch) { return *this += wxUniChar(ch); }
3261   wxString& operator+=(char ch) { return *this += wxUniChar(ch); }
3262   wxString& operator+=(unsigned char ch) { return *this += wxUniChar(ch); }
3263   wxString& operator+=(wchar_t ch) { return *this += wxUniChar(ch); }
3264
3265 private:
3266 #if !wxUSE_STL_BASED_WXSTRING
3267   // helpers for wxStringBuffer and wxStringBufferLength
3268   wxStringCharType *DoGetWriteBuf(size_t nLen)
3269   {
3270       return m_impl.DoGetWriteBuf(nLen);
3271   }
3272
3273   void DoUngetWriteBuf()
3274   {
3275       wxSTRING_INVALIDATE_CACHE();
3276
3277       m_impl.DoUngetWriteBuf();
3278   }
3279
3280   void DoUngetWriteBuf(size_t nLen)
3281   {
3282       wxSTRING_SET_CACHED_LENGTH(nLen);
3283
3284       m_impl.DoUngetWriteBuf(nLen);
3285   }
3286 #endif // !wxUSE_STL_BASED_WXSTRING
3287
3288 #ifndef wxNEEDS_WXSTRING_PRINTF_MIXIN
3289   #if !wxUSE_UTF8_LOCALE_ONLY
3290   int DoPrintfWchar(const wxChar *format, ...);
3291   static wxString DoFormatWchar(const wxChar *format, ...);
3292   #endif
3293   #if wxUSE_UNICODE_UTF8
3294   int DoPrintfUtf8(const char *format, ...);
3295   static wxString DoFormatUtf8(const char *format, ...);
3296   #endif
3297 #endif
3298
3299 #if !wxUSE_STL_BASED_WXSTRING
3300   // check string's data validity
3301   bool IsValid() const { return m_impl.GetStringData()->IsValid(); }
3302 #endif
3303
3304 private:
3305   wxStringImpl m_impl;
3306
3307   // buffers for compatibility conversion from (char*)c_str() and
3308   // (wchar_t*)c_str():
3309   // FIXME-UTF8: bechmark various approaches to keeping compatibility buffers
3310   template<typename T>
3311   struct ConvertedBuffer
3312   {
3313       ConvertedBuffer() : m_buf(NULL) {}
3314       ~ConvertedBuffer()
3315           { free(m_buf); }
3316
3317       operator T*() const { return m_buf; }
3318
3319       ConvertedBuffer& operator=(T *str)
3320       {
3321           free(m_buf);
3322           m_buf = str;
3323           return *this;
3324       }
3325
3326       T *m_buf;
3327   };
3328 #if wxUSE_UNICODE && !wxUSE_UTF8_LOCALE_ONLY
3329   ConvertedBuffer<char> m_convertedToChar;
3330 #endif
3331 #if !wxUSE_UNICODE_WCHAR
3332   ConvertedBuffer<wchar_t> m_convertedToWChar;
3333 #endif
3334
3335 #if wxUSE_UNICODE_UTF8
3336   // FIXME-UTF8: (try to) move this elsewhere (TLS) or solve differently
3337   //             assigning to character pointer to by wxString::interator may
3338   //             change the underlying wxStringImpl iterator, so we have to
3339   //             keep track of all iterators and update them as necessary:
3340   struct wxStringIteratorNodeHead
3341   {
3342       wxStringIteratorNodeHead() : ptr(NULL) {}
3343       wxStringIteratorNode *ptr;
3344
3345       // copying is disallowed as it would result in more than one pointer into
3346       // the same linked list
3347       DECLARE_NO_COPY_CLASS(wxStringIteratorNodeHead)
3348   };
3349
3350   wxStringIteratorNodeHead m_iterators;
3351
3352   friend class WXDLLIMPEXP_FWD_BASE wxStringIteratorNode;
3353   friend class WXDLLIMPEXP_FWD_BASE wxUniCharRef;
3354 #endif // wxUSE_UNICODE_UTF8
3355
3356   friend class WXDLLIMPEXP_FWD_BASE wxCStrData;
3357   friend class wxStringInternalBuffer;
3358   friend class wxStringInternalBufferLength;
3359 };
3360
3361 #ifdef wxNEEDS_WXSTRING_PRINTF_MIXIN
3362     #pragma warning (default:4275)
3363 #endif
3364
3365 // string iterator operators that satisfy STL Random Access Iterator
3366 // requirements:
3367 inline wxString::iterator operator+(ptrdiff_t n, wxString::iterator i)
3368   { return i + n; }
3369 inline wxString::const_iterator operator+(ptrdiff_t n, wxString::const_iterator i)
3370   { return i + n; }
3371 inline wxString::reverse_iterator operator+(ptrdiff_t n, wxString::reverse_iterator i)
3372   { return i + n; }
3373 inline wxString::const_reverse_iterator operator+(ptrdiff_t n, wxString::const_reverse_iterator i)
3374   { return i + n; }
3375
3376 // notice that even though for many compilers the friend declarations above are
3377 // enough, from the point of view of C++ standard we must have the declarations
3378 // here as friend ones are not injected in the enclosing namespace and without
3379 // them the code fails to compile with conforming compilers such as xlC or g++4
3380 wxString WXDLLIMPEXP_BASE operator+(const wxString& string1, const wxString& string2);
3381 wxString WXDLLIMPEXP_BASE operator+(const wxString& string, const char *psz);
3382 wxString WXDLLIMPEXP_BASE operator+(const wxString& string, const wchar_t *pwz);
3383 wxString WXDLLIMPEXP_BASE operator+(const char *psz, const wxString& string);
3384 wxString WXDLLIMPEXP_BASE operator+(const wchar_t *pwz, const wxString& string);
3385
3386 wxString WXDLLIMPEXP_BASE operator+(const wxString& string, wxUniChar ch);
3387 wxString WXDLLIMPEXP_BASE operator+(wxUniChar ch, const wxString& string);
3388
3389 inline wxString operator+(const wxString& string, wxUniCharRef ch)
3390     { return string + (wxUniChar)ch; }
3391 inline wxString operator+(const wxString& string, char ch)
3392     { return string + wxUniChar(ch); }
3393 inline wxString operator+(const wxString& string, wchar_t ch)
3394     { return string + wxUniChar(ch); }
3395 inline wxString operator+(wxUniCharRef ch, const wxString& string)
3396     { return (wxUniChar)ch + string; }
3397 inline wxString operator+(char ch, const wxString& string)
3398     { return wxUniChar(ch) + string; }
3399 inline wxString operator+(wchar_t ch, const wxString& string)
3400     { return wxUniChar(ch) + string; }
3401
3402
3403 #define wxGetEmptyString() wxString()
3404
3405 // ----------------------------------------------------------------------------
3406 // helper functions which couldn't be defined inline
3407 // ----------------------------------------------------------------------------
3408
3409 namespace wxPrivate
3410 {
3411
3412 #if wxUSE_UNICODE_WCHAR
3413
3414 template <>
3415 struct wxStringAsBufHelper<char>
3416 {
3417     static wxCharBuffer Get(const wxString& s, size_t *len)
3418     {
3419         wxCharBuffer buf(s.mb_str());
3420         if ( len )
3421             *len = buf ? strlen(buf) : 0;
3422         return buf;
3423     }
3424 };
3425
3426 template <>
3427 struct wxStringAsBufHelper<wchar_t>
3428 {
3429     static wxWCharBuffer Get(const wxString& s, size_t *len)
3430     {
3431         if ( len )
3432             *len = s.length();
3433         return wxWCharBuffer::CreateNonOwned(s.wx_str());
3434     }
3435 };
3436
3437 #elif wxUSE_UNICODE_UTF8
3438
3439 template <>
3440 struct wxStringAsBufHelper<char>
3441 {
3442     static wxCharBuffer Get(const wxString& s, size_t *len)
3443     {
3444         if ( len )
3445             *len = s.utf8_length();
3446         return wxCharBuffer::CreateNonOwned(s.wx_str());
3447     }
3448 };
3449
3450 template <>
3451 struct wxStringAsBufHelper<wchar_t>
3452 {
3453     static wxWCharBuffer Get(const wxString& s, size_t *len)
3454     {
3455         wxWCharBuffer wbuf(s.wc_str());
3456         if ( len )
3457             *len = wxWcslen(wbuf);
3458         return wbuf;
3459     }
3460 };
3461
3462 #endif // Unicode build kind
3463
3464 } // namespace wxPrivate
3465
3466 // ----------------------------------------------------------------------------
3467 // wxStringBuffer: a tiny class allowing to get a writable pointer into string
3468 // ----------------------------------------------------------------------------
3469
3470 #if !wxUSE_STL_BASED_WXSTRING
3471 // string buffer for direct access to string data in their native
3472 // representation:
3473 class wxStringInternalBuffer
3474 {
3475 public:
3476     typedef wxStringCharType CharType;
3477
3478     wxStringInternalBuffer(wxString& str, size_t lenWanted = 1024)
3479         : m_str(str), m_buf(NULL)
3480         { m_buf = m_str.DoGetWriteBuf(lenWanted); }
3481
3482     ~wxStringInternalBuffer() { m_str.DoUngetWriteBuf(); }
3483
3484     operator wxStringCharType*() const { return m_buf; }
3485
3486 private:
3487     wxString&         m_str;
3488     wxStringCharType *m_buf;
3489
3490     DECLARE_NO_COPY_CLASS(wxStringInternalBuffer)
3491 };
3492
3493 class wxStringInternalBufferLength
3494 {
3495 public:
3496     typedef wxStringCharType CharType;
3497
3498     wxStringInternalBufferLength(wxString& str, size_t lenWanted = 1024)
3499         : m_str(str), m_buf(NULL), m_len(0), m_lenSet(false)
3500     {
3501         m_buf = m_str.DoGetWriteBuf(lenWanted);
3502         wxASSERT(m_buf != NULL);
3503     }
3504
3505     ~wxStringInternalBufferLength()
3506     {
3507         wxASSERT(m_lenSet);
3508         m_str.DoUngetWriteBuf(m_len);
3509     }
3510
3511     operator wxStringCharType*() const { return m_buf; }
3512     void SetLength(size_t length) { m_len = length; m_lenSet = true; }
3513
3514 private:
3515     wxString&         m_str;
3516     wxStringCharType *m_buf;
3517     size_t            m_len;
3518     bool              m_lenSet;
3519
3520     DECLARE_NO_COPY_CLASS(wxStringInternalBufferLength)
3521 };
3522
3523 #endif // !wxUSE_STL_BASED_WXSTRING
3524
3525 template<typename T>
3526 class WXDLLIMPEXP_BASE wxStringTypeBufferBase
3527 {
3528 public:
3529     typedef T CharType;
3530
3531     wxStringTypeBufferBase(wxString& str, size_t lenWanted = 1024)
3532         : m_str(str), m_buf(lenWanted)
3533     {
3534         // for compatibility with old wxStringBuffer which provided direct
3535         // access to wxString internal buffer, initialize ourselves with the
3536         // string initial contents
3537
3538         // FIXME-VC6: remove the ugly (CharType *)NULL and use normal
3539         //            tchar_str<CharType>
3540         size_t len;
3541         const wxCharTypeBuffer<CharType> buf(str.tchar_str(&len, (CharType *)NULL));
3542         if ( buf )
3543         {
3544             if ( len > lenWanted )
3545             {
3546                 // in this case there is not enough space for terminating NUL,
3547                 // ensure that we still put it there
3548                 m_buf.data()[lenWanted] = 0;
3549                 len = lenWanted - 1;
3550             }
3551
3552             memcpy(m_buf.data(), buf, (len + 1)*sizeof(CharType));
3553         }
3554         //else: conversion failed, this can happen when trying to get Unicode
3555         //      string contents into a char string
3556     }
3557
3558     operator CharType*() { return m_buf.data(); }
3559
3560 protected:
3561     wxString& m_str;
3562     wxCharTypeBuffer<CharType> m_buf;
3563 };
3564
3565 template<typename T>
3566 class WXDLLIMPEXP_BASE wxStringTypeBufferLengthBase
3567     : public wxStringTypeBufferBase<T>
3568 {
3569 public:
3570     wxStringTypeBufferLengthBase(wxString& str, size_t lenWanted = 1024)
3571         : wxStringTypeBufferBase<T>(str, lenWanted),
3572           m_len(0),
3573           m_lenSet(false)
3574         { }
3575
3576     ~wxStringTypeBufferLengthBase()
3577     {
3578         wxASSERT_MSG( this->m_lenSet, "forgot to call SetLength()" );
3579     }
3580
3581     void SetLength(size_t length) { m_len = length; m_lenSet = true; }
3582
3583 protected:
3584     size_t m_len;
3585     bool m_lenSet;
3586 };
3587
3588 template<typename T>
3589 class wxStringTypeBuffer : public wxStringTypeBufferBase<T>
3590 {
3591 public:
3592     wxStringTypeBuffer(wxString& str, size_t lenWanted = 1024)
3593         : wxStringTypeBufferBase<T>(str, lenWanted)
3594         { }
3595
3596     ~wxStringTypeBuffer()
3597     {
3598         this->m_str.assign(this->m_buf.data());
3599     }
3600
3601     DECLARE_NO_COPY_CLASS(wxStringTypeBuffer)
3602 };
3603
3604 template<typename T>
3605 class wxStringTypeBufferLength : public wxStringTypeBufferLengthBase<T>
3606 {
3607 public:
3608     wxStringTypeBufferLength(wxString& str, size_t lenWanted = 1024)
3609         : wxStringTypeBufferLengthBase<T>(str, lenWanted)
3610         { }
3611
3612     ~wxStringTypeBufferLength()
3613     {
3614         this->m_str.assign(this->m_buf.data(), this->m_len);
3615     }
3616
3617     DECLARE_NO_COPY_CLASS(wxStringTypeBufferLength)
3618 };
3619
3620 #if wxUSE_STL_BASED_WXSTRING
3621
3622 WXDLLIMPEXP_TEMPLATE_INSTANCE_BASE( wxStringTypeBufferBase<wxStringCharType> )
3623
3624 class wxStringInternalBuffer : public wxStringTypeBufferBase<wxStringCharType>
3625 {
3626 public:
3627     wxStringInternalBuffer(wxString& str, size_t lenWanted = 1024)
3628         : wxStringTypeBufferBase<wxStringCharType>(str, lenWanted) {}
3629     ~wxStringInternalBuffer()
3630         { m_str.m_impl.assign(m_buf.data()); }
3631
3632     DECLARE_NO_COPY_CLASS(wxStringInternalBuffer)
3633 };
3634
3635 WXDLLIMPEXP_TEMPLATE_INSTANCE_BASE(
3636     wxStringTypeBufferLengthBase<wxStringCharType> )
3637
3638 class wxStringInternalBufferLength
3639     : public wxStringTypeBufferLengthBase<wxStringCharType>
3640 {
3641 public:
3642     wxStringInternalBufferLength(wxString& str, size_t lenWanted = 1024)
3643         : wxStringTypeBufferLengthBase<wxStringCharType>(str, lenWanted) {}
3644
3645     ~wxStringInternalBufferLength()
3646     {
3647         m_str.m_impl.assign(m_buf.data(), m_len);
3648     }
3649
3650     DECLARE_NO_COPY_CLASS(wxStringInternalBufferLength)
3651 };
3652
3653 #endif // wxUSE_STL_BASED_WXSTRING
3654
3655
3656 #if wxUSE_STL_BASED_WXSTRING || wxUSE_UNICODE_UTF8
3657 typedef wxStringTypeBuffer<wxChar>        wxStringBuffer;
3658 typedef wxStringTypeBufferLength<wxChar>  wxStringBufferLength;
3659 #else // if !wxUSE_STL_BASED_WXSTRING && !wxUSE_UNICODE_UTF8
3660 typedef wxStringInternalBuffer                wxStringBuffer;
3661 typedef wxStringInternalBufferLength          wxStringBufferLength;
3662 #endif // !wxUSE_STL_BASED_WXSTRING && !wxUSE_UNICODE_UTF8
3663
3664 #if wxUSE_UNICODE_UTF8
3665 typedef wxStringInternalBuffer                wxUTF8StringBuffer;
3666 typedef wxStringInternalBufferLength          wxUTF8StringBufferLength;
3667 #elif wxUSE_UNICODE_WCHAR
3668
3669 WXDLLIMPEXP_TEMPLATE_INSTANCE_BASE( wxStringTypeBufferBase<char> )
3670
3671 class WXDLLIMPEXP_BASE wxUTF8StringBuffer : public wxStringTypeBufferBase<char>
3672 {
3673 public:
3674     wxUTF8StringBuffer(wxString& str, size_t lenWanted = 1024)
3675         : wxStringTypeBufferBase<char>(str, lenWanted) {}
3676     ~wxUTF8StringBuffer();
3677
3678     DECLARE_NO_COPY_CLASS(wxUTF8StringBuffer)
3679 };
3680
3681 WXDLLIMPEXP_TEMPLATE_INSTANCE_BASE( wxStringTypeBufferLengthBase<char> )
3682
3683 class WXDLLIMPEXP_BASE wxUTF8StringBufferLength
3684     : public wxStringTypeBufferLengthBase<char>
3685 {
3686 public:
3687     wxUTF8StringBufferLength(wxString& str, size_t lenWanted = 1024)
3688         : wxStringTypeBufferLengthBase<char>(str, lenWanted) {}
3689     ~wxUTF8StringBufferLength();
3690
3691     DECLARE_NO_COPY_CLASS(wxUTF8StringBufferLength)
3692 };
3693 #endif // wxUSE_UNICODE_UTF8/wxUSE_UNICODE_WCHAR
3694
3695
3696 // ---------------------------------------------------------------------------
3697 // wxString comparison functions: operator versions are always case sensitive
3698 // ---------------------------------------------------------------------------
3699
3700 #define wxCMP_WXCHAR_STRING(p, s, op) 0 op s.Cmp(p)
3701
3702 wxDEFINE_ALL_COMPARISONS(const wxChar *, const wxString&, wxCMP_WXCHAR_STRING)
3703
3704 #undef wxCMP_WXCHAR_STRING
3705
3706 inline bool operator==(const wxString& s1, const wxString& s2)
3707     { return s1.IsSameAs(s2); }
3708 inline bool operator!=(const wxString& s1, const wxString& s2)
3709     { return !s1.IsSameAs(s2); }
3710 inline bool operator< (const wxString& s1, const wxString& s2)
3711     { return s1.Cmp(s2) < 0; }
3712 inline bool operator> (const wxString& s1, const wxString& s2)
3713     { return s1.Cmp(s2) >  0; }
3714 inline bool operator<=(const wxString& s1, const wxString& s2)
3715     { return s1.Cmp(s2) <= 0; }
3716 inline bool operator>=(const wxString& s1, const wxString& s2)
3717     { return s1.Cmp(s2) >= 0; }
3718
3719 inline bool operator==(const wxString& s1, const wxCStrData& s2)
3720     { return s1 == s2.AsString(); }
3721 inline bool operator==(const wxCStrData& s1, const wxString& s2)
3722     { return s1.AsString() == s2; }
3723 inline bool operator!=(const wxString& s1, const wxCStrData& s2)
3724     { return s1 != s2.AsString(); }
3725 inline bool operator!=(const wxCStrData& s1, const wxString& s2)
3726     { return s1.AsString() != s2; }
3727
3728 inline bool operator==(const wxString& s1, const wxWCharBuffer& s2)
3729     { return (s1.Cmp((const wchar_t *)s2) == 0); }
3730 inline bool operator==(const wxWCharBuffer& s1, const wxString& s2)
3731     { return (s2.Cmp((const wchar_t *)s1) == 0); }
3732 inline bool operator!=(const wxString& s1, const wxWCharBuffer& s2)
3733     { return (s1.Cmp((const wchar_t *)s2) != 0); }
3734 inline bool operator!=(const wxWCharBuffer& s1, const wxString& s2)
3735     { return (s2.Cmp((const wchar_t *)s1) != 0); }
3736
3737 inline bool operator==(const wxString& s1, const wxCharBuffer& s2)
3738     { return (s1.Cmp((const char *)s2) == 0); }
3739 inline bool operator==(const wxCharBuffer& s1, const wxString& s2)
3740     { return (s2.Cmp((const char *)s1) == 0); }
3741 inline bool operator!=(const wxString& s1, const wxCharBuffer& s2)
3742     { return (s1.Cmp((const char *)s2) != 0); }
3743 inline bool operator!=(const wxCharBuffer& s1, const wxString& s2)
3744     { return (s2.Cmp((const char *)s1) != 0); }
3745
3746 inline wxString operator+(const wxString& string, const wxWCharBuffer& buf)
3747     { return string + (const wchar_t *)buf; }
3748 inline wxString operator+(const wxWCharBuffer& buf, const wxString& string)
3749     { return (const wchar_t *)buf + string; }
3750
3751 inline wxString operator+(const wxString& string, const wxCharBuffer& buf)
3752     { return string + (const char *)buf; }
3753 inline wxString operator+(const wxCharBuffer& buf, const wxString& string)
3754     { return (const char *)buf + string; }
3755
3756 // comparison with char
3757 inline bool operator==(const wxUniChar& c, const wxString& s) { return s.IsSameAs(c); }
3758 inline bool operator==(const wxUniCharRef& c, const wxString& s) { return s.IsSameAs(c); }
3759 inline bool operator==(char c, const wxString& s) { return s.IsSameAs(c); }
3760 inline bool operator==(wchar_t c, const wxString& s) { return s.IsSameAs(c); }
3761 inline bool operator==(int c, const wxString& s) { return s.IsSameAs(c); }
3762 inline bool operator==(const wxString& s, const wxUniChar& c) { return s.IsSameAs(c); }
3763 inline bool operator==(const wxString& s, const wxUniCharRef& c) { return s.IsSameAs(c); }
3764 inline bool operator==(const wxString& s, char c) { return s.IsSameAs(c); }
3765 inline bool operator==(const wxString& s, wchar_t c) { return s.IsSameAs(c); }
3766 inline bool operator!=(const wxUniChar& c, const wxString& s) { return !s.IsSameAs(c); }
3767 inline bool operator!=(const wxUniCharRef& c, const wxString& s) { return !s.IsSameAs(c); }
3768 inline bool operator!=(char c, const wxString& s) { return !s.IsSameAs(c); }
3769 inline bool operator!=(wchar_t c, const wxString& s) { return !s.IsSameAs(c); }
3770 inline bool operator!=(int c, const wxString& s) { return !s.IsSameAs(c); }
3771 inline bool operator!=(const wxString& s, const wxUniChar& c) { return !s.IsSameAs(c); }
3772 inline bool operator!=(const wxString& s, const wxUniCharRef& c) { return !s.IsSameAs(c); }
3773 inline bool operator!=(const wxString& s, char c) { return !s.IsSameAs(c); }
3774 inline bool operator!=(const wxString& s, wchar_t c) { return !s.IsSameAs(c); }
3775
3776 // comparison with C string in Unicode build
3777 #if wxUSE_UNICODE
3778
3779 #define wxCMP_CHAR_STRING(p, s, op) wxString(p) op s
3780
3781 wxDEFINE_ALL_COMPARISONS(const char *, const wxString&, wxCMP_CHAR_STRING)
3782
3783 #undef wxCMP_CHAR_STRING
3784
3785 #endif // wxUSE_UNICODE
3786
3787 // we also need to provide the operators for comparison with wxCStrData to
3788 // resolve ambiguity between operator(const wxChar *,const wxString &) and
3789 // operator(const wxChar *, const wxChar *) for "p == s.c_str()"
3790 //
3791 // notice that these are (shallow) pointer comparisons, not (deep) string ones
3792 #define wxCMP_CHAR_CSTRDATA(p, s, op) p op s.AsChar()
3793 #define wxCMP_WCHAR_CSTRDATA(p, s, op) p op s.AsWChar()
3794
3795 wxDEFINE_ALL_COMPARISONS(const wchar_t *, const wxCStrData&, wxCMP_WCHAR_CSTRDATA)
3796 wxDEFINE_ALL_COMPARISONS(const char *, const wxCStrData&, wxCMP_CHAR_CSTRDATA)
3797
3798 #undef wxCMP_CHAR_CSTRDATA
3799 #undef wxCMP_WCHAR_CSTRDATA
3800
3801 // ---------------------------------------------------------------------------
3802 // Implementation only from here until the end of file
3803 // ---------------------------------------------------------------------------
3804
3805 #if wxUSE_STD_IOSTREAM
3806
3807 #include "wx/iosfwrap.h"
3808
3809 WXDLLIMPEXP_BASE wxSTD ostream& operator<<(wxSTD ostream&, const wxString&);
3810 WXDLLIMPEXP_BASE wxSTD ostream& operator<<(wxSTD ostream&, const wxCStrData&);
3811 WXDLLIMPEXP_BASE wxSTD ostream& operator<<(wxSTD ostream&, const wxCharBuffer&);
3812 #ifndef __BORLANDC__
3813 WXDLLIMPEXP_BASE wxSTD ostream& operator<<(wxSTD ostream&, const wxWCharBuffer&);
3814 #endif
3815
3816 #if wxUSE_UNICODE && defined(HAVE_WOSTREAM)
3817
3818 WXDLLIMPEXP_BASE wxSTD wostream& operator<<(wxSTD wostream&, const wxString&);
3819 WXDLLIMPEXP_BASE wxSTD wostream& operator<<(wxSTD wostream&, const wxCStrData&);
3820 WXDLLIMPEXP_BASE wxSTD wostream& operator<<(wxSTD wostream&, const wxWCharBuffer&);
3821
3822 #endif  // wxUSE_UNICODE && defined(HAVE_WOSTREAM)
3823
3824 #endif  // wxUSE_STD_IOSTREAM
3825
3826 // ---------------------------------------------------------------------------
3827 // wxCStrData implementation
3828 // ---------------------------------------------------------------------------
3829
3830 inline wxCStrData::wxCStrData(char *buf)
3831     : m_str(new wxString(buf)), m_offset(0), m_owned(true) {}
3832 inline wxCStrData::wxCStrData(wchar_t *buf)
3833     : m_str(new wxString(buf)), m_offset(0), m_owned(true) {}
3834
3835 inline wxCStrData::wxCStrData(const wxCStrData& data)
3836     : m_str(data.m_owned ? new wxString(*data.m_str) : data.m_str),
3837       m_offset(data.m_offset),
3838       m_owned(data.m_owned)
3839 {
3840 }
3841
3842 inline wxCStrData::~wxCStrData()
3843 {
3844     if ( m_owned )
3845         delete wx_const_cast(wxString*, m_str); // cast to silence warnings
3846 }
3847
3848 // simple cases for AsChar() and AsWChar(), the complicated ones are
3849 // in string.cpp
3850 #if wxUSE_UNICODE_WCHAR
3851 inline const wchar_t* wxCStrData::AsWChar() const
3852 {
3853     return m_str->wx_str() + m_offset;
3854 }
3855 #endif // wxUSE_UNICODE_WCHAR
3856
3857 #if !wxUSE_UNICODE
3858 inline const char* wxCStrData::AsChar() const
3859 {
3860     return m_str->wx_str() + m_offset;
3861 }
3862 #endif // !wxUSE_UNICODE
3863
3864 #if wxUSE_UTF8_LOCALE_ONLY
3865 inline const char* wxCStrData::AsChar() const
3866 {
3867     return wxStringOperations::AddToIter(m_str->wx_str(), m_offset);
3868 }
3869 #endif // wxUSE_UTF8_LOCALE_ONLY
3870
3871 inline const wxCharBuffer wxCStrData::AsCharBuf() const
3872 {
3873 #if !wxUSE_UNICODE
3874     return wxCharBuffer::CreateNonOwned(AsChar());
3875 #else
3876     return AsString().mb_str();
3877 #endif
3878 }
3879
3880 inline const wxWCharBuffer wxCStrData::AsWCharBuf() const
3881 {
3882 #if wxUSE_UNICODE_WCHAR
3883     return wxWCharBuffer::CreateNonOwned(AsWChar());
3884 #else
3885     return AsString().wc_str();
3886 #endif
3887 }
3888
3889 inline wxString wxCStrData::AsString() const
3890 {
3891     if ( m_offset == 0 )
3892         return *m_str;
3893     else
3894         return m_str->Mid(m_offset);
3895 }
3896
3897 inline const wxStringCharType *wxCStrData::AsInternal() const
3898 {
3899 #if wxUSE_UNICODE_UTF8
3900     return wxStringOperations::AddToIter(m_str->wx_str(), m_offset);
3901 #else
3902     return m_str->wx_str() + m_offset;
3903 #endif
3904 }
3905
3906 inline wxUniChar wxCStrData::operator*() const
3907 {
3908     if ( m_str->empty() )
3909         return wxUniChar(_T('\0'));
3910     else
3911         return (*m_str)[m_offset];
3912 }
3913
3914 inline wxUniChar wxCStrData::operator[](size_t n) const
3915 {
3916     // NB: we intentionally use operator[] and not at() here because the former
3917     //     works for the terminating NUL while the latter does not
3918     return (*m_str)[m_offset + n];
3919 }
3920
3921 // ----------------------------------------------------------------------------
3922 // more wxCStrData operators
3923 // ----------------------------------------------------------------------------
3924
3925 // we need to define those to allow "size_t pos = p - s.c_str()" where p is
3926 // some pointer into the string
3927 inline size_t operator-(const char *p, const wxCStrData& cs)
3928 {
3929     return p - cs.AsChar();
3930 }
3931
3932 inline size_t operator-(const wchar_t *p, const wxCStrData& cs)
3933 {
3934     return p - cs.AsWChar();
3935 }
3936
3937 // ----------------------------------------------------------------------------
3938 // implementation of wx[W]CharBuffer inline methods using wxCStrData
3939 // ----------------------------------------------------------------------------
3940
3941 // FIXME-UTF8: move this to buffer.h
3942 inline wxCharBuffer::wxCharBuffer(const wxCStrData& cstr)
3943                     : wxCharTypeBufferBase(cstr.AsCharBuf())
3944 {
3945 }
3946
3947 inline wxWCharBuffer::wxWCharBuffer(const wxCStrData& cstr)
3948                     : wxCharTypeBufferBase(cstr.AsWCharBuf())
3949 {
3950 }
3951
3952 #if wxUSE_UNICODE_UTF8
3953 // ----------------------------------------------------------------------------
3954 // implementation of wxStringIteratorNode inline methods
3955 // ----------------------------------------------------------------------------
3956
3957 void wxStringIteratorNode::DoSet(const wxString *str,
3958                                  wxStringImpl::const_iterator *citer,
3959                                  wxStringImpl::iterator *iter)
3960 {
3961     m_prev = NULL;
3962     m_iter = iter;
3963     m_citer = citer;
3964     m_str = str;
3965     if ( str )
3966     {
3967         m_next = str->m_iterators.ptr;
3968         wx_const_cast(wxString*, m_str)->m_iterators.ptr = this;
3969         if ( m_next )
3970             m_next->m_prev = this;
3971     }
3972     else
3973     {
3974         m_next = NULL;
3975     }
3976 }
3977
3978 void wxStringIteratorNode::clear()
3979 {
3980     if ( m_next )
3981         m_next->m_prev = m_prev;
3982     if ( m_prev )
3983         m_prev->m_next = m_next;
3984     else if ( m_str ) // first in the list
3985         wx_const_cast(wxString*, m_str)->m_iterators.ptr = m_next;
3986
3987     m_next = m_prev = NULL;
3988     m_citer = NULL;
3989     m_iter = NULL;
3990     m_str = NULL;
3991 }
3992 #endif // wxUSE_UNICODE_UTF8
3993
3994 #if WXWIN_COMPATIBILITY_2_8
3995     // lot of code out there doesn't explicitly include wx/crt.h, but uses
3996     // CRT wrappers that are now declared in wx/wxcrt.h and wx/wxcrtvararg.h,
3997     // so let's include this header now that wxString is defined and it's safe
3998     // to do it:
3999     #include "wx/crt.h"
4000 #endif
4001
4002 #endif  // _WX_WXSTRING_H_