1 ///////////////////////////////////////////////////////////////////////////////
3 // Purpose: wxString class
4 // Author: Vadim Zeitlin
8 // Copyright: (c) 1998 Vadim Zeitlin <zeitlin@dptmaths.ens-cachan.fr>
9 // Licence: wxWindows licence
10 ///////////////////////////////////////////////////////////////////////////////
13 Efficient string class [more or less] compatible with MFC CString,
14 wxWidgets version 1 wxString and std::string and some handy functions
15 missing from string.h.
18 #ifndef _WX_WXSTRING_H__
19 #define _WX_WXSTRING_H__
21 // ----------------------------------------------------------------------------
23 // ----------------------------------------------------------------------------
25 #include "wx/defs.h" // everybody should include this
28 #if defined(__WXMAC__) || defined(__VISAGECPP__)
32 #if defined(__VISAGECPP__) && __IBMCPP__ >= 400
33 // problem in VACPP V4 with including stdlib.h multiple times
34 // strconv includes it anyway
47 #ifdef HAVE_STRCASECMP_IN_STRINGS_H
48 #include <strings.h> // for strcasecmp()
49 #endif // HAVE_STRCASECMP_IN_STRINGS_H
50 #endif // ! __WXPALMOS5__
52 #include "wx/wxcrtbase.h" // for wxChar, wxStrlen() etc.
53 #include "wx/strvararg.h"
54 #include "wx/buffer.h" // for wxCharBuffer
55 #include "wx/strconv.h" // for wxConvertXXX() macros and wxMBConv classes
56 #include "wx/stringimpl.h"
57 #include "wx/stringops.h"
58 #include "wx/unichar.h"
60 // by default we cache the mapping of the positions in UTF-8 string to the byte
61 // offset as this results in noticeable performance improvements for loops over
62 // strings using indices; comment out this line to disable this
64 // notice that this optimization is well worth using even in debug builds as it
65 // changes asymptotic complexity of algorithms using indices to iterate over
66 // wxString back to expected linear from quadratic
68 // also notice that wxTLS_TYPE() (__declspec(thread) in this case) is unsafe to
69 // use in DLL build under pre-Vista Windows so we disable this code for now, if
70 // anybody really needs to use UTF-8 build under Windows with this optimization
71 // it would have to be re-tested and probably corrected
72 // CS: under OSX release builds the string destructor/cache cleanup sometimes
73 // crashes, disable until we find the true reason or a better workaround
74 #if wxUSE_UNICODE_UTF8 && !defined(__WXMSW__) && !defined(__WXOSX__)
75 #define wxUSE_STRING_POS_CACHE 1
77 #define wxUSE_STRING_POS_CACHE 0
80 #if wxUSE_STRING_POS_CACHE
83 // change this 0 to 1 to enable additional (very expensive) asserts
84 // verifying that string caching logic works as expected
86 #define wxSTRING_CACHE_ASSERT(cond) wxASSERT(cond)
88 #define wxSTRING_CACHE_ASSERT(cond)
90 #endif // wxUSE_STRING_POS_CACHE
92 class WXDLLIMPEXP_FWD_BASE wxString
;
94 // unless this symbol is predefined to disable the compatibility functions, do
96 #ifndef WXWIN_COMPATIBILITY_STRING_PTR_AS_ITER
97 #define WXWIN_COMPATIBILITY_STRING_PTR_AS_ITER 1
102 template <typename T
> struct wxStringAsBufHelper
;
105 // ---------------------------------------------------------------------------
107 // ---------------------------------------------------------------------------
109 // casts [unfortunately!] needed to call some broken functions which require
110 // "char *" instead of "const char *"
111 #define WXSTRINGCAST (wxChar *)(const wxChar *)
112 #define wxCSTRINGCAST (wxChar *)(const wxChar *)
113 #define wxMBSTRINGCAST (char *)(const char *)
114 #define wxWCSTRINGCAST (wchar_t *)(const wchar_t *)
116 // ----------------------------------------------------------------------------
118 // ----------------------------------------------------------------------------
120 #if WXWIN_COMPATIBILITY_2_6
122 // deprecated in favour of wxString::npos, don't use in new code
124 // maximum possible length for a string means "take all string" everywhere
125 #define wxSTRING_MAXLEN wxString::npos
127 #endif // WXWIN_COMPATIBILITY_2_6
129 // ---------------------------------------------------------------------------
130 // global functions complementing standard C string library replacements for
131 // strlen() and portable strcasecmp()
132 //---------------------------------------------------------------------------
134 #if WXWIN_COMPATIBILITY_2_8
135 // Use wxXXX() functions from wxcrt.h instead! These functions are for
136 // backwards compatibility only.
138 // checks whether the passed in pointer is NULL and if the string is empty
139 wxDEPRECATED( inline bool IsEmpty(const char *p
) );
140 inline bool IsEmpty(const char *p
) { return (!p
|| !*p
); }
142 // safe version of strlen() (returns 0 if passed NULL pointer)
143 wxDEPRECATED( inline size_t Strlen(const char *psz
) );
144 inline size_t Strlen(const char *psz
)
145 { return psz
? strlen(psz
) : 0; }
147 // portable strcasecmp/_stricmp
148 wxDEPRECATED( inline int Stricmp(const char *psz1
, const char *psz2
) );
149 inline int Stricmp(const char *psz1
, const char *psz2
)
151 #if defined(__VISUALC__) && defined(__WXWINCE__)
152 register char c1
, c2
;
154 c1
= tolower(*psz1
++);
155 c2
= tolower(*psz2
++);
156 } while ( c1
&& (c1
== c2
) );
159 #elif defined(__VISUALC__) || ( defined(__MWERKS__) && defined(__INTEL__) )
160 return _stricmp(psz1
, psz2
);
161 #elif defined(__SC__)
162 return _stricmp(psz1
, psz2
);
163 #elif defined(__BORLANDC__)
164 return stricmp(psz1
, psz2
);
165 #elif defined(__WATCOMC__)
166 return stricmp(psz1
, psz2
);
167 #elif defined(__DJGPP__)
168 return stricmp(psz1
, psz2
);
169 #elif defined(__EMX__)
170 return stricmp(psz1
, psz2
);
171 #elif defined(__WXPM__)
172 return stricmp(psz1
, psz2
);
173 #elif defined(__WXPALMOS__) || \
174 defined(HAVE_STRCASECMP_IN_STRING_H) || \
175 defined(HAVE_STRCASECMP_IN_STRINGS_H) || \
176 defined(__GNUWIN32__)
177 return strcasecmp(psz1
, psz2
);
178 #elif defined(__MWERKS__) && !defined(__INTEL__)
179 register char c1
, c2
;
181 c1
= tolower(*psz1
++);
182 c2
= tolower(*psz2
++);
183 } while ( c1
&& (c1
== c2
) );
187 // almost all compilers/libraries provide this function (unfortunately under
188 // different names), that's why we don't implement our own which will surely
189 // be more efficient than this code (uncomment to use):
191 register char c1, c2;
193 c1 = tolower(*psz1++);
194 c2 = tolower(*psz2++);
195 } while ( c1 && (c1 == c2) );
200 #error "Please define string case-insensitive compare for your OS/compiler"
201 #endif // OS/compiler
204 #endif // WXWIN_COMPATIBILITY_2_8
206 // ----------------------------------------------------------------------------
208 // ----------------------------------------------------------------------------
210 // Lightweight object returned by wxString::c_str() and implicitly convertible
211 // to either const char* or const wchar_t*.
215 // Ctors; for internal use by wxString and wxCStrData only
216 wxCStrData(const wxString
*str
, size_t offset
= 0, bool owned
= false)
217 : m_str(str
), m_offset(offset
), m_owned(owned
) {}
220 // Ctor constructs the object from char literal; they are needed to make
221 // operator?: compile and they intentionally take char*, not const char*
222 inline wxCStrData(char *buf
);
223 inline wxCStrData(wchar_t *buf
);
224 inline wxCStrData(const wxCStrData
& data
);
226 inline ~wxCStrData();
228 // AsWChar() and AsChar() can't be defined here as they use wxString and so
229 // must come after it and because of this won't be inlined when called from
230 // wxString methods (without a lot of work to extract these wxString methods
231 // from inside the class itself). But we still define them being inline
232 // below to let compiler inline them from elsewhere. And because of this we
233 // must declare them as inline here because otherwise some compilers give
234 // warnings about them, e.g. mingw32 3.4.5 warns about "<symbol> defined
235 // locally after being referenced with dllimport linkage" while IRIX
236 // mipsPro 7.4 warns about "function declared inline after being called".
237 inline const wchar_t* AsWChar() const;
238 operator const wchar_t*() const { return AsWChar(); }
240 inline const char* AsChar() const;
241 const unsigned char* AsUnsignedChar() const
242 { return (const unsigned char *) AsChar(); }
243 operator const char*() const { return AsChar(); }
244 operator const unsigned char*() const { return AsUnsignedChar(); }
246 operator const void*() const { return AsChar(); }
248 // returns buffers that are valid as long as the associated wxString exists
249 const wxScopedCharBuffer
AsCharBuf() const
251 return wxScopedCharBuffer::CreateNonOwned(AsChar());
254 const wxScopedWCharBuffer
AsWCharBuf() const
256 return wxScopedWCharBuffer::CreateNonOwned(AsWChar());
259 inline wxString
AsString() const;
261 // returns the value as C string in internal representation (equivalent
262 // to AsString().wx_str(), but more efficient)
263 const wxStringCharType
*AsInternal() const;
265 // allow expressions like "c_str()[0]":
266 inline wxUniChar
operator[](size_t n
) const;
267 wxUniChar
operator[](int n
) const { return operator[](size_t(n
)); }
268 wxUniChar
operator[](long n
) const { return operator[](size_t(n
)); }
269 #ifndef wxSIZE_T_IS_UINT
270 wxUniChar
operator[](unsigned int n
) const { return operator[](size_t(n
)); }
271 #endif // size_t != unsigned int
273 // These operators are needed to emulate the pointer semantics of c_str():
274 // expressions like "wxChar *p = str.c_str() + 1;" should continue to work
275 // (we need both versions to resolve ambiguities). Note that this means
276 // the 'n' value is interpreted as addition to char*/wchar_t* pointer, it
277 // is *not* number of Unicode characters in wxString.
278 wxCStrData
operator+(int n
) const
279 { return wxCStrData(m_str
, m_offset
+ n
, m_owned
); }
280 wxCStrData
operator+(long n
) const
281 { return wxCStrData(m_str
, m_offset
+ n
, m_owned
); }
282 wxCStrData
operator+(size_t n
) const
283 { return wxCStrData(m_str
, m_offset
+ n
, m_owned
); }
285 // and these for "str.c_str() + (p2 - p1)" (it also works for any integer
286 // expression but it must be ptrdiff_t and not e.g. int to work in this
288 wxCStrData
operator-(ptrdiff_t n
) const
290 wxASSERT_MSG( n
<= (ptrdiff_t)m_offset
,
291 wxT("attempt to construct address before the beginning of the string") );
292 return wxCStrData(m_str
, m_offset
- n
, m_owned
);
295 // this operator is needed to make expressions like "*c_str()" or
296 // "*(c_str() + 2)" work
297 inline wxUniChar
operator*() const;
300 // the wxString this object was returned for
301 const wxString
*m_str
;
302 // Offset into c_str() return value. Note that this is *not* offset in
303 // m_str in Unicode characters. Instead, it is index into the
304 // char*/wchar_t* buffer returned by c_str(). It's interpretation depends
305 // on how is the wxCStrData instance used: if it is eventually cast to
306 // const char*, m_offset will be in bytes form string's start; if it is
307 // cast to const wchar_t*, it will be in wchar_t values.
309 // should m_str be deleted, i.e. is it owned by us?
312 friend class WXDLLIMPEXP_FWD_BASE wxString
;
315 // ----------------------------------------------------------------------------
316 // wxStringPrintfMixin
317 // ---------------------------------------------------------------------------
319 // NB: VC6 has a bug that causes linker errors if you have template methods
320 // in a class using __declspec(dllimport). The solution is to split such
321 // class into two classes, one that contains the template methods and does
322 // *not* use WXDLLIMPEXP_BASE and another class that contains the rest
323 // (with DLL linkage).
325 // We only do this for VC6 here, because the code is less efficient
326 // (Printf() has to use dynamic_cast<>) and because OpenWatcom compiler
327 // cannot compile this code.
329 #if defined(__VISUALC__) && __VISUALC__ < 1300
330 #define wxNEEDS_WXSTRING_PRINTF_MIXIN
333 #ifdef wxNEEDS_WXSTRING_PRINTF_MIXIN
334 // this class contains implementation of wxString's vararg methods, it's
335 // exported from wxBase DLL
336 class WXDLLIMPEXP_BASE wxStringPrintfMixinBase
339 wxStringPrintfMixinBase() {}
341 #if !wxUSE_UTF8_LOCALE_ONLY
342 int DoPrintfWchar(const wxChar
*format
, ...);
343 static wxString
DoFormatWchar(const wxChar
*format
, ...);
345 #if wxUSE_UNICODE_UTF8
346 int DoPrintfUtf8(const char *format
, ...);
347 static wxString
DoFormatUtf8(const char *format
, ...);
351 // this class contains template wrappers for wxString's vararg methods, it's
352 // intentionally *not* exported from the DLL in order to fix the VC6 bug
354 class wxStringPrintfMixin
: public wxStringPrintfMixinBase
357 // to further complicate things, we can't return wxString from
358 // wxStringPrintfMixin::Format() because wxString is not yet declared at
359 // this point; the solution is to use this fake type trait template - this
360 // way the compiler won't know the return type until Format() is used
361 // (this doesn't compile with Watcom, but VC6 compiles it just fine):
362 template<typename T
> struct StringReturnType
364 typedef wxString type
;
368 // these are duplicated wxString methods, they're also declared below
369 // if !wxNEEDS_WXSTRING_PRINTF_MIXIN:
371 // static wxString Format(const wString& format, ...) WX_ATTRIBUTE_PRINTF_1;
372 WX_DEFINE_VARARG_FUNC_SANS_N0(static typename StringReturnType
<T1
>::type
,
373 Format
, 1, (const wxFormatString
&),
374 DoFormatWchar
, DoFormatUtf8
)
375 // We have to implement the version without template arguments manually
376 // because of the StringReturnType<> hack, although WX_DEFINE_VARARG_FUNC
377 // normally does it itself. It has to be a template so that we can use
378 // the hack, even though there's no real template parameter. We can't move
379 // it to wxStrig, because it would shadow these versions of Format() then.
381 inline static typename StringReturnType
<T
>::type
384 // NB: this doesn't compile if T is not (some form of) a string;
385 // this makes Format's prototype equivalent to
386 // Format(const wxFormatString& fmt)
387 return DoFormatWchar(wxFormatString(fmt
));
390 // int Printf(const wxString& format, ...);
391 WX_DEFINE_VARARG_FUNC(int, Printf
, 1, (const wxFormatString
&),
392 DoPrintfWchar
, DoPrintfUtf8
)
393 // int sprintf(const wxString& format, ...) WX_ATTRIBUTE_PRINTF_2;
394 WX_DEFINE_VARARG_FUNC(int, sprintf
, 1, (const wxFormatString
&),
395 DoPrintfWchar
, DoPrintfUtf8
)
398 wxStringPrintfMixin() : wxStringPrintfMixinBase() {}
400 #endif // wxNEEDS_WXSTRING_PRINTF_MIXIN
403 // ----------------------------------------------------------------------------
404 // wxString: string class trying to be compatible with std::string, MFC
405 // CString and wxWindows 1.x wxString all at once
406 // ---------------------------------------------------------------------------
408 #ifdef wxNEEDS_WXSTRING_PRINTF_MIXIN
409 // "non dll-interface class 'wxStringPrintfMixin' used as base interface
410 // for dll-interface class 'wxString'" -- this is OK in our case
411 #pragma warning (push)
412 #pragma warning (disable:4275)
415 #if wxUSE_UNICODE_UTF8
416 // see the comment near wxString::iterator for why we need this
417 class WXDLLIMPEXP_BASE wxStringIteratorNode
420 wxStringIteratorNode()
421 : m_str(NULL
), m_citer(NULL
), m_iter(NULL
), m_prev(NULL
), m_next(NULL
) {}
422 wxStringIteratorNode(const wxString
*str
,
423 wxStringImpl::const_iterator
*citer
)
424 { DoSet(str
, citer
, NULL
); }
425 wxStringIteratorNode(const wxString
*str
, wxStringImpl::iterator
*iter
)
426 { DoSet(str
, NULL
, iter
); }
427 ~wxStringIteratorNode()
430 inline void set(const wxString
*str
, wxStringImpl::const_iterator
*citer
)
431 { clear(); DoSet(str
, citer
, NULL
); }
432 inline void set(const wxString
*str
, wxStringImpl::iterator
*iter
)
433 { clear(); DoSet(str
, NULL
, iter
); }
435 const wxString
*m_str
;
436 wxStringImpl::const_iterator
*m_citer
;
437 wxStringImpl::iterator
*m_iter
;
438 wxStringIteratorNode
*m_prev
, *m_next
;
442 inline void DoSet(const wxString
*str
,
443 wxStringImpl::const_iterator
*citer
,
444 wxStringImpl::iterator
*iter
);
446 // the node belongs to a particular iterator instance, it's not copied
447 // when a copy of the iterator is made
448 wxDECLARE_NO_COPY_CLASS(wxStringIteratorNode
);
450 #endif // wxUSE_UNICODE_UTF8
452 class WXDLLIMPEXP_BASE wxString
453 #ifdef wxNEEDS_WXSTRING_PRINTF_MIXIN
454 : public wxStringPrintfMixin
457 // NB: special care was taken in arranging the member functions in such order
458 // that all inline functions can be effectively inlined, verify that all
459 // performance critical functions are still inlined if you change order!
461 // an 'invalid' value for string index, moved to this place due to a CW bug
462 static const size_t npos
;
465 // if we hadn't made these operators private, it would be possible to
466 // compile "wxString s; s = 17;" without any warnings as 17 is implicitly
467 // converted to char in C and we do have operator=(char)
469 // NB: we don't need other versions (short/long and unsigned) as attempt
470 // to assign another numeric type to wxString will now result in
471 // ambiguity between operator=(char) and operator=(int)
472 wxString
& operator=(int);
474 // these methods are not implemented - there is _no_ conversion from int to
475 // string, you're doing something wrong if the compiler wants to call it!
477 // try `s << i' or `s.Printf("%d", i)' instead
481 // buffer for holding temporary substring when using any of the methods
482 // that take (char*,size_t) or (wchar_t*,size_t) arguments:
484 struct SubstrBufFromType
489 SubstrBufFromType(const T
& data_
, size_t len_
)
490 : data(data_
), len(len_
)
492 wxASSERT_MSG( len
!= npos
, "must have real length" );
496 #if wxUSE_UNICODE_UTF8
497 // even char* -> char* needs conversion, from locale charset to UTF-8
498 typedef SubstrBufFromType
<wxScopedCharBuffer
> SubstrBufFromWC
;
499 typedef SubstrBufFromType
<wxScopedCharBuffer
> SubstrBufFromMB
;
500 #elif wxUSE_UNICODE_WCHAR
501 typedef SubstrBufFromType
<const wchar_t*> SubstrBufFromWC
;
502 typedef SubstrBufFromType
<wxScopedWCharBuffer
> SubstrBufFromMB
;
504 typedef SubstrBufFromType
<const char*> SubstrBufFromMB
;
505 typedef SubstrBufFromType
<wxScopedCharBuffer
> SubstrBufFromWC
;
509 // Functions implementing primitive operations on string data; wxString
510 // methods and iterators are implemented in terms of it. The differences
511 // between UTF-8 and wchar_t* representations of the string are mostly
514 #if wxUSE_UNICODE_UTF8
515 static SubstrBufFromMB
ConvertStr(const char *psz
, size_t nLength
,
516 const wxMBConv
& conv
);
517 static SubstrBufFromWC
ConvertStr(const wchar_t *pwz
, size_t nLength
,
518 const wxMBConv
& conv
);
519 #elif wxUSE_UNICODE_WCHAR
520 static SubstrBufFromMB
ConvertStr(const char *psz
, size_t nLength
,
521 const wxMBConv
& conv
);
523 static SubstrBufFromWC
ConvertStr(const wchar_t *pwz
, size_t nLength
,
524 const wxMBConv
& conv
);
527 #if !wxUSE_UNICODE_UTF8 // wxUSE_UNICODE_WCHAR or !wxUSE_UNICODE
528 // returns C string encoded as the implementation expects:
530 static const wchar_t* ImplStr(const wchar_t* str
)
531 { return str
? str
: wxT(""); }
532 static const SubstrBufFromWC
ImplStr(const wchar_t* str
, size_t n
)
533 { return SubstrBufFromWC(str
, (str
&& n
== npos
) ? wxWcslen(str
) : n
); }
534 static wxScopedWCharBuffer
ImplStr(const char* str
,
535 const wxMBConv
& conv
= wxConvLibc
)
536 { return ConvertStr(str
, npos
, conv
).data
; }
537 static SubstrBufFromMB
ImplStr(const char* str
, size_t n
,
538 const wxMBConv
& conv
= wxConvLibc
)
539 { return ConvertStr(str
, n
, conv
); }
541 static const char* ImplStr(const char* str
,
542 const wxMBConv
& WXUNUSED(conv
) = wxConvLibc
)
543 { return str
? str
: ""; }
544 static const SubstrBufFromMB
ImplStr(const char* str
, size_t n
,
545 const wxMBConv
& WXUNUSED(conv
) = wxConvLibc
)
546 { return SubstrBufFromMB(str
, (str
&& n
== npos
) ? wxStrlen(str
) : n
); }
547 static wxScopedCharBuffer
ImplStr(const wchar_t* str
)
548 { return ConvertStr(str
, npos
, wxConvLibc
).data
; }
549 static SubstrBufFromWC
ImplStr(const wchar_t* str
, size_t n
)
550 { return ConvertStr(str
, n
, wxConvLibc
); }
553 // translates position index in wxString to/from index in underlying
555 static size_t PosToImpl(size_t pos
) { return pos
; }
556 static void PosLenToImpl(size_t pos
, size_t len
,
557 size_t *implPos
, size_t *implLen
)
558 { *implPos
= pos
; *implLen
= len
; }
559 static size_t LenToImpl(size_t len
) { return len
; }
560 static size_t PosFromImpl(size_t pos
) { return pos
; }
562 // we don't want to define these as empty inline functions as it could
563 // result in noticeable (and quite unnecessary in non-UTF-8 build) slowdown
564 // in debug build where the inline functions are not effectively inlined
565 #define wxSTRING_INVALIDATE_CACHE()
566 #define wxSTRING_INVALIDATE_CACHED_LENGTH()
567 #define wxSTRING_UPDATE_CACHED_LENGTH(n)
568 #define wxSTRING_SET_CACHED_LENGTH(n)
570 #else // wxUSE_UNICODE_UTF8
572 static wxScopedCharBuffer
ImplStr(const char* str
,
573 const wxMBConv
& conv
= wxConvLibc
)
574 { return ConvertStr(str
, npos
, conv
).data
; }
575 static SubstrBufFromMB
ImplStr(const char* str
, size_t n
,
576 const wxMBConv
& conv
= wxConvLibc
)
577 { return ConvertStr(str
, n
, conv
); }
579 static wxScopedCharBuffer
ImplStr(const wchar_t* str
)
580 { return ConvertStr(str
, npos
, wxMBConvUTF8()).data
; }
581 static SubstrBufFromWC
ImplStr(const wchar_t* str
, size_t n
)
582 { return ConvertStr(str
, n
, wxMBConvUTF8()); }
584 #if wxUSE_STRING_POS_CACHE
585 // this is an extremely simple cache used by PosToImpl(): each cache element
586 // contains the string it applies to and the index corresponding to the last
587 // used position in this wxString in its m_impl string
589 // NB: notice that this struct (and nested Element one) must be a POD or we
590 // wouldn't be able to use a thread-local variable of this type, in
591 // particular it should have no ctor -- we rely on statics being
592 // initialized to 0 instead
599 const wxString
*str
; // the string to which this element applies
600 size_t pos
, // the cached index in this string
601 impl
, // the corresponding position in its m_impl
602 len
; // cached length or npos if unknown
604 // reset cached index to 0
605 void ResetPos() { pos
= impl
= 0; }
607 // reset position and length
608 void Reset() { ResetPos(); len
= npos
; }
611 // cache the indices mapping for the last few string used
612 Element cached
[SIZE
];
614 // the last used index
618 #ifndef wxHAS_COMPILER_TLS
619 // we must use an accessor function and not a static variable when the TLS
620 // variables support is implemented in the library (and not by the compiler)
621 // because the global s_cache variable could be not yet initialized when a
622 // ctor of another global object is executed and if that ctor uses any
623 // wxString methods, bad things happen
625 // however notice that this approach does not work when compiler TLS is used,
626 // at least not with g++ 4.1.2 under amd64 as it apparently compiles code
627 // using this accessor incorrectly when optimizations are enabled (-O2 is
628 // enough) -- luckily we don't need it then neither as static __thread
629 // variables are initialized by 0 anyhow then and so we can use the variable
631 WXEXPORT
static Cache
& GetCache()
633 static wxTLS_TYPE(Cache
) s_cache
;
635 return wxTLS_VALUE(s_cache
);
638 // this helper struct is used to ensure that GetCache() is called during
639 // static initialization time, i.e. before any threads creation, as otherwise
640 // the static s_cache construction inside GetCache() wouldn't be MT-safe
641 friend struct wxStrCacheInitializer
;
642 #else // wxHAS_COMPILER_TLS
643 static wxTLS_TYPE(Cache
) ms_cache
;
644 static Cache
& GetCache() { return wxTLS_VALUE(ms_cache
); }
645 #endif // !wxHAS_COMPILER_TLS/wxHAS_COMPILER_TLS
647 static Cache::Element
*GetCacheBegin() { return GetCache().cached
; }
648 static Cache::Element
*GetCacheEnd() { return GetCacheBegin() + Cache::SIZE
; }
649 static unsigned& LastUsedCacheElement() { return GetCache().lastUsed
; }
651 // this is used in debug builds only to provide a convenient function,
652 // callable from a debugger, to show the cache contents
653 friend struct wxStrCacheDumper
;
655 // uncomment this to have access to some profiling statistics on program
657 //#define wxPROFILE_STRING_CACHE
659 #ifdef wxPROFILE_STRING_CACHE
660 static struct PosToImplCacheStats
662 unsigned postot
, // total non-trivial calls to PosToImpl
663 poshits
, // cache hits from PosToImpl()
664 mishits
, // cached position beyond the needed one
665 sumpos
, // sum of all positions, used to compute the
666 // average position after dividing by postot
667 sumofs
, // sum of all offsets after using the cache, used to
668 // compute the average after dividing by hits
669 lentot
, // number of total calls to length()
670 lenhits
; // number of cache hits in length()
673 friend struct wxStrCacheStatsDumper
;
675 #define wxCACHE_PROFILE_FIELD_INC(field) ms_cacheStats.field++
676 #define wxCACHE_PROFILE_FIELD_ADD(field, val) ms_cacheStats.field += (val)
677 #else // !wxPROFILE_STRING_CACHE
678 #define wxCACHE_PROFILE_FIELD_INC(field)
679 #define wxCACHE_PROFILE_FIELD_ADD(field, val)
680 #endif // wxPROFILE_STRING_CACHE/!wxPROFILE_STRING_CACHE
682 // note: it could seem that the functions below shouldn't be inline because
683 // they are big, contain loops and so the compiler shouldn't be able to
684 // inline them anyhow, however moving them into string.cpp does decrease the
685 // code performance by ~5%, at least when using g++ 4.1 so do keep them here
686 // unless tests show that it's not advantageous any more
688 // return the pointer to the cache element for this string or NULL if not
690 Cache::Element
*FindCacheElement() const
692 // profiling seems to show a small but consistent gain if we use this
693 // simple loop instead of starting from the last used element (there are
694 // a lot of misses in this function...)
695 Cache::Element
* const cacheBegin
= GetCacheBegin();
696 #ifndef wxHAS_COMPILER_TLS
697 // during destruction tls calls may return NULL, in this case return NULL
698 // immediately without accessing anything else
699 if ( cacheBegin
== NULL
)
702 Cache::Element
* const cacheEnd
= GetCacheEnd();
703 for ( Cache::Element
*c
= cacheBegin
; c
!= cacheEnd
; c
++ )
705 if ( c
->str
== this )
712 // unlike FindCacheElement(), this one always returns a valid pointer to the
713 // cache element for this string, it may have valid last cached position and
714 // its corresponding index in the byte string or not
715 Cache::Element
*GetCacheElement() const
717 Cache::Element
* const cacheBegin
= GetCacheBegin();
718 Cache::Element
* const cacheEnd
= GetCacheEnd();
719 Cache::Element
* const cacheStart
= cacheBegin
+ LastUsedCacheElement();
721 // check the last used first, this does no (measurable) harm for a miss
722 // but does help for simple loops addressing the same string all the time
723 if ( cacheStart
->str
== this )
726 // notice that we're going to check cacheStart again inside this call but
727 // profiling shows that it's still faster to use a simple loop like
728 // inside FindCacheElement() than manually looping with wrapping starting
729 // from the cache entry after the start one
730 Cache::Element
*c
= FindCacheElement();
733 // claim the next cache entry for this string
735 if ( ++c
== cacheEnd
)
741 // and remember the last used element
742 LastUsedCacheElement() = c
- cacheBegin
;
748 size_t DoPosToImpl(size_t pos
) const
750 wxCACHE_PROFILE_FIELD_INC(postot
);
752 // NB: although the case of pos == 1 (and offset from cached position
753 // equal to 1) are common, nothing is gained by writing special code
754 // for handling them, the compiler (at least g++ 4.1 used) seems to
755 // optimize the code well enough on its own
757 wxCACHE_PROFILE_FIELD_ADD(sumpos
, pos
);
759 Cache::Element
* const cache
= GetCacheElement();
761 // cached position can't be 0 so if it is, it means that this entry was
762 // used for length caching only so far, i.e. it doesn't count as a hit
763 // from our point of view
766 wxCACHE_PROFILE_FIELD_INC(poshits
);
769 if ( pos
== cache
->pos
)
772 // this seems to happen only rarely so just reset the cache in this case
773 // instead of complicating code even further by seeking backwards in this
775 if ( cache
->pos
> pos
)
777 wxCACHE_PROFILE_FIELD_INC(mishits
);
782 wxCACHE_PROFILE_FIELD_ADD(sumofs
, pos
- cache
->pos
);
785 wxStringImpl::const_iterator
i(m_impl
.begin() + cache
->impl
);
786 for ( size_t n
= cache
->pos
; n
< pos
; n
++ )
787 wxStringOperations::IncIter(i
);
790 cache
->impl
= i
- m_impl
.begin();
792 wxSTRING_CACHE_ASSERT(
793 (int)cache
->impl
== (begin() + pos
).impl() - m_impl
.begin() );
798 void InvalidateCache()
800 Cache::Element
* const cache
= FindCacheElement();
805 void InvalidateCachedLength()
807 Cache::Element
* const cache
= FindCacheElement();
812 void SetCachedLength(size_t len
)
814 // we optimistically cache the length here even if the string wasn't
815 // present in the cache before, this seems to do no harm and the
816 // potential for avoiding length recomputation for long strings looks
818 GetCacheElement()->len
= len
;
821 void UpdateCachedLength(ptrdiff_t delta
)
823 Cache::Element
* const cache
= FindCacheElement();
824 if ( cache
&& cache
->len
!= npos
)
826 wxSTRING_CACHE_ASSERT( (ptrdiff_t)cache
->len
+ delta
>= 0 );
832 #define wxSTRING_INVALIDATE_CACHE() InvalidateCache()
833 #define wxSTRING_INVALIDATE_CACHED_LENGTH() InvalidateCachedLength()
834 #define wxSTRING_UPDATE_CACHED_LENGTH(n) UpdateCachedLength(n)
835 #define wxSTRING_SET_CACHED_LENGTH(n) SetCachedLength(n)
836 #else // !wxUSE_STRING_POS_CACHE
837 size_t DoPosToImpl(size_t pos
) const
839 return (begin() + pos
).impl() - m_impl
.begin();
842 #define wxSTRING_INVALIDATE_CACHE()
843 #define wxSTRING_INVALIDATE_CACHED_LENGTH()
844 #define wxSTRING_UPDATE_CACHED_LENGTH(n)
845 #define wxSTRING_SET_CACHED_LENGTH(n)
846 #endif // wxUSE_STRING_POS_CACHE/!wxUSE_STRING_POS_CACHE
848 size_t PosToImpl(size_t pos
) const
850 return pos
== 0 || pos
== npos
? pos
: DoPosToImpl(pos
);
853 void PosLenToImpl(size_t pos
, size_t len
, size_t *implPos
, size_t *implLen
) const;
855 size_t LenToImpl(size_t len
) const
858 PosLenToImpl(0, len
, &pos
, &len2
);
862 size_t PosFromImpl(size_t pos
) const
864 if ( pos
== 0 || pos
== npos
)
867 return const_iterator(this, m_impl
.begin() + pos
) - begin();
869 #endif // !wxUSE_UNICODE_UTF8/wxUSE_UNICODE_UTF8
873 typedef wxUniChar value_type
;
874 typedef wxUniChar char_type
;
875 typedef wxUniCharRef reference
;
876 typedef wxChar
* pointer
;
877 typedef const wxChar
* const_pointer
;
879 typedef size_t size_type
;
880 typedef wxUniChar const_reference
;
883 #if wxUSE_UNICODE_UTF8
884 // random access is not O(1), as required by Random Access Iterator
885 #define WX_STR_ITERATOR_TAG std::bidirectional_iterator_tag
887 #define WX_STR_ITERATOR_TAG std::random_access_iterator_tag
889 #define WX_DEFINE_ITERATOR_CATEGORY(cat) typedef cat iterator_category;
891 // not defining iterator_category at all in this case is better than defining
892 // it as some dummy type -- at least it results in more intelligible error
894 #define WX_DEFINE_ITERATOR_CATEGORY(cat)
897 #define WX_STR_ITERATOR_IMPL(iterator_name, pointer_type, reference_type) \
899 typedef wxStringImpl::iterator_name underlying_iterator; \
901 WX_DEFINE_ITERATOR_CATEGORY(WX_STR_ITERATOR_TAG) \
902 typedef wxUniChar value_type; \
903 typedef int difference_type; \
904 typedef reference_type reference; \
905 typedef pointer_type pointer; \
907 reference operator[](size_t n) const { return *(*this + n); } \
909 iterator_name& operator++() \
910 { wxStringOperations::IncIter(m_cur); return *this; } \
911 iterator_name& operator--() \
912 { wxStringOperations::DecIter(m_cur); return *this; } \
913 iterator_name operator++(int) \
915 iterator_name tmp = *this; \
916 wxStringOperations::IncIter(m_cur); \
919 iterator_name operator--(int) \
921 iterator_name tmp = *this; \
922 wxStringOperations::DecIter(m_cur); \
926 iterator_name& operator+=(ptrdiff_t n) \
928 m_cur = wxStringOperations::AddToIter(m_cur, n); \
931 iterator_name& operator-=(ptrdiff_t n) \
933 m_cur = wxStringOperations::AddToIter(m_cur, -n); \
937 difference_type operator-(const iterator_name& i) const \
938 { return wxStringOperations::DiffIters(m_cur, i.m_cur); } \
940 bool operator==(const iterator_name& i) const \
941 { return m_cur == i.m_cur; } \
942 bool operator!=(const iterator_name& i) const \
943 { return m_cur != i.m_cur; } \
945 bool operator<(const iterator_name& i) const \
946 { return m_cur < i.m_cur; } \
947 bool operator>(const iterator_name& i) const \
948 { return m_cur > i.m_cur; } \
949 bool operator<=(const iterator_name& i) const \
950 { return m_cur <= i.m_cur; } \
951 bool operator>=(const iterator_name& i) const \
952 { return m_cur >= i.m_cur; } \
955 /* for internal wxString use only: */ \
956 underlying_iterator impl() const { return m_cur; } \
958 friend class wxString; \
959 friend class wxCStrData; \
962 underlying_iterator m_cur
964 class WXDLLIMPEXP_FWD_BASE const_iterator
;
966 #if wxUSE_UNICODE_UTF8
967 // NB: In UTF-8 build, (non-const) iterator needs to keep reference
968 // to the underlying wxStringImpl, because UTF-8 is variable-length
969 // encoding and changing the value pointer to by an iterator (using
970 // its operator*) requires calling wxStringImpl::replace() if the old
971 // and new values differ in their encoding's length.
973 // Furthermore, the replace() call may invalid all iterators for the
974 // string, so we have to keep track of outstanding iterators and update
975 // them if replace() happens.
977 // This is implemented by maintaining linked list of iterators for every
978 // string and traversing it in wxUniCharRef::operator=(). Head of the
979 // list is stored in wxString. (FIXME-UTF8)
981 class WXDLLIMPEXP_BASE iterator
983 WX_STR_ITERATOR_IMPL(iterator
, wxChar
*, wxUniCharRef
);
987 iterator(const iterator
& i
)
988 : m_cur(i
.m_cur
), m_node(i
.str(), &m_cur
) {}
989 iterator
& operator=(const iterator
& i
)
994 m_node
.set(i
.str(), &m_cur
);
999 reference
operator*()
1000 { return wxUniCharRef::CreateForString(*str(), m_cur
); }
1002 iterator
operator+(ptrdiff_t n
) const
1003 { return iterator(str(), wxStringOperations::AddToIter(m_cur
, n
)); }
1004 iterator
operator-(ptrdiff_t n
) const
1005 { return iterator(str(), wxStringOperations::AddToIter(m_cur
, -n
)); }
1007 // Normal iterators need to be comparable with the const_iterators so
1008 // declare the comparison operators and implement them below after the
1009 // full const_iterator declaration.
1010 bool operator==(const const_iterator
& i
) const;
1011 bool operator!=(const const_iterator
& i
) const;
1012 bool operator<(const const_iterator
& i
) const;
1013 bool operator>(const const_iterator
& i
) const;
1014 bool operator<=(const const_iterator
& i
) const;
1015 bool operator>=(const const_iterator
& i
) const;
1018 iterator(wxString
*wxstr
, underlying_iterator ptr
)
1019 : m_cur(ptr
), m_node(wxstr
, &m_cur
) {}
1021 wxString
* str() const { return const_cast<wxString
*>(m_node
.m_str
); }
1023 wxStringIteratorNode m_node
;
1025 friend class const_iterator
;
1028 class WXDLLIMPEXP_BASE const_iterator
1030 // NB: reference_type is intentionally value, not reference, the character
1031 // may be encoded differently in wxString data:
1032 WX_STR_ITERATOR_IMPL(const_iterator
, const wxChar
*, wxUniChar
);
1036 const_iterator(const const_iterator
& i
)
1037 : m_cur(i
.m_cur
), m_node(i
.str(), &m_cur
) {}
1038 const_iterator(const iterator
& i
)
1039 : m_cur(i
.m_cur
), m_node(i
.str(), &m_cur
) {}
1041 const_iterator
& operator=(const const_iterator
& i
)
1046 m_node
.set(i
.str(), &m_cur
);
1050 const_iterator
& operator=(const iterator
& i
)
1051 { m_cur
= i
.m_cur
; m_node
.set(i
.str(), &m_cur
); return *this; }
1053 reference
operator*() const
1054 { return wxStringOperations::DecodeChar(m_cur
); }
1056 const_iterator
operator+(ptrdiff_t n
) const
1057 { return const_iterator(str(), wxStringOperations::AddToIter(m_cur
, n
)); }
1058 const_iterator
operator-(ptrdiff_t n
) const
1059 { return const_iterator(str(), wxStringOperations::AddToIter(m_cur
, -n
)); }
1061 // Notice that comparison operators taking non-const iterator are not
1062 // needed here because of the implicit conversion from non-const iterator
1063 // to const ones ensure that the versions for const_iterator declared
1064 // inside WX_STR_ITERATOR_IMPL can be used.
1067 // for internal wxString use only:
1068 const_iterator(const wxString
*wxstr
, underlying_iterator ptr
)
1069 : m_cur(ptr
), m_node(wxstr
, &m_cur
) {}
1071 const wxString
* str() const { return m_node
.m_str
; }
1073 wxStringIteratorNode m_node
;
1076 size_t IterToImplPos(wxString::iterator i
) const
1077 { return wxStringImpl::const_iterator(i
.impl()) - m_impl
.begin(); }
1079 iterator
GetIterForNthChar(size_t n
)
1080 { return iterator(this, m_impl
.begin() + PosToImpl(n
)); }
1081 const_iterator
GetIterForNthChar(size_t n
) const
1082 { return const_iterator(this, m_impl
.begin() + PosToImpl(n
)); }
1083 #else // !wxUSE_UNICODE_UTF8
1085 class WXDLLIMPEXP_BASE iterator
1087 WX_STR_ITERATOR_IMPL(iterator
, wxChar
*, wxUniCharRef
);
1091 iterator(const iterator
& i
) : m_cur(i
.m_cur
) {}
1093 reference
operator*()
1094 { return wxUniCharRef::CreateForString(m_cur
); }
1096 iterator
operator+(ptrdiff_t n
) const
1097 { return iterator(wxStringOperations::AddToIter(m_cur
, n
)); }
1098 iterator
operator-(ptrdiff_t n
) const
1099 { return iterator(wxStringOperations::AddToIter(m_cur
, -n
)); }
1101 // As in UTF-8 case above, define comparison operators taking
1102 // const_iterator too.
1103 bool operator==(const const_iterator
& i
) const;
1104 bool operator!=(const const_iterator
& i
) const;
1105 bool operator<(const const_iterator
& i
) const;
1106 bool operator>(const const_iterator
& i
) const;
1107 bool operator<=(const const_iterator
& i
) const;
1108 bool operator>=(const const_iterator
& i
) const;
1111 // for internal wxString use only:
1112 iterator(underlying_iterator ptr
) : m_cur(ptr
) {}
1113 iterator(wxString
*WXUNUSED(str
), underlying_iterator ptr
) : m_cur(ptr
) {}
1115 friend class const_iterator
;
1118 class WXDLLIMPEXP_BASE const_iterator
1120 // NB: reference_type is intentionally value, not reference, the character
1121 // may be encoded differently in wxString data:
1122 WX_STR_ITERATOR_IMPL(const_iterator
, const wxChar
*, wxUniChar
);
1126 const_iterator(const const_iterator
& i
) : m_cur(i
.m_cur
) {}
1127 const_iterator(const iterator
& i
) : m_cur(i
.m_cur
) {}
1129 reference
operator*() const
1130 { return wxStringOperations::DecodeChar(m_cur
); }
1132 const_iterator
operator+(ptrdiff_t n
) const
1133 { return const_iterator(wxStringOperations::AddToIter(m_cur
, n
)); }
1134 const_iterator
operator-(ptrdiff_t n
) const
1135 { return const_iterator(wxStringOperations::AddToIter(m_cur
, -n
)); }
1137 // As in UTF-8 case above, we don't need comparison operators taking
1138 // iterator because we have an implicit conversion from iterator to
1139 // const_iterator so the operators declared by WX_STR_ITERATOR_IMPL will
1143 // for internal wxString use only:
1144 const_iterator(underlying_iterator ptr
) : m_cur(ptr
) {}
1145 const_iterator(const wxString
*WXUNUSED(str
), underlying_iterator ptr
)
1149 iterator
GetIterForNthChar(size_t n
) { return begin() + n
; }
1150 const_iterator
GetIterForNthChar(size_t n
) const { return begin() + n
; }
1151 #endif // wxUSE_UNICODE_UTF8/!wxUSE_UNICODE_UTF8
1153 #undef WX_STR_ITERATOR_TAG
1154 #undef WX_STR_ITERATOR_IMPL
1156 friend class iterator
;
1157 friend class const_iterator
;
1159 template <typename T
>
1160 class reverse_iterator_impl
1163 typedef T iterator_type
;
1165 WX_DEFINE_ITERATOR_CATEGORY(typename
T::iterator_category
)
1166 typedef typename
T::value_type value_type
;
1167 typedef typename
T::difference_type difference_type
;
1168 typedef typename
T::reference reference
;
1169 typedef typename
T::pointer
*pointer
;
1171 reverse_iterator_impl() {}
1172 reverse_iterator_impl(iterator_type i
) : m_cur(i
) {}
1173 reverse_iterator_impl(const reverse_iterator_impl
& ri
)
1174 : m_cur(ri
.m_cur
) {}
1176 iterator_type
base() const { return m_cur
; }
1178 reference
operator*() const { return *(m_cur
-1); }
1179 reference
operator[](size_t n
) const { return *(*this + n
); }
1181 reverse_iterator_impl
& operator++()
1182 { --m_cur
; return *this; }
1183 reverse_iterator_impl
operator++(int)
1184 { reverse_iterator_impl tmp
= *this; --m_cur
; return tmp
; }
1185 reverse_iterator_impl
& operator--()
1186 { ++m_cur
; return *this; }
1187 reverse_iterator_impl
operator--(int)
1188 { reverse_iterator_impl tmp
= *this; ++m_cur
; return tmp
; }
1190 // NB: explicit <T> in the functions below is to keep BCC 5.5 happy
1191 reverse_iterator_impl
operator+(ptrdiff_t n
) const
1192 { return reverse_iterator_impl
<T
>(m_cur
- n
); }
1193 reverse_iterator_impl
operator-(ptrdiff_t n
) const
1194 { return reverse_iterator_impl
<T
>(m_cur
+ n
); }
1195 reverse_iterator_impl
operator+=(ptrdiff_t n
)
1196 { m_cur
-= n
; return *this; }
1197 reverse_iterator_impl
operator-=(ptrdiff_t n
)
1198 { m_cur
+= n
; return *this; }
1200 unsigned operator-(const reverse_iterator_impl
& i
) const
1201 { return i
.m_cur
- m_cur
; }
1203 bool operator==(const reverse_iterator_impl
& ri
) const
1204 { return m_cur
== ri
.m_cur
; }
1205 bool operator!=(const reverse_iterator_impl
& ri
) const
1206 { return !(*this == ri
); }
1208 bool operator<(const reverse_iterator_impl
& i
) const
1209 { return m_cur
> i
.m_cur
; }
1210 bool operator>(const reverse_iterator_impl
& i
) const
1211 { return m_cur
< i
.m_cur
; }
1212 bool operator<=(const reverse_iterator_impl
& i
) const
1213 { return m_cur
>= i
.m_cur
; }
1214 bool operator>=(const reverse_iterator_impl
& i
) const
1215 { return m_cur
<= i
.m_cur
; }
1218 iterator_type m_cur
;
1221 typedef reverse_iterator_impl
<iterator
> reverse_iterator
;
1222 typedef reverse_iterator_impl
<const_iterator
> const_reverse_iterator
;
1225 // used to transform an expression built using c_str() (and hence of type
1226 // wxCStrData) to an iterator into the string
1227 static const_iterator
CreateConstIterator(const wxCStrData
& data
)
1229 return const_iterator(data
.m_str
,
1230 (data
.m_str
->begin() + data
.m_offset
).impl());
1233 // in UTF-8 STL build, creation from std::string requires conversion under
1234 // non-UTF8 locales, so we can't have and use wxString(wxStringImpl) ctor;
1235 // instead we define dummy type that lets us have wxString ctor for creation
1236 // from wxStringImpl that couldn't be used by user code (in all other builds,
1237 // "standard" ctors can be used):
1238 #if wxUSE_UNICODE_UTF8 && wxUSE_STL_BASED_WXSTRING
1239 struct CtorFromStringImplTag
{};
1241 wxString(CtorFromStringImplTag
* WXUNUSED(dummy
), const wxStringImpl
& src
)
1244 static wxString
FromImpl(const wxStringImpl
& src
)
1245 { return wxString((CtorFromStringImplTag
*)NULL
, src
); }
1247 #if !wxUSE_STL_BASED_WXSTRING
1248 wxString(const wxStringImpl
& src
) : m_impl(src
) { }
1249 // else: already defined as wxString(wxStdString) below
1251 static wxString
FromImpl(const wxStringImpl
& src
) { return wxString(src
); }
1255 // constructors and destructor
1256 // ctor for an empty string
1260 wxString(const wxString
& stringSrc
) : m_impl(stringSrc
.m_impl
) { }
1262 // string containing nRepeat copies of ch
1263 wxString(wxUniChar ch
, size_t nRepeat
= 1 )
1264 { assign(nRepeat
, ch
); }
1265 wxString(size_t nRepeat
, wxUniChar ch
)
1266 { assign(nRepeat
, ch
); }
1267 wxString(wxUniCharRef ch
, size_t nRepeat
= 1)
1268 { assign(nRepeat
, ch
); }
1269 wxString(size_t nRepeat
, wxUniCharRef ch
)
1270 { assign(nRepeat
, ch
); }
1271 wxString(char ch
, size_t nRepeat
= 1)
1272 { assign(nRepeat
, ch
); }
1273 wxString(size_t nRepeat
, char ch
)
1274 { assign(nRepeat
, ch
); }
1275 wxString(wchar_t ch
, size_t nRepeat
= 1)
1276 { assign(nRepeat
, ch
); }
1277 wxString(size_t nRepeat
, wchar_t ch
)
1278 { assign(nRepeat
, ch
); }
1280 // ctors from char* strings:
1281 wxString(const char *psz
)
1282 : m_impl(ImplStr(psz
)) {}
1283 wxString(const char *psz
, const wxMBConv
& conv
)
1284 : m_impl(ImplStr(psz
, conv
)) {}
1285 wxString(const char *psz
, size_t nLength
)
1286 { assign(psz
, nLength
); }
1287 wxString(const char *psz
, const wxMBConv
& conv
, size_t nLength
)
1289 SubstrBufFromMB
str(ImplStr(psz
, nLength
, conv
));
1290 m_impl
.assign(str
.data
, str
.len
);
1293 // and unsigned char*:
1294 wxString(const unsigned char *psz
)
1295 : m_impl(ImplStr((const char*)psz
)) {}
1296 wxString(const unsigned char *psz
, const wxMBConv
& conv
)
1297 : m_impl(ImplStr((const char*)psz
, conv
)) {}
1298 wxString(const unsigned char *psz
, size_t nLength
)
1299 { assign((const char*)psz
, nLength
); }
1300 wxString(const unsigned char *psz
, const wxMBConv
& conv
, size_t nLength
)
1302 SubstrBufFromMB
str(ImplStr((const char*)psz
, nLength
, conv
));
1303 m_impl
.assign(str
.data
, str
.len
);
1306 // ctors from wchar_t* strings:
1307 wxString(const wchar_t *pwz
)
1308 : m_impl(ImplStr(pwz
)) {}
1309 wxString(const wchar_t *pwz
, const wxMBConv
& WXUNUSED(conv
))
1310 : m_impl(ImplStr(pwz
)) {}
1311 wxString(const wchar_t *pwz
, size_t nLength
)
1312 { assign(pwz
, nLength
); }
1313 wxString(const wchar_t *pwz
, const wxMBConv
& WXUNUSED(conv
), size_t nLength
)
1314 { assign(pwz
, nLength
); }
1316 wxString(const wxScopedCharBuffer
& buf
)
1317 { assign(buf
.data(), buf
.length()); }
1318 wxString(const wxScopedWCharBuffer
& buf
)
1319 { assign(buf
.data(), buf
.length()); }
1321 // NB: this version uses m_impl.c_str() to force making a copy of the
1322 // string, so that "wxString(str.c_str())" idiom for passing strings
1323 // between threads works
1324 wxString(const wxCStrData
& cstr
)
1325 : m_impl(cstr
.AsString().m_impl
.c_str()) { }
1327 // as we provide both ctors with this signature for both char and unsigned
1328 // char string, we need to provide one for wxCStrData to resolve ambiguity
1329 wxString(const wxCStrData
& cstr
, size_t nLength
)
1330 : m_impl(cstr
.AsString().Mid(0, nLength
).m_impl
) {}
1332 // and because wxString is convertible to wxCStrData and const wxChar *
1333 // we also need to provide this one
1334 wxString(const wxString
& str
, size_t nLength
)
1335 { assign(str
, nLength
); }
1338 #if wxUSE_STRING_POS_CACHE
1341 // we need to invalidate our cache entry as another string could be
1342 // recreated at the same address (unlikely, but still possible, with the
1343 // heap-allocated strings but perfectly common with stack-allocated ones)
1346 #endif // wxUSE_STRING_POS_CACHE
1348 // even if we're not built with wxUSE_STL == 1 it is very convenient to allow
1349 // implicit conversions from std::string to wxString and vice verse as this
1350 // allows to use the same strings in non-GUI and GUI code, however we don't
1351 // want to unconditionally add this ctor as it would make wx lib dependent on
1352 // libstdc++ on some Linux versions which is bad, so instead we ask the
1353 // client code to define this wxUSE_STD_STRING symbol if they need it
1354 #if wxUSE_STD_STRING
1355 #if wxUSE_UNICODE_WCHAR
1356 wxString(const wxStdWideString
& str
) : m_impl(str
) {}
1357 #else // UTF-8 or ANSI
1358 wxString(const wxStdWideString
& str
)
1359 { assign(str
.c_str(), str
.length()); }
1362 #if !wxUSE_UNICODE // ANSI build
1363 // FIXME-UTF8: do this in UTF8 build #if wxUSE_UTF8_LOCALE_ONLY, too
1364 wxString(const std::string
& str
) : m_impl(str
) {}
1366 wxString(const std::string
& str
)
1367 { assign(str
.c_str(), str
.length()); }
1369 #endif // wxUSE_STD_STRING
1371 // Unlike ctor from std::string, we provide conversion to std::string only
1372 // if wxUSE_STL and not merely wxUSE_STD_STRING (which is on by default),
1373 // because it conflicts with operator const char/wchar_t* but we still
1374 // provide explicit conversions to std::[w]string for convenience in any case
1375 #if wxUSE_STD_STRING
1376 // We can avoid a copy if we already use this string type internally,
1377 // otherwise we create a copy on the fly:
1378 #if wxUSE_UNICODE_WCHAR && wxUSE_STL_BASED_WXSTRING
1379 #define wxStringToStdWstringRetType const wxStdWideString&
1380 const wxStdWideString
& ToStdWstring() const { return m_impl
; }
1382 // wxStringImpl is either not std::string or needs conversion
1383 #define wxStringToStdWstringRetType wxStdWideString
1384 wxStdWideString
ToStdWstring() const
1386 #if wxUSE_UNICODE_WCHAR
1387 wxScopedWCharBuffer buf
=
1388 wxScopedWCharBuffer::CreateNonOwned(m_impl
.c_str(), m_impl
.length());
1389 #else // !wxUSE_UNICODE_WCHAR
1390 wxScopedWCharBuffer
buf(wc_str());
1393 return wxStdWideString(buf
.data(), buf
.length());
1397 #if (!wxUSE_UNICODE || wxUSE_UTF8_LOCALE_ONLY) && wxUSE_STL_BASED_WXSTRING
1398 // wxStringImpl is std::string in the encoding we want
1399 #define wxStringToStdStringRetType const std::string&
1400 const std::string
& ToStdString() const { return m_impl
; }
1402 // wxStringImpl is either not std::string or needs conversion
1403 #define wxStringToStdStringRetType std::string
1404 std::string
ToStdString() const
1406 wxScopedCharBuffer
buf(mb_str());
1407 return std::string(buf
.data(), buf
.length());
1412 // In wxUSE_STL case we also provide implicit conversions as there is no
1413 // ambiguity with the const char/wchar_t* ones as they are disabled in this
1414 // build (for consistency with std::basic_string<>)
1415 operator wxStringToStdStringRetType() const { return ToStdString(); }
1416 operator wxStringToStdWstringRetType() const { return ToStdWstring(); }
1419 #undef wxStringToStdStringRetType
1420 #undef wxStringToStdWstringRetType
1422 #endif // wxUSE_STD_STRING
1424 wxString
Clone() const
1426 // make a deep copy of the string, i.e. the returned string will have
1427 // ref count = 1 with refcounted implementation
1428 return wxString::FromImpl(wxStringImpl(m_impl
.c_str(), m_impl
.length()));
1431 // first valid index position
1432 const_iterator
begin() const { return const_iterator(this, m_impl
.begin()); }
1433 iterator
begin() { return iterator(this, m_impl
.begin()); }
1434 // position one after the last valid one
1435 const_iterator
end() const { return const_iterator(this, m_impl
.end()); }
1436 iterator
end() { return iterator(this, m_impl
.end()); }
1438 // first element of the reversed string
1439 const_reverse_iterator
rbegin() const
1440 { return const_reverse_iterator(end()); }
1441 reverse_iterator
rbegin()
1442 { return reverse_iterator(end()); }
1443 // one beyond the end of the reversed string
1444 const_reverse_iterator
rend() const
1445 { return const_reverse_iterator(begin()); }
1446 reverse_iterator
rend()
1447 { return reverse_iterator(begin()); }
1449 // std::string methods:
1450 #if wxUSE_UNICODE_UTF8
1451 size_t length() const
1453 #if wxUSE_STRING_POS_CACHE
1454 wxCACHE_PROFILE_FIELD_INC(lentot
);
1456 Cache::Element
* const cache
= GetCacheElement();
1458 if ( cache
->len
== npos
)
1460 // it's probably not worth trying to be clever and using cache->pos
1461 // here as it's probably 0 anyhow -- you usually call length() before
1462 // starting to index the string
1463 cache
->len
= end() - begin();
1467 wxCACHE_PROFILE_FIELD_INC(lenhits
);
1469 wxSTRING_CACHE_ASSERT( (int)cache
->len
== end() - begin() );
1473 #else // !wxUSE_STRING_POS_CACHE
1474 return end() - begin();
1475 #endif // wxUSE_STRING_POS_CACHE/!wxUSE_STRING_POS_CACHE
1478 size_t length() const { return m_impl
.length(); }
1481 size_type
size() const { return length(); }
1482 size_type
max_size() const { return npos
; }
1484 bool empty() const { return m_impl
.empty(); }
1486 // NB: these methods don't have a well-defined meaning in UTF-8 case
1487 size_type
capacity() const { return m_impl
.capacity(); }
1488 void reserve(size_t sz
) { m_impl
.reserve(sz
); }
1490 void resize(size_t nSize
, wxUniChar ch
= wxT('\0'))
1492 const size_t len
= length();
1496 #if wxUSE_UNICODE_UTF8
1499 wxSTRING_INVALIDATE_CACHE();
1501 // we can't use wxStringImpl::resize() for truncating the string as it
1502 // counts in bytes, not characters
1507 // we also can't use (presumably more efficient) resize() if we have to
1508 // append characters taking more than one byte
1509 if ( !ch
.IsAscii() )
1511 append(nSize
- len
, ch
);
1513 else // can use (presumably faster) resize() version
1514 #endif // wxUSE_UNICODE_UTF8
1516 wxSTRING_INVALIDATE_CACHED_LENGTH();
1518 m_impl
.resize(nSize
, (wxStringCharType
)ch
);
1522 wxString
substr(size_t nStart
= 0, size_t nLen
= npos
) const
1525 PosLenToImpl(nStart
, nLen
, &pos
, &len
);
1526 return FromImpl(m_impl
.substr(pos
, len
));
1529 // generic attributes & operations
1530 // as standard strlen()
1531 size_t Len() const { return length(); }
1532 // string contains any characters?
1533 bool IsEmpty() const { return empty(); }
1534 // empty string is "false", so !str will return true
1535 bool operator!() const { return empty(); }
1536 // truncate the string to given length
1537 wxString
& Truncate(size_t uiLen
);
1538 // empty string contents
1539 void Empty() { clear(); }
1540 // empty the string and free memory
1541 void Clear() { clear(); }
1544 // Is an ascii value
1545 bool IsAscii() const;
1547 bool IsNumber() const;
1549 bool IsWord() const;
1551 // data access (all indexes are 0 based)
1553 wxUniChar
at(size_t n
) const
1554 { return wxStringOperations::DecodeChar(m_impl
.begin() + PosToImpl(n
)); }
1555 wxUniChar
GetChar(size_t n
) const
1557 // read/write access
1558 wxUniCharRef
at(size_t n
)
1559 { return *GetIterForNthChar(n
); }
1560 wxUniCharRef
GetWritableChar(size_t n
)
1563 void SetChar(size_t n
, wxUniChar ch
)
1566 // get last character
1567 wxUniChar
Last() const
1569 wxASSERT_MSG( !empty(), wxT("wxString: index out of bounds") );
1573 // get writable last character
1576 wxASSERT_MSG( !empty(), wxT("wxString: index out of bounds") );
1581 Note that we we must define all of the overloads below to avoid
1582 ambiguity when using str[0].
1584 wxUniChar
operator[](int n
) const
1586 wxUniChar
operator[](long n
) const
1588 wxUniChar
operator[](size_t n
) const
1590 #ifndef wxSIZE_T_IS_UINT
1591 wxUniChar
operator[](unsigned int n
) const
1593 #endif // size_t != unsigned int
1595 // operator versions of GetWriteableChar()
1596 wxUniCharRef
operator[](int n
)
1598 wxUniCharRef
operator[](long n
)
1600 wxUniCharRef
operator[](size_t n
)
1602 #ifndef wxSIZE_T_IS_UINT
1603 wxUniCharRef
operator[](unsigned int n
)
1605 #endif // size_t != unsigned int
1609 Overview of wxString conversions, implicit and explicit:
1611 - wxString has a std::[w]string-like c_str() method, however it does
1612 not return a C-style string directly but instead returns wxCStrData
1613 helper object which is convertible to either "char *" narrow string
1614 or "wchar_t *" wide string. Usually the correct conversion will be
1615 applied by the compiler automatically but if this doesn't happen you
1616 need to explicitly choose one using wxCStrData::AsChar() or AsWChar()
1617 methods or another wxString conversion function.
1619 - One of the places where the conversion does *NOT* happen correctly is
1620 when c_str() is passed to a vararg function such as printf() so you
1621 must *NOT* use c_str() with them. Either use wxPrintf() (all wx
1622 functions do handle c_str() correctly, even if they appear to be
1623 vararg (but they're not, really)) or add an explicit AsChar() or, if
1624 compatibility with previous wxWidgets versions is important, add a
1625 cast to "const char *".
1627 - In non-STL mode only, wxString is also implicitly convertible to
1628 wxCStrData. The same warning as above applies.
1630 - c_str() is polymorphic as it can be converted to either narrow or
1631 wide string. If you explicitly need one or the other, choose to use
1632 mb_str() (for narrow) or wc_str() (for wide) instead. Notice that
1633 these functions can return either the pointer to string directly (if
1634 this is what the string uses internally) or a temporary buffer
1635 containing the string and convertible to it. Again, conversion will
1636 usually be done automatically by the compiler but beware of the
1637 vararg functions: you need an explicit cast when using them.
1639 - There are also non-const versions of mb_str() and wc_str() called
1640 char_str() and wchar_str(). They are only meant to be used with
1641 non-const-correct functions and they always return buffers.
1643 - Finally wx_str() returns whatever string representation is used by
1644 wxString internally. It may be either a narrow or wide string
1645 depending on wxWidgets build mode but it will always be a raw pointer
1649 // explicit conversion to wxCStrData
1650 wxCStrData
c_str() const { return wxCStrData(this); }
1651 wxCStrData
data() const { return c_str(); }
1653 // implicit conversion to wxCStrData
1654 operator wxCStrData() const { return c_str(); }
1656 // the first two operators conflict with operators for conversion to
1657 // std::string and they must be disabled in STL build; the next one only
1658 // makes sense if conversions to char* are also defined and not defining it
1659 // in STL build also helps us to get more clear error messages for the code
1660 // which relies on implicit conversion to char* in STL build
1662 operator const char*() const { return c_str(); }
1663 operator const wchar_t*() const { return c_str(); }
1665 // implicit conversion to untyped pointer for compatibility with previous
1666 // wxWidgets versions: this is the same as conversion to const char * so it
1668 operator const void*() const { return c_str(); }
1671 // identical to c_str(), for MFC compatibility
1672 const wxCStrData
GetData() const { return c_str(); }
1674 // explicit conversion to C string in internal representation (char*,
1675 // wchar_t*, UTF-8-encoded char*, depending on the build):
1676 const wxStringCharType
*wx_str() const { return m_impl
.c_str(); }
1678 // conversion to *non-const* multibyte or widestring buffer; modifying
1679 // returned buffer won't affect the string, these methods are only useful
1680 // for passing values to const-incorrect functions
1681 wxWritableCharBuffer
char_str(const wxMBConv
& conv
= wxConvLibc
) const
1682 { return mb_str(conv
); }
1683 wxWritableWCharBuffer
wchar_str() const { return wc_str(); }
1685 // conversion to the buffer of the given type T (= char or wchar_t) and
1686 // also optionally return the buffer length
1688 // this is mostly/only useful for the template functions
1690 // FIXME-VC6: the second argument only exists for VC6 which doesn't support
1691 // explicit template function selection, do not use it unless
1692 // you must support VC6!
1693 template <typename T
>
1694 wxCharTypeBuffer
<T
> tchar_str(size_t *len
= NULL
,
1695 T
* WXUNUSED(dummy
) = NULL
) const
1698 // we need a helper dispatcher depending on type
1699 return wxPrivate::wxStringAsBufHelper
<T
>::Get(*this, len
);
1701 // T can only be char in ANSI build
1705 return wxCharTypeBuffer
<T
>::CreateNonOwned(wx_str(), length());
1706 #endif // Unicode build kind
1709 // conversion to/from plain (i.e. 7 bit) ASCII: this is useful for
1710 // converting numbers or strings which are certain not to contain special
1711 // chars (typically system functions, X atoms, environment variables etc.)
1713 // the behaviour of these functions with the strings containing anything
1714 // else than 7 bit ASCII characters is undefined, use at your own risk.
1716 static wxString
FromAscii(const char *ascii
, size_t len
);
1717 static wxString
FromAscii(const char *ascii
);
1718 static wxString
FromAscii(char ascii
);
1719 const wxScopedCharBuffer
ToAscii() const;
1721 static wxString
FromAscii(const char *ascii
) { return wxString( ascii
); }
1722 static wxString
FromAscii(const char *ascii
, size_t len
)
1723 { return wxString( ascii
, len
); }
1724 static wxString
FromAscii(char ascii
) { return wxString( ascii
); }
1725 const char *ToAscii() const { return c_str(); }
1726 #endif // Unicode/!Unicode
1728 // also provide unsigned char overloads as signed/unsigned doesn't matter
1729 // for 7 bit ASCII characters
1730 static wxString
FromAscii(const unsigned char *ascii
)
1731 { return FromAscii((const char *)ascii
); }
1732 static wxString
FromAscii(const unsigned char *ascii
, size_t len
)
1733 { return FromAscii((const char *)ascii
, len
); }
1735 // conversion to/from UTF-8:
1736 #if wxUSE_UNICODE_UTF8
1737 static wxString
FromUTF8Unchecked(const char *utf8
)
1740 return wxEmptyString
;
1742 wxASSERT( wxStringOperations::IsValidUtf8String(utf8
) );
1743 return FromImpl(wxStringImpl(utf8
));
1745 static wxString
FromUTF8Unchecked(const char *utf8
, size_t len
)
1748 return wxEmptyString
;
1750 return FromUTF8Unchecked(utf8
);
1752 wxASSERT( wxStringOperations::IsValidUtf8String(utf8
, len
) );
1753 return FromImpl(wxStringImpl(utf8
, len
));
1756 static wxString
FromUTF8(const char *utf8
)
1758 if ( !utf8
|| !wxStringOperations::IsValidUtf8String(utf8
) )
1761 return FromImpl(wxStringImpl(utf8
));
1763 static wxString
FromUTF8(const char *utf8
, size_t len
)
1766 return FromUTF8(utf8
);
1768 if ( !utf8
|| !wxStringOperations::IsValidUtf8String(utf8
, len
) )
1771 return FromImpl(wxStringImpl(utf8
, len
));
1774 const wxScopedCharBuffer
utf8_str() const
1775 { return wxCharBuffer::CreateNonOwned(m_impl
.c_str(), m_impl
.length()); }
1777 // this function exists in UTF-8 build only and returns the length of the
1778 // internal UTF-8 representation
1779 size_t utf8_length() const { return m_impl
.length(); }
1780 #elif wxUSE_UNICODE_WCHAR
1781 static wxString
FromUTF8(const char *utf8
, size_t len
= npos
)
1782 { return wxString(utf8
, wxMBConvUTF8(), len
); }
1783 static wxString
FromUTF8Unchecked(const char *utf8
, size_t len
= npos
)
1785 const wxString
s(utf8
, wxMBConvUTF8(), len
);
1786 wxASSERT_MSG( !utf8
|| !*utf8
|| !s
.empty(),
1787 "string must be valid UTF-8" );
1790 const wxScopedCharBuffer
utf8_str() const { return mb_str(wxMBConvUTF8()); }
1792 static wxString
FromUTF8(const char *utf8
)
1793 { return wxString(wxMBConvUTF8().cMB2WC(utf8
)); }
1794 static wxString
FromUTF8(const char *utf8
, size_t len
)
1797 wxScopedWCharBuffer
buf(wxMBConvUTF8().cMB2WC(utf8
, len
== npos
? wxNO_LEN
: len
, &wlen
));
1798 return wxString(buf
.data(), wlen
);
1800 static wxString
FromUTF8Unchecked(const char *utf8
, size_t len
= npos
)
1803 wxScopedWCharBuffer buf
1805 wxMBConvUTF8().cMB2WC
1808 len
== npos
? wxNO_LEN
: len
,
1812 wxASSERT_MSG( !utf8
|| !*utf8
|| wlen
,
1813 "string must be valid UTF-8" );
1815 return wxString(buf
.data(), wlen
);
1817 const wxScopedCharBuffer
utf8_str() const
1818 { return wxMBConvUTF8().cWC2MB(wc_str()); }
1821 const wxScopedCharBuffer
ToUTF8() const { return utf8_str(); }
1823 // functions for storing binary data in wxString:
1825 static wxString
From8BitData(const char *data
, size_t len
)
1826 { return wxString(data
, wxConvISO8859_1
, len
); }
1827 // version for NUL-terminated data:
1828 static wxString
From8BitData(const char *data
)
1829 { return wxString(data
, wxConvISO8859_1
); }
1830 const wxScopedCharBuffer
To8BitData() const
1831 { return mb_str(wxConvISO8859_1
); }
1833 static wxString
From8BitData(const char *data
, size_t len
)
1834 { return wxString(data
, len
); }
1835 // version for NUL-terminated data:
1836 static wxString
From8BitData(const char *data
)
1837 { return wxString(data
); }
1838 const wxScopedCharBuffer
To8BitData() const
1839 { return wxScopedCharBuffer::CreateNonOwned(wx_str(), length()); }
1840 #endif // Unicode/ANSI
1842 // conversions with (possible) format conversions: have to return a
1843 // buffer with temporary data
1845 // the functions defined (in either Unicode or ANSI) mode are mb_str() to
1846 // return an ANSI (multibyte) string, wc_str() to return a wide string and
1847 // fn_str() to return a string which should be used with the OS APIs
1848 // accepting the file names. The return value is always the same, but the
1849 // type differs because a function may either return pointer to the buffer
1850 // directly or have to use intermediate buffer for translation.
1854 // this is an optimization: even though using mb_str(wxConvLibc) does the
1855 // same thing (i.e. returns pointer to internal representation as locale is
1856 // always an UTF-8 one) in wxUSE_UTF8_LOCALE_ONLY case, we can avoid the
1857 // extra checks and the temporary buffer construction by providing a
1858 // separate mb_str() overload
1859 #if wxUSE_UTF8_LOCALE_ONLY
1860 const char* mb_str() const { return wx_str(); }
1861 const wxScopedCharBuffer
mb_str(const wxMBConv
& conv
) const
1863 return AsCharBuf(conv
);
1865 #else // !wxUSE_UTF8_LOCALE_ONLY
1866 const wxScopedCharBuffer
mb_str(const wxMBConv
& conv
= wxConvLibc
) const
1868 return AsCharBuf(conv
);
1870 #endif // wxUSE_UTF8_LOCALE_ONLY/!wxUSE_UTF8_LOCALE_ONLY
1872 const wxWX2MBbuf
mbc_str() const { return mb_str(*wxConvCurrent
); }
1874 #if wxUSE_UNICODE_WCHAR
1875 const wchar_t* wc_str() const { return wx_str(); }
1876 #elif wxUSE_UNICODE_UTF8
1877 const wxScopedWCharBuffer
wc_str() const
1878 { return AsWCharBuf(wxMBConvStrictUTF8()); }
1880 // for compatibility with !wxUSE_UNICODE version
1881 const wxWX2WCbuf
wc_str(const wxMBConv
& WXUNUSED(conv
)) const
1882 { return wc_str(); }
1885 const wxScopedCharBuffer
fn_str() const { return mb_str(wxConvFile
); }
1887 const wxWX2WCbuf
fn_str() const { return wc_str(); }
1888 #endif // wxMBFILES/!wxMBFILES
1891 const char* mb_str() const { return wx_str(); }
1893 // for compatibility with wxUSE_UNICODE version
1894 const char* mb_str(const wxMBConv
& WXUNUSED(conv
)) const { return wx_str(); }
1896 const wxWX2MBbuf
mbc_str() const { return mb_str(); }
1898 const wxScopedWCharBuffer
wc_str(const wxMBConv
& conv
= wxConvLibc
) const
1899 { return AsWCharBuf(conv
); }
1901 const wxScopedCharBuffer
fn_str() const
1902 { return wxConvFile
.cWC2WX( wc_str( wxConvLibc
) ); }
1903 #endif // Unicode/ANSI
1905 #if wxUSE_UNICODE_UTF8
1906 const wxScopedWCharBuffer
t_str() const { return wc_str(); }
1907 #elif wxUSE_UNICODE_WCHAR
1908 const wchar_t* t_str() const { return wx_str(); }
1910 const char* t_str() const { return wx_str(); }
1914 // overloaded assignment
1915 // from another wxString
1916 wxString
& operator=(const wxString
& stringSrc
)
1918 if ( this != &stringSrc
)
1920 wxSTRING_INVALIDATE_CACHE();
1922 m_impl
= stringSrc
.m_impl
;
1928 wxString
& operator=(const wxCStrData
& cstr
)
1929 { return *this = cstr
.AsString(); }
1931 wxString
& operator=(wxUniChar ch
)
1933 wxSTRING_INVALIDATE_CACHE();
1935 #if wxUSE_UNICODE_UTF8
1936 if ( !ch
.IsAscii() )
1937 m_impl
= wxStringOperations::EncodeChar(ch
);
1939 #endif // wxUSE_UNICODE_UTF8
1940 m_impl
= (wxStringCharType
)ch
;
1944 wxString
& operator=(wxUniCharRef ch
)
1945 { return operator=((wxUniChar
)ch
); }
1946 wxString
& operator=(char ch
)
1947 { return operator=(wxUniChar(ch
)); }
1948 wxString
& operator=(unsigned char ch
)
1949 { return operator=(wxUniChar(ch
)); }
1950 wxString
& operator=(wchar_t ch
)
1951 { return operator=(wxUniChar(ch
)); }
1952 // from a C string - STL probably will crash on NULL,
1953 // so we need to compensate in that case
1954 #if wxUSE_STL_BASED_WXSTRING
1955 wxString
& operator=(const char *psz
)
1957 wxSTRING_INVALIDATE_CACHE();
1960 m_impl
= ImplStr(psz
);
1967 wxString
& operator=(const wchar_t *pwz
)
1969 wxSTRING_INVALIDATE_CACHE();
1972 m_impl
= ImplStr(pwz
);
1978 #else // !wxUSE_STL_BASED_WXSTRING
1979 wxString
& operator=(const char *psz
)
1981 wxSTRING_INVALIDATE_CACHE();
1983 m_impl
= ImplStr(psz
);
1988 wxString
& operator=(const wchar_t *pwz
)
1990 wxSTRING_INVALIDATE_CACHE();
1992 m_impl
= ImplStr(pwz
);
1996 #endif // wxUSE_STL_BASED_WXSTRING/!wxUSE_STL_BASED_WXSTRING
1998 wxString
& operator=(const unsigned char *psz
)
1999 { return operator=((const char*)psz
); }
2001 // from wxScopedWCharBuffer
2002 wxString
& operator=(const wxScopedWCharBuffer
& s
)
2003 { return assign(s
); }
2004 // from wxScopedCharBuffer
2005 wxString
& operator=(const wxScopedCharBuffer
& s
)
2006 { return assign(s
); }
2008 // string concatenation
2009 // in place concatenation
2011 Concatenate and return the result. Note that the left to right
2012 associativity of << allows to write things like "str << str1 << str2
2013 << ..." (unlike with +=)
2016 wxString
& operator<<(const wxString
& s
)
2018 #if WXWIN_COMPATIBILITY_2_8 && !wxUSE_STL_BASED_WXSTRING && !wxUSE_UNICODE_UTF8
2019 wxASSERT_MSG( s
.IsValid(),
2020 wxT("did you forget to call UngetWriteBuf()?") );
2026 // string += C string
2027 wxString
& operator<<(const char *psz
)
2028 { append(psz
); return *this; }
2029 wxString
& operator<<(const wchar_t *pwz
)
2030 { append(pwz
); return *this; }
2031 wxString
& operator<<(const wxCStrData
& psz
)
2032 { append(psz
.AsString()); return *this; }
2034 wxString
& operator<<(wxUniChar ch
) { append(1, ch
); return *this; }
2035 wxString
& operator<<(wxUniCharRef ch
) { append(1, ch
); return *this; }
2036 wxString
& operator<<(char ch
) { append(1, ch
); return *this; }
2037 wxString
& operator<<(unsigned char ch
) { append(1, ch
); return *this; }
2038 wxString
& operator<<(wchar_t ch
) { append(1, ch
); return *this; }
2040 // string += buffer (i.e. from wxGetString)
2041 wxString
& operator<<(const wxScopedWCharBuffer
& s
)
2042 { return append(s
); }
2043 wxString
& operator<<(const wxScopedCharBuffer
& s
)
2044 { return append(s
); }
2046 // string += C string
2047 wxString
& Append(const wxString
& s
)
2049 // test for empty() to share the string if possible
2056 wxString
& Append(const char* psz
)
2057 { append(psz
); return *this; }
2058 wxString
& Append(const wchar_t* pwz
)
2059 { append(pwz
); return *this; }
2060 wxString
& Append(const wxCStrData
& psz
)
2061 { append(psz
); return *this; }
2062 wxString
& Append(const wxScopedCharBuffer
& psz
)
2063 { append(psz
); return *this; }
2064 wxString
& Append(const wxScopedWCharBuffer
& psz
)
2065 { append(psz
); return *this; }
2066 wxString
& Append(const char* psz
, size_t nLen
)
2067 { append(psz
, nLen
); return *this; }
2068 wxString
& Append(const wchar_t* pwz
, size_t nLen
)
2069 { append(pwz
, nLen
); return *this; }
2070 wxString
& Append(const wxCStrData
& psz
, size_t nLen
)
2071 { append(psz
, nLen
); return *this; }
2072 wxString
& Append(const wxScopedCharBuffer
& psz
, size_t nLen
)
2073 { append(psz
, nLen
); return *this; }
2074 wxString
& Append(const wxScopedWCharBuffer
& psz
, size_t nLen
)
2075 { append(psz
, nLen
); return *this; }
2076 // append count copies of given character
2077 wxString
& Append(wxUniChar ch
, size_t count
= 1u)
2078 { append(count
, ch
); return *this; }
2079 wxString
& Append(wxUniCharRef ch
, size_t count
= 1u)
2080 { append(count
, ch
); return *this; }
2081 wxString
& Append(char ch
, size_t count
= 1u)
2082 { append(count
, ch
); return *this; }
2083 wxString
& Append(unsigned char ch
, size_t count
= 1u)
2084 { append(count
, ch
); return *this; }
2085 wxString
& Append(wchar_t ch
, size_t count
= 1u)
2086 { append(count
, ch
); return *this; }
2088 // prepend a string, return the string itself
2089 wxString
& Prepend(const wxString
& str
)
2090 { *this = str
+ *this; return *this; }
2092 // non-destructive concatenation
2094 friend wxString WXDLLIMPEXP_BASE
operator+(const wxString
& string1
,
2095 const wxString
& string2
);
2096 // string with a single char
2097 friend wxString WXDLLIMPEXP_BASE
operator+(const wxString
& string
, wxUniChar ch
);
2098 // char with a string
2099 friend wxString WXDLLIMPEXP_BASE
operator+(wxUniChar ch
, const wxString
& string
);
2100 // string with C string
2101 friend wxString WXDLLIMPEXP_BASE
operator+(const wxString
& string
,
2103 friend wxString WXDLLIMPEXP_BASE
operator+(const wxString
& string
,
2104 const wchar_t *pwz
);
2105 // C string with string
2106 friend wxString WXDLLIMPEXP_BASE
operator+(const char *psz
,
2107 const wxString
& string
);
2108 friend wxString WXDLLIMPEXP_BASE
operator+(const wchar_t *pwz
,
2109 const wxString
& string
);
2111 // stream-like functions
2112 // insert an int into string
2113 wxString
& operator<<(int i
)
2114 { return (*this) << Format(wxT("%d"), i
); }
2115 // insert an unsigned int into string
2116 wxString
& operator<<(unsigned int ui
)
2117 { return (*this) << Format(wxT("%u"), ui
); }
2118 // insert a long into string
2119 wxString
& operator<<(long l
)
2120 { return (*this) << Format(wxT("%ld"), l
); }
2121 // insert an unsigned long into string
2122 wxString
& operator<<(unsigned long ul
)
2123 { return (*this) << Format(wxT("%lu"), ul
); }
2124 #ifdef wxHAS_LONG_LONG_T_DIFFERENT_FROM_LONG
2125 // insert a long long if they exist and aren't longs
2126 wxString
& operator<<(wxLongLong_t ll
)
2128 return (*this) << Format("%" wxLongLongFmtSpec
"d", ll
);
2130 // insert an unsigned long long
2131 wxString
& operator<<(wxULongLong_t ull
)
2133 return (*this) << Format("%" wxLongLongFmtSpec
"u" , ull
);
2135 #endif // wxHAS_LONG_LONG_T_DIFFERENT_FROM_LONG
2136 // insert a float into string
2137 wxString
& operator<<(float f
)
2138 { return (*this) << Format(wxT("%f"), f
); }
2139 // insert a double into string
2140 wxString
& operator<<(double d
)
2141 { return (*this) << Format(wxT("%g"), d
); }
2143 // string comparison
2144 // case-sensitive comparison (returns a value < 0, = 0 or > 0)
2145 int Cmp(const char *psz
) const
2146 { return compare(psz
); }
2147 int Cmp(const wchar_t *pwz
) const
2148 { return compare(pwz
); }
2149 int Cmp(const wxString
& s
) const
2150 { return compare(s
); }
2151 int Cmp(const wxCStrData
& s
) const
2152 { return compare(s
); }
2153 int Cmp(const wxScopedCharBuffer
& s
) const
2154 { return compare(s
); }
2155 int Cmp(const wxScopedWCharBuffer
& s
) const
2156 { return compare(s
); }
2157 // same as Cmp() but not case-sensitive
2158 int CmpNoCase(const wxString
& s
) const;
2160 // test for the string equality, either considering case or not
2161 // (if compareWithCase then the case matters)
2162 bool IsSameAs(const wxString
& str
, bool compareWithCase
= true) const
2164 #if !wxUSE_UNICODE_UTF8
2165 // in UTF-8 build, length() is O(n) and doing this would be _slower_
2166 if ( length() != str
.length() )
2169 return (compareWithCase
? Cmp(str
) : CmpNoCase(str
)) == 0;
2171 bool IsSameAs(const char *str
, bool compareWithCase
= true) const
2172 { return (compareWithCase
? Cmp(str
) : CmpNoCase(str
)) == 0; }
2173 bool IsSameAs(const wchar_t *str
, bool compareWithCase
= true) const
2174 { return (compareWithCase
? Cmp(str
) : CmpNoCase(str
)) == 0; }
2176 bool IsSameAs(const wxCStrData
& str
, bool compareWithCase
= true) const
2177 { return IsSameAs(str
.AsString(), compareWithCase
); }
2178 bool IsSameAs(const wxScopedCharBuffer
& str
, bool compareWithCase
= true) const
2179 { return IsSameAs(str
.data(), compareWithCase
); }
2180 bool IsSameAs(const wxScopedWCharBuffer
& str
, bool compareWithCase
= true) const
2181 { return IsSameAs(str
.data(), compareWithCase
); }
2182 // comparison with a single character: returns true if equal
2183 bool IsSameAs(wxUniChar c
, bool compareWithCase
= true) const;
2184 // FIXME-UTF8: remove these overloads
2185 bool IsSameAs(wxUniCharRef c
, bool compareWithCase
= true) const
2186 { return IsSameAs(wxUniChar(c
), compareWithCase
); }
2187 bool IsSameAs(char c
, bool compareWithCase
= true) const
2188 { return IsSameAs(wxUniChar(c
), compareWithCase
); }
2189 bool IsSameAs(unsigned char c
, bool compareWithCase
= true) const
2190 { return IsSameAs(wxUniChar(c
), compareWithCase
); }
2191 bool IsSameAs(wchar_t c
, bool compareWithCase
= true) const
2192 { return IsSameAs(wxUniChar(c
), compareWithCase
); }
2193 bool IsSameAs(int c
, bool compareWithCase
= true) const
2194 { return IsSameAs(wxUniChar(c
), compareWithCase
); }
2196 // simple sub-string extraction
2197 // return substring starting at nFirst of length nCount (or till the end
2198 // if nCount = default value)
2199 wxString
Mid(size_t nFirst
, size_t nCount
= npos
) const;
2201 // operator version of Mid()
2202 wxString
operator()(size_t start
, size_t len
) const
2203 { return Mid(start
, len
); }
2205 // check if the string starts with the given prefix and return the rest
2206 // of the string in the provided pointer if it is not NULL; otherwise
2208 bool StartsWith(const wxString
& prefix
, wxString
*rest
= NULL
) const;
2209 // check if the string ends with the given suffix and return the
2210 // beginning of the string before the suffix in the provided pointer if
2211 // it is not NULL; otherwise return false
2212 bool EndsWith(const wxString
& suffix
, wxString
*rest
= NULL
) const;
2214 // get first nCount characters
2215 wxString
Left(size_t nCount
) const;
2216 // get last nCount characters
2217 wxString
Right(size_t nCount
) const;
2218 // get all characters before the first occurrence of ch
2219 // (returns the whole string if ch not found) and also put everything
2220 // following the first occurrence of ch into rest if it's non-NULL
2221 wxString
BeforeFirst(wxUniChar ch
, wxString
*rest
= NULL
) const;
2222 // get all characters before the last occurrence of ch
2223 // (returns empty string if ch not found) and also put everything
2224 // following the last occurrence of ch into rest if it's non-NULL
2225 wxString
BeforeLast(wxUniChar ch
, wxString
*rest
= NULL
) const;
2226 // get all characters after the first occurrence of ch
2227 // (returns empty string if ch not found)
2228 wxString
AfterFirst(wxUniChar ch
) const;
2229 // get all characters after the last occurrence of ch
2230 // (returns the whole string if ch not found)
2231 wxString
AfterLast(wxUniChar ch
) const;
2233 // for compatibility only, use more explicitly named functions above
2234 wxString
Before(wxUniChar ch
) const { return BeforeLast(ch
); }
2235 wxString
After(wxUniChar ch
) const { return AfterFirst(ch
); }
2238 // convert to upper case in place, return the string itself
2239 wxString
& MakeUpper();
2240 // convert to upper case, return the copy of the string
2241 wxString
Upper() const { return wxString(*this).MakeUpper(); }
2242 // convert to lower case in place, return the string itself
2243 wxString
& MakeLower();
2244 // convert to lower case, return the copy of the string
2245 wxString
Lower() const { return wxString(*this).MakeLower(); }
2246 // convert the first character to the upper case and the rest to the
2247 // lower one, return the modified string itself
2248 wxString
& MakeCapitalized();
2249 // convert the first character to the upper case and the rest to the
2250 // lower one, return the copy of the string
2251 wxString
Capitalize() const { return wxString(*this).MakeCapitalized(); }
2253 // trimming/padding whitespace (either side) and truncating
2254 // remove spaces from left or from right (default) side
2255 wxString
& Trim(bool bFromRight
= true);
2256 // add nCount copies chPad in the beginning or at the end (default)
2257 wxString
& Pad(size_t nCount
, wxUniChar chPad
= wxT(' '), bool bFromRight
= true);
2259 // searching and replacing
2260 // searching (return starting index, or -1 if not found)
2261 int Find(wxUniChar ch
, bool bFromEnd
= false) const; // like strchr/strrchr
2262 int Find(wxUniCharRef ch
, bool bFromEnd
= false) const
2263 { return Find(wxUniChar(ch
), bFromEnd
); }
2264 int Find(char ch
, bool bFromEnd
= false) const
2265 { return Find(wxUniChar(ch
), bFromEnd
); }
2266 int Find(unsigned char ch
, bool bFromEnd
= false) const
2267 { return Find(wxUniChar(ch
), bFromEnd
); }
2268 int Find(wchar_t ch
, bool bFromEnd
= false) const
2269 { return Find(wxUniChar(ch
), bFromEnd
); }
2270 // searching (return starting index, or -1 if not found)
2271 int Find(const wxString
& sub
) const // like strstr
2273 size_type idx
= find(sub
);
2274 return (idx
== npos
) ? wxNOT_FOUND
: (int)idx
;
2276 int Find(const char *sub
) const // like strstr
2278 size_type idx
= find(sub
);
2279 return (idx
== npos
) ? wxNOT_FOUND
: (int)idx
;
2281 int Find(const wchar_t *sub
) const // like strstr
2283 size_type idx
= find(sub
);
2284 return (idx
== npos
) ? wxNOT_FOUND
: (int)idx
;
2287 int Find(const wxCStrData
& sub
) const
2288 { return Find(sub
.AsString()); }
2289 int Find(const wxScopedCharBuffer
& sub
) const
2290 { return Find(sub
.data()); }
2291 int Find(const wxScopedWCharBuffer
& sub
) const
2292 { return Find(sub
.data()); }
2294 // replace first (or all of bReplaceAll) occurrences of substring with
2295 // another string, returns the number of replacements made
2296 size_t Replace(const wxString
& strOld
,
2297 const wxString
& strNew
,
2298 bool bReplaceAll
= true);
2300 // check if the string contents matches a mask containing '*' and '?'
2301 bool Matches(const wxString
& mask
) const;
2303 // conversion to numbers: all functions return true only if the whole
2304 // string is a number and put the value of this number into the pointer
2305 // provided, the base is the numeric base in which the conversion should be
2306 // done and must be comprised between 2 and 36 or be 0 in which case the
2307 // standard C rules apply (leading '0' => octal, "0x" => hex)
2308 // convert to a signed integer
2309 bool ToLong(long *val
, int base
= 10) const;
2310 // convert to an unsigned integer
2311 bool ToULong(unsigned long *val
, int base
= 10) const;
2312 // convert to wxLongLong
2313 #if defined(wxLongLong_t)
2314 bool ToLongLong(wxLongLong_t
*val
, int base
= 10) const;
2315 // convert to wxULongLong
2316 bool ToULongLong(wxULongLong_t
*val
, int base
= 10) const;
2317 #endif // wxLongLong_t
2318 // convert to a double
2319 bool ToDouble(double *val
) const;
2321 // conversions to numbers using C locale
2322 // convert to a signed integer
2323 bool ToCLong(long *val
, int base
= 10) const;
2324 // convert to an unsigned integer
2325 bool ToCULong(unsigned long *val
, int base
= 10) const;
2326 // convert to a double
2327 bool ToCDouble(double *val
) const;
2329 // create a string representing the given floating point number
2330 // in the current locale
2331 static wxString
FromDouble(double val
)
2332 { return wxString::Format(wxS("%g"), val
); }
2334 static wxString
FromCDouble(double val
);
2336 #ifndef wxNEEDS_WXSTRING_PRINTF_MIXIN
2337 // formatted input/output
2338 // as sprintf(), returns the number of characters written or < 0 on error
2339 // (take 'this' into account in attribute parameter count)
2340 // int Printf(const wxString& format, ...);
2341 WX_DEFINE_VARARG_FUNC(int, Printf
, 1, (const wxFormatString
&),
2342 DoPrintfWchar
, DoPrintfUtf8
)
2344 // workaround for http://bugzilla.openwatcom.org/show_bug.cgi?id=351
2345 WX_VARARG_WATCOM_WORKAROUND(int, Printf
, 1, (const wxString
&),
2346 (wxFormatString(f1
)));
2347 WX_VARARG_WATCOM_WORKAROUND(int, Printf
, 1, (const wxCStrData
&),
2348 (wxFormatString(f1
)));
2349 WX_VARARG_WATCOM_WORKAROUND(int, Printf
, 1, (const char*),
2350 (wxFormatString(f1
)));
2351 WX_VARARG_WATCOM_WORKAROUND(int, Printf
, 1, (const wchar_t*),
2352 (wxFormatString(f1
)));
2354 #endif // !wxNEEDS_WXSTRING_PRINTF_MIXIN
2355 // as vprintf(), returns the number of characters written or < 0 on error
2356 int PrintfV(const wxString
& format
, va_list argptr
);
2358 #ifndef wxNEEDS_WXSTRING_PRINTF_MIXIN
2359 // returns the string containing the result of Printf() to it
2360 // static wxString Format(const wxString& format, ...) WX_ATTRIBUTE_PRINTF_1;
2361 WX_DEFINE_VARARG_FUNC(static wxString
, Format
, 1, (const wxFormatString
&),
2362 DoFormatWchar
, DoFormatUtf8
)
2364 // workaround for http://bugzilla.openwatcom.org/show_bug.cgi?id=351
2365 WX_VARARG_WATCOM_WORKAROUND(static wxString
, Format
, 1, (const wxString
&),
2366 (wxFormatString(f1
)));
2367 WX_VARARG_WATCOM_WORKAROUND(static wxString
, Format
, 1, (const wxCStrData
&),
2368 (wxFormatString(f1
)));
2369 WX_VARARG_WATCOM_WORKAROUND(static wxString
, Format
, 1, (const char*),
2370 (wxFormatString(f1
)));
2371 WX_VARARG_WATCOM_WORKAROUND(static wxString
, Format
, 1, (const wchar_t*),
2372 (wxFormatString(f1
)));
2375 // the same as above, but takes a va_list
2376 static wxString
FormatV(const wxString
& format
, va_list argptr
);
2378 // raw access to string memory
2379 // ensure that string has space for at least nLen characters
2380 // only works if the data of this string is not shared
2381 bool Alloc(size_t nLen
) { reserve(nLen
); return capacity() >= nLen
; }
2382 // minimize the string's memory
2383 // only works if the data of this string is not shared
2385 #if WXWIN_COMPATIBILITY_2_8 && !wxUSE_STL_BASED_WXSTRING && !wxUSE_UNICODE_UTF8
2386 // These are deprecated, use wxStringBuffer or wxStringBufferLength instead
2388 // get writable buffer of at least nLen bytes. Unget() *must* be called
2389 // a.s.a.p. to put string back in a reasonable state!
2390 wxDEPRECATED( wxStringCharType
*GetWriteBuf(size_t nLen
) );
2391 // call this immediately after GetWriteBuf() has been used
2392 wxDEPRECATED( void UngetWriteBuf() );
2393 wxDEPRECATED( void UngetWriteBuf(size_t nLen
) );
2394 #endif // WXWIN_COMPATIBILITY_2_8 && !wxUSE_STL_BASED_WXSTRING && wxUSE_UNICODE_UTF8
2396 // wxWidgets version 1 compatibility functions
2399 wxString
SubString(size_t from
, size_t to
) const
2400 { return Mid(from
, (to
- from
+ 1)); }
2401 // values for second parameter of CompareTo function
2402 enum caseCompare
{exact
, ignoreCase
};
2403 // values for first parameter of Strip function
2404 enum stripType
{leading
= 0x1, trailing
= 0x2, both
= 0x3};
2406 #ifndef wxNEEDS_WXSTRING_PRINTF_MIXIN
2408 // (take 'this' into account in attribute parameter count)
2409 // int sprintf(const wxString& format, ...) WX_ATTRIBUTE_PRINTF_2;
2410 WX_DEFINE_VARARG_FUNC(int, sprintf
, 1, (const wxFormatString
&),
2411 DoPrintfWchar
, DoPrintfUtf8
)
2413 // workaround for http://bugzilla.openwatcom.org/show_bug.cgi?id=351
2414 WX_VARARG_WATCOM_WORKAROUND(int, sprintf
, 1, (const wxString
&),
2415 (wxFormatString(f1
)));
2416 WX_VARARG_WATCOM_WORKAROUND(int, sprintf
, 1, (const wxCStrData
&),
2417 (wxFormatString(f1
)));
2418 WX_VARARG_WATCOM_WORKAROUND(int, sprintf
, 1, (const char*),
2419 (wxFormatString(f1
)));
2420 WX_VARARG_WATCOM_WORKAROUND(int, sprintf
, 1, (const wchar_t*),
2421 (wxFormatString(f1
)));
2423 #endif // wxNEEDS_WXSTRING_PRINTF_MIXIN
2426 int CompareTo(const wxChar
* psz
, caseCompare cmp
= exact
) const
2427 { return cmp
== exact
? Cmp(psz
) : CmpNoCase(psz
); }
2430 size_t Length() const { return length(); }
2431 // Count the number of characters
2432 int Freq(wxUniChar ch
) const;
2434 void LowerCase() { MakeLower(); }
2436 void UpperCase() { MakeUpper(); }
2437 // use Trim except that it doesn't change this string
2438 wxString
Strip(stripType w
= trailing
) const;
2440 // use Find (more general variants not yet supported)
2441 size_t Index(const wxChar
* psz
) const { return Find(psz
); }
2442 size_t Index(wxUniChar ch
) const { return Find(ch
); }
2444 wxString
& Remove(size_t pos
) { return Truncate(pos
); }
2445 wxString
& RemoveLast(size_t n
= 1) { return Truncate(length() - n
); }
2447 wxString
& Remove(size_t nStart
, size_t nLen
)
2448 { return (wxString
&)erase( nStart
, nLen
); }
2451 int First( wxUniChar ch
) const { return Find(ch
); }
2452 int First( wxUniCharRef ch
) const { return Find(ch
); }
2453 int First( char ch
) const { return Find(ch
); }
2454 int First( unsigned char ch
) const { return Find(ch
); }
2455 int First( wchar_t ch
) const { return Find(ch
); }
2456 int First( const wxString
& str
) const { return Find(str
); }
2457 int Last( wxUniChar ch
) const { return Find(ch
, true); }
2458 bool Contains(const wxString
& str
) const { return Find(str
) != wxNOT_FOUND
; }
2461 bool IsNull() const { return empty(); }
2463 // std::string compatibility functions
2465 // take nLen chars starting at nPos
2466 wxString(const wxString
& str
, size_t nPos
, size_t nLen
)
2467 { assign(str
, nPos
, nLen
); }
2468 // take all characters from first to last
2469 wxString(const_iterator first
, const_iterator last
)
2470 : m_impl(first
.impl(), last
.impl()) { }
2471 #if WXWIN_COMPATIBILITY_STRING_PTR_AS_ITER
2472 // the 2 overloads below are for compatibility with the existing code using
2473 // pointers instead of iterators
2474 wxString(const char *first
, const char *last
)
2476 SubstrBufFromMB
str(ImplStr(first
, last
- first
));
2477 m_impl
.assign(str
.data
, str
.len
);
2479 wxString(const wchar_t *first
, const wchar_t *last
)
2481 SubstrBufFromWC
str(ImplStr(first
, last
- first
));
2482 m_impl
.assign(str
.data
, str
.len
);
2484 // and this one is needed to compile code adding offsets to c_str() result
2485 wxString(const wxCStrData
& first
, const wxCStrData
& last
)
2486 : m_impl(CreateConstIterator(first
).impl(),
2487 CreateConstIterator(last
).impl())
2489 wxASSERT_MSG( first
.m_str
== last
.m_str
,
2490 wxT("pointers must be into the same string") );
2492 #endif // WXWIN_COMPATIBILITY_STRING_PTR_AS_ITER
2494 // lib.string.modifiers
2495 // append elements str[pos], ..., str[pos+n]
2496 wxString
& append(const wxString
& str
, size_t pos
, size_t n
)
2498 wxSTRING_UPDATE_CACHED_LENGTH(n
);
2501 str
.PosLenToImpl(pos
, n
, &from
, &len
);
2502 m_impl
.append(str
.m_impl
, from
, len
);
2506 wxString
& append(const wxString
& str
)
2508 wxSTRING_UPDATE_CACHED_LENGTH(str
.length());
2510 m_impl
.append(str
.m_impl
);
2514 // append first n (or all if n == npos) characters of sz
2515 wxString
& append(const char *sz
)
2517 wxSTRING_INVALIDATE_CACHED_LENGTH();
2519 m_impl
.append(ImplStr(sz
));
2523 wxString
& append(const wchar_t *sz
)
2525 wxSTRING_INVALIDATE_CACHED_LENGTH();
2527 m_impl
.append(ImplStr(sz
));
2531 wxString
& append(const char *sz
, size_t n
)
2533 wxSTRING_INVALIDATE_CACHED_LENGTH();
2535 SubstrBufFromMB
str(ImplStr(sz
, n
));
2536 m_impl
.append(str
.data
, str
.len
);
2539 wxString
& append(const wchar_t *sz
, size_t n
)
2541 wxSTRING_UPDATE_CACHED_LENGTH(n
);
2543 SubstrBufFromWC
str(ImplStr(sz
, n
));
2544 m_impl
.append(str
.data
, str
.len
);
2548 wxString
& append(const wxCStrData
& str
)
2549 { return append(str
.AsString()); }
2550 wxString
& append(const wxScopedCharBuffer
& str
)
2551 { return append(str
.data(), str
.length()); }
2552 wxString
& append(const wxScopedWCharBuffer
& str
)
2553 { return append(str
.data(), str
.length()); }
2554 wxString
& append(const wxCStrData
& str
, size_t n
)
2555 { return append(str
.AsString(), 0, n
); }
2556 wxString
& append(const wxScopedCharBuffer
& str
, size_t n
)
2557 { return append(str
.data(), n
); }
2558 wxString
& append(const wxScopedWCharBuffer
& str
, size_t n
)
2559 { return append(str
.data(), n
); }
2561 // append n copies of ch
2562 wxString
& append(size_t n
, wxUniChar ch
)
2564 #if wxUSE_UNICODE_UTF8
2565 if ( !ch
.IsAscii() )
2567 wxSTRING_INVALIDATE_CACHED_LENGTH();
2569 m_impl
.append(wxStringOperations::EncodeNChars(n
, ch
));
2574 wxSTRING_UPDATE_CACHED_LENGTH(n
);
2576 m_impl
.append(n
, (wxStringCharType
)ch
);
2582 wxString
& append(size_t n
, wxUniCharRef ch
)
2583 { return append(n
, wxUniChar(ch
)); }
2584 wxString
& append(size_t n
, char ch
)
2585 { return append(n
, wxUniChar(ch
)); }
2586 wxString
& append(size_t n
, unsigned char ch
)
2587 { return append(n
, wxUniChar(ch
)); }
2588 wxString
& append(size_t n
, wchar_t ch
)
2589 { return append(n
, wxUniChar(ch
)); }
2591 // append from first to last
2592 wxString
& append(const_iterator first
, const_iterator last
)
2594 wxSTRING_INVALIDATE_CACHED_LENGTH();
2596 m_impl
.append(first
.impl(), last
.impl());
2599 #if WXWIN_COMPATIBILITY_STRING_PTR_AS_ITER
2600 wxString
& append(const char *first
, const char *last
)
2601 { return append(first
, last
- first
); }
2602 wxString
& append(const wchar_t *first
, const wchar_t *last
)
2603 { return append(first
, last
- first
); }
2604 wxString
& append(const wxCStrData
& first
, const wxCStrData
& last
)
2605 { return append(CreateConstIterator(first
), CreateConstIterator(last
)); }
2606 #endif // WXWIN_COMPATIBILITY_STRING_PTR_AS_ITER
2608 // same as `this_string = str'
2609 wxString
& assign(const wxString
& str
)
2611 wxSTRING_SET_CACHED_LENGTH(str
.length());
2613 m_impl
= str
.m_impl
;
2618 wxString
& assign(const wxString
& str
, size_t len
)
2620 wxSTRING_SET_CACHED_LENGTH(len
);
2622 m_impl
.assign(str
.m_impl
, 0, str
.LenToImpl(len
));
2627 // same as ` = str[pos..pos + n]
2628 wxString
& assign(const wxString
& str
, size_t pos
, size_t n
)
2631 str
.PosLenToImpl(pos
, n
, &from
, &len
);
2632 m_impl
.assign(str
.m_impl
, from
, len
);
2634 // it's important to call this after PosLenToImpl() above in case str is
2635 // the same string as this one
2636 wxSTRING_SET_CACHED_LENGTH(n
);
2641 // same as `= first n (or all if n == npos) characters of sz'
2642 wxString
& assign(const char *sz
)
2644 wxSTRING_INVALIDATE_CACHE();
2646 m_impl
.assign(ImplStr(sz
));
2651 wxString
& assign(const wchar_t *sz
)
2653 wxSTRING_INVALIDATE_CACHE();
2655 m_impl
.assign(ImplStr(sz
));
2660 wxString
& assign(const char *sz
, size_t n
)
2662 wxSTRING_SET_CACHED_LENGTH(n
);
2664 SubstrBufFromMB
str(ImplStr(sz
, n
));
2665 m_impl
.assign(str
.data
, str
.len
);
2670 wxString
& assign(const wchar_t *sz
, size_t n
)
2672 wxSTRING_SET_CACHED_LENGTH(n
);
2674 SubstrBufFromWC
str(ImplStr(sz
, n
));
2675 m_impl
.assign(str
.data
, str
.len
);
2680 wxString
& assign(const wxCStrData
& str
)
2681 { return assign(str
.AsString()); }
2682 wxString
& assign(const wxScopedCharBuffer
& str
)
2683 { return assign(str
.data(), str
.length()); }
2684 wxString
& assign(const wxScopedWCharBuffer
& str
)
2685 { return assign(str
.data(), str
.length()); }
2686 wxString
& assign(const wxCStrData
& str
, size_t len
)
2687 { return assign(str
.AsString(), len
); }
2688 wxString
& assign(const wxScopedCharBuffer
& str
, size_t len
)
2689 { return assign(str
.data(), len
); }
2690 wxString
& assign(const wxScopedWCharBuffer
& str
, size_t len
)
2691 { return assign(str
.data(), len
); }
2693 // same as `= n copies of ch'
2694 wxString
& assign(size_t n
, wxUniChar ch
)
2696 wxSTRING_SET_CACHED_LENGTH(n
);
2698 #if wxUSE_UNICODE_UTF8
2699 if ( !ch
.IsAscii() )
2700 m_impl
.assign(wxStringOperations::EncodeNChars(n
, ch
));
2703 m_impl
.assign(n
, (wxStringCharType
)ch
);
2708 wxString
& assign(size_t n
, wxUniCharRef ch
)
2709 { return assign(n
, wxUniChar(ch
)); }
2710 wxString
& assign(size_t n
, char ch
)
2711 { return assign(n
, wxUniChar(ch
)); }
2712 wxString
& assign(size_t n
, unsigned char ch
)
2713 { return assign(n
, wxUniChar(ch
)); }
2714 wxString
& assign(size_t n
, wchar_t ch
)
2715 { return assign(n
, wxUniChar(ch
)); }
2717 // assign from first to last
2718 wxString
& assign(const_iterator first
, const_iterator last
)
2720 wxSTRING_INVALIDATE_CACHE();
2722 m_impl
.assign(first
.impl(), last
.impl());
2726 #if WXWIN_COMPATIBILITY_STRING_PTR_AS_ITER
2727 wxString
& assign(const char *first
, const char *last
)
2728 { return assign(first
, last
- first
); }
2729 wxString
& assign(const wchar_t *first
, const wchar_t *last
)
2730 { return assign(first
, last
- first
); }
2731 wxString
& assign(const wxCStrData
& first
, const wxCStrData
& last
)
2732 { return assign(CreateConstIterator(first
), CreateConstIterator(last
)); }
2733 #endif // WXWIN_COMPATIBILITY_STRING_PTR_AS_ITER
2735 // string comparison
2736 int compare(const wxString
& str
) const;
2737 int compare(const char* sz
) const;
2738 int compare(const wchar_t* sz
) const;
2739 int compare(const wxCStrData
& str
) const
2740 { return compare(str
.AsString()); }
2741 int compare(const wxScopedCharBuffer
& str
) const
2742 { return compare(str
.data()); }
2743 int compare(const wxScopedWCharBuffer
& str
) const
2744 { return compare(str
.data()); }
2745 // comparison with a substring
2746 int compare(size_t nStart
, size_t nLen
, const wxString
& str
) const;
2747 // comparison of 2 substrings
2748 int compare(size_t nStart
, size_t nLen
,
2749 const wxString
& str
, size_t nStart2
, size_t nLen2
) const;
2750 // substring comparison with first nCount characters of sz
2751 int compare(size_t nStart
, size_t nLen
,
2752 const char* sz
, size_t nCount
= npos
) const;
2753 int compare(size_t nStart
, size_t nLen
,
2754 const wchar_t* sz
, size_t nCount
= npos
) const;
2756 // insert another string
2757 wxString
& insert(size_t nPos
, const wxString
& str
)
2758 { insert(GetIterForNthChar(nPos
), str
.begin(), str
.end()); return *this; }
2759 // insert n chars of str starting at nStart (in str)
2760 wxString
& insert(size_t nPos
, const wxString
& str
, size_t nStart
, size_t n
)
2762 wxSTRING_UPDATE_CACHED_LENGTH(n
);
2765 str
.PosLenToImpl(nStart
, n
, &from
, &len
);
2766 m_impl
.insert(PosToImpl(nPos
), str
.m_impl
, from
, len
);
2771 // insert first n (or all if n == npos) characters of sz
2772 wxString
& insert(size_t nPos
, const char *sz
)
2774 wxSTRING_INVALIDATE_CACHE();
2776 m_impl
.insert(PosToImpl(nPos
), ImplStr(sz
));
2781 wxString
& insert(size_t nPos
, const wchar_t *sz
)
2783 wxSTRING_INVALIDATE_CACHE();
2785 m_impl
.insert(PosToImpl(nPos
), ImplStr(sz
)); return *this;
2788 wxString
& insert(size_t nPos
, const char *sz
, size_t n
)
2790 wxSTRING_UPDATE_CACHED_LENGTH(n
);
2792 SubstrBufFromMB
str(ImplStr(sz
, n
));
2793 m_impl
.insert(PosToImpl(nPos
), str
.data
, str
.len
);
2798 wxString
& insert(size_t nPos
, const wchar_t *sz
, size_t n
)
2800 wxSTRING_UPDATE_CACHED_LENGTH(n
);
2802 SubstrBufFromWC
str(ImplStr(sz
, n
));
2803 m_impl
.insert(PosToImpl(nPos
), str
.data
, str
.len
);
2808 // insert n copies of ch
2809 wxString
& insert(size_t nPos
, size_t n
, wxUniChar ch
)
2811 wxSTRING_UPDATE_CACHED_LENGTH(n
);
2813 #if wxUSE_UNICODE_UTF8
2814 if ( !ch
.IsAscii() )
2815 m_impl
.insert(PosToImpl(nPos
), wxStringOperations::EncodeNChars(n
, ch
));
2818 m_impl
.insert(PosToImpl(nPos
), n
, (wxStringCharType
)ch
);
2822 iterator
insert(iterator it
, wxUniChar ch
)
2824 wxSTRING_UPDATE_CACHED_LENGTH(1);
2826 #if wxUSE_UNICODE_UTF8
2827 if ( !ch
.IsAscii() )
2829 size_t pos
= IterToImplPos(it
);
2830 m_impl
.insert(pos
, wxStringOperations::EncodeChar(ch
));
2831 return iterator(this, m_impl
.begin() + pos
);
2835 return iterator(this, m_impl
.insert(it
.impl(), (wxStringCharType
)ch
));
2838 void insert(iterator it
, const_iterator first
, const_iterator last
)
2840 wxSTRING_INVALIDATE_CACHE();
2842 m_impl
.insert(it
.impl(), first
.impl(), last
.impl());
2845 #if WXWIN_COMPATIBILITY_STRING_PTR_AS_ITER
2846 void insert(iterator it
, const char *first
, const char *last
)
2847 { insert(it
- begin(), first
, last
- first
); }
2848 void insert(iterator it
, const wchar_t *first
, const wchar_t *last
)
2849 { insert(it
- begin(), first
, last
- first
); }
2850 void insert(iterator it
, const wxCStrData
& first
, const wxCStrData
& last
)
2851 { insert(it
, CreateConstIterator(first
), CreateConstIterator(last
)); }
2852 #endif // WXWIN_COMPATIBILITY_STRING_PTR_AS_ITER
2854 void insert(iterator it
, size_type n
, wxUniChar ch
)
2856 wxSTRING_UPDATE_CACHED_LENGTH(n
);
2858 #if wxUSE_UNICODE_UTF8
2859 if ( !ch
.IsAscii() )
2860 m_impl
.insert(IterToImplPos(it
), wxStringOperations::EncodeNChars(n
, ch
));
2863 m_impl
.insert(it
.impl(), n
, (wxStringCharType
)ch
);
2866 // delete characters from nStart to nStart + nLen
2867 wxString
& erase(size_type pos
= 0, size_type n
= npos
)
2869 wxSTRING_INVALIDATE_CACHE();
2872 PosLenToImpl(pos
, n
, &from
, &len
);
2873 m_impl
.erase(from
, len
);
2878 // delete characters from first up to last
2879 iterator
erase(iterator first
, iterator last
)
2881 wxSTRING_INVALIDATE_CACHE();
2883 return iterator(this, m_impl
.erase(first
.impl(), last
.impl()));
2886 iterator
erase(iterator first
)
2888 wxSTRING_UPDATE_CACHED_LENGTH(-1);
2890 return iterator(this, m_impl
.erase(first
.impl()));
2893 #ifdef wxSTRING_BASE_HASNT_CLEAR
2894 void clear() { erase(); }
2898 wxSTRING_SET_CACHED_LENGTH(0);
2904 // replaces the substring of length nLen starting at nStart
2905 wxString
& replace(size_t nStart
, size_t nLen
, const char* sz
)
2907 wxSTRING_INVALIDATE_CACHE();
2910 PosLenToImpl(nStart
, nLen
, &from
, &len
);
2911 m_impl
.replace(from
, len
, ImplStr(sz
));
2916 wxString
& replace(size_t nStart
, size_t nLen
, const wchar_t* sz
)
2918 wxSTRING_INVALIDATE_CACHE();
2921 PosLenToImpl(nStart
, nLen
, &from
, &len
);
2922 m_impl
.replace(from
, len
, ImplStr(sz
));
2927 // replaces the substring of length nLen starting at nStart
2928 wxString
& replace(size_t nStart
, size_t nLen
, const wxString
& str
)
2930 wxSTRING_INVALIDATE_CACHE();
2933 PosLenToImpl(nStart
, nLen
, &from
, &len
);
2934 m_impl
.replace(from
, len
, str
.m_impl
);
2939 // replaces the substring with nCount copies of ch
2940 wxString
& replace(size_t nStart
, size_t nLen
, size_t nCount
, wxUniChar ch
)
2942 wxSTRING_INVALIDATE_CACHE();
2945 PosLenToImpl(nStart
, nLen
, &from
, &len
);
2946 #if wxUSE_UNICODE_UTF8
2947 if ( !ch
.IsAscii() )
2948 m_impl
.replace(from
, len
, wxStringOperations::EncodeNChars(nCount
, ch
));
2951 m_impl
.replace(from
, len
, nCount
, (wxStringCharType
)ch
);
2956 // replaces a substring with another substring
2957 wxString
& replace(size_t nStart
, size_t nLen
,
2958 const wxString
& str
, size_t nStart2
, size_t nLen2
)
2960 wxSTRING_INVALIDATE_CACHE();
2963 PosLenToImpl(nStart
, nLen
, &from
, &len
);
2966 str
.PosLenToImpl(nStart2
, nLen2
, &from2
, &len2
);
2968 m_impl
.replace(from
, len
, str
.m_impl
, from2
, len2
);
2973 // replaces the substring with first nCount chars of sz
2974 wxString
& replace(size_t nStart
, size_t nLen
,
2975 const char* sz
, size_t nCount
)
2977 wxSTRING_INVALIDATE_CACHE();
2980 PosLenToImpl(nStart
, nLen
, &from
, &len
);
2982 SubstrBufFromMB
str(ImplStr(sz
, nCount
));
2984 m_impl
.replace(from
, len
, str
.data
, str
.len
);
2989 wxString
& replace(size_t nStart
, size_t nLen
,
2990 const wchar_t* sz
, size_t nCount
)
2992 wxSTRING_INVALIDATE_CACHE();
2995 PosLenToImpl(nStart
, nLen
, &from
, &len
);
2997 SubstrBufFromWC
str(ImplStr(sz
, nCount
));
2999 m_impl
.replace(from
, len
, str
.data
, str
.len
);
3004 wxString
& replace(size_t nStart
, size_t nLen
,
3005 const wxString
& s
, size_t nCount
)
3007 wxSTRING_INVALIDATE_CACHE();
3010 PosLenToImpl(nStart
, nLen
, &from
, &len
);
3011 m_impl
.replace(from
, len
, s
.m_impl
.c_str(), s
.LenToImpl(nCount
));
3016 wxString
& replace(iterator first
, iterator last
, const char* s
)
3018 wxSTRING_INVALIDATE_CACHE();
3020 m_impl
.replace(first
.impl(), last
.impl(), ImplStr(s
));
3025 wxString
& replace(iterator first
, iterator last
, const wchar_t* s
)
3027 wxSTRING_INVALIDATE_CACHE();
3029 m_impl
.replace(first
.impl(), last
.impl(), ImplStr(s
));
3034 wxString
& replace(iterator first
, iterator last
, const char* s
, size_type n
)
3036 wxSTRING_INVALIDATE_CACHE();
3038 SubstrBufFromMB
str(ImplStr(s
, n
));
3039 m_impl
.replace(first
.impl(), last
.impl(), str
.data
, str
.len
);
3044 wxString
& replace(iterator first
, iterator last
, const wchar_t* s
, size_type n
)
3046 wxSTRING_INVALIDATE_CACHE();
3048 SubstrBufFromWC
str(ImplStr(s
, n
));
3049 m_impl
.replace(first
.impl(), last
.impl(), str
.data
, str
.len
);
3054 wxString
& replace(iterator first
, iterator last
, const wxString
& s
)
3056 wxSTRING_INVALIDATE_CACHE();
3058 m_impl
.replace(first
.impl(), last
.impl(), s
.m_impl
);
3063 wxString
& replace(iterator first
, iterator last
, size_type n
, wxUniChar ch
)
3065 wxSTRING_INVALIDATE_CACHE();
3067 #if wxUSE_UNICODE_UTF8
3068 if ( !ch
.IsAscii() )
3069 m_impl
.replace(first
.impl(), last
.impl(),
3070 wxStringOperations::EncodeNChars(n
, ch
));
3073 m_impl
.replace(first
.impl(), last
.impl(), n
, (wxStringCharType
)ch
);
3078 wxString
& replace(iterator first
, iterator last
,
3079 const_iterator first1
, const_iterator last1
)
3081 wxSTRING_INVALIDATE_CACHE();
3083 m_impl
.replace(first
.impl(), last
.impl(), first1
.impl(), last1
.impl());
3088 wxString
& replace(iterator first
, iterator last
,
3089 const char *first1
, const char *last1
)
3090 { replace(first
, last
, first1
, last1
- first1
); return *this; }
3091 wxString
& replace(iterator first
, iterator last
,
3092 const wchar_t *first1
, const wchar_t *last1
)
3093 { replace(first
, last
, first1
, last1
- first1
); return *this; }
3096 void swap(wxString
& str
)
3098 #if wxUSE_STRING_POS_CACHE
3099 // we modify not only this string but also the other one directly so we
3100 // need to invalidate cache for both of them (we could also try to
3101 // exchange their cache entries but it seems unlikely to be worth it)
3103 str
.InvalidateCache();
3104 #endif // wxUSE_STRING_POS_CACHE
3106 m_impl
.swap(str
.m_impl
);
3110 size_t find(const wxString
& str
, size_t nStart
= 0) const
3111 { return PosFromImpl(m_impl
.find(str
.m_impl
, PosToImpl(nStart
))); }
3113 // find first n characters of sz
3114 size_t find(const char* sz
, size_t nStart
= 0, size_t n
= npos
) const
3116 SubstrBufFromMB
str(ImplStr(sz
, n
));
3117 return PosFromImpl(m_impl
.find(str
.data
, PosToImpl(nStart
), str
.len
));
3119 size_t find(const wchar_t* sz
, size_t nStart
= 0, size_t n
= npos
) const
3121 SubstrBufFromWC
str(ImplStr(sz
, n
));
3122 return PosFromImpl(m_impl
.find(str
.data
, PosToImpl(nStart
), str
.len
));
3124 size_t find(const wxScopedCharBuffer
& s
, size_t nStart
= 0, size_t n
= npos
) const
3125 { return find(s
.data(), nStart
, n
); }
3126 size_t find(const wxScopedWCharBuffer
& s
, size_t nStart
= 0, size_t n
= npos
) const
3127 { return find(s
.data(), nStart
, n
); }
3128 size_t find(const wxCStrData
& s
, size_t nStart
= 0, size_t n
= npos
) const
3129 { return find(s
.AsWChar(), nStart
, n
); }
3131 // find the first occurrence of character ch after nStart
3132 size_t find(wxUniChar ch
, size_t nStart
= 0) const
3134 #if wxUSE_UNICODE_UTF8
3135 if ( !ch
.IsAscii() )
3136 return PosFromImpl(m_impl
.find(wxStringOperations::EncodeChar(ch
),
3137 PosToImpl(nStart
)));
3140 return PosFromImpl(m_impl
.find((wxStringCharType
)ch
,
3141 PosToImpl(nStart
)));
3144 size_t find(wxUniCharRef ch
, size_t nStart
= 0) const
3145 { return find(wxUniChar(ch
), nStart
); }
3146 size_t find(char ch
, size_t nStart
= 0) const
3147 { return find(wxUniChar(ch
), nStart
); }
3148 size_t find(unsigned char ch
, size_t nStart
= 0) const
3149 { return find(wxUniChar(ch
), nStart
); }
3150 size_t find(wchar_t ch
, size_t nStart
= 0) const
3151 { return find(wxUniChar(ch
), nStart
); }
3153 // rfind() family is exactly like find() but works right to left
3155 // as find, but from the end
3156 size_t rfind(const wxString
& str
, size_t nStart
= npos
) const
3157 { return PosFromImpl(m_impl
.rfind(str
.m_impl
, PosToImpl(nStart
))); }
3159 // as find, but from the end
3160 size_t rfind(const char* sz
, size_t nStart
= npos
, size_t n
= npos
) const
3162 SubstrBufFromMB
str(ImplStr(sz
, n
));
3163 return PosFromImpl(m_impl
.rfind(str
.data
, PosToImpl(nStart
), str
.len
));
3165 size_t rfind(const wchar_t* sz
, size_t nStart
= npos
, size_t n
= npos
) const
3167 SubstrBufFromWC
str(ImplStr(sz
, n
));
3168 return PosFromImpl(m_impl
.rfind(str
.data
, PosToImpl(nStart
), str
.len
));
3170 size_t rfind(const wxScopedCharBuffer
& s
, size_t nStart
= npos
, size_t n
= npos
) const
3171 { return rfind(s
.data(), nStart
, n
); }
3172 size_t rfind(const wxScopedWCharBuffer
& s
, size_t nStart
= npos
, size_t n
= npos
) const
3173 { return rfind(s
.data(), nStart
, n
); }
3174 size_t rfind(const wxCStrData
& s
, size_t nStart
= npos
, size_t n
= npos
) const
3175 { return rfind(s
.AsWChar(), nStart
, n
); }
3176 // as find, but from the end
3177 size_t rfind(wxUniChar ch
, size_t nStart
= npos
) const
3179 #if wxUSE_UNICODE_UTF8
3180 if ( !ch
.IsAscii() )
3181 return PosFromImpl(m_impl
.rfind(wxStringOperations::EncodeChar(ch
),
3182 PosToImpl(nStart
)));
3185 return PosFromImpl(m_impl
.rfind((wxStringCharType
)ch
,
3186 PosToImpl(nStart
)));
3188 size_t rfind(wxUniCharRef ch
, size_t nStart
= npos
) const
3189 { return rfind(wxUniChar(ch
), nStart
); }
3190 size_t rfind(char ch
, size_t nStart
= npos
) const
3191 { return rfind(wxUniChar(ch
), nStart
); }
3192 size_t rfind(unsigned char ch
, size_t nStart
= npos
) const
3193 { return rfind(wxUniChar(ch
), nStart
); }
3194 size_t rfind(wchar_t ch
, size_t nStart
= npos
) const
3195 { return rfind(wxUniChar(ch
), nStart
); }
3197 // find first/last occurrence of any character (not) in the set:
3198 #if wxUSE_STL_BASED_WXSTRING && !wxUSE_UNICODE_UTF8
3199 // FIXME-UTF8: this is not entirely correct, because it doesn't work if
3200 // sizeof(wchar_t)==2 and surrogates are present in the string;
3201 // should we care? Probably not.
3202 size_t find_first_of(const wxString
& str
, size_t nStart
= 0) const
3203 { return m_impl
.find_first_of(str
.m_impl
, nStart
); }
3204 size_t find_first_of(const char* sz
, size_t nStart
= 0) const
3205 { return m_impl
.find_first_of(ImplStr(sz
), nStart
); }
3206 size_t find_first_of(const wchar_t* sz
, size_t nStart
= 0) const
3207 { return m_impl
.find_first_of(ImplStr(sz
), nStart
); }
3208 size_t find_first_of(const char* sz
, size_t nStart
, size_t n
) const
3209 { return m_impl
.find_first_of(ImplStr(sz
), nStart
, n
); }
3210 size_t find_first_of(const wchar_t* sz
, size_t nStart
, size_t n
) const
3211 { return m_impl
.find_first_of(ImplStr(sz
), nStart
, n
); }
3212 size_t find_first_of(wxUniChar c
, size_t nStart
= 0) const
3213 { return m_impl
.find_first_of((wxChar
)c
, nStart
); }
3215 size_t find_last_of(const wxString
& str
, size_t nStart
= npos
) const
3216 { return m_impl
.find_last_of(str
.m_impl
, nStart
); }
3217 size_t find_last_of(const char* sz
, size_t nStart
= npos
) const
3218 { return m_impl
.find_last_of(ImplStr(sz
), nStart
); }
3219 size_t find_last_of(const wchar_t* sz
, size_t nStart
= npos
) const
3220 { return m_impl
.find_last_of(ImplStr(sz
), nStart
); }
3221 size_t find_last_of(const char* sz
, size_t nStart
, size_t n
) const
3222 { return m_impl
.find_last_of(ImplStr(sz
), nStart
, n
); }
3223 size_t find_last_of(const wchar_t* sz
, size_t nStart
, size_t n
) const
3224 { return m_impl
.find_last_of(ImplStr(sz
), nStart
, n
); }
3225 size_t find_last_of(wxUniChar c
, size_t nStart
= npos
) const
3226 { return m_impl
.find_last_of((wxChar
)c
, nStart
); }
3228 size_t find_first_not_of(const wxString
& str
, size_t nStart
= 0) const
3229 { return m_impl
.find_first_not_of(str
.m_impl
, nStart
); }
3230 size_t find_first_not_of(const char* sz
, size_t nStart
= 0) const
3231 { return m_impl
.find_first_not_of(ImplStr(sz
), nStart
); }
3232 size_t find_first_not_of(const wchar_t* sz
, size_t nStart
= 0) const
3233 { return m_impl
.find_first_not_of(ImplStr(sz
), nStart
); }
3234 size_t find_first_not_of(const char* sz
, size_t nStart
, size_t n
) const
3235 { return m_impl
.find_first_not_of(ImplStr(sz
), nStart
, n
); }
3236 size_t find_first_not_of(const wchar_t* sz
, size_t nStart
, size_t n
) const
3237 { return m_impl
.find_first_not_of(ImplStr(sz
), nStart
, n
); }
3238 size_t find_first_not_of(wxUniChar c
, size_t nStart
= 0) const
3239 { return m_impl
.find_first_not_of((wxChar
)c
, nStart
); }
3241 size_t find_last_not_of(const wxString
& str
, size_t nStart
= npos
) const
3242 { return m_impl
.find_last_not_of(str
.m_impl
, nStart
); }
3243 size_t find_last_not_of(const char* sz
, size_t nStart
= npos
) const
3244 { return m_impl
.find_last_not_of(ImplStr(sz
), nStart
); }
3245 size_t find_last_not_of(const wchar_t* sz
, size_t nStart
= npos
) const
3246 { return m_impl
.find_last_not_of(ImplStr(sz
), nStart
); }
3247 size_t find_last_not_of(const char* sz
, size_t nStart
, size_t n
) const
3248 { return m_impl
.find_last_not_of(ImplStr(sz
), nStart
, n
); }
3249 size_t find_last_not_of(const wchar_t* sz
, size_t nStart
, size_t n
) const
3250 { return m_impl
.find_last_not_of(ImplStr(sz
), nStart
, n
); }
3251 size_t find_last_not_of(wxUniChar c
, size_t nStart
= npos
) const
3252 { return m_impl
.find_last_not_of((wxChar
)c
, nStart
); }
3254 // we can't use std::string implementation in UTF-8 build, because the
3255 // character sets would be interpreted wrongly:
3257 // as strpbrk() but starts at nStart, returns npos if not found
3258 size_t find_first_of(const wxString
& str
, size_t nStart
= 0) const
3259 #if wxUSE_UNICODE // FIXME-UTF8: temporary
3260 { return find_first_of(str
.wc_str(), nStart
); }
3262 { return find_first_of(str
.mb_str(), nStart
); }
3265 size_t find_first_of(const char* sz
, size_t nStart
= 0) const;
3266 size_t find_first_of(const wchar_t* sz
, size_t nStart
= 0) const;
3267 size_t find_first_of(const char* sz
, size_t nStart
, size_t n
) const;
3268 size_t find_first_of(const wchar_t* sz
, size_t nStart
, size_t n
) const;
3269 // same as find(char, size_t)
3270 size_t find_first_of(wxUniChar c
, size_t nStart
= 0) const
3271 { return find(c
, nStart
); }
3272 // find the last (starting from nStart) char from str in this string
3273 size_t find_last_of (const wxString
& str
, size_t nStart
= npos
) const
3274 #if wxUSE_UNICODE // FIXME-UTF8: temporary
3275 { return find_last_of(str
.wc_str(), nStart
); }
3277 { return find_last_of(str
.mb_str(), nStart
); }
3280 size_t find_last_of (const char* sz
, size_t nStart
= npos
) const;
3281 size_t find_last_of (const wchar_t* sz
, size_t nStart
= npos
) const;
3282 size_t find_last_of(const char* sz
, size_t nStart
, size_t n
) const;
3283 size_t find_last_of(const wchar_t* sz
, size_t nStart
, size_t n
) const;
3285 size_t find_last_of(wxUniChar c
, size_t nStart
= npos
) const
3286 { return rfind(c
, nStart
); }
3288 // find first/last occurrence of any character not in the set
3290 // as strspn() (starting from nStart), returns npos on failure
3291 size_t find_first_not_of(const wxString
& str
, size_t nStart
= 0) const
3292 #if wxUSE_UNICODE // FIXME-UTF8: temporary
3293 { return find_first_not_of(str
.wc_str(), nStart
); }
3295 { return find_first_not_of(str
.mb_str(), nStart
); }
3298 size_t find_first_not_of(const char* sz
, size_t nStart
= 0) const;
3299 size_t find_first_not_of(const wchar_t* sz
, size_t nStart
= 0) const;
3300 size_t find_first_not_of(const char* sz
, size_t nStart
, size_t n
) const;
3301 size_t find_first_not_of(const wchar_t* sz
, size_t nStart
, size_t n
) const;
3303 size_t find_first_not_of(wxUniChar ch
, size_t nStart
= 0) const;
3305 size_t find_last_not_of(const wxString
& str
, size_t nStart
= npos
) const
3306 #if wxUSE_UNICODE // FIXME-UTF8: temporary
3307 { return find_last_not_of(str
.wc_str(), nStart
); }
3309 { return find_last_not_of(str
.mb_str(), nStart
); }
3312 size_t find_last_not_of(const char* sz
, size_t nStart
= npos
) const;
3313 size_t find_last_not_of(const wchar_t* sz
, size_t nStart
= npos
) const;
3314 size_t find_last_not_of(const char* sz
, size_t nStart
, size_t n
) const;
3315 size_t find_last_not_of(const wchar_t* sz
, size_t nStart
, size_t n
) const;
3317 size_t find_last_not_of(wxUniChar ch
, size_t nStart
= npos
) const;
3318 #endif // wxUSE_STL_BASED_WXSTRING && !wxUSE_UNICODE_UTF8 or not
3320 // provide char/wchar_t/wxUniCharRef overloads for char-finding functions
3321 // above to resolve ambiguities:
3322 size_t find_first_of(wxUniCharRef ch
, size_t nStart
= 0) const
3323 { return find_first_of(wxUniChar(ch
), nStart
); }
3324 size_t find_first_of(char ch
, size_t nStart
= 0) const
3325 { return find_first_of(wxUniChar(ch
), nStart
); }
3326 size_t find_first_of(unsigned char ch
, size_t nStart
= 0) const
3327 { return find_first_of(wxUniChar(ch
), nStart
); }
3328 size_t find_first_of(wchar_t ch
, size_t nStart
= 0) const
3329 { return find_first_of(wxUniChar(ch
), nStart
); }
3330 size_t find_last_of(wxUniCharRef ch
, size_t nStart
= npos
) const
3331 { return find_last_of(wxUniChar(ch
), nStart
); }
3332 size_t find_last_of(char ch
, size_t nStart
= npos
) const
3333 { return find_last_of(wxUniChar(ch
), nStart
); }
3334 size_t find_last_of(unsigned char ch
, size_t nStart
= npos
) const
3335 { return find_last_of(wxUniChar(ch
), nStart
); }
3336 size_t find_last_of(wchar_t ch
, size_t nStart
= npos
) const
3337 { return find_last_of(wxUniChar(ch
), nStart
); }
3338 size_t find_first_not_of(wxUniCharRef ch
, size_t nStart
= 0) const
3339 { return find_first_not_of(wxUniChar(ch
), nStart
); }
3340 size_t find_first_not_of(char ch
, size_t nStart
= 0) const
3341 { return find_first_not_of(wxUniChar(ch
), nStart
); }
3342 size_t find_first_not_of(unsigned char ch
, size_t nStart
= 0) const
3343 { return find_first_not_of(wxUniChar(ch
), nStart
); }
3344 size_t find_first_not_of(wchar_t ch
, size_t nStart
= 0) const
3345 { return find_first_not_of(wxUniChar(ch
), nStart
); }
3346 size_t find_last_not_of(wxUniCharRef ch
, size_t nStart
= npos
) const
3347 { return find_last_not_of(wxUniChar(ch
), nStart
); }
3348 size_t find_last_not_of(char ch
, size_t nStart
= npos
) const
3349 { return find_last_not_of(wxUniChar(ch
), nStart
); }
3350 size_t find_last_not_of(unsigned char ch
, size_t nStart
= npos
) const
3351 { return find_last_not_of(wxUniChar(ch
), nStart
); }
3352 size_t find_last_not_of(wchar_t ch
, size_t nStart
= npos
) const
3353 { return find_last_not_of(wxUniChar(ch
), nStart
); }
3355 // and additional overloads for the versions taking strings:
3356 size_t find_first_of(const wxCStrData
& sz
, size_t nStart
= 0) const
3357 { return find_first_of(sz
.AsString(), nStart
); }
3358 size_t find_first_of(const wxScopedCharBuffer
& sz
, size_t nStart
= 0) const
3359 { return find_first_of(sz
.data(), nStart
); }
3360 size_t find_first_of(const wxScopedWCharBuffer
& sz
, size_t nStart
= 0) const
3361 { return find_first_of(sz
.data(), nStart
); }
3362 size_t find_first_of(const wxCStrData
& sz
, size_t nStart
, size_t n
) const
3363 { return find_first_of(sz
.AsWChar(), nStart
, n
); }
3364 size_t find_first_of(const wxScopedCharBuffer
& sz
, size_t nStart
, size_t n
) const
3365 { return find_first_of(sz
.data(), nStart
, n
); }
3366 size_t find_first_of(const wxScopedWCharBuffer
& sz
, size_t nStart
, size_t n
) const
3367 { return find_first_of(sz
.data(), nStart
, n
); }
3369 size_t find_last_of(const wxCStrData
& sz
, size_t nStart
= 0) const
3370 { return find_last_of(sz
.AsString(), nStart
); }
3371 size_t find_last_of(const wxScopedCharBuffer
& sz
, size_t nStart
= 0) const
3372 { return find_last_of(sz
.data(), nStart
); }
3373 size_t find_last_of(const wxScopedWCharBuffer
& sz
, size_t nStart
= 0) const
3374 { return find_last_of(sz
.data(), nStart
); }
3375 size_t find_last_of(const wxCStrData
& sz
, size_t nStart
, size_t n
) const
3376 { return find_last_of(sz
.AsWChar(), nStart
, n
); }
3377 size_t find_last_of(const wxScopedCharBuffer
& sz
, size_t nStart
, size_t n
) const
3378 { return find_last_of(sz
.data(), nStart
, n
); }
3379 size_t find_last_of(const wxScopedWCharBuffer
& sz
, size_t nStart
, size_t n
) const
3380 { return find_last_of(sz
.data(), nStart
, n
); }
3382 size_t find_first_not_of(const wxCStrData
& sz
, size_t nStart
= 0) const
3383 { return find_first_not_of(sz
.AsString(), nStart
); }
3384 size_t find_first_not_of(const wxScopedCharBuffer
& sz
, size_t nStart
= 0) const
3385 { return find_first_not_of(sz
.data(), nStart
); }
3386 size_t find_first_not_of(const wxScopedWCharBuffer
& sz
, size_t nStart
= 0) const
3387 { return find_first_not_of(sz
.data(), nStart
); }
3388 size_t find_first_not_of(const wxCStrData
& sz
, size_t nStart
, size_t n
) const
3389 { return find_first_not_of(sz
.AsWChar(), nStart
, n
); }
3390 size_t find_first_not_of(const wxScopedCharBuffer
& sz
, size_t nStart
, size_t n
) const
3391 { return find_first_not_of(sz
.data(), nStart
, n
); }
3392 size_t find_first_not_of(const wxScopedWCharBuffer
& sz
, size_t nStart
, size_t n
) const
3393 { return find_first_not_of(sz
.data(), nStart
, n
); }
3395 size_t find_last_not_of(const wxCStrData
& sz
, size_t nStart
= 0) const
3396 { return find_last_not_of(sz
.AsString(), nStart
); }
3397 size_t find_last_not_of(const wxScopedCharBuffer
& sz
, size_t nStart
= 0) const
3398 { return find_last_not_of(sz
.data(), nStart
); }
3399 size_t find_last_not_of(const wxScopedWCharBuffer
& sz
, size_t nStart
= 0) const
3400 { return find_last_not_of(sz
.data(), nStart
); }
3401 size_t find_last_not_of(const wxCStrData
& sz
, size_t nStart
, size_t n
) const
3402 { return find_last_not_of(sz
.AsWChar(), nStart
, n
); }
3403 size_t find_last_not_of(const wxScopedCharBuffer
& sz
, size_t nStart
, size_t n
) const
3404 { return find_last_not_of(sz
.data(), nStart
, n
); }
3405 size_t find_last_not_of(const wxScopedWCharBuffer
& sz
, size_t nStart
, size_t n
) const
3406 { return find_last_not_of(sz
.data(), nStart
, n
); }
3409 wxString
& operator+=(const wxString
& s
)
3411 wxSTRING_INVALIDATE_CACHED_LENGTH();
3416 // string += C string
3417 wxString
& operator+=(const char *psz
)
3419 wxSTRING_INVALIDATE_CACHED_LENGTH();
3421 m_impl
+= ImplStr(psz
);
3424 wxString
& operator+=(const wchar_t *pwz
)
3426 wxSTRING_INVALIDATE_CACHED_LENGTH();
3428 m_impl
+= ImplStr(pwz
);
3431 wxString
& operator+=(const wxCStrData
& s
)
3433 wxSTRING_INVALIDATE_CACHED_LENGTH();
3435 m_impl
+= s
.AsString().m_impl
;
3438 wxString
& operator+=(const wxScopedCharBuffer
& s
)
3439 { return append(s
); }
3440 wxString
& operator+=(const wxScopedWCharBuffer
& s
)
3441 { return append(s
); }
3443 wxString
& operator+=(wxUniChar ch
)
3445 wxSTRING_UPDATE_CACHED_LENGTH(1);
3447 #if wxUSE_UNICODE_UTF8
3448 if ( !ch
.IsAscii() )
3449 m_impl
+= wxStringOperations::EncodeChar(ch
);
3452 m_impl
+= (wxStringCharType
)ch
;
3455 wxString
& operator+=(wxUniCharRef ch
) { return *this += wxUniChar(ch
); }
3456 wxString
& operator+=(int ch
) { return *this += wxUniChar(ch
); }
3457 wxString
& operator+=(char ch
) { return *this += wxUniChar(ch
); }
3458 wxString
& operator+=(unsigned char ch
) { return *this += wxUniChar(ch
); }
3459 wxString
& operator+=(wchar_t ch
) { return *this += wxUniChar(ch
); }
3462 #if !wxUSE_STL_BASED_WXSTRING
3463 // helpers for wxStringBuffer and wxStringBufferLength
3464 wxStringCharType
*DoGetWriteBuf(size_t nLen
)
3466 return m_impl
.DoGetWriteBuf(nLen
);
3469 void DoUngetWriteBuf()
3471 wxSTRING_INVALIDATE_CACHE();
3473 m_impl
.DoUngetWriteBuf();
3476 void DoUngetWriteBuf(size_t nLen
)
3478 wxSTRING_SET_CACHED_LENGTH(nLen
);
3480 m_impl
.DoUngetWriteBuf(nLen
);
3482 #endif // !wxUSE_STL_BASED_WXSTRING
3484 #ifndef wxNEEDS_WXSTRING_PRINTF_MIXIN
3485 #if !wxUSE_UTF8_LOCALE_ONLY
3486 int DoPrintfWchar(const wxChar
*format
, ...);
3487 static wxString
DoFormatWchar(const wxChar
*format
, ...);
3489 #if wxUSE_UNICODE_UTF8
3490 int DoPrintfUtf8(const char *format
, ...);
3491 static wxString
DoFormatUtf8(const char *format
, ...);
3495 #if !wxUSE_STL_BASED_WXSTRING
3496 // check string's data validity
3497 bool IsValid() const { return m_impl
.GetStringData()->IsValid(); }
3501 wxStringImpl m_impl
;
3503 // buffers for compatibility conversion from (char*)c_str() and
3504 // (wchar_t*)c_str(): the pointers returned by these functions should remain
3505 // valid until the string itself is modified for compatibility with the
3506 // existing code and consistency with std::string::c_str() so returning a
3507 // temporary buffer won't do and we need to cache the conversion results
3509 // TODO-UTF8: benchmark various approaches to keeping compatibility buffers
3510 template<typename T
>
3511 struct ConvertedBuffer
3513 // notice that there is no need to initialize m_len here as it's unused
3514 // as long as m_str is NULL
3515 ConvertedBuffer() : m_str(NULL
) {}
3519 bool Extend(size_t len
)
3521 // add extra 1 for the trailing NUL
3522 void * const str
= realloc(m_str
, sizeof(T
)*(len
+ 1));
3526 m_str
= static_cast<T
*>(str
);
3532 const wxScopedCharTypeBuffer
<T
> AsScopedBuffer() const
3534 return wxScopedCharTypeBuffer
<T
>::CreateNonOwned(m_str
, m_len
);
3537 T
*m_str
; // pointer to the string data
3538 size_t m_len
; // length, not size, i.e. in chars and without last NUL
3543 // common mb_str() and wxCStrData::AsChar() helper: performs the conversion
3544 // and returns either m_convertedToChar.m_str (in which case its m_len is
3545 // also updated) or NULL if it failed
3547 // there is an important exception: in wxUSE_UNICODE_UTF8 build if conv is a
3548 // UTF-8 one, we return m_impl.c_str() directly, without doing any conversion
3549 // as optimization and so the caller needs to check for this before using
3550 // m_convertedToChar
3552 // NB: AsChar() returns char* in any build, unlike mb_str()
3553 const char *AsChar(const wxMBConv
& conv
) const;
3555 // mb_str() implementation helper
3556 wxScopedCharBuffer
AsCharBuf(const wxMBConv
& conv
) const
3558 #if wxUSE_UNICODE_UTF8
3559 // avoid conversion if we can
3560 if ( conv
.IsUTF8() )
3562 return wxScopedCharBuffer::CreateNonOwned(m_impl
.c_str(),
3565 #endif // wxUSE_UNICODE_UTF8
3567 // call this solely in order to fill in m_convertedToChar as AsChar()
3568 // updates it as a side effect: this is a bit ugly but it's a completely
3569 // internal function so the users of this class shouldn't care or know
3570 // about it and doing it like this, i.e. having a separate AsChar(),
3571 // allows us to avoid the creation and destruction of a temporary buffer
3572 // when using wxCStrData without duplicating any code
3573 if ( !AsChar(conv
) )
3575 // although it would be probably more correct to return NULL buffer
3576 // from here if the conversion fails, a lot of existing code doesn't
3577 // expect mb_str() (or wc_str()) to ever return NULL so return an
3578 // empty string otherwise to avoid crashes in it
3580 // also, some existing code does check for the conversion success and
3581 // so asserting here would be bad too -- even if it does mean that
3582 // silently losing data is possible for badly written code
3583 return wxScopedCharBuffer::CreateNonOwned("", 0);
3586 return m_convertedToChar
.AsScopedBuffer();
3589 ConvertedBuffer
<char> m_convertedToChar
;
3590 #endif // !wxUSE_UNICODE
3592 #if !wxUSE_UNICODE_WCHAR
3593 // common wc_str() and wxCStrData::AsWChar() helper for both UTF-8 and ANSI
3594 // builds: converts the string contents into m_convertedToWChar and returns
3595 // NULL if the conversion failed (this can only happen in ANSI build)
3597 // NB: AsWChar() returns wchar_t* in any build, unlike wc_str()
3598 const wchar_t *AsWChar(const wxMBConv
& conv
) const;
3600 // wc_str() implementation helper
3601 wxScopedWCharBuffer
AsWCharBuf(const wxMBConv
& conv
) const
3603 if ( !AsWChar(conv
) )
3604 return wxScopedWCharBuffer::CreateNonOwned(L
"", 0);
3606 return m_convertedToWChar
.AsScopedBuffer();
3609 ConvertedBuffer
<wchar_t> m_convertedToWChar
;
3610 #endif // !wxUSE_UNICODE_WCHAR
3612 #if wxUSE_UNICODE_UTF8
3613 // FIXME-UTF8: (try to) move this elsewhere (TLS) or solve differently
3614 // assigning to character pointer to by wxString::iterator may
3615 // change the underlying wxStringImpl iterator, so we have to
3616 // keep track of all iterators and update them as necessary:
3617 struct wxStringIteratorNodeHead
3619 wxStringIteratorNodeHead() : ptr(NULL
) {}
3620 wxStringIteratorNode
*ptr
;
3622 // copying is disallowed as it would result in more than one pointer into
3623 // the same linked list
3624 wxDECLARE_NO_COPY_CLASS(wxStringIteratorNodeHead
);
3627 wxStringIteratorNodeHead m_iterators
;
3629 friend class WXDLLIMPEXP_FWD_BASE wxStringIteratorNode
;
3630 friend class WXDLLIMPEXP_FWD_BASE wxUniCharRef
;
3631 #endif // wxUSE_UNICODE_UTF8
3633 friend class WXDLLIMPEXP_FWD_BASE wxCStrData
;
3634 friend class wxStringInternalBuffer
;
3635 friend class wxStringInternalBufferLength
;
3638 #ifdef wxNEEDS_WXSTRING_PRINTF_MIXIN
3639 #pragma warning (pop)
3642 // string iterator operators that satisfy STL Random Access Iterator
3644 inline wxString::iterator
operator+(ptrdiff_t n
, wxString::iterator i
)
3646 inline wxString::const_iterator
operator+(ptrdiff_t n
, wxString::const_iterator i
)
3648 inline wxString::reverse_iterator
operator+(ptrdiff_t n
, wxString::reverse_iterator i
)
3650 inline wxString::const_reverse_iterator
operator+(ptrdiff_t n
, wxString::const_reverse_iterator i
)
3653 // notice that even though for many compilers the friend declarations above are
3654 // enough, from the point of view of C++ standard we must have the declarations
3655 // here as friend ones are not injected in the enclosing namespace and without
3656 // them the code fails to compile with conforming compilers such as xlC or g++4
3657 wxString WXDLLIMPEXP_BASE
operator+(const wxString
& string1
, const wxString
& string2
);
3658 wxString WXDLLIMPEXP_BASE
operator+(const wxString
& string
, const char *psz
);
3659 wxString WXDLLIMPEXP_BASE
operator+(const wxString
& string
, const wchar_t *pwz
);
3660 wxString WXDLLIMPEXP_BASE
operator+(const char *psz
, const wxString
& string
);
3661 wxString WXDLLIMPEXP_BASE
operator+(const wchar_t *pwz
, const wxString
& string
);
3663 wxString WXDLLIMPEXP_BASE
operator+(const wxString
& string
, wxUniChar ch
);
3664 wxString WXDLLIMPEXP_BASE
operator+(wxUniChar ch
, const wxString
& string
);
3666 inline wxString
operator+(const wxString
& string
, wxUniCharRef ch
)
3667 { return string
+ (wxUniChar
)ch
; }
3668 inline wxString
operator+(const wxString
& string
, char ch
)
3669 { return string
+ wxUniChar(ch
); }
3670 inline wxString
operator+(const wxString
& string
, wchar_t ch
)
3671 { return string
+ wxUniChar(ch
); }
3672 inline wxString
operator+(wxUniCharRef ch
, const wxString
& string
)
3673 { return (wxUniChar
)ch
+ string
; }
3674 inline wxString
operator+(char ch
, const wxString
& string
)
3675 { return wxUniChar(ch
) + string
; }
3676 inline wxString
operator+(wchar_t ch
, const wxString
& string
)
3677 { return wxUniChar(ch
) + string
; }
3680 #define wxGetEmptyString() wxString()
3682 // ----------------------------------------------------------------------------
3683 // helper functions which couldn't be defined inline
3684 // ----------------------------------------------------------------------------
3689 #if wxUSE_UNICODE_WCHAR
3692 struct wxStringAsBufHelper
<char>
3694 static wxScopedCharBuffer
Get(const wxString
& s
, size_t *len
)
3696 wxScopedCharBuffer
buf(s
.mb_str());
3698 *len
= buf
? strlen(buf
) : 0;
3704 struct wxStringAsBufHelper
<wchar_t>
3706 static wxScopedWCharBuffer
Get(const wxString
& s
, size_t *len
)
3708 const size_t length
= s
.length();
3711 return wxScopedWCharBuffer::CreateNonOwned(s
.wx_str(), length
);
3715 #elif wxUSE_UNICODE_UTF8
3718 struct wxStringAsBufHelper
<char>
3720 static wxScopedCharBuffer
Get(const wxString
& s
, size_t *len
)
3722 const size_t length
= s
.utf8_length();
3725 return wxScopedCharBuffer::CreateNonOwned(s
.wx_str(), length
);
3730 struct wxStringAsBufHelper
<wchar_t>
3732 static wxScopedWCharBuffer
Get(const wxString
& s
, size_t *len
)
3734 wxScopedWCharBuffer
wbuf(s
.wc_str());
3736 *len
= wxWcslen(wbuf
);
3741 #endif // Unicode build kind
3743 } // namespace wxPrivate
3745 // ----------------------------------------------------------------------------
3746 // wxStringBuffer: a tiny class allowing to get a writable pointer into string
3747 // ----------------------------------------------------------------------------
3749 #if !wxUSE_STL_BASED_WXSTRING
3750 // string buffer for direct access to string data in their native
3752 class wxStringInternalBuffer
3755 typedef wxStringCharType CharType
;
3757 wxStringInternalBuffer(wxString
& str
, size_t lenWanted
= 1024)
3758 : m_str(str
), m_buf(NULL
)
3759 { m_buf
= m_str
.DoGetWriteBuf(lenWanted
); }
3761 ~wxStringInternalBuffer() { m_str
.DoUngetWriteBuf(); }
3763 operator wxStringCharType
*() const { return m_buf
; }
3767 wxStringCharType
*m_buf
;
3769 wxDECLARE_NO_COPY_CLASS(wxStringInternalBuffer
);
3772 class wxStringInternalBufferLength
3775 typedef wxStringCharType CharType
;
3777 wxStringInternalBufferLength(wxString
& str
, size_t lenWanted
= 1024)
3778 : m_str(str
), m_buf(NULL
), m_len(0), m_lenSet(false)
3780 m_buf
= m_str
.DoGetWriteBuf(lenWanted
);
3781 wxASSERT(m_buf
!= NULL
);
3784 ~wxStringInternalBufferLength()
3787 m_str
.DoUngetWriteBuf(m_len
);
3790 operator wxStringCharType
*() const { return m_buf
; }
3791 void SetLength(size_t length
) { m_len
= length
; m_lenSet
= true; }
3795 wxStringCharType
*m_buf
;
3799 wxDECLARE_NO_COPY_CLASS(wxStringInternalBufferLength
);
3802 #endif // !wxUSE_STL_BASED_WXSTRING
3804 template<typename T
>
3805 class wxStringTypeBufferBase
3810 wxStringTypeBufferBase(wxString
& str
, size_t lenWanted
= 1024)
3811 : m_str(str
), m_buf(lenWanted
)
3813 // for compatibility with old wxStringBuffer which provided direct
3814 // access to wxString internal buffer, initialize ourselves with the
3815 // string initial contents
3817 // FIXME-VC6: remove the ugly (CharType *)NULL and use normal
3818 // tchar_str<CharType>
3820 const wxCharTypeBuffer
<CharType
> buf(str
.tchar_str(&len
, (CharType
*)NULL
));
3823 if ( len
> lenWanted
)
3825 // in this case there is not enough space for terminating NUL,
3826 // ensure that we still put it there
3827 m_buf
.data()[lenWanted
] = 0;
3828 len
= lenWanted
- 1;
3831 memcpy(m_buf
.data(), buf
, (len
+ 1)*sizeof(CharType
));
3833 //else: conversion failed, this can happen when trying to get Unicode
3834 // string contents into a char string
3837 operator CharType
*() { return m_buf
.data(); }
3841 wxCharTypeBuffer
<CharType
> m_buf
;
3844 template<typename T
>
3845 class wxStringTypeBufferLengthBase
: public wxStringTypeBufferBase
<T
>
3848 wxStringTypeBufferLengthBase(wxString
& str
, size_t lenWanted
= 1024)
3849 : wxStringTypeBufferBase
<T
>(str
, lenWanted
),
3854 ~wxStringTypeBufferLengthBase()
3856 wxASSERT_MSG( this->m_lenSet
, "forgot to call SetLength()" );
3859 void SetLength(size_t length
) { m_len
= length
; m_lenSet
= true; }
3866 template<typename T
>
3867 class wxStringTypeBuffer
: public wxStringTypeBufferBase
<T
>
3870 wxStringTypeBuffer(wxString
& str
, size_t lenWanted
= 1024)
3871 : wxStringTypeBufferBase
<T
>(str
, lenWanted
)
3874 ~wxStringTypeBuffer()
3876 this->m_str
.assign(this->m_buf
.data());
3879 wxDECLARE_NO_COPY_CLASS(wxStringTypeBuffer
);
3882 template<typename T
>
3883 class wxStringTypeBufferLength
: public wxStringTypeBufferLengthBase
<T
>
3886 wxStringTypeBufferLength(wxString
& str
, size_t lenWanted
= 1024)
3887 : wxStringTypeBufferLengthBase
<T
>(str
, lenWanted
)
3890 ~wxStringTypeBufferLength()
3892 this->m_str
.assign(this->m_buf
.data(), this->m_len
);
3895 wxDECLARE_NO_COPY_CLASS(wxStringTypeBufferLength
);
3898 #if wxUSE_STL_BASED_WXSTRING
3900 WXDLLIMPEXP_TEMPLATE_INSTANCE_BASE( wxStringTypeBufferBase
<wxStringCharType
> )
3902 class wxStringInternalBuffer
: public wxStringTypeBufferBase
<wxStringCharType
>
3905 wxStringInternalBuffer(wxString
& str
, size_t lenWanted
= 1024)
3906 : wxStringTypeBufferBase
<wxStringCharType
>(str
, lenWanted
) {}
3907 ~wxStringInternalBuffer()
3908 { m_str
.m_impl
.assign(m_buf
.data()); }
3910 wxDECLARE_NO_COPY_CLASS(wxStringInternalBuffer
);
3913 WXDLLIMPEXP_TEMPLATE_INSTANCE_BASE(
3914 wxStringTypeBufferLengthBase
<wxStringCharType
> )
3916 class wxStringInternalBufferLength
3917 : public wxStringTypeBufferLengthBase
<wxStringCharType
>
3920 wxStringInternalBufferLength(wxString
& str
, size_t lenWanted
= 1024)
3921 : wxStringTypeBufferLengthBase
<wxStringCharType
>(str
, lenWanted
) {}
3923 ~wxStringInternalBufferLength()
3925 m_str
.m_impl
.assign(m_buf
.data(), m_len
);
3928 wxDECLARE_NO_COPY_CLASS(wxStringInternalBufferLength
);
3931 #endif // wxUSE_STL_BASED_WXSTRING
3934 #if wxUSE_STL_BASED_WXSTRING || wxUSE_UNICODE_UTF8
3935 typedef wxStringTypeBuffer
<wxChar
> wxStringBuffer
;
3936 typedef wxStringTypeBufferLength
<wxChar
> wxStringBufferLength
;
3937 #else // if !wxUSE_STL_BASED_WXSTRING && !wxUSE_UNICODE_UTF8
3938 typedef wxStringInternalBuffer wxStringBuffer
;
3939 typedef wxStringInternalBufferLength wxStringBufferLength
;
3940 #endif // !wxUSE_STL_BASED_WXSTRING && !wxUSE_UNICODE_UTF8
3942 #if wxUSE_UNICODE_UTF8
3943 typedef wxStringInternalBuffer wxUTF8StringBuffer
;
3944 typedef wxStringInternalBufferLength wxUTF8StringBufferLength
;
3945 #elif wxUSE_UNICODE_WCHAR
3947 WXDLLIMPEXP_TEMPLATE_INSTANCE_BASE( wxStringTypeBufferBase
<char> )
3949 // Note about inlined dtors in the classes below: this is done not for
3950 // performance reasons but just to avoid linking errors in the MSVC DLL build
3951 // under Windows: if a class has non-inline methods it must be declared as
3952 // being DLL-exported but, due to an extremely interesting feature of MSVC 7
3953 // and later, any template class which is used as a base of a DLL-exported
3954 // class is implicitly made DLL-exported too, as explained at the bottom of
3955 // http://msdn.microsoft.com/en-us/library/twa2aw10.aspx (just to confirm: yes,
3956 // _inheriting_ from a class can change whether it is being exported from DLL)
3958 // But this results in link errors because the base template class is not DLL-
3959 // exported, whether it is declared with WXDLLIMPEXP_BASE or not, because it
3960 // does have only inline functions. So the simplest fix is to just make all the
3961 // functions of these classes inline too.
3963 class wxUTF8StringBuffer
: public wxStringTypeBufferBase
<char>
3966 wxUTF8StringBuffer(wxString
& str
, size_t lenWanted
= 1024)
3967 : wxStringTypeBufferBase
<char>(str
, lenWanted
) {}
3968 ~wxUTF8StringBuffer()
3970 wxMBConvStrictUTF8 conv
;
3971 size_t wlen
= conv
.ToWChar(NULL
, 0, m_buf
);
3972 wxCHECK_RET( wlen
!= wxCONV_FAILED
, "invalid UTF-8 data in string buffer?" );
3974 wxStringInternalBuffer
wbuf(m_str
, wlen
);
3975 conv
.ToWChar(wbuf
, wlen
, m_buf
);
3978 wxDECLARE_NO_COPY_CLASS(wxUTF8StringBuffer
);
3981 WXDLLIMPEXP_TEMPLATE_INSTANCE_BASE( wxStringTypeBufferLengthBase
<char> )
3983 class wxUTF8StringBufferLength
: public wxStringTypeBufferLengthBase
<char>
3986 wxUTF8StringBufferLength(wxString
& str
, size_t lenWanted
= 1024)
3987 : wxStringTypeBufferLengthBase
<char>(str
, lenWanted
) {}
3988 ~wxUTF8StringBufferLength()
3990 wxCHECK_RET(m_lenSet
, "length not set");
3992 wxMBConvStrictUTF8 conv
;
3993 size_t wlen
= conv
.ToWChar(NULL
, 0, m_buf
, m_len
);
3994 wxCHECK_RET( wlen
!= wxCONV_FAILED
, "invalid UTF-8 data in string buffer?" );
3996 wxStringInternalBufferLength
wbuf(m_str
, wlen
);
3997 conv
.ToWChar(wbuf
, wlen
, m_buf
, m_len
);
3998 wbuf
.SetLength(wlen
);
4001 wxDECLARE_NO_COPY_CLASS(wxUTF8StringBufferLength
);
4003 #endif // wxUSE_UNICODE_UTF8/wxUSE_UNICODE_WCHAR
4006 // ---------------------------------------------------------------------------
4007 // wxString comparison functions: operator versions are always case sensitive
4008 // ---------------------------------------------------------------------------
4010 #define wxCMP_WXCHAR_STRING(p, s, op) 0 op s.Cmp(p)
4012 wxDEFINE_ALL_COMPARISONS(const wxChar
*, const wxString
&, wxCMP_WXCHAR_STRING
)
4014 #undef wxCMP_WXCHAR_STRING
4016 inline bool operator==(const wxString
& s1
, const wxString
& s2
)
4017 { return s1
.IsSameAs(s2
); }
4018 inline bool operator!=(const wxString
& s1
, const wxString
& s2
)
4019 { return !s1
.IsSameAs(s2
); }
4020 inline bool operator< (const wxString
& s1
, const wxString
& s2
)
4021 { return s1
.Cmp(s2
) < 0; }
4022 inline bool operator> (const wxString
& s1
, const wxString
& s2
)
4023 { return s1
.Cmp(s2
) > 0; }
4024 inline bool operator<=(const wxString
& s1
, const wxString
& s2
)
4025 { return s1
.Cmp(s2
) <= 0; }
4026 inline bool operator>=(const wxString
& s1
, const wxString
& s2
)
4027 { return s1
.Cmp(s2
) >= 0; }
4029 inline bool operator==(const wxString
& s1
, const wxCStrData
& s2
)
4030 { return s1
== s2
.AsString(); }
4031 inline bool operator==(const wxCStrData
& s1
, const wxString
& s2
)
4032 { return s1
.AsString() == s2
; }
4033 inline bool operator!=(const wxString
& s1
, const wxCStrData
& s2
)
4034 { return s1
!= s2
.AsString(); }
4035 inline bool operator!=(const wxCStrData
& s1
, const wxString
& s2
)
4036 { return s1
.AsString() != s2
; }
4038 inline bool operator==(const wxString
& s1
, const wxScopedWCharBuffer
& s2
)
4039 { return (s1
.Cmp((const wchar_t *)s2
) == 0); }
4040 inline bool operator==(const wxScopedWCharBuffer
& s1
, const wxString
& s2
)
4041 { return (s2
.Cmp((const wchar_t *)s1
) == 0); }
4042 inline bool operator!=(const wxString
& s1
, const wxScopedWCharBuffer
& s2
)
4043 { return (s1
.Cmp((const wchar_t *)s2
) != 0); }
4044 inline bool operator!=(const wxScopedWCharBuffer
& s1
, const wxString
& s2
)
4045 { return (s2
.Cmp((const wchar_t *)s1
) != 0); }
4047 inline bool operator==(const wxString
& s1
, const wxScopedCharBuffer
& s2
)
4048 { return (s1
.Cmp((const char *)s2
) == 0); }
4049 inline bool operator==(const wxScopedCharBuffer
& s1
, const wxString
& s2
)
4050 { return (s2
.Cmp((const char *)s1
) == 0); }
4051 inline bool operator!=(const wxString
& s1
, const wxScopedCharBuffer
& s2
)
4052 { return (s1
.Cmp((const char *)s2
) != 0); }
4053 inline bool operator!=(const wxScopedCharBuffer
& s1
, const wxString
& s2
)
4054 { return (s2
.Cmp((const char *)s1
) != 0); }
4056 inline wxString
operator+(const wxString
& string
, const wxScopedWCharBuffer
& buf
)
4057 { return string
+ (const wchar_t *)buf
; }
4058 inline wxString
operator+(const wxScopedWCharBuffer
& buf
, const wxString
& string
)
4059 { return (const wchar_t *)buf
+ string
; }
4061 inline wxString
operator+(const wxString
& string
, const wxScopedCharBuffer
& buf
)
4062 { return string
+ (const char *)buf
; }
4063 inline wxString
operator+(const wxScopedCharBuffer
& buf
, const wxString
& string
)
4064 { return (const char *)buf
+ string
; }
4066 // comparison with char
4067 inline bool operator==(const wxUniChar
& c
, const wxString
& s
) { return s
.IsSameAs(c
); }
4068 inline bool operator==(const wxUniCharRef
& c
, const wxString
& s
) { return s
.IsSameAs(c
); }
4069 inline bool operator==(char c
, const wxString
& s
) { return s
.IsSameAs(c
); }
4070 inline bool operator==(wchar_t c
, const wxString
& s
) { return s
.IsSameAs(c
); }
4071 inline bool operator==(int c
, const wxString
& s
) { return s
.IsSameAs(c
); }
4072 inline bool operator==(const wxString
& s
, const wxUniChar
& c
) { return s
.IsSameAs(c
); }
4073 inline bool operator==(const wxString
& s
, const wxUniCharRef
& c
) { return s
.IsSameAs(c
); }
4074 inline bool operator==(const wxString
& s
, char c
) { return s
.IsSameAs(c
); }
4075 inline bool operator==(const wxString
& s
, wchar_t c
) { return s
.IsSameAs(c
); }
4076 inline bool operator!=(const wxUniChar
& c
, const wxString
& s
) { return !s
.IsSameAs(c
); }
4077 inline bool operator!=(const wxUniCharRef
& c
, const wxString
& s
) { return !s
.IsSameAs(c
); }
4078 inline bool operator!=(char c
, const wxString
& s
) { return !s
.IsSameAs(c
); }
4079 inline bool operator!=(wchar_t c
, const wxString
& s
) { return !s
.IsSameAs(c
); }
4080 inline bool operator!=(int c
, const wxString
& s
) { return !s
.IsSameAs(c
); }
4081 inline bool operator!=(const wxString
& s
, const wxUniChar
& c
) { return !s
.IsSameAs(c
); }
4082 inline bool operator!=(const wxString
& s
, const wxUniCharRef
& c
) { return !s
.IsSameAs(c
); }
4083 inline bool operator!=(const wxString
& s
, char c
) { return !s
.IsSameAs(c
); }
4084 inline bool operator!=(const wxString
& s
, wchar_t c
) { return !s
.IsSameAs(c
); }
4087 // wxString iterators comparisons
4088 inline bool wxString::iterator::operator==(const const_iterator
& i
) const
4089 { return i
== *this; }
4090 inline bool wxString::iterator::operator!=(const const_iterator
& i
) const
4091 { return i
!= *this; }
4092 inline bool wxString::iterator::operator<(const const_iterator
& i
) const
4093 { return i
> *this; }
4094 inline bool wxString::iterator::operator>(const const_iterator
& i
) const
4095 { return i
< *this; }
4096 inline bool wxString::iterator::operator<=(const const_iterator
& i
) const
4097 { return i
>= *this; }
4098 inline bool wxString::iterator::operator>=(const const_iterator
& i
) const
4099 { return i
<= *this; }
4101 // comparison with C string in Unicode build
4104 #define wxCMP_CHAR_STRING(p, s, op) wxString(p) op s
4106 wxDEFINE_ALL_COMPARISONS(const char *, const wxString
&, wxCMP_CHAR_STRING
)
4108 #undef wxCMP_CHAR_STRING
4110 #endif // wxUSE_UNICODE
4112 // we also need to provide the operators for comparison with wxCStrData to
4113 // resolve ambiguity between operator(const wxChar *,const wxString &) and
4114 // operator(const wxChar *, const wxChar *) for "p == s.c_str()"
4116 // notice that these are (shallow) pointer comparisons, not (deep) string ones
4117 #define wxCMP_CHAR_CSTRDATA(p, s, op) p op s.AsChar()
4118 #define wxCMP_WCHAR_CSTRDATA(p, s, op) p op s.AsWChar()
4120 wxDEFINE_ALL_COMPARISONS(const wchar_t *, const wxCStrData
&, wxCMP_WCHAR_CSTRDATA
)
4121 wxDEFINE_ALL_COMPARISONS(const char *, const wxCStrData
&, wxCMP_CHAR_CSTRDATA
)
4123 #undef wxCMP_CHAR_CSTRDATA
4124 #undef wxCMP_WCHAR_CSTRDATA
4126 // ---------------------------------------------------------------------------
4127 // Implementation only from here until the end of file
4128 // ---------------------------------------------------------------------------
4130 #if wxUSE_STD_IOSTREAM
4132 #include "wx/iosfwrap.h"
4134 WXDLLIMPEXP_BASE wxSTD ostream
& operator<<(wxSTD ostream
&, const wxString
&);
4135 WXDLLIMPEXP_BASE wxSTD ostream
& operator<<(wxSTD ostream
&, const wxCStrData
&);
4136 WXDLLIMPEXP_BASE wxSTD ostream
& operator<<(wxSTD ostream
&, const wxScopedCharBuffer
&);
4137 #ifndef __BORLANDC__
4138 WXDLLIMPEXP_BASE wxSTD ostream
& operator<<(wxSTD ostream
&, const wxScopedWCharBuffer
&);
4141 #if wxUSE_UNICODE && defined(HAVE_WOSTREAM)
4143 WXDLLIMPEXP_BASE wxSTD wostream
& operator<<(wxSTD wostream
&, const wxString
&);
4144 WXDLLIMPEXP_BASE wxSTD wostream
& operator<<(wxSTD wostream
&, const wxCStrData
&);
4145 WXDLLIMPEXP_BASE wxSTD wostream
& operator<<(wxSTD wostream
&, const wxScopedWCharBuffer
&);
4147 #endif // wxUSE_UNICODE && defined(HAVE_WOSTREAM)
4149 #endif // wxUSE_STD_IOSTREAM
4151 // ---------------------------------------------------------------------------
4152 // wxCStrData implementation
4153 // ---------------------------------------------------------------------------
4155 inline wxCStrData::wxCStrData(char *buf
)
4156 : m_str(new wxString(buf
)), m_offset(0), m_owned(true) {}
4157 inline wxCStrData::wxCStrData(wchar_t *buf
)
4158 : m_str(new wxString(buf
)), m_offset(0), m_owned(true) {}
4160 inline wxCStrData::wxCStrData(const wxCStrData
& data
)
4161 : m_str(data
.m_owned
? new wxString(*data
.m_str
) : data
.m_str
),
4162 m_offset(data
.m_offset
),
4163 m_owned(data
.m_owned
)
4167 inline wxCStrData::~wxCStrData()
4170 delete const_cast<wxString
*>(m_str
); // cast to silence warnings
4173 // AsChar() and AsWChar() implementations simply forward to wxString methods
4175 inline const wchar_t* wxCStrData::AsWChar() const
4177 const wchar_t * const p
=
4178 #if wxUSE_UNICODE_WCHAR
4180 #elif wxUSE_UNICODE_UTF8
4181 m_str
->AsWChar(wxMBConvStrictUTF8());
4183 m_str
->AsWChar(wxConvLibc
);
4186 // in Unicode build the string always has a valid Unicode representation
4187 // and even if a conversion is needed (as in UTF8 case) it can't fail
4189 // but in ANSI build the string contents might be not convertible to
4190 // Unicode using the current locale encoding so we do need to check for
4195 // if conversion fails, return empty string and not NULL to avoid
4196 // crashes in code written with either wxWidgets 2 wxString or
4197 // std::string behaviour in mind: neither of them ever returns NULL
4198 // from its c_str() and so we shouldn't neither
4200 // notice that the same is done in AsChar() below and
4201 // wxString::wc_str() and mb_str() for the same reasons
4204 #endif // !wxUSE_UNICODE
4206 return p
+ m_offset
;
4209 inline const char* wxCStrData::AsChar() const
4211 #if wxUSE_UNICODE && !wxUSE_UTF8_LOCALE_ONLY
4212 const char * const p
= m_str
->AsChar(wxConvLibc
);
4215 #else // !wxUSE_UNICODE || wxUSE_UTF8_LOCALE_ONLY
4216 const char * const p
= m_str
->mb_str();
4217 #endif // wxUSE_UNICODE && !wxUSE_UTF8_LOCALE_ONLY
4219 return p
+ m_offset
;
4222 inline wxString
wxCStrData::AsString() const
4224 if ( m_offset
== 0 )
4227 return m_str
->Mid(m_offset
);
4230 inline const wxStringCharType
*wxCStrData::AsInternal() const
4232 #if wxUSE_UNICODE_UTF8
4233 return wxStringOperations::AddToIter(m_str
->wx_str(), m_offset
);
4235 return m_str
->wx_str() + m_offset
;
4239 inline wxUniChar
wxCStrData::operator*() const
4241 if ( m_str
->empty() )
4242 return wxUniChar(wxT('\0'));
4244 return (*m_str
)[m_offset
];
4247 inline wxUniChar
wxCStrData::operator[](size_t n
) const
4249 // NB: we intentionally use operator[] and not at() here because the former
4250 // works for the terminating NUL while the latter does not
4251 return (*m_str
)[m_offset
+ n
];
4254 // ----------------------------------------------------------------------------
4255 // more wxCStrData operators
4256 // ----------------------------------------------------------------------------
4258 // we need to define those to allow "size_t pos = p - s.c_str()" where p is
4259 // some pointer into the string
4260 inline size_t operator-(const char *p
, const wxCStrData
& cs
)
4262 return p
- cs
.AsChar();
4265 inline size_t operator-(const wchar_t *p
, const wxCStrData
& cs
)
4267 return p
- cs
.AsWChar();
4270 // ----------------------------------------------------------------------------
4271 // implementation of wx[W]CharBuffer inline methods using wxCStrData
4272 // ----------------------------------------------------------------------------
4274 // FIXME-UTF8: move this to buffer.h
4275 inline wxCharBuffer::wxCharBuffer(const wxCStrData
& cstr
)
4276 : wxCharTypeBufferBase(cstr
.AsCharBuf())
4280 inline wxWCharBuffer::wxWCharBuffer(const wxCStrData
& cstr
)
4281 : wxCharTypeBufferBase(cstr
.AsWCharBuf())
4285 #if wxUSE_UNICODE_UTF8
4286 // ----------------------------------------------------------------------------
4287 // implementation of wxStringIteratorNode inline methods
4288 // ----------------------------------------------------------------------------
4290 void wxStringIteratorNode::DoSet(const wxString
*str
,
4291 wxStringImpl::const_iterator
*citer
,
4292 wxStringImpl::iterator
*iter
)
4300 m_next
= str
->m_iterators
.ptr
;
4301 const_cast<wxString
*>(m_str
)->m_iterators
.ptr
= this;
4303 m_next
->m_prev
= this;
4311 void wxStringIteratorNode::clear()
4314 m_next
->m_prev
= m_prev
;
4316 m_prev
->m_next
= m_next
;
4317 else if ( m_str
) // first in the list
4318 const_cast<wxString
*>(m_str
)->m_iterators
.ptr
= m_next
;
4320 m_next
= m_prev
= NULL
;
4325 #endif // wxUSE_UNICODE_UTF8
4327 #if WXWIN_COMPATIBILITY_2_8
4328 // lot of code out there doesn't explicitly include wx/crt.h, but uses
4329 // CRT wrappers that are now declared in wx/wxcrt.h and wx/wxcrtvararg.h,
4330 // so let's include this header now that wxString is defined and it's safe
4335 // ----------------------------------------------------------------------------
4336 // Checks on wxString characters
4337 // ----------------------------------------------------------------------------
4339 template<bool (T
)(const wxUniChar
& c
)>
4340 inline bool wxStringCheck(const wxString
& val
)
4342 for ( wxString::const_iterator i
= val
.begin();
4350 #endif // _WX_WXSTRING_H_