]>
Commit | Line | Data |
---|---|---|
c801d85f | 1 | ///////////////////////////////////////////////////////////////////////////// |
8898456d | 2 | // Name: src/common/string.cpp |
c801d85f | 3 | // Purpose: wxString class |
59059feb | 4 | // Author: Vadim Zeitlin, Ryan Norton |
c801d85f KB |
5 | // Modified by: |
6 | // Created: 29/01/98 | |
7 | // RCS-ID: $Id$ | |
8 | // Copyright: (c) 1998 Vadim Zeitlin <zeitlin@dptmaths.ens-cachan.fr> | |
59059feb | 9 | // (c) 2004 Ryan Norton <wxprojects@comcast.net> |
65571936 | 10 | // Licence: wxWindows licence |
c801d85f KB |
11 | ///////////////////////////////////////////////////////////////////////////// |
12 | ||
c801d85f KB |
13 | // =========================================================================== |
14 | // headers, declarations, constants | |
15 | // =========================================================================== | |
16 | ||
17 | // For compilers that support precompilation, includes "wx.h". | |
18 | #include "wx/wxprec.h" | |
19 | ||
20 | #ifdef __BORLANDC__ | |
8898456d | 21 | #pragma hdrstop |
c801d85f KB |
22 | #endif |
23 | ||
24 | #ifndef WX_PRECOMP | |
8898456d | 25 | #include "wx/string.h" |
2523e9b7 | 26 | #include "wx/wxcrtvararg.h" |
6b769f3d | 27 | #endif |
c801d85f KB |
28 | |
29 | #include <ctype.h> | |
92df97b8 WS |
30 | |
31 | #ifndef __WXWINCE__ | |
32 | #include <errno.h> | |
33 | #endif | |
34 | ||
c801d85f KB |
35 | #include <string.h> |
36 | #include <stdlib.h> | |
9a08c20e | 37 | |
ce3ed50d | 38 | #ifdef __SALFORDC__ |
8898456d | 39 | #include <clib.h> |
ce3ed50d JS |
40 | #endif |
41 | ||
8116a0c5 | 42 | #include "wx/hashmap.h" |
8f93a29f VS |
43 | |
44 | // string handling functions used by wxString: | |
45 | #if wxUSE_UNICODE_UTF8 | |
46 | #define wxStringMemcpy memcpy | |
47 | #define wxStringMemcmp memcmp | |
48 | #define wxStringMemchr memchr | |
49 | #define wxStringStrlen strlen | |
50 | #else | |
51 | #define wxStringMemcpy wxTmemcpy | |
52 | #define wxStringMemcmp wxTmemcmp | |
a7ea63e2 VS |
53 | #define wxStringMemchr wxTmemchr |
54 | #define wxStringStrlen wxStrlen | |
55 | #endif | |
8f93a29f | 56 | |
e87b7833 | 57 | |
a7ea63e2 VS |
58 | // --------------------------------------------------------------------------- |
59 | // static class variables definition | |
60 | // --------------------------------------------------------------------------- | |
e87b7833 | 61 | |
a7ea63e2 VS |
62 | //According to STL _must_ be a -1 size_t |
63 | const size_t wxString::npos = (size_t) -1; | |
8f93a29f | 64 | |
a7ea63e2 VS |
65 | // ---------------------------------------------------------------------------- |
66 | // global functions | |
67 | // ---------------------------------------------------------------------------- | |
e87b7833 | 68 | |
a7ea63e2 | 69 | #if wxUSE_STD_IOSTREAM |
8f93a29f | 70 | |
a7ea63e2 | 71 | #include <iostream> |
8f93a29f | 72 | |
a7ea63e2 | 73 | wxSTD ostream& operator<<(wxSTD ostream& os, const wxCStrData& str) |
8f93a29f | 74 | { |
04abe4bc | 75 | // FIXME-UTF8: always, not only if wxUSE_UNICODE |
a7ea63e2 | 76 | #if wxUSE_UNICODE && !defined(__BORLANDC__) |
681e4412 | 77 | return os << (const wchar_t*)str.AsWCharBuf(); |
a7ea63e2 | 78 | #else |
681e4412 | 79 | return os << (const char*)str.AsCharBuf(); |
a7ea63e2 | 80 | #endif |
8f93a29f VS |
81 | } |
82 | ||
04abe4bc VS |
83 | wxSTD ostream& operator<<(wxSTD ostream& os, const wxString& str) |
84 | { | |
85 | return os << str.c_str(); | |
86 | } | |
87 | ||
88 | wxSTD ostream& operator<<(wxSTD ostream& os, const wxCharBuffer& str) | |
89 | { | |
90 | return os << str.data(); | |
91 | } | |
92 | ||
93 | #ifndef __BORLANDC__ | |
94 | wxSTD ostream& operator<<(wxSTD ostream& os, const wxWCharBuffer& str) | |
95 | { | |
96 | return os << str.data(); | |
97 | } | |
98 | #endif | |
99 | ||
a7ea63e2 | 100 | #endif // wxUSE_STD_IOSTREAM |
e87b7833 | 101 | |
81727065 VS |
102 | // =========================================================================== |
103 | // wxString class core | |
104 | // =========================================================================== | |
105 | ||
106 | #if wxUSE_UNICODE_UTF8 | |
107 | ||
81727065 VS |
108 | void wxString::PosLenToImpl(size_t pos, size_t len, |
109 | size_t *implPos, size_t *implLen) const | |
110 | { | |
111 | if ( pos == npos ) | |
112 | *implPos = npos; | |
113 | else | |
114 | { | |
115 | const_iterator i = begin() + pos; | |
cf9a878b | 116 | *implPos = wxStringImpl::const_iterator(i.impl()) - m_impl.begin(); |
81727065 VS |
117 | if ( len == npos ) |
118 | *implLen = npos; | |
119 | else | |
120 | { | |
121 | // too large length is interpreted as "to the end of the string" | |
122 | // FIXME-UTF8: verify this is the case in std::string, assert | |
123 | // otherwise | |
124 | if ( pos + len > length() ) | |
125 | len = length() - pos; | |
126 | ||
cf9a878b | 127 | *implLen = (i + len).impl() - i.impl(); |
81727065 VS |
128 | } |
129 | } | |
130 | } | |
131 | ||
132 | #endif // wxUSE_UNICODE_UTF8 | |
133 | ||
11aac4ba VS |
134 | // ---------------------------------------------------------------------------- |
135 | // wxCStrData converted strings caching | |
136 | // ---------------------------------------------------------------------------- | |
137 | ||
132276cf VS |
138 | // FIXME-UTF8: temporarily disabled because it doesn't work with global |
139 | // string objects; re-enable after fixing this bug and benchmarking | |
140 | // performance to see if using a hash is a good idea at all | |
141 | #if 0 | |
142 | ||
11aac4ba VS |
143 | // For backward compatibility reasons, it must be possible to assign the value |
144 | // returned by wxString::c_str() to a char* or wchar_t* variable and work with | |
145 | // it. Returning wxCharBuffer from (const char*)c_str() wouldn't do the trick, | |
146 | // because the memory would be freed immediately, but it has to be valid as long | |
147 | // as the string is not modified, so that code like this still works: | |
148 | // | |
149 | // const wxChar *s = str.c_str(); | |
150 | // while ( s ) { ... } | |
151 | ||
152 | // FIXME-UTF8: not thread safe! | |
153 | // FIXME-UTF8: we currently clear the cached conversion only when the string is | |
154 | // destroyed, but we should do it when the string is modified, to | |
155 | // keep memory usage down | |
156 | // FIXME-UTF8: we do the conversion every time As[W]Char() is called, but if we | |
157 | // invalidated the cache on every change, we could keep the previous | |
158 | // conversion | |
159 | // FIXME-UTF8: add tracing of usage of these two methods - new code is supposed | |
160 | // to use mb_str() or wc_str() instead of (const [w]char*)c_str() | |
161 | ||
162 | template<typename T> | |
163 | static inline void DeleteStringFromConversionCache(T& hash, const wxString *s) | |
164 | { | |
6c4ebcda | 165 | typename T::iterator i = hash.find(wxConstCast(s, wxString)); |
11aac4ba VS |
166 | if ( i != hash.end() ) |
167 | { | |
168 | free(i->second); | |
169 | hash.erase(i); | |
170 | } | |
171 | } | |
172 | ||
173 | #if wxUSE_UNICODE | |
6c4ebcda VS |
174 | // NB: non-STL implementation doesn't compile with "const wxString*" key type, |
175 | // so we have to use wxString* here and const-cast when used | |
11aac4ba VS |
176 | WX_DECLARE_HASH_MAP(wxString*, char*, wxPointerHash, wxPointerEqual, |
177 | wxStringCharConversionCache); | |
178 | static wxStringCharConversionCache gs_stringsCharCache; | |
179 | ||
180 | const char* wxCStrData::AsChar() const | |
181 | { | |
182 | // remove previously cache value, if any (see FIXMEs above): | |
183 | DeleteStringFromConversionCache(gs_stringsCharCache, m_str); | |
184 | ||
185 | // convert the string and keep it: | |
6c4ebcda VS |
186 | const char *s = gs_stringsCharCache[wxConstCast(m_str, wxString)] = |
187 | m_str->mb_str().release(); | |
11aac4ba VS |
188 | |
189 | return s + m_offset; | |
190 | } | |
191 | #endif // wxUSE_UNICODE | |
192 | ||
193 | #if !wxUSE_UNICODE_WCHAR | |
194 | WX_DECLARE_HASH_MAP(wxString*, wchar_t*, wxPointerHash, wxPointerEqual, | |
195 | wxStringWCharConversionCache); | |
196 | static wxStringWCharConversionCache gs_stringsWCharCache; | |
197 | ||
198 | const wchar_t* wxCStrData::AsWChar() const | |
199 | { | |
200 | // remove previously cache value, if any (see FIXMEs above): | |
201 | DeleteStringFromConversionCache(gs_stringsWCharCache, m_str); | |
202 | ||
203 | // convert the string and keep it: | |
6c4ebcda VS |
204 | const wchar_t *s = gs_stringsWCharCache[wxConstCast(m_str, wxString)] = |
205 | m_str->wc_str().release(); | |
11aac4ba VS |
206 | |
207 | return s + m_offset; | |
208 | } | |
209 | #endif // !wxUSE_UNICODE_WCHAR | |
210 | ||
11aac4ba VS |
211 | wxString::~wxString() |
212 | { | |
213 | #if wxUSE_UNICODE | |
214 | // FIXME-UTF8: do this only if locale is not UTF8 if wxUSE_UNICODE_UTF8 | |
215 | DeleteStringFromConversionCache(gs_stringsCharCache, this); | |
216 | #endif | |
217 | #if !wxUSE_UNICODE_WCHAR | |
218 | DeleteStringFromConversionCache(gs_stringsWCharCache, this); | |
219 | #endif | |
220 | } | |
132276cf VS |
221 | #endif |
222 | ||
111d9948 | 223 | #if wxUSE_UNICODE && !wxUSE_UTF8_LOCALE_ONLY |
132276cf VS |
224 | const char* wxCStrData::AsChar() const |
225 | { | |
111d9948 VS |
226 | #if wxUSE_UNICODE_UTF8 |
227 | if ( wxLocaleIsUtf8 ) | |
228 | return AsInternal(); | |
229 | #endif | |
230 | // under non-UTF8 locales, we have to convert the internal UTF-8 | |
231 | // representation using wxConvLibc and cache the result | |
232 | ||
132276cf | 233 | wxString *str = wxConstCast(m_str, wxString); |
05f32fc3 VS |
234 | |
235 | // convert the string: | |
236 | wxCharBuffer buf(str->mb_str()); | |
237 | ||
238 | // FIXME-UTF8: do the conversion in-place in the existing buffer | |
239 | if ( str->m_convertedToChar && | |
240 | strlen(buf) == strlen(str->m_convertedToChar) ) | |
241 | { | |
242 | // keep the same buffer for as long as possible, so that several calls | |
243 | // to c_str() in a row still work: | |
244 | strcpy(str->m_convertedToChar, buf); | |
245 | } | |
246 | else | |
247 | { | |
248 | str->m_convertedToChar = buf.release(); | |
249 | } | |
250 | ||
251 | // and keep it: | |
132276cf VS |
252 | return str->m_convertedToChar + m_offset; |
253 | } | |
111d9948 | 254 | #endif // wxUSE_UNICODE && !wxUSE_UTF8_LOCALE_ONLY |
132276cf VS |
255 | |
256 | #if !wxUSE_UNICODE_WCHAR | |
257 | const wchar_t* wxCStrData::AsWChar() const | |
258 | { | |
259 | wxString *str = wxConstCast(m_str, wxString); | |
05f32fc3 VS |
260 | |
261 | // convert the string: | |
262 | wxWCharBuffer buf(str->wc_str()); | |
263 | ||
264 | // FIXME-UTF8: do the conversion in-place in the existing buffer | |
265 | if ( str->m_convertedToWChar && | |
266 | wxWcslen(buf) == wxWcslen(str->m_convertedToWChar) ) | |
267 | { | |
268 | // keep the same buffer for as long as possible, so that several calls | |
269 | // to c_str() in a row still work: | |
270 | memcpy(str->m_convertedToWChar, buf, sizeof(wchar_t) * wxWcslen(buf)); | |
271 | } | |
272 | else | |
273 | { | |
274 | str->m_convertedToWChar = buf.release(); | |
275 | } | |
276 | ||
277 | // and keep it: | |
132276cf VS |
278 | return str->m_convertedToWChar + m_offset; |
279 | } | |
280 | #endif // !wxUSE_UNICODE_WCHAR | |
281 | ||
282 | // =========================================================================== | |
283 | // wxString class core | |
284 | // =========================================================================== | |
285 | ||
286 | // --------------------------------------------------------------------------- | |
287 | // construction and conversion | |
288 | // --------------------------------------------------------------------------- | |
11aac4ba | 289 | |
81727065 | 290 | #if wxUSE_UNICODE_WCHAR |
8f93a29f VS |
291 | /* static */ |
292 | wxString::SubstrBufFromMB wxString::ConvertStr(const char *psz, size_t nLength, | |
04abe4bc | 293 | const wxMBConv& conv) |
8f93a29f VS |
294 | { |
295 | // anything to do? | |
296 | if ( !psz || nLength == 0 ) | |
81727065 | 297 | return SubstrBufFromMB(L"", 0); |
8f93a29f VS |
298 | |
299 | if ( nLength == npos ) | |
300 | nLength = wxNO_LEN; | |
301 | ||
302 | size_t wcLen; | |
303 | wxWCharBuffer wcBuf(conv.cMB2WC(psz, nLength, &wcLen)); | |
304 | if ( !wcLen ) | |
81727065 | 305 | return SubstrBufFromMB(_T(""), 0); |
8f93a29f VS |
306 | else |
307 | return SubstrBufFromMB(wcBuf, wcLen); | |
308 | } | |
81727065 VS |
309 | #endif // wxUSE_UNICODE_WCHAR |
310 | ||
311 | #if wxUSE_UNICODE_UTF8 | |
312 | /* static */ | |
313 | wxString::SubstrBufFromMB wxString::ConvertStr(const char *psz, size_t nLength, | |
314 | const wxMBConv& conv) | |
315 | { | |
81727065 VS |
316 | // anything to do? |
317 | if ( !psz || nLength == 0 ) | |
318 | return SubstrBufFromMB("", 0); | |
319 | ||
111d9948 VS |
320 | // if psz is already in UTF-8, we don't have to do the roundtrip to |
321 | // wchar_t* and back: | |
322 | if ( conv.IsUTF8() ) | |
323 | { | |
324 | // we need to validate the input because UTF8 iterators assume valid | |
325 | // UTF-8 sequence and psz may be invalid: | |
326 | if ( wxStringOperations::IsValidUtf8String(psz, nLength) ) | |
327 | { | |
328 | return SubstrBufFromMB(wxCharBuffer::CreateNonOwned(psz), nLength); | |
329 | } | |
330 | // else: do the roundtrip through wchar_t* | |
331 | } | |
332 | ||
81727065 VS |
333 | if ( nLength == npos ) |
334 | nLength = wxNO_LEN; | |
335 | ||
336 | // first convert to wide string: | |
337 | size_t wcLen; | |
338 | wxWCharBuffer wcBuf(conv.cMB2WC(psz, nLength, &wcLen)); | |
339 | if ( !wcLen ) | |
340 | return SubstrBufFromMB("", 0); | |
341 | ||
342 | // and then to UTF-8: | |
5487ff0f | 343 | SubstrBufFromMB buf(ConvertStr(wcBuf, wcLen, wxMBConvUTF8())); |
81727065 VS |
344 | // widechar -> UTF-8 conversion isn't supposed to ever fail: |
345 | wxASSERT_MSG( buf.data, _T("conversion to UTF-8 failed") ); | |
346 | ||
347 | return buf; | |
348 | } | |
349 | #endif // wxUSE_UNICODE_UTF8 | |
350 | ||
351 | #if wxUSE_UNICODE_UTF8 || !wxUSE_UNICODE | |
8f93a29f VS |
352 | /* static */ |
353 | wxString::SubstrBufFromWC wxString::ConvertStr(const wchar_t *pwz, size_t nLength, | |
04abe4bc | 354 | const wxMBConv& conv) |
8f93a29f VS |
355 | { |
356 | // anything to do? | |
357 | if ( !pwz || nLength == 0 ) | |
81727065 | 358 | return SubstrBufFromWC("", 0); |
8f93a29f VS |
359 | |
360 | if ( nLength == npos ) | |
361 | nLength = wxNO_LEN; | |
362 | ||
363 | size_t mbLen; | |
364 | wxCharBuffer mbBuf(conv.cWC2MB(pwz, nLength, &mbLen)); | |
365 | if ( !mbLen ) | |
81727065 | 366 | return SubstrBufFromWC("", 0); |
8f93a29f VS |
367 | else |
368 | return SubstrBufFromWC(mbBuf, mbLen); | |
369 | } | |
81727065 | 370 | #endif // wxUSE_UNICODE_UTF8 || !wxUSE_UNICODE |
8f93a29f VS |
371 | |
372 | ||
81727065 | 373 | #if wxUSE_UNICODE_WCHAR |
e87b7833 | 374 | |
06386448 | 375 | //Convert wxString in Unicode mode to a multi-byte string |
830f8f11 | 376 | const wxCharBuffer wxString::mb_str(const wxMBConv& conv) const |
265d5cce | 377 | { |
81727065 | 378 | return conv.cWC2MB(wx_str(), length() + 1 /* size, not length */, NULL); |
e87b7833 MB |
379 | } |
380 | ||
81727065 | 381 | #elif wxUSE_UNICODE_UTF8 |
e87b7833 | 382 | |
81727065 VS |
383 | const wxWCharBuffer wxString::wc_str() const |
384 | { | |
5487ff0f VS |
385 | return wxMBConvUTF8().cMB2WC(m_impl.c_str(), |
386 | m_impl.length() + 1 /* size, not length */, | |
387 | NULL); | |
81727065 VS |
388 | } |
389 | ||
390 | const wxCharBuffer wxString::mb_str(const wxMBConv& conv) const | |
391 | { | |
111d9948 VS |
392 | if ( conv.IsUTF8() ) |
393 | return wxCharBuffer::CreateNonOwned(m_impl.c_str()); | |
394 | ||
81727065 VS |
395 | // FIXME-UTF8: use wc_str() here once we have buffers with length |
396 | ||
397 | size_t wcLen; | |
398 | wxWCharBuffer wcBuf( | |
5487ff0f VS |
399 | wxMBConvUTF8().cMB2WC(m_impl.c_str(), |
400 | m_impl.length() + 1 /* size, not length */, | |
401 | &wcLen)); | |
81727065 VS |
402 | if ( !wcLen ) |
403 | return wxCharBuffer(""); | |
404 | ||
405 | return conv.cWC2MB(wcBuf, wcLen, NULL); | |
406 | } | |
407 | ||
408 | #else // ANSI | |
eec47cc6 | 409 | |
7663d0d4 | 410 | //Converts this string to a wide character string if unicode |
06386448 | 411 | //mode is not enabled and wxUSE_WCHAR_T is enabled |
830f8f11 | 412 | const wxWCharBuffer wxString::wc_str(const wxMBConv& conv) const |
265d5cce | 413 | { |
81727065 | 414 | return conv.cMB2WC(wx_str(), length() + 1 /* size, not length */, NULL); |
265d5cce | 415 | } |
7663d0d4 | 416 | |
e87b7833 MB |
417 | #endif // Unicode/ANSI |
418 | ||
419 | // shrink to minimal size (releasing extra memory) | |
420 | bool wxString::Shrink() | |
421 | { | |
422 | wxString tmp(begin(), end()); | |
423 | swap(tmp); | |
424 | return tmp.length() == length(); | |
425 | } | |
426 | ||
d8a4b666 | 427 | // deprecated compatibility code: |
a7ea63e2 | 428 | #if WXWIN_COMPATIBILITY_2_8 && !wxUSE_STL_BASED_WXSTRING && !wxUSE_UNICODE_UTF8 |
c87a0bc8 | 429 | wxStringCharType *wxString::GetWriteBuf(size_t nLen) |
d8a4b666 VS |
430 | { |
431 | return DoGetWriteBuf(nLen); | |
432 | } | |
433 | ||
434 | void wxString::UngetWriteBuf() | |
435 | { | |
436 | DoUngetWriteBuf(); | |
437 | } | |
438 | ||
439 | void wxString::UngetWriteBuf(size_t nLen) | |
440 | { | |
441 | DoUngetWriteBuf(nLen); | |
442 | } | |
a7ea63e2 | 443 | #endif // WXWIN_COMPATIBILITY_2_8 && !wxUSE_STL_BASED_WXSTRING && !wxUSE_UNICODE_UTF8 |
e87b7833 | 444 | |
d8a4b666 | 445 | |
e87b7833 MB |
446 | // --------------------------------------------------------------------------- |
447 | // data access | |
448 | // --------------------------------------------------------------------------- | |
449 | ||
450 | // all functions are inline in string.h | |
451 | ||
452 | // --------------------------------------------------------------------------- | |
e8f59039 | 453 | // concatenation operators |
e87b7833 MB |
454 | // --------------------------------------------------------------------------- |
455 | ||
c801d85f | 456 | /* |
c801d85f KB |
457 | * concatenation functions come in 5 flavours: |
458 | * string + string | |
459 | * char + string and string + char | |
460 | * C str + string and string + C str | |
461 | */ | |
462 | ||
b1801e0e | 463 | wxString operator+(const wxString& str1, const wxString& str2) |
c801d85f | 464 | { |
992527a5 | 465 | #if !wxUSE_STL_BASED_WXSTRING |
8f93a29f VS |
466 | wxASSERT( str1.IsValid() ); |
467 | wxASSERT( str2.IsValid() ); | |
e87b7833 | 468 | #endif |
097c080b | 469 | |
3458e408 WS |
470 | wxString s = str1; |
471 | s += str2; | |
3168a13f | 472 | |
3458e408 | 473 | return s; |
c801d85f KB |
474 | } |
475 | ||
c9f78968 | 476 | wxString operator+(const wxString& str, wxUniChar ch) |
c801d85f | 477 | { |
992527a5 | 478 | #if !wxUSE_STL_BASED_WXSTRING |
8f93a29f | 479 | wxASSERT( str.IsValid() ); |
e87b7833 | 480 | #endif |
3168a13f | 481 | |
3458e408 WS |
482 | wxString s = str; |
483 | s += ch; | |
097c080b | 484 | |
3458e408 | 485 | return s; |
c801d85f KB |
486 | } |
487 | ||
c9f78968 | 488 | wxString operator+(wxUniChar ch, const wxString& str) |
c801d85f | 489 | { |
992527a5 | 490 | #if !wxUSE_STL_BASED_WXSTRING |
8f93a29f | 491 | wxASSERT( str.IsValid() ); |
e87b7833 | 492 | #endif |
097c080b | 493 | |
3458e408 WS |
494 | wxString s = ch; |
495 | s += str; | |
3168a13f | 496 | |
3458e408 | 497 | return s; |
c801d85f KB |
498 | } |
499 | ||
8f93a29f | 500 | wxString operator+(const wxString& str, const char *psz) |
c801d85f | 501 | { |
992527a5 | 502 | #if !wxUSE_STL_BASED_WXSTRING |
8f93a29f | 503 | wxASSERT( str.IsValid() ); |
e87b7833 | 504 | #endif |
097c080b | 505 | |
3458e408 | 506 | wxString s; |
8f93a29f | 507 | if ( !s.Alloc(strlen(psz) + str.length()) ) { |
3458e408 WS |
508 | wxFAIL_MSG( _T("out of memory in wxString::operator+") ); |
509 | } | |
510 | s += str; | |
511 | s += psz; | |
3168a13f | 512 | |
3458e408 | 513 | return s; |
c801d85f KB |
514 | } |
515 | ||
8f93a29f | 516 | wxString operator+(const wxString& str, const wchar_t *pwz) |
c801d85f | 517 | { |
992527a5 | 518 | #if !wxUSE_STL_BASED_WXSTRING |
8f93a29f VS |
519 | wxASSERT( str.IsValid() ); |
520 | #endif | |
521 | ||
522 | wxString s; | |
523 | if ( !s.Alloc(wxWcslen(pwz) + str.length()) ) { | |
524 | wxFAIL_MSG( _T("out of memory in wxString::operator+") ); | |
525 | } | |
526 | s += str; | |
527 | s += pwz; | |
528 | ||
529 | return s; | |
530 | } | |
531 | ||
532 | wxString operator+(const char *psz, const wxString& str) | |
533 | { | |
a7ea63e2 VS |
534 | #if !wxUSE_STL_BASED_WXSTRING |
535 | wxASSERT( str.IsValid() ); | |
536 | #endif | |
537 | ||
538 | wxString s; | |
539 | if ( !s.Alloc(strlen(psz) + str.length()) ) { | |
540 | wxFAIL_MSG( _T("out of memory in wxString::operator+") ); | |
541 | } | |
542 | s = psz; | |
543 | s += str; | |
544 | ||
545 | return s; | |
546 | } | |
547 | ||
548 | wxString operator+(const wchar_t *pwz, const wxString& str) | |
549 | { | |
550 | #if !wxUSE_STL_BASED_WXSTRING | |
551 | wxASSERT( str.IsValid() ); | |
552 | #endif | |
553 | ||
554 | wxString s; | |
555 | if ( !s.Alloc(wxWcslen(pwz) + str.length()) ) { | |
556 | wxFAIL_MSG( _T("out of memory in wxString::operator+") ); | |
557 | } | |
558 | s = pwz; | |
559 | s += str; | |
560 | ||
561 | return s; | |
562 | } | |
563 | ||
564 | // --------------------------------------------------------------------------- | |
565 | // string comparison | |
566 | // --------------------------------------------------------------------------- | |
567 | ||
52de37c7 VS |
568 | bool wxString::IsSameAs(wxUniChar c, bool compareWithCase) const |
569 | { | |
570 | return (length() == 1) && (compareWithCase ? GetChar(0u) == c | |
571 | : wxToupper(GetChar(0u)) == wxToupper(c)); | |
572 | } | |
573 | ||
a7ea63e2 VS |
574 | #ifdef HAVE_STD_STRING_COMPARE |
575 | ||
576 | // NB: Comparison code (both if HAVE_STD_STRING_COMPARE and if not) works with | |
577 | // UTF-8 encoded strings too, thanks to UTF-8's design which allows us to | |
578 | // sort strings in characters code point order by sorting the byte sequence | |
579 | // in byte values order (i.e. what strcmp() and memcmp() do). | |
580 | ||
581 | int wxString::compare(const wxString& str) const | |
582 | { | |
583 | return m_impl.compare(str.m_impl); | |
584 | } | |
585 | ||
586 | int wxString::compare(size_t nStart, size_t nLen, | |
587 | const wxString& str) const | |
588 | { | |
589 | size_t pos, len; | |
590 | PosLenToImpl(nStart, nLen, &pos, &len); | |
591 | return m_impl.compare(pos, len, str.m_impl); | |
592 | } | |
593 | ||
594 | int wxString::compare(size_t nStart, size_t nLen, | |
595 | const wxString& str, | |
596 | size_t nStart2, size_t nLen2) const | |
597 | { | |
598 | size_t pos, len; | |
599 | PosLenToImpl(nStart, nLen, &pos, &len); | |
600 | ||
601 | size_t pos2, len2; | |
602 | str.PosLenToImpl(nStart2, nLen2, &pos2, &len2); | |
603 | ||
604 | return m_impl.compare(pos, len, str.m_impl, pos2, len2); | |
605 | } | |
606 | ||
607 | int wxString::compare(const char* sz) const | |
608 | { | |
609 | return m_impl.compare(ImplStr(sz)); | |
610 | } | |
611 | ||
612 | int wxString::compare(const wchar_t* sz) const | |
613 | { | |
614 | return m_impl.compare(ImplStr(sz)); | |
615 | } | |
616 | ||
617 | int wxString::compare(size_t nStart, size_t nLen, | |
618 | const char* sz, size_t nCount) const | |
619 | { | |
620 | size_t pos, len; | |
621 | PosLenToImpl(nStart, nLen, &pos, &len); | |
622 | ||
623 | SubstrBufFromMB str(ImplStr(sz, nCount)); | |
624 | ||
625 | return m_impl.compare(pos, len, str.data, str.len); | |
626 | } | |
627 | ||
628 | int wxString::compare(size_t nStart, size_t nLen, | |
629 | const wchar_t* sz, size_t nCount) const | |
630 | { | |
631 | size_t pos, len; | |
632 | PosLenToImpl(nStart, nLen, &pos, &len); | |
633 | ||
634 | SubstrBufFromWC str(ImplStr(sz, nCount)); | |
635 | ||
636 | return m_impl.compare(pos, len, str.data, str.len); | |
637 | } | |
638 | ||
639 | #else // !HAVE_STD_STRING_COMPARE | |
640 | ||
641 | static inline int wxDoCmp(const wxStringCharType* s1, size_t l1, | |
642 | const wxStringCharType* s2, size_t l2) | |
643 | { | |
644 | if( l1 == l2 ) | |
645 | return wxStringMemcmp(s1, s2, l1); | |
646 | else if( l1 < l2 ) | |
647 | { | |
648 | int ret = wxStringMemcmp(s1, s2, l1); | |
649 | return ret == 0 ? -1 : ret; | |
650 | } | |
651 | else | |
652 | { | |
653 | int ret = wxStringMemcmp(s1, s2, l2); | |
654 | return ret == 0 ? +1 : ret; | |
655 | } | |
656 | } | |
657 | ||
658 | int wxString::compare(const wxString& str) const | |
659 | { | |
660 | return ::wxDoCmp(m_impl.data(), m_impl.length(), | |
661 | str.m_impl.data(), str.m_impl.length()); | |
662 | } | |
663 | ||
664 | int wxString::compare(size_t nStart, size_t nLen, | |
665 | const wxString& str) const | |
666 | { | |
667 | wxASSERT(nStart <= length()); | |
668 | size_type strLen = length() - nStart; | |
669 | nLen = strLen < nLen ? strLen : nLen; | |
670 | ||
671 | size_t pos, len; | |
672 | PosLenToImpl(nStart, nLen, &pos, &len); | |
673 | ||
674 | return ::wxDoCmp(m_impl.data() + pos, len, | |
675 | str.m_impl.data(), str.m_impl.length()); | |
676 | } | |
677 | ||
678 | int wxString::compare(size_t nStart, size_t nLen, | |
679 | const wxString& str, | |
680 | size_t nStart2, size_t nLen2) const | |
681 | { | |
682 | wxASSERT(nStart <= length()); | |
683 | wxASSERT(nStart2 <= str.length()); | |
684 | size_type strLen = length() - nStart, | |
685 | strLen2 = str.length() - nStart2; | |
686 | nLen = strLen < nLen ? strLen : nLen; | |
687 | nLen2 = strLen2 < nLen2 ? strLen2 : nLen2; | |
688 | ||
689 | size_t pos, len; | |
690 | PosLenToImpl(nStart, nLen, &pos, &len); | |
691 | size_t pos2, len2; | |
692 | str.PosLenToImpl(nStart2, nLen2, &pos2, &len2); | |
693 | ||
694 | return ::wxDoCmp(m_impl.data() + pos, len, | |
695 | str.m_impl.data() + pos2, len2); | |
696 | } | |
697 | ||
698 | int wxString::compare(const char* sz) const | |
699 | { | |
700 | SubstrBufFromMB str(ImplStr(sz, npos)); | |
701 | if ( str.len == npos ) | |
702 | str.len = wxStringStrlen(str.data); | |
703 | return ::wxDoCmp(m_impl.data(), m_impl.length(), str.data, str.len); | |
704 | } | |
705 | ||
706 | int wxString::compare(const wchar_t* sz) const | |
707 | { | |
708 | SubstrBufFromWC str(ImplStr(sz, npos)); | |
709 | if ( str.len == npos ) | |
710 | str.len = wxStringStrlen(str.data); | |
711 | return ::wxDoCmp(m_impl.data(), m_impl.length(), str.data, str.len); | |
712 | } | |
713 | ||
714 | int wxString::compare(size_t nStart, size_t nLen, | |
715 | const char* sz, size_t nCount) const | |
716 | { | |
717 | wxASSERT(nStart <= length()); | |
718 | size_type strLen = length() - nStart; | |
719 | nLen = strLen < nLen ? strLen : nLen; | |
097c080b | 720 | |
a7ea63e2 VS |
721 | size_t pos, len; |
722 | PosLenToImpl(nStart, nLen, &pos, &len); | |
3168a13f | 723 | |
a7ea63e2 VS |
724 | SubstrBufFromMB str(ImplStr(sz, nCount)); |
725 | if ( str.len == npos ) | |
726 | str.len = wxStringStrlen(str.data); | |
727 | ||
728 | return ::wxDoCmp(m_impl.data() + pos, len, str.data, str.len); | |
c801d85f KB |
729 | } |
730 | ||
a7ea63e2 VS |
731 | int wxString::compare(size_t nStart, size_t nLen, |
732 | const wchar_t* sz, size_t nCount) const | |
8f93a29f | 733 | { |
a7ea63e2 VS |
734 | wxASSERT(nStart <= length()); |
735 | size_type strLen = length() - nStart; | |
736 | nLen = strLen < nLen ? strLen : nLen; | |
8f93a29f | 737 | |
a7ea63e2 VS |
738 | size_t pos, len; |
739 | PosLenToImpl(nStart, nLen, &pos, &len); | |
8f93a29f | 740 | |
a7ea63e2 VS |
741 | SubstrBufFromWC str(ImplStr(sz, nCount)); |
742 | if ( str.len == npos ) | |
743 | str.len = wxStringStrlen(str.data); | |
744 | ||
745 | return ::wxDoCmp(m_impl.data() + pos, len, str.data, str.len); | |
8f93a29f VS |
746 | } |
747 | ||
a7ea63e2 VS |
748 | #endif // HAVE_STD_STRING_COMPARE/!HAVE_STD_STRING_COMPARE |
749 | ||
750 | ||
8f93a29f VS |
751 | // --------------------------------------------------------------------------- |
752 | // find_{first,last}_[not]_of functions | |
753 | // --------------------------------------------------------------------------- | |
754 | ||
755 | #if !wxUSE_STL_BASED_WXSTRING || wxUSE_UNICODE_UTF8 | |
c801d85f | 756 | |
8f93a29f VS |
757 | // NB: All these functions are implemented with the argument being wxChar*, |
758 | // i.e. widechar string in any Unicode build, even though native string | |
759 | // representation is char* in the UTF-8 build. This is because we couldn't | |
760 | // use memchr() to determine if a character is in a set encoded as UTF-8. | |
761 | ||
762 | size_t wxString::find_first_of(const wxChar* sz, size_t nStart) const | |
dcb68102 | 763 | { |
8f93a29f | 764 | return find_first_of(sz, nStart, wxStrlen(sz)); |
dcb68102 RN |
765 | } |
766 | ||
8f93a29f | 767 | size_t wxString::find_first_not_of(const wxChar* sz, size_t nStart) const |
dcb68102 | 768 | { |
8f93a29f | 769 | return find_first_not_of(sz, nStart, wxStrlen(sz)); |
dcb68102 RN |
770 | } |
771 | ||
8f93a29f | 772 | size_t wxString::find_first_of(const wxChar* sz, size_t nStart, size_t n) const |
dcb68102 | 773 | { |
8f93a29f | 774 | wxASSERT_MSG( nStart <= length(), _T("invalid index") ); |
dcb68102 | 775 | |
8f93a29f VS |
776 | size_t idx = nStart; |
777 | for ( const_iterator i = begin() + nStart; i != end(); ++idx, ++i ) | |
dcb68102 | 778 | { |
8f93a29f VS |
779 | if ( wxTmemchr(sz, *i, n) ) |
780 | return idx; | |
dcb68102 | 781 | } |
8f93a29f VS |
782 | |
783 | return npos; | |
784 | } | |
785 | ||
786 | size_t wxString::find_first_not_of(const wxChar* sz, size_t nStart, size_t n) const | |
787 | { | |
788 | wxASSERT_MSG( nStart <= length(), _T("invalid index") ); | |
789 | ||
790 | size_t idx = nStart; | |
791 | for ( const_iterator i = begin() + nStart; i != end(); ++idx, ++i ) | |
dcb68102 | 792 | { |
8f93a29f VS |
793 | if ( !wxTmemchr(sz, *i, n) ) |
794 | return idx; | |
795 | } | |
796 | ||
797 | return npos; | |
798 | } | |
799 | ||
800 | ||
801 | size_t wxString::find_last_of(const wxChar* sz, size_t nStart) const | |
802 | { | |
803 | return find_last_of(sz, nStart, wxStrlen(sz)); | |
804 | } | |
805 | ||
806 | size_t wxString::find_last_not_of(const wxChar* sz, size_t nStart) const | |
807 | { | |
808 | return find_last_not_of(sz, nStart, wxStrlen(sz)); | |
809 | } | |
810 | ||
811 | size_t wxString::find_last_of(const wxChar* sz, size_t nStart, size_t n) const | |
812 | { | |
813 | size_t len = length(); | |
814 | ||
815 | if ( nStart == npos ) | |
816 | { | |
817 | nStart = len - 1; | |
dcb68102 | 818 | } |
2c09fb3b | 819 | else |
dcb68102 | 820 | { |
8f93a29f | 821 | wxASSERT_MSG( nStart <= len, _T("invalid index") ); |
dcb68102 | 822 | } |
8f93a29f VS |
823 | |
824 | size_t idx = nStart; | |
825 | for ( const_reverse_iterator i = rbegin() + (len - nStart - 1); | |
826 | i != rend(); --idx, ++i ) | |
827 | { | |
828 | if ( wxTmemchr(sz, *i, n) ) | |
829 | return idx; | |
830 | } | |
831 | ||
832 | return npos; | |
dcb68102 RN |
833 | } |
834 | ||
8f93a29f | 835 | size_t wxString::find_last_not_of(const wxChar* sz, size_t nStart, size_t n) const |
dcb68102 | 836 | { |
8f93a29f VS |
837 | size_t len = length(); |
838 | ||
839 | if ( nStart == npos ) | |
840 | { | |
841 | nStart = len - 1; | |
842 | } | |
843 | else | |
844 | { | |
845 | wxASSERT_MSG( nStart <= len, _T("invalid index") ); | |
846 | } | |
847 | ||
848 | size_t idx = nStart; | |
849 | for ( const_reverse_iterator i = rbegin() + (len - nStart - 1); | |
850 | i != rend(); --idx, ++i ) | |
851 | { | |
852 | if ( !wxTmemchr(sz, *i, n) ) | |
853 | return idx; | |
854 | } | |
855 | ||
856 | return npos; | |
dcb68102 RN |
857 | } |
858 | ||
8f93a29f | 859 | size_t wxString::find_first_not_of(wxUniChar ch, size_t nStart) const |
dcb68102 | 860 | { |
8f93a29f VS |
861 | wxASSERT_MSG( nStart <= length(), _T("invalid index") ); |
862 | ||
863 | size_t idx = nStart; | |
864 | for ( const_iterator i = begin() + nStart; i != end(); ++idx, ++i ) | |
865 | { | |
866 | if ( *i != ch ) | |
867 | return idx; | |
868 | } | |
869 | ||
870 | return npos; | |
871 | } | |
872 | ||
873 | size_t wxString::find_last_not_of(wxUniChar ch, size_t nStart) const | |
874 | { | |
875 | size_t len = length(); | |
876 | ||
877 | if ( nStart == npos ) | |
878 | { | |
879 | nStart = len - 1; | |
880 | } | |
881 | else | |
882 | { | |
883 | wxASSERT_MSG( nStart <= len, _T("invalid index") ); | |
884 | } | |
885 | ||
886 | size_t idx = nStart; | |
887 | for ( const_reverse_iterator i = rbegin() + (len - nStart - 1); | |
888 | i != rend(); --idx, ++i ) | |
889 | { | |
890 | if ( *i != ch ) | |
891 | return idx; | |
892 | } | |
893 | ||
894 | return npos; | |
895 | } | |
896 | ||
897 | // the functions above were implemented for wchar_t* arguments in Unicode | |
898 | // build and char* in ANSI build; below are implementations for the other | |
899 | // version: | |
900 | #if wxUSE_UNICODE | |
901 | #define wxOtherCharType char | |
902 | #define STRCONV (const wxChar*)wxConvLibc.cMB2WC | |
903 | #else | |
904 | #define wxOtherCharType wchar_t | |
905 | #define STRCONV (const wxChar*)wxConvLibc.cWC2MB | |
906 | #endif | |
907 | ||
908 | size_t wxString::find_first_of(const wxOtherCharType* sz, size_t nStart) const | |
909 | { return find_first_of(STRCONV(sz), nStart); } | |
910 | ||
911 | size_t wxString::find_first_of(const wxOtherCharType* sz, size_t nStart, | |
912 | size_t n) const | |
913 | { return find_first_of(STRCONV(sz, n, NULL), nStart, n); } | |
914 | size_t wxString::find_last_of(const wxOtherCharType* sz, size_t nStart) const | |
915 | { return find_last_of(STRCONV(sz), nStart); } | |
916 | size_t wxString::find_last_of(const wxOtherCharType* sz, size_t nStart, | |
917 | size_t n) const | |
918 | { return find_last_of(STRCONV(sz, n, NULL), nStart, n); } | |
919 | size_t wxString::find_first_not_of(const wxOtherCharType* sz, size_t nStart) const | |
920 | { return find_first_not_of(STRCONV(sz), nStart); } | |
921 | size_t wxString::find_first_not_of(const wxOtherCharType* sz, size_t nStart, | |
922 | size_t n) const | |
923 | { return find_first_not_of(STRCONV(sz, n, NULL), nStart, n); } | |
924 | size_t wxString::find_last_not_of(const wxOtherCharType* sz, size_t nStart) const | |
925 | { return find_last_not_of(STRCONV(sz), nStart); } | |
926 | size_t wxString::find_last_not_of(const wxOtherCharType* sz, size_t nStart, | |
927 | size_t n) const | |
928 | { return find_last_not_of(STRCONV(sz, n, NULL), nStart, n); } | |
929 | ||
930 | #undef wxOtherCharType | |
931 | #undef STRCONV | |
932 | ||
933 | #endif // !wxUSE_STL_BASED_WXSTRING || wxUSE_UNICODE_UTF8 | |
934 | ||
935 | // =========================================================================== | |
936 | // other common string functions | |
937 | // =========================================================================== | |
938 | ||
939 | int wxString::CmpNoCase(const wxString& s) const | |
940 | { | |
941 | // FIXME-UTF8: use wxUniChar::ToLower/ToUpper once added | |
942 | ||
943 | size_t idx = 0; | |
944 | const_iterator i1 = begin(); | |
945 | const_iterator end1 = end(); | |
946 | const_iterator i2 = s.begin(); | |
947 | const_iterator end2 = s.end(); | |
948 | ||
949 | for ( ; i1 != end1 && i2 != end2; ++idx, ++i1, ++i2 ) | |
950 | { | |
951 | wxUniChar lower1 = (wxChar)wxTolower(*i1); | |
952 | wxUniChar lower2 = (wxChar)wxTolower(*i2); | |
953 | if ( lower1 != lower2 ) | |
954 | return lower1 < lower2 ? -1 : 1; | |
955 | } | |
956 | ||
957 | size_t len1 = length(); | |
958 | size_t len2 = s.length(); | |
dcb68102 | 959 | |
8f93a29f VS |
960 | if ( len1 < len2 ) |
961 | return -1; | |
962 | else if ( len1 > len2 ) | |
963 | return 1; | |
964 | return 0; | |
dcb68102 RN |
965 | } |
966 | ||
967 | ||
b1ac3b56 | 968 | #if wxUSE_UNICODE |
e015c2a3 | 969 | |
cf6bedce SC |
970 | #ifdef __MWERKS__ |
971 | #ifndef __SCHAR_MAX__ | |
972 | #define __SCHAR_MAX__ 127 | |
973 | #endif | |
974 | #endif | |
975 | ||
e015c2a3 | 976 | wxString wxString::FromAscii(const char *ascii) |
b1ac3b56 RR |
977 | { |
978 | if (!ascii) | |
979 | return wxEmptyString; | |
e015c2a3 | 980 | |
c1eada83 | 981 | size_t len = strlen(ascii); |
b1ac3b56 | 982 | wxString res; |
e015c2a3 VZ |
983 | |
984 | if ( len ) | |
985 | { | |
c1eada83 VS |
986 | wxImplStringBuffer buf(res, len); |
987 | wxStringCharType *dest = buf; | |
e015c2a3 VZ |
988 | |
989 | for ( ;; ) | |
990 | { | |
c1eada83 VS |
991 | unsigned char c = (unsigned char)*ascii++; |
992 | wxASSERT_MSG( c < 0x80, | |
993 | _T("Non-ASCII value passed to FromAscii().") ); | |
994 | ||
995 | *dest++ = (wchar_t)c; | |
996 | ||
997 | if ( c == '\0' ) | |
998 | break; | |
e015c2a3 VZ |
999 | } |
1000 | } | |
1001 | ||
b1ac3b56 RR |
1002 | return res; |
1003 | } | |
1004 | ||
2b5f62a0 VZ |
1005 | wxString wxString::FromAscii(const char ascii) |
1006 | { | |
1007 | // What do we do with '\0' ? | |
1008 | ||
c1eada83 | 1009 | unsigned char c = (unsigned char)ascii; |
8760bc65 | 1010 | |
c1eada83 VS |
1011 | wxASSERT_MSG( c < 0x80, _T("Non-ASCII value passed to FromAscii().") ); |
1012 | ||
1013 | // NB: the cast to wchar_t causes interpretation of 'ascii' as Latin1 value | |
1014 | return wxString(wxUniChar((wchar_t)c)); | |
2b5f62a0 VZ |
1015 | } |
1016 | ||
b1ac3b56 RR |
1017 | const wxCharBuffer wxString::ToAscii() const |
1018 | { | |
e015c2a3 VZ |
1019 | // this will allocate enough space for the terminating NUL too |
1020 | wxCharBuffer buffer(length()); | |
6e394fc6 | 1021 | char *dest = buffer.data(); |
e015c2a3 | 1022 | |
c1eada83 | 1023 | for ( const_iterator i = begin(); i != end(); ++i ) |
b1ac3b56 | 1024 | { |
c1eada83 VS |
1025 | wxUniChar c(*i); |
1026 | // FIXME-UTF8: unify substituted char ('_') with wxUniChar ('?') | |
1027 | *dest++ = c.IsAscii() ? (char)c : '_'; | |
e015c2a3 VZ |
1028 | |
1029 | // the output string can't have embedded NULs anyhow, so we can safely | |
1030 | // stop at first of them even if we do have any | |
c1eada83 | 1031 | if ( !c ) |
e015c2a3 | 1032 | break; |
b1ac3b56 | 1033 | } |
e015c2a3 | 1034 | |
b1ac3b56 RR |
1035 | return buffer; |
1036 | } | |
e015c2a3 | 1037 | |
c1eada83 | 1038 | #endif // wxUSE_UNICODE |
b1ac3b56 | 1039 | |
c801d85f | 1040 | // extract string of length nCount starting at nFirst |
c801d85f KB |
1041 | wxString wxString::Mid(size_t nFirst, size_t nCount) const |
1042 | { | |
73f507f5 | 1043 | size_t nLen = length(); |
30d9011f | 1044 | |
73f507f5 WS |
1045 | // default value of nCount is npos and means "till the end" |
1046 | if ( nCount == npos ) | |
1047 | { | |
1048 | nCount = nLen - nFirst; | |
1049 | } | |
30d9011f | 1050 | |
73f507f5 WS |
1051 | // out-of-bounds requests return sensible things |
1052 | if ( nFirst + nCount > nLen ) | |
1053 | { | |
1054 | nCount = nLen - nFirst; | |
1055 | } | |
c801d85f | 1056 | |
73f507f5 WS |
1057 | if ( nFirst > nLen ) |
1058 | { | |
1059 | // AllocCopy() will return empty string | |
1060 | return wxEmptyString; | |
1061 | } | |
c801d85f | 1062 | |
73f507f5 WS |
1063 | wxString dest(*this, nFirst, nCount); |
1064 | if ( dest.length() != nCount ) | |
1065 | { | |
1066 | wxFAIL_MSG( _T("out of memory in wxString::Mid") ); | |
1067 | } | |
30d9011f | 1068 | |
73f507f5 | 1069 | return dest; |
c801d85f KB |
1070 | } |
1071 | ||
e87b7833 | 1072 | // check that the string starts with prefix and return the rest of the string |
d775fa82 | 1073 | // in the provided pointer if it is not NULL, otherwise return false |
c5e7a7d7 | 1074 | bool wxString::StartsWith(const wxString& prefix, wxString *rest) const |
f6bcfd97 | 1075 | { |
c5e7a7d7 VS |
1076 | if ( compare(0, prefix.length(), prefix) != 0 ) |
1077 | return false; | |
f6bcfd97 BP |
1078 | |
1079 | if ( rest ) | |
1080 | { | |
1081 | // put the rest of the string into provided pointer | |
c5e7a7d7 | 1082 | rest->assign(*this, prefix.length(), npos); |
f6bcfd97 BP |
1083 | } |
1084 | ||
d775fa82 | 1085 | return true; |
f6bcfd97 BP |
1086 | } |
1087 | ||
3affcd07 VZ |
1088 | |
1089 | // check that the string ends with suffix and return the rest of it in the | |
1090 | // provided pointer if it is not NULL, otherwise return false | |
c5e7a7d7 | 1091 | bool wxString::EndsWith(const wxString& suffix, wxString *rest) const |
3affcd07 | 1092 | { |
c5e7a7d7 | 1093 | int start = length() - suffix.length(); |
81727065 VS |
1094 | |
1095 | if ( start < 0 || compare(start, npos, suffix) != 0 ) | |
3affcd07 VZ |
1096 | return false; |
1097 | ||
1098 | if ( rest ) | |
1099 | { | |
1100 | // put the rest of the string into provided pointer | |
1101 | rest->assign(*this, 0, start); | |
1102 | } | |
1103 | ||
1104 | return true; | |
1105 | } | |
1106 | ||
1107 | ||
c801d85f KB |
1108 | // extract nCount last (rightmost) characters |
1109 | wxString wxString::Right(size_t nCount) const | |
1110 | { | |
e87b7833 MB |
1111 | if ( nCount > length() ) |
1112 | nCount = length(); | |
c801d85f | 1113 | |
e87b7833 MB |
1114 | wxString dest(*this, length() - nCount, nCount); |
1115 | if ( dest.length() != nCount ) { | |
b1801e0e GD |
1116 | wxFAIL_MSG( _T("out of memory in wxString::Right") ); |
1117 | } | |
c801d85f KB |
1118 | return dest; |
1119 | } | |
1120 | ||
1121 | // get all characters after the last occurence of ch | |
1122 | // (returns the whole string if ch not found) | |
c9f78968 | 1123 | wxString wxString::AfterLast(wxUniChar ch) const |
c801d85f KB |
1124 | { |
1125 | wxString str; | |
d775fa82 | 1126 | int iPos = Find(ch, true); |
3c67202d | 1127 | if ( iPos == wxNOT_FOUND ) |
c801d85f KB |
1128 | str = *this; |
1129 | else | |
c9f78968 | 1130 | str = wx_str() + iPos + 1; |
c801d85f KB |
1131 | |
1132 | return str; | |
1133 | } | |
1134 | ||
1135 | // extract nCount first (leftmost) characters | |
1136 | wxString wxString::Left(size_t nCount) const | |
1137 | { | |
e87b7833 MB |
1138 | if ( nCount > length() ) |
1139 | nCount = length(); | |
c801d85f | 1140 | |
e87b7833 MB |
1141 | wxString dest(*this, 0, nCount); |
1142 | if ( dest.length() != nCount ) { | |
b1801e0e GD |
1143 | wxFAIL_MSG( _T("out of memory in wxString::Left") ); |
1144 | } | |
c801d85f KB |
1145 | return dest; |
1146 | } | |
1147 | ||
1148 | // get all characters before the first occurence of ch | |
1149 | // (returns the whole string if ch not found) | |
c9f78968 | 1150 | wxString wxString::BeforeFirst(wxUniChar ch) const |
c801d85f | 1151 | { |
e87b7833 MB |
1152 | int iPos = Find(ch); |
1153 | if ( iPos == wxNOT_FOUND ) iPos = length(); | |
1154 | return wxString(*this, 0, iPos); | |
c801d85f KB |
1155 | } |
1156 | ||
1157 | /// get all characters before the last occurence of ch | |
1158 | /// (returns empty string if ch not found) | |
c9f78968 | 1159 | wxString wxString::BeforeLast(wxUniChar ch) const |
c801d85f KB |
1160 | { |
1161 | wxString str; | |
d775fa82 | 1162 | int iPos = Find(ch, true); |
3c67202d | 1163 | if ( iPos != wxNOT_FOUND && iPos != 0 ) |
d1c9bbf6 | 1164 | str = wxString(c_str(), iPos); |
c801d85f KB |
1165 | |
1166 | return str; | |
1167 | } | |
1168 | ||
1169 | /// get all characters after the first occurence of ch | |
1170 | /// (returns empty string if ch not found) | |
c9f78968 | 1171 | wxString wxString::AfterFirst(wxUniChar ch) const |
c801d85f KB |
1172 | { |
1173 | wxString str; | |
1174 | int iPos = Find(ch); | |
3c67202d | 1175 | if ( iPos != wxNOT_FOUND ) |
c9f78968 | 1176 | str = wx_str() + iPos + 1; |
c801d85f KB |
1177 | |
1178 | return str; | |
1179 | } | |
1180 | ||
1181 | // replace first (or all) occurences of some substring with another one | |
8a540c88 VS |
1182 | size_t wxString::Replace(const wxString& strOld, |
1183 | const wxString& strNew, bool bReplaceAll) | |
c801d85f | 1184 | { |
a8f1f1b2 | 1185 | // if we tried to replace an empty string we'd enter an infinite loop below |
8a540c88 | 1186 | wxCHECK_MSG( !strOld.empty(), 0, |
a8f1f1b2 VZ |
1187 | _T("wxString::Replace(): invalid parameter") ); |
1188 | ||
510bb748 | 1189 | size_t uiCount = 0; // count of replacements made |
c801d85f | 1190 | |
8a540c88 VS |
1191 | size_t uiOldLen = strOld.length(); |
1192 | size_t uiNewLen = strNew.length(); | |
c801d85f | 1193 | |
510bb748 | 1194 | size_t dwPos = 0; |
c801d85f | 1195 | |
8a540c88 | 1196 | while ( (*this)[dwPos] != wxT('\0') ) |
510bb748 RN |
1197 | { |
1198 | //DO NOT USE STRSTR HERE | |
1199 | //this string can contain embedded null characters, | |
1200 | //so strstr will function incorrectly | |
8a540c88 | 1201 | dwPos = find(strOld, dwPos); |
ad5bb7d6 | 1202 | if ( dwPos == npos ) |
510bb748 | 1203 | break; // exit the loop |
ad5bb7d6 | 1204 | else |
510bb748 RN |
1205 | { |
1206 | //replace this occurance of the old string with the new one | |
8a540c88 | 1207 | replace(dwPos, uiOldLen, strNew, uiNewLen); |
510bb748 | 1208 | |
2df0258e RN |
1209 | //move up pos past the string that was replaced |
1210 | dwPos += uiNewLen; | |
510bb748 RN |
1211 | |
1212 | //increase replace count | |
1213 | ++uiCount; | |
ad5bb7d6 | 1214 | |
510bb748 | 1215 | // stop now? |
ad5bb7d6 | 1216 | if ( !bReplaceAll ) |
510bb748 RN |
1217 | break; // exit the loop |
1218 | } | |
c801d85f | 1219 | } |
c801d85f | 1220 | |
510bb748 | 1221 | return uiCount; |
c801d85f KB |
1222 | } |
1223 | ||
1224 | bool wxString::IsAscii() const | |
1225 | { | |
a4a44612 VS |
1226 | for ( const_iterator i = begin(); i != end(); ++i ) |
1227 | { | |
1228 | if ( !(*i).IsAscii() ) | |
1229 | return false; | |
1230 | } | |
1231 | ||
1232 | return true; | |
c801d85f | 1233 | } |
dd1eaa89 | 1234 | |
c801d85f KB |
1235 | bool wxString::IsWord() const |
1236 | { | |
a4a44612 VS |
1237 | for ( const_iterator i = begin(); i != end(); ++i ) |
1238 | { | |
1239 | if ( !wxIsalpha(*i) ) | |
1240 | return false; | |
1241 | } | |
1242 | ||
1243 | return true; | |
c801d85f | 1244 | } |
dd1eaa89 | 1245 | |
c801d85f KB |
1246 | bool wxString::IsNumber() const |
1247 | { | |
a4a44612 VS |
1248 | if ( empty() ) |
1249 | return true; | |
1250 | ||
1251 | const_iterator i = begin(); | |
1252 | ||
1253 | if ( *i == _T('-') || *i == _T('+') ) | |
1254 | ++i; | |
1255 | ||
1256 | for ( ; i != end(); ++i ) | |
1257 | { | |
1258 | if ( !wxIsdigit(*i) ) | |
1259 | return false; | |
1260 | } | |
1261 | ||
1262 | return true; | |
c801d85f KB |
1263 | } |
1264 | ||
c801d85f KB |
1265 | wxString wxString::Strip(stripType w) const |
1266 | { | |
1267 | wxString s = *this; | |
d775fa82 WS |
1268 | if ( w & leading ) s.Trim(false); |
1269 | if ( w & trailing ) s.Trim(true); | |
c801d85f KB |
1270 | return s; |
1271 | } | |
1272 | ||
c801d85f KB |
1273 | // --------------------------------------------------------------------------- |
1274 | // case conversion | |
1275 | // --------------------------------------------------------------------------- | |
1276 | ||
1277 | wxString& wxString::MakeUpper() | |
1278 | { | |
e87b7833 MB |
1279 | for ( iterator it = begin(), en = end(); it != en; ++it ) |
1280 | *it = (wxChar)wxToupper(*it); | |
c801d85f KB |
1281 | |
1282 | return *this; | |
1283 | } | |
1284 | ||
1285 | wxString& wxString::MakeLower() | |
1286 | { | |
e87b7833 MB |
1287 | for ( iterator it = begin(), en = end(); it != en; ++it ) |
1288 | *it = (wxChar)wxTolower(*it); | |
c801d85f KB |
1289 | |
1290 | return *this; | |
1291 | } | |
1292 | ||
1293 | // --------------------------------------------------------------------------- | |
1294 | // trimming and padding | |
1295 | // --------------------------------------------------------------------------- | |
1296 | ||
d775fa82 | 1297 | // some compilers (VC++ 6.0 not to name them) return true for a call to |
576c608d VZ |
1298 |