Maybe negative wxWindowId are better than just -1.
[wxWidgets.git] / src / common / string.cpp
1 /////////////////////////////////////////////////////////////////////////////
2 // Name: string.cpp
3 // Purpose: wxString class
4 // Author: Vadim Zeitlin
5 // Modified by:
6 // Created: 29/01/98
7 // RCS-ID: $Id$
8 // Copyright: (c) 1998 Vadim Zeitlin <zeitlin@dptmaths.ens-cachan.fr>
9 // Licence: wxWindows license
10 /////////////////////////////////////////////////////////////////////////////
11
12 #ifdef __GNUG__
13 #pragma implementation "string.h"
14 #endif
15
16 /*
17 * About ref counting:
18 * 1) all empty strings use g_strEmpty, nRefs = -1 (set in Init())
19 * 2) AllocBuffer() sets nRefs to 1, Lock() increments it by one
20 * 3) Unlock() decrements nRefs and frees memory if it goes to 0
21 */
22
23 // ===========================================================================
24 // headers, declarations, constants
25 // ===========================================================================
26
27 // For compilers that support precompilation, includes "wx.h".
28 #include "wx/wxprec.h"
29
30 #ifdef __BORLANDC__
31 #pragma hdrstop
32 #endif
33
34 #ifndef WX_PRECOMP
35 #include "wx/defs.h"
36 #include "wx/string.h"
37 #include "wx/intl.h"
38 #if wxUSE_THREADS
39 #include <wx/thread.h>
40 #endif
41 #endif
42
43 #include <ctype.h>
44 #include <string.h>
45 #include <stdlib.h>
46
47 #ifdef __SALFORDC__
48 #include <clib.h>
49 #endif
50
51 #if wxUSE_WCSRTOMBS
52 #include <wchar.h> // for wcsrtombs(), see comments where it's used
53 #endif // GNU
54
55 #ifdef WXSTRING_IS_WXOBJECT
56 IMPLEMENT_DYNAMIC_CLASS(wxString, wxObject)
57 #endif //WXSTRING_IS_WXOBJECT
58
59 // allocating extra space for each string consumes more memory but speeds up
60 // the concatenation operations (nLen is the current string's length)
61 // NB: EXTRA_ALLOC must be >= 0!
62 #define EXTRA_ALLOC (19 - nLen % 16)
63
64 // ---------------------------------------------------------------------------
65 // static class variables definition
66 // ---------------------------------------------------------------------------
67
68 #ifdef wxSTD_STRING_COMPATIBILITY
69 const size_t wxString::npos = wxSTRING_MAXLEN;
70 #endif // wxSTD_STRING_COMPATIBILITY
71
72 // ----------------------------------------------------------------------------
73 // static data
74 // ----------------------------------------------------------------------------
75
76 // for an empty string, GetStringData() will return this address: this
77 // structure has the same layout as wxStringData and it's data() method will
78 // return the empty string (dummy pointer)
79 static const struct
80 {
81 wxStringData data;
82 wxChar dummy;
83 } g_strEmpty = { {-1, 0, 0}, _T('\0') };
84
85 // empty C style string: points to 'string data' byte of g_strEmpty
86 extern const wxChar WXDLLEXPORT *g_szNul = &g_strEmpty.dummy;
87
88 // ----------------------------------------------------------------------------
89 // conditional compilation
90 // ----------------------------------------------------------------------------
91
92 // we want to find out if the current platform supports vsnprintf()-like
93 // function: for Unix this is done with configure, for Windows we test the
94 // compiler explicitly.
95 #ifdef __WXMSW__
96 #ifdef __VISUALC__
97 #define wxVsnprintf _vsnprintf
98 #endif
99 #else // !Windows
100 #ifdef HAVE_VSNPRINTF
101 #define wxVsnprintf vsnprintf
102 #endif
103 #endif // Windows/!Windows
104
105 #ifndef wxVsnprintf
106 // in this case we'll use vsprintf() (which is ANSI and thus should be
107 // always available), but it's unsafe because it doesn't check for buffer
108 // size - so give a warning
109 #define wxVsnprintf(buffer,len,format,argptr) vsprintf(buffer,format, argptr)
110
111 #if defined(__VISUALC__)
112 #pragma message("Using sprintf() because no snprintf()-like function defined")
113 #elif defined(__GNUG__) && !defined(__UNIX__)
114 #warning "Using sprintf() because no snprintf()-like function defined"
115 #elif defined(__MWERKS__)
116 #warning "Using sprintf() because no snprintf()-like function defined"
117 #endif //compiler
118 #endif // no vsnprintf
119
120 #ifdef _AIX
121 // AIX has vsnprintf, but there's no prototype in the system headers.
122 extern "C" int vsnprintf(char* str, size_t n, const char* format, va_list ap);
123 #endif
124
125 // ----------------------------------------------------------------------------
126 // global functions
127 // ----------------------------------------------------------------------------
128
129 #ifdef wxSTD_STRING_COMPATIBILITY
130
131 // MS Visual C++ version 5.0 provides the new STL headers as well as the old
132 // iostream ones.
133 //
134 // ATTN: you can _not_ use both of these in the same program!
135
136 istream& operator>>(istream& is, wxString& WXUNUSED(str))
137 {
138 #if 0
139 int w = is.width(0);
140 if ( is.ipfx(0) ) {
141 streambuf *sb = is.rdbuf();
142 str.erase();
143 while ( true ) {
144 int ch = sb->sbumpc ();
145 if ( ch == EOF ) {
146 is.setstate(ios::eofbit);
147 break;
148 }
149 else if ( isspace(ch) ) {
150 sb->sungetc();
151 break;
152 }
153
154 str += ch;
155 if ( --w == 1 )
156 break;
157 }
158 }
159
160 is.isfx();
161 if ( str.length() == 0 )
162 is.setstate(ios::failbit);
163 #endif
164 return is;
165 }
166
167 #endif //std::string compatibility
168
169 // ----------------------------------------------------------------------------
170 // private classes
171 // ----------------------------------------------------------------------------
172
173 // this small class is used to gather statistics for performance tuning
174 //#define WXSTRING_STATISTICS
175 #ifdef WXSTRING_STATISTICS
176 class Averager
177 {
178 public:
179 Averager(const char *sz) { m_sz = sz; m_nTotal = m_nCount = 0; }
180 ~Averager()
181 { printf("wxString: average %s = %f\n", m_sz, ((float)m_nTotal)/m_nCount); }
182
183 void Add(size_t n) { m_nTotal += n; m_nCount++; }
184
185 private:
186 size_t m_nCount, m_nTotal;
187 const char *m_sz;
188 } g_averageLength("allocation size"),
189 g_averageSummandLength("summand length"),
190 g_averageConcatHit("hit probability in concat"),
191 g_averageInitialLength("initial string length");
192
193 #define STATISTICS_ADD(av, val) g_average##av.Add(val)
194 #else
195 #define STATISTICS_ADD(av, val)
196 #endif // WXSTRING_STATISTICS
197
198 // ===========================================================================
199 // wxString class core
200 // ===========================================================================
201
202 // ---------------------------------------------------------------------------
203 // construction
204 // ---------------------------------------------------------------------------
205
206 // constructs string of <nLength> copies of character <ch>
207 wxString::wxString(wxChar ch, size_t nLength)
208 {
209 Init();
210
211 if ( nLength > 0 ) {
212 AllocBuffer(nLength);
213
214 #if wxUSE_UNICODE
215 // memset only works on char
216 for (size_t n=0; n<nLength; n++) m_pchData[n] = ch;
217 #else
218 memset(m_pchData, ch, nLength);
219 #endif
220 }
221 }
222
223 // takes nLength elements of psz starting at nPos
224 void wxString::InitWith(const wxChar *psz, size_t nPos, size_t nLength)
225 {
226 Init();
227
228 wxASSERT( nPos <= wxStrlen(psz) );
229
230 if ( nLength == wxSTRING_MAXLEN )
231 nLength = wxStrlen(psz + nPos);
232
233 STATISTICS_ADD(InitialLength, nLength);
234
235 if ( nLength > 0 ) {
236 // trailing '\0' is written in AllocBuffer()
237 AllocBuffer(nLength);
238 memcpy(m_pchData, psz + nPos, nLength*sizeof(wxChar));
239 }
240 }
241
242 #ifdef wxSTD_STRING_COMPATIBILITY
243
244 // poor man's iterators are "void *" pointers
245 wxString::wxString(const void *pStart, const void *pEnd)
246 {
247 InitWith((const wxChar *)pStart, 0,
248 (const wxChar *)pEnd - (const wxChar *)pStart);
249 }
250
251 #endif //std::string compatibility
252
253 #if wxUSE_UNICODE
254
255 // from multibyte string
256 wxString::wxString(const char *psz, wxMBConv& conv, size_t nLength)
257 {
258 // first get necessary size
259 size_t nLen = psz ? conv.MB2WC((wchar_t *) NULL, psz, 0) : 0;
260
261 // nLength is number of *Unicode* characters here!
262 if ((nLen != (size_t)-1) && (nLen > nLength))
263 nLen = nLength;
264
265 // empty?
266 if ( (nLen != 0) && (nLen != (size_t)-1) ) {
267 AllocBuffer(nLen);
268 conv.MB2WC(m_pchData, psz, nLen);
269 }
270 else {
271 Init();
272 }
273 }
274
275 #else
276
277 #if wxUSE_WCHAR_T
278 // from wide string
279 wxString::wxString(const wchar_t *pwz)
280 {
281 // first get necessary size
282 size_t nLen = pwz ? wxWC2MB((char *) NULL, pwz, 0) : 0;
283
284 // empty?
285 if ( (nLen != 0) && (nLen != (size_t)-1) ) {
286 AllocBuffer(nLen);
287 wxWC2MB(m_pchData, pwz, nLen);
288 }
289 else {
290 Init();
291 }
292 }
293 #endif
294
295 #endif
296
297 // ---------------------------------------------------------------------------
298 // memory allocation
299 // ---------------------------------------------------------------------------
300
301 // allocates memory needed to store a C string of length nLen
302 void wxString::AllocBuffer(size_t nLen)
303 {
304 wxASSERT( nLen > 0 ); //
305 wxASSERT( nLen <= INT_MAX-1 ); // max size (enough room for 1 extra)
306
307 STATISTICS_ADD(Length, nLen);
308
309 // allocate memory:
310 // 1) one extra character for '\0' termination
311 // 2) sizeof(wxStringData) for housekeeping info
312 wxStringData* pData = (wxStringData*)
313 malloc(sizeof(wxStringData) + (nLen + EXTRA_ALLOC + 1)*sizeof(wxChar));
314 pData->nRefs = 1;
315 pData->nDataLength = nLen;
316 pData->nAllocLength = nLen + EXTRA_ALLOC;
317 m_pchData = pData->data(); // data starts after wxStringData
318 m_pchData[nLen] = _T('\0');
319 }
320
321 // must be called before changing this string
322 void wxString::CopyBeforeWrite()
323 {
324 wxStringData* pData = GetStringData();
325
326 if ( pData->IsShared() ) {
327 pData->Unlock(); // memory not freed because shared
328 size_t nLen = pData->nDataLength;
329 AllocBuffer(nLen);
330 memcpy(m_pchData, pData->data(), nLen*sizeof(wxChar));
331 }
332
333 wxASSERT( !GetStringData()->IsShared() ); // we must be the only owner
334 }
335
336 // must be called before replacing contents of this string
337 void wxString::AllocBeforeWrite(size_t nLen)
338 {
339 wxASSERT( nLen != 0 ); // doesn't make any sense
340
341 // must not share string and must have enough space
342 wxStringData* pData = GetStringData();
343 if ( pData->IsShared() || (nLen > pData->nAllocLength) ) {
344 // can't work with old buffer, get new one
345 pData->Unlock();
346 AllocBuffer(nLen);
347 }
348 else {
349 // update the string length
350 pData->nDataLength = nLen;
351 }
352
353 wxASSERT( !GetStringData()->IsShared() ); // we must be the only owner
354 }
355
356 // allocate enough memory for nLen characters
357 void wxString::Alloc(size_t nLen)
358 {
359 wxStringData *pData = GetStringData();
360 if ( pData->nAllocLength <= nLen ) {
361 if ( pData->IsEmpty() ) {
362 nLen += EXTRA_ALLOC;
363
364 wxStringData* pData = (wxStringData*)
365 malloc(sizeof(wxStringData) + (nLen + 1)*sizeof(wxChar));
366 pData->nRefs = 1;
367 pData->nDataLength = 0;
368 pData->nAllocLength = nLen;
369 m_pchData = pData->data(); // data starts after wxStringData
370 m_pchData[0u] = _T('\0');
371 }
372 else if ( pData->IsShared() ) {
373 pData->Unlock(); // memory not freed because shared
374 size_t nOldLen = pData->nDataLength;
375 AllocBuffer(nLen);
376 memcpy(m_pchData, pData->data(), nOldLen*sizeof(wxChar));
377 }
378 else {
379 nLen += EXTRA_ALLOC;
380
381 wxStringData *p = (wxStringData *)
382 realloc(pData, sizeof(wxStringData) + (nLen + 1)*sizeof(wxChar));
383
384 if ( p == NULL ) {
385 // @@@ what to do on memory error?
386 return;
387 }
388
389 // it's not important if the pointer changed or not (the check for this
390 // is not faster than assigning to m_pchData in all cases)
391 p->nAllocLength = nLen;
392 m_pchData = p->data();
393 }
394 }
395 //else: we've already got enough
396 }
397
398 // shrink to minimal size (releasing extra memory)
399 void wxString::Shrink()
400 {
401 wxStringData *pData = GetStringData();
402
403 // this variable is unused in release build, so avoid the compiler warning by
404 // just not declaring it
405 #ifdef __WXDEBUG__
406 void *p =
407 #endif
408 realloc(pData, sizeof(wxStringData) + (pData->nDataLength + 1)*sizeof(wxChar));
409
410 wxASSERT( p != NULL ); // can't free memory?
411 wxASSERT( p == pData ); // we're decrementing the size - block shouldn't move!
412 }
413
414 // get the pointer to writable buffer of (at least) nLen bytes
415 wxChar *wxString::GetWriteBuf(size_t nLen)
416 {
417 AllocBeforeWrite(nLen);
418
419 wxASSERT( GetStringData()->nRefs == 1 );
420 GetStringData()->Validate(FALSE);
421
422 return m_pchData;
423 }
424
425 // put string back in a reasonable state after GetWriteBuf
426 void wxString::UngetWriteBuf()
427 {
428 GetStringData()->nDataLength = wxStrlen(m_pchData);
429 GetStringData()->Validate(TRUE);
430 }
431
432 // ---------------------------------------------------------------------------
433 // data access
434 // ---------------------------------------------------------------------------
435
436 // all functions are inline in string.h
437
438 // ---------------------------------------------------------------------------
439 // assignment operators
440 // ---------------------------------------------------------------------------
441
442 // helper function: does real copy
443 void wxString::AssignCopy(size_t nSrcLen, const wxChar *pszSrcData)
444 {
445 if ( nSrcLen == 0 ) {
446 Reinit();
447 }
448 else {
449 AllocBeforeWrite(nSrcLen);
450 memcpy(m_pchData, pszSrcData, nSrcLen*sizeof(wxChar));
451 GetStringData()->nDataLength = nSrcLen;
452 m_pchData[nSrcLen] = _T('\0');
453 }
454 }
455
456 // assigns one string to another
457 wxString& wxString::operator=(const wxString& stringSrc)
458 {
459 wxASSERT( stringSrc.GetStringData()->IsValid() );
460
461 // don't copy string over itself
462 if ( m_pchData != stringSrc.m_pchData ) {
463 if ( stringSrc.GetStringData()->IsEmpty() ) {
464 Reinit();
465 }
466 else {
467 // adjust references
468 GetStringData()->Unlock();
469 m_pchData = stringSrc.m_pchData;
470 GetStringData()->Lock();
471 }
472 }
473
474 return *this;
475 }
476
477 // assigns a single character
478 wxString& wxString::operator=(wxChar ch)
479 {
480 AssignCopy(1, &ch);
481 return *this;
482 }
483
484 // assigns C string
485 wxString& wxString::operator=(const wxChar *psz)
486 {
487 AssignCopy(wxStrlen(psz), psz);
488 return *this;
489 }
490
491 #if !wxUSE_UNICODE
492
493 // same as 'signed char' variant
494 wxString& wxString::operator=(const unsigned char* psz)
495 {
496 *this = (const char *)psz;
497 return *this;
498 }
499
500 #if wxUSE_WCHAR_T
501 wxString& wxString::operator=(const wchar_t *pwz)
502 {
503 wxString str(pwz);
504 *this = str;
505 return *this;
506 }
507 #endif
508
509 #endif
510
511 // ---------------------------------------------------------------------------
512 // string concatenation
513 // ---------------------------------------------------------------------------
514
515 // add something to this string
516 void wxString::ConcatSelf(int nSrcLen, const wxChar *pszSrcData)
517 {
518 STATISTICS_ADD(SummandLength, nSrcLen);
519
520 // concatenating an empty string is a NOP
521 if ( nSrcLen > 0 ) {
522 wxStringData *pData = GetStringData();
523 size_t nLen = pData->nDataLength;
524 size_t nNewLen = nLen + nSrcLen;
525
526 // alloc new buffer if current is too small
527 if ( pData->IsShared() ) {
528 STATISTICS_ADD(ConcatHit, 0);
529
530 // we have to allocate another buffer
531 wxStringData* pOldData = GetStringData();
532 AllocBuffer(nNewLen);
533 memcpy(m_pchData, pOldData->data(), nLen*sizeof(wxChar));
534 pOldData->Unlock();
535 }
536 else if ( nNewLen > pData->nAllocLength ) {
537 STATISTICS_ADD(ConcatHit, 0);
538
539 // we have to grow the buffer
540 Alloc(nNewLen);
541 }
542 else {
543 STATISTICS_ADD(ConcatHit, 1);
544
545 // the buffer is already big enough
546 }
547
548 // should be enough space
549 wxASSERT( nNewLen <= GetStringData()->nAllocLength );
550
551 // fast concatenation - all is done in our buffer
552 memcpy(m_pchData + nLen, pszSrcData, nSrcLen*sizeof(wxChar));
553
554 m_pchData[nNewLen] = _T('\0'); // put terminating '\0'
555 GetStringData()->nDataLength = nNewLen; // and fix the length
556 }
557 //else: the string to append was empty
558 }
559
560 /*
561 * concatenation functions come in 5 flavours:
562 * string + string
563 * char + string and string + char
564 * C str + string and string + C str
565 */
566
567 wxString operator+(const wxString& string1, const wxString& string2)
568 {
569 wxASSERT( string1.GetStringData()->IsValid() );
570 wxASSERT( string2.GetStringData()->IsValid() );
571
572 wxString s = string1;
573 s += string2;
574
575 return s;
576 }
577
578 wxString operator+(const wxString& string, wxChar ch)
579 {
580 wxASSERT( string.GetStringData()->IsValid() );
581
582 wxString s = string;
583 s += ch;
584
585 return s;
586 }
587
588 wxString operator+(wxChar ch, const wxString& string)
589 {
590 wxASSERT( string.GetStringData()->IsValid() );
591
592 wxString s = ch;
593 s += string;
594
595 return s;
596 }
597
598 wxString operator+(const wxString& string, const wxChar *psz)
599 {
600 wxASSERT( string.GetStringData()->IsValid() );
601
602 wxString s;
603 s.Alloc(wxStrlen(psz) + string.Len());
604 s = string;
605 s += psz;
606
607 return s;
608 }
609
610 wxString operator+(const wxChar *psz, const wxString& string)
611 {
612 wxASSERT( string.GetStringData()->IsValid() );
613
614 wxString s;
615 s.Alloc(wxStrlen(psz) + string.Len());
616 s = psz;
617 s += string;
618
619 return s;
620 }
621
622 // ===========================================================================
623 // other common string functions
624 // ===========================================================================
625
626 // ---------------------------------------------------------------------------
627 // simple sub-string extraction
628 // ---------------------------------------------------------------------------
629
630 // helper function: clone the data attached to this string
631 void wxString::AllocCopy(wxString& dest, int nCopyLen, int nCopyIndex) const
632 {
633 if ( nCopyLen == 0 ) {
634 dest.Init();
635 }
636 else {
637 dest.AllocBuffer(nCopyLen);
638 memcpy(dest.m_pchData, m_pchData + nCopyIndex, nCopyLen*sizeof(wxChar));
639 }
640 }
641
642 // extract string of length nCount starting at nFirst
643 wxString wxString::Mid(size_t nFirst, size_t nCount) const
644 {
645 wxStringData *pData = GetStringData();
646 size_t nLen = pData->nDataLength;
647
648 // default value of nCount is wxSTRING_MAXLEN and means "till the end"
649 if ( nCount == wxSTRING_MAXLEN )
650 {
651 nCount = nLen - nFirst;
652 }
653
654 // out-of-bounds requests return sensible things
655 if ( nFirst + nCount > nLen )
656 {
657 nCount = nLen - nFirst;
658 }
659
660 if ( nFirst > nLen )
661 {
662 // AllocCopy() will return empty string
663 nCount = 0;
664 }
665
666 wxString dest;
667 AllocCopy(dest, nCount, nFirst);
668
669 return dest;
670 }
671
672 // extract nCount last (rightmost) characters
673 wxString wxString::Right(size_t nCount) const
674 {
675 if ( nCount > (size_t)GetStringData()->nDataLength )
676 nCount = GetStringData()->nDataLength;
677
678 wxString dest;
679 AllocCopy(dest, nCount, GetStringData()->nDataLength - nCount);
680 return dest;
681 }
682
683 // get all characters after the last occurence of ch
684 // (returns the whole string if ch not found)
685 wxString wxString::AfterLast(wxChar ch) const
686 {
687 wxString str;
688 int iPos = Find(ch, TRUE);
689 if ( iPos == wxNOT_FOUND )
690 str = *this;
691 else
692 str = c_str() + iPos + 1;
693
694 return str;
695 }
696
697 // extract nCount first (leftmost) characters
698 wxString wxString::Left(size_t nCount) const
699 {
700 if ( nCount > (size_t)GetStringData()->nDataLength )
701 nCount = GetStringData()->nDataLength;
702
703 wxString dest;
704 AllocCopy(dest, nCount, 0);
705 return dest;
706 }
707
708 // get all characters before the first occurence of ch
709 // (returns the whole string if ch not found)
710 wxString wxString::BeforeFirst(wxChar ch) const
711 {
712 wxString str;
713 for ( const wxChar *pc = m_pchData; *pc != _T('\0') && *pc != ch; pc++ )
714 str += *pc;
715
716 return str;
717 }
718
719 /// get all characters before the last occurence of ch
720 /// (returns empty string if ch not found)
721 wxString wxString::BeforeLast(wxChar ch) const
722 {
723 wxString str;
724 int iPos = Find(ch, TRUE);
725 if ( iPos != wxNOT_FOUND && iPos != 0 )
726 str = wxString(c_str(), iPos);
727
728 return str;
729 }
730
731 /// get all characters after the first occurence of ch
732 /// (returns empty string if ch not found)
733 wxString wxString::AfterFirst(wxChar ch) const
734 {
735 wxString str;
736 int iPos = Find(ch);
737 if ( iPos != wxNOT_FOUND )
738 str = c_str() + iPos + 1;
739
740 return str;
741 }
742
743 // replace first (or all) occurences of some substring with another one
744 size_t wxString::Replace(const wxChar *szOld, const wxChar *szNew, bool bReplaceAll)
745 {
746 size_t uiCount = 0; // count of replacements made
747
748 size_t uiOldLen = wxStrlen(szOld);
749
750 wxString strTemp;
751 const wxChar *pCurrent = m_pchData;
752 const wxChar *pSubstr;
753 while ( *pCurrent != _T('\0') ) {
754 pSubstr = wxStrstr(pCurrent, szOld);
755 if ( pSubstr == NULL ) {
756 // strTemp is unused if no replacements were made, so avoid the copy
757 if ( uiCount == 0 )
758 return 0;
759
760 strTemp += pCurrent; // copy the rest
761 break; // exit the loop
762 }
763 else {
764 // take chars before match
765 strTemp.ConcatSelf(pSubstr - pCurrent, pCurrent);
766 strTemp += szNew;
767 pCurrent = pSubstr + uiOldLen; // restart after match
768
769 uiCount++;
770
771 // stop now?
772 if ( !bReplaceAll ) {
773 strTemp += pCurrent; // copy the rest
774 break; // exit the loop
775 }
776 }
777 }
778
779 // only done if there were replacements, otherwise would have returned above
780 *this = strTemp;
781
782 return uiCount;
783 }
784
785 bool wxString::IsAscii() const
786 {
787 const wxChar *s = (const wxChar*) *this;
788 while(*s){
789 if(!isascii(*s)) return(FALSE);
790 s++;
791 }
792 return(TRUE);
793 }
794
795 bool wxString::IsWord() const
796 {
797 const wxChar *s = (const wxChar*) *this;
798 while(*s){
799 if(!wxIsalpha(*s)) return(FALSE);
800 s++;
801 }
802 return(TRUE);
803 }
804
805 bool wxString::IsNumber() const
806 {
807 const wxChar *s = (const wxChar*) *this;
808 while(*s){
809 if(!wxIsdigit(*s)) return(FALSE);
810 s++;
811 }
812 return(TRUE);
813 }
814
815 wxString wxString::Strip(stripType w) const
816 {
817 wxString s = *this;
818 if ( w & leading ) s.Trim(FALSE);
819 if ( w & trailing ) s.Trim(TRUE);
820 return s;
821 }
822
823 // ---------------------------------------------------------------------------
824 // case conversion
825 // ---------------------------------------------------------------------------
826
827 wxString& wxString::MakeUpper()
828 {
829 CopyBeforeWrite();
830
831 for ( wxChar *p = m_pchData; *p; p++ )
832 *p = (wxChar)wxToupper(*p);
833
834 return *this;
835 }
836
837 wxString& wxString::MakeLower()
838 {
839 CopyBeforeWrite();
840
841 for ( wxChar *p = m_pchData; *p; p++ )
842 *p = (wxChar)wxTolower(*p);
843
844 return *this;
845 }
846
847 // ---------------------------------------------------------------------------
848 // trimming and padding
849 // ---------------------------------------------------------------------------
850
851 // trims spaces (in the sense of isspace) from left or right side
852 wxString& wxString::Trim(bool bFromRight)
853 {
854 // first check if we're going to modify the string at all
855 if ( !IsEmpty() &&
856 (
857 (bFromRight && wxIsspace(GetChar(Len() - 1))) ||
858 (!bFromRight && wxIsspace(GetChar(0u)))
859 )
860 )
861 {
862 // ok, there is at least one space to trim
863 CopyBeforeWrite();
864
865 if ( bFromRight )
866 {
867 // find last non-space character
868 wxChar *psz = m_pchData + GetStringData()->nDataLength - 1;
869 while ( wxIsspace(*psz) && (psz >= m_pchData) )
870 psz--;
871
872 // truncate at trailing space start
873 *++psz = _T('\0');
874 GetStringData()->nDataLength = psz - m_pchData;
875 }
876 else
877 {
878 // find first non-space character
879 const wxChar *psz = m_pchData;
880 while ( wxIsspace(*psz) )
881 psz++;
882
883 // fix up data and length
884 int nDataLength = GetStringData()->nDataLength - (psz - (const wxChar*) m_pchData);
885 memmove(m_pchData, psz, (nDataLength + 1)*sizeof(wxChar));
886 GetStringData()->nDataLength = nDataLength;
887 }
888 }
889
890 return *this;
891 }
892
893 // adds nCount characters chPad to the string from either side
894 wxString& wxString::Pad(size_t nCount, wxChar chPad, bool bFromRight)
895 {
896 wxString s(chPad, nCount);
897
898 if ( bFromRight )
899 *this += s;
900 else
901 {
902 s += *this;
903 *this = s;
904 }
905
906 return *this;
907 }
908
909 // truncate the string
910 wxString& wxString::Truncate(size_t uiLen)
911 {
912 if ( uiLen < Len() ) {
913 CopyBeforeWrite();
914
915 *(m_pchData + uiLen) = _T('\0');
916 GetStringData()->nDataLength = uiLen;
917 }
918 //else: nothing to do, string is already short enough
919
920 return *this;
921 }
922
923 // ---------------------------------------------------------------------------
924 // finding (return wxNOT_FOUND if not found and index otherwise)
925 // ---------------------------------------------------------------------------
926
927 // find a character
928 int wxString::Find(wxChar ch, bool bFromEnd) const
929 {
930 const wxChar *psz = bFromEnd ? wxStrrchr(m_pchData, ch) : wxStrchr(m_pchData, ch);
931
932 return (psz == NULL) ? wxNOT_FOUND : psz - (const wxChar*) m_pchData;
933 }
934
935 // find a sub-string (like strstr)
936 int wxString::Find(const wxChar *pszSub) const
937 {
938 const wxChar *psz = wxStrstr(m_pchData, pszSub);
939
940 return (psz == NULL) ? wxNOT_FOUND : psz - (const wxChar*) m_pchData;
941 }
942
943 // ---------------------------------------------------------------------------
944 // stream-like operators
945 // ---------------------------------------------------------------------------
946 wxString& wxString::operator<<(int i)
947 {
948 wxString res;
949 res.Printf(_T("%d"), i);
950
951 return (*this) << res;
952 }
953
954 wxString& wxString::operator<<(float f)
955 {
956 wxString res;
957 res.Printf(_T("%f"), f);
958
959 return (*this) << res;
960 }
961
962 wxString& wxString::operator<<(double d)
963 {
964 wxString res;
965 res.Printf(_T("%g"), d);
966
967 return (*this) << res;
968 }
969
970 // ---------------------------------------------------------------------------
971 // formatted output
972 // ---------------------------------------------------------------------------
973 int wxString::Printf(const wxChar *pszFormat, ...)
974 {
975 va_list argptr;
976 va_start(argptr, pszFormat);
977
978 int iLen = PrintfV(pszFormat, argptr);
979
980 va_end(argptr);
981
982 return iLen;
983 }
984
985 int wxString::PrintfV(const wxChar* pszFormat, va_list argptr)
986 {
987 // static buffer to avoid dynamic memory allocation each time
988 static char s_szScratch[1024];
989 #if wxUSE_THREADS
990 // protect the static buffer
991 static wxCriticalSection critsect;
992 wxCriticalSectionLocker lock(critsect);
993 #endif
994
995 #if 1 // the new implementation
996
997 Reinit();
998 for (size_t n = 0; pszFormat[n]; n++)
999 if (pszFormat[n] == _T('%')) {
1000 static char s_szFlags[256] = "%";
1001 size_t flagofs = 1;
1002 bool adj_left = FALSE, in_prec = FALSE,
1003 prec_dot = FALSE, done = FALSE;
1004 int ilen = 0;
1005 size_t min_width = 0, max_width = wxSTRING_MAXLEN;
1006 do {
1007 #define CHECK_PREC if (in_prec && !prec_dot) { s_szFlags[flagofs++] = '.'; prec_dot = TRUE; }
1008 switch (pszFormat[++n]) {
1009 case _T('\0'):
1010 done = TRUE;
1011 break;
1012 case _T('%'):
1013 *this += _T('%');
1014 done = TRUE;
1015 break;
1016 case _T('#'):
1017 case _T('0'):
1018 case _T(' '):
1019 case _T('+'):
1020 case _T('\''):
1021 CHECK_PREC
1022 s_szFlags[flagofs++] = pszFormat[n];
1023 break;
1024 case _T('-'):
1025 CHECK_PREC
1026 adj_left = TRUE;
1027 s_szFlags[flagofs++] = pszFormat[n];
1028 break;
1029 case _T('.'):
1030 CHECK_PREC
1031 in_prec = TRUE;
1032 prec_dot = FALSE;
1033 max_width = 0;
1034 // dot will be auto-added to s_szFlags if non-negative number follows
1035 break;
1036 case _T('h'):
1037 ilen = -1;
1038 CHECK_PREC
1039 s_szFlags[flagofs++] = pszFormat[n];
1040 break;
1041 case _T('l'):
1042 ilen = 1;
1043 CHECK_PREC
1044 s_szFlags[flagofs++] = pszFormat[n];
1045 break;
1046 case _T('q'):
1047 case _T('L'):
1048 ilen = 2;
1049 CHECK_PREC
1050 s_szFlags[flagofs++] = pszFormat[n];
1051 break;
1052 case _T('Z'):
1053 ilen = 3;
1054 CHECK_PREC
1055 s_szFlags[flagofs++] = pszFormat[n];
1056 break;
1057 case _T('*'):
1058 {
1059 int len = va_arg(argptr, int);
1060 if (in_prec) {
1061 if (len<0) break;
1062 CHECK_PREC
1063 max_width = len;
1064 } else {
1065 if (len<0) {
1066 adj_left = !adj_left;
1067 s_szFlags[flagofs++] = '-';
1068 len = -len;
1069 }
1070 min_width = len;
1071 }
1072 flagofs += ::sprintf(s_szFlags+flagofs,"%d",len);
1073 }
1074 break;
1075 case _T('1'): case _T('2'): case _T('3'):
1076 case _T('4'): case _T('5'): case _T('6'):
1077 case _T('7'): case _T('8'): case _T('9'):
1078 {
1079 int len = 0;
1080 CHECK_PREC
1081 while ((pszFormat[n]>=_T('0')) && (pszFormat[n]<=_T('9'))) {
1082 s_szFlags[flagofs++] = pszFormat[n];
1083 len = len*10 + (pszFormat[n] - _T('0'));
1084 n++;
1085 }
1086 if (in_prec) max_width = len;
1087 else min_width = len;
1088 n--; // the main loop pre-increments n again
1089 }
1090 break;
1091 case _T('d'):
1092 case _T('i'):
1093 case _T('o'):
1094 case _T('u'):
1095 case _T('x'):
1096 case _T('X'):
1097 CHECK_PREC
1098 s_szFlags[flagofs++] = pszFormat[n];
1099 s_szFlags[flagofs] = '\0';
1100 if (ilen == 0 ) {
1101 int val = va_arg(argptr, int);
1102 ::sprintf(s_szScratch, s_szFlags, val);
1103 }
1104 else if (ilen == -1) {
1105 short int val = va_arg(argptr, short int);
1106 ::sprintf(s_szScratch, s_szFlags, val);
1107 }
1108 else if (ilen == 1) {
1109 long int val = va_arg(argptr, long int);
1110 ::sprintf(s_szScratch, s_szFlags, val);
1111 }
1112 else if (ilen == 2) {
1113 #if SIZEOF_LONG_LONG
1114 long long int val = va_arg(argptr, long long int);
1115 ::sprintf(s_szScratch, s_szFlags, val);
1116 #else
1117 long int val = va_arg(argptr, long int);
1118 ::sprintf(s_szScratch, s_szFlags, val);
1119 #endif
1120 }
1121 else if (ilen == 3) {
1122 size_t val = va_arg(argptr, size_t);
1123 ::sprintf(s_szScratch, s_szFlags, val);
1124 }
1125 *this += wxString(s_szScratch);
1126 done = TRUE;
1127 break;
1128 case _T('e'):
1129 case _T('E'):
1130 case _T('f'):
1131 case _T('g'):
1132 case _T('G'):
1133 CHECK_PREC
1134 s_szFlags[flagofs++] = pszFormat[n];
1135 s_szFlags[flagofs] = '\0';
1136 if (ilen == 2) {
1137 long double val = va_arg(argptr, long double);
1138 ::sprintf(s_szScratch, s_szFlags, val);
1139 } else {
1140 double val = va_arg(argptr, double);
1141 ::sprintf(s_szScratch, s_szFlags, val);
1142 }
1143 *this += wxString(s_szScratch);
1144 done = TRUE;
1145 break;
1146 case _T('p'):
1147 {
1148 void *val = va_arg(argptr, void *);
1149 CHECK_PREC
1150 s_szFlags[flagofs++] = pszFormat[n];
1151 s_szFlags[flagofs] = '\0';
1152 ::sprintf(s_szScratch, s_szFlags, val);
1153 *this += wxString(s_szScratch);
1154 done = TRUE;
1155 }
1156 break;
1157 case _T('c'):
1158 {
1159 wxChar val = va_arg(argptr, int);
1160 // we don't need to honor padding here, do we?
1161 *this += val;
1162 done = TRUE;
1163 }
1164 break;
1165 case _T('s'):
1166 if (ilen == -1) {
1167 // wx extension: we'll let %hs mean non-Unicode strings
1168 char *val = va_arg(argptr, char *);
1169 #if wxUSE_UNICODE
1170 // ASCII->Unicode constructor handles max_width right
1171 wxString s(val, wxConvLibc, max_width);
1172 #else
1173 size_t len = wxSTRING_MAXLEN;
1174 if (val) {
1175 for (len = 0; val[len] && (len<max_width); len++);
1176 } else val = _T("(null)");
1177 wxString s(val, len);
1178 #endif
1179 if (s.Len() < min_width)
1180 s.Pad(min_width - s.Len(), _T(' '), adj_left);
1181 *this += s;
1182 } else {
1183 wxChar *val = va_arg(argptr, wxChar *);
1184 size_t len = wxSTRING_MAXLEN;
1185 if (val) {
1186 for (len = 0; val[len] && (len<max_width); len++);
1187 } else val = _T("(null)");
1188 wxString s(val, len);
1189 if (s.Len() < min_width)
1190 s.Pad(min_width - s.Len(), _T(' '), adj_left);
1191 *this += s;
1192 }
1193 done = TRUE;
1194 break;
1195 case _T('n'):
1196 if (ilen == 0) {
1197 int *val = va_arg(argptr, int *);
1198 *val = Len();
1199 }
1200 else if (ilen == -1) {
1201 short int *val = va_arg(argptr, short int *);
1202 *val = Len();
1203 }
1204 else if (ilen >= 1) {
1205 long int *val = va_arg(argptr, long int *);
1206 *val = Len();
1207 }
1208 done = TRUE;
1209 break;
1210 default:
1211 if (wxIsalpha(pszFormat[n]))
1212 // probably some flag not taken care of here yet
1213 s_szFlags[flagofs++] = pszFormat[n];
1214 else {
1215 // bad format
1216 *this += _T('%'); // just to pass the glibc tst-printf.c
1217 n--;
1218 done = TRUE;
1219 }
1220 break;
1221 }
1222 #undef CHECK_PREC
1223 } while (!done);
1224 } else *this += pszFormat[n];
1225
1226 #else
1227 // NB: wxVsnprintf() may return either less than the buffer size or -1 if there
1228 // is not enough place depending on implementation
1229 int iLen = wxVsnprintf(s_szScratch, WXSIZEOF(s_szScratch), pszFormat, argptr);
1230 char *buffer;
1231 if ( iLen < (int)WXSIZEOF(s_szScratch) ) {
1232 buffer = s_szScratch;
1233 }
1234 else {
1235 int size = WXSIZEOF(s_szScratch) * 2;
1236 buffer = (char *)malloc(size);
1237 while ( buffer != NULL ) {
1238 iLen = wxVsnprintf(buffer, WXSIZEOF(s_szScratch), pszFormat, argptr);
1239 if ( iLen < size ) {
1240 // ok, there was enough space
1241 break;
1242 }
1243
1244 // still not enough, double it again
1245 buffer = (char *)realloc(buffer, size *= 2);
1246 }
1247
1248 if ( !buffer ) {
1249 // out of memory
1250 return -1;
1251 }
1252 }
1253
1254 wxString s(buffer);
1255 *this = s;
1256
1257 if ( buffer != s_szScratch )
1258 free(buffer);
1259 #endif
1260
1261 return Len();
1262 }
1263
1264 // ----------------------------------------------------------------------------
1265 // misc other operations
1266 // ----------------------------------------------------------------------------
1267 bool wxString::Matches(const wxChar *pszMask) const
1268 {
1269 // check char by char
1270 const wxChar *pszTxt;
1271 for ( pszTxt = c_str(); *pszMask != _T('\0'); pszMask++, pszTxt++ ) {
1272 switch ( *pszMask ) {
1273 case _T('?'):
1274 if ( *pszTxt == _T('\0') )
1275 return FALSE;
1276
1277 pszTxt++;
1278 pszMask++;
1279 break;
1280
1281 case _T('*'):
1282 {
1283 // ignore special chars immediately following this one
1284 while ( *pszMask == _T('*') || *pszMask == _T('?') )
1285 pszMask++;
1286
1287 // if there is nothing more, match
1288 if ( *pszMask == _T('\0') )
1289 return TRUE;
1290
1291 // are there any other metacharacters in the mask?
1292 size_t uiLenMask;
1293 const wxChar *pEndMask = wxStrpbrk(pszMask, _T("*?"));
1294
1295 if ( pEndMask != NULL ) {
1296 // we have to match the string between two metachars
1297 uiLenMask = pEndMask - pszMask;
1298 }
1299 else {
1300 // we have to match the remainder of the string
1301 uiLenMask = wxStrlen(pszMask);
1302 }
1303
1304 wxString strToMatch(pszMask, uiLenMask);
1305 const wxChar* pMatch = wxStrstr(pszTxt, strToMatch);
1306 if ( pMatch == NULL )
1307 return FALSE;
1308
1309 // -1 to compensate "++" in the loop
1310 pszTxt = pMatch + uiLenMask - 1;
1311 pszMask += uiLenMask - 1;
1312 }
1313 break;
1314
1315 default:
1316 if ( *pszMask != *pszTxt )
1317 return FALSE;
1318 break;
1319 }
1320 }
1321
1322 // match only if nothing left
1323 return *pszTxt == _T('\0');
1324 }
1325
1326 // Count the number of chars
1327 int wxString::Freq(wxChar ch) const
1328 {
1329 int count = 0;
1330 int len = Len();
1331 for (int i = 0; i < len; i++)
1332 {
1333 if (GetChar(i) == ch)
1334 count ++;
1335 }
1336 return count;
1337 }
1338
1339 // convert to upper case, return the copy of the string
1340 wxString wxString::Upper() const
1341 { wxString s(*this); return s.MakeUpper(); }
1342
1343 // convert to lower case, return the copy of the string
1344 wxString wxString::Lower() const { wxString s(*this); return s.MakeLower(); }
1345
1346 int wxString::sprintf(const wxChar *pszFormat, ...)
1347 {
1348 va_list argptr;
1349 va_start(argptr, pszFormat);
1350 int iLen = PrintfV(pszFormat, argptr);
1351 va_end(argptr);
1352 return iLen;
1353 }
1354
1355 // ---------------------------------------------------------------------------
1356 // standard C++ library string functions
1357 // ---------------------------------------------------------------------------
1358 #ifdef wxSTD_STRING_COMPATIBILITY
1359
1360 wxString& wxString::insert(size_t nPos, const wxString& str)
1361 {
1362 wxASSERT( str.GetStringData()->IsValid() );
1363 wxASSERT( nPos <= Len() );
1364
1365 if ( !str.IsEmpty() ) {
1366 wxString strTmp;
1367 wxChar *pc = strTmp.GetWriteBuf(Len() + str.Len());
1368 wxStrncpy(pc, c_str(), nPos);
1369 wxStrcpy(pc + nPos, str);
1370 wxStrcpy(pc + nPos + str.Len(), c_str() + nPos);
1371 strTmp.UngetWriteBuf();
1372 *this = strTmp;
1373 }
1374
1375 return *this;
1376 }
1377
1378 size_t wxString::find(const wxString& str, size_t nStart) const
1379 {
1380 wxASSERT( str.GetStringData()->IsValid() );
1381 wxASSERT( nStart <= Len() );
1382
1383 const wxChar *p = wxStrstr(c_str() + nStart, str);
1384
1385 return p == NULL ? npos : p - c_str();
1386 }
1387
1388 // VC++ 1.5 can't cope with the default argument in the header.
1389 #if !defined(__VISUALC__) || defined(__WIN32__)
1390 size_t wxString::find(const wxChar* sz, size_t nStart, size_t n) const
1391 {
1392 return find(wxString(sz, n == npos ? 0 : n), nStart);
1393 }
1394 #endif // VC++ 1.5
1395
1396 // Gives a duplicate symbol (presumably a case-insensitivity problem)
1397 #if !defined(__BORLANDC__)
1398 size_t wxString::find(wxChar ch, size_t nStart) const
1399 {
1400 wxASSERT( nStart <= Len() );
1401
1402 const wxChar *p = wxStrchr(c_str() + nStart, ch);
1403
1404 return p == NULL ? npos : p - c_str();
1405 }
1406 #endif
1407
1408 size_t wxString::rfind(const wxString& str, size_t nStart) const
1409 {
1410 wxASSERT( str.GetStringData()->IsValid() );
1411 wxASSERT( nStart <= Len() );
1412
1413 // # could be quicker than that
1414 const wxChar *p = c_str() + (nStart == npos ? Len() : nStart);
1415 while ( p >= c_str() + str.Len() ) {
1416 if ( wxStrncmp(p - str.Len(), str, str.Len()) == 0 )
1417 return p - str.Len() - c_str();
1418 p--;
1419 }
1420
1421 return npos;
1422 }
1423
1424 // VC++ 1.5 can't cope with the default argument in the header.
1425 #if !defined(__VISUALC__) || defined(__WIN32__)
1426 size_t wxString::rfind(const wxChar* sz, size_t nStart, size_t n) const
1427 {
1428 return rfind(wxString(sz, n == npos ? 0 : n), nStart);
1429 }
1430
1431 size_t wxString::rfind(wxChar ch, size_t nStart) const
1432 {
1433 wxASSERT( nStart <= Len() );
1434
1435 const wxChar *p = wxStrrchr(c_str() + nStart, ch);
1436
1437 return p == NULL ? npos : p - c_str();
1438 }
1439 #endif // VC++ 1.5
1440
1441 wxString wxString::substr(size_t nStart, size_t nLen) const
1442 {
1443 // npos means 'take all'
1444 if ( nLen == npos )
1445 nLen = 0;
1446
1447 wxASSERT( nStart + nLen <= Len() );
1448
1449 return wxString(c_str() + nStart, nLen == npos ? 0 : nLen);
1450 }
1451
1452 wxString& wxString::erase(size_t nStart, size_t nLen)
1453 {
1454 wxString strTmp(c_str(), nStart);
1455 if ( nLen != npos ) {
1456 wxASSERT( nStart + nLen <= Len() );
1457
1458 strTmp.append(c_str() + nStart + nLen);
1459 }
1460
1461 *this = strTmp;
1462 return *this;
1463 }
1464
1465 wxString& wxString::replace(size_t nStart, size_t nLen, const wxChar *sz)
1466 {
1467 wxASSERT( nStart + nLen <= wxStrlen(sz) );
1468
1469 wxString strTmp;
1470 if ( nStart != 0 )
1471 strTmp.append(c_str(), nStart);
1472 strTmp += sz;
1473 strTmp.append(c_str() + nStart + nLen);
1474
1475 *this = strTmp;
1476 return *this;
1477 }
1478
1479 wxString& wxString::replace(size_t nStart, size_t nLen, size_t nCount, wxChar ch)
1480 {
1481 return replace(nStart, nLen, wxString(ch, nCount));
1482 }
1483
1484 wxString& wxString::replace(size_t nStart, size_t nLen,
1485 const wxString& str, size_t nStart2, size_t nLen2)
1486 {
1487 return replace(nStart, nLen, str.substr(nStart2, nLen2));
1488 }
1489
1490 wxString& wxString::replace(size_t nStart, size_t nLen,
1491 const wxChar* sz, size_t nCount)
1492 {
1493 return replace(nStart, nLen, wxString(sz, nCount));
1494 }
1495
1496 #endif //std::string compatibility
1497
1498 // ============================================================================
1499 // ArrayString
1500 // ============================================================================
1501
1502 // size increment = max(50% of current size, ARRAY_MAXSIZE_INCREMENT)
1503 #define ARRAY_MAXSIZE_INCREMENT 4096
1504 #ifndef ARRAY_DEFAULT_INITIAL_SIZE // also defined in dynarray.h
1505 #define ARRAY_DEFAULT_INITIAL_SIZE (16)
1506 #endif
1507
1508 #define STRING(p) ((wxString *)(&(p)))
1509
1510 // ctor
1511 wxArrayString::wxArrayString()
1512 {
1513 m_nSize =
1514 m_nCount = 0;
1515 m_pItems = (wxChar **) NULL;
1516 }
1517
1518 // copy ctor
1519 wxArrayString::wxArrayString(const wxArrayString& src)
1520 {
1521 m_nSize =
1522 m_nCount = 0;
1523 m_pItems = (wxChar **) NULL;
1524
1525 *this = src;
1526 }
1527
1528 // assignment operator
1529 wxArrayString& wxArrayString::operator=(const wxArrayString& src)
1530 {
1531 if ( m_nSize > 0 )
1532 Clear();
1533
1534 if ( src.m_nCount > ARRAY_DEFAULT_INITIAL_SIZE )
1535 Alloc(src.m_nCount);
1536
1537 // we can't just copy the pointers here because otherwise we would share
1538 // the strings with another array
1539 for ( size_t n = 0; n < src.m_nCount; n++ )
1540 Add(src[n]);
1541
1542 if ( m_nCount != 0 )
1543 memcpy(m_pItems, src.m_pItems, m_nCount*sizeof(wxChar *));
1544
1545 return *this;
1546 }
1547
1548 // grow the array
1549 void wxArrayString::Grow()
1550 {
1551 // only do it if no more place
1552 if( m_nCount == m_nSize ) {
1553 if( m_nSize == 0 ) {
1554 // was empty, alloc some memory
1555 m_nSize = ARRAY_DEFAULT_INITIAL_SIZE;
1556 m_pItems = new wxChar *[m_nSize];
1557 }
1558 else {
1559 // otherwise when it's called for the first time, nIncrement would be 0
1560 // and the array would never be expanded
1561 wxASSERT( ARRAY_DEFAULT_INITIAL_SIZE != 0 );
1562
1563 // add 50% but not too much
1564 size_t nIncrement = m_nSize < ARRAY_DEFAULT_INITIAL_SIZE
1565 ? ARRAY_DEFAULT_INITIAL_SIZE : m_nSize >> 1;
1566 if ( nIncrement > ARRAY_MAXSIZE_INCREMENT )
1567 nIncrement = ARRAY_MAXSIZE_INCREMENT;
1568 m_nSize += nIncrement;
1569 wxChar **pNew = new wxChar *[m_nSize];
1570
1571 // copy data to new location
1572 memcpy(pNew, m_pItems, m_nCount*sizeof(wxChar *));
1573
1574 // delete old memory (but do not release the strings!)
1575 wxDELETEA(m_pItems);
1576
1577 m_pItems = pNew;
1578 }
1579 }
1580 }
1581
1582 void wxArrayString::Free()
1583 {
1584 for ( size_t n = 0; n < m_nCount; n++ ) {
1585 STRING(m_pItems[n])->GetStringData()->Unlock();
1586 }
1587 }
1588
1589 // deletes all the strings from the list
1590 void wxArrayString::Empty()
1591 {
1592 Free();
1593
1594 m_nCount = 0;
1595 }
1596
1597 // as Empty, but also frees memory
1598 void wxArrayString::Clear()
1599 {
1600 Free();
1601
1602 m_nSize =
1603 m_nCount = 0;
1604
1605 wxDELETEA(m_pItems);
1606 }
1607
1608 // dtor
1609 wxArrayString::~wxArrayString()
1610 {
1611 Free();
1612
1613 wxDELETEA(m_pItems);
1614 }
1615
1616 // pre-allocates memory (frees the previous data!)
1617 void wxArrayString::Alloc(size_t nSize)
1618 {
1619 wxASSERT( nSize > 0 );
1620
1621 // only if old buffer was not big enough
1622 if ( nSize > m_nSize ) {
1623 Free();
1624 wxDELETEA(m_pItems);
1625 m_pItems = new wxChar *[nSize];
1626 m_nSize = nSize;
1627 }
1628
1629 m_nCount = 0;
1630 }
1631
1632 // minimizes the memory usage by freeing unused memory
1633 void wxArrayString::Shrink()
1634 {
1635 // only do it if we have some memory to free
1636 if( m_nCount < m_nSize ) {
1637 // allocates exactly as much memory as we need
1638 wxChar **pNew = new wxChar *[m_nCount];
1639
1640 // copy data to new location
1641 memcpy(pNew, m_pItems, m_nCount*sizeof(wxChar *));
1642 delete [] m_pItems;
1643 m_pItems = pNew;
1644 }
1645 }
1646
1647 // searches the array for an item (forward or backwards)
1648 int wxArrayString::Index(const wxChar *sz, bool bCase, bool bFromEnd) const
1649 {
1650 if ( bFromEnd ) {
1651 if ( m_nCount > 0 ) {
1652 size_t ui = m_nCount;
1653 do {
1654 if ( STRING(m_pItems[--ui])->IsSameAs(sz, bCase) )
1655 return ui;
1656 }
1657 while ( ui != 0 );
1658 }
1659 }
1660 else {
1661 for( size_t ui = 0; ui < m_nCount; ui++ ) {
1662 if( STRING(m_pItems[ui])->IsSameAs(sz, bCase) )
1663 return ui;
1664 }
1665 }
1666
1667 return wxNOT_FOUND;
1668 }
1669
1670 // add item at the end
1671 void wxArrayString::Add(const wxString& str)
1672 {
1673 wxASSERT( str.GetStringData()->IsValid() );
1674
1675 Grow();
1676
1677 // the string data must not be deleted!
1678 str.GetStringData()->Lock();
1679 m_pItems[m_nCount++] = (wxChar *)str.c_str();
1680 }
1681
1682 // add item at the given position
1683 void wxArrayString::Insert(const wxString& str, size_t nIndex)
1684 {
1685 wxASSERT( str.GetStringData()->IsValid() );
1686
1687 wxCHECK_RET( nIndex <= m_nCount, _("bad index in wxArrayString::Insert") );
1688
1689 Grow();
1690
1691 memmove(&m_pItems[nIndex + 1], &m_pItems[nIndex],
1692 (m_nCount - nIndex)*sizeof(wxChar *));
1693
1694 str.GetStringData()->Lock();
1695 m_pItems[nIndex] = (wxChar *)str.c_str();
1696
1697 m_nCount++;
1698 }
1699
1700 // removes item from array (by index)
1701 void wxArrayString::Remove(size_t nIndex)
1702 {
1703 wxCHECK_RET( nIndex <= m_nCount, _("bad index in wxArrayString::Remove") );
1704
1705 // release our lock
1706 Item(nIndex).GetStringData()->Unlock();
1707
1708 memmove(&m_pItems[nIndex], &m_pItems[nIndex + 1],
1709 (m_nCount - nIndex - 1)*sizeof(wxChar *));
1710 m_nCount--;
1711 }
1712
1713 // removes item from array (by value)
1714 void wxArrayString::Remove(const wxChar *sz)
1715 {
1716 int iIndex = Index(sz);
1717
1718 wxCHECK_RET( iIndex != wxNOT_FOUND,
1719 _("removing inexistent element in wxArrayString::Remove") );
1720
1721 Remove(iIndex);
1722 }
1723
1724 // ----------------------------------------------------------------------------
1725 // sorting
1726 // ----------------------------------------------------------------------------
1727
1728 // we can only sort one array at a time with the quick-sort based
1729 // implementation
1730 #if wxUSE_THREADS
1731 // need a critical section to protect access to gs_compareFunction and
1732 // gs_sortAscending variables
1733 static wxCriticalSection *gs_critsectStringSort = NULL;
1734
1735 // call this before the value of the global sort vars is changed/after
1736 // you're finished with them
1737 #define START_SORT() wxASSERT( !gs_critsectStringSort ); \
1738 gs_critsectStringSort = new wxCriticalSection; \
1739 gs_critsectStringSort->Enter()
1740 #define END_SORT() gs_critsectStringSort->Leave(); \
1741 delete gs_critsectStringSort; \
1742 gs_critsectStringSort = NULL
1743 #else // !threads
1744 #define START_SORT()
1745 #define END_SORT()
1746 #endif // wxUSE_THREADS
1747
1748 // function to use for string comparaison
1749 static wxArrayString::CompareFunction gs_compareFunction = NULL;
1750
1751 // if we don't use the compare function, this flag tells us if we sort the
1752 // array in ascending or descending order
1753 static bool gs_sortAscending = TRUE;
1754
1755 // function which is called by quick sort
1756 static int wxStringCompareFunction(const void *first, const void *second)
1757 {
1758 wxString *strFirst = (wxString *)first;
1759 wxString *strSecond = (wxString *)second;
1760
1761 if ( gs_compareFunction ) {
1762 return gs_compareFunction(*strFirst, *strSecond);
1763 }
1764 else {
1765 // maybe we should use wxStrcoll
1766 int result = wxStrcmp(strFirst->c_str(), strSecond->c_str());
1767
1768 return gs_sortAscending ? result : -result;
1769 }
1770 }
1771
1772 // sort array elements using passed comparaison function
1773 void wxArrayString::Sort(CompareFunction compareFunction)
1774 {
1775 START_SORT();
1776
1777 wxASSERT( !gs_compareFunction ); // must have been reset to NULL
1778 gs_compareFunction = compareFunction;
1779
1780 DoSort();
1781
1782 END_SORT();
1783 }
1784
1785 void wxArrayString::Sort(bool reverseOrder)
1786 {
1787 START_SORT();
1788
1789 wxASSERT( !gs_compareFunction ); // must have been reset to NULL
1790 gs_sortAscending = !reverseOrder;
1791
1792 DoSort();
1793
1794 END_SORT();
1795 }
1796
1797 void wxArrayString::DoSort()
1798 {
1799 // just sort the pointers using qsort() - of course it only works because
1800 // wxString() *is* a pointer to its data
1801 qsort(m_pItems, m_nCount, sizeof(wxChar *), wxStringCompareFunction);
1802 }
1803
1804 // ============================================================================
1805 // MBConv
1806 // ============================================================================
1807
1808 WXDLLEXPORT_DATA(wxMBConv *) wxConvCurrent = &wxConvLibc;
1809 #if !wxUSE_WCHAR_T
1810 WXDLLEXPORT_DATA(wxMBConv) wxConvLibc, wxConvFile;
1811 #endif
1812
1813 #if wxUSE_WCHAR_T
1814
1815 // ----------------------------------------------------------------------------
1816 // standard libc conversion
1817 // ----------------------------------------------------------------------------
1818
1819 WXDLLEXPORT_DATA(wxMBConv) wxConvLibc;
1820
1821 size_t wxMBConv::MB2WC(wchar_t *buf, const char *psz, size_t n) const
1822 {
1823 return wxMB2WC(buf, psz, n);
1824 }
1825
1826 size_t wxMBConv::WC2MB(char *buf, const wchar_t *psz, size_t n) const
1827 {
1828 return wxWC2MB(buf, psz, n);
1829 }
1830
1831 // ----------------------------------------------------------------------------
1832 // standard file conversion
1833 // ----------------------------------------------------------------------------
1834
1835 WXDLLEXPORT_DATA(wxMBConvFile) wxConvFile;
1836
1837 // just use the libc conversion for now
1838 size_t wxMBConvFile::MB2WC(wchar_t *buf, const char *psz, size_t n) const
1839 {
1840 return wxMB2WC(buf, psz, n);
1841 }
1842
1843 size_t wxMBConvFile::WC2MB(char *buf, const wchar_t *psz, size_t n) const
1844 {
1845 return wxWC2MB(buf, psz, n);
1846 }
1847
1848 // ----------------------------------------------------------------------------
1849 // standard gdk conversion
1850 // ----------------------------------------------------------------------------
1851
1852 #ifdef __WXGTK12__
1853 WXDLLEXPORT_DATA(wxMBConvGdk) wxConvGdk;
1854
1855 #include <gdk/gdk.h>
1856
1857 size_t wxMBConvGdk::MB2WC(wchar_t *buf, const char *psz, size_t n) const
1858 {
1859 if (buf) {
1860 return gdk_mbstowcs((GdkWChar *)buf, psz, n);
1861 } else {
1862 GdkWChar *nbuf = new GdkWChar[n=strlen(psz)];
1863 size_t len = gdk_mbstowcs(nbuf, psz, n);
1864 delete [] nbuf;
1865 return len;
1866 }
1867 }
1868
1869 size_t wxMBConvGdk::WC2MB(char *buf, const wchar_t *psz, size_t n) const
1870 {
1871 char *mbstr = gdk_wcstombs((GdkWChar *)psz);
1872 size_t len = mbstr ? strlen(mbstr) : 0;
1873 if (buf) {
1874 if (len > n) len = n;
1875 memcpy(buf, psz, len);
1876 if (len < n) buf[len] = 0;
1877 }
1878 return len;
1879 }
1880 #endif // GTK > 1.0
1881
1882 // ----------------------------------------------------------------------------
1883 // UTF-7
1884 // ----------------------------------------------------------------------------
1885
1886 WXDLLEXPORT_DATA(wxMBConvUTF7) wxConvUTF7;
1887
1888 #if 0
1889 static char utf7_setD[]="ABCDEFGHIJKLMNOPQRSTUVWXYZ"
1890 "abcdefghijklmnopqrstuvwxyz"
1891 "0123456789'(),-./:?";
1892 static char utf7_setO[]="!\"#$%&*;<=>@[]^_`{|}";
1893 static char utf7_setB[]="ABCDEFGHIJKLMNOPQRSTUVWXYZ"
1894 "abcdefghijklmnopqrstuvwxyz"
1895 "0123456789+/";
1896 #endif
1897
1898 // TODO: write actual implementations of UTF-7 here
1899 size_t wxMBConvUTF7::MB2WC(wchar_t * WXUNUSED(buf),
1900 const char * WXUNUSED(psz),
1901 size_t WXUNUSED(n)) const
1902 {
1903 return 0;
1904 }
1905
1906 size_t wxMBConvUTF7::WC2MB(char * WXUNUSED(buf),
1907 const wchar_t * WXUNUSED(psz),
1908 size_t WXUNUSED(n)) const
1909 {
1910 return 0;
1911 }
1912
1913 // ----------------------------------------------------------------------------
1914 // UTF-8
1915 // ----------------------------------------------------------------------------
1916
1917 WXDLLEXPORT_DATA(wxMBConvUTF8) wxConvUTF8;
1918
1919 static unsigned long utf8_max[]={0x7f,0x7ff,0xffff,0x1fffff,0x3ffffff,0x7fffffff,0xffffffff};
1920
1921 size_t wxMBConvUTF8::MB2WC(wchar_t *buf, const char *psz, size_t n) const
1922 {
1923 size_t len = 0;
1924
1925 while (*psz && ((!buf) || (len<n))) {
1926 unsigned char cc=*psz++, fc=cc;
1927 unsigned cnt;
1928 for (cnt=0; fc&0x80; cnt++) fc<<=1;
1929 if (!cnt) {
1930 // plain ASCII char
1931 if (buf) *buf++=cc;
1932 len++;
1933 } else {
1934 cnt--;
1935 if (!cnt) {
1936 // invalid UTF-8 sequence
1937 return (size_t)-1;
1938 } else {
1939 unsigned ocnt=cnt-1;
1940 unsigned long res=cc&(0x3f>>cnt);
1941 while (cnt--) {
1942 cc = *psz++;
1943 if ((cc&0xC0)!=0x80) {
1944 // invalid UTF-8 sequence
1945 return (size_t)-1;
1946 }
1947 res=(res<<6)|(cc&0x3f);
1948 }
1949 if (res<=utf8_max[ocnt]) {
1950 // illegal UTF-8 encoding
1951 return (size_t)-1;
1952 }
1953 if (buf) *buf++=res;
1954 len++;
1955 }
1956 }
1957 }
1958 if (buf && (len<n)) *buf = 0;
1959 return len;
1960 }
1961
1962 size_t wxMBConvUTF8::WC2MB(char *buf, const wchar_t *psz, size_t n) const
1963 {
1964 size_t len = 0;
1965
1966 while (*psz && ((!buf) || (len<n))) {
1967 unsigned long cc=(*psz++)&0x7fffffff;
1968 unsigned cnt;
1969 for (cnt=0; cc>utf8_max[cnt]; cnt++);
1970 if (!cnt) {
1971 // plain ASCII char
1972 if (buf) *buf++=cc;
1973 len++;
1974 } else {
1975 len+=cnt+1;
1976 if (buf) {
1977 *buf++=(-128>>cnt)|((cc>>(cnt*6))&(0x3f>>cnt));
1978 while (cnt--)
1979 *buf++=0x80|((cc>>(cnt*6))&0x3f);
1980 }
1981 }
1982 }
1983 if (buf && (len<n)) *buf = 0;
1984 return len;
1985 }
1986
1987 // ----------------------------------------------------------------------------
1988 // specified character set
1989 // ----------------------------------------------------------------------------
1990
1991 class wxCharacterSet
1992 {
1993 public:
1994 wxArrayString names;
1995 wchar_t *data;
1996 };
1997
1998 #ifndef WX_PRECOMP
1999 #include "wx/dynarray.h"
2000 #include "wx/filefn.h"
2001 #include "wx/textfile.h"
2002 #include "wx/tokenzr.h"
2003 #include "wx/utils.h"
2004 #endif
2005
2006 WX_DECLARE_OBJARRAY(wxCharacterSet, wxCSArray);
2007 #include "wx/arrimpl.cpp"
2008 WX_DEFINE_OBJARRAY(wxCSArray);
2009
2010 static wxCSArray wxCharsets;
2011
2012 static void wxLoadCharacterSets(void)
2013 {
2014 static bool already_loaded = FALSE;
2015
2016 if (already_loaded) return;
2017
2018 already_loaded = TRUE;
2019 #if defined(__UNIX__)
2020 // search through files in /usr/share/i18n/charmaps
2021 wxString fname;
2022 for (fname = ::wxFindFirstFile(_T("/usr/share/i18n/charmaps/*"));
2023 !fname.IsEmpty();
2024 fname = ::wxFindNextFile()) {
2025 wxTextFile cmap(fname);
2026 if (cmap.Open()) {
2027 wxCharacterSet *cset = new wxCharacterSet;
2028 wxString comchar,escchar;
2029 bool in_charset = FALSE;
2030
2031 // wxFprintf(stderr,_T("Loaded: %s\n"),fname.c_str());
2032
2033 wxString line;
2034 for (line = cmap.GetFirstLine();
2035 !cmap.Eof();
2036 line = cmap.GetNextLine()) {
2037 // wxFprintf(stderr,_T("line contents: %s\n"),line.c_str());
2038 wxStringTokenizer token(line);
2039 wxString cmd = token.GetNextToken();
2040 if (cmd == comchar) {
2041 if (token.GetNextToken() == _T("alias"))
2042 cset->names.Add(token.GetNextToken());
2043 }
2044 else if (cmd == _T("<code_set_name>"))
2045 cset->names.Add(token.GetNextToken());
2046 else if (cmd == _T("<comment_char>"))
2047 comchar = token.GetNextToken();
2048 else if (cmd == _T("<escape_char>"))
2049 escchar = token.GetNextToken();
2050 else if (cmd == _T("<mb_cur_min>")) {
2051 delete cset;
2052 cset = (wxCharacterSet *) NULL;
2053 break; // we don't support multibyte charsets ourselves (yet)
2054 }
2055 else if (cmd == _T("CHARMAP")) {
2056 cset->data = (wchar_t *)calloc(256, sizeof(wchar_t));
2057 in_charset = TRUE;
2058 }
2059 else if (cmd == _T("END")) {
2060 if (token.GetNextToken() == _T("CHARMAP"))
2061 in_charset = FALSE;
2062 }
2063 else if (in_charset) {
2064 // format: <NUL> /x00 <U0000> NULL (NUL)
2065 // <A> /x41 <U0041> LATIN CAPITAL LETTER A
2066 wxString hex = token.GetNextToken();
2067 // skip whitespace (why doesn't wxStringTokenizer do this?)
2068 while (wxIsEmpty(hex) && token.HasMoreTokens()) hex = token.GetNextToken();
2069 wxString uni = token.GetNextToken();
2070 // skip whitespace again
2071 while (wxIsEmpty(uni) && token.HasMoreTokens()) uni = token.GetNextToken();
2072
2073 if ((hex.Len() > 2) && (hex.GetChar(0) == escchar) && (hex.GetChar(1) == _T('x')) &&
2074 (uni.Left(2) == _T("<U"))) {
2075 hex.MakeUpper(); uni.MakeUpper();
2076 int pos = ::wxHexToDec(hex.Mid(2,2));
2077 if (pos>=0) {
2078 unsigned long uni1 = ::wxHexToDec(uni.Mid(2,2));
2079 unsigned long uni2 = ::wxHexToDec(uni.Mid(4,2));
2080 cset->data[pos] = (uni1 << 16) | uni2;
2081 // wxFprintf(stderr,_T("char %02x mapped to %04x (%c)\n"),pos,cset->data[pos],cset->data[pos]);
2082 }
2083 }
2084 }
2085 }
2086 if (cset) {
2087 cset->names.Shrink();
2088 wxCharsets.Add(cset);
2089 }
2090 }
2091 }
2092 #endif
2093 wxCharsets.Shrink();
2094 }
2095
2096 static wxCharacterSet *wxFindCharacterSet(const wxChar *charset)
2097 {
2098 if (!charset) return (wxCharacterSet *)NULL;
2099 wxLoadCharacterSets();
2100 for (size_t n=0; n<wxCharsets.GetCount(); n++)
2101 if (wxCharsets[n].names.Index(charset) != wxNOT_FOUND)
2102 return &(wxCharsets[n]);
2103 return (wxCharacterSet *)NULL;
2104 }
2105
2106 WXDLLEXPORT_DATA(wxCSConv) wxConvLocal((const wxChar *)NULL);
2107
2108 wxCSConv::wxCSConv(const wxChar *charset)
2109 {
2110 m_name = (wxChar *) NULL;
2111 m_cset = (wxCharacterSet *) NULL;
2112 m_deferred = TRUE;
2113 SetName(charset);
2114 }
2115
2116 wxCSConv::~wxCSConv()
2117 {
2118 if (m_name) free(m_name);
2119 }
2120
2121 void wxCSConv::SetName(const wxChar *charset)
2122 {
2123 if (charset) {
2124 #ifdef __UNIX__
2125 // first, convert the character set name to standard form
2126 wxString codeset;
2127 if (wxString(charset,3).CmpNoCase(_T("ISO")) == 0) {
2128 // make sure it's represented in the standard form: ISO_8859-1
2129 codeset = _T("ISO_");
2130 charset += 3;
2131 if ((*charset == _T('-')) || (*charset == _T('_'))) charset++;
2132 if (wxStrlen(charset)>4) {
2133 if (wxString(charset,4) == _T("8859")) {
2134 codeset << _T("8859-");
2135 if (*charset == _T('-')) charset++;
2136 }
2137 }
2138 }
2139 codeset << charset;
2140 codeset.MakeUpper();
2141 m_name = wxStrdup(codeset.c_str());
2142 m_deferred = TRUE;
2143 #endif
2144 }
2145 }
2146
2147 void wxCSConv::LoadNow()
2148 {
2149 // wxPrintf(_T("Conversion request\n"));
2150 if (m_deferred) {
2151 if (!m_name) {
2152 #ifdef __UNIX__
2153 wxChar *lang = wxGetenv(_T("LANG"));
2154 wxChar *dot = lang ? wxStrchr(lang, _T('.')) : (wxChar *)NULL;
2155 if (dot) SetName(dot+1);
2156 #endif
2157 }
2158 m_cset = wxFindCharacterSet(m_name);
2159 m_deferred = FALSE;
2160 }
2161 }
2162
2163 size_t wxCSConv::MB2WC(wchar_t *buf, const char *psz, size_t n) const
2164 {
2165 ((wxCSConv *)this)->LoadNow(); // discard constness
2166 if (buf) {
2167 if (m_cset) {
2168 for (size_t c=0; c<n; c++)
2169 buf[c] = m_cset->data[(unsigned char)(psz[c])];
2170 } else {
2171 // latin-1 (direct)
2172 for (size_t c=0; c<n; c++)
2173 buf[c] = (unsigned char)(psz[c]);
2174 }
2175 return n;
2176 }
2177 return strlen(psz);
2178 }
2179
2180 size_t wxCSConv::WC2MB(char *buf, const wchar_t *psz, size_t n) const
2181 {
2182 ((wxCSConv *)this)->LoadNow(); // discard constness
2183 if (buf) {
2184 if (m_cset) {
2185 for (size_t c=0; c<n; c++) {
2186 size_t n;
2187 for (n=0; (n<256) && (m_cset->data[n] != psz[c]); n++);
2188 buf[c] = (n>0xff) ? '?' : n;
2189 }
2190 } else {
2191 // latin-1 (direct)
2192 for (size_t c=0; c<n; c++)
2193 buf[c] = (psz[c]>0xff) ? '?' : psz[c];
2194 }
2195 return n;
2196 }
2197 return wcslen(psz);
2198 }
2199
2200 #endif//wxUSE_WCHAR_T
2201
2202 #if wxUSE_WCHAR_T
2203 const wxWCharBuffer wxMBConv::cMB2WC(const char *psz) const
2204 {
2205 if (psz) {
2206 size_t nLen = MB2WC((wchar_t *) NULL, psz, 0);
2207 wxWCharBuffer buf(nLen);
2208 MB2WC(WCSTRINGCAST buf, psz, nLen);
2209 return buf;
2210 } else return wxWCharBuffer((wchar_t *) NULL);
2211 }
2212
2213 const wxCharBuffer wxMBConv::cWC2MB(const wchar_t *psz) const
2214 {
2215 if (psz) {
2216 size_t nLen = WC2MB((char *) NULL, psz, 0);
2217 wxCharBuffer buf(nLen);
2218 WC2MB(MBSTRINGCAST buf, psz, nLen);
2219 return buf;
2220 } else return wxCharBuffer((char *) NULL);
2221 }
2222
2223 #endif//wxUSE_WCHAR_T
2224