]>
git.saurik.com Git - wxWidgets.git/blob - src/common/unichar.cpp
1 /////////////////////////////////////////////////////////////////////////////
2 // Name: src/common/unichar.cpp
3 // Purpose: wxUniChar and wxUniCharRef classes
4 // Author: Vaclav Slavik
7 // Copyright: (c) 2007 REA Elektronik GmbH
8 // Licence: wxWindows licence
9 ///////////////////////////////////////////////////////////////////////////////
11 // ===========================================================================
13 // ===========================================================================
15 // For compilers that support precompilation, includes "wx.h".
16 #include "wx/wxprec.h"
23 #include "wx/strconv.h" // wxConvLibc
27 #include "wx/unichar.h"
28 #include "wx/string.h"
30 // ===========================================================================
32 // ===========================================================================
34 // ---------------------------------------------------------------------------
36 // ---------------------------------------------------------------------------
39 wxUniChar::value_type
wxUniChar::FromHi8bit(char c
)
41 #if wxUSE_UTF8_LOCALE_ONLY
42 wxFAIL_MSG( "invalid UTF-8 character" );
45 return wxT('?'); // FIXME-UTF8: what to use as failure character?
48 if ( wxConvLibc
.ToWChar(buf
, 2, &c
, 1) != 2 )
50 wxFAIL_MSG( "invalid multibyte character" );
51 return wxT('?'); // FIXME-UTF8: what to use as failure character?
58 char wxUniChar::ToHi8bit(wxUniChar::value_type c
)
60 #if wxUSE_UTF8_LOCALE_ONLY
61 wxFAIL_MSG( "character cannot be converted to single UTF-8 byte" );
64 return '?'; // FIXME-UTF8: what to use as failure character?
68 if ( wxConvLibc
.FromWChar(buf
, 2, &in
, 1) != 2 )
70 wxFAIL_MSG( "character cannot be converted to single byte" );
71 return '?'; // FIXME-UTF8: what to use as failure character?
78 // ---------------------------------------------------------------------------
80 // ---------------------------------------------------------------------------
82 #if wxUSE_UNICODE_UTF8
83 wxUniChar
wxUniCharRef::UniChar() const
85 return wxStringOperations::DecodeChar(m_pos
);
88 wxUniCharRef
& wxUniCharRef::operator=(const wxUniChar
& c
)
90 wxStringOperations::Utf8CharBuffer
utf(wxStringOperations::EncodeChar(c
));
91 size_t lenOld
= wxStringOperations::GetUtf8CharLength(*m_pos
);
92 size_t lenNew
= wxStringOperations::GetUtf8CharLength(utf
[0]);
94 if ( lenNew
== lenOld
)
96 // this is the simpler case: if the new value's UTF-8 code has the
97 // same length, we can just replace it:
100 for ( size_t i
= 0; i
< lenNew
; ++i
, ++pos
)
103 else // length of character encoding in UTF-8 changed
105 // the worse case is when the new value has either longer or shorter
106 // code -- in that case, we have to use wxStringImpl::replace() and
107 // this invalidates all iterators, so we have to update them too:
109 wxStringImpl
& strimpl
= m_str
.m_impl
;
111 int iterDiff
= lenNew
- lenOld
;
112 size_t posIdx
= m_pos
- strimpl
.begin();
114 // compute positions of outstanding iterators for this string after the
115 // replacement is done (there is only a small number of iterators at
116 // any time, so we use an array on the stack to avoid unneeded
118 static const size_t STATIC_SIZE
= 32;
119 size_t indexes_a
[STATIC_SIZE
];
120 size_t *indexes
= indexes_a
;
122 wxStringIteratorNode
*it
;
123 for ( it
= m_str
.m_iterators
.ptr
; it
; it
= it
->m_next
, ++iterNum
)
125 wxASSERT( it
->m_iter
|| it
->m_citer
);
127 if ( iterNum
== STATIC_SIZE
)
129 wxLogTrace( _T("utf8"), _T("unexpectedly many iterators") );
131 size_t total
= iterNum
+ 1;
132 for ( wxStringIteratorNode
*it2
= it
; it2
; it2
= it2
->m_next
)
134 indexes
= new size_t[total
];
135 memcpy(indexes
, indexes_a
, sizeof(size_t) * STATIC_SIZE
);
138 size_t idx
= it
->m_iter
139 ? (*it
->m_iter
- strimpl
.begin())
140 : (*it
->m_citer
- strimpl
.begin());
145 indexes
[iterNum
] = idx
;
148 // update the string:
149 strimpl
.replace(m_pos
, m_pos
+ lenOld
, utf
, lenNew
);
151 #if wxUSE_STRING_POS_CACHE
152 m_str
.InvalidateCache();
153 #endif // wxUSE_STRING_POS_CACHE
155 // finally, set the iterators to valid values again (note that this
156 // updates m_pos as well):
158 for ( i
= 0, it
= m_str
.m_iterators
.ptr
; it
; it
= it
->m_next
, ++i
)
160 wxASSERT( i
< iterNum
);
161 wxASSERT( it
->m_iter
|| it
->m_citer
);
164 *it
->m_iter
= strimpl
.begin() + indexes
[i
];
166 *it
->m_citer
= strimpl
.begin() + indexes
[i
];
169 if ( indexes
!= indexes_a
)
175 #endif // wxUSE_UNICODE_UTF8