]> git.saurik.com Git - wxWidgets.git/blame - docs/latex/wx/mbconv.tex
Patches-1851591 ] dataview sample is crashing (under MSW)
[wxWidgets.git] / docs / latex / wx / mbconv.tex
CommitLineData
eec47cc6
VZ
1%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
2%% Name: mbconv.tex
3%% Purpose: wxMBConv documentation
4%% Author: Ove Kaaven, Vadim Zeitlin
5%% Created: 2000-03-25
6%% RCS-ID: $Id$
7%% Copyright: (c) 2000 Ove Kaaven
8%% (c) 2003-2006 Vadim Zeitlin
9%% License: wxWindows license
10%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
11
f6bcfd97
BP
12
13\section{\class{wxMBConv}}\label{wxmbconv}
14
15This class is the base class of a hierarchy of classes capable of converting
eec47cc6
VZ
16text strings between multibyte (SBCS or DBCS) encodings and Unicode.
17
18In the documentation for this and related classes please notice that
19\emph{length} of the string refers to the number of characters in the string
20not counting the terminating \NUL, if any. While the \emph{size} of the string
5e51fb4c 21is the total number of bytes in the string, including any trailing \NUL.
eec47cc6
VZ
22Thus, length of wide character string \texttt{L"foo"} is $3$ while its size can
23be either $8$ or $16$ depending on whether \texttt{wchar\_t} is $2$ bytes (as
24under Windows) or $4$ (Unix).
25
26\wxheading{Global variables}
27
28There are several predefined instances of this class:
29\begin{twocollist}
30\twocolitem{\textbf{wxConvLibc}}{Uses the standard ANSI C \texttt{mbstowcs()} and
31\texttt{wcstombs()} functions to perform the conversions; thus depends on the
32current locale.}
ef95ce41
VZ
33\twocolitem{\textbf{wxConvLocal}}{Another conversion corresponding to the
34current locale but this one uses the best available conversion.}
d5bef0a3
VZ
35\twocolitem{\textbf{wxConvUI}}{The conversion used for hte standard UI elements
36such as menu items and buttons. This is a pointer which is initially set to
37\texttt{wxConvLocal} as the program uses the current locale by default but can
38be set to some specific conversion if the program needs to use a specific
39encoding for its UI.}
ef95ce41
VZ
40\twocolitem{\textbf{wxConvISO8859\_1}}{Conversion to and from ISO-8859-1 (Latin I)
41encoding.}
42\twocolitem{\textbf{wxConvUTF8}}{Conversion to and from UTF-8 encoding.}
eec47cc6
VZ
43\twocolitem{\textbf{wxConvFile}}{The appropriate conversion for the file names,
44depends on the system.}
ef95ce41 45% \twocolitem{\textbf{wxConvCurrent}}{Not really clear what is it for...}
eec47cc6 46\end{twocollist}
f6bcfd97 47
483b0434
VZ
48
49\wxheading{Constants}
50
51\texttt{wxCONV\_FAILED} value is defined as \texttt{(size\_t)$-1$} and is
52returned by the conversion functions instead of the length of the converted
53string if the conversion fails.
54
55
f6bcfd97
BP
56\wxheading{Derived from}
57
58No base class
59
60\wxheading{Include files}
61
62<wx/strconv.h>
63
a7af285d
VZ
64\wxheading{Library}
65
66\helpref{wxBase}{librarieslist}
67
f6bcfd97
BP
68\wxheading{See also}
69
70\helpref{wxCSConv}{wxcsconv},
71\helpref{wxEncodingConverter}{wxencodingconverter},
72\helpref{wxMBConv classes overview}{mbconvclasses}
73
483b0434 74
f6bcfd97
BP
75\latexignore{\rtfignore{\wxheading{Members}}}
76
77
78\membersection{wxMBConv::wxMBConv}\label{wxmbconvwxmbconv}
79
80\func{}{wxMBConv}{\void}
81
483b0434
VZ
82Trivial default constructor.
83
f6bcfd97 84
429e2bb2
VZ
85\membersection{wxMBConv::Clone}\label{wxmbconvclone}
86
87\constfunc{virtual wxMBConv *}{Clone}{\void}
88
89This pure virtual function is overridden in each of the derived classes to
90return a new copy of the object it is called on. It is used for copying the
91conversion objects while preserving their dynamic type.
92
93
f6bcfd97
BP
94\membersection{wxMBConv::MB2WC}\label{wxmbconvmb2wc}
95
eec47cc6
VZ
96\constfunc{virtual size\_t}{MB2WC}{\param{wchar\_t *}{out}, \param{const char *}{in}, \param{size\_t }{outLen}}
97
483b0434
VZ
98\deprecated{\helpref{ToWChar}{wxmbconvtowchar}}
99
eec47cc6
VZ
100Converts from a string \arg{in} in multibyte encoding to Unicode putting up to
101\arg{outLen} characters into the buffer \arg{out}.
f6bcfd97 102
eec47cc6
VZ
103If \arg{out} is \NULL, only the length of the string which would result from
104the conversion is calculated and returned. Note that this is the length and not
105size, i.e. the returned value does \emph{not} include the trailing \NUL. But
106when the function is called with a non-\NULL \arg{out} buffer, the \arg{outLen}
107parameter should be one more to allow to properly \NUL-terminate the string.
2b5f62a0
VZ
108
109\wxheading{Parameters}
110
eec47cc6 111\docparam{out}{The output buffer, may be \NULL if the caller is only
2b5f62a0
VZ
112interested in the length of the resulting string}
113
eec47cc6 114\docparam{in}{The \NUL-terminated input string, cannot be \NULL}
2b5f62a0 115
eec47cc6
VZ
116\docparam{outLen}{The length of the output buffer but \emph{including}
117\NUL, ignored if \arg{out} is \NULL}
2b5f62a0
VZ
118
119\wxheading{Return value}
120
5e51fb4c 121The length of the converted string \emph{excluding} the trailing \NUL.
eec47cc6 122
f6bcfd97
BP
123
124\membersection{wxMBConv::WC2MB}\label{wxmbconvwc2mb}
125
126\constfunc{virtual size\_t}{WC2MB}{\param{char* }{buf}, \param{const wchar\_t* }{psz}, \param{size\_t }{n}}
127
483b0434
VZ
128\deprecated{\helpref{FromWChar}{wxmbconvfromwchar}}
129
2b5f62a0
VZ
130Converts from Unicode to multibyte encoding. The semantics of this function
131(including the return value meaning) is the same as for
132\helpref{MB2WC}{wxmbconvmb2wc}.
133
eec47cc6
VZ
134Notice that when the function is called with a non-\NULL buffer, the
135{\it n} parameter should be the size of the buffer and so it \emph{should} take
5e51fb4c 136into account the trailing \NUL, which might take two or four bytes for some
eec47cc6
VZ
137encodings (UTF-16 and UTF-32) and not one.
138
f6bcfd97
BP
139
140\membersection{wxMBConv::cMB2WC}\label{wxmbconvcmb2wc}
141
eec47cc6
VZ
142\constfunc{const wxWCharBuffer}{cMB2WC}{\param{const char *}{in}}
143
144\constfunc{const wxWCharBuffer}{cMB2WC}{\param{const char *}{in}, \param{size\_t }{inLen}, \param{size\_t }{*outLen}}
145
146Converts from multibyte encoding to Unicode by calling
147\helpref{MB2WC}{wxmbconvmb2wc}, allocating a temporary wxWCharBuffer to hold
148the result.
149
150The first overload takes a \NUL-terminated input string. The second one takes a
151string of exactly the specified length and the string may include or not the
5e51fb4c 152trailing \NUL character(s). If the string is not \NUL-terminated, a temporary
eec47cc6
VZ
153\NUL-terminated copy of it suitable for passing to \helpref{MB2WC}{wxmbconvmb2wc}
154is made, so it is more efficient to ensure that the string is does have the
155appropriate number of \NUL bytes (which is usually $1$ but may be $2$ or $4$
7ef3ab50
VZ
156for UTF-16 or UTF-32, see \helpref{GetMBNulLen}{wxmbconvgetmbnullen}),
157especially for long strings.
eec47cc6
VZ
158
159If \arg{outLen} is not-\NULL, it receives the length of the converted
160string.
f6bcfd97 161
f6bcfd97
BP
162
163\membersection{wxMBConv::cWC2MB}\label{wxmbconvcwc2mb}
164
eec47cc6
VZ
165\constfunc{const wxCharBuffer}{cWC2MB}{\param{const wchar\_t* }{in}}
166
167\constfunc{const wxCharBuffer}{cWC2MB}{\param{const wchar\_t* }{in}, \param{size\_t }{inLen}, \param{size\_t }{*outLen}}
f6bcfd97
BP
168
169Converts from Unicode to multibyte encoding by calling WC2MB,
170allocating a temporary wxCharBuffer to hold the result.
171
eec47cc6
VZ
172The second overload of this function allows to convert a string of the given
173length \arg{inLen}, whether it is \NUL-terminated or not (for wide character
174strings, unlike for the multibyte ones, a single \NUL is always enough).
175But notice that just as with \helpref{cMB2WC}{wxmbconvmb2wc}, it is more
176efficient to pass an already terminated string to this function as otherwise a
177copy is made internally.
178
179If \arg{outLen} is not-\NULL, it receives the length of the converted
180string.
181
182
f6bcfd97
BP
183\membersection{wxMBConv::cMB2WX}\label{wxmbconvcmb2wx}
184
185\constfunc{const char*}{cMB2WX}{\param{const char* }{psz}}
186
187\constfunc{const wxWCharBuffer}{cMB2WX}{\param{const char* }{psz}}
188
189Converts from multibyte encoding to the current wxChar type
190(which depends on whether wxUSE\_UNICODE is set to 1). If wxChar is char,
191it returns the parameter unaltered. If wxChar is wchar\_t, it returns the
192result in a wxWCharBuffer. The macro wxMB2WXbuf is defined as the correct
193return type (without const).
194
eec47cc6 195
f6bcfd97
BP
196\membersection{wxMBConv::cWX2MB}\label{wxmbconvcwx2mb}
197
198\constfunc{const char*}{cWX2MB}{\param{const wxChar* }{psz}}
199
200\constfunc{const wxCharBuffer}{cWX2MB}{\param{const wxChar* }{psz}}
201
202Converts from the current wxChar type to multibyte encoding. If wxChar is char,
203it returns the parameter unaltered. If wxChar is wchar\_t, it returns the
204result in a wxCharBuffer. The macro wxWX2MBbuf is defined as the correct
205return type (without const).
206
eec47cc6 207
f6bcfd97
BP
208\membersection{wxMBConv::cWC2WX}\label{wxmbconvcwc2wx}
209
210\constfunc{const wchar\_t*}{cWC2WX}{\param{const wchar\_t* }{psz}}
211
212\constfunc{const wxCharBuffer}{cWC2WX}{\param{const wchar\_t* }{psz}}
213
214Converts from Unicode to the current wxChar type. If wxChar is wchar\_t,
215it returns the parameter unaltered. If wxChar is char, it returns the
216result in a wxCharBuffer. The macro wxWC2WXbuf is defined as the correct
217return type (without const).
218
eec47cc6 219
f6bcfd97
BP
220\membersection{wxMBConv::cWX2WC}\label{wxmbconvcwx2wc}
221
222\constfunc{const wchar\_t*}{cWX2WC}{\param{const wxChar* }{psz}}
223
224\constfunc{const wxWCharBuffer}{cWX2WC}{\param{const wxChar* }{psz}}
225
226Converts from the current wxChar type to Unicode. If wxChar is wchar\_t,
227it returns the parameter unaltered. If wxChar is char, it returns the
228result in a wxWCharBuffer. The macro wxWX2WCbuf is defined as the correct
229return type (without const).
230
7ef3ab50 231
483b0434
VZ
232\membersection{wxMBConv::FromWChar}\label{wxmbconvfromwchar}
233
13b55525 234\constfunc{virtual size\_t}{FromWChar}{\param{char\_t *}{dst}, \param{size\_t }{dstLen}, \param{const wchar\_t *}{src}, \param{size\_t }{srcLen = wxNO\_LEN}}
483b0434 235
13b55525
JS
236This function has the same semantics as \helpref{ToWChar}{wxmbconvtowchar}
237except that it converts a wide string to multibyte one.
483b0434
VZ
238
239\membersection{wxMBConv::GetMaxMBNulLen}\label{wxmbconvgetmaxmbnullen}
240
241\func{const size\_t}{GetMaxMBNulLen}{\void}
242
243Returns the maximal value which can be returned by
244\helpref{GetMBNulLen}{wxmbconvgetmbnullen} for any conversion object. Currently
245this value is $4$.
246
247This method can be used to allocate the buffer with enough space for the
248trailing \NUL characters for any encoding.
249
250
7ef3ab50
VZ
251\membersection{wxMBConv::GetMBNulLen}\label{wxmbconvgetmbnullen}
252
253\constfunc{size\_t}{GetMBNulLen}{\void}
254
255This function returns $1$ for most of the multibyte encodings in which the
256string is terminated by a single \NUL, $2$ for UTF-16 and $4$ for UTF-32 for
257which the string is terminated with $2$ and $4$ \NUL characters respectively.
21de14b3
VZ
258The other cases are not currently supported and \texttt{wxCONV\_FAILED}
259(defined as $-1$) is returned for them.
7ef3ab50
VZ
260
261
483b0434
VZ
262\membersection{wxMBConv::ToWChar}\label{wxmbconvtowchar}
263
13b55525 264\constfunc{virtual size\_t}{ToWChar}{\param{wchar\_t *}{dst}, \param{size\_t }{dstLen}, \param{const char *}{src}, \param{size\_t }{srcLen = wxNO\_LEN}}
483b0434 265
13b55525
JS
266The most general function for converting a multibyte string to a wide string.
267The main case is when \arg{dst} is not \NULL and \arg{srcLen} is not
268\texttt{wxNO\_LEN} (which is defined as \texttt{(size\_t)$-1$}): then
269the function converts exactly \arg{srcLen} bytes starting at \arg{src} into
270wide string which it output to \arg{dst}. If the length of the resulting wide
271string is greater than \arg{dstLen}, an error is returned. Note that if
272\arg{srcLen} bytes don't include \NUL characters, the resulting wide string is
273not \NUL-terminated neither.
483b0434 274
13b55525
JS
275If \arg{srcLen} is \texttt{wxNO\_LEN}, the function supposes that the string is
276properly (i.e. as necessary for the encoding handled by this conversion)
277\NUL-terminated and converts the entire string, including any trailing \NUL
278bytes. In this case the wide string is also \NUL-terminated.
279
280Finally, if \arg{dst} is \NULL, the function returns the length of the needed
281buffer.
282
283\wxheading{Return value}
284
285The number of characters written to \arg{dst} (or the number of characters
286which would have been written to it if it were non-\NULL) on success or
287\texttt{wxCONV\_FAILED} on error.
483b0434 288
f1e589cd 289