]>
Commit | Line | Data |
---|---|---|
1 | %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% | |
2 | %% Name: mbconv.tex | |
3 | %% Purpose: wxMBConv documentation | |
4 | %% Author: Ove Kaaven, Vadim Zeitlin | |
5 | %% Created: 2000-03-25 | |
6 | %% RCS-ID: $Id$ | |
7 | %% Copyright: (c) 2000 Ove Kaaven | |
8 | %% (c) 2003-2006 Vadim Zeitlin | |
9 | %% License: wxWindows license | |
10 | %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% | |
11 | ||
12 | ||
13 | \section{\class{wxMBConv}}\label{wxmbconv} | |
14 | ||
15 | This class is the base class of a hierarchy of classes capable of converting | |
16 | text strings between multibyte (SBCS or DBCS) encodings and Unicode. | |
17 | ||
18 | In the documentation for this and related classes please notice that | |
19 | \emph{length} of the string refers to the number of characters in the string | |
20 | not counting the terminating \NUL, if any. While the \emph{size} of the string | |
21 | is the total number of bytes in the string, including any trailing \NUL. | |
22 | Thus, length of wide character string \texttt{L"foo"} is $3$ while its size can | |
23 | be either $8$ or $16$ depending on whether \texttt{wchar\_t} is $2$ bytes (as | |
24 | under Windows) or $4$ (Unix). | |
25 | ||
26 | \wxheading{Global variables} | |
27 | ||
28 | There are several predefined instances of this class: | |
29 | \begin{twocollist} | |
30 | \twocolitem{\textbf{wxConvLibc}}{Uses the standard ANSI C \texttt{mbstowcs()} and | |
31 | \texttt{wcstombs()} functions to perform the conversions; thus depends on the | |
32 | current locale.} | |
33 | \twocolitem{\textbf{wxConvLocal}}{Another conversion corresponding to the | |
34 | current locale but this one uses the best available conversion.} | |
35 | \twocolitem{\textbf{wxConvUI}}{The conversion used for hte standard UI elements | |
36 | such as menu items and buttons. This is a pointer which is initially set to | |
37 | \texttt{wxConvLocal} as the program uses the current locale by default but can | |
38 | be set to some specific conversion if the program needs to use a specific | |
39 | encoding for its UI.} | |
40 | \twocolitem{\textbf{wxConvISO8859\_1}}{Conversion to and from ISO-8859-1 (Latin I) | |
41 | encoding.} | |
42 | \twocolitem{\textbf{wxConvUTF8}}{Conversion to and from UTF-8 encoding.} | |
43 | \twocolitem{\textbf{wxConvFile}}{The appropriate conversion for the file names, | |
44 | depends on the system.} | |
45 | % \twocolitem{\textbf{wxConvCurrent}}{Not really clear what is it for...} | |
46 | \end{twocollist} | |
47 | ||
48 | ||
49 | \wxheading{Constants} | |
50 | ||
51 | \texttt{wxCONV\_FAILED} value is defined as \texttt{(size\_t)$-1$} and is | |
52 | returned by the conversion functions instead of the length of the converted | |
53 | string if the conversion fails. | |
54 | ||
55 | ||
56 | \wxheading{Derived from} | |
57 | ||
58 | No base class | |
59 | ||
60 | \wxheading{Include files} | |
61 | ||
62 | <wx/strconv.h> | |
63 | ||
64 | \wxheading{Library} | |
65 | ||
66 | \helpref{wxBase}{librarieslist} | |
67 | ||
68 | \wxheading{See also} | |
69 | ||
70 | \helpref{wxCSConv}{wxcsconv}, | |
71 | \helpref{wxEncodingConverter}{wxencodingconverter}, | |
72 | \helpref{wxMBConv classes overview}{mbconvclasses} | |
73 | ||
74 | ||
75 | \latexignore{\rtfignore{\wxheading{Members}}} | |
76 | ||
77 | ||
78 | \membersection{wxMBConv::wxMBConv}\label{wxmbconvwxmbconv} | |
79 | ||
80 | \func{}{wxMBConv}{\void} | |
81 | ||
82 | Trivial default constructor. | |
83 | ||
84 | ||
85 | \membersection{wxMBConv::MB2WC}\label{wxmbconvmb2wc} | |
86 | ||
87 | \constfunc{virtual size\_t}{MB2WC}{\param{wchar\_t *}{out}, \param{const char *}{in}, \param{size\_t }{outLen}} | |
88 | ||
89 | \deprecated{\helpref{ToWChar}{wxmbconvtowchar}} | |
90 | ||
91 | Converts from a string \arg{in} in multibyte encoding to Unicode putting up to | |
92 | \arg{outLen} characters into the buffer \arg{out}. | |
93 | ||
94 | If \arg{out} is \NULL, only the length of the string which would result from | |
95 | the conversion is calculated and returned. Note that this is the length and not | |
96 | size, i.e. the returned value does \emph{not} include the trailing \NUL. But | |
97 | when the function is called with a non-\NULL \arg{out} buffer, the \arg{outLen} | |
98 | parameter should be one more to allow to properly \NUL-terminate the string. | |
99 | ||
100 | \wxheading{Parameters} | |
101 | ||
102 | \docparam{out}{The output buffer, may be \NULL if the caller is only | |
103 | interested in the length of the resulting string} | |
104 | ||
105 | \docparam{in}{The \NUL-terminated input string, cannot be \NULL} | |
106 | ||
107 | \docparam{outLen}{The length of the output buffer but \emph{including} | |
108 | \NUL, ignored if \arg{out} is \NULL} | |
109 | ||
110 | \wxheading{Return value} | |
111 | ||
112 | The length of the converted string \emph{excluding} the trailing \NUL. | |
113 | ||
114 | ||
115 | \membersection{wxMBConv::WC2MB}\label{wxmbconvwc2mb} | |
116 | ||
117 | \constfunc{virtual size\_t}{WC2MB}{\param{char* }{buf}, \param{const wchar\_t* }{psz}, \param{size\_t }{n}} | |
118 | ||
119 | \deprecated{\helpref{FromWChar}{wxmbconvfromwchar}} | |
120 | ||
121 | Converts from Unicode to multibyte encoding. The semantics of this function | |
122 | (including the return value meaning) is the same as for | |
123 | \helpref{MB2WC}{wxmbconvmb2wc}. | |
124 | ||
125 | Notice that when the function is called with a non-\NULL buffer, the | |
126 | {\it n} parameter should be the size of the buffer and so it \emph{should} take | |
127 | into account the trailing \NUL, which might take two or four bytes for some | |
128 | encodings (UTF-16 and UTF-32) and not one. | |
129 | ||
130 | ||
131 | \membersection{wxMBConv::cMB2WC}\label{wxmbconvcmb2wc} | |
132 | ||
133 | \constfunc{const wxWCharBuffer}{cMB2WC}{\param{const char *}{in}} | |
134 | ||
135 | \constfunc{const wxWCharBuffer}{cMB2WC}{\param{const char *}{in}, \param{size\_t }{inLen}, \param{size\_t }{*outLen}} | |
136 | ||
137 | Converts from multibyte encoding to Unicode by calling | |
138 | \helpref{MB2WC}{wxmbconvmb2wc}, allocating a temporary wxWCharBuffer to hold | |
139 | the result. | |
140 | ||
141 | The first overload takes a \NUL-terminated input string. The second one takes a | |
142 | string of exactly the specified length and the string may include or not the | |
143 | trailing \NUL character(s). If the string is not \NUL-terminated, a temporary | |
144 | \NUL-terminated copy of it suitable for passing to \helpref{MB2WC}{wxmbconvmb2wc} | |
145 | is made, so it is more efficient to ensure that the string is does have the | |
146 | appropriate number of \NUL bytes (which is usually $1$ but may be $2$ or $4$ | |
147 | for UTF-16 or UTF-32, see \helpref{GetMBNulLen}{wxmbconvgetmbnullen}), | |
148 | especially for long strings. | |
149 | ||
150 | If \arg{outLen} is not-\NULL, it receives the length of the converted | |
151 | string. | |
152 | ||
153 | ||
154 | \membersection{wxMBConv::cWC2MB}\label{wxmbconvcwc2mb} | |
155 | ||
156 | \constfunc{const wxCharBuffer}{cWC2MB}{\param{const wchar\_t* }{in}} | |
157 | ||
158 | \constfunc{const wxCharBuffer}{cWC2MB}{\param{const wchar\_t* }{in}, \param{size\_t }{inLen}, \param{size\_t }{*outLen}} | |
159 | ||
160 | Converts from Unicode to multibyte encoding by calling WC2MB, | |
161 | allocating a temporary wxCharBuffer to hold the result. | |
162 | ||
163 | The second overload of this function allows to convert a string of the given | |
164 | length \arg{inLen}, whether it is \NUL-terminated or not (for wide character | |
165 | strings, unlike for the multibyte ones, a single \NUL is always enough). | |
166 | But notice that just as with \helpref{cMB2WC}{wxmbconvmb2wc}, it is more | |
167 | efficient to pass an already terminated string to this function as otherwise a | |
168 | copy is made internally. | |
169 | ||
170 | If \arg{outLen} is not-\NULL, it receives the length of the converted | |
171 | string. | |
172 | ||
173 | ||
174 | \membersection{wxMBConv::cMB2WX}\label{wxmbconvcmb2wx} | |
175 | ||
176 | \constfunc{const char*}{cMB2WX}{\param{const char* }{psz}} | |
177 | ||
178 | \constfunc{const wxWCharBuffer}{cMB2WX}{\param{const char* }{psz}} | |
179 | ||
180 | Converts from multibyte encoding to the current wxChar type | |
181 | (which depends on whether wxUSE\_UNICODE is set to 1). If wxChar is char, | |
182 | it returns the parameter unaltered. If wxChar is wchar\_t, it returns the | |
183 | result in a wxWCharBuffer. The macro wxMB2WXbuf is defined as the correct | |
184 | return type (without const). | |
185 | ||
186 | ||
187 | \membersection{wxMBConv::cWX2MB}\label{wxmbconvcwx2mb} | |
188 | ||
189 | \constfunc{const char*}{cWX2MB}{\param{const wxChar* }{psz}} | |
190 | ||
191 | \constfunc{const wxCharBuffer}{cWX2MB}{\param{const wxChar* }{psz}} | |
192 | ||
193 | Converts from the current wxChar type to multibyte encoding. If wxChar is char, | |
194 | it returns the parameter unaltered. If wxChar is wchar\_t, it returns the | |
195 | result in a wxCharBuffer. The macro wxWX2MBbuf is defined as the correct | |
196 | return type (without const). | |
197 | ||
198 | ||
199 | \membersection{wxMBConv::cWC2WX}\label{wxmbconvcwc2wx} | |
200 | ||
201 | \constfunc{const wchar\_t*}{cWC2WX}{\param{const wchar\_t* }{psz}} | |
202 | ||
203 | \constfunc{const wxCharBuffer}{cWC2WX}{\param{const wchar\_t* }{psz}} | |
204 | ||
205 | Converts from Unicode to the current wxChar type. If wxChar is wchar\_t, | |
206 | it returns the parameter unaltered. If wxChar is char, it returns the | |
207 | result in a wxCharBuffer. The macro wxWC2WXbuf is defined as the correct | |
208 | return type (without const). | |
209 | ||
210 | ||
211 | \membersection{wxMBConv::cWX2WC}\label{wxmbconvcwx2wc} | |
212 | ||
213 | \constfunc{const wchar\_t*}{cWX2WC}{\param{const wxChar* }{psz}} | |
214 | ||
215 | \constfunc{const wxWCharBuffer}{cWX2WC}{\param{const wxChar* }{psz}} | |
216 | ||
217 | Converts from the current wxChar type to Unicode. If wxChar is wchar\_t, | |
218 | it returns the parameter unaltered. If wxChar is char, it returns the | |
219 | result in a wxWCharBuffer. The macro wxWX2WCbuf is defined as the correct | |
220 | return type (without const). | |
221 | ||
222 | ||
223 | \membersection{wxMBConv::FromWChar}\label{wxmbconvfromwchar} | |
224 | ||
225 | \constfunc{virtual size\_t}{FromWChar}{\param{char\_t *}{dst}, \param{size\_t }{dstLen}, \param{const wchar\_t *}{src}, \param{size\_t }{srcLen = wxNO\_LEN}} | |
226 | ||
227 | This function has the same semantics as \helpref{ToWChar}{wxmbconvtowchar} | |
228 | except that it converts a wide string to multibyte one. | |
229 | ||
230 | \membersection{wxMBConv::GetMaxMBNulLen}\label{wxmbconvgetmaxmbnullen} | |
231 | ||
232 | \func{const size\_t}{GetMaxMBNulLen}{\void} | |
233 | ||
234 | Returns the maximal value which can be returned by | |
235 | \helpref{GetMBNulLen}{wxmbconvgetmbnullen} for any conversion object. Currently | |
236 | this value is $4$. | |
237 | ||
238 | This method can be used to allocate the buffer with enough space for the | |
239 | trailing \NUL characters for any encoding. | |
240 | ||
241 | ||
242 | \membersection{wxMBConv::GetMBNulLen}\label{wxmbconvgetmbnullen} | |
243 | ||
244 | \constfunc{size\_t}{GetMBNulLen}{\void} | |
245 | ||
246 | This function returns $1$ for most of the multibyte encodings in which the | |
247 | string is terminated by a single \NUL, $2$ for UTF-16 and $4$ for UTF-32 for | |
248 | which the string is terminated with $2$ and $4$ \NUL characters respectively. | |
249 | The other cases are not currently supported and \texttt{wxCONV\_FAILED} | |
250 | (defined as $-1$) is returned for them. | |
251 | ||
252 | ||
253 | \membersection{wxMBConv::ToWChar}\label{wxmbconvtowchar} | |
254 | ||
255 | \constfunc{virtual size\_t}{ToWChar}{\param{wchar\_t *}{dst}, \param{size\_t }{dstLen}, \param{const char *}{src}, \param{size\_t }{srcLen = wxNO\_LEN}} | |
256 | ||
257 | The most general function for converting a multibyte string to a wide string. | |
258 | The main case is when \arg{dst} is not \NULL and \arg{srcLen} is not | |
259 | \texttt{wxNO\_LEN} (which is defined as \texttt{(size\_t)$-1$}): then | |
260 | the function converts exactly \arg{srcLen} bytes starting at \arg{src} into | |
261 | wide string which it output to \arg{dst}. If the length of the resulting wide | |
262 | string is greater than \arg{dstLen}, an error is returned. Note that if | |
263 | \arg{srcLen} bytes don't include \NUL characters, the resulting wide string is | |
264 | not \NUL-terminated neither. | |
265 | ||
266 | If \arg{srcLen} is \texttt{wxNO\_LEN}, the function supposes that the string is | |
267 | properly (i.e. as necessary for the encoding handled by this conversion) | |
268 | \NUL-terminated and converts the entire string, including any trailing \NUL | |
269 | bytes. In this case the wide string is also \NUL-terminated. | |
270 | ||
271 | Finally, if \arg{dst} is \NULL, the function returns the length of the needed | |
272 | buffer. | |
273 | ||
274 | \wxheading{Return value} | |
275 | ||
276 | The number of characters written to \arg{dst} (or the number of characters | |
277 | which would have been written to it if it were non-\NULL) on success or | |
278 | \texttt{wxCONV\_FAILED} on error. | |
279 | ||
280 |