]> git.saurik.com Git - wxWidgets.git/blame - interface/strconv.h
remove wxTextAttr::CreateFont(); return wxNullFont from GetFont() if we have no font...
[wxWidgets.git] / interface / strconv.h
CommitLineData
23324ae1
FM
1/////////////////////////////////////////////////////////////////////////////
2// Name: strconv.h
3// Purpose: documentation for wxMBConvUTF7 class
4// Author: wxWidgets team
5// RCS-ID: $Id$
6// Licence: wxWindows license
7/////////////////////////////////////////////////////////////////////////////
8
9/**
10 @class wxMBConvUTF7
11 @wxheader{strconv.h}
7c913512 12
23324ae1
FM
13 This class converts between the UTF-7 encoding and Unicode.
14 It has one predefined instance, @b wxConvUTF7.
7c913512 15
23324ae1 16 @b WARNING: this class is not implemented yet.
7c913512 17
23324ae1
FM
18 @library{wxbase}
19 @category{FIXME}
7c913512 20
23324ae1
FM
21 @seealso
22 wxMBConvUTF8, @ref overview_mbconvclasses "wxMBConv classes overview"
23*/
24class wxMBConvUTF7 : public wxMBConv
25{
26public:
27 /**
28 Converts from UTF-7 encoding to Unicode. Returns the size of the destination
29 buffer.
30 */
4cc4bfaf 31 size_t MB2WC(wchar_t* buf, const char* psz, size_t n);
23324ae1
FM
32
33 /**
34 Converts from Unicode to UTF-7 encoding. Returns the size of the destination
35 buffer.
36 */
4cc4bfaf 37 size_t WC2MB(char* buf, const wchar_t* psz, size_t n);
23324ae1
FM
38};
39
40
41/**
42 @class wxMBConvUTF8
43 @wxheader{strconv.h}
7c913512 44
23324ae1
FM
45 This class converts between the UTF-8 encoding and Unicode.
46 It has one predefined instance, @b wxConvUTF8.
7c913512 47
23324ae1
FM
48 @library{wxbase}
49 @category{FIXME}
7c913512 50
23324ae1
FM
51 @seealso
52 wxMBConvUTF7, @ref overview_mbconvclasses "wxMBConv classes overview"
53*/
54class wxMBConvUTF8 : public wxMBConv
55{
56public:
57 /**
58 Converts from UTF-8 encoding to Unicode. Returns the size of the destination
59 buffer.
60 */
4cc4bfaf 61 size_t MB2WC(wchar_t* buf, const char* psz, size_t n);
23324ae1
FM
62
63 /**
64 Converts from Unicode to UTF-8 encoding. Returns the size of the destination
65 buffer.
66 */
4cc4bfaf 67 size_t WC2MB(char* buf, const wchar_t* psz, size_t n);
23324ae1
FM
68};
69
70
71/**
72 @class wxMBConvUTF16
73 @wxheader{strconv.h}
7c913512 74
23324ae1
FM
75 This class is used to convert between multibyte encodings and UTF-16 Unicode
76 encoding (also known as UCS-2). Unlike UTF-8 encoding,
77 UTF-16 uses words and not bytes and hence depends on the byte ordering:
78 big or little endian. Hence this class is provided in two versions:
79 wxMBConvUTF16LE and wxMBConvUTF16BE and wxMBConvUTF16 itself is just a typedef
80 for one of them (native for the given platform, e.g. LE under Windows and BE
81 under Mac).
7c913512 82
23324ae1
FM
83 @library{wxbase}
84 @category{FIXME}
7c913512 85
23324ae1
FM
86 @seealso
87 wxMBConvUTF8, wxMBConvUTF32, @ref overview_mbconvclasses "wxMBConv classes
88 overview"
89*/
90class wxMBConvUTF16 : public wxMBConv
91{
92public:
93 /**
94 Converts from UTF-16 encoding to Unicode. Returns the size of the destination
95 buffer.
96 */
4cc4bfaf 97 size_t MB2WC(wchar_t* buf, const char* psz, size_t n);
23324ae1
FM
98
99 /**
100 Converts from Unicode to UTF-16 encoding. Returns the size of the destination
101 buffer.
102 */
4cc4bfaf 103 size_t WC2MB(char* buf, const wchar_t* psz, size_t n);
23324ae1
FM
104};
105
106
107/**
108 @class wxCSConv
109 @wxheader{strconv.h}
7c913512 110
23324ae1
FM
111 This class converts between any character sets and Unicode.
112 It has one predefined instance, @b wxConvLocal, for the
113 default user character set.
7c913512 114
23324ae1
FM
115 @library{wxbase}
116 @category{FIXME}
7c913512 117
23324ae1
FM
118 @seealso
119 wxMBConv, wxEncodingConverter, @ref overview_mbconvclasses "wxMBConv classes
120 overview"
121*/
122class wxCSConv : public wxMBConv
123{
124public:
125 //@{
126 /**
127 Constructor. You may specify either the name of the character set you want to
128 convert from/to or an encoding constant. If the character set name (or the
129 encoding) is not recognized, ISO 8859-1 is used as fall back.
130 */
131 wxCSConv(const wxChar* charset);
7c913512 132 wxCSConv(wxFontEncoding encoding);
23324ae1
FM
133 //@}
134
135 /**
136 Destructor frees any resources needed to perform the conversion.
137 */
138 ~wxCSConv();
139
140 /**
141 Returns @true if the charset (or the encoding) given at constructor is really
142 available to use. Returns @false if ISO 8859-1 will be used instead.
23324ae1
FM
143 Note this does not mean that a given string will be correctly converted.
144 A malformed string may still make conversion functions return @c wxCONV_FAILED.
23324ae1
FM
145 This function is new since wxWidgets version 2.8.2
146 */
4cc4bfaf 147 bool IsOk();
23324ae1
FM
148
149 /**
150 Converts from the selected character set to Unicode. Returns length of string
151 written to destination buffer.
152 */
4cc4bfaf 153 size_t MB2WC(wchar_t* buf, const char* psz, size_t n);
23324ae1
FM
154
155 /**
156 Converts from Unicode to the selected character set. Returns length of string
157 written to destination buffer.
158 */
4cc4bfaf 159 size_t WC2MB(char* buf, const wchar_t* psz, size_t n);
23324ae1
FM
160};
161
162
163/**
164 @class wxMBConvFile
165 @wxheader{strconv.h}
7c913512
FM
166
167 This class used to define the class instance
23324ae1
FM
168 @b wxConvFileName, but nowadays @b wxConvFileName is
169 either of type wxConvLibc (on most platforms) or wxConvUTF8
7c913512
FM
170 (on MacOS X). @b wxConvFileName converts filenames between
171 filesystem multibyte encoding and Unicode. @b wxConvFileName
172 can also be set to a something else at run-time which is used
173 e.g. by wxGTK to use a class which checks the environment
174 variable @b G_FILESYSTEM_ENCODING indicating that filenames
175 should not be interpreted as UTF8 and also for converting
23324ae1 176 invalid UTF8 characters (e.g. if there is a filename in iso8859_1)
7c913512
FM
177 to strings with octal values.
178
23324ae1
FM
179 Since some platforms (such as Win32) use Unicode in the filenames,
180 and others (such as Unix) use multibyte encodings, this class should only
181 be used directly if wxMBFILES is defined to 1. A convenience macro,
182 wxFNCONV, is defined to wxConvFileName-cWX2MB in this case. You could
183 use it like this:
7c913512 184
23324ae1
FM
185 @code
186 wxChar *name = wxT("rawfile.doc");
187 FILE *fil = fopen(wxFNCONV(name), "r");
188 @endcode
7c913512 189
23324ae1 190 (although it would be better to use wxFopen(name, wxT("r")) in this case.)
7c913512 191
23324ae1
FM
192 @library{wxbase}
193 @category{FIXME}
7c913512 194
23324ae1
FM
195 @seealso
196 @ref overview_mbconvclasses "wxMBConv classes overview"
197*/
198class wxMBConvFile : public wxMBConv
199{
200public:
201 /**
202 Converts from multibyte filename encoding to Unicode. Returns the size of the
203 destination buffer.
204 */
4cc4bfaf 205 size_t MB2WC(wchar_t* buf, const char* psz, size_t n);
23324ae1
FM
206
207 /**
208 Converts from Unicode to multibyte filename encoding. Returns the size of the
209 destination buffer.
210 */
4cc4bfaf 211 size_t WC2MB(char* buf, const wchar_t* psz, size_t n);
23324ae1
FM
212};
213
214
215/**
216 @class wxMBConvUTF32
217 @wxheader{strconv.h}
7c913512 218
23324ae1
FM
219 This class is used to convert between multibyte encodings and UTF-32 Unicode
220 encoding (also known as UCS-4). Unlike UTF-8 encoding,
221 UTF-32 uses (double) words and not bytes and hence depends on the byte ordering:
222 big or little endian. Hence this class is provided in two versions:
223 wxMBConvUTF32LE and wxMBConvUTF32BE and wxMBConvUTF32 itself is just a typedef
224 for one of them (native for the given platform, e.g. LE under Windows and BE
225 under Mac).
7c913512 226
23324ae1
FM
227 @library{wxbase}
228 @category{FIXME}
7c913512 229
23324ae1
FM
230 @seealso
231 wxMBConvUTF8, wxMBConvUTF16, @ref overview_mbconvclasses "wxMBConv classes
232 overview"
233*/
234class wxMBConvUTF32 : public wxMBConv
235{
236public:
237 /**
238 Converts from UTF-32 encoding to Unicode. Returns the size of the destination
239 buffer.
240 */
4cc4bfaf 241 size_t MB2WC(wchar_t* buf, const char* psz, size_t n);
23324ae1
FM
242
243 /**
244 Converts from Unicode to UTF-32 encoding. Returns the size of the destination
245 buffer.
246 */
4cc4bfaf 247 size_t WC2MB(char* buf, const wchar_t* psz, size_t n);
23324ae1
FM
248};
249
250
251/**
252 @class wxMBConv
253 @wxheader{strconv.h}
7c913512 254
23324ae1
FM
255 This class is the base class of a hierarchy of classes capable of converting
256 text strings between multibyte (SBCS or DBCS) encodings and Unicode.
7c913512
FM
257
258 In the documentation for this and related classes please notice that
23324ae1
FM
259 length of the string refers to the number of characters in the string
260 not counting the terminating @c NUL, if any. While the size of the string
261 is the total number of bytes in the string, including any trailing @c NUL.
262 Thus, length of wide character string @c L"foo" is 3 while its size can
263 be either 8 or 16 depending on whether @c wchar_t is 2 bytes (as
264 under Windows) or 4 (Unix).
7c913512 265
23324ae1
FM
266 @library{wxbase}
267 @category{FIXME}
7c913512 268
23324ae1
FM
269 @seealso
270 wxCSConv, wxEncodingConverter, @ref overview_mbconvclasses "wxMBConv classes
271 overview"
272*/
7c913512 273class wxMBConv
23324ae1
FM
274{
275public:
276 /**
277 Trivial default constructor.
278 */
279 wxMBConv();
280
281 /**
282 This pure virtual function is overridden in each of the derived classes to
283 return a new copy of the object it is called on. It is used for copying the
284 conversion objects while preserving their dynamic type.
285 */
4cc4bfaf 286 virtual wxMBConv* Clone();
23324ae1
FM
287
288 /**
7c913512 289 This function has the same semantics as ToWChar()
23324ae1
FM
290 except that it converts a wide string to multibyte one.
291 */
4cc4bfaf
FM
292 virtual size_t FromWChar(char* dst, size_t dstLen,
293 const wchar_t* src,
23324ae1
FM
294 size_t srcLen = wxNO_LEN);
295
296 /**
297 This function returns 1 for most of the multibyte encodings in which the
298 string is terminated by a single @c NUL, 2 for UTF-16 and 4 for UTF-32 for
299 which the string is terminated with 2 and 4 @c NUL characters respectively.
7c913512 300 The other cases are not currently supported and @c wxCONV_FAILED
23324ae1
FM
301 (defined as -1) is returned for them.
302 */
303 size_t GetMBNulLen();
304
305 /**
7c913512 306 Returns the maximal value which can be returned by
23324ae1
FM
307 GetMBNulLen() for any conversion object. Currently
308 this value is 4.
23324ae1
FM
309 This method can be used to allocate the buffer with enough space for the
310 trailing @c NUL characters for any encoding.
311 */
312 const size_t GetMaxMBNulLen();
313
314 /**
315 This function is deprecated, please use ToWChar() instead
4cc4bfaf
FM
316 Converts from a string @a in in multibyte encoding to Unicode putting up to
317 @a outLen characters into the buffer @e out.
318 If @a out is @NULL, only the length of the string which would result from
23324ae1
FM
319 the conversion is calculated and returned. Note that this is the length and not
320 size, i.e. the returned value does not include the trailing @c NUL. But
4cc4bfaf 321 when the function is called with a non-@NULL @a out buffer, the @a outLen
23324ae1
FM
322 parameter should be one more to allow to properly @c NUL-terminate the string.
323
7c913512 324 @param out
4cc4bfaf
FM
325 The output buffer, may be @NULL if the caller is only
326 interested in the length of the resulting string
7c913512 327 @param in
4cc4bfaf 328 The NUL-terminated input string, cannot be @NULL
7c913512 329 @param outLen
4cc4bfaf
FM
330 The length of the output buffer but including
331 NUL, ignored if out is @NULL
23324ae1
FM
332
333 @returns The length of the converted string excluding the trailing NUL.
334 */
4cc4bfaf
FM
335 virtual size_t MB2WC(wchar_t* out, const char* in,
336 size_t outLen);
23324ae1
FM
337
338 /**
339 The most general function for converting a multibyte string to a wide string.
4cc4bfaf 340 The main case is when @a dst is not @NULL and @a srcLen is not
23324ae1 341 @c wxNO_LEN (which is defined as @c (size_t)-1): then
4cc4bfaf 342 the function converts exactly @a srcLen bytes starting at @a src into
23324ae1 343 wide string which it output to @e dst. If the length of the resulting wide
7c913512 344 string is greater than @e dstLen, an error is returned. Note that if
4cc4bfaf 345 @a srcLen bytes don't include @c NUL characters, the resulting wide string is
23324ae1 346 not @c NUL-terminated neither.
4cc4bfaf 347 If @a srcLen is @c wxNO_LEN, the function supposes that the string is
7c913512
FM
348 properly (i.e. as necessary for the encoding handled by this conversion)
349 @c NUL-terminated and converts the entire string, including any trailing @c NUL
23324ae1 350 bytes. In this case the wide string is also @c NUL-terminated.
4cc4bfaf 351 Finally, if @a dst is @NULL, the function returns the length of the needed
23324ae1
FM
352 buffer.
353 */
4cc4bfaf
FM
354 virtual size_t ToWChar(wchar_t* dst, size_t dstLen,
355 const char* src,
23324ae1
FM
356 size_t srcLen = wxNO_LEN);
357
358 /**
359 This function is deprecated, please use FromWChar() instead
23324ae1 360 Converts from Unicode to multibyte encoding. The semantics of this function
7c913512 361 (including the return value meaning) is the same as for
23324ae1 362 wxMBConv::MB2WC.
7c913512 363 Notice that when the function is called with a non-@NULL buffer, the
4cc4bfaf 364 @a n parameter should be the size of the buffer and so it should take
23324ae1
FM
365 into account the trailing @c NUL, which might take two or four bytes for some
366 encodings (UTF-16 and UTF-32) and not one.
367 */
4cc4bfaf 368 virtual size_t WC2MB(char* buf, const wchar_t* psz, size_t n);
23324ae1
FM
369
370 //@{
371 /**
7c913512 372 Converts from multibyte encoding to Unicode by calling
23324ae1
FM
373 wxMBConv::MB2WC, allocating a temporary wxWCharBuffer to hold
374 the result.
23324ae1
FM
375 The first overload takes a @c NUL-terminated input string. The second one takes
376 a
377 string of exactly the specified length and the string may include or not the
378 trailing @c NUL character(s). If the string is not @c NUL-terminated, a
7c913512
FM
379 temporary
380 @c NUL-terminated copy of it suitable for passing to wxMBConv::MB2WC
23324ae1
FM
381 is made, so it is more efficient to ensure that the string is does have the
382 appropriate number of @c NUL bytes (which is usually 1 but may be 2 or 4
383 for UTF-16 or UTF-32, see wxMBConv::GetMBNulLen),
384 especially for long strings.
4cc4bfaf 385 If @a outLen is not-@NULL, it receives the length of the converted
23324ae1
FM
386 string.
387 */
4cc4bfaf
FM
388 const wxWCharBuffer cMB2WC(const char* in);
389 const wxWCharBuffer cMB2WC(const char* in, size_t inLen,
7c913512 390 size_t outLen);
23324ae1
FM
391 //@}
392
393 //@{
394 /**
395 Converts from multibyte encoding to the current wxChar type
396 (which depends on whether wxUSE_UNICODE is set to 1). If wxChar is char,
397 it returns the parameter unaltered. If wxChar is wchar_t, it returns the
398 result in a wxWCharBuffer. The macro wxMB2WXbuf is defined as the correct
399 return type (without const).
400 */
401 const char* cMB2WX(const char* psz);
7c913512 402 const wxWCharBuffer cMB2WX(const char* psz);
23324ae1
FM
403 //@}
404
405 //@{
406 /**
407 Converts from Unicode to multibyte encoding by calling WC2MB,
408 allocating a temporary wxCharBuffer to hold the result.
23324ae1
FM
409 The second overload of this function allows to convert a string of the given
410 length @e inLen, whether it is @c NUL-terminated or not (for wide character
411 strings, unlike for the multibyte ones, a single @c NUL is always enough).
412 But notice that just as with @ref wxMBConv::mb2wc cMB2WC, it is more
413 efficient to pass an already terminated string to this function as otherwise a
414 copy is made internally.
4cc4bfaf 415 If @a outLen is not-@NULL, it receives the length of the converted
23324ae1
FM
416 string.
417 */
418 const wxCharBuffer cWC2MB(const wchar_t* in);
7c913512
FM
419 const wxCharBuffer cWC2MB(const wchar_t* in, size_t inLen,
420 size_t outLen);
23324ae1
FM
421 //@}
422
423 //@{
424 /**
425 Converts from Unicode to the current wxChar type. If wxChar is wchar_t,
426 it returns the parameter unaltered. If wxChar is char, it returns the
427 result in a wxCharBuffer. The macro wxWC2WXbuf is defined as the correct
428 return type (without const).
429 */
430 const wchar_t* cWC2WX(const wchar_t* psz);
7c913512 431 const wxCharBuffer cWC2WX(const wchar_t* psz);
23324ae1
FM
432 //@}
433
434 //@{
435 /**
436 Converts from the current wxChar type to multibyte encoding. If wxChar is char,
437 it returns the parameter unaltered. If wxChar is wchar_t, it returns the
438 result in a wxCharBuffer. The macro wxWX2MBbuf is defined as the correct
439 return type (without const).
440 */
441 const char* cWX2MB(const wxChar* psz);
7c913512 442 const wxCharBuffer cWX2MB(const wxChar* psz);
23324ae1
FM
443 //@}
444
445 //@{
446 /**
447 Converts from the current wxChar type to Unicode. If wxChar is wchar_t,
448 it returns the parameter unaltered. If wxChar is char, it returns the
449 result in a wxWCharBuffer. The macro wxWX2WCbuf is defined as the correct
450 return type (without const).
451 */
452 const wchar_t* cWX2WC(const wxChar* psz);
7c913512 453 const wxWCharBuffer cWX2WC(const wxChar* psz);
23324ae1
FM
454 //@}
455};