]>
Commit | Line | Data |
---|---|---|
6001e347 RR |
1 | /////////////////////////////////////////////////////////////////////////////// |
2 | // Name: strconv.h | |
3 | // Purpose: conversion routines for char sets any Unicode | |
4 | // Author: Robert Roebling, Ove Kaaven | |
5 | // Modified by: | |
6 | // Created: 29/01/98 | |
7 | // RCS-ID: $Id$ | |
8 | // Copyright: (c) 1998 Ove Kaaven, Robert Roebling, Vadim Zeitlin | |
65571936 | 9 | // Licence: wxWindows licence |
6001e347 RR |
10 | /////////////////////////////////////////////////////////////////////////////// |
11 | ||
12 | #ifndef _WX_WXSTRCONVH__ | |
13 | #define _WX_WXSTRCONVH__ | |
14 | ||
12028905 | 15 | #if defined(__GNUG__) && !defined(NO_GCC_PRAGMA) |
6001e347 RR |
16 | #pragma interface "strconv.h" |
17 | #endif | |
18 | ||
19 | #include "wx/defs.h" | |
20 | #include "wx/wxchar.h" | |
21 | #include "wx/buffer.h" | |
22 | ||
7db39dd6 CE |
23 | #ifdef __DIGITALMARS__ |
24 | #include "typeinfo.h" | |
25 | #endif | |
26 | ||
9dea36ef DW |
27 | #if defined(__VISAGECPP__) && __IBMCPP__ >= 400 |
28 | # undef __BSEXCPT__ | |
29 | #endif | |
dccce9ea | 30 | |
6001e347 RR |
31 | #include <stdlib.h> |
32 | ||
33 | #if wxUSE_WCHAR_T | |
34 | ||
e90c1d2a | 35 | // ---------------------------------------------------------------------------- |
bde4baac | 36 | // wxMBConv (abstract base class for conversions) |
e90c1d2a | 37 | // ---------------------------------------------------------------------------- |
6001e347 | 38 | |
bddd7a8d | 39 | class WXDLLIMPEXP_BASE wxMBConv |
6001e347 RR |
40 | { |
41 | public: | |
e90c1d2a | 42 | // the actual conversion takes place here |
bde4baac | 43 | // |
e4e3bbb4 | 44 | // note that outputSize is the size of the output buffer, not the length of input |
75736a9c DS |
45 | // (the latter is always supposed to be NUL-terminated) |
46 | virtual size_t MB2WC(wchar_t *outputBuf, const char *psz, size_t outputSize) const = 0; | |
47 | virtual size_t WC2MB(char *outputBuf, const wchar_t *psz, size_t outputSize) const = 0; | |
e90c1d2a | 48 | |
bde4baac | 49 | // MB <-> WC |
e90c1d2a VZ |
50 | const wxWCharBuffer cMB2WC(const char *psz) const; |
51 | const wxCharBuffer cWC2MB(const wchar_t *psz) const; | |
6001e347 | 52 | |
f5fb6871 RN |
53 | // MB <-> WC for strings with embedded null characters |
54 | // | |
55 | // pszLen length of the input string | |
56 | // pOutSize gets the final size of the converted string | |
57 | const wxWCharBuffer cMB2WC(const char *psz, size_t pszLen, size_t* pOutSize) const; | |
58 | const wxCharBuffer cWC2MB(const wchar_t *psz, size_t pszLen, size_t* pOutSize) const; | |
59 | ||
bde4baac | 60 | // convenience functions for converting MB or WC to/from wxWin default |
6001e347 | 61 | #if wxUSE_UNICODE |
e90c1d2a VZ |
62 | const wxWCharBuffer cMB2WX(const char *psz) const { return cMB2WC(psz); } |
63 | const wxCharBuffer cWX2MB(const wchar_t *psz) const { return cWC2MB(psz); } | |
64 | const wchar_t* cWC2WX(const wchar_t *psz) const { return psz; } | |
f6bcfd97 | 65 | const wchar_t* cWX2WC(const wchar_t *psz) const { return psz; } |
e90c1d2a VZ |
66 | #else // ANSI |
67 | const char* cMB2WX(const char *psz) const { return psz; } | |
68 | const char* cWX2MB(const char *psz) const { return psz; } | |
69 | const wxCharBuffer cWC2WX(const wchar_t *psz) const { return cWC2MB(psz); } | |
70 | const wxWCharBuffer cWX2WC(const char *psz) const { return cMB2WC(psz); } | |
71 | #endif // Unicode/ANSI | |
2b5f62a0 VZ |
72 | |
73 | // virtual dtor for any base class | |
e4a4a50b | 74 | virtual ~wxMBConv(); |
6001e347 RR |
75 | }; |
76 | ||
bde4baac VZ |
77 | // ---------------------------------------------------------------------------- |
78 | // wxMBConvLibc uses standard mbstowcs() and wcstombs() functions for | |
79 | // conversion (hence it depends on the current locale) | |
80 | // ---------------------------------------------------------------------------- | |
81 | ||
82 | class WXDLLIMPEXP_BASE wxMBConvLibc : public wxMBConv | |
83 | { | |
84 | public: | |
75736a9c DS |
85 | virtual size_t MB2WC(wchar_t *outputBuf, const char *psz, size_t outputSize) const; |
86 | virtual size_t WC2MB(char *outputBuf, const wchar_t *psz, size_t outputSize) const; | |
bde4baac VZ |
87 | }; |
88 | ||
e90c1d2a | 89 | // ---------------------------------------------------------------------------- |
6001e347 | 90 | // wxMBConvUTF7 (for conversion using UTF7 encoding) |
e90c1d2a | 91 | // ---------------------------------------------------------------------------- |
6001e347 | 92 | |
bddd7a8d | 93 | class WXDLLIMPEXP_BASE wxMBConvUTF7 : public wxMBConv |
6001e347 RR |
94 | { |
95 | public: | |
75736a9c DS |
96 | virtual size_t MB2WC(wchar_t *outputBuf, const char *psz, size_t outputSize) const; |
97 | virtual size_t WC2MB(char *outputBuf, const wchar_t *psz, size_t outputSize) const; | |
6001e347 RR |
98 | }; |
99 | ||
e90c1d2a | 100 | // ---------------------------------------------------------------------------- |
6001e347 | 101 | // wxMBConvUTF8 (for conversion using UTF8 encoding) |
e90c1d2a | 102 | // ---------------------------------------------------------------------------- |
6001e347 | 103 | |
bddd7a8d | 104 | class WXDLLIMPEXP_BASE wxMBConvUTF8 : public wxMBConv |
6001e347 RR |
105 | { |
106 | public: | |
75736a9c DS |
107 | virtual size_t MB2WC(wchar_t *outputBuf, const char *psz, size_t outputSize) const; |
108 | virtual size_t WC2MB(char *outputBuf, const wchar_t *psz, size_t outputSize) const; | |
6001e347 RR |
109 | }; |
110 | ||
e90c1d2a | 111 | // ---------------------------------------------------------------------------- |
c91830cb VZ |
112 | // wxMBConvUTF16LE (for conversion using UTF16 Little Endian encoding) |
113 | // ---------------------------------------------------------------------------- | |
114 | ||
115 | class WXDLLIMPEXP_BASE wxMBConvUTF16LE : public wxMBConv | |
116 | { | |
117 | public: | |
75736a9c DS |
118 | virtual size_t MB2WC(wchar_t *outputBuf, const char *psz, size_t outputSize) const; |
119 | virtual size_t WC2MB(char *outputBuf, const wchar_t *psz, size_t outputSize) const; | |
c91830cb VZ |
120 | }; |
121 | ||
122 | // ---------------------------------------------------------------------------- | |
123 | // wxMBConvUTF16BE (for conversion using UTF16 Big Endian encoding) | |
124 | // ---------------------------------------------------------------------------- | |
125 | ||
126 | class WXDLLIMPEXP_BASE wxMBConvUTF16BE : public wxMBConv | |
127 | { | |
128 | public: | |
75736a9c DS |
129 | virtual size_t MB2WC(wchar_t *outputBuf, const char *psz, size_t outputSize) const; |
130 | virtual size_t WC2MB(char *outputBuf, const wchar_t *psz, size_t outputSize) const; | |
c91830cb VZ |
131 | }; |
132 | ||
133 | // ---------------------------------------------------------------------------- | |
134 | // wxMBConvUCS4LE (for conversion using UTF32 Little Endian encoding) | |
135 | // ---------------------------------------------------------------------------- | |
136 | ||
137 | class WXDLLIMPEXP_BASE wxMBConvUTF32LE : public wxMBConv | |
138 | { | |
139 | public: | |
75736a9c DS |
140 | virtual size_t MB2WC(wchar_t *outputBuf, const char *psz, size_t outputSize) const; |
141 | virtual size_t WC2MB(char *outputBuf, const wchar_t *psz, size_t outputSize) const; | |
c91830cb VZ |
142 | }; |
143 | ||
144 | // ---------------------------------------------------------------------------- | |
145 | // wxMBConvUCS4BE (for conversion using UTF32 Big Endian encoding) | |
146 | // ---------------------------------------------------------------------------- | |
147 | ||
148 | class WXDLLIMPEXP_BASE wxMBConvUTF32BE : public wxMBConv | |
149 | { | |
150 | public: | |
75736a9c DS |
151 | virtual size_t MB2WC(wchar_t *outputBuf, const char *psz, size_t outputSize) const; |
152 | virtual size_t WC2MB(char *outputBuf, const wchar_t *psz, size_t outputSize) const; | |
c91830cb VZ |
153 | }; |
154 | ||
155 | // ---------------------------------------------------------------------------- | |
e90c1d2a VZ |
156 | // wxCSConv (for conversion based on loadable char sets) |
157 | // ---------------------------------------------------------------------------- | |
6001e347 | 158 | |
8b04d4c4 VZ |
159 | #include "wx/fontenc.h" |
160 | ||
bddd7a8d | 161 | class WXDLLIMPEXP_BASE wxCSConv : public wxMBConv |
6001e347 | 162 | { |
6001e347 | 163 | public: |
e95354ec VZ |
164 | // we can be created either from charset name or from an encoding constant |
165 | // but we can't have both at once | |
e90c1d2a | 166 | wxCSConv(const wxChar *charset); |
8b04d4c4 | 167 | wxCSConv(wxFontEncoding encoding); |
e95354ec | 168 | |
54380f29 | 169 | wxCSConv(const wxCSConv& conv); |
e90c1d2a VZ |
170 | virtual ~wxCSConv(); |
171 | ||
54380f29 | 172 | wxCSConv& operator=(const wxCSConv& conv); |
2b5f62a0 | 173 | |
75736a9c DS |
174 | virtual size_t MB2WC(wchar_t *outputBuf, const char *psz, size_t outputSize) const; |
175 | virtual size_t WC2MB(char *outputBuf, const wchar_t *psz, size_t outputSize) const; | |
e90c1d2a | 176 | |
65e50848 JS |
177 | void Clear() ; |
178 | ||
e90c1d2a | 179 | private: |
8b04d4c4 VZ |
180 | // common part of all ctors |
181 | void Init(); | |
182 | ||
e95354ec VZ |
183 | // creates m_convReal if necessary |
184 | void CreateConvIfNeeded() const; | |
185 | ||
186 | // do create m_convReal (unconditionally) | |
187 | wxMBConv *DoCreate() const; | |
188 | ||
bda3d86a VZ |
189 | // set the name (may be only called when m_name == NULL), makes copy of |
190 | // charset string | |
e90c1d2a VZ |
191 | void SetName(const wxChar *charset); |
192 | ||
e95354ec | 193 | |
dccce9ea VZ |
194 | // note that we can't use wxString here because of compilation |
195 | // dependencies: we're included from wx/string.h | |
e90c1d2a | 196 | wxChar *m_name; |
8b04d4c4 | 197 | wxFontEncoding m_encoding; |
e95354ec VZ |
198 | |
199 | // use CreateConvIfNeeded() before accessing m_convReal! | |
200 | wxMBConv *m_convReal; | |
e90c1d2a | 201 | bool m_deferred; |
6001e347 RR |
202 | }; |
203 | ||
f5a1953b VZ |
204 | // ---------------------------------------------------------------------------- |
205 | // declare predefined conversion objects | |
206 | // ---------------------------------------------------------------------------- | |
d5c8817c | 207 | |
f5a1953b VZ |
208 | // conversion to be used with all standard functions affected by locale, e.g. |
209 | // strtol(), strftime(), ... | |
210 | extern WXDLLIMPEXP_DATA_BASE(wxMBConv&) wxConvLibc; | |
211 | ||
212 | // conversion ISO-8859-1/UTF-7/UTF-8 <-> wchar_t | |
16cba29d | 213 | extern WXDLLIMPEXP_DATA_BASE(wxCSConv&) wxConvISO8859_1; |
f5a1953b VZ |
214 | extern WXDLLIMPEXP_DATA_BASE(wxMBConvUTF7&) wxConvUTF7; |
215 | extern WXDLLIMPEXP_DATA_BASE(wxMBConvUTF8&) wxConvUTF8; | |
216 | ||
217 | // conversion used for the file names on the systems where they're not Unicode | |
218 | // (basically anything except Windows) | |
219 | // | |
220 | // this is used by all file functions, can be changed by the application | |
221 | // | |
222 | // by default UTF-8 under Mac OS X and wxConvLibc elsewhere (but it's not used | |
223 | // under Windows normally) | |
224 | extern WXDLLIMPEXP_DATA_BASE(wxMBConv *) wxConvFileName; | |
225 | ||
226 | // backwards compatible define | |
227 | #define wxConvFile (*wxConvFileName) | |
228 | ||
229 | // the current conversion object, may be set to any conversion, is used by | |
230 | // default in a couple of places inside wx (initially same as wxConvLibc) | |
16cba29d | 231 | extern WXDLLIMPEXP_DATA_BASE(wxMBConv *) wxConvCurrent; |
6001e347 | 232 | |
f5a1953b VZ |
233 | // ??? |
234 | extern WXDLLIMPEXP_DATA_BASE(wxCSConv&) wxConvLocal; | |
235 | ||
236 | ||
e95354ec VZ |
237 | // ---------------------------------------------------------------------------- |
238 | // endianness-dependent conversions | |
239 | // ---------------------------------------------------------------------------- | |
240 | ||
241 | #ifdef WORDS_BIGENDIAN | |
242 | typedef wxMBConvUTF16BE wxMBConvUTF16; | |
243 | typedef wxMBConvUTF32BE wxMBConvUTF32; | |
244 | #else | |
245 | typedef wxMBConvUTF16LE wxMBConvUTF16; | |
246 | typedef wxMBConvUTF32LE wxMBConvUTF32; | |
247 | #endif | |
248 | ||
e90c1d2a | 249 | // ---------------------------------------------------------------------------- |
6001e347 | 250 | // filename conversion macros |
e90c1d2a | 251 | // ---------------------------------------------------------------------------- |
6001e347 RR |
252 | |
253 | // filenames are multibyte on Unix and probably widechar on Windows? | |
c4e41ce3 | 254 | #if defined(__UNIX__) || defined(__BORLANDC__) || defined(__WXMAC__ ) |
e90c1d2a | 255 | #define wxMBFILES 1 |
6001e347 | 256 | #else |
e90c1d2a | 257 | #define wxMBFILES 0 |
6001e347 RR |
258 | #endif |
259 | ||
80df4d31 | 260 | #if wxMBFILES && wxUSE_UNICODE |
f5a1953b | 261 | #define wxFNCONV(name) wxConvFileName->cWX2MB(name) |
e90c1d2a | 262 | #define wxFNSTRINGCAST wxMBSTRINGCAST |
d5c8817c SC |
263 | #else |
264 | #if defined( __WXOSX__ ) && wxMBFILES | |
f5a1953b | 265 | #define wxFNCONV(name) wxConvFileName->cWC2MB( wxConvLocal.cWX2WC(name) ) |
6001e347 | 266 | #else |
e90c1d2a | 267 | #define wxFNCONV(name) name |
d5c8817c | 268 | #endif |
e90c1d2a | 269 | #define wxFNSTRINGCAST WXSTRINGCAST |
6001e347 RR |
270 | #endif |
271 | ||
f5a1953b | 272 | #else // !wxUSE_WCHAR_T |
6001e347 | 273 | |
e90c1d2a | 274 | // ---------------------------------------------------------------------------- |
6001e347 | 275 | // stand-ins in absence of wchar_t |
e90c1d2a | 276 | // ---------------------------------------------------------------------------- |
6001e347 | 277 | |
bddd7a8d | 278 | class WXDLLIMPEXP_BASE wxMBConv |
6001e347 RR |
279 | { |
280 | public: | |
e90c1d2a VZ |
281 | const char* cMB2WX(const char *psz) const { return psz; } |
282 | const char* cWX2MB(const char *psz) const { return psz; } | |
6001e347 | 283 | }; |
e90c1d2a | 284 | |
bde4baac VZ |
285 | #define wxConvFile wxConvLocal |
286 | ||
16cba29d | 287 | extern WXDLLIMPEXP_DATA_BASE(wxMBConv) wxConvLibc, |
8b04d4c4 VZ |
288 | wxConvLocal, |
289 | wxConvISO8859_1, | |
290 | wxConvUTF8; | |
16cba29d | 291 | extern WXDLLIMPEXP_DATA_BASE(wxMBConv *) wxConvCurrent; |
6001e347 RR |
292 | |
293 | #define wxFNCONV(name) name | |
e90c1d2a | 294 | #define wxFNSTRINGCAST WXSTRINGCAST |
6001e347 RR |
295 | |
296 | #endif | |
297 | // wxUSE_WCHAR_T | |
298 | ||
e90c1d2a VZ |
299 | // ---------------------------------------------------------------------------- |
300 | // macros for the most common conversions | |
301 | // ---------------------------------------------------------------------------- | |
302 | ||
303 | #if wxUSE_UNICODE | |
304 | #define wxConvertWX2MB(s) wxConvCurrent->cWX2MB(s) | |
305 | #define wxConvertMB2WX(s) wxConvCurrent->cMB2WX(s) | |
306 | #else // ANSI | |
307 | // no conversions to do | |
308 | #define wxConvertWX2MB(s) (s) | |
309 | #define wxConvertMB2WX(s) (s) | |
310 | #endif // Unicode/ANSI | |
311 | ||
312 | #endif | |
6001e347 RR |
313 | // _WX_WXSTRCONVH__ |
314 |