]> git.saurik.com Git - wxWidgets.git/blame - src/common/strconv.cpp
added common imagxpm files
[wxWidgets.git] / src / common / strconv.cpp
CommitLineData
6001e347
RR
1/////////////////////////////////////////////////////////////////////////////
2// Name: strconv.cpp
3// Purpose: Unicode conversion classes
4// Author: Ove Kaaven, Robert Roebling, Vadim Zeitlin
5// Modified by:
6// Created: 29/01/98
7// RCS-ID: $Id$
8// Copyright: (c) 1999 Ove Kaaven, Robert Roebling, Vadim Zeitlin
9// Licence: wxWindows license
10/////////////////////////////////////////////////////////////////////////////
11
f6bcfd97
BP
12// ============================================================================
13// declarations
14// ============================================================================
15
16// ----------------------------------------------------------------------------
17// headers
18// ----------------------------------------------------------------------------
19
6001e347
RR
20#ifdef __GNUG__
21 #pragma implementation "strconv.h"
22#endif
23
24// For compilers that support precompilation, includes "wx.h".
25#include "wx/wxprec.h"
26
27#ifdef __BORLANDC__
28 #pragma hdrstop
29#endif
30
0a1c1e62
GRG
31#ifdef __WXMSW__
32 #include "wx/msw/private.h"
33#endif
34
1cd52418 35#include <errno.h>
6001e347
RR
36#include <ctype.h>
37#include <string.h>
38#include <stdlib.h>
39
40#ifdef __SALFORDC__
41 #include <clib.h>
42#endif
43
1cd52418
OK
44#ifdef HAVE_ICONV_H
45 #include <iconv.h>
46#endif
47#ifdef HAVE_LANGINFO_H
48 #include <langinfo.h>
49#endif
50
3e61dfb0
OK
51#ifdef __WXMSW__
52 #include <windows.h>
53#endif
54
6001e347
RR
55#include "wx/debug.h"
56#include "wx/strconv.h"
57
d43088ee 58#if defined(WORDS_BIGENDIAN) || defined(__STDC_ISO_10646__)
1cd52418
OK
59#define BSWAP_UCS4(str, len)
60#define BSWAP_UCS2(str, len)
61#else
62#define BSWAP_UCS4(str, len) { unsigned _c; for (_c=0; _c<len; _c++) str[_c]=wxUINT32_SWAP_ALWAYS(str[_c]); }
63#define BSWAP_UCS2(str, len) { unsigned _c; for (_c=0; _c<len; _c++) str[_c]=wxUINT16_SWAP_ALWAYS(str[_c]); }
64#define WC_NEED_BSWAP
65#endif
66#define BSWAP_UTF32(str, len) BSWAP_UCS4(str, len)
67#define BSWAP_UTF16(str, len) BSWAP_UCS2(str, len)
68
69#if SIZEOF_WCHAR_T == 4
70#define WC_NAME "UCS4"
71#define WC_BSWAP BSWAP_UCS4
72#elif SIZEOF_WCHAR_T == 2
73#define WC_NAME "UTF16"
74#define WC_BSWAP BSWAP_UTF16
75#define WC_UTF16
76#endif
77
f6bcfd97
BP
78// ----------------------------------------------------------------------------
79// globals
80// ----------------------------------------------------------------------------
6001e347
RR
81
82WXDLLEXPORT_DATA(wxMBConv *) wxConvCurrent = &wxConvLibc;
83
f6bcfd97
BP
84// ============================================================================
85// implementation
86// ============================================================================
6001e347 87
f6bcfd97 88#if wxUSE_WCHAR_T
6001e347 89
b0a6bb75
VZ
90#ifdef WC_UTF16
91
1cd52418
OK
92static size_t encode_utf16(wxUint32 input,wxUint16*output)
93{
94 if (input<=0xffff) {
95 if (output) *output++ = input;
96 return 1;
97 } else
98 if (input>=0x110000) {
99 return (size_t)-1;
100 } else {
101 if (output) {
102 *output++ = (input >> 10)+0xd7c0;
103 *output++ = (input&0x3ff)+0xdc00;
104 }
105 return 2;
106 }
107}
108
109static size_t decode_utf16(wxUint16*input,wxUint32&output)
110{
111 if ((*input<0xd800) || (*input>0xdfff)) {
112 output = *input;
113 return 1;
114 } else
115 if ((input[1]<0xdc00) || (input[1]>=0xdfff)) {
116 output = *input;
117 return (size_t)-1;
118 } else {
119 output = ((input[0] - 0xd7c0) << 10) + (input[1] - 0xdc00);
120 return 2;
121 }
122}
123
b0a6bb75
VZ
124#endif // WC_UTF16
125
f6bcfd97 126// ----------------------------------------------------------------------------
6001e347 127// wxMBConv
f6bcfd97 128// ----------------------------------------------------------------------------
6001e347
RR
129
130WXDLLEXPORT_DATA(wxMBConv) wxConvLibc;
131
132size_t wxMBConv::MB2WC(wchar_t *buf, const char *psz, size_t n) const
133{
134 return wxMB2WC(buf, psz, n);
135}
136
137size_t wxMBConv::WC2MB(char *buf, const wchar_t *psz, size_t n) const
138{
139 return wxWC2MB(buf, psz, n);
140}
141
142const wxWCharBuffer wxMBConv::cMB2WC(const char *psz) const
143{
f6bcfd97 144 if (psz)
6001e347
RR
145 {
146 size_t nLen = MB2WC((wchar_t *) NULL, psz, 0);
f6bcfd97
BP
147 if (nLen == (size_t)-1)
148 return wxWCharBuffer((wchar_t *) NULL);
6001e347
RR
149 wxWCharBuffer buf(nLen);
150 MB2WC((wchar_t *)(const wchar_t *) buf, psz, nLen);
151 return buf;
f6bcfd97
BP
152 }
153 else
6001e347
RR
154 return wxWCharBuffer((wchar_t *) NULL);
155}
156
157const wxCharBuffer wxMBConv::cWC2MB(const wchar_t *psz) const
158{
f6bcfd97 159 if (psz)
6001e347
RR
160 {
161 size_t nLen = WC2MB((char *) NULL, psz, 0);
f6bcfd97
BP
162 if (nLen == (size_t)-1)
163 return wxCharBuffer((char *) NULL);
6001e347
RR
164 wxCharBuffer buf(nLen);
165 WC2MB((char *)(const char *) buf, psz, nLen);
166 return buf;
f6bcfd97
BP
167 }
168 else
6001e347
RR
169 return wxCharBuffer((char *) NULL);
170}
171
f6bcfd97 172// ----------------------------------------------------------------------------
6001e347 173// standard file conversion
f6bcfd97 174// ----------------------------------------------------------------------------
6001e347
RR
175
176WXDLLEXPORT_DATA(wxMBConvFile) wxConvFile;
177
178// just use the libc conversion for now
179size_t wxMBConvFile::MB2WC(wchar_t *buf, const char *psz, size_t n) const
180{
181 return wxMB2WC(buf, psz, n);
182}
183
184size_t wxMBConvFile::WC2MB(char *buf, const wchar_t *psz, size_t n) const
185{
186 return wxWC2MB(buf, psz, n);
187}
188
f6bcfd97 189// ----------------------------------------------------------------------------
6001e347 190// standard gdk conversion
f6bcfd97
BP
191// ----------------------------------------------------------------------------
192
193#ifdef __WXGTK12__
6001e347
RR
194
195WXDLLEXPORT_DATA(wxMBConvGdk) wxConvGdk;
196
197#include <gdk/gdk.h>
198
199size_t wxMBConvGdk::MB2WC(wchar_t *buf, const char *psz, size_t n) const
200{
201 if (buf) {
202 return gdk_mbstowcs((GdkWChar *)buf, psz, n);
203 } else {
204 GdkWChar *nbuf = new GdkWChar[n=strlen(psz)];
205 size_t len = gdk_mbstowcs(nbuf, psz, n);
206 delete [] nbuf;
207 return len;
208 }
209}
210
211size_t wxMBConvGdk::WC2MB(char *buf, const wchar_t *psz, size_t n) const
212{
213 char *mbstr = gdk_wcstombs((GdkWChar *)psz);
214 size_t len = mbstr ? strlen(mbstr) : 0;
215 if (buf) {
216 if (len > n) len = n;
217 memcpy(buf, psz, len);
218 if (len < n) buf[len] = 0;
219 }
220 return len;
221}
f6bcfd97 222
6001e347
RR
223#endif // GTK > 1.0
224
225// ----------------------------------------------------------------------------
226// UTF-7
227// ----------------------------------------------------------------------------
228
229WXDLLEXPORT_DATA(wxMBConvUTF7) wxConvUTF7;
230
231#if 0
232static char utf7_setD[]="ABCDEFGHIJKLMNOPQRSTUVWXYZ"
233 "abcdefghijklmnopqrstuvwxyz"
234 "0123456789'(),-./:?";
235static char utf7_setO[]="!\"#$%&*;<=>@[]^_`{|}";
236static char utf7_setB[]="ABCDEFGHIJKLMNOPQRSTUVWXYZ"
237 "abcdefghijklmnopqrstuvwxyz"
238 "0123456789+/";
239#endif
240
241// TODO: write actual implementations of UTF-7 here
242size_t wxMBConvUTF7::MB2WC(wchar_t * WXUNUSED(buf),
243 const char * WXUNUSED(psz),
244 size_t WXUNUSED(n)) const
245{
246 return 0;
247}
248
249size_t wxMBConvUTF7::WC2MB(char * WXUNUSED(buf),
250 const wchar_t * WXUNUSED(psz),
251 size_t WXUNUSED(n)) const
252{
253 return 0;
254}
255
f6bcfd97 256// ----------------------------------------------------------------------------
6001e347 257// UTF-8
f6bcfd97 258// ----------------------------------------------------------------------------
6001e347
RR
259
260WXDLLEXPORT_DATA(wxMBConvUTF8) wxConvUTF8;
261
1cd52418 262static wxUint32 utf8_max[]={0x7f,0x7ff,0xffff,0x1fffff,0x3ffffff,0x7fffffff,0xffffffff};
6001e347
RR
263
264size_t wxMBConvUTF8::MB2WC(wchar_t *buf, const char *psz, size_t n) const
265{
266 size_t len = 0;
267
268 while (*psz && ((!buf) || (len<n))) {
269 unsigned char cc=*psz++, fc=cc;
270 unsigned cnt;
271 for (cnt=0; fc&0x80; cnt++) fc<<=1;
272 if (!cnt) {
273 // plain ASCII char
274 if (buf) *buf++=cc;
275 len++;
276 } else {
277 cnt--;
278 if (!cnt) {
279 // invalid UTF-8 sequence
280 return (size_t)-1;
281 } else {
282 unsigned ocnt=cnt-1;
1cd52418 283 wxUint32 res=cc&(0x3f>>cnt);
6001e347
RR
284 while (cnt--) {
285 cc = *psz++;
286 if ((cc&0xC0)!=0x80) {
287 // invalid UTF-8 sequence
288 return (size_t)-1;
289 }
290 res=(res<<6)|(cc&0x3f);
291 }
292 if (res<=utf8_max[ocnt]) {
293 // illegal UTF-8 encoding
294 return (size_t)-1;
295 }
1cd52418
OK
296#ifdef WC_UTF16
297 size_t pa = encode_utf16(res, buf);
298 if (pa == (size_t)-1)
299 return (size_t)-1;
300 if (buf) buf+=pa;
301 len+=pa;
302#else
6001e347
RR
303 if (buf) *buf++=res;
304 len++;
1cd52418 305#endif
6001e347
RR
306 }
307 }
308 }
309 if (buf && (len<n)) *buf = 0;
310 return len;
311}
312
313size_t wxMBConvUTF8::WC2MB(char *buf, const wchar_t *psz, size_t n) const
314{
315 size_t len = 0;
316
317 while (*psz && ((!buf) || (len<n))) {
1cd52418
OK
318 wxUint32 cc;
319#ifdef WC_UTF16
320 size_t pa = decode_utf16(psz,cc);
321 psz += (pa == (size_t)-1) ? 1 : pa;
322#else
323 cc=(*psz++)&0x7fffffff;
324#endif
6001e347
RR
325 unsigned cnt;
326 for (cnt=0; cc>utf8_max[cnt]; cnt++);
327 if (!cnt) {
328 // plain ASCII char
329 if (buf) *buf++=cc;
330 len++;
331 } else {
332 len+=cnt+1;
333 if (buf) {
334 *buf++=(-128>>cnt)|((cc>>(cnt*6))&(0x3f>>cnt));
335 while (cnt--)
336 *buf++=0x80|((cc>>(cnt*6))&0x3f);
337 }
338 }
339 }
340 if (buf && (len<n)) *buf = 0;
341 return len;
342}
343
344// ----------------------------------------------------------------------------
345// specified character set
346// ----------------------------------------------------------------------------
347
f6bcfd97
BP
348WXDLLEXPORT_DATA(wxCSConv) wxConvLocal((const wxChar *)NULL);
349
350#include "wx/encconv.h"
351#include "wx/fontmap.h"
6001e347 352
1cd52418
OK
353// TODO: add some tables here
354// - perhaps common encodings to common codepages (for Win32)
355// - perhaps common encodings to objects ("UTF8" -> wxConvUTF8)
356// - move wxEncodingConverter meat in here
357
358#ifdef __WIN32__
359#include "wx/msw/registry.h"
360// this should work if M$ Internet Exploiter is installed
361static long CharsetToCodepage(const wxChar *name)
362{
f1339c56
RR
363 if (!name)
364 return GetACP();
365
366 long CP=-1;
367
368 wxString cn(name);
369 do {
370 wxString path( wxT("MIME\\Database\\Charset\\") );
371 path += cn;
372 wxRegKey key( wxRegKey::HKCR, path );
373
374 /* two cases: either there's an AliasForCharset string,
375 * or there are Codepage and InternetEncoding dwords.
376 * The InternetEncoding gives us the actual encoding,
377 * the Codepage just says which Windows character set to
378 * use when displaying the data.
379 */
380 if (key.QueryValue( wxT("InternetEncoding"), &CP )) break;
381
382 // no encoding, see if it's an alias
383 if (!key.QueryValue( wxT("AliasForCharset"), cn )) break;
384 } while (1);
385
386 return CP;
1cd52418
OK
387}
388#endif
389
6001e347
RR
390class wxCharacterSet
391{
1cd52418 392public:
f1339c56
RR
393 wxCharacterSet(const wxChar*name)
394 : cname(name) {}
395 virtual ~wxCharacterSet()
396 {}
397 virtual size_t MB2WC(wchar_t*buf, const char*psz, size_t n)
398 { return (size_t)-1; }
399 virtual size_t WC2MB(char*buf, const wchar_t*psz, size_t n)
400 { return (size_t)-1; }
401 virtual bool usable()
402 { return FALSE; }
403public:
404 const wxChar*cname;
1cd52418
OK
405};
406
407class ID_CharSet : public wxCharacterSet
408{
409public:
f1339c56
RR
410 ID_CharSet(const wxChar*name,wxMBConv*cnv)
411 : wxCharacterSet(name), work(cnv) {}
412
413 size_t MB2WC(wchar_t*buf, const char*psz, size_t n)
414 { return work ? work->MB2WC(buf,psz,n) : (size_t)-1; }
415
416 size_t WC2MB(char*buf, const wchar_t*psz, size_t n)
417 { return work ? work->WC2MB(buf,psz,n) : (size_t)-1; }
418
419 bool usable()
420 { return work!=NULL; }
421public:
422 wxMBConv*work;
1cd52418
OK
423};
424
425#ifdef HAVE_ICONV_H
426class IC_CharSet : public wxCharacterSet
427{
428public:
f1339c56
RR
429 IC_CharSet(const wxChar*name)
430 : wxCharacterSet(name), m2w((iconv_t)-1), w2m((iconv_t)-1) {}
431 ~IC_CharSet()
432 {
433 if (m2w!=(iconv_t)-1) iconv_close(m2w);
434 if (w2m!=(iconv_t)-1) iconv_close(w2m);
1cd52418 435 }
f1339c56
RR
436
437 void LoadM2W()
438 {
439 if (m2w==(iconv_t)-1)
440 m2w=iconv_open(WC_NAME,wxConvLibc.cWX2MB(cname));
441 }
442
443 void LoadW2M()
444 {
445 if (w2m==(iconv_t)-1)
446 w2m=iconv_open(wxConvLibc.cWX2MB(cname),WC_NAME);
447 }
448
449 size_t MB2WC(wchar_t*buf, const char*psz, size_t n)
450 {
451 LoadM2W();
452 size_t inbuf = strlen(psz);
453 size_t outbuf = n*SIZEOF_WCHAR_T;
454 size_t res, cres;
455 fprintf(stderr,"IC Convert to WC using %s\n",(const char*)wxConvLibc.cWX2MB(cname));
456 if (buf)
457 {
458 // have destination buffer, convert there
95c8801c 459#ifdef WX_ICONV_TAKES_CHAR
f1339c56 460 cres = iconv( m2w, (char**)&psz, &inbuf, (char**)&buf, &outbuf );
95c8801c
VS
461#else
462 cres = iconv( m2w, &psz, &inbuf, (char**)&buf, &outbuf );
463#endif
f1339c56
RR
464 res = n-(outbuf/SIZEOF_WCHAR_T);
465 // convert to native endianness
466 WC_BSWAP(buf, res)
467 }
468 else
469 {
470 // no destination buffer... convert using temp buffer
471 // to calculate destination buffer requirement
472 wchar_t tbuf[8];
473 res = 0;
474 do {
475 buf = tbuf; outbuf = 8*SIZEOF_WCHAR_T;
95c8801c 476#ifdef WX_ICONV_TAKES_CHAR
f1339c56 477 cres = iconv( m2w, (char**)&psz, &inbuf, (char**)&buf, &outbuf );
95c8801c
VS
478#else
479 cres = iconv( m2w, &psz, &inbuf, (char**)&buf, &outbuf );
480#endif
f1339c56
RR
481 res += 8-(outbuf/SIZEOF_WCHAR_T);
482 } while ((cres==(size_t)-1) && (errno==E2BIG));
483 }
484
485 if (cres==(size_t)-1)
486 return (size_t)-1;
487
488 return res;
489 }
490
491 size_t WC2MB(char*buf, const wchar_t*psz, size_t n)
492 {
493 LoadW2M();
1cd52418 494#if defined(__BORLANDC__) && (__BORLANDC__ > 0x530)
f1339c56 495 size_t inbuf = std::wcslen(psz);
1cd52418 496#else
f1339c56 497 size_t inbuf = ::wcslen(psz);
1cd52418 498#endif
f1339c56
RR
499 size_t outbuf = n;
500 size_t res, cres;
501 fprintf(stderr,"IC Convert from WC using %s\n",(const char*)wxConvLibc.cWX2MB(cname));
1cd52418 502#ifdef WC_NEED_BSWAP
f1339c56
RR
503 // need to copy to temp buffer to switch endianness
504 // this absolutely doesn't rock!
505 // (no, doing WC_BSWAP twice on the original buffer won't help, as it
506 // could be in read-only memory, or be accessed in some other thread)
507 wchar_t*tmpbuf=(wchar_t*)malloc((inbuf+1)*SIZEOF_WCHAR_T);
508 memcpy(tmpbuf,psz,(inbuf+1)*SIZEOF_WCHAR_T);
509 WC_BSWAP(tmpbuf, inbuf)
510 psz=tmpbuf;
1cd52418 511#endif
f1339c56
RR
512 if (buf)
513 {
514 // have destination buffer, convert there
95c8801c 515#ifdef WX_ICONV_TAKES_CHAR
f1339c56 516 cres = iconv( w2m, (char**)&psz, &inbuf, &buf, &outbuf );
95c8801c
VS
517#else
518 cres = iconv( w2m, (const char**)&psz, &inbuf, &buf, &outbuf );
519#endif
f1339c56
RR
520 res = n-outbuf;
521 }
522 else
523 {
524 // no destination buffer... convert using temp buffer
525 // to calculate destination buffer requirement
526 char tbuf[16];
527 res = 0;
528 do {
529 buf = tbuf; outbuf = 16;
95c8801c 530#ifdef WX_ICONV_TAKES_CHAR
f1339c56 531 cres = iconv( w2m, (char**)&psz, &inbuf, &buf, &outbuf );
95c8801c
VS
532#else
533 cres = iconv( w2m, (const char**)&psz, &inbuf, &buf, &outbuf );
534#endif
f1339c56
RR
535 res += 16 - outbuf;
536 } while ((cres==(size_t)-1) && (errno==E2BIG));
537 }
1cd52418 538#ifdef WC_NEED_BSWAP
f1339c56 539 free(tmpbuf);
1cd52418 540#endif
f1339c56
RR
541 if (cres==(size_t)-1)
542 return (size_t)-1;
543
544 return res;
545 }
546
547 bool usable()
548 { return TRUE; }
549
550public:
551 iconv_t m2w, w2m;
1cd52418
OK
552};
553#endif
554
555#ifdef __WIN32__
556class CP_CharSet : public wxCharacterSet
557{
558public:
f1339c56
RR
559 CP_CharSet(const wxChar*name)
560 : wxCharacterSet(name), CodePage(CharsetToCodepage(name)) {}
561
562 size_t MB2WC(wchar_t*buf, const char*psz, size_t n)
563 {
564 size_t len = MultiByteToWideChar(CodePage,0,psz,-1,buf,buf?n:0);
565 return len ? len : (size_t)-1;
566 }
567
568 size_t WC2MB(char*buf, const wchar_t*psz, size_t n)
569 {
570 size_t len = WideCharToMultiByte(CodePage,0,psz,-1,buf,buf?n:0,NULL,NULL);
571 return len ? len : (size_t)-1;
572 }
573
574 bool usable()
575 { return CodePage!=-1; }
576
577public:
578 long CodePage;
1cd52418
OK
579};
580#endif
581
582class EC_CharSet : public wxCharacterSet
583{
6001e347 584public:
f1339c56
RR
585 // temporarily just use wxEncodingConverter stuff,
586 // so that it works while a better implementation is built
587 EC_CharSet(const wxChar*name) : wxCharacterSet(name), enc(wxFONTENCODING_SYSTEM)
588 {
589 if (name)
590 enc = wxTheFontMapper->CharsetToEncoding(name, FALSE);
591 m2w.Init(enc, wxFONTENCODING_UNICODE);
592 w2m.Init(wxFONTENCODING_UNICODE, enc);
593 }
594
595 size_t MB2WC(wchar_t*buf, const char*psz, size_t n)
596 {
597 size_t inbuf = strlen(psz);
598 fprintf(stderr,"EC Convert to WC using %d\n",enc);
599 if (buf) m2w.Convert(psz,buf);
600 return inbuf;
601 }
602
603 size_t WC2MB(char*buf, const wchar_t*psz, size_t n)
604 {
1cd52418 605#if defined(__BORLANDC__) && (__BORLANDC__ > 0x530)
f1339c56 606 size_t inbuf = std::wcslen(psz);
1cd52418 607#else
f1339c56 608 size_t inbuf = ::wcslen(psz);
1cd52418 609#endif
f1339c56
RR
610 fprintf(stderr,"EC Convert from WC using %d\n",enc);
611 if (buf)
612 w2m.Convert(psz,buf);
613
614 return inbuf;
615 }
616
617 bool usable()
618 { return (enc!=wxFONTENCODING_SYSTEM) && (enc!=wxFONTENCODING_DEFAULT); }
619
620public:
621 wxFontEncoding enc;
622 wxEncodingConverter m2w, w2m;
f6bcfd97 623};
6001e347 624
f6bcfd97 625static wxCharacterSet *wxGetCharacterSet(const wxChar *name)
6001e347 626{
f1339c56
RR
627 wxCharacterSet *cset = NULL;
628 if (name)
629 {
630 if (!wxStricmp(name, wxT("UTF8")) || !wxStricmp(name, wxT("UTF-8")))
631 {
632 cset = new ID_CharSet(name, &wxConvUTF8);
633 }
634 else
635 {
1cd52418 636#ifdef HAVE_ICONV_H
f1339c56 637 cset = new IC_CharSet(name); // may not take NULL
1cd52418 638#endif
f1339c56 639 }
1cd52418 640 }
f1339c56
RR
641
642 if (cset && cset->usable()) return cset;
643 if (cset) delete cset;
1cd52418 644#ifdef __WIN32__
f1339c56
RR
645 cset = new CP_CharSet(name); // may take NULL
646 if (cset->usable()) return cset;
1cd52418 647#endif
f1339c56
RR
648 if (cset) delete cset;
649 cset = new EC_CharSet(name);
650 if (cset->usable()) return cset;
651 delete cset;
652 return NULL;
6001e347
RR
653}
654
6001e347
RR
655wxCSConv::wxCSConv(const wxChar *charset)
656{
f1339c56
RR
657 m_name = (wxChar *) NULL;
658 m_cset = (wxCharacterSet *) NULL;
659 m_deferred = TRUE;
660 SetName(charset);
6001e347
RR
661}
662
663wxCSConv::~wxCSConv()
664{
f1339c56
RR
665 if (m_name) free(m_name);
666 if (m_cset) delete m_cset;
6001e347
RR
667}
668
669void wxCSConv::SetName(const wxChar *charset)
670{
f1339c56
RR
671 if (charset)
672 {
673 m_name = wxStrdup(charset);
674 m_deferred = TRUE;
675 }
6001e347
RR
676}
677
678void wxCSConv::LoadNow()
679{
223d09f6 680// wxPrintf(wxT("Conversion request\n"));
f1339c56
RR
681 if (m_deferred)
682 {
683 if (!m_name)
684 {
6001e347 685#ifdef __UNIX__
1cd52418 686#if defined(HAVE_LANGINFO_H) && defined(CODESET)
f1339c56
RR
687 // GNU libc provides current character set this way
688 char*alang = nl_langinfo(CODESET);
689 if (alang)
690 {
691 SetName(wxConvLibc.cMB2WX(alang));
692 }
693 else
1cd52418 694#endif
f1339c56
RR
695 {
696 // if we can't get at the character set directly,
697 // try to see if it's in the environment variables
698 // (in most cases this won't work, but I was out of ideas)
699 wxChar *lang = wxGetenv(wxT("LC_ALL"));
700 if (!lang) lang = wxGetenv(wxT("LC_CTYPE"));
701 if (!lang) lang = wxGetenv(wxT("LANG"));
702 wxChar *dot = lang ? wxStrchr(lang, wxT('.')) : (wxChar *)NULL;
703 if (dot) SetName(dot+1);
704 }
6001e347 705#endif
f1339c56
RR
706 }
707 m_cset = wxGetCharacterSet(m_name);
708 m_deferred = FALSE;
6001e347 709 }
6001e347
RR
710}
711
712size_t wxCSConv::MB2WC(wchar_t *buf, const char *psz, size_t n) const
713{
f1339c56
RR
714 ((wxCSConv *)this)->LoadNow(); // discard constness
715
716 if (m_cset)
717 return m_cset->MB2WC(buf, psz, n);
718
719 // latin-1 (direct)
720 size_t len=strlen(psz);
721
722 if (buf)
723 {
724 for (size_t c=0; c<=len; c++)
725 buf[c] = (unsigned char)(psz[c]);
726 }
727
728 return len;
6001e347
RR
729}
730
731size_t wxCSConv::WC2MB(char *buf, const wchar_t *psz, size_t n) const
732{
f1339c56
RR
733 ((wxCSConv *)this)->LoadNow(); // discard constness
734
735 if (m_cset)
736 return m_cset->WC2MB(buf, psz, n);
1cd52418 737
f1339c56 738 // latin-1 (direct)
d834f22c 739#if defined(__BORLANDC__) && (__BORLANDC__ > 0x530)
f1339c56 740 size_t len=std::wcslen(psz);
d834f22c 741#else
f1339c56 742 size_t len=::wcslen(psz);
d834f22c 743#endif
f1339c56
RR
744 if (buf)
745 {
746 for (size_t c=0; c<=len; c++)
747 buf[c] = (psz[c]>0xff) ? '?' : psz[c];
748 }
749
750 return len;
6001e347
RR
751}
752
1cd52418
OK
753#ifdef HAVE_ICONV_H
754class IC_CharSetConverter
755{
756public:
f1339c56
RR
757 IC_CharSetConverter(IC_CharSet*from,IC_CharSet*to)
758 { cnv = iconv_open(wxConvLibc.cWX2MB(to->cname),wxConvLibc.cWX2MB(from->cname)); }
759
760 ~IC_CharSetConverter()
761 { if (cnv!=(iconv_t)-1) iconv_close(cnv); }
762
763 size_t Convert(char*buf, const char*psz, size_t n)
764 {
765 size_t inbuf = strlen(psz);
766 size_t outbuf = n;
95c8801c 767#ifdef WX_ICONV_TAKES_CHAR
f1339c56 768 size_t res = iconv( cnv, (char**)&psz, &inbuf, &buf, &outbuf );
95c8801c
VS
769#else
770 size_t res = iconv( cnv, &psz, &inbuf, &buf, &outbuf );
771#endif
f1339c56
RR
772 if (res==(size_t)-1) return (size_t)-1;
773 return n-outbuf;
774 }
775
776public:
777 iconv_t cnv;
1cd52418
OK
778};
779#endif
780
781class EC_CharSetConverter
782{
783public:
f1339c56
RR
784 EC_CharSetConverter(EC_CharSet*from,EC_CharSet*to)
785 { cnv.Init(from->enc,to->enc); }
786
787 size_t Convert(char*buf, const char*psz, size_t n)
788 {
789 size_t inbuf = strlen(psz);
790 if (buf) cnv.Convert(psz,buf);
791 return inbuf;
792 }
793
794public:
795 wxEncodingConverter cnv;
1cd52418
OK
796};
797
f6bcfd97
BP
798#else // !wxUSE_WCHAR_T
799
800// ----------------------------------------------------------------------------
801// stand-ins in absence of wchar_t
802// ----------------------------------------------------------------------------
803
804WXDLLEXPORT_DATA(wxMBConv) wxConvLibc, wxConvFile;
805
806#endif // wxUSE_WCHAR_T
6001e347
RR
807
808