1 /////////////////////////////////////////////////////////////////////////////
3 // Purpose: Unicode conversion classes
4 // Author: Ove Kaaven, Robert Roebling, Vadim Zeitlin, Vaclav Slavik
8 // Copyright: (c) 1999 Ove Kaaven, Robert Roebling, Vadim Zeitlin, Vaclav Slavik
9 // Licence: wxWindows license
10 /////////////////////////////////////////////////////////////////////////////
12 // ============================================================================
14 // ============================================================================
16 // ----------------------------------------------------------------------------
18 // ----------------------------------------------------------------------------
21 #pragma implementation "strconv.h"
24 // For compilers that support precompilation, includes "wx.h".
25 #include "wx/wxprec.h"
32 #include "wx/msw/private.h"
42 #include "wx/strconv.h"
46 // ----------------------------------------------------------------------------
48 // ----------------------------------------------------------------------------
50 WXDLLEXPORT_DATA(wxMBConv
*) wxConvCurrent
= &wxConvLibc
;
53 // ============================================================================
55 // ============================================================================
71 #define BSWAP_UCS4(str, len) { unsigned _c; for (_c=0; _c<len; _c++) str[_c]=wxUINT32_SWAP_ALWAYS(str[_c]); }
72 #define BSWAP_UTF16(str, len) { unsigned _c; for (_c=0; _c<len; _c++) str[_c]=wxUINT16_SWAP_ALWAYS(str[_c]); }
74 // under Unix SIZEOF_WCHAR_T is defined by configure, but under other platforms
75 // it might be not defined - assume the most common value
76 #ifndef SIZEOF_WCHAR_T
77 #define SIZEOF_WCHAR_T 2
78 #endif // !defined(SIZEOF_WCHAR_T)
80 #if SIZEOF_WCHAR_T == 4
81 #define WC_NAME "UCS4"
82 #define WC_BSWAP BSWAP_UCS4
83 #ifdef WORDS_BIGENDIAN
84 #define WC_NAME_BEST "UCS-4BE"
86 #define WC_NAME_BEST "UCS-4LE"
88 #elif SIZEOF_WCHAR_T == 2
89 #define WC_NAME "UTF16"
90 #define WC_BSWAP BSWAP_UTF16
92 #ifdef WORDS_BIGENDIAN
93 #define WC_NAME_BEST "UTF-16BE"
95 #define WC_NAME_BEST "UTF-16LE"
97 #else // sizeof(wchar_t) != 2 nor 4
98 // I don't know what to do about this
99 #error "Weird sizeof(wchar_t): please report your platform details to wx-users mailing list"
105 static size_t encode_utf16(wxUint32 input
, wchar_t *output
)
109 if (output
) *output
++ = input
;
112 else if (input
>=0x110000)
120 *output
++ = (input
>> 10)+0xd7c0;
121 *output
++ = (input
&0x3ff)+0xdc00;
127 static size_t decode_utf16(const wchar_t* input
, wxUint32
& output
)
129 if ((*input
<0xd800) || (*input
>0xdfff))
134 else if ((input
[1]<0xdc00) || (input
[1]>=0xdfff))
141 output
= ((input
[0] - 0xd7c0) << 10) + (input
[1] - 0xdc00);
148 // ----------------------------------------------------------------------------
150 // ----------------------------------------------------------------------------
152 WXDLLEXPORT_DATA(wxMBConv
) wxConvLibc
;
154 size_t wxMBConv::MB2WC(wchar_t *buf
, const char *psz
, size_t n
) const
156 return wxMB2WC(buf
, psz
, n
);
159 size_t wxMBConv::WC2MB(char *buf
, const wchar_t *psz
, size_t n
) const
161 return wxWC2MB(buf
, psz
, n
);
164 const wxWCharBuffer
wxMBConv::cMB2WC(const char *psz
) const
168 size_t nLen
= MB2WC((wchar_t *) NULL
, psz
, 0);
169 if (nLen
== (size_t)-1)
170 return wxWCharBuffer((wchar_t *) NULL
);
171 wxWCharBuffer
buf(nLen
);
172 MB2WC((wchar_t *)(const wchar_t *) buf
, psz
, nLen
);
176 return wxWCharBuffer((wchar_t *) NULL
);
179 const wxCharBuffer
wxMBConv::cWC2MB(const wchar_t *psz
) const
183 size_t nLen
= WC2MB((char *) NULL
, psz
, 0);
184 if (nLen
== (size_t)-1)
185 return wxCharBuffer((char *) NULL
);
186 wxCharBuffer
buf(nLen
);
187 WC2MB((char *)(const char *) buf
, psz
, nLen
);
191 return wxCharBuffer((char *) NULL
);
194 // ----------------------------------------------------------------------------
195 // standard file conversion
196 // ----------------------------------------------------------------------------
198 WXDLLEXPORT_DATA(wxMBConvFile
) wxConvFile
;
200 // just use the libc conversion for now
201 size_t wxMBConvFile::MB2WC(wchar_t *buf
, const char *psz
, size_t n
) const
203 return wxMB2WC(buf
, psz
, n
);
206 size_t wxMBConvFile::WC2MB(char *buf
, const wchar_t *psz
, size_t n
) const
208 return wxWC2MB(buf
, psz
, n
);
211 // ----------------------------------------------------------------------------
212 // standard gdk conversion
213 // ----------------------------------------------------------------------------
217 WXDLLEXPORT_DATA(wxMBConvGdk
) wxConvGdk
;
221 size_t wxMBConvGdk::MB2WC(wchar_t *buf
, const char *psz
, size_t n
) const
225 return gdk_mbstowcs((GdkWChar
*)buf
, psz
, n
);
229 GdkWChar
*nbuf
= new GdkWChar
[n
=strlen(psz
)];
230 size_t len
= gdk_mbstowcs(nbuf
, psz
, n
);
236 size_t wxMBConvGdk::WC2MB(char *buf
, const wchar_t *psz
, size_t n
) const
238 char *mbstr
= gdk_wcstombs((GdkWChar
*)psz
);
239 size_t len
= mbstr
? strlen(mbstr
) : 0;
244 memcpy(buf
, psz
, len
);
253 // ----------------------------------------------------------------------------
255 // ----------------------------------------------------------------------------
257 WXDLLEXPORT_DATA(wxMBConvUTF7
) wxConvUTF7
;
260 static char utf7_setD
[]="ABCDEFGHIJKLMNOPQRSTUVWXYZ"
261 "abcdefghijklmnopqrstuvwxyz"
262 "0123456789'(),-./:?";
263 static char utf7_setO
[]="!\"#$%&*;<=>@[]^_`{|}";
264 static char utf7_setB
[]="ABCDEFGHIJKLMNOPQRSTUVWXYZ"
265 "abcdefghijklmnopqrstuvwxyz"
269 // TODO: write actual implementations of UTF-7 here
270 size_t wxMBConvUTF7::MB2WC(wchar_t * WXUNUSED(buf
),
271 const char * WXUNUSED(psz
),
272 size_t WXUNUSED(n
)) const
277 size_t wxMBConvUTF7::WC2MB(char * WXUNUSED(buf
),
278 const wchar_t * WXUNUSED(psz
),
279 size_t WXUNUSED(n
)) const
284 // ----------------------------------------------------------------------------
286 // ----------------------------------------------------------------------------
288 WXDLLEXPORT_DATA(wxMBConvUTF8
) wxConvUTF8
;
290 static wxUint32 utf8_max
[]=
291 { 0x7f, 0x7ff, 0xffff, 0x1fffff, 0x3ffffff, 0x7fffffff, 0xffffffff };
293 size_t wxMBConvUTF8::MB2WC(wchar_t *buf
, const char *psz
, size_t n
) const
297 while (*psz
&& ((!buf
) || (len
< n
)))
299 unsigned char cc
= *psz
++, fc
= cc
;
301 for (cnt
= 0; fc
& 0x80; cnt
++)
315 // invalid UTF-8 sequence
320 unsigned ocnt
= cnt
- 1;
321 wxUint32 res
= cc
& (0x3f >> cnt
);
325 if ((cc
& 0xC0) != 0x80)
327 // invalid UTF-8 sequence
330 res
= (res
<< 6) | (cc
& 0x3f);
332 if (res
<= utf8_max
[ocnt
])
334 // illegal UTF-8 encoding
338 size_t pa
= encode_utf16(res
, buf
);
339 if (pa
== (size_t)-1)
352 if (buf
&& (len
< n
))
357 size_t wxMBConvUTF8::WC2MB(char *buf
, const wchar_t *psz
, size_t n
) const
361 while (*psz
&& ((!buf
) || (len
< n
)))
365 size_t pa
= decode_utf16(psz
, cc
);
366 psz
+= (pa
== (size_t)-1) ? 1 : pa
;
368 cc
=(*psz
++) & 0x7fffffff;
371 for (cnt
= 0; cc
> utf8_max
[cnt
]; cnt
++) {}
385 *buf
++ = (-128 >> cnt
) | ((cc
>> (cnt
* 6)) & (0x3f >> cnt
));
387 *buf
++ = 0x80 | ((cc
>> (cnt
* 6)) & 0x3f);
392 if (buf
&& (len
<n
)) *buf
= 0;
396 // ----------------------------------------------------------------------------
397 // specified character set
398 // ----------------------------------------------------------------------------
400 WXDLLEXPORT_DATA(wxCSConv
) wxConvLocal((const wxChar
*)NULL
);
402 #include "wx/encconv.h"
403 #include "wx/fontmap.h"
405 // TODO: add some tables here
406 // - perhaps common encodings to common codepages (for Win32)
407 // - perhaps common encodings to objects ("UTF8" -> wxConvUTF8)
408 // - move wxEncodingConverter meat in here
410 #if defined(__WIN32__) && !defined(__WXMICROWIN__)
414 // VZ: the new version of wxCharsetToCodepage() is more politically correct
415 // and should work on other Windows versions as well but the old version is
416 // still needed for !wxUSE_FONTMAP || !wxUSE_GUI case
418 extern long wxEncodingToCodepage(wxFontEncoding encoding
)
420 // translate encoding into the Windows CHARSET
421 wxNativeEncodingInfo natveEncInfo
;
422 if ( !wxGetNativeFontEncoding(encoding
, &natveEncInfo
) )
425 // translate CHARSET to code page
426 CHARSETINFO csetInfo
;
427 if ( !::TranslateCharsetInfo((DWORD
*)(DWORD
)natveEncInfo
.charset
,
431 wxLogLastError(_T("TranslateCharsetInfo(TCI_SRCCHARSET)"));
436 return csetInfo
.ciACP
;
441 extern long wxCharsetToCodepage(const wxChar
*name
)
443 // first get the font encoding for this charset
447 wxFontEncoding enc
= wxTheFontMapper
->CharsetToEncoding(name
, FALSE
);
448 if ( enc
== wxFONTENCODING_SYSTEM
)
451 // the use the helper function
452 return wxEncodingToCodepage(enc
);
455 #endif // wxUSE_FONTMAP
459 // include old wxCharsetToCodepage() by OK if needed
460 #if !wxUSE_GUI || !wxUSE_FONTMAP
462 #include "wx/msw/registry.h"
464 // this should work if Internet Exploiter is installed
465 extern long wxCharsetToCodepage(const wxChar
*name
)
474 wxString
path(wxT("MIME\\Database\\Charset\\"));
476 wxRegKey
key(wxRegKey::HKCR
, path
);
478 if (!key
.Exists()) break;
480 // two cases: either there's an AliasForCharset string,
481 // or there are Codepage and InternetEncoding dwords.
482 // The InternetEncoding gives us the actual encoding,
483 // the Codepage just says which Windows character set to
484 // use when displaying the data.
485 if (key
.HasValue(wxT("InternetEncoding")) &&
486 key
.QueryValue(wxT("InternetEncoding"), &CP
)) break;
488 // no encoding, see if it's an alias
489 if (!key
.HasValue(wxT("AliasForCharset")) ||
490 !key
.QueryValue(wxT("AliasForCharset"), cn
)) break;
496 #endif // !wxUSE_GUI || !wxUSE_FONTMAP
500 // ============================================================================
501 // wxCharacterSet and derived classes
502 // ============================================================================
504 // ----------------------------------------------------------------------------
505 // wxCharacterSet is the ABC for the classes below
506 // ----------------------------------------------------------------------------
511 wxCharacterSet(const wxChar
*name
) : cname(name
) {}
512 virtual ~wxCharacterSet() {}
513 virtual size_t MB2WC(wchar_t *buf
, const char *psz
, size_t n
) = 0;
514 virtual size_t WC2MB(char *buf
, const wchar_t *psz
, size_t n
) = 0;
515 virtual bool usable() const = 0;
520 // ----------------------------------------------------------------------------
521 // ID_CharSet: implementation of wxCharacterSet using an existing wxMBConv
522 // ----------------------------------------------------------------------------
524 class ID_CharSet
: public wxCharacterSet
527 ID_CharSet(const wxChar
*name
, wxMBConv
*cnv
)
528 : wxCharacterSet(name
), work(cnv
) {}
530 size_t MB2WC(wchar_t *buf
, const char *psz
, size_t n
)
531 { return work
? work
->MB2WC(buf
,psz
,n
) : (size_t)-1; }
533 size_t WC2MB(char *buf
, const wchar_t *psz
, size_t n
)
534 { return work
? work
->WC2MB(buf
,psz
,n
) : (size_t)-1; }
537 { return work
!=NULL
; }
543 // ============================================================================
544 // The classes doing conversion using the iconv_xxx() functions
545 // ============================================================================
549 // VS: glibc 2.1.3 is broken in that iconv() conversion to/from UCS4 fails with E2BIG
550 // if output buffer is _exactly_ as big as needed. Such case is (unless there's
551 // yet another bug in glibc) the only case when iconv() returns with (size_t)-1
552 // (which means error) and says there are 0 bytes left in the input buffer --
553 // when _real_ error occurs, bytes-left-in-input buffer is non-zero. Hence,
554 // this alternative test for iconv() failure.
555 // [This bug does not appear in glibc 2.2.]
556 #if defined(__GLIBC__) && __GLIBC__ == 2 && __GLIBC_MINOR__ <= 1
557 #define ICONV_FAILED(cres, bufLeft) ((cres == (size_t)-1) && \
558 (errno != E2BIG || bufLeft != 0))
560 #define ICONV_FAILED(cres, bufLeft) (cres == (size_t)-1)
563 #define ICONV_CHAR_CAST(x) ((ICONV_CONST char **)(x))
565 // ----------------------------------------------------------------------------
566 // IC_CharSet: encapsulates an iconv character set
567 // ----------------------------------------------------------------------------
569 class IC_CharSet
: public wxCharacterSet
572 IC_CharSet(const wxChar
*name
);
573 virtual ~IC_CharSet();
575 virtual size_t MB2WC(wchar_t *buf
, const char *psz
, size_t n
);
576 virtual size_t WC2MB(char *buf
, const wchar_t *psz
, size_t n
);
579 { return (m2w
!= (iconv_t
)-1) && (w2m
!= (iconv_t
)-1); }
582 // the iconv handlers used to translate from multibyte to wide char and in
583 // the other direction
588 // the name (for iconv_open()) of a wide char charset - if none is
589 // available on this machine, it will remain NULL
590 static const char *ms_wcCharsetName
;
592 // true if the wide char encoding we use (i.e. ms_wcCharsetName) has
593 // different endian-ness than the native one
594 static bool ms_wcNeedsSwap
;
597 const char *IC_CharSet::ms_wcCharsetName
= NULL
;
598 bool IC_CharSet::ms_wcNeedsSwap
= FALSE
;
600 IC_CharSet::IC_CharSet(const wxChar
*name
)
601 : wxCharacterSet(name
)
603 // check for charset that represents wchar_t:
604 if (ms_wcCharsetName
== NULL
)
606 ms_wcNeedsSwap
= FALSE
;
608 // try charset with explicit bytesex info (e.g. "UCS-4LE"):
609 ms_wcCharsetName
= WC_NAME_BEST
;
610 m2w
= iconv_open(ms_wcCharsetName
, wxConvLibc
.cWX2MB(name
));
612 if (m2w
== (iconv_t
)-1)
614 // try charset w/o bytesex info (e.g. "UCS4")
615 // and check for bytesex ourselves:
616 ms_wcCharsetName
= WC_NAME
;
617 m2w
= iconv_open(ms_wcCharsetName
, wxConvLibc
.cWX2MB(name
));
619 // last bet, try if it knows WCHAR_T pseudo-charset
620 if (m2w
== (iconv_t
)-1)
622 ms_wcCharsetName
= "WCHAR_T";
623 m2w
= iconv_open(ms_wcCharsetName
, wxConvLibc
.cWX2MB(name
));
626 if (m2w
!= (iconv_t
)-1)
628 char buf
[2], *bufPtr
;
629 wchar_t wbuf
[2], *wbufPtr
;
637 outsz
= SIZEOF_WCHAR_T
* 2;
641 res
= iconv(m2w
, ICONV_CHAR_CAST(&bufPtr
), &insz
,
642 (char**)&wbufPtr
, &outsz
);
644 if (ICONV_FAILED(res
, insz
))
646 ms_wcCharsetName
= NULL
;
647 wxLogLastError(wxT("iconv"));
648 wxLogError(_("Convertion to charset '%s' doesn't work."), name
);
652 ms_wcNeedsSwap
= wbuf
[0] != (wchar_t)buf
[0];
657 ms_wcCharsetName
= NULL
;
659 // VS: we must not output an error here, since wxWindows will safely
660 // fall back to using wxEncodingConverter.
661 wxLogTrace(wxT("strconv"), wxT("Impossible to convert to/from charset '%s' with iconv, falling back to wxEncodingConverter."), name
);
665 wxLogTrace(wxT("strconv"), wxT("wchar_t charset is '%s', needs swap: %i"), ms_wcCharsetName
, ms_wcNeedsSwap
);
667 else // we already have ms_wcCharsetName
669 m2w
= iconv_open(ms_wcCharsetName
, wxConvLibc
.cWX2MB(name
));
672 // NB: don't ever pass NULL to iconv_open(), it may crash!
673 if ( ms_wcCharsetName
)
675 w2m
= iconv_open(wxConvLibc
.cWX2MB(name
), ms_wcCharsetName
);
683 IC_CharSet::~IC_CharSet()
685 if ( m2w
!= (iconv_t
)-1 )
687 if ( w2m
!= (iconv_t
)-1 )
691 size_t IC_CharSet::MB2WC(wchar_t *buf
, const char *psz
, size_t n
)
693 size_t inbuf
= strlen(psz
);
694 size_t outbuf
= n
* SIZEOF_WCHAR_T
;
696 // VS: Use these instead of psz, buf because iconv() modifies its arguments:
697 wchar_t *bufPtr
= buf
;
698 const char *pszPtr
= psz
;
702 // have destination buffer, convert there
704 ICONV_CHAR_CAST(&pszPtr
), &inbuf
,
705 (char**)&bufPtr
, &outbuf
);
706 res
= n
- (outbuf
/ SIZEOF_WCHAR_T
);
710 // convert to native endianness
711 WC_BSWAP(buf
/* _not_ bufPtr */, res
)
716 // no destination buffer... convert using temp buffer
717 // to calculate destination buffer requirement
722 outbuf
= 8*SIZEOF_WCHAR_T
;
725 ICONV_CHAR_CAST(&pszPtr
), &inbuf
,
726 (char**)&bufPtr
, &outbuf
);
728 res
+= 8-(outbuf
/SIZEOF_WCHAR_T
);
729 } while ((cres
==(size_t)-1) && (errno
==E2BIG
));
732 if (ICONV_FAILED(cres
, inbuf
))
734 //VS: it is ok if iconv fails, hence trace only
735 wxLogTrace(wxT("strconv"), wxT("iconv failed: %s"), wxSysErrorMsg(wxSysErrorCode()));
742 size_t IC_CharSet::WC2MB(char *buf
, const wchar_t *psz
, size_t n
)
744 #if defined(__BORLANDC__) && (__BORLANDC__ > 0x530)
745 size_t inbuf
= std::wcslen(psz
) * SIZEOF_WCHAR_T
;
747 size_t inbuf
= ::wcslen(psz
) * SIZEOF_WCHAR_T
;
756 // need to copy to temp buffer to switch endianness
757 // this absolutely doesn't rock!
758 // (no, doing WC_BSWAP twice on the original buffer won't help, as it
759 // could be in read-only memory, or be accessed in some other thread)
760 tmpbuf
=(wchar_t*)malloc((inbuf
+1)*SIZEOF_WCHAR_T
);
761 memcpy(tmpbuf
,psz
,(inbuf
+1)*SIZEOF_WCHAR_T
);
762 WC_BSWAP(tmpbuf
, inbuf
)
768 // have destination buffer, convert there
769 cres
= iconv( w2m
, ICONV_CHAR_CAST(&psz
), &inbuf
, &buf
, &outbuf
);
775 // no destination buffer... convert using temp buffer
776 // to calculate destination buffer requirement
780 buf
= tbuf
; outbuf
= 16;
782 cres
= iconv( w2m
, ICONV_CHAR_CAST(&psz
), &inbuf
, &buf
, &outbuf
);
785 } while ((cres
==(size_t)-1) && (errno
==E2BIG
));
793 if (ICONV_FAILED(cres
, inbuf
))
795 //VS: it is ok if iconv fails, hence trace only
796 wxLogTrace(wxT("strconv"), wxT("iconv failed: %s"), wxSysErrorMsg(wxSysErrorCode()));
805 // ============================================================================
806 // Win32 conversion classes
807 // ============================================================================
809 #if defined(__WIN32__) && !defined(__WXMICROWIN__)
810 class CP_CharSet
: public wxCharacterSet
813 CP_CharSet(const wxChar
* name
)
814 : wxCharacterSet(name
)
816 m_CodePage
= wxCharsetToCodepage(name
);
819 size_t MB2WC(wchar_t *buf
, const char *psz
, size_t n
)
822 MultiByteToWideChar(m_CodePage
, 0, psz
, -1, buf
, buf
? n
: 0);
823 //VS: returns # of written chars for buf!=NULL and *size*
824 // needed buffer for buf==NULL
825 return len
? (buf
? len
: len
-1) : (size_t)-1;
828 size_t WC2MB(char *buf
, const wchar_t *psz
, size_t n
)
830 size_t len
= WideCharToMultiByte(m_CodePage
, 0, psz
, -1, buf
,
831 buf
? n
: 0, NULL
, NULL
);
832 //VS: returns # of written chars for buf!=NULL and *size*
833 // needed buffer for buf==NULL
834 return len
? (buf
? len
: len
-1) : (size_t)-1;
838 { return m_CodePage
!= -1; }
845 // ============================================================================
846 // wxEncodingConverter based conversion classes
847 // ============================================================================
851 class EC_CharSet
: public wxCharacterSet
854 // temporarily just use wxEncodingConverter stuff,
855 // so that it works while a better implementation is built
856 EC_CharSet(const wxChar
* name
) : wxCharacterSet(name
),
857 enc(wxFONTENCODING_SYSTEM
)
860 enc
= wxTheFontMapper
->CharsetToEncoding(name
, FALSE
);
862 m_ok
= m2w
.Init(enc
, wxFONTENCODING_UNICODE
) &&
863 w2m
.Init(wxFONTENCODING_UNICODE
, enc
);
866 size_t MB2WC(wchar_t *buf
, const char *psz
, size_t n
)
868 size_t inbuf
= strlen(psz
);
870 m2w
.Convert(psz
,buf
);
874 size_t WC2MB(char *buf
, const wchar_t *psz
, size_t n
)
876 #if ( defined(__BORLANDC__) && (__BORLANDC__ > 0x530) ) \
877 || ( defined(__MWERKS__) && defined(__WXMSW__) )
878 size_t inbuf
= std::wcslen(psz
);
880 size_t inbuf
= ::wcslen(psz
);
883 w2m
.Convert(psz
,buf
);
888 bool usable() const { return m_ok
; }
892 wxEncodingConverter m2w
, w2m
;
894 // were we initialized successfully?
898 #endif // wxUSE_FONTMAP
900 // ----------------------------------------------------------------------------
901 // the function creating the wxCharacterSet for the specified charset on the
902 // current system, trying all possibilities
903 // ----------------------------------------------------------------------------
905 static wxCharacterSet
*wxGetCharacterSet(const wxChar
*name
)
907 // check for the special case of ASCII charset
909 if ( wxTheFontMapper
->CharsetToEncoding(name
) == wxFONTENCODING_DEFAULT
)
910 #else // wxUSE_FONTMAP
912 #endif // wxUSE_FONTMAP/!wxUSE_FONTMAP
914 // don't convert at all
918 // the test above must have taken care of this case
919 wxCHECK_MSG( name
, NULL
, _T("NULL name must be wxFONTENCODING_DEFAULT") );
921 wxCharacterSet
*cset
;
923 if ( wxStricmp(name
, wxT("UTF8")) == 0 || wxStricmp(name
, wxT("UTF-8")) == 0)
925 cset
= new ID_CharSet(name
, &wxConvUTF8
);
930 cset
= new IC_CharSet(name
);
933 #endif // HAVE_ICONV/!HAVE_ICONV
936 if ( cset
->usable() )
942 #if defined(__WIN32__) && !defined(__WXMICROWIN__)
943 cset
= new CP_CharSet(name
);
944 if ( cset
->usable() )
952 cset
= new EC_CharSet(name
);
953 if ( cset
->usable() )
958 #endif // wxUSE_FONTMAP
960 wxLogError(_("Cannot convert from encoding '%s'!"), name
);
965 // ============================================================================
966 // wxCSConv implementation
967 // ============================================================================
969 wxCSConv::wxCSConv(const wxChar
*charset
)
971 m_name
= (wxChar
*)NULL
;
972 m_cset
= (wxCharacterSet
*) NULL
;
978 wxCSConv::~wxCSConv()
984 void wxCSConv::SetName(const wxChar
*charset
)
988 m_name
= wxStrdup(charset
);
993 void wxCSConv::LoadNow()
999 wxString name
= wxLocale::GetSystemEncodingName();
1000 if ( !name
.empty() )
1004 // wxGetCharacterSet() complains about NULL name
1005 m_cset
= m_name
? wxGetCharacterSet(m_name
) : NULL
;
1010 size_t wxCSConv::MB2WC(wchar_t *buf
, const char *psz
, size_t n
) const
1012 ((wxCSConv
*)this)->LoadNow(); // discard constness
1015 return m_cset
->MB2WC(buf
, psz
, n
);
1018 size_t len
= strlen(psz
);
1022 for (size_t c
= 0; c
<= len
; c
++)
1023 buf
[c
] = (unsigned char)(psz
[c
]);
1029 size_t wxCSConv::WC2MB(char *buf
, const wchar_t *psz
, size_t n
) const
1031 ((wxCSConv
*)this)->LoadNow(); // discard constness
1034 return m_cset
->WC2MB(buf
, psz
, n
);
1037 #if ( defined(__BORLANDC__) && (__BORLANDC__ > 0x530) ) \
1038 || ( defined(__MWERKS__) && defined(__WXMSW__) )
1039 size_t len
=std::wcslen(psz
);
1041 size_t len
=::wcslen(psz
);
1045 for (size_t c
= 0; c
<= len
; c
++)
1046 buf
[c
] = (psz
[c
] > 0xff) ? '?' : psz
[c
];
1052 #else // !wxUSE_WCHAR_T
1054 // ----------------------------------------------------------------------------
1055 // stand-ins in absence of wchar_t
1056 // ----------------------------------------------------------------------------
1058 WXDLLEXPORT_DATA(wxMBConv
) wxConvLibc
, wxConvFile
;
1060 #endif // wxUSE_WCHAR_T