1 /////////////////////////////////////////////////////////////////////////////
3 // Purpose: Unicode conversion classes
4 // Author: Ove Kaaven, Robert Roebling, Vadim Zeitlin, Vaclav Slavik
8 // Copyright: (c) 1999 Ove Kaaven, Robert Roebling, Vadim Zeitlin, Vaclav Slavik
9 // Licence: wxWindows license
10 /////////////////////////////////////////////////////////////////////////////
12 // ============================================================================
14 // ============================================================================
16 // ----------------------------------------------------------------------------
18 // ----------------------------------------------------------------------------
21 #pragma implementation "strconv.h"
24 // For compilers that support precompilation, includes "wx.h".
25 #include "wx/wxprec.h"
32 #include "wx/msw/private.h"
42 #include "wx/strconv.h"
46 // ----------------------------------------------------------------------------
48 // ----------------------------------------------------------------------------
50 WXDLLEXPORT_DATA(wxMBConv
*) wxConvCurrent
= &wxConvLibc
;
53 // ============================================================================
55 // ============================================================================
71 #define BSWAP_UCS4(str, len) { unsigned _c; for (_c=0; _c<len; _c++) str[_c]=wxUINT32_SWAP_ALWAYS(str[_c]); }
72 #define BSWAP_UTF16(str, len) { unsigned _c; for (_c=0; _c<len; _c++) str[_c]=wxUINT16_SWAP_ALWAYS(str[_c]); }
74 // under Unix SIZEOF_WCHAR_T is defined by configure, but under other platforms
75 // it might be not defined - assume the most common value
76 #ifndef SIZEOF_WCHAR_T
77 #define SIZEOF_WCHAR_T 2
78 #endif // !defined(SIZEOF_WCHAR_T)
80 #if SIZEOF_WCHAR_T == 4
81 #define WC_NAME "UCS4"
82 #define WC_BSWAP BSWAP_UCS4
83 #ifdef WORDS_BIGENDIAN
84 #define WC_NAME_BEST "UCS-4BE"
86 #define WC_NAME_BEST "UCS-4LE"
88 #elif SIZEOF_WCHAR_T == 2
89 #define WC_NAME "UTF16"
90 #define WC_BSWAP BSWAP_UTF16
92 #ifdef WORDS_BIGENDIAN
93 #define WC_NAME_BEST "UTF-16BE"
95 #define WC_NAME_BEST "UTF-16LE"
97 #else // sizeof(wchar_t) != 2 nor 4
98 // I don't know what to do about this
99 #error "Weird sizeof(wchar_t): please report your platform details to wx-users mailing list"
105 static size_t encode_utf16(wxUint32 input
, wchar_t *output
)
109 if (output
) *output
++ = input
;
112 else if (input
>=0x110000)
120 *output
++ = (input
>> 10)+0xd7c0;
121 *output
++ = (input
&0x3ff)+0xdc00;
127 static size_t decode_utf16(const wchar_t* input
, wxUint32
& output
)
129 if ((*input
<0xd800) || (*input
>0xdfff))
134 else if ((input
[1]<0xdc00) || (input
[1]>=0xdfff))
141 output
= ((input
[0] - 0xd7c0) << 10) + (input
[1] - 0xdc00);
148 // ----------------------------------------------------------------------------
150 // ----------------------------------------------------------------------------
152 WXDLLEXPORT_DATA(wxMBConv
) wxConvLibc
;
154 size_t wxMBConv::MB2WC(wchar_t *buf
, const char *psz
, size_t n
) const
156 return wxMB2WC(buf
, psz
, n
);
159 size_t wxMBConv::WC2MB(char *buf
, const wchar_t *psz
, size_t n
) const
161 return wxWC2MB(buf
, psz
, n
);
164 const wxWCharBuffer
wxMBConv::cMB2WC(const char *psz
) const
168 size_t nLen
= MB2WC((wchar_t *) NULL
, psz
, 0);
169 if (nLen
== (size_t)-1)
170 return wxWCharBuffer((wchar_t *) NULL
);
171 wxWCharBuffer
buf(nLen
);
172 MB2WC((wchar_t *)(const wchar_t *) buf
, psz
, nLen
);
176 return wxWCharBuffer((wchar_t *) NULL
);
179 const wxCharBuffer
wxMBConv::cWC2MB(const wchar_t *psz
) const
183 size_t nLen
= WC2MB((char *) NULL
, psz
, 0);
184 if (nLen
== (size_t)-1)
185 return wxCharBuffer((char *) NULL
);
186 wxCharBuffer
buf(nLen
);
187 WC2MB((char *)(const char *) buf
, psz
, nLen
);
191 return wxCharBuffer((char *) NULL
);
194 // ----------------------------------------------------------------------------
195 // standard file conversion
196 // ----------------------------------------------------------------------------
198 WXDLLEXPORT_DATA(wxMBConvFile
) wxConvFile
;
200 // just use the libc conversion for now
201 size_t wxMBConvFile::MB2WC(wchar_t *buf
, const char *psz
, size_t n
) const
203 return wxMB2WC(buf
, psz
, n
);
206 size_t wxMBConvFile::WC2MB(char *buf
, const wchar_t *psz
, size_t n
) const
208 return wxWC2MB(buf
, psz
, n
);
211 // ----------------------------------------------------------------------------
212 // standard gdk conversion
213 // ----------------------------------------------------------------------------
217 WXDLLEXPORT_DATA(wxMBConvGdk
) wxConvGdk
;
221 size_t wxMBConvGdk::MB2WC(wchar_t *buf
, const char *psz
, size_t n
) const
225 return gdk_mbstowcs((GdkWChar
*)buf
, psz
, n
);
229 GdkWChar
*nbuf
= new GdkWChar
[n
=strlen(psz
)];
230 size_t len
= gdk_mbstowcs(nbuf
, psz
, n
);
236 size_t wxMBConvGdk::WC2MB(char *buf
, const wchar_t *psz
, size_t n
) const
238 char *mbstr
= gdk_wcstombs((GdkWChar
*)psz
);
239 size_t len
= mbstr
? strlen(mbstr
) : 0;
244 memcpy(buf
, psz
, len
);
253 // ----------------------------------------------------------------------------
255 // ----------------------------------------------------------------------------
257 WXDLLEXPORT_DATA(wxMBConvUTF7
) wxConvUTF7
;
260 static char utf7_setD
[]="ABCDEFGHIJKLMNOPQRSTUVWXYZ"
261 "abcdefghijklmnopqrstuvwxyz"
262 "0123456789'(),-./:?";
263 static char utf7_setO
[]="!\"#$%&*;<=>@[]^_`{|}";
264 static char utf7_setB
[]="ABCDEFGHIJKLMNOPQRSTUVWXYZ"
265 "abcdefghijklmnopqrstuvwxyz"
269 // TODO: write actual implementations of UTF-7 here
270 size_t wxMBConvUTF7::MB2WC(wchar_t * WXUNUSED(buf
),
271 const char * WXUNUSED(psz
),
272 size_t WXUNUSED(n
)) const
277 size_t wxMBConvUTF7::WC2MB(char * WXUNUSED(buf
),
278 const wchar_t * WXUNUSED(psz
),
279 size_t WXUNUSED(n
)) const
284 // ----------------------------------------------------------------------------
286 // ----------------------------------------------------------------------------
288 WXDLLEXPORT_DATA(wxMBConvUTF8
) wxConvUTF8
;
290 static wxUint32 utf8_max
[]=
291 { 0x7f, 0x7ff, 0xffff, 0x1fffff, 0x3ffffff, 0x7fffffff, 0xffffffff };
293 size_t wxMBConvUTF8::MB2WC(wchar_t *buf
, const char *psz
, size_t n
) const
297 while (*psz
&& ((!buf
) || (len
< n
)))
299 unsigned char cc
= *psz
++, fc
= cc
;
301 for (cnt
= 0; fc
& 0x80; cnt
++)
315 // invalid UTF-8 sequence
320 unsigned ocnt
= cnt
- 1;
321 wxUint32 res
= cc
& (0x3f >> cnt
);
325 if ((cc
& 0xC0) != 0x80)
327 // invalid UTF-8 sequence
330 res
= (res
<< 6) | (cc
& 0x3f);
332 if (res
<= utf8_max
[ocnt
])
334 // illegal UTF-8 encoding
338 size_t pa
= encode_utf16(res
, buf
);
339 if (pa
== (size_t)-1)
352 if (buf
&& (len
< n
))
357 size_t wxMBConvUTF8::WC2MB(char *buf
, const wchar_t *psz
, size_t n
) const
361 while (*psz
&& ((!buf
) || (len
< n
)))
365 size_t pa
= decode_utf16(psz
, cc
);
366 psz
+= (pa
== (size_t)-1) ? 1 : pa
;
368 cc
=(*psz
++) & 0x7fffffff;
371 for (cnt
= 0; cc
> utf8_max
[cnt
]; cnt
++) {}
385 *buf
++ = (-128 >> cnt
) | ((cc
>> (cnt
* 6)) & (0x3f >> cnt
));
387 *buf
++ = 0x80 | ((cc
>> (cnt
* 6)) & 0x3f);
392 if (buf
&& (len
<n
)) *buf
= 0;
396 // ----------------------------------------------------------------------------
397 // specified character set
398 // ----------------------------------------------------------------------------
400 WXDLLEXPORT_DATA(wxCSConv
) wxConvLocal((const wxChar
*)NULL
);
402 #include "wx/encconv.h"
403 #include "wx/fontmap.h"
405 // TODO: add some tables here
406 // - perhaps common encodings to common codepages (for Win32)
407 // - perhaps common encodings to objects ("UTF8" -> wxConvUTF8)
408 // - move wxEncodingConverter meat in here
410 #if defined(__WIN32__) && !defined(__WXMICROWIN__)
414 // VZ: the new version of wxCharsetToCodepage() is more politically correct
415 // and should work on other Windows versions as well but the old version is
416 // still needed for !wxUSE_FONTMAP || !wxUSE_GUI case
418 extern long wxEncodingToCodepage(wxFontEncoding encoding
)
420 // translate encoding into the Windows CHARSET
421 wxNativeEncodingInfo natveEncInfo
;
422 if ( !wxGetNativeFontEncoding(encoding
, &natveEncInfo
) )
425 // translate CHARSET to code page
426 CHARSETINFO csetInfo
;
427 if ( !::TranslateCharsetInfo((DWORD
*)(DWORD
)natveEncInfo
.charset
,
431 wxLogLastError(_T("TranslateCharsetInfo(TCI_SRCCHARSET)"));
436 return csetInfo
.ciACP
;
441 extern long wxCharsetToCodepage(const wxChar
*name
)
443 // first get the font encoding for this charset
447 wxFontEncoding enc
= wxTheFontMapper
->CharsetToEncoding(name
, FALSE
);
448 if ( enc
== wxFONTENCODING_SYSTEM
)
451 // the use the helper function
452 return wxEncodingToCodepage(enc
);
455 #endif // wxUSE_FONTMAP
459 // include old wxCharsetToCodepage() by OK if needed
460 #if !wxUSE_GUI || !wxUSE_FONTMAP
462 #include "wx/msw/registry.h"
464 // this should work if Internet Exploiter is installed
465 extern long wxCharsetToCodepage(const wxChar
*name
)
474 wxString
path(wxT("MIME\\Database\\Charset\\"));
476 wxRegKey
key(wxRegKey::HKCR
, path
);
478 if (!key
.Exists()) break;
480 // two cases: either there's an AliasForCharset string,
481 // or there are Codepage and InternetEncoding dwords.
482 // The InternetEncoding gives us the actual encoding,
483 // the Codepage just says which Windows character set to
484 // use when displaying the data.
485 if (key
.HasValue(wxT("InternetEncoding")) &&
486 key
.QueryValue(wxT("InternetEncoding"), &CP
)) break;
488 // no encoding, see if it's an alias
489 if (!key
.HasValue(wxT("AliasForCharset")) ||
490 !key
.QueryValue(wxT("AliasForCharset"), cn
)) break;
496 #endif // !wxUSE_GUI || !wxUSE_FONTMAP
503 wxCharacterSet(const wxChar
*name
)
505 virtual ~wxCharacterSet()
507 virtual size_t MB2WC(wchar_t *buf
, const char *psz
, size_t n
)
508 { return (size_t)-1; }
509 virtual size_t WC2MB(char *buf
, const wchar_t *psz
, size_t n
)
510 { return (size_t)-1; }
511 virtual bool usable()
517 class ID_CharSet
: public wxCharacterSet
520 ID_CharSet(const wxChar
*name
,wxMBConv
*cnv
)
521 : wxCharacterSet(name
), work(cnv
) {}
523 size_t MB2WC(wchar_t *buf
, const char *psz
, size_t n
)
524 { return work
? work
->MB2WC(buf
,psz
,n
) : (size_t)-1; }
526 size_t WC2MB(char *buf
, const wchar_t *psz
, size_t n
)
527 { return work
? work
->WC2MB(buf
,psz
,n
) : (size_t)-1; }
530 { return work
!=NULL
; }
538 bool g_wcNeedsSwap
= FALSE
;
539 static const char *g_wcCharset
= NULL
;
541 // VS: glibc 2.1.3 is broken in that iconv() conversion to/from UCS4 fails with E2BIG
542 // if output buffer is _exactly_ as big as needed. Such case is (unless there's
543 // yet another bug in glibc) the only case when iconv() returns with (size_t)-1
544 // (which means error) and says there are 0 bytes left in the input buffer --
545 // when _real_ error occurs, bytes-left-in-input buffer is non-zero. Hence,
546 // this alternative test for iconv() failure.
547 // [This bug does not appear in glibc 2.2.]
548 #if defined(__GLIBC__) && __GLIBC__ == 2 && __GLIBC_MINOR__ <= 1
549 #define ICONV_FAILED(cres, bufLeft) ((cres == (size_t)-1) && \
550 (errno != E2BIG || bufLeft != 0))
552 #define ICONV_FAILED(cres, bufLeft) (cres == (size_t)-1)
555 class IC_CharSet
: public wxCharacterSet
558 IC_CharSet(const wxChar
*name
)
559 : wxCharacterSet(name
)
561 // check for charset that represents wchar_t:
562 if (g_wcCharset
== NULL
)
564 g_wcNeedsSwap
= FALSE
;
566 // try charset with explicit bytesex info (e.g. "UCS-4LE"):
567 g_wcCharset
= WC_NAME_BEST
;
568 m2w
= iconv_open(g_wcCharset
, wxConvLibc
.cWX2MB(name
));
570 if (m2w
== (iconv_t
)-1)
572 // try charset w/o bytesex info (e.g. "UCS4")
573 // and check for bytesex ourselves:
574 g_wcCharset
= WC_NAME
;
575 m2w
= iconv_open(g_wcCharset
, wxConvLibc
.cWX2MB(name
));
577 // last bet, try if it knows WCHAR_T pseudo-charset
578 if (m2w
== (iconv_t
)-1)
580 g_wcCharset
= "WCHAR_T";
581 m2w
= iconv_open(g_wcCharset
, wxConvLibc
.cWX2MB(name
));
584 if (m2w
!= (iconv_t
)-1)
586 char buf
[2], *bufPtr
;
587 wchar_t wbuf
[2], *wbufPtr
;
595 outsz
= SIZEOF_WCHAR_T
* 2;
599 #ifdef WX_ICONV_TAKES_CHAR
600 res
= iconv(m2w
, (char**)&bufPtr
, &insz
, (char**)&wbufPtr
, &outsz
);
602 res
= iconv(m2w
, (const char**)&bufPtr
, &insz
, (char**)&wbufPtr
, &outsz
);
604 if (ICONV_FAILED(res
, insz
))
607 wxLogLastError(wxT("iconv"));
608 wxLogError(_("Convertion to charset '%s' doesn't work."), name
);
612 g_wcNeedsSwap
= (wbuf
[0] != (wchar_t)buf
[0]);
618 wxLogError(_("Don't know how to convert to/from charset '%s'."), name
);
621 wxLogTrace(wxT("strconv"), wxT("wchar_t charset is '%s', needs swap: %i"), g_wcCharset
, g_wcNeedsSwap
);
624 m2w
= iconv_open(g_wcCharset
, wxConvLibc
.cWX2MB(name
));
626 w2m
= iconv_open(wxConvLibc
.cWX2MB(name
), g_wcCharset
);
631 if ( m2w
!= (iconv_t
)-1 )
633 if ( w2m
!= (iconv_t
)-1 )
637 size_t MB2WC(wchar_t *buf
, const char *psz
, size_t n
)
639 size_t inbuf
= strlen(psz
);
640 size_t outbuf
= n
* SIZEOF_WCHAR_T
;
642 // VS: Use these instead of psz, buf because iconv() modifies its arguments:
643 wchar_t *bufPtr
= buf
;
644 const char *pszPtr
= psz
;
648 // have destination buffer, convert there
649 #ifdef WX_ICONV_TAKES_CHAR
650 cres
= iconv(m2w
, (char**)&pszPtr
, &inbuf
, (char**)&bufPtr
, &outbuf
);
652 cres
= iconv(m2w
, &pszPtr
, &inbuf
, (char**)&bufPtr
, &outbuf
);
654 res
= n
- (outbuf
/ SIZEOF_WCHAR_T
);
658 // convert to native endianness
659 WC_BSWAP(buf
/* _not_ bufPtr */, res
)
664 // no destination buffer... convert using temp buffer
665 // to calculate destination buffer requirement
669 bufPtr
= tbuf
; outbuf
= 8*SIZEOF_WCHAR_T
;
670 #ifdef WX_ICONV_TAKES_CHAR
671 cres
= iconv( m2w
, (char**)&pszPtr
, &inbuf
, (char**)&bufPtr
, &outbuf
);
673 cres
= iconv( m2w
, &pszPtr
, &inbuf
, (char**)&bufPtr
, &outbuf
);
675 res
+= 8-(outbuf
/SIZEOF_WCHAR_T
);
676 } while ((cres
==(size_t)-1) && (errno
==E2BIG
));
679 if (ICONV_FAILED(cres
, inbuf
))
681 //VS: it is ok if iconv fails, hence trace only
682 wxLogTrace(wxT("strconv"), wxT("iconv failed: %s"), wxSysErrorMsg(wxSysErrorCode()));
689 size_t WC2MB(char *buf
, const wchar_t *psz
, size_t n
)
691 #if defined(__BORLANDC__) && (__BORLANDC__ > 0x530)
692 size_t inbuf
= std::wcslen(psz
) * SIZEOF_WCHAR_T
;
694 size_t inbuf
= ::wcslen(psz
) * SIZEOF_WCHAR_T
;
703 // need to copy to temp buffer to switch endianness
704 // this absolutely doesn't rock!
705 // (no, doing WC_BSWAP twice on the original buffer won't help, as it
706 // could be in read-only memory, or be accessed in some other thread)
707 tmpbuf
=(wchar_t*)malloc((inbuf
+1)*SIZEOF_WCHAR_T
);
708 memcpy(tmpbuf
,psz
,(inbuf
+1)*SIZEOF_WCHAR_T
);
709 WC_BSWAP(tmpbuf
, inbuf
)
715 // have destination buffer, convert there
716 #ifdef WX_ICONV_TAKES_CHAR
717 cres
= iconv( w2m
, (char**)&psz
, &inbuf
, &buf
, &outbuf
);
719 cres
= iconv( w2m
, (const char**)&psz
, &inbuf
, &buf
, &outbuf
);
725 // no destination buffer... convert using temp buffer
726 // to calculate destination buffer requirement
730 buf
= tbuf
; outbuf
= 16;
731 #ifdef WX_ICONV_TAKES_CHAR
732 cres
= iconv( w2m
, (char**)&psz
, &inbuf
, &buf
, &outbuf
);
734 cres
= iconv( w2m
, (const char**)&psz
, &inbuf
, &buf
, &outbuf
);
737 } while ((cres
==(size_t)-1) && (errno
==E2BIG
));
745 if (ICONV_FAILED(cres
, inbuf
))
747 //VS: it is ok if iconv fails, hence trace only
748 wxLogTrace(wxT("strconv"), wxT("iconv failed: %s"), wxSysErrorMsg(wxSysErrorCode()));
756 { return (m2w
!= (iconv_t
)-1) && (w2m
!= (iconv_t
)-1); }
763 #if defined(__WIN32__) && !defined(__WXMICROWIN__)
764 class CP_CharSet
: public wxCharacterSet
767 CP_CharSet(const wxChar
* name
)
768 : wxCharacterSet(name
)
770 m_CodePage
= wxCharsetToCodepage(name
);
773 size_t MB2WC(wchar_t *buf
, const char *psz
, size_t n
)
776 MultiByteToWideChar(m_CodePage
, 0, psz
, -1, buf
, buf
? n
: 0);
777 //VS: returns # of written chars for buf!=NULL and *size*
778 // needed buffer for buf==NULL
779 return len
? (buf
? len
: len
-1) : (size_t)-1;
782 size_t WC2MB(char *buf
, const wchar_t *psz
, size_t n
)
784 size_t len
= WideCharToMultiByte(m_CodePage
, 0, psz
, -1, buf
,
785 buf
? n
: 0, NULL
, NULL
);
786 //VS: returns # of written chars for buf!=NULL and *size*
787 // needed buffer for buf==NULL
788 return len
? (buf
? len
: len
-1) : (size_t)-1;
792 { return m_CodePage
!= -1; }
801 class EC_CharSet
: public wxCharacterSet
804 // temporarily just use wxEncodingConverter stuff,
805 // so that it works while a better implementation is built
806 EC_CharSet(const wxChar
* name
) : wxCharacterSet(name
),
807 enc(wxFONTENCODING_SYSTEM
)
810 enc
= wxTheFontMapper
->CharsetToEncoding(name
, FALSE
);
811 m2w
.Init(enc
, wxFONTENCODING_UNICODE
);
812 w2m
.Init(wxFONTENCODING_UNICODE
, enc
);
815 size_t MB2WC(wchar_t *buf
, const char *psz
, size_t n
)
817 size_t inbuf
= strlen(psz
);
819 m2w
.Convert(psz
,buf
);
823 size_t WC2MB(char *buf
, const wchar_t *psz
, size_t n
)
825 #if ( defined(__BORLANDC__) && (__BORLANDC__ > 0x530) ) \
826 || ( defined(__MWERKS__) && defined(__WXMSW__) )
827 size_t inbuf
= std::wcslen(psz
);
829 size_t inbuf
= ::wcslen(psz
);
832 w2m
.Convert(psz
,buf
);
838 { return (enc
!=wxFONTENCODING_SYSTEM
) && (enc
!=wxFONTENCODING_DEFAULT
); }
842 wxEncodingConverter m2w
, w2m
;
845 #endif // wxUSE_FONTMAP
847 static wxCharacterSet
*wxGetCharacterSet(const wxChar
*name
)
849 wxCharacterSet
*cset
= NULL
;
852 if (wxStricmp(name
, wxT("UTF8")) == 0 || wxStricmp(name
, wxT("UTF-8")) == 0)
854 cset
= new ID_CharSet(name
, &wxConvUTF8
);
859 cset
= new IC_CharSet(name
); // may not take NULL
864 if (cset
&& cset
->usable())
873 #if defined(__WIN32__) && !defined(__WXMICROWIN__)
874 cset
= new CP_CharSet(name
); // may take NULL
882 cset
= new EC_CharSet(name
);
885 #endif // wxUSE_FONTMAP
888 wxLogError(_("Unknown encoding '%s'!"), name
);
892 wxCSConv::wxCSConv(const wxChar
*charset
)
894 m_name
= (wxChar
*)NULL
;
895 m_cset
= (wxCharacterSet
*) NULL
;
901 wxCSConv::~wxCSConv()
907 void wxCSConv::SetName(const wxChar
*charset
)
911 m_name
= wxStrdup(charset
);
916 void wxCSConv::LoadNow()
922 wxString name
= wxLocale::GetSystemEncodingName();
927 // wxGetCharacterSet() complains about NULL name
928 m_cset
= m_name
? wxGetCharacterSet(m_name
) : NULL
;
933 size_t wxCSConv::MB2WC(wchar_t *buf
, const char *psz
, size_t n
) const
935 ((wxCSConv
*)this)->LoadNow(); // discard constness
938 return m_cset
->MB2WC(buf
, psz
, n
);
941 size_t len
= strlen(psz
);
945 for (size_t c
= 0; c
<= len
; c
++)
946 buf
[c
] = (unsigned char)(psz
[c
]);
952 size_t wxCSConv::WC2MB(char *buf
, const wchar_t *psz
, size_t n
) const
954 ((wxCSConv
*)this)->LoadNow(); // discard constness
957 return m_cset
->WC2MB(buf
, psz
, n
);
960 #if ( defined(__BORLANDC__) && (__BORLANDC__ > 0x530) ) \
961 || ( defined(__MWERKS__) && defined(__WXMSW__) )
962 size_t len
=std::wcslen(psz
);
964 size_t len
=::wcslen(psz
);
968 for (size_t c
= 0; c
<= len
; c
++)
969 buf
[c
] = (psz
[c
] > 0xff) ? '?' : psz
[c
];
977 class IC_CharSetConverter
980 IC_CharSetConverter(IC_CharSet
*from
, IC_CharSet
*to
)
982 cnv
= iconv_open(wxConvLibc
.cWX2MB(to
->cname
),
983 wxConvLibc
.cWX2MB(from
->cname
));
986 ~IC_CharSetConverter()
988 if (cnv
!= (iconv_t
)-1)
992 size_t Convert(char *buf
, const char *psz
, size_t n
)
994 size_t inbuf
= strlen(psz
);
996 #ifdef WX_ICONV_TAKES_CHAR
997 size_t res
= iconv( cnv
, (char**)&psz
, &inbuf
, &buf
, &outbuf
);
999 size_t res
= iconv( cnv
, &psz
, &inbuf
, &buf
, &outbuf
);
1001 if (res
== (size_t)-1)
1003 return (n
- outbuf
);
1010 #endif // HAVE_ICONV_H
1012 class EC_CharSetConverter
1015 EC_CharSetConverter(EC_CharSet
* from
,EC_CharSet
* to
)
1016 { cnv
.Init(from
->enc
,to
->enc
); }
1018 size_t Convert(char* buf
, const char* psz
, size_t n
)
1020 size_t inbuf
= strlen(psz
);
1021 if (buf
) cnv
.Convert(psz
,buf
);
1026 wxEncodingConverter cnv
;
1029 #else // !wxUSE_WCHAR_T
1031 // ----------------------------------------------------------------------------
1032 // stand-ins in absence of wchar_t
1033 // ----------------------------------------------------------------------------
1035 WXDLLEXPORT_DATA(wxMBConv
) wxConvLibc
, wxConvFile
;
1037 #endif // wxUSE_WCHAR_T