]>
git.saurik.com Git - wxWidgets.git/blob - src/common/strconv.cpp
997899e769822839b58763a49ff0bdb9ed55bad8
1 /////////////////////////////////////////////////////////////////////////////
3 // Purpose: Unicode conversion classes
4 // Author: Ove Kaaven, Robert Roebling, Vadim Zeitlin
8 // Copyright: (c) 1999 Ove Kaaven, Robert Roebling, Vadim Zeitlin
9 // Licence: wxWindows license
10 /////////////////////////////////////////////////////////////////////////////
12 // ============================================================================
14 // ============================================================================
16 // ----------------------------------------------------------------------------
18 // ----------------------------------------------------------------------------
21 #pragma implementation "strconv.h"
24 // For compilers that support precompilation, includes "wx.h".
25 #include "wx/wxprec.h"
40 #include "wx/strconv.h"
42 // ----------------------------------------------------------------------------
44 // ----------------------------------------------------------------------------
46 WXDLLEXPORT_DATA(wxMBConv
*) wxConvCurrent
= &wxConvLibc
;
48 // ============================================================================
50 // ============================================================================
54 // ----------------------------------------------------------------------------
56 // ----------------------------------------------------------------------------
58 WXDLLEXPORT_DATA(wxMBConv
) wxConvLibc
;
60 size_t wxMBConv::MB2WC(wchar_t *buf
, const char *psz
, size_t n
) const
62 return wxMB2WC(buf
, psz
, n
);
65 size_t wxMBConv::WC2MB(char *buf
, const wchar_t *psz
, size_t n
) const
67 return wxWC2MB(buf
, psz
, n
);
70 const wxWCharBuffer
wxMBConv::cMB2WC(const char *psz
) const
74 size_t nLen
= MB2WC((wchar_t *) NULL
, psz
, 0);
75 if (nLen
== (size_t)-1)
76 return wxWCharBuffer((wchar_t *) NULL
);
77 wxWCharBuffer
buf(nLen
);
78 MB2WC((wchar_t *)(const wchar_t *) buf
, psz
, nLen
);
82 return wxWCharBuffer((wchar_t *) NULL
);
85 const wxCharBuffer
wxMBConv::cWC2MB(const wchar_t *psz
) const
89 size_t nLen
= WC2MB((char *) NULL
, psz
, 0);
90 if (nLen
== (size_t)-1)
91 return wxCharBuffer((char *) NULL
);
92 wxCharBuffer
buf(nLen
);
93 WC2MB((char *)(const char *) buf
, psz
, nLen
);
97 return wxCharBuffer((char *) NULL
);
100 // ----------------------------------------------------------------------------
101 // standard file conversion
102 // ----------------------------------------------------------------------------
104 WXDLLEXPORT_DATA(wxMBConvFile
) wxConvFile
;
106 // just use the libc conversion for now
107 size_t wxMBConvFile::MB2WC(wchar_t *buf
, const char *psz
, size_t n
) const
109 return wxMB2WC(buf
, psz
, n
);
112 size_t wxMBConvFile::WC2MB(char *buf
, const wchar_t *psz
, size_t n
) const
114 return wxWC2MB(buf
, psz
, n
);
117 // ----------------------------------------------------------------------------
118 // standard gdk conversion
119 // ----------------------------------------------------------------------------
123 WXDLLEXPORT_DATA(wxMBConvGdk
) wxConvGdk
;
127 size_t wxMBConvGdk::MB2WC(wchar_t *buf
, const char *psz
, size_t n
) const
130 return gdk_mbstowcs((GdkWChar
*)buf
, psz
, n
);
132 GdkWChar
*nbuf
= new GdkWChar
[n
=strlen(psz
)];
133 size_t len
= gdk_mbstowcs(nbuf
, psz
, n
);
139 size_t wxMBConvGdk::WC2MB(char *buf
, const wchar_t *psz
, size_t n
) const
141 char *mbstr
= gdk_wcstombs((GdkWChar
*)psz
);
142 size_t len
= mbstr
? strlen(mbstr
) : 0;
144 if (len
> n
) len
= n
;
145 memcpy(buf
, psz
, len
);
146 if (len
< n
) buf
[len
] = 0;
153 // ----------------------------------------------------------------------------
155 // ----------------------------------------------------------------------------
157 WXDLLEXPORT_DATA(wxMBConvUTF7
) wxConvUTF7
;
160 static char utf7_setD
[]="ABCDEFGHIJKLMNOPQRSTUVWXYZ"
161 "abcdefghijklmnopqrstuvwxyz"
162 "0123456789'(),-./:?";
163 static char utf7_setO
[]="!\"#$%&*;<=>@[]^_`{|}";
164 static char utf7_setB
[]="ABCDEFGHIJKLMNOPQRSTUVWXYZ"
165 "abcdefghijklmnopqrstuvwxyz"
169 // TODO: write actual implementations of UTF-7 here
170 size_t wxMBConvUTF7::MB2WC(wchar_t * WXUNUSED(buf
),
171 const char * WXUNUSED(psz
),
172 size_t WXUNUSED(n
)) const
177 size_t wxMBConvUTF7::WC2MB(char * WXUNUSED(buf
),
178 const wchar_t * WXUNUSED(psz
),
179 size_t WXUNUSED(n
)) const
184 // ----------------------------------------------------------------------------
186 // ----------------------------------------------------------------------------
188 WXDLLEXPORT_DATA(wxMBConvUTF8
) wxConvUTF8
;
190 static unsigned long utf8_max
[]={0x7f,0x7ff,0xffff,0x1fffff,0x3ffffff,0x7fffffff,0xffffffff};
192 size_t wxMBConvUTF8::MB2WC(wchar_t *buf
, const char *psz
, size_t n
) const
196 while (*psz
&& ((!buf
) || (len
<n
))) {
197 unsigned char cc
=*psz
++, fc
=cc
;
199 for (cnt
=0; fc
&0x80; cnt
++) fc
<<=1;
207 // invalid UTF-8 sequence
211 unsigned long res
=cc
&(0x3f>>cnt
);
214 if ((cc
&0xC0)!=0x80) {
215 // invalid UTF-8 sequence
218 res
=(res
<<6)|(cc
&0x3f);
220 if (res
<=utf8_max
[ocnt
]) {
221 // illegal UTF-8 encoding
229 if (buf
&& (len
<n
)) *buf
= 0;
233 size_t wxMBConvUTF8::WC2MB(char *buf
, const wchar_t *psz
, size_t n
) const
237 while (*psz
&& ((!buf
) || (len
<n
))) {
238 unsigned long cc
=(*psz
++)&0x7fffffff;
240 for (cnt
=0; cc
>utf8_max
[cnt
]; cnt
++);
248 *buf
++=(-128>>cnt
)|((cc
>>(cnt
*6))&(0x3f>>cnt
));
250 *buf
++=0x80|((cc
>>(cnt
*6))&0x3f);
254 if (buf
&& (len
<n
)) *buf
= 0;
258 // ----------------------------------------------------------------------------
259 // specified character set
260 // ----------------------------------------------------------------------------
262 WXDLLEXPORT_DATA(wxCSConv
) wxConvLocal((const wxChar
*)NULL
);
264 #include "wx/encconv.h"
265 #include "wx/fontmap.h"
270 // temporarily just use wxEncodingConverter stuff,
271 // so that it works while a better implementation is built
273 wxEncodingConverter m2w
, w2m
;
274 wxCharacterSet(wxFontEncoding e
) : enc(e
)
276 m2w
.Init(enc
, wxFONTENCODING_UNICODE
);
277 w2m
.Init(wxFONTENCODING_UNICODE
, enc
);
281 static wxCharacterSet
*wxGetCharacterSet(const wxChar
*name
)
283 wxFontEncoding enc
= name
? wxTheFontMapper
->CharsetToEncoding(name
, FALSE
)
284 : wxFONTENCODING_SYSTEM
;
285 wxCharacterSet
*cset
= (enc
!= wxFONTENCODING_SYSTEM
) ? new wxCharacterSet(enc
)
286 : (wxCharacterSet
*)NULL
;
290 wxCSConv::wxCSConv(const wxChar
*charset
)
292 m_name
= (wxChar
*) NULL
;
293 m_cset
= (wxCharacterSet
*) NULL
;
298 wxCSConv::~wxCSConv()
300 if (m_name
) free(m_name
);
301 if (m_cset
) delete m_cset
;
304 void wxCSConv::SetName(const wxChar
*charset
)
307 m_name
= wxStrdup(charset
);
312 void wxCSConv::LoadNow()
314 // wxPrintf(wxT("Conversion request\n"));
318 wxChar
*lang
= wxGetenv(wxT("LC_ALL"));
319 if (!lang
) lang
= wxGetenv(wxT("LANG"));
320 wxChar
*dot
= lang
? wxStrchr(lang
, wxT('.')) : (wxChar
*)NULL
;
321 if (dot
) SetName(dot
+1);
324 m_cset
= wxGetCharacterSet(m_name
);
329 size_t wxCSConv::MB2WC(wchar_t *buf
, const char *psz
, size_t n
) const
331 ((wxCSConv
*)this)->LoadNow(); // discard constness
334 m_cset
->m2w
.Convert(psz
, buf
);
337 for (size_t c
=0; c
<n
; c
++)
338 buf
[c
] = (unsigned char)(psz
[c
]);
345 size_t wxCSConv::WC2MB(char *buf
, const wchar_t *psz
, size_t n
) const
347 ((wxCSConv
*)this)->LoadNow(); // discard constness
350 m_cset
->w2m
.Convert(psz
, buf
);
353 for (size_t c
=0; c
<n
; c
++)
354 buf
[c
] = (psz
[c
]>0xff) ? '?' : psz
[c
];
358 #if defined(__BORLANDC__) && (__BORLANDC__ > 0x530)
359 return std::wcslen(psz
);
361 return ::wcslen(psz
);
365 #else // !wxUSE_WCHAR_T
367 // ----------------------------------------------------------------------------
368 // stand-ins in absence of wchar_t
369 // ----------------------------------------------------------------------------
371 WXDLLEXPORT_DATA(wxMBConv
) wxConvLibc
, wxConvFile
;
373 #endif // wxUSE_WCHAR_T