Commit | Line | Data |
---|---|---|
c958260b VS |
1 | % |
2 | % automatically generated by HelpGen from | |
3 | % encconv.h at 30/Dec/99 18:45:16 | |
4 | % | |
5 | ||
c958260b VS |
6 | \section{\class{wxEncodingConverter}}\label{wxencodingconverter} |
7 | ||
a663cce7 | 8 | This class is capable of converting strings between two |
457e6c54 | 9 | 8-bit encodings/charsets. It can also convert from/to Unicode (but only |
1599f54e JS |
10 | if you compiled wxWidgets with wxUSE\_WCHAR\_T set to 1). Only a limited subset |
11 | of encodings is supported by wxEncodingConverter: | |
a663cce7 VS |
12 | {\tt wxFONTENCODING\_ISO8859\_1..15}, {\tt wxFONTENCODING\_CP1250..1257} and |
13 | {\tt wxFONTENCODING\_KOI8}. | |
14 | ||
15 | \wxheading{Note} | |
16 | ||
17 | Please use \helpref{wxMBConv classes}{mbconvclasses} instead | |
18 | if possible. \helpref{wxCSConv}{wxcsconv} has much better support for various | |
19 | encodings than wxEncodingConverter. wxEncodingConverter is useful only | |
20 | if you rely on {\tt wxCONVERT\_SUBSTITUTE} mode of operation (see | |
21 | \helpref{Init}{wxencodingconverterinit}). | |
c958260b | 22 | |
c958260b VS |
23 | \wxheading{Derived from} |
24 | ||
25 | \helpref{wxObject}{wxobject} | |
26 | ||
9704b250 VS |
27 | \wxheading{Include files} |
28 | ||
29 | <wx/encconv.h> | |
30 | ||
04a4a2af VS |
31 | \wxheading{See also} |
32 | ||
33 | \helpref{wxFontMapper}{wxfontmapper}, | |
f6bcfd97 | 34 | \helpref{wxMBConv}{wxmbconv}, |
04a4a2af VS |
35 | \helpref{Writing non-English applications}{nonenglishoverview} |
36 | ||
37 | ||
c958260b VS |
38 | \latexignore{\rtfignore{\wxheading{Members}}} |
39 | ||
5bc97d1b | 40 | |
c958260b VS |
41 | \membersection{wxEncodingConverter::wxEncodingConverter}\label{wxencodingconverterwxencodingconverter} |
42 | ||
43 | \func{}{wxEncodingConverter}{\void} | |
44 | ||
45 | Constructor. | |
46 | ||
5bc97d1b | 47 | |
c958260b VS |
48 | \membersection{wxEncodingConverter::Init}\label{wxencodingconverterinit} |
49 | ||
50 | \func{bool}{Init}{\param{wxFontEncoding }{input\_enc}, \param{wxFontEncoding }{output\_enc}, \param{int }{method = wxCONVERT\_STRICT}} | |
51 | ||
2edb0bde | 52 | Initialize conversion. Both output or input encoding may |
c958260b VS |
53 | be wxFONTENCODING\_UNICODE, but only if wxUSE\_ENCODING is set to 1. |
54 | All subsequent calls to \helpref{Convert()}{wxencodingconverterconvert} | |
457e6c54 JS |
55 | will interpret its argument |
56 | as a string in {\it input\_enc} encoding and will output string in | |
c958260b VS |
57 | {\it output\_enc} encoding. |
58 | You must call this method before calling Convert. You may call | |
59 | it more than once in order to switch to another conversion. | |
60 | {\it Method} affects behaviour of Convert() in case input character | |
61 | cannot be converted because it does not exist in output encoding: | |
62 | ||
457e6c54 | 63 | \begin{twocollist}\itemsep=0pt |
c958260b | 64 | \twocolitem{{\bf wxCONVERT\_STRICT}}{follow behaviour of GNU Recode - |
f6bcfd97 | 65 | just copy unconvertible characters to output and don't change them |
c958260b VS |
66 | (its integer value will stay the same)} |
67 | \twocolitem{{\bf wxCONVERT\_SUBSTITUTE}}{try some (lossy) substitutions | |
f6bcfd97 | 68 | - e.g. replace unconvertible latin capitals with acute by ordinary |
c958260b VS |
69 | capitals, replace en-dash or em-dash by '-' etc.} |
70 | \end{twocollist} | |
71 | ||
f6bcfd97 | 72 | Both modes guarantee that output string will have same length |
c958260b VS |
73 | as input string. |
74 | ||
75 | \wxheading{Return value} | |
76 | ||
cc81d32f | 77 | false if given conversion is impossible, true otherwise |
c958260b | 78 | (conversion may be impossible either if you try to convert |
fc2171bd | 79 | to Unicode with non-Unicode build of wxWidgets or if input |
c958260b VS |
80 | or output encoding is not supported.) |
81 | ||
5bc97d1b VZ |
82 | |
83 | \membersection{wxEncodingConverter::CanConvert}\label{wxencodingconvertercanconvert} | |
84 | ||
1599f54e | 85 | \func{static bool}{CanConvert}{\param{wxFontEncoding }{encIn}, \param{wxFontEncoding }{encOut}} |
5bc97d1b VZ |
86 | |
87 | Return true if (any text in) multibyte encoding \arg{encIn} can be converted to | |
b325f27f | 88 | another one ({\it encOut}) losslessly. |
5bc97d1b VZ |
89 | |
90 | Do not call this method with \texttt{wxFONTENCODING\_UNICODE} as either | |
91 | parameter, it doesn't make sense (always works in one sense and always depends | |
92 | on the text to convert in the other). | |
93 | ||
94 | ||
c958260b VS |
95 | \membersection{wxEncodingConverter::Convert}\label{wxencodingconverterconvert} |
96 | ||
02c92ad9 | 97 | \constfunc{bool}{Convert}{\param{const char* }{input}, \param{char* }{output}} |
7a766dcd | 98 | |
02c92ad9 | 99 | \constfunc{bool}{Convert}{\param{const wchar\_t* }{input}, \param{wchar\_t* }{output}} |
7a766dcd | 100 | |
02c92ad9 | 101 | \constfunc{bool}{Convert}{\param{const char* }{input}, \param{wchar\_t* }{output}} |
7a766dcd | 102 | |
02c92ad9 | 103 | \constfunc{bool}{Convert}{\param{const wchar\_t* }{input}, \param{char* }{output}} |
7a766dcd VS |
104 | |
105 | Convert input string according to settings passed to | |
106 | \helpref{Init}{wxencodingconverterinit} and writes the result to {\it output}. | |
107 | ||
02c92ad9 | 108 | \constfunc{bool}{Convert}{\param{char* }{str}} |
7a766dcd | 109 | |
02c92ad9 | 110 | \constfunc{bool}{Convert}{\param{wchar\_t* }{str}} |
7a766dcd VS |
111 | |
112 | Convert input string according to settings passed to | |
113 | \helpref{Init}{wxencodingconverterinit} in-place, i.e. write the result to the | |
114 | same memory area. | |
115 | ||
02c92ad9 VS |
116 | All of the versions above return \true if the conversion was lossless and |
117 | \false if at least one of the characters couldn't be converted and was replaced | |
118 | with {\tt '?'} in the output. Note that if {\tt wxCONVERT\_SUBSTITUTE} was | |
119 | passed to \helpref{Init}{wxencodingconverterinit}, substitution is considered | |
120 | lossless operation. | |
121 | ||
57c5293e | 122 | \constfunc{wxString}{Convert}{\param{const wxString\& }{input}} |
c958260b | 123 | |
7a766dcd | 124 | Convert wxString and return new wxString object. |
c958260b | 125 | |
7a766dcd | 126 | \wxheading{Notes} |
c958260b | 127 | |
7a766dcd | 128 | You must call \helpref{Init}{wxencodingconverterinit} before using this method! |
5b5d025c | 129 | |
fc2171bd | 130 | {\tt wchar\_t} versions of the method are not available if wxWidgets was compiled |
7a766dcd | 131 | with {\tt wxUSE\_WCHAR\_T} set to 0. |
c958260b | 132 | |
5bc97d1b | 133 | |
c958260b VS |
134 | \membersection{wxEncodingConverter::GetPlatformEquivalents}\label{wxencodingconvertergetplatformequivalents} |
135 | ||
5b5d025c | 136 | \func{static wxFontEncodingArray}{GetPlatformEquivalents}{\param{wxFontEncoding }{enc}, \param{int }{platform = wxPLATFORM\_CURRENT}} |
c958260b VS |
137 | |
138 | Return equivalents for given font that are used | |
139 | under given platform. Supported platforms: | |
140 | ||
457e6c54 | 141 | \begin{itemize}\itemsep=0pt |
c958260b VS |
142 | \item wxPLATFORM\_UNIX |
143 | \item wxPLATFORM\_WINDOWS | |
144 | \item wxPLATFORM\_OS2 | |
145 | \item wxPLATFORM\_MAC | |
146 | \item wxPLATFORM\_CURRENT | |
147 | \end{itemize} | |
148 | ||
2edb0bde | 149 | wxPLATFORM\_CURRENT means the platform this binary was compiled for. |
c958260b VS |
150 | |
151 | Examples: | |
457e6c54 | 152 | |
c958260b VS |
153 | \begin{verbatim} |
154 | current platform enc returned value | |
155 | ---------------------------------------------- | |
156 | unix CP1250 {ISO8859_2} | |
157 | unix ISO8859_2 {ISO8859_2} | |
158 | windows ISO8859_2 {CP1250} | |
159 | unix CP1252 {ISO8859_1,ISO8859_15} | |
160 | \end{verbatim} | |
161 | ||
162 | Equivalence is defined in terms of convertibility: | |
f6bcfd97 BP |
163 | two encodings are equivalent if you can convert text between |
164 | then without losing information (it may - and will - happen | |
165 | that you lose special chars like quotation marks or em-dashes | |
166 | but you shouldn't lose any diacritics and language-specific | |
c958260b VS |
167 | characters when converting between equivalent encodings). |
168 | ||
169 | Remember that this function does {\bf NOT} check for presence of | |
170 | fonts in system. It only tells you what are most suitable | |
171 | encodings. (It usually returns only one encoding.) | |
172 | ||
173 | \wxheading{Notes} | |
174 | ||
457e6c54 JS |
175 | \begin{itemize}\itemsep=0pt |
176 | \item Note that argument {\it enc} itself may be present in the returned array, | |
f6bcfd97 | 177 | so that you can, as a side-effect, detect whether the |
457e6c54 | 178 | encoding is native for this platform or not. |
f6bcfd97 BP |
179 | \item \helpref{Convert}{wxencodingconverterconvert} is not limited to |
180 | converting between equivalent encodings, it can convert between two arbitrary | |
181 | encodings. | |
182 | \item If {\it enc} is present in the returned array, then it is {\bf always} the first | |
5b5d025c | 183 | item of it. |
f6bcfd97 | 184 | \item Please note that the returned array may contain no items at all. |
c958260b VS |
185 | \end{itemize} |
186 | ||
5bc97d1b | 187 | |
c958260b VS |
188 | \membersection{wxEncodingConverter::GetAllEquivalents}\label{wxencodingconvertergetallequivalents} |
189 | ||
5b5d025c | 190 | \func{static wxFontEncodingArray}{GetAllEquivalents}{\param{wxFontEncoding }{enc}} |
c958260b VS |
191 | |
192 | Similar to | |
193 | \helpref{GetPlatformEquivalents}{wxencodingconvertergetplatformequivalents}, | |
194 | but this one will return ALL | |
f6bcfd97 | 195 | equivalent encodings, regardless of the platform, and including itself. |
c958260b | 196 | |
5b5d025c VS |
197 | This platform's encodings are before others in the array. And again, if {\it enc} is in the array, |
198 | it is the very first item in it. | |
457e6c54 | 199 |