git.saurik.com Git - wxWidgets.git/blame_incremental

... / ...

Commit	Line	Data
	1	%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
	2	%% Name: mbconv.tex
	3	%% Purpose: wxMBConv documentation
	4	%% Author: Ove Kaaven, Vadim Zeitlin
	5	%% Created: 2000-03-25
	6	%% RCS-ID: $Id$
	7	%% Copyright: (c) 2000 Ove Kaaven
	8	%% (c) 2003-2006 Vadim Zeitlin
	9	%% License: wxWindows license
	10	%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
	11
	12
	13	\section{\class{wxMBConv}}\label{wxmbconv}
	14
	15	This class is the base class of a hierarchy of classes capable of converting
	16	text strings between multibyte (SBCS or DBCS) encodings and Unicode.
	17
	18	In the documentation for this and related classes please notice that
	19	\emph{length} of the string refers to the number of characters in the string
	20	not counting the terminating \NUL, if any. While the \emph{size} of the string
	21	is the total number of bytes in the string, including any trailing \NUL.
	22	Thus, length of wide character string \texttt{L"foo"} is $3$ while its size can
	23	be either $8$ or $16$ depending on whether \texttt{wchar\_t} is $2$ bytes (as
	24	under Windows) or $4$ (Unix).
	25
	26	\wxheading{Global variables}
	27
	28	There are several predefined instances of this class:
	29	\begin{twocollist}
	30	\twocolitem{\textbf{wxConvLibc}}{Uses the standard ANSI C \texttt{mbstowcs()} and
	31	\texttt{wcstombs()} functions to perform the conversions; thus depends on the
	32	current locale.}
	33	\twocolitem{\textbf{wxConvLocal}}{Another conversion corresponding to the
	34	current locale but this one uses the best available conversion.}
	35	\twocolitem{\textbf{wxConvUI}}{The conversion used for hte standard UI elements
	36	such as menu items and buttons. This is a pointer which is initially set to
	37	\texttt{wxConvLocal} as the program uses the current locale by default but can
	38	be set to some specific conversion if the program needs to use a specific
	39	encoding for its UI.}
	40	\twocolitem{\textbf{wxConvISO8859\_1}}{Conversion to and from ISO-8859-1 (Latin I)
	41	encoding.}
	42	\twocolitem{\textbf{wxConvUTF8}}{Conversion to and from UTF-8 encoding.}
	43	\twocolitem{\textbf{wxConvFile}}{The appropriate conversion for the file names,
	44	depends on the system.}
	45	% \twocolitem{\textbf{wxConvCurrent}}{Not really clear what is it for...}
	46	\end{twocollist}
	47
	48
	49	\wxheading{Constants}
	50
	51	\texttt{wxCONV\_FAILED} value is defined as \texttt{(size\_t)$-1$} and is
	52	returned by the conversion functions instead of the length of the converted
	53	string if the conversion fails.
	54
	55
	56	\wxheading{Derived from}
	57
	58	No base class
	59
	60	\wxheading{Include files}
	61
	62	<wx/strconv.h>
	63
	64	\wxheading{Library}
	65
	66	\helpref{wxBase}{librarieslist}
	67
	68	\wxheading{See also}
	69
	70	\helpref{wxCSConv}{wxcsconv},
	71	\helpref{wxEncodingConverter}{wxencodingconverter},
	72	\helpref{wxMBConv classes overview}{mbconvclasses}
	73
	74
	75	\latexignore{\rtfignore{\wxheading{Members}}}
	76
	77
	78	\membersection{wxMBConv::wxMBConv}\label{wxmbconvwxmbconv}
	79
	80	\func{}{wxMBConv}{\void}
	81
	82	Trivial default constructor.
	83
	84
	85	\membersection{wxMBConv::Clone}\label{wxmbconvclone}
	86
	87	\constfunc{virtual wxMBConv *}{Clone}{\void}
	88
	89	This pure virtual function is overridden in each of the derived classes to
	90	return a new copy of the object it is called on. It is used for copying the
	91	conversion objects while preserving their dynamic type.
	92
	93
	94	\membersection{wxMBConv::MB2WC}\label{wxmbconvmb2wc}
	95
	96	\constfunc{virtual size\_t}{MB2WC}{\param{wchar\_t }{out}, \param{const char }{in}, \param{size\_t }{outLen}}
	97
	98	\deprecated{\helpref{ToWChar}{wxmbconvtowchar}}
	99
	100	Converts from a string \arg{in} in multibyte encoding to Unicode putting up to
	101	\arg{outLen} characters into the buffer \arg{out}.
	102
	103	If \arg{out} is \NULL, only the length of the string which would result from
	104	the conversion is calculated and returned. Note that this is the length and not
	105	size, i.e. the returned value does \emph{not} include the trailing \NUL. But
	106	when the function is called with a non-\NULL \arg{out} buffer, the \arg{outLen}
	107	parameter should be one more to allow to properly \NUL-terminate the string.
	108
	109	\wxheading{Parameters}
	110
	111	\docparam{out}{The output buffer, may be \NULL if the caller is only
	112	interested in the length of the resulting string}
	113
	114	\docparam{in}{The \NUL-terminated input string, cannot be \NULL}
	115
	116	\docparam{outLen}{The length of the output buffer but \emph{including}
	117	\NUL, ignored if \arg{out} is \NULL}
	118
	119	\wxheading{Return value}
	120
	121	The length of the converted string \emph{excluding} the trailing \NUL.
	122
	123
	124	\membersection{wxMBConv::WC2MB}\label{wxmbconvwc2mb}
	125
	126	\constfunc{virtual size\_t}{WC2MB}{\param{char* }{buf}, \param{const wchar\_t* }{psz}, \param{size\_t }{n}}
	127
	128	\deprecated{\helpref{FromWChar}{wxmbconvfromwchar}}
	129
	130	Converts from Unicode to multibyte encoding. The semantics of this function
	131	(including the return value meaning) is the same as for
	132	\helpref{MB2WC}{wxmbconvmb2wc}.
	133
	134	Notice that when the function is called with a non-\NULL buffer, the
	135	{\it n} parameter should be the size of the buffer and so it \emph{should} take
	136	into account the trailing \NUL, which might take two or four bytes for some
	137	encodings (UTF-16 and UTF-32) and not one.
	138
	139
	140	\membersection{wxMBConv::cMB2WC}\label{wxmbconvcmb2wc}
	141
	142	\constfunc{const wxWCharBuffer}{cMB2WC}{\param{const char *}{in}}
	143
	144	\constfunc{const wxWCharBuffer}{cMB2WC}{\param{const char }{in}, \param{size\_t }{inLen}, \param{size\_t }{outLen}}
	145
	146	Converts from multibyte encoding to Unicode by calling
	147	\helpref{MB2WC}{wxmbconvmb2wc}, allocating a temporary wxWCharBuffer to hold
	148	the result.
	149
	150	The first overload takes a \NUL-terminated input string. The second one takes a
	151	string of exactly the specified length and the string may include or not the
	152	trailing \NUL character(s). If the string is not \NUL-terminated, a temporary
	153	\NUL-terminated copy of it suitable for passing to \helpref{MB2WC}{wxmbconvmb2wc}
	154	is made, so it is more efficient to ensure that the string is does have the
	155	appropriate number of \NUL bytes (which is usually $1$ but may be $2$ or $4$
	156	for UTF-16 or UTF-32, see \helpref{GetMBNulLen}{wxmbconvgetmbnullen}),
	157	especially for long strings.
	158
	159	If \arg{outLen} is not-\NULL, it receives the length of the converted
	160	string.
	161
	162
	163	\membersection{wxMBConv::cWC2MB}\label{wxmbconvcwc2mb}
	164
	165	\constfunc{const wxCharBuffer}{cWC2MB}{\param{const wchar\_t* }{in}}
	166
	167	\constfunc{const wxCharBuffer}{cWC2MB}{\param{const wchar\_t* }{in}, \param{size\_t }{inLen}, \param{size\_t }{*outLen}}
	168
	169	Converts from Unicode to multibyte encoding by calling WC2MB,
	170	allocating a temporary wxCharBuffer to hold the result.
	171
	172	The second overload of this function allows to convert a string of the given
	173	length \arg{inLen}, whether it is \NUL-terminated or not (for wide character
	174	strings, unlike for the multibyte ones, a single \NUL is always enough).
	175	But notice that just as with \helpref{cMB2WC}{wxmbconvmb2wc}, it is more
	176	efficient to pass an already terminated string to this function as otherwise a
	177	copy is made internally.
	178
	179	If \arg{outLen} is not-\NULL, it receives the length of the converted
	180	string.
	181
	182
	183	\membersection{wxMBConv::cMB2WX}\label{wxmbconvcmb2wx}
	184
	185	\constfunc{const char}{cMB2WX}{\param{const char }{psz}}
	186
	187	\constfunc{const wxWCharBuffer}{cMB2WX}{\param{const char* }{psz}}
	188
	189	Converts from multibyte encoding to the current wxChar type
	190	(which depends on whether wxUSE\_UNICODE is set to 1). If wxChar is char,
	191	it returns the parameter unaltered. If wxChar is wchar\_t, it returns the
	192	result in a wxWCharBuffer. The macro wxMB2WXbuf is defined as the correct
	193	return type (without const).
	194
	195
	196	\membersection{wxMBConv::cWX2MB}\label{wxmbconvcwx2mb}
	197
	198	\constfunc{const char}{cWX2MB}{\param{const wxChar }{psz}}
	199
	200	\constfunc{const wxCharBuffer}{cWX2MB}{\param{const wxChar* }{psz}}
	201
	202	Converts from the current wxChar type to multibyte encoding. If wxChar is char,
	203	it returns the parameter unaltered. If wxChar is wchar\_t, it returns the
	204	result in a wxCharBuffer. The macro wxWX2MBbuf is defined as the correct
	205	return type (without const).
	206
	207
	208	\membersection{wxMBConv::cWC2WX}\label{wxmbconvcwc2wx}
	209
	210	\constfunc{const wchar\_t}{cWC2WX}{\param{const wchar\_t }{psz}}
	211
	212	\constfunc{const wxCharBuffer}{cWC2WX}{\param{const wchar\_t* }{psz}}
	213
	214	Converts from Unicode to the current wxChar type. If wxChar is wchar\_t,
	215	it returns the parameter unaltered. If wxChar is char, it returns the
	216	result in a wxCharBuffer. The macro wxWC2WXbuf is defined as the correct
	217	return type (without const).
	218
	219
	220	\membersection{wxMBConv::cWX2WC}\label{wxmbconvcwx2wc}
	221
	222	\constfunc{const wchar\_t}{cWX2WC}{\param{const wxChar }{psz}}
	223
	224	\constfunc{const wxWCharBuffer}{cWX2WC}{\param{const wxChar* }{psz}}
	225
	226	Converts from the current wxChar type to Unicode. If wxChar is wchar\_t,
	227	it returns the parameter unaltered. If wxChar is char, it returns the
	228	result in a wxWCharBuffer. The macro wxWX2WCbuf is defined as the correct
	229	return type (without const).
	230
	231
	232	\membersection{wxMBConv::FromWChar}\label{wxmbconvfromwchar}
	233
	234	\constfunc{virtual size\_t}{FromWChar}{\param{char\_t }{dst}, \param{size\_t }{dstLen}, \param{const wchar\_t }{src}, \param{size\_t }{srcLen = wxNO\_LEN}}
	235
	236	This function has the same semantics as \helpref{ToWChar}{wxmbconvtowchar}
	237	except that it converts a wide string to multibyte one.
	238
	239	\membersection{wxMBConv::GetMaxMBNulLen}\label{wxmbconvgetmaxmbnullen}
	240
	241	\func{const size\_t}{GetMaxMBNulLen}{\void}
	242
	243	Returns the maximal value which can be returned by
	244	\helpref{GetMBNulLen}{wxmbconvgetmbnullen} for any conversion object. Currently
	245	this value is $4$.
	246
	247	This method can be used to allocate the buffer with enough space for the
	248	trailing \NUL characters for any encoding.
	249
	250
	251	\membersection{wxMBConv::GetMBNulLen}\label{wxmbconvgetmbnullen}
	252
	253	\constfunc{size\_t}{GetMBNulLen}{\void}
	254
	255	This function returns $1$ for most of the multibyte encodings in which the
	256	string is terminated by a single \NUL, $2$ for UTF-16 and $4$ for UTF-32 for
	257	which the string is terminated with $2$ and $4$ \NUL characters respectively.
	258	The other cases are not currently supported and \texttt{wxCONV\_FAILED}
	259	(defined as $-1$) is returned for them.
	260
	261
	262	\membersection{wxMBConv::ToWChar}\label{wxmbconvtowchar}
	263
	264	\constfunc{virtual size\_t}{ToWChar}{\param{wchar\_t }{dst}, \param{size\_t }{dstLen}, \param{const char }{src}, \param{size\_t }{srcLen = wxNO\_LEN}}
	265
	266	The most general function for converting a multibyte string to a wide string.
	267	The main case is when \arg{dst} is not \NULL and \arg{srcLen} is not
	268	\texttt{wxNO\_LEN} (which is defined as \texttt{(size\_t)$-1$}): then
	269	the function converts exactly \arg{srcLen} bytes starting at \arg{src} into
	270	wide string which it output to \arg{dst}. If the length of the resulting wide
	271	string is greater than \arg{dstLen}, an error is returned. Note that if
	272	\arg{srcLen} bytes don't include \NUL characters, the resulting wide string is
	273	not \NUL-terminated neither.
	274
	275	If \arg{srcLen} is \texttt{wxNO\_LEN}, the function supposes that the string is
	276	properly (i.e. as necessary for the encoding handled by this conversion)
	277	\NUL-terminated and converts the entire string, including any trailing \NUL
	278	bytes. In this case the wide string is also \NUL-terminated.
	279
	280	Finally, if \arg{dst} is \NULL, the function returns the length of the needed
	281	buffer.
	282
	283	\wxheading{Return value}
	284
	285	The number of characters written to \arg{dst} (or the number of characters
	286	which would have been written to it if it were non-\NULL) on success or
	287	\texttt{wxCONV\_FAILED} on error.
	288
	289