[wxWidgets.git] / interface / strconv.h

/////////////////////////////////////////////////////////////////////////////
// Name:        strconv.h
// Purpose:     interface of wxMBConvUTF7
// Author:      wxWidgets team
// RCS-ID:      $Id$
// Licence:     wxWindows license
/////////////////////////////////////////////////////////////////////////////

/**
    @class wxMBConv
    @wxheader{strconv.h}

    This class is the base class of a hierarchy of classes capable of
    converting text strings between multibyte (SBCS or DBCS) encodings and
    Unicode.

    This is an abstract base class which defines the operations implemented by
    all different conversion classes. The derived classes don't add any new
    operations of their own (except, possibly, some non-default constructors)
    and so you should simply use this class ToWChar() and FromWChar() (or
    cMB2WC() and cWC2MB()) methods with the objects of the derived class.

    In the documentation for this and related classes please notice that
    length of the string refers to the number of characters in the string
    not counting the terminating @c NUL, if any. While the size of the string
    is the total number of bytes in the string, including any trailing @c NUL.
    Thus, length of wide character string @c L"foo" is 3 while its size can
    be either 8 or 16 depending on whether @c wchar_t is 2 bytes (as
    under Windows) or 4 (Unix).

    @library{wxbase}
    @category{conv}

    @see wxCSConv, wxEncodingConverter, @ref overview_mbconv "wxMBConv classes overview"
*/
class wxMBConv
{
public:
    /**
        Trivial default constructor.
    */
    wxMBConv();

    /**
        This pure virtual function is overridden in each of the derived classes
        to return a new copy of the object it is called on.

        It is used for copying the conversion objects while preserving their
        dynamic type.
    */
    virtual wxMBConv* Clone() const = 0;

    /**
        This function returns 1 for most of the multibyte encodings in which the
        string is terminated by a single @c NUL, 2 for UTF-16 and 4 for UTF-32 for
        which the string is terminated with 2 and 4 @c NUL characters respectively.
        The other cases are not currently supported and @c wxCONV_FAILED
        (defined as -1) is returned for them.
    */
    size_t GetMBNulLen() const;

    /**
        Returns the maximal value which can be returned by GetMBNulLen() for
        any conversion object.

        Currently this value is 4.

        This method can be used to allocate the buffer with enough space for the
        trailing @c NUL characters for any encoding.
    */
    const size_t GetMaxMBNulLen();

    /**
        Convert multibyte string to a wide character one.

        This is the most general function for converting a multibyte string to
        a wide string, cMB2WC() may be often more convenient, however this
        function is the most efficient one as it allows to avoid any
        unnecessary copying.

        The main case is when @a dst is not @NULL and @a srcLen is not
        @c wxNO_LEN (which is defined as @c (size_t)-1): then the function
        converts exactly @a srcLen bytes starting at @a src into wide string
        which it output to @e dst. If the length of the resulting wide
        string is greater than @e dstLen, an error is returned. Note that if
        @a srcLen bytes don't include @c NUL characters, the resulting wide
        string is not @c NUL-terminated neither.

        If @a srcLen is @c wxNO_LEN, the function supposes that the string is
        properly (i.e. as necessary for the encoding handled by this
        conversion) @c NUL-terminated and converts the entire string, including
        any trailing @c NUL bytes. In this case the wide string is also @c
        NUL-terminated.

        Finally, if @a dst is @NULL, the function returns the length of the
        needed buffer.

        Example of use of this function:
        @code
        size_t dstLen = conv.ToWChar(NULL, 0, src);
        if ( dstLen == wxCONV_FAILED )
            ... handle error ...
        wchar_t *dst = new wchar_t[dstLen];
        if ( conv.ToWChar(dst, dstLen, src) == wxCONV_FAILED )
            ... handle error ...
        @endcode

        Notice that when passing the explicit source length the output will
        @e not be @c NUL terminated if you pass @c strlen(str) as parameter.
        Either leave @a srcLen as default @c wxNO_LEN or add one to @c strlen
        result if you want the output to be @c NUL terminated.

        @param dst
            Pointer to output buffer of the size of at least @a dstLen or @NULL.
        @param dstLen
            Maximal number of characters to be written to the output buffer if
            @dst is non-@NULL, unused otherwise.
        @param src
            Point to the source string, must not be @NULL.
        @param
            The number of characters of the source string to convert or @c
            wxNO_LEN (default parameter) to convert everything up to and
            including the terminating @c NUL character(s).
        @return
            The number of character written (or which would have been written
            if it were non-@NULL) to @a dst or @c wxCONV_FAILED on error.
    */
    virtual size_t ToWChar(wchar_t* dst, size_t dstLen,
                           const char* src,
                           size_t srcLen = wxNO_LEN) const;

    /**
        Converts wide character string to multibyte.

        This function has the same semantics as ToWChar() except that it
        converts a wide string to multibyte one. As with ToWChar(), it may be
        more convenient to use cWC2MB() when working with @c NUL terminated
        strings.

        @param dst
            Pointer to output buffer of the size of at least @a dstLen or @NULL.
        @param dstLen
            Maximal number of characters to be written to the output buffer if
            @dst is non-@NULL, unused otherwise.
        @param src
            Point to the source string, must not be @NULL.
        @param
            The number of characters of the source string to convert or @c
            wxNO_LEN (default parameter) to convert everything up to and
            including the terminating @c NUL character.
        @return
            The number of character written (or which would have been written
            if it were non-@NULL) to @a dst or @c wxCONV_FAILED on error.
    */
    virtual size_t FromWChar(char* dst, size_t dstLen,
                             const wchar_t* src,
                             size_t srcLen = wxNO_LEN) const;

    //@{
    /**
        Converts from multibyte encoding to Unicode by calling MB2WC() and
        allocating a temporary wxWCharBuffer to hold the result.

        The first overload takes a @c NUL-terminated input string. The second
        one takes a string of exactly the specified length and the string may
        include or not the trailing @c NUL character(s). If the string is not
        @c NUL-terminated, a temporary @c NUL-terminated copy of it suitable
        for passing to wxMBConv::MB2WC is made, so it is more efficient to
        ensure that the string is does have the appropriate number of @c NUL
        bytes (which is usually 1 but may be 2 or 4 for UTF-16 or UTF-32, see
        wxMBConv::GetMBNulLen), especially for long strings.

        If @a outLen is not-@NULL, it receives the length of the converted
        string.
    */
    const wxWCharBuffer cMB2WC(const char* in) const;
    const wxWCharBuffer cMB2WC(const char* in, size_t inLen, size_t *outLen) const;
    //@}

    //@{
    /**
        Converts from multibyte encoding to the current wxChar type (which
        depends on whether wxUSE_UNICODE is set to 1).

        If wxChar is char, it returns the parameter unaltered. If wxChar is
        wchar_t, it returns the result in a wxWCharBuffer. The macro wxMB2WXbuf
        is defined as the correct return type (without const).
    */
    const char* cMB2WX(const char* psz) const;
    const wxWCharBuffer cMB2WX(const char* psz) const;
    //@}

    //@{
    /**
        Converts from Unicode to multibyte encoding by calling WC2MB and
        allocating a temporary wxCharBuffer to hold the result.

        The second overload of this function allows to convert a string of the
        given length @e inLen, whether it is @c NUL-terminated or not (for wide
        character strings, unlike for the multibyte ones, a single @c NUL is
        always enough). But notice that just as with @ref wxMBConv::mb2wc
        cMB2WC, it is more efficient to pass an already terminated string to
        this function as otherwise a copy is made internally. If @a outLen is
        not-@NULL, it receives the length of the converted string.
    */
    const wxCharBuffer cWC2MB(const wchar_t* in) const;
    const wxCharBuffer cWC2MB(const wchar_t* in, size_t inLen, size_t *outLen) const;
    //@}

    //@{
    /**
        Converts from Unicode to the current wxChar type.

        If wxChar is wchar_t, it returns the parameter unaltered. If wxChar is
        char, it returns the result in a wxCharBuffer. The macro wxWC2WXbuf is
        defined as the correct return type (without const).
    */
    const wchar_t* cWC2WX(const wchar_t* psz) const;
    const wxCharBuffer cWC2WX(const wchar_t* psz) const;
    //@}

    //@{
    /**
        Converts from the current wxChar type to multibyte encoding.

        If wxChar is char, it returns the parameter unaltered. If wxChar is
        wchar_t, it returns the result in a wxCharBuffer. The macro wxWX2MBbuf
        is defined as the correct return type (without const).
    */
    const char* cWX2MB(const wxChar* psz) const;
    const wxCharBuffer cWX2MB(const wxChar* psz) const;
    //@}

    //@{
    /**
        Converts from the current wxChar type to Unicode.

        If wxChar is wchar_t, it returns the parameter unaltered. If wxChar is
        char, it returns the result in a wxWCharBuffer. The macro wxWX2WCbuf is
        defined as the correct return type (without const).
    */
    const wchar_t* cWX2WC(const wxChar* psz) const;
    const wxWCharBuffer cWX2WC(const wxChar* psz) const;
    //@}

    /**
        @deprecated This function is deprecated, please use ToWChar() instead.

        Converts from a string @a in in multibyte encoding to Unicode putting up to
        @a outLen characters into the buffer @e out.

        If @a out is @NULL, only the length of the string which would result
        from the conversion is calculated and returned. Note that this is the
        length and not size, i.e. the returned value does not include the
        trailing @c NUL. But when the function is called with a non-@NULL @a
        out buffer, the @a outLen parameter should be one more to allow to
        properly @c NUL-terminate the string.

        @param out
            The output buffer, may be @NULL if the caller is only
            interested in the length of the resulting string
        @param in
            The NUL-terminated input string, cannot be @NULL
        @param outLen
            The length of the output buffer but including
            NUL, ignored if out is @NULL

        @return The length of the converted string excluding the trailing NUL.
    */
    virtual size_t MB2WC(wchar_t* out, const char* in, size_t outLen) const;

    /**
        @deprecated This function is deprecated, please use FromWChar() instead.

        Converts from Unicode to multibyte encoding.
        The semantics of this function (including the return value meaning) is
        the same as for wxMBConv::MB2WC. Notice that when the function is
        called with a non-@NULL buffer, the @a n parameter should be the size
        of the buffer and so it should take into account the trailing @c NUL,
        which might take two or four bytes for some encodings (UTF-16 and
        UTF-32) and not one.
    */
    virtual size_t WC2MB(char* buf, const wchar_t* psz, size_t n) const;
};


/**
    @class wxMBConvUTF7
    @wxheader{strconv.h}

    This class converts between the UTF-7 encoding and Unicode.
    It has one predefined instance, @b wxConvUTF7.

    Notice that, unlike all the other conversion objects, this converter is
    stateful, i.e. it remembers its state from the last call to its ToWChar()
    or FromWChar() and assumes it is called on the continuation of the same
    string when the same method is called again. This assumption is only made
    if an explicit length is specified as parameter to these functions as if an
    entire @c NUL terminated string is processed the state doesn't need to be
    remembered.

    This also means that, unlike the other predefined conversion objects,
    @b wxConvUTF7 is @em not thread-safe.

    @library{wxbase}
    @category{conv}

    @see wxMBConvUTF8, @ref overview_mbconv "wxMBConv classes overview"
*/
class wxMBConvUTF7 : public wxMBConv
{
};


/**
    @class wxMBConvUTF8
    @wxheader{strconv.h}

    This class converts between the UTF-8 encoding and Unicode.
    It has one predefined instance, @b wxConvUTF8.

    @library{wxbase}
    @category{conv}

    @see wxMBConvUTF7, @ref overview_mbconv "wxMBConv classes overview"
*/
class wxMBConvUTF8 : public wxMBConv
{
};


/**
    @class wxMBConvUTF16
    @wxheader{strconv.h}

    This class is used to convert between multibyte encodings and UTF-16 Unicode
    encoding (also known as UCS-2).

    Unlike UTF-8 encoding, UTF-16 uses words and not bytes and hence depends
    on the byte ordering: big or little endian. Hence this class is provided in
    two versions: wxMBConvUTF16LE and wxMBConvUTF16BE and wxMBConvUTF16 itself
    is just a typedef for one of them (native for the given platform, e.g. LE
    under Windows and BE under Mac).

    @library{wxbase}
    @category{conv}

    @see wxMBConvUTF8, wxMBConvUTF32, @ref overview_mbconv "wxMBConv classes overview"
*/
class wxMBConvUTF16 : public wxMBConv
{
};


/**
    @class wxMBConvUTF32
    @wxheader{strconv.h}

    This class is used to convert between multibyte encodings and UTF-32
    Unicode encoding (also known as UCS-4).
    Unlike UTF-8 encoding, UTF-32 uses (double) words and not bytes and hence
    depends on the byte ordering: big or little endian. Hence this class is
    provided in two versions: wxMBConvUTF32LE and wxMBConvUTF32BE and
    wxMBConvUTF32 itself is just a typedef for one of them (native for the
    given platform, e.g. LE under Windows and BE under Mac).

    @library{wxbase}
    @category{conv}

    @see wxMBConvUTF8, wxMBConvUTF16, @ref overview_mbconv "wxMBConv classes overview"
*/
class wxMBConvUTF32 : public wxMBConv
{
};


/**
    @class wxCSConv
    @wxheader{strconv.h}

    This class converts between any character set supported by the system and
    Unicode.

    Please notice that this class uses system-provided conversion functions,
    e.g. @c MultiByteToWideChar() and @c WideCharToMultiByte() under MSW and @c
    iconv(3) under Unix systems and as such may support different encodings and
    different encoding names on different platforms (although all relatively
    common encodings are supported should be supported everywhere).

    It has one predefined instance, @b wxConvLocal, for the default user
    character set.

    @library{wxbase}
    @category{conv}

    @see wxMBConv, wxEncodingConverter, @ref overview_mbconv "wxMBConv classes overview"
*/
class wxCSConv : public wxMBConv
{
public:
    /**
        Constructor.

        You can specify the name of the character set you want to convert
        from/to. If the character set name is not recognized, ISO 8859-1 is
        used as fall back, use IsOk() to test for this.

        @param charset The name of the encoding, shouldn't be empty.
    */
    wxCSConv(const wxString& charset);

    /**
        Constructor.

        You can specify an encoding constant for the character set you want to
        convert from/to. Use IsOk() after construction to check whether the
        encoding is supported by the current system.

        @param encoding Any valid (i.e. not wxFONTENCODING_MAX) font encoding.
    */
    wxCSConv(wxFontEncoding encoding);

    /**
        Returns @true if the charset (or the encoding) given at constructor is
        really available to use.

        Returns @false if ISO 8859-1 will be used instead.

        Note this does not mean that a given string will be correctly
        converted. A malformed string may still make conversion functions
        return @c wxCONV_FAILED.

        @since 2.8.2
    */
    bool IsOk() const;
};


/**
    @class wxMBConvFile
    @wxheader{strconv.h}

    This class used to define the class instance @b wxConvFileName, but
    nowadays @b wxConvFileName is either of type wxConvLibc (on most platforms)
    or wxConvUTF8 (on MacOS X).

    @b wxConvFileName converts filenames between filesystem multibyte encoding
    and Unicode. @b wxConvFileName can also be set to a something else at
    run-time which is used e.g. by wxGTK to use a class which checks the
    environment variable @b G_FILESYSTEM_ENCODING indicating that filenames
    should not be interpreted as UTF8 and also for converting invalid UTF8
    characters (e.g. if there is a filename in iso8859_1) to strings with octal
    values.

    Since some platforms (such as Win32) use Unicode in the filenames,
    and others (such as Unix) use multibyte encodings, this class should only
    be used directly if wxMBFILES is defined to 1. A convenience macro,
    @c wxFNCONV, is defined to @c wxConvFileName->cWX2MB in this case. You
    could use it like this:

    @code
    wxChar *name = wxT("rawfile.doc");
    FILE *fil = fopen(wxFNCONV(name), "r");
    @endcode

    (although it would be better to just use wxFopen(name, "r") in this
    particular case, you only need to use this class for functions taking file
    names not wrapped by wxWidgets.)

    @library{wxbase}
    @category{conv}

    @see @ref overview_mbconv "wxMBConv classes overview"
*/
class wxMBConvFile : public wxMBConv
{
public:
};
Commit	Line	Data
23324ae1 FM	1	/////////////////////////////////////////////////////////////////////////////
23324ae1 FM	2	// Name: strconv.h
e54c96f1	3	// Purpose: interface of wxMBConvUTF7
23324ae1 FM	4	// Author: wxWidgets team
	5	// RCS-ID: $Id$
	6	// Licence: wxWindows license
	7	/////////////////////////////////////////////////////////////////////////////
	8
	9	/**
f501c3a9	10	@class wxMBConv
23324ae1	11	@wxheader{strconv.h}
7c913512	12
f501c3a9 VZ	13	This class is the base class of a hierarchy of classes capable of
	14	converting text strings between multibyte (SBCS or DBCS) encodings and
	15	Unicode.
	16
	17	This is an abstract base class which defines the operations implemented by
	18	all different conversion classes. The derived classes don't add any new
	19	operations of their own (except, possibly, some non-default constructors)
	20	and so you should simply use this class ToWChar() and FromWChar() (or
	21	cMB2WC() and cWC2MB()) methods with the objects of the derived class.
	22
	23	In the documentation for this and related classes please notice that
	24	length of the string refers to the number of characters in the string
	25	not counting the terminating @c NUL, if any. While the size of the string
	26	is the total number of bytes in the string, including any trailing @c NUL.
	27	Thus, length of wide character string @c L"foo" is 3 while its size can
	28	be either 8 or 16 depending on whether @c wchar_t is 2 bytes (as
	29	under Windows) or 4 (Unix).
7c913512	30
23324ae1	31	@library{wxbase}
79b40dcf	32	@category{conv}
7c913512	33
f501c3a9	34	@see wxCSConv, wxEncodingConverter, @ref overview_mbconv "wxMBConv classes overview"
23324ae1	35	*/
f501c3a9	36	class wxMBConv
23324ae1 FM	37	{
	38	public:
	39	/**
f501c3a9	40	Trivial default constructor.
23324ae1	41	*/
f501c3a9	42	wxMBConv();
23324ae1 FM	43
23324ae1 FM	44	/**
f501c3a9 VZ	45	This pure virtual function is overridden in each of the derived classes
f501c3a9 VZ	46	to return a new copy of the object it is called on.
7c913512	47
f501c3a9 VZ	48	It is used for copying the conversion objects while preserving their
	49	dynamic type.
	50	*/
	51	virtual wxMBConv* Clone() const = 0;
7c913512	52
23324ae1	53	/**
f501c3a9 VZ	54	This function returns 1 for most of the multibyte encodings in which the
	55	string is terminated by a single @c NUL, 2 for UTF-16 and 4 for UTF-32 for
	56	which the string is terminated with 2 and 4 @c NUL characters respectively.
	57	The other cases are not currently supported and @c wxCONV_FAILED
	58	(defined as -1) is returned for them.
23324ae1	59	*/
f501c3a9	60	size_t GetMBNulLen() const;
23324ae1 FM	61
23324ae1 FM	62	/**
f501c3a9 VZ	63	Returns the maximal value which can be returned by GetMBNulLen() for
f501c3a9 VZ	64	any conversion object.
23324ae1	65
f501c3a9	66	Currently this value is 4.
23324ae1	67
f501c3a9 VZ	68	This method can be used to allocate the buffer with enough space for the
	69	trailing @c NUL characters for any encoding.
	70	*/
	71	const size_t GetMaxMBNulLen();
e54c96f1	72
f501c3a9 VZ	73	/**
f501c3a9 VZ	74	Convert multibyte string to a wide character one.
7c913512	75
f501c3a9 VZ	76	This is the most general function for converting a multibyte string to
	77	a wide string, cMB2WC() may be often more convenient, however this
	78	function is the most efficient one as it allows to avoid any
	79	unnecessary copying.
7c913512	80
f501c3a9 VZ	81	The main case is when @a dst is not @NULL and @a srcLen is not
	82	@c wxNO_LEN (which is defined as @c (size_t)-1): then the function
	83	converts exactly @a srcLen bytes starting at @a src into wide string
	84	which it output to @e dst. If the length of the resulting wide
	85	string is greater than @e dstLen, an error is returned. Note that if
	86	@a srcLen bytes don't include @c NUL characters, the resulting wide
	87	string is not @c NUL-terminated neither.
7c913512	88
f501c3a9 VZ	89	If @a srcLen is @c wxNO_LEN, the function supposes that the string is
	90	properly (i.e. as necessary for the encoding handled by this
	91	conversion) @c NUL-terminated and converts the entire string, including
	92	any trailing @c NUL bytes. In this case the wide string is also @c
	93	NUL-terminated.
	94
	95	Finally, if @a dst is @NULL, the function returns the length of the
	96	needed buffer.
	97
	98	Example of use of this function:
	99	@code
	100	size_t dstLen = conv.ToWChar(NULL, 0, src);
	101	if ( dstLen == wxCONV_FAILED )
	102	... handle error ...
	103	wchar_t *dst = new wchar_t[dstLen];
	104	if ( conv.ToWChar(dst, dstLen, src) == wxCONV_FAILED )
	105	... handle error ...
	106	@endcode
	107
	108	Notice that when passing the explicit source length the output will
	109	@e not be @c NUL terminated if you pass @c strlen(str) as parameter.
	110	Either leave @a srcLen as default @c wxNO_LEN or add one to @c strlen
	111	result if you want the output to be @c NUL terminated.
	112
	113	@param dst
	114	Pointer to output buffer of the size of at least @a dstLen or @NULL.
	115	@param dstLen
	116	Maximal number of characters to be written to the output buffer if
	117	@dst is non-@NULL, unused otherwise.
	118	@param src
	119	Point to the source string, must not be @NULL.
	120	@param
	121	The number of characters of the source string to convert or @c
	122	wxNO_LEN (default parameter) to convert everything up to and
	123	including the terminating @c NUL character(s).
	124	@return
	125	The number of character written (or which would have been written
	126	if it were non-@NULL) to @a dst or @c wxCONV_FAILED on error.
23324ae1	127	*/
f501c3a9 VZ	128	virtual size_t ToWChar(wchar_t* dst, size_t dstLen,
	129	const char* src,
	130	size_t srcLen = wxNO_LEN) const;
23324ae1 FM	131
23324ae1 FM	132	/**
f501c3a9 VZ	133	Converts wide character string to multibyte.
	134
	135	This function has the same semantics as ToWChar() except that it
	136	converts a wide string to multibyte one. As with ToWChar(), it may be
	137	more convenient to use cWC2MB() when working with @c NUL terminated
	138	strings.
	139
	140	@param dst
	141	Pointer to output buffer of the size of at least @a dstLen or @NULL.
	142	@param dstLen
	143	Maximal number of characters to be written to the output buffer if
	144	@dst is non-@NULL, unused otherwise.
	145	@param src
	146	Point to the source string, must not be @NULL.
	147	@param
	148	The number of characters of the source string to convert or @c
	149	wxNO_LEN (default parameter) to convert everything up to and
	150	including the terminating @c NUL character.
	151	@return
	152	The number of character written (or which would have been written
	153	if it were non-@NULL) to @a dst or @c wxCONV_FAILED on error.
23324ae1	154	*/
f501c3a9 VZ	155	virtual size_t FromWChar(char* dst, size_t dstLen,
	156	const wchar_t* src,
	157	size_t srcLen = wxNO_LEN) const;
23324ae1	158
f501c3a9 VZ	159	//@{
	160	/**
	161	Converts from multibyte encoding to Unicode by calling MB2WC() and
	162	allocating a temporary wxWCharBuffer to hold the result.
	163
	164	The first overload takes a @c NUL-terminated input string. The second
	165	one takes a string of exactly the specified length and the string may
	166	include or not the trailing @c NUL character(s). If the string is not
	167	@c NUL-terminated, a temporary @c NUL-terminated copy of it suitable
	168	for passing to wxMBConv::MB2WC is made, so it is more efficient to
	169	ensure that the string is does have the appropriate number of @c NUL
	170	bytes (which is usually 1 but may be 2 or 4 for UTF-16 or UTF-32, see
	171	wxMBConv::GetMBNulLen), especially for long strings.
e54c96f1	172
f501c3a9 VZ	173	If @a outLen is not-@NULL, it receives the length of the converted
	174	string.
	175	*/
	176	const wxWCharBuffer cMB2WC(const char* in) const;
	177	const wxWCharBuffer cMB2WC(const char* in, size_t inLen, size_t *outLen) const;
	178	//@}
7c913512	179
f501c3a9 VZ	180	//@{
	181	/**
	182	Converts from multibyte encoding to the current wxChar type (which
	183	depends on whether wxUSE_UNICODE is set to 1).
7c913512	184
f501c3a9 VZ	185	If wxChar is char, it returns the parameter unaltered. If wxChar is
	186	wchar_t, it returns the result in a wxWCharBuffer. The macro wxMB2WXbuf
	187	is defined as the correct return type (without const).
	188	*/
	189	const char* cMB2WX(const char* psz) const;
	190	const wxWCharBuffer cMB2WX(const char* psz) const;
	191	//@}
7c913512	192
f501c3a9	193	//@{
23324ae1	194	/**
f501c3a9 VZ	195	Converts from Unicode to multibyte encoding by calling WC2MB and
	196	allocating a temporary wxCharBuffer to hold the result.
	197
	198	The second overload of this function allows to convert a string of the
	199	given length @e inLen, whether it is @c NUL-terminated or not (for wide
	200	character strings, unlike for the multibyte ones, a single @c NUL is
	201	always enough). But notice that just as with @ref wxMBConv::mb2wc
	202	cMB2WC, it is more efficient to pass an already terminated string to
	203	this function as otherwise a copy is made internally. If @a outLen is
	204	not-@NULL, it receives the length of the converted string.
23324ae1	205	*/
f501c3a9 VZ	206	const wxCharBuffer cWC2MB(const wchar_t* in) const;
	207	const wxCharBuffer cWC2MB(const wchar_t* in, size_t inLen, size_t *outLen) const;
	208	//@}
79b40dcf	209
f501c3a9	210	//@{
ee0b7af0	211	/**
f501c3a9 VZ	212	Converts from Unicode to the current wxChar type.
	213
	214	If wxChar is wchar_t, it returns the parameter unaltered. If wxChar is
	215	char, it returns the result in a wxCharBuffer. The macro wxWC2WXbuf is
	216	defined as the correct return type (without const).
ee0b7af0	217	*/
f501c3a9 VZ	218	const wchar_t* cWC2WX(const wchar_t* psz) const;
	219	const wxCharBuffer cWC2WX(const wchar_t* psz) const;
	220	//@}
23324ae1	221
f501c3a9	222	//@{
23324ae1	223	/**
f501c3a9 VZ	224	Converts from the current wxChar type to multibyte encoding.
	225
	226	If wxChar is char, it returns the parameter unaltered. If wxChar is
	227	wchar_t, it returns the result in a wxCharBuffer. The macro wxWX2MBbuf
	228	is defined as the correct return type (without const).
23324ae1	229	*/
f501c3a9 VZ	230	const char* cWX2MB(const wxChar* psz) const;
	231	const wxCharBuffer cWX2MB(const wxChar* psz) const;
	232	//@}
23324ae1	233
f501c3a9	234	//@{
23324ae1	235	/**
f501c3a9	236	Converts from the current wxChar type to Unicode.
3c4f71cc	237
f501c3a9 VZ	238	If wxChar is wchar_t, it returns the parameter unaltered. If wxChar is
	239	char, it returns the result in a wxWCharBuffer. The macro wxWX2WCbuf is
	240	defined as the correct return type (without const).
23324ae1	241	*/
f501c3a9 VZ	242	const wchar_t* cWX2WC(const wxChar* psz) const;
	243	const wxWCharBuffer cWX2WC(const wxChar* psz) const;
	244	//@}
23324ae1 FM	245
23324ae1 FM	246	/**
f501c3a9 VZ	247	@deprecated This function is deprecated, please use ToWChar() instead.
	248
	249	Converts from a string @a in in multibyte encoding to Unicode putting up to
	250	@a outLen characters into the buffer @e out.
	251
	252	If @a out is @NULL, only the length of the string which would result
	253	from the conversion is calculated and returned. Note that this is the
	254	length and not size, i.e. the returned value does not include the
	255	trailing @c NUL. But when the function is called with a non-@NULL @a
	256	out buffer, the @a outLen parameter should be one more to allow to
	257	properly @c NUL-terminate the string.
	258
	259	@param out
	260	The output buffer, may be @NULL if the caller is only
	261	interested in the length of the resulting string
	262	@param in
	263	The NUL-terminated input string, cannot be @NULL
	264	@param outLen
	265	The length of the output buffer but including
	266	NUL, ignored if out is @NULL
	267
	268	@return The length of the converted string excluding the trailing NUL.
23324ae1	269	*/
f501c3a9	270	virtual size_t MB2WC(wchar_t* out, const char* in, size_t outLen) const;
23324ae1 FM	271
23324ae1 FM	272	/**
f501c3a9 VZ	273	@deprecated This function is deprecated, please use FromWChar() instead.
	274
	275	Converts from Unicode to multibyte encoding.
	276	The semantics of this function (including the return value meaning) is
	277	the same as for wxMBConv::MB2WC. Notice that when the function is
	278	called with a non-@NULL buffer, the @a n parameter should be the size
	279	of the buffer and so it should take into account the trailing @c NUL,
	280	which might take two or four bytes for some encodings (UTF-16 and
	281	UTF-32) and not one.
23324ae1	282	*/
f501c3a9	283	virtual size_t WC2MB(char* buf, const wchar_t* psz, size_t n) const;
23324ae1 FM	284	};
	285
	286
	287	/**
f501c3a9	288	@class wxMBConvUTF7
23324ae1	289	@wxheader{strconv.h}
7c913512	290
f501c3a9 VZ	291	This class converts between the UTF-7 encoding and Unicode.
f501c3a9 VZ	292	It has one predefined instance, @b wxConvUTF7.
7c913512	293
9d653e81 VZ	294	Notice that, unlike all the other conversion objects, this converter is
	295	stateful, i.e. it remembers its state from the last call to its ToWChar()
	296	or FromWChar() and assumes it is called on the continuation of the same
	297	string when the same method is called again. This assumption is only made
	298	if an explicit length is specified as parameter to these functions as if an
	299	entire @c NUL terminated string is processed the state doesn't need to be
	300	remembered.
	301
	302	This also means that, unlike the other predefined conversion objects,
	303	@b wxConvUTF7 is @em not thread-safe.
	304
f501c3a9 VZ	305	@library{wxbase}
	306	@category{conv}
	307
	308	@see wxMBConvUTF8, @ref overview_mbconv "wxMBConv classes overview"
	309	*/
	310	class wxMBConvUTF7 : public wxMBConv
	311	{
	312	};
7c913512	313
7c913512	314
f501c3a9 VZ	315
	316	/**
	317	@class wxMBConvUTF8
	318	@wxheader{strconv.h}
	319
	320	This class converts between the UTF-8 encoding and Unicode.
	321	It has one predefined instance, @b wxConvUTF8.
7c913512	322
23324ae1	323	@library{wxbase}
79b40dcf	324	@category{conv}
7c913512	325
f501c3a9	326	@see wxMBConvUTF7, @ref overview_mbconv "wxMBConv classes overview"
23324ae1	327	*/
f501c3a9	328	class wxMBConvUTF8 : public wxMBConv
23324ae1	329	{
23324ae1 FM	330	};
	331
	332
e54c96f1	333
f501c3a9 VZ	334	/**
	335	@class wxMBConvUTF16
	336	@wxheader{strconv.h}
	337
	338	This class is used to convert between multibyte encodings and UTF-16 Unicode
	339	encoding (also known as UCS-2).
	340
	341	Unlike UTF-8 encoding, UTF-16 uses words and not bytes and hence depends
	342	on the byte ordering: big or little endian. Hence this class is provided in
	343	two versions: wxMBConvUTF16LE and wxMBConvUTF16BE and wxMBConvUTF16 itself
	344	is just a typedef for one of them (native for the given platform, e.g. LE
	345	under Windows and BE under Mac).
	346
	347	@library{wxbase}
	348	@category{conv}
	349
	350	@see wxMBConvUTF8, wxMBConvUTF32, @ref overview_mbconv "wxMBConv classes overview"
	351	*/
	352	class wxMBConvUTF16 : public wxMBConv
	353	{
	354	};
	355
	356
23324ae1 FM	357	/**
	358	@class wxMBConvUTF32
	359	@wxheader{strconv.h}
7c913512	360
f501c3a9 VZ	361	This class is used to convert between multibyte encodings and UTF-32
	362	Unicode encoding (also known as UCS-4).
	363	Unlike UTF-8 encoding, UTF-32 uses (double) words and not bytes and hence
	364	depends on the byte ordering: big or little endian. Hence this class is
	365	provided in two versions: wxMBConvUTF32LE and wxMBConvUTF32BE and
	366	wxMBConvUTF32 itself is just a typedef for one of them (native for the
	367	given platform, e.g. LE under Windows and BE under Mac).
7c913512	368
23324ae1	369	@library{wxbase}
79b40dcf	370	@category{conv}
7c913512	371
8c1cd030	372	@see wxMBConvUTF8, wxMBConvUTF16, @ref overview_mbconv "wxMBConv classes overview"
23324ae1 FM	373	*/
	374	class wxMBConvUTF32 : public wxMBConv
	375	{
23324ae1 FM	376	};
	377
	378
e54c96f1	379
f501c3a9	380
23324ae1	381	/**
f501c3a9	382	@class wxCSConv
23324ae1	383	@wxheader{strconv.h}
7c913512	384
f501c3a9 VZ	385	This class converts between any character set supported by the system and
f501c3a9 VZ	386	Unicode.
7c913512	387
f501c3a9 VZ	388	Please notice that this class uses system-provided conversion functions,
	389	e.g. @c MultiByteToWideChar() and @c WideCharToMultiByte() under MSW and @c
	390	iconv(3) under Unix systems and as such may support different encodings and
	391	different encoding names on different platforms (although all relatively
	392	common encodings are supported should be supported everywhere).
	393
	394	It has one predefined instance, @b wxConvLocal, for the default user
	395	character set.
7c913512	396
23324ae1	397	@library{wxbase}
79b40dcf	398	@category{conv}
7c913512	399
f501c3a9	400	@see wxMBConv, wxEncodingConverter, @ref overview_mbconv "wxMBConv classes overview"
23324ae1	401	*/
f501c3a9	402	class wxCSConv : public wxMBConv
23324ae1 FM	403	{
	404	public:
	405	/**
f501c3a9	406	Constructor.
23324ae1	407
f501c3a9 VZ	408	You can specify the name of the character set you want to convert
	409	from/to. If the character set name is not recognized, ISO 8859-1 is
	410	used as fall back, use IsOk() to test for this.
23324ae1	411
f501c3a9	412	@param charset The name of the encoding, shouldn't be empty.
23324ae1	413	*/
f501c3a9	414	wxCSConv(const wxString& charset);
23324ae1 FM	415
23324ae1 FM	416	/**
f501c3a9	417	Constructor.
23324ae1	418
f501c3a9 VZ	419	You can specify an encoding constant for the character set you want to
	420	convert from/to. Use IsOk() after construction to check whether the
	421	encoding is supported by the current system.
	422
	423	@param encoding Any valid (i.e. not wxFONTENCODING_MAX) font encoding.
23324ae1	424	*/
f501c3a9	425	wxCSConv(wxFontEncoding encoding);
23324ae1 FM	426
23324ae1 FM	427	/**
f501c3a9 VZ	428	Returns @true if the charset (or the encoding) given at constructor is
f501c3a9 VZ	429	really available to use.
3c4f71cc	430
f501c3a9	431	Returns @false if ISO 8859-1 will be used instead.
3c4f71cc	432
f501c3a9 VZ	433	Note this does not mean that a given string will be correctly
	434	converted. A malformed string may still make conversion functions
	435	return @c wxCONV_FAILED.
23324ae1	436
f501c3a9	437	@since 2.8.2
23324ae1	438	*/
f501c3a9 VZ	439	bool IsOk() const;
f501c3a9 VZ	440	};
23324ae1	441
23324ae1	442
23324ae1	443
f501c3a9 VZ	444	/**
	445	@class wxMBConvFile
	446	@wxheader{strconv.h}
23324ae1	447
f501c3a9 VZ	448	This class used to define the class instance @b wxConvFileName, but
	449	nowadays @b wxConvFileName is either of type wxConvLibc (on most platforms)
	450	or wxConvUTF8 (on MacOS X).
23324ae1	451
f501c3a9 VZ	452	@b wxConvFileName converts filenames between filesystem multibyte encoding
	453	and Unicode. @b wxConvFileName can also be set to a something else at
	454	run-time which is used e.g. by wxGTK to use a class which checks the
	455	environment variable @b G_FILESYSTEM_ENCODING indicating that filenames
	456	should not be interpreted as UTF8 and also for converting invalid UTF8
	457	characters (e.g. if there is a filename in iso8859_1) to strings with octal
	458	values.
23324ae1	459
f501c3a9 VZ	460	Since some platforms (such as Win32) use Unicode in the filenames,
	461	and others (such as Unix) use multibyte encodings, this class should only
	462	be used directly if wxMBFILES is defined to 1. A convenience macro,
	463	@c wxFNCONV, is defined to @c wxConvFileName->cWX2MB in this case. You
	464	could use it like this:
23324ae1	465
f501c3a9 VZ	466	@code
	467	wxChar *name = wxT("rawfile.doc");
	468	FILE *fil = fopen(wxFNCONV(name), "r");
	469	@endcode
	470
	471	(although it would be better to just use wxFopen(name, "r") in this
	472	particular case, you only need to use this class for functions taking file
	473	names not wrapped by wxWidgets.)
e54c96f1	474
f501c3a9 VZ	475	@library{wxbase}
	476	@category{conv}
	477
	478	@see @ref overview_mbconv "wxMBConv classes overview"
	479	*/
	480	class wxMBConvFile : public wxMBConv
	481	{
	482	public:
	483	};