1999-12-31 00:35:13 +00:00
|
|
|
%
|
|
|
|
% automatically generated by HelpGen from
|
|
|
|
% encconv.h at 30/Dec/99 18:45:16
|
|
|
|
%
|
|
|
|
|
|
|
|
\section{\class{wxEncodingConverter}}\label{wxencodingconverter}
|
|
|
|
|
2003-01-23 19:49:53 +00:00
|
|
|
This class is capable of converting strings between two
|
2000-02-06 19:11:10 +00:00
|
|
|
8-bit encodings/charsets. It can also convert from/to Unicode (but only
|
2005-11-20 15:22:17 +00:00
|
|
|
if you compiled wxWidgets with wxUSE\_WCHAR\_T set to 1). Only a limited subset
|
|
|
|
of encodings is supported by wxEncodingConverter:
|
2003-01-23 19:49:53 +00:00
|
|
|
{\tt wxFONTENCODING\_ISO8859\_1..15}, {\tt wxFONTENCODING\_CP1250..1257} and
|
|
|
|
{\tt wxFONTENCODING\_KOI8}.
|
|
|
|
|
|
|
|
\wxheading{Note}
|
|
|
|
|
|
|
|
Please use \helpref{wxMBConv classes}{mbconvclasses} instead
|
|
|
|
if possible. \helpref{wxCSConv}{wxcsconv} has much better support for various
|
|
|
|
encodings than wxEncodingConverter. wxEncodingConverter is useful only
|
|
|
|
if you rely on {\tt wxCONVERT\_SUBSTITUTE} mode of operation (see
|
|
|
|
\helpref{Init}{wxencodingconverterinit}).
|
1999-12-31 00:35:13 +00:00
|
|
|
|
|
|
|
\wxheading{Derived from}
|
|
|
|
|
|
|
|
\helpref{wxObject}{wxobject}
|
|
|
|
|
2000-02-27 21:06:58 +00:00
|
|
|
\wxheading{Include files}
|
|
|
|
|
|
|
|
<wx/encconv.h>
|
|
|
|
|
2000-03-11 10:05:40 +00:00
|
|
|
\wxheading{See also}
|
|
|
|
|
|
|
|
\helpref{wxFontMapper}{wxfontmapper},
|
2000-07-15 19:51:35 +00:00
|
|
|
\helpref{wxMBConv}{wxmbconv},
|
2000-03-11 10:05:40 +00:00
|
|
|
\helpref{Writing non-English applications}{nonenglishoverview}
|
|
|
|
|
|
|
|
|
1999-12-31 00:35:13 +00:00
|
|
|
\latexignore{\rtfignore{\wxheading{Members}}}
|
|
|
|
|
2003-10-13 23:47:22 +00:00
|
|
|
|
1999-12-31 00:35:13 +00:00
|
|
|
\membersection{wxEncodingConverter::wxEncodingConverter}\label{wxencodingconverterwxencodingconverter}
|
|
|
|
|
|
|
|
\func{}{wxEncodingConverter}{\void}
|
|
|
|
|
|
|
|
Constructor.
|
|
|
|
|
2003-10-13 23:47:22 +00:00
|
|
|
|
1999-12-31 00:35:13 +00:00
|
|
|
\membersection{wxEncodingConverter::Init}\label{wxencodingconverterinit}
|
|
|
|
|
|
|
|
\func{bool}{Init}{\param{wxFontEncoding }{input\_enc}, \param{wxFontEncoding }{output\_enc}, \param{int }{method = wxCONVERT\_STRICT}}
|
|
|
|
|
2002-06-07 20:15:28 +00:00
|
|
|
Initialize conversion. Both output or input encoding may
|
1999-12-31 00:35:13 +00:00
|
|
|
be wxFONTENCODING\_UNICODE, but only if wxUSE\_ENCODING is set to 1.
|
|
|
|
All subsequent calls to \helpref{Convert()}{wxencodingconverterconvert}
|
2000-02-06 19:11:10 +00:00
|
|
|
will interpret its argument
|
|
|
|
as a string in {\it input\_enc} encoding and will output string in
|
1999-12-31 00:35:13 +00:00
|
|
|
{\it output\_enc} encoding.
|
|
|
|
You must call this method before calling Convert. You may call
|
|
|
|
it more than once in order to switch to another conversion.
|
|
|
|
{\it Method} affects behaviour of Convert() in case input character
|
|
|
|
cannot be converted because it does not exist in output encoding:
|
|
|
|
|
2000-02-06 19:11:10 +00:00
|
|
|
\begin{twocollist}\itemsep=0pt
|
1999-12-31 00:35:13 +00:00
|
|
|
\twocolitem{{\bf wxCONVERT\_STRICT}}{follow behaviour of GNU Recode -
|
2000-07-15 19:51:35 +00:00
|
|
|
just copy unconvertible characters to output and don't change them
|
1999-12-31 00:35:13 +00:00
|
|
|
(its integer value will stay the same)}
|
|
|
|
\twocolitem{{\bf wxCONVERT\_SUBSTITUTE}}{try some (lossy) substitutions
|
2000-07-15 19:51:35 +00:00
|
|
|
- e.g. replace unconvertible latin capitals with acute by ordinary
|
1999-12-31 00:35:13 +00:00
|
|
|
capitals, replace en-dash or em-dash by '-' etc.}
|
|
|
|
\end{twocollist}
|
|
|
|
|
2000-07-15 19:51:35 +00:00
|
|
|
Both modes guarantee that output string will have same length
|
1999-12-31 00:35:13 +00:00
|
|
|
as input string.
|
|
|
|
|
|
|
|
\wxheading{Return value}
|
|
|
|
|
2003-01-18 00:16:34 +00:00
|
|
|
false if given conversion is impossible, true otherwise
|
1999-12-31 00:35:13 +00:00
|
|
|
(conversion may be impossible either if you try to convert
|
2004-05-04 08:27:20 +00:00
|
|
|
to Unicode with non-Unicode build of wxWidgets or if input
|
1999-12-31 00:35:13 +00:00
|
|
|
or output encoding is not supported.)
|
|
|
|
|
2003-10-13 23:47:22 +00:00
|
|
|
|
|
|
|
\membersection{wxEncodingConverter::CanConvert}\label{wxencodingconvertercanconvert}
|
|
|
|
|
2005-11-20 15:22:17 +00:00
|
|
|
\func{static bool}{CanConvert}{\param{wxFontEncoding }{encIn}, \param{wxFontEncoding }{encOut}}
|
2003-10-13 23:47:22 +00:00
|
|
|
|
|
|
|
Return true if (any text in) multibyte encoding \arg{encIn} can be converted to
|
2004-06-19 07:40:07 +00:00
|
|
|
another one ({\it encOut}) losslessly.
|
2003-10-13 23:47:22 +00:00
|
|
|
|
|
|
|
Do not call this method with \texttt{wxFONTENCODING\_UNICODE} as either
|
|
|
|
parameter, it doesn't make sense (always works in one sense and always depends
|
|
|
|
on the text to convert in the other).
|
|
|
|
|
|
|
|
|
1999-12-31 00:35:13 +00:00
|
|
|
\membersection{wxEncodingConverter::Convert}\label{wxencodingconverterconvert}
|
|
|
|
|
2004-11-16 11:58:24 +00:00
|
|
|
\constfunc{bool}{Convert}{\param{const char* }{input}, \param{char* }{output}}
|
2002-04-06 19:07:40 +00:00
|
|
|
|
2004-11-16 11:58:24 +00:00
|
|
|
\constfunc{bool}{Convert}{\param{const wchar\_t* }{input}, \param{wchar\_t* }{output}}
|
2002-04-06 19:07:40 +00:00
|
|
|
|
2004-11-16 11:58:24 +00:00
|
|
|
\constfunc{bool}{Convert}{\param{const char* }{input}, \param{wchar\_t* }{output}}
|
2002-04-06 19:07:40 +00:00
|
|
|
|
2004-11-16 11:58:24 +00:00
|
|
|
\constfunc{bool}{Convert}{\param{const wchar\_t* }{input}, \param{char* }{output}}
|
2002-04-06 19:07:40 +00:00
|
|
|
|
|
|
|
Convert input string according to settings passed to
|
|
|
|
\helpref{Init}{wxencodingconverterinit} and writes the result to {\it output}.
|
|
|
|
|
2004-11-16 11:58:24 +00:00
|
|
|
\constfunc{bool}{Convert}{\param{char* }{str}}
|
2002-04-06 19:07:40 +00:00
|
|
|
|
2004-11-16 11:58:24 +00:00
|
|
|
\constfunc{bool}{Convert}{\param{wchar\_t* }{str}}
|
2002-04-06 19:07:40 +00:00
|
|
|
|
|
|
|
Convert input string according to settings passed to
|
|
|
|
\helpref{Init}{wxencodingconverterinit} in-place, i.e. write the result to the
|
|
|
|
same memory area.
|
|
|
|
|
2004-11-16 11:58:24 +00:00
|
|
|
All of the versions above return \true if the conversion was lossless and
|
|
|
|
\false if at least one of the characters couldn't be converted and was replaced
|
|
|
|
with {\tt '?'} in the output. Note that if {\tt wxCONVERT\_SUBSTITUTE} was
|
|
|
|
passed to \helpref{Init}{wxencodingconverterinit}, substitution is considered
|
|
|
|
lossless operation.
|
|
|
|
|
2003-09-22 20:15:00 +00:00
|
|
|
\constfunc{wxString}{Convert}{\param{const wxString\& }{input}}
|
1999-12-31 00:35:13 +00:00
|
|
|
|
2002-04-06 19:07:40 +00:00
|
|
|
Convert wxString and return new wxString object.
|
1999-12-31 00:35:13 +00:00
|
|
|
|
2002-04-06 19:07:40 +00:00
|
|
|
\wxheading{Notes}
|
1999-12-31 00:35:13 +00:00
|
|
|
|
2002-04-06 19:07:40 +00:00
|
|
|
You must call \helpref{Init}{wxencodingconverterinit} before using this method!
|
2000-01-02 19:51:04 +00:00
|
|
|
|
2004-05-04 08:27:20 +00:00
|
|
|
{\tt wchar\_t} versions of the method are not available if wxWidgets was compiled
|
2002-04-06 19:07:40 +00:00
|
|
|
with {\tt wxUSE\_WCHAR\_T} set to 0.
|
1999-12-31 00:35:13 +00:00
|
|
|
|
2003-10-13 23:47:22 +00:00
|
|
|
|
1999-12-31 00:35:13 +00:00
|
|
|
\membersection{wxEncodingConverter::GetPlatformEquivalents}\label{wxencodingconvertergetplatformequivalents}
|
|
|
|
|
2000-01-02 19:51:04 +00:00
|
|
|
\func{static wxFontEncodingArray}{GetPlatformEquivalents}{\param{wxFontEncoding }{enc}, \param{int }{platform = wxPLATFORM\_CURRENT}}
|
1999-12-31 00:35:13 +00:00
|
|
|
|
|
|
|
Return equivalents for given font that are used
|
|
|
|
under given platform. Supported platforms:
|
|
|
|
|
2000-02-06 19:11:10 +00:00
|
|
|
\begin{itemize}\itemsep=0pt
|
1999-12-31 00:35:13 +00:00
|
|
|
\item wxPLATFORM\_UNIX
|
|
|
|
\item wxPLATFORM\_WINDOWS
|
|
|
|
\item wxPLATFORM\_OS2
|
|
|
|
\item wxPLATFORM\_MAC
|
|
|
|
\item wxPLATFORM\_CURRENT
|
|
|
|
\end{itemize}
|
|
|
|
|
2002-06-07 20:15:28 +00:00
|
|
|
wxPLATFORM\_CURRENT means the platform this binary was compiled for.
|
1999-12-31 00:35:13 +00:00
|
|
|
|
|
|
|
Examples:
|
2000-02-06 19:11:10 +00:00
|
|
|
|
1999-12-31 00:35:13 +00:00
|
|
|
\begin{verbatim}
|
|
|
|
current platform enc returned value
|
|
|
|
----------------------------------------------
|
|
|
|
unix CP1250 {ISO8859_2}
|
|
|
|
unix ISO8859_2 {ISO8859_2}
|
|
|
|
windows ISO8859_2 {CP1250}
|
|
|
|
unix CP1252 {ISO8859_1,ISO8859_15}
|
|
|
|
\end{verbatim}
|
|
|
|
|
|
|
|
Equivalence is defined in terms of convertibility:
|
2000-07-15 19:51:35 +00:00
|
|
|
two encodings are equivalent if you can convert text between
|
|
|
|
then without losing information (it may - and will - happen
|
|
|
|
that you lose special chars like quotation marks or em-dashes
|
|
|
|
but you shouldn't lose any diacritics and language-specific
|
1999-12-31 00:35:13 +00:00
|
|
|
characters when converting between equivalent encodings).
|
|
|
|
|
|
|
|
Remember that this function does {\bf NOT} check for presence of
|
|
|
|
fonts in system. It only tells you what are most suitable
|
|
|
|
encodings. (It usually returns only one encoding.)
|
|
|
|
|
|
|
|
\wxheading{Notes}
|
|
|
|
|
2000-02-06 19:11:10 +00:00
|
|
|
\begin{itemize}\itemsep=0pt
|
|
|
|
\item Note that argument {\it enc} itself may be present in the returned array,
|
2000-07-15 19:51:35 +00:00
|
|
|
so that you can, as a side-effect, detect whether the
|
2000-02-06 19:11:10 +00:00
|
|
|
encoding is native for this platform or not.
|
2000-07-15 19:51:35 +00:00
|
|
|
\item \helpref{Convert}{wxencodingconverterconvert} is not limited to
|
|
|
|
converting between equivalent encodings, it can convert between two arbitrary
|
|
|
|
encodings.
|
|
|
|
\item If {\it enc} is present in the returned array, then it is {\bf always} the first
|
2000-01-02 19:51:04 +00:00
|
|
|
item of it.
|
2000-07-15 19:51:35 +00:00
|
|
|
\item Please note that the returned array may contain no items at all.
|
1999-12-31 00:35:13 +00:00
|
|
|
\end{itemize}
|
|
|
|
|
2003-10-13 23:47:22 +00:00
|
|
|
|
1999-12-31 00:35:13 +00:00
|
|
|
\membersection{wxEncodingConverter::GetAllEquivalents}\label{wxencodingconvertergetallequivalents}
|
|
|
|
|
2000-01-02 19:51:04 +00:00
|
|
|
\func{static wxFontEncodingArray}{GetAllEquivalents}{\param{wxFontEncoding }{enc}}
|
1999-12-31 00:35:13 +00:00
|
|
|
|
|
|
|
Similar to
|
|
|
|
\helpref{GetPlatformEquivalents}{wxencodingconvertergetplatformequivalents},
|
|
|
|
but this one will return ALL
|
2000-07-15 19:51:35 +00:00
|
|
|
equivalent encodings, regardless of the platform, and including itself.
|
1999-12-31 00:35:13 +00:00
|
|
|
|
2000-01-02 19:51:04 +00:00
|
|
|
This platform's encodings are before others in the array. And again, if {\it enc} is in the array,
|
|
|
|
it is the very first item in it.
|
2000-02-06 19:11:10 +00:00
|
|
|
|