1999-12-31 00:35:13 +00:00
|
|
|
/////////////////////////////////////////////////////////////////////////////
|
2000-07-15 19:51:35 +00:00
|
|
|
// Name: wx/encconv.h
|
1999-12-31 00:35:13 +00:00
|
|
|
// Purpose: wxEncodingConverter class for converting between different
|
|
|
|
// font encodings
|
|
|
|
// Author: Vaclav Slavik
|
|
|
|
// Copyright: (c) 1999 Vaclav Slavik
|
|
|
|
// Licence: wxWindows Licence
|
|
|
|
/////////////////////////////////////////////////////////////////////////////
|
|
|
|
|
2000-07-15 19:51:35 +00:00
|
|
|
#ifndef _WX_ENCCONV_H_
|
|
|
|
#define _WX_ENCCONV_H_
|
1999-12-31 00:35:13 +00:00
|
|
|
|
2003-08-09 12:38:21 +00:00
|
|
|
#if defined(__GNUG__) && !defined(NO_GCC_PRAGMA)
|
1999-12-31 00:35:13 +00:00
|
|
|
#pragma interface "encconv.h"
|
|
|
|
#endif
|
|
|
|
|
|
|
|
#include "wx/defs.h"
|
2001-06-26 20:59:19 +00:00
|
|
|
|
|
|
|
#if wxUSE_FONTMAP
|
|
|
|
|
2000-07-15 19:51:35 +00:00
|
|
|
#include "wx/object.h"
|
|
|
|
#include "wx/fontenc.h"
|
1999-12-31 00:35:13 +00:00
|
|
|
#include "wx/dynarray.h"
|
|
|
|
|
2000-07-15 19:51:35 +00:00
|
|
|
// ----------------------------------------------------------------------------
|
|
|
|
// constants
|
|
|
|
// ----------------------------------------------------------------------------
|
1999-12-31 00:35:13 +00:00
|
|
|
|
2000-07-15 19:51:35 +00:00
|
|
|
enum
|
|
|
|
{
|
1999-12-31 00:35:13 +00:00
|
|
|
wxCONVERT_STRICT,
|
|
|
|
wxCONVERT_SUBSTITUTE
|
|
|
|
};
|
|
|
|
|
|
|
|
|
2000-07-15 19:51:35 +00:00
|
|
|
enum
|
|
|
|
{
|
1999-12-31 00:35:13 +00:00
|
|
|
wxPLATFORM_CURRENT = -1,
|
2000-01-03 18:22:51 +00:00
|
|
|
|
1999-12-31 00:35:13 +00:00
|
|
|
wxPLATFORM_UNIX = 0,
|
|
|
|
wxPLATFORM_WINDOWS,
|
|
|
|
wxPLATFORM_OS2,
|
2000-01-03 18:22:51 +00:00
|
|
|
wxPLATFORM_MAC
|
1999-12-31 00:35:13 +00:00
|
|
|
};
|
|
|
|
|
2000-07-15 19:51:35 +00:00
|
|
|
// ----------------------------------------------------------------------------
|
|
|
|
// types
|
|
|
|
// ----------------------------------------------------------------------------
|
1999-12-31 00:35:13 +00:00
|
|
|
|
2002-03-06 06:31:34 +00:00
|
|
|
WX_DEFINE_ARRAY_INT(wxFontEncoding, wxFontEncodingArray);
|
1999-12-31 00:35:13 +00:00
|
|
|
|
|
|
|
//--------------------------------------------------------------------------------
|
|
|
|
// wxEncodingConverter
|
|
|
|
// This class is capable of converting strings between any two
|
|
|
|
// 8bit encodings/charsets. It can also convert from/to Unicode
|
|
|
|
//--------------------------------------------------------------------------------
|
|
|
|
|
2003-07-02 01:59:24 +00:00
|
|
|
class WXDLLIMPEXP_BASE wxEncodingConverter : public wxObject
|
1999-12-31 00:35:13 +00:00
|
|
|
{
|
|
|
|
public:
|
2000-01-03 18:22:51 +00:00
|
|
|
|
1999-12-31 00:35:13 +00:00
|
|
|
wxEncodingConverter();
|
|
|
|
~wxEncodingConverter() { if (m_Table) delete[] m_Table; }
|
2000-01-03 18:22:51 +00:00
|
|
|
|
2002-12-04 14:11:26 +00:00
|
|
|
// Initialize conversion. Both output or input encoding may
|
2000-07-15 19:51:35 +00:00
|
|
|
// be wxFONTENCODING_UNICODE, but only if wxUSE_WCHAR_T is set to 1.
|
1999-12-31 00:35:13 +00:00
|
|
|
//
|
|
|
|
// All subsequent calls to Convert() will interpret it's argument
|
|
|
|
// as a string in input_enc encoding and will output string in
|
|
|
|
// output_enc encoding.
|
|
|
|
//
|
2000-01-03 18:22:51 +00:00
|
|
|
// You must call this method before calling Convert. You may call
|
1999-12-31 00:35:13 +00:00
|
|
|
// it more than once in order to switch to another conversion
|
|
|
|
//
|
|
|
|
// Method affects behaviour of Convert() in case input character
|
|
|
|
// cannot be converted because it does not exist in output encoding:
|
2000-01-03 18:22:51 +00:00
|
|
|
// wxCONVERT_STRICT --
|
|
|
|
// follow behaviour of GNU Recode - just copy unconvertable
|
|
|
|
// characters to output and don't change them (it's integer
|
1999-12-31 00:35:13 +00:00
|
|
|
// value will stay the same)
|
|
|
|
// wxCONVERT_SUBSTITUTE --
|
2000-01-03 18:22:51 +00:00
|
|
|
// try some (lossy) substitutions - e.g. replace
|
1999-12-31 00:35:13 +00:00
|
|
|
// unconvertable latin capitals with acute by ordinary
|
|
|
|
// capitals, replace en-dash or em-dash by '-' etc.
|
|
|
|
// both modes gurantee that output string will have same length
|
|
|
|
// as input string
|
|
|
|
//
|
|
|
|
// Returns FALSE if given conversion is impossible, TRUE otherwise
|
|
|
|
// (conversion may be impossible either if you try to convert
|
|
|
|
// to Unicode with non-Unicode build of wxWindows or if input
|
|
|
|
// or output encoding is not supported.)
|
|
|
|
bool Init(wxFontEncoding input_enc, wxFontEncoding output_enc, int method = wxCONVERT_STRICT);
|
2000-01-03 18:22:51 +00:00
|
|
|
|
1999-12-31 00:35:13 +00:00
|
|
|
// Convert input string according to settings passed to Init.
|
|
|
|
// Note that you must call Init before using Convert!
|
2000-01-02 19:51:04 +00:00
|
|
|
void Convert(const char* input, char* output);
|
|
|
|
void Convert(char* str) { Convert(str, str); }
|
2000-07-15 19:51:35 +00:00
|
|
|
wxString Convert(const wxString& input);
|
|
|
|
|
|
|
|
#if wxUSE_WCHAR_T
|
|
|
|
void Convert(const char* input, wchar_t* output);
|
|
|
|
void Convert(const wchar_t* input, char* output);
|
|
|
|
void Convert(const wchar_t* input, wchar_t* output);
|
|
|
|
void Convert(wchar_t* str) { Convert(str, str); }
|
2000-01-03 18:22:51 +00:00
|
|
|
#endif
|
1999-12-31 00:35:13 +00:00
|
|
|
// Return equivalent(s) for given font that are used
|
|
|
|
// under given platform. wxPLATFORM_CURRENT means the plaform
|
|
|
|
// this binary was compiled for
|
|
|
|
//
|
|
|
|
// Examples:
|
|
|
|
// current platform enc returned value
|
|
|
|
// -----------------------------------------------------
|
|
|
|
// unix CP1250 {ISO8859_2}
|
|
|
|
// unix ISO8859_2 {}
|
|
|
|
// windows ISO8859_2 {CP1250}
|
|
|
|
//
|
|
|
|
// Equivalence is defined in terms of convertibility:
|
|
|
|
// 2 encodings are equivalent if you can convert text between
|
|
|
|
// then without loosing information (it may - and will - happen
|
|
|
|
// that you loose special chars like quotation marks or em-dashes
|
|
|
|
// but you shouldn't loose any diacritics and language-specific
|
|
|
|
// characters when converting between equivalent encodings).
|
2000-01-03 18:22:51 +00:00
|
|
|
//
|
|
|
|
// Convert() method is not limited to converting between
|
1999-12-31 00:35:13 +00:00
|
|
|
// equivalent encodings, it can convert between arbitrary
|
|
|
|
// two encodings!
|
|
|
|
//
|
|
|
|
// Remember that this function does _NOT_ check for presence of
|
|
|
|
// fonts in system. It only tells you what are most suitable
|
|
|
|
// encodings. (It usually returns only one encoding)
|
|
|
|
//
|
|
|
|
// Note that argument enc itself may be present in returned array!
|
|
|
|
// (so that you can -- as a side effect -- detect whether the
|
|
|
|
// encoding is native for this platform or not)
|
|
|
|
static wxFontEncodingArray GetPlatformEquivalents(wxFontEncoding enc, int platform = wxPLATFORM_CURRENT);
|
|
|
|
|
2000-01-03 18:22:51 +00:00
|
|
|
// Similar to GetPlatformEquivalent, but this one will return ALL
|
1999-12-31 00:35:13 +00:00
|
|
|
// equivalent encodings, regardless the platform, including itself.
|
|
|
|
static wxFontEncodingArray GetAllEquivalents(wxFontEncoding enc);
|
|
|
|
|
|
|
|
private:
|
2000-01-03 18:22:51 +00:00
|
|
|
|
2000-07-15 19:51:35 +00:00
|
|
|
#if wxUSE_WCHAR_T
|
|
|
|
wchar_t *m_Table;
|
|
|
|
#else
|
|
|
|
char *m_Table;
|
|
|
|
#endif
|
2000-01-02 19:51:04 +00:00
|
|
|
bool m_UnicodeInput, m_UnicodeOutput;
|
1999-12-31 00:35:13 +00:00
|
|
|
bool m_JustCopy;
|
2000-01-03 18:22:51 +00:00
|
|
|
|
2003-01-02 23:38:11 +00:00
|
|
|
DECLARE_NO_COPY_CLASS(wxEncodingConverter)
|
1999-12-31 00:35:13 +00:00
|
|
|
};
|
|
|
|
|
2001-06-26 20:59:19 +00:00
|
|
|
#endif // wxUSE_FONTMAP
|
1999-12-31 00:35:13 +00:00
|
|
|
|
2000-07-15 19:51:35 +00:00
|
|
|
#endif // _WX_ENCCONV_H_
|