2011-03-20 18:05:19 +00:00
|
|
|
///////////////////////////////////////////////////////////////////////////////
|
|
|
|
// Name: wx/convauto.h
|
|
|
|
// Purpose: wxConvAuto class declaration
|
|
|
|
// Author: Vadim Zeitlin
|
|
|
|
// Created: 2006-04-03
|
2012-03-18 01:12:27 +00:00
|
|
|
// RCS-ID: $Id: convauto.h 69675 2011-11-05 11:23:41Z VZ $
|
2011-03-20 18:05:19 +00:00
|
|
|
// Copyright: (c) 2006 Vadim Zeitlin
|
|
|
|
// Licence: wxWindows licence
|
|
|
|
///////////////////////////////////////////////////////////////////////////////
|
|
|
|
|
|
|
|
#ifndef _WX_CONVAUTO_H_
|
|
|
|
#define _WX_CONVAUTO_H_
|
|
|
|
|
|
|
|
#include "wx/strconv.h"
|
|
|
|
#include "wx/fontenc.h"
|
|
|
|
|
|
|
|
// ----------------------------------------------------------------------------
|
|
|
|
// wxConvAuto: uses BOM to automatically detect input encoding
|
|
|
|
// ----------------------------------------------------------------------------
|
|
|
|
|
2012-03-18 01:12:27 +00:00
|
|
|
// All currently recognized BOM values.
|
|
|
|
enum wxBOM
|
|
|
|
{
|
|
|
|
wxBOM_Unknown = -1,
|
|
|
|
wxBOM_None,
|
|
|
|
wxBOM_UTF32BE,
|
|
|
|
wxBOM_UTF32LE,
|
|
|
|
wxBOM_UTF16BE,
|
|
|
|
wxBOM_UTF16LE,
|
|
|
|
wxBOM_UTF8
|
|
|
|
};
|
|
|
|
|
2011-03-20 18:05:19 +00:00
|
|
|
class WXDLLIMPEXP_BASE wxConvAuto : public wxMBConv
|
|
|
|
{
|
|
|
|
public:
|
|
|
|
// default ctor, the real conversion will be created on demand
|
|
|
|
wxConvAuto(wxFontEncoding enc = wxFONTENCODING_DEFAULT)
|
|
|
|
{
|
|
|
|
Init();
|
|
|
|
|
|
|
|
m_encDefault = enc;
|
|
|
|
}
|
|
|
|
|
|
|
|
// copy ctor doesn't initialize anything neither as conversion can only be
|
|
|
|
// deduced on first use
|
|
|
|
wxConvAuto(const wxConvAuto& other) : wxMBConv()
|
|
|
|
{
|
|
|
|
Init();
|
|
|
|
|
|
|
|
m_encDefault = other.m_encDefault;
|
|
|
|
}
|
|
|
|
|
|
|
|
virtual ~wxConvAuto()
|
|
|
|
{
|
|
|
|
if ( m_ownsConv )
|
|
|
|
delete m_conv;
|
|
|
|
}
|
|
|
|
|
|
|
|
// get/set the fall-back encoding used when the input text doesn't have BOM
|
|
|
|
// and isn't UTF-8
|
|
|
|
//
|
|
|
|
// special values are wxFONTENCODING_MAX meaning not to use any fall back
|
|
|
|
// at all (but just fail to convert in this case) and wxFONTENCODING_SYSTEM
|
|
|
|
// meaning to use the encoding of the system locale
|
|
|
|
static wxFontEncoding GetFallbackEncoding() { return ms_defaultMBEncoding; }
|
|
|
|
static void SetFallbackEncoding(wxFontEncoding enc);
|
|
|
|
static void DisableFallbackEncoding()
|
|
|
|
{
|
|
|
|
SetFallbackEncoding(wxFONTENCODING_MAX);
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
// override the base class virtual function(s) to use our m_conv
|
|
|
|
virtual size_t ToWChar(wchar_t *dst, size_t dstLen,
|
|
|
|
const char *src, size_t srcLen = wxNO_LEN) const;
|
|
|
|
|
|
|
|
virtual size_t FromWChar(char *dst, size_t dstLen,
|
|
|
|
const wchar_t *src, size_t srcLen = wxNO_LEN) const;
|
|
|
|
|
|
|
|
virtual size_t GetMBNulLen() const { return m_conv->GetMBNulLen(); }
|
|
|
|
|
|
|
|
virtual wxMBConv *Clone() const { return new wxConvAuto(*this); }
|
|
|
|
|
|
|
|
// return the BOM type of this buffer
|
2012-03-18 01:12:27 +00:00
|
|
|
static wxBOM DetectBOM(const char *src, size_t srcLen);
|
2011-03-20 18:05:19 +00:00
|
|
|
|
2012-03-18 01:12:27 +00:00
|
|
|
// return the characters composing the given BOM.
|
|
|
|
static const char* GetBOMChars(wxBOM bomType, size_t* count);
|
|
|
|
|
|
|
|
wxBOM GetBOM() const
|
|
|
|
{
|
|
|
|
return m_bomType;
|
|
|
|
}
|
|
|
|
|
|
|
|
private:
|
2011-03-20 18:05:19 +00:00
|
|
|
// common part of all ctors
|
|
|
|
void Init()
|
|
|
|
{
|
2012-03-18 01:12:27 +00:00
|
|
|
// We don't initialize m_encDefault here as different ctors do it
|
|
|
|
// differently.
|
2011-03-20 18:05:19 +00:00
|
|
|
m_conv = NULL;
|
2012-03-18 01:12:27 +00:00
|
|
|
m_bomType = wxBOM_Unknown;
|
2011-03-20 18:05:19 +00:00
|
|
|
m_ownsConv = false;
|
2012-03-18 01:12:27 +00:00
|
|
|
m_consumedBOM = false;
|
2011-03-20 18:05:19 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
// initialize m_conv with the UTF-8 conversion
|
|
|
|
void InitWithUTF8()
|
|
|
|
{
|
|
|
|
m_conv = &wxConvUTF8;
|
|
|
|
m_ownsConv = false;
|
|
|
|
}
|
|
|
|
|
|
|
|
// create the correct conversion object for the given BOM type
|
2012-03-18 01:12:27 +00:00
|
|
|
void InitFromBOM(wxBOM bomType);
|
2011-03-20 18:05:19 +00:00
|
|
|
|
|
|
|
// create the correct conversion object for the BOM present in the
|
|
|
|
// beginning of the buffer
|
|
|
|
//
|
|
|
|
// return false if the buffer is too short to allow us to determine if we
|
|
|
|
// have BOM or not
|
|
|
|
bool InitFromInput(const char *src, size_t len);
|
|
|
|
|
|
|
|
// adjust src and len to skip over the BOM (identified by m_bomType) at the
|
|
|
|
// start of the buffer
|
|
|
|
void SkipBOM(const char **src, size_t *len) const;
|
|
|
|
|
|
|
|
|
|
|
|
// fall-back multibyte encoding to use, may be wxFONTENCODING_SYSTEM or
|
|
|
|
// wxFONTENCODING_MAX but not wxFONTENCODING_DEFAULT
|
|
|
|
static wxFontEncoding ms_defaultMBEncoding;
|
|
|
|
|
|
|
|
// conversion object which we really use, NULL until the first call to
|
|
|
|
// either ToWChar() or FromWChar()
|
|
|
|
wxMBConv *m_conv;
|
|
|
|
|
|
|
|
// the multibyte encoding to use by default if input isn't Unicode
|
|
|
|
wxFontEncoding m_encDefault;
|
|
|
|
|
|
|
|
// our BOM type
|
2012-03-18 01:12:27 +00:00
|
|
|
wxBOM m_bomType;
|
2011-03-20 18:05:19 +00:00
|
|
|
|
|
|
|
// true if we allocated m_conv ourselves, false if we just use an existing
|
|
|
|
// global conversion
|
|
|
|
bool m_ownsConv;
|
|
|
|
|
|
|
|
// true if we already skipped BOM when converting (and not just calculating
|
|
|
|
// the size)
|
|
|
|
bool m_consumedBOM;
|
|
|
|
|
|
|
|
|
|
|
|
wxDECLARE_NO_ASSIGN_CLASS(wxConvAuto);
|
|
|
|
};
|
|
|
|
|
|
|
|
#endif // _WX_CONVAUTO_H_
|
|
|
|
|