On the platforms using UTF-16 for wchar_t we can't read nor write Unicode data one wchar_t at a time as a single half of a surrogate character can't be converted to or from the encoding of the stream. To fix this, we may need to store the last wchar_t already read from the stream but not returned yet in wxTextInputStream::NextChar() and store, without writing it, the wchar_t passed to wxTextOutputStream::PutChar() until the second half of the surrogate is written. See #17070.
193 lines
6.1 KiB
C++
193 lines
6.1 KiB
C++
/////////////////////////////////////////////////////////////////////////////
|
|
// Name: wx/txtstrm.h
|
|
// Purpose: Text stream classes
|
|
// Author: Guilhem Lavaux
|
|
// Modified by:
|
|
// Created: 28/06/1998
|
|
// Copyright: (c) Guilhem Lavaux
|
|
// Licence: wxWindows licence
|
|
/////////////////////////////////////////////////////////////////////////////
|
|
|
|
#ifndef _WX_TXTSTREAM_H_
|
|
#define _WX_TXTSTREAM_H_
|
|
|
|
#include "wx/stream.h"
|
|
#include "wx/convauto.h"
|
|
|
|
#if wxUSE_STREAMS
|
|
|
|
class WXDLLIMPEXP_FWD_BASE wxTextInputStream;
|
|
class WXDLLIMPEXP_FWD_BASE wxTextOutputStream;
|
|
|
|
typedef wxTextInputStream& (*__wxTextInputManip)(wxTextInputStream&);
|
|
typedef wxTextOutputStream& (*__wxTextOutputManip)(wxTextOutputStream&);
|
|
|
|
WXDLLIMPEXP_BASE wxTextOutputStream &endl( wxTextOutputStream &stream );
|
|
|
|
|
|
#define wxEOT wxT('\4') // the End-Of-Text control code (used only inside wxTextInputStream)
|
|
|
|
// If you're scanning through a file using wxTextInputStream, you should check for EOF _before_
|
|
// reading the next item (word / number), because otherwise the last item may get lost.
|
|
// You should however be prepared to receive an empty item (empty string / zero number) at the
|
|
// end of file, especially on Windows systems. This is unavoidable because most (but not all) files end
|
|
// with whitespace (i.e. usually a newline).
|
|
class WXDLLIMPEXP_BASE wxTextInputStream
|
|
{
|
|
public:
|
|
#if wxUSE_UNICODE
|
|
wxTextInputStream(wxInputStream& s,
|
|
const wxString &sep=wxT(" \t"),
|
|
const wxMBConv& conv = wxConvAuto());
|
|
#else
|
|
wxTextInputStream(wxInputStream& s, const wxString &sep=wxT(" \t"));
|
|
#endif
|
|
~wxTextInputStream();
|
|
|
|
const wxInputStream& GetInputStream() const { return m_input; }
|
|
|
|
// base may be between 2 and 36, inclusive, or the special 0 (= C format)
|
|
wxUint64 Read64(int base = 10);
|
|
wxUint32 Read32(int base = 10);
|
|
wxUint16 Read16(int base = 10);
|
|
wxUint8 Read8(int base = 10);
|
|
wxInt64 Read64S(int base = 10);
|
|
wxInt32 Read32S(int base = 10);
|
|
wxInt16 Read16S(int base = 10);
|
|
wxInt8 Read8S(int base = 10);
|
|
double ReadDouble();
|
|
wxString ReadLine();
|
|
wxString ReadWord();
|
|
wxChar GetChar() { wxChar c = NextChar(); return (wxChar)(c != wxEOT ? c : 0); }
|
|
|
|
wxString GetStringSeparators() const { return m_separators; }
|
|
void SetStringSeparators(const wxString &c) { m_separators = c; }
|
|
|
|
// Operators
|
|
wxTextInputStream& operator>>(wxString& word);
|
|
wxTextInputStream& operator>>(char& c);
|
|
#if wxUSE_UNICODE && wxWCHAR_T_IS_REAL_TYPE
|
|
wxTextInputStream& operator>>(wchar_t& wc);
|
|
#endif // wxUSE_UNICODE
|
|
wxTextInputStream& operator>>(wxInt16& i);
|
|
wxTextInputStream& operator>>(wxInt32& i);
|
|
wxTextInputStream& operator>>(wxInt64& i);
|
|
wxTextInputStream& operator>>(wxUint16& i);
|
|
wxTextInputStream& operator>>(wxUint32& i);
|
|
wxTextInputStream& operator>>(wxUint64& i);
|
|
wxTextInputStream& operator>>(double& i);
|
|
wxTextInputStream& operator>>(float& f);
|
|
|
|
wxTextInputStream& operator>>( __wxTextInputManip func) { return func(*this); }
|
|
|
|
protected:
|
|
wxInputStream &m_input;
|
|
wxString m_separators;
|
|
char m_lastBytes[10]; // stores the bytes that were read for the last character
|
|
|
|
#if wxUSE_UNICODE
|
|
wxMBConv *m_conv;
|
|
|
|
// The second half of a surrogate character when using UTF-16 for wchar_t:
|
|
// we can't return it immediately from GetChar() when we read a Unicode
|
|
// code point outside of the BMP, but we can't keep it in m_lastBytes
|
|
// neither because it can't separately decoded, so we have a separate 1
|
|
// wchar_t buffer just for this case.
|
|
#if SIZEOF_WCHAR_T == 2
|
|
wchar_t m_lastWChar;
|
|
#endif // SIZEOF_WCHAR_T == 2
|
|
#endif // wxUSE_UNICODE
|
|
|
|
bool EatEOL(const wxChar &c);
|
|
void UngetLast(); // should be used instead of wxInputStream::Ungetch() because of Unicode issues
|
|
// returns EOT (\4) if there is a stream error, or end of file
|
|
wxChar NextChar(); // this should be used instead of GetC() because of Unicode issues
|
|
wxChar NextNonSeparators();
|
|
|
|
wxDECLARE_NO_COPY_CLASS(wxTextInputStream);
|
|
};
|
|
|
|
typedef enum
|
|
{
|
|
wxEOL_NATIVE,
|
|
wxEOL_UNIX,
|
|
wxEOL_MAC,
|
|
wxEOL_DOS
|
|
} wxEOL;
|
|
|
|
class WXDLLIMPEXP_BASE wxTextOutputStream
|
|
{
|
|
public:
|
|
#if wxUSE_UNICODE
|
|
wxTextOutputStream(wxOutputStream& s,
|
|
wxEOL mode = wxEOL_NATIVE,
|
|
const wxMBConv& conv = wxConvAuto());
|
|
#else
|
|
wxTextOutputStream(wxOutputStream& s, wxEOL mode = wxEOL_NATIVE);
|
|
#endif
|
|
virtual ~wxTextOutputStream();
|
|
|
|
const wxOutputStream& GetOutputStream() const { return m_output; }
|
|
|
|
void SetMode( wxEOL mode = wxEOL_NATIVE );
|
|
wxEOL GetMode() { return m_mode; }
|
|
|
|
template<typename T>
|
|
void Write(const T& i)
|
|
{
|
|
wxString str;
|
|
str << i;
|
|
|
|
WriteString(str);
|
|
}
|
|
|
|
void Write64(wxUint64 i);
|
|
void Write32(wxUint32 i);
|
|
void Write16(wxUint16 i);
|
|
void Write8(wxUint8 i);
|
|
virtual void WriteDouble(double d);
|
|
virtual void WriteString(const wxString& string);
|
|
|
|
wxTextOutputStream& PutChar(wxChar c);
|
|
|
|
void Flush();
|
|
|
|
wxTextOutputStream& operator<<(const wxString& string);
|
|
wxTextOutputStream& operator<<(char c);
|
|
#if wxUSE_UNICODE && wxWCHAR_T_IS_REAL_TYPE
|
|
wxTextOutputStream& operator<<(wchar_t wc);
|
|
#endif // wxUSE_UNICODE
|
|
wxTextOutputStream& operator<<(wxInt16 c);
|
|
wxTextOutputStream& operator<<(wxInt32 c);
|
|
wxTextOutputStream& operator<<(wxInt64 c);
|
|
wxTextOutputStream& operator<<(wxUint16 c);
|
|
wxTextOutputStream& operator<<(wxUint32 c);
|
|
wxTextOutputStream& operator<<(wxUint64 c);
|
|
wxTextOutputStream& operator<<(double f);
|
|
wxTextOutputStream& operator<<(float f);
|
|
|
|
wxTextOutputStream& operator<<( __wxTextOutputManip func) { return func(*this); }
|
|
|
|
protected:
|
|
wxOutputStream &m_output;
|
|
wxEOL m_mode;
|
|
|
|
#if wxUSE_UNICODE
|
|
wxMBConv *m_conv;
|
|
|
|
#if SIZEOF_WCHAR_T == 2
|
|
// The first half of a surrogate character if one was passed to PutChar()
|
|
// and couldn't be output when it was called the last time.
|
|
wchar_t m_lastWChar;
|
|
#endif // SIZEOF_WCHAR_T == 2
|
|
#endif // wxUSE_UNICODE
|
|
|
|
wxDECLARE_NO_COPY_CLASS(wxTextOutputStream);
|
|
};
|
|
|
|
#endif
|
|
// wxUSE_STREAMS
|
|
|
|
#endif
|
|
// _WX_DATSTREAM_H_
|