On the platforms using UTF-16 for wchar_t we can't read nor write Unicode data one wchar_t at a time as a single half of a surrogate character can't be converted to or from the encoding of the stream. To fix this, we may need to store the last wchar_t already read from the stream but not returned yet in wxTextInputStream::NextChar() and store, without writing it, the wchar_t passed to wxTextOutputStream::PutChar() until the second half of the surrogate is written. See #17070.
		
			
				
	
	
		
			193 lines
		
	
	
		
			6.1 KiB
		
	
	
	
		
			C++
		
	
	
	
	
	
			
		
		
	
	
			193 lines
		
	
	
		
			6.1 KiB
		
	
	
	
		
			C++
		
	
	
	
	
	
| /////////////////////////////////////////////////////////////////////////////
 | |
| // Name:        wx/txtstrm.h
 | |
| // Purpose:     Text stream classes
 | |
| // Author:      Guilhem Lavaux
 | |
| // Modified by:
 | |
| // Created:     28/06/1998
 | |
| // Copyright:   (c) Guilhem Lavaux
 | |
| // Licence:     wxWindows licence
 | |
| /////////////////////////////////////////////////////////////////////////////
 | |
| 
 | |
| #ifndef _WX_TXTSTREAM_H_
 | |
| #define _WX_TXTSTREAM_H_
 | |
| 
 | |
| #include "wx/stream.h"
 | |
| #include "wx/convauto.h"
 | |
| 
 | |
| #if wxUSE_STREAMS
 | |
| 
 | |
| class WXDLLIMPEXP_FWD_BASE wxTextInputStream;
 | |
| class WXDLLIMPEXP_FWD_BASE wxTextOutputStream;
 | |
| 
 | |
| typedef wxTextInputStream& (*__wxTextInputManip)(wxTextInputStream&);
 | |
| typedef wxTextOutputStream& (*__wxTextOutputManip)(wxTextOutputStream&);
 | |
| 
 | |
| WXDLLIMPEXP_BASE wxTextOutputStream &endl( wxTextOutputStream &stream );
 | |
| 
 | |
| 
 | |
| #define wxEOT wxT('\4') // the End-Of-Text control code (used only inside wxTextInputStream)
 | |
| 
 | |
| // If you're scanning through a file using wxTextInputStream, you should check for EOF _before_
 | |
| // reading the next item (word / number), because otherwise the last item may get lost.
 | |
| // You should however be prepared to receive an empty item (empty string / zero number) at the
 | |
| // end of file, especially on Windows systems. This is unavoidable because most (but not all) files end
 | |
| // with whitespace (i.e. usually a newline).
 | |
| class WXDLLIMPEXP_BASE wxTextInputStream
 | |
| {
 | |
| public:
 | |
| #if wxUSE_UNICODE
 | |
|     wxTextInputStream(wxInputStream& s,
 | |
|                       const wxString &sep=wxT(" \t"),
 | |
|                       const wxMBConv& conv = wxConvAuto());
 | |
| #else
 | |
|     wxTextInputStream(wxInputStream& s, const wxString &sep=wxT(" \t"));
 | |
| #endif
 | |
|     ~wxTextInputStream();
 | |
| 
 | |
|     const wxInputStream& GetInputStream() const { return m_input; }
 | |
| 
 | |
|     // base may be between 2 and 36, inclusive, or the special 0 (= C format)
 | |
|     wxUint64 Read64(int base = 10);
 | |
|     wxUint32 Read32(int base = 10);
 | |
|     wxUint16 Read16(int base = 10);
 | |
|     wxUint8  Read8(int base = 10);
 | |
|     wxInt64  Read64S(int base = 10);
 | |
|     wxInt32  Read32S(int base = 10);
 | |
|     wxInt16  Read16S(int base = 10);
 | |
|     wxInt8   Read8S(int base = 10);
 | |
|     double   ReadDouble();
 | |
|     wxString ReadLine();
 | |
|     wxString ReadWord();
 | |
|     wxChar   GetChar() { wxChar c = NextChar(); return (wxChar)(c != wxEOT ? c : 0); }
 | |
| 
 | |
|     wxString GetStringSeparators() const { return m_separators; }
 | |
|     void SetStringSeparators(const wxString &c) { m_separators = c; }
 | |
| 
 | |
|     // Operators
 | |
|     wxTextInputStream& operator>>(wxString& word);
 | |
|     wxTextInputStream& operator>>(char& c);
 | |
| #if wxUSE_UNICODE && wxWCHAR_T_IS_REAL_TYPE
 | |
|     wxTextInputStream& operator>>(wchar_t& wc);
 | |
| #endif // wxUSE_UNICODE
 | |
|     wxTextInputStream& operator>>(wxInt16& i);
 | |
|     wxTextInputStream& operator>>(wxInt32& i);
 | |
|     wxTextInputStream& operator>>(wxInt64& i);
 | |
|     wxTextInputStream& operator>>(wxUint16& i);
 | |
|     wxTextInputStream& operator>>(wxUint32& i);
 | |
|     wxTextInputStream& operator>>(wxUint64& i);
 | |
|     wxTextInputStream& operator>>(double& i);
 | |
|     wxTextInputStream& operator>>(float& f);
 | |
| 
 | |
|     wxTextInputStream& operator>>( __wxTextInputManip func) { return func(*this); }
 | |
| 
 | |
| protected:
 | |
|     wxInputStream &m_input;
 | |
|     wxString m_separators;
 | |
|     char m_lastBytes[10]; // stores the bytes that were read for the last character
 | |
| 
 | |
| #if wxUSE_UNICODE
 | |
|     wxMBConv *m_conv;
 | |
| 
 | |
|     // The second half of a surrogate character when using UTF-16 for wchar_t:
 | |
|     // we can't return it immediately from GetChar() when we read a Unicode
 | |
|     // code point outside of the BMP, but we can't keep it in m_lastBytes
 | |
|     // neither because it can't separately decoded, so we have a separate 1
 | |
|     // wchar_t buffer just for this case.
 | |
| #if SIZEOF_WCHAR_T == 2
 | |
|     wchar_t m_lastWChar;
 | |
| #endif // SIZEOF_WCHAR_T == 2
 | |
| #endif // wxUSE_UNICODE
 | |
| 
 | |
|     bool   EatEOL(const wxChar &c);
 | |
|     void   UngetLast(); // should be used instead of wxInputStream::Ungetch() because of Unicode issues
 | |
|     // returns EOT (\4) if there is a stream error, or end of file
 | |
|     wxChar NextChar();   // this should be used instead of GetC() because of Unicode issues
 | |
|     wxChar NextNonSeparators();
 | |
| 
 | |
|     wxDECLARE_NO_COPY_CLASS(wxTextInputStream);
 | |
| };
 | |
| 
 | |
| typedef enum
 | |
| {
 | |
|   wxEOL_NATIVE,
 | |
|   wxEOL_UNIX,
 | |
|   wxEOL_MAC,
 | |
|   wxEOL_DOS
 | |
| } wxEOL;
 | |
| 
 | |
| class WXDLLIMPEXP_BASE wxTextOutputStream
 | |
| {
 | |
| public:
 | |
| #if wxUSE_UNICODE
 | |
|     wxTextOutputStream(wxOutputStream& s,
 | |
|                        wxEOL mode = wxEOL_NATIVE,
 | |
|                        const wxMBConv& conv = wxConvAuto());
 | |
| #else
 | |
|     wxTextOutputStream(wxOutputStream& s, wxEOL mode = wxEOL_NATIVE);
 | |
| #endif
 | |
|     virtual ~wxTextOutputStream();
 | |
| 
 | |
|     const wxOutputStream& GetOutputStream() const { return m_output; }
 | |
| 
 | |
|     void SetMode( wxEOL mode = wxEOL_NATIVE );
 | |
|     wxEOL GetMode() { return m_mode; }
 | |
| 
 | |
|     template<typename T>
 | |
|     void Write(const T& i)
 | |
|     {
 | |
|         wxString str;
 | |
|         str << i;
 | |
| 
 | |
|         WriteString(str);
 | |
|     }
 | |
| 
 | |
|     void Write64(wxUint64 i);
 | |
|     void Write32(wxUint32 i);
 | |
|     void Write16(wxUint16 i);
 | |
|     void Write8(wxUint8 i);
 | |
|     virtual void WriteDouble(double d);
 | |
|     virtual void WriteString(const wxString& string);
 | |
| 
 | |
|     wxTextOutputStream& PutChar(wxChar c);
 | |
| 
 | |
|     void Flush();
 | |
| 
 | |
|     wxTextOutputStream& operator<<(const wxString& string);
 | |
|     wxTextOutputStream& operator<<(char c);
 | |
| #if wxUSE_UNICODE && wxWCHAR_T_IS_REAL_TYPE
 | |
|     wxTextOutputStream& operator<<(wchar_t wc);
 | |
| #endif // wxUSE_UNICODE
 | |
|     wxTextOutputStream& operator<<(wxInt16 c);
 | |
|     wxTextOutputStream& operator<<(wxInt32 c);
 | |
|     wxTextOutputStream& operator<<(wxInt64 c);
 | |
|     wxTextOutputStream& operator<<(wxUint16 c);
 | |
|     wxTextOutputStream& operator<<(wxUint32 c);
 | |
|     wxTextOutputStream& operator<<(wxUint64 c);
 | |
|     wxTextOutputStream& operator<<(double f);
 | |
|     wxTextOutputStream& operator<<(float f);
 | |
| 
 | |
|     wxTextOutputStream& operator<<( __wxTextOutputManip func) { return func(*this); }
 | |
| 
 | |
| protected:
 | |
|     wxOutputStream &m_output;
 | |
|     wxEOL           m_mode;
 | |
| 
 | |
| #if wxUSE_UNICODE
 | |
|     wxMBConv *m_conv;
 | |
| 
 | |
| #if SIZEOF_WCHAR_T == 2
 | |
|     // The first half of a surrogate character if one was passed to PutChar()
 | |
|     // and couldn't be output when it was called the last time.
 | |
|     wchar_t m_lastWChar;
 | |
| #endif // SIZEOF_WCHAR_T == 2
 | |
| #endif // wxUSE_UNICODE
 | |
| 
 | |
|     wxDECLARE_NO_COPY_CLASS(wxTextOutputStream);
 | |
| };
 | |
| 
 | |
| #endif
 | |
|   // wxUSE_STREAMS
 | |
| 
 | |
| #endif
 | |
|     // _WX_DATSTREAM_H_
 |