/* Copyright 2015-2017 Amebis This file is part of ZRCola. ZRCola is free software: you can redistribute it and/or modify it under the terms of the GNU General Public License as published by the Free Software Foundation, either version 3 of the License, or (at your option) any later version. ZRCola is distributed in the hope that it will be useful, but WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for more details. You should have received a copy of the GNU General Public License along with ZRCola. If not, see . */ #pragma once #include "common.h" #include #include #include #include #include #pragma warning(push) #pragma warning(disable: 4200) #pragma warning(disable: 4251) #pragma warning(disable: 4512) namespace ZRCola { /// /// Language Character Database /// class ZRCOLA_API langchar_db { public: #pragma pack(push) #pragma pack(2) /// /// Character data /// struct langchar { public: langid_t lang; ///< Language ID protected: unsigned __int16 chr_to; ///< Character end in \c data wchar_t data[]; ///< Character private: inline langchar(_In_ const langchar &other); inline langchar& operator=(_In_ const langchar &other); public: /// /// Constructs the language character /// /// \param[in] lang Character language /// \param[in] chr Character /// \param[in] chr_len Number of UTF-16 characters in \p chr /// inline langchar( _In_opt_ langid_t lang = langid_t::blank, _In_opt_z_count_(chr_len) const wchar_t *chr = NULL, _In_opt_ size_t chr_len = 0) { this->lang = lang; this->chr_to = static_cast(chr_len); if (chr_len) memcpy(this->data, chr, sizeof(wchar_t)*chr_len); } inline const wchar_t* chr () const { return data; }; inline wchar_t* chr () { return data; }; inline const wchar_t* chr_end() const { return data + chr_to; }; inline wchar_t* chr_end() { return data + chr_to; }; inline unsigned __int16 chr_len() const { return chr_to; }; }; #pragma pack(pop) /// /// Character index /// class indexChr : public index { public: /// /// Constructs the index /// /// \param[in] h Reference to vector holding the data /// indexChr(_In_ std::vector &h) : index(h) {} /// /// Compares two characters by ID (for searching) /// /// \param[in] a Pointer to first element /// \param[in] b Pointer to second element /// /// \returns /// - <0 when a < b /// - =0 when a == b /// - >0 when a > b /// virtual int compare(_In_ const langchar &a, _In_ const langchar &b) const { int r = ZRCola::CompareString(a.chr(), a.chr_len(), b.chr(), b.chr_len()); if (r != 0) return r; if (a.lang < b.lang) return -1; else if (a.lang > b.lang) return 1; return 0; } } idxChr; ///< Character index #ifdef ZRCOLA_LANGCHAR_LANG_IDX /// /// Language Index /// class indexLang : public index { public: /// /// Constructs the index /// /// \param[in] h Reference to vector holding the data /// indexLang(_In_ std::vector &h) : index(h) {} /// /// Compares two languages by ID (for searching) /// /// \param[in] a Pointer to first element /// \param[in] b Pointer to second element /// /// \returns /// - <0 when a < b /// - =0 when a == b /// - >0 when a > b /// virtual int compare(_In_ const langchar &a, _In_ const langchar &b) const { if (a.lang < b.lang) return -1; else if (a.lang > b.lang) return 1; int r = ZRCola::CompareString(a.chr, a.chr_len(), b.chr(), b.chr_len()); if (r != 0) return r; return 0; } } idxLang; ///< Language index #endif std::vector data; ///< Character data public: /// /// Constructs the database /// inline langchar_db() : idxChr(data) #ifdef ZRCOLA_LANGCHAR_LANG_IDX , idxLang(data) #endif {} /// /// Clears the database /// inline void clear() { idxChr .clear(); #ifdef ZRCOLA_LANGCHAR_LANG_IDX idxLang.clear(); #endif data .clear(); } /// /// Tests presence of character in the given language /// /// \param[in] chr Pointer to character /// \param[in] chr_end Pointer to character end /// \param[in] lang Language /// /// \returns /// - \c true when character is used in language /// - \c false otherwise bool IsLocalCharacter(_In_ const wchar_t *chr, _In_ const wchar_t *chr_end, _In_ langid_t lang) const; }; typedef ZRCOLA_API stdex::idrec::record langchar_rec; /// /// Language database /// class ZRCOLA_API language_db { public: #pragma pack(push) #pragma pack(2) /// /// Language data /// struct language { public: langid_t lang; ///< Language ID protected: unsigned __int16 name_to; ///< Language name end in \c data wchar_t data[]; ///< Language name private: inline language(_In_ const language &other); inline language& operator=(_In_ const language &other); public: /// /// Constructs the language /// /// \param[in] lang Language ID /// \param[in] name Language name /// \param[in] name_len Number of UTF-16 characters in \p name /// inline language( _In_opt_ langid_t lang = langid_t::blank, _In_opt_z_count_(name_len) const wchar_t *name = NULL, _In_opt_ size_t name_len = 0) { this->lang = lang; this->name_to = static_cast(name_len); if (name_len) memcpy(this->data, name, sizeof(wchar_t)*name_len); } inline const wchar_t* name () const { return data; }; inline wchar_t* name () { return data; }; inline const wchar_t* name_end() const { return data + name_to; }; inline wchar_t* name_end() { return data + name_to; }; inline unsigned __int16 name_len() const { return name_to; }; }; #pragma pack(pop) /// /// Language index /// class indexLang : public index { public: /// /// Constructs the index /// /// \param[in] h Reference to vector holding the data /// indexLang(_In_ std::vector &h) : index(h) {} /// /// Compares two languages by ID (for searching) /// /// \param[in] a Pointer to first element /// \param[in] b Pointer to second element /// /// \returns /// - <0 when a < b /// - =0 when a == b /// - >0 when a > b /// virtual int compare(_In_ const language &a, _In_ const language &b) const { if (a.lang < b.lang) return -1; else if (a.lang > b.lang) return 1; return 0; } } idxLang; ///< Language index std::vector data; ///< Language data public: /// /// Constructs the database /// inline language_db() : idxLang(data) {} /// /// Clears the database /// inline void clear() { idxLang.clear(); data .clear(); } }; typedef ZRCOLA_API stdex::idrec::record language_rec; }; const ZRCola::recordid_t ZRCola::langchar_rec::id = *(ZRCola::recordid_t*)"L-C"; const ZRCola::recordid_t ZRCola::language_rec::id = *(ZRCola::recordid_t*)"LNG"; /// /// Writes language character database to a stream /// /// \param[in] stream Output stream /// \param[in] db Language character database /// /// \returns The stream \p stream /// inline std::ostream& operator <<(_In_ std::ostream& stream, _In_ const ZRCola::langchar_db &db) { // Write character index. if (stream.fail()) return stream; stream << db.idxChr; #ifdef ZRCOLA_LANGCHAR_LANG_IDX // Write language index. if (stream.fail()) return stream; stream << db.idxLang; #endif // Write data count. auto data_count = db.data.size(); #if defined(_WIN64) || defined(__x86_64__) || defined(__ppc64__) // 4G check if (data_count > 0xffffffff) { stream.setstate(std::ios_base::failbit); return stream; } #endif if (stream.fail()) return stream; unsigned __int32 count = (unsigned __int32)data_count; stream.write((const char*)&count, sizeof(count)); // Write data. if (stream.fail()) return stream; stream.write((const char*)db.data.data(), sizeof(unsigned __int16)*count); return stream; } /// /// Reads language character database from a stream /// /// \param[in ] stream Input stream /// \param[out] db Language character database /// /// \returns The stream \p stream /// inline std::istream& operator >>(_In_ std::istream& stream, _Out_ ZRCola::langchar_db &db) { // Read character index. stream >> db.idxChr; if (!stream.good()) return stream; #ifdef ZRCOLA_LANGCHAR_LANG_IDX // Read language index. stream >> db.idxLang; if (!stream.good()) return stream; #endif // Read data count. unsigned __int32 count; stream.read((char*)&count, sizeof(count)); if (!stream.good()) return stream; if (count) { // Read data. db.data.resize(count); stream.read((char*)db.data.data(), sizeof(unsigned __int16)*count); } else db.data.clear(); return stream; } /// /// Writes language database to a stream /// /// \param[in] stream Output stream /// \param[in] db Language database /// /// \returns The stream \p stream /// inline std::ostream& operator <<(_In_ std::ostream& stream, _In_ const ZRCola::language_db &db) { // Write language index. if (stream.fail()) return stream; stream << db.idxLang; // Write data count. auto data_count = db.data.size(); #if defined(_WIN64) || defined(__x86_64__) || defined(__ppc64__) // 4G check if (data_count > 0xffffffff) { stream.setstate(std::ios_base::failbit); return stream; } #endif if (stream.fail()) return stream; unsigned __int32 count = (unsigned __int32)data_count; stream.write((const char*)&count, sizeof(count)); // Write data. if (stream.fail()) return stream; stream.write((const char*)db.data.data(), sizeof(unsigned __int16)*count); return stream; } /// /// Reads language database from a stream /// /// \param[in ] stream Input stream /// \param[out] db Language database /// /// \returns The stream \p stream /// inline std::istream& operator >>(_In_ std::istream& stream, _Out_ ZRCola::language_db &db) { // Read language index. stream >> db.idxLang; if (!stream.good()) return stream; // Read data count. unsigned __int32 count; stream.read((char*)&count, sizeof(count)); if (!stream.good()) return stream; if (count) { // Read data. db.data.resize(count); stream.read((char*)db.data.data(), sizeof(unsigned __int16)*count); } else db.data.clear(); return stream; } #pragma warning(pop)