1022 lines
44 KiB
C++
1022 lines
44 KiB
C++
/*
|
|
SPDX-License-Identifier: GPL-3.0-or-later
|
|
Copyright © 2015-2022 Amebis
|
|
*/
|
|
|
|
#include "pch.h"
|
|
|
|
using namespace std;
|
|
using namespace stdex;
|
|
using namespace winstd;
|
|
|
|
|
|
///
|
|
/// (destination character rank, (source character rank, source character)) data holder
|
|
///
|
|
class com_translation
|
|
{
|
|
public:
|
|
short rank_src; ///< Source sequence rank
|
|
short rank_dst; ///< Destination character rank
|
|
string norm; ///< Normalization footprint
|
|
|
|
inline com_translation() :
|
|
rank_src(0),
|
|
rank_dst(0)
|
|
{
|
|
}
|
|
|
|
inline com_translation(short _rank_src, short _rank_dst) :
|
|
rank_src(_rank_src),
|
|
rank_dst(_rank_dst)
|
|
{
|
|
}
|
|
|
|
inline com_translation(short _rank_src, short _rank_dst, const char *_norm) :
|
|
rank_src(_rank_src),
|
|
rank_dst(_rank_dst),
|
|
norm (_norm )
|
|
{
|
|
}
|
|
|
|
inline com_translation(short _rank_src, short _rank_dst, string &&_norm) :
|
|
rank_src( _rank_src ),
|
|
rank_dst( _rank_dst ),
|
|
norm (std::move(_norm ))
|
|
{
|
|
}
|
|
|
|
inline com_translation(const com_translation &other) :
|
|
rank_src(other.rank_src),
|
|
rank_dst(other.rank_dst),
|
|
norm (other.norm )
|
|
{
|
|
}
|
|
|
|
inline com_translation(com_translation &&other) noexcept :
|
|
rank_src( other.rank_src ),
|
|
rank_dst( other.rank_dst ),
|
|
norm (std::move(other.norm ))
|
|
{
|
|
}
|
|
|
|
inline com_translation& operator=(const com_translation &other)
|
|
{
|
|
if (this != std::addressof(other)) {
|
|
rank_src = other.rank_src;
|
|
rank_dst = other.rank_dst;
|
|
norm = other.norm ;
|
|
}
|
|
return *this;
|
|
}
|
|
|
|
inline com_translation& operator=(com_translation &&other) noexcept
|
|
{
|
|
if (this != std::addressof(other)) {
|
|
rank_src = other.rank_src ;
|
|
rank_dst = other.rank_dst ;
|
|
norm = std::move(other.norm );
|
|
}
|
|
return *this;
|
|
}
|
|
|
|
inline bool operator==(_In_ const com_translation& other) const
|
|
{
|
|
return
|
|
rank_src == other.rank_src &&
|
|
rank_dst == other.rank_dst &&
|
|
norm == other.norm;
|
|
}
|
|
|
|
inline bool operator!=(_In_ const com_translation &other) const
|
|
{
|
|
return !operator==(other);
|
|
}
|
|
|
|
inline bool operator<(_In_ const com_translation& other) const
|
|
{
|
|
if (rank_src < other.rank_src) return true;
|
|
else if (rank_src > other.rank_src) return false;
|
|
else if (rank_dst < other.rank_dst) return true;
|
|
else if (rank_dst > other.rank_dst) return false;
|
|
else if (norm < other.norm ) return true;
|
|
else return false;
|
|
}
|
|
|
|
inline bool operator<=(_In_ const com_translation &other) const
|
|
{
|
|
return !operator>(other);
|
|
}
|
|
|
|
inline bool operator>(_In_ const com_translation &other) const
|
|
{
|
|
return other.operator<(*this);
|
|
}
|
|
|
|
inline bool operator>=(_In_ const com_translation &other) const
|
|
{
|
|
return !operator<(other);
|
|
}
|
|
};
|
|
|
|
|
|
typedef map<wstring, map<wstring, com_translation> > translation_db;
|
|
typedef map<string, ZRCola::DBSource::normperm> normperm_db;
|
|
|
|
|
|
static set<ZRCola::DBSource::charseq> translate_inv(_In_ const translation_db &db_trans, _In_ const normperm_db &db_np, _In_z_ const wchar_t *str, _Inout_ set<translation_db::key_type> &path);
|
|
static inline set<ZRCola::DBSource::charseq> permutate_and_translate_inv(_In_ const translation_db &db_trans, _In_ const normperm_db &db_np, _In_z_ const wchar_t *str, _In_z_ const char *norm, _Inout_ set<translation_db::key_type> &path);
|
|
|
|
|
|
static set<ZRCola::DBSource::charseq> translate_inv(_In_ const translation_db &db_trans, _In_ const normperm_db &db_np, _In_z_ const wchar_t *str, _Inout_ set<translation_db::key_type> &path)
|
|
{
|
|
set<ZRCola::DBSource::charseq> res;
|
|
|
|
if (!*str) {
|
|
// Empty string results in empty inverse translation.
|
|
res.insert(ZRCola::DBSource::charseq(0, L""));
|
|
return res;
|
|
}
|
|
|
|
// Prepare inverse translate of the remainder string (without the first character).
|
|
auto res_rem = translate_inv(db_trans, db_np, str + 1, path);
|
|
if (res_rem.empty())
|
|
return res;
|
|
|
|
// See if first character is inverse translatable.
|
|
translation_db::key_type chr(1, *str);
|
|
auto const hit_trans = db_trans.find(chr);
|
|
if (hit_trans != db_trans.end()) {
|
|
// Current character is inverse translatable.
|
|
|
|
// Add the current character to the path before recursing.
|
|
auto hit_path = path.insert(chr);
|
|
if (!hit_path.second) {
|
|
// Path already contains this character: Cycle detected!
|
|
return res;
|
|
}
|
|
|
|
// Iterate all possible character inverse translations and combine them with the remainder string inverse translations.
|
|
for (auto d = hit_trans->second.cbegin(), d_end = hit_trans->second.cend(); d != d_end; ++d) {
|
|
auto res_chr = d->second.norm.empty() ?
|
|
translate_inv(db_trans, db_np, d->first.c_str(), path) :
|
|
permutate_and_translate_inv(db_trans, db_np, d->first.c_str(), d->second.norm.c_str(), path);
|
|
if (!res_chr.empty()) {
|
|
for (auto r_chr = res_chr.cbegin(), r_chr_end = res_chr.cend(); r_chr != r_chr_end; ++r_chr) {
|
|
for (auto r_rem = res_rem.cbegin(), r_rem_end = res_rem.cend(); r_rem != r_rem_end; ++r_rem)
|
|
res.insert(ZRCola::DBSource::charseq(d->second.rank_src + r_chr->rank + r_rem->rank, r_chr->str + r_rem->str));
|
|
}
|
|
} else {
|
|
// Cycle detected. Do not continue inverse translation.
|
|
for (auto r_rem = res_rem.cbegin(), r_end = res_rem.cend(); r_rem != r_end; ++r_rem)
|
|
res.insert(ZRCola::DBSource::charseq(r_rem->rank, chr + r_rem->str));
|
|
}
|
|
}
|
|
|
|
// Remove the current character from the path.
|
|
path.erase(hit_path.first);
|
|
} else {
|
|
// First character is non-inverse translatable. Combine it with the remainder(s).
|
|
for (auto r_rem = res_rem.cbegin(), r_end = res_rem.cend(); r_rem != r_end; ++r_rem)
|
|
res.insert(ZRCola::DBSource::charseq(r_rem->rank, chr + r_rem->str));
|
|
}
|
|
|
|
return res;
|
|
}
|
|
|
|
|
|
static inline set<ZRCola::DBSource::charseq> permutate_and_translate_inv(_In_ const translation_db &db_trans, _In_ const normperm_db &db_np, _In_z_ const wchar_t *str, _In_z_ const char *norm, _Inout_ set<translation_db::key_type> &path)
|
|
{
|
|
// Primary permutation inverse translate.
|
|
auto res = translate_inv(db_trans, db_np, str, path);
|
|
|
|
// Secondary permutation(s).
|
|
auto const hit_np = db_np.find(norm);
|
|
if (hit_np != db_np.end()) {
|
|
for (auto perm = hit_np->second.cbegin(), perm_end = hit_np->second.cend(); perm != perm_end; ++perm) {
|
|
// Prepare permutated string.
|
|
translation_db::mapped_type::key_type str_perm;
|
|
for (auto idx = perm->cbegin(), idx_end = perm->cend(); idx != idx_end; ++idx)
|
|
str_perm += str[*idx];
|
|
|
|
// Secondary permutation inverse translate.
|
|
auto res_perm = translate_inv(db_trans, db_np, str_perm.c_str(), path);
|
|
for (auto r = res_perm.cbegin(), r_end = res_perm.cend(); r != r_end; ++r)
|
|
res.insert(ZRCola::DBSource::charseq(r->rank + 1, r->str));
|
|
}
|
|
}
|
|
|
|
return res;
|
|
}
|
|
|
|
|
|
///
|
|
/// Main function
|
|
///
|
|
int _tmain(int argc, _TCHAR *argv[])
|
|
{
|
|
wxApp::CheckBuildOptions(WX_BUILD_OPTIONS_SIGNATURE, "program");
|
|
|
|
// Initialize wxWidgets.
|
|
wxInitializer initializer;
|
|
if (!initializer) {
|
|
_ftprintf(stderr, wxT("Failed to initialize the wxWidgets library, aborting.\n"));
|
|
return -1;
|
|
}
|
|
|
|
// Initialize configuration.
|
|
wxConfigBase *cfgPrev = wxConfigBase::Set(new wxConfig(wxT(PRODUCT_CFG_APPLICATION), wxT(PRODUCT_CFG_VENDOR)));
|
|
if (cfgPrev) wxDELETE(cfgPrev);
|
|
|
|
// Initialize locale.
|
|
wxLocale locale;
|
|
if (wxInitializeLocale(locale))
|
|
wxVERIFY(locale.AddCatalog(wxT("ZRColaCompile")));
|
|
|
|
// Parse command line.
|
|
static const wxCmdLineEntryDesc cmdLineDesc[] =
|
|
{
|
|
{ wxCMD_LINE_SWITCH, "h" , "help" , _("Show this help message"), wxCMD_LINE_VAL_NONE , wxCMD_LINE_OPTION_HELP },
|
|
{ wxCMD_LINE_PARAM , NULL, NULL , _("<Input file>" ), wxCMD_LINE_VAL_STRING, wxCMD_LINE_OPTION_MANDATORY },
|
|
{ wxCMD_LINE_PARAM , NULL, NULL , _("<Output file>" ), wxCMD_LINE_VAL_STRING, wxCMD_LINE_OPTION_MANDATORY },
|
|
{ wxCMD_LINE_OPTION, NULL, "pot-cat", _("Output POT catalog" ), wxCMD_LINE_VAL_STRING, wxCMD_LINE_PARAM_OPTIONAL },
|
|
|
|
{ wxCMD_LINE_NONE }
|
|
};
|
|
wxCmdLineParser parser(cmdLineDesc, argc, argv);
|
|
switch (parser.Parse()) {
|
|
case -1:
|
|
// Help was given, terminating.
|
|
return 0;
|
|
|
|
case 0:
|
|
// everything is ok; proceed
|
|
break;
|
|
|
|
default:
|
|
wxLogMessage(wxT("Syntax error detected, aborting."));
|
|
return -1;
|
|
}
|
|
|
|
// Initialize COM (CoInitialize).
|
|
wxCoInitializer initializerOLE(COINIT_MULTITHREADED | COINIT_SPEED_OVER_MEMORY);
|
|
if (!initializerOLE) {
|
|
_ftprintf(stderr, wxT("Error initializing COM.\n"));
|
|
return -1;
|
|
}
|
|
|
|
ZRCola::DBSource src;
|
|
const wxString& filenameIn = parser.GetParam(0);
|
|
if (!src.Open(filenameIn)) {
|
|
_ftprintf(stderr, wxT("%s: error ZCC0001: Error opening input file.\n"), filenameIn.fn_str());
|
|
return 1;
|
|
}
|
|
|
|
const wxString& filenameOut = parser.GetParam(1);
|
|
fstream dst((LPCTSTR)filenameOut, ios_base::out | ios_base::trunc | ios_base::binary);
|
|
if (dst.fail()) {
|
|
_ftprintf(stderr, wxT("%s: error ZCC0002: Error opening output file.\n"), filenameOut.fn_str());
|
|
return 1;
|
|
}
|
|
|
|
bool has_errors = false;
|
|
|
|
// Set of strings to translate.
|
|
wxString filenamePot;
|
|
bool build_pot = parser.Found("pot-cat", &filenamePot);
|
|
set<wstring> pot;
|
|
|
|
// Open file ID.
|
|
streamoff dst_start = idrec::open<ZRCola::recordid_t, ZRCola::recordsize_t>(dst, ZRCOLA_DB_ID);
|
|
|
|
ZRCola::translation_db db_trans;
|
|
ZRCola::transet_db db_transset;
|
|
normperm_db db_np;
|
|
|
|
{
|
|
// Get normalization permutation sets.
|
|
com_obj<ADORecordset> rs;
|
|
if (src.SelectNormPermSets(rs)) {
|
|
size_t count = src.GetRecordsetCount(rs);
|
|
if (count < 0xffffffff) { // 4G check (-1 is reserved for error condition)
|
|
string norm;
|
|
ZRCola::DBSource::normperm np;
|
|
|
|
// Parse normalization permutation sets.
|
|
for (; !ZRCola::DBSource::IsEOF(rs); rs->MoveNext()) {
|
|
// Read normalization permutation set from the database.
|
|
if (src.GetNormPerm(rs, norm, np)) {
|
|
if (!np.empty())
|
|
db_np.insert(pair<string, ZRCola::DBSource::normperm>(norm, std::move(np)));
|
|
} else
|
|
has_errors = true;
|
|
}
|
|
} else {
|
|
_ftprintf(stderr, wxT("%s: error ZCC0009: Error getting translation set count from database or too many translation sets.\n"), (LPCTSTR)filenameIn.c_str());
|
|
has_errors = true;
|
|
}
|
|
} else {
|
|
_ftprintf(stderr, wxT("%s: error ZCC0008: Error getting translation sets from database. Please make sure the file is ZRCola.zrc compatible.\n"), (LPCTSTR)filenameIn.c_str());
|
|
has_errors = true;
|
|
}
|
|
}
|
|
|
|
{
|
|
// Get translations.
|
|
com_obj<ADORecordset> rs;
|
|
if (src.SelectTranslations(rs)) {
|
|
size_t count = src.GetRecordsetCount(rs);
|
|
if (count < 0xffffffff) { // 4G check (-1 is reserved for error condition)
|
|
// Parse translations and build temporary database.
|
|
translation_db db_temp1;
|
|
for (; !ZRCola::DBSource::IsEOF(rs); rs->MoveNext()) {
|
|
// Read translation from the database.
|
|
ZRCola::DBSource::translation trans;
|
|
if (src.GetTranslation(rs, trans)) {
|
|
// Add translation to temporary database.
|
|
pair<translation_db::mapped_type::key_type, translation_db::mapped_type::mapped_type> ctp(std::move(trans.src.str), translation_db::mapped_type::mapped_type(trans.src.rank, trans.dst.rank, std::move(trans.norm)));
|
|
auto hit = db_temp1.find(trans.dst.str);
|
|
if (hit != db_temp1.end())
|
|
hit->second.insert(std::move(ctp));
|
|
else {
|
|
translation_db::mapped_type t;
|
|
t.insert(std::move(ctp));
|
|
db_temp1.insert(pair<translation_db::key_type, translation_db::mapped_type>(std::move(trans.dst.str), std::move(t)));
|
|
}
|
|
} else
|
|
has_errors = true;
|
|
}
|
|
|
|
// Inverse translate source sequences down to non-inverse translatable characters.
|
|
translation_db db_temp2;
|
|
for (auto t1 = db_temp1.cbegin(), t1_end = db_temp1.cend(); t1 != t1_end; ++t1) {
|
|
auto t2 = db_temp2.insert(pair<translation_db::key_type, translation_db::mapped_type>(t1->first, translation_db::mapped_type())).first;
|
|
|
|
for (auto d1 = t1->second.cbegin(), d1_end = t1->second.cend(); d1 != d1_end; ++d1) {
|
|
set<translation_db::key_type> path;
|
|
path.insert(t1->first);
|
|
auto res = d1->second.norm.empty() ?
|
|
translate_inv(db_temp1, db_np, d1->first.c_str(), path) :
|
|
permutate_and_translate_inv(db_temp1, db_np, d1->first.c_str(), d1->second.norm.c_str(), path);
|
|
assert(!res.empty());
|
|
|
|
// Add translation to temporary database.
|
|
for (auto r = res.cbegin(), r_end = res.cend(); r != r_end; ++r) {
|
|
translation_db::mapped_type::mapped_type ct(d1->second.rank_src + r->rank, d1->second.rank_dst);
|
|
auto hit = t2->second.find(r->str);
|
|
if (hit != t2->second.end()) {
|
|
hit->second.rank_src = std::min<short>(hit->second.rank_src, ct.rank_src);
|
|
hit->second.rank_dst = std::max<short>(hit->second.rank_dst, ct.rank_dst);
|
|
} else
|
|
t2->second.insert(pair<translation_db::mapped_type::key_type, translation_db::mapped_type::mapped_type>(r->str, std::move(ct)));
|
|
}
|
|
}
|
|
}
|
|
|
|
// Preallocate memory.
|
|
db_trans.idxSrc.reserve(count*2);
|
|
db_trans.idxDst.reserve(count*2);
|
|
db_trans.data .reserve(count*2*8);
|
|
|
|
// Parse translations and build index and data.
|
|
ZRCola::DBSource::translation trans;
|
|
for (auto t = db_temp2.cbegin(), t_end = db_temp2.cend(); t != t_end; ++t) {
|
|
// Add translation to index and data.
|
|
trans.dst.str = t->first;
|
|
for (auto d = t->second.cbegin(), d_end = t->second.cend(); d != d_end; ++d) {
|
|
trans.set = (short)ZRCOLA_TRANSETID_DEFAULT;
|
|
trans.dst.rank = d->second.rank_dst;
|
|
trans.src.rank = d->second.rank_src;
|
|
trans.src.str = d->first;
|
|
db_trans << trans;
|
|
|
|
// If destination contains no PUA characters, add it to the ZRCola » Unicode transliteration too.
|
|
bool has_pua = false;
|
|
for (auto ch = trans.dst.str.cbegin(), ch_end = trans.dst.str.cend(); ch != ch_end; ++ch)
|
|
if (ZRCola::ispua(*ch)) {
|
|
has_pua = true;
|
|
break;
|
|
}
|
|
if (!has_pua) {
|
|
trans.set = (short)ZRCOLA_TRANSETID_UNICODE;
|
|
trans.dst.rank += 50;
|
|
db_trans << trans;
|
|
}
|
|
}
|
|
}
|
|
} else {
|
|
_ftprintf(stderr, wxT("%s: error ZCC0004: Error getting translation count from database or too many translations.\n"), (LPCTSTR)filenameIn.c_str());
|
|
has_errors = true;
|
|
}
|
|
} else {
|
|
_ftprintf(stderr, wxT("%s: error ZCC0003: Error getting translations from database. Please make sure the file is ZRCola.zrc compatible.\n"), (LPCTSTR)filenameIn.c_str());
|
|
has_errors = true;
|
|
}
|
|
}
|
|
|
|
{
|
|
com_obj<ADORecordset> rs_tran;
|
|
if (src.SelectTranslations(static_cast<short>(ZRCOLA_TRANSETID_UNICODE), rs_tran)) {
|
|
size_t count = src.GetRecordsetCount(rs_tran);
|
|
if (count < 0xffffffff) { // 4G check (-1 is reserved for error condition)
|
|
// Preallocate memory.
|
|
db_trans.idxSrc.reserve(db_trans.idxSrc.size() + count);
|
|
db_trans.idxDst.reserve(db_trans.idxDst.size() + count);
|
|
db_trans.data .reserve(db_trans.data.size() + count*8);
|
|
|
|
// Parse translations and build temporary database.
|
|
ZRCola::DBSource::translation trans;
|
|
trans.set = (short)ZRCOLA_TRANSETID_UNICODE;
|
|
for (; !ZRCola::DBSource::IsEOF(rs_tran); rs_tran->MoveNext()) {
|
|
// Read translation from the database.
|
|
if (src.GetTranslation(rs_tran, trans)) {
|
|
// Add translation to index and data.
|
|
db_trans << trans;
|
|
} else
|
|
has_errors = true;
|
|
}
|
|
} else {
|
|
_ftprintf(stderr, wxT("%s: error ZCC0004: Error getting Unicode translation count from database or too many translations.\n"), (LPCTSTR)filenameIn.c_str());
|
|
has_errors = true;
|
|
}
|
|
} else {
|
|
_ftprintf(stderr, wxT("%s: error ZCC0003: Error getting Unicode translations from database. Please make sure the file is ZRCola.zrc compatible.\n"), (LPCTSTR)filenameIn.c_str());
|
|
has_errors = true;
|
|
}
|
|
}
|
|
|
|
{
|
|
// Get translation sets.
|
|
com_obj<ADORecordset> rs;
|
|
if (src.SelectTranlationSets(rs)) {
|
|
size_t count = src.GetRecordsetCount(rs);
|
|
if (count < 0xffffffff) { // 4G check (-1 is reserved for error condition)
|
|
// Preallocate memory.
|
|
db_transset.idxTranSet.reserve((count+1));
|
|
db_transset.data .reserve((count+1)*4);
|
|
|
|
// Parse translation sets and build index and data.
|
|
for (; !ZRCola::DBSource::IsEOF(rs); rs->MoveNext()) {
|
|
// Read translation set from the database.
|
|
ZRCola::DBSource::transet ts;
|
|
if (src.GetTranslationSet(rs, ts)) {
|
|
if (ts.set <= (short)ZRCOLA_TRANSETID_DEFAULT || (short)ZRCOLA_TRANSETID_UNICODE <= ts.set)
|
|
continue;
|
|
|
|
if (build_pot) {
|
|
pot.insert(ts.src);
|
|
pot.insert(ts.dst);
|
|
}
|
|
|
|
// Add translation set to index and data.
|
|
db_transset << ts;
|
|
|
|
// Get translations.
|
|
com_obj<ADORecordset> rs_tran;
|
|
if (src.SelectTranslations(ts.set, rs_tran)) {
|
|
count = src.GetRecordsetCount(rs_tran);
|
|
if (count < 0xffffffff) { // 4G check (-1 is reserved for error condition)
|
|
// Preallocate memory.
|
|
db_trans.idxSrc.reserve(db_trans.idxSrc.size() + count);
|
|
db_trans.idxDst.reserve(db_trans.idxDst.size() + count);
|
|
db_trans.data .reserve(db_trans.data.size() + count*8);
|
|
|
|
// Parse translations and build temporary database.
|
|
ZRCola::DBSource::translation trans;
|
|
trans.set = ts.set;
|
|
for (; !ZRCola::DBSource::IsEOF(rs_tran); rs_tran->MoveNext()) {
|
|
// Read translation from the database.
|
|
if (src.GetTranslation(rs_tran, trans)) {
|
|
// Add translation to index and data.
|
|
db_trans << trans;
|
|
} else
|
|
has_errors = true;
|
|
}
|
|
} else {
|
|
_ftprintf(stderr, wxT("%s: error ZCC0004: Error getting translation count from database or too many translations.\n"), (LPCTSTR)filenameIn.c_str());
|
|
has_errors = true;
|
|
}
|
|
} else {
|
|
_ftprintf(stderr, wxT("%s: error ZCC0003: Error getting translations from database. Please make sure the file is ZRCola.zrc compatible.\n"), (LPCTSTR)filenameIn.c_str());
|
|
has_errors = true;
|
|
}
|
|
} else
|
|
has_errors = true;
|
|
}
|
|
} else {
|
|
_ftprintf(stderr, wxT("%s: error ZCC0009: Error getting translation set count from database or too many translation sets.\n"), (LPCTSTR)filenameIn.c_str());
|
|
has_errors = true;
|
|
}
|
|
} else {
|
|
_ftprintf(stderr, wxT("%s: error ZCC0008: Error getting translation sets from database. Please make sure the file is ZRCola.zrc compatible.\n"), (LPCTSTR)filenameIn.c_str());
|
|
has_errors = true;
|
|
}
|
|
}
|
|
|
|
// Write translation sets to file.
|
|
db_transset.idxTranSet.sort();
|
|
dst << ZRCola::transet_rec(db_transset);
|
|
|
|
// Write translations to file.
|
|
db_trans.idxSrc.sort();
|
|
db_trans.idxDst.sort();
|
|
dst << ZRCola::translation_rec(db_trans);
|
|
|
|
{
|
|
// Get translation sequences.
|
|
com_obj<ADORecordset> rs;
|
|
if (src.SelectTranlationSeqs(rs)) {
|
|
size_t count = src.GetRecordsetCount(rs);
|
|
if (count < 0xffffffff) { // 4G check (-1 is reserved for error condition)
|
|
ZRCola::transeq_db db;
|
|
|
|
// Preallocate memory.
|
|
db.idxTranSeq.reserve((count+1));
|
|
db.idxRank .reserve((count+1));
|
|
db.data .reserve((count+1)*4);
|
|
|
|
// Parse translation sequences and build index and data.
|
|
for (; !ZRCola::DBSource::IsEOF(rs); rs->MoveNext()) {
|
|
// Read translation sequence from the database.
|
|
ZRCola::DBSource::transeq ts;
|
|
if (src.GetTranslationSeq(rs, ts)) {
|
|
if (build_pot)
|
|
pot.insert(ts.name);
|
|
|
|
// Add translation sequence to index and data.
|
|
db << ts;
|
|
} else
|
|
has_errors = true;
|
|
}
|
|
|
|
// Write translation sequences to file.
|
|
db.idxTranSeq.sort();
|
|
db.idxRank .sort();
|
|
dst << ZRCola::transeq_rec(db);
|
|
} else {
|
|
_ftprintf(stderr, wxT("%s: error ZCC0025: Error getting translation sequence count from database or too many translation sequences.\n"), (LPCTSTR)filenameIn.c_str());
|
|
has_errors = true;
|
|
}
|
|
} else {
|
|
_ftprintf(stderr, wxT("%s: error ZCC0024: Error getting translation sequences from database. Please make sure the file is ZRCola.zrc compatible.\n"), (LPCTSTR)filenameIn.c_str());
|
|
has_errors = true;
|
|
}
|
|
}
|
|
|
|
{
|
|
// Get key sequences.
|
|
com_obj<ADORecordset> rs;
|
|
if (src.SelectKeySequences(rs)) {
|
|
size_t count = src.GetRecordsetCount(rs);
|
|
if (count < 0xffffffff) { // 4G check (-1 is reserved for error condition)
|
|
ZRCola::DBSource::keyseq ks;
|
|
ZRCola::keyseq_db db;
|
|
|
|
// Preallocate memory.
|
|
db.idxChr.reserve(count);
|
|
db.idxKey.reserve(count);
|
|
db.data .reserve(count*4);
|
|
|
|
// Parse key sequences and build index and data.
|
|
for (; !ZRCola::DBSource::IsEOF(rs); rs->MoveNext()) {
|
|
// Read key sequence from the database.
|
|
if (src.GetKeySequence(rs, ks)) {
|
|
// Add key sequence to index and data.
|
|
db << ks;
|
|
} else
|
|
has_errors = true;
|
|
}
|
|
|
|
// Sort indices.
|
|
db.idxChr.sort();
|
|
db.idxKey.sort();
|
|
|
|
// Check key sequences.
|
|
for (ZRCola::keyseq_db::indexKey::size_type i = 1, n = db.idxKey.size(); i < n; i++) {
|
|
const ZRCola::keyseq_db::keyseq
|
|
&ks1 = db.idxKey[i - 1],
|
|
&ks2 = db.idxKey[i ];
|
|
|
|
if (ZRCola::keyseq_db::keyseq::CompareSequence(ks1.seq(), ks1.seq_len(), ks2.seq(), ks2.seq_len()) == 0) {
|
|
wxString seq_str;
|
|
ZRCola::keyseq_db::GetSequenceAsText(ks1.seq(), ks1.seq_len(), seq_str);
|
|
_ftprintf(stderr, wxT("%s: warning ZCC0007: Duplicate key sequence (%s => %s or %s). The keyboard behaviour will be unpredictable.\n"),
|
|
(LPCTSTR)filenameIn.c_str(),
|
|
(LPCTSTR)seq_str.c_str(),
|
|
ZRCola::GetUnicodeDump(ks1.chr(), ks1.chr_len()).c_str(),
|
|
ZRCola::GetUnicodeDump(ks2.chr(), ks2.chr_len()).c_str());
|
|
}
|
|
}
|
|
|
|
// Write translations to file.
|
|
dst << ZRCola::keyseq_rec(db);
|
|
} else {
|
|
_ftprintf(stderr, wxT("%s: error ZCC0006: Error getting key sequence count from database or too many key sequences.\n"), (LPCTSTR)filenameIn.c_str());
|
|
has_errors = true;
|
|
}
|
|
} else {
|
|
_ftprintf(stderr, wxT("%s: error ZCC0005: Error getting key sequences from database. Please make sure the file is ZRCola.zrc compatible.\n"), (LPCTSTR)filenameIn.c_str());
|
|
has_errors = true;
|
|
}
|
|
}
|
|
|
|
{
|
|
// Get languages.
|
|
com_obj<ADORecordset> rs;
|
|
if (src.SelectLanguages(rs)) {
|
|
size_t count = src.GetRecordsetCount(rs);
|
|
if (count < 0xffffffff) { // 4G check (-1 is reserved for error condition)
|
|
ZRCola::DBSource::language lang;
|
|
ZRCola::language_db db;
|
|
|
|
// Preallocate memory.
|
|
db.idxLang.reserve(count);
|
|
db.data .reserve(count*4);
|
|
|
|
// Parse languages and build index and data.
|
|
for (; !ZRCola::DBSource::IsEOF(rs); rs->MoveNext()) {
|
|
// Read language from the database.
|
|
if (src.GetLanguage(rs, lang)) {
|
|
if (build_pot)
|
|
pot.insert(lang.name);
|
|
|
|
// Add language to index and data.
|
|
db << lang;
|
|
} else
|
|
has_errors = true;
|
|
}
|
|
|
|
// Write languages to file.
|
|
db.idxLang.sort();
|
|
dst << ZRCola::language_rec(db);
|
|
} else {
|
|
_ftprintf(stderr, wxT("%s: error ZCC0009: Error getting language count from database or too many languages.\n"), (LPCTSTR)filenameIn.c_str());
|
|
has_errors = true;
|
|
}
|
|
} else {
|
|
_ftprintf(stderr, wxT("%s: error ZCC0008: Error getting languages from database. Please make sure the file is ZRCola.zrc compatible.\n"), (LPCTSTR)filenameIn.c_str());
|
|
has_errors = true;
|
|
}
|
|
}
|
|
|
|
{
|
|
// Get language characters.
|
|
com_obj<ADORecordset> rs;
|
|
if (src.SelectLanguageCharacters(rs)) {
|
|
size_t count = src.GetRecordsetCount(rs);
|
|
if (count < 0xffffffff) { // 4G check (-1 is reserved for error condition)
|
|
ZRCola::DBSource::langchar lc;
|
|
ZRCola::langchar_db db;
|
|
|
|
// Preallocate memory.
|
|
db.idxChr .reserve(count);
|
|
#ifdef ZRCOLA_LANGCHAR_LANG_IDX
|
|
db.idxLang.reserve(count);
|
|
#endif
|
|
db.data .reserve(count*4);
|
|
|
|
// Parse language characters and build index and data.
|
|
for (; !ZRCola::DBSource::IsEOF(rs); rs->MoveNext()) {
|
|
// Read language characters from the database.
|
|
if (src.GetLanguageCharacter(rs, lc)) {
|
|
// Add language characters to index and data.
|
|
db << lc;
|
|
} else
|
|
has_errors = true;
|
|
}
|
|
|
|
// Write language characters to file.
|
|
db.idxChr .sort();
|
|
#ifdef ZRCOLA_LANGCHAR_LANG_IDX
|
|
db.idxLang.sort();
|
|
#endif
|
|
dst << ZRCola::langchar_rec(db);
|
|
} else {
|
|
_ftprintf(stderr, wxT("%s: error ZCC0011: Error getting language characters count from database or too many langchars.\n"), (LPCTSTR)filenameIn.c_str());
|
|
has_errors = true;
|
|
}
|
|
} else {
|
|
_ftprintf(stderr, wxT("%s: error ZCC0010: Error getting language characters from database. Please make sure the file is ZRCola.zrc compatible.\n"), (LPCTSTR)filenameIn.c_str());
|
|
has_errors = true;
|
|
}
|
|
}
|
|
|
|
{
|
|
// Get character groups.
|
|
com_obj<ADORecordset> rs;
|
|
if (src.SelectCharacterGroups(rs)) {
|
|
size_t count = src.GetRecordsetCount(rs);
|
|
if (count < 0xffffffff) { // 4G check (-1 is reserved for error condition)
|
|
ZRCola::DBSource::chrgrp cg;
|
|
ZRCola::chrgrp_db db;
|
|
|
|
// Preallocate memory.
|
|
db.idxRank.reserve(count);
|
|
db.data .reserve(count*4);
|
|
|
|
// Parse character groups and build index and data.
|
|
for (; !ZRCola::DBSource::IsEOF(rs); rs->MoveNext()) {
|
|
// Read character group from the database.
|
|
if (src.GetCharacterGroup(rs, cg)) {
|
|
if (build_pot)
|
|
pot.insert(cg.name);
|
|
|
|
if (cg.chars.empty()) {
|
|
// Skip empty character groups.
|
|
continue;
|
|
}
|
|
|
|
// Add character group to index and data.
|
|
db << cg;
|
|
} else
|
|
has_errors = true;
|
|
}
|
|
|
|
// Write character groups to file.
|
|
db.idxRank.sort();
|
|
dst << ZRCola::chrgrp_rec(db);
|
|
} else {
|
|
_ftprintf(stderr, wxT("%s: error ZCC0015: Error getting character group count from database or too many character groups.\n"), (LPCTSTR)filenameIn.c_str());
|
|
has_errors = true;
|
|
}
|
|
} else {
|
|
_ftprintf(stderr, wxT("%s: error ZCC0014: Error getting character groups from database. Please make sure the file is ZRCola.zrc compatible.\n"), (LPCTSTR)filenameIn.c_str());
|
|
has_errors = true;
|
|
}
|
|
}
|
|
|
|
set<ZRCola::chrcatid_t> categories_used;
|
|
|
|
{
|
|
// Get characters.
|
|
com_obj<ADORecordset> rs;
|
|
if (src.SelectCharacters(rs)) {
|
|
size_t count = src.GetRecordsetCount(rs);
|
|
if (count < 0xffffffff) { // 4G check (-1 is reserved for error condition)
|
|
ZRCola::DBSource::character_desc_idx idxChrDsc, idxChrDscSub;
|
|
ZRCola::DBSource::character_bank chrs;
|
|
|
|
// Phase 1: Parse characters and build indexes.
|
|
for (; !ZRCola::DBSource::IsEOF(rs); rs->MoveNext()) {
|
|
// Read character from the database.
|
|
ZRCola::DBSource::character chr;
|
|
if (src.GetCharacter(rs, chr))
|
|
chrs[chr.first] = std::move(chr.second);
|
|
else
|
|
has_errors = true;
|
|
}
|
|
|
|
// Phase 2: Build related character lists.
|
|
chrs.build_related();
|
|
|
|
ZRCola::character_db db;
|
|
|
|
// Preallocate memory.
|
|
db.idxChr.reserve(count);
|
|
db.data .reserve(count*4);
|
|
|
|
// Phase 3: Parse characters and build index and data.
|
|
for (auto chr = chrs.cbegin(), chr_end = chrs.cend(); chr != chr_end; ++chr) {
|
|
// Add character to index and data.
|
|
db << *chr;
|
|
|
|
// Add description (and keywords) to index.
|
|
idxChrDsc .add_keywords(chr->second.terms, chr->first, 0);
|
|
idxChrDscSub.add_keywords(chr->second.terms, chr->first, 3);
|
|
|
|
// Mark category used.
|
|
categories_used.insert(chr->second.cat);
|
|
}
|
|
|
|
// Write characters to file.
|
|
db.idxChr.sort();
|
|
idxChrDsc .save(db.idxDsc );
|
|
idxChrDscSub.save(db.idxDscSub);
|
|
dst << ZRCola::character_rec(db);
|
|
} else {
|
|
_ftprintf(stderr, wxT("%s: error ZCC0017: Error getting character count from database or too many characters.\n"), (LPCTSTR)filenameIn.c_str());
|
|
has_errors = true;
|
|
}
|
|
} else {
|
|
_ftprintf(stderr, wxT("%s: error ZCC0016: Error getting characters from database. Please make sure the file is ZRCola.zrc compatible.\n"), (LPCTSTR)filenameIn.c_str());
|
|
has_errors = true;
|
|
}
|
|
}
|
|
|
|
{
|
|
// Get character categories.
|
|
com_obj<ADORecordset> rs;
|
|
if (src.SelectCharacterCategories(rs)) {
|
|
size_t count = src.GetRecordsetCount(rs);
|
|
if (count < 0xffffffff) { // 4G check (-1 is reserved for error condition)
|
|
ZRCola::DBSource::chrcat cc;
|
|
ZRCola::chrcat_db db;
|
|
|
|
// Preallocate memory.
|
|
db.idxChrCat.reserve(count);
|
|
db.idxRank .reserve(count);
|
|
db.data .reserve(count*4);
|
|
|
|
// Parse character categories and build index and data.
|
|
for (; !ZRCola::DBSource::IsEOF(rs); rs->MoveNext()) {
|
|
// Read character category from the database.
|
|
if (src.GetCharacterCategory(rs, cc)) {
|
|
if (build_pot)
|
|
pot.insert(cc.name);
|
|
|
|
if (categories_used.find(cc.cat) == categories_used.end()) {
|
|
// Skip empty character categories.
|
|
continue;
|
|
}
|
|
|
|
// Add character category to index and data.
|
|
db << cc;
|
|
} else
|
|
has_errors = true;
|
|
}
|
|
|
|
// Write character categories to file.
|
|
db.idxChrCat.sort();
|
|
db.idxRank .sort();
|
|
dst << ZRCola::chrcat_rec(db);
|
|
} else {
|
|
_ftprintf(stderr, wxT("%s: error ZCC0019: Error getting character category count from database or too many character categories.\n"), (LPCTSTR)filenameIn.c_str());
|
|
has_errors = true;
|
|
}
|
|
} else {
|
|
_ftprintf(stderr, wxT("%s: error ZCC0018: Error getting character categories from database. Please make sure the file is ZRCola.zrc compatible.\n"), (LPCTSTR)filenameIn.c_str());
|
|
has_errors = true;
|
|
}
|
|
}
|
|
|
|
{
|
|
// Get characters tags.
|
|
com_obj<ADORecordset> rs;
|
|
if (src.SelectCharacterTags(rs)) {
|
|
size_t count = src.GetRecordsetCount(rs);
|
|
if (count < 0xffffffff) { // 4G check (-1 is reserved for error condition)
|
|
ZRCola::DBSource::chrtag ct;
|
|
ZRCola::chrtag_db db;
|
|
|
|
// Preallocate memory.
|
|
db.idxChr.reserve(count);
|
|
db.idxTag.reserve(count);
|
|
db.data .reserve(count*4);
|
|
|
|
// Parse characters tags and build index and data.
|
|
for (; !ZRCola::DBSource::IsEOF(rs); rs->MoveNext()) {
|
|
// Read characters tags from the database.
|
|
if (src.GetCharacterTag(rs, ct)) {
|
|
// Add characters tags to index and data.
|
|
db << ct;
|
|
} else
|
|
has_errors = true;
|
|
}
|
|
|
|
// Write characters tags to file.
|
|
db.idxChr.sort();
|
|
db.idxTag.sort();
|
|
dst << ZRCola::chrtag_rec(db);
|
|
} else {
|
|
_ftprintf(stderr, wxT("%s: error ZCC0021: Error getting characters tags count from database or too many character tags.\n"), (LPCTSTR)filenameIn.c_str());
|
|
has_errors = true;
|
|
}
|
|
} else {
|
|
_ftprintf(stderr, wxT("%s: error ZCC0020: Error getting characters tags from database. Please make sure the file is ZRCola.zrc compatible.\n"), (LPCTSTR)filenameIn.c_str());
|
|
has_errors = true;
|
|
}
|
|
}
|
|
|
|
{
|
|
// Get tag names.
|
|
com_obj<ADORecordset> rs;
|
|
if (src.SelectTagNames(rs)) {
|
|
size_t count = src.GetRecordsetCount(rs);
|
|
if (count < 0xffffffff) { // 4G check (-1 is reserved for error condition)
|
|
ZRCola::DBSource::tagname tn;
|
|
ZRCola::tagname_db db;
|
|
|
|
// Preallocate memory.
|
|
db.idxName.reserve(count*3);
|
|
db.idxTag .reserve(count*3);
|
|
db.data .reserve(count*3*4);
|
|
|
|
// Parse tags and build index and data.
|
|
for (; !ZRCola::DBSource::IsEOF(rs); rs->MoveNext()) {
|
|
// Read tag name from the database.
|
|
if (src.GetTagName(rs, tn)) {
|
|
// Add tag name to index and data.
|
|
db << tn;
|
|
} else
|
|
has_errors = true;
|
|
}
|
|
|
|
// Write tags to file.
|
|
db.idxName.sort();
|
|
db.idxTag .sort();
|
|
dst << ZRCola::tagname_rec(db);
|
|
} else {
|
|
_ftprintf(stderr, wxT("%s: error ZCC0023: Error getting tag name count from database or too many tags.\n"), (LPCTSTR)filenameIn.c_str());
|
|
has_errors = true;
|
|
}
|
|
} else {
|
|
_ftprintf(stderr, wxT("%s: error ZCC0022: Error getting tags from database. Please make sure the file is ZRCola.zrc compatible.\n"), (LPCTSTR)filenameIn.c_str());
|
|
has_errors = true;
|
|
}
|
|
}
|
|
|
|
{
|
|
// Get highlights.
|
|
com_obj<ADORecordset> rs;
|
|
if (src.SelectHighlights((short)ZRCOLA_HLGHTSETID_ZRCOLA_UNICODE_COMPOSED_ISSUES, rs)) {
|
|
size_t count = src.GetRecordsetCount(rs);
|
|
if (count < 0xffffffff) { // 4G check (-1 is reserved for error condition)
|
|
ZRCola::DBSource::highlight h;
|
|
ZRCola::highlight_db db;
|
|
|
|
// Preallocate memory.
|
|
db.idxChr.reserve(count);
|
|
db.data .reserve(count*5);
|
|
|
|
// Parse highlights and build index and data.
|
|
h.set = (short)ZRCOLA_HLGHTSETID_ZRCOLA_UNICODE_COMPOSED_ISSUES;
|
|
for (; !ZRCola::DBSource::IsEOF(rs); rs->MoveNext()) {
|
|
// Read tag name from the database.
|
|
if (src.GetHighlight(rs, h)) {
|
|
// Add highlight to index and data.
|
|
db << h;
|
|
} else
|
|
has_errors = true;
|
|
}
|
|
|
|
// Write highlights to file.
|
|
db.idxChr.sort();
|
|
dst << ZRCola::highlight_rec(db);
|
|
} else {
|
|
_ftprintf(stderr, wxT("%s: error ZCC0027: Error getting highlight count from database or too many tags.\n"), (LPCTSTR)filenameIn.c_str());
|
|
has_errors = true;
|
|
}
|
|
} else {
|
|
_ftprintf(stderr, wxT("%s: error ZCC0026: Error getting highlights from database. Please make sure the file is ZRCola.zrc compatible.\n"), (LPCTSTR)filenameIn.c_str());
|
|
has_errors = true;
|
|
}
|
|
}
|
|
|
|
idrec::close<ZRCola::recordid_t, ZRCola::recordsize_t, ZRCOLA_RECORD_ALIGN>(dst, dst_start);
|
|
|
|
if (dst.fail()) {
|
|
_ftprintf(stderr, wxT("%s: error ZCC1000: Writing to output file failed.\n"), (LPCTSTR)filenameOut.c_str());
|
|
has_errors = true;
|
|
}
|
|
|
|
if (!has_errors && build_pot) {
|
|
fstream dst_pot((LPCTSTR)filenamePot, ios_base::out | ios_base::trunc);
|
|
if (dst_pot.good()) {
|
|
dst_pot << "msgid \"\"" << endl
|
|
<< "msgstr \"\"" << endl
|
|
<< "\"Project-Id-Version: ZRCola.zrcdb\\n\"" << endl
|
|
<< "\"Language: en\\n\"" << endl
|
|
<< "\"MIME-Version: 1.0\\n\"" << endl
|
|
<< "\"Content-Type: text/plain; charset=UTF-8\\n\"" << endl
|
|
<< "\"Content-Transfer-Encoding: 8bit\\n\"" << endl
|
|
<< "\"X-Generator: ZRColaCompile\\n\"" << endl;
|
|
|
|
charset_encoder<wchar_t, char> conv(stdex::wchar_t_charset, charset_id::utf8);
|
|
for (auto p = pot.cbegin(); p != pot.cend(); ++p) {
|
|
// Convert UTF-16 to UTF-8 and escape.
|
|
string t(conv.convert(*p)), u;
|
|
for (size_t i = 0, n = t.size(); i < n; i++) {
|
|
char c = t[i];
|
|
switch (c) {
|
|
case '\'': u += "\\\'"; break;
|
|
case '\"': u += "\\\""; break;
|
|
case '\n': u += "\\\n"; break;
|
|
case '\t': u += "\\\t"; break;
|
|
default : u += c;
|
|
}
|
|
}
|
|
dst_pot << endl
|
|
<< "msgid \"" << u << "\"" << endl
|
|
<< "msgstr \"\"" << endl;
|
|
}
|
|
|
|
if (dst_pot.fail()) {
|
|
_ftprintf(stderr, wxT("%s: error ZCC0013: Writing to POT catalog failed.\n"), (LPCTSTR)filenameOut.c_str());
|
|
has_errors = true;
|
|
}
|
|
|
|
dst_pot.close();
|
|
} else {
|
|
_ftprintf(stderr, wxT("%s: error ZCC0012: Error opening POT catalog.\n"), filenameOut.fn_str());
|
|
has_errors = true;
|
|
}
|
|
}
|
|
|
|
if (has_errors) {
|
|
dst.close();
|
|
wxRemoveFile(filenameOut);
|
|
return 1;
|
|
} else
|
|
return 0;
|
|
}
|