It's useless to continue with testing the given regex if compiling it has unexpectedly succeeded, all the rest of the tests will fail anyhow. Also explain that REQUIRE() can't be used here, which is why we need to use CHECK() and then check the same condition again before returning to avoid the temptation to "simplify" things.
355 lines
9.0 KiB
C++
355 lines
9.0 KiB
C++
///////////////////////////////////////////////////////////////////////////////
|
|
// Name: tests/regex/regex.cpp
|
|
// Purpose: Test the built-in regex lib and wxRegEx
|
|
// Author: Mike Wetherell
|
|
// Copyright: (c) 2004 Mike Wetherell
|
|
// Licence: wxWindows licence
|
|
///////////////////////////////////////////////////////////////////////////////
|
|
|
|
//
|
|
// Notes:
|
|
//
|
|
// To run just one section, say wx_1, do this:
|
|
// test regex.wx_1
|
|
//
|
|
// To run all the regex tests:
|
|
// test regex
|
|
//
|
|
// Some tests must be skipped since they use features which we do not make
|
|
// available through wxRegEx. To see the list of tests that have been skipped
|
|
// turn on verbose logging, e.g.:
|
|
// test --verbose regex
|
|
//
|
|
// The tests here are for the builtin library, tests for wxRegEx in general
|
|
// should go in wxregex.cpp
|
|
//
|
|
// The tests are generated from Henry Spencer's reg.test, additional test
|
|
// can be added in wxreg.test. These test files are then turned into a C++
|
|
// include file 'regex.inc' (included below) using a script 'regex.pl'.
|
|
//
|
|
|
|
// For compilers that support precompilation, includes "wx/wx.h".
|
|
#include "testprec.h"
|
|
|
|
|
|
#if wxUSE_REGEX
|
|
|
|
// for all others, include the necessary headers
|
|
#ifndef WX_PRECOMP
|
|
#include "wx/wx.h"
|
|
#endif
|
|
|
|
|
|
// many of the tests are specific to the builtin regex lib, so only attempts
|
|
// to do them when using the builtin regex lib.
|
|
//
|
|
#ifdef wxHAS_REGEX_ADVANCED
|
|
|
|
#include "wx/regex.h"
|
|
#include <string>
|
|
#include <vector>
|
|
|
|
using std::string;
|
|
using std::vector;
|
|
|
|
///////////////////////////////////////////////////////////////////////////////
|
|
// The test case - an instance represents a single test
|
|
|
|
class RegExTestCase
|
|
{
|
|
public:
|
|
RegExTestCase(
|
|
const char *mode,
|
|
const char *id,
|
|
const char *flags,
|
|
const char *pattern,
|
|
const char *data,
|
|
const vector<const char *>& expected);
|
|
|
|
private:
|
|
void runTest();
|
|
|
|
// workers
|
|
wxString Conv(const char *str);
|
|
bool parseFlags(const wxString& flags);
|
|
void doTest(int flavor);
|
|
static wxString quote(const wxString& arg);
|
|
|
|
// mode, id, flags, pattern, test data, expected results...
|
|
int m_mode;
|
|
wxString m_id;
|
|
wxString m_flags;
|
|
wxString m_pattern;
|
|
wxString m_data;
|
|
wxArrayString m_expected;
|
|
|
|
// the flag decoded
|
|
int m_compileFlags;
|
|
int m_matchFlags;
|
|
bool m_basic;
|
|
bool m_extended;
|
|
bool m_advanced;
|
|
};
|
|
|
|
// constructor - throws Exception on failure
|
|
//
|
|
RegExTestCase::RegExTestCase(
|
|
const char *mode,
|
|
const char *id,
|
|
const char *flags,
|
|
const char *pattern,
|
|
const char *data,
|
|
const vector<const char *>& expected)
|
|
:
|
|
m_mode(mode[0]),
|
|
m_id(Conv(id)),
|
|
m_flags(Conv(flags)),
|
|
m_pattern(Conv(pattern)),
|
|
m_data(Conv(data)),
|
|
m_compileFlags(0),
|
|
m_matchFlags(0),
|
|
m_basic(false),
|
|
m_extended(false),
|
|
m_advanced(false)
|
|
{
|
|
vector<const char *>::const_iterator it;
|
|
|
|
for (it = expected.begin(); it != expected.end(); ++it) {
|
|
m_expected.push_back(Conv(*it));
|
|
}
|
|
|
|
runTest();
|
|
}
|
|
|
|
int wxWcscmp(const wchar_t* s1, const wchar_t* s2)
|
|
{
|
|
size_t nLen1 = wxWcslen(s1);
|
|
size_t nLen2 = wxWcslen(s2);
|
|
|
|
if (nLen1 != nLen2)
|
|
return nLen1 - nLen2;
|
|
|
|
return memcmp(s1, s2, nLen1*sizeof(wchar_t));
|
|
}
|
|
|
|
// convert a string from UTF8 to the internal encoding
|
|
//
|
|
wxString RegExTestCase::Conv(const char *str)
|
|
{
|
|
const wxWCharBuffer wstr = wxConvUTF8.cMB2WC(str);
|
|
const wxWC2WXbuf buf = wxConvCurrent->cWC2WX(wstr);
|
|
|
|
if (!buf || wxWcscmp(wxConvCurrent->cWX2WC(buf), wstr) != 0)
|
|
{
|
|
FAIL( "Converting string \"" << str << "\" failed" );
|
|
}
|
|
|
|
return buf;
|
|
}
|
|
|
|
// Parse flags
|
|
//
|
|
bool RegExTestCase::parseFlags(const wxString& flags)
|
|
{
|
|
for ( wxString::const_iterator p = flags.begin(); p != flags.end(); ++p )
|
|
{
|
|
switch ( (*p).GetValue() ) {
|
|
// noop
|
|
case '-': break;
|
|
|
|
// we don't fully support these flags, but they don't stop us
|
|
// checking for success of failure of the match, so treat as noop
|
|
case 'A': case 'B': case 'E': case 'H':
|
|
case 'I': case 'L': case 'M': case 'N':
|
|
case 'P': case 'Q': case 'R': case 'S':
|
|
case 'T': case 'U': case '%':
|
|
break;
|
|
|
|
// match options
|
|
case '^': m_matchFlags |= wxRE_NOTBOL; break;
|
|
case '$': m_matchFlags |= wxRE_NOTEOL; break;
|
|
#if wxUSE_UNICODE
|
|
case '*': break;
|
|
#endif
|
|
// compile options
|
|
case '&': m_advanced = m_basic = true; break;
|
|
case 'b': m_basic = true; break;
|
|
case 'e': m_extended = true; break;
|
|
case 'i': m_compileFlags |= wxRE_ICASE; break;
|
|
case 'o': m_compileFlags |= wxRE_NOSUB; break;
|
|
case 'n': m_compileFlags |= wxRE_NEWLINE; break;
|
|
case 't': if (strchr("ep", m_mode)) break; wxFALLTHROUGH;
|
|
|
|
// anything else we must skip the test
|
|
default:
|
|
return false;
|
|
}
|
|
}
|
|
|
|
return true;
|
|
}
|
|
|
|
// Try test for all flavours of expression specified
|
|
//
|
|
void RegExTestCase::runTest()
|
|
{
|
|
// the flags need further parsing...
|
|
if (!parseFlags(m_flags)) {
|
|
// we just have to skip the unsupported flags now
|
|
return;
|
|
}
|
|
|
|
// Provide more information about the test case if it fails.
|
|
wxString str;
|
|
wxArrayString::const_iterator it;
|
|
|
|
str << (wxChar)m_mode << wxT(" ") << m_id << wxT(" ") << m_flags << wxT(" ")
|
|
<< quote(m_pattern) << wxT(" ") << quote(m_data);
|
|
|
|
for (it = m_expected.begin(); it != m_expected.end(); ++it)
|
|
str << wxT(" ") << quote(*it);
|
|
|
|
if (str.length() > 77)
|
|
str = str.substr(0, 74) + wxT("...");
|
|
|
|
INFO( str );
|
|
|
|
|
|
if (m_basic)
|
|
doTest(wxRE_BASIC);
|
|
if (m_extended)
|
|
doTest(wxRE_EXTENDED);
|
|
#ifdef wxHAS_REGEX_ADVANCED
|
|
if (m_advanced || (!m_basic && !m_extended))
|
|
doTest(wxRE_ADVANCED);
|
|
#endif
|
|
}
|
|
|
|
// Try the test for a single flavour of expression
|
|
//
|
|
void RegExTestCase::doTest(int flavor)
|
|
{
|
|
wxRegEx re(m_pattern, m_compileFlags | flavor);
|
|
|
|
// 'e' - test that the pattern fails to compile
|
|
if (m_mode == 'e') {
|
|
CHECK( !re.IsValid() );
|
|
|
|
// Never continue with this kind of test.
|
|
return;
|
|
} else {
|
|
// Note: we don't use REQUIRE here because this would abort the entire
|
|
// test case on error instead of skipping just the rest of this regex
|
|
// test.
|
|
CHECK( re.IsValid() );
|
|
|
|
if (!re.IsValid())
|
|
return;
|
|
}
|
|
|
|
bool matches = re.Matches(m_data, m_matchFlags);
|
|
|
|
// 'f' or 'p' - test that the pattern does not match
|
|
if (m_mode == 'f' || m_mode == 'p') {
|
|
CHECK( !matches );
|
|
} else {
|
|
// otherwise 'm' or 'i' - test the pattern does match
|
|
CHECK( matches );
|
|
}
|
|
|
|
if (!matches)
|
|
return;
|
|
|
|
if (m_compileFlags & wxRE_NOSUB)
|
|
return;
|
|
|
|
// check wxRegEx has correctly counted the number of subexpressions
|
|
CHECK( m_expected.size() == re.GetMatchCount() );
|
|
|
|
for (size_t i = 0; i < m_expected.size(); i++) {
|
|
wxString result;
|
|
size_t start, len;
|
|
|
|
INFO( "Match " << i );
|
|
CHECK( re.GetMatch(&start, &len, i) );
|
|
|
|
// m - check the match returns the strings given
|
|
if (m_mode == 'm')
|
|
{
|
|
if (start < INT_MAX)
|
|
result = m_data.substr(start, len);
|
|
else
|
|
result = wxT("");
|
|
}
|
|
|
|
// i - check the match returns the offsets given
|
|
else if (m_mode == 'i')
|
|
{
|
|
if (start > INT_MAX)
|
|
result = wxT("-1 -1");
|
|
else if (start + len > 0)
|
|
result << start << wxT(" ") << start + len - 1;
|
|
else
|
|
result << start << wxT(" -1");
|
|
}
|
|
|
|
CHECK( result == m_expected[i] );
|
|
}
|
|
}
|
|
|
|
// quote a string so that it can be displayed (static)
|
|
//
|
|
wxString RegExTestCase::quote(const wxString& arg)
|
|
{
|
|
const wxChar *needEscape = wxT("\a\b\t\n\v\f\r\"\\");
|
|
const wxChar *escapes = wxT("abtnvfr\"\\");
|
|
wxString str;
|
|
|
|
for (size_t i = 0; i < arg.length(); i++) {
|
|
wxChar ch = (wxChar)arg[i];
|
|
const wxChar *p = wxStrchr(needEscape, ch);
|
|
|
|
if (p)
|
|
str += wxString::Format(wxT("\\%c"), escapes[p - needEscape]);
|
|
else if (wxIscntrl(ch))
|
|
str += wxString::Format(wxT("\\%03o"), ch);
|
|
else
|
|
str += (wxChar)ch;
|
|
}
|
|
|
|
return str.length() == arg.length() && str.find(' ') == wxString::npos ?
|
|
str : wxT("\"") + str + wxT("\"");
|
|
}
|
|
|
|
// The helper function used by the tests in auto-generated regex.inc.
|
|
static void
|
|
CheckRE(
|
|
const char *mode,
|
|
const char *id,
|
|
const char *flags,
|
|
const char *pattern,
|
|
const char *data,
|
|
const char *expected,
|
|
...)
|
|
{
|
|
vector<const char *> expected_results;
|
|
va_list ap;
|
|
|
|
for (va_start(ap, expected); expected; expected = va_arg(ap, const char *))
|
|
expected_results.push_back(expected);
|
|
|
|
va_end(ap);
|
|
|
|
RegExTestCase(mode, id, flags, pattern, data, expected_results);
|
|
}
|
|
|
|
|
|
// Include the generated tests
|
|
//
|
|
#include "regex.inc"
|
|
|
|
|
|
#endif // wxHAS_REGEX_ADVANCED
|
|
|
|
#endif // wxUSE_REGEX
|