// file : libbuild2/script/regex.test.cxx -*- C++ -*- // license : MIT; see accompanying LICENSE file #include <regex> #include <type_traits> // is_* #include <libbuild2/types.hxx> #include <libbuild2/utility.hxx> #include <libbuild2/script/regex.hxx> #undef NDEBUG #include <cassert> using namespace std; using namespace build2::script::regex; int main () { build2::init_process (); using lc = line_char; using ls = line_string; using lr = line_regex; using cf = char_flags; using cr = char_regex; init (); // Initializes the script regex global state. // Test line_char. // { static_assert (is_trivial<lc>::value && is_standard_layout<lc>::value && !is_array<lc>::value, "line_char must be char-like"); // Zero-initialed line_char should be the null-char as required by // char_traits<>::length() specification. // assert (lc () == lc::nul); line_pool p; assert (lc::eof == -1); assert (lc::nul == 0); enum meta {mn = 'n', mp = 'p'}; // Special roundtrip. // assert (lc ('0').special () == '0'); assert (lc (0).special () == 0); assert (lc (-1).special () == -1); assert (lc ('p').special () == 'p'); assert (lc (u'\u2028').special () == u'\u2028'); // Special comparison. // assert (lc ('0') == lc ('0')); assert (lc ('0') == '0'); assert (lc ('n') == mn); assert (mn == static_cast<meta> (lc ('n'))); assert (lc ('0') != lc ('1')); assert (lc ('0') != '1'); assert (lc ('n') != mp); assert (lc ('0') != lc ("0", p)); assert (lc ('0') != lc (cr ("0"), p)); assert (lc ('0') < lc ('1')); assert (lc ('0') < '1'); assert (lc ('1') < lc ("0", p)); assert (lc ('n') < mp); assert (lc ('0') <= '1'); assert (lc ('0') <= lc ('1')); assert (lc ('n') <= mn); assert (lc ('1') <= lc ("0", p)); // Literal roundtrip. // assert (*lc ("abc", p).literal () == "abc"); // Literal comparison. // assert (lc ("a", p) == lc ("a", p)); assert (lc ("a", p).literal () == lc ("a", p).literal ()); assert (char (lc ("a", p)) == '\a'); assert (lc ("a", p) != lc ("b", p)); assert (!(lc ("a", p) != lc (cr ("a"), p))); assert (lc ("a", p) != lc (cr ("b"), p)); assert (lc ("a", p) < lc ("b", p)); assert (!(lc ("a", p) < lc (cr ("a"), p))); assert (lc ("a", p) <= lc ("b", p)); assert (lc ("a", p) <= lc (cr ("a"), p)); assert (lc ("a", p) < lc (cr ("c"), p)); // Regex roundtrip. // assert (regex_match ("abc", *lc (cr ("abc"), p).regex ())); // Regex flags. // // icase // assert (regex_match ("ABC", cr ("abc", cf::icase))); // idot // assert (!regex_match ("a", cr ("[.]", cf::idot))); assert (!regex_match ("a", cr ("[\\.]", cf::idot))); assert (regex_match ("a", cr ("."))); assert (!regex_match ("a", cr (".", cf::idot))); assert (regex_match ("a", cr ("\\.", cf::idot))); assert (!regex_match ("a", cr ("\\."))); // regex::transform() // // The function is static and we can't test it directly. So we will test // it indirectly via regex matches. // // @@ Would be nice to somehow address the inability to test internals (not // exposed via headers). As a part of utility library support? // assert (regex_match (".a[.", cr (".\\.\\[[.]", cf::idot))); assert (regex_match (".a[.", cr (".\\.\\[[\\.]", cf::idot))); assert (!regex_match ("ba[.", cr (".\\.\\[[.]", cf::idot))); assert (!regex_match (".a[b", cr (".\\.\\[[.]", cf::idot))); assert (!regex_match (".a[b", cr (".\\.\\[[\\.]", cf::idot))); // Regex comparison. // assert (lc ("a", p) == lc (cr ("a|b"), p)); assert (lc (cr ("a|b"), p) == lc ("a", p)); } // Test char_traits<line_char>. // { using ct = char_traits<lc>; using vc = vector<lc>; lc c; ct::assign (c, '0'); assert (c == ct::char_type ('0')); assert (ct::to_char_type (c) == c); assert (ct::to_int_type (c) == c); assert (ct::eq_int_type (c, c)); assert (!ct::eq_int_type (c, lc::eof)); assert (ct::eof () == lc::eof); assert (ct::not_eof (c) == c); assert (ct::not_eof (lc::eof) != lc::eof); ct::assign (&c, 1, '1'); assert (c == ct::int_type ('1')); assert (ct::eq (lc ('0'), lc ('0'))); assert (ct::lt (lc ('0'), lc ('1'))); vc v1 ({'0', '1', '2'}); vc v2 (3, lc::nul); assert (ct::find (v1.data (), 3, '1') == v1.data () + 1); ct::copy (v2.data (), v1.data (), 3); assert (v2 == v1); v2.push_back (lc::nul); assert (ct::length (v2.data ()) == 3); // Overlaping ranges. // ct::move (v1.data () + 1, v1.data (), 2); assert (v1 == vc ({'0', '0', '1'})); v1 = vc ({'0', '1', '2'}); ct::move (v1.data (), v1.data () + 1, 2); assert (v1 == vc ({'1', '2', '2'})); } // Test line_char_locale and ctype<line_char> (only non-trivial functions). // { using ct = ctype<lc>; line_char_locale l; // It is better not to create q facet on stack as it is // reference-countable. // const ct& t (use_facet<ct> (l)); line_pool p; assert (t.is (ct::digit, '0')); assert (!t.is (ct::digit, '?')); assert (!t.is (ct::digit, lc ("0", p))); const lc chars[] = { '0', '?' }; ct::mask m[2]; const lc* b (chars); const lc* e (chars + 2); // Cast flag value to mask type and compare to mask. // auto fl = [] (ct::mask m, ct::mask f) {return m == f;}; t.is (b, e, m); assert (fl (m[0], ct::digit) && fl (m[1], 0)); assert (t.scan_is (ct::digit, b, e) == b); assert (t.scan_is (0, b, e) == b + 1); assert (t.scan_not (ct::digit, b, e) == b + 1); assert (t.scan_not (0, b, e) == b); { char nr[] = "0?"; lc wd[2]; t.widen (nr, nr + 2, wd); assert (wd[0] == b[0] && wd[1] == b[1]); } { lc wd[] = {'0', lc ("a", p)}; char nr[2]; t.narrow (wd, wd + 2, '-', nr); assert (nr[0] == '0' && nr[1] == '-'); } } // Test regex_traits<line_char>. Functions other that value() are trivial. // { regex_traits<lc> t; const int radix[] = {8, 10}; // Radix 16 is not supported by line_char. const char digits[] = "0123456789ABCDEF"; for (size_t r (0); r < 2; ++r) { for (int i (0); i < radix[r]; ++i) assert (t.value (digits[i], radix[r]) == i); } } // Test line_regex construction. // { line_pool p; lr r1 ({lc ("foo", p), lc (cr ("ba(r|z)"), p)}, move (p)); lr r2 (move (r1)); assert (regex_match (ls ({lc ("foo", r2.pool), lc ("bar", r2.pool)}), r2)); assert (!regex_match (ls ({lc ("foo", r2.pool), lc ("ba", r2.pool)}), r2)); } // Test line_regex match. // { line_pool p; const lc foo ("foo", p); const lc bar ("bar", p); const lc baz ("baz", p); const lc blank ("", p); assert (regex_match (ls ({foo, bar}), lr ({foo, bar}))); assert (!regex_match (ls ({foo, baz}), lr ({foo, bar}))); assert (regex_match (ls ({bar, foo}), lr ({'(', foo, '|', bar, ')', '+'}))); assert (regex_match (ls ({foo, foo, bar}), lr ({'(', foo, ')', '\\', '1', bar}))); assert (regex_match (ls ({foo}), lr ({lc (cr ("fo+"), p)}))); assert (regex_match (ls ({foo}), lr ({lc (cr (".*"), p)}))); assert (regex_match (ls ({blank}), lr ({lc (cr (".*"), p)}))); assert (regex_match (ls ({blank, blank, foo}), lr ({blank, '*', foo, blank, '*'}))); assert (regex_match (ls ({blank, blank, foo}), lr ({'.', '*'}))); assert (regex_match (ls ({blank, blank}), lr ({blank, '*', foo, '?', blank, '*'}))); assert (regex_match (ls ({foo}), lr ({foo, '{', '1', '}'}))); assert (regex_match (ls ({foo, foo}), lr ({foo, '{', '1', ',', '}'}))); assert (regex_match (ls ({foo, foo}), lr ({foo, '{', '1', ',', '2', '}'}))); assert (!regex_match (ls ({foo, foo}), lr ({foo, '{', '3', ',', '4', '}'}))); assert (regex_match (ls ({foo}), lr ({'(', '?', '=', foo, ')', foo}))); assert (regex_match (ls ({foo}), lr ({'(', '?', '!', bar, ')', foo}))); } }