aboutsummaryrefslogtreecommitdiff
path: root/libbutl/regex.mxx
blob: 84b024f10be636528b8a4cc487460d98475b6788 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
// file      : libbutl/regex.mxx -*- C++ -*-
// license   : MIT; see accompanying LICENSE file

#ifndef __cpp_modules_ts
#pragma once
#endif

// C includes.

#ifndef __cpp_lib_modules_ts
#include <regex>
#include <iosfwd>
#include <string>
#include <utility> // pair

#include <locale>
#include <cstddef> // size_t
#include <utility> // move(), make_pair()
#endif

#if defined(__clang__)
#  if __has_include(<__config>)
#    include <__config>          // _LIBCPP_VERSION
#  endif
#endif

// Other includes.

#ifdef __cpp_modules_ts
export module butl.regex;
#ifdef __cpp_lib_modules_ts
import std.core;
import std.io;
import std.regex; // @@ MOD TODO should probably be re-exported.
#endif
#endif

#include <libbutl/export.hxx>

LIBBUTL_MODEXPORT namespace butl
{
  // The regex semantics for the following functions is like that of
  // std::regex_replace() extended the standard ECMA-262 substitution escape
  // sequences with a subset of Perl sequences:
  //
  // \\, \n, \u, \l, \U, \L, \E, \1, ..., \9
  //
  // Notes and limitations:
  //
  // - The only valid regex_constants flags are match_default,
  //   format_first_only and format_no_copy.
  //
  // - If backslash doesn't start any of the listed sequences then it is
  //   silently dropped and the following character is copied as is.
  //
  // - The character case conversion is performed according to the global
  //   C++ locale (which is, unless changed, is the same as C locale and
  //   both default to the POSIX locale aka "C").
  //

  // Call specified append() function for non-matched substrings and matched
  // substring replacements returning true if search succeeded. The function
  // must be callable with the following signature:
  //
  // void
  // append(basic_string<C>::iterator begin, basic_string<C>::iterator end);
  //
  template <typename C, typename F>
  bool
  regex_replace_search (const std::basic_string<C>&,
                        const std::basic_regex<C>&,
                        const std::basic_string<C>& fmt,
                        F&& append,
                        std::regex_constants::match_flag_type =
                        std::regex_constants::match_default);

  // As above but concatenate non-matched substrings and matched substring
  // replacements into a string returning it as well as whether the search
  // succeeded.
  //
  template <typename C>
  std::pair<std::basic_string<C>, bool>
  regex_replace_search (const std::basic_string<C>&,
                        const std::basic_regex<C>&,
                        const std::basic_string<C>& fmt,
                        std::regex_constants::match_flag_type =
                          std::regex_constants::match_default);

  // Match the entire string and, if it matches, return the string replacement.
  //
  template <typename C>
  std::pair<std::basic_string<C>, bool>
  regex_replace_match (const std::basic_string<C>&,
                       const std::basic_regex<C>&,
                       const std::basic_string<C>& fmt);
}

LIBBUTL_MODEXPORT namespace std
{
  // Print regex error description but only if it is meaningful (this is also
  // why we have to print leading colon).
  //
  LIBBUTL_SYMEXPORT ostream&
  operator<< (ostream&, const regex_error&);
}

#include <libbutl/regex.ixx>
#include <libbutl/regex.txx>