sl@0
|
1 |
///////////////////////////////////////////////////////////////////////////////
|
sl@0
|
2 |
/// \file regex_constants.hpp
|
sl@0
|
3 |
/// Contains definitions for the syntax_option_type, match_flag_type and
|
sl@0
|
4 |
/// error_type enumerations.
|
sl@0
|
5 |
//
|
sl@0
|
6 |
// Copyright 2004 Eric Niebler. Distributed under the Boost
|
sl@0
|
7 |
// Software License, Version 1.0. (See accompanying file
|
sl@0
|
8 |
// LICENSE_1_0.txt or copy at http://www.boost.org/LICENSE_1_0.txt)
|
sl@0
|
9 |
|
sl@0
|
10 |
#ifndef BOOST_XPRESSIVE_REGEX_CONSTANTS_HPP_EAN_10_04_2005
|
sl@0
|
11 |
#define BOOST_XPRESSIVE_REGEX_CONSTANTS_HPP_EAN_10_04_2005
|
sl@0
|
12 |
|
sl@0
|
13 |
// MS compatible compilers support #pragma once
|
sl@0
|
14 |
#if defined(_MSC_VER) && (_MSC_VER >= 1020)
|
sl@0
|
15 |
# pragma once
|
sl@0
|
16 |
#endif
|
sl@0
|
17 |
|
sl@0
|
18 |
#include <boost/mpl/identity.hpp>
|
sl@0
|
19 |
|
sl@0
|
20 |
#ifndef BOOST_XPRESSIVE_DOXYGEN_INVOKED
|
sl@0
|
21 |
# define icase icase_
|
sl@0
|
22 |
#endif
|
sl@0
|
23 |
|
sl@0
|
24 |
namespace boost { namespace xpressive { namespace regex_constants
|
sl@0
|
25 |
{
|
sl@0
|
26 |
|
sl@0
|
27 |
/// Flags used to customize the regex syntax
|
sl@0
|
28 |
///
|
sl@0
|
29 |
enum syntax_option_type
|
sl@0
|
30 |
{
|
sl@0
|
31 |
// these flags are required:
|
sl@0
|
32 |
|
sl@0
|
33 |
ECMAScript = 0, ///< Specifies that the grammar recognized by the regular expression
|
sl@0
|
34 |
///< engine uses its normal semantics: that is the same as that given
|
sl@0
|
35 |
///< in the ECMA-262, ECMAScript Language Specification, Chapter 15
|
sl@0
|
36 |
///< part 10, RegExp (Regular Expression) Objects (FWD.1).
|
sl@0
|
37 |
///<
|
sl@0
|
38 |
icase = 1 << 1, ///< Specifies that matching of regular expressions against a character
|
sl@0
|
39 |
///< container sequence shall be performed without regard to case.
|
sl@0
|
40 |
///<
|
sl@0
|
41 |
nosubs = 1 << 2, ///< Specifies that when a regular expression is matched against a
|
sl@0
|
42 |
///< character container sequence, then no sub-expression matches are to
|
sl@0
|
43 |
///< be stored in the supplied match_results structure.
|
sl@0
|
44 |
///<
|
sl@0
|
45 |
optimize = 1 << 3, ///< Specifies that the regular expression engine should pay more
|
sl@0
|
46 |
///< attention to the speed with which regular expressions are matched,
|
sl@0
|
47 |
///< and less to the speed with which regular expression objects are
|
sl@0
|
48 |
///< constructed. Otherwise it has no detectable effect on the program
|
sl@0
|
49 |
///< output.
|
sl@0
|
50 |
///<
|
sl@0
|
51 |
collate = 1 << 4, ///< Specifies that character ranges of the form "[a-b]" should be
|
sl@0
|
52 |
///< locale sensitive.
|
sl@0
|
53 |
///<
|
sl@0
|
54 |
|
sl@0
|
55 |
// These flags are optional. If the functionality is supported
|
sl@0
|
56 |
// then the flags shall take these names.
|
sl@0
|
57 |
|
sl@0
|
58 |
//basic = 1 << 5, ///< Specifies that the grammar recognized by the regular expression
|
sl@0
|
59 |
// ///< engine is the same as that used by POSIX basic regular expressions
|
sl@0
|
60 |
// ///< in IEEE Std 1003.1-2001, Portable Operating System Interface
|
sl@0
|
61 |
// ///< (POSIX), Base Definitions and Headers, Section 9, Regular
|
sl@0
|
62 |
// ///< Expressions (FWD.1).
|
sl@0
|
63 |
// ///<
|
sl@0
|
64 |
//extended = 1 << 6, ///< Specifies that the grammar recognized by the regular expression
|
sl@0
|
65 |
// ///< engine is the same as that used by POSIX extended regular
|
sl@0
|
66 |
// ///< expressions in IEEE Std 1003.1-2001, Portable Operating System
|
sl@0
|
67 |
// ///< Interface (POSIX), Base Definitions and Headers, Section 9,
|
sl@0
|
68 |
// ///< Regular Expressions (FWD.1).
|
sl@0
|
69 |
// ///<
|
sl@0
|
70 |
//awk = 1 << 7, ///< Specifies that the grammar recognized by the regular expression
|
sl@0
|
71 |
// ///< engine is the same as that used by POSIX utility awk in IEEE Std
|
sl@0
|
72 |
// ///< 1003.1-2001, Portable Operating System Interface (POSIX), Shells
|
sl@0
|
73 |
// ///< and Utilities, Section 4, awk (FWD.1).
|
sl@0
|
74 |
// ///<
|
sl@0
|
75 |
//grep = 1 << 8, ///< Specifies that the grammar recognized by the regular expression
|
sl@0
|
76 |
// ///< engine is the same as that used by POSIX utility grep in IEEE Std
|
sl@0
|
77 |
// ///< 1003.1-2001, Portable Operating System Interface (POSIX),
|
sl@0
|
78 |
// ///< Shells and Utilities, Section 4, Utilities, grep (FWD.1).
|
sl@0
|
79 |
// ///<
|
sl@0
|
80 |
//egrep = 1 << 9, ///< Specifies that the grammar recognized by the regular expression
|
sl@0
|
81 |
// ///< engine is the same as that used by POSIX utility grep when given
|
sl@0
|
82 |
// ///< the -E option in IEEE Std 1003.1-2001, Portable Operating System
|
sl@0
|
83 |
// ///< Interface (POSIX), Shells and Utilities, Section 4, Utilities,
|
sl@0
|
84 |
// ///< grep (FWD.1).
|
sl@0
|
85 |
// ///<
|
sl@0
|
86 |
|
sl@0
|
87 |
// these flags are specific to xpressive, and they help with perl compliance.
|
sl@0
|
88 |
|
sl@0
|
89 |
single_line = 1 << 10, ///< Specifies that the ^ and \$ metacharacters DO NOT match at
|
sl@0
|
90 |
///< internal line breaks. Note that this is the opposite of the
|
sl@0
|
91 |
///< perl default. It is the inverse of perl's /m (multi-line)
|
sl@0
|
92 |
///< modifier.
|
sl@0
|
93 |
///<
|
sl@0
|
94 |
not_dot_null = 1 << 11, ///< Specifies that the . metacharacter does not match the null
|
sl@0
|
95 |
///< character \\0.
|
sl@0
|
96 |
///<
|
sl@0
|
97 |
not_dot_newline = 1 << 12, ///< Specifies that the . metacharacter does not match the
|
sl@0
|
98 |
///< newline character \\n.
|
sl@0
|
99 |
///<
|
sl@0
|
100 |
ignore_white_space = 1 << 13 ///< Specifies that non-escaped white-space is not significant.
|
sl@0
|
101 |
///<
|
sl@0
|
102 |
};
|
sl@0
|
103 |
|
sl@0
|
104 |
/// Flags used to customize the behavior of the regex algorithms
|
sl@0
|
105 |
///
|
sl@0
|
106 |
enum match_flag_type
|
sl@0
|
107 |
{
|
sl@0
|
108 |
match_default = 0, ///< Specifies that matching of regular expressions proceeds
|
sl@0
|
109 |
///< without any modification of the normal rules used in
|
sl@0
|
110 |
///< ECMA-262, ECMAScript Language Specification, Chapter 15
|
sl@0
|
111 |
///< part 10, RegExp (Regular Expression) Objects (FWD.1)
|
sl@0
|
112 |
///<
|
sl@0
|
113 |
match_not_bol = 1 << 1, ///< Specifies that the expression "^" should not be matched
|
sl@0
|
114 |
///< against the sub-sequence [first,first).
|
sl@0
|
115 |
///<
|
sl@0
|
116 |
match_not_eol = 1 << 2, ///< Specifies that the expression "\$" should not be
|
sl@0
|
117 |
///< matched against the sub-sequence [last,last).
|
sl@0
|
118 |
///<
|
sl@0
|
119 |
match_not_bow = 1 << 3, ///< Specifies that the expression "\\b" should not be
|
sl@0
|
120 |
///< matched against the sub-sequence [first,first).
|
sl@0
|
121 |
///<
|
sl@0
|
122 |
match_not_eow = 1 << 4, ///< Specifies that the expression "\\b" should not be
|
sl@0
|
123 |
///< matched against the sub-sequence [last,last).
|
sl@0
|
124 |
///<
|
sl@0
|
125 |
match_any = 1 << 7, ///< Specifies that if more than one match is possible then
|
sl@0
|
126 |
///< any match is an acceptable result.
|
sl@0
|
127 |
///<
|
sl@0
|
128 |
match_not_null = 1 << 8, ///< Specifies that the expression can not be matched
|
sl@0
|
129 |
///< against an empty sequence.
|
sl@0
|
130 |
///<
|
sl@0
|
131 |
match_continuous = 1 << 10, ///< Specifies that the expression must match a sub-sequence
|
sl@0
|
132 |
///< that begins at first.
|
sl@0
|
133 |
///<
|
sl@0
|
134 |
match_partial = 1 << 11, ///< Specifies that if no match can be found, then it is
|
sl@0
|
135 |
///< acceptable to return a match [from, last) where
|
sl@0
|
136 |
///< from!=last, if there exists some sequence of characters
|
sl@0
|
137 |
///< [from,to) of which [from,last) is a prefix, and which
|
sl@0
|
138 |
///< would result in a full match.
|
sl@0
|
139 |
///<
|
sl@0
|
140 |
match_prev_avail = 1 << 12, ///< Specifies that --first is a valid iterator position,
|
sl@0
|
141 |
///< when this flag is set then the flags match_not_bol
|
sl@0
|
142 |
///< and match_not_bow are ignored by the regular expression
|
sl@0
|
143 |
///< algorithms (RE.7) and iterators (RE.8).
|
sl@0
|
144 |
///<
|
sl@0
|
145 |
format_default = 0, ///< Specifies that when a regular expression match is to be
|
sl@0
|
146 |
///< replaced by a new string, that the new string is
|
sl@0
|
147 |
///< constructed using the rules used by the ECMAScript
|
sl@0
|
148 |
///< replace function in ECMA-262, ECMAScript Language
|
sl@0
|
149 |
///< Specification, Chapter 15 part 5.4.11
|
sl@0
|
150 |
///< String.prototype.replace. (FWD.1). In addition during
|
sl@0
|
151 |
///< search and replace operations then all non-overlapping
|
sl@0
|
152 |
///< occurrences of the regular expression are located and
|
sl@0
|
153 |
///< replaced, and sections of the input that did not match
|
sl@0
|
154 |
///< the expression, are copied unchanged to the output
|
sl@0
|
155 |
///< string.
|
sl@0
|
156 |
///<
|
sl@0
|
157 |
//format_sed = 1 << 13, ///< Specifies that when a regular expression match is to be
|
sl@0
|
158 |
// ///< replaced by a new string, that the new string is
|
sl@0
|
159 |
// ///< constructed using the rules used by the Unix sed
|
sl@0
|
160 |
// ///< utility in IEEE Std 1003.1-2001, Portable Operating
|
sl@0
|
161 |
// ///< SystemInterface (POSIX), Shells and Utilities.
|
sl@0
|
162 |
// ///<
|
sl@0
|
163 |
//format_perl = 1 << 14, ///< Specifies that when a regular expression match is to be
|
sl@0
|
164 |
// ///< replaced by a new string, that the new string is
|
sl@0
|
165 |
// ///< constructed using an implementation defined superset
|
sl@0
|
166 |
// ///< of the rules used by the ECMAScript replace function in
|
sl@0
|
167 |
// ///< ECMA-262, ECMAScript Language Specification, Chapter 15
|
sl@0
|
168 |
// ///< part 5.4.11 String.prototype.replace (FWD.1).
|
sl@0
|
169 |
// ///<
|
sl@0
|
170 |
format_no_copy = 1 << 15, ///< When specified during a search and replace operation,
|
sl@0
|
171 |
///< then sections of the character container sequence being
|
sl@0
|
172 |
///< searched that do match the regular expression, are not
|
sl@0
|
173 |
///< copied to the output string.
|
sl@0
|
174 |
///<
|
sl@0
|
175 |
format_first_only = 1 << 16, ///< When specified during a search and replace operation,
|
sl@0
|
176 |
///< then only the first occurrence of the regular
|
sl@0
|
177 |
///< expression is replaced.
|
sl@0
|
178 |
///<
|
sl@0
|
179 |
format_literal = 1 << 17 ///< Treat the format string as a literal.
|
sl@0
|
180 |
///<
|
sl@0
|
181 |
};
|
sl@0
|
182 |
|
sl@0
|
183 |
/// Error codes used by the regex_error type
|
sl@0
|
184 |
///
|
sl@0
|
185 |
enum error_type
|
sl@0
|
186 |
{
|
sl@0
|
187 |
error_collate, ///< The expression contained an invalid collating element name.
|
sl@0
|
188 |
///<
|
sl@0
|
189 |
error_ctype, ///< The expression contained an invalid character class name.
|
sl@0
|
190 |
///<
|
sl@0
|
191 |
error_escape, ///< The expression contained an invalid escaped character,
|
sl@0
|
192 |
///< or a trailing escape.
|
sl@0
|
193 |
///<
|
sl@0
|
194 |
error_subreg, ///< The expression contained an invalid back-reference.
|
sl@0
|
195 |
///<
|
sl@0
|
196 |
error_brack, ///< The expression contained mismatched [ and ].
|
sl@0
|
197 |
///<
|
sl@0
|
198 |
error_paren, ///< The expression contained mismatched (and).
|
sl@0
|
199 |
///<
|
sl@0
|
200 |
error_brace, ///< The expression contained mismatched { and }
|
sl@0
|
201 |
///<
|
sl@0
|
202 |
error_badbrace, ///< The expression contained an invalid range in a {} expression.
|
sl@0
|
203 |
///<
|
sl@0
|
204 |
error_range, ///< The expression contained an invalid character range, for
|
sl@0
|
205 |
///< example [b-a].
|
sl@0
|
206 |
///<
|
sl@0
|
207 |
error_space, ///< There was insufficient memory to convert the expression into a
|
sl@0
|
208 |
///< finite state machine.
|
sl@0
|
209 |
///<
|
sl@0
|
210 |
error_badrepeat, ///< One of *?+{ was not preceded by a valid regular expression.
|
sl@0
|
211 |
///<
|
sl@0
|
212 |
error_complexity, ///< The complexity of an attempted match against a regular
|
sl@0
|
213 |
///< expression exceeded a pre-set level.
|
sl@0
|
214 |
///<
|
sl@0
|
215 |
error_stack, ///< There was insufficient memory to determine whether the regular
|
sl@0
|
216 |
///< expression could match the specified character sequence.
|
sl@0
|
217 |
///<
|
sl@0
|
218 |
error_badref, ///< An nested regex is uninitialized.
|
sl@0
|
219 |
///<
|
sl@0
|
220 |
error_badlookbehind, ///< An attempt to create a variable-width look-behind assertion
|
sl@0
|
221 |
///< was detected.
|
sl@0
|
222 |
///<
|
sl@0
|
223 |
error_internal ///< An internal error has occured.
|
sl@0
|
224 |
///<
|
sl@0
|
225 |
};
|
sl@0
|
226 |
|
sl@0
|
227 |
/// INTERNAL ONLY
|
sl@0
|
228 |
inline syntax_option_type operator &(syntax_option_type b1, syntax_option_type b2)
|
sl@0
|
229 |
{
|
sl@0
|
230 |
return static_cast<syntax_option_type>(
|
sl@0
|
231 |
static_cast<int>(b1) & static_cast<int>(b2));
|
sl@0
|
232 |
}
|
sl@0
|
233 |
|
sl@0
|
234 |
/// INTERNAL ONLY
|
sl@0
|
235 |
inline syntax_option_type operator |(syntax_option_type b1, syntax_option_type b2)
|
sl@0
|
236 |
{
|
sl@0
|
237 |
return static_cast<syntax_option_type>(static_cast<int>(b1) | static_cast<int>(b2));
|
sl@0
|
238 |
}
|
sl@0
|
239 |
|
sl@0
|
240 |
/// INTERNAL ONLY
|
sl@0
|
241 |
inline syntax_option_type operator ^(syntax_option_type b1, syntax_option_type b2)
|
sl@0
|
242 |
{
|
sl@0
|
243 |
return static_cast<syntax_option_type>(static_cast<int>(b1) ^ static_cast<int>(b2));
|
sl@0
|
244 |
}
|
sl@0
|
245 |
|
sl@0
|
246 |
/// INTERNAL ONLY
|
sl@0
|
247 |
inline syntax_option_type operator ~(syntax_option_type b)
|
sl@0
|
248 |
{
|
sl@0
|
249 |
return static_cast<syntax_option_type>(~static_cast<int>(b));
|
sl@0
|
250 |
}
|
sl@0
|
251 |
|
sl@0
|
252 |
/// INTERNAL ONLY
|
sl@0
|
253 |
inline match_flag_type operator &(match_flag_type b1, match_flag_type b2)
|
sl@0
|
254 |
{
|
sl@0
|
255 |
return static_cast<match_flag_type>(static_cast<int>(b1) & static_cast<int>(b2));
|
sl@0
|
256 |
}
|
sl@0
|
257 |
|
sl@0
|
258 |
/// INTERNAL ONLY
|
sl@0
|
259 |
inline match_flag_type operator |(match_flag_type b1, match_flag_type b2)
|
sl@0
|
260 |
{
|
sl@0
|
261 |
return static_cast<match_flag_type>(static_cast<int>(b1) | static_cast<int>(b2));
|
sl@0
|
262 |
}
|
sl@0
|
263 |
|
sl@0
|
264 |
/// INTERNAL ONLY
|
sl@0
|
265 |
inline match_flag_type operator ^(match_flag_type b1, match_flag_type b2)
|
sl@0
|
266 |
{
|
sl@0
|
267 |
return static_cast<match_flag_type>(static_cast<int>(b1) ^ static_cast<int>(b2));
|
sl@0
|
268 |
}
|
sl@0
|
269 |
|
sl@0
|
270 |
/// INTERNAL ONLY
|
sl@0
|
271 |
inline match_flag_type operator ~(match_flag_type b)
|
sl@0
|
272 |
{
|
sl@0
|
273 |
return static_cast<match_flag_type>(~static_cast<int>(b));
|
sl@0
|
274 |
}
|
sl@0
|
275 |
|
sl@0
|
276 |
}}} // namespace boost::xpressive::regex_constants
|
sl@0
|
277 |
|
sl@0
|
278 |
#ifndef BOOST_XPRESSIVE_DOXYGEN_INVOKED
|
sl@0
|
279 |
# undef icase
|
sl@0
|
280 |
#endif
|
sl@0
|
281 |
|
sl@0
|
282 |
#endif
|