sl@0: /////////////////////////////////////////////////////////////////////////////// sl@0: /// \file regex_primitives.hpp sl@0: /// Contains the syntax elements for writing static regular expressions. sl@0: // sl@0: // Copyright 2004 Eric Niebler. Distributed under the Boost sl@0: // Software License, Version 1.0. (See accompanying file sl@0: // LICENSE_1_0.txt or copy at http://www.boost.org/LICENSE_1_0.txt) sl@0: sl@0: #ifndef BOOST_XPRESSIVE_REGEX_PRIMITIVES_HPP_EAN_10_04_2005 sl@0: #define BOOST_XPRESSIVE_REGEX_PRIMITIVES_HPP_EAN_10_04_2005 sl@0: sl@0: #include sl@0: #include sl@0: #include sl@0: #include sl@0: #include sl@0: #include sl@0: #include sl@0: #include sl@0: #include sl@0: #include sl@0: #include sl@0: #include sl@0: #include sl@0: sl@0: namespace boost { namespace xpressive { namespace detail sl@0: { sl@0: sl@0: typedef assert_word_placeholder > assert_word_boundary; sl@0: typedef assert_word_placeholder assert_word_begin; sl@0: typedef assert_word_placeholder assert_word_end; sl@0: sl@0: /* sl@0: /////////////////////////////////////////////////////////////////////////////// sl@0: /// INTERNAL ONLY sl@0: // BOOST_XPRESSIVE_GLOBAL sl@0: // for defining globals that neither violate the One Definition Rule nor sl@0: // lead to undefined behavior due to global object initialization order. sl@0: //#define BOOST_XPRESSIVE_GLOBAL(type, name, init) \ sl@0: // namespace detail \ sl@0: // { \ sl@0: // template \ sl@0: // struct BOOST_PP_CAT(global_pod_, name) \ sl@0: // { \ sl@0: // static type const value; \ sl@0: // private: \ sl@0: // union type_must_be_pod \ sl@0: // { \ sl@0: // type t; \ sl@0: // char ch; \ sl@0: // } u; \ sl@0: // }; \ sl@0: // template \ sl@0: // type const BOOST_PP_CAT(global_pod_, name)::value = init; \ sl@0: // } \ sl@0: // type const &name = detail::BOOST_PP_CAT(global_pod_, name)<0>::value sl@0: */ sl@0: sl@0: } // namespace detail sl@0: sl@0: /// INTERNAL ONLY (for backwards compatibility) sl@0: unsigned int const repeat_max = UINT_MAX-1; sl@0: sl@0: /////////////////////////////////////////////////////////////////////////////// sl@0: /// \brief For infinite repetition of a sub-expression. sl@0: /// sl@0: /// Magic value used with the repeat\<\>() function template sl@0: /// to specify an unbounded repeat. Use as: repeat<17, inf>('a'). sl@0: /// The equivalent in perl is /a{17,}/. sl@0: unsigned int const inf = UINT_MAX-1; sl@0: sl@0: /// INTERNAL ONLY (for backwards compatibility) sl@0: proto::op_proxy< sl@0: proto::unary_op sl@0: > const epsilon = {}; sl@0: sl@0: /////////////////////////////////////////////////////////////////////////////// sl@0: /// \brief Successfully matches nothing. sl@0: /// sl@0: /// Successfully matches a zero-width sequence. nil always succeeds and sl@0: /// never consumes any characters. sl@0: proto::op_proxy< sl@0: proto::unary_op sl@0: > const nil = {}; sl@0: sl@0: /////////////////////////////////////////////////////////////////////////////// sl@0: /// \brief Matches an alpha-numeric character. sl@0: /// sl@0: /// The regex traits are used to determine which characters are alpha-numeric. sl@0: /// To match any character that is not alpha-numeric, use ~alnum. sl@0: /// sl@0: /// \attention alnum is equivalent to /[[:alnum:]]/ in perl. ~alnum is equivalent sl@0: /// to /[[:^alnum:]]/ in perl. sl@0: proto::op_proxy< sl@0: proto::unary_op sl@0: , char const * sl@0: > const alnum = {"alnum"}; sl@0: sl@0: /////////////////////////////////////////////////////////////////////////////// sl@0: /// \brief Matches an alphabetic character. sl@0: /// sl@0: /// The regex traits are used to determine which characters are alphabetic. sl@0: /// To match any character that is not alphabetic, use ~alpha. sl@0: /// sl@0: /// \attention alpha is equivalent to /[[:alpha:]]/ in perl. ~alpha is equivalent sl@0: /// to /[[:^alpha:]]/ in perl. sl@0: proto::op_proxy< sl@0: proto::unary_op sl@0: , char const * sl@0: > const alpha = {"alpha"}; sl@0: sl@0: /////////////////////////////////////////////////////////////////////////////// sl@0: /// \brief Matches a blank (horizonal white-space) character. sl@0: /// sl@0: /// The regex traits are used to determine which characters are blank characters. sl@0: /// To match any character that is not blank, use ~blank. sl@0: /// sl@0: /// \attention blank is equivalent to /[[:blank:]]/ in perl. ~blank is equivalent sl@0: /// to /[[:^blank:]]/ in perl. sl@0: proto::op_proxy< sl@0: proto::unary_op sl@0: , char const * sl@0: > const blank = {"blank"}; sl@0: sl@0: /////////////////////////////////////////////////////////////////////////////// sl@0: /// \brief Matches a control character. sl@0: /// sl@0: /// The regex traits are used to determine which characters are control characters. sl@0: /// To match any character that is not a control character, use ~cntrl. sl@0: /// sl@0: /// \attention cntrl is equivalent to /[[:cntrl:]]/ in perl. ~cntrl is equivalent sl@0: /// to /[[:^cntrl:]]/ in perl. sl@0: proto::op_proxy< sl@0: proto::unary_op sl@0: , char const * sl@0: > const cntrl = {"cntrl"}; sl@0: sl@0: /////////////////////////////////////////////////////////////////////////////// sl@0: /// \brief Matches a digit character. sl@0: /// sl@0: /// The regex traits are used to determine which characters are digits. sl@0: /// To match any character that is not a digit, use ~digit. sl@0: /// sl@0: /// \attention digit is equivalent to /[[:digit:]]/ in perl. ~digit is equivalent sl@0: /// to /[[:^digit:]]/ in perl. sl@0: proto::op_proxy< sl@0: proto::unary_op sl@0: , char const * sl@0: > const digit = {"digit"}; sl@0: sl@0: /////////////////////////////////////////////////////////////////////////////// sl@0: /// \brief Matches a graph character. sl@0: /// sl@0: /// The regex traits are used to determine which characters are graphable. sl@0: /// To match any character that is not graphable, use ~graph. sl@0: /// sl@0: /// \attention graph is equivalent to /[[:graph:]]/ in perl. ~graph is equivalent sl@0: /// to /[[:^graph:]]/ in perl. sl@0: proto::op_proxy< sl@0: proto::unary_op sl@0: , char const * sl@0: > const graph = {"graph"}; sl@0: sl@0: /////////////////////////////////////////////////////////////////////////////// sl@0: /// \brief Matches a lower-case character. sl@0: /// sl@0: /// The regex traits are used to determine which characters are lower-case. sl@0: /// To match any character that is not a lower-case character, use ~lower. sl@0: /// sl@0: /// \attention lower is equivalent to /[[:lower:]]/ in perl. ~lower is equivalent sl@0: /// to /[[:^lower:]]/ in perl. sl@0: proto::op_proxy< sl@0: proto::unary_op sl@0: , char const * sl@0: > const lower = {"lower"}; sl@0: sl@0: /////////////////////////////////////////////////////////////////////////////// sl@0: /// \brief Matches a printable character. sl@0: /// sl@0: /// The regex traits are used to determine which characters are printable. sl@0: /// To match any character that is not printable, use ~print. sl@0: /// sl@0: /// \attention print is equivalent to /[[:print:]]/ in perl. ~print is equivalent sl@0: /// to /[[:^print:]]/ in perl. sl@0: proto::op_proxy< sl@0: proto::unary_op sl@0: , char const * sl@0: > const print = {"print"}; sl@0: sl@0: /////////////////////////////////////////////////////////////////////////////// sl@0: /// \brief Matches a punctuation character. sl@0: /// sl@0: /// The regex traits are used to determine which characters are punctuation. sl@0: /// To match any character that is not punctuation, use ~punct. sl@0: /// sl@0: /// \attention punct is equivalent to /[[:punct:]]/ in perl. ~punct is equivalent sl@0: /// to /[[:^punct:]]/ in perl. sl@0: proto::op_proxy< sl@0: proto::unary_op sl@0: , char const * sl@0: > const punct = {"punct"}; sl@0: sl@0: /////////////////////////////////////////////////////////////////////////////// sl@0: /// \brief Matches a space character. sl@0: /// sl@0: /// The regex traits are used to determine which characters are space characters. sl@0: /// To match any character that is not white-space, use ~space. sl@0: /// sl@0: /// \attention space is equivalent to /[[:space:]]/ in perl. ~space is equivalent sl@0: /// to /[[:^space:]]/ in perl. sl@0: proto::op_proxy< sl@0: proto::unary_op sl@0: , char const * sl@0: > const space = {"space"}; sl@0: sl@0: /////////////////////////////////////////////////////////////////////////////// sl@0: /// \brief Matches an upper-case character. sl@0: /// sl@0: /// The regex traits are used to determine which characters are upper-case. sl@0: /// To match any character that is not upper-case, use ~upper. sl@0: /// sl@0: /// \attention upper is equivalent to /[[:upper:]]/ in perl. ~upper is equivalent sl@0: /// to /[[:^upper:]]/ in perl. sl@0: proto::op_proxy< sl@0: proto::unary_op sl@0: , char const * sl@0: > const upper = {"upper"}; sl@0: sl@0: /////////////////////////////////////////////////////////////////////////////// sl@0: /// \brief Matches a hexadecimal digit character. sl@0: /// sl@0: /// The regex traits are used to determine which characters are hex digits. sl@0: /// To match any character that is not a hex digit, use ~xdigit. sl@0: /// sl@0: /// \attention xdigit is equivalent to /[[:xdigit:]]/ in perl. ~xdigit is equivalent sl@0: /// to /[[:^xdigit:]]/ in perl. sl@0: proto::op_proxy< sl@0: proto::unary_op sl@0: , char const * sl@0: > const xdigit = {"xdigit"}; sl@0: sl@0: /////////////////////////////////////////////////////////////////////////////// sl@0: /// \brief Beginning of sequence assertion. sl@0: /// sl@0: /// For the character sequence [begin, end), 'bos' matches the sl@0: /// zero-width sub-sequence [begin, begin). sl@0: proto::op_proxy< sl@0: proto::unary_op sl@0: > const bos = {}; sl@0: sl@0: /////////////////////////////////////////////////////////////////////////////// sl@0: /// \brief End of sequence assertion. sl@0: /// sl@0: /// For the character sequence [begin, end), sl@0: /// 'eos' matches the zero-width sub-sequence [end, end). sl@0: /// sl@0: /// \attention Unlike the perl end of sequence assertion \$, 'eos' will sl@0: /// not match at the position [end-1, end-1) if *(end-1) is '\\n'. To sl@0: /// get that behavior, use (!_n >> eos). sl@0: proto::op_proxy< sl@0: proto::unary_op sl@0: > const eos = {}; sl@0: sl@0: /////////////////////////////////////////////////////////////////////////////// sl@0: /// \brief Beginning of line assertion. sl@0: /// sl@0: /// 'bol' matches the zero-width sub-sequence sl@0: /// immediately following a logical newline sequence. The regex traits sl@0: /// is used to determine what constitutes a logical newline sequence. sl@0: proto::op_proxy< sl@0: proto::unary_op sl@0: > const bol = {}; sl@0: sl@0: /////////////////////////////////////////////////////////////////////////////// sl@0: /// \brief End of line assertion. sl@0: /// sl@0: /// 'eol' matches the zero-width sub-sequence sl@0: /// immediately preceeding a logical newline sequence. The regex traits sl@0: /// is used to determine what constitutes a logical newline sequence. sl@0: proto::op_proxy< sl@0: proto::unary_op sl@0: > const eol = {}; sl@0: sl@0: /////////////////////////////////////////////////////////////////////////////// sl@0: /// \brief Beginning of word assertion. sl@0: /// sl@0: /// 'bow' matches the zero-width sub-sequence sl@0: /// immediately following a non-word character and preceeding a word character. sl@0: /// The regex traits are used to determine what constitutes a word character. sl@0: proto::op_proxy< sl@0: proto::unary_op sl@0: > const bow = {}; sl@0: sl@0: /////////////////////////////////////////////////////////////////////////////// sl@0: /// \brief End of word assertion. sl@0: /// sl@0: /// 'eow' matches the zero-width sub-sequence sl@0: /// immediately following a word character and preceeding a non-word character. sl@0: /// The regex traits are used to determine what constitutes a word character. sl@0: proto::op_proxy< sl@0: proto::unary_op sl@0: > const eow = {}; sl@0: sl@0: /////////////////////////////////////////////////////////////////////////////// sl@0: /// \brief Word boundary assertion. sl@0: /// sl@0: /// '_b' matches the zero-width sub-sequence at the beginning or the end of a word. sl@0: /// It is equivalent to (bow | eow). The regex traits are used to determine what sl@0: /// constitutes a word character. To match a non-word boundary, use ~_b. sl@0: /// sl@0: /// \attention _b is like \\b in perl. ~_b is like \\B in perl. sl@0: proto::op_proxy< sl@0: proto::unary_op sl@0: > const _b = {}; sl@0: sl@0: /////////////////////////////////////////////////////////////////////////////// sl@0: /// \brief Matches a word character. sl@0: /// sl@0: /// '_w' matches a single word character. The regex traits are used to determine which sl@0: /// characters are word characters. Use ~_w to match a character that is not a word sl@0: /// character. sl@0: /// sl@0: /// \attention _w is like \\w in perl. ~_w is like \\W in perl. sl@0: proto::op_proxy< sl@0: proto::unary_op sl@0: , char const * sl@0: > const _w = {"w"}; sl@0: sl@0: /////////////////////////////////////////////////////////////////////////////// sl@0: /// \brief Matches a digit character. sl@0: /// sl@0: /// '_d' matches a single digit character. The regex traits are used to determine which sl@0: /// characters are digits. Use ~_d to match a character that is not a digit sl@0: /// character. sl@0: /// sl@0: /// \attention _d is like \\d in perl. ~_d is like \\D in perl. sl@0: proto::op_proxy< sl@0: proto::unary_op sl@0: , char const * sl@0: > const _d = {"d"}; sl@0: sl@0: /////////////////////////////////////////////////////////////////////////////// sl@0: /// \brief Matches a space character. sl@0: /// sl@0: /// '_s' matches a single space character. The regex traits are used to determine which sl@0: /// characters are space characters. Use ~_s to match a character that is not a space sl@0: /// character. sl@0: /// sl@0: /// \attention _s is like \\s in perl. ~_s is like \\S in perl. sl@0: proto::op_proxy< sl@0: proto::unary_op sl@0: , char const * sl@0: > const _s = {"s"}; sl@0: sl@0: /////////////////////////////////////////////////////////////////////////////// sl@0: /// \brief Matches a literal newline character, '\\n'. sl@0: /// sl@0: /// '_n' matches a single newline character, '\\n'. Use ~_n to match a character sl@0: /// that is not a newline. sl@0: /// sl@0: /// \attention ~_n is like '.' in perl without the /s modifier. sl@0: proto::op_proxy< sl@0: proto::unary_op, proto::noop_tag> sl@0: , char sl@0: > const _n = {'\n'}; sl@0: sl@0: /////////////////////////////////////////////////////////////////////////////// sl@0: /// \brief Matches a logical newline sequence. sl@0: /// sl@0: /// '_ln' matches a logical newline sequence. This can be any character in the sl@0: /// line separator class, as determined by the regex traits, or the '\\r\\n' sequence. sl@0: /// For the purpose of back-tracking, '\\r\\n' is treated as a unit. sl@0: /// To match any one character that is not a logical newline, use ~_ln. sl@0: proto::op_proxy< sl@0: detail::logical_newline_xpression sl@0: > const _ln = {}; sl@0: sl@0: /////////////////////////////////////////////////////////////////////////////// sl@0: /// \brief Matches any one character. sl@0: /// sl@0: /// Match any character, similar to '.' in perl syntax with the /s modifier. sl@0: /// '_' matches any one character, including the newline. sl@0: /// sl@0: /// \attention To match any character except the newline, use ~_n sl@0: proto::op_proxy< sl@0: proto::unary_op sl@0: > const _ = {}; sl@0: sl@0: /////////////////////////////////////////////////////////////////////////////// sl@0: /// \brief Reference to the current regex object sl@0: /// sl@0: /// Useful when constructing recursive regular expression objects. The 'self' sl@0: /// identifier is a short-hand for the current regex object. For instance, sl@0: /// sregex rx = '(' >> (self | nil) >> ')'; will create a regex object that sl@0: /// matches balanced parens such as "((()))". sl@0: proto::op_proxy< sl@0: proto::unary_op sl@0: > const self = {}; sl@0: sl@0: /////////////////////////////////////////////////////////////////////////////// sl@0: /// \brief Used to create character sets. sl@0: /// sl@0: /// There are two ways to create character sets with the 'set' identifier. The sl@0: /// easiest is to create a comma-separated list of the characters in the set, sl@0: /// as in (set= 'a','b','c'). This set will match 'a', 'b', or 'c'. The other sl@0: /// way is to define the set as an argument to the set subscript operator. sl@0: /// For instance, set[ 'a' | range('b','c') | digit ] will match an 'a', 'b', sl@0: /// 'c' or a digit character. sl@0: /// sl@0: /// To complement a set, apply the '~' operator. For instance, ~(set= 'a','b','c') sl@0: /// will match any character that is not an 'a', 'b', or 'c'. sl@0: /// sl@0: /// Sets can be composed of other, possibly complemented, sets. For instance, sl@0: /// set[ ~digit | ~(set= 'a','b','c') ]. sl@0: proto::op_proxy< sl@0: detail::set_initializer_type sl@0: > const set = {}; sl@0: sl@0: /////////////////////////////////////////////////////////////////////////////// sl@0: /// \brief Sub-match placeholder, like $& in Perl sl@0: proto::op_proxy const s0 = {0}; sl@0: sl@0: /////////////////////////////////////////////////////////////////////////////// sl@0: /// \brief Sub-match placeholder, like $1 in perl. sl@0: /// sl@0: /// To create a sub-match, assign a sub-expression to the sub-match placeholder. sl@0: /// For instance, (s1= _) will match any one character and remember which sl@0: /// character was matched in the 1st sub-match. Later in the pattern, you can sl@0: /// refer back to the sub-match. For instance, (s1= _) >> s1 will match any sl@0: /// character, and then match the same character again. sl@0: /// sl@0: /// After a successful regex_match() or regex_search(), the sub-match placeholders sl@0: /// can be used to index into the match_results\<\> object to retrieve the Nth sl@0: /// sub-match. sl@0: proto::op_proxy const s1 = {1}; sl@0: proto::op_proxy const s2 = {2}; sl@0: proto::op_proxy const s3 = {3}; sl@0: proto::op_proxy const s4 = {4}; sl@0: proto::op_proxy const s5 = {5}; sl@0: proto::op_proxy const s6 = {6}; sl@0: proto::op_proxy const s7 = {7}; sl@0: proto::op_proxy const s8 = {8}; sl@0: proto::op_proxy const s9 = {9}; sl@0: sl@0: // NOTE: For the purpose of xpressive's documentation, make icase() look like an sl@0: // ordinary function. In reality, it is a function object defined in detail/icase.hpp sl@0: // so that it can serve double-duty as regex_constants::icase, the syntax_option_type. sl@0: // Do the same for as_xpr(), which is actually defined in detail/static/as_xpr.hpp sl@0: #ifdef BOOST_XPRESSIVE_DOXYGEN_INVOKED sl@0: /////////////////////////////////////////////////////////////////////////////// sl@0: /// \brief Makes a literal into a regular expression. sl@0: /// sl@0: /// Use as_xpr() to turn a literal into a regular expression. For instance, sl@0: /// "foo" >> "bar" will not compile because both operands to the right-shift sl@0: /// operator are const char*, and no such operator exists. Use as_xpr("foo") >> "bar" sl@0: /// instead. sl@0: /// sl@0: /// You can use as_xpr() with character literals in addition to string literals. sl@0: /// For instance, as_xpr('a') will match an 'a'. You can also complement a sl@0: /// character literal, as with ~as_xpr('a'). This will match any one character sl@0: /// that is not an 'a'. sl@0: template sl@0: inline typename detail::as_xpr_type::const_reference sl@0: as_xpr(Literal const &literal) sl@0: { sl@0: return detail::as_xpr_type::call(xpr); sl@0: } sl@0: sl@0: /////////////////////////////////////////////////////////////////////////////// sl@0: /// \brief Makes a sub-expression case-insensitive. sl@0: /// sl@0: /// Use icase() to make a sub-expression case-insensitive. For instance, sl@0: /// "foo" >> icase(set['b'] >> "ar") will match "foo" exactly followed by sl@0: /// "bar" irrespective of case. sl@0: template sl@0: inline proto::binary_op::type, modifier_tag> const sl@0: icase(Xpr const &xpr) sl@0: { sl@0: detail::icase_modifier mod; sl@0: return proto::make_op(mod, as_xpr(xpr)); sl@0: } sl@0: #endif sl@0: sl@0: /////////////////////////////////////////////////////////////////////////////// sl@0: /// \brief Embed a regex object by reference. sl@0: /// sl@0: /// \param rex The basic_regex object to embed by reference. sl@0: template sl@0: inline proto::unary_op, proto::noop_tag> const sl@0: by_ref(basic_regex const &rex) sl@0: { sl@0: typedef detail::core_access access; sl@0: shared_ptr > impl = access::get_regex_impl(rex); sl@0: return proto::noop(detail::regex_placeholder(impl)); sl@0: } sl@0: sl@0: /////////////////////////////////////////////////////////////////////////////// sl@0: /// \brief Match a range of characters. sl@0: /// sl@0: /// Match any character in the range [ch_min, ch_max]. sl@0: /// sl@0: /// \param ch_min The lower end of the range to match. sl@0: /// \param ch_max The upper end of the range to match. sl@0: template sl@0: inline proto::unary_op, proto::noop_tag> const sl@0: range(Char ch_min, Char ch_max) sl@0: { sl@0: return proto::noop(detail::range_placeholder(ch_min, ch_max)); sl@0: } sl@0: sl@0: /////////////////////////////////////////////////////////////////////////////// sl@0: /// \brief Make a sub-expression optional. Equivalent to !as_xpr(xpr). sl@0: /// sl@0: /// \param xpr The sub-expression to make optional. sl@0: template sl@0: inline proto::unary_op sl@0: < sl@0: typename detail::as_xpr_type::type sl@0: , proto::logical_not_tag sl@0: > const sl@0: optional(Xpr const &xpr) sl@0: { sl@0: return !as_xpr(xpr); sl@0: } sl@0: sl@0: /////////////////////////////////////////////////////////////////////////////// sl@0: /// \brief Repeat a sub-expression multiple times. sl@0: /// sl@0: /// There are two forms of the repeat\<\>() function template. To match a sl@0: /// sub-expression N times, use repeat\(xpr). To match a sub-expression sl@0: /// from M to N times, use repeat\(xpr). sl@0: /// sl@0: /// The repeat\<\>() function creates a greedy quantifier. To make the quantifier sl@0: /// non-greedy, apply the unary minus operator, as in -repeat\(xpr). sl@0: /// sl@0: /// \param xpr The sub-expression to repeat. sl@0: template sl@0: inline proto::unary_op sl@0: < sl@0: typename detail::as_xpr_type::type sl@0: , detail::generic_quant_tag sl@0: > const sl@0: repeat(Xpr const &xpr) sl@0: { sl@0: return proto::make_op >(as_xpr(xpr)); sl@0: } sl@0: sl@0: /// \overload sl@0: template sl@0: inline proto::unary_op sl@0: < sl@0: typename detail::as_xpr_type::type sl@0: , detail::generic_quant_tag sl@0: > const sl@0: repeat(Xpr2 const &xpr) sl@0: { sl@0: return proto::make_op >(as_xpr(xpr)); sl@0: } sl@0: sl@0: /////////////////////////////////////////////////////////////////////////////// sl@0: /// \brief Create an independent sub-expression. sl@0: /// sl@0: /// Turn off back-tracking for a sub-expression. Any branches or repeats within sl@0: /// the sub-expression will match only one way, and no other alternatives are sl@0: /// tried. sl@0: /// sl@0: /// \attention keep(xpr) is equivalent to the perl (?>...) extension. sl@0: /// sl@0: /// \param xpr The sub-expression to modify. sl@0: template sl@0: inline proto::unary_op sl@0: < sl@0: typename detail::as_xpr_type::type sl@0: , detail::keeper_tag sl@0: > const sl@0: keep(Xpr const &xpr) sl@0: { sl@0: return proto::make_op(as_xpr(xpr)); sl@0: } sl@0: sl@0: /////////////////////////////////////////////////////////////////////////////// sl@0: /// \brief Look-ahead assertion. sl@0: /// sl@0: /// before(xpr) succeeds if the xpr sub-expression would match at the current sl@0: /// position in the sequence, but xpr is not included in the match. For instance, sl@0: /// before("foo") succeeds if we are before a "foo". Look-ahead assertions can be sl@0: /// negated with the bit-compliment operator. sl@0: /// sl@0: /// \attention before(xpr) is equivalent to the perl (?=...) extension. sl@0: /// ~before(xpr) is a negative look-ahead assertion, equivalent to the sl@0: /// perl (?!...) extension. sl@0: /// sl@0: /// \param xpr The sub-expression to put in the look-ahead assertion. sl@0: template sl@0: inline proto::unary_op sl@0: < sl@0: typename detail::as_xpr_type::type sl@0: , detail::lookahead_tag sl@0: > const sl@0: before(Xpr const &xpr) sl@0: { sl@0: return proto::make_op >(as_xpr(xpr)); sl@0: } sl@0: sl@0: /////////////////////////////////////////////////////////////////////////////// sl@0: /// \brief Look-behind assertion. sl@0: /// sl@0: /// after(xpr) succeeds if the xpr sub-expression would match at the current sl@0: /// position minus N in the sequence, where N is the width of xpr. xpr is not included in sl@0: /// the match. For instance, after("foo") succeeds if we are after a "foo". Look-behind sl@0: /// assertions can be negated with the bit-complement operator. sl@0: /// sl@0: /// \attention after(xpr) is equivalent to the perl (?<=...) extension. sl@0: /// ~after(xpr) is a negative look-behind assertion, equivalent to the sl@0: /// perl (? sl@0: inline proto::unary_op sl@0: < sl@0: typename detail::as_xpr_type::type sl@0: , detail::lookbehind_tag sl@0: > const sl@0: after(Xpr const &xpr) sl@0: { sl@0: return proto::make_op >(as_xpr(xpr)); sl@0: } sl@0: sl@0: /////////////////////////////////////////////////////////////////////////////// sl@0: /// \brief Specify a regex traits or a std::locale. sl@0: /// sl@0: /// imbue() instructs the regex engine to use the specified traits or locale sl@0: /// when matching the regex. The entire expression must use the same traits/locale. sl@0: /// For instance, the following specifies a locale for use with a regex: sl@0: /// std::locale loc; sl@0: /// sregex rx = imbue(loc)(+digit); sl@0: /// sl@0: /// \param loc The std::locale or regex traits object. sl@0: template sl@0: inline detail::modifier_op > const sl@0: imbue(Locale const &loc) sl@0: { sl@0: detail::modifier_op > mod = sl@0: { sl@0: detail::locale_modifier(loc) sl@0: , regex_constants::ECMAScript sl@0: }; sl@0: return mod; sl@0: } sl@0: sl@0: }} // namespace boost::xpressive sl@0: sl@0: #endif