You cannot select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and dots ('.'), can be up to 35 characters long. Letters must be lowercase.
260 lines
8.6 KiB
260 lines
8.6 KiB
/////////////////////////////////////////////////////////////////////////////// |
|
/// \file regex_iterator.hpp |
|
/// Contains the definition of the regex_iterator type, an STL-compatible iterator |
|
/// for stepping through all the matches in a sequence. |
|
// |
|
// Copyright 2008 Eric Niebler. Distributed under the Boost |
|
// Software License, Version 1.0. (See accompanying file |
|
// LICENSE_1_0.txt or copy at http://www.boost.org/LICENSE_1_0.txt) |
|
|
|
#ifndef BOOST_XPRESSIVE_REGEX_ITERATOR_HPP_EAN_10_04_2005 |
|
#define BOOST_XPRESSIVE_REGEX_ITERATOR_HPP_EAN_10_04_2005 |
|
|
|
// MS compatible compilers support #pragma once |
|
#if defined(_MSC_VER) && (_MSC_VER >= 1020) |
|
# pragma once |
|
#endif |
|
|
|
#include <boost/noncopyable.hpp> |
|
#include <boost/intrusive_ptr.hpp> |
|
#include <boost/iterator/iterator_traits.hpp> |
|
#include <boost/xpressive/detail/detail_fwd.hpp> |
|
#include <boost/xpressive/detail/core/access.hpp> |
|
#include <boost/xpressive/detail/utility/counted_base.hpp> |
|
|
|
namespace boost { namespace xpressive { namespace detail |
|
{ |
|
|
|
////////////////////////////////////////////////////////////////////////// |
|
// regex_iterator_impl |
|
// |
|
template<typename BidiIter> |
|
struct regex_iterator_impl |
|
: counted_base<regex_iterator_impl<BidiIter> > |
|
{ |
|
typedef detail::core_access<BidiIter> access; |
|
|
|
regex_iterator_impl |
|
( |
|
BidiIter begin |
|
, BidiIter cur |
|
, BidiIter end |
|
, BidiIter next_search |
|
, basic_regex<BidiIter> const &rex |
|
, regex_constants::match_flag_type flags |
|
, bool not_null = false |
|
) |
|
: rex_(rex) |
|
, what_() |
|
, state_(begin, end, what_, *access::get_regex_impl(rex_), flags) |
|
, flags_(flags) |
|
, not_null_(not_null) |
|
{ |
|
this->state_.cur_ = cur; |
|
this->state_.next_search_ = next_search; |
|
} |
|
|
|
bool next() |
|
{ |
|
this->state_.reset(this->what_, *access::get_regex_impl(this->rex_)); |
|
if(!regex_search_impl(this->state_, this->rex_, this->not_null_)) |
|
{ |
|
return false; |
|
} |
|
|
|
// Report position() correctly by setting the base different from prefix().first |
|
access::set_base(this->what_, this->state_.begin_); |
|
|
|
this->state_.cur_ = this->state_.next_search_ = this->what_[0].second; |
|
this->not_null_ = (0 == this->what_.length()); |
|
|
|
return true; |
|
} |
|
|
|
bool equal_to(regex_iterator_impl<BidiIter> const &that) const |
|
{ |
|
return this->rex_.regex_id() == that.rex_.regex_id() |
|
&& this->state_.begin_ == that.state_.begin_ |
|
&& this->state_.cur_ == that.state_.cur_ |
|
&& this->state_.end_ == that.state_.end_ |
|
&& this->flags_ == that.flags_ |
|
; |
|
} |
|
|
|
basic_regex<BidiIter> rex_; |
|
match_results<BidiIter> what_; |
|
match_state<BidiIter> state_; |
|
regex_constants::match_flag_type const flags_; |
|
bool not_null_; |
|
}; |
|
|
|
} // namespace detail |
|
|
|
////////////////////////////////////////////////////////////////////////// |
|
// regex_iterator |
|
// |
|
template<typename BidiIter> |
|
struct regex_iterator |
|
{ |
|
typedef basic_regex<BidiIter> regex_type; |
|
typedef match_results<BidiIter> value_type; |
|
typedef typename iterator_difference<BidiIter>::type difference_type; |
|
typedef value_type const *pointer; |
|
typedef value_type const &reference; |
|
typedef std::forward_iterator_tag iterator_category; |
|
|
|
/// INTERNAL ONLY |
|
typedef detail::regex_iterator_impl<BidiIter> impl_type_; |
|
|
|
regex_iterator() |
|
: impl_() |
|
{ |
|
} |
|
|
|
regex_iterator |
|
( |
|
BidiIter begin |
|
, BidiIter end |
|
, basic_regex<BidiIter> const &rex |
|
, regex_constants::match_flag_type flags = regex_constants::match_default |
|
) |
|
: impl_() |
|
{ |
|
if(0 != rex.regex_id()) // Empty regexes are guaranteed to match nothing |
|
{ |
|
this->impl_ = new impl_type_(begin, begin, end, begin, rex, flags); |
|
this->next_(); |
|
} |
|
} |
|
|
|
template<typename LetExpr> |
|
regex_iterator |
|
( |
|
BidiIter begin |
|
, BidiIter end |
|
, basic_regex<BidiIter> const &rex |
|
, detail::let_<LetExpr> const &args |
|
, regex_constants::match_flag_type flags = regex_constants::match_default |
|
) |
|
: impl_() |
|
{ |
|
if(0 != rex.regex_id()) // Empty regexes are guaranteed to match nothing |
|
{ |
|
this->impl_ = new impl_type_(begin, begin, end, begin, rex, flags); |
|
detail::bind_args(args, this->impl_->what_); |
|
this->next_(); |
|
} |
|
} |
|
|
|
regex_iterator(regex_iterator<BidiIter> const &that) |
|
: impl_(that.impl_) // COW |
|
{ |
|
} |
|
|
|
regex_iterator<BidiIter> &operator =(regex_iterator<BidiIter> const &that) |
|
{ |
|
this->impl_ = that.impl_; // COW |
|
return *this; |
|
} |
|
|
|
friend bool operator ==(regex_iterator<BidiIter> const &left, regex_iterator<BidiIter> const &right) |
|
{ |
|
if(!left.impl_ || !right.impl_) |
|
{ |
|
return !left.impl_ && !right.impl_; |
|
} |
|
|
|
return left.impl_->equal_to(*right.impl_); |
|
} |
|
|
|
friend bool operator !=(regex_iterator<BidiIter> const &left, regex_iterator<BidiIter> const &right) |
|
{ |
|
return !(left == right); |
|
} |
|
|
|
value_type const &operator *() const |
|
{ |
|
return this->impl_->what_; |
|
} |
|
|
|
value_type const *operator ->() const |
|
{ |
|
return &this->impl_->what_; |
|
} |
|
|
|
/// If what.prefix().first != what[0].second and if the element match_prev_avail is not set in |
|
/// flags then sets it. Then behaves as if by calling regex_search(what[0].second, end, what, *pre, flags), |
|
/// with the following variation: in the event that the previous match found was of zero length |
|
/// (what[0].length() == 0) then attempts to find a non-zero length match starting at what[0].second, |
|
/// only if that fails and provided what[0].second != suffix().second does it look for a (possibly |
|
/// zero length) match starting from what[0].second + 1. If no further match is found then sets |
|
/// *this equal to the end of sequence iterator. |
|
/// \post (*this)-\>size() == pre-\>mark_count() + 1 |
|
/// \post (*this)-\>empty() == false |
|
/// \post (*this)-\>prefix().first == An iterator denoting the end point of the previous match found |
|
/// \post (*this)-\>prefix().last == (**this)[0].first |
|
/// \post (*this)-\>prefix().matched == (*this)-\>prefix().first != (*this)-\>prefix().second |
|
/// \post (*this)-\>suffix().first == (**this)[0].second |
|
/// \post (*this)-\>suffix().last == end |
|
/// \post (*this)-\>suffix().matched == (*this)-\>suffix().first != (*this)-\>suffix().second |
|
/// \post (**this)[0].first == The starting iterator for this match. |
|
/// \post (**this)[0].second == The ending iterator for this match. |
|
/// \post (**this)[0].matched == true if a full match was found, and false if it was a partial match (found as a result of the match_partial flag being set). |
|
/// \post (**this)[n].first == For all integers n \< (*this)-\>size(), the start of the sequence that matched sub-expression n. Alternatively, if sub-expression n did not participate in the match, then end. |
|
/// \post (**this)[n].second == For all integers n \< (*this)-\>size(), the end of the sequence that matched sub-expression n. Alternatively, if sub-expression n did not participate in the match, then end. |
|
/// \post (**this)[n].matched == For all integers n \< (*this)-\>size(), true if sub-expression n participated in the match, false otherwise. |
|
/// \post (*this)-\>position() == The distance from the start of the original sequence being iterated, to the start of this match. |
|
regex_iterator<BidiIter> &operator ++() |
|
{ |
|
this->fork_(); // un-share the implementation |
|
this->next_(); |
|
return *this; |
|
} |
|
|
|
regex_iterator<BidiIter> operator ++(int) |
|
{ |
|
regex_iterator<BidiIter> tmp(*this); |
|
++*this; |
|
return tmp; |
|
} |
|
|
|
private: |
|
|
|
/// INTERNAL ONLY |
|
void fork_() |
|
{ |
|
if(1 != this->impl_->use_count()) |
|
{ |
|
// This is OK, the use_count is > 1 |
|
impl_type_ *that = this->impl_.get(); |
|
this->impl_ = new impl_type_ |
|
( |
|
that->state_.begin_ |
|
, that->state_.cur_ |
|
, that->state_.end_ |
|
, that->state_.next_search_ |
|
, that->rex_ |
|
, that->flags_ |
|
, that->not_null_ |
|
); |
|
detail::core_access<BidiIter>::get_action_args(this->impl_->what_) |
|
= detail::core_access<BidiIter>::get_action_args(that->what_); |
|
} |
|
} |
|
|
|
/// INTERNAL ONLY |
|
void next_() |
|
{ |
|
BOOST_ASSERT(this->impl_ && 1 == this->impl_->use_count()); |
|
if(!this->impl_->next()) |
|
{ |
|
this->impl_ = 0; |
|
} |
|
} |
|
|
|
intrusive_ptr<impl_type_> impl_; |
|
}; |
|
|
|
}} // namespace boost::xpressive |
|
|
|
#endif
|
|
|