boost/spirit/home/lex/lexer/token_def.hpp
// Copyright (c) 2001-2011 Hartmut Kaiser
//
// Distributed under the Boost Software License, Version 1.0. (See accompanying
// file LICENSE_1_0.txt or copy at http://www.boost.org/LICENSE_1_0.txt)
#if !defined(BOOST_SPIRIT_LEX_TOKEN_DEF_MAR_13_2007_0145PM)
#define BOOST_SPIRIT_LEX_TOKEN_DEF_MAR_13_2007_0145PM
#if defined(_MSC_VER)
#pragma once
#endif
#include <boost/spirit/home/support/unused.hpp>
#include <boost/spirit/home/support/argument.hpp>
#include <boost/spirit/home/support/info.hpp>
#include <boost/spirit/home/support/handles_container.hpp>
#include <boost/spirit/home/qi/parser.hpp>
#include <boost/spirit/home/qi/skip_over.hpp>
#include <boost/spirit/home/qi/detail/construct.hpp>
#include <boost/spirit/home/qi/detail/assign_to.hpp>
#include <boost/spirit/home/lex/reference.hpp>
#include <boost/spirit/home/lex/lexer_type.hpp>
#include <boost/spirit/home/lex/lexer/terminals.hpp>
#include <boost/fusion/include/vector.hpp>
#include <boost/mpl/if.hpp>
#include <boost/proto/extends.hpp>
#include <boost/proto/traits.hpp>
#include <boost/type_traits/is_same.hpp>
#include <boost/variant.hpp>
#include <iterator> // for std::iterator_traits
#include <string>
#include <cstdlib>
#if defined(BOOST_MSVC)
# pragma warning(push)
# pragma warning(disable: 4355) // 'this' : used in base member initializer list warning
#endif
namespace boost { namespace spirit { namespace lex
{
///////////////////////////////////////////////////////////////////////////
// This component represents a token definition
///////////////////////////////////////////////////////////////////////////
template<typename Attribute = unused_type
, typename Char = char
, typename Idtype = std::size_t>
struct token_def
: proto::extends<
typename proto::terminal<
lex::reference<token_def<Attribute, Char, Idtype> const, Idtype>
>::type
, token_def<Attribute, Char, Idtype> >
, qi::parser<token_def<Attribute, Char, Idtype> >
, lex::lexer_type<token_def<Attribute, Char, Idtype> >
{
private:
// initialize proto base class
typedef lex::reference<token_def const, Idtype> reference_;
typedef typename proto::terminal<reference_>::type terminal_type;
typedef proto::extends<terminal_type, token_def> proto_base_type;
static std::size_t const all_states_id = static_cast<std::size_t>(-2);
public:
// Qi interface: meta-function calculating parser return type
template <typename Context, typename Iterator>
struct attribute
{
// The return value of the token_def is either the specified
// attribute type, or the pair of iterators from the match of the
// corresponding token (if no attribute type has been specified),
// or unused_type (if omit has been specified).
typedef typename Iterator::base_iterator_type iterator_type;
typedef typename mpl::if_<
traits::not_is_unused<Attribute>
, typename mpl::if_<
is_same<Attribute, lex::omit>, unused_type, Attribute
>::type
, iterator_range<iterator_type>
>::type type;
};
public:
// Qi interface: parse functionality
template <typename Iterator, typename Context
, typename Skipper, typename Attribute_>
bool parse(Iterator& first, Iterator const& last
, Context& /*context*/, Skipper const& skipper
, Attribute_& attr) const
{
qi::skip_over(first, last, skipper); // always do a pre-skip
if (first != last) {
typedef typename
std::iterator_traits<Iterator>::value_type
token_type;
// If the following assertion fires you probably forgot to
// associate this token definition with a lexer instance.
BOOST_ASSERT(std::size_t(~0) != token_state_);
token_type const& t = *first;
if (token_id_ == t.id() &&
(all_states_id == token_state_ || token_state_ == t.state()))
{
spirit::traits::assign_to(t, attr);
++first;
return true;
}
}
return false;
}
template <typename Context>
info what(Context& /*context*/) const
{
if (0 == def_.which())
return info("token_def", boost::get<string_type>(def_));
return info("token_def", boost::get<char_type>(def_));
}
///////////////////////////////////////////////////////////////////////
// Lex interface: collect token definitions and put it into the
// provided lexer def
template <typename LexerDef, typename String>
void collect(LexerDef& lexdef, String const& state
, String const& targetstate) const
{
std::size_t state_id = lexdef.add_state(state.c_str());
// If the following assertion fires you are probably trying to use
// a single token_def instance in more than one lexer state. This
// is not possible. Please create a separate token_def instance
// from the same regular expression for each lexer state it needs
// to be associated with.
BOOST_ASSERT(
(std::size_t(~0) == token_state_ || state_id == token_state_) &&
"Can't use single token_def with more than one lexer state");
char_type const* target = targetstate.empty() ? 0 : targetstate.c_str();
if (target)
lexdef.add_state(target);
token_state_ = state_id;
if (0 == token_id_)
token_id_ = lexdef.get_next_id();
if (0 == def_.which()) {
unique_id_ = lexdef.add_token(state.c_str()
, boost::get<string_type>(def_), token_id_, target);
}
else {
unique_id_ = lexdef.add_token(state.c_str()
, boost::get<char_type>(def_), token_id_, target);
}
}
template <typename LexerDef>
void add_actions(LexerDef&) const {}
public:
typedef Char char_type;
typedef Idtype id_type;
typedef std::basic_string<char_type> string_type;
// Lex interface: constructing token definitions
token_def()
: proto_base_type(terminal_type::make(reference_(*this)))
, def_('\0'), token_id_()
, unique_id_(std::size_t(~0)), token_state_(std::size_t(~0)) {}
token_def(token_def const& rhs)
: proto_base_type(terminal_type::make(reference_(*this)))
, def_(rhs.def_), token_id_(rhs.token_id_)
, unique_id_(rhs.unique_id_), token_state_(rhs.token_state_) {}
explicit token_def(char_type def_, Idtype id_ = Idtype())
: proto_base_type(terminal_type::make(reference_(*this)))
, def_(def_)
, token_id_(Idtype() == id_ ? Idtype(def_) : id_)
, unique_id_(std::size_t(~0)), token_state_(std::size_t(~0)) {}
explicit token_def(string_type const& def_, Idtype id_ = Idtype())
: proto_base_type(terminal_type::make(reference_(*this)))
, def_(def_), token_id_(id_)
, unique_id_(std::size_t(~0)), token_state_(std::size_t(~0)) {}
template <typename String>
token_def& operator= (String const& definition)
{
def_ = definition;
token_id_ = Idtype();
unique_id_ = std::size_t(~0);
token_state_ = std::size_t(~0);
return *this;
}
token_def& operator= (token_def const& rhs)
{
def_ = rhs.def_;
token_id_ = rhs.token_id_;
unique_id_ = rhs.unique_id_;
token_state_ = rhs.token_state_;
return *this;
}
// general accessors
Idtype const& id() const { return token_id_; }
void id(Idtype const& id) { token_id_ = id; }
std::size_t unique_id() const { return unique_id_; }
string_type definition() const
{
return (0 == def_.which()) ?
boost::get<string_type>(def_) :
string_type(1, boost::get<char_type>(def_));
}
std::size_t state() const { return token_state_; }
private:
variant<string_type, char_type> def_;
mutable Idtype token_id_;
mutable std::size_t unique_id_;
mutable std::size_t token_state_;
};
}}}
namespace boost { namespace spirit { namespace traits
{
///////////////////////////////////////////////////////////////////////////
template<typename Attribute, typename Char, typename Idtype
, typename Attr, typename Context, typename Iterator>
struct handles_container<
lex::token_def<Attribute, Char, Idtype>, Attr, Context, Iterator>
: traits::is_container<
typename attribute_of<
lex::token_def<Attribute, Char, Idtype>, Context, Iterator
>::type>
{};
}}}
#if defined(BOOST_MSVC)
# pragma warning(pop)
#endif
#endif