249 lines
9.1 KiB
C++
249 lines
9.1 KiB
C++
|
// Copyright (c) 2001-2011 Hartmut Kaiser
|
||
|
//
|
||
|
// Distributed under the Boost Software License, Version 1.0. (See accompanying
|
||
|
// file LICENSE_1_0.txt or copy at http://www.boost.org/LICENSE_1_0.txt)
|
||
|
|
||
|
#if !defined(BOOST_SPIRIT_LEX_TOKEN_DEF_MAR_13_2007_0145PM)
|
||
|
#define BOOST_SPIRIT_LEX_TOKEN_DEF_MAR_13_2007_0145PM
|
||
|
|
||
|
#if defined(_MSC_VER)
|
||
|
#pragma once
|
||
|
#endif
|
||
|
|
||
|
#include <boost/spirit/home/support/unused.hpp>
|
||
|
#include <boost/spirit/home/support/argument.hpp>
|
||
|
#include <boost/spirit/home/support/info.hpp>
|
||
|
#include <boost/spirit/home/support/handles_container.hpp>
|
||
|
#include <boost/spirit/home/qi/parser.hpp>
|
||
|
#include <boost/spirit/home/qi/skip_over.hpp>
|
||
|
#include <boost/spirit/home/qi/detail/construct.hpp>
|
||
|
#include <boost/spirit/home/qi/detail/assign_to.hpp>
|
||
|
#include <boost/spirit/home/lex/reference.hpp>
|
||
|
#include <boost/spirit/home/lex/lexer_type.hpp>
|
||
|
#include <boost/spirit/home/lex/lexer/terminals.hpp>
|
||
|
|
||
|
#include <boost/fusion/include/vector.hpp>
|
||
|
#include <boost/mpl/if.hpp>
|
||
|
#include <boost/proto/extends.hpp>
|
||
|
#include <boost/proto/traits.hpp>
|
||
|
#include <boost/type_traits/is_same.hpp>
|
||
|
#include <boost/variant.hpp>
|
||
|
|
||
|
#include <iterator> // for std::iterator_traits
|
||
|
#include <string>
|
||
|
#include <cstdlib>
|
||
|
|
||
|
#if defined(BOOST_MSVC)
|
||
|
# pragma warning(push)
|
||
|
# pragma warning(disable: 4355) // 'this' : used in base member initializer list warning
|
||
|
#endif
|
||
|
|
||
|
namespace boost { namespace spirit { namespace lex
|
||
|
{
|
||
|
///////////////////////////////////////////////////////////////////////////
|
||
|
// This component represents a token definition
|
||
|
///////////////////////////////////////////////////////////////////////////
|
||
|
template<typename Attribute = unused_type
|
||
|
, typename Char = char
|
||
|
, typename Idtype = std::size_t>
|
||
|
struct token_def
|
||
|
: proto::extends<
|
||
|
typename proto::terminal<
|
||
|
lex::reference<token_def<Attribute, Char, Idtype> const, Idtype>
|
||
|
>::type
|
||
|
, token_def<Attribute, Char, Idtype> >
|
||
|
, qi::parser<token_def<Attribute, Char, Idtype> >
|
||
|
, lex::lexer_type<token_def<Attribute, Char, Idtype> >
|
||
|
{
|
||
|
private:
|
||
|
// initialize proto base class
|
||
|
typedef lex::reference<token_def const, Idtype> reference_;
|
||
|
typedef typename proto::terminal<reference_>::type terminal_type;
|
||
|
typedef proto::extends<terminal_type, token_def> proto_base_type;
|
||
|
|
||
|
static std::size_t const all_states_id = static_cast<std::size_t>(-2);
|
||
|
|
||
|
public:
|
||
|
// Qi interface: meta-function calculating parser return type
|
||
|
template <typename Context, typename Iterator>
|
||
|
struct attribute
|
||
|
{
|
||
|
// The return value of the token_def is either the specified
|
||
|
// attribute type, or the pair of iterators from the match of the
|
||
|
// corresponding token (if no attribute type has been specified),
|
||
|
// or unused_type (if omit has been specified).
|
||
|
typedef typename Iterator::base_iterator_type iterator_type;
|
||
|
typedef typename mpl::if_<
|
||
|
traits::not_is_unused<Attribute>
|
||
|
, typename mpl::if_<
|
||
|
is_same<Attribute, lex::omit>, unused_type, Attribute
|
||
|
>::type
|
||
|
, iterator_range<iterator_type>
|
||
|
>::type type;
|
||
|
};
|
||
|
|
||
|
public:
|
||
|
// Qi interface: parse functionality
|
||
|
template <typename Iterator, typename Context
|
||
|
, typename Skipper, typename Attribute_>
|
||
|
bool parse(Iterator& first, Iterator const& last
|
||
|
, Context& /*context*/, Skipper const& skipper
|
||
|
, Attribute_& attr) const
|
||
|
{
|
||
|
qi::skip_over(first, last, skipper); // always do a pre-skip
|
||
|
|
||
|
if (first != last) {
|
||
|
typedef typename
|
||
|
std::iterator_traits<Iterator>::value_type
|
||
|
token_type;
|
||
|
|
||
|
// If the following assertion fires you probably forgot to
|
||
|
// associate this token definition with a lexer instance.
|
||
|
BOOST_ASSERT(std::size_t(~0) != token_state_);
|
||
|
|
||
|
token_type const& t = *first;
|
||
|
if (token_id_ == t.id() &&
|
||
|
(all_states_id == token_state_ || token_state_ == t.state()))
|
||
|
{
|
||
|
spirit::traits::assign_to(t, attr);
|
||
|
++first;
|
||
|
return true;
|
||
|
}
|
||
|
}
|
||
|
return false;
|
||
|
}
|
||
|
|
||
|
template <typename Context>
|
||
|
info what(Context& /*context*/) const
|
||
|
{
|
||
|
if (0 == def_.which())
|
||
|
return info("token_def", boost::get<string_type>(def_));
|
||
|
|
||
|
return info("token_def", boost::get<char_type>(def_));
|
||
|
}
|
||
|
|
||
|
///////////////////////////////////////////////////////////////////////
|
||
|
// Lex interface: collect token definitions and put it into the
|
||
|
// provided lexer def
|
||
|
template <typename LexerDef, typename String>
|
||
|
void collect(LexerDef& lexdef, String const& state
|
||
|
, String const& targetstate) const
|
||
|
{
|
||
|
std::size_t state_id = lexdef.add_state(state.c_str());
|
||
|
|
||
|
// If the following assertion fires you are probably trying to use
|
||
|
// a single token_def instance in more than one lexer state. This
|
||
|
// is not possible. Please create a separate token_def instance
|
||
|
// from the same regular expression for each lexer state it needs
|
||
|
// to be associated with.
|
||
|
BOOST_ASSERT(
|
||
|
(std::size_t(~0) == token_state_ || state_id == token_state_) &&
|
||
|
"Can't use single token_def with more than one lexer state");
|
||
|
|
||
|
char_type const* target = targetstate.empty() ? 0 : targetstate.c_str();
|
||
|
if (target)
|
||
|
lexdef.add_state(target);
|
||
|
|
||
|
token_state_ = state_id;
|
||
|
if (0 == token_id_)
|
||
|
token_id_ = lexdef.get_next_id();
|
||
|
|
||
|
if (0 == def_.which()) {
|
||
|
unique_id_ = lexdef.add_token(state.c_str()
|
||
|
, boost::get<string_type>(def_), token_id_, target);
|
||
|
}
|
||
|
else {
|
||
|
unique_id_ = lexdef.add_token(state.c_str()
|
||
|
, boost::get<char_type>(def_), token_id_, target);
|
||
|
}
|
||
|
}
|
||
|
|
||
|
template <typename LexerDef>
|
||
|
void add_actions(LexerDef&) const {}
|
||
|
|
||
|
public:
|
||
|
typedef Char char_type;
|
||
|
typedef Idtype id_type;
|
||
|
typedef std::basic_string<char_type> string_type;
|
||
|
|
||
|
// Lex interface: constructing token definitions
|
||
|
token_def()
|
||
|
: proto_base_type(terminal_type::make(reference_(*this)))
|
||
|
, def_('\0'), token_id_()
|
||
|
, unique_id_(std::size_t(~0)), token_state_(std::size_t(~0)) {}
|
||
|
|
||
|
token_def(token_def const& rhs)
|
||
|
: proto_base_type(terminal_type::make(reference_(*this)))
|
||
|
, def_(rhs.def_), token_id_(rhs.token_id_)
|
||
|
, unique_id_(rhs.unique_id_), token_state_(rhs.token_state_) {}
|
||
|
|
||
|
explicit token_def(char_type def_, Idtype id_ = Idtype())
|
||
|
: proto_base_type(terminal_type::make(reference_(*this)))
|
||
|
, def_(def_)
|
||
|
, token_id_(Idtype() == id_ ? Idtype(def_) : id_)
|
||
|
, unique_id_(std::size_t(~0)), token_state_(std::size_t(~0)) {}
|
||
|
|
||
|
explicit token_def(string_type const& def_, Idtype id_ = Idtype())
|
||
|
: proto_base_type(terminal_type::make(reference_(*this)))
|
||
|
, def_(def_), token_id_(id_)
|
||
|
, unique_id_(std::size_t(~0)), token_state_(std::size_t(~0)) {}
|
||
|
|
||
|
template <typename String>
|
||
|
token_def& operator= (String const& definition)
|
||
|
{
|
||
|
def_ = definition;
|
||
|
token_id_ = Idtype();
|
||
|
unique_id_ = std::size_t(~0);
|
||
|
token_state_ = std::size_t(~0);
|
||
|
return *this;
|
||
|
}
|
||
|
token_def& operator= (token_def const& rhs)
|
||
|
{
|
||
|
def_ = rhs.def_;
|
||
|
token_id_ = rhs.token_id_;
|
||
|
unique_id_ = rhs.unique_id_;
|
||
|
token_state_ = rhs.token_state_;
|
||
|
return *this;
|
||
|
}
|
||
|
|
||
|
// general accessors
|
||
|
Idtype const& id() const { return token_id_; }
|
||
|
void id(Idtype const& id) { token_id_ = id; }
|
||
|
std::size_t unique_id() const { return unique_id_; }
|
||
|
|
||
|
string_type definition() const
|
||
|
{
|
||
|
return (0 == def_.which()) ?
|
||
|
boost::get<string_type>(def_) :
|
||
|
string_type(1, boost::get<char_type>(def_));
|
||
|
}
|
||
|
std::size_t state() const { return token_state_; }
|
||
|
|
||
|
private:
|
||
|
variant<string_type, char_type> def_;
|
||
|
mutable Idtype token_id_;
|
||
|
mutable std::size_t unique_id_;
|
||
|
mutable std::size_t token_state_;
|
||
|
};
|
||
|
}}}
|
||
|
|
||
|
namespace boost { namespace spirit { namespace traits
|
||
|
{
|
||
|
///////////////////////////////////////////////////////////////////////////
|
||
|
template<typename Attribute, typename Char, typename Idtype
|
||
|
, typename Attr, typename Context, typename Iterator>
|
||
|
struct handles_container<
|
||
|
lex::token_def<Attribute, Char, Idtype>, Attr, Context, Iterator>
|
||
|
: traits::is_container<
|
||
|
typename attribute_of<
|
||
|
lex::token_def<Attribute, Char, Idtype>, Context, Iterator
|
||
|
>::type>
|
||
|
{};
|
||
|
}}}
|
||
|
|
||
|
#if defined(BOOST_MSVC)
|
||
|
# pragma warning(pop)
|
||
|
#endif
|
||
|
|
||
|
#endif
|