/*
Ousía
Copyright (C) 2014, 2015 Benjamin Paaßen, Andreas Stöckel
This program is free software: you can redistribute it and/or modify
it under the terms of the GNU General Public License as published by
the Free Software Foundation, either version 3 of the License, or
(at your option) any later version.
This program is distributed in the hope that it will be useful,
but WITHOUT ANY WARRANTY; without even the implied warranty of
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
GNU General Public License for more details.
You should have received a copy of the GNU General Public License
along with this program. If not, see .
*/
/**
* @file ParserState.hpp
*
* Defines the ParserState class used within the ParserStack pushdown
* automaton and the ParserStateBuilder class for convenient construction of
* such classes.
*
* @author Andreas Stöckel (astoecke@techfak.uni-bielefeld.de)
*/
#ifndef _OUSIA_PARSER_STATE_HPP_
#define _OUSIA_PARSER_STATE_HPP_
#include
#include
#include
namespace ousia {
// Forward declarations
class ParserStateBuilder;
class ParserState;
class HandlerData;
class Handler;
using HandlerConstructor = Handler *(*)(const HandlerData &handlerData);
/**
* Set of pointers of parser states -- used for specifying a set of parent
* states.
*/
using ParserStateSet = std::unordered_set;
/**
* Class used for the complete specification of a ParserState. Stores possible
* parent states, state handlers and arguments to be passed to that state.
*/
struct ParserState {
/**
* Vector containing all possible parent states.
*/
ParserStateSet parents;
/**
* Descriptor of the arguments that should be passed to the handler.
*/
Arguments arguments;
/**
* Set containing the types of the nodes that may be created in this
* ParserState. This information is needed for Parsers to reconstruct the
* current ParserState from a given ParserScope when a file is included.
*/
RttiSet createdNodeTypes;
/**
* Pointer at a function which creates a new concrete Handler instance for
* the elements described by this state. May be nullptr in which case no
* handler instance is created.
*/
HandlerConstructor elementHandler;
/**
* Pointer at a function which creates a new concrete Handler instance for
* all child elements for which no matching state is defined. May be nullptr
* in which case no such elements are allowed.
*/
HandlerConstructor childHandler;
/**
* Default constructor, initializes the handlers with nullptr.
*/
ParserState();
/**
* Constructor taking values for all fields. Use the ParserStateBuilder
* class for a more convenient construction of ParserState instances.
*
* @param parents is a vector containing all possible parent states.
* @param arguments is a descriptor of arguments that should be passed to
* the handler.
* @param createdNodeTypes is a set containing the types of the nodes tha
* may be created in this ParserState. This information is needed for
* Parsers to reconstruct the current ParserState from a given ParserScope
* when a file is included.
* @param elementHandler is a pointer at a function which creates a new
* concrete Handler instance for the elements described by this state. May
* be nullptr in which case no handler instance is created.
* @param childHandler is a pointer at a function which creates a new
* concrete Handler instance for all child elements for which no matching
* state is defined. May be nullptr in which case no such elements are
* allowed.
*/
ParserState(ParserStateSet parents, Arguments arguments = Arguments{},
RttiSet createdNodeTypes = RttiSet{},
HandlerConstructor elementHandler = nullptr,
HandlerConstructor childHandler = nullptr);
/**
* Creates this ParserState from the given ParserStateBuilder instance.
*/
ParserState(const ParserStateBuilder &builder);
};
/**
* The ParserStateBuilder class is a class used for conveniently building new
* ParserState instances.
*/
class ParserStateBuilder {
private:
/**
* ParserState instance that is currently being built by the
* ParserStateBuilder.
*/
ParserState state;
public:
/**
* Copies the ParserState instance and uses it as internal state. Overrides
* all changes made by the ParserStateBuilder.
*
* @param state is the state that should be copied.
* @return a reference at this ParserStateBuilder instance for method
* chaining.
*/
ParserStateBuilder ©(const ParserState &state);
/**
* Sets the possible parent states to the single given parent element.
*
* @param parent is a pointer at the parent ParserState instance that should
* be the possible parent state.
* @return a reference at this ParserStateBuilder instance for method
* chaining.
*/
ParserStateBuilder &parent(const ParserState *parent);
/**
* Sets the ParserState instances in the given ParserStateSet as the list of
* supported parent states.
*
* @param parents is a set of pointers at ParserState instances that should
* be the possible parent states.
* @return a reference at this ParserStateBuilder instance for method
* chaining.
*/
ParserStateBuilder &parents(const ParserStateSet &parents);
/**
* Sets the arguments that should be passed to the parser state handler to
* those given as argument.
*
* @param arguments is the Arguments instance describing the Arguments that
* should be parsed to a Handler for this ParserState.
* @return a reference at this ParserStateBuilder instance for method
* chaining.
*/
ParserStateBuilder &arguments(const Arguments &arguments);
/**
* Sets the Node types this state may produce to the given Rtti descriptor.
*
* @param type is the Rtti descriptor of the Type that may be produced by
* this state.
* @return a reference at this ParserStateBuilder instance for method
* chaining.
*/
ParserStateBuilder &createdNodeType(const Rtti *type);
/**
* Sets the Node types this state may produce to the given Rtti descriptors.
*
* @param types is a set of Rtti descriptors of the Types that may be
* produced by this state.
* @return a reference at this ParserStateBuilder instance for method
* chaining.
*/
ParserStateBuilder &createdNodeTypes(const RttiSet &types);
/**
* Sets the constructor for the element handler. The constructor creates a
* new concrete Handler instance for the elements described by this state.
* May be nullptr in which case no handler instance is created (this is
* the default value).
*
* @param elementHandler is the HandlerConstructor that should create a
* new Handler instance.
* @return a reference at this ParserStateBuilder instance for method
* chaining.
*/
ParserStateBuilder &elementHandler(HandlerConstructor elementHandler);
/**
* Sets the constructor for the child handler. The constructor creates a new
* concrete Handler instance for all child elements for which no matching
* state is defined. May be nullptr in which case no such elements are
* allowed.
*
* @param childHandler is the HandlerConstructor that should point at the
* constructor of the Handler instance for child elements.
* @return a reference at this ParserStateBuilder instance for method
* chaining.
*/
ParserStateBuilder &childHandler(HandlerConstructor childHandler);
/**
* Returns a reference at the internal ParserState instance that was built
* using the ParserStateBuilder.
*
* @return the built ParserState.
*/
const ParserState &build() const;
};
/**
* Class used to deduce the ParserState a Parser is currently in based on the
* types of the Nodes that currently are on the ParserStack. Uses dynamic
* programming in order to solve this problem.
*/
class ParserStateDeductor {
public:
/**
* Type containing the dynamic programming table.
*/
using Table = std::vector>;
private:
/**
* Dynamic programming table.
*/
Table tbl;
/**
* Signature given in the constructor.
*/
const std::vector signature;
/**
* List of states that should be checked for being active.
*/
const std::vector states;
/**
* Used internally to check whether the given parser stack s may have been
* active for signature element d.
*
* @param d is the signature element.
* @param s is the parser state.
* @return true if the the given ParserState may have been active.
*/
bool isActive(size_t d, const ParserState *s);
public:
/**
* Constructor of the ParserStateDeductor class.
*
* @param signature a Node type signature describing the types of the nodes
* which currently reside on e.g. the ParserScope stack.
* @param states is a list of states that should be checked.
*/
ParserStateDeductor(std::vector signature,
std::vector states);
/**
* Selects all active states from the given states. Only considers those
* states that may have produced the last signature element.
*
* @return a list of states that may actually have been active.
*/
std::vector deduce();
};
/**
* The ParserStates namespace contains all the global state constants used
* in the ParserStack class.
*/
namespace ParserStates {
/**
* State representing all states.
*/
extern const ParserState All;
/**
* State representing the initial state.
*/
extern const ParserState None;
}
}
#endif /* _OUSIA_PARSER_STATE_HPP_ */