summaryrefslogtreecommitdiff
path: root/src/core/parser/generic/ParserState.hpp
diff options
context:
space:
mode:
Diffstat (limited to 'src/core/parser/generic/ParserState.hpp')
-rw-r--r--src/core/parser/generic/ParserState.hpp284
1 files changed, 284 insertions, 0 deletions
diff --git a/src/core/parser/generic/ParserState.hpp b/src/core/parser/generic/ParserState.hpp
new file mode 100644
index 0000000..6487fdd
--- /dev/null
+++ b/src/core/parser/generic/ParserState.hpp
@@ -0,0 +1,284 @@
+/*
+ Ousía
+ Copyright (C) 2014, 2015 Benjamin Paaßen, Andreas Stöckel
+
+ This program is free software: you can redistribute it and/or modify
+ it under the terms of the GNU General Public License as published by
+ the Free Software Foundation, either version 3 of the License, or
+ (at your option) any later version.
+
+ This program is distributed in the hope that it will be useful,
+ but WITHOUT ANY WARRANTY; without even the implied warranty of
+ MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
+ GNU General Public License for more details.
+
+ You should have received a copy of the GNU General Public License
+ along with this program. If not, see <http://www.gnu.org/licenses/>.
+*/
+
+/**
+ * @file ParserState.hpp
+ *
+ * Defines the ParserState class used within the ParserStack pushdown
+ * automaton and the ParserStateBuilder class for convenient construction of
+ * such classes.
+ *
+ * @author Andreas Stöckel (astoecke@techfak.uni-bielefeld.de)
+ */
+
+#ifndef _OUSIA_PARSER_STATE_HPP_
+#define _OUSIA_PARSER_STATE_HPP_
+
+#include <unordered_set>
+
+#include <core/common/Rtti.hpp>
+#include <core/common/Argument.hpp>
+
+namespace ousia {
+
+// Forward declarations
+class ParserStateBuilder;
+class ParserState;
+class HandlerData;
+class Handler;
+using HandlerConstructor = Handler *(*)(const HandlerData &handlerData);
+
+/**
+ * Set of pointers of parser states -- used for specifying a set of parent
+ * states.
+ */
+using ParserStateSet = std::unordered_set<const ParserState *>;
+
+/**
+ * Class used for the complete specification of a ParserState. Stores possible
+ * parent states, state handlers and arguments to be passed to that state.
+ */
+struct ParserState {
+ /**
+ * Vector containing all possible parent states.
+ */
+ ParserStateSet parents;
+
+ /**
+ * Descriptor of the arguments that should be passed to the handler.
+ */
+ Arguments arguments;
+
+ /**
+ * Set containing the types of the nodes that may be created in this
+ * ParserState. This information is needed for Parsers to reconstruct the
+ * current ParserState from a given ParserScope when a file is included.
+ */
+ RttiSet createdNodeTypes;
+
+ /**
+ * Pointer at a function which creates a new concrete Handler instance for
+ * the elements described by this state. May be nullptr in which case no
+ * handler instance is created.
+ */
+ HandlerConstructor elementHandler;
+
+ /**
+ * Default constructor, initializes the handlers with nullptr.
+ */
+ ParserState();
+
+ /**
+ * Constructor taking values for all fields. Use the ParserStateBuilder
+ * class for a more convenient construction of ParserState instances.
+ *
+ * @param parents is a vector containing all possible parent states.
+ * @param arguments is a descriptor of arguments that should be passed to
+ * the handler.
+ * @param createdNodeTypes is a set containing the types of the nodes tha
+ * may be created in this ParserState. This information is needed for
+ * Parsers to reconstruct the current ParserState from a given ParserScope
+ * when a file is included.
+ * @param elementHandler is a pointer at a function which creates a new
+ * concrete Handler instance for the elements described by this state. May
+ * be nullptr in which case no handler instance is created.
+ */
+ ParserState(ParserStateSet parents, Arguments arguments = Arguments{},
+ RttiSet createdNodeTypes = RttiSet{},
+ HandlerConstructor elementHandler = nullptr);
+
+ /**
+ * Creates this ParserState from the given ParserStateBuilder instance.
+ */
+ ParserState(const ParserStateBuilder &builder);
+};
+
+/**
+ * The ParserStateBuilder class is a class used for conveniently building new
+ * ParserState instances.
+ */
+class ParserStateBuilder {
+private:
+ /**
+ * ParserState instance that is currently being built by the
+ * ParserStateBuilder.
+ */
+ ParserState state;
+
+public:
+ /**
+ * Copies the ParserState instance and uses it as internal state. Overrides
+ * all changes made by the ParserStateBuilder.
+ *
+ * @param state is the state that should be copied.
+ * @return a reference at this ParserStateBuilder instance for method
+ * chaining.
+ */
+ ParserStateBuilder &copy(const ParserState &state);
+
+ /**
+ * Sets the possible parent states to the single given parent element.
+ *
+ * @param parent is a pointer at the parent ParserState instance that should
+ * be the possible parent state.
+ * @return a reference at this ParserStateBuilder instance for method
+ * chaining.
+ */
+ ParserStateBuilder &parent(const ParserState *parent);
+
+ /**
+ * Sets the ParserState instances in the given ParserStateSet as the list of
+ * supported parent states.
+ *
+ * @param parents is a set of pointers at ParserState instances that should
+ * be the possible parent states.
+ * @return a reference at this ParserStateBuilder instance for method
+ * chaining.
+ */
+ ParserStateBuilder &parents(const ParserStateSet &parents);
+
+ /**
+ * Sets the arguments that should be passed to the parser state handler to
+ * those given as argument.
+ *
+ * @param arguments is the Arguments instance describing the Arguments that
+ * should be parsed to a Handler for this ParserState.
+ * @return a reference at this ParserStateBuilder instance for method
+ * chaining.
+ */
+ ParserStateBuilder &arguments(const Arguments &arguments);
+
+ /**
+ * Sets the Node types this state may produce to the given Rtti descriptor.
+ *
+ * @param type is the Rtti descriptor of the Type that may be produced by
+ * this state.
+ * @return a reference at this ParserStateBuilder instance for method
+ * chaining.
+ */
+ ParserStateBuilder &createdNodeType(const Rtti *type);
+
+ /**
+ * Sets the Node types this state may produce to the given Rtti descriptors.
+ *
+ * @param types is a set of Rtti descriptors of the Types that may be
+ * produced by this state.
+ * @return a reference at this ParserStateBuilder instance for method
+ * chaining.
+ */
+ ParserStateBuilder &createdNodeTypes(const RttiSet &types);
+
+ /**
+ * Sets the constructor for the element handler. The constructor creates a
+ * new concrete Handler instance for the elements described by this state.
+ * May be nullptr in which case no handler instance is created (this is
+ * the default value).
+ *
+ * @param elementHandler is the HandlerConstructor that should create a
+ * new Handler instance.
+ * @return a reference at this ParserStateBuilder instance for method
+ * chaining.
+ */
+ ParserStateBuilder &elementHandler(HandlerConstructor elementHandler);
+
+ /**
+ * Returns a reference at the internal ParserState instance that was built
+ * using the ParserStateBuilder.
+ *
+ * @return the built ParserState.
+ */
+ const ParserState &build() const;
+};
+
+/**
+ * Class used to deduce the ParserState a Parser is currently in based on the
+ * types of the Nodes that currently are on the ParserStack. Uses dynamic
+ * programming in order to solve this problem.
+ */
+class ParserStateDeductor {
+public:
+ /**
+ * Type containing the dynamic programming table.
+ */
+ using Table = std::vector<std::unordered_map<const ParserState *, bool>>;
+
+private:
+ /**
+ * Dynamic programming table.
+ */
+ Table tbl;
+
+ /**
+ * Signature given in the constructor.
+ */
+ const std::vector<const Rtti *> signature;
+
+ /**
+ * List of states that should be checked for being active.
+ */
+ const std::vector<const ParserState *> states;
+
+ /**
+ * Used internally to check whether the given parser stack s may have been
+ * active for signature element d.
+ *
+ * @param d is the signature element.
+ * @param s is the parser state.
+ * @return true if the the given ParserState may have been active.
+ */
+ bool isActive(size_t d, const ParserState *s);
+
+public:
+ /**
+ * Constructor of the ParserStateDeductor class.
+ *
+ * @param signature a Node type signature describing the types of the nodes
+ * which currently reside on e.g. the ParserScope stack.
+ * @param states is a list of states that should be checked.
+ */
+ ParserStateDeductor(std::vector<const Rtti *> signature,
+ std::vector<const ParserState *> states);
+
+ /**
+ * Selects all active states from the given states. Only considers those
+ * states that may have produced the last signature element.
+ *
+ * @return a list of states that may actually have been active.
+ */
+ std::vector<const ParserState *> deduce();
+};
+
+/**
+ * The ParserStates namespace contains all the global state constants used
+ * in the ParserStack class.
+ */
+namespace ParserStates {
+/**
+ * State representing all states.
+ */
+extern const ParserState All;
+
+/**
+ * State representing the initial state.
+ */
+extern const ParserState None;
+}
+}
+
+#endif /* _OUSIA_PARSER_STATE_HPP_ */
+