/* Copyright (c) 2012-2017 The ANTLR Project. All rights reserved.
* Use of this file is governed by the BSD 3-clause license that
* can be found in the LICENSE.txt file in the project root.
*/
#pragma once
#include "antlr4-common.h"
#include "atn/ATNConfigSet.h"
namespace antlr4 {
namespace dfa {
///
/// A DFA state represents a set of possible ATN configurations.
/// As Aho, Sethi, Ullman p. 117 says "The DFA uses its state
/// to keep track of all possible states the ATN can be in after
/// reading each input symbol. That is to say, after reading
/// input a1a2..an, the DFA is in a state that represents the
/// subset T of the states of the ATN that are reachable from the
/// ATN's start state along some path labeled a1a2..an."
/// In conventional NFA->DFA conversion, therefore, the subset T
/// would be a bitset representing the set of states the
/// ATN could be in. We need to track the alt predicted by each
/// state as well, however. More importantly, we need to maintain
/// a stack of states, tracking the closure operations as they
/// jump from rule to rule, emulating rule invocations (method calls).
/// I have to add a stack to simulate the proper lookahead sequences for
/// the underlying LL grammar from which the ATN was derived.
///
/// I use a set of ATNConfig objects not simple states. An ATNConfig
/// is both a state (ala normal conversion) and a RuleContext describing
/// the chain of rules (if any) followed to arrive at that state.
///
/// A DFA state may have multiple references to a particular state,
/// but with different ATN contexts (with same or different alts)
/// meaning that state was reached via a different set of rule invocations.
///
class ANTLR4CPP_PUBLIC DFAState final {
public:
struct ANTLR4CPP_PUBLIC PredPrediction final {
public:
Ref pred; // never null; at least SemanticContext.NONE
int alt;
PredPrediction() = delete;
PredPrediction(const PredPrediction&) = default;
PredPrediction(PredPrediction&&) = default;
PredPrediction(Ref pred, int alt) : pred(std::move(pred)), alt(alt) {}
PredPrediction& operator=(const PredPrediction&) = default;
PredPrediction& operator=(PredPrediction&&) = default;
std::string toString() const;
};
std::unique_ptr configs;
/// {@code edges[symbol]} points to target of symbol. Shift up by 1 so (-1)
/// maps to {@code edges[0]}.
// ml: this is a sparse list, so we use a map instead of a vector.
// Watch out: we no longer have the -1 offset, as it isn't needed anymore.
std::unordered_map edges;
/// if accept state, what ttype do we match or alt do we predict?
/// This is set to when {@code !=null} or
/// .
size_t prediction = 0;
Ref lexerActionExecutor;
///
/// During SLL parsing, this is a list of predicates associated with the
/// ATN configurations of the DFA state. When we have predicates,
/// is {@code false} since full context prediction evaluates predicates
/// on-the-fly. If this is not null, then is
/// .
///
/// We only use these for non- but conflicting states. That
/// means we know from the context (it's $ or we don't dip into outer
/// context) that it's an ambiguity not a conflict.
///
/// This list is computed by .
///
std::vector predicates;
int stateNumber = -1;
bool isAcceptState = false;
///
/// Indicates that this state was created during SLL prediction that
/// discovered a conflict between the configurations in the state. Future
/// invocations immediately jumped doing
/// full context prediction if this field is true.
///
bool requiresFullContext = false;
/// Map a predicate to a predicted alternative.
DFAState() = default;
explicit DFAState(int stateNumber) : stateNumber(stateNumber) {}
explicit DFAState(std::unique_ptr configs) : configs(std::move(configs)) {}
///
/// Get the set of all alts mentioned by all ATN configurations in this
/// DFA state.
///
std::set getAltSet() const;
size_t hashCode() const;
/// Two DFAState instances are equal if their ATN configuration sets
/// are the same. This method is used to see if a state already exists.
///
/// Because the number of alternatives and number of ATN configurations are
/// finite, there is a finite number of DFA states that can be processed.
/// This is necessary to show that the algorithm terminates.
///
/// Cannot test the DFA state numbers here because in
/// ParserATNSimulator#addDFAState we need to know if any other state
/// exists that has this exact set of ATN configurations. The
/// stateNumber is irrelevant.
bool equals(const DFAState &other) const;
std::string toString() const;
};
inline bool operator==(const DFAState &lhs, const DFAState &rhs) {
return lhs.equals(rhs);
}
inline bool operator!=(const DFAState &lhs, const DFAState &rhs) {
return !operator==(lhs, rhs);
}
} // namespace dfa
} // namespace antlr4
namespace std {
template <>
struct hash<::antlr4::dfa::DFAState> {
size_t operator()(const ::antlr4::dfa::DFAState &dfaState) const {
return dfaState.hashCode();
}
};
} // namespace std