/* Copyright (c) 2012-2017 The ANTLR Project. All rights reserved. * Use of this file is governed by the BSD 3-clause license that * can be found in the LICENSE.txt file in the project root. */ #pragma once #include "antlr4-common.h" #include "atn/ATNConfigSet.h" namespace antlr4 { namespace dfa { /// /// A DFA state represents a set of possible ATN configurations. /// As Aho, Sethi, Ullman p. 117 says "The DFA uses its state /// to keep track of all possible states the ATN can be in after /// reading each input symbol. That is to say, after reading /// input a1a2..an, the DFA is in a state that represents the /// subset T of the states of the ATN that are reachable from the /// ATN's start state along some path labeled a1a2..an." /// In conventional NFA->DFA conversion, therefore, the subset T /// would be a bitset representing the set of states the /// ATN could be in. We need to track the alt predicted by each /// state as well, however. More importantly, we need to maintain /// a stack of states, tracking the closure operations as they /// jump from rule to rule, emulating rule invocations (method calls). /// I have to add a stack to simulate the proper lookahead sequences for /// the underlying LL grammar from which the ATN was derived. ///

/// I use a set of ATNConfig objects not simple states. An ATNConfig /// is both a state (ala normal conversion) and a RuleContext describing /// the chain of rules (if any) followed to arrive at that state. ///

/// A DFA state may have multiple references to a particular state, /// but with different ATN contexts (with same or different alts) /// meaning that state was reached via a different set of rule invocations. ///

class ANTLR4CPP_PUBLIC DFAState final { public: struct ANTLR4CPP_PUBLIC PredPrediction final { public: Ref pred; // never null; at least SemanticContext.NONE int alt; PredPrediction() = delete; PredPrediction(const PredPrediction&) = default; PredPrediction(PredPrediction&&) = default; PredPrediction(Ref pred, int alt) : pred(std::move(pred)), alt(alt) {} PredPrediction& operator=(const PredPrediction&) = default; PredPrediction& operator=(PredPrediction&&) = default; std::string toString() const; }; std::unique_ptr configs; /// {@code edges[symbol]} points to target of symbol. Shift up by 1 so (-1) /// maps to {@code edges[0]}. // ml: this is a sparse list, so we use a map instead of a vector. // Watch out: we no longer have the -1 offset, as it isn't needed anymore. std::unordered_map edges; /// if accept state, what ttype do we match or alt do we predict? /// This is set to when {@code !=null} or /// . size_t prediction = 0; Ref lexerActionExecutor; /// /// During SLL parsing, this is a list of predicates associated with the /// ATN configurations of the DFA state. When we have predicates, /// is {@code false} since full context prediction evaluates predicates /// on-the-fly. If this is not null, then is /// . ///

/// We only use these for non- but conflicting states. That /// means we know from the context (it's $ or we don't dip into outer /// context) that it's an ambiguity not a conflict. ///

/// This list is computed by . ///

std::vector predicates; int stateNumber = -1; bool isAcceptState = false; /// /// Indicates that this state was created during SLL prediction that /// discovered a conflict between the configurations in the state. Future /// invocations immediately jumped doing /// full context prediction if this field is true. /// bool requiresFullContext = false; /// Map a predicate to a predicted alternative. DFAState() = default; explicit DFAState(int stateNumber) : stateNumber(stateNumber) {} explicit DFAState(std::unique_ptr configs) : configs(std::move(configs)) {} /// /// Get the set of all alts mentioned by all ATN configurations in this /// DFA state. /// std::set getAltSet() const; size_t hashCode() const; /// Two DFAState instances are equal if their ATN configuration sets /// are the same. This method is used to see if a state already exists. /// /// Because the number of alternatives and number of ATN configurations are /// finite, there is a finite number of DFA states that can be processed. /// This is necessary to show that the algorithm terminates. /// /// Cannot test the DFA state numbers here because in /// ParserATNSimulator#addDFAState we need to know if any other state /// exists that has this exact set of ATN configurations. The /// stateNumber is irrelevant. bool equals(const DFAState &other) const; std::string toString() const; }; inline bool operator==(const DFAState &lhs, const DFAState &rhs) { return lhs.equals(rhs); } inline bool operator!=(const DFAState &lhs, const DFAState &rhs) { return !operator==(lhs, rhs); } } // namespace dfa } // namespace antlr4 namespace std { template <> struct hash<::antlr4::dfa::DFAState> { size_t operator()(const ::antlr4::dfa::DFAState &dfaState) const { return dfaState.hashCode(); } }; } // namespace std