add antlr

This commit is contained in:
2020-09-29 23:16:42 +05:30
parent 34754a7130
commit 2b36e74ff5
181 changed files with 14689 additions and 7 deletions

View File

@@ -0,0 +1,91 @@
/* Copyright (c) 2012-2017 The ANTLR Project. All rights reserved.
* Use of this file is governed by the BSD 3-clause license that
* can be found in the LICENSE.txt file in the project root.
*/
#pragma once
#include "dfa/DFAState.h"
namespace antlrcpp {
class SingleWriteMultipleReadLock;
}
namespace antlr4 {
namespace dfa {
class ANTLR4CPP_PUBLIC DFA {
public:
/// A set of all DFA states. Use a map so we can get old state back.
/// Set only allows you to see if it's there.
/// From which ATN state did we create this DFA?
atn::DecisionState *atnStartState;
std::unordered_set<DFAState *, DFAState::Hasher, DFAState::Comparer> states; // States are owned by this class.
DFAState *s0;
size_t decision;
DFA(atn::DecisionState *atnStartState);
DFA(atn::DecisionState *atnStartState, size_t decision);
DFA(const DFA &other) = delete;
DFA(DFA &&other);
virtual ~DFA();
/**
* Gets whether this DFA is a precedence DFA. Precedence DFAs use a special
* start state {@link #s0} which is not stored in {@link #states}. The
* {@link DFAState#edges} array for this start state contains outgoing edges
* supplying individual start states corresponding to specific precedence
* values.
*
* @return {@code true} if this is a precedence DFA; otherwise,
* {@code false}.
* @see Parser#getPrecedence()
*/
bool isPrecedenceDfa() const;
/**
* Get the start state for a specific precedence value.
*
* @param precedence The current precedence.
* @return The start state corresponding to the specified precedence, or
* {@code null} if no start state exists for the specified precedence.
*
* @throws IllegalStateException if this is not a precedence DFA.
* @see #isPrecedenceDfa()
*/
DFAState* getPrecedenceStartState(int precedence) const;
/**
* Set the start state for a specific precedence value.
*
* @param precedence The current precedence.
* @param startState The start state corresponding to the specified
* precedence.
*
* @throws IllegalStateException if this is not a precedence DFA.
* @see #isPrecedenceDfa()
*/
void setPrecedenceStartState(int precedence, DFAState *startState, antlrcpp::SingleWriteMultipleReadLock &lock);
/// Return a list of all states in this DFA, ordered by state number.
virtual std::vector<DFAState *> getStates() const;
/**
* @deprecated Use {@link #toString(Vocabulary)} instead.
*/
virtual std::string toString(const std::vector<std::string>& tokenNames);
std::string toString(const Vocabulary &vocabulary) const;
virtual std::string toLexerString();
private:
/**
* {@code true} if this DFA is for a precedence decision; otherwise,
* {@code false}. This is the backing field for {@link #isPrecedenceDfa}.
*/
bool _precedenceDfa;
};
} // namespace atn
} // namespace antlr4

View File

@@ -0,0 +1,32 @@
/* Copyright (c) 2012-2017 The ANTLR Project. All rights reserved.
* Use of this file is governed by the BSD 3-clause license that
* can be found in the LICENSE.txt file in the project root.
*/
#pragma once
#include "Vocabulary.h"
namespace antlr4 {
namespace dfa {
/// A DFA walker that knows how to dump them to serialized strings.
class ANTLR4CPP_PUBLIC DFASerializer {
public:
DFASerializer(const DFA *dfa, const std::vector<std::string>& tnames);
DFASerializer(const DFA *dfa, const Vocabulary &vocabulary);
virtual ~DFASerializer();
virtual std::string toString() const;
protected:
virtual std::string getEdgeLabel(size_t i) const;
virtual std::string getStateString(DFAState *s) const;
private:
const DFA *_dfa;
const Vocabulary &_vocabulary;
};
} // namespace atn
} // namespace antlr4

View File

@@ -0,0 +1,144 @@
/* Copyright (c) 2012-2017 The ANTLR Project. All rights reserved.
* Use of this file is governed by the BSD 3-clause license that
* can be found in the LICENSE.txt file in the project root.
*/
#pragma once
#include "antlr4-common.h"
namespace antlr4 {
namespace dfa {
/// <summary>
/// A DFA state represents a set of possible ATN configurations.
/// As Aho, Sethi, Ullman p. 117 says "The DFA uses its state
/// to keep track of all possible states the ATN can be in after
/// reading each input symbol. That is to say, after reading
/// input a1a2..an, the DFA is in a state that represents the
/// subset T of the states of the ATN that are reachable from the
/// ATN's start state along some path labeled a1a2..an."
/// In conventional NFA->DFA conversion, therefore, the subset T
/// would be a bitset representing the set of states the
/// ATN could be in. We need to track the alt predicted by each
/// state as well, however. More importantly, we need to maintain
/// a stack of states, tracking the closure operations as they
/// jump from rule to rule, emulating rule invocations (method calls).
/// I have to add a stack to simulate the proper lookahead sequences for
/// the underlying LL grammar from which the ATN was derived.
/// <p/>
/// I use a set of ATNConfig objects not simple states. An ATNConfig
/// is both a state (ala normal conversion) and a RuleContext describing
/// the chain of rules (if any) followed to arrive at that state.
/// <p/>
/// A DFA state may have multiple references to a particular state,
/// but with different ATN contexts (with same or different alts)
/// meaning that state was reached via a different set of rule invocations.
/// </summary>
class ANTLR4CPP_PUBLIC DFAState {
public:
class PredPrediction {
public:
Ref<atn::SemanticContext> pred; // never null; at least SemanticContext.NONE
int alt;
PredPrediction(const Ref<atn::SemanticContext> &pred, int alt);
virtual ~PredPrediction();
virtual std::string toString();
private:
void InitializeInstanceFields();
};
int stateNumber;
std::unique_ptr<atn::ATNConfigSet> configs;
/// {@code edges[symbol]} points to target of symbol. Shift up by 1 so (-1)
/// <seealso cref="Token#EOF"/> maps to {@code edges[0]}.
// ml: this is a sparse list, so we use a map instead of a vector.
// Watch out: we no longer have the -1 offset, as it isn't needed anymore.
std::unordered_map<size_t, DFAState *> edges;
bool isAcceptState;
/// if accept state, what ttype do we match or alt do we predict?
/// This is set to <seealso cref="ATN#INVALID_ALT_NUMBER"/> when <seealso cref="#predicates"/>{@code !=null} or
/// <seealso cref="#requiresFullContext"/>.
size_t prediction;
Ref<atn::LexerActionExecutor> lexerActionExecutor;
/// <summary>
/// Indicates that this state was created during SLL prediction that
/// discovered a conflict between the configurations in the state. Future
/// <seealso cref="ParserATNSimulator#execATN"/> invocations immediately jumped doing
/// full context prediction if this field is true.
/// </summary>
bool requiresFullContext;
/// <summary>
/// During SLL parsing, this is a list of predicates associated with the
/// ATN configurations of the DFA state. When we have predicates,
/// <seealso cref="#requiresFullContext"/> is {@code false} since full context prediction evaluates predicates
/// on-the-fly. If this is not null, then <seealso cref="#prediction"/> is
/// <seealso cref="ATN#INVALID_ALT_NUMBER"/>.
/// <p/>
/// We only use these for non-<seealso cref="#requiresFullContext"/> but conflicting states. That
/// means we know from the context (it's $ or we don't dip into outer
/// context) that it's an ambiguity not a conflict.
/// <p/>
/// This list is computed by <seealso cref="ParserATNSimulator#predicateDFAState"/>.
/// </summary>
std::vector<PredPrediction *> predicates;
/// Map a predicate to a predicted alternative.
DFAState();
DFAState(int state);
DFAState(std::unique_ptr<atn::ATNConfigSet> configs);
virtual ~DFAState();
/// <summary>
/// Get the set of all alts mentioned by all ATN configurations in this
/// DFA state.
/// </summary>
virtual std::set<size_t> getAltSet();
virtual size_t hashCode() const;
/// Two DFAState instances are equal if their ATN configuration sets
/// are the same. This method is used to see if a state already exists.
///
/// Because the number of alternatives and number of ATN configurations are
/// finite, there is a finite number of DFA states that can be processed.
/// This is necessary to show that the algorithm terminates.
///
/// Cannot test the DFA state numbers here because in
/// ParserATNSimulator#addDFAState we need to know if any other state
/// exists that has this exact set of ATN configurations. The
/// stateNumber is irrelevant.
bool operator == (const DFAState &o) const;
virtual std::string toString();
struct Hasher
{
size_t operator()(DFAState *k) const {
return k->hashCode();
}
};
struct Comparer {
bool operator()(DFAState *lhs, DFAState *rhs) const
{
return *lhs == *rhs;
}
};
private:
void InitializeInstanceFields();
};
} // namespace atn
} // namespace antlr4

View File

@@ -0,0 +1,23 @@
/* Copyright (c) 2012-2017 The ANTLR Project. All rights reserved.
* Use of this file is governed by the BSD 3-clause license that
* can be found in the LICENSE.txt file in the project root.
*/
#pragma once
#include "dfa/DFASerializer.h"
namespace antlr4 {
namespace dfa {
class ANTLR4CPP_PUBLIC LexerDFASerializer : public DFASerializer {
public:
LexerDFASerializer(DFA *dfa);
virtual ~LexerDFASerializer();
protected:
virtual std::string getEdgeLabel(size_t i) const override;
};
} // namespace atn
} // namespace antlr4