Suppose a parse state S has multiple actions for a terminal lookahead symbol A. Then during incremental parsing, while in state S, the parser should not reuse a non-terminal lookahead B where FIRST(B) contains A, because reusing B might prematurely discard one of the possible actions that a batch parser would have attempted in state S, upon seeing A as a lookahead.
40 lines
1.2 KiB
C++
40 lines
1.2 KiB
C++
#include "compiler/syntax_grammar.h"
|
|
#include <vector>
|
|
#include <string>
|
|
#include <utility>
|
|
#include "compiler/rules/symbol.h"
|
|
#include "compiler/rules/built_in_symbols.h"
|
|
|
|
namespace tree_sitter {
|
|
|
|
using std::string;
|
|
using std::to_string;
|
|
using std::pair;
|
|
using std::vector;
|
|
using std::set;
|
|
|
|
static const vector<Production> NO_PRODUCTIONS;
|
|
|
|
SyntaxVariable::SyntaxVariable(const string &name, VariableType type,
|
|
const vector<Production> &productions)
|
|
: name(name), productions(productions), type(type) {}
|
|
|
|
ProductionStep::ProductionStep(const rules::Symbol &symbol, int precedence,
|
|
rules::Associativity associativity)
|
|
: symbol(symbol), precedence(precedence), associativity(associativity) {}
|
|
|
|
bool ProductionStep::operator==(const ProductionStep &other) const {
|
|
return symbol == other.symbol && precedence == other.precedence &&
|
|
associativity == other.associativity;
|
|
}
|
|
|
|
const vector<Production> &SyntaxGrammar::productions(
|
|
const rules::Symbol &symbol) const {
|
|
if (symbol.is_built_in() || symbol.is_token) {
|
|
return NO_PRODUCTIONS;
|
|
} else {
|
|
return variables[symbol.index].productions;
|
|
}
|
|
}
|
|
|
|
} // namespace tree_sitter
|