70 lines
No EOL
2.4 KiB
C++
70 lines
No EOL
2.4 KiB
C++
#include "compiler/build_tables/first_set.h"
|
|
#include "tree_sitter/compiler.h"
|
|
#include "compiler/prepared_grammar.h"
|
|
#include "compiler/build_tables/rule_can_be_blank.h"
|
|
#include "compiler/rules/metadata.h"
|
|
#include "compiler/rules/visitor.h"
|
|
#include "compiler/rules/seq.h"
|
|
#include "compiler/rules/choice.h"
|
|
|
|
namespace tree_sitter {
|
|
using std::set;
|
|
using rules::Symbol;
|
|
|
|
namespace build_tables {
|
|
set<Symbol> set_union(const set<Symbol> &left, const set<Symbol> &right) {
|
|
set<Symbol> result = left;
|
|
result.insert(right.begin(), right.end());
|
|
return result;
|
|
}
|
|
|
|
class FirstSet : public rules::RuleFn<set<Symbol>> {
|
|
const PreparedGrammar grammar;
|
|
set<Symbol> visited_symbols;
|
|
public:
|
|
explicit FirstSet(const PreparedGrammar &grammar) : grammar(grammar) {}
|
|
|
|
void visit(const Symbol *rule) {
|
|
if (visited_symbols.find(*rule) == visited_symbols.end()) {
|
|
visited_symbols.insert(*rule);
|
|
|
|
if (grammar.has_definition(*rule)) {
|
|
value = apply(grammar.rule(*rule));
|
|
} else {
|
|
value = set<Symbol>({ *rule });
|
|
}
|
|
}
|
|
}
|
|
|
|
void visit(const rules::Metadata *rule) {
|
|
value = apply(rule->rule);
|
|
}
|
|
|
|
void visit(const rules::Choice *rule) {
|
|
value = set_union(apply(rule->left), apply(rule->right));
|
|
}
|
|
|
|
void visit(const rules::Seq *rule) {
|
|
auto result = apply(rule->left);
|
|
if (rule_can_be_blank(rule->left, grammar)) {
|
|
result = set_union(result, apply(rule->right));
|
|
}
|
|
value = result;
|
|
}
|
|
};
|
|
|
|
set<Symbol> first_set(const rules::rule_ptr &rule, const PreparedGrammar &grammar) {
|
|
return FirstSet(grammar).apply(rule);
|
|
}
|
|
|
|
set<Symbol> first_set(const ParseItemSet &item_set, const PreparedGrammar &grammar) {
|
|
set<Symbol> result;
|
|
for (auto &item : item_set) {
|
|
result = set_union(result, first_set(item.rule, grammar));
|
|
if (rule_can_be_blank(item.rule, grammar))
|
|
result.insert(item.lookahead_sym);
|
|
}
|
|
return result;
|
|
}
|
|
}
|
|
} |