Refine logic for deciding when tokens need to be re-lexed

* While generating the lex table, note which tokens can match the same string. A token needs to be relexed when it has possible homonyms in the current state. * Also note which tokens can match substrings of each other tokens. A token needs to be relexed when there are viable tokens that could match longer strings in the current state and the next token has been edited. * Remove the logic for marking tokens as fragile on creation. * Store the reusability/non-reusability of symbols off of individual actions and onto the entire entry for the state & symbol.
2016-06-21 07:28:04 -07:00 · 2016-06-21 07:28:04 -07:00 · 38c144b4a3
commit 38c144b4a3
parent 45f7cee0c8
19 changed files with 337 additions and 257 deletions
--- a/src/runtime/language.c
+++ b/src/runtime/language.c
@ -6,38 +6,30 @@ static const TSParseAction ERROR_SHIFT_EXTRA = {
  .type = TSParseActionTypeShift, .extra = true,
 };

-const TSParseAction *ts_language_actions(const TSLanguage *self, TSStateId state,
-                                         TSSymbol symbol, size_t *count) {
+void ts_language_table_entry(const TSLanguage *self, TSStateId state,
+                             TSSymbol symbol, TableEntry *result) {
  if (state == ts_parse_state_error) {
-    *count = 1;
-    if (symbol == ts_builtin_sym_error)
-      return &ERROR_SHIFT_EXTRA;
-    else if (self->recovery_actions[symbol].type == TSParseActionTypeError)
-      return &ERROR_SHIFT_EXTRA;
+    result->action_count = 1;
+    result->is_reusable = false;
+    result->depends_on_lookahead = false;
+    if (symbol == ts_builtin_sym_error ||
+        self->recovery_actions[symbol].type == TSParseActionTypeError)
+      result->actions = &ERROR_SHIFT_EXTRA;
    else
-      return &self->recovery_actions[symbol];
+      result->actions = &self->recovery_actions[symbol];
+    return;
  }

-  size_t action_index = 0;
-  if (symbol != ts_builtin_sym_error)
-    action_index = self->parse_table[state * self->symbol_count + symbol];
+  size_t action_index =
+    (symbol != ts_builtin_sym_error)
+      ? self->parse_table[state * self->symbol_count + symbol]
+      : 0;

-  *count = self->parse_actions[action_index].count;
-  const TSParseActionEntry *entry = self->parse_actions + action_index + 1;
-  return (const TSParseAction *)entry;
-}
-
-TSParseAction ts_language_last_action(const TSLanguage *self, TSStateId state,
-                                      TSSymbol sym) {
-  size_t count;
-  const TSParseAction *actions = ts_language_actions(self, state, sym, &count);
-  return actions[count - 1];
-}
-
-bool ts_language_has_action(const TSLanguage *self, TSStateId state,
-                            TSSymbol symbol) {
-  TSParseAction action = ts_language_last_action(self, state, symbol);
-  return action.type != TSParseActionTypeError;
+  const TSParseActionEntry *entry = &self->parse_actions[action_index];
+  result->action_count = entry->count;
+  result->is_reusable = entry->reusable;
+  result->depends_on_lookahead = entry->depends_on_lookahead;
+  result->actions = (const TSParseAction *)(entry + 1);
 }

 size_t ts_language_symbol_count(const TSLanguage *language) {