tree-sitter/src/runtime/stack.c

588 lines
16 KiB
C
Raw Normal View History

2015-05-25 20:21:13 -07:00
#include "tree_sitter/parser.h"
2016-01-15 15:08:42 -08:00
#include "runtime/alloc.h"
2015-05-25 20:21:13 -07:00
#include "runtime/tree.h"
2016-02-17 20:41:29 -08:00
#include "runtime/array.h"
2015-09-18 18:04:52 -07:00
#include "runtime/stack.h"
#include "runtime/length.h"
2015-05-25 20:21:13 -07:00
#include <assert.h>
2016-01-28 21:18:57 -08:00
#include <stdio.h>
2015-05-25 20:21:13 -07:00
2015-11-20 00:01:53 -08:00
#define MAX_SUCCESSOR_COUNT 8
2015-06-03 09:44:13 -07:00
#define INITIAL_HEAD_CAPACITY 3
#define STARTING_TREE_CAPACITY 10
#define MAX_NODE_POOL_SIZE 50
2015-06-03 09:44:13 -07:00
typedef struct StackNode StackNode;
typedef struct {
StackNode *node;
TSTree *tree;
} StackLink;
struct StackNode {
2015-09-18 18:04:52 -07:00
StackEntry entry;
StackLink successors[MAX_SUCCESSOR_COUNT];
2015-06-03 09:44:13 -07:00
short unsigned int successor_count;
short unsigned int ref_count;
};
2015-05-25 20:21:13 -07:00
2015-11-20 00:01:53 -08:00
typedef struct {
size_t goal_tree_count;
StackNode *node;
2016-02-17 20:41:29 -08:00
TreeArray trees;
2015-11-20 00:01:53 -08:00
bool is_shared;
} PopPath;
2016-02-25 21:46:13 -08:00
typedef Array(StackNode *) StackNodeArray;
2016-02-17 14:45:00 -08:00
struct Stack {
2016-02-17 20:41:29 -08:00
Array(StackNode *) heads;
2016-03-03 10:16:10 -08:00
StackSliceArray slices;
2016-02-17 20:41:29 -08:00
Array(PopPath) pop_paths;
2016-02-25 21:46:13 -08:00
StackNodeArray node_pool;
2016-02-17 14:45:00 -08:00
void *tree_selection_payload;
TreeSelectionFunction tree_selection_function;
};
2015-05-25 20:21:13 -07:00
/*
2015-06-03 09:44:13 -07:00
* Section: Stack lifecycle
2015-05-25 20:21:13 -07:00
*/
static int ts_stack__default_tree_selection(void *p, TSTree *t1, TSTree *t2) {
return 0;
}
Stack *ts_stack_new() {
Stack *self = ts_calloc(1, sizeof(Stack));
if (!self)
goto error;
2016-02-17 20:41:29 -08:00
array_init(&self->heads);
2016-03-03 10:16:10 -08:00
array_init(&self->slices);
2016-02-17 20:41:29 -08:00
array_init(&self->pop_paths);
array_init(&self->node_pool);
self->tree_selection_payload = NULL;
self->tree_selection_function = ts_stack__default_tree_selection;
2016-02-17 20:41:29 -08:00
if (!array_grow(&self->heads, 4))
goto error;
2016-03-03 10:16:10 -08:00
if (!array_grow(&self->slices, 4))
goto error;
2016-02-17 20:41:29 -08:00
if (!array_grow(&self->pop_paths, 4))
goto error;
2016-02-17 20:41:29 -08:00
if (!array_grow(&self->node_pool, 20))
goto error;
2016-02-17 20:41:29 -08:00
array_push(&self->heads, NULL);
2015-10-14 21:52:13 -07:00
return self;
error:
if (self) {
if (self->heads.contents)
2016-02-17 20:41:29 -08:00
array_delete(&self->heads);
2016-03-03 10:16:10 -08:00
if (self->slices.contents)
array_delete(&self->slices);
if (self->pop_paths.contents)
2016-02-17 20:41:29 -08:00
array_delete(&self->pop_paths);
if (self->node_pool.contents)
2016-02-17 20:41:29 -08:00
array_delete(&self->node_pool);
ts_free(self);
}
return NULL;
2015-05-25 20:21:13 -07:00
}
/*
2015-06-03 09:44:13 -07:00
* Section: Reading from the stack
2015-05-25 20:21:13 -07:00
*/
2016-02-25 21:46:13 -08:00
TSStateId ts_stack_top_state(const Stack *self, int head_index) {
StackEntry *entry = ts_stack_head((Stack *)self, head_index);
return entry ? entry->state : 0;
}
2016-02-25 21:46:13 -08:00
TSLength ts_stack_top_position(const Stack *self, int head_index) {
StackEntry *entry = ts_stack_head((Stack *)self, head_index);
return entry ? entry->position : ts_length_zero();
}
2016-02-25 21:46:13 -08:00
StackEntry *ts_stack_head(Stack *self, int head_index) {
StackNode *node = self->heads.contents[head_index];
2015-06-03 09:44:13 -07:00
return node ? &node->entry : NULL;
2015-05-25 20:21:13 -07:00
}
2015-10-14 21:52:13 -07:00
int ts_stack_head_count(const Stack *self) {
return self->heads.size;
2015-05-25 20:21:13 -07:00
}
2015-09-18 18:04:52 -07:00
int ts_stack_entry_next_count(const StackEntry *entry) {
return ((const StackNode *)entry)->successor_count;
2015-06-03 09:44:13 -07:00
}
2016-02-25 21:46:13 -08:00
StackEntry *ts_stack_entry_next(const StackEntry *entry, int successor_index) {
return &((const StackNode *)entry)->successors[successor_index].node->entry;
2015-06-03 09:44:13 -07:00
}
/*
* Section: Manipulating nodes (Private)
*/
2015-10-14 21:52:13 -07:00
static void stack_node_retain(StackNode *self) {
if (!self)
2015-07-27 18:29:48 -07:00
return;
2015-10-14 21:52:13 -07:00
assert(self->ref_count != 0);
self->ref_count++;
2015-06-03 09:44:13 -07:00
}
2016-02-25 21:46:13 -08:00
static void stack_node_release(StackNode *self, StackNodeArray *pool) {
if (!self)
return;
assert(self->ref_count != 0);
self->ref_count--;
if (self->ref_count == 0) {
for (int i = 0; i < self->successor_count; i++) {
stack_node_release(self->successors[i].node, pool);
ts_tree_release(self->successors[i].tree);
}
2016-02-25 21:46:13 -08:00
if (pool->size >= MAX_NODE_POOL_SIZE)
ts_free(self);
else
2016-02-25 21:46:13 -08:00
array_push(pool, self);
2015-06-03 09:44:13 -07:00
}
}
2016-02-25 21:46:13 -08:00
static StackNode *stack_node_new(StackNode *next, TSTree *tree, TSStateId state,
StackNodeArray *pool) {
assert(tree->ref_count > 0);
StackNode *node;
2016-02-25 21:46:13 -08:00
if (pool->size == 0) {
node = ts_malloc(sizeof(StackNode));
if (!node)
return NULL;
} else {
2016-02-25 21:46:13 -08:00
node = array_pop(pool);
}
2015-06-03 09:44:13 -07:00
ts_tree_retain(tree);
stack_node_retain(next);
TSLength position = ts_tree_total_size(tree);
if (next)
position = ts_length_add(next->entry.position, position);
*node = (StackNode){
2015-06-03 09:44:13 -07:00
.ref_count = 1,
.successor_count = 1,
2016-02-25 21:46:13 -08:00
.successors = { { next, tree } },
.entry = {.state = state, .position = position },
2015-06-03 09:44:13 -07:00
};
return node;
2015-06-03 09:44:13 -07:00
}
2016-03-03 10:16:10 -08:00
static void ts_stack_slice__clear(StackSlice *slice) {
ts_tree_array_clear(&slice->trees);
array_delete(&slice->trees);
}
2016-03-03 10:16:10 -08:00
static void ts_stack__merge_slice(Stack *self, StackSlice *slice,
StackSlice *new_slice) {
bool should_update = false;
2016-03-03 10:16:10 -08:00
if (slice->trees.size < new_slice->trees.size) {
should_update = true;
2016-03-03 10:16:10 -08:00
} else if (slice->trees.size == new_slice->trees.size) {
for (size_t i = 0; i < slice->trees.size; i++) {
TSTree *tree = slice->trees.contents[i];
TSTree *new_tree = new_slice->trees.contents[i];
2016-02-17 14:45:00 -08:00
int comparison = self->tree_selection_function(
self->tree_selection_payload, tree, new_tree);
if (comparison < 0) {
break;
} else if (comparison > 0) {
should_update = true;
break;
}
}
}
if (should_update) {
2016-03-03 10:16:10 -08:00
ts_stack_slice__clear(slice);
slice->trees = new_slice->trees;
slice->trees.size = new_slice->trees.size;
} else {
2016-03-03 10:16:10 -08:00
ts_stack_slice__clear(new_slice);
}
}
2016-02-25 21:46:13 -08:00
static void stack_node__add_successor(StackNode *self, TSTree *new_tree,
StackNode *new_node) {
for (int i = 0; i < self->successor_count; i++) {
StackLink successor = self->successors[i];
if (successor.tree == new_tree) {
if (successor.node == new_node)
return;
if (successor.node && new_node &&
successor.node->entry.state == new_node->entry.state) {
for (int j = 0; j < new_node->successor_count; j++) {
2016-02-25 21:46:13 -08:00
stack_node__add_successor(successor.node, new_node->successors[j].tree,
new_node->successors[j].node);
}
return;
}
}
}
stack_node_retain(new_node);
ts_tree_retain(new_tree);
self->successors[self->successor_count++] = (StackLink){
2016-02-25 21:46:13 -08:00
new_node, new_tree,
};
2015-06-03 09:44:13 -07:00
}
2015-05-25 20:21:13 -07:00
/*
2015-06-03 09:44:13 -07:00
* Section: Mutating the stack (Private)
2015-05-25 20:21:13 -07:00
*/
2015-10-14 21:52:13 -07:00
static int ts_stack__add_head(Stack *self, StackNode *node) {
2016-02-17 20:41:29 -08:00
if (array_push(&self->heads, node)) {
stack_node_retain(node);
return self->heads.size - 1;
} else {
return -1;
2015-06-03 09:44:13 -07:00
}
}
2015-11-20 00:01:53 -08:00
static int ts_stack__find_head(Stack *self, StackNode *node) {
for (size_t i = 0; i < self->heads.size; i++) {
2016-02-17 14:45:00 -08:00
if (self->heads.contents[i] == node)
return i;
}
2015-11-20 00:01:53 -08:00
return -1;
}
2015-10-14 21:52:13 -07:00
void ts_stack_remove_head(Stack *self, int head_index) {
2016-02-17 20:41:29 -08:00
StackNode *node = *array_get(&self->heads, head_index);
2016-02-25 21:46:13 -08:00
stack_node_release(node, &self->node_pool);
2016-02-17 20:41:29 -08:00
array_erase(&self->heads, head_index);
2015-06-03 09:44:13 -07:00
}
/*
* Section: Mutating the stack (Public)
*/
2016-02-25 21:46:13 -08:00
StackPushResult ts_stack_push(Stack *self, int head_index, TSTree *tree,
TSStateId state) {
TSLength position = ts_tree_total_size(tree);
2016-02-17 20:41:29 -08:00
StackNode *current_head = *array_get(&self->heads, head_index);
2016-02-17 14:45:00 -08:00
if (current_head)
position = ts_length_add(current_head->entry.position, position);
for (int i = 0; i < head_index; i++) {
2016-02-17 14:45:00 -08:00
StackNode *prior_node = self->heads.contents[i];
StackEntry prior_entry = prior_node->entry;
if (prior_entry.state == state &&
ts_length_eq(prior_entry.position, position)) {
stack_node__add_successor(prior_node, tree, current_head);
ts_stack_remove_head(self, head_index);
return StackPushMerged;
}
}
2016-02-25 21:46:13 -08:00
StackNode *new_head =
stack_node_new(current_head, tree, state, &self->node_pool);
if (!new_head)
return StackPushFailed;
2016-02-25 21:46:13 -08:00
stack_node_release(current_head, &self->node_pool);
2016-02-17 14:45:00 -08:00
self->heads.contents[head_index] = new_head;
return StackPushContinued;
2015-05-25 20:21:13 -07:00
}
2015-10-14 21:52:13 -07:00
int ts_stack_split(Stack *self, int head_index) {
2016-02-17 14:45:00 -08:00
StackNode *head = self->heads.contents[head_index];
return ts_stack__add_head(self, head);
2015-06-03 09:44:13 -07:00
}
2016-03-03 10:16:10 -08:00
StackSliceArray ts_stack_pop(Stack *self, int head_index, int child_count,
2016-02-17 20:41:29 -08:00
bool count_extra) {
2016-03-03 10:16:10 -08:00
array_clear(&self->slices);
2016-02-17 20:41:29 -08:00
array_clear(&self->pop_paths);
2016-02-17 20:41:29 -08:00
StackNode *previous_head = *array_get(&self->heads, head_index);
int capacity = (child_count == -1) ? STARTING_TREE_CAPACITY : child_count;
2015-11-20 00:01:53 -08:00
PopPath initial_path = {
2016-02-17 20:41:29 -08:00
.goal_tree_count = child_count, .node = previous_head, .is_shared = false,
2015-11-20 00:01:53 -08:00
};
2016-02-17 20:41:29 -08:00
array_init(&initial_path.trees);
2015-11-20 00:01:53 -08:00
2016-02-17 20:41:29 -08:00
if (!array_grow(&initial_path.trees, capacity))
goto error;
2016-02-17 20:41:29 -08:00
if (!array_push(&self->pop_paths, initial_path))
goto error;
2015-05-25 20:21:13 -07:00
/*
* Reduce along every possible path in parallel. Stop when the given number
* of child trees have been collected along every path.
2015-05-25 20:21:13 -07:00
*/
bool all_paths_done = false;
while (!all_paths_done) {
all_paths_done = true;
2015-11-20 00:01:53 -08:00
for (size_t i = 0; i < self->pop_paths.size; i++) {
2016-02-17 14:45:00 -08:00
PopPath *path = &self->pop_paths.contents[i];
2015-11-20 00:01:53 -08:00
StackNode *node = path->node;
if (!node || path->trees.size == path->goal_tree_count)
continue;
all_paths_done = false;
/*
* If a node has more than one successor, create new paths for each of
* the additional successors.
*/
for (int j = 0; j < node->successor_count; j++) {
StackLink successor = node->successors[j];
PopPath *next_path;
if (j == 0) {
next_path = path;
} else {
if (!array_push(&self->pop_paths, *path))
goto error;
next_path = array_back(&self->pop_paths);
next_path->is_shared = true;
}
2015-11-20 00:01:53 -08:00
if (next_path->is_shared) {
TreeArray trees = path->trees;
trees.size--;
next_path->trees = ts_tree_array_copy(&trees);
next_path->is_shared = false;
}
2015-11-20 00:01:53 -08:00
if (successor.tree->extra && !count_extra)
next_path->goal_tree_count++;
ts_tree_retain(successor.tree);
if (!array_push(&next_path->trees, successor.tree))
goto error;
next_path->node = successor.node;
if (successor.tree->symbol == ts_builtin_sym_error && !count_extra) {
next_path->goal_tree_count = next_path->trees.size;
}
}
}
2015-05-25 20:21:13 -07:00
}
2015-11-20 00:01:53 -08:00
for (size_t i = 0; i < self->pop_paths.size; i++) {
2016-02-17 14:45:00 -08:00
PopPath *path = &self->pop_paths.contents[i];
2015-11-20 00:01:53 -08:00
if (!path->is_shared)
2016-02-17 20:41:29 -08:00
array_reverse(&path->trees);
2015-11-20 00:01:53 -08:00
2016-03-03 10:16:10 -08:00
StackSlice slice = {
.trees = path->trees, .head_index = -1,
2015-11-20 00:01:53 -08:00
};
if (i == 0) {
stack_node_retain(path->node);
2016-02-17 14:45:00 -08:00
self->heads.contents[head_index] = path->node;
2016-03-03 10:16:10 -08:00
slice.head_index = head_index;
2015-06-03 09:44:13 -07:00
} else {
2016-03-03 10:16:10 -08:00
slice.head_index = ts_stack__find_head(self, path->node);
if (slice.head_index == -1) {
slice.head_index = ts_stack__add_head(self, path->node);
if (slice.head_index == -1)
goto error;
} else {
2016-03-03 10:16:10 -08:00
bool merged = false;
for (size_t j = 0; j < self->slices.size; j++) {
StackSlice *prior_result = &self->slices.contents[j];
if (prior_result->head_index == slice.head_index) {
ts_stack__merge_slice(self, prior_result, &slice);
merged = true;
break;
}
}
2016-03-03 10:16:10 -08:00
if (merged)
continue;
}
}
2015-05-25 20:21:13 -07:00
2016-03-03 10:16:10 -08:00
if (!array_push(&self->slices, slice))
goto error;
}
2016-02-25 21:46:13 -08:00
stack_node_release(previous_head, &self->node_pool);
2016-03-03 10:16:10 -08:00
return self->slices;
error:
2016-02-17 20:41:29 -08:00
array_delete(&initial_path.trees);
2016-03-03 10:16:10 -08:00
StackSliceArray slices;
array_init(&slices);
return slices;
2015-05-25 20:21:13 -07:00
}
2015-10-14 21:52:13 -07:00
void ts_stack_shrink(Stack *self, int head_index, int count) {
2016-02-17 20:41:29 -08:00
StackNode *head = *array_get(&self->heads, head_index);
2016-02-17 14:45:00 -08:00
StackNode *new_head = head;
for (int i = 0; i < count; i++) {
2015-07-27 18:29:48 -07:00
if (new_head->successor_count == 0)
break;
new_head = new_head->successors[0].node;
}
stack_node_retain(new_head);
2016-02-25 21:46:13 -08:00
stack_node_release(head, &self->node_pool);
2016-02-17 14:45:00 -08:00
self->heads.contents[head_index] = new_head;
}
2015-10-14 21:52:13 -07:00
void ts_stack_clear(Stack *self) {
2016-02-17 14:45:00 -08:00
for (size_t i = 0; i < self->heads.size; i++)
2016-02-25 21:46:13 -08:00
stack_node_release(self->heads.contents[i], &self->node_pool);
2016-02-17 20:41:29 -08:00
array_clear(&self->heads);
array_push(&self->heads, NULL);
}
void ts_stack_set_tree_selection_callback(Stack *self, void *payload,
TreeSelectionFunction function) {
self->tree_selection_payload = payload;
self->tree_selection_function = function;
}
2016-01-28 21:18:57 -08:00
void ts_stack_delete(Stack *self) {
if (self->pop_paths.contents)
2016-03-03 10:16:10 -08:00
array_delete(&self->slices);
if (self->pop_paths.contents)
2016-02-17 20:41:29 -08:00
array_delete(&self->pop_paths);
2016-01-28 21:18:57 -08:00
ts_stack_clear(self);
2016-02-17 14:45:00 -08:00
if (self->node_pool.contents) {
for (size_t i = 0; i < self->node_pool.size; i++)
ts_free(self->node_pool.contents[i]);
2016-02-17 20:41:29 -08:00
array_delete(&self->node_pool);
2016-02-17 14:45:00 -08:00
}
2016-02-17 20:41:29 -08:00
array_delete(&self->heads);
2016-01-28 21:18:57 -08:00
ts_free(self);
}
static const char *COLORS[] = {
"red", "blue", "orange", "green", "purple",
};
static size_t COLOR_COUNT = sizeof(COLORS) / sizeof(COLORS[0]);
size_t ts_stack__write_dot_graph(Stack *self, char *string, size_t n,
const char **symbol_names) {
char *cursor = string;
char **s = n > 0 ? &cursor : &string;
cursor += snprintf(*s, n, "digraph stack {\n");
cursor += snprintf(*s, n, "rankdir=\"RL\";\n");
2016-02-25 21:46:13 -08:00
Array(StackNode *)visited_nodes;
array_init(&visited_nodes);
array_clear(&self->pop_paths);
for (size_t i = 0; i < self->heads.size; i++) {
StackNode *node = self->heads.contents[i];
const char *color = COLORS[i % COLOR_COUNT];
cursor += snprintf(*s, n, "node_%p [color=%s];\n", node, color);
2016-02-25 21:46:13 -08:00
array_push(&self->pop_paths, ((PopPath){.node = node }));
}
bool all_paths_done = false;
while (!all_paths_done) {
all_paths_done = true;
for (size_t i = 0; i < self->pop_paths.size; i++) {
PopPath *path = &self->pop_paths.contents[i];
StackNode *node = path->node;
for (size_t j = 0; j < visited_nodes.size; j++) {
if (visited_nodes.contents[j] == node) {
node = NULL;
break;
}
}
if (!node)
continue;
all_paths_done = false;
2016-03-02 09:55:25 -08:00
cursor += snprintf(*s, n, "node_%p [label=", node);
if (node->entry.state == ts_parse_state_error)
cursor += snprintf(*s, n, "\"?\"");
else
cursor += snprintf(*s, n, "%d", node->entry.state);
cursor += snprintf(*s, n, "];\n");
for (int j = 0; j < node->successor_count; j++) {
StackLink successor = node->successors[j];
2016-02-25 21:46:13 -08:00
cursor +=
snprintf(*s, n, "node_%p -> node_%p [label=\"", node, successor.node);
2016-03-02 09:55:25 -08:00
if (successor.tree->symbol == ts_builtin_sym_error) {
cursor += snprintf(*s, n, "ERROR");
} else {
const char *name = symbol_names[successor.tree->symbol];
for (const char *c = name; *c; c++) {
if (*c == '\"' || *c == '\\') {
**s = '\\';
cursor++;
}
**s = *c;
cursor++;
}
}
cursor += snprintf(*s, n, "\"];\n");
if (j == 0) {
path->node = successor.node;
} else {
if (!array_push(&self->pop_paths, *path))
goto error;
PopPath *next_path = array_back(&self->pop_paths);
next_path->node = successor.node;
}
}
if (!array_push(&visited_nodes, node))
goto error;
}
}
cursor += snprintf(*s, n, "node_%p [label=0];\n", NULL);
cursor += snprintf(*s, n, "}\n");
array_delete(&visited_nodes);
return cursor - string;
error:
array_delete(&visited_nodes);
return (size_t)-1;
}
char *ts_stack_dot_graph(Stack *self, const char **symbol_names) {
static char SCRATCH[1];
char *result = NULL;
size_t size = ts_stack__write_dot_graph(self, SCRATCH, 0, symbol_names) + 1;
if (size == (size_t)-1)
goto error;
result = ts_malloc(size * sizeof(char));
if (!result)
goto error;
size = ts_stack__write_dot_graph(self, result, size, symbol_names);
if (size == (size_t)-1)
goto error;
return result;
error:
if (result)
ts_free(result);
return NULL;
}