tree-sitter/src/runtime/stack.c

614 lines
18 KiB
C
Raw Normal View History

2015-05-25 20:21:13 -07:00
#include "tree_sitter/parser.h"
2016-01-15 15:08:42 -08:00
#include "runtime/alloc.h"
2015-05-25 20:21:13 -07:00
#include "runtime/tree.h"
2016-02-17 20:41:29 -08:00
#include "runtime/array.h"
2015-09-18 18:04:52 -07:00
#include "runtime/stack.h"
#include "runtime/length.h"
2015-05-25 20:21:13 -07:00
#include <assert.h>
2016-01-28 21:18:57 -08:00
#include <stdio.h>
2015-05-25 20:21:13 -07:00
2016-04-11 22:41:06 -07:00
#define MAX_LINK_COUNT 8
#define MAX_NODE_POOL_SIZE 50
2015-06-03 09:44:13 -07:00
#define INLINE static inline __attribute__((always_inline))
typedef struct StackNode StackNode;
typedef struct {
StackNode *node;
TSTree *tree;
bool is_pending;
} StackLink;
struct StackNode {
TSStateId state;
TSLength position;
2016-04-11 22:41:06 -07:00
StackLink links[MAX_LINK_COUNT];
short unsigned int link_count;
2015-06-03 09:44:13 -07:00
short unsigned int ref_count;
unsigned error_cost;
unsigned error_depth;
};
2015-05-25 20:21:13 -07:00
2015-11-20 00:01:53 -08:00
typedef struct {
2016-02-17 20:41:29 -08:00
TreeArray trees;
size_t tree_count;
StackNode *node;
bool is_pending;
2015-11-20 00:01:53 -08:00
} PopPath;
typedef struct {
2016-04-04 11:59:10 -07:00
size_t goal_tree_count;
bool found_error;
bool found_valid_path;
} StackPopSession;
2016-02-25 21:46:13 -08:00
typedef Array(StackNode *) StackNodeArray;
typedef struct {
StackNode *node;
bool is_halted;
} StackHead;
2016-02-17 14:45:00 -08:00
struct Stack {
Array(StackHead) heads;
2016-03-03 10:16:10 -08:00
StackSliceArray slices;
2016-02-17 20:41:29 -08:00
Array(PopPath) pop_paths;
2016-02-25 21:46:13 -08:00
StackNodeArray node_pool;
StackNode *base_node;
};
static void stack_node_retain(StackNode *self) {
if (!self)
return;
assert(self->ref_count != 0);
self->ref_count++;
}
static void stack_node_release(StackNode *self, StackNodeArray *pool) {
if (!self)
return;
assert(self->ref_count != 0);
self->ref_count--;
if (self->ref_count == 0) {
2016-04-11 22:41:06 -07:00
for (int i = 0; i < self->link_count; i++) {
2016-05-26 13:20:53 -07:00
if (self->links[i].tree)
ts_tree_release(self->links[i].tree);
2016-04-11 22:41:06 -07:00
stack_node_release(self->links[i].node, pool);
}
if (pool->size >= MAX_NODE_POOL_SIZE || !array_push(pool, self))
ts_free(self);
}
}
static StackNode *stack_node_new(StackNode *next, TSTree *tree, bool is_pending,
TSStateId state, TSLength position,
StackNodeArray *pool) {
StackNode *node;
if (pool->size > 0)
node = array_pop(pool);
else if (!(node = ts_malloc(sizeof(StackNode))))
return NULL;
bool is_error = (state == ts_parse_state_error);
*node = (StackNode){
.ref_count = 1,
2016-04-11 22:41:06 -07:00
.link_count = 0,
.links = {},
.state = state,
.position = position,
.error_depth = 0,
.error_cost = is_error ? 1 : 0,
};
if (next) {
stack_node_retain(next);
2016-04-11 22:41:06 -07:00
node->links[0] = (StackLink){ next, tree, is_pending };
node->link_count = 1;
node->error_cost += next->error_cost;
node->error_depth = next->error_depth;
if (tree) {
ts_tree_retain(tree);
node->error_cost += tree->error_size;
} else {
node->error_depth++;
}
}
return node;
}
static void stack_node_add_link(StackNode *self, StackLink link) {
2016-04-11 22:41:06 -07:00
for (int i = 0; i < self->link_count; i++) {
StackLink existing_link = self->links[i];
if (existing_link.tree == link.tree) {
if (existing_link.node == link.node)
return;
if (existing_link.node->state == link.node->state) {
2016-04-11 22:41:06 -07:00
for (int j = 0; j < link.node->link_count; j++)
stack_node_add_link(existing_link.node, link.node->links[j]);
return;
}
}
}
2016-04-11 22:41:06 -07:00
if (self->link_count < MAX_LINK_COUNT) {
stack_node_retain(link.node);
if (link.tree)
2016-05-26 13:20:53 -07:00
ts_tree_retain(link.tree);
2016-04-11 22:41:06 -07:00
self->links[self->link_count++] = (StackLink){
link.node, link.tree, link.is_pending,
};
}
}
static StackVersion ts_stack__add_version(Stack *self, StackNode *node) {
if (!array_push(&self->heads, ((StackHead){ node, false })))
return STACK_VERSION_NONE;
stack_node_retain(node);
return (StackVersion)(self->heads.size - 1);
}
static bool ts_stack__add_slice(Stack *self, StackNode *node, TreeArray *trees) {
for (size_t i = self->slices.size - 1; i + 1 > 0; i--) {
StackVersion version = self->slices.contents[i].version;
if (self->heads.contents[version].node == node) {
StackSlice slice = { *trees, version };
return array_insert(&self->slices, i + 1, slice);
}
}
StackVersion version = ts_stack__add_version(self, node);
if (version == STACK_VERSION_NONE)
return false;
StackSlice slice = { *trees, version };
return array_push(&self->slices, slice);
2015-06-03 09:44:13 -07:00
}
INLINE StackPopResult stack__iter(Stack *self, StackVersion version,
StackIterateCallback callback, void *payload) {
array_clear(&self->slices);
PopPath pop_path = {
.node = array_get(&self->heads, version)->node,
.trees = array_new(),
.tree_count = 0,
.is_pending = true,
2015-11-20 00:01:53 -08:00
};
2016-04-11 23:12:50 -07:00
array_clear(&self->pop_paths);
if (!array_push(&self->pop_paths, pop_path))
goto error;
2015-05-25 20:21:13 -07:00
while (self->pop_paths.size > 0) {
for (size_t i = 0, size = self->pop_paths.size; i < size; i++) {
2016-02-17 14:45:00 -08:00
PopPath *path = &self->pop_paths.contents[i];
2015-11-20 00:01:53 -08:00
StackNode *node = path->node;
bool is_done = node == self->base_node;
StackIterateAction action =
callback(payload, node->state, &path->trees, path->tree_count, is_done,
path->is_pending);
bool should_pop = action & StackIteratePop;
bool should_stop = action & StackIterateStop || node->link_count == 0;
if (should_pop) {
TreeArray trees = path->trees;
if (!should_stop)
if (!ts_tree_array_copy(trees, &trees))
goto error;
array_reverse(&trees);
if (!ts_stack__add_slice(self, node, &trees))
goto error;
}
2015-11-20 00:01:53 -08:00
if (should_stop) {
if (!should_pop)
ts_tree_array_delete(&path->trees);
2016-04-11 23:12:50 -07:00
array_erase(&self->pop_paths, i);
i--, size--;
continue;
}
for (size_t j = 1; j <= node->link_count; j++) {
PopPath *next_path;
2016-04-11 22:41:06 -07:00
StackLink link;
if (j == node->link_count) {
2016-04-11 22:41:06 -07:00
link = node->links[0];
next_path = &self->pop_paths.contents[i];
} else {
2016-04-11 22:41:06 -07:00
link = node->links[j];
if (!array_push(&self->pop_paths, self->pop_paths.contents[i]))
goto error;
next_path = array_back(&self->pop_paths);
if (!ts_tree_array_copy(next_path->trees, &next_path->trees))
goto error;
}
2015-11-20 00:01:53 -08:00
2016-04-11 22:41:06 -07:00
next_path->node = link.node;
if (!link.is_pending)
next_path->is_pending = false;
2016-05-26 13:20:53 -07:00
if (link.tree) {
if (!link.tree->extra)
next_path->tree_count++;
if (!array_push(&next_path->trees, link.tree))
goto error;
ts_tree_retain(link.tree);
}
}
}
2015-05-25 20:21:13 -07:00
}
return (StackPopResult){ StackPopSucceeded, self->slices };
error:
for (size_t i = 0; i < self->pop_paths.size; i++)
ts_tree_array_delete(&self->pop_paths.contents[i].trees);
array_clear(&self->slices);
2016-04-04 12:25:57 -07:00
return (StackPopResult){.status = StackPopFailed };
}
2016-04-15 21:33:31 -07:00
Stack *ts_stack_new() {
Stack *self = ts_calloc(1, sizeof(Stack));
if (!self)
goto error;
array_init(&self->heads);
array_init(&self->slices);
array_init(&self->pop_paths);
array_init(&self->node_pool);
if (!array_grow(&self->heads, 4))
goto error;
if (!array_grow(&self->slices, 4))
goto error;
if (!array_grow(&self->pop_paths, 4))
goto error;
if (!array_grow(&self->node_pool, MAX_NODE_POOL_SIZE))
2016-04-15 21:33:31 -07:00
goto error;
self->base_node =
stack_node_new(NULL, NULL, false, 0, ts_length_zero(), &self->node_pool);
stack_node_retain(self->base_node);
if (!self->base_node)
goto error;
array_push(&self->heads, ((StackHead){ self->base_node, false }));
2016-04-15 21:33:31 -07:00
return self;
error:
if (self) {
if (self->heads.contents)
array_delete(&self->heads);
if (self->slices.contents)
array_delete(&self->slices);
if (self->pop_paths.contents)
array_delete(&self->pop_paths);
if (self->node_pool.contents)
array_delete(&self->node_pool);
ts_free(self);
}
return NULL;
}
void ts_stack_delete(Stack *self) {
if (self->slices.contents)
2016-04-15 21:33:31 -07:00
array_delete(&self->slices);
if (self->pop_paths.contents)
array_delete(&self->pop_paths);
stack_node_release(self->base_node, &self->node_pool);
for (size_t i = 0; i < self->heads.size; i++)
stack_node_release(self->heads.contents[i].node, &self->node_pool);
2016-04-15 21:33:31 -07:00
array_clear(&self->heads);
if (self->node_pool.contents) {
for (size_t i = 0; i < self->node_pool.size; i++)
ts_free(self->node_pool.contents[i]);
array_delete(&self->node_pool);
}
array_delete(&self->heads);
ts_free(self);
}
size_t ts_stack_version_count(const Stack *self) {
return self->heads.size;
}
TSStateId ts_stack_top_state(const Stack *self, StackVersion version) {
return array_get(&self->heads, version)->node->state;
2016-04-15 21:33:31 -07:00
}
TSLength ts_stack_top_position(const Stack *self, StackVersion version) {
return array_get(&self->heads, version)->node->position;
2016-04-15 21:33:31 -07:00
}
unsigned ts_stack_error_cost(const Stack *self, StackVersion version) {
return array_get(&self->heads, version)->node->error_cost;
}
unsigned ts_stack_error_depth(const Stack *self, StackVersion version) {
return array_get(&self->heads, version)->node->error_depth;
}
size_t ts_stack_last_repaired_error_size(const Stack *self,
StackVersion version) {
StackNode *node = array_get(&self->heads, version)->node;
for (;;) {
if (node->link_count == 0)
break;
TSTree *tree = node->links[0].tree;
2016-05-26 13:20:53 -07:00
if (tree && tree->error_size > 0)
return ts_tree_last_error_size(tree);
node = node->links[0].node;
}
return 0;
}
2016-04-15 21:33:31 -07:00
bool ts_stack_push(Stack *self, StackVersion version, TSTree *tree,
bool is_pending, TSStateId state) {
StackNode *node = array_get(&self->heads, version)->node;
2016-05-26 13:20:53 -07:00
TSLength position =
tree ? ts_length_add(node->position, ts_tree_total_size(tree))
: node->position;
2016-04-15 21:33:31 -07:00
StackNode *new_node =
stack_node_new(node, tree, is_pending, state, position, &self->node_pool);
if (!new_node)
return false;
stack_node_release(node, &self->node_pool);
self->heads.contents[version].node = new_node;
2016-04-15 21:33:31 -07:00
return true;
}
StackPopResult ts_stack_iterate(Stack *self, StackVersion version,
StackIterateCallback callback, void *payload) {
return stack__iter(self, version, callback, payload);
2016-04-04 11:59:10 -07:00
}
INLINE StackIterateAction pop_count_callback(void *payload, TSStateId state,
TreeArray *trees, size_t tree_count,
bool is_done, bool is_pending) {
StackPopSession *pop_session = (StackPopSession *)payload;
if (tree_count == pop_session->goal_tree_count) {
pop_session->found_valid_path = true;
return StackIteratePop | StackIterateStop;
}
2016-04-04 11:59:10 -07:00
if (state == ts_parse_state_error) {
if (pop_session->found_valid_path || pop_session->found_error) {
return StackIterateStop;
} else {
pop_session->found_error = true;
return StackIteratePop | StackIterateStop;
}
}
return StackIterateNone;
}
2016-04-04 12:25:57 -07:00
StackPopResult ts_stack_pop_count(Stack *self, StackVersion version,
size_t count) {
StackPopSession session = {
.goal_tree_count = count, .found_error = false, .found_valid_path = false,
};
StackPopResult pop = stack__iter(self, version, pop_count_callback, &session);
if (pop.status && session.found_error) {
if (session.found_valid_path) {
StackSlice error_slice = pop.slices.contents[0];
ts_tree_array_delete(&error_slice.trees);
array_erase(&pop.slices, 0);
if (array_front(&pop.slices)->version != error_slice.version) {
ts_stack_remove_version(self, error_slice.version);
for (StackVersion i = 0; i < pop.slices.size; i++)
pop.slices.contents[i].version--;
}
} else {
pop.status = StackPopStoppedAtError;
}
}
return pop;
}
INLINE StackIterateAction pop_pending_callback(void *payload, TSStateId state,
TreeArray *trees,
size_t tree_count, bool is_done,
bool is_pending) {
2016-04-11 23:12:50 -07:00
if (tree_count >= 1) {
if (is_pending) {
return StackIteratePop | StackIterateStop;
2016-04-11 23:12:50 -07:00
} else {
return StackIterateStop;
2016-04-11 23:12:50 -07:00
}
} else {
return StackIterateNone;
2016-04-11 23:12:50 -07:00
}
2015-05-25 20:21:13 -07:00
}
2016-04-04 12:25:57 -07:00
StackPopResult ts_stack_pop_pending(Stack *self, StackVersion version) {
StackPopResult pop = stack__iter(self, version, pop_pending_callback, NULL);
if (pop.slices.size > 0) {
ts_stack_renumber_version(self, pop.slices.contents[0].version, version);
pop.slices.contents[0].version = version;
}
return pop;
}
INLINE StackIterateAction pop_all_callback(void *payload, TSStateId state,
TreeArray *trees, size_t tree_count,
bool is_done, bool is_pending) {
return is_done ? (StackIteratePop | StackIterateStop) : StackIterateNone;
}
StackPopResult ts_stack_pop_all(Stack *self, StackVersion version) {
return stack__iter(self, version, pop_all_callback, NULL);
}
2016-04-15 21:33:31 -07:00
void ts_stack_remove_version(Stack *self, StackVersion version) {
StackNode *node = array_get(&self->heads, version)->node;
2016-04-15 21:33:31 -07:00
stack_node_release(node, &self->node_pool);
array_erase(&self->heads, version);
}
void ts_stack_renumber_version(Stack *self, StackVersion v1, StackVersion v2) {
assert(v2 < v1);
assert((size_t)v1 < self->heads.size);
stack_node_release(self->heads.contents[v2].node, &self->node_pool);
2016-04-15 21:33:31 -07:00
self->heads.contents[v2] = self->heads.contents[v1];
array_erase(&self->heads, v1);
}
StackVersion ts_stack_duplicate_version(Stack *self, StackVersion version) {
assert(version < self->heads.size);
if (!array_push(&self->heads, self->heads.contents[version]))
return STACK_VERSION_NONE;
stack_node_retain(array_back(&self->heads)->node);
return self->heads.size - 1;
}
bool ts_stack_merge(Stack *self, StackVersion version, StackVersion new_version) {
StackNode *node = self->heads.contents[version].node;
StackNode *new_node = self->heads.contents[new_version].node;
if (new_node->state == node->state &&
new_node->position.chars == node->position.chars &&
new_node->error_depth == node->error_depth &&
new_node->error_cost == node->error_cost) {
for (size_t j = 0; j < new_node->link_count; j++)
stack_node_add_link(node, new_node->links[j]);
ts_stack_remove_version(self, new_version);
return true;
} else {
return false;
}
}
void ts_stack_halt(Stack *self, StackVersion version) {
array_get(&self->heads, version)->is_halted = true;
}
bool ts_stack_is_halted(Stack *self, StackVersion version) {
return array_get(&self->heads, version)->is_halted;
}
2016-04-04 11:59:10 -07:00
void ts_stack_clear(Stack *self) {
stack_node_retain(self->base_node);
for (size_t i = 0; i < self->heads.size; i++)
stack_node_release(self->heads.contents[i].node, &self->node_pool);
2016-04-04 11:59:10 -07:00
array_clear(&self->heads);
array_push(&self->heads, ((StackHead){ self->base_node, false }));
2016-04-04 11:59:10 -07:00
}
bool ts_stack_print_dot_graph(Stack *self, const char **symbol_names, FILE *f) {
bool was_recording_allocations = ts_toggle_allocation_recording(false);
if (!f)
f = stderr;
fprintf(f, "digraph stack {\n");
fprintf(f, "rankdir=\"RL\";\n");
fprintf(f, "edge [arrowhead=none]\n");
Array(StackNode *)visited_nodes = array_new();
array_clear(&self->pop_paths);
for (size_t i = 0; i < self->heads.size; i++) {
if (self->heads.contents[i].is_halted)
continue;
StackNode *node = self->heads.contents[i].node;
fprintf(f, "node_head_%lu [shape=none, label=\"\"]\n", i);
fprintf(
f, "node_head_%lu -> node_%p [label=%lu, fontcolor=blue, weight=10000]\n",
i, node, i);
if (!array_push(&self->pop_paths, ((PopPath){.node = node })))
goto error;
}
bool all_paths_done = false;
while (!all_paths_done) {
all_paths_done = true;
for (size_t i = 0; i < self->pop_paths.size; i++) {
PopPath *path = &self->pop_paths.contents[i];
StackNode *node = path->node;
for (size_t j = 0; j < visited_nodes.size; j++) {
if (visited_nodes.contents[j] == node) {
node = NULL;
break;
}
}
if (!node)
continue;
all_paths_done = false;
fprintf(f, "node_%p [", node);
if (node->state == ts_parse_state_error)
fprintf(f, "label=\"?\"");
2016-05-26 13:20:53 -07:00
else if (node->link_count == 1 && node->links[0].tree &&
node->links[0].tree->extra)
fprintf(f, "shape=point margin=0 label=\"\"");
2016-03-02 09:55:25 -08:00
else
fprintf(f, "label=\"%d\"", node->state);
fprintf(f, " tooltip=\"error-count:%u, error-cost:%u\"];\n",
node->error_depth, node->error_cost);
2016-04-11 22:41:06 -07:00
for (int j = 0; j < node->link_count; j++) {
StackLink link = node->links[j];
fprintf(f, "node_%p -> node_%p [", node, link.node);
if (link.is_pending)
2016-04-04 12:25:57 -07:00
fprintf(f, "style=dashed ");
2016-05-26 13:20:53 -07:00
if (link.tree && link.tree->extra)
fprintf(f, "fontcolor=gray ");
2016-05-26 13:20:53 -07:00
if (!link.tree) {
fprintf(f, "color=red");
} else if (link.tree->symbol == ts_builtin_sym_error) {
fprintf(f, "label=\"ERROR\"");
2016-03-02 09:55:25 -08:00
} else {
2016-05-26 13:20:53 -07:00
fprintf(f, "label=\"");
2016-04-11 22:41:06 -07:00
const char *name = symbol_names[link.tree->symbol];
2016-03-02 09:55:25 -08:00
for (const char *c = name; *c; c++) {
if (*c == '\"' || *c == '\\')
fprintf(f, "\\");
fprintf(f, "%c", *c);
}
2016-05-26 13:20:53 -07:00
fprintf(f, "\"");
}
2016-05-26 13:20:53 -07:00
fprintf(f, "];\n");
if (j == 0) {
2016-04-11 22:41:06 -07:00
path->node = link.node;
} else {
if (!array_push(&self->pop_paths, *path))
goto error;
PopPath *next_path = array_back(&self->pop_paths);
2016-04-11 22:41:06 -07:00
next_path->node = link.node;
}
}
if (!array_push(&visited_nodes, node))
goto error;
}
}
fprintf(f, "}\n");
array_delete(&visited_nodes);
ts_toggle_allocation_recording(was_recording_allocations);
return true;
error:
ts_toggle_allocation_recording(was_recording_allocations);
if (visited_nodes.contents)
array_delete(&visited_nodes);
return false;
}