#ifndef TREE_SITTER_PARSER_H_ #define TREE_SITTER_PARSER_H_ #ifdef __cplusplus extern "C" { #endif #include #include #include "tree_sitter/runtime.h" #define ts_lex_state_error 0 #define TS_DEBUG_BUFFER_SIZE 512 typedef struct TSTree TSTree; typedef unsigned short TSStateId; typedef struct { size_t bytes; size_t chars; size_t rows; size_t columns; } TSLength; typedef struct { bool visible : 1; bool named : 1; bool extra : 1; bool structural : 1; } TSSymbolMetadata; typedef struct TSLexer { void (*start_fn)(struct TSLexer *, TSStateId); void (*start_token_fn)(struct TSLexer *); bool (*advance_fn)(struct TSLexer *, TSStateId); TSTree *(*accept_fn)(struct TSLexer *, TSSymbol, TSSymbolMetadata, const char *, bool fragile); const char *chunk; size_t chunk_start; size_t chunk_size; TSLength current_position; TSLength token_end_position; TSLength token_start_position; size_t lookahead_size; int32_t lookahead; TSInput input; TSDebugger debugger; char debug_buffer[TS_DEBUG_BUFFER_SIZE]; } TSLexer; typedef enum { TSParseActionTypeError = 1, TSParseActionTypeShift, TSParseActionTypeReduce, TSParseActionTypeAccept, } TSParseActionType; typedef struct { union { TSStateId to_state; struct { TSSymbol symbol; unsigned short child_count; }; } data; TSParseActionType type : 3; bool extra : 1; bool fragile : 1; bool can_hide_split : 1; } TSParseAction; struct TSLanguage { size_t symbol_count; const char **symbol_names; const TSSymbolMetadata *symbol_metadata; const TSParseAction **parse_table; const TSStateId *lex_states; TSTree *(*lex_fn)(TSLexer *, TSStateId); }; /* * Lexer Macros */ #define START_LEXER() \ const bool error_mode = (lex_state == ts_lex_state_error); \ lexer->start_fn(lexer, lex_state); \ int32_t lookahead; \ next_state: \ lookahead = lexer->lookahead; #define START_TOKEN() lexer->start_token_fn(lexer); #define GO_TO_STATE(state_index) \ { \ lex_state = state_index; \ goto next_state; \ } #define ADVANCE(state_index) \ { \ lexer->advance_fn(lexer, state_index); \ GO_TO_STATE(state_index); \ } #define ACCEPT_FRAGILE_TOKEN(symbol) \ return lexer->accept_fn(lexer, symbol, ts_symbol_metadata[symbol], \ ts_symbol_names[symbol], true); #define ACCEPT_TOKEN(symbol) \ return lexer->accept_fn(lexer, symbol, ts_symbol_metadata[symbol], \ ts_symbol_names[symbol], false); #define LEX_ERROR() \ if (error_mode) { \ if (lex_state == ts_lex_state_error) \ ADVANCE(ts_lex_state_error) \ else \ GO_TO_STATE(ts_lex_state_error) \ } else { \ ACCEPT_TOKEN(ts_builtin_sym_error) \ } /* * Parse Table Macros */ #define ACTIONS(...) \ (TSParseAction[]) { \ __VA_ARGS__, { \ .type = 0 \ } \ } enum { FRAGILE = 1, CAN_HIDE_SPLIT = 2, }; #define SHIFT(to_state_value, flags) \ { \ .type = TSParseActionTypeShift, \ .can_hide_split = (flags & CAN_HIDE_SPLIT) != 0, \ .data = {.to_state = to_state_value } \ } #define SHIFT_EXTRA() \ { .type = TSParseActionTypeShift, .extra = true } #define REDUCE_EXTRA(symbol_val) \ { \ .type = TSParseActionTypeReduce, .extra = true, \ .data = {.symbol = symbol_val, .child_count = 1 } \ } #define REDUCE(symbol_val, child_count_val, flags) \ { \ .type = TSParseActionTypeReduce, .fragile = (flags & FRAGILE) != 0, \ .can_hide_split = (flags & CAN_HIDE_SPLIT) != 0, \ .data = {.symbol = symbol_val, .child_count = child_count_val } \ } #define ACCEPT_INPUT() \ { .type = TSParseActionTypeAccept } #define EXPORT_LANGUAGE(language_name) \ static TSLanguage language = { \ .symbol_count = SYMBOL_COUNT, \ .symbol_metadata = ts_symbol_metadata, \ .parse_table = (const TSParseAction **)ts_parse_actions, \ .lex_states = ts_lex_states, \ .symbol_names = ts_symbol_names, \ .lex_fn = ts_lex, \ }; \ \ const TSLanguage *language_name() { \ return &language; \ } #ifdef __cplusplus } #endif #endif // TREE_SITTER_PARSER_H_