1
0
Fork 0
mirror of https://github.com/pnx/tree-sitter-dotenv synced 2026-06-16 01:54:56 +02:00

Initial Commit

This commit is contained in:
Henrik Hautakoski 2024-12-10 19:51:21 +01:00
commit 948e93ffac
40 changed files with 2760 additions and 0 deletions

172
src/grammar.json generated Normal file
View file

@ -0,0 +1,172 @@
{
"name": "dotenv",
"rules": {
"document": {
"type": "REPEAT",
"content": {
"type": "CHOICE",
"members": [
{
"type": "SYMBOL",
"name": "comment"
},
{
"type": "SYMBOL",
"name": "assignment"
}
]
}
},
"assignment": {
"type": "SEQ",
"members": [
{
"type": "FIELD",
"name": "key",
"content": {
"type": "SYMBOL",
"name": "identifier"
}
},
{
"type": "STRING",
"value": "="
},
{
"type": "FIELD",
"name": "value",
"content": {
"type": "SYMBOL",
"name": "_value"
}
}
]
},
"comment": {
"type": "SEQ",
"members": [
{
"type": "STRING",
"value": "#"
},
{
"type": "PATTERN",
"value": ".*"
}
]
},
"identifier": {
"type": "TOKEN",
"content": {
"type": "PATTERN",
"value": "[A-Za-z_][A-Za-z0-9_]*"
}
},
"_value": {
"type": "CHOICE",
"members": [
{
"type": "SYMBOL",
"name": "string"
},
{
"type": "SYMBOL",
"name": "string_interpolation"
},
{
"type": "SYMBOL",
"name": "value"
},
{
"type": "ALIAS",
"content": {
"type": "SYMBOL",
"name": "_empty_value"
},
"named": true,
"value": "value"
}
]
},
"string": {
"type": "SEQ",
"members": [
{
"type": "STRING",
"value": "'"
},
{
"type": "SYMBOL",
"name": "string_content"
},
{
"type": "STRING",
"value": "'"
}
]
},
"string_interpolation": {
"type": "SEQ",
"members": [
{
"type": "STRING",
"value": "\""
},
{
"type": "ALIAS",
"content": {
"type": "SYMBOL",
"name": "string_interpolation_content"
},
"named": true,
"value": "string_content"
},
{
"type": "STRING",
"value": "\""
}
]
},
"string_content": {
"type": "TOKEN",
"content": {
"type": "PATTERN",
"value": "[^']*"
}
},
"string_interpolation_content": {
"type": "TOKEN",
"content": {
"type": "PATTERN",
"value": "[^\"]*"
}
},
"value": {
"type": "TOKEN",
"content": {
"type": "PREC",
"value": -1,
"content": {
"type": "PATTERN",
"value": "[^\\#\\=\\s]+"
}
}
}
},
"extras": [
{
"type": "PATTERN",
"value": "\\s"
}
],
"conflicts": [],
"precedences": [],
"externals": [
{
"type": "SYMBOL",
"name": "_empty_value"
}
],
"inline": [],
"supertypes": []
}

118
src/node-types.json generated Normal file
View file

@ -0,0 +1,118 @@
[
{
"type": "assignment",
"named": true,
"fields": {
"key": {
"multiple": false,
"required": true,
"types": [
{
"type": "identifier",
"named": true
}
]
},
"value": {
"multiple": false,
"required": true,
"types": [
{
"type": "string",
"named": true
},
{
"type": "string_interpolation",
"named": true
},
{
"type": "value",
"named": true
}
]
}
}
},
{
"type": "comment",
"named": true,
"fields": {}
},
{
"type": "document",
"named": true,
"fields": {},
"children": {
"multiple": true,
"required": false,
"types": [
{
"type": "assignment",
"named": true
},
{
"type": "comment",
"named": true
}
]
}
},
{
"type": "string",
"named": true,
"fields": {},
"children": {
"multiple": false,
"required": true,
"types": [
{
"type": "string_content",
"named": true
}
]
}
},
{
"type": "string_interpolation",
"named": true,
"fields": {},
"children": {
"multiple": false,
"required": true,
"types": [
{
"type": "string_content",
"named": true
}
]
}
},
{
"type": "\"",
"named": false
},
{
"type": "#",
"named": false
},
{
"type": "'",
"named": false
},
{
"type": "=",
"named": false
},
{
"type": "identifier",
"named": true
},
{
"type": "string_content",
"named": true
},
{
"type": "value",
"named": true
}
]

547
src/parser.c generated Normal file
View file

@ -0,0 +1,547 @@
#include "tree_sitter/parser.h"
#if defined(__GNUC__) || defined(__clang__)
#pragma GCC diagnostic ignored "-Wmissing-field-initializers"
#endif
#define LANGUAGE_VERSION 14
#define STATE_COUNT 16
#define LARGE_STATE_COUNT 2
#define SYMBOL_COUNT 18
#define ALIAS_COUNT 0
#define TOKEN_COUNT 11
#define EXTERNAL_TOKEN_COUNT 1
#define FIELD_COUNT 2
#define MAX_ALIAS_SEQUENCE_LENGTH 3
#define PRODUCTION_ID_COUNT 2
enum ts_symbol_identifiers {
anon_sym_EQ = 1,
anon_sym_POUND = 2,
aux_sym_comment_token1 = 3,
sym_identifier = 4,
anon_sym_SQUOTE = 5,
anon_sym_DQUOTE = 6,
sym_string_content = 7,
sym_string_interpolation_content = 8,
sym_value = 9,
sym__empty_value = 10,
sym_document = 11,
sym_assignment = 12,
sym_comment = 13,
sym__value = 14,
sym_string = 15,
sym_string_interpolation = 16,
aux_sym_document_repeat1 = 17,
};
static const char * const ts_symbol_names[] = {
[ts_builtin_sym_end] = "end",
[anon_sym_EQ] = "=",
[anon_sym_POUND] = "#",
[aux_sym_comment_token1] = "comment_token1",
[sym_identifier] = "identifier",
[anon_sym_SQUOTE] = "'",
[anon_sym_DQUOTE] = "\"",
[sym_string_content] = "string_content",
[sym_string_interpolation_content] = "string_content",
[sym_value] = "value",
[sym__empty_value] = "value",
[sym_document] = "document",
[sym_assignment] = "assignment",
[sym_comment] = "comment",
[sym__value] = "_value",
[sym_string] = "string",
[sym_string_interpolation] = "string_interpolation",
[aux_sym_document_repeat1] = "document_repeat1",
};
static const TSSymbol ts_symbol_map[] = {
[ts_builtin_sym_end] = ts_builtin_sym_end,
[anon_sym_EQ] = anon_sym_EQ,
[anon_sym_POUND] = anon_sym_POUND,
[aux_sym_comment_token1] = aux_sym_comment_token1,
[sym_identifier] = sym_identifier,
[anon_sym_SQUOTE] = anon_sym_SQUOTE,
[anon_sym_DQUOTE] = anon_sym_DQUOTE,
[sym_string_content] = sym_string_content,
[sym_string_interpolation_content] = sym_string_content,
[sym_value] = sym_value,
[sym__empty_value] = sym_value,
[sym_document] = sym_document,
[sym_assignment] = sym_assignment,
[sym_comment] = sym_comment,
[sym__value] = sym__value,
[sym_string] = sym_string,
[sym_string_interpolation] = sym_string_interpolation,
[aux_sym_document_repeat1] = aux_sym_document_repeat1,
};
static const TSSymbolMetadata ts_symbol_metadata[] = {
[ts_builtin_sym_end] = {
.visible = false,
.named = true,
},
[anon_sym_EQ] = {
.visible = true,
.named = false,
},
[anon_sym_POUND] = {
.visible = true,
.named = false,
},
[aux_sym_comment_token1] = {
.visible = false,
.named = false,
},
[sym_identifier] = {
.visible = true,
.named = true,
},
[anon_sym_SQUOTE] = {
.visible = true,
.named = false,
},
[anon_sym_DQUOTE] = {
.visible = true,
.named = false,
},
[sym_string_content] = {
.visible = true,
.named = true,
},
[sym_string_interpolation_content] = {
.visible = true,
.named = true,
},
[sym_value] = {
.visible = true,
.named = true,
},
[sym__empty_value] = {
.visible = true,
.named = true,
},
[sym_document] = {
.visible = true,
.named = true,
},
[sym_assignment] = {
.visible = true,
.named = true,
},
[sym_comment] = {
.visible = true,
.named = true,
},
[sym__value] = {
.visible = false,
.named = true,
},
[sym_string] = {
.visible = true,
.named = true,
},
[sym_string_interpolation] = {
.visible = true,
.named = true,
},
[aux_sym_document_repeat1] = {
.visible = false,
.named = false,
},
};
enum ts_field_identifiers {
field_key = 1,
field_value = 2,
};
static const char * const ts_field_names[] = {
[0] = NULL,
[field_key] = "key",
[field_value] = "value",
};
static const TSFieldMapSlice ts_field_map_slices[PRODUCTION_ID_COUNT] = {
[1] = {.index = 0, .length = 2},
};
static const TSFieldMapEntry ts_field_map_entries[] = {
[0] =
{field_key, 0},
{field_value, 2},
};
static const TSSymbol ts_alias_sequences[PRODUCTION_ID_COUNT][MAX_ALIAS_SEQUENCE_LENGTH] = {
[0] = {0},
};
static const uint16_t ts_non_terminal_alias_map[] = {
0,
};
static const TSStateId ts_primary_state_ids[STATE_COUNT] = {
[0] = 0,
[1] = 1,
[2] = 2,
[3] = 3,
[4] = 4,
[5] = 5,
[6] = 6,
[7] = 7,
[8] = 8,
[9] = 9,
[10] = 10,
[11] = 11,
[12] = 12,
[13] = 13,
[14] = 14,
[15] = 15,
};
static bool ts_lex(TSLexer *lexer, TSStateId state) {
START_LEXER();
eof = lexer->eof(lexer);
switch (state) {
case 0:
if (eof) ADVANCE(3);
if (lookahead == '"') ADVANCE(10);
if (lookahead == '#') ADVANCE(5);
if (lookahead == '\'') ADVANCE(9);
if (lookahead == '=') ADVANCE(4);
if (('\t' <= lookahead && lookahead <= '\r') ||
lookahead == ' ') SKIP(0);
if (('A' <= lookahead && lookahead <= 'Z') ||
lookahead == '_' ||
('a' <= lookahead && lookahead <= 'z')) ADVANCE(8);
if (lookahead != 0) ADVANCE(15);
END_STATE();
case 1:
if (lookahead == '"') ADVANCE(10);
if (lookahead == '\'') ADVANCE(9);
if (('\t' <= lookahead && lookahead <= '\r') ||
lookahead == ' ') SKIP(1);
if (lookahead != 0 &&
lookahead != '"' &&
lookahead != '#' &&
lookahead != '=') ADVANCE(15);
END_STATE();
case 2:
if (eof) ADVANCE(3);
if (lookahead == '#') ADVANCE(5);
if (('\t' <= lookahead && lookahead <= '\r') ||
lookahead == ' ') SKIP(2);
if (('A' <= lookahead && lookahead <= 'Z') ||
lookahead == '_' ||
('a' <= lookahead && lookahead <= 'z')) ADVANCE(8);
END_STATE();
case 3:
ACCEPT_TOKEN(ts_builtin_sym_end);
END_STATE();
case 4:
ACCEPT_TOKEN(anon_sym_EQ);
END_STATE();
case 5:
ACCEPT_TOKEN(anon_sym_POUND);
END_STATE();
case 6:
ACCEPT_TOKEN(aux_sym_comment_token1);
if (lookahead == '\t' ||
(0x0b <= lookahead && lookahead <= '\r') ||
lookahead == ' ') ADVANCE(6);
if (lookahead != 0 &&
(lookahead < '\t' || '\r' < lookahead)) ADVANCE(7);
END_STATE();
case 7:
ACCEPT_TOKEN(aux_sym_comment_token1);
if (lookahead != 0 &&
lookahead != '\n') ADVANCE(7);
END_STATE();
case 8:
ACCEPT_TOKEN(sym_identifier);
if (('0' <= lookahead && lookahead <= '9') ||
('A' <= lookahead && lookahead <= 'Z') ||
lookahead == '_' ||
('a' <= lookahead && lookahead <= 'z')) ADVANCE(8);
END_STATE();
case 9:
ACCEPT_TOKEN(anon_sym_SQUOTE);
END_STATE();
case 10:
ACCEPT_TOKEN(anon_sym_DQUOTE);
END_STATE();
case 11:
ACCEPT_TOKEN(sym_string_content);
if (('\t' <= lookahead && lookahead <= '\r') ||
lookahead == ' ') ADVANCE(11);
if (lookahead != 0 &&
lookahead != '\'') ADVANCE(12);
END_STATE();
case 12:
ACCEPT_TOKEN(sym_string_content);
if (lookahead != 0 &&
lookahead != '\'') ADVANCE(12);
END_STATE();
case 13:
ACCEPT_TOKEN(sym_string_interpolation_content);
if (('\t' <= lookahead && lookahead <= '\r') ||
lookahead == ' ') ADVANCE(13);
if (lookahead != 0 &&
lookahead != '"') ADVANCE(14);
END_STATE();
case 14:
ACCEPT_TOKEN(sym_string_interpolation_content);
if (lookahead != 0 &&
lookahead != '"') ADVANCE(14);
END_STATE();
case 15:
ACCEPT_TOKEN(sym_value);
if (lookahead != 0 &&
(lookahead < '\t' || '\r' < lookahead) &&
lookahead != ' ' &&
lookahead != '#' &&
lookahead != '=') ADVANCE(15);
END_STATE();
default:
return false;
}
}
static const TSLexMode ts_lex_modes[STATE_COUNT] = {
[0] = {.lex_state = 0, .external_lex_state = 1},
[1] = {.lex_state = 2},
[2] = {.lex_state = 1, .external_lex_state = 1},
[3] = {.lex_state = 2},
[4] = {.lex_state = 2},
[5] = {.lex_state = 2},
[6] = {.lex_state = 2},
[7] = {.lex_state = 2},
[8] = {.lex_state = 2},
[9] = {.lex_state = 6},
[10] = {.lex_state = 0},
[11] = {.lex_state = 0},
[12] = {.lex_state = 11},
[13] = {.lex_state = 13},
[14] = {.lex_state = 0},
[15] = {.lex_state = 0},
};
static const uint16_t ts_parse_table[LARGE_STATE_COUNT][SYMBOL_COUNT] = {
[0] = {
[ts_builtin_sym_end] = ACTIONS(1),
[anon_sym_EQ] = ACTIONS(1),
[anon_sym_POUND] = ACTIONS(1),
[sym_identifier] = ACTIONS(1),
[anon_sym_SQUOTE] = ACTIONS(1),
[anon_sym_DQUOTE] = ACTIONS(1),
[sym_value] = ACTIONS(1),
[sym__empty_value] = ACTIONS(1),
},
[1] = {
[sym_document] = STATE(11),
[sym_assignment] = STATE(3),
[sym_comment] = STATE(3),
[aux_sym_document_repeat1] = STATE(3),
[ts_builtin_sym_end] = ACTIONS(3),
[anon_sym_POUND] = ACTIONS(5),
[sym_identifier] = ACTIONS(7),
},
};
static const uint16_t ts_small_parse_table[] = {
[0] = 5,
ACTIONS(9), 1,
anon_sym_SQUOTE,
ACTIONS(11), 1,
anon_sym_DQUOTE,
ACTIONS(13), 1,
sym_value,
ACTIONS(15), 1,
sym__empty_value,
STATE(6), 3,
sym__value,
sym_string,
sym_string_interpolation,
[18] = 4,
ACTIONS(5), 1,
anon_sym_POUND,
ACTIONS(7), 1,
sym_identifier,
ACTIONS(17), 1,
ts_builtin_sym_end,
STATE(4), 3,
sym_assignment,
sym_comment,
aux_sym_document_repeat1,
[33] = 4,
ACTIONS(19), 1,
ts_builtin_sym_end,
ACTIONS(21), 1,
anon_sym_POUND,
ACTIONS(24), 1,
sym_identifier,
STATE(4), 3,
sym_assignment,
sym_comment,
aux_sym_document_repeat1,
[48] = 1,
ACTIONS(27), 3,
ts_builtin_sym_end,
anon_sym_POUND,
sym_identifier,
[54] = 1,
ACTIONS(29), 3,
ts_builtin_sym_end,
anon_sym_POUND,
sym_identifier,
[60] = 1,
ACTIONS(31), 3,
ts_builtin_sym_end,
anon_sym_POUND,
sym_identifier,
[66] = 1,
ACTIONS(33), 3,
ts_builtin_sym_end,
anon_sym_POUND,
sym_identifier,
[72] = 1,
ACTIONS(35), 1,
aux_sym_comment_token1,
[76] = 1,
ACTIONS(37), 1,
anon_sym_EQ,
[80] = 1,
ACTIONS(39), 1,
ts_builtin_sym_end,
[84] = 1,
ACTIONS(41), 1,
sym_string_content,
[88] = 1,
ACTIONS(43), 1,
sym_string_interpolation_content,
[92] = 1,
ACTIONS(45), 1,
anon_sym_SQUOTE,
[96] = 1,
ACTIONS(47), 1,
anon_sym_DQUOTE,
};
static const uint32_t ts_small_parse_table_map[] = {
[SMALL_STATE(2)] = 0,
[SMALL_STATE(3)] = 18,
[SMALL_STATE(4)] = 33,
[SMALL_STATE(5)] = 48,
[SMALL_STATE(6)] = 54,
[SMALL_STATE(7)] = 60,
[SMALL_STATE(8)] = 66,
[SMALL_STATE(9)] = 72,
[SMALL_STATE(10)] = 76,
[SMALL_STATE(11)] = 80,
[SMALL_STATE(12)] = 84,
[SMALL_STATE(13)] = 88,
[SMALL_STATE(14)] = 92,
[SMALL_STATE(15)] = 96,
};
static const TSParseActionEntry ts_parse_actions[] = {
[0] = {.entry = {.count = 0, .reusable = false}},
[1] = {.entry = {.count = 1, .reusable = false}}, RECOVER(),
[3] = {.entry = {.count = 1, .reusable = true}}, REDUCE(sym_document, 0, 0, 0),
[5] = {.entry = {.count = 1, .reusable = true}}, SHIFT(9),
[7] = {.entry = {.count = 1, .reusable = true}}, SHIFT(10),
[9] = {.entry = {.count = 1, .reusable = true}}, SHIFT(12),
[11] = {.entry = {.count = 1, .reusable = true}}, SHIFT(13),
[13] = {.entry = {.count = 1, .reusable = false}}, SHIFT(6),
[15] = {.entry = {.count = 1, .reusable = true}}, SHIFT(6),
[17] = {.entry = {.count = 1, .reusable = true}}, REDUCE(sym_document, 1, 0, 0),
[19] = {.entry = {.count = 1, .reusable = true}}, REDUCE(aux_sym_document_repeat1, 2, 0, 0),
[21] = {.entry = {.count = 2, .reusable = true}}, REDUCE(aux_sym_document_repeat1, 2, 0, 0), SHIFT_REPEAT(9),
[24] = {.entry = {.count = 2, .reusable = true}}, REDUCE(aux_sym_document_repeat1, 2, 0, 0), SHIFT_REPEAT(10),
[27] = {.entry = {.count = 1, .reusable = true}}, REDUCE(sym_comment, 2, 0, 0),
[29] = {.entry = {.count = 1, .reusable = true}}, REDUCE(sym_assignment, 3, 0, 1),
[31] = {.entry = {.count = 1, .reusable = true}}, REDUCE(sym_string, 3, 0, 0),
[33] = {.entry = {.count = 1, .reusable = true}}, REDUCE(sym_string_interpolation, 3, 0, 0),
[35] = {.entry = {.count = 1, .reusable = true}}, SHIFT(5),
[37] = {.entry = {.count = 1, .reusable = true}}, SHIFT(2),
[39] = {.entry = {.count = 1, .reusable = true}}, ACCEPT_INPUT(),
[41] = {.entry = {.count = 1, .reusable = true}}, SHIFT(14),
[43] = {.entry = {.count = 1, .reusable = true}}, SHIFT(15),
[45] = {.entry = {.count = 1, .reusable = true}}, SHIFT(7),
[47] = {.entry = {.count = 1, .reusable = true}}, SHIFT(8),
};
enum ts_external_scanner_symbol_identifiers {
ts_external_token__empty_value = 0,
};
static const TSSymbol ts_external_scanner_symbol_map[EXTERNAL_TOKEN_COUNT] = {
[ts_external_token__empty_value] = sym__empty_value,
};
static const bool ts_external_scanner_states[2][EXTERNAL_TOKEN_COUNT] = {
[1] = {
[ts_external_token__empty_value] = true,
},
};
#ifdef __cplusplus
extern "C" {
#endif
void *tree_sitter_dotenv_external_scanner_create(void);
void tree_sitter_dotenv_external_scanner_destroy(void *);
bool tree_sitter_dotenv_external_scanner_scan(void *, TSLexer *, const bool *);
unsigned tree_sitter_dotenv_external_scanner_serialize(void *, char *);
void tree_sitter_dotenv_external_scanner_deserialize(void *, const char *, unsigned);
#ifdef TREE_SITTER_HIDE_SYMBOLS
#define TS_PUBLIC
#elif defined(_WIN32)
#define TS_PUBLIC __declspec(dllexport)
#else
#define TS_PUBLIC __attribute__((visibility("default")))
#endif
TS_PUBLIC const TSLanguage *tree_sitter_dotenv(void) {
static const TSLanguage language = {
.version = LANGUAGE_VERSION,
.symbol_count = SYMBOL_COUNT,
.alias_count = ALIAS_COUNT,
.token_count = TOKEN_COUNT,
.external_token_count = EXTERNAL_TOKEN_COUNT,
.state_count = STATE_COUNT,
.large_state_count = LARGE_STATE_COUNT,
.production_id_count = PRODUCTION_ID_COUNT,
.field_count = FIELD_COUNT,
.max_alias_sequence_length = MAX_ALIAS_SEQUENCE_LENGTH,
.parse_table = &ts_parse_table[0][0],
.small_parse_table = ts_small_parse_table,
.small_parse_table_map = ts_small_parse_table_map,
.parse_actions = ts_parse_actions,
.symbol_names = ts_symbol_names,
.field_names = ts_field_names,
.field_map_slices = ts_field_map_slices,
.field_map_entries = ts_field_map_entries,
.symbol_metadata = ts_symbol_metadata,
.public_symbol_map = ts_symbol_map,
.alias_map = ts_non_terminal_alias_map,
.alias_sequences = &ts_alias_sequences[0][0],
.lex_modes = ts_lex_modes,
.lex_fn = ts_lex,
.external_scanner = {
&ts_external_scanner_states[0][0],
ts_external_scanner_symbol_map,
tree_sitter_dotenv_external_scanner_create,
tree_sitter_dotenv_external_scanner_destroy,
tree_sitter_dotenv_external_scanner_scan,
tree_sitter_dotenv_external_scanner_serialize,
tree_sitter_dotenv_external_scanner_deserialize,
},
.primary_state_ids = ts_primary_state_ids,
};
return &language;
}
#ifdef __cplusplus
}
#endif

45
src/scanner.c Normal file
View file

@ -0,0 +1,45 @@
#include "tree_sitter/parser.h"
#include "tree_sitter/alloc.h"
#include "tree_sitter/array.h"
enum TokenType {
EMPTY_VALUE,
};
void *tree_sitter_dotenv_external_scanner_create(void) {
return NULL;
}
void tree_sitter_dotenv_external_scanner_destroy(void *payload) {}
unsigned tree_sitter_dotenv_external_scanner_serialize(void *payload, char *buffer) {
return 0;
}
void tree_sitter_dotenv_external_scanner_deserialize(void *payload, const char *buffer, unsigned length) {}
void advanceWS(TSLexer *lexer) {
while (lexer->lookahead == ' ' || lexer->lookahead == '\t') {
lexer->advance(lexer, true);
}
}
bool tree_sitter_dotenv_external_scanner_scan(void *payload, TSLexer *lexer, const bool *valid_symbols) {
if (valid_symbols[EMPTY_VALUE]) {
advanceWS(lexer);
if (lexer->lookahead == '\r') {
lexer->advance(lexer, true);
}
if (lexer->eof(lexer)
|| lexer->lookahead == '#'
|| lexer->lookahead == '\n') {
lexer->result_symbol = EMPTY_VALUE;
return true;
}
}
return false;
}

54
src/tree_sitter/alloc.h generated Normal file
View file

@ -0,0 +1,54 @@
#ifndef TREE_SITTER_ALLOC_H_
#define TREE_SITTER_ALLOC_H_
#ifdef __cplusplus
extern "C" {
#endif
#include <stdbool.h>
#include <stdio.h>
#include <stdlib.h>
// Allow clients to override allocation functions
#ifdef TREE_SITTER_REUSE_ALLOCATOR
extern void *(*ts_current_malloc)(size_t);
extern void *(*ts_current_calloc)(size_t, size_t);
extern void *(*ts_current_realloc)(void *, size_t);
extern void (*ts_current_free)(void *);
#ifndef ts_malloc
#define ts_malloc ts_current_malloc
#endif
#ifndef ts_calloc
#define ts_calloc ts_current_calloc
#endif
#ifndef ts_realloc
#define ts_realloc ts_current_realloc
#endif
#ifndef ts_free
#define ts_free ts_current_free
#endif
#else
#ifndef ts_malloc
#define ts_malloc malloc
#endif
#ifndef ts_calloc
#define ts_calloc calloc
#endif
#ifndef ts_realloc
#define ts_realloc realloc
#endif
#ifndef ts_free
#define ts_free free
#endif
#endif
#ifdef __cplusplus
}
#endif
#endif // TREE_SITTER_ALLOC_H_

290
src/tree_sitter/array.h generated Normal file
View file

@ -0,0 +1,290 @@
#ifndef TREE_SITTER_ARRAY_H_
#define TREE_SITTER_ARRAY_H_
#ifdef __cplusplus
extern "C" {
#endif
#include "./alloc.h"
#include <assert.h>
#include <stdbool.h>
#include <stdint.h>
#include <stdlib.h>
#include <string.h>
#ifdef _MSC_VER
#pragma warning(disable : 4101)
#elif defined(__GNUC__) || defined(__clang__)
#pragma GCC diagnostic push
#pragma GCC diagnostic ignored "-Wunused-variable"
#endif
#define Array(T) \
struct { \
T *contents; \
uint32_t size; \
uint32_t capacity; \
}
/// Initialize an array.
#define array_init(self) \
((self)->size = 0, (self)->capacity = 0, (self)->contents = NULL)
/// Create an empty array.
#define array_new() \
{ NULL, 0, 0 }
/// Get a pointer to the element at a given `index` in the array.
#define array_get(self, _index) \
(assert((uint32_t)(_index) < (self)->size), &(self)->contents[_index])
/// Get a pointer to the first element in the array.
#define array_front(self) array_get(self, 0)
/// Get a pointer to the last element in the array.
#define array_back(self) array_get(self, (self)->size - 1)
/// Clear the array, setting its size to zero. Note that this does not free any
/// memory allocated for the array's contents.
#define array_clear(self) ((self)->size = 0)
/// Reserve `new_capacity` elements of space in the array. If `new_capacity` is
/// less than the array's current capacity, this function has no effect.
#define array_reserve(self, new_capacity) \
_array__reserve((Array *)(self), array_elem_size(self), new_capacity)
/// Free any memory allocated for this array. Note that this does not free any
/// memory allocated for the array's contents.
#define array_delete(self) _array__delete((Array *)(self))
/// Push a new `element` onto the end of the array.
#define array_push(self, element) \
(_array__grow((Array *)(self), 1, array_elem_size(self)), \
(self)->contents[(self)->size++] = (element))
/// Increase the array's size by `count` elements.
/// New elements are zero-initialized.
#define array_grow_by(self, count) \
do { \
if ((count) == 0) break; \
_array__grow((Array *)(self), count, array_elem_size(self)); \
memset((self)->contents + (self)->size, 0, (count) * array_elem_size(self)); \
(self)->size += (count); \
} while (0)
/// Append all elements from one array to the end of another.
#define array_push_all(self, other) \
array_extend((self), (other)->size, (other)->contents)
/// Append `count` elements to the end of the array, reading their values from the
/// `contents` pointer.
#define array_extend(self, count, contents) \
_array__splice( \
(Array *)(self), array_elem_size(self), (self)->size, \
0, count, contents \
)
/// Remove `old_count` elements from the array starting at the given `index`. At
/// the same index, insert `new_count` new elements, reading their values from the
/// `new_contents` pointer.
#define array_splice(self, _index, old_count, new_count, new_contents) \
_array__splice( \
(Array *)(self), array_elem_size(self), _index, \
old_count, new_count, new_contents \
)
/// Insert one `element` into the array at the given `index`.
#define array_insert(self, _index, element) \
_array__splice((Array *)(self), array_elem_size(self), _index, 0, 1, &(element))
/// Remove one element from the array at the given `index`.
#define array_erase(self, _index) \
_array__erase((Array *)(self), array_elem_size(self), _index)
/// Pop the last element off the array, returning the element by value.
#define array_pop(self) ((self)->contents[--(self)->size])
/// Assign the contents of one array to another, reallocating if necessary.
#define array_assign(self, other) \
_array__assign((Array *)(self), (const Array *)(other), array_elem_size(self))
/// Swap one array with another
#define array_swap(self, other) \
_array__swap((Array *)(self), (Array *)(other))
/// Get the size of the array contents
#define array_elem_size(self) (sizeof *(self)->contents)
/// Search a sorted array for a given `needle` value, using the given `compare`
/// callback to determine the order.
///
/// If an existing element is found to be equal to `needle`, then the `index`
/// out-parameter is set to the existing value's index, and the `exists`
/// out-parameter is set to true. Otherwise, `index` is set to an index where
/// `needle` should be inserted in order to preserve the sorting, and `exists`
/// is set to false.
#define array_search_sorted_with(self, compare, needle, _index, _exists) \
_array__search_sorted(self, 0, compare, , needle, _index, _exists)
/// Search a sorted array for a given `needle` value, using integer comparisons
/// of a given struct field (specified with a leading dot) to determine the order.
///
/// See also `array_search_sorted_with`.
#define array_search_sorted_by(self, field, needle, _index, _exists) \
_array__search_sorted(self, 0, _compare_int, field, needle, _index, _exists)
/// Insert a given `value` into a sorted array, using the given `compare`
/// callback to determine the order.
#define array_insert_sorted_with(self, compare, value) \
do { \
unsigned _index, _exists; \
array_search_sorted_with(self, compare, &(value), &_index, &_exists); \
if (!_exists) array_insert(self, _index, value); \
} while (0)
/// Insert a given `value` into a sorted array, using integer comparisons of
/// a given struct field (specified with a leading dot) to determine the order.
///
/// See also `array_search_sorted_by`.
#define array_insert_sorted_by(self, field, value) \
do { \
unsigned _index, _exists; \
array_search_sorted_by(self, field, (value) field, &_index, &_exists); \
if (!_exists) array_insert(self, _index, value); \
} while (0)
// Private
typedef Array(void) Array;
/// This is not what you're looking for, see `array_delete`.
static inline void _array__delete(Array *self) {
if (self->contents) {
ts_free(self->contents);
self->contents = NULL;
self->size = 0;
self->capacity = 0;
}
}
/// This is not what you're looking for, see `array_erase`.
static inline void _array__erase(Array *self, size_t element_size,
uint32_t index) {
assert(index < self->size);
char *contents = (char *)self->contents;
memmove(contents + index * element_size, contents + (index + 1) * element_size,
(self->size - index - 1) * element_size);
self->size--;
}
/// This is not what you're looking for, see `array_reserve`.
static inline void _array__reserve(Array *self, size_t element_size, uint32_t new_capacity) {
if (new_capacity > self->capacity) {
if (self->contents) {
self->contents = ts_realloc(self->contents, new_capacity * element_size);
} else {
self->contents = ts_malloc(new_capacity * element_size);
}
self->capacity = new_capacity;
}
}
/// This is not what you're looking for, see `array_assign`.
static inline void _array__assign(Array *self, const Array *other, size_t element_size) {
_array__reserve(self, element_size, other->size);
self->size = other->size;
memcpy(self->contents, other->contents, self->size * element_size);
}
/// This is not what you're looking for, see `array_swap`.
static inline void _array__swap(Array *self, Array *other) {
Array swap = *other;
*other = *self;
*self = swap;
}
/// This is not what you're looking for, see `array_push` or `array_grow_by`.
static inline void _array__grow(Array *self, uint32_t count, size_t element_size) {
uint32_t new_size = self->size + count;
if (new_size > self->capacity) {
uint32_t new_capacity = self->capacity * 2;
if (new_capacity < 8) new_capacity = 8;
if (new_capacity < new_size) new_capacity = new_size;
_array__reserve(self, element_size, new_capacity);
}
}
/// This is not what you're looking for, see `array_splice`.
static inline void _array__splice(Array *self, size_t element_size,
uint32_t index, uint32_t old_count,
uint32_t new_count, const void *elements) {
uint32_t new_size = self->size + new_count - old_count;
uint32_t old_end = index + old_count;
uint32_t new_end = index + new_count;
assert(old_end <= self->size);
_array__reserve(self, element_size, new_size);
char *contents = (char *)self->contents;
if (self->size > old_end) {
memmove(
contents + new_end * element_size,
contents + old_end * element_size,
(self->size - old_end) * element_size
);
}
if (new_count > 0) {
if (elements) {
memcpy(
(contents + index * element_size),
elements,
new_count * element_size
);
} else {
memset(
(contents + index * element_size),
0,
new_count * element_size
);
}
}
self->size += new_count - old_count;
}
/// A binary search routine, based on Rust's `std::slice::binary_search_by`.
/// This is not what you're looking for, see `array_search_sorted_with` or `array_search_sorted_by`.
#define _array__search_sorted(self, start, compare, suffix, needle, _index, _exists) \
do { \
*(_index) = start; \
*(_exists) = false; \
uint32_t size = (self)->size - *(_index); \
if (size == 0) break; \
int comparison; \
while (size > 1) { \
uint32_t half_size = size / 2; \
uint32_t mid_index = *(_index) + half_size; \
comparison = compare(&((self)->contents[mid_index] suffix), (needle)); \
if (comparison <= 0) *(_index) = mid_index; \
size -= half_size; \
} \
comparison = compare(&((self)->contents[*(_index)] suffix), (needle)); \
if (comparison == 0) *(_exists) = true; \
else if (comparison < 0) *(_index) += 1; \
} while (0)
/// Helper macro for the `_sorted_by` routines below. This takes the left (existing)
/// parameter by reference in order to work with the generic sorting function above.
#define _compare_int(a, b) ((int)*(a) - (int)(b))
#ifdef _MSC_VER
#pragma warning(default : 4101)
#elif defined(__GNUC__) || defined(__clang__)
#pragma GCC diagnostic pop
#endif
#ifdef __cplusplus
}
#endif
#endif // TREE_SITTER_ARRAY_H_

266
src/tree_sitter/parser.h generated Normal file
View file

@ -0,0 +1,266 @@
#ifndef TREE_SITTER_PARSER_H_
#define TREE_SITTER_PARSER_H_
#ifdef __cplusplus
extern "C" {
#endif
#include <stdbool.h>
#include <stdint.h>
#include <stdlib.h>
#define ts_builtin_sym_error ((TSSymbol)-1)
#define ts_builtin_sym_end 0
#define TREE_SITTER_SERIALIZATION_BUFFER_SIZE 1024
#ifndef TREE_SITTER_API_H_
typedef uint16_t TSStateId;
typedef uint16_t TSSymbol;
typedef uint16_t TSFieldId;
typedef struct TSLanguage TSLanguage;
#endif
typedef struct {
TSFieldId field_id;
uint8_t child_index;
bool inherited;
} TSFieldMapEntry;
typedef struct {
uint16_t index;
uint16_t length;
} TSFieldMapSlice;
typedef struct {
bool visible;
bool named;
bool supertype;
} TSSymbolMetadata;
typedef struct TSLexer TSLexer;
struct TSLexer {
int32_t lookahead;
TSSymbol result_symbol;
void (*advance)(TSLexer *, bool);
void (*mark_end)(TSLexer *);
uint32_t (*get_column)(TSLexer *);
bool (*is_at_included_range_start)(const TSLexer *);
bool (*eof)(const TSLexer *);
void (*log)(const TSLexer *, const char *, ...);
};
typedef enum {
TSParseActionTypeShift,
TSParseActionTypeReduce,
TSParseActionTypeAccept,
TSParseActionTypeRecover,
} TSParseActionType;
typedef union {
struct {
uint8_t type;
TSStateId state;
bool extra;
bool repetition;
} shift;
struct {
uint8_t type;
uint8_t child_count;
TSSymbol symbol;
int16_t dynamic_precedence;
uint16_t production_id;
} reduce;
uint8_t type;
} TSParseAction;
typedef struct {
uint16_t lex_state;
uint16_t external_lex_state;
} TSLexMode;
typedef union {
TSParseAction action;
struct {
uint8_t count;
bool reusable;
} entry;
} TSParseActionEntry;
typedef struct {
int32_t start;
int32_t end;
} TSCharacterRange;
struct TSLanguage {
uint32_t version;
uint32_t symbol_count;
uint32_t alias_count;
uint32_t token_count;
uint32_t external_token_count;
uint32_t state_count;
uint32_t large_state_count;
uint32_t production_id_count;
uint32_t field_count;
uint16_t max_alias_sequence_length;
const uint16_t *parse_table;
const uint16_t *small_parse_table;
const uint32_t *small_parse_table_map;
const TSParseActionEntry *parse_actions;
const char * const *symbol_names;
const char * const *field_names;
const TSFieldMapSlice *field_map_slices;
const TSFieldMapEntry *field_map_entries;
const TSSymbolMetadata *symbol_metadata;
const TSSymbol *public_symbol_map;
const uint16_t *alias_map;
const TSSymbol *alias_sequences;
const TSLexMode *lex_modes;
bool (*lex_fn)(TSLexer *, TSStateId);
bool (*keyword_lex_fn)(TSLexer *, TSStateId);
TSSymbol keyword_capture_token;
struct {
const bool *states;
const TSSymbol *symbol_map;
void *(*create)(void);
void (*destroy)(void *);
bool (*scan)(void *, TSLexer *, const bool *symbol_whitelist);
unsigned (*serialize)(void *, char *);
void (*deserialize)(void *, const char *, unsigned);
} external_scanner;
const TSStateId *primary_state_ids;
};
static inline bool set_contains(TSCharacterRange *ranges, uint32_t len, int32_t lookahead) {
uint32_t index = 0;
uint32_t size = len - index;
while (size > 1) {
uint32_t half_size = size / 2;
uint32_t mid_index = index + half_size;
TSCharacterRange *range = &ranges[mid_index];
if (lookahead >= range->start && lookahead <= range->end) {
return true;
} else if (lookahead > range->end) {
index = mid_index;
}
size -= half_size;
}
TSCharacterRange *range = &ranges[index];
return (lookahead >= range->start && lookahead <= range->end);
}
/*
* Lexer Macros
*/
#ifdef _MSC_VER
#define UNUSED __pragma(warning(suppress : 4101))
#else
#define UNUSED __attribute__((unused))
#endif
#define START_LEXER() \
bool result = false; \
bool skip = false; \
UNUSED \
bool eof = false; \
int32_t lookahead; \
goto start; \
next_state: \
lexer->advance(lexer, skip); \
start: \
skip = false; \
lookahead = lexer->lookahead;
#define ADVANCE(state_value) \
{ \
state = state_value; \
goto next_state; \
}
#define ADVANCE_MAP(...) \
{ \
static const uint16_t map[] = { __VA_ARGS__ }; \
for (uint32_t i = 0; i < sizeof(map) / sizeof(map[0]); i += 2) { \
if (map[i] == lookahead) { \
state = map[i + 1]; \
goto next_state; \
} \
} \
}
#define SKIP(state_value) \
{ \
skip = true; \
state = state_value; \
goto next_state; \
}
#define ACCEPT_TOKEN(symbol_value) \
result = true; \
lexer->result_symbol = symbol_value; \
lexer->mark_end(lexer);
#define END_STATE() return result;
/*
* Parse Table Macros
*/
#define SMALL_STATE(id) ((id) - LARGE_STATE_COUNT)
#define STATE(id) id
#define ACTIONS(id) id
#define SHIFT(state_value) \
{{ \
.shift = { \
.type = TSParseActionTypeShift, \
.state = (state_value) \
} \
}}
#define SHIFT_REPEAT(state_value) \
{{ \
.shift = { \
.type = TSParseActionTypeShift, \
.state = (state_value), \
.repetition = true \
} \
}}
#define SHIFT_EXTRA() \
{{ \
.shift = { \
.type = TSParseActionTypeShift, \
.extra = true \
} \
}}
#define REDUCE(symbol_name, children, precedence, prod_id) \
{{ \
.reduce = { \
.type = TSParseActionTypeReduce, \
.symbol = symbol_name, \
.child_count = children, \
.dynamic_precedence = precedence, \
.production_id = prod_id \
}, \
}}
#define RECOVER() \
{{ \
.type = TSParseActionTypeRecover \
}}
#define ACCEPT_INPUT() \
{{ \
.type = TSParseActionTypeAccept \
}}
#ifdef __cplusplus
}
#endif
#endif // TREE_SITTER_PARSER_H_