update: remove ts

2024-10-04 16:31:20 +02:00 · 2024-10-04 16:31:20 +02:00 · a35eafd84c
commit a35eafd84c
parent 142ac9c9e1
3 changed files with 0 additions and 1613 deletions
--- a/.tree-sitter-sh/grammar.js
+++ b/.tree-sitter-sh/grammar.js
@ -1,606 +0,0 @@
-/**
- * @file Bash grammar for tree-sitter
- * @author Max Brunsfeld <maxbrunsfeld@gmail.com>
- * @author Amaan Qureshi <amaanq12@gmail.com>
- * @license MIT
- */
-
-/// <reference types="tree-sitter-cli/dsl" />
-// @ts-check
-
-const SPECIAL_CHARACTERS = [
-	'|', '&', ';', '<', '>', '(', ')', '$', '`', '\\', '\"', '\'', ' ', '\t', '\n',
-]
-
-const PREC = {
-	UPDATE: 0,
-	ASSIGN: 1,
-	TERNARY: 2,
-	LOGICAL_OR: 3,
-	LOGICAL_AND: 4,
-	BITWISE_OR: 5,
-	BITWISE_XOR: 6,
-	BITWISE_AND: 7,
-	EQUALITY: 8,
-	COMPARE: 9,
-	TEST: 10,
-	UNARY: 11,
-	SHIFT: 12,
-	ADD: 13,
-	MULTIPLY: 14,
-	EXPONENT: 15,
-	NEGATE: 16,
-	PREFIX: 17,
-	POSTFIX: 18,
-};
-
-module.exports = grammar({
-	name: 'sh',
-
-	conflicts: $ => [
-		[$.command, $._variable_assignments],
-		[$.redirected_statement, $.command],
-		[$.redirected_statement, $.command_substitution],
-		[$._expansion_body, $._expansion_regex],
-		[$.pipeline],
-	],
-
-	inline: $ => [
-		$._statement,
-		$._literal,
-		$._terminated_statement,
-		$._primary_expression,
-		$._simple_variable_name,
-		$._multiline_variable_name,
-		$._special_variable_name,
-		$._statement_not_subshell,
-	],
-
-	externals: $ => [
-		$.file_descriptor,
-		$._empty_value,
-		$._concat,
-		$.variable_name,
-		$.regex,
-		$._expansion_word,
-		$.extglob_pattern,
-		$._bare_dollar,
-		$._immediate_double_hash,
-		//'<<',
-		/\n/,
-		'(',
-		$.__error_recovery,
-	],
-
-	extras: $ => [
-		$.comment,
-		/\s/,
-		/\\\r?\n/,
-		/\\( |\t|\v|\f)/,
-	],
-
-	word: $ => $.word,
-
-	rules: {
-		program: $ => optional($._statements),
-
-		_statements: $ => prec(1, seq(
-			repeat(seq(
-				field('stmt', $._statement),
-				field('term', $.terminator),
-			)),
-			field('stmt', $._statement),
-			field('term', optional($.terminator)),
-		)),
-
-		_terminated_statement: $ => repeat1(seq(
-			field('stmt', $._statement),
-			field('term', $.terminator)
-		)),
-
-		// Statements
-
-		_statement: $ => choice(
-			$._statement_not_subshell,
-			$.subshell,
-		),
-
-		_statement_not_subshell: $ => choice(
-			// $.case_statement,
-			$.command,
-			$.compound_statement,
-			// $.for_statement,
-			// $.function_definition,
-			// $.if_statement,
-			$.list,
-			$.negated_command,
-			$.pipeline,
-			$.redirected_statement,
-			$.variable_assignment,
-			$._variable_assignments,
-			// $.while_statement,
-		),
-
-		_statement_not_pipeline: $ => prec(1, choice(
-			// $.case_statement,
-			$.command,
-			$.compound_statement,
-			// $.for_statement,
-			// $.function_definition,
-			// $.if_statement,
-			$.list,
-			$.negated_command,
-			$.redirected_statement,
-			$.subshell,
-			$.variable_assignment,
-			$._variable_assignments,
-			// $.while_statement,
-		)),
-
-		redirected_statement: $ => prec.dynamic(-1, prec.right(-1, choice(
-			seq(
-				field('body', $._statement),
-				field('redr', repeat1(choice($.file_redirect, $.heredoc_redirect))),
-			),
-			field('redr', repeat1($.file_redirect)),
-		))),
-
-		/*
-		for_statement: $ => seq(
-			'for',
-			field('var', $._simple_variable_name),
-			optional(seq(
-				'in',
-				field('value', repeat1($._literal)),
-			)),
-			$.terminator,
-			field('body', $.do_group),
-		),
-
-		while_statement: $ => seq(
-			choice('while', 'until'),
-			field('cond', $._terminated_statement),
-			field('body', $.do_group),
-		),
-
-		do_group: $ => seq(
-			'do',
-			optional($._terminated_statement),
-			'done',
-		),
-
-		if_statement: $ => seq(
-			'if',
-			field('cond', $._terminated_statement),
-			'then',
-			field('body', optional($._terminated_statement)),
-			field('elif', repeat($.elif_clause)),
-			field('else', optional($.else_clause)),
-			'fi',
-		),
-
-		elif_clause: $ => seq(
-			'elif',
-			field('cond', $._terminated_statement),
-			'then',
-			field('body', optional($._terminated_statement)),
-		),
-
-		else_clause: $ => seq(
-			'else',
-			field('body', optional($._terminated_statement)),
-		),
-
-		case_statement: $ => seq(
-			'case',
-			field('value', $._literal),
-			optional($.terminator),
-			'in',
-			optional($.terminator),
-			optional(seq(
-				repeat(field('cases', $.case_item)),
-				field('cases', alias($._case_item_last, $.case_item))
-			)),
-			'esac',
-		),
-
-		_case_item_last: $ => seq(
-			optional('('),
-			field('value', choice($._literal, $._extglob_blob)),
-			repeat(seq('|', field('value', choice($._literal, $._extglob_blob)))),
-			')',
-			repeat('\n'),
-			choice(field('body', $._statements),),
-			optional(';;')
-		),
-
-		case_item: $ => seq(
-			optional('('),
-			field('value', choice($._literal, $._extglob_blob)),
-			repeat(seq('|', field('value', choice($._literal, $._extglob_blob)))),
-			')',
-			repeat('\n'),
-			choice(field('body', $._statements)),
-			';;'
-		),
-
-		function_definition: $ => prec.right(seq(
-			field('name', $.word),
-			'(', ')',
-			field('body', choice($.compound_statement, $.subshell, $.command, $.while_statement, $.if_statement, $.for_statement, $._variable_assignments, repeat1($.file_redirect))),
-		)),
-		*/
-
-		compound_statement: $ => seq('{', $._terminated_statement, '}'),
-		subshell: $ => seq('(', $._statements, ')'),
-
-		pipeline: $ => prec.right(seq(
-			$._statement_not_pipeline,
-			repeat1(seq('|', $._statement_not_pipeline)),
-		)),
-
-		list: $ => prec.left(-1, seq(
-			field('cmd', $._statement),
-			field('op', alias(choice('&&', '||'), $.operator)),
-			field('cmd', $._statement),
-		)),
-
-		// Commands
-
-		negated_command: $ => seq(
-			'!',
-			choice(
-				prec(2, $.command),
-				prec(1, $.variable_assignment),
-				$.subshell,
-			),
-		),
-
-		command: $ => prec.left(seq(
-			repeat(choice(
-				$.variable_assignment,
-				field('redr', $.file_redirect),
-			)),
-			field('name', $.command_name),
-			repeat(choice(
-				field('arg', $._literal),
-				field('arg', alias($._bare_dollar, $.word)),
-			)),
-		)),
-
-		command_name: $ => $._literal,
-
-		variable_assignment: $ => seq(
-			field('name', choice(
-				$.variable_name,
-			)),
-			'=',
-			field('value', choice(
-				$._literal,
-				$._empty_value,
-				alias($._comment_word, $.word),
-			)),
-		),
-
-		_variable_assignments: $ => seq($.variable_assignment, repeat1($.variable_assignment)),
-
-		file_redirect: $ => prec.left(seq(
-			field('op', alias(choice('<', '>', '>>'), $.operator)),
-			field('dest', repeat1($._literal)),
-		)),
-
-		heredoc_redirect: $ => seq(
-			field('op', alias('<<', $.operator)),
-			field('del', alias(/[\w\d\-\._]+/, $.heredoc_delimiter)),
-		),
-
-		// Literals
-
-		_literal: $ => choice($.concatenation, $._primary_expression),
-
-		_primary_expression: $ => choice(
-			$.word,
-			$.string,
-			$.raw_string,
-			$.number,
-			$.expansion,
-			$.simple_expansion,
-			$.command_substitution,
-			$.arithmetic_expansion,
-		),
-
-		arithmetic_expansion: $ => seq('$((', $._arithmetic_expression, '))'),
-
-		_arithmetic_expression: $ => prec(1, choice(
-			$.arithmetic_literal,
-			$.arithmetic_unary_expression,
-			$.arithmetic_ternary_expression,
-			$.arithmetic_binary_expression,
-			$.arithmetic_postfix_expression,
-			$.arithmetic_parenthesized_expression,
-		)),
-
-		arithmetic_literal: $ => prec(1, choice(
-			$.number,
-			$.simple_expansion,
-			$.expansion,
-			$._simple_variable_name,
-			$.variable_name,
-			$.string,
-		)),
-
-		arithmetic_binary_expression: $ => {
-
-			/** @type {[RuleOrLiteral, number][]} */
-			const table = [
-				[choice('+', '-'), PREC.ADD],
-				[choice('*', '/', '%'), PREC.MULTIPLY],
-			];
-
-			return choice(...table.map(([operator, precedence]) =>
-				prec.left(precedence, seq(
-					field('lhs', $._arithmetic_expression),
-					field('op', alias(operator, $.operator)),
-					field('rhs', $._arithmetic_expression),
-				))
-			));
-		},
-
-		arithmetic_ternary_expression: $ => prec.left(PREC.TERNARY, seq(
-			field('cond', $._arithmetic_expression),
-			'?',
-			field('then', $._arithmetic_expression),
-			':',
-			field('else', $._arithmetic_expression),
-		)),
-
-		arithmetic_unary_expression: $ => prec(PREC.UNARY, seq(
-			field('op', alias(tokenLiterals(1, '-', '+'), $.operator)),
-			$._arithmetic_expression,
-		)),
-
-		arithmetic_postfix_expression: $ => prec(PREC.POSTFIX, seq(
-			$._arithmetic_expression,
-			field('op', alias(choice('++', '--'), $.operator)),
-		)),
-
-		arithmetic_parenthesized_expression: $ => seq('(', $._arithmetic_expression, ')'),
-
-		concatenation: $ => prec(-1, seq(
-			$._primary_expression,
-			repeat1(seq(
-				choice($._concat, alias(/`\s*`/, '``')),
-				choice(
-					$._primary_expression,
-					alias($._comment_word, $.word),
-					alias($._bare_dollar, $.word),
-					alias(/`\s*`/, '``')
-				),
-			)),
-			optional(seq($._concat, alias('$', $.word))),
-		)),
-
-		string: $ => seq(
-			'"',
-			repeat(seq(
-				choice(
-					seq(optional('$'), $.string_content),
-					$.expansion,
-					$.simple_expansion,
-					$.command_substitution,
-					$.arithmetic_expansion,
-				),
-				optional($._concat),
-			)),
-			optional(alias('$', $.string_content)),
-			'"',
-		),
-
-		string_content: _ => token(prec(-1, /([^"`$\\\r\n]|\\(.|\r?\n))+/)),
-
-		raw_string: _ => /'[^']*'/,
-
-		number: _ => /[0-9]+/,
-
-		simple_expansion: $ => seq(
-			'$',
-			choice(
-				$._simple_variable_name,
-				$._multiline_variable_name,
-				$._special_variable_name,
-				$.variable_name,
-				alias('!', $.special_variable_name),
-				alias('#', $.special_variable_name),
-			),
-		),
-
-		expansion: $ => seq(
-			'${',
-			optional($._expansion_body),
-			'}',
-		),
-
-		_expansion_body: $ => seq(
-			field('len', optional(alias('#', $.operator))),
-			field('name', choice($.variable_name, $._simple_variable_name, $._special_variable_name)),
-			optional(choice($._expansion_expression, $._expansion_regex)),
-		),
-
-
-		_expansion_expression: $ => prec(1, seq(
-			field('op', alias(immediateLiterals(':-', '-', ':=', '=', ':?', '?', ':+', '+'), $.operator)),
-			field('args', optional(choice(
-				alias($._concatenation_in_expansion, $.concatenation),
-				alias(prec(1, $._word_no_brace), $.word2),
-				$.expansion,
-				$.raw_string,
-				$.string,
-			))),
-		)),
-
-		_expansion_regex: $ => seq(
-			field('op', alias(choice('#', $._immediate_double_hash, '%', '%%'), $.operator)),
-			field('args', repeat(choice(
-				$.raw_string,
-				$.regex,
-				$.string,
-				alias(')', $.regex),
-				alias(/\s+/, $.regex),
-			))),
-		),
-
-
-		_concatenation_in_expansion: $ => prec(-2, seq(
-			choice(
-				alias($._word_no_brace, $.word),
-				alias($._expansion_word, $.word),
-				$.variable_name,
-				$.simple_expansion,
-				$.expansion,
-				$.string,
-				$.raw_string,
-				$.command_substitution,
-			),
-			repeat1(seq(
-				choice($._concat, alias(/`\s*`/, '``')),
-				choice(
-					alias($._word_no_brace, $.word),
-					alias($._expansion_word, $.word),
-					$.variable_name,
-					$.simple_expansion,
-					$.expansion,
-					$.string,
-					$.raw_string,
-					$.command_substitution,
-				),
-			)),
-		)),
-
-		command_substitution: $ => choice(
-			seq('$(', $._statements, ')'),
-			seq('$(', field('redr', $.file_redirect), ')'),
-			prec(1, seq('`', $._statements, '`')),
-		),
-
-		_extglob_blob: $ => choice(
-			$.extglob_pattern,
-			seq(
-				$.extglob_pattern,
-				choice($.string, $.expansion, $.command_substitution),
-				optional($.extglob_pattern),
-			),
-		),
-
-		comment: _ => token(prec(-10, /#.*/)),
-
-		_comment_word: _ => token(prec(-8, seq(
-			choice(
-				noneOf(...SPECIAL_CHARACTERS),
-				seq('\\', noneOf('\\s')),
-			),
-			repeat(choice(
-				noneOf(...SPECIAL_CHARACTERS),
-				seq('\\', noneOf('\\s')),
-				'\\ ',
-			)),
-		))),
-
-		_simple_variable_name: $ => alias(/\w+/, $.variable_name),
-		_multiline_variable_name: $ => alias(
-			token(prec(-1, /(\w|\\\r?\n)+/)),
-			$.variable_name,
-		),
-
-		_special_variable_name: $ => alias(choice('*', '@', '?', '!', '#', '-', '$', '0'), $.special_variable_name),
-
-		word: _ => token(seq(
-			choice(
-				noneOf('#', ...SPECIAL_CHARACTERS),
-				seq('\\', noneOf('\\s')),
-			),
-			repeat(choice(
-				noneOf(...SPECIAL_CHARACTERS),
-				seq('\\', noneOf('\\s')),
-				'\\ ',
-			)),
-		)),
-
-
-		_word_no_brace: _ => prec(2, token(seq(
-			choice(
-				noneOf('#', '{', '}', ...SPECIAL_CHARACTERS),
-				seq('\\', noneOf('\\s')),
-			),
-			repeat(choice(
-				noneOf('{', '}', ...SPECIAL_CHARACTERS),
-				seq('\\', noneOf('\\s')),
-				'\\ ',
-			)),
-		))),
-		terminator: _ => choice(';', ';;', /\n/),
-	},
-});
-
-/**
- * Returns a regular expression that matches any character except the ones
- * provided.
- *
- * @param  {...string} characters
- *
- * @return {RegExp}
- *
- */
-function noneOf(...characters) {
-	const negatedString = characters.map(c => c == '\\' ? '\\\\' : c).join('');
-	return new RegExp('[^' + negatedString + ']');
-}
-
-/**
- * Creates a rule to optionally match one or more of the rules separated by a comma
- *
- * @param {RuleOrLiteral} rule
- *
- * @return {ChoiceRule}
- *
- */
-function commaSep(rule) {
-	return optional(commaSep1(rule));
-}
-
-/**
- * Creates a rule to match one or more of the rules separated by a comma
- *
- * @param {RuleOrLiteral} rule
- *
- * @return {SeqRule}
- *
- */
-function commaSep1(rule) {
-	return seq(rule, repeat(seq(',', rule)));
-}
-
-/**
- *
- * Turns a list of rules into a choice of immediate rule
- *
- * @param {(RegExp|String)[]} literals
- *
- * @return {ChoiceRule}
- */
-function immediateLiterals(...literals) {
-	return choice(...literals.map(l => token.immediate(l)));
-}
-
-/**
- *
- * Turns a list of rules into a choice of aliased token rules
- *
- * @param {number} precedence
- *
- * @param {(RegExp|String)[]} literals
- *
- * @return {ChoiceRule}
- */
-function tokenLiterals(precedence, ...literals) {
-	return choice(...literals.map(l => token(prec(precedence, l))));
-}
--- a/.tree-sitter-sh/package.json
+++ b/.tree-sitter-sh/package.json
@ -1,53 +0,0 @@
-{
-  "name": "tree-sitter-bash",
-  "version": "0.0.1",
-  "description": "Bash grammar for tree-sitter",
-  "repository": "github:tree-sitter/tree-sitter-bash",
-  "license": "MIT",
-  "main": "bindings/node",
-  "types": "bindings/node",
-  "keywords": [
-    "incremental",
-    "parsing",
-    "tree-sitter",
-    "bash"
-  ],
-  "files": [
-    "grammar.js",
-    "binding.gyp",
-    "prebuilds/**",
-    "bindings/node/*",
-    "queries/*",
-    "src/**"
-  ],
-  "dependencies": {
-    "node-addon-api": "^7.1.0",
-    "node-gyp-build": "^4.8.0"
-  },
-  "devDependencies": {
-    "prebuildify": "^6.0.0",
-    "tree-sitter-cli": "^0.22.6"
-  },
-  "peerDependencies": {
-    "tree-sitter": "^0.21.0"
-  },
-  "peerDependenciesMeta": {
-    "tree-sitter": {
-      "optional": true
-    }
-  },
-  "scripts": {
-    "install": "node-gyp-build",
-    "prebuildify": "prebuildify --napi --strip",
-    "build": "tree-sitter generate --no-bindings",
-    "build-wasm": "tree-sitter build --wasm",
-    "test": "tree-sitter test",
-    "parse": "tree-sitter parse"
-  },
-  "tree-sitter": [
-    {
-      "scope": "source.bash",
-      "injection-regex": "^bash$"
-    }
-  ]
-}
--- a/.tree-sitter-sh/src/scanner.c
+++ b/.tree-sitter-sh/src/scanner.c
@ -1,954 +0,0 @@
-#include "tree_sitter/alloc.h"
-#include "tree_sitter/array.h"
-#include "tree_sitter/parser.h"
-
-#include <assert.h>
-#include <ctype.h>
-#include <string.h>
-#include <wctype.h>
-
-enum TokenType
-{
-	FILE_DESCRIPTOR,
-	EMPTY_VALUE,
-	CONCAT,
-	VARIABLE_NAME,
-	REGEX,
-	EXPANSION_WORD,
-	EXTGLOB_PATTERN,
-	BARE_DOLLAR,
-	IMMEDIATE_DOUBLE_HASH,
-	// HEREDOC_ARROW,
-	// HEREDOC_ARROW_DASH,
-	NEWLINE,
-	OPENING_PAREN,
-	ERROR_RECOVERY,
-};
-
-typedef Array(char) String;
-
-typedef struct Heredoc
-{
-	bool   is_raw;
-	bool   started;
-	bool   allows_indent;
-	String delimiter;
-	String current_leading_word;
-} Heredoc;
-
-#define heredoc_new()                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                          \
-	{                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                          \
-		.is_raw = false,                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                       \
-		.started = false,                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                      \
-		.allows_indent = false,                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                \
-		.delimiter = array_new(),                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                              \
-		.current_leading_word = array_new(),                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                   \
-	};
-
-typedef struct Scanner
-{
-	uint8_t last_glob_paren_depth;
-	bool	ext_was_in_double_quote;
-	bool	ext_saw_outside_quote;
-	Array(Heredoc) heredocs;
-} Scanner;
-
-static inline void advance(TSLexer *lexer)
-{
-	lexer->advance(lexer, false);
-}
-
-static inline void skip(TSLexer *lexer)
-{
-	lexer->advance(lexer, true);
-}
-
-static inline bool in_error_recovery(const bool *valid_symbols)
-{
-	return valid_symbols[ERROR_RECOVERY];
-}
-
-static inline void reset_string(String *string)
-{
-	if (string->size > 0)
-	{
-		memset(string->contents, 0, string->size);
-		array_clear(string);
-	}
-}
-
-static inline void reset_heredoc(Heredoc *heredoc)
-{
-	heredoc->is_raw = false;
-	heredoc->started = false;
-	heredoc->allows_indent = false;
-	reset_string(&heredoc->delimiter);
-}
-
-static inline void reset(Scanner *scanner)
-{
-	for (uint32_t i = 0; i < scanner->heredocs.size; i++)
-	{
-		reset_heredoc(array_get(&scanner->heredocs, i));
-	}
-}
-
-static unsigned serialize(Scanner *scanner, char *buffer)
-{
-	uint32_t size = 0;
-
-	buffer[size++] = (char)scanner->last_glob_paren_depth;
-	buffer[size++] = (char)scanner->ext_was_in_double_quote;
-	buffer[size++] = (char)scanner->ext_saw_outside_quote;
-	buffer[size++] = (char)scanner->heredocs.size;
-
-	for (uint32_t i = 0; i < scanner->heredocs.size; i++)
-	{
-		Heredoc *heredoc = array_get(&scanner->heredocs, i);
-		if (heredoc->delimiter.size + 3 + size >= TREE_SITTER_SERIALIZATION_BUFFER_SIZE)
-		{
-			return 0;
-		}
-
-		buffer[size++] = (char)heredoc->is_raw;
-		buffer[size++] = (char)heredoc->started;
-		buffer[size++] = (char)heredoc->allows_indent;
-
-		memcpy(&buffer[size], &heredoc->delimiter.size, sizeof(uint32_t));
-		size += sizeof(uint32_t);
-		if (heredoc->delimiter.size > 0)
-		{
-			memcpy(&buffer[size], heredoc->delimiter.contents, heredoc->delimiter.size);
-			size += heredoc->delimiter.size;
-		}
-	}
-	return size;
-}
-
-static void deserialize(Scanner *scanner, const char *buffer, unsigned length)
-{
-	if (length == 0)
-	{
-		reset(scanner);
-	}
-	else
-	{
-		uint32_t size = 0;
-		scanner->last_glob_paren_depth = buffer[size++];
-		scanner->ext_was_in_double_quote = buffer[size++];
-		scanner->ext_saw_outside_quote = buffer[size++];
-		uint32_t heredoc_count = (unsigned char)buffer[size++];
-		for (uint32_t i = 0; i < heredoc_count; i++)
-		{
-			Heredoc *heredoc = NULL;
-			if (i < scanner->heredocs.size)
-			{
-				heredoc = array_get(&scanner->heredocs, i);
-			}
-			else
-			{
-				Heredoc new_heredoc = heredoc_new();
-				array_push(&scanner->heredocs, new_heredoc);
-				heredoc = array_back(&scanner->heredocs);
-			}
-
-			heredoc->is_raw = buffer[size++];
-			heredoc->started = buffer[size++];
-			heredoc->allows_indent = buffer[size++];
-
-			memcpy(&heredoc->delimiter.size, &buffer[size], sizeof(uint32_t));
-			size += sizeof(uint32_t);
-			array_reserve(&heredoc->delimiter, heredoc->delimiter.size);
-
-			if (heredoc->delimiter.size > 0)
-			{
-				memcpy(heredoc->delimiter.contents, &buffer[size], heredoc->delimiter.size);
-				size += heredoc->delimiter.size;
-			}
-		}
-		assert(size == length);
-	}
-}
-
-/**
- * Consume a "word" in POSIX parlance, and returns it unquoted.
- *
- * This is an approximate implementation that doesn't deal with any
- * POSIX-mandated substitution, and assumes the default value for
- * IFS.
- */
-static bool advance_word(TSLexer *lexer, String *unquoted_word)
-{
-	bool	empty = true;
-	int32_t quote = 0;
-
-	if (lexer->lookahead == '\'' || lexer->lookahead == '"')
-	{
-		quote = lexer->lookahead;
-		advance(lexer);
-	}
-
-	while (lexer->lookahead && !(quote ? lexer->lookahead == quote || lexer->lookahead == '\r' || lexer->lookahead == '\n' : iswspace(lexer->lookahead)))
-	{
-		if (lexer->lookahead == '\\')
-		{
-			advance(lexer);
-			if (!lexer->lookahead)
-				return false;
-		}
-		empty = false;
-		array_push(unquoted_word, lexer->lookahead);
-		advance(lexer);
-	}
-	array_push(unquoted_word, '\0');
-
-	if (quote && lexer->lookahead == quote)
-		advance(lexer);
-
-	return !empty;
-}
-
-static inline bool scan_bare_dollar(TSLexer *lexer)
-{
-	while (iswspace(lexer->lookahead) && lexer->lookahead != '\n' && !lexer->eof(lexer))
-		skip(lexer);
-
-	if (lexer->lookahead == '$')
-	{
-		advance(lexer);
-		lexer->result_symbol = BARE_DOLLAR;
-		lexer->mark_end(lexer);
-		return (iswspace(lexer->lookahead) || lexer->eof(lexer) || lexer->lookahead == '\"');
-	}
-
-	return false;
-}
-
-static bool scan(Scanner *scanner, TSLexer *lexer, const bool *valid_symbols)
-{
-	if (valid_symbols[CONCAT] && !in_error_recovery(valid_symbols))
-	{
-		if (!(lexer->lookahead == 0 || iswspace(lexer->lookahead) || lexer->lookahead == '>' || lexer->lookahead == '<' || lexer->lookahead == ')' || lexer->lookahead == '(' || lexer->lookahead == ';' || lexer->lookahead == '&' || lexer->lookahead == '|' || lexer->lookahead == '{' || lexer->lookahead == '}'))
-		{
-			lexer->result_symbol = CONCAT;
-			// So for a`b`, we want to return a concat. We check if the
-			// 2nd backtick has whitespace after it, and if it does we
-			// return concat.
-			if (lexer->lookahead == '`')
-			{
-				lexer->mark_end(lexer);
-				advance(lexer);
-				while (lexer->lookahead != '`' && !lexer->eof(lexer))
-				{
-					advance(lexer);
-				}
-				if (lexer->eof(lexer))
-				{
-					return false;
-				}
-				if (lexer->lookahead == '`')
-				{
-					advance(lexer);
-				}
-				return iswspace(lexer->lookahead) || lexer->eof(lexer);
-			}
-			// strings w/ expansions that contains escaped quotes or
-			// backslashes need this to return a concat
-			if (lexer->lookahead == '\\')
-			{
-				lexer->mark_end(lexer);
-				advance(lexer);
-				if (lexer->lookahead == '"' || lexer->lookahead == '\'' || lexer->lookahead == '\\')
-				{
-					return true;
-				}
-				if (lexer->eof(lexer))
-				{
-					return false;
-				}
-			}
-			else
-			{
-				return true;
-			}
-		}
-	}
-
-	if (valid_symbols[IMMEDIATE_DOUBLE_HASH] && !in_error_recovery(valid_symbols))
-	{
-		// advance two # and ensure not } after
-		if (lexer->lookahead == '#')
-		{
-			lexer->mark_end(lexer);
-			advance(lexer);
-			if (lexer->lookahead == '#')
-			{
-				advance(lexer);
-				if (lexer->lookahead != '}')
-				{
-					lexer->result_symbol = IMMEDIATE_DOUBLE_HASH;
-					lexer->mark_end(lexer);
-					return true;
-				}
-			}
-		}
-	}
-
-	if (valid_symbols[EMPTY_VALUE])
-	{
-		if (iswspace(lexer->lookahead) || lexer->eof(lexer) || lexer->lookahead == ';' || lexer->lookahead == '&')
-		{
-			lexer->result_symbol = EMPTY_VALUE;
-			return true;
-		}
-	}
-
-	if ((valid_symbols[VARIABLE_NAME] || valid_symbols[FILE_DESCRIPTOR]) && !in_error_recovery(valid_symbols))
-	{
-		for (;;)
-		{
-			if ((lexer->lookahead == ' ' || lexer->lookahead == '\t' || lexer->lookahead == '\r' || (lexer->lookahead == '\n' && !valid_symbols[NEWLINE])) && !valid_symbols[EXPANSION_WORD])
-			{
-				skip(lexer);
-			}
-			else if (lexer->lookahead == '\\')
-			{
-				skip(lexer);
-
-				if (lexer->eof(lexer))
-				{
-					lexer->mark_end(lexer);
-					lexer->result_symbol = VARIABLE_NAME;
-					return true;
-				}
-
-				if (lexer->lookahead == '\r')
-				{
-					skip(lexer);
-				}
-				if (lexer->lookahead == '\n')
-				{
-					skip(lexer);
-				}
-				else
-				{
-					if (lexer->lookahead == '\\' && valid_symbols[EXPANSION_WORD])
-					{
-						goto expansion_word;
-					}
-					return false;
-				}
-			}
-			else
-			{
-				break;
-			}
-		}
-
-		// no '*', '@', '?', '-', '$', '0', '_'
-		if (!valid_symbols[EXPANSION_WORD] && (lexer->lookahead == '*' || lexer->lookahead == '@' || lexer->lookahead == '?' || lexer->lookahead == '-' || lexer->lookahead == '0' || lexer->lookahead == '_'))
-		{
-			lexer->mark_end(lexer);
-			advance(lexer);
-			if (lexer->lookahead == '=' || lexer->lookahead == '[' || lexer->lookahead == ':' || lexer->lookahead == '-' || lexer->lookahead == '%' || lexer->lookahead == '#' || lexer->lookahead == '/')
-			{
-				return false;
-			}
-			if (valid_symbols[EXTGLOB_PATTERN] && iswspace(lexer->lookahead))
-			{
-				lexer->mark_end(lexer);
-				lexer->result_symbol = EXTGLOB_PATTERN;
-				return true;
-			}
-		}
-
-		bool is_number = true;
-		if (iswdigit(lexer->lookahead))
-		{
-			advance(lexer);
-		}
-		else if (iswalpha(lexer->lookahead) || lexer->lookahead == '_')
-		{
-			is_number = false;
-			advance(lexer);
-		}
-		else
-		{
-			if (lexer->lookahead == '{')
-			{
-				goto brace_start;
-			}
-			if (valid_symbols[EXPANSION_WORD])
-			{
-				goto expansion_word;
-			}
-			if (valid_symbols[EXTGLOB_PATTERN])
-			{
-				goto extglob_pattern;
-			}
-			return false;
-		}
-
-		for (;;)
-		{
-			if (iswdigit(lexer->lookahead))
-			{
-				advance(lexer);
-			}
-			else if (iswalpha(lexer->lookahead) || lexer->lookahead == '_')
-			{
-				is_number = false;
-				advance(lexer);
-			}
-			else
-			{
-				break;
-			}
-		}
-
-		if (is_number && valid_symbols[FILE_DESCRIPTOR] && (lexer->lookahead == '>' || lexer->lookahead == '<'))
-		{
-			lexer->result_symbol = FILE_DESCRIPTOR;
-			return true;
-		}
-
-		if (valid_symbols[VARIABLE_NAME])
-		{
-			if (lexer->lookahead == '+')
-			{
-				lexer->mark_end(lexer);
-				advance(lexer);
-				if (lexer->lookahead == '=' || lexer->lookahead == ':')
-				{
-					lexer->result_symbol = VARIABLE_NAME;
-					return true;
-				}
-				return false;
-			}
-			if (lexer->lookahead == '/')
-			{
-				return false;
-			}
-			if (lexer->lookahead == '=' || lexer->lookahead == '[' || (lexer->lookahead == ':' && !valid_symbols[OPENING_PAREN]) || // TODO(amaanq): more cases for regular word chars but not variable
-																																	// names for function words, only handling : for now? #235
-				lexer->lookahead == '%' || (lexer->lookahead == '#' && !is_number) || lexer->lookahead == '@' || (lexer->lookahead == '-'))
-			{
-				lexer->mark_end(lexer);
-				lexer->result_symbol = VARIABLE_NAME;
-				return true;
-			}
-
-			if (lexer->lookahead == '?')
-			{
-				lexer->mark_end(lexer);
-				advance(lexer);
-				lexer->result_symbol = VARIABLE_NAME;
-				return iswalpha(lexer->lookahead);
-			}
-		}
-
-		return false;
-	}
-
-	if (valid_symbols[BARE_DOLLAR] && !in_error_recovery(valid_symbols) && scan_bare_dollar(lexer))
-	{
-		return true;
-	}
-
-	if ((valid_symbols[REGEX]) && !in_error_recovery(valid_symbols))
-	{
-		if (valid_symbols[REGEX])
-		{
-			while (iswspace(lexer->lookahead))
-			{
-				skip(lexer);
-			}
-		}
-
-		if ((lexer->lookahead != '"' && lexer->lookahead != '\'') || ((lexer->lookahead == '$' || lexer->lookahead == '\'')) || (lexer->lookahead == '\''))
-		{
-			typedef struct
-			{
-				bool	 done;
-				bool	 advanced_once;
-				bool	 found_non_alnumdollarunderdash;
-				bool	 last_was_escape;
-				bool	 in_single_quote;
-				uint32_t paren_depth;
-				uint32_t bracket_depth;
-				uint32_t brace_depth;
-			} State;
-
-			if (lexer->lookahead == '$')
-			{
-				lexer->mark_end(lexer);
-				advance(lexer);
-				if (lexer->lookahead == '(')
-				{
-					return false;
-				}
-			}
-
-			lexer->mark_end(lexer);
-
-			State state = {false, false, false, false, false, 0, 0, 0};
-			while (!state.done)
-			{
-				if (state.in_single_quote)
-				{
-					if (lexer->lookahead == '\'')
-					{
-						state.in_single_quote = false;
-						advance(lexer);
-						lexer->mark_end(lexer);
-					}
-				}
-				switch (lexer->lookahead)
-				{
-				case '\\':
-					state.last_was_escape = true;
-					break;
-				case '\0':
-					return false;
-				case '(':
-					state.paren_depth++;
-					state.last_was_escape = false;
-					break;
-				case '[':
-					state.bracket_depth++;
-					state.last_was_escape = false;
-					break;
-				case '{':
-					if (!state.last_was_escape)
-						state.brace_depth++;
-					state.last_was_escape = false;
-					break;
-				case ')':
-					if (state.paren_depth == 0)
-						state.done = true;
-					state.paren_depth--;
-					state.last_was_escape = false;
-					break;
-				case ']':
-					if (state.bracket_depth == 0)
-						state.done = true;
-					state.bracket_depth--;
-					state.last_was_escape = false;
-					break;
-				case '}':
-					if (state.brace_depth == 0)
-						state.done = true;
-					state.brace_depth--;
-					state.last_was_escape = false;
-					break;
-				case '\'':
-					// Enter or exit a single-quoted string.
-					state.in_single_quote = !state.in_single_quote;
-					advance(lexer);
-					state.advanced_once = true;
-					state.last_was_escape = false;
-					continue;
-				default:
-					state.last_was_escape = false;
-					break;
-				}
-
-				if (!state.done)
-				{
-					if (valid_symbols[REGEX])
-					{
-						bool was_space = !state.in_single_quote && iswspace(lexer->lookahead);
-						advance(lexer);
-						state.advanced_once = true;
-						if (!was_space || state.paren_depth > 0)
-						{
-							lexer->mark_end(lexer);
-						}
-					}
-				}
-			}
-
-			lexer->result_symbol = REGEX;
-			if (valid_symbols[REGEX] && !state.advanced_once)
-			{
-				return false;
-			}
-			return true;
-		}
-	}
-
-extglob_pattern:
-	if (valid_symbols[EXTGLOB_PATTERN] && !in_error_recovery(valid_symbols))
-	{
-		// first skip ws, then check for ? * + @ !
-		while (iswspace(lexer->lookahead))
-		{
-			skip(lexer);
-		}
-
-		if (lexer->lookahead == '?' || lexer->lookahead == '*' || lexer->lookahead == '+' || lexer->lookahead == '@' || lexer->lookahead == '!' || lexer->lookahead == '-' || lexer->lookahead == ')' || lexer->lookahead == '\\' || lexer->lookahead == '.' || lexer->lookahead == '[' || (iswalpha(lexer->lookahead)))
-		{
-			if (lexer->lookahead == '\\')
-			{
-				advance(lexer);
-				if ((iswspace(lexer->lookahead) || lexer->lookahead == '"') && lexer->lookahead != '\r' && lexer->lookahead != '\n')
-				{
-					advance(lexer);
-				}
-				else
-				{
-					return false;
-				}
-			}
-
-			if (lexer->lookahead == ')' && scanner->last_glob_paren_depth == 0)
-			{
-				lexer->mark_end(lexer);
-				advance(lexer);
-
-				if (iswspace(lexer->lookahead))
-				{
-					return false;
-				}
-			}
-
-			lexer->mark_end(lexer);
-			bool was_non_alpha = !iswalpha(lexer->lookahead);
-			if (lexer->lookahead != '[')
-			{
-				// no esac
-				if (lexer->lookahead == 'e')
-				{
-					lexer->mark_end(lexer);
-					advance(lexer);
-					if (lexer->lookahead == 's')
-					{
-						advance(lexer);
-						if (lexer->lookahead == 'a')
-						{
-							advance(lexer);
-							if (lexer->lookahead == 'c')
-							{
-								advance(lexer);
-								if (iswspace(lexer->lookahead))
-								{
-									return false;
-								}
-							}
-						}
-					}
-				}
-				else
-				{
-					advance(lexer);
-				}
-			}
-
-			// -\w is just a word, find something else special
-			if (lexer->lookahead == '-')
-			{
-				lexer->mark_end(lexer);
-				advance(lexer);
-				while (iswalnum(lexer->lookahead))
-				{
-					advance(lexer);
-				}
-
-				if (lexer->lookahead == ')' || lexer->lookahead == '\\' || lexer->lookahead == '.')
-				{
-					return false;
-				}
-				lexer->mark_end(lexer);
-			}
-
-			// case item -) or *)
-			if (lexer->lookahead == ')' && scanner->last_glob_paren_depth == 0)
-			{
-				lexer->mark_end(lexer);
-				advance(lexer);
-				if (iswspace(lexer->lookahead))
-				{
-					lexer->result_symbol = EXTGLOB_PATTERN;
-					return was_non_alpha;
-				}
-			}
-
-			if (iswspace(lexer->lookahead))
-			{
-				lexer->mark_end(lexer);
-				lexer->result_symbol = EXTGLOB_PATTERN;
-				scanner->last_glob_paren_depth = 0;
-				return true;
-			}
-
-			if (lexer->lookahead == '$')
-			{
-				lexer->mark_end(lexer);
-				advance(lexer);
-				if (lexer->lookahead == '{' || lexer->lookahead == '(')
-				{
-					lexer->result_symbol = EXTGLOB_PATTERN;
-					return true;
-				}
-			}
-
-			if (lexer->lookahead == '|')
-			{
-				lexer->mark_end(lexer);
-				advance(lexer);
-				lexer->result_symbol = EXTGLOB_PATTERN;
-				return true;
-			}
-
-			if (!iswalnum(lexer->lookahead) && lexer->lookahead != '(' && lexer->lookahead != '"' && lexer->lookahead != '[' && lexer->lookahead != '?' && lexer->lookahead != '/' && lexer->lookahead != '\\' && lexer->lookahead != '_' && lexer->lookahead != '*')
-			{
-				return false;
-			}
-
-			typedef struct
-			{
-				bool	 done;
-				bool	 saw_non_alphadot;
-				uint32_t paren_depth;
-				uint32_t bracket_depth;
-				uint32_t brace_depth;
-			} State;
-
-			State state = {false, was_non_alpha, scanner->last_glob_paren_depth, 0, 0};
-			while (!state.done)
-			{
-				switch (lexer->lookahead)
-				{
-				case '\0':
-					return false;
-				case '(':
-					state.paren_depth++;
-					break;
-				case '[':
-					state.bracket_depth++;
-					break;
-				case '{':
-					state.brace_depth++;
-					break;
-				case ')':
-					if (state.paren_depth == 0)
-					{
-						state.done = true;
-					}
-					state.paren_depth--;
-					break;
-				case ']':
-					if (state.bracket_depth == 0)
-					{
-						state.done = true;
-					}
-					state.bracket_depth--;
-					break;
-				case '}':
-					if (state.brace_depth == 0)
-					{
-						state.done = true;
-					}
-					state.brace_depth--;
-					break;
-				}
-
-				if (lexer->lookahead == '|')
-				{
-					lexer->mark_end(lexer);
-					advance(lexer);
-					if (state.paren_depth == 0 && state.bracket_depth == 0 && state.brace_depth == 0)
-					{
-						lexer->result_symbol = EXTGLOB_PATTERN;
-						return true;
-					}
-				}
-
-				if (!state.done)
-				{
-					bool was_space = iswspace(lexer->lookahead);
-					if (lexer->lookahead == '$')
-					{
-						lexer->mark_end(lexer);
-						if (!iswalpha(lexer->lookahead) && lexer->lookahead != '.' && lexer->lookahead != '\\')
-						{
-							state.saw_non_alphadot = true;
-						}
-						advance(lexer);
-						if (lexer->lookahead == '(' || lexer->lookahead == '{')
-						{
-							lexer->result_symbol = EXTGLOB_PATTERN;
-							scanner->last_glob_paren_depth = state.paren_depth;
-							return state.saw_non_alphadot;
-						}
-					}
-					if (was_space)
-					{
-						lexer->mark_end(lexer);
-						lexer->result_symbol = EXTGLOB_PATTERN;
-						scanner->last_glob_paren_depth = 0;
-						return state.saw_non_alphadot;
-					}
-					if (lexer->lookahead == '"')
-					{
-						lexer->mark_end(lexer);
-						lexer->result_symbol = EXTGLOB_PATTERN;
-						scanner->last_glob_paren_depth = 0;
-						return state.saw_non_alphadot;
-					}
-					if (lexer->lookahead == '\\')
-					{
-						if (!iswalpha(lexer->lookahead) && lexer->lookahead != '.' && lexer->lookahead != '\\')
-						{
-							state.saw_non_alphadot = true;
-						}
-						advance(lexer);
-						if (iswspace(lexer->lookahead) || lexer->lookahead == '"')
-						{
-							advance(lexer);
-						}
-					}
-					else
-					{
-						if (!iswalpha(lexer->lookahead) && lexer->lookahead != '.' && lexer->lookahead != '\\')
-						{
-							state.saw_non_alphadot = true;
-						}
-						advance(lexer);
-					}
-					if (!was_space)
-					{
-						lexer->mark_end(lexer);
-					}
-				}
-			}
-
-			lexer->result_symbol = EXTGLOB_PATTERN;
-			scanner->last_glob_paren_depth = 0;
-			return state.saw_non_alphadot;
-		}
-		scanner->last_glob_paren_depth = 0;
-
-		return false;
-	}
-
-expansion_word:
-	if (valid_symbols[EXPANSION_WORD])
-	{
-		bool advanced_once = false;
-		bool advance_once_space = false;
-		for (;;)
-		{
-			if (lexer->lookahead == '\"')
-				return false;
-			if (lexer->lookahead == '$')
-			{
-				lexer->mark_end(lexer);
-				advance(lexer);
-				if (lexer->lookahead == '{' || lexer->lookahead == '(' || lexer->lookahead == '\'' || iswalnum(lexer->lookahead))
-				{
-					lexer->result_symbol = EXPANSION_WORD;
-					return advanced_once;
-				}
-				advanced_once = true;
-			}
-
-			if (lexer->lookahead == '}')
-			{
-				lexer->mark_end(lexer);
-				lexer->result_symbol = EXPANSION_WORD;
-				return advanced_once || advance_once_space;
-			}
-
-			if (lexer->lookahead == '(' && !(advanced_once || advance_once_space))
-			{
-				lexer->mark_end(lexer);
-				advance(lexer);
-				while (lexer->lookahead != ')' && !lexer->eof(lexer))
-				{
-					// if we find a $( or ${ assume this is valid and is
-					// a garbage concatenation of some weird word + an
-					// expansion
-					// I wonder where this can fail
-					if (lexer->lookahead == '$')
-					{
-						lexer->mark_end(lexer);
-						advance(lexer);
-						if (lexer->lookahead == '{' || lexer->lookahead == '(' || lexer->lookahead == '\'' || iswalnum(lexer->lookahead))
-						{
-							lexer->result_symbol = EXPANSION_WORD;
-							return advanced_once;
-						}
-						advanced_once = true;
-					}
-					else
-					{
-						advanced_once = advanced_once || !iswspace(lexer->lookahead);
-						advance_once_space = advance_once_space || iswspace(lexer->lookahead);
-						advance(lexer);
-					}
-				}
-				lexer->mark_end(lexer);
-				if (lexer->lookahead == ')')
-				{
-					advanced_once = true;
-					advance(lexer);
-					lexer->mark_end(lexer);
-					if (lexer->lookahead == '}')
-						return false;
-				}
-				else
-					return false;
-			}
-
-			if (lexer->lookahead == '\'')
-				return false;
-			if (lexer->eof(lexer))
-				return false;
-			advanced_once = advanced_once || !iswspace(lexer->lookahead);
-			advance_once_space = advance_once_space || iswspace(lexer->lookahead);
-			advance(lexer);
-		}
-	}
-
-brace_start:
-	return false;
-}
-
-void *tree_sitter_sh_external_scanner_create()
-{
-	Scanner *scanner = calloc(1, sizeof(Scanner));
-	array_init(&scanner->heredocs);
-	return scanner;
-}
-
-bool tree_sitter_sh_external_scanner_scan(void *payload, TSLexer *lexer, const bool *valid_symbols)
-{
-	Scanner *scanner = (Scanner *)payload;
-	return scan(scanner, lexer, valid_symbols);
-}
-
-unsigned tree_sitter_sh_external_scanner_serialize(void *payload, char *state)
-{
-	Scanner *scanner = (Scanner *)payload;
-	return serialize(scanner, state);
-}
-
-void tree_sitter_sh_external_scanner_deserialize(void *payload, const char *state, unsigned length)
-{
-	Scanner *scanner = (Scanner *)payload;
-	deserialize(scanner, state, length);
-}
-
-void tree_sitter_sh_external_scanner_destroy(void *payload)
-{
-	Scanner *scanner = (Scanner *)payload;
-	for (size_t i = 0; i < scanner->heredocs.size; i++)
-	{
-		Heredoc *heredoc = array_get(&scanner->heredocs, i);
-		array_delete(&heredoc->current_leading_word);
-		array_delete(&heredoc->delimiter);
-	}
-	array_delete(&scanner->heredocs);
-	free(scanner);
-}