From 6e0c49305e003d69cb6418a0cb8a9b1744035afe Mon Sep 17 00:00:00 2001
From: Amin Yahyaabadi <aminyahyaabadi74@gmail.com>
Date: Fri, 24 Sep 2021 12:55:17 -0500
Subject: [PATCH 001/347] Use ISO C and C++ conformant name: _fdopen on windows

Fixes
```
warning: In file included from src\lib.c:12:
warning: src/./parser.c:1781:28: warning: 'fdopen' is deprecated: The POSIX name for this item is deprecated. Instead, use the ISO C and C++ conformant name: _fdopen. See online help for details. [-Wdeprecated-declarations]
warning:     self->dot_graph_file = fdopen(fd, "a");
warning:                            ^
warning: C:\Program Files (x86)\Windows Kits\10\Include\10.0.19041.0\ucrt\stdio.h:2431:28: note: 'fdopen' has been explicitly marked deprecated here
warning:         _Check_return_     _CRT_NONSTDC_DEPRECATE(_fdopen)    _ACRTIMP FILE* __cdecl fdopen(_In_ int _FileHandle, _In_z_ char const* _Format);
warning:                            ^
warning: C:\Program Files (x86)\Windows Kits\10\Include\10.0.19041.0\ucrt\corecrt.h:414:50: note: expanded from macro '_CRT_NONSTDC_DEPRECATE'
warning:         #define _CRT_NONSTDC_DEPRECATE(_NewName) _CRT_DEPRECATE_TEXT(             \
warning:                                                  ^
warning: C:\Program Files (x86)\Microsoft Visual Studio\2019\Preview\VC\Tools\MSVC\14.29.30133\include\vcruntime.h:310:47: note: expanded from macro '_CRT_DEPRECATE_TEXT'
warning: #define _CRT_DEPRECATE_TEXT(_Text) __declspec(deprecated(_Text))
```
---
 lib/src/parser.c | 4 ++++
 1 file changed, 4 insertions(+)

diff --git a/lib/src/parser.c b/lib/src/parser.c
index 7db1aceb..ebeb4b37 100644
--- a/lib/src/parser.c
+++ b/lib/src/parser.c
@@ -1776,7 +1776,11 @@ void ts_parser_print_dot_graphs(TSParser *self, int fd) {
   }
 
   if (fd >= 0) {
+    #ifdef _WIN32
+    self->dot_graph_file = _fdopen(fd, "a");
+    #else
     self->dot_graph_file = fdopen(fd, "a");
+    #endif
   } else {
     self->dot_graph_file = NULL;
   }

From 94ffcdadf3abc3890e4f1e7d4c8ec9cdc8543668 Mon Sep 17 00:00:00 2001
From: Amin Yahyaabadi <aminyahyaabadi74@gmail.com>
Date: Fri, 24 Sep 2021 15:20:34 -0500
Subject: [PATCH 002/347] Mark stack__iter as static

Fixes
```
warning: In file included from src\lib.c:14:
warning: src/./stack.c:311:9: warning: static function 'ts_stack__add_slice' is used in an inline function with external linkage [-Wstatic-in-inline]
warning:         ts_stack__add_slice(
warning:         ^
warning: src/./stack.c:274:1: note: use 'static' to give inline function 'stack__iter' internal linkage
warning: inline StackSliceArray stack__iter(Stack *self, StackVersion version,
warning: ^
warning: static
warning: src/./stack.c:15:16: note: expanded from macro 'inline'
warning: #define inline __forceinline
warning:                ^
warning: src/./stack.c:258:13: note: 'ts_stack__add_slice' declared here
warning: static void ts_stack__add_slice(Stack *self, StackVersion original_version,
warning:             ^
warning: 1 warning generated.
    Finished dev [unoptimized + debuginfo] target(s) in 2.01s
```
---
 lib/src/stack.c | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/lib/src/stack.c b/lib/src/stack.c
index 1dc6895f..e49289cf 100644
--- a/lib/src/stack.c
+++ b/lib/src/stack.c
@@ -302,7 +302,7 @@ static void ts_stack__add_slice(
   array_push(&self->slices, slice);
 }
 
-inline StackSliceArray stack__iter(
+static StackSliceArray stack__iter(
   Stack *self,
   StackVersion version,
   StackCallback callback,

From a33e9141a8e0e3eeb08aeae228bb8b0214ea7d0b Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Wed, 9 Nov 2022 04:55:52 +0200
Subject: [PATCH 003/347] fix(cli): Racing on playground webserver port binding

---
 cli/Cargo.toml        |  2 +-
 cli/src/playground.rs | 39 ++++++++++++++++++++-------------------
 2 files changed, 21 insertions(+), 20 deletions(-)

diff --git a/cli/Cargo.toml b/cli/Cargo.toml
index 3c2bd171..5403075d 100644
--- a/cli/Cargo.toml
+++ b/cli/Cargo.toml
@@ -35,7 +35,7 @@ rustc-hash = "1"
 semver = "1.0"
 serde = { version = "1.0.130", features = ["derive"] }
 smallbitvec = "2.5.1"
-tiny_http = "0.8"
+tiny_http = "0.12.0"
 walkdir = "2.3"
 webbrowser = "0.5.1"
 which = "4.1.0"
diff --git a/cli/src/playground.rs b/cli/src/playground.rs
index be804b50..a2dbef96 100644
--- a/cli/src/playground.rs
+++ b/cli/src/playground.rs
@@ -45,20 +45,7 @@ fn get_main_html(tree_sitter_dir: &Option<PathBuf>) -> Cow<'static, [u8]> {
 }
 
 pub fn serve(grammar_path: &Path, open_in_browser: bool) {
-    let port = env::var("TREE_SITTER_PLAYGROUND_PORT")
-        .map(|v| v.parse::<u16>().expect("Invalid port specification"))
-        .unwrap_or_else(
-            |_| get_available_port().expect(
-                "Couldn't find an available port, try providing a port number via the TREE_SITTER_PLAYGROUND_PORT \
-                 environment variable"
-            )
-        );
-    let addr = format!(
-        "{}:{}",
-        env::var("TREE_SITTER_PLAYGROUND_ADDR").unwrap_or("127.0.0.1".to_owned()),
-        port
-    );
-    let server = Server::http(&addr).expect("Failed to start web server");
+    let server = get_server();
     let grammar_name = wasm::get_grammar_name(&grammar_path.join("src"))
         .with_context(|| "Failed to get wasm filename")
         .unwrap();
@@ -71,7 +58,7 @@ pub fn serve(grammar_path: &Path, open_in_browser: bool) {
             )
         })
         .unwrap();
-    let url = format!("http://{}", addr);
+    let url = format!("http://{}", server.server_addr());
     println!("Started playground on: {}", url);
     if open_in_browser {
         if let Err(_) = webbrowser::open(&url) {
@@ -135,10 +122,24 @@ fn response<'a>(data: &'a [u8], header: &Header) -> Response<&'a [u8]> {
         .with_header(header.clone())
 }
 
-fn get_available_port() -> Option<u16> {
-    (8000..12000).find(port_is_available)
+fn get_server() -> Server {
+    let addr = env::var("TREE_SITTER_PLAYGROUND_ADDR").unwrap_or("127.0.0.1".to_owned());
+    let port = env::var("TREE_SITTER_PLAYGROUND_PORT")
+        .map(|v| v.parse::<u16>().expect("Invalid port specification"))
+        .ok();
+    let listener = match port {
+        Some(port) => bind_to(&*addr, port).expect("Can't bind to the specified port"),
+        None => {
+            get_listener_on_available_port(&*addr).expect("Can't find a free port to bind to it")
+        }
+    };
+    Server::from_listener(listener, None).expect("Failed to start web server")
 }
 
-fn port_is_available(port: &u16) -> bool {
-    TcpListener::bind(("127.0.0.1", *port)).is_ok()
+fn get_listener_on_available_port(addr: &str) -> Option<TcpListener> {
+    (8000..12000).find_map(|port| bind_to(addr, port))
+}
+
+fn bind_to(addr: &str, port: u16) -> Option<TcpListener> {
+    TcpListener::bind(format!("{addr}:{port}")).ok()
 }

From c669e5ee159e0c59a3f094327a01dd688bc67c56 Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Sun, 11 Dec 2022 19:11:58 +0200
Subject: [PATCH 004/347] Fix permanent rebuild triggering in a git worktree
 due to wrong git branch file path

---
 Cargo.lock   | 508 +++++++++++++++------------------------------------
 cli/build.rs |  16 +-
 2 files changed, 166 insertions(+), 358 deletions(-)

diff --git a/Cargo.lock b/Cargo.lock
index 49f95269..f5c4e7e4 100644
--- a/Cargo.lock
+++ b/Cargo.lock
@@ -4,22 +4,13 @@ version = 3
 
 [[package]]
 name = "aho-corasick"
-version = "0.7.15"
+version = "0.7.20"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "7404febffaa47dac81aa44dba71523c9d069b1bdc50a77db41195149e17f68e5"
+checksum = "cc936419f96fa211c1b9166887b38e5e40b19958e5b895be7c1f93adec7071ac"
 dependencies = [
  "memchr",
 ]
 
-[[package]]
-name = "ansi_term"
-version = "0.11.0"
-source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "ee49baf6cb617b853aa8d93bf420db2383fab46d314482ca2803b40d5fde979b"
-dependencies = [
- "winapi",
-]
-
 [[package]]
 name = "ansi_term"
 version = "0.12.1"
@@ -31,27 +22,15 @@ dependencies = [
 
 [[package]]
 name = "anyhow"
-version = "1.0.40"
+version = "1.0.66"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "28b2cd92db5cbd74e8e5028f7e27dd7aa3090e89e4f2a197cc7c8dfb69c7063b"
-
-[[package]]
-name = "arrayref"
-version = "0.3.6"
-source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "a4c527152e37cf757a3f78aae5a06fbeefdb07ccc535c980a3208ee3060dd544"
-
-[[package]]
-name = "arrayvec"
-version = "0.5.2"
-source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "23b62fc65de8e4e7f52534fb52b0f3ed04746ae267519eef2a83941e8085068b"
+checksum = "216261ddc8289130e551ddcd5ce8a064710c0d064a4d2895c67151c92b5443f6"
 
 [[package]]
 name = "ascii"
-version = "1.0.0"
+version = "1.1.0"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "bbf56136a5198c7b01a49e3afcbef6cf84597273d298f54432926024107b0109"
+checksum = "d92bec98840b8f03a5ff5413de5293bfcd8bf96467cf5452609f939ec6f5de16"
 
 [[package]]
 name = "atty"
@@ -66,44 +45,27 @@ dependencies = [
 
 [[package]]
 name = "autocfg"
-version = "1.0.1"
+version = "1.1.0"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "cdb031dd78e28731d87d56cc8ffef4a8f36ca26c38fe2de700543e627f8a464a"
-
-[[package]]
-name = "base64"
-version = "0.13.0"
-source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "904dfeac50f3cdaba28fc6f57fdcddb75f49ed61346676a78c4ffe55877802fd"
+checksum = "d468802bab17cbc0cc575e9b053f41e72aa36bfa6b7f55e3529ffa43161b97fa"
 
 [[package]]
 name = "bitflags"
-version = "1.2.1"
+version = "1.3.2"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "cf1de2fe8c75bc145a2f577add951f8134889b4795d47466a54a5c846d691693"
-
-[[package]]
-name = "blake2b_simd"
-version = "0.5.11"
-source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "afa748e348ad3be8263be728124b24a24f268266f6f5d58af9d75f6a40b5c587"
-dependencies = [
- "arrayref",
- "arrayvec",
- "constant_time_eq",
-]
+checksum = "bef38d45163c2f1dde094a7dfd33ccf595c92905c8f8f4fdc18d06fb1037718a"
 
 [[package]]
 name = "bumpalo"
-version = "3.6.1"
+version = "3.11.1"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "63396b8a4b9de3f4fdfb320ab6080762242f66a8ef174c49d8e19b674db4cdbe"
+checksum = "572f695136211188308f16ad2ca5c851a712c464060ae6974944458eb83880ba"
 
 [[package]]
 name = "cc"
-version = "1.0.67"
+version = "1.0.77"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "e3c69b077ad434294d3ce9f1f6143a2a4b89a8a2d54ef813d85003a4fd1137fd"
+checksum = "e9f73505338f7d905b19d18738976aae232eb46b8efc15554ffc56deb5d9ebe4"
 
 [[package]]
 name = "cfg-if"
@@ -111,19 +73,6 @@ version = "1.0.0"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "baf1de4339761588bc0619e3cbc0120ee582ebb74b53b4efbf79117bd2da40fd"
 
-[[package]]
-name = "chrono"
-version = "0.4.19"
-source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "670ad68c9088c2a963aaa298cb369688cf3f9465ce5e2d4ca10e6e0098a1ce73"
-dependencies = [
- "libc",
- "num-integer",
- "num-traits",
- "time",
- "winapi",
-]
-
 [[package]]
 name = "chunked_transfer"
 version = "1.4.0"
@@ -132,11 +81,11 @@ checksum = "fff857943da45f546682664a79488be82e69e43c1a7a2307679ab9afb3a66d2e"
 
 [[package]]
 name = "clap"
-version = "2.33.3"
+version = "2.34.0"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "37e58ac78573c40708d45522f0d80fa2f01cc4f9b4e2bf749807255454312002"
+checksum = "a0610544180c38b88101fecf2dd634b174a62eef6946f84dfc6a7127512b381c"
 dependencies = [
- "ansi_term 0.11.0",
+ "ansi_term",
  "atty",
  "bitflags",
  "strsim",
@@ -145,28 +94,11 @@ dependencies = [
  "vec_map",
 ]
 
-[[package]]
-name = "constant_time_eq"
-version = "0.1.5"
-source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "245097e9a4535ee1e3e3931fcfcd55a796a44c643e8596ff6566d68f09b87bbc"
-
-[[package]]
-name = "crossbeam-utils"
-version = "0.8.3"
-source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "e7e9d99fa91428effe99c5c6d4634cdeba32b8cf784fc428a2a687f61a952c49"
-dependencies = [
- "autocfg",
- "cfg-if",
- "lazy_static",
-]
-
 [[package]]
 name = "ctor"
-version = "0.1.20"
+version = "0.1.26"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "5e98e2ad1a782e33928b96fc3948e7c355e5af34ba4de7670fe8bac2a3b2006d"
+checksum = "6d2301688392eb071b0bf1a37be05c469d3cc4dbbd95df672fe28ab021e6a096"
 dependencies = [
  "quote",
  "syn",
@@ -174,9 +106,9 @@ dependencies = [
 
 [[package]]
 name = "diff"
-version = "0.1.12"
+version = "0.1.13"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "0e25ea47919b1560c4e3b7fe0aaab9becf5b84a10325ddf7db0f0ba5e1026499"
+checksum = "56254986775e3233ffa9c4d7d3faaf6d36a2c09d30b20687e9f88bc8bafc16c8"
 
 [[package]]
 name = "difference"
@@ -186,18 +118,18 @@ checksum = "524cbf6897b527295dff137cec09ecf3a05f4fddffd7dfcd1585403449e74198"
 
 [[package]]
 name = "dirs"
-version = "3.0.1"
+version = "3.0.2"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "142995ed02755914747cc6ca76fc7e4583cd18578746716d0508ea6ed558b9ff"
+checksum = "30baa043103c9d0c2a57cf537cc2f35623889dc0d405e6c3cccfadbc81c71309"
 dependencies = [
  "dirs-sys",
 ]
 
 [[package]]
 name = "dirs-sys"
-version = "0.3.5"
+version = "0.3.7"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "8e93d7f5705de3e49895a2b5e0b8855a1c27f080192ae9c32a6432d50741a57a"
+checksum = "1b1d1d91c932ef41c0f2663aa8b0ca0342d444d842c06914aa0a7e352d0bada6"
 dependencies = [
  "libc",
  "redox_users",
@@ -206,40 +138,28 @@ dependencies = [
 
 [[package]]
 name = "either"
-version = "1.6.1"
+version = "1.8.0"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "e78d4f1cc4ae33bbfc157ed5d5a5ef3bc29227303d595861deb238fcec4e9457"
+checksum = "90e5c1c8368803113bf0c9584fc495a58b86dc8a29edbf8fe877d21d9507e797"
 
 [[package]]
-name = "form_urlencoded"
-version = "1.0.1"
+name = "fastrand"
+version = "1.8.0"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "5fc25a87fa4fd2094bffb06925852034d90a17f0d1e05197d4956d3555752191"
+checksum = "a7a407cfaa3385c4ae6b23e84623d48c2798d06e3e6a1878f7f59f17b3f86499"
 dependencies = [
- "matches",
- "percent-encoding",
+ "instant",
 ]
 
 [[package]]
 name = "getrandom"
-version = "0.1.16"
+version = "0.2.8"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "8fc3cb4d91f53b50155bdcfd23f6a4c39ae1969c2ae85982b135750cccaf5fce"
+checksum = "c05aeb6a22b8f62540c194aac980f2115af067bfe15a0734d7277a768d396b31"
 dependencies = [
  "cfg-if",
  "libc",
- "wasi 0.9.0+wasi-snapshot-preview1",
-]
-
-[[package]]
-name = "getrandom"
-version = "0.2.2"
-source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "c9495705279e7140bf035dde1f6e750c162df8b625267cd52cc44e0b156732c8"
-dependencies = [
- "cfg-if",
- "libc",
- "wasi 0.10.2+wasi-snapshot-preview1",
+ "wasi",
 ]
 
 [[package]]
@@ -250,60 +170,64 @@ checksum = "9b919933a397b79c37e33b77bb2aa3dc8eb6e165ad809e58ff75bc7db2e34574"
 
 [[package]]
 name = "hashbrown"
-version = "0.9.1"
+version = "0.12.3"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "d7afe4a420e3fe79967a00898cc1f4db7c8a49a9333a29f8a4bd76a253d5cd04"
+checksum = "8a9ee70c43aaf417c914396645a0fa852624801b24ebb7ae78fe8272889ac888"
 
 [[package]]
 name = "hermit-abi"
-version = "0.1.18"
+version = "0.1.19"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "322f4de77956e22ed0e5032c359a0f1273f1f7f0d79bfa3b8ffbc730d7fbcc5c"
+checksum = "62b467343b94ba476dcb2500d242dadbb39557df889310ac77c5d99100aaac33"
 dependencies = [
  "libc",
 ]
 
 [[package]]
 name = "html-escape"
-version = "0.2.6"
+version = "0.2.12"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "d348900ce941b7474395ba922ed3735a517df4546a2939ddb416ce85eeaa988e"
+checksum = "15315cfa9503e9aa85a477138eff76a1b203a430703548052c330b69d8d8c205"
 dependencies = [
  "utf8-width",
 ]
 
 [[package]]
-name = "idna"
-version = "0.2.2"
+name = "httpdate"
+version = "1.0.2"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "89829a5d69c23d348314a7ac337fe39173b61149a9864deabd260983aed48c21"
-dependencies = [
- "matches",
- "unicode-bidi",
- "unicode-normalization",
-]
+checksum = "c4a1e36c821dbe04574f602848a19f742f4fb3c98d40449f11bcad18d6b17421"
 
 [[package]]
 name = "indexmap"
-version = "1.6.1"
+version = "1.9.2"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "4fb1fa934250de4de8aef298d81c729a7d33d8c239daa3a7575e6b92bfc7313b"
+checksum = "1885e79c1fc4b10f0e172c475f458b7f7b93061064d98c3293e98c5ba0c8b399"
 dependencies = [
  "autocfg",
  "hashbrown",
 ]
 
 [[package]]
-name = "itoa"
-version = "0.4.7"
+name = "instant"
+version = "0.1.12"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "dd25036021b0de88a0aff6b850051563c6516d0bf53f8638938edbb9de732736"
+checksum = "7a5bbe824c507c5da5956355e86a746d82e0e1464f65d862cc5e71da70e94b2c"
+dependencies = [
+ "cfg-if",
+]
+
+[[package]]
+name = "itoa"
+version = "1.0.4"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "4217ad341ebadf8d8e724e264f13e593e0648f5b3e94b3896a5df283be015ecc"
 
 [[package]]
 name = "js-sys"
-version = "0.3.48"
+version = "0.3.60"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "dc9f84f9b115ce7843d60706df1422a916680bfdfcbdb0447c5614ff9d7e4d78"
+checksum = "49409df3e3bf0856b916e2ceaca09ee28e6871cf7d9ce97a692cacfdb2a25a47"
 dependencies = [
  "wasm-bindgen",
 ]
@@ -316,15 +240,15 @@ checksum = "e2abad23fbc42b3700f2f279844dc832adb2b2eb069b2df918f455c4e18cc646"
 
 [[package]]
 name = "libc"
-version = "0.2.86"
+version = "0.2.138"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "b7282d924be3275cec7f6756ff4121987bc6481325397dde6ba3e7802b1a8b1c"
+checksum = "db6d7e329c562c5dfab7a46a2afabc8b987ab9a4834c9d1ca04dc54c1546cef8"
 
 [[package]]
 name = "libloading"
-version = "0.7.0"
+version = "0.7.4"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "6f84d96438c15fcd6c3f244c8fce01d1e2b9c6b5623e9c711dc9286d8fc92d6a"
+checksum = "b67380fd3b2fbe7527a606e18729d21c6f3951633d0500574c4dc22d2d638b9f"
 dependencies = [
  "cfg-if",
  "winapi",
@@ -332,70 +256,39 @@ dependencies = [
 
 [[package]]
 name = "log"
-version = "0.4.14"
+version = "0.4.17"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "51b9bbe6c47d51fc3e1a9b945965946b4c44142ab8792c50835a980d362c2710"
+checksum = "abb12e687cfb44aa40f41fc3978ef76448f9b6038cad6aef4259d3c095a2382e"
 dependencies = [
  "cfg-if",
 ]
 
-[[package]]
-name = "matches"
-version = "0.1.8"
-source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "7ffc5c5338469d4d3ea17d269fa8ea3512ad247247c30bd2df69e68309ed0a08"
-
 [[package]]
 name = "memchr"
-version = "2.3.4"
+version = "2.5.0"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "0ee1c47aaa256ecabcaea351eae4a9b01ef39ed810004e298d2511ed284b1525"
-
-[[package]]
-name = "num-integer"
-version = "0.1.44"
-source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "d2cc698a63b549a70bc047073d2949cce27cd1c7b0a4a862d08a8031bc2801db"
-dependencies = [
- "autocfg",
- "num-traits",
-]
-
-[[package]]
-name = "num-traits"
-version = "0.2.14"
-source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "9a64b1ec5cda2586e284722486d802acf1f7dbdc623e2bfc57e65ca1cd099290"
-dependencies = [
- "autocfg",
-]
+checksum = "2dffe52ecf27772e601905b7522cb4ef790d2cc203488bbd0e2fe85fcb74566d"
 
 [[package]]
 name = "once_cell"
-version = "1.7.0"
+version = "1.16.0"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "10acf907b94fc1b1a152d08ef97e7759650268cf986bf127f387e602b02c7e5a"
+checksum = "86f0b0d4bf799edbc74508c1e8bf170ff5f41238e5f8225603ca7caaae2b7860"
 
 [[package]]
 name = "output_vt100"
-version = "0.1.2"
+version = "0.1.3"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "53cdc5b785b7a58c5aad8216b3dfa114df64b0b06ae6e1501cef91df2fbdf8f9"
+checksum = "628223faebab4e3e40667ee0b2336d34a5b960ff60ea743ddfdbcf7770bcfb66"
 dependencies = [
  "winapi",
 ]
 
-[[package]]
-name = "percent-encoding"
-version = "2.1.0"
-source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "d4fd5641d01c8f18a23da7b6fe29298ff4b55afcccdf78973b24cf3175fee32e"
-
 [[package]]
 name = "ppv-lite86"
-version = "0.2.10"
+version = "0.2.17"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "ac74c624d6b2d21f425f752262f42188365d7b8ff1aff74c82e45136510a4857"
+checksum = "5b40af805b3121feab8a3c29f04d8ad262fa8e0561883e7653e024ae4479e6de"
 
 [[package]]
 name = "pretty_assertions"
@@ -403,7 +296,7 @@ version = "0.7.2"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "1cab0e7c02cf376875e9335e0ba1da535775beb5450d21e1dffca068818ed98b"
 dependencies = [
- "ansi_term 0.12.1",
+ "ansi_term",
  "ctor",
  "diff",
  "output_vt100",
@@ -411,39 +304,38 @@ dependencies = [
 
 [[package]]
 name = "proc-macro2"
-version = "1.0.24"
+version = "1.0.47"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "1e0704ee1a7e00d7bb417d0770ea303c1bccbabf0ef1667dae92b5967f5f8a71"
+checksum = "5ea3d908b0e36316caf9e9e2c4625cdde190a7e6f440d794667ed17a1855e725"
 dependencies = [
- "unicode-xid",
+ "unicode-ident",
 ]
 
 [[package]]
 name = "quote"
-version = "1.0.9"
+version = "1.0.21"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "c3d0b9745dc2debf507c8422de05d7226cc1f0644216dfdfead988f9b1ab32a7"
+checksum = "bbe448f377a7d6961e30f5955f9b8d106c3f5e449d493ee1b125c1d43c2b5179"
 dependencies = [
  "proc-macro2",
 ]
 
 [[package]]
 name = "rand"
-version = "0.8.3"
+version = "0.8.5"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "0ef9e7e66b4468674bfcb0c81af8b7fa0bb154fa9f28eb840da5c447baeb8d7e"
+checksum = "34af8d1a0e25924bc5b7c43c079c942339d8f0a8b57c39049bef581b46327404"
 dependencies = [
  "libc",
  "rand_chacha",
  "rand_core",
- "rand_hc",
 ]
 
 [[package]]
 name = "rand_chacha"
-version = "0.3.0"
+version = "0.3.1"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "e12735cf05c9e10bf21534da50a147b924d555dc7a547c42e6bb2d5b6017ae0d"
+checksum = "e6c10a63a0fa32252be49d21e7709d4d4baf8d231c2dbce1eaa8141b9b127d88"
 dependencies = [
  "ppv-lite86",
  "rand_core",
@@ -451,65 +343,49 @@ dependencies = [
 
 [[package]]
 name = "rand_core"
-version = "0.6.2"
+version = "0.6.4"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "34cf66eb183df1c5876e2dcf6b13d57340741e8dc255b48e40a26de954d06ae7"
+checksum = "ec0be4795e2f6a28069bec0b5ff3e2ac9bafc99e6a9a7dc3547996c5c816922c"
 dependencies = [
- "getrandom 0.2.2",
-]
-
-[[package]]
-name = "rand_hc"
-version = "0.3.0"
-source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "3190ef7066a446f2e7f42e239d161e905420ccab01eb967c9eb27d21b2322a73"
-dependencies = [
- "rand_core",
+ "getrandom",
 ]
 
 [[package]]
 name = "redox_syscall"
-version = "0.1.57"
+version = "0.2.16"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "41cc0f7e4d5d4544e8861606a285bb08d3e70712ccc7d2b84d7c0ccfaf4b05ce"
-
-[[package]]
-name = "redox_syscall"
-version = "0.2.5"
-source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "94341e4e44e24f6b591b59e47a8a027df12e008d73fd5672dbea9cc22f4507d9"
+checksum = "fb5a58c1855b4b6819d59012155603f0b22ad30cad752600aadfcb695265519a"
 dependencies = [
  "bitflags",
 ]
 
 [[package]]
 name = "redox_users"
-version = "0.3.5"
+version = "0.4.3"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "de0737333e7a9502c789a36d7c7fa6092a49895d4faa31ca5df163857ded2e9d"
+checksum = "b033d837a7cf162d7993aded9304e30a83213c648b6e389db233191f891e5c2b"
 dependencies = [
- "getrandom 0.1.16",
- "redox_syscall 0.1.57",
- "rust-argon2",
+ "getrandom",
+ "redox_syscall",
+ "thiserror",
 ]
 
 [[package]]
 name = "regex"
-version = "1.4.3"
+version = "1.7.0"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "d9251239e129e16308e70d853559389de218ac275b515068abc96829d05b948a"
+checksum = "e076559ef8e241f2ae3479e36f97bd5741c0330689e217ad51ce2c76808b868a"
 dependencies = [
  "aho-corasick",
  "memchr",
  "regex-syntax",
- "thread_local",
 ]
 
 [[package]]
 name = "regex-syntax"
-version = "0.6.22"
+version = "0.6.28"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "b5eb417147ba9860a96cfe72a0b93bf88fee1744b5636ec99ab20c1aa9376581"
+checksum = "456c603be3e8d448b072f410900c09faf164fbce2d480456f50eea6e25f9c848"
 
 [[package]]
 name = "remove_dir_all"
@@ -520,18 +396,6 @@ dependencies = [
  "winapi",
 ]
 
-[[package]]
-name = "rust-argon2"
-version = "0.8.3"
-source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "4b18820d944b33caa75a71378964ac46f58517c92b6ae5f762636247c09e78fb"
-dependencies = [
- "base64",
- "blake2b_simd",
- "constant_time_eq",
- "crossbeam-utils",
-]
-
 [[package]]
 name = "rustc-hash"
 version = "1.1.0"
@@ -540,9 +404,9 @@ checksum = "08d43f7aa6b08d49f382cde6a7982047c3426db949b1424bc4b7ec9ae12c6ce2"
 
 [[package]]
 name = "ryu"
-version = "1.0.5"
+version = "1.0.11"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "71d301d4193d031abdd79ff7e3dd721168a9572ef3fe51a1517aba235bd8f86e"
+checksum = "4501abdff3ae82a1c1b477a17252eb69cee9e66eb915c1abaa4f44d873df9f09"
 
 [[package]]
 name = "same-file"
@@ -555,24 +419,24 @@ dependencies = [
 
 [[package]]
 name = "semver"
-version = "1.0.5"
+version = "1.0.14"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "0486718e92ec9a68fbed73bb5ef687d71103b142595b406835649bebd33f72c7"
+checksum = "e25dfac463d778e353db5be2449d1cce89bd6fd23c9f1ea21310ce6e5a1b29c4"
 
 [[package]]
 name = "serde"
-version = "1.0.130"
+version = "1.0.149"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "f12d06de37cf59146fbdecab66aa99f9fe4f78722e3607577a5375d66bd0c913"
+checksum = "256b9932320c590e707b94576e3cc1f7c9024d0ee6612dfbcf1cb106cbe8e055"
 dependencies = [
  "serde_derive",
 ]
 
 [[package]]
 name = "serde_derive"
-version = "1.0.130"
+version = "1.0.149"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "d7bc1a1ab1961464eae040d96713baa5a724a8152c1222492465b54322ec508b"
+checksum = "b4eae9b04cbffdfd550eb462ed33bc6a1b68c935127d008b27444d08380f94e4"
 dependencies = [
  "proc-macro2",
  "quote",
@@ -581,9 +445,9 @@ dependencies = [
 
 [[package]]
 name = "serde_json"
-version = "1.0.63"
+version = "1.0.89"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "43535db9747a4ba938c0ce0a98cc631a46ebf943c9e1d604e091df6007620bf6"
+checksum = "020ff22c755c2ed3f8cf162dbb41a7268d934702f3ed3631656ea597e08fc3db"
 dependencies = [
  "indexmap",
  "itoa",
@@ -605,25 +469,25 @@ checksum = "8ea5119cdb4c55b55d432abb513a0429384878c15dde60cc77b1c99de1a95a6a"
 
 [[package]]
 name = "syn"
-version = "1.0.67"
+version = "1.0.105"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "6498a9efc342871f91cc2d0d694c674368b4ceb40f62b65a7a08c3792935e702"
+checksum = "60b9b43d45702de4c839cb9b51d9f529c5dd26a4aff255b42b1ebc03e88ee908"
 dependencies = [
  "proc-macro2",
  "quote",
- "unicode-xid",
+ "unicode-ident",
 ]
 
 [[package]]
 name = "tempfile"
-version = "3.2.0"
+version = "3.3.0"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "dac1c663cfc93810f88aed9b8941d48cabf856a1b111c29a40439018d870eb22"
+checksum = "5cdb1ef4eaeeaddc8fbd371e5017057064af0911902ef36b39801f67cc6d79e4"
 dependencies = [
  "cfg-if",
+ "fastrand",
  "libc",
- "rand",
- "redox_syscall 0.2.5",
+ "redox_syscall",
  "remove_dir_all",
  "winapi",
 ]
@@ -639,76 +503,41 @@ dependencies = [
 
 [[package]]
 name = "thiserror"
-version = "1.0.25"
+version = "1.0.37"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "fa6f76457f59514c7eeb4e59d891395fab0b2fd1d40723ae737d64153392e9c6"
+checksum = "10deb33631e3c9018b9baf9dcbbc4f737320d2b576bac10f6aefa048fa407e3e"
 dependencies = [
  "thiserror-impl",
 ]
 
 [[package]]
 name = "thiserror-impl"
-version = "1.0.25"
+version = "1.0.37"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "8a36768c0fbf1bb15eca10defa29526bda730a2376c2ab4393ccfa16fb1a318d"
+checksum = "982d17546b47146b28f7c22e3d08465f6b8903d0ea13c1660d9d84a6e7adcdbb"
 dependencies = [
  "proc-macro2",
  "quote",
  "syn",
 ]
 
-[[package]]
-name = "thread_local"
-version = "1.1.3"
-source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "8018d24e04c95ac8790716a5987d0fec4f8b27249ffa0f7d33f1369bdfb88cbd"
-dependencies = [
- "once_cell",
-]
-
-[[package]]
-name = "time"
-version = "0.1.43"
-source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "ca8a50ef2360fbd1eeb0ecd46795a87a19024eb4b53c5dc916ca1fd95fe62438"
-dependencies = [
- "libc",
- "winapi",
-]
-
 [[package]]
 name = "tiny_http"
-version = "0.8.0"
+version = "0.12.0"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "eded47106b8e52d8ed8119f0ea6e8c0f5881e69783e0297b5a8462958f334bc1"
+checksum = "389915df6413a2e74fb181895f933386023c71110878cd0825588928e64cdc82"
 dependencies = [
  "ascii",
- "chrono",
  "chunked_transfer",
+ "httpdate",
  "log",
- "url",
 ]
 
-[[package]]
-name = "tinyvec"
-version = "1.1.1"
-source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "317cca572a0e89c3ce0ca1f1bdc9369547fe318a683418e42ac8f59d14701023"
-dependencies = [
- "tinyvec_macros",
-]
-
-[[package]]
-name = "tinyvec_macros"
-version = "0.1.0"
-source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "cda74da7e1a664f795bb1f8a87ec406fb89a02522cf6e50620d016add6dbbf5c"
-
 [[package]]
 name = "toml"
-version = "0.5.8"
+version = "0.5.9"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "a31142970826733df8241ef35dc040ef98c679ab14d7c3e54d827099b3acecaa"
+checksum = "8d82e1a7758622a465f8cee077614c73484dac5b836c02ff6a40d5d1010324d7"
 dependencies = [
  "serde",
 ]
@@ -726,7 +555,7 @@ dependencies = [
 name = "tree-sitter-cli"
 version = "0.20.7"
 dependencies = [
- "ansi_term 0.12.1",
+ "ansi_term",
  "anyhow",
  "atty",
  "clap",
@@ -807,52 +636,22 @@ dependencies = [
 ]
 
 [[package]]
-name = "unicode-bidi"
-version = "0.3.4"
+name = "unicode-ident"
+version = "1.0.5"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "49f2bd0c6468a8230e1db229cff8029217cf623c767ea5d60bfbd42729ea54d5"
-dependencies = [
- "matches",
-]
-
-[[package]]
-name = "unicode-normalization"
-version = "0.1.17"
-source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "07fbfce1c8a97d547e8b5334978438d9d6ec8c20e38f56d4a4374d181493eaef"
-dependencies = [
- "tinyvec",
-]
+checksum = "6ceab39d59e4c9499d4e5a8ee0e2735b891bb7308ac83dfb4e80cad195c9f6f3"
 
 [[package]]
 name = "unicode-width"
-version = "0.1.8"
+version = "0.1.10"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "9337591893a19b88d8d87f2cec1e73fad5cdfd10e5a6f349f498ad6ea2ffb1e3"
-
-[[package]]
-name = "unicode-xid"
-version = "0.2.1"
-source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "f7fe0bb3479651439c9112f72b6c505038574c9fbb575ed1bf3b797fa39dd564"
-
-[[package]]
-name = "url"
-version = "2.2.1"
-source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "9ccd964113622c8e9322cfac19eb1004a07e636c545f325da085d5cdde6f1f8b"
-dependencies = [
- "form_urlencoded",
- "idna",
- "matches",
- "percent-encoding",
-]
+checksum = "c0edd1e5b14653f783770bce4a4dabb4a5108a5370a5f5d8cfe8710c361f6c8b"
 
 [[package]]
 name = "utf8-width"
-version = "0.1.4"
+version = "0.1.6"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "9071ac216321a4470a69fb2b28cfc68dcd1a39acd877c8be8e014df6772d8efa"
+checksum = "5190c9442dcdaf0ddd50f37420417d219ae5261bbf5db120d0f9bab996c9cba1"
 
 [[package]]
 name = "vec_map"
@@ -862,9 +661,9 @@ checksum = "f1bddf1187be692e79c5ffeab891132dfb0f236ed36a43c7ed39f1165ee20191"
 
 [[package]]
 name = "walkdir"
-version = "2.3.1"
+version = "2.3.2"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "777182bc735b6424e1a57516d35ed72cb8019d85c8c9bf536dccb3445c1a2f7d"
+checksum = "808cf2735cd4b6866113f648b791c6adc5714537bc222d9347bb203386ffda56"
 dependencies = [
  "same-file",
  "winapi",
@@ -873,21 +672,15 @@ dependencies = [
 
 [[package]]
 name = "wasi"
-version = "0.9.0+wasi-snapshot-preview1"
+version = "0.11.0+wasi-snapshot-preview1"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "cccddf32554fecc6acb585f82a32a72e28b48f8c4c1883ddfeeeaa96f7d8e519"
-
-[[package]]
-name = "wasi"
-version = "0.10.2+wasi-snapshot-preview1"
-source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "fd6fbd9a79829dd1ad0cc20627bf1ed606756a7f77edff7b66b7064f9cb327c6"
+checksum = "9c8d87e72b64a3b4db28d11ce29237c246188f4f51057d65a7eab63b7987e423"
 
 [[package]]
 name = "wasm-bindgen"
-version = "0.2.71"
+version = "0.2.83"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "7ee1280240b7c461d6a0071313e08f34a60b0365f14260362e5a2b17d1d31aa7"
+checksum = "eaf9f5aceeec8be17c128b2e93e031fb8a4d469bb9c4ae2d7dc1888b26887268"
 dependencies = [
  "cfg-if",
  "wasm-bindgen-macro",
@@ -895,13 +688,13 @@ dependencies = [
 
 [[package]]
 name = "wasm-bindgen-backend"
-version = "0.2.71"
+version = "0.2.83"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "5b7d8b6942b8bb3a9b0e73fc79b98095a27de6fa247615e59d096754a3bc2aa8"
+checksum = "4c8ffb332579b0557b52d268b91feab8df3615f265d5270fec2a8c95b17c1142"
 dependencies = [
  "bumpalo",
- "lazy_static",
  "log",
+ "once_cell",
  "proc-macro2",
  "quote",
  "syn",
@@ -910,9 +703,9 @@ dependencies = [
 
 [[package]]
 name = "wasm-bindgen-macro"
-version = "0.2.71"
+version = "0.2.83"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "e5ac38da8ef716661f0f36c0d8320b89028efe10c7c0afde65baffb496ce0d3b"
+checksum = "052be0f94026e6cbc75cdefc9bae13fd6052cdcaf532fa6c45e7ae33a1e6c810"
 dependencies = [
  "quote",
  "wasm-bindgen-macro-support",
@@ -920,9 +713,9 @@ dependencies = [
 
 [[package]]
 name = "wasm-bindgen-macro-support"
-version = "0.2.71"
+version = "0.2.83"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "cc053ec74d454df287b9374ee8abb36ffd5acb95ba87da3ba5b7d3fe20eb401e"
+checksum = "07bc0c051dc5f23e307b13285f9d75df86bfdf816c5721e573dec1f9b8aa193c"
 dependencies = [
  "proc-macro2",
  "quote",
@@ -933,15 +726,15 @@ dependencies = [
 
 [[package]]
 name = "wasm-bindgen-shared"
-version = "0.2.71"
+version = "0.2.83"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "7d6f8ec44822dd71f5f221a5847fb34acd9060535c1211b70a05844c0f6383b1"
+checksum = "1c38c045535d93ec4f0b4defec448e4291638ee608530863b1e2ba115d4fff7f"
 
 [[package]]
 name = "web-sys"
-version = "0.3.48"
+version = "0.3.60"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "ec600b26223b2948cedfde2a0aa6756dcf1fef616f43d7b3097aaf53a6c4d92b"
+checksum = "bcda906d8be16e728fd5adc5b729afad4e444e106ab28cd1c7256e54fa61510f"
 dependencies = [
  "js-sys",
  "wasm-bindgen",
@@ -960,12 +753,13 @@ dependencies = [
 
 [[package]]
 name = "which"
-version = "4.1.0"
+version = "4.3.0"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "b55551e42cbdf2ce2bedd2203d0cc08dba002c27510f86dab6d0ce304cba3dfe"
+checksum = "1c831fbbee9e129a8cf93e7747a82da9d95ba8e16621cae60ec2cdc849bacb7b"
 dependencies = [
  "either",
  "libc",
+ "once_cell",
 ]
 
 [[package]]
diff --git a/cli/build.rs b/cli/build.rs
index 1986e023..0ff98a81 100644
--- a/cli/build.rs
+++ b/cli/build.rs
@@ -66,7 +66,21 @@ fn read_git_sha() -> Option<String> {
         // If we're on a branch, read the SHA from the ref file.
         if head_content.starts_with("ref: ") {
             head_content.replace_range(0.."ref: ".len(), "");
-            let ref_filename = git_dir_path.join(&head_content);
+            let ref_filename = {
+                let file = git_dir_path.join(&head_content);
+                if file.is_file() {
+                    file
+                } else {
+                    let file = git_dir_path
+                        .parent() // worktrees subfolder
+                        .unwrap()
+                        .parent() // original gitdir
+                        .unwrap()
+                        .join(&head_content);
+                    assert!(file.is_file());
+                    file
+                }
+            };
             if let Some(path) = ref_filename.to_str() {
                 println!("cargo:rerun-if-changed={}", path);
             }

From eb549a89ad33923f4680ddb9281be79186a32db9 Mon Sep 17 00:00:00 2001
From: Phil Freeman <phil@deepchannel.com>
Date: Wed, 14 Dec 2022 09:43:58 -0800
Subject: [PATCH 005/347] fix: possible rollover of nanoseconds in clock.h

---
 lib/src/clock.h | 4 ++++
 1 file changed, 4 insertions(+)

diff --git a/lib/src/clock.h b/lib/src/clock.h
index 94545f35..e6faa040 100644
--- a/lib/src/clock.h
+++ b/lib/src/clock.h
@@ -82,6 +82,10 @@ static inline TSClock clock_after(TSClock base, TSDuration duration) {
   TSClock result = base;
   result.tv_sec += duration / 1000000;
   result.tv_nsec += (duration % 1000000) * 1000;
+  if (result.tv_nsec >= 1000000000) {
+    result.tv_nsec -= 1000000000;
+    ++(result.tv_sec);
+  }
   return result;
 }
 

From dddbc2d4f741597e212175c19644a473ec0170d2 Mon Sep 17 00:00:00 2001
From: Andrew Helwer <ahelwer@users.noreply.github.com>
Date: Sat, 20 Jun 2020 17:51:01 -0400
Subject: [PATCH 006/347] Added working commands for Windows users

Windows users are likely to be using either Windows Terminal (which uses PowerShell) or PowerShell directly.
---
 docs/section-3-creating-parsers.md | 5 +++++
 1 file changed, 5 insertions(+)

diff --git a/docs/section-3-creating-parsers.md b/docs/section-3-creating-parsers.md
index 07f9d865..d4c05f25 100644
--- a/docs/section-3-creating-parsers.md
+++ b/docs/section-3-creating-parsers.md
@@ -80,6 +80,11 @@ You can test this parser by creating a source file with the contents "hello" and
 echo 'hello' > example-file
 tree-sitter parse example-file
 ```
+Alternatively, in Windows PowerShell:
+```pwsh
+"hello" | Out-File example-file -Encoding utf8
+tree-sitter parse example-file
+```
 
 This should print the following:
 

From b1024a14937efc2c3b63cdb5e13bc33141a2c0b6 Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Mon, 2 Jan 2023 22:56:51 +0200
Subject: [PATCH 007/347] cli: Fix build.rs in case of the current branch ref
 was packed

Support SHA lookup in .git/packed-refs
---
 cli/build.rs | 35 +++++++++++++++++++++++++++--------
 1 file changed, 27 insertions(+), 8 deletions(-)

diff --git a/cli/build.rs b/cli/build.rs
index 0ff98a81..74c6d833 100644
--- a/cli/build.rs
+++ b/cli/build.rs
@@ -1,3 +1,4 @@
+use std::ffi::OsStr;
 use std::path::{Path, PathBuf};
 use std::{env, fs};
 
@@ -67,18 +68,36 @@ fn read_git_sha() -> Option<String> {
         if head_content.starts_with("ref: ") {
             head_content.replace_range(0.."ref: ".len(), "");
             let ref_filename = {
+                // Go to real non-worktree gitdir
+                let git_dir_path = git_dir_path
+                    .parent()
+                    .map(|p| {
+                        p.file_name()
+                            .map(|n| n == OsStr::new("worktrees"))
+                            .and_then(|x| x.then(|| p.parent()))
+                    })
+                    .flatten()
+                    .flatten()
+                    .unwrap_or(&git_dir_path);
+
                 let file = git_dir_path.join(&head_content);
                 if file.is_file() {
                     file
                 } else {
-                    let file = git_dir_path
-                        .parent() // worktrees subfolder
-                        .unwrap()
-                        .parent() // original gitdir
-                        .unwrap()
-                        .join(&head_content);
-                    assert!(file.is_file());
-                    file
+                    let packed_refs = git_dir_path.join("packed-refs");
+                    if let Ok(packed_refs_content) = fs::read_to_string(&packed_refs) {
+                        for line in packed_refs_content.lines() {
+                            if let Some((hash, r#ref)) = line.split_once(' ') {
+                                if r#ref == head_content {
+                                    if let Some(path) = packed_refs.to_str() {
+                                        println!("cargo:rerun-if-changed={}", path);
+                                    }
+                                    return Some(hash.to_string());
+                                }
+                            }
+                        }
+                    }
+                    return None;
                 }
             };
             if let Some(path) = ref_filename.to_str() {

From 87a0517f3ce1d0eef47333dd50e8b25d932564c1 Mon Sep 17 00:00:00 2001
From: Andrew Helwer <ahelwer@protonmail.com>
Date: Sat, 22 Jan 2022 10:16:32 -0500
Subject: [PATCH 008/347] Various updates to Creating Parsers docs

* Documented test separator suffixes
* Documented partial precedences field
* Added external scanning to conflicting tokens rules
* Added earliest starting position to conflicting tokens rules
* Added note about lexical precedence vs. parse precedence
* Added note about tree-sitter calling external scanner with all
  tokens marked valid during error recovery
---
 docs/section-3-creating-parsers.md | 49 ++++++++++++++++++++++++++----
 1 file changed, 43 insertions(+), 6 deletions(-)

diff --git a/docs/section-3-creating-parsers.md b/docs/section-3-creating-parsers.md
index d4c05f25..747238b4 100644
--- a/docs/section-3-creating-parsers.md
+++ b/docs/section-3-creating-parsers.md
@@ -157,6 +157,26 @@ func x() int {
       (return_statement (number)))))
 ```
 
+* If your language's syntax conflicts with the `===` and `---` test separators, you can optionally add an arbitrary identical suffix (in the below example, `|||`) to disambiguate them:
+
+```
+==================|||
+Basic module
+==================|||
+
+---- MODULE Test ----
+increment(n) == n + 1
+====
+
+---|||
+
+(source_file
+  (module (identifier)
+    (operator (identifier)
+      (parameter_list (identifier))
+      (plus (identifier_ref) (number)))))
+```
+
 These tests are important. They serve as the parser's API documentation, and they can be run every time you change the grammar to verify that everything still parses correctly.
 
 By default, the `tree-sitter test` command runs all of the tests in your `corpus` or `test/corpus/` folder. To run a particular test, you can use the `-f` flag:
@@ -227,6 +247,7 @@ In addition to the `name` and `rules` fields, grammars have a few other optional
 * **`inline`** - an array of rule names that should be automatically *removed* from the grammar by replacing all of their usages with a copy of their definition. This is useful for rules that are used in multiple places but for which you *don't* want to create syntax tree nodes at runtime.
 * **`conflicts`** - an array of arrays of rule names. Each inner array represents a set of rules that's involved in an *LR(1) conflict* that is *intended to exist* in the grammar. When these conflicts occur at runtime, Tree-sitter will use the GLR algorithm to explore all of the possible interpretations. If *multiple* parses end up succeeding, Tree-sitter will pick the subtree whose corresponding rule has the highest total *dynamic precedence*.
 * **`externals`** - an array of token names which can be returned by an [*external scanner*](#external-scanners). External scanners allow you to write custom C code which runs during the lexing process in order to handle lexical rules (e.g. Python's indentation tokens) that cannot be described by regular expressions.
+* **`precedences`** - an array of array of strings, where each array of strings defines named precedence levels in descending order. These names can be used in the `prec` functions to define precedence relative only to other names in the array, rather than globally. Can only be used with parse precedence, not lexical precedence.
 * **`word`** - the name of a token that will match keywords for the purpose of the [keyword extraction](#keyword-extraction) optimization.
 * **`supertypes`** an array of hidden rule names which should be considered to be 'supertypes' in the generated [*node types* file][static-node-types].
 
@@ -503,17 +524,31 @@ Tree-sitter's parsing process is divided into two phases: parsing (which is desc
 
 ### Conflicting Tokens
 
-Grammars often contain multiple tokens that can match the same characters. For example, a grammar might contain the tokens (`"if"` and `/[a-z]+/`). Tree-sitter differentiates between these conflicting tokens in a few ways:
+Grammars often contain multiple tokens that can match the same characters. For example, a grammar might contain the tokens (`"if"` and `/[a-z]+/`). Tree-sitter differentiates between these conflicting tokens in a few ways.
 
-1. **Context-aware Lexing** - Tree-sitter performs lexing on-demand, during the parsing process. At any given position in a source document, the lexer only tries to recognize tokens that are *valid* at that position in the document.
+1. **External Scanning** - If your grammar has an external scanner and one or more tokens in your `externals` array are valid at the current location, your external scanner will always be called first to determine whether those tokens are present.
 
-2. **Lexical Precedence** - When the precedence functions described [above](#the-grammar-dsl) are used within the `token` function, the given precedence values serve as instructions to the lexer. If there are two valid tokens that match the characters at a given position in the document, Tree-sitter will select the one with the higher precedence.
+1. **Context-Aware Lexing** - Tree-sitter performs lexing on-demand, during the parsing process. At any given position in a source document, the lexer only tries to recognize tokens that are *valid* at that position in the document.
 
-3. **Match Length** - If multiple valid tokens with the same precedence match the characters at a given position in a document, Tree-sitter will select the token that matches the [longest sequence of characters][longest-match].
+1. **Earliest Starting Position** - Tree-sitter will prefer tokens with an earlier starting position. This is most often seen with very permissive regular expressions similar to `/.*/`, which are greedy and will consume as much text as possible. In this example the regex would consume all text until hitting a newline - even if text on that line could be interpreted as a different token.
 
-4. **Match Specificity** - If there are two valid tokens with the same precedence and which both match the same number of characters, Tree-sitter will prefer a token that is specified in the grammar as a `String` over a token specified as a `RegExp`.
+1. **Explicit Lexical Precedence** - When the precedence functions described [above](#the-grammar-dsl) are used within the `token` function, the given precedence values serve as instructions to the lexer. If there are two valid tokens that match the characters at a given position in the document, Tree-sitter will select the one with the higher precedence.
 
-5. **Rule Order** - If none of the above criteria can be used to select one token over another, Tree-sitter will prefer the token that appears earlier in the grammar.
+1. **Match Length** - If multiple valid tokens with the same precedence match the characters at a given position in a document, Tree-sitter will select the token that matches the [longest sequence of characters][longest-match].
+
+1. **Match Specificity** - If there are two valid tokens with the same precedence and which both match the same number of characters, Tree-sitter will prefer a token that is specified in the grammar as a `String` over a token specified as a `RegExp`.
+
+1. **Rule Order** - If none of the above criteria can be used to select one token over another, Tree-sitter will prefer the token that appears earlier in the grammar.
+
+### Lexical Precedence vs. Parse Precedence
+
+One common mistake involves not distinguishing lexical precedence from parse precedence.
+Parse precedence determines which rule is chosen to interpret a given sequence of tokens.
+Lexical precedence determines which token is chosen to interpret a given section of text.
+It is a lower-level operation that is done first.
+The above list fully capture tree-sitter's lexical precedence rules, and you will probably refer back to this section of the documentation more often than any other.
+Most of the time when you really get stuck, you're dealing with a lexical precedence problem.
+Pay particular attention to the difference in meaning between using `prec` inside the `token` function vs. outside of it.
 
 ### Keywords
 
@@ -699,6 +734,8 @@ if (valid_symbols[INDENT] || valid_symbol[DEDENT]) {
 }
 ```
 
+Note that if a syntax error is encountered during regular parsing, tree-sitter's first action during error recovery will be to call your external scanner with all tokens marked valid. Your scanner should detect this case and handle it appropriately.
+
 [ambiguous-grammar]: https://en.wikipedia.org/wiki/Ambiguous_grammar
 [antlr]: http://www.antlr.org/
 [bison-dprec]: https://www.gnu.org/software/bison/manual/html_node/Generalized-LR-Parsing.html

From 278ff01e71a8d798a19f85a61c10dd29e3e681c1 Mon Sep 17 00:00:00 2001
From: Andrew Helwer <ahelwer@protonmail.com>
Date: Wed, 26 Jan 2022 18:57:32 -0500
Subject: [PATCH 009/347] Added additional documentation details

* External scanners and infinite loops
* Terminal keywords in externals array
* Using error sentinel external token
* Good practice to erase state variables in deserialize func
* Emphasize external scanner is called first
---
 docs/section-3-creating-parsers.md | 25 ++++++++++++++++++++-----
 1 file changed, 20 insertions(+), 5 deletions(-)

diff --git a/docs/section-3-creating-parsers.md b/docs/section-3-creating-parsers.md
index 747238b4..5677292f 100644
--- a/docs/section-3-creating-parsers.md
+++ b/docs/section-3-creating-parsers.md
@@ -548,7 +548,7 @@ Lexical precedence determines which token is chosen to interpret a given section
 It is a lower-level operation that is done first.
 The above list fully capture tree-sitter's lexical precedence rules, and you will probably refer back to this section of the documentation more often than any other.
 Most of the time when you really get stuck, you're dealing with a lexical precedence problem.
-Pay particular attention to the difference in meaning between using `prec` inside the `token` function vs. outside of it.
+Pay particular attention to the difference in meaning between using `prec` inside the `token` function versus outside of it.
 
 ### Keywords
 
@@ -632,7 +632,7 @@ grammar({
 
 Then, add another C or C++ source file to your project. Currently, its path must be `src/scanner.c` or `src/scanner.cc` for the CLI to recognize it. Be sure to add this file to the `sources` section of your `binding.gyp` file so that it will be included when your project is compiled by Node.js and uncomment the appropriate block in your `bindings/rust/build.rs` file so that it will be included in your Rust crate.
 
-In this new source file, define an [`enum`][enum] type containing the names of all of your external tokens. The ordering of this enum must match the order in your grammar's `externals` array.
+In this new source file, define an [`enum`][enum] type containing the names of all of your external tokens. The ordering of this enum must match the order in your grammar's `externals` array; the actual names do not matter.
 
 ```c
 #include <tree_sitter/parser.h>
@@ -695,6 +695,7 @@ void tree_sitter_my_language_external_scanner_deserialize(
 ```
 
 This function should *restore* the state of your scanner based the bytes that were previously written by the `serialize` function. It is called with a pointer to your scanner, a pointer to the buffer of bytes, and the number of bytes that should be read.
+It is good practice to explicitly erase your scanner state variables at the start of this function, before restoring their values from the byte buffer.
 
 #### Scan
 
@@ -712,10 +713,11 @@ This function is responsible for recognizing external tokens. It should return `
 
 * **`int32_t lookahead`** - The current next character in the input stream, represented as a 32-bit unicode code point.
 * **`TSSymbol result_symbol`** - The symbol that was recognized. Your scan function should *assign* to this field one of the values from the `TokenType` enum, described above.
-* **`void (*advance)(TSLexer *, bool skip)`** - A function for advancing to the next character. If you pass `true` for the second argument, the current character will be treated as whitespace.
+* **`void (*advance)(TSLexer *, bool skip)`** - A function for advancing to the next character. If you pass `true` for the second argument, the current character will be treated as whitespace; whitespace won't be included in the text range associated with tokens emitted by the external scanner.
 * **`void (*mark_end)(TSLexer *)`** - A function for marking the end of the recognized token. This allows matching tokens that require multiple characters of lookahead. By default (if you don't call `mark_end`), any character that you moved past using the `advance` function will be included in the size of the token. But once you call `mark_end`, then any later calls to `advance` will *not* increase the size of the returned token. You can call `mark_end` multiple times to increase the size of the token.
 * **`uint32_t (*get_column)(TSLexer *)`** - A function for querying the current column position of the lexer. It returns the number of codepoints since the start of the current line. The codepoint position is recalculated on every call to this function by reading from the start of the line.
-* **`bool (*is_at_included_range_start)(TSLexer *)`** - A function for checking if the parser has just skipped some characters in the document. When parsing an embedded document using the `ts_parser_set_included_ranges` function (described in the [multi-language document section][multi-language-section]), your scanner may want to apply some special behavior when moving to a disjoint part of the document. For example, in [EJS documents][ejs], the JavaScript parser uses this function to enable inserting automatic semicolon tokens in between the code directives, delimited by `<%` and `%>`.
+* **`bool (*is_at_included_range_start)(const TSLexer *)`** - A function for checking whether the parser has just skipped some characters in the document. When parsing an embedded document using the `ts_parser_set_included_ranges` function (described in the [multi-language document section][multi-language-section]), your scanner may want to apply some special behavior when moving to a disjoint part of the document. For example, in [EJS documents][ejs], the JavaScript parser uses this function to enable inserting automatic semicolon tokens in between the code directives, delimited by `<%` and `%>`.
+* **`bool (*eof)(const TSLexer *)`** - A function for determining whether the lexer is at the end of the file. The value of `lookahead` will be `0` at the end of a file, but this function should be used instead of checking for that value because the `0` or "NUL" value is also a valid character that could be present in the file being parsed.
 
 The third argument to the `scan` function is an array of booleans that indicates which of your external tokens are currently expected by the parser. You should only look for a given token if it is valid according to this array. At the same time, you cannot backtrack, so you may need to combine certain pieces of logic.
 
@@ -734,7 +736,20 @@ if (valid_symbols[INDENT] || valid_symbol[DEDENT]) {
 }
 ```
 
-Note that if a syntax error is encountered during regular parsing, tree-sitter's first action during error recovery will be to call your external scanner with all tokens marked valid. Your scanner should detect this case and handle it appropriately.
+#### Other External Scanner Details
+
+If a token in your `externals` array is valid at the current position in the parse, your external scanner will be called first before anything else is done.
+This means your external scanner functions as a powerful override of tree-sitter's lexing behavior, and can be used to solve problems that can't be cracked with ordinary lexical, parse, or dynamic precedence.
+
+If a syntax error is encountered during regular parsing, tree-sitter's first action during error recovery will be to call your external scanner's `scan` function with all tokens marked valid.
+Your scanner should detect this case and handle it appropriately.
+One simple method of detection is to add an unused token to the end of your `externals` array, for example `externals: $ => [$.token1, $.token2, $.error_sentinel]`, then check whether that token is marked valid to determine whether tree-sitter is in error correction mode.
+
+If you put terminal keywords in your `externals` array, for example `externals: $ => ['if', 'then', 'else']`, then any time those terminals are present in your grammar they will be tokenized by your external scanner.
+It is equivalent to writing `externals: [$.if_keyword, $.then_keyword, $.else_keyword]` then using `alias($.if_keyword, 'if')` in your grammar.
+
+External scanners are a common cause of infinite loops.
+Be very careful when emitting zero-width tokens from your external scanner, and if you consume characters in a loop be sure use the `eof` function to check whether you are at the end of the file.
 
 [ambiguous-grammar]: https://en.wikipedia.org/wiki/Ambiguous_grammar
 [antlr]: http://www.antlr.org/

From 19bd5868eb72ea3e72e29359a0f06056aa609140 Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Fri, 6 Jan 2023 08:32:26 +0200
Subject: [PATCH 010/347] Fix wasm tests

---
 lib/binding_web/exports.json        | 7 ++++---
 lib/binding_web/test/parser-test.js | 2 +-
 2 files changed, 5 insertions(+), 4 deletions(-)

diff --git a/lib/binding_web/exports.json b/lib/binding_web/exports.json
index 3fe11cdf..d4b6eb5e 100644
--- a/lib/binding_web/exports.json
+++ b/lib/binding_web/exports.json
@@ -4,13 +4,14 @@
   "_malloc",
   "_realloc",
 
-  "__ZNKSt3__212basic_stringIcNS_11char_traitsIcEENS_9allocatorIcEEE4copyEPcmm",
   "__ZNSt3__212basic_stringIcNS_11char_traitsIcEENS_9allocatorIcEEE6__initEPKcm",
-  "__ZNSt3__212basic_stringIcNS_11char_traitsIcEENS_9allocatorIcEEE7reserveEm",
   "__ZNSt3__212basic_stringIcNS_11char_traitsIcEENS_9allocatorIcEEE9__grow_byEmmmmmm",
   "__ZNSt3__212basic_stringIcNS_11char_traitsIcEENS_9allocatorIcEEE9push_backEc",
-  "__ZNSt3__212basic_stringIcNS_11char_traitsIcEENS_9allocatorIcEEED2Ev",
   "__ZNSt3__212basic_stringIwNS_11char_traitsIwEENS_9allocatorIwEEE9push_backEw",
+  "__ZNKSt3__212basic_stringIcNS_11char_traitsIcEENS_9allocatorIcEEE4copyEPcmm",
+  "__ZNSt3__212basic_stringIcNS_11char_traitsIcEENS_9allocatorIcEEE7reserveEm",
+  "__ZNSt3__212basic_stringIwNS_11char_traitsIwEENS_9allocatorIwEEE6resizeEmw",
+  "__ZNSt3__212basic_stringIcNS_11char_traitsIcEENS_9allocatorIcEEED2Ev",
   "__ZNSt3__212basic_stringIwNS_11char_traitsIwEENS_9allocatorIwEEED2Ev",
   "__ZdlPv",
   "__Znwm",
diff --git a/lib/binding_web/test/parser-test.js b/lib/binding_web/test/parser-test.js
index c76b49c7..fcd714b2 100644
--- a/lib/binding_web/test/parser-test.js
+++ b/lib/binding_web/test/parser-test.js
@@ -153,7 +153,7 @@ describe("Parser", () => {
           'type: (primitive_type) ' +
           'declarator: (init_declarator ' +
             'declarator: (pointer_declarator declarator: (identifier)) ' +
-            'value: (raw_string_literal))))'
+            'value: (raw_string_literal delimiter: (raw_string_delimiter) (raw_string_content) (raw_string_delimiter)))))'
       );
     }).timeout(5000);
 

From 88fe1d00c42760beda7cc01f5259da3d7fc5265e Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Fri, 6 Jan 2023 08:15:15 +0200
Subject: [PATCH 011/347] Bump Emscripten version to 3.1.29

---
 cli/emscripten-version | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/cli/emscripten-version b/cli/emscripten-version
index 199eda56..05b41fb6 100644
--- a/cli/emscripten-version
+++ b/cli/emscripten-version
@@ -1 +1 @@
-3.1.25
+3.1.29

From e733a07a5c0848e813a825a885f0c0dc0f04664b Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Fri, 6 Jan 2023 08:46:43 +0200
Subject: [PATCH 012/347] Update CI action versions

---
 .github/workflows/ci.yml | 10 +++++-----
 1 file changed, 5 insertions(+), 5 deletions(-)

diff --git a/.github/workflows/ci.yml b/.github/workflows/ci.yml
index d494e236..71f4be63 100644
--- a/.github/workflows/ci.yml
+++ b/.github/workflows/ci.yml
@@ -26,7 +26,7 @@ jobs:
           - ubuntu-latest
     steps:
       - name: Checkout repo
-        uses: actions/checkout@v2
+        uses: actions/checkout@v3
 
       # Work around https://github.com/actions/cache/issues/403.
       - name: Use GNU tar
@@ -40,7 +40,7 @@ jobs:
 
       - name: Cache artifacts
         id: cache
-        uses: actions/cache@v2
+        uses: actions/cache@v3
         with:
           path: |
             ~/.cargo/registry
@@ -59,7 +59,7 @@ jobs:
         run: cargo fmt -- --check
 
       - name: Install emscripten
-        uses: mymindstorm/setup-emsdk@v10
+        uses: mymindstorm/setup-emsdk@v11
         with:
           version: ${{ env.EMSCRIPTEN_VERSION }}
 
@@ -113,11 +113,11 @@ jobs:
     runs-on: windows-latest
     steps:
       - name: Checkout repo
-        uses: actions/checkout@v2
+        uses: actions/checkout@v3
 
       - name: Cache artifacts
         id: cache
-        uses: actions/cache@v2
+        uses: actions/cache@v3
         with:
           path: |
             ~/.cargo/registry

From ad45f5cd2cabda2de406a480f6d660aa5c96a85b Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Fri, 6 Jan 2023 06:05:07 +0200
Subject: [PATCH 013/347] Remove unused no-minimize arg for the generate
 command

---
 cli/src/main.rs | 3 +--
 1 file changed, 1 insertion(+), 2 deletions(-)

diff --git a/cli/src/main.rs b/cli/src/main.rs
index ce6743bf..9e3331c0 100644
--- a/cli/src/main.rs
+++ b/cli/src/main.rs
@@ -111,8 +111,7 @@ fn run() -> Result<()> {
                         .long("report-states-for-rule")
                         .value_name("rule-name")
                         .takes_value(true),
-                )
-                .arg(Arg::with_name("no-minimize").long("no-minimize")),
+                ),
         )
         .subcommand(
             SubCommand::with_name("parse")

From 5088781ef965c5cd7187c5308e3cb45f8f892860 Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Fri, 6 Jan 2023 06:13:08 +0200
Subject: [PATCH 014/347] cli: add -b, --build flags for `tree-sitter generate`

---
 cli/src/main.rs | 11 +++++++++++
 1 file changed, 11 insertions(+)

diff --git a/cli/src/main.rs b/cli/src/main.rs
index 9e3331c0..a6e75bf5 100644
--- a/cli/src/main.rs
+++ b/cli/src/main.rs
@@ -106,6 +106,11 @@ fn run() -> Result<()> {
                         )),
                 )
                 .arg(Arg::with_name("no-bindings").long("no-bindings"))
+                .arg(
+                    Arg::with_name("build").long("build").short("b")
+                    .help("Compile all defined languages in the current dir")
+                )
+                .arg(&debug_build_arg)
                 .arg(
                     Arg::with_name("report-states-for-rule")
                         .long("report-states-for-rule")
@@ -269,6 +274,8 @@ fn run() -> Result<()> {
 
         ("generate", Some(matches)) => {
             let grammar_path = matches.value_of("grammar-path");
+            let debug_build = matches.is_present("debug-build");
+            let build = matches.is_present("build");
             let report_symbol_name = matches.value_of("report-states-for-rule").or_else(|| {
                 if matches.is_present("report-states") {
                     Some("")
@@ -297,6 +304,10 @@ fn run() -> Result<()> {
                 generate_bindings,
                 report_symbol_name,
             )?;
+            if build {
+                loader.use_debug_build(debug_build);
+                loader.languages_at_path(&current_dir)?;
+            }
         }
 
         ("test", Some(matches)) => {

From 108d0ecede9312e88ac12475ffac62af9fba5dbf Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Fri, 6 Jan 2023 06:37:22 +0200
Subject: [PATCH 015/347] loader: add TREE_SITTER_LIBDIR; cli: add --libdir to
 `tree-sitter generate`

Closes #1336
---
 cli/loader/src/lib.rs | 11 +++++++----
 cli/src/main.rs       | 18 +++++++++++++++---
 2 files changed, 22 insertions(+), 7 deletions(-)

diff --git a/cli/loader/src/lib.rs b/cli/loader/src/lib.rs
index 6f8605f4..0f92b051 100644
--- a/cli/loader/src/lib.rs
+++ b/cli/loader/src/lib.rs
@@ -10,7 +10,7 @@ use std::path::{Path, PathBuf};
 use std::process::Command;
 use std::sync::Mutex;
 use std::time::SystemTime;
-use std::{fs, mem};
+use std::{env, fs, mem};
 use tree_sitter::{Language, QueryError, QueryErrorKind};
 use tree_sitter_highlight::HighlightConfiguration;
 use tree_sitter_tags::{Error as TagsError, TagsConfiguration};
@@ -108,9 +108,12 @@ unsafe impl Sync for Loader {}
 
 impl Loader {
     pub fn new() -> Result<Self> {
-        let parser_lib_path = dirs::cache_dir()
-            .ok_or(anyhow!("Cannot determine cache directory"))?
-            .join("tree-sitter/lib");
+        let parser_lib_path = match env::var("TREE_SITTER_LIBDIR") {
+            Ok(path) => PathBuf::from(path),
+            _ => dirs::cache_dir()
+                .ok_or(anyhow!("Cannot determine cache directory"))?
+                .join("tree-sitter/lib"),
+        };
         Ok(Self::with_parser_lib_path(parser_lib_path))
     }
 
diff --git a/cli/src/main.rs b/cli/src/main.rs
index a6e75bf5..c1dd2501 100644
--- a/cli/src/main.rs
+++ b/cli/src/main.rs
@@ -1,7 +1,7 @@
 use anyhow::{anyhow, Context, Result};
 use clap::{App, AppSettings, Arg, SubCommand};
 use glob::glob;
-use std::path::Path;
+use std::path::{Path, PathBuf};
 use std::{env, fs, u64};
 use tree_sitter_cli::{
     generate, highlight, logger, parse, playground, query, tags, test, test_highlight, test_tags,
@@ -107,10 +107,18 @@ fn run() -> Result<()> {
                 )
                 .arg(Arg::with_name("no-bindings").long("no-bindings"))
                 .arg(
-                    Arg::with_name("build").long("build").short("b")
-                    .help("Compile all defined languages in the current dir")
+                    Arg::with_name("build")
+                        .long("build")
+                        .short("b")
+                        .help("Compile all defined languages in the current dir"),
                 )
                 .arg(&debug_build_arg)
+                .arg(
+                    Arg::with_name("libdir")
+                        .long("libdir")
+                        .takes_value(true)
+                        .value_name("path"),
+                )
                 .arg(
                     Arg::with_name("report-states-for-rule")
                         .long("report-states-for-rule")
@@ -276,6 +284,7 @@ fn run() -> Result<()> {
             let grammar_path = matches.value_of("grammar-path");
             let debug_build = matches.is_present("debug-build");
             let build = matches.is_present("build");
+            let libdir = matches.value_of("libdir");
             let report_symbol_name = matches.value_of("report-states-for-rule").or_else(|| {
                 if matches.is_present("report-states") {
                     Some("")
@@ -305,6 +314,9 @@ fn run() -> Result<()> {
                 report_symbol_name,
             )?;
             if build {
+                if let Some(path) = libdir {
+                    loader = loader::Loader::with_parser_lib_path(PathBuf::from(path));
+                }
                 loader.use_debug_build(debug_build);
                 loader.languages_at_path(&current_dir)?;
             }

From 9ac55f79d191f6fa200b1894ddac449fa3df70c1 Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Sun, 8 Jan 2023 04:39:46 +0200
Subject: [PATCH 016/347] Update Makefile VERSION to 0.20.9 from lib/Cargo.toml

Closes #1158
Closes #1608
---
 Makefile | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/Makefile b/Makefile
index 764f411a..69f6f590 100644
--- a/Makefile
+++ b/Makefile
@@ -1,4 +1,4 @@
-VERSION := 0.6.3
+VERSION := 0.20.9
 
 # install directory layout
 PREFIX ?= /usr/local

From 61b85b2664488bee81e36b1d145bea2d24b871c5 Mon Sep 17 00:00:00 2001
From: Boris Verkhovskiy <boris.verk@gmail.com>
Date: Sun, 8 Jan 2023 08:10:14 -0700
Subject: [PATCH 017/347] Make error message more specific

---
 cli/src/wasm.rs   | 5 +++++
 script/build-wasm | 6 +++++-
 2 files changed, 10 insertions(+), 1 deletion(-)

diff --git a/cli/src/wasm.rs b/cli/src/wasm.rs
index f31ac2d2..467fef71 100644
--- a/cli/src/wasm.rs
+++ b/cli/src/wasm.rs
@@ -65,6 +65,11 @@ pub fn compile_language_to_wasm(language_dir: &Path, force_docker: bool) -> Resu
         // Run `emcc` in a container using the `emscripten-slim` image
         command.args(&[EMSCRIPTEN_TAG, "emcc"]);
     } else {
+        if force_docker {
+            return Err(anyhow!(
+                "You must have docker on your PATH to run this command with --docker"
+            ));
+        }
         return Err(anyhow!(
             "You must have either emcc or docker on your PATH to run this command"
         ));
diff --git a/script/build-wasm b/script/build-wasm
index f95c3f15..dc42895a 100755
--- a/script/build-wasm
+++ b/script/build-wasm
@@ -71,7 +71,11 @@ elif which docker > /dev/null; then
     emscripten/emsdk:$emscripen_version  \
     emcc"
 else
-  echo 'You must have either `docker` or `emcc` on your PATH to run this script'
+  if [[ "$force_docker" == "1" ]]; then
+    echo 'You must have `docker` on your PATH to run this script with --docker'
+  else
+    echo 'You must have either `docker` or `emcc` on your PATH to run this script'
+  fi
   exit 1
 fi
 

From c7d431b53ed6e7b08d73d237cba960da1d437e62 Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Tue, 10 Jan 2023 10:44:20 +0200
Subject: [PATCH 018/347] Add setting TREE_SITTER_DEBUG in the test subcommand

Were asked in #1218
---
 cli/src/main.rs | 5 +++++
 1 file changed, 5 insertions(+)

diff --git a/cli/src/main.rs b/cli/src/main.rs
index c1dd2501..e0625708 100644
--- a/cli/src/main.rs
+++ b/cli/src/main.rs
@@ -329,6 +329,11 @@ fn run() -> Result<()> {
             let update = matches.is_present("update");
             let filter = matches.value_of("filter");
 
+            if debug {
+                // For augmenting debug logging in external scanners
+                env::set_var("TREE_SITTER_DEBUG", "1");
+            }
+
             loader.use_debug_build(debug_build);
 
             let languages = loader.languages_at_path(&current_dir)?;

From f627a97d24b8908110fe536f13b2c08b7a59efc2 Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Wed, 11 Jan 2023 04:11:04 +0200
Subject: [PATCH 019/347] loader: use portable way of path joining

---
 cli/config/src/lib.rs | 6 ++++--
 cli/loader/src/lib.rs | 3 ++-
 2 files changed, 6 insertions(+), 3 deletions(-)

diff --git a/cli/config/src/lib.rs b/cli/config/src/lib.rs
index 0a5eba54..678688fe 100644
--- a/cli/config/src/lib.rs
+++ b/cli/config/src/lib.rs
@@ -37,7 +37,8 @@ impl Config {
 
         let legacy_path = dirs::home_dir()
             .ok_or(anyhow!("Cannot determine home directory"))?
-            .join(".tree-sitter/config.json");
+            .join(".tree-sitter")
+            .join("config.json");
         if legacy_path.is_file() {
             return Ok(Some(legacy_path));
         }
@@ -48,7 +49,8 @@ impl Config {
     fn xdg_config_file() -> Result<PathBuf> {
         let xdg_path = dirs::config_dir()
             .ok_or(anyhow!("Cannot determine config directory"))?
-            .join("tree-sitter/config.json");
+            .join("tree-sitter")
+            .join("config.json");
         Ok(xdg_path)
     }
 
diff --git a/cli/loader/src/lib.rs b/cli/loader/src/lib.rs
index 0f92b051..029da451 100644
--- a/cli/loader/src/lib.rs
+++ b/cli/loader/src/lib.rs
@@ -112,7 +112,8 @@ impl Loader {
             Ok(path) => PathBuf::from(path),
             _ => dirs::cache_dir()
                 .ok_or(anyhow!("Cannot determine cache directory"))?
-                .join("tree-sitter/lib"),
+                .join("tree-sitter")
+                .join("lib"),
         };
         Ok(Self::with_parser_lib_path(parser_lib_path))
     }

From ca38c32d368ffd84e686b0cf41fef754044351a9 Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Sat, 14 Jan 2023 08:58:25 +0200
Subject: [PATCH 020/347] Exclude huge generated files from `git diff` output

---
 .gitattributes | 3 +++
 1 file changed, 3 insertions(+)

diff --git a/.gitattributes b/.gitattributes
index 4fcce330..44bf45c7 100644
--- a/.gitattributes
+++ b/.gitattributes
@@ -1,2 +1,5 @@
 /lib/src/unicode/*.h linguist-vendored
 /lib/src/unicode/LICENSE linguist-vendored
+
+/cli/src/generate/prepare_grammar/*.json -diff
+Cargo.lock -diff

From 5c1ca5adb0d007d6e68885601127fcbce0288c3f Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Sun, 15 Jan 2023 03:07:53 +0200
Subject: [PATCH 021/347] cli: produce smaller release binary by stripping
 debug info

---
 Cargo.toml | 3 +++
 1 file changed, 3 insertions(+)

diff --git a/Cargo.toml b/Cargo.toml
index 38830584..d1e57f89 100644
--- a/Cargo.toml
+++ b/Cargo.toml
@@ -2,3 +2,6 @@
 default-members = ["cli"]
 
 members = ["cli", "lib"]
+
+[profile.release]
+strip = true

From 7a56f0815436fadb93ad8f3e277aa4c6c44e7954 Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Sun, 15 Jan 2023 04:08:03 +0200
Subject: [PATCH 022/347] ci: bump setup-emsdk action version to @v12

---
 .github/workflows/ci.yml | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/.github/workflows/ci.yml b/.github/workflows/ci.yml
index 71f4be63..1f5edc96 100644
--- a/.github/workflows/ci.yml
+++ b/.github/workflows/ci.yml
@@ -59,7 +59,7 @@ jobs:
         run: cargo fmt -- --check
 
       - name: Install emscripten
-        uses: mymindstorm/setup-emsdk@v11
+        uses: mymindstorm/setup-emsdk@v12
         with:
           version: ${{ env.EMSCRIPTEN_VERSION }}
 

From ced103b519ea31eca559f4252798901a03e27fa3 Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Sun, 15 Jan 2023 04:07:29 +0200
Subject: [PATCH 023/347] ci: rustup install rustfmt and clippy

---
 .github/workflows/ci.yml | 1 +
 1 file changed, 1 insertion(+)

diff --git a/.github/workflows/ci.yml b/.github/workflows/ci.yml
index 1f5edc96..e6ef591a 100644
--- a/.github/workflows/ci.yml
+++ b/.github/workflows/ci.yml
@@ -54,6 +54,7 @@ jobs:
         with:
           toolchain: stable
           profile: minimal
+          components: rustfmt, clippy
 
       - name: Check Rust code formatting
         run: cargo fmt -- --check

From adeb8d0aa9af9d4472316d74dcc0c809ac3654b6 Mon Sep 17 00:00:00 2001
From: sogaiu <983021772@users.noreply.github.com>
Date: Mon, 16 Jan 2023 14:34:19 +0900
Subject: [PATCH 024/347] cli: Make init-config respect TREE_SITTER_DIR

---
 cli/config/src/lib.rs | 8 +++++++-
 1 file changed, 7 insertions(+), 1 deletion(-)

diff --git a/cli/config/src/lib.rs b/cli/config/src/lib.rs
index 678688fe..27b2dfb6 100644
--- a/cli/config/src/lib.rs
+++ b/cli/config/src/lib.rs
@@ -81,7 +81,13 @@ impl Config {
     ///
     /// (Note that this is typically only done by the `tree-sitter init-config` command.)
     pub fn initial() -> Result<Config> {
-        let location = Self::xdg_config_file()?;
+        let location = if let Ok(path) = env::var("TREE_SITTER_DIR") {
+            let mut path = PathBuf::from(path);
+            path.push("config.json");
+            path
+        } else {
+            Self::xdg_config_file()?
+        };
         let config = serde_json::json!({});
         Ok(Config { location, config })
     }

From 23ce370fa3607ab1fed4e60aebd6c0d2e6744376 Mon Sep 17 00:00:00 2001
From: sogaiu <983021772@users.noreply.github.com>
Date: Mon, 16 Jan 2023 14:24:16 +0900
Subject: [PATCH 025/347] cli: Stop config.json search sooner if
 TREE_SITTER_DIR set

---
 cli/config/src/lib.rs | 3 +++
 1 file changed, 3 insertions(+)

diff --git a/cli/config/src/lib.rs b/cli/config/src/lib.rs
index 27b2dfb6..3cd09b8d 100644
--- a/cli/config/src/lib.rs
+++ b/cli/config/src/lib.rs
@@ -25,6 +25,9 @@ impl Config {
         if let Ok(path) = env::var("TREE_SITTER_DIR") {
             let mut path = PathBuf::from(path);
             path.push("config.json");
+            if !path.exists() {
+                return Ok(None);
+            }
             if path.is_file() {
                 return Ok(Some(path));
             }

From ae3b60bd29e301a99568f5c20d46e83bbccfda68 Mon Sep 17 00:00:00 2001
From: Matt <85322+mattmassicotte@users.noreply.github.com>
Date: Tue, 17 Jan 2023 09:14:57 -0500
Subject: [PATCH 026/347] Include many new parsers in a unified list

---
 docs/index.md | 75 ++++++++++++++++++++++++++++++++-------------------
 1 file changed, 47 insertions(+), 28 deletions(-)

diff --git a/docs/index.md b/docs/index.md
index 1c4f958a..6602c25e 100644
--- a/docs/index.md
+++ b/docs/index.md
@@ -27,77 +27,96 @@ There are currently bindings that allow Tree-sitter to be used from the followin
 * [Kotlin](https://github.com/oxisto/kotlintree)
 * [Java](https://github.com/serenadeai/java-tree-sitter)
 
-### Available Parsers
-
-Parsers for these languages are fairly complete:
+### Parsers
 
+* [Agda](https://github.com/tree-sitter/tree-sitter-agda)
 * [Bash](https://github.com/tree-sitter/tree-sitter-bash)
-* [C](https://github.com/tree-sitter/tree-sitter-c)
 * [C#](https://github.com/tree-sitter/tree-sitter-c-sharp)
 * [C++](https://github.com/tree-sitter/tree-sitter-cpp)
+* [Clojure](https://github.com/sogaiu/tree-sitter-clojure)
+* [CMake](https://github.com/uyha/tree-sitter-cmake)
+* [Comment](https://github.com/stsewd/tree-sitter-comment)
 * [Common Lisp](https://github.com/theHamsta/tree-sitter-commonlisp)
 * [CSS](https://github.com/tree-sitter/tree-sitter-css)
 * [CUDA](https://github.com/theHamsta/tree-sitter-cuda)
-* [D](https://github.com/gdamore/tree-sitter-d)
+* [C](https://github.com/tree-sitter/tree-sitter-c)
+* [Dart](https://github.com/UserNobody14/tree-sitter-dart)
+* [Dockerfile](https://github.com/camdencheek/tree-sitter-dockerfile)
+* [Dockerfile](https://github.com/camdencheek/tree-sitter-dockerfile)
 * [DOT](https://github.com/rydesun/tree-sitter-dot)
+* [D](https://github.com/gdamore/tree-sitter-d)
+* [Elixir](https://github.com/elixir-lang/tree-sitter-elixir)
 * [Elm](https://github.com/elm-tooling/tree-sitter-elm)
 * [Emacs Lisp](https://github.com/Wilfred/tree-sitter-elisp)
 * [Eno](https://github.com/eno-lang/tree-sitter-eno)
 * [ERB / EJS](https://github.com/tree-sitter/tree-sitter-embedded-template)
 * [Erlang](https://github.com/WhatsApp/tree-sitter-erlang/)
 * [Fennel](https://github.com/travonted/tree-sitter-fennel)
+* [Fish](https://github.com/ram02z/tree-sitter-fish)
+* [Fortran](https://github.com/stadelmanma/tree-sitter-fortran)
+* [gitattributes](https://github.com/ObserverOfTime/tree-sitter-gitattributes)
+* [gitignore](https://github.com/shunsambongi/tree-sitter-gitignore)
 * [GLSL (OpenGL Shading Language)](https://github.com/theHamsta/tree-sitter-glsl)
+* [Go mod](https://github.com/camdencheek/tree-sitter-go-mod)
+* [Go work](https://github.com/omertuc/tree-sitter-go-work)
 * [Go](https://github.com/tree-sitter/tree-sitter-go)
+* [Graphql](https://github.com/bkegley/tree-sitter-graphql)
+* [Hack](https://github.com/slackhq/tree-sitter-hack)
+* [Haskell](https://github.com/tree-sitter/tree-sitter-haskell)
 * [HCL](https://github.com/MichaHoffmann/tree-sitter-hcl)
 * [HTML](https://github.com/tree-sitter/tree-sitter-html)
-* [Java](https://github.com/tree-sitter/tree-sitter-java)
 * [JavaScript](https://github.com/tree-sitter/tree-sitter-javascript)
+* [Java](https://github.com/tree-sitter/tree-sitter-java)
+* [JSON5](https://github.com/Joakker/tree-sitter-json5)
 * [JSON](https://github.com/tree-sitter/tree-sitter-json)
+* [Julia](https://github.com/tree-sitter/tree-sitter-julia)
+* [Kotlin](https://github.com/fwcd/tree-sitter-kotlin)
+* [Latex](https://github.com/latex-lsp/tree-sitter-latex)
+* [LLVM](https://github.com/benwilliamgraham/tree-sitter-llvm)
 * [Lua](https://github.com/Azganoth/tree-sitter-lua)
 * [Make](https://github.com/alemuller/tree-sitter-make)
 * [Markdown](https://github.com/ikatyang/tree-sitter-markdown)
+* [Markdown](https://github.com/MDeiml/tree-sitter-markdown)
+* [Nix](https://github.com/cstrahan/tree-sitter-nix)
+* [Objective-C](https://github.com/jiyee/tree-sitter-objc)
 * [OCaml](https://github.com/tree-sitter/tree-sitter-ocaml)
+* [Org](https://github.com/milisims/tree-sitter-org)
+* [Pascal](https://github.com/Isopod/tree-sitter-pascal)
+* [Perl](https://github.com/ganezdragon/tree-sitter-perl)
 * [PHP](https://github.com/tree-sitter/tree-sitter-php)
+* [PowerShell](https://github.com/PowerShell/tree-sitter-PowerShell)
+* [Protocol Buffers](https://github.com/mitchellh/tree-sitter-proto)
 * [Python](https://github.com/tree-sitter/tree-sitter-python)
+* [Racket](https://github.com/6cdh/tree-sitter-racket)
+* [Regex](https://github.com/tree-sitter/tree-sitter-regex)
+* [reStructuredText](https://github.com/stsewd/tree-sitter-rst)
 * [Ruby](https://github.com/tree-sitter/tree-sitter-ruby)
 * [Rust](https://github.com/tree-sitter/tree-sitter-rust)
 * [R](https://github.com/r-lib/tree-sitter-r)
 * [S-expressions](https://github.com/AbstractMachinesLab/tree-sitter-sexp)
+* [Scala](https://github.com/tree-sitter/tree-sitter-scala)
+* [Scheme](https://github.com/6cdh/tree-sitter-scheme)
+* [Scss](https://github.com/serenadeai/tree-sitter-scss)
+* [Sourcepawn](https://github.com/nilshelmig/tree-sitter-sourcepawn)
 * [SPARQL](https://github.com/BonaBeavis/tree-sitter-sparql)
+* [SQL-PostgreSQL](https://github.com/m-novikov/tree-sitter-sql)
+* [SQL-Sqlite](https://github.com/dhcmrlchtdj/tree-sitter-sqlite)
+* [SSH](https://github.com/metio/tree-sitter-ssh-client-config)
 * [Svelte](https://github.com/Himujjal/tree-sitter-svelte)
 * [Swift](https://github.com/alex-pinkus/tree-sitter-swift)
 * [SystemRDL](https://github.com/SystemRDL/tree-sitter-systemrdl)
 * [TOML](https://github.com/ikatyang/tree-sitter-toml)
+* [Tree-sitter query](https://github.com/nvim-treesitter/tree-sitter-query)
 * [Turtle](https://github.com/BonaBeavis/tree-sitter-turtle)
 * [Twig](https://github.com/gbprod/tree-sitter-twig)
 * [TypeScript](https://github.com/tree-sitter/tree-sitter-typescript)
 * [Verilog](https://github.com/tree-sitter/tree-sitter-verilog)
 * [VHDL](https://github.com/alemuller/tree-sitter-vhdl)
 * [Vue](https://github.com/ikatyang/tree-sitter-vue)
-* [YAML](https://github.com/ikatyang/tree-sitter-yaml)
 * [WASM](https://github.com/wasm-lsp/tree-sitter-wasm)
 * [WGSL WebGPU Shading Language](https://github.com/mehmetoguzderin/tree-sitter-wgsl)
-
-Parsers for these languages are in development:
-
-* [Agda](https://github.com/tree-sitter/tree-sitter-agda)
-* [Elixir](https://github.com/elixir-lang/tree-sitter-elixir)
-* [Dockerfile](https://github.com/camdencheek/tree-sitter-dockerfile)
-* [Go mod](https://github.com/camdencheek/tree-sitter-go-mod)
-* [Hack](https://github.com/slackhq/tree-sitter-hack)
-* [Haskell](https://github.com/tree-sitter/tree-sitter-haskell)
-* [Julia](https://github.com/tree-sitter/tree-sitter-julia)
-* [Kotlin](https://github.com/fwcd/tree-sitter-kotlin)
-* [Nix](https://github.com/cstrahan/tree-sitter-nix)
-* [Objective-C](https://github.com/jiyee/tree-sitter-objc)
-* [Org](https://github.com/milisims/tree-sitter-org)
-* [Perl](https://github.com/ganezdragon/tree-sitter-perl)
-* [Protocol Buffers](https://github.com/mitchellh/tree-sitter-proto)
-* [Racket](https://github.com/6cdh/tree-sitter-racket)
-* [Scala](https://github.com/tree-sitter/tree-sitter-scala)
-* [Sourcepawn](https://github.com/nilshelmig/tree-sitter-sourcepawn)
-* [SQL](https://github.com/m-novikov/tree-sitter-sql)
-
+* [YAML](https://github.com/ikatyang/tree-sitter-yaml)
+* [Zig](https://github.com/maxxnino/tree-sitter-zig)
 
 ### Talks on Tree-sitter
 

From cca626afe786dd1c1c0bf3609f81621165dabac1 Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Fri, 27 Jan 2023 07:49:07 +0200
Subject: [PATCH 027/347] docs: remove duplicated link

---
 docs/index.md | 1 -
 1 file changed, 1 deletion(-)

diff --git a/docs/index.md b/docs/index.md
index 6602c25e..097f0241 100644
--- a/docs/index.md
+++ b/docs/index.md
@@ -42,7 +42,6 @@ There are currently bindings that allow Tree-sitter to be used from the followin
 * [C](https://github.com/tree-sitter/tree-sitter-c)
 * [Dart](https://github.com/UserNobody14/tree-sitter-dart)
 * [Dockerfile](https://github.com/camdencheek/tree-sitter-dockerfile)
-* [Dockerfile](https://github.com/camdencheek/tree-sitter-dockerfile)
 * [DOT](https://github.com/rydesun/tree-sitter-dot)
 * [D](https://github.com/gdamore/tree-sitter-d)
 * [Elixir](https://github.com/elixir-lang/tree-sitter-elixir)

From 2e732d17ddfa0360668c029fac0f3c0b9bc083a5 Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Fri, 27 Jan 2023 10:15:23 +0200
Subject: [PATCH 028/347] docs: merge of all binding and grammar link PRs
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Joined commit messages:
---

Closes: #2048

    docs: add capnp, smali, thrift

Closes: #2026

    Add Perl binding

Closes: #1989

    Add Ada to the list of available parsers

Closes: #1980

    Add clojure to list of available parsers

    After some discussion in
    https://github.com/sogaiu/tree-sitter-clojure/issues/28

    I decided to submit an issue to the tree-sitter organization
    to include tree-sitter-clojure in their list of available parsers.
    This repository is used by a couple of editors and tools, and
    I am using it to build a tree-sitter based programming mode
    for Clojure in Emacs.
    Since there are a couple of tools that depend on it, it seems
    worthy of inclusion in an official list of tree-sitter grammars.

Closes: #1943

    Add meson grammar to list.

Closes: #1926

    docs(meson): add parse for meson
    add meson

Closes: #1912

    Merge branch 'master' into add-heex-parser

Closes: #1908

    Add Apex to available parsers

Closes: #1876

    Add tree-sitter-gleam to list of available parsers

Closes: #1862

    DOCS: Add entries various SQL flavor parsers

Closes: #1857

    Add Go to the available language bindings

Closes: #1856

    docs: add jq grammar

Closes: #1828

    Add tree sitter lalrpop

    This is a parser for https://github.com/lalrpop/lalrpop,
    a parser generator for use in Rust.

    It is still in development because it should support some kind
    of highlighting of the pseudo rust code used in rules.

Closes: #1733

    Add YANG parser to parser list
    I wrote this parser over summer vacation last year and I've been using it at work every day since.

Closes: #1728

    Add link to m68k grammar
    Link to m68k (Motorola 68000 assembly) grammar in docs.

Closes: #1697

    Added rego language

Closes: #1694

    docs: add Formula parser

Closes: #1672

    docs: Add link to QML (Qt UI spec/programming language) parser

Closes: #1671

    parser: add beancount parser link

Closes: #1623

    Add link to llvm grammars
    Add links to LLVM IR, MIR and TableGen parsers.

Closes: #1579

    Add my Smali parser to the WIP list

Closes: #1575

    Update index.md

Closes: #1563

    Add re2c and sort alphabetically

    Added re2c parser (lexer generator).
    Sorted the list alphabetically case-insensitively.

Closes: #1209

    add link to chess Portable Game Notation grammar

Closes: #1176

    Add tree-sitter-lean.

Closes: #1123

    Add parsers to list

---
Co-authored-by: Amaan Qureshi <amaanq12@gmail.com>
Co-authored-by: Felipe Gasper <FGasper@users.noreply.github.com>
Co-authored-by: Emmanuel Briot <briot.emmanuel@gmail.com>
Co-authored-by: Danny Freeman <dannyfreeman@users.noreply.github.com>
Co-authored-by: Garrett D'Amore <garrett@damore.org>
Co-authored-by: ShootingStarDragons <ShootingStarDragons@protonmail.com>
Co-authored-by: Clay <connorlay@users.noreply.github.com>
Co-authored-by: Anthony Heber <anthony@heber.dev>
Co-authored-by: Jonathan Arnett <jonarnett90@gmail.com>
Co-authored-by: takegue <takegue@gmail.com>
Co-authored-by: Cédric Fabianski <cedric@bearer.sh>
Co-authored-by: flurie <flurie@gmail.com>
Co-authored-by: traxys <quentin+dev@familleboyer.net>
Co-authored-by: Tomas Sandven <597206+Hubro@users.noreply.github.com>
Co-authored-by: Graham Bates <info@grahambates.com>
Co-authored-by: Lex <mr.x97@mail.ru>
Co-authored-by: Ben Siraphob <bensiraphob@gmail.com>
Co-authored-by: Yuya Nishihara <yuya@tcha.org>
Co-authored-by: WeiZhang <kweizh@gmail.com>
Co-authored-by: Flakebi <flakebi@t-online.de>
Co-authored-by: Yotam <me@yotam.net>
Co-authored-by: Fymyte <34305318+Fymyte@users.noreply.github.com>
Co-authored-by: Alexandre A. Muller <muller@outlook.com>
Co-authored-by: Roland Walker <walker@pobox.com>
Co-authored-by: Julian Berman <Julian@GrayVines.com>
Co-authored-by: Santos Gallegos <stsewd@protonmail.com>
---
 docs/index.md | 51 ++++++++++++++++++++++++++++++++++++++++-----------
 1 file changed, 40 insertions(+), 11 deletions(-)

diff --git a/docs/index.md b/docs/index.md
index 097f0241..2e3b59ed 100644
--- a/docs/index.md
+++ b/docs/index.md
@@ -9,19 +9,22 @@ Tree-sitter is a parser generator tool and an incremental parsing library. It ca
 * **General** enough to parse any programming language
 * **Fast** enough to parse on every keystroke in a text editor
 * **Robust** enough to provide useful results even in the presence of syntax errors
-* **Dependency-free** so that the runtime library (which is written in pure C) can be embedded in any application
+* **Dependency-free** so that the runtime library (which is written in pure [C](https://github.com/tree-sitter/tree-sitter/tree/master/lib)) can be embedded in any application
 
 ### Language Bindings
 
 There are currently bindings that allow Tree-sitter to be used from the following languages:
 
+* [Go](https://github.com/smacker/go-tree-sitter)
 * [Haskell](https://github.com/tree-sitter/haskell-tree-sitter)
 * [JavaScript (Node.js)](https://github.com/tree-sitter/node-tree-sitter)
 * [JavaScript (Wasm)](https://github.com/tree-sitter/tree-sitter/tree/master/lib/binding_web)
 * [Lua](https://github.com/euclidianAce/ltreesitter)
 * [OCaml](https://github.com/returntocorp/ocaml-tree-sitter-core)
+* [Perl](https://metacpan.org/pod/Text::Treesitter)
 * [Python](https://github.com/tree-sitter/py-tree-sitter)
 * [Ruby](https://github.com/tree-sitter/ruby-tree-sitter)
+* [Ruby](https://github.com/calicoday/ruby-tree-sitter-ffi)
 * [Rust](https://github.com/tree-sitter/tree-sitter/tree/master/lib/binding_rust)
 * [Swift](https://github.com/ChimeHQ/SwiftTreeSitter)
 * [Kotlin](https://github.com/oxisto/kotlintree)
@@ -29,21 +32,25 @@ There are currently bindings that allow Tree-sitter to be used from the followin
 
 ### Parsers
 
+* [Ada](https://github.com/briot/tree-sitter-ada)
 * [Agda](https://github.com/tree-sitter/tree-sitter-agda)
+* [Apex](https://github.com/aheber/tree-sitter-sfapex)
 * [Bash](https://github.com/tree-sitter/tree-sitter-bash)
-* [C#](https://github.com/tree-sitter/tree-sitter-c-sharp)
+* [Beancount](https://github.com/zwpaper/tree-sitter-beancount)
+* [Cap'n Proto](https://github.com/amaanq/tree-sitter-capnp)
+* [C](https://github.com/tree-sitter/tree-sitter-c)
 * [C++](https://github.com/tree-sitter/tree-sitter-cpp)
+* [C#](https://github.com/tree-sitter/tree-sitter-c-sharp)
 * [Clojure](https://github.com/sogaiu/tree-sitter-clojure)
 * [CMake](https://github.com/uyha/tree-sitter-cmake)
 * [Comment](https://github.com/stsewd/tree-sitter-comment)
 * [Common Lisp](https://github.com/theHamsta/tree-sitter-commonlisp)
 * [CSS](https://github.com/tree-sitter/tree-sitter-css)
 * [CUDA](https://github.com/theHamsta/tree-sitter-cuda)
-* [C](https://github.com/tree-sitter/tree-sitter-c)
 * [Dart](https://github.com/UserNobody14/tree-sitter-dart)
+* [D](https://github.com/gdamore/tree-sitter-d)
 * [Dockerfile](https://github.com/camdencheek/tree-sitter-dockerfile)
 * [DOT](https://github.com/rydesun/tree-sitter-dot)
-* [D](https://github.com/gdamore/tree-sitter-d)
 * [Elixir](https://github.com/elixir-lang/tree-sitter-elixir)
 * [Elm](https://github.com/elm-tooling/tree-sitter-elm)
 * [Emacs Lisp](https://github.com/Wilfred/tree-sitter-elisp)
@@ -52,60 +59,81 @@ There are currently bindings that allow Tree-sitter to be used from the followin
 * [Erlang](https://github.com/WhatsApp/tree-sitter-erlang/)
 * [Fennel](https://github.com/travonted/tree-sitter-fennel)
 * [Fish](https://github.com/ram02z/tree-sitter-fish)
+* [Formula](https://github.com/siraben/tree-sitter-formula)
 * [Fortran](https://github.com/stadelmanma/tree-sitter-fortran)
 * [gitattributes](https://github.com/ObserverOfTime/tree-sitter-gitattributes)
 * [gitignore](https://github.com/shunsambongi/tree-sitter-gitignore)
+* [Gleam](https://github.com/gleam-lang/tree-sitter-gleam)
 * [GLSL (OpenGL Shading Language)](https://github.com/theHamsta/tree-sitter-glsl)
+* [Go](https://github.com/tree-sitter/tree-sitter-go)
 * [Go mod](https://github.com/camdencheek/tree-sitter-go-mod)
 * [Go work](https://github.com/omertuc/tree-sitter-go-work)
-* [Go](https://github.com/tree-sitter/tree-sitter-go)
 * [Graphql](https://github.com/bkegley/tree-sitter-graphql)
 * [Hack](https://github.com/slackhq/tree-sitter-hack)
 * [Haskell](https://github.com/tree-sitter/tree-sitter-haskell)
 * [HCL](https://github.com/MichaHoffmann/tree-sitter-hcl)
 * [HTML](https://github.com/tree-sitter/tree-sitter-html)
-* [JavaScript](https://github.com/tree-sitter/tree-sitter-javascript)
 * [Java](https://github.com/tree-sitter/tree-sitter-java)
+* [JavaScript](https://github.com/tree-sitter/tree-sitter-javascript)
+* [jq](https://github.com/flurie/tree-sitter-jq)
 * [JSON5](https://github.com/Joakker/tree-sitter-json5)
 * [JSON](https://github.com/tree-sitter/tree-sitter-json)
 * [Julia](https://github.com/tree-sitter/tree-sitter-julia)
 * [Kotlin](https://github.com/fwcd/tree-sitter-kotlin)
+* [LALRPOP](https://github.com/traxys/tree-sitter-lalrpop)
 * [Latex](https://github.com/latex-lsp/tree-sitter-latex)
+* [Lean](https://github.com/Julian/tree-sitter-lean)
 * [LLVM](https://github.com/benwilliamgraham/tree-sitter-llvm)
+* [LLVM MachineIR](https://github.com/Flakebi/tree-sitter-llvm-mir)
+* [LLVM TableGen](https://github.com/Flakebi/tree-sitter-tablegen)
 * [Lua](https://github.com/Azganoth/tree-sitter-lua)
 * [Make](https://github.com/alemuller/tree-sitter-make)
 * [Markdown](https://github.com/ikatyang/tree-sitter-markdown)
 * [Markdown](https://github.com/MDeiml/tree-sitter-markdown)
+* [Meson](https://github.com/Decodetalkers/tree-sitter-meson)
+* [Meson](https://github.com/staysail/tree-sitter-meson)
+* [Motorola 68000 Assembly](https://github.com/grahambates/tree-sitter-m68k)
 * [Nix](https://github.com/cstrahan/tree-sitter-nix)
 * [Objective-C](https://github.com/jiyee/tree-sitter-objc)
 * [OCaml](https://github.com/tree-sitter/tree-sitter-ocaml)
 * [Org](https://github.com/milisims/tree-sitter-org)
 * [Pascal](https://github.com/Isopod/tree-sitter-pascal)
 * [Perl](https://github.com/ganezdragon/tree-sitter-perl)
+* [Perl](https://github.com/tree-sitter-perl/tree-sitter-perl)
+* [Perl POD](https://github.com/tree-sitter-perl/tree-sitter-pod)
 * [PHP](https://github.com/tree-sitter/tree-sitter-php)
+* [Portable Game Notation](https://github.com/rolandwalker/tree-sitter-pgn)
 * [PowerShell](https://github.com/PowerShell/tree-sitter-PowerShell)
 * [Protocol Buffers](https://github.com/mitchellh/tree-sitter-proto)
 * [Python](https://github.com/tree-sitter/tree-sitter-python)
+* [QML](https://github.com/yuja/tree-sitter-qmljs)
 * [Racket](https://github.com/6cdh/tree-sitter-racket)
+* [Rasi](https://github.com/Fymyte/tree-sitter-rasi)
+* [re2c](https://github.com/alemuller/tree-sitter-re2c)
 * [Regex](https://github.com/tree-sitter/tree-sitter-regex)
+* [Rego](https://github.com/FallenAngel97/tree-sitter-rego)
 * [reStructuredText](https://github.com/stsewd/tree-sitter-rst)
+* [R](https://github.com/r-lib/tree-sitter-r)
 * [Ruby](https://github.com/tree-sitter/tree-sitter-ruby)
 * [Rust](https://github.com/tree-sitter/tree-sitter-rust)
-* [R](https://github.com/r-lib/tree-sitter-r)
-* [S-expressions](https://github.com/AbstractMachinesLab/tree-sitter-sexp)
 * [Scala](https://github.com/tree-sitter/tree-sitter-scala)
 * [Scheme](https://github.com/6cdh/tree-sitter-scheme)
 * [Scss](https://github.com/serenadeai/tree-sitter-scss)
+* [S-expressions](https://github.com/AbstractMachinesLab/tree-sitter-sexp)
+* [Smali](https://github.com/amaanq/tree-sitter-smali)
+* [Smali](https://git.sr.ht/~yotam/tree-sitter-smali)
 * [Sourcepawn](https://github.com/nilshelmig/tree-sitter-sourcepawn)
 * [SPARQL](https://github.com/BonaBeavis/tree-sitter-sparql)
-* [SQL-PostgreSQL](https://github.com/m-novikov/tree-sitter-sql)
-* [SQL-Sqlite](https://github.com/dhcmrlchtdj/tree-sitter-sqlite)
+* [SQL - BigQuery](https://github.com/takegue/tree-sitter-sql-bigquery)
+* [SQL - PostgreSQL](https://github.com/m-novikov/tree-sitter-sql)
+* [SQL - SQLite](https://github.com/dhcmrlchtdj/tree-sitter-sqlite)
 * [SSH](https://github.com/metio/tree-sitter-ssh-client-config)
 * [Svelte](https://github.com/Himujjal/tree-sitter-svelte)
 * [Swift](https://github.com/alex-pinkus/tree-sitter-swift)
 * [SystemRDL](https://github.com/SystemRDL/tree-sitter-systemrdl)
+* [Thrift](https://github.com/duskmoon314/tree-sitter-thrift)
 * [TOML](https://github.com/ikatyang/tree-sitter-toml)
-* [Tree-sitter query](https://github.com/nvim-treesitter/tree-sitter-query)
+* [Tree-sitter Query](https://github.com/nvim-treesitter/tree-sitter-query)
 * [Turtle](https://github.com/BonaBeavis/tree-sitter-turtle)
 * [Twig](https://github.com/gbprod/tree-sitter-twig)
 * [TypeScript](https://github.com/tree-sitter/tree-sitter-typescript)
@@ -115,6 +143,7 @@ There are currently bindings that allow Tree-sitter to be used from the followin
 * [WASM](https://github.com/wasm-lsp/tree-sitter-wasm)
 * [WGSL WebGPU Shading Language](https://github.com/mehmetoguzderin/tree-sitter-wgsl)
 * [YAML](https://github.com/ikatyang/tree-sitter-yaml)
+* [YANG](https://github.com/Hubro/tree-sitter-yang)
 * [Zig](https://github.com/maxxnino/tree-sitter-zig)
 
 ### Talks on Tree-sitter

From 5766b8a0a785ea34fceb479a94f7fe24c9daae2f Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Mon, 6 Feb 2023 21:33:50 +0200
Subject: [PATCH 029/347] docs: apply `scheme` marker for all query syntax
 snippets

---
 docs/section-2-using-parsers.md | 40 ++++++++++++++++-----------------
 1 file changed, 20 insertions(+), 20 deletions(-)

diff --git a/docs/section-2-using-parsers.md b/docs/section-2-using-parsers.md
index ac3f968f..ea32f4f5 100644
--- a/docs/section-2-using-parsers.md
+++ b/docs/section-2-using-parsers.md
@@ -442,13 +442,13 @@ Many code analysis tasks involve searching for patterns in syntax trees. Tree-si
 
 A _query_ consists of one or more _patterns_, where each pattern is an [S-expression](https://en.wikipedia.org/wiki/S-expression) that matches a certain set of nodes in a syntax tree. The expression to match a given node consists of a pair of parentheses containing two things: the node's type, and optionally, a series of other S-expressions that match the node's children. For example, this pattern would match any `binary_expression` node whose children are both `number_literal` nodes:
 
-```
+``` scheme
 (binary_expression (number_literal) (number_literal))
 ```
 
 Children can also be omitted. For example, this would match any `binary_expression` where at least _one_ of child is a `string_literal` node:
 
-```
+``` scheme
 (binary_expression (string_literal))
 ```
 
@@ -456,7 +456,7 @@ Children can also be omitted. For example, this would match any `binary_expressi
 
 In general, it's a good idea to make patterns more specific by specifying [field names](#node-field-names) associated with child nodes. You do this by prefixing a child pattern with a field name followed by a colon. For example, this pattern would match an `assignment_expression` node where the `left` child is a `member_expression` whose `object` is a `call_expression`.
 
-```
+``` scheme
 (assignment_expression
   left: (member_expression
     object: (call_expression)))
@@ -466,7 +466,7 @@ In general, it's a good idea to make patterns more specific by specifying [field
 
 You can also constrain a pattern so that it only matches nodes that *lack* a certain field. To do this, add a field name prefixed by a `!` within the parent pattern. For example, this pattern would match a class declaration with no type parameters:
 
-```
+``` scheme
 (class_declaration
   name: (identifier) @class_name
   !type_parameters)
@@ -476,7 +476,7 @@ You can also constrain a pattern so that it only matches nodes that *lack* a cer
 
 The parenthesized syntax for writing nodes only applies to [named nodes](#named-vs-anonymous-nodes). To match specific anonymous nodes, you write their name between double quotes. For example, this pattern would match any `binary_expression` where the operator is `!=` and the right side is `null`:
 
-```
+``` scheme
 (binary_expression
   operator: "!="
   right: (null))
@@ -488,7 +488,7 @@ When matching patterns, you may want to process specific nodes within the patter
 
 For example, this pattern would match any assignment of a `function` to an `identifier`, and it would associate the name `the-function-name` with the identifier:
 
-```
+``` scheme
 (assignment_expression
   left: (identifier) @the-function-name
   right: (function))
@@ -496,7 +496,7 @@ For example, this pattern would match any assignment of a `function` to an `iden
 
 And this pattern would match all method definitions, associating the name `the-method-name` with the method name, `the-class-name` with the containing class name:
 
-```
+``` scheme
 (class_declaration
   name: (identifier) @the-class-name
   body: (class_body
@@ -510,13 +510,13 @@ You can match a repeating sequence of sibling nodes using the postfix `+` and `*
 
 For example, this pattern would match a sequence of one or more comments:
 
-```
+``` scheme
 (comment)+
 ```
 
 This pattern would match a class declaration, capturing all of the decorators if any were present:
 
-```
+``` scheme
 (class_declaration
   (decorator)* @the-decorator
   name: (identifier) @the-name)
@@ -524,7 +524,7 @@ This pattern would match a class declaration, capturing all of the decorators if
 
 You can also mark a node as optional using the `?` operator. For example, this pattern would match all function calls, capturing a string argument if one was present:
 
-```
+``` scheme
 (call_expression
   function: (identifier) @the-function
   arguments: (arguments (string)? @the-string-arg))
@@ -534,7 +534,7 @@ You can also mark a node as optional using the `?` operator. For example, this p
 
 You can also use parentheses for grouping a sequence of _sibling_ nodes. For example, this pattern would match a comment followed by a function declaration:
 
-```
+``` scheme
 (
   (comment)
   (function_declaration)
@@ -543,7 +543,7 @@ You can also use parentheses for grouping a sequence of _sibling_ nodes. For exa
 
 Any of the quantification operators mentioned above (`+`, `*`, and `?`) can also be applied to groups. For example, this pattern would match a comma-separated series of numbers:
 
-```
+``` scheme
 (
   (number)
   ("," (number))*
@@ -558,7 +558,7 @@ This is similar to _character classes_ from regular expressions (`[abc]` matches
 For example, this pattern would match a call to either a variable or an object property.
 In the case of a variable, capture it as `@function`, and in the case of a property, capture it as `@method`:
 
-```
+``` scheme
 (call_expression
   function: [
     (identifier) @function
@@ -569,7 +569,7 @@ In the case of a variable, capture it as `@function`, and in the case of a prope
 
 This pattern would match a set of possible keyword tokens, capturing them as `@keyword`:
 
-```
+``` scheme
 [
   "break"
   "delete"
@@ -592,7 +592,7 @@ and `_` will match any named or anonymous node.
 
 For example, this pattern would match any node inside a call:
 
-```
+``` scheme
 (call (_) @call.inner)
 ```
 
@@ -602,7 +602,7 @@ The anchor operator, `.`, is used to constrain the ways in which child patterns
 
 When `.` is placed before the _first_ child within a parent pattern, the child will only match when it is the first named node in the parent. For example, the below pattern matches a given `array` node at most once, assigning the `@the-element` capture to the first `identifier` node in the parent `array`:
 
-```
+``` scheme
 (array . (identifier) @the-element)
 ```
 
@@ -610,13 +610,13 @@ Without this anchor, the pattern would match once for every identifier in the ar
 
 Similarly, an anchor placed after a pattern's _last_ child will cause that child pattern to only match nodes that are the last named child of their parent. The below pattern matches only nodes that are the last named child within a `block`.
 
-```
+``` scheme
 (block (_) @last-expression .)
 ```
 
 Finally, an anchor _between_ two child patterns will cause the patterns to only match nodes that are immediate siblings. The pattern below, given a long dotted name like `a.b.c.d`, will only match pairs of consecutive identifiers: `a, b`, `b, c`, and `c, d`.
 
-```
+``` scheme
 (dotted_name
   (identifier) @prev-id
   .
@@ -633,7 +633,7 @@ You can also specify arbitrary metadata and conditions associated with a pattern
 
 For example, this pattern would match identifier whose names is written in `SCREAMING_SNAKE_CASE`:
 
-```
+``` scheme
 (
   (identifier) @constant
   (#match? @constant "^[A-Z][A-Z_]+")
@@ -642,7 +642,7 @@ For example, this pattern would match identifier whose names is written in `SCRE
 
 And this pattern would match key-value pairs where the `value` is an identifier with the same name as the key:
 
-```
+``` scheme
 (
   (pair
     key: (property_identifier) @key-name

From 3964651fc69cdf4ac060751464268fad41aca421 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?L=C3=A9o=20Gaspard?= <leo@gaspard.io>
Date: Thu, 9 Feb 2023 03:35:42 +0100
Subject: [PATCH 030/347] Derive Hash for Language

Given Language implements Eq, it can probably implement Hash too.

This makes it easy to derive a random identifier from a `Language`
---
 lib/binding_rust/lib.rs | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/lib/binding_rust/lib.rs b/lib/binding_rust/lib.rs
index 870d177b..84471d06 100644
--- a/lib/binding_rust/lib.rs
+++ b/lib/binding_rust/lib.rs
@@ -38,7 +38,7 @@ pub const PARSER_HEADER: &'static str = include_str!("../include/tree_sitter/par
 /// An opaque object that defines how to parse a particular language. The code for each
 /// `Language` is generated by the Tree-sitter CLI.
 #[doc(alias = "TSLanguage")]
-#[derive(Clone, Copy, Debug, PartialEq, Eq)]
+#[derive(Clone, Copy, Debug, PartialEq, Eq, Hash)]
 #[repr(transparent)]
 pub struct Language(*const ffi::TSLanguage);
 

From 97fd990822deeb3c288f4999a8410fba69f230b6 Mon Sep 17 00:00:00 2001
From: Max Brunsfeld <maxbrunsfeld@gmail.com>
Date: Mon, 13 Feb 2023 12:33:34 -0800
Subject: [PATCH 031/347] Add --dot flag to parse subcommand, for printing tree
 as DOT graph

---
 cli/src/main.rs               | 20 ++++++---
 cli/src/parse.rs              | 19 +++++++--
 cli/src/util.rs               | 80 ++++++++++++++++++++++-------------
 lib/binding_rust/bindings.rs  |  7 +++
 lib/binding_rust/lib.rs       | 10 +++++
 lib/include/tree_sitter/api.h |  2 +-
 lib/src/clock.h               |  1 +
 lib/src/tree.c                |  5 ++-
 lib/src/tree.h                |  2 +
 script/generate-bindings      |  3 --
 10 files changed, 106 insertions(+), 43 deletions(-)

diff --git a/cli/src/main.rs b/cli/src/main.rs
index e0625708..47e7597b 100644
--- a/cli/src/main.rs
+++ b/cli/src/main.rs
@@ -3,6 +3,7 @@ use clap::{App, AppSettings, Arg, SubCommand};
 use glob::glob;
 use std::path::{Path, PathBuf};
 use std::{env, fs, u64};
+use tree_sitter_cli::parse::ParseOutput;
 use tree_sitter_cli::{
     generate, highlight, logger, parse, playground, query, tags, test, test_highlight, test_tags,
     util, wasm,
@@ -136,7 +137,8 @@ fn run() -> Result<()> {
                 .arg(&debug_arg)
                 .arg(&debug_build_arg)
                 .arg(&debug_graph_arg)
-                .arg(Arg::with_name("debug-xml").long("xml").short("x"))
+                .arg(Arg::with_name("output-dot").long("dot"))
+                .arg(Arg::with_name("output-xml").long("xml").short("x"))
                 .arg(
                     Arg::with_name("stat")
                         .help("Show parsing statistic")
@@ -377,8 +379,17 @@ fn run() -> Result<()> {
             let debug = matches.is_present("debug");
             let debug_graph = matches.is_present("debug-graph");
             let debug_build = matches.is_present("debug-build");
-            let debug_xml = matches.is_present("debug-xml");
-            let quiet = matches.is_present("quiet");
+
+            let output = if matches.is_present("output-dot") {
+                ParseOutput::Dot
+            } else if matches.is_present("output-xml") {
+                ParseOutput::Xml
+            } else if matches.is_present("quiet") {
+                ParseOutput::Quiet
+            } else {
+                ParseOutput::Normal
+            };
+
             let time = matches.is_present("time");
             let edits = matches
                 .values_of("edits")
@@ -416,12 +427,11 @@ fn run() -> Result<()> {
                     path,
                     &edits,
                     max_path_length,
-                    quiet,
+                    output,
                     time,
                     timeout,
                     debug,
                     debug_graph,
-                    debug_xml,
                     Some(&cancellation_flag),
                 )?;
 
diff --git a/cli/src/parse.rs b/cli/src/parse.rs
index 15a9d4c9..3e28e51a 100644
--- a/cli/src/parse.rs
+++ b/cli/src/parse.rs
@@ -30,17 +30,24 @@ impl fmt::Display for Stats {
     }
 }
 
+#[derive(Copy, Clone)]
+pub enum ParseOutput {
+    Normal,
+    Quiet,
+    Xml,
+    Dot,
+}
+
 pub fn parse_file_at_path(
     language: Language,
     path: &Path,
     edits: &Vec<&str>,
     max_path_length: usize,
-    quiet: bool,
+    output: ParseOutput,
     print_time: bool,
     timeout: u64,
     debug: bool,
     debug_graph: bool,
-    debug_xml: bool,
     cancellation_flag: Option<&AtomicUsize>,
 ) -> Result<bool> {
     let mut _log_session = None;
@@ -95,7 +102,7 @@ pub fn parse_file_at_path(
         let duration_ms = duration.as_secs() * 1000 + duration.subsec_nanos() as u64 / 1000000;
         let mut cursor = tree.walk();
 
-        if !quiet {
+        if matches!(output, ParseOutput::Normal) {
             let mut needs_newline = false;
             let mut indent_level = 0;
             let mut did_visit_children = false;
@@ -151,7 +158,7 @@ pub fn parse_file_at_path(
             println!("");
         }
 
-        if debug_xml {
+        if matches!(output, ParseOutput::Xml) {
             let mut needs_newline = false;
             let mut indent_level = 0;
             let mut did_visit_children = false;
@@ -206,6 +213,10 @@ pub fn parse_file_at_path(
             println!("");
         }
 
+        if matches!(output, ParseOutput::Dot) {
+            util::print_tree_graph(&tree, "log.html").unwrap();
+        }
+
         let mut first_error = None;
         loop {
             let node = cursor.node();
diff --git a/cli/src/util.rs b/cli/src/util.rs
index acd8acbf..2b7405fd 100644
--- a/cli/src/util.rs
+++ b/cli/src/util.rs
@@ -3,7 +3,7 @@ use std::io;
 use std::sync::atomic::{AtomicUsize, Ordering};
 use std::sync::Arc;
 use std::thread;
-use tree_sitter::Parser;
+use tree_sitter::{Parser, Tree};
 
 #[cfg(unix)]
 use anyhow::{anyhow, Context};
@@ -29,39 +29,61 @@ pub fn cancel_on_stdin() -> Arc<AtomicUsize> {
     }
     result
 }
+
 #[cfg(windows)]
-pub struct LogSession();
+pub struct LogSession;
 
 #[cfg(unix)]
-pub struct LogSession(PathBuf, Option<Child>, Option<ChildStdin>);
+pub struct LogSession {
+    path: PathBuf,
+    dot_process: Option<Child>,
+    dot_process_stdin: Option<ChildStdin>,
+}
+
+pub fn print_tree_graph(tree: &Tree, path: &str) -> Result<()> {
+    let session = LogSession::new(path)?;
+    tree.print_dot_graph(session.dot_process_stdin.as_ref().unwrap());
+    Ok(())
+}
+
+pub fn log_graphs(parser: &mut Parser, path: &str) -> Result<LogSession> {
+    let session = LogSession::new(path)?;
+    parser.print_dot_graphs(session.dot_process_stdin.as_ref().unwrap());
+    Ok(session)
+}
 
 #[cfg(windows)]
-pub fn log_graphs(_parser: &mut Parser, _path: &str) -> Result<LogSession> {
-    Ok(LogSession())
+impl LogSession {
+    fn new(path: &str) -> Result<Self> {
+        Ok(Self)
+    }
 }
 
 #[cfg(unix)]
-pub fn log_graphs(parser: &mut Parser, path: &str) -> Result<LogSession> {
-    use std::io::Write;
+impl LogSession {
+    fn new(path: &str) -> Result<Self> {
+        use std::io::Write;
 
-    let mut dot_file = std::fs::File::create(path)?;
-    dot_file.write(HTML_HEADER)?;
-    let mut dot_process = Command::new("dot")
-        .arg("-Tsvg")
-        .stdin(Stdio::piped())
-        .stdout(dot_file)
-        .spawn()
-        .with_context(|| "Failed to run the `dot` command. Check that graphviz is installed.")?;
-    let dot_stdin = dot_process
-        .stdin
-        .take()
-        .ok_or_else(|| anyhow!("Failed to open stdin for `dot` process."))?;
-    parser.print_dot_graphs(&dot_stdin);
-    Ok(LogSession(
-        PathBuf::from(path),
-        Some(dot_process),
-        Some(dot_stdin),
-    ))
+        let mut dot_file = std::fs::File::create(path)?;
+        dot_file.write(HTML_HEADER)?;
+        let mut dot_process = Command::new("dot")
+            .arg("-Tsvg")
+            .stdin(Stdio::piped())
+            .stdout(dot_file)
+            .spawn()
+            .with_context(|| {
+                "Failed to run the `dot` command. Check that graphviz is installed."
+            })?;
+        let dot_stdin = dot_process
+            .stdin
+            .take()
+            .ok_or_else(|| anyhow!("Failed to open stdin for `dot` process."))?;
+        Ok(Self {
+            path: PathBuf::from(path),
+            dot_process: Some(dot_process),
+            dot_process_stdin: Some(dot_stdin),
+        })
+    }
 }
 
 #[cfg(unix)]
@@ -69,13 +91,13 @@ impl Drop for LogSession {
     fn drop(&mut self) {
         use std::fs;
 
-        drop(self.2.take().unwrap());
-        let output = self.1.take().unwrap().wait_with_output().unwrap();
+        drop(self.dot_process_stdin.take().unwrap());
+        let output = self.dot_process.take().unwrap().wait_with_output().unwrap();
         if output.status.success() {
             if cfg!(target_os = "macos")
-                && fs::metadata(&self.0).unwrap().len() > HTML_HEADER.len() as u64
+                && fs::metadata(&self.path).unwrap().len() > HTML_HEADER.len() as u64
             {
-                Command::new("open").arg(&self.0).output().unwrap();
+                Command::new("open").arg(&self.path).output().unwrap();
             }
         } else {
             eprintln!(
diff --git a/lib/binding_rust/bindings.rs b/lib/binding_rust/bindings.rs
index b4ec9bed..4591a380 100644
--- a/lib/binding_rust/bindings.rs
+++ b/lib/binding_rust/bindings.rs
@@ -346,6 +346,9 @@ extern "C" {
     pub fn ts_tree_language(arg1: *const TSTree) -> *const TSLanguage;
 }
 extern "C" {
+    #[doc = " Get the array of included ranges that was used to parse the syntax tree."]
+    #[doc = ""]
+    #[doc = " The returned pointer must be freed by the caller."]
     pub fn ts_tree_included_ranges(arg1: *const TSTree, length: *mut u32) -> *mut TSRange;
 }
 extern "C" {
@@ -375,6 +378,10 @@ extern "C" {
         length: *mut u32,
     ) -> *mut TSRange;
 }
+extern "C" {
+    #[doc = " Write a DOT graph describing the syntax tree to the given file."]
+    pub fn ts_tree_print_dot_graph(arg1: *const TSTree, file_descriptor: ::std::os::raw::c_int);
+}
 extern "C" {
     #[doc = " Get the node's type as a null-terminated string."]
     pub fn ts_node_type(arg1: TSNode) -> *const ::std::os::raw::c_char;
diff --git a/lib/binding_rust/lib.rs b/lib/binding_rust/lib.rs
index 84471d06..6f044cca 100644
--- a/lib/binding_rust/lib.rs
+++ b/lib/binding_rust/lib.rs
@@ -775,6 +775,16 @@ impl Tree {
             result
         }
     }
+
+    /// Print a graph of the tree to the given file descriptor.
+    /// The graph is formatted in the DOT language. You may want to pipe this graph
+    /// directly to a `dot(1)` process in order to generate SVG output.
+    #[cfg(unix)]
+    #[doc(alias = "ts_tree_print_dot_graph")]
+    pub fn print_dot_graph(&self, file: &impl AsRawFd) {
+        let fd = file.as_raw_fd();
+        unsafe { ffi::ts_tree_print_dot_graph(self.0.as_ptr(), fd) }
+    }
 }
 
 impl fmt::Debug for Tree {
diff --git a/lib/include/tree_sitter/api.h b/lib/include/tree_sitter/api.h
index bc05bc3c..5b48cf60 100644
--- a/lib/include/tree_sitter/api.h
+++ b/lib/include/tree_sitter/api.h
@@ -420,7 +420,7 @@ TSRange *ts_tree_get_changed_ranges(
 /**
  * Write a DOT graph describing the syntax tree to the given file.
  */
-void ts_tree_print_dot_graph(const TSTree *, FILE *);
+void ts_tree_print_dot_graph(const TSTree *, int file_descriptor);
 
 /******************/
 /* Section - Node */
diff --git a/lib/src/clock.h b/lib/src/clock.h
index e6faa040..6e75729e 100644
--- a/lib/src/clock.h
+++ b/lib/src/clock.h
@@ -1,6 +1,7 @@
 #ifndef TREE_SITTER_CLOCK_H_
 #define TREE_SITTER_CLOCK_H_
 
+#include <stdbool.h>
 #include <stdint.h>
 
 typedef uint64_t TSDuration;
diff --git a/lib/src/tree.c b/lib/src/tree.c
index f6bd2c72..bee2a3de 100644
--- a/lib/src/tree.c
+++ b/lib/src/tree.c
@@ -1,3 +1,4 @@
+#include <unistd.h>
 #include "tree_sitter/api.h"
 #include "./array.h"
 #include "./get_changed_ranges.h"
@@ -123,6 +124,8 @@ TSRange *ts_tree_get_changed_ranges(const TSTree *self, const TSTree *other, uin
   return result;
 }
 
-void ts_tree_print_dot_graph(const TSTree *self, FILE *file) {
+void ts_tree_print_dot_graph(const TSTree *self, int fd) {
+  FILE *file = fdopen(dup(fd), "a");
   ts_subtree_print_dot_graph(self->root, self->language, file);
+  fclose(file);
 }
diff --git a/lib/src/tree.h b/lib/src/tree.h
index 0334b824..f012f888 100644
--- a/lib/src/tree.h
+++ b/lib/src/tree.h
@@ -1,6 +1,8 @@
 #ifndef TREE_SITTER_TREE_H_
 #define TREE_SITTER_TREE_H_
 
+#include "./subtree.h"
+
 #ifdef __cplusplus
 extern "C" {
 #endif
diff --git a/script/generate-bindings b/script/generate-bindings
index 4b3fb951..54abac06 100755
--- a/script/generate-bindings
+++ b/script/generate-bindings
@@ -7,10 +7,7 @@ bindgen                                        \
   --no-layout-tests                            \
   --whitelist-type '^TS.*'                     \
   --whitelist-function '^ts_.*'                \
-  --opaque-type FILE                           \
-  --blocklist-type FILE                        \
   --blocklist-type '^__.*'                     \
-  --blocklist-function ts_tree_print_dot_graph \
   --size_t-is-usize                            \
   $header_path > $output_path
 

From 0b817a609f7cd3d7309a81dbfe96287c6945a085 Mon Sep 17 00:00:00 2001
From: Max Brunsfeld <maxbrunsfeld@gmail.com>
Date: Mon, 13 Feb 2023 13:45:12 -0800
Subject: [PATCH 032/347] Clear the parse stack when terminating parsing early
 due to error cost

This fixes a bug where the parse tree would not be rebalanced if this
code path was taken.
---
 lib/src/parser.c | 8 ++++++++
 1 file changed, 8 insertions(+)

diff --git a/lib/src/parser.c b/lib/src/parser.c
index f186ce33..f84b3c8d 100644
--- a/lib/src/parser.c
+++ b/lib/src/parser.c
@@ -1941,8 +1941,16 @@ TSTree *ts_parser_parse(
       }
     }
 
+    // After advancing each version of the stack, re-sort the versions by their cost,
+    // removing any versions that are no longer worth pursuing.
     unsigned min_error_cost = ts_parser__condense_stack(self);
+
+    // If there's already a finished parse tree that's better than any in-progress version,
+    // then terminate parsing. Clear the parse stack to remove any extra references to subtrees
+    // within the finished tree, ensuring that these subtrees can be safely mutated in-place
+    // for rebalancing.
     if (self->finished_tree.ptr && ts_subtree_error_cost(self->finished_tree) < min_error_cost) {
+      ts_stack_clear(self->stack);
       break;
     }
 

From 450c67484bcf2836807b4c6a9f128df2149d47d6 Mon Sep 17 00:00:00 2001
From: Max Brunsfeld <maxbrunsfeld@gmail.com>
Date: Mon, 13 Feb 2023 23:18:35 -0800
Subject: [PATCH 033/347] For now, don't implement ts_tree_print_dot_graph on
 windows

---
 lib/src/tree.c | 14 +++++++++++++-
 1 file changed, 13 insertions(+), 1 deletion(-)

diff --git a/lib/src/tree.c b/lib/src/tree.c
index bee2a3de..79e1d1ae 100644
--- a/lib/src/tree.c
+++ b/lib/src/tree.c
@@ -1,4 +1,3 @@
-#include <unistd.h>
 #include "tree_sitter/api.h"
 #include "./array.h"
 #include "./get_changed_ranges.h"
@@ -124,8 +123,21 @@ TSRange *ts_tree_get_changed_ranges(const TSTree *self, const TSTree *other, uin
   return result;
 }
 
+#ifdef _WIN32
+
+void ts_tree_print_dot_graph(const TSTree *self, int fd) {
+  (void)self;
+  (void)fd;
+}
+
+#else
+
+#include <unistd.h>
+
 void ts_tree_print_dot_graph(const TSTree *self, int fd) {
   FILE *file = fdopen(dup(fd), "a");
   ts_subtree_print_dot_graph(self->root, self->language, file);
   fclose(file);
 }
+
+#endif

From 125503ff3b613b08233fc1e06292be9ddd9dd448 Mon Sep 17 00:00:00 2001
From: Max Brunsfeld <maxbrunsfeld@gmail.com>
Date: Mon, 13 Feb 2023 23:23:47 -0800
Subject: [PATCH 034/347] Fix CLI build on windows

---
 cli/src/util.rs | 28 ++++++++++++++++++++--------
 1 file changed, 20 insertions(+), 8 deletions(-)

diff --git a/cli/src/util.rs b/cli/src/util.rs
index 2b7405fd..d180cd54 100644
--- a/cli/src/util.rs
+++ b/cli/src/util.rs
@@ -13,7 +13,14 @@ use std::path::PathBuf;
 use std::process::{Child, ChildStdin, Command, Stdio};
 
 #[cfg(unix)]
-const HTML_HEADER: &[u8] = b"<!DOCTYPE html>\n<style>svg { width: 100%; }</style>\n\n";
+const HTML_HEADER: &[u8] = b"
+<!DOCTYPE html>
+
+<style>
+svg { width: 100%; }
+</style>
+
+";
 
 pub fn cancel_on_stdin() -> Arc<AtomicUsize> {
     let result = Arc::new(AtomicUsize::new(0));
@@ -40,25 +47,30 @@ pub struct LogSession {
     dot_process_stdin: Option<ChildStdin>,
 }
 
+#[cfg(windows)]
+pub fn print_tree_graph(_tree: &Tree, _path: &str) -> Result<()> {
+    Ok(())
+}
+
+#[cfg(windows)]
+pub fn log_graphs(_parser: &mut Parser, _path: &str) -> Result<LogSession> {
+    Ok(LogSession)
+}
+
+#[cfg(unix)]
 pub fn print_tree_graph(tree: &Tree, path: &str) -> Result<()> {
     let session = LogSession::new(path)?;
     tree.print_dot_graph(session.dot_process_stdin.as_ref().unwrap());
     Ok(())
 }
 
+#[cfg(unix)]
 pub fn log_graphs(parser: &mut Parser, path: &str) -> Result<LogSession> {
     let session = LogSession::new(path)?;
     parser.print_dot_graphs(session.dot_process_stdin.as_ref().unwrap());
     Ok(session)
 }
 
-#[cfg(windows)]
-impl LogSession {
-    fn new(path: &str) -> Result<Self> {
-        Ok(Self)
-    }
-}
-
 #[cfg(unix)]
 impl LogSession {
     fn new(path: &str) -> Result<Self> {

From ff2436a6f8639b290e4395ca2b44491472647a2b Mon Sep 17 00:00:00 2001
From: Max Brunsfeld <maxbrunsfeld@gmail.com>
Date: Tue, 14 Feb 2023 14:41:25 -0800
Subject: [PATCH 035/347] Add --row-range, --quiet, and --time flags to query
 subcommand

---
 cli/src/main.rs  | 30 ++++++++++++++++---
 cli/src/query.rs | 77 +++++++++++++++++++++++++++++-------------------
 2 files changed, 73 insertions(+), 34 deletions(-)

diff --git a/cli/src/main.rs b/cli/src/main.rs
index 47e7597b..fb2a6327 100644
--- a/cli/src/main.rs
+++ b/cli/src/main.rs
@@ -3,6 +3,7 @@ use clap::{App, AppSettings, Arg, SubCommand};
 use glob::glob;
 use std::path::{Path, PathBuf};
 use std::{env, fs, u64};
+use tree_sitter::Point;
 use tree_sitter_cli::parse::ParseOutput;
 use tree_sitter_cli::{
     generate, highlight, logger, parse, playground, query, tags, test, test_highlight, test_tags,
@@ -173,6 +174,8 @@ fn run() -> Result<()> {
                         .index(1)
                         .required(true),
                 )
+                .arg(&time_arg)
+                .arg(&quiet_arg)
                 .arg(&paths_file_arg)
                 .arg(&paths_arg.clone().index(2))
                 .arg(
@@ -181,6 +184,12 @@ fn run() -> Result<()> {
                         .long("byte-range")
                         .takes_value(true),
                 )
+                .arg(
+                    Arg::with_name("row-range")
+                        .help("The range of rows in which the query will be executed")
+                        .long("row-range")
+                        .takes_value(true),
+                )
                 .arg(&scope_arg)
                 .arg(Arg::with_name("captures").long("captures").short("c"))
                 .arg(Arg::with_name("test").long("test")),
@@ -456,6 +465,8 @@ fn run() -> Result<()> {
 
         ("query", Some(matches)) => {
             let ordered_captures = matches.values_of("captures").is_some();
+            let quiet = matches.values_of("quiet").is_some();
+            let time = matches.values_of("time").is_some();
             let paths = collect_paths(matches.value_of("paths-file"), matches.values_of("paths"))?;
             let loader_config = config.get()?;
             loader.find_all_languages(&loader_config)?;
@@ -465,9 +476,17 @@ fn run() -> Result<()> {
                 matches.value_of("scope"),
             )?;
             let query_path = Path::new(matches.value_of("query-path").unwrap());
-            let range = matches.value_of("byte-range").map(|br| {
-                let r: Vec<&str> = br.split(":").collect();
-                r[0].parse().unwrap()..r[1].parse().unwrap()
+            let byte_range = matches.value_of("byte-range").and_then(|arg| {
+                let mut parts = arg.split(":");
+                let start = parts.next()?.parse().ok()?;
+                let end = parts.next().unwrap().parse().ok()?;
+                Some(start..end)
+            });
+            let point_range = matches.value_of("row-range").and_then(|arg| {
+                let mut parts = arg.split(":");
+                let start = parts.next()?.parse().ok()?;
+                let end = parts.next().unwrap().parse().ok()?;
+                Some(Point::new(start, 0)..Point::new(end, 0))
             });
             let should_test = matches.is_present("test");
             query::query_files_at_paths(
@@ -475,8 +494,11 @@ fn run() -> Result<()> {
                 paths,
                 query_path,
                 ordered_captures,
-                range,
+                byte_range,
+                point_range,
                 should_test,
+                quiet,
+                time,
             )?;
         }
 
diff --git a/cli/src/query.rs b/cli/src/query.rs
index 73d6dd28..fc24cb05 100644
--- a/cli/src/query.rs
+++ b/cli/src/query.rs
@@ -5,16 +5,20 @@ use std::{
     io::{self, Write},
     ops::Range,
     path::Path,
+    time::Instant,
 };
-use tree_sitter::{Language, Parser, Query, QueryCursor};
+use tree_sitter::{Language, Parser, Point, Query, QueryCursor};
 
 pub fn query_files_at_paths(
     language: Language,
     paths: Vec<String>,
     query_path: &Path,
     ordered_captures: bool,
-    range: Option<Range<usize>>,
+    byte_range: Option<Range<usize>>,
+    point_range: Option<Range<Point>>,
     should_test: bool,
+    quiet: bool,
+    print_time: bool,
 ) -> Result<()> {
     let stdout = io::stdout();
     let mut stdout = stdout.lock();
@@ -24,9 +28,12 @@ pub fn query_files_at_paths(
     let query = Query::new(language, &query_source).with_context(|| "Query compilation failed")?;
 
     let mut query_cursor = QueryCursor::new();
-    if let Some(range) = range {
+    if let Some(range) = byte_range {
         query_cursor.set_byte_range(range);
     }
+    if let Some(range) = point_range {
+        query_cursor.set_point_range(range);
+    }
 
     let mut parser = Parser::new();
     parser.set_language(language)?;
@@ -40,22 +47,25 @@ pub fn query_files_at_paths(
             fs::read(&path).with_context(|| format!("Error reading source file {:?}", path))?;
         let tree = parser.parse(&source_code, None).unwrap();
 
+        let start = Instant::now();
         if ordered_captures {
             for (mat, capture_index) in
                 query_cursor.captures(&query, tree.root_node(), source_code.as_slice())
             {
                 let capture = mat.captures[capture_index];
                 let capture_name = &query.capture_names()[capture.index as usize];
-                writeln!(
-                    &mut stdout,
-                    "    pattern: {:>2}, capture: {} - {}, start: {}, end: {}, text: `{}`",
-                    mat.pattern_index,
-                    capture.index,
-                    capture_name,
-                    capture.node.start_position(),
-                    capture.node.end_position(),
-                    capture.node.utf8_text(&source_code).unwrap_or("")
-                )?;
+                if !quiet {
+                    writeln!(
+                        &mut stdout,
+                        "    pattern: {:>2}, capture: {} - {}, start: {}, end: {}, text: `{}`",
+                        mat.pattern_index,
+                        capture.index,
+                        capture_name,
+                        capture.node.start_position(),
+                        capture.node.end_position(),
+                        capture.node.utf8_text(&source_code).unwrap_or("")
+                    )?;
+                }
                 results.push(query_testing::CaptureInfo {
                     name: capture_name.to_string(),
                     start: capture.node.start_position(),
@@ -64,27 +74,31 @@ pub fn query_files_at_paths(
             }
         } else {
             for m in query_cursor.matches(&query, tree.root_node(), source_code.as_slice()) {
-                writeln!(&mut stdout, "  pattern: {}", m.pattern_index)?;
+                if !quiet {
+                    writeln!(&mut stdout, "  pattern: {}", m.pattern_index)?;
+                }
                 for capture in m.captures {
                     let start = capture.node.start_position();
                     let end = capture.node.end_position();
                     let capture_name = &query.capture_names()[capture.index as usize];
-                    if end.row == start.row {
-                        writeln!(
-                            &mut stdout,
-                            "    capture: {} - {}, start: {}, end: {}, text: `{}`",
-                            capture.index,
-                            capture_name,
-                            start,
-                            end,
-                            capture.node.utf8_text(&source_code).unwrap_or("")
-                        )?;
-                    } else {
-                        writeln!(
-                            &mut stdout,
-                            "    capture: {}, start: {}, end: {}",
-                            capture_name, start, end,
-                        )?;
+                    if !quiet {
+                        if end.row == start.row {
+                            writeln!(
+                                &mut stdout,
+                                "    capture: {} - {}, start: {}, end: {}, text: `{}`",
+                                capture.index,
+                                capture_name,
+                                start,
+                                end,
+                                capture.node.utf8_text(&source_code).unwrap_or("")
+                            )?;
+                        } else {
+                            writeln!(
+                                &mut stdout,
+                                "    capture: {}, start: {}, end: {}",
+                                capture_name, start, end,
+                            )?;
+                        }
                     }
                     results.push(query_testing::CaptureInfo {
                         name: capture_name.to_string(),
@@ -103,6 +117,9 @@ pub fn query_files_at_paths(
         if should_test {
             query_testing::assert_expected_captures(results, path, &mut parser, language)?
         }
+        if print_time {
+            writeln!(&mut stdout, "{:?}", start.elapsed())?;
+        }
     }
 
     Ok(())

From 32ce1fccd05efdf91dd8d99fba0fc91b46b18b81 Mon Sep 17 00:00:00 2001
From: Max Brunsfeld <maxbrunsfeld@gmail.com>
Date: Tue, 14 Feb 2023 14:42:26 -0800
Subject: [PATCH 036/347] Precompute the set of repetition symbols that can
 match rootless patterns

---
 lib/src/query.c | 733 ++++++++++++++++++++++++++++--------------------
 1 file changed, 427 insertions(+), 306 deletions(-)

diff --git a/lib/src/query.c b/lib/src/query.c
index 710a9209..a756c089 100644
--- a/lib/src/query.c
+++ b/lib/src/query.c
@@ -228,12 +228,15 @@ typedef struct {
   AnalysisStateEntry stack[MAX_ANALYSIS_STATE_DEPTH];
   uint16_t depth;
   uint16_t step_index;
+  TSSymbol root_symbol;
 } AnalysisState;
 
 typedef Array(AnalysisState *) AnalysisStateSet;
 
 typedef Array(AnalysisState *) AnalysisStatePool;
 
+typedef Array(uint16_t) StepIndexArray;
+
 /*
  * AnalysisSubgraph - A subset of the states in the parse table that are used
  * in constructing nodes with a certain symbol. Each state is accompanied by
@@ -253,6 +256,8 @@ typedef struct {
   Array(AnalysisSubgraphNode) nodes;
 } AnalysisSubgraph;
 
+typedef Array(AnalysisSubgraph) AnalysisSubgraphArray;
+
 /*
  * StatePredecessorMap - A map that stores the predecessors of each parse state.
  * This is used during query analysis to determine which parse states can lead
@@ -269,8 +274,8 @@ typedef struct {
  */
 struct TSQuery {
   SymbolTable captures;
-  Array(CaptureQuantifiers) capture_quantifiers;
   SymbolTable predicate_values;
+  Array(CaptureQuantifiers) capture_quantifiers;
   Array(QueryStep) steps;
   Array(PatternEntry) pattern_map;
   Array(TSQueryPredicateStep) predicate_steps;
@@ -278,6 +283,7 @@ struct TSQuery {
   Array(StepOffset) step_offsets;
   Array(TSFieldId) negated_fields;
   Array(char) string_buffer;
+  Array(TSSymbol) repeat_symbols_with_rootless_patterns;
   const TSLanguage *language;
   uint16_t wildcard_root_pattern_count;
 };
@@ -1113,7 +1119,324 @@ static inline void ts_query__pattern_map_insert(
   array_insert(&self->pattern_map, index, new_entry);
 }
 
+static void ts_query__analyze_patterns_from_states(
+  TSQuery *self,
+  const AnalysisSubgraphArray *subgraphs,
+  AnalysisStateSet *states,
+  AnalysisStateSet *next_states,
+  AnalysisStateSet *deeper_states,
+  AnalysisStatePool *state_pool,
+  StepIndexArray *finished_parent_symbols,
+  StepIndexArray *final_step_indices,
+  bool *did_abort_analysis
+) {
+  unsigned recursion_depth_limit = 0;
+  unsigned prev_final_step_count = 0;
+
+  for (unsigned iteration = 0;; iteration++) {
+    if (iteration == MAX_ANALYSIS_ITERATION_COUNT) {
+      *did_abort_analysis = true;
+      break;
+    }
+
+    #ifdef DEBUG_ANALYZE_QUERY
+      printf("Iteration: %u. Final step indices:", iteration);
+      for (unsigned j = 0; j < final_step_indices->size; j++) {
+        printf(" %4u", final_step_indices->contents[j]);
+      }
+      printf("\n");
+      for (unsigned j = 0; j < states->size; j++) {
+        AnalysisState *state = states->contents[j];
+        printf("  %3u: step: %u, stack: [", j, state->step_index);
+        for (unsigned k = 0; k < state->depth; k++) {
+          printf(
+            " {%s, child: %u, state: %4u",
+            self->language->symbol_names[state->stack[k].parent_symbol],
+            state->stack[k].child_index,
+            state->stack[k].parse_state
+          );
+          if (state->stack[k].field_id) printf(", field: %s", self->language->field_names[state->stack[k].field_id]);
+          if (state->stack[k].done) printf(", DONE");
+          printf("}");
+        }
+        printf(" ]\n");
+      }
+    #endif
+
+    // If no further progress can be made within the current recursion depth limit, then
+    // bump the depth limit by one, and continue to process the states the exceeded the
+    // limit. But only allow this if progress has been made since the last time the depth
+    // limit was increased.
+    if (states->size == 0) {
+      if (
+          deeper_states->size > 0
+          && final_step_indices->size > prev_final_step_count
+      ) {
+        #ifdef DEBUG_ANALYZE_QUERY
+          printf("Increase recursion depth limit to %u\n", recursion_depth_limit + 1);
+        #endif
+
+        prev_final_step_count = final_step_indices->size;
+        recursion_depth_limit++;
+        AnalysisStateSet _states = *states;
+        *states = *deeper_states;
+        *deeper_states = _states;
+        continue;
+      }
+
+      break;
+    }
+
+    analysis_state_set__clear(next_states, state_pool);
+    for (unsigned j = 0; j < states->size; j++) {
+      AnalysisState * const state = states->contents[j];
+
+      // For efficiency, it's important to avoid processing the same analysis state more
+      // than once. To achieve this, keep the states in order of ascending position within
+      // their hypothetical syntax trees. In each iteration of this loop, start by advancing
+      // the states that have made the least progress. Avoid advancing states that have already
+      // made more progress.
+      if (next_states->size > 0) {
+        int comparison = analysis_state__compare_position(
+          &state,
+          array_back(next_states)
+        );
+        if (comparison == 0) {
+          analysis_state_set__insert_sorted_by_clone(next_states, state_pool, state);
+          continue;
+        } else if (comparison > 0) {
+          #ifdef DEBUG_ANALYZE_QUERY
+            printf("Terminate iteration at state %u\n", j);
+          #endif
+          while (j < states->size) {
+            analysis_state_set__push_by_clone(
+              next_states,
+              state_pool,
+              states->contents[j]
+            );
+            j++;
+          }
+          break;
+        }
+      }
+
+      const TSStateId parse_state = analysis_state__top(state)->parse_state;
+      const TSSymbol parent_symbol = analysis_state__top(state)->parent_symbol;
+      const TSFieldId parent_field_id = analysis_state__top(state)->field_id;
+      const unsigned child_index = analysis_state__top(state)->child_index;
+      const QueryStep * const step = &self->steps.contents[state->step_index];
+
+      unsigned subgraph_index, exists;
+      array_search_sorted_by(subgraphs, .symbol, parent_symbol, &subgraph_index, &exists);
+      if (!exists) continue;
+      const AnalysisSubgraph *subgraph = &subgraphs->contents[subgraph_index];
+
+      // Follow every possible path in the parse table, but only visit states that
+      // are part of the subgraph for the current symbol.
+      LookaheadIterator lookahead_iterator = ts_language_lookaheads(self->language, parse_state);
+      while (ts_lookahead_iterator_next(&lookahead_iterator)) {
+        TSSymbol sym = lookahead_iterator.symbol;
+
+        AnalysisSubgraphNode successor = {
+          .state = parse_state,
+          .child_index = child_index,
+        };
+        if (lookahead_iterator.action_count) {
+          const TSParseAction *action = &lookahead_iterator.actions[lookahead_iterator.action_count - 1];
+          if (action->type == TSParseActionTypeShift) {
+            if (!action->shift.extra) {
+              successor.state = action->shift.state;
+              successor.child_index++;
+            }
+          } else {
+            continue;
+          }
+        } else if (lookahead_iterator.next_state != 0) {
+          successor.state = lookahead_iterator.next_state;
+          successor.child_index++;
+        } else {
+          continue;
+        }
+
+        unsigned node_index;
+        array_search_sorted_with(
+          &subgraph->nodes,
+          analysis_subgraph_node__compare, &successor,
+          &node_index, &exists
+        );
+        while (node_index < subgraph->nodes.size) {
+          AnalysisSubgraphNode *node = &subgraph->nodes.contents[node_index++];
+          if (node->state != successor.state || node->child_index != successor.child_index) break;
+
+          // Use the subgraph to determine what alias and field will eventually be applied
+          // to this child node.
+          TSSymbol alias = ts_language_alias_at(self->language, node->production_id, child_index);
+          TSSymbol visible_symbol = alias
+            ? alias
+            : self->language->symbol_metadata[sym].visible
+              ? self->language->public_symbol_map[sym]
+              : 0;
+          TSFieldId field_id = parent_field_id;
+          if (!field_id) {
+            const TSFieldMapEntry *field_map, *field_map_end;
+            ts_language_field_map(self->language, node->production_id, &field_map, &field_map_end);
+            for (; field_map != field_map_end; field_map++) {
+              if (!field_map->inherited && field_map->child_index == child_index) {
+                field_id = field_map->field_id;
+                break;
+              }
+            }
+          }
+
+          // Create a new state that has advanced past this hypothetical subtree.
+          AnalysisState next_state = *state;
+          AnalysisStateEntry *next_state_top = analysis_state__top(&next_state);
+          next_state_top->child_index = successor.child_index;
+          next_state_top->parse_state = successor.state;
+          if (node->done) next_state_top->done = true;
+
+          // Determine if this hypothetical child node would match the current step
+          // of the query pattern.
+          bool does_match = false;
+          if (visible_symbol) {
+            does_match = true;
+            if (step->symbol == WILDCARD_SYMBOL) {
+              if (
+                step->is_named &&
+                !self->language->symbol_metadata[visible_symbol].named
+              ) does_match = false;
+            } else if (step->symbol != visible_symbol) {
+              does_match = false;
+            }
+            if (step->field && step->field != field_id) {
+              does_match = false;
+            }
+            if (
+              step->supertype_symbol &&
+              !analysis_state__has_supertype(state, step->supertype_symbol)
+            ) does_match = false;
+          }
+
+          // If this child is hidden, then descend into it and walk through its children.
+          // If the top entry of the stack is at the end of its rule, then that entry can
+          // be replaced. Otherwise, push a new entry onto the stack.
+          else if (sym >= self->language->token_count) {
+            if (!next_state_top->done) {
+              if (next_state.depth + 1 >= MAX_ANALYSIS_STATE_DEPTH) {
+                #ifdef DEBUG_ANALYZE_QUERY
+                  printf("Exceeded depth limit for state %u\n", j);
+                #endif
+
+                *did_abort_analysis = true;
+                continue;
+              }
+
+              next_state.depth++;
+              next_state_top = analysis_state__top(&next_state);
+            }
+
+            *next_state_top = (AnalysisStateEntry) {
+              .parse_state = parse_state,
+              .parent_symbol = sym,
+              .child_index = 0,
+              .field_id = field_id,
+              .done = false,
+            };
+
+            if (analysis_state__recursion_depth(&next_state) > recursion_depth_limit) {
+              analysis_state_set__insert_sorted_by_clone(
+                deeper_states,
+                state_pool,
+                &next_state
+              );
+              continue;
+            }
+          }
+
+          // Pop from the stack when this state reached the end of its current syntax node.
+          while (next_state.depth > 0 && next_state_top->done) {
+            next_state.depth--;
+            next_state_top = analysis_state__top(&next_state);
+          }
+
+          // If this hypothetical child did match the current step of the query pattern,
+          // then advance to the next step at the current depth. This involves skipping
+          // over any descendant steps of the current child.
+          const QueryStep *next_step = step;
+          if (does_match) {
+            for (;;) {
+              next_state.step_index++;
+              next_step = &self->steps.contents[next_state.step_index];
+              if (
+                next_step->depth == PATTERN_DONE_MARKER ||
+                next_step->depth <= step->depth
+              ) break;
+            }
+          } else if (successor.state == parse_state) {
+            continue;
+          }
+
+          for (;;) {
+            // Skip pass-through states. Although these states have alternatives, they are only
+            // used to implement repetitions, and query analysis does not need to process
+            // repetitions in order to determine whether steps are possible and definite.
+            if (next_step->is_pass_through) {
+              next_state.step_index++;
+              next_step++;
+              continue;
+            }
+
+            // If the pattern is finished or hypothetical parent node is complete, then
+            // record that matching can terminate at this step of the pattern. Otherwise,
+            // add this state to the list of states to process on the next iteration.
+            if (!next_step->is_dead_end) {
+              bool did_finish_pattern = self->steps.contents[next_state.step_index].depth != step->depth;
+              if (did_finish_pattern) {
+                array_insert_sorted_by(finished_parent_symbols, , state->root_symbol);
+              } else if (next_state.depth == 0) {
+                array_insert_sorted_by(final_step_indices, , next_state.step_index);
+              } else {
+                analysis_state_set__insert_sorted_by_clone(next_states, state_pool, &next_state);
+              }
+            }
+
+            // If the state has advanced to a step with an alternative step, then add another state
+            // at that alternative step. This process is simpler than the process of actually matching a
+            // pattern during query execution, because for the purposes of query analysis, there is no
+            // need to process repetitions.
+            if (
+              does_match &&
+              next_step->alternative_index != NONE &&
+              next_step->alternative_index > next_state.step_index
+            ) {
+              next_state.step_index = next_step->alternative_index;
+              next_step = &self->steps.contents[next_state.step_index];
+            } else {
+              break;
+            }
+          }
+        }
+      }
+    }
+
+    AnalysisStateSet _states = *states;
+    *states = *next_states;
+    *next_states = _states;
+  }
+}
+
 static bool ts_query__analyze_patterns(TSQuery *self, unsigned *error_offset) {
+  Array(uint16_t) non_rooted_pattern_start_steps = array_new();
+  for (unsigned i = 0; i < self->pattern_map.size; i++) {
+    PatternEntry *pattern = &self->pattern_map.contents[i];
+    if (!pattern->is_rooted) {
+      QueryStep *step = &self->steps.contents[pattern->step_index];
+      if (step->symbol != WILDCARD_SYMBOL) {
+        array_push(&non_rooted_pattern_start_steps, pattern->step_index);
+      }
+    }
+  }
+
   // Walk forward through all of the steps in the query, computing some
   // basic information about each step. Mark all of the steps that contain
   // captures, and record the indices of all of the steps that have child steps.
@@ -1158,7 +1481,7 @@ static bool ts_query__analyze_patterns(TSQuery *self, unsigned *error_offset) {
   // of the hidden symbols in the grammar, because these might occur within
   // one of the parent nodes, such that their children appear to belong to the
   // parent.
-  Array(AnalysisSubgraph) subgraphs = array_new();
+  AnalysisSubgraphArray subgraphs = array_new();
   for (unsigned i = 0; i < parent_step_indices.size; i++) {
     uint32_t parent_step_index = parent_step_indices.contents[i];
     TSSymbol parent_symbol = self->steps.contents[parent_step_index].symbol;
@@ -1324,7 +1647,8 @@ static bool ts_query__analyze_patterns(TSQuery *self, unsigned *error_offset) {
   AnalysisStateSet next_states = array_new();
   AnalysisStateSet deeper_states = array_new();
   AnalysisStatePool state_pool = array_new();
-  Array(uint16_t) final_step_indices = array_new();
+  StepIndexArray final_step_indices = array_new();
+  StepIndexArray finished_parent_symbols = array_new();
   for (unsigned i = 0; i < parent_step_indices.size; i++) {
     uint16_t parent_step_index = parent_step_indices.contents[i];
     uint16_t parent_depth = self->steps.contents[parent_step_index].depth;
@@ -1364,308 +1688,31 @@ static bool ts_query__analyze_patterns(TSQuery *self, unsigned *error_offset) {
           },
         },
         .depth = 1,
+        .root_symbol = parent_symbol,
       }));
     }
 
     // Walk the subgraph for this non-terminal, tracking all of the possible
     // sequences of progress within the pattern.
-    bool can_finish_pattern = false;
     bool did_abort_analysis = false;
-    unsigned recursion_depth_limit = 0;
-    unsigned prev_final_step_count = 0;
     array_clear(&final_step_indices);
-    for (unsigned iteration = 0;; iteration++) {
-      if (iteration == MAX_ANALYSIS_ITERATION_COUNT) {
-        did_abort_analysis = true;
-        break;
-      }
+    array_clear(&finished_parent_symbols);
 
-      #ifdef DEBUG_ANALYZE_QUERY
-        printf("Iteration: %u. Final step indices:", iteration);
-        for (unsigned j = 0; j < final_step_indices.size; j++) {
-          printf(" %4u", final_step_indices.contents[j]);
-        }
-        printf("\nWalk states for %u %s:\n", i, ts_language_symbol_name(self->language, parent_symbol));
-        for (unsigned j = 0; j < states.size; j++) {
-          AnalysisState *state = states.contents[j];
-          printf("  %3u: step: %u, stack: [", j, state->step_index);
-          for (unsigned k = 0; k < state->depth; k++) {
-            printf(
-              " {%s, child: %u, state: %4u",
-              self->language->symbol_names[state->stack[k].parent_symbol],
-              state->stack[k].child_index,
-              state->stack[k].parse_state
-            );
-            if (state->stack[k].field_id) printf(", field: %s", self->language->field_names[state->stack[k].field_id]);
-            if (state->stack[k].done) printf(", DONE");
-            printf("}");
-          }
-          printf(" ]\n");
-        }
-      #endif
+    #ifdef DEBUG_ANALYZE_QUERY
+      printf("\nWalk states for %s:\n", ts_language_symbol_name(self->language, states.contents[0]->stack[0].parent_symbol));
+    #endif
 
-      // If no further progress can be made within the current recursion depth limit, then
-      // bump the depth limit by one, and continue to process the states the exceeded the
-      // limit. But only allow this if progress has been made since the last time the depth
-      // limit was increased.
-      if (states.size == 0) {
-        if (
-            deeper_states.size > 0
-            && final_step_indices.size > prev_final_step_count
-        ) {
-          #ifdef DEBUG_ANALYZE_QUERY
-            printf("Increase recursion depth limit to %u\n", recursion_depth_limit + 1);
-          #endif
-
-          prev_final_step_count = final_step_indices.size;
-          recursion_depth_limit++;
-          AnalysisStateSet _states = states;
-          states = deeper_states;
-          deeper_states = _states;
-          continue;
-        }
-
-        break;
-      }
-
-      analysis_state_set__clear(&next_states, &state_pool);
-      for (unsigned j = 0; j < states.size; j++) {
-        AnalysisState * const state = states.contents[j];
-
-        // For efficiency, it's important to avoid processing the same analysis state more
-        // than once. To achieve this, keep the states in order of ascending position within
-        // their hypothetical syntax trees. In each iteration of this loop, start by advancing
-        // the states that have made the least progress. Avoid advancing states that have already
-        // made more progress.
-        if (next_states.size > 0) {
-          int comparison = analysis_state__compare_position(
-            &state,
-            array_back(&next_states)
-          );
-          if (comparison == 0) {
-            #ifdef DEBUG_ANALYZE_QUERY
-              printf("Skip iteration for state %u\n", j);
-            #endif
-            analysis_state_set__insert_sorted_by_clone(&next_states, &state_pool, state);
-            continue;
-          } else if (comparison > 0) {
-            #ifdef DEBUG_ANALYZE_QUERY
-              printf("Terminate iteration at state %u\n", j);
-            #endif
-            while (j < states.size) {
-              analysis_state_set__push_by_clone(
-                &next_states,
-                &state_pool,
-                states.contents[j]
-              );
-              j++;
-            }
-            break;
-          }
-        }
-
-        const TSStateId parse_state = analysis_state__top(state)->parse_state;
-        const TSSymbol parent_symbol = analysis_state__top(state)->parent_symbol;
-        const TSFieldId parent_field_id = analysis_state__top(state)->field_id;
-        const unsigned child_index = analysis_state__top(state)->child_index;
-        const QueryStep * const step = &self->steps.contents[state->step_index];
-
-        unsigned subgraph_index, exists;
-        array_search_sorted_by(&subgraphs, .symbol, parent_symbol, &subgraph_index, &exists);
-        if (!exists) continue;
-        const AnalysisSubgraph *subgraph = &subgraphs.contents[subgraph_index];
-
-        // Follow every possible path in the parse table, but only visit states that
-        // are part of the subgraph for the current symbol.
-        LookaheadIterator lookahead_iterator = ts_language_lookaheads(self->language, parse_state);
-        while (ts_lookahead_iterator_next(&lookahead_iterator)) {
-          TSSymbol sym = lookahead_iterator.symbol;
-
-          AnalysisSubgraphNode successor = {
-            .state = parse_state,
-            .child_index = child_index,
-          };
-          if (lookahead_iterator.action_count) {
-            const TSParseAction *action = &lookahead_iterator.actions[lookahead_iterator.action_count - 1];
-            if (action->type == TSParseActionTypeShift) {
-              if (!action->shift.extra) {
-                successor.state = action->shift.state;
-                successor.child_index++;
-              }
-            } else {
-              continue;
-            }
-          } else if (lookahead_iterator.next_state != 0) {
-            successor.state = lookahead_iterator.next_state;
-            successor.child_index++;
-          } else {
-            continue;
-          }
-
-          unsigned node_index;
-          array_search_sorted_with(
-            &subgraph->nodes,
-            analysis_subgraph_node__compare, &successor,
-            &node_index, &exists
-          );
-          while (node_index < subgraph->nodes.size) {
-            AnalysisSubgraphNode *node = &subgraph->nodes.contents[node_index++];
-            if (node->state != successor.state || node->child_index != successor.child_index) break;
-
-            // Use the subgraph to determine what alias and field will eventually be applied
-            // to this child node.
-            TSSymbol alias = ts_language_alias_at(self->language, node->production_id, child_index);
-            TSSymbol visible_symbol = alias
-              ? alias
-              : self->language->symbol_metadata[sym].visible
-                ? self->language->public_symbol_map[sym]
-                : 0;
-            TSFieldId field_id = parent_field_id;
-            if (!field_id) {
-              const TSFieldMapEntry *field_map, *field_map_end;
-              ts_language_field_map(self->language, node->production_id, &field_map, &field_map_end);
-              for (; field_map != field_map_end; field_map++) {
-                if (!field_map->inherited && field_map->child_index == child_index) {
-                  field_id = field_map->field_id;
-                  break;
-                }
-              }
-            }
-
-            // Create a new state that has advanced past this hypothetical subtree.
-            AnalysisState next_state = *state;
-            AnalysisStateEntry *next_state_top = analysis_state__top(&next_state);
-            next_state_top->child_index = successor.child_index;
-            next_state_top->parse_state = successor.state;
-            if (node->done) next_state_top->done = true;
-
-            // Determine if this hypothetical child node would match the current step
-            // of the query pattern.
-            bool does_match = false;
-            if (visible_symbol) {
-              does_match = true;
-              if (step->symbol == WILDCARD_SYMBOL) {
-                if (
-                  step->is_named &&
-                  !self->language->symbol_metadata[visible_symbol].named
-                ) does_match = false;
-              } else if (step->symbol != visible_symbol) {
-                does_match = false;
-              }
-              if (step->field && step->field != field_id) {
-                does_match = false;
-              }
-              if (
-                step->supertype_symbol &&
-                !analysis_state__has_supertype(state, step->supertype_symbol)
-              ) does_match = false;
-            }
-
-            // If this child is hidden, then descend into it and walk through its children.
-            // If the top entry of the stack is at the end of its rule, then that entry can
-            // be replaced. Otherwise, push a new entry onto the stack.
-            else if (sym >= self->language->token_count) {
-              if (!next_state_top->done) {
-                if (next_state.depth + 1 >= MAX_ANALYSIS_STATE_DEPTH) {
-                  #ifdef DEBUG_ANALYZE_QUERY
-                    printf("Exceeded depth limit for state %u\n", j);
-                  #endif
-
-                  did_abort_analysis = true;
-                  continue;
-                }
-
-                next_state.depth++;
-                next_state_top = analysis_state__top(&next_state);
-              }
-
-              *next_state_top = (AnalysisStateEntry) {
-                .parse_state = parse_state,
-                .parent_symbol = sym,
-                .child_index = 0,
-                .field_id = field_id,
-                .done = false,
-              };
-
-              if (analysis_state__recursion_depth(&next_state) > recursion_depth_limit) {
-                analysis_state_set__insert_sorted_by_clone(
-                  &deeper_states,
-                  &state_pool,
-                  &next_state
-                );
-                continue;
-              }
-            }
-
-            // Pop from the stack when this state reached the end of its current syntax node.
-            while (next_state.depth > 0 && next_state_top->done) {
-              next_state.depth--;
-              next_state_top = analysis_state__top(&next_state);
-            }
-
-            // If this hypothetical child did match the current step of the query pattern,
-            // then advance to the next step at the current depth. This involves skipping
-            // over any descendant steps of the current child.
-            const QueryStep *next_step = step;
-            if (does_match) {
-              for (;;) {
-                next_state.step_index++;
-                next_step = &self->steps.contents[next_state.step_index];
-                if (
-                  next_step->depth == PATTERN_DONE_MARKER ||
-                  next_step->depth <= parent_depth + 1
-                ) break;
-              }
-            } else if (successor.state == parse_state) {
-              continue;
-            }
-
-            for (;;) {
-              // Skip pass-through states. Although these states have alternatives, they are only
-              // used to implement repetitions, and query analysis does not need to process
-              // repetitions in order to determine whether steps are possible and definite.
-              if (next_step->is_pass_through) {
-                next_state.step_index++;
-                next_step++;
-                continue;
-              }
-
-              // If the pattern is finished or hypothetical parent node is complete, then
-              // record that matching can terminate at this step of the pattern. Otherwise,
-              // add this state to the list of states to process on the next iteration.
-              if (!next_step->is_dead_end) {
-                bool did_finish_pattern = self->steps.contents[next_state.step_index].depth != parent_depth + 1;
-                if (did_finish_pattern) can_finish_pattern = true;
-                if (did_finish_pattern || next_state.depth == 0) {
-                  array_insert_sorted_by(&final_step_indices, , next_state.step_index);
-                } else {
-                  analysis_state_set__insert_sorted_by_clone(&next_states, &state_pool, &next_state);
-                }
-              }
-
-              // If the state has advanced to a step with an alternative step, then add another state
-              // at that alternative step. This process is simpler than the process of actually matching a
-              // pattern during query execution, because for the purposes of query analysis, there is no
-              // need to process repetitions.
-              if (
-                does_match &&
-                next_step->alternative_index != NONE &&
-                next_step->alternative_index > next_state.step_index
-              ) {
-                next_state.step_index = next_step->alternative_index;
-                next_step = &self->steps.contents[next_state.step_index];
-              } else {
-                break;
-              }
-            }
-          }
-        }
-      }
-
-      AnalysisStateSet _states = states;
-      states = next_states;
-      next_states = _states;
-    }
+    ts_query__analyze_patterns_from_states(
+      self,
+      &subgraphs,
+      &states,
+      &next_states,
+      &deeper_states,
+      &state_pool,
+      &finished_parent_symbols,
+      &final_step_indices,
+      &did_abort_analysis
+    );
 
     // If this pattern could not be fully analyzed, then every step should
     // be considered fallible.
@@ -1686,7 +1733,7 @@ static bool ts_query__analyze_patterns(TSQuery *self, unsigned *error_offset) {
 
     // If this pattern cannot match, store the pattern index so that it can be
     // returned to the caller.
-    if (!can_finish_pattern) {
+    if (finished_parent_symbols.size == 0) {
       assert(final_step_indices.size > 0);
       uint16_t impossible_step_index = *array_back(&final_step_indices);
       uint32_t i, exists;
@@ -1810,6 +1857,75 @@ static bool ts_query__analyze_patterns(TSQuery *self, unsigned *error_offset) {
     }
   #endif
 
+  // Determine which repetition symbols in this language have the possibility
+  // of matching non-rooted patterns in this query. These repetition symbols
+  // prevent certain optimizations with range restrictions.
+  bool did_abort_analysis = false;
+  for (uint32_t i = 0; i < non_rooted_pattern_start_steps.size; i++) {
+    uint16_t step_index = non_rooted_pattern_start_steps.contents[i];
+
+    analysis_state_set__clear(&states, &state_pool);
+    analysis_state_set__clear(&deeper_states, &state_pool);
+
+    for (unsigned j = 0; j < subgraphs.size; j++) {
+      AnalysisSubgraph *subgraph = &subgraphs.contents[j];
+      TSSymbolMetadata metadata = ts_language_symbol_metadata(self->language, subgraph->symbol);
+      if (metadata.visible || metadata.named) continue;
+      for (uint32_t k = 0; k < subgraph->start_states.size; k++) {
+        TSStateId parse_state = subgraph->start_states.contents[k];
+        analysis_state_set__push_by_clone(&states, &state_pool, &((AnalysisState) {
+          .step_index = step_index,
+          .stack = {
+            [0] = {
+              .parse_state = parse_state,
+              .parent_symbol = subgraph->symbol,
+              .child_index = 0,
+              .field_id = 0,
+              .done = false,
+            },
+          },
+          .root_symbol = subgraph->symbol,
+          .depth = 1,
+        }));
+      }
+    }
+
+    #ifdef DEBUG_ANALYZE_QUERY
+      printf("\nWalk states for rootless pattern step %u:\n", step_index);
+    #endif
+
+    array_clear(&final_step_indices);
+    array_clear(&finished_parent_symbols);
+    ts_query__analyze_patterns_from_states(
+      self,
+      &subgraphs,
+      &states,
+      &next_states,
+      &deeper_states,
+      &state_pool,
+      &finished_parent_symbols,
+      &final_step_indices,
+      &did_abort_analysis
+    );
+
+    for (unsigned k = 0; k < finished_parent_symbols.size; k++) {
+      TSSymbol symbol = finished_parent_symbols.contents[k];
+      array_insert_sorted_by(&self->repeat_symbols_with_rootless_patterns, , symbol);
+    }
+  }
+
+  #ifdef DEBUG_ANALYZE_QUERY
+    if (self->repeat_symbols_with_rootless_patterns.size > 0) {
+      printf("\nRepetition symbols with rootless patterns:\n");
+      printf("aborted analysis: %d\n", did_abort_analysis);
+      for (unsigned i = 0; i < self->repeat_symbols_with_rootless_patterns.size; i++) {
+        TSSymbol symbol = self->repeat_symbols_with_rootless_patterns.contents[i];
+        printf("  %u, %s\n", symbol, ts_language_symbol_name(self->language, symbol));
+      }
+      printf("\n");
+    }
+  #endif
+
   // Cleanup
   for (unsigned i = 0; i < subgraphs.size; i++) {
     array_delete(&subgraphs.contents[i].start_states);
@@ -1821,9 +1937,11 @@ static bool ts_query__analyze_patterns(TSQuery *self, unsigned *error_offset) {
   }
   array_delete(&state_pool);
   array_delete(&next_nodes);
+  array_delete(&non_rooted_pattern_start_steps);
   analysis_state_set__delete(&states);
   analysis_state_set__delete(&next_states);
   analysis_state_set__delete(&deeper_states);
+  array_delete(&finished_parent_symbols);
   array_delete(&final_step_indices);
   array_delete(&parent_step_indices);
   array_delete(&predicate_capture_ids);
@@ -2571,6 +2689,7 @@ TSQuery *ts_query_new(
     .step_offsets = array_new(),
     .string_buffer = array_new(),
     .negated_fields = array_new(),
+    .repeat_symbols_with_rootless_patterns = array_new(),
     .wildcard_root_pattern_count = 0,
     .language = language,
   };
@@ -2685,6 +2804,7 @@ void ts_query_delete(TSQuery *self) {
     array_delete(&self->step_offsets);
     array_delete(&self->string_buffer);
     array_delete(&self->negated_fields);
+    array_delete(&self->repeat_symbols_with_rootless_patterns);
     symbol_table_delete(&self->captures);
     symbol_table_delete(&self->predicate_values);
     for (uint32_t index = 0; index < self->capture_quantifiers.size; index++) {
@@ -3327,18 +3447,18 @@ static inline bool ts_query_cursor__advance(
         self->finished_states.size
       );
 
-      bool node_intersects_range = (
-        ts_node_end_byte(node) > self->start_byte &&
-        ts_node_start_byte(node) < self->end_byte &&
-        point_gt(ts_node_end_point(node), self->start_point) &&
-        point_lt(ts_node_start_point(node), self->end_point)
-      );
       bool parent_intersects_range = ts_node_is_null(parent_node) || (
         ts_node_end_byte(parent_node) > self->start_byte &&
         ts_node_start_byte(parent_node) < self->end_byte &&
         point_gt(ts_node_end_point(parent_node), self->start_point) &&
         point_lt(ts_node_start_point(parent_node), self->end_point)
       );
+      bool node_intersects_range = parent_intersects_range && (
+        ts_node_end_byte(node) > self->start_byte &&
+        ts_node_start_byte(node) < self->end_byte &&
+        point_gt(ts_node_end_point(node), self->start_point) &&
+        point_lt(ts_node_start_point(node), self->end_point)
+      );
       bool node_is_error = symbol == ts_builtin_sym_error;
       bool parent_is_error =
         !ts_node_is_null(parent_node) &&
@@ -3679,8 +3799,8 @@ static inline bool ts_query_cursor__advance(
 
       // When the current node ends prior to the desired start offset,
       // only descend for the purpose of continuing in-progress matches.
-      bool should_descend = node_intersects_range;
-      if (!should_descend) {
+      bool has_in_progress_matches = false;
+      if (!node_intersects_range) {
         for (unsigned i = 0; i < self->states.size; i++) {
           QueryState *state = &self->states.contents[i];;
           QueryStep *next_step = &self->query->steps.contents[state->step_index];
@@ -3688,12 +3808,13 @@ static inline bool ts_query_cursor__advance(
             next_step->depth != PATTERN_DONE_MARKER &&
             state->start_depth + next_step->depth > self->depth
           ) {
-            should_descend = true;
+            has_in_progress_matches = true;
             break;
           }
         }
       }
 
+      bool should_descend = node_intersects_range || has_in_progress_matches;
       if (!should_descend) {
         LOG(
           "  not descending. node end byte: %u, start byte: %u\n",

From 189cf6d59daa7861f504c74d0a775b8f53cf98e2 Mon Sep 17 00:00:00 2001
From: Max Brunsfeld <maxbrunsfeld@gmail.com>
Date: Tue, 14 Feb 2023 15:18:00 -0800
Subject: [PATCH 037/347] Group analysis state sets into QueryAnalysis struct

---
 lib/src/query.c | 218 ++++++++++++++++++++++--------------------------
 1 file changed, 102 insertions(+), 116 deletions(-)

diff --git a/lib/src/query.c b/lib/src/query.c
index a756c089..cbc9add6 100644
--- a/lib/src/query.c
+++ b/lib/src/query.c
@@ -233,9 +233,15 @@ typedef struct {
 
 typedef Array(AnalysisState *) AnalysisStateSet;
 
-typedef Array(AnalysisState *) AnalysisStatePool;
-
-typedef Array(uint16_t) StepIndexArray;
+typedef struct {
+  AnalysisStateSet states;
+  AnalysisStateSet next_states;
+  AnalysisStateSet deeper_states;
+  AnalysisStateSet state_pool;
+  Array(uint16_t) final_step_indices;
+  Array(TSSymbol) finished_parent_symbols;
+  bool did_abort;
+} QueryAnalysis;
 
 /*
  * AnalysisSubgraph - A subset of the states in the parse table that are used
@@ -940,30 +946,23 @@ static inline bool analysis_state__has_supertype(AnalysisState *self, TSSymbol s
   return false;
 }
 
-static inline AnalysisState *analysis_state__clone(AnalysisState const *self) {
-  AnalysisState *new_state = ts_malloc(sizeof(AnalysisState));
-  *new_state = *self;
-  return new_state;
-}
-
-/****************
+/******************
  * AnalysisStateSet
- ****************/
+ ******************/
 
 // Obtains an `AnalysisState` instance, either by consuming one from this set's object pool, or by
 // cloning one from scratch.
 static inline AnalysisState *analysis_state_pool__clone_or_reuse(
-  AnalysisStatePool *self,
+  AnalysisStateSet *self,
   AnalysisState *borrowed_item
 ) {
   AnalysisState *new_item;
   if (self->size) {
     new_item = array_pop(self);
-    *new_item = *borrowed_item;
   } else {
-    new_item = analysis_state__clone(borrowed_item);
+    new_item = ts_malloc(sizeof(AnalysisState));
   }
-
+  *new_item = *borrowed_item;
   return new_item;
 }
 
@@ -973,9 +972,9 @@ static inline AnalysisState *analysis_state_pool__clone_or_reuse(
 //
 // The caller retains ownership of the passed-in memory. However, the clone that is created by this
 // function will be managed by the state set.
-static inline void analysis_state_set__insert_sorted_by_clone(
+static inline void analysis_state_set__insert_sorted(
   AnalysisStateSet *self,
-  AnalysisStatePool *pool,
+  AnalysisStateSet *pool,
   AnalysisState *borrowed_item
 ) {
   unsigned index, exists;
@@ -994,9 +993,9 @@ static inline void analysis_state_set__insert_sorted_by_clone(
 //
 // The caller retains ownership of the passed-in memory. However, the clone that is created by this
 // function will be managed by the state set.
-static inline void analysis_state_set__push_by_clone(
+static inline void analysis_state_set__push(
   AnalysisStateSet *self,
-  AnalysisStatePool *pool,
+  AnalysisStateSet *pool,
   AnalysisState *borrowed_item
 ) {
   AnalysisState *new_item = analysis_state_pool__clone_or_reuse(pool, borrowed_item);
@@ -1004,7 +1003,7 @@ static inline void analysis_state_set__push_by_clone(
 }
 
 // Removes all items from this set, returning it to an empty state.
-static inline void analysis_state_set__clear(AnalysisStateSet *self, AnalysisStatePool *pool) {
+static inline void analysis_state_set__clear(AnalysisStateSet *self, AnalysisStateSet *pool) {
   array_push_all(pool, self);
   array_clear(self);
 }
@@ -1018,6 +1017,31 @@ static inline void analysis_state_set__delete(AnalysisStateSet *self) {
   array_delete(self);
 }
 
+/****************
+ * QueryAnalyzer
+ ****************/
+
+static inline QueryAnalysis query_analysis__new() {
+  return (QueryAnalysis) {
+    .states = array_new(),
+    .next_states = array_new(),
+    .deeper_states = array_new(),
+    .state_pool = array_new(),
+    .final_step_indices = array_new(),
+    .finished_parent_symbols = array_new(),
+    .did_abort = false,
+  };
+}
+
+static inline void query_analysis__delete(QueryAnalysis *self) {
+  analysis_state_set__delete(&self->states);
+  analysis_state_set__delete(&self->next_states);
+  analysis_state_set__delete(&self->deeper_states);
+  analysis_state_set__delete(&self->state_pool);
+  array_delete(&self->final_step_indices);
+  array_delete(&self->finished_parent_symbols);
+}
+
 /***********************
  * AnalysisSubgraphNode
  ***********************/
@@ -1119,23 +1143,21 @@ static inline void ts_query__pattern_map_insert(
   array_insert(&self->pattern_map, index, new_entry);
 }
 
-static void ts_query__analyze_patterns_from_states(
+// Walk the subgraph for this non-terminal, tracking all of the possible
+// sequences of progress within the pattern.
+static void ts_query__perform_analysis(
   TSQuery *self,
   const AnalysisSubgraphArray *subgraphs,
-  AnalysisStateSet *states,
-  AnalysisStateSet *next_states,
-  AnalysisStateSet *deeper_states,
-  AnalysisStatePool *state_pool,
-  StepIndexArray *finished_parent_symbols,
-  StepIndexArray *final_step_indices,
-  bool *did_abort_analysis
+  QueryAnalysis *analysis
 ) {
   unsigned recursion_depth_limit = 0;
   unsigned prev_final_step_count = 0;
+  array_clear(&analysis->final_step_indices);
+  array_clear(&analysis->finished_parent_symbols);
 
   for (unsigned iteration = 0;; iteration++) {
     if (iteration == MAX_ANALYSIS_ITERATION_COUNT) {
-      *did_abort_analysis = true;
+      analysis->did_abort = true;
       break;
     }
 
@@ -1167,52 +1189,52 @@ static void ts_query__analyze_patterns_from_states(
     // bump the depth limit by one, and continue to process the states the exceeded the
     // limit. But only allow this if progress has been made since the last time the depth
     // limit was increased.
-    if (states->size == 0) {
+    if (analysis->states.size == 0) {
       if (
-          deeper_states->size > 0
-          && final_step_indices->size > prev_final_step_count
+        analysis->deeper_states.size > 0 &&
+        analysis->final_step_indices.size > prev_final_step_count
       ) {
         #ifdef DEBUG_ANALYZE_QUERY
           printf("Increase recursion depth limit to %u\n", recursion_depth_limit + 1);
         #endif
 
-        prev_final_step_count = final_step_indices->size;
+        prev_final_step_count = analysis->final_step_indices.size;
         recursion_depth_limit++;
-        AnalysisStateSet _states = *states;
-        *states = *deeper_states;
-        *deeper_states = _states;
+        AnalysisStateSet _states = analysis->states;
+        analysis->states = analysis->deeper_states;
+        analysis->deeper_states = _states;
         continue;
       }
 
       break;
     }
 
-    analysis_state_set__clear(next_states, state_pool);
-    for (unsigned j = 0; j < states->size; j++) {
-      AnalysisState * const state = states->contents[j];
+    analysis_state_set__clear(&analysis->next_states, &analysis->state_pool);
+    for (unsigned j = 0; j < analysis->states.size; j++) {
+      AnalysisState * const state = analysis->states.contents[j];
 
       // For efficiency, it's important to avoid processing the same analysis state more
       // than once. To achieve this, keep the states in order of ascending position within
       // their hypothetical syntax trees. In each iteration of this loop, start by advancing
       // the states that have made the least progress. Avoid advancing states that have already
       // made more progress.
-      if (next_states->size > 0) {
+      if (analysis->next_states.size > 0) {
         int comparison = analysis_state__compare_position(
           &state,
-          array_back(next_states)
+          array_back(&analysis->next_states)
         );
         if (comparison == 0) {
-          analysis_state_set__insert_sorted_by_clone(next_states, state_pool, state);
+          analysis_state_set__insert_sorted(&analysis->next_states, &analysis->state_pool, state);
           continue;
         } else if (comparison > 0) {
           #ifdef DEBUG_ANALYZE_QUERY
             printf("Terminate iteration at state %u\n", j);
           #endif
-          while (j < states->size) {
-            analysis_state_set__push_by_clone(
-              next_states,
-              state_pool,
-              states->contents[j]
+          while (j < analysis->states.size) {
+            analysis_state_set__push(
+              &analysis->next_states,
+              &analysis->state_pool,
+              analysis->states.contents[j]
             );
             j++;
           }
@@ -1327,7 +1349,7 @@ static void ts_query__analyze_patterns_from_states(
                   printf("Exceeded depth limit for state %u\n", j);
                 #endif
 
-                *did_abort_analysis = true;
+                analysis->did_abort = true;
                 continue;
               }
 
@@ -1344,9 +1366,9 @@ static void ts_query__analyze_patterns_from_states(
             };
 
             if (analysis_state__recursion_depth(&next_state) > recursion_depth_limit) {
-              analysis_state_set__insert_sorted_by_clone(
-                deeper_states,
-                state_pool,
+              analysis_state_set__insert_sorted(
+                &analysis->deeper_states,
+                &analysis->state_pool,
                 &next_state
               );
               continue;
@@ -1392,11 +1414,11 @@ static void ts_query__analyze_patterns_from_states(
             if (!next_step->is_dead_end) {
               bool did_finish_pattern = self->steps.contents[next_state.step_index].depth != step->depth;
               if (did_finish_pattern) {
-                array_insert_sorted_by(finished_parent_symbols, , state->root_symbol);
+                array_insert_sorted_by(&analysis->finished_parent_symbols, , state->root_symbol);
               } else if (next_state.depth == 0) {
-                array_insert_sorted_by(final_step_indices, , next_state.step_index);
+                array_insert_sorted_by(&analysis->final_step_indices, , next_state.step_index);
               } else {
-                analysis_state_set__insert_sorted_by_clone(next_states, state_pool, &next_state);
+                analysis_state_set__insert_sorted(&analysis->next_states, &analysis->state_pool, &next_state);
               }
             }
 
@@ -1419,9 +1441,9 @@ static void ts_query__analyze_patterns_from_states(
       }
     }
 
-    AnalysisStateSet _states = *states;
-    *states = *next_states;
-    *next_states = _states;
+    AnalysisStateSet _states = analysis->states;
+    analysis->states = analysis->next_states;
+    analysis->next_states = _states;
   }
 }
 
@@ -1643,12 +1665,7 @@ static bool ts_query__analyze_patterns(TSQuery *self, unsigned *error_offset) {
   // For each non-terminal pattern, determine if the pattern can successfully match,
   // and identify all of the possible children within the pattern where matching could fail.
   bool all_patterns_are_valid = true;
-  AnalysisStateSet states = array_new();
-  AnalysisStateSet next_states = array_new();
-  AnalysisStateSet deeper_states = array_new();
-  AnalysisStatePool state_pool = array_new();
-  StepIndexArray final_step_indices = array_new();
-  StepIndexArray finished_parent_symbols = array_new();
+  QueryAnalysis analysis = query_analysis__new();
   for (unsigned i = 0; i < parent_step_indices.size; i++) {
     uint16_t parent_step_index = parent_step_indices.contents[i];
     uint16_t parent_depth = self->steps.contents[parent_step_index].depth;
@@ -1672,11 +1689,11 @@ static bool ts_query__analyze_patterns(TSQuery *self, unsigned *error_offset) {
     // Initialize an analysis state at every parse state in the table where
     // this parent symbol can occur.
     AnalysisSubgraph *subgraph = &subgraphs.contents[subgraph_index];
-    analysis_state_set__clear(&states, &state_pool);
-    analysis_state_set__clear(&deeper_states, &state_pool);
+    analysis_state_set__clear(&analysis.states, &analysis.state_pool);
+    analysis_state_set__clear(&analysis.deeper_states, &analysis.state_pool);
     for (unsigned j = 0; j < subgraph->start_states.size; j++) {
       TSStateId parse_state = subgraph->start_states.contents[j];
-      analysis_state_set__push_by_clone(&states, &state_pool, &((AnalysisState) {
+      analysis_state_set__push(&analysis.states, &analysis.state_pool, &((AnalysisState) {
         .step_index = parent_step_index + 1,
         .stack = {
           [0] = {
@@ -1692,31 +1709,16 @@ static bool ts_query__analyze_patterns(TSQuery *self, unsigned *error_offset) {
       }));
     }
 
-    // Walk the subgraph for this non-terminal, tracking all of the possible
-    // sequences of progress within the pattern.
-    bool did_abort_analysis = false;
-    array_clear(&final_step_indices);
-    array_clear(&finished_parent_symbols);
-
     #ifdef DEBUG_ANALYZE_QUERY
       printf("\nWalk states for %s:\n", ts_language_symbol_name(self->language, states.contents[0]->stack[0].parent_symbol));
     #endif
 
-    ts_query__analyze_patterns_from_states(
-      self,
-      &subgraphs,
-      &states,
-      &next_states,
-      &deeper_states,
-      &state_pool,
-      &finished_parent_symbols,
-      &final_step_indices,
-      &did_abort_analysis
-    );
+    analysis.did_abort = false;
+    ts_query__perform_analysis(self, &subgraphs, &analysis);
 
     // If this pattern could not be fully analyzed, then every step should
     // be considered fallible.
-    if (did_abort_analysis) {
+    if (analysis.did_abort) {
       for (unsigned j = parent_step_index + 1; j < self->steps.size; j++) {
         QueryStep *step = &self->steps.contents[j];
         if (
@@ -1733,9 +1735,9 @@ static bool ts_query__analyze_patterns(TSQuery *self, unsigned *error_offset) {
 
     // If this pattern cannot match, store the pattern index so that it can be
     // returned to the caller.
-    if (finished_parent_symbols.size == 0) {
-      assert(final_step_indices.size > 0);
-      uint16_t impossible_step_index = *array_back(&final_step_indices);
+    if (analysis.finished_parent_symbols.size == 0) {
+      assert(analysis.final_step_indices.size > 0);
+      uint16_t impossible_step_index = *array_back(&analysis.final_step_indices);
       uint32_t i, exists;
       array_search_sorted_by(&self->step_offsets, .step_index, impossible_step_index, &i, &exists);
       if (i >= self->step_offsets.size) i = self->step_offsets.size - 1;
@@ -1746,8 +1748,8 @@ static bool ts_query__analyze_patterns(TSQuery *self, unsigned *error_offset) {
 
     // Mark as fallible any step where a match terminated.
     // Later, this property will be propagated to all of the step's predecessors.
-    for (unsigned j = 0; j < final_step_indices.size; j++) {
-      uint32_t final_step_index = final_step_indices.contents[j];
+    for (unsigned j = 0; j < analysis.final_step_indices.size; j++) {
+      uint32_t final_step_index = analysis.final_step_indices.contents[j];
       QueryStep *step = &self->steps.contents[final_step_index];
       if (
         step->depth != PATTERN_DONE_MARKER &&
@@ -1860,20 +1862,20 @@ static bool ts_query__analyze_patterns(TSQuery *self, unsigned *error_offset) {
   // Determine which repetition symbols in this language have the possibility
   // of matching non-rooted patterns in this query. These repetition symbols
   // prevent certain optimizations with range restrictions.
-  bool did_abort_analysis = false;
+  analysis.did_abort = false;
   for (uint32_t i = 0; i < non_rooted_pattern_start_steps.size; i++) {
     uint16_t step_index = non_rooted_pattern_start_steps.contents[i];
 
-    analysis_state_set__clear(&states, &state_pool);
-    analysis_state_set__clear(&deeper_states, &state_pool);
-
+    analysis_state_set__clear(&analysis.states, &analysis.state_pool);
+    analysis_state_set__clear(&analysis.deeper_states, &analysis.state_pool);
     for (unsigned j = 0; j < subgraphs.size; j++) {
       AnalysisSubgraph *subgraph = &subgraphs.contents[j];
       TSSymbolMetadata metadata = ts_language_symbol_metadata(self->language, subgraph->symbol);
       if (metadata.visible || metadata.named) continue;
+
       for (uint32_t k = 0; k < subgraph->start_states.size; k++) {
         TSStateId parse_state = subgraph->start_states.contents[k];
-        analysis_state_set__push_by_clone(&states, &state_pool, &((AnalysisState) {
+        analysis_state_set__push(&analysis.states, &analysis.state_pool, &((AnalysisState) {
           .step_index = step_index,
           .stack = {
             [0] = {
@@ -1894,22 +1896,14 @@ static bool ts_query__analyze_patterns(TSQuery *self, unsigned *error_offset) {
       printf("\nWalk states for rootless pattern step %u:\n", step_index);
     #endif
 
-    array_clear(&final_step_indices);
-    array_clear(&finished_parent_symbols);
-    ts_query__analyze_patterns_from_states(
+    ts_query__perform_analysis(
       self,
       &subgraphs,
-      &states,
-      &next_states,
-      &deeper_states,
-      &state_pool,
-      &finished_parent_symbols,
-      &final_step_indices,
-      &did_abort_analysis
+      &analysis
     );
 
-    for (unsigned k = 0; k < finished_parent_symbols.size; k++) {
-      TSSymbol symbol = finished_parent_symbols.contents[k];
+    for (unsigned k = 0; k < analysis.finished_parent_symbols.size; k++) {
+      TSSymbol symbol = analysis.finished_parent_symbols.contents[k];
       array_insert_sorted_by(&self->repeat_symbols_with_rootless_patterns, , symbol);
     }
   }
@@ -1917,7 +1911,7 @@ static bool ts_query__analyze_patterns(TSQuery *self, unsigned *error_offset) {
   #ifdef DEBUG_ANALYZE_QUERY
     if (self->repeat_symbols_with_rootless_patterns.size > 0) {
       printf("\nRepetition symbols with rootless patterns:\n");
-      printf("aborted analysis: %d\n", did_abort_analysis);
+      printf("aborted analysis: %d\n", analyzer.did_abort);
       for (unsigned i = 0; i < self->repeat_symbols_with_rootless_patterns.size; i++) {
         TSSymbol symbol = self->repeat_symbols_with_rootless_patterns.contents[i];
         printf("  %u, %s\n", symbol, ts_language_symbol_name(self->language, symbol));
@@ -1932,17 +1926,9 @@ static bool ts_query__analyze_patterns(TSQuery *self, unsigned *error_offset) {
     array_delete(&subgraphs.contents[i].nodes);
   }
   array_delete(&subgraphs);
-  for (unsigned i = 0; i < state_pool.size; i++) {
-    ts_free(state_pool.contents[i]);
-  }
-  array_delete(&state_pool);
+  query_analysis__delete(&analysis);
   array_delete(&next_nodes);
   array_delete(&non_rooted_pattern_start_steps);
-  analysis_state_set__delete(&states);
-  analysis_state_set__delete(&next_states);
-  analysis_state_set__delete(&deeper_states);
-  array_delete(&finished_parent_symbols);
-  array_delete(&final_step_indices);
   array_delete(&parent_step_indices);
   array_delete(&predicate_capture_ids);
   state_predecessor_map_delete(&predecessor_map);

From 29c9073177d4e5f750daa9619feab75701a9a286 Mon Sep 17 00:00:00 2001
From: Max Brunsfeld <maxbrunsfeld@gmail.com>
Date: Wed, 15 Feb 2023 14:01:59 -0800
Subject: [PATCH 038/347] Extract 'internal' versions of tree cursor movement
 fns that allow visiting hidden nodes

---
 lib/src/tree_cursor.c | 126 +++++++++++++++++++-----------------------
 lib/src/tree_cursor.h |  15 +++++
 2 files changed, 72 insertions(+), 69 deletions(-)

diff --git a/lib/src/tree_cursor.c b/lib/src/tree_cursor.c
index e8dc98a9..98930250 100644
--- a/lib/src/tree_cursor.c
+++ b/lib/src/tree_cursor.c
@@ -98,34 +98,43 @@ void ts_tree_cursor_delete(TSTreeCursor *_self) {
 
 // TSTreeCursor - walking the tree
 
-bool ts_tree_cursor_goto_first_child(TSTreeCursor *_self) {
+TreeCursorStep ts_tree_cursor_goto_first_child_internal(TSTreeCursor *_self) {
   TreeCursor *self = (TreeCursor *)_self;
-
-  bool did_descend;
-  do {
-    did_descend = false;
-
-    bool visible;
-    TreeCursorEntry entry;
-    CursorChildIterator iterator = ts_tree_cursor_iterate_children(self);
-    while (ts_tree_cursor_child_iterator_next(&iterator, &entry, &visible)) {
-      if (visible) {
-        array_push(&self->stack, entry);
-        return true;
-      }
-
-      if (ts_subtree_visible_child_count(*entry.subtree) > 0) {
-        array_push(&self->stack, entry);
-        did_descend = true;
-        break;
-      }
+  bool visible;
+  TreeCursorEntry entry;
+  CursorChildIterator iterator = ts_tree_cursor_iterate_children(self);
+  while (ts_tree_cursor_child_iterator_next(&iterator, &entry, &visible)) {
+    if (visible) {
+      array_push(&self->stack, entry);
+      return TreeCursorStepVisible;
     }
-  } while (did_descend);
+    if (ts_subtree_visible_child_count(*entry.subtree) > 0) {
+      array_push(&self->stack, entry);
+      return TreeCursorStepHidden;
+    }
+  }
+  return TreeCursorStepNone;
+}
 
+bool ts_tree_cursor_goto_first_child(TSTreeCursor *self) {
+  for (;;) {
+    switch (ts_tree_cursor_goto_first_child_internal(self)) {
+      case TreeCursorStepHidden:
+        continue;
+      case TreeCursorStepVisible:
+        return true;
+      default:
+        return false;
+    }
+  }
   return false;
 }
 
-int64_t ts_tree_cursor_goto_first_child_for_byte(TSTreeCursor *_self, uint32_t goal_byte) {
+static inline int64_t ts_tree_cursor_goto_first_child_for_byte_and_point(
+  TSTreeCursor *_self,
+  uint32_t goal_byte,
+  TSPoint goal_point
+) {
   TreeCursor *self = (TreeCursor *)_self;
   uint32_t initial_size = self->stack.size;
   uint32_t visible_child_index = 0;
@@ -138,48 +147,8 @@ int64_t ts_tree_cursor_goto_first_child_for_byte(TSTreeCursor *_self, uint32_t g
     TreeCursorEntry entry;
     CursorChildIterator iterator = ts_tree_cursor_iterate_children(self);
     while (ts_tree_cursor_child_iterator_next(&iterator, &entry, &visible)) {
-      uint32_t end_byte = entry.position.bytes + ts_subtree_size(*entry.subtree).bytes;
-      bool at_goal = end_byte >= goal_byte;
-      uint32_t visible_child_count = ts_subtree_visible_child_count(*entry.subtree);
-
-      if (at_goal) {
-        if (visible) {
-          array_push(&self->stack, entry);
-          return visible_child_index;
-        }
-
-        if (visible_child_count > 0) {
-          array_push(&self->stack, entry);
-          did_descend = true;
-          break;
-        }
-      } else if (visible) {
-        visible_child_index++;
-      } else {
-        visible_child_index += visible_child_count;
-      }
-    }
-  } while (did_descend);
-
-  self->stack.size = initial_size;
-  return -1;
-}
-
-int64_t ts_tree_cursor_goto_first_child_for_point(TSTreeCursor *_self, TSPoint goal_point) {
-  TreeCursor *self = (TreeCursor *)_self;
-  uint32_t initial_size = self->stack.size;
-  uint32_t visible_child_index = 0;
-
-  bool did_descend;
-  do {
-    did_descend = false;
-
-    bool visible;
-    TreeCursorEntry entry;
-    CursorChildIterator iterator = ts_tree_cursor_iterate_children(self);
-    while (ts_tree_cursor_child_iterator_next(&iterator, &entry, &visible)) {
-      TSPoint end_point = point_add(entry.position.extent, ts_subtree_size(*entry.subtree).extent);
-      bool at_goal = point_gte(end_point, goal_point);
+      Length entry_end = length_add(entry.position, ts_subtree_size(*entry.subtree));
+      bool at_goal = entry_end.bytes >= goal_byte && point_gte(entry_end.extent, goal_point);
       uint32_t visible_child_count = ts_subtree_visible_child_count(*entry.subtree);
       if (at_goal) {
         if (visible) {
@@ -203,7 +172,15 @@ int64_t ts_tree_cursor_goto_first_child_for_point(TSTreeCursor *_self, TSPoint g
   return -1;
 }
 
-bool ts_tree_cursor_goto_next_sibling(TSTreeCursor *_self) {
+int64_t ts_tree_cursor_goto_first_child_for_byte(TSTreeCursor *self, uint32_t goal_byte) {
+  return ts_tree_cursor_goto_first_child_for_byte_and_point(self, goal_byte, POINT_ZERO);
+}
+
+int64_t ts_tree_cursor_goto_first_child_for_point(TSTreeCursor *self, TSPoint goal_point) {
+  return ts_tree_cursor_goto_first_child_for_byte_and_point(self, 0, goal_point);
+}
+
+TreeCursorStep ts_tree_cursor_goto_next_sibling_internal(TSTreeCursor *_self) {
   TreeCursor *self = (TreeCursor *)_self;
   uint32_t initial_size = self->stack.size;
 
@@ -221,19 +198,30 @@ bool ts_tree_cursor_goto_next_sibling(TSTreeCursor *_self) {
     while (ts_tree_cursor_child_iterator_next(&iterator, &entry, &visible)) {
       if (visible) {
         array_push(&self->stack, entry);
-        return true;
+        return TreeCursorStepVisible;
       }
 
       if (ts_subtree_visible_child_count(*entry.subtree)) {
         array_push(&self->stack, entry);
-        ts_tree_cursor_goto_first_child(_self);
-        return true;
+        return TreeCursorStepHidden;
       }
     }
   }
 
   self->stack.size = initial_size;
-  return false;
+  return TreeCursorStepNone;
+}
+
+bool ts_tree_cursor_goto_next_sibling(TSTreeCursor *self) {
+  switch (ts_tree_cursor_goto_next_sibling_internal(self)) {
+    case TreeCursorStepHidden:
+      ts_tree_cursor_goto_first_child(self);
+      return true;
+    case TreeCursorStepVisible:
+      return true;
+    default:
+      return false;
+  }
 }
 
 bool ts_tree_cursor_goto_parent(TSTreeCursor *_self) {
diff --git a/lib/src/tree_cursor.h b/lib/src/tree_cursor.h
index 69647d1d..7b94db6b 100644
--- a/lib/src/tree_cursor.h
+++ b/lib/src/tree_cursor.h
@@ -15,6 +15,12 @@ typedef struct {
   Array(TreeCursorEntry) stack;
 } TreeCursor;
 
+typedef enum {
+  TreeCursorStepNone,
+  TreeCursorStepHidden,
+  TreeCursorStepVisible,
+} TreeCursorStep;
+
 void ts_tree_cursor_init(TreeCursor *, TSNode);
 void ts_tree_cursor_current_status(
   const TSTreeCursor *,
@@ -26,6 +32,15 @@ void ts_tree_cursor_current_status(
   unsigned *
 );
 
+TreeCursorStep ts_tree_cursor_goto_first_child_internal(TSTreeCursor *);
+TreeCursorStep ts_tree_cursor_goto_next_sibling_internal(TSTreeCursor *);
+
+static inline Subtree ts_tree_cursor_current_subtree(const TSTreeCursor *_self) {
+  const TreeCursor *self = (const TreeCursor *)_self;
+  TreeCursorEntry *last_entry = array_back(&self->stack);
+  return *last_entry->subtree;
+}
+
 TSNode ts_tree_cursor_parent_node(const TSTreeCursor *);
 
 #endif  // TREE_SITTER_TREE_CURSOR_H_

From fa869cf3eddac07d82bfd48f7fda0a0705087a51 Mon Sep 17 00:00:00 2001
From: Max Brunsfeld <maxbrunsfeld@gmail.com>
Date: Wed, 15 Feb 2023 14:03:15 -0800
Subject: [PATCH 039/347] Restructure query_cursor_advance to explicitly
 control which hidden nodes it descends into

---
 lib/src/query.c   | 914 ++++++++++++++++++++++++----------------------
 lib/src/subtree.h |   6 +
 2 files changed, 492 insertions(+), 428 deletions(-)

diff --git a/lib/src/query.c b/lib/src/query.c
index cbc9add6..04a59f9a 100644
--- a/lib/src/query.c
+++ b/lib/src/query.c
@@ -309,6 +309,7 @@ struct TSQueryCursor {
   TSPoint start_point;
   TSPoint end_point;
   uint32_t next_state_id;
+  bool on_visible_node;
   bool ascending;
   bool halted;
   bool did_exceed_match_limit;
@@ -1163,12 +1164,12 @@ static void ts_query__perform_analysis(
 
     #ifdef DEBUG_ANALYZE_QUERY
       printf("Iteration: %u. Final step indices:", iteration);
-      for (unsigned j = 0; j < final_step_indices->size; j++) {
-        printf(" %4u", final_step_indices->contents[j]);
+      for (unsigned j = 0; j < analysis->final_step_indices.size; j++) {
+        printf(" %4u", analysis->final_step_indices.contents[j]);
       }
       printf("\n");
-      for (unsigned j = 0; j < states->size; j++) {
-        AnalysisState *state = states->contents[j];
+      for (unsigned j = 0; j < analysis->states.size; j++) {
+        AnalysisState *state = analysis->states.contents[j];
         printf("  %3u: step: %u, stack: [", j, state->step_index);
         for (unsigned k = 0; k < state->depth; k++) {
           printf(
@@ -1710,7 +1711,10 @@ static bool ts_query__analyze_patterns(TSQuery *self, unsigned *error_offset) {
     }
 
     #ifdef DEBUG_ANALYZE_QUERY
-      printf("\nWalk states for %s:\n", ts_language_symbol_name(self->language, states.contents[0]->stack[0].parent_symbol));
+      printf(
+        "\nWalk states for %s:\n",
+        ts_language_symbol_name(self->language, analysis.states.contents[0]->stack[0].parent_symbol)
+      );
     #endif
 
     analysis.did_abort = false;
@@ -1911,7 +1915,7 @@ static bool ts_query__analyze_patterns(TSQuery *self, unsigned *error_offset) {
   #ifdef DEBUG_ANALYZE_QUERY
     if (self->repeat_symbols_with_rootless_patterns.size > 0) {
       printf("\nRepetition symbols with rootless patterns:\n");
-      printf("aborted analysis: %d\n", analyzer.did_abort);
+      printf("aborted analysis: %d\n", analysis.did_abort);
       for (unsigned i = 0; i < self->repeat_symbols_with_rootless_patterns.size; i++) {
         TSSymbol symbol = self->repeat_symbols_with_rootless_patterns.contents[i];
         printf("  %u, %s\n", symbol, ts_language_symbol_name(self->language, symbol));
@@ -2986,6 +2990,7 @@ void ts_query_cursor_exec(
   array_clear(&self->finished_states);
   ts_tree_cursor_reset(&self->cursor, node);
   capture_list_pool_reset(&self->capture_list_pool);
+  self->on_visible_node = true;
   self->next_state_id = 0;
   self->depth = 0;
   self->ascending = false;
@@ -3320,6 +3325,50 @@ static QueryState *ts_query_cursor__copy_state(
   return &self->states.contents[state_index + 1];
 }
 
+static inline bool ts_query_cursor__should_descend_outside_of_range(
+  TSQueryCursor *self
+) {
+  // If there are in-progress matches whose remaining steps occur
+  // deeper in the tree, then descend.
+  for (unsigned i = 0; i < self->states.size; i++) {
+    QueryState *state = &self->states.contents[i];;
+    QueryStep *next_step = &self->query->steps.contents[state->step_index];
+    if (
+      next_step->depth != PATTERN_DONE_MARKER &&
+      state->start_depth + next_step->depth > self->depth
+    ) {
+      return true;
+    }
+  }
+
+  // If the current node is hidden, then a non-rooted pattern might match
+  // one if its roots inside of this node, and match another of its roots
+  // as part of a sibling node, so we may need to descend.
+  if (!self->on_visible_node) {
+    // Descending into a repetition node outside of the range can be
+    // expensive, because these nodes can have many visible children.
+    // Avoid descending into repetition nodes unless we have already
+    // determined that this query can match rootless patterns inside
+    // of this type of repetition node.
+    Subtree subtree = ts_tree_cursor_current_subtree(&self->cursor);
+    if (ts_subtree_is_repetition(subtree)) {
+      bool exists;
+      uint32_t index;
+      array_search_sorted_by(
+        &self->query->repeat_symbols_with_rootless_patterns,,
+        ts_subtree_symbol(subtree),
+        &index,
+        &exists
+      );
+      return exists;
+    }
+
+    return true;
+  }
+
+  return false;
+}
+
 // Walk the tree, processing patterns until at least one pattern finishes,
 // If one or more patterns finish, return `true` and store their states in the
 // `finished_states` array. Multiple patterns can finish on the same node. If
@@ -3351,219 +3400,49 @@ static inline bool ts_query_cursor__advance(
       );
 
       // Leave this node by stepping to its next sibling or to its parent.
-      if (ts_tree_cursor_goto_next_sibling(&self->cursor)) {
-        self->ascending = false;
-      } else if (ts_tree_cursor_goto_parent(&self->cursor)) {
-        self->depth--;
-      } else {
-        LOG("halt at root\n");
-        self->halted = true;
-      }
-
-      // After leaving a node, remove any states that cannot make further progress.
-      uint32_t deleted_count = 0;
-      for (unsigned i = 0, n = self->states.size; i < n; i++) {
-        QueryState *state = &self->states.contents[i];
-        QueryStep *step = &self->query->steps.contents[state->step_index];
-
-        // If a state completed its pattern inside of this node, but was deferred from finishing
-        // in order to search for longer matches, mark it as finished.
-        if (step->depth == PATTERN_DONE_MARKER) {
-          if (state->start_depth > self->depth || self->halted) {
-            LOG("  finish pattern %u\n", state->pattern_index);
-            array_push(&self->finished_states, *state);
-            did_match = true;
-            deleted_count++;
-            continue;
-          }
-        }
-
-        // If a state needed to match something within this node, then remove that state
-        // as it has failed to match.
-        else if ((uint32_t)state->start_depth + (uint32_t)step->depth > self->depth) {
-          LOG(
-            "  failed to match. pattern:%u, step:%u\n",
-            state->pattern_index,
-            state->step_index
-          );
-          capture_list_pool_release(
-            &self->capture_list_pool,
-            state->capture_list_id
-          );
-          deleted_count++;
-          continue;
-        }
-
-        if (deleted_count > 0) {
-          self->states.contents[i - deleted_count] = *state;
-        }
-      }
-      self->states.size -= deleted_count;
-    }
-
-    // Enter a new node.
-    else {
-      // Get the properties of the current node.
-      TSNode node = ts_tree_cursor_current_node(&self->cursor);
-      TSNode parent_node = ts_tree_cursor_parent_node(&self->cursor);
-      TSSymbol symbol = ts_node_symbol(node);
-      bool is_named = ts_node_is_named(node);
-      bool has_later_siblings;
-      bool has_later_named_siblings;
-      bool can_have_later_siblings_with_this_field;
-      TSFieldId field_id = 0;
-      TSSymbol supertypes[8] = {0};
-      unsigned supertype_count = 8;
-      ts_tree_cursor_current_status(
-        &self->cursor,
-        &field_id,
-        &has_later_siblings,
-        &has_later_named_siblings,
-        &can_have_later_siblings_with_this_field,
-        supertypes,
-        &supertype_count
-      );
-      LOG(
-        "enter node. depth:%u, type:%s, field:%s, row:%u state_count:%u, finished_state_count:%u\n",
-        self->depth,
-        ts_node_type(node),
-        ts_language_field_name_for_id(self->query->language, field_id),
-        ts_node_start_point(node).row,
-        self->states.size,
-        self->finished_states.size
-      );
-
-      bool parent_intersects_range = ts_node_is_null(parent_node) || (
-        ts_node_end_byte(parent_node) > self->start_byte &&
-        ts_node_start_byte(parent_node) < self->end_byte &&
-        point_gt(ts_node_end_point(parent_node), self->start_point) &&
-        point_lt(ts_node_start_point(parent_node), self->end_point)
-      );
-      bool node_intersects_range = parent_intersects_range && (
-        ts_node_end_byte(node) > self->start_byte &&
-        ts_node_start_byte(node) < self->end_byte &&
-        point_gt(ts_node_end_point(node), self->start_point) &&
-        point_lt(ts_node_start_point(node), self->end_point)
-      );
-      bool node_is_error = symbol == ts_builtin_sym_error;
-      bool parent_is_error =
-        !ts_node_is_null(parent_node) &&
-        ts_node_symbol(parent_node) == ts_builtin_sym_error;
-
-      // Add new states for any patterns whose root node is a wildcard.
-      if (!node_is_error) {
-        for (unsigned i = 0; i < self->query->wildcard_root_pattern_count; i++) {
-          PatternEntry *pattern = &self->query->pattern_map.contents[i];
-
-          // If this node matches the first step of the pattern, then add a new
-          // state at the start of this pattern.
-          QueryStep *step = &self->query->steps.contents[pattern->step_index];
-          if (
-            (pattern->is_rooted ?
-              node_intersects_range :
-              (parent_intersects_range && !parent_is_error)) &&
-            (!step->field || field_id == step->field) &&
-            (!step->supertype_symbol || supertype_count > 0)
-          ) {
-            ts_query_cursor__add_state(self, pattern);
-          }
-        }
-      }
-
-      // Add new states for any patterns whose root node matches this node.
-      unsigned i;
-      if (ts_query__pattern_map_search(self->query, symbol, &i)) {
-        PatternEntry *pattern = &self->query->pattern_map.contents[i];
-
-        QueryStep *step = &self->query->steps.contents[pattern->step_index];
-        do {
-          // If this node matches the first step of the pattern, then add a new
-          // state at the start of this pattern.
-          if (
-            (pattern->is_rooted ?
-              node_intersects_range :
-              (parent_intersects_range && !parent_is_error)) &&
-            (!step->field || field_id == step->field)
-          ) {
-            ts_query_cursor__add_state(self, pattern);
-          }
-
-          // Advance to the next pattern whose root node matches this node.
-          i++;
-          if (i == self->query->pattern_map.size) break;
-          pattern = &self->query->pattern_map.contents[i];
-          step = &self->query->steps.contents[pattern->step_index];
-        } while (step->symbol == symbol);
-      }
-
-      // Update all of the in-progress states with current node.
-      for (unsigned i = 0, copy_count = 0; i < self->states.size; i += 1 + copy_count) {
-        QueryState *state = &self->states.contents[i];
-        QueryStep *step = &self->query->steps.contents[state->step_index];
-        state->has_in_progress_alternatives = false;
-        copy_count = 0;
-
-        // Check that the node matches all of the criteria for the next
-        // step of the pattern.
-        if ((uint32_t)state->start_depth + (uint32_t)step->depth != self->depth) continue;
-
-        // Determine if this node matches this step of the pattern, and also
-        // if this node can have later siblings that match this step of the
-        // pattern.
-        bool node_does_match = false;
-        if (step->symbol == WILDCARD_SYMBOL) {
-          node_does_match = !node_is_error && (is_named || !step->is_named);
-        } else {
-          node_does_match = symbol == step->symbol;
-        }
-        bool later_sibling_can_match = has_later_siblings;
-        if ((step->is_immediate && is_named) || state->seeking_immediate_match) {
-          later_sibling_can_match = false;
-        }
-        if (step->is_last_child && has_later_named_siblings) {
-          node_does_match = false;
-        }
-        if (step->supertype_symbol) {
-          bool has_supertype = false;
-          for (unsigned j = 0; j < supertype_count; j++) {
-            if (supertypes[j] == step->supertype_symbol) {
-              has_supertype = true;
-              break;
-            }
-          }
-          if (!has_supertype) node_does_match = false;
-        }
-        if (step->field) {
-          if (step->field == field_id) {
-            if (!can_have_later_siblings_with_this_field) {
-              later_sibling_can_match = false;
-            }
+      switch (ts_tree_cursor_goto_next_sibling_internal(&self->cursor)) {
+        case TreeCursorStepVisible:
+          self->on_visible_node = true;
+          self->ascending = false;
+          break;
+        case TreeCursorStepHidden:
+          self->depth--;
+          self->on_visible_node = false;
+          self->ascending = false;
+          break;
+        default:
+          if (ts_tree_cursor_goto_parent(&self->cursor)) {
+            self->depth--;
           } else {
-            node_does_match = false;
+            LOG("halt at root\n");
+            self->halted = true;
           }
-        }
+      }
 
-        if (step->negated_field_list_id) {
-          TSFieldId *negated_field_ids = &self->query->negated_fields.contents[step->negated_field_list_id];
-          for (;;) {
-            TSFieldId negated_field_id = *negated_field_ids;
-            if (negated_field_id) {
-              negated_field_ids++;
-              if (ts_node_child_by_field_id(node, negated_field_id).id) {
-                node_does_match = false;
-                break;
-              }
-            } else {
-              break;
+      if (self->on_visible_node) {
+        // After leaving a node, remove any states that cannot make further progress.
+        uint32_t deleted_count = 0;
+        for (unsigned i = 0, n = self->states.size; i < n; i++) {
+          QueryState *state = &self->states.contents[i];
+          QueryStep *step = &self->query->steps.contents[state->step_index];
+
+          // If a state completed its pattern inside of this node, but was deferred from finishing
+          // in order to search for longer matches, mark it as finished.
+          if (step->depth == PATTERN_DONE_MARKER) {
+            if (state->start_depth > self->depth || self->halted) {
+              LOG("  finish pattern %u\n", state->pattern_index);
+              array_push(&self->finished_states, *state);
+              did_match = true;
+              deleted_count++;
+              continue;
             }
           }
-        }
 
-        // Remove states immediately if it is ever clear that they cannot match.
-        if (!node_does_match) {
-          if (!later_sibling_can_match) {
+          // If a state needed to match something within this node, then remove that state
+          // as it has failed to match.
+          else if ((uint32_t)state->start_depth + (uint32_t)step->depth > self->depth) {
             LOG(
-              "  discard state. pattern:%u, step:%u\n",
+              "  failed to match. pattern:%u, step:%u\n",
               state->pattern_index,
               state->step_index
             );
@@ -3571,249 +3450,428 @@ static inline bool ts_query_cursor__advance(
               &self->capture_list_pool,
               state->capture_list_id
             );
-            array_erase(&self->states, i);
-            i--;
+            deleted_count++;
+            continue;
           }
-          continue;
-        }
 
-        // Some patterns can match their root node in multiple ways, capturing different
-        // children. If this pattern step could match later children within the same
-        // parent, then this query state cannot simply be updated in place. It must be
-        // split into two states: one that matches this node, and one which skips over
-        // this node, to preserve the possibility of matching later siblings.
-        if (later_sibling_can_match && (
-          step->contains_captures ||
-          ts_query__step_is_fallible(self->query, state->step_index)
-        )) {
-          if (ts_query_cursor__copy_state(self, &state)) {
-            LOG(
-              "  split state for capture. pattern:%u, step:%u\n",
-              state->pattern_index,
-              state->step_index
-            );
-            copy_count++;
+          if (deleted_count > 0) {
+            self->states.contents[i - deleted_count] = *state;
           }
         }
+        self->states.size -= deleted_count;
+      }
+    }
 
-        // If this pattern started with a wildcard, such that the pattern map
-        // actually points to the *second* step of the pattern, then check
-        // that the node has a parent, and capture the parent node if necessary.
-        if (state->needs_parent) {
-          TSNode parent = ts_tree_cursor_parent_node(&self->cursor);
-          if (ts_node_is_null(parent)) {
-            LOG("  missing parent node\n");
-            state->dead = true;
-          } else {
-            state->needs_parent = false;
-            QueryStep *skipped_wildcard_step = step;
-            do {
-              skipped_wildcard_step--;
-            } while (
-              skipped_wildcard_step->is_dead_end ||
-              skipped_wildcard_step->is_pass_through ||
-              skipped_wildcard_step->depth > 0
-            );
-            if (skipped_wildcard_step->capture_ids[0] != NONE) {
-              LOG("  capture wildcard parent\n");
-              ts_query_cursor__capture(
-                self,
-                state,
-                skipped_wildcard_step,
-                parent
-              );
-            }
-          }
-        }
+    // Enter a new node.
+    else {
+      // Get the properties of the current node.
+      TSNode node = ts_tree_cursor_current_node(&self->cursor);
+      TSNode parent_node = ts_tree_cursor_parent_node(&self->cursor);
 
-        // If the current node is captured in this pattern, add it to the capture list.
-        if (step->capture_ids[0] != NONE) {
-          ts_query_cursor__capture(self, state, step, node);
-        }
+      bool parent_precedes_range = !ts_node_is_null(parent_node) && (
+        ts_node_end_byte(parent_node) <= self->start_byte ||
+        point_lte(ts_node_end_point(parent_node), self->start_point)
+      );
+      bool parent_follows_range = !ts_node_is_null(parent_node) && (
+        ts_node_start_byte(parent_node) >= self->end_byte ||
+        point_gte(ts_node_start_point(parent_node), self->end_point)
+      );
+      bool node_precedes_range = parent_precedes_range || (
+        ts_node_end_byte(node) <= self->start_byte ||
+        point_lte(ts_node_end_point(node), self->start_point)
+      );
+      bool node_follows_range = parent_follows_range || (
+        ts_node_start_byte(node) >= self->end_byte ||
+        point_gte(ts_node_start_point(node), self->end_point)
+      );
+      bool parent_intersects_range = !parent_precedes_range && !parent_follows_range;
+      bool node_intersects_range = !node_precedes_range && !node_follows_range;
 
-        if (state->dead) {
-          array_erase(&self->states, i);
-          i--;
-          continue;
-        }
-
-        // Advance this state to the next step of its pattern.
-        state->step_index++;
-        state->seeking_immediate_match = false;
+      if (self->on_visible_node) {
+        TSSymbol symbol = ts_node_symbol(node);
+        bool is_named = ts_node_is_named(node);
+        bool has_later_siblings;
+        bool has_later_named_siblings;
+        bool can_have_later_siblings_with_this_field;
+        TSFieldId field_id = 0;
+        TSSymbol supertypes[8] = {0};
+        unsigned supertype_count = 8;
+        ts_tree_cursor_current_status(
+          &self->cursor,
+          &field_id,
+          &has_later_siblings,
+          &has_later_named_siblings,
+          &can_have_later_siblings_with_this_field,
+          supertypes,
+          &supertype_count
+        );
         LOG(
-          "  advance state. pattern:%u, step:%u\n",
-          state->pattern_index,
-          state->step_index
+          "enter node. depth:%u, type:%s, field:%s, row:%u state_count:%u, finished_state_count:%u\n",
+          self->depth,
+          ts_node_type(node),
+          ts_language_field_name_for_id(self->query->language, field_id),
+          ts_node_start_point(node).row,
+          self->states.size,
+          self->finished_states.size
         );
 
-        QueryStep *next_step = &self->query->steps.contents[state->step_index];
-        if (stop_on_definite_step && next_step->root_pattern_guaranteed) did_match = true;
+        bool node_is_error = symbol == ts_builtin_sym_error;
+        bool parent_is_error =
+          !ts_node_is_null(parent_node) &&
+          ts_node_symbol(parent_node) == ts_builtin_sym_error;
 
-        // If this state's next step has an alternative step, then copy the state in order
-        // to pursue both alternatives. The alternative step itself may have an alternative,
-        // so this is an interactive process.
-        unsigned end_index = i + 1;
-        for (unsigned j = i; j < end_index; j++) {
-          QueryState *state = &self->states.contents[j];
-          QueryStep *next_step = &self->query->steps.contents[state->step_index];
-          if (next_step->alternative_index != NONE) {
-            // A "dead-end" step exists only to add a non-sequential jump into the step sequence,
-            // via its alternative index. When a state reaches a dead-end step, it jumps straight
-            // to the step's alternative.
-            if (next_step->is_dead_end) {
-              state->step_index = next_step->alternative_index;
-              j--;
-              continue;
+        // Add new states for any patterns whose root node is a wildcard.
+        if (!node_is_error) {
+          for (unsigned i = 0; i < self->query->wildcard_root_pattern_count; i++) {
+            PatternEntry *pattern = &self->query->pattern_map.contents[i];
+
+            // If this node matches the first step of the pattern, then add a new
+            // state at the start of this pattern.
+            QueryStep *step = &self->query->steps.contents[pattern->step_index];
+            if (
+              (pattern->is_rooted ?
+                node_intersects_range :
+                (parent_intersects_range && !parent_is_error)) &&
+              (!step->field || field_id == step->field) &&
+              (!step->supertype_symbol || supertype_count > 0)
+            ) {
+              ts_query_cursor__add_state(self, pattern);
+            }
+          }
+        }
+
+        // Add new states for any patterns whose root node matches this node.
+        unsigned i;
+        if (ts_query__pattern_map_search(self->query, symbol, &i)) {
+          PatternEntry *pattern = &self->query->pattern_map.contents[i];
+
+          QueryStep *step = &self->query->steps.contents[pattern->step_index];
+          do {
+            // If this node matches the first step of the pattern, then add a new
+            // state at the start of this pattern.
+            if (
+              (pattern->is_rooted ?
+                node_intersects_range :
+                (parent_intersects_range && !parent_is_error)) &&
+              (!step->field || field_id == step->field)
+            ) {
+              ts_query_cursor__add_state(self, pattern);
             }
 
-            // A "pass-through" step exists only to add a branch into the step sequence,
-            // via its alternative_index. When a state reaches a pass-through step, it splits
-            // in order to process the alternative step, and then it advances to the next step.
-            if (next_step->is_pass_through) {
-              state->step_index++;
-              j--;
-            }
+            // Advance to the next pattern whose root node matches this node.
+            i++;
+            if (i == self->query->pattern_map.size) break;
+            pattern = &self->query->pattern_map.contents[i];
+            step = &self->query->steps.contents[pattern->step_index];
+          } while (step->symbol == symbol);
+        }
 
-            QueryState *copy = ts_query_cursor__copy_state(self, &state);
-            if (copy) {
+        // Update all of the in-progress states with current node.
+        for (unsigned i = 0, copy_count = 0; i < self->states.size; i += 1 + copy_count) {
+          QueryState *state = &self->states.contents[i];
+          QueryStep *step = &self->query->steps.contents[state->step_index];
+          state->has_in_progress_alternatives = false;
+          copy_count = 0;
+
+          // Check that the node matches all of the criteria for the next
+          // step of the pattern.
+          if ((uint32_t)state->start_depth + (uint32_t)step->depth != self->depth) continue;
+
+          // Determine if this node matches this step of the pattern, and also
+          // if this node can have later siblings that match this step of the
+          // pattern.
+          bool node_does_match = false;
+          if (step->symbol == WILDCARD_SYMBOL) {
+            node_does_match = !node_is_error && (is_named || !step->is_named);
+          } else {
+            node_does_match = symbol == step->symbol;
+          }
+          bool later_sibling_can_match = has_later_siblings;
+          if ((step->is_immediate && is_named) || state->seeking_immediate_match) {
+            later_sibling_can_match = false;
+          }
+          if (step->is_last_child && has_later_named_siblings) {
+            node_does_match = false;
+          }
+          if (step->supertype_symbol) {
+            bool has_supertype = false;
+            for (unsigned j = 0; j < supertype_count; j++) {
+              if (supertypes[j] == step->supertype_symbol) {
+                has_supertype = true;
+                break;
+              }
+            }
+            if (!has_supertype) node_does_match = false;
+          }
+          if (step->field) {
+            if (step->field == field_id) {
+              if (!can_have_later_siblings_with_this_field) {
+                later_sibling_can_match = false;
+              }
+            } else {
+              node_does_match = false;
+            }
+          }
+
+          if (step->negated_field_list_id) {
+            TSFieldId *negated_field_ids = &self->query->negated_fields.contents[step->negated_field_list_id];
+            for (;;) {
+              TSFieldId negated_field_id = *negated_field_ids;
+              if (negated_field_id) {
+                negated_field_ids++;
+                if (ts_node_child_by_field_id(node, negated_field_id).id) {
+                  node_does_match = false;
+                  break;
+                }
+              } else {
+                break;
+              }
+            }
+          }
+
+          // Remove states immediately if it is ever clear that they cannot match.
+          if (!node_does_match) {
+            if (!later_sibling_can_match) {
               LOG(
-                "  split state for branch. pattern:%u, from_step:%u, to_step:%u, immediate:%d, capture_count: %u\n",
-                copy->pattern_index,
-                copy->step_index,
-                next_step->alternative_index,
-                next_step->alternative_is_immediate,
-                capture_list_pool_get(&self->capture_list_pool, copy->capture_list_id)->size
+                "  discard state. pattern:%u, step:%u\n",
+                state->pattern_index,
+                state->step_index
+              );
+              capture_list_pool_release(
+                &self->capture_list_pool,
+                state->capture_list_id
+              );
+              array_erase(&self->states, i);
+              i--;
+            }
+            continue;
+          }
+
+          // Some patterns can match their root node in multiple ways, capturing different
+          // children. If this pattern step could match later children within the same
+          // parent, then this query state cannot simply be updated in place. It must be
+          // split into two states: one that matches this node, and one which skips over
+          // this node, to preserve the possibility of matching later siblings.
+          if (later_sibling_can_match && (
+            step->contains_captures ||
+            ts_query__step_is_fallible(self->query, state->step_index)
+          )) {
+            if (ts_query_cursor__copy_state(self, &state)) {
+              LOG(
+                "  split state for capture. pattern:%u, step:%u\n",
+                state->pattern_index,
+                state->step_index
               );
-              end_index++;
               copy_count++;
-              copy->step_index = next_step->alternative_index;
-              if (next_step->alternative_is_immediate) {
-                copy->seeking_immediate_match = true;
+            }
+          }
+
+          // If this pattern started with a wildcard, such that the pattern map
+          // actually points to the *second* step of the pattern, then check
+          // that the node has a parent, and capture the parent node if necessary.
+          if (state->needs_parent) {
+            TSNode parent = ts_tree_cursor_parent_node(&self->cursor);
+            if (ts_node_is_null(parent)) {
+              LOG("  missing parent node\n");
+              state->dead = true;
+            } else {
+              state->needs_parent = false;
+              QueryStep *skipped_wildcard_step = step;
+              do {
+                skipped_wildcard_step--;
+              } while (
+                skipped_wildcard_step->is_dead_end ||
+                skipped_wildcard_step->is_pass_through ||
+                skipped_wildcard_step->depth > 0
+              );
+              if (skipped_wildcard_step->capture_ids[0] != NONE) {
+                LOG("  capture wildcard parent\n");
+                ts_query_cursor__capture(
+                  self,
+                  state,
+                  skipped_wildcard_step,
+                  parent
+                );
+              }
+            }
+          }
+
+          // If the current node is captured in this pattern, add it to the capture list.
+          if (step->capture_ids[0] != NONE) {
+            ts_query_cursor__capture(self, state, step, node);
+          }
+
+          if (state->dead) {
+            array_erase(&self->states, i);
+            i--;
+            continue;
+          }
+
+          // Advance this state to the next step of its pattern.
+          state->step_index++;
+          state->seeking_immediate_match = false;
+          LOG(
+            "  advance state. pattern:%u, step:%u\n",
+            state->pattern_index,
+            state->step_index
+          );
+
+          QueryStep *next_step = &self->query->steps.contents[state->step_index];
+          if (stop_on_definite_step && next_step->root_pattern_guaranteed) did_match = true;
+
+          // If this state's next step has an alternative step, then copy the state in order
+          // to pursue both alternatives. The alternative step itself may have an alternative,
+          // so this is an interactive process.
+          unsigned end_index = i + 1;
+          for (unsigned j = i; j < end_index; j++) {
+            QueryState *state = &self->states.contents[j];
+            QueryStep *next_step = &self->query->steps.contents[state->step_index];
+            if (next_step->alternative_index != NONE) {
+              // A "dead-end" step exists only to add a non-sequential jump into the step sequence,
+              // via its alternative index. When a state reaches a dead-end step, it jumps straight
+              // to the step's alternative.
+              if (next_step->is_dead_end) {
+                state->step_index = next_step->alternative_index;
+                j--;
+                continue;
+              }
+
+              // A "pass-through" step exists only to add a branch into the step sequence,
+              // via its alternative_index. When a state reaches a pass-through step, it splits
+              // in order to process the alternative step, and then it advances to the next step.
+              if (next_step->is_pass_through) {
+                state->step_index++;
+                j--;
+              }
+
+              QueryState *copy = ts_query_cursor__copy_state(self, &state);
+              if (copy) {
+                LOG(
+                  "  split state for branch. pattern:%u, from_step:%u, to_step:%u, immediate:%d, capture_count: %u\n",
+                  copy->pattern_index,
+                  copy->step_index,
+                  next_step->alternative_index,
+                  next_step->alternative_is_immediate,
+                  capture_list_pool_get(&self->capture_list_pool, copy->capture_list_id)->size
+                );
+                end_index++;
+                copy_count++;
+                copy->step_index = next_step->alternative_index;
+                if (next_step->alternative_is_immediate) {
+                  copy->seeking_immediate_match = true;
+                }
+              }
+            }
+          }
+        }
+
+        for (unsigned i = 0; i < self->states.size; i++) {
+          QueryState *state = &self->states.contents[i];
+          if (state->dead) {
+            array_erase(&self->states, i);
+            i--;
+            continue;
+          }
+
+          // Enfore the longest-match criteria. When a query pattern contains optional or
+          // repeated nodes, this is necessary to avoid multiple redundant states, where
+          // one state has a strict subset of another state's captures.
+          bool did_remove = false;
+          for (unsigned j = i + 1; j < self->states.size; j++) {
+            QueryState *other_state = &self->states.contents[j];
+
+            // Query states are kept in ascending order of start_depth and pattern_index.
+            // Since the longest-match criteria is only used for deduping matches of the same
+            // pattern and root node, we only need to perform pairwise comparisons within a
+            // small slice of the states array.
+            if (
+              other_state->start_depth != state->start_depth ||
+              other_state->pattern_index != state->pattern_index
+            ) break;
+
+            bool left_contains_right, right_contains_left;
+            ts_query_cursor__compare_captures(
+              self,
+              state,
+              other_state,
+              &left_contains_right,
+              &right_contains_left
+            );
+            if (left_contains_right) {
+              if (state->step_index == other_state->step_index) {
+                LOG(
+                  "  drop shorter state. pattern: %u, step_index: %u\n",
+                  state->pattern_index,
+                  state->step_index
+                );
+                capture_list_pool_release(&self->capture_list_pool, other_state->capture_list_id);
+                array_erase(&self->states, j);
+                j--;
+                continue;
+              }
+              other_state->has_in_progress_alternatives = true;
+            }
+            if (right_contains_left) {
+              if (state->step_index == other_state->step_index) {
+                LOG(
+                  "  drop shorter state. pattern: %u, step_index: %u\n",
+                  state->pattern_index,
+                  state->step_index
+                );
+                capture_list_pool_release(&self->capture_list_pool, state->capture_list_id);
+                array_erase(&self->states, i);
+                i--;
+                did_remove = true;
+                break;
+              }
+              state->has_in_progress_alternatives = true;
+            }
+          }
+
+          // If the state is at the end of its pattern, remove it from the list
+          // of in-progress states and add it to the list of finished states.
+          if (!did_remove) {
+            LOG(
+              "  keep state. pattern: %u, start_depth: %u, step_index: %u, capture_count: %u\n",
+              state->pattern_index,
+              state->start_depth,
+              state->step_index,
+              capture_list_pool_get(&self->capture_list_pool, state->capture_list_id)->size
+            );
+            QueryStep *next_step = &self->query->steps.contents[state->step_index];
+            if (next_step->depth == PATTERN_DONE_MARKER) {
+              if (state->has_in_progress_alternatives) {
+                LOG("  defer finishing pattern %u\n", state->pattern_index);
+              } else {
+                LOG("  finish pattern %u\n", state->pattern_index);
+                array_push(&self->finished_states, *state);
+                array_erase(&self->states, (uint32_t)(state - self->states.contents));
+                did_match = true;
+                i--;
               }
             }
           }
         }
       }
 
-      for (unsigned i = 0; i < self->states.size; i++) {
-        QueryState *state = &self->states.contents[i];
-        if (state->dead) {
-          array_erase(&self->states, i);
-          i--;
-          continue;
-        }
-
-        // Enfore the longest-match criteria. When a query pattern contains optional or
-        // repeated nodes, this is necessary to avoid multiple redundant states, where
-        // one state has a strict subset of another state's captures.
-        bool did_remove = false;
-        for (unsigned j = i + 1; j < self->states.size; j++) {
-          QueryState *other_state = &self->states.contents[j];
-
-          // Query states are kept in ascending order of start_depth and pattern_index.
-          // Since the longest-match criteria is only used for deduping matches of the same
-          // pattern and root node, we only need to perform pairwise comparisons within a
-          // small slice of the states array.
-          if (
-            other_state->start_depth != state->start_depth ||
-            other_state->pattern_index != state->pattern_index
-          ) break;
-
-          bool left_contains_right, right_contains_left;
-          ts_query_cursor__compare_captures(
-            self,
-            state,
-            other_state,
-            &left_contains_right,
-            &right_contains_left
-          );
-          if (left_contains_right) {
-            if (state->step_index == other_state->step_index) {
-              LOG(
-                "  drop shorter state. pattern: %u, step_index: %u\n",
-                state->pattern_index,
-                state->step_index
-              );
-              capture_list_pool_release(&self->capture_list_pool, other_state->capture_list_id);
-              array_erase(&self->states, j);
-              j--;
-              continue;
-            }
-            other_state->has_in_progress_alternatives = true;
-          }
-          if (right_contains_left) {
-            if (state->step_index == other_state->step_index) {
-              LOG(
-                "  drop shorter state. pattern: %u, step_index: %u\n",
-                state->pattern_index,
-                state->step_index
-              );
-              capture_list_pool_release(&self->capture_list_pool, state->capture_list_id);
-              array_erase(&self->states, i);
-              i--;
-              did_remove = true;
-              break;
-            }
-            state->has_in_progress_alternatives = true;
-          }
-        }
-
-        // If the state is at the end of its pattern, remove it from the list
-        // of in-progress states and add it to the list of finished states.
-        if (!did_remove) {
-          LOG(
-            "  keep state. pattern: %u, start_depth: %u, step_index: %u, capture_count: %u\n",
-            state->pattern_index,
-            state->start_depth,
-            state->step_index,
-            capture_list_pool_get(&self->capture_list_pool, state->capture_list_id)->size
-          );
-          QueryStep *next_step = &self->query->steps.contents[state->step_index];
-          if (next_step->depth == PATTERN_DONE_MARKER) {
-            if (state->has_in_progress_alternatives) {
-              LOG("  defer finishing pattern %u\n", state->pattern_index);
-            } else {
-              LOG("  finish pattern %u\n", state->pattern_index);
-              array_push(&self->finished_states, *state);
-              array_erase(&self->states, (uint32_t)(state - self->states.contents));
-              did_match = true;
-              i--;
-            }
-          }
-        }
-      }
-
-      // When the current node ends prior to the desired start offset,
-      // only descend for the purpose of continuing in-progress matches.
-      bool has_in_progress_matches = false;
-      if (!node_intersects_range) {
-        for (unsigned i = 0; i < self->states.size; i++) {
-          QueryState *state = &self->states.contents[i];;
-          QueryStep *next_step = &self->query->steps.contents[state->step_index];
-          if (
-            next_step->depth != PATTERN_DONE_MARKER &&
-            state->start_depth + next_step->depth > self->depth
-          ) {
-            has_in_progress_matches = true;
+      bool should_descend =
+        node_intersects_range ||
+        ts_query_cursor__should_descend_outside_of_range(self);
+      if (should_descend) {
+        switch (ts_tree_cursor_goto_first_child_internal(&self->cursor)) {
+          case TreeCursorStepVisible:
+            self->depth++;
+            self->on_visible_node = true;
+            continue;
+          case TreeCursorStepHidden:
+            self->on_visible_node = false;
+            continue;
+          default:
             break;
-          }
         }
       }
 
-      bool should_descend = node_intersects_range || has_in_progress_matches;
-      if (!should_descend) {
-        LOG(
-          "  not descending. node end byte: %u, start byte: %u\n",
-          ts_node_end_byte(node),
-          self->start_byte
-        );
-      }
-
-      if (should_descend && ts_tree_cursor_goto_first_child(&self->cursor)) {
-        self->depth++;
-      } else {
-        self->ascending = true;
-      }
+      self->ascending = true;
     }
   }
 }
diff --git a/lib/src/subtree.h b/lib/src/subtree.h
index 8456d2f1..a0e838eb 100644
--- a/lib/src/subtree.h
+++ b/lib/src/subtree.h
@@ -291,6 +291,12 @@ static inline uint32_t ts_subtree_repeat_depth(Subtree self) {
   return self.data.is_inline ? 0 : self.ptr->repeat_depth;
 }
 
+static inline uint32_t ts_subtree_is_repetition(Subtree self) {
+  return self.data.is_inline
+    ? 0
+    : !self.ptr->named && !self.ptr->visible && self.ptr->child_count != 0;
+}
+
 static inline uint32_t ts_subtree_node_count(Subtree self) {
   return (self.data.is_inline || self.ptr->child_count == 0) ? 1 : self.ptr->node_count;
 }

From bd63fb2a0d837bb5ae254ce7749d63c58ebac945 Mon Sep 17 00:00:00 2001
From: Max Brunsfeld <maxbrunsfeld@gmail.com>
Date: Wed, 15 Feb 2023 14:03:36 -0800
Subject: [PATCH 040/347] Tweak query tests

---
 Cargo.lock                  |  7 +++++
 cli/Cargo.toml              |  3 ++-
 cli/src/tests/query_test.rs | 51 ++++++++++++++++++++++++-------------
 lib/Cargo.toml              |  2 +-
 4 files changed, 44 insertions(+), 19 deletions(-)

diff --git a/Cargo.lock b/Cargo.lock
index f5c4e7e4..ca773788 100644
--- a/Cargo.lock
+++ b/Cargo.lock
@@ -584,6 +584,7 @@ dependencies = [
  "tree-sitter-highlight",
  "tree-sitter-loader",
  "tree-sitter-tags",
+ "unindent",
  "walkdir",
  "webbrowser",
  "which",
@@ -647,6 +648,12 @@ version = "0.1.10"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "c0edd1e5b14653f783770bce4a4dabb4a5108a5370a5f5d8cfe8710c361f6c8b"
 
+[[package]]
+name = "unindent"
+version = "0.2.1"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "5aa30f5ea51ff7edfc797c6d3f9ec8cbd8cfedef5371766b7181d33977f4814f"
+
 [[package]]
 name = "utf8-width"
 version = "0.1.6"
diff --git a/cli/Cargo.toml b/cli/Cargo.toml
index 5403075d..77cf52e4 100644
--- a/cli/Cargo.toml
+++ b/cli/Cargo.toml
@@ -3,7 +3,7 @@ name = "tree-sitter-cli"
 description = "CLI tool for developing, testing, and using Tree-sitter parsers"
 version = "0.20.7"
 authors = ["Max Brunsfeld <maxbrunsfeld@gmail.com>"]
-edition = "2018"
+edition = "2021"
 license = "MIT"
 readme = "README.md"
 keywords = ["incremental", "parsing"]
@@ -73,6 +73,7 @@ rand = "0.8"
 tempfile = "3"
 pretty_assertions = "0.7.2"
 ctor = "0.1"
+unindent = "0.2"
 
 [build-dependencies]
 toml = "0.5"
diff --git a/cli/src/tests/query_test.rs b/cli/src/tests/query_test.rs
index 31cb8035..63dea5a6 100644
--- a/cli/src/tests/query_test.rs
+++ b/cli/src/tests/query_test.rs
@@ -2,6 +2,7 @@ use super::helpers::{
     allocations,
     fixtures::get_language,
     query_helpers::{Match, Pattern},
+    ITERATION_COUNT,
 };
 use lazy_static::lazy_static;
 use rand::{prelude::StdRng, SeedableRng};
@@ -10,6 +11,7 @@ use tree_sitter::{
     CaptureQuantifier, Language, Node, Parser, Point, Query, QueryCapture, QueryCursor, QueryError,
     QueryErrorKind, QueryMatch, QueryPredicate, QueryPredicateArg, QueryProperty,
 };
+use unindent::Unindent;
 
 lazy_static! {
     static ref EXAMPLE_FILTER: Option<String> = env::var("TREE_SITTER_TEST_EXAMPLE_FILTER").ok();
@@ -1920,20 +1922,28 @@ fn test_query_matches_within_point_range() {
         let language = get_language("javascript");
         let query = Query::new(language, "(identifier) @element").unwrap();
 
-        let source = "[a, b,\n c, d,\n e, f,\n g]";
+        let source = "
+            [
+              a, b,
+              c, d,
+              e, f,
+              g, h,
+              i, j,
+              k, l,
+            ]
+        "
+        .unindent();
 
         let mut parser = Parser::new();
         parser.set_language(language).unwrap();
         let tree = parser.parse(&source, None).unwrap();
-
         let mut cursor = QueryCursor::new();
 
         let matches = cursor
-            .set_point_range(Point::new(0, 0)..Point::new(1, 3))
+            .set_point_range(Point::new(1, 0)..Point::new(2, 3))
             .matches(&query, tree.root_node(), source.as_bytes());
-
         assert_eq!(
-            collect_matches(matches, &query, source),
+            collect_matches(matches, &query, &source),
             &[
                 (0, vec![("element", "a")]),
                 (0, vec![("element", "b")]),
@@ -1942,11 +1952,10 @@ fn test_query_matches_within_point_range() {
         );
 
         let matches = cursor
-            .set_point_range(Point::new(1, 0)..Point::new(2, 3))
+            .set_point_range(Point::new(2, 0)..Point::new(3, 3))
             .matches(&query, tree.root_node(), source.as_bytes());
-
         assert_eq!(
-            collect_matches(matches, &query, source),
+            collect_matches(matches, &query, &source),
             &[
                 (0, vec![("element", "c")]),
                 (0, vec![("element", "d")]),
@@ -1954,16 +1963,19 @@ fn test_query_matches_within_point_range() {
             ]
         );
 
+        // Zero end point is treated like no end point.
         let matches = cursor
-            .set_point_range(Point::new(2, 1)..Point::new(0, 0))
+            .set_point_range(Point::new(4, 1)..Point::new(0, 0))
             .matches(&query, tree.root_node(), source.as_bytes());
-
         assert_eq!(
-            collect_matches(matches, &query, source),
+            collect_matches(matches, &query, &source),
             &[
-                (0, vec![("element", "e")]),
-                (0, vec![("element", "f")]),
                 (0, vec![("element", "g")]),
+                (0, vec![("element", "h")]),
+                (0, vec![("element", "i")]),
+                (0, vec![("element", "j")]),
+                (0, vec![("element", "k")]),
+                (0, vec![("element", "l")]),
             ]
         );
     });
@@ -3634,17 +3646,22 @@ fn test_query_random() {
             .parse(include_str!("helpers/query_helpers.rs"), None)
             .unwrap();
 
-        // let start_seed = *SEED;
         let start_seed = 0;
+        let end_seed = start_seed + *ITERATION_COUNT;
 
-        for i in 0..100 {
-            let seed = (start_seed + i) as u64;
+        for seed in start_seed..(start_seed + end_seed) {
+            let seed = seed as u64;
             let mut rand = StdRng::seed_from_u64(seed);
             let (pattern_ast, _) = Pattern::random_pattern_in_tree(&pattern_tree, &mut rand);
             let pattern = pattern_ast.to_string();
             let expected_matches = pattern_ast.matches_in_tree(&test_tree);
 
-            let query = Query::new(language, &pattern).unwrap();
+            let query = match Query::new(language, &pattern) {
+                Ok(query) => query,
+                Err(e) => {
+                    panic!("failed to build query for pattern {pattern} - {e}. seed: {seed}");
+                }
+            };
             let mut actual_matches = cursor
                 .matches(
                     &query,
diff --git a/lib/Cargo.toml b/lib/Cargo.toml
index d096efdc..c2d35685 100644
--- a/lib/Cargo.toml
+++ b/lib/Cargo.toml
@@ -3,7 +3,7 @@ name = "tree-sitter"
 description = "Rust bindings to the Tree-sitter parsing library"
 version = "0.20.9"
 authors = ["Max Brunsfeld <maxbrunsfeld@gmail.com>"]
-edition = "2018"
+edition = "2021"
 license = "MIT"
 readme = "binding_rust/README.md"
 keywords = ["incremental", "parsing"]

From 40703f110c7f16650b686fc4c56ab128cf61e449 Mon Sep 17 00:00:00 2001
From: Max Brunsfeld <maxbrunsfeld@gmail.com>
Date: Wed, 15 Feb 2023 14:40:36 -0800
Subject: [PATCH 041/347] Fix bug in maintenance of query cursor's tree depth

---
 cli/src/tests/query_test.rs |  3 ---
 lib/src/query.c             | 24 +++++++++++++++---------
 2 files changed, 15 insertions(+), 12 deletions(-)

diff --git a/cli/src/tests/query_test.rs b/cli/src/tests/query_test.rs
index 63dea5a6..c691df30 100644
--- a/cli/src/tests/query_test.rs
+++ b/cli/src/tests/query_test.rs
@@ -1876,7 +1876,6 @@ fn test_query_matches_within_byte_range() {
             cursor
                 .set_byte_range(0..8)
                 .matches(&query, tree.root_node(), source.as_bytes());
-
         assert_eq!(
             collect_matches(matches, &query, source),
             &[
@@ -1890,7 +1889,6 @@ fn test_query_matches_within_byte_range() {
             cursor
                 .set_byte_range(5..15)
                 .matches(&query, tree.root_node(), source.as_bytes());
-
         assert_eq!(
             collect_matches(matches, &query, source),
             &[
@@ -1904,7 +1902,6 @@ fn test_query_matches_within_byte_range() {
             cursor
                 .set_byte_range(12..0)
                 .matches(&query, tree.root_node(), source.as_bytes());
-
         assert_eq!(
             collect_matches(matches, &query, source),
             &[
diff --git a/lib/src/query.c b/lib/src/query.c
index 04a59f9a..b2450ce2 100644
--- a/lib/src/query.c
+++ b/lib/src/query.c
@@ -3393,21 +3393,28 @@ static inline bool ts_query_cursor__advance(
 
     // Exit the current node.
     if (self->ascending) {
-      LOG(
-        "leave node. depth:%u, type:%s\n",
-        self->depth,
-        ts_node_type(ts_tree_cursor_current_node(&self->cursor))
-      );
+      if (self->on_visible_node) {
+        LOG(
+          "leave node. depth:%u, type:%s\n",
+          self->depth,
+          ts_node_type(ts_tree_cursor_current_node(&self->cursor))
+        );
+      }
 
       // Leave this node by stepping to its next sibling or to its parent.
       switch (ts_tree_cursor_goto_next_sibling_internal(&self->cursor)) {
         case TreeCursorStepVisible:
-          self->on_visible_node = true;
+          if (!self->on_visible_node) {
+            self->depth++;
+            self->on_visible_node = true;
+          }
           self->ascending = false;
           break;
         case TreeCursorStepHidden:
-          self->depth--;
-          self->on_visible_node = false;
+          if (self->on_visible_node) {
+            self->depth--;
+            self->on_visible_node = false;
+          }
           self->ascending = false;
           break;
         default:
@@ -3467,7 +3474,6 @@ static inline bool ts_query_cursor__advance(
       // Get the properties of the current node.
       TSNode node = ts_tree_cursor_current_node(&self->cursor);
       TSNode parent_node = ts_tree_cursor_parent_node(&self->cursor);
-
       bool parent_precedes_range = !ts_node_is_null(parent_node) && (
         ts_node_end_byte(parent_node) <= self->start_byte ||
         point_lte(ts_node_end_point(parent_node), self->start_point)

From 837899e456202c6d112679c03e7e989451973a6d Mon Sep 17 00:00:00 2001
From: Max Brunsfeld <maxbrunsfeld@gmail.com>
Date: Wed, 15 Feb 2023 18:24:07 -0800
Subject: [PATCH 042/347] Add API for checking if a pattern in a query is
 non-local

---
 cli/src/tests/query_test.rs   | 62 +++++++++++++++++++++++++++++++++++
 lib/binding_rust/bindings.rs  |  3 ++
 lib/binding_rust/lib.rs       |  8 ++++-
 lib/include/tree_sitter/api.h | 27 ++++++++++-----
 lib/src/query.c               | 24 ++++++++++++--
 5 files changed, 112 insertions(+), 12 deletions(-)

diff --git a/cli/src/tests/query_test.rs b/cli/src/tests/query_test.rs
index c691df30..e99fe06e 100644
--- a/cli/src/tests/query_test.rs
+++ b/cli/src/tests/query_test.rs
@@ -4084,6 +4084,68 @@ fn test_query_is_pattern_rooted() {
     });
 }
 
+#[test]
+fn test_query_is_pattern_non_local() {
+    struct Row {
+        description: &'static str,
+        pattern: &'static str,
+        is_non_local: bool,
+    }
+
+    let rows = [
+        Row {
+            description: "simple token",
+            pattern: r#"(identifier)"#,
+            is_non_local: false,
+        },
+        Row {
+            description: "siblings that can occur in an argument list",
+            pattern: r#"((identifier) (identifier))"#,
+            is_non_local: true,
+        },
+        Row {
+            description: "siblings that can occur in a statement block",
+            pattern: r#"((return_statement) (return_statement))"#,
+            is_non_local: true,
+        },
+        Row {
+            description: "siblings that can occur in a source file",
+            pattern: r#"((function_definition) (class_definition))"#,
+            is_non_local: true,
+        },
+        Row {
+            description: "siblings that can't occur in any repetition",
+            pattern: r#"("{" "}")"#,
+            is_non_local: false,
+        },
+    ];
+
+    allocations::record(|| {
+        eprintln!("");
+
+        let language = get_language("python");
+        for row in &rows {
+            if let Some(filter) = EXAMPLE_FILTER.as_ref() {
+                if !row.description.contains(filter.as_str()) {
+                    continue;
+                }
+            }
+            eprintln!("  query example: {:?}", row.description);
+            let query = Query::new(language, row.pattern).unwrap();
+            assert_eq!(
+                query.is_pattern_non_local(0),
+                row.is_non_local,
+                "Description: {}, Pattern: {:?}",
+                row.description,
+                row.pattern
+                    .split_ascii_whitespace()
+                    .collect::<Vec<_>>()
+                    .join(" "),
+            )
+        }
+    });
+}
+
 #[test]
 fn test_capture_quantifiers() {
     struct Row {
diff --git a/lib/binding_rust/bindings.rs b/lib/binding_rust/bindings.rs
index 4591a380..be117f83 100644
--- a/lib/binding_rust/bindings.rs
+++ b/lib/binding_rust/bindings.rs
@@ -677,6 +677,9 @@ extern "C" {
         length: *mut u32,
     ) -> *const TSQueryPredicateStep;
 }
+extern "C" {
+    pub fn ts_query_is_pattern_non_local(self_: *const TSQuery, pattern_index: u32) -> bool;
+}
 extern "C" {
     pub fn ts_query_is_pattern_rooted(self_: *const TSQuery, pattern_index: u32) -> bool;
 }
diff --git a/lib/binding_rust/lib.rs b/lib/binding_rust/lib.rs
index 6f044cca..579bf8e2 100644
--- a/lib/binding_rust/lib.rs
+++ b/lib/binding_rust/lib.rs
@@ -1736,11 +1736,17 @@ impl Query {
     }
 
     /// Check if a given pattern within a query has a single root node.
-    #[doc(alias = "ts_query_is_pattern_guaranteed_at_step")]
+    #[doc(alias = "ts_query_is_pattern_rooted")]
     pub fn is_pattern_rooted(&self, index: usize) -> bool {
         unsafe { ffi::ts_query_is_pattern_rooted(self.ptr.as_ptr(), index as u32) }
     }
 
+    /// Check if a given pattern within a query has a single root node.
+    #[doc(alias = "ts_query_is_pattern_non_local")]
+    pub fn is_pattern_non_local(&self, index: usize) -> bool {
+        unsafe { ffi::ts_query_is_pattern_non_local(self.ptr.as_ptr(), index as u32) }
+    }
+
     /// Check if a given step in a query is 'definite'.
     ///
     /// A query step is 'definite' if its parent pattern will be guaranteed to match
diff --git a/lib/include/tree_sitter/api.h b/lib/include/tree_sitter/api.h
index 5b48cf60..edc1c36a 100644
--- a/lib/include/tree_sitter/api.h
+++ b/lib/include/tree_sitter/api.h
@@ -750,15 +750,26 @@ const TSQueryPredicateStep *ts_query_predicates_for_pattern(
   uint32_t *length
 );
 
-bool ts_query_is_pattern_rooted(
-  const TSQuery *self,
-  uint32_t pattern_index
-);
+/*
+ * Check if the given pattern in the query has a single root node.
+ */
+bool ts_query_is_pattern_rooted(const TSQuery *self, uint32_t pattern_index);
 
-bool ts_query_is_pattern_guaranteed_at_step(
-  const TSQuery *self,
-  uint32_t byte_offset
-);
+/*
+ * Check if the given pattern in the query is 'non local'.
+ *
+ * A non-local pattern has multiple root nodes and can match within a
+ * repeating sequence of nodes, as specified by the grammar. Non-local
+ * patterns disable certain optimizations that would otherwise be possible
+ * when executing a query on a specific range of a syntax tree.
+ */
+bool ts_query_is_pattern_non_local(const TSQuery *self, uint32_t pattern_index);
+
+/*
+ * Check if a given pattern is guaranteed to match once a given step is reached.
+ * The step is specified by its byte offset in the query's source code.
+ */
+bool ts_query_is_pattern_guaranteed_at_step(const TSQuery *self, uint32_t byte_offset);
 
 /**
  * Get the name and length of one of the query's captures, or one of the
diff --git a/lib/src/query.c b/lib/src/query.c
index b2450ce2..cfe11438 100644
--- a/lib/src/query.c
+++ b/lib/src/query.c
@@ -146,6 +146,7 @@ typedef struct {
   Slice steps;
   Slice predicate_steps;
   uint32_t start_byte;
+  bool is_non_local;
 } QueryPattern;
 
 typedef struct {
@@ -1455,7 +1456,7 @@ static bool ts_query__analyze_patterns(TSQuery *self, unsigned *error_offset) {
     if (!pattern->is_rooted) {
       QueryStep *step = &self->steps.contents[pattern->step_index];
       if (step->symbol != WILDCARD_SYMBOL) {
-        array_push(&non_rooted_pattern_start_steps, pattern->step_index);
+        array_push(&non_rooted_pattern_start_steps, i);
       }
     }
   }
@@ -1868,7 +1869,8 @@ static bool ts_query__analyze_patterns(TSQuery *self, unsigned *error_offset) {
   // prevent certain optimizations with range restrictions.
   analysis.did_abort = false;
   for (uint32_t i = 0; i < non_rooted_pattern_start_steps.size; i++) {
-    uint16_t step_index = non_rooted_pattern_start_steps.contents[i];
+    uint16_t pattern_entry_index = non_rooted_pattern_start_steps.contents[i];
+    PatternEntry *pattern_entry = &self->pattern_map.contents[pattern_entry_index];
 
     analysis_state_set__clear(&analysis.states, &analysis.state_pool);
     analysis_state_set__clear(&analysis.deeper_states, &analysis.state_pool);
@@ -1880,7 +1882,7 @@ static bool ts_query__analyze_patterns(TSQuery *self, unsigned *error_offset) {
       for (uint32_t k = 0; k < subgraph->start_states.size; k++) {
         TSStateId parse_state = subgraph->start_states.contents[k];
         analysis_state_set__push(&analysis.states, &analysis.state_pool, &((AnalysisState) {
-          .step_index = step_index,
+          .step_index = pattern_entry->step_index,
           .stack = {
             [0] = {
               .parse_state = parse_state,
@@ -1906,6 +1908,10 @@ static bool ts_query__analyze_patterns(TSQuery *self, unsigned *error_offset) {
       &analysis
     );
 
+    if (analysis.finished_parent_symbols.size > 0) {
+      self->patterns.contents[pattern_entry->pattern_index].is_non_local = true;
+    }
+
     for (unsigned k = 0; k < analysis.finished_parent_symbols.size; k++) {
       TSSymbol symbol = analysis.finished_parent_symbols.contents[k];
       array_insert_sorted_by(&self->repeat_symbols_with_rootless_patterns, , symbol);
@@ -2697,6 +2703,7 @@ TSQuery *ts_query_new(
       .steps = (Slice) {.offset = start_step_index},
       .predicate_steps = (Slice) {.offset = start_predicate_step_index},
       .start_byte = stream_offset(&stream),
+      .is_non_local = false,
     }));
     CaptureQuantifiers capture_quantifiers = capture_quantifiers_new();
     *error_type = ts_query__parse_pattern(self, &stream, 0, false, &capture_quantifiers);
@@ -2876,6 +2883,17 @@ bool ts_query_is_pattern_rooted(
   return true;
 }
 
+bool ts_query_is_pattern_non_local(
+  const TSQuery *self,
+  uint32_t pattern_index
+) {
+  if (pattern_index < self->patterns.size) {
+    return self->patterns.contents[pattern_index].is_non_local;
+  } else {
+    return false;
+  }
+}
+
 bool ts_query_is_pattern_guaranteed_at_step(
   const TSQuery *self,
   uint32_t byte_offset

From 8dcf8517399d83ad7cfd2f046c8ea441827ebde2 Mon Sep 17 00:00:00 2001
From: Max Brunsfeld <maxbrunsfeld@gmail.com>
Date: Thu, 16 Feb 2023 12:03:51 -0800
Subject: [PATCH 043/347] Add unit test for querying within a range of a long
 top-level repetition

---
 cli/src/tests/query_test.rs | 90 ++++++++++++++++++++++++++++++++++++-
 1 file changed, 88 insertions(+), 2 deletions(-)

diff --git a/cli/src/tests/query_test.rs b/cli/src/tests/query_test.rs
index e99fe06e..7d01c26e 100644
--- a/cli/src/tests/query_test.rs
+++ b/cli/src/tests/query_test.rs
@@ -2219,6 +2219,57 @@ fn test_query_captures_within_byte_range_assigned_after_iterating() {
     });
 }
 
+#[test]
+fn test_query_matches_within_range_of_long_repetition() {
+    allocations::record(|| {
+        let language = get_language("rust");
+        let query = Query::new(
+            language,
+            "
+            (function_item name: (identifier) @fn-name)
+            ",
+        )
+        .unwrap();
+
+        let source = "
+            fn zero() {}
+            fn one() {}
+            fn two() {}
+            fn three() {}
+            fn four() {}
+            fn five() {}
+            fn six() {}
+            fn seven() {}
+            fn eight() {}
+            fn nine() {}
+            fn ten() {}
+            fn eleven() {}
+            fn twelve() {}
+        "
+        .unindent();
+
+        let mut parser = Parser::new();
+        let mut cursor = QueryCursor::new();
+
+        parser.set_language(language).unwrap();
+        let tree = parser.parse(&source, None).unwrap();
+
+        let matches = cursor
+            .set_point_range(Point::new(8, 0)..Point::new(20, 0))
+            .matches(&query, tree.root_node(), source.as_bytes());
+        assert_eq!(
+            collect_matches(matches, &query, &source),
+            &[
+                (0, vec![("fn-name", "eight")]),
+                (0, vec![("fn-name", "nine")]),
+                (0, vec![("fn-name", "ten")]),
+                (0, vec![("fn-name", "eleven")]),
+                (0, vec![("fn-name", "twelve")]),
+            ]
+        );
+    });
+}
+
 #[test]
 fn test_query_matches_different_queries_same_cursor() {
     allocations::record(|| {
@@ -4089,6 +4140,7 @@ fn test_query_is_pattern_non_local() {
     struct Row {
         description: &'static str,
         pattern: &'static str,
+        language: Language,
         is_non_local: bool,
     }
 
@@ -4096,26 +4148,61 @@ fn test_query_is_pattern_non_local() {
         Row {
             description: "simple token",
             pattern: r#"(identifier)"#,
+            language: get_language("python"),
             is_non_local: false,
         },
         Row {
             description: "siblings that can occur in an argument list",
             pattern: r#"((identifier) (identifier))"#,
+            language: get_language("python"),
             is_non_local: true,
         },
         Row {
             description: "siblings that can occur in a statement block",
             pattern: r#"((return_statement) (return_statement))"#,
+            language: get_language("python"),
             is_non_local: true,
         },
         Row {
             description: "siblings that can occur in a source file",
             pattern: r#"((function_definition) (class_definition))"#,
+            language: get_language("python"),
             is_non_local: true,
         },
         Row {
             description: "siblings that can't occur in any repetition",
             pattern: r#"("{" "}")"#,
+            language: get_language("python"),
+            is_non_local: false,
+        },
+        Row {
+            description: "siblings that can't occur in any repetition, wildcard root",
+            pattern: r#"(_ "{" "}") @foo"#,
+            language: get_language("javascript"),
+            is_non_local: false,
+        },
+        Row {
+            description: "siblings that can occur in a class body, wildcard root",
+            pattern: r#"(_ (method_definition) (method_definition)) @foo"#,
+            language: get_language("javascript"),
+            is_non_local: true,
+        },
+        Row {
+            description: "top-level repetitions that can occur in a class body",
+            pattern: r#"(method_definition)+ @foo"#,
+            language: get_language("javascript"),
+            is_non_local: true,
+        },
+        Row {
+            description: "top-level repetitions that can occur in a statement block",
+            pattern: r#"(return_statement)+ @foo"#,
+            language: get_language("javascript"),
+            is_non_local: true,
+        },
+        Row {
+            description: "rooted pattern that can occur in a statement block",
+            pattern: r#"(return_statement) @foo"#,
+            language: get_language("javascript"),
             is_non_local: false,
         },
     ];
@@ -4123,7 +4210,6 @@ fn test_query_is_pattern_non_local() {
     allocations::record(|| {
         eprintln!("");
 
-        let language = get_language("python");
         for row in &rows {
             if let Some(filter) = EXAMPLE_FILTER.as_ref() {
                 if !row.description.contains(filter.as_str()) {
@@ -4131,7 +4217,7 @@ fn test_query_is_pattern_non_local() {
                 }
             }
             eprintln!("  query example: {:?}", row.description);
-            let query = Query::new(language, row.pattern).unwrap();
+            let query = Query::new(row.language, row.pattern).unwrap();
             assert_eq!(
                 query.is_pattern_non_local(0),
                 row.is_non_local,

From 811bc8256def2ddff65a1e46003263d7f49cd08e Mon Sep 17 00:00:00 2001
From: Max Brunsfeld <maxbrunsfeld@gmail.com>
Date: Mon, 13 Mar 2023 12:21:19 -0700
Subject: [PATCH 044/347] lib: 0.20.10

---
 Cargo.lock     | 2 +-
 lib/Cargo.toml | 2 +-
 2 files changed, 2 insertions(+), 2 deletions(-)

diff --git a/Cargo.lock b/Cargo.lock
index ca773788..40b4afab 100644
--- a/Cargo.lock
+++ b/Cargo.lock
@@ -544,7 +544,7 @@ dependencies = [
 
 [[package]]
 name = "tree-sitter"
-version = "0.20.9"
+version = "0.20.10"
 dependencies = [
  "cc",
  "lazy_static",
diff --git a/lib/Cargo.toml b/lib/Cargo.toml
index c2d35685..16fd0254 100644
--- a/lib/Cargo.toml
+++ b/lib/Cargo.toml
@@ -1,7 +1,7 @@
 [package]
 name = "tree-sitter"
 description = "Rust bindings to the Tree-sitter parsing library"
-version = "0.20.9"
+version = "0.20.10"
 authors = ["Max Brunsfeld <maxbrunsfeld@gmail.com>"]
 edition = "2021"
 license = "MIT"

From b1ad55909d1539bfbf6ae66407e33250770f0a88 Mon Sep 17 00:00:00 2001
From: Max Brunsfeld <maxbrunsfeld@gmail.com>
Date: Mon, 13 Mar 2023 12:22:10 -0700
Subject: [PATCH 045/347] 0.20.8

---
 Cargo.lock           | 2 +-
 cli/Cargo.toml       | 2 +-
 cli/npm/package.json | 2 +-
 3 files changed, 3 insertions(+), 3 deletions(-)

diff --git a/Cargo.lock b/Cargo.lock
index 40b4afab..4a844dc8 100644
--- a/Cargo.lock
+++ b/Cargo.lock
@@ -553,7 +553,7 @@ dependencies = [
 
 [[package]]
 name = "tree-sitter-cli"
-version = "0.20.7"
+version = "0.20.8"
 dependencies = [
  "ansi_term",
  "anyhow",
diff --git a/cli/Cargo.toml b/cli/Cargo.toml
index 77cf52e4..ad21f0e7 100644
--- a/cli/Cargo.toml
+++ b/cli/Cargo.toml
@@ -1,7 +1,7 @@
 [package]
 name = "tree-sitter-cli"
 description = "CLI tool for developing, testing, and using Tree-sitter parsers"
-version = "0.20.7"
+version = "0.20.8"
 authors = ["Max Brunsfeld <maxbrunsfeld@gmail.com>"]
 edition = "2021"
 license = "MIT"
diff --git a/cli/npm/package.json b/cli/npm/package.json
index dfa53ab4..02309193 100644
--- a/cli/npm/package.json
+++ b/cli/npm/package.json
@@ -1,6 +1,6 @@
 {
   "name": "tree-sitter-cli",
-  "version": "0.20.7",
+  "version": "0.20.8",
   "author": "Max Brunsfeld",
   "license": "MIT",
   "repository": {

From 25d9c989ebdc53dbad3852317c5b45228ff012e4 Mon Sep 17 00:00:00 2001
From: Max Brunsfeld <maxbrunsfeld@gmail.com>
Date: Mon, 13 Mar 2023 14:25:24 -0700
Subject: [PATCH 046/347] Update python error corpus to reflect grammar changes

---
 test/fixtures/error_corpus/python_errors.txt | 5 +++--
 1 file changed, 3 insertions(+), 2 deletions(-)

diff --git a/test/fixtures/error_corpus/python_errors.txt b/test/fixtures/error_corpus/python_errors.txt
index edabb510..bd3101a9 100644
--- a/test/fixtures/error_corpus/python_errors.txt
+++ b/test/fixtures/error_corpus/python_errors.txt
@@ -89,7 +89,8 @@ def a():
     parameters: (parameters)
     (ERROR (identifier))
     body: (block
-      (expression_statement (string)))))
+      (expression_statement (string
+        string_content: (string_content))))))
 
 ===========================================
 incomplete definition in class definition
@@ -108,4 +109,4 @@ b
     (ERROR)
     body: (block))
   (expression_statement
-    (identifier)))
\ No newline at end of file
+    (identifier)))

From ca152a93dd7f7dbea2e6eb84072b53dc74816443 Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Tue, 14 Mar 2023 20:06:31 +0200
Subject: [PATCH 047/347] ci: fix tests

---
 cli/src/tests/parser_test.rs | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/cli/src/tests/parser_test.rs b/cli/src/tests/parser_test.rs
index cf3b6437..30b12336 100644
--- a/cli/src/tests/parser_test.rs
+++ b/cli/src/tests/parser_test.rs
@@ -505,7 +505,7 @@ fn test_parsing_after_detecting_error_in_the_middle_of_a_string_token() {
     let tree = parser.parse(&source, None).unwrap();
     assert_eq!(
         tree.root_node().to_sexp(),
-        "(module (expression_statement (assignment left: (identifier) right: (expression_list (identifier) (string)))))"
+        "(module (expression_statement (assignment left: (identifier) right: (expression_list (identifier) (string string_content: (string_content))))))"
     );
 
     // Delete a suffix of the source code, starting in the middle of the string

From 47c1e858efb3fc29f9a539378ff40c00caabac40 Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Tue, 14 Mar 2023 20:37:12 +0200
Subject: [PATCH 048/347] Update deps: lib/binding_web/package.json

---
 lib/binding_web/package.json | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/lib/binding_web/package.json b/lib/binding_web/package.json
index 2cfcf72e..52f72d5b 100644
--- a/lib/binding_web/package.json
+++ b/lib/binding_web/package.json
@@ -27,8 +27,8 @@
   },
   "homepage": "https://github.com/tree-sitter/tree-sitter/tree/master/lib/binding_web",
   "devDependencies": {
-    "chai": "^4.2.0",
-    "mocha": "^6.1.4",
-    "terser": "^3.17.0"
+    "chai": "^4.3.7",
+    "mocha": "^10.2.0",
+    "terser": "^5.16.6"
   }
 }

From 1b2a3e3c73674e12144fb619083df48deb958716 Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Wed, 15 Mar 2023 12:31:54 +0200
Subject: [PATCH 049/347] docs: add `webrick` to Gemfile to fix a compat issue

---
 docs/Gemfile | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/docs/Gemfile b/docs/Gemfile
index 91ceacd3..ee114290 100644
--- a/docs/Gemfile
+++ b/docs/Gemfile
@@ -1,2 +1,3 @@
 source 'https://rubygems.org'
-gem 'github-pages', group: :jekyll_plugins
\ No newline at end of file
+gem 'github-pages', group: :jekyll_plugins
+gem "webrick"

From 2ce06b623ede810682fb58ffa126854efe14dd60 Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Wed, 15 Mar 2023 12:37:58 +0200
Subject: [PATCH 050/347] docs: update Gemfile.lock to fix GH dependabot
 complains

Updated with commands like:
  > gem install bundler
  > bundle config set --local path 'vendor/bundle'
  > bundle update --bundler
  > #bundle add webrick
  > bundle update
  > #bundle exec jekyll serve
---
 docs/Gemfile.lock | 368 +++++++++++++++++++++++-----------------------
 1 file changed, 185 insertions(+), 183 deletions(-)

diff --git a/docs/Gemfile.lock b/docs/Gemfile.lock
index 44aff756..3b2801be 100644
--- a/docs/Gemfile.lock
+++ b/docs/Gemfile.lock
@@ -1,258 +1,260 @@
 GEM
   remote: https://rubygems.org/
   specs:
-    activesupport (4.2.9)
-      i18n (~> 0.7)
-      minitest (~> 5.1)
-      thread_safe (~> 0.3, >= 0.3.4)
-      tzinfo (~> 1.1)
-    addressable (2.8.0)
-      public_suffix (>= 2.0.2, < 5.0)
+    activesupport (7.0.4.3)
+      concurrent-ruby (~> 1.0, >= 1.0.2)
+      i18n (>= 1.6, < 2)
+      minitest (>= 5.1)
+      tzinfo (~> 2.0)
+    addressable (2.8.1)
+      public_suffix (>= 2.0.2, < 6.0)
     coffee-script (2.4.1)
       coffee-script-source
       execjs
     coffee-script-source (1.11.1)
     colorator (1.1.0)
-    commonmarker (0.17.8)
-      ruby-enum (~> 0.5)
-    concurrent-ruby (1.0.5)
-    ethon (0.14.0)
+    commonmarker (0.23.8)
+    concurrent-ruby (1.2.2)
+    dnsruby (1.61.9)
+      simpleidn (~> 0.1)
+    em-websocket (0.5.3)
+      eventmachine (>= 0.12.9)
+      http_parser.rb (~> 0)
+    ethon (0.16.0)
       ffi (>= 1.15.0)
-    execjs (2.7.0)
-    faraday (1.5.1)
-      faraday-em_http (~> 1.0)
-      faraday-em_synchrony (~> 1.0)
-      faraday-excon (~> 1.1)
-      faraday-httpclient (~> 1.0.1)
-      faraday-net_http (~> 1.0)
-      faraday-net_http_persistent (~> 1.1)
-      faraday-patron (~> 1.0)
-      multipart-post (>= 1.2, < 3)
+    eventmachine (1.2.7)
+    execjs (2.8.1)
+    faraday (2.7.4)
+      faraday-net_http (>= 2.0, < 3.1)
       ruby2_keywords (>= 0.0.4)
-    faraday-em_http (1.0.0)
-    faraday-em_synchrony (1.0.0)
-    faraday-excon (1.1.0)
-    faraday-httpclient (1.0.1)
-    faraday-net_http (1.0.1)
-    faraday-net_http_persistent (1.2.0)
-    faraday-patron (1.0.0)
-    ffi (1.15.3)
+    faraday-net_http (3.0.2)
+    ffi (1.15.5)
     forwardable-extended (2.6.0)
-    gemoji (3.0.0)
-    github-pages (177)
-      activesupport (= 4.2.9)
-      github-pages-health-check (= 1.3.5)
-      jekyll (= 3.6.2)
-      jekyll-avatar (= 0.5.0)
-      jekyll-coffeescript (= 1.0.2)
-      jekyll-commonmark-ghpages (= 0.1.5)
+    gemoji (3.0.1)
+    github-pages (228)
+      github-pages-health-check (= 1.17.9)
+      jekyll (= 3.9.3)
+      jekyll-avatar (= 0.7.0)
+      jekyll-coffeescript (= 1.1.1)
+      jekyll-commonmark-ghpages (= 0.4.0)
       jekyll-default-layout (= 0.1.4)
-      jekyll-feed (= 0.9.2)
-      jekyll-gist (= 1.4.1)
-      jekyll-github-metadata (= 2.9.3)
-      jekyll-mentions (= 1.2.0)
-      jekyll-optional-front-matter (= 0.3.0)
+      jekyll-feed (= 0.15.1)
+      jekyll-gist (= 1.5.0)
+      jekyll-github-metadata (= 2.13.0)
+      jekyll-include-cache (= 0.2.1)
+      jekyll-mentions (= 1.6.0)
+      jekyll-optional-front-matter (= 0.3.2)
       jekyll-paginate (= 1.1.0)
-      jekyll-readme-index (= 0.2.0)
-      jekyll-redirect-from (= 0.12.1)
-      jekyll-relative-links (= 0.5.2)
-      jekyll-remote-theme (= 0.2.3)
-      jekyll-sass-converter (= 1.5.0)
-      jekyll-seo-tag (= 2.3.0)
-      jekyll-sitemap (= 1.1.1)
-      jekyll-swiss (= 0.4.0)
-      jekyll-theme-architect (= 0.1.0)
-      jekyll-theme-cayman (= 0.1.0)
-      jekyll-theme-dinky (= 0.1.0)
-      jekyll-theme-hacker (= 0.1.0)
-      jekyll-theme-leap-day (= 0.1.0)
-      jekyll-theme-merlot (= 0.1.0)
-      jekyll-theme-midnight (= 0.1.0)
-      jekyll-theme-minimal (= 0.1.0)
-      jekyll-theme-modernist (= 0.1.0)
-      jekyll-theme-primer (= 0.5.2)
-      jekyll-theme-slate (= 0.1.0)
-      jekyll-theme-tactile (= 0.1.0)
-      jekyll-theme-time-machine (= 0.1.0)
-      jekyll-titles-from-headings (= 0.5.0)
-      jemoji (= 0.8.1)
-      kramdown (= 1.16.2)
-      liquid (= 4.0.0)
-      listen (= 3.0.6)
+      jekyll-readme-index (= 0.3.0)
+      jekyll-redirect-from (= 0.16.0)
+      jekyll-relative-links (= 0.6.1)
+      jekyll-remote-theme (= 0.4.3)
+      jekyll-sass-converter (= 1.5.2)
+      jekyll-seo-tag (= 2.8.0)
+      jekyll-sitemap (= 1.4.0)
+      jekyll-swiss (= 1.0.0)
+      jekyll-theme-architect (= 0.2.0)
+      jekyll-theme-cayman (= 0.2.0)
+      jekyll-theme-dinky (= 0.2.0)
+      jekyll-theme-hacker (= 0.2.0)
+      jekyll-theme-leap-day (= 0.2.0)
+      jekyll-theme-merlot (= 0.2.0)
+      jekyll-theme-midnight (= 0.2.0)
+      jekyll-theme-minimal (= 0.2.0)
+      jekyll-theme-modernist (= 0.2.0)
+      jekyll-theme-primer (= 0.6.0)
+      jekyll-theme-slate (= 0.2.0)
+      jekyll-theme-tactile (= 0.2.0)
+      jekyll-theme-time-machine (= 0.2.0)
+      jekyll-titles-from-headings (= 0.5.3)
+      jemoji (= 0.12.0)
+      kramdown (= 2.3.2)
+      kramdown-parser-gfm (= 1.1.0)
+      liquid (= 4.0.4)
       mercenary (~> 0.3)
-      minima (= 2.1.1)
-      nokogiri (>= 1.8.1, < 2.0)
-      rouge (= 2.2.1)
+      minima (= 2.5.1)
+      nokogiri (>= 1.13.6, < 2.0)
+      rouge (= 3.26.0)
       terminal-table (~> 1.4)
-    github-pages-health-check (1.3.5)
+    github-pages-health-check (1.17.9)
       addressable (~> 2.3)
-      net-dns (~> 0.8)
+      dnsruby (~> 1.60)
       octokit (~> 4.0)
-      public_suffix (~> 2.0)
-      typhoeus (~> 0.7)
-    html-pipeline (2.7.1)
+      public_suffix (>= 3.0, < 5.0)
+      typhoeus (~> 1.3)
+    html-pipeline (2.14.3)
       activesupport (>= 2)
       nokogiri (>= 1.4)
-    i18n (0.9.5)
+    http_parser.rb (0.8.0)
+    i18n (1.12.0)
       concurrent-ruby (~> 1.0)
-    jekyll (3.6.2)
+    jekyll (3.9.3)
       addressable (~> 2.4)
       colorator (~> 1.0)
+      em-websocket (~> 0.5)
+      i18n (>= 0.7, < 2)
       jekyll-sass-converter (~> 1.0)
-      jekyll-watch (~> 1.1)
-      kramdown (~> 1.14)
+      jekyll-watch (~> 2.0)
+      kramdown (>= 1.17, < 3)
       liquid (~> 4.0)
       mercenary (~> 0.3.3)
       pathutil (~> 0.9)
-      rouge (>= 1.7, < 3)
+      rouge (>= 1.7, < 4)
       safe_yaml (~> 1.0)
-    jekyll-avatar (0.5.0)
-      jekyll (~> 3.0)
-    jekyll-coffeescript (1.0.2)
+    jekyll-avatar (0.7.0)
+      jekyll (>= 3.0, < 5.0)
+    jekyll-coffeescript (1.1.1)
       coffee-script (~> 2.2)
       coffee-script-source (~> 1.11.1)
-    jekyll-commonmark (1.1.0)
-      commonmarker (~> 0.14)
-      jekyll (>= 3.0, < 4.0)
-    jekyll-commonmark-ghpages (0.1.5)
-      commonmarker (~> 0.17.6)
-      jekyll-commonmark (~> 1)
-      rouge (~> 2)
+    jekyll-commonmark (1.4.0)
+      commonmarker (~> 0.22)
+    jekyll-commonmark-ghpages (0.4.0)
+      commonmarker (~> 0.23.7)
+      jekyll (~> 3.9.0)
+      jekyll-commonmark (~> 1.4.0)
+      rouge (>= 2.0, < 5.0)
     jekyll-default-layout (0.1.4)
       jekyll (~> 3.0)
-    jekyll-feed (0.9.2)
-      jekyll (~> 3.3)
-    jekyll-gist (1.4.1)
+    jekyll-feed (0.15.1)
+      jekyll (>= 3.7, < 5.0)
+    jekyll-gist (1.5.0)
       octokit (~> 4.2)
-    jekyll-github-metadata (2.9.3)
-      jekyll (~> 3.1)
+    jekyll-github-metadata (2.13.0)
+      jekyll (>= 3.4, < 5.0)
       octokit (~> 4.0, != 4.4.0)
-    jekyll-mentions (1.2.0)
-      activesupport (~> 4.0)
+    jekyll-include-cache (0.2.1)
+      jekyll (>= 3.7, < 5.0)
+    jekyll-mentions (1.6.0)
       html-pipeline (~> 2.3)
-      jekyll (~> 3.0)
-    jekyll-optional-front-matter (0.3.0)
-      jekyll (~> 3.0)
+      jekyll (>= 3.7, < 5.0)
+    jekyll-optional-front-matter (0.3.2)
+      jekyll (>= 3.0, < 5.0)
     jekyll-paginate (1.1.0)
-    jekyll-readme-index (0.2.0)
-      jekyll (~> 3.0)
-    jekyll-redirect-from (0.12.1)
-      jekyll (~> 3.3)
-    jekyll-relative-links (0.5.2)
-      jekyll (~> 3.3)
-    jekyll-remote-theme (0.2.3)
-      jekyll (~> 3.5)
-      rubyzip (>= 1.2.1, < 3.0)
-      typhoeus (>= 0.7, < 2.0)
-    jekyll-sass-converter (1.5.0)
+    jekyll-readme-index (0.3.0)
+      jekyll (>= 3.0, < 5.0)
+    jekyll-redirect-from (0.16.0)
+      jekyll (>= 3.3, < 5.0)
+    jekyll-relative-links (0.6.1)
+      jekyll (>= 3.3, < 5.0)
+    jekyll-remote-theme (0.4.3)
+      addressable (~> 2.0)
+      jekyll (>= 3.5, < 5.0)
+      jekyll-sass-converter (>= 1.0, <= 3.0.0, != 2.0.0)
+      rubyzip (>= 1.3.0, < 3.0)
+    jekyll-sass-converter (1.5.2)
       sass (~> 3.4)
-    jekyll-seo-tag (2.3.0)
-      jekyll (~> 3.3)
-    jekyll-sitemap (1.1.1)
-      jekyll (~> 3.3)
-    jekyll-swiss (0.4.0)
-    jekyll-theme-architect (0.1.0)
-      jekyll (~> 3.5)
+    jekyll-seo-tag (2.8.0)
+      jekyll (>= 3.8, < 5.0)
+    jekyll-sitemap (1.4.0)
+      jekyll (>= 3.7, < 5.0)
+    jekyll-swiss (1.0.0)
+    jekyll-theme-architect (0.2.0)
+      jekyll (> 3.5, < 5.0)
       jekyll-seo-tag (~> 2.0)
-    jekyll-theme-cayman (0.1.0)
-      jekyll (~> 3.5)
+    jekyll-theme-cayman (0.2.0)
+      jekyll (> 3.5, < 5.0)
       jekyll-seo-tag (~> 2.0)
-    jekyll-theme-dinky (0.1.0)
-      jekyll (~> 3.5)
+    jekyll-theme-dinky (0.2.0)
+      jekyll (> 3.5, < 5.0)
       jekyll-seo-tag (~> 2.0)
-    jekyll-theme-hacker (0.1.0)
-      jekyll (~> 3.5)
+    jekyll-theme-hacker (0.2.0)
+      jekyll (> 3.5, < 5.0)
       jekyll-seo-tag (~> 2.0)
-    jekyll-theme-leap-day (0.1.0)
-      jekyll (~> 3.5)
+    jekyll-theme-leap-day (0.2.0)
+      jekyll (> 3.5, < 5.0)
       jekyll-seo-tag (~> 2.0)
-    jekyll-theme-merlot (0.1.0)
-      jekyll (~> 3.5)
+    jekyll-theme-merlot (0.2.0)
+      jekyll (> 3.5, < 5.0)
       jekyll-seo-tag (~> 2.0)
-    jekyll-theme-midnight (0.1.0)
-      jekyll (~> 3.5)
+    jekyll-theme-midnight (0.2.0)
+      jekyll (> 3.5, < 5.0)
       jekyll-seo-tag (~> 2.0)
-    jekyll-theme-minimal (0.1.0)
-      jekyll (~> 3.5)
+    jekyll-theme-minimal (0.2.0)
+      jekyll (> 3.5, < 5.0)
       jekyll-seo-tag (~> 2.0)
-    jekyll-theme-modernist (0.1.0)
-      jekyll (~> 3.5)
+    jekyll-theme-modernist (0.2.0)
+      jekyll (> 3.5, < 5.0)
       jekyll-seo-tag (~> 2.0)
-    jekyll-theme-primer (0.5.2)
-      jekyll (~> 3.5)
+    jekyll-theme-primer (0.6.0)
+      jekyll (> 3.5, < 5.0)
       jekyll-github-metadata (~> 2.9)
-      jekyll-seo-tag (~> 2.2)
-    jekyll-theme-slate (0.1.0)
-      jekyll (~> 3.5)
       jekyll-seo-tag (~> 2.0)
-    jekyll-theme-tactile (0.1.0)
-      jekyll (~> 3.5)
+    jekyll-theme-slate (0.2.0)
+      jekyll (> 3.5, < 5.0)
       jekyll-seo-tag (~> 2.0)
-    jekyll-theme-time-machine (0.1.0)
-      jekyll (~> 3.5)
+    jekyll-theme-tactile (0.2.0)
+      jekyll (> 3.5, < 5.0)
       jekyll-seo-tag (~> 2.0)
-    jekyll-titles-from-headings (0.5.0)
-      jekyll (~> 3.3)
-    jekyll-watch (1.5.1)
+    jekyll-theme-time-machine (0.2.0)
+      jekyll (> 3.5, < 5.0)
+      jekyll-seo-tag (~> 2.0)
+    jekyll-titles-from-headings (0.5.3)
+      jekyll (>= 3.3, < 5.0)
+    jekyll-watch (2.2.1)
       listen (~> 3.0)
-    jemoji (0.8.1)
-      activesupport (~> 4.0, >= 4.2.9)
+    jemoji (0.12.0)
       gemoji (~> 3.0)
       html-pipeline (~> 2.2)
-      jekyll (>= 3.0)
-    kramdown (1.16.2)
-    liquid (4.0.0)
-    listen (3.0.6)
-      rb-fsevent (>= 0.9.3)
-      rb-inotify (>= 0.9.7)
+      jekyll (>= 3.0, < 5.0)
+    kramdown (2.3.2)
+      rexml
+    kramdown-parser-gfm (1.1.0)
+      kramdown (~> 2.0)
+    liquid (4.0.4)
+    listen (3.8.0)
+      rb-fsevent (~> 0.10, >= 0.10.3)
+      rb-inotify (~> 0.9, >= 0.9.10)
     mercenary (0.3.6)
-    mini_portile2 (2.8.0)
-    minima (2.1.1)
-      jekyll (~> 3.3)
-    minitest (5.11.3)
-    multipart-post (2.1.1)
-    net-dns (0.9.0)
-    nokogiri (1.13.3)
-      mini_portile2 (~> 2.8.0)
+    minima (2.5.1)
+      jekyll (>= 3.5, < 5.0)
+      jekyll-feed (~> 0.9)
+      jekyll-seo-tag (~> 2.1)
+    minitest (5.18.0)
+    nokogiri (1.14.2-x86_64-linux)
       racc (~> 1.4)
-    octokit (4.21.0)
-      faraday (>= 0.9)
-      sawyer (~> 0.8.0, >= 0.5.3)
+    octokit (4.25.1)
+      faraday (>= 1, < 3)
+      sawyer (~> 0.9)
     pathutil (0.16.2)
       forwardable-extended (~> 2.6)
-    public_suffix (2.0.5)
-    racc (1.6.0)
-    rb-fsevent (0.11.0)
+    public_suffix (4.0.7)
+    racc (1.6.2)
+    rb-fsevent (0.11.2)
     rb-inotify (0.10.1)
       ffi (~> 1.0)
-    rouge (2.2.1)
-    ruby-enum (0.7.2)
-      i18n
-    ruby2_keywords (0.0.4)
-    rubyzip (2.0.0)
+    rexml (3.2.5)
+    rouge (3.26.0)
+    ruby2_keywords (0.0.5)
+    rubyzip (2.3.2)
     safe_yaml (1.0.5)
     sass (3.7.4)
       sass-listen (~> 4.0.0)
     sass-listen (4.0.0)
       rb-fsevent (~> 0.9, >= 0.9.4)
       rb-inotify (~> 0.9, >= 0.9.7)
-    sawyer (0.8.2)
+    sawyer (0.9.2)
       addressable (>= 2.3.5)
-      faraday (> 0.8, < 2.0)
+      faraday (>= 0.17.3, < 3)
+    simpleidn (0.2.1)
+      unf (~> 0.1.4)
     terminal-table (1.8.0)
       unicode-display_width (~> 1.1, >= 1.1.1)
-    thread_safe (0.3.6)
-    typhoeus (0.8.0)
-      ethon (>= 0.8.0)
-    tzinfo (1.2.5)
-      thread_safe (~> 0.1)
-    unicode-display_width (1.3.0)
+    typhoeus (1.4.0)
+      ethon (>= 0.9.0)
+    tzinfo (2.0.6)
+      concurrent-ruby (~> 1.0)
+    unf (0.1.4)
+      unf_ext
+    unf_ext (0.0.8.2)
+    unicode-display_width (1.8.0)
+    webrick (1.8.1)
 
 PLATFORMS
   ruby
 
 DEPENDENCIES
   github-pages
+  webrick
 
 BUNDLED WITH
-   1.16.1
+   2.4.8

From 23faf59f162b881eee634ba8df2b65d6b67a4113 Mon Sep 17 00:00:00 2001
From: James McCoy <jamessan@jamessan.com>
Date: Wed, 15 Mar 2023 09:57:25 -0400
Subject: [PATCH 051/347] cli: Bump tree-sitter dependency to 0.20.10

tree-sitter/tree-sitter#2085 added the ts_query_is_pattern_non_local API
and its usage in tree-sitter-cli, so bump version accordingly.
---
 cli/Cargo.toml | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/cli/Cargo.toml b/cli/Cargo.toml
index ad21f0e7..f228951d 100644
--- a/cli/Cargo.toml
+++ b/cli/Cargo.toml
@@ -41,7 +41,7 @@ webbrowser = "0.5.1"
 which = "4.1.0"
 
 [dependencies.tree-sitter]
-version = "0.20.3"
+version = "0.20.10"
 path = "../lib"
 
 [dependencies.tree-sitter-config]

From a1388d9be152996492c425515187b6bc743fe9ca Mon Sep 17 00:00:00 2001
From: "dependabot[bot]" <49699333+dependabot[bot]@users.noreply.github.com>
Date: Wed, 15 Mar 2023 16:10:11 +0000
Subject: [PATCH 052/347] Bump webbrowser from 0.5.5 to 0.8.3

Bumps [webbrowser](https://github.com/amodm/webbrowser-rs) from 0.5.5 to 0.8.3.
- [Release notes](https://github.com/amodm/webbrowser-rs/releases)
- [Changelog](https://github.com/amodm/webbrowser-rs/blob/main/CHANGELOG.md)
- [Commits](https://github.com/amodm/webbrowser-rs/compare/v0.5.5...v0.8.3)

---
updated-dependencies:
- dependency-name: webbrowser
  dependency-type: direct:production
...

Signed-off-by: dependabot[bot] <support@github.com>
---
 Cargo.lock     | 185 +++++++++++++++++++++++++++++++++++++++++++++++--
 cli/Cargo.toml |   2 +-
 2 files changed, 179 insertions(+), 8 deletions(-)

diff --git a/Cargo.lock b/Cargo.lock
index 4a844dc8..a863b14f 100644
--- a/Cargo.lock
+++ b/Cargo.lock
@@ -61,12 +61,24 @@ version = "3.11.1"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "572f695136211188308f16ad2ca5c851a712c464060ae6974944458eb83880ba"
 
+[[package]]
+name = "bytes"
+version = "1.4.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "89b2fd2a0dcf38d7971e2194b6b6eebab45ae01067456a7fd93d5547a61b70be"
+
 [[package]]
 name = "cc"
 version = "1.0.77"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "e9f73505338f7d905b19d18738976aae232eb46b8efc15554ffc56deb5d9ebe4"
 
+[[package]]
+name = "cesu8"
+version = "1.1.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "6d43a04d8753f35258c91f8ec639f792891f748a1edbd759cf1dcea3382ad83c"
+
 [[package]]
 name = "cfg-if"
 version = "1.0.0"
@@ -94,6 +106,32 @@ dependencies = [
  "vec_map",
 ]
 
+[[package]]
+name = "combine"
+version = "4.6.6"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "35ed6e9d84f0b51a7f52daf1c7d71dd136fd7a3f41a8462b8cdb8c78d920fad4"
+dependencies = [
+ "bytes",
+ "memchr",
+]
+
+[[package]]
+name = "core-foundation"
+version = "0.9.3"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "194a7a9e6de53fa55116934067c844d9d749312f75c6f6d0980e8c252f8c2146"
+dependencies = [
+ "core-foundation-sys",
+ "libc",
+]
+
+[[package]]
+name = "core-foundation-sys"
+version = "0.8.3"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "5827cebf4670468b8772dd191856768aedcb1b0278a04f989f7766351917b9dc"
+
 [[package]]
 name = "ctor"
 version = "0.1.26"
@@ -125,6 +163,15 @@ dependencies = [
  "dirs-sys",
 ]
 
+[[package]]
+name = "dirs"
+version = "4.0.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "ca3aa72a6f96ea37bbc5aa912f6788242832f75369bdfdadcb0e38423f100059"
+dependencies = [
+ "dirs-sys",
+]
+
 [[package]]
 name = "dirs-sys"
 version = "0.3.7"
@@ -151,6 +198,15 @@ dependencies = [
  "instant",
 ]
 
+[[package]]
+name = "form_urlencoded"
+version = "1.1.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "a9c384f161156f5260c24a097c56119f9be8c798586aecc13afbcbe7b7e26bf8"
+dependencies = [
+ "percent-encoding",
+]
+
 [[package]]
 name = "getrandom"
 version = "0.2.8"
@@ -198,6 +254,16 @@ version = "1.0.2"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "c4a1e36c821dbe04574f602848a19f742f4fb3c98d40449f11bcad18d6b17421"
 
+[[package]]
+name = "idna"
+version = "0.3.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "e14ddfc70884202db2244c223200c204c2bda1bc6e0998d11b5e024d657209e6"
+dependencies = [
+ "unicode-bidi",
+ "unicode-normalization",
+]
+
 [[package]]
 name = "indexmap"
 version = "1.9.2"
@@ -223,6 +289,26 @@ version = "1.0.4"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "4217ad341ebadf8d8e724e264f13e593e0648f5b3e94b3896a5df283be015ecc"
 
+[[package]]
+name = "jni"
+version = "0.20.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "039022cdf4d7b1cf548d31f60ae783138e5fd42013f6271049d7df7afadef96c"
+dependencies = [
+ "cesu8",
+ "combine",
+ "jni-sys",
+ "log",
+ "thiserror",
+ "walkdir",
+]
+
+[[package]]
+name = "jni-sys"
+version = "0.3.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "8eaf4bc02d17cbdd7ff4c7438cafcdf7fb9a4613313ad11b4f8fefe7d3fa0130"
+
 [[package]]
 name = "js-sys"
 version = "0.3.60"
@@ -263,12 +349,36 @@ dependencies = [
  "cfg-if",
 ]
 
+[[package]]
+name = "malloc_buf"
+version = "0.0.6"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "62bb907fe88d54d8d9ce32a3cceab4218ed2f6b7d35617cafe9adf84e43919cb"
+dependencies = [
+ "libc",
+]
+
 [[package]]
 name = "memchr"
 version = "2.5.0"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "2dffe52ecf27772e601905b7522cb4ef790d2cc203488bbd0e2fe85fcb74566d"
 
+[[package]]
+name = "ndk-context"
+version = "0.1.1"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "27b02d87554356db9e9a873add8782d4ea6e3e58ea071a9adb9a2e8ddb884a8b"
+
+[[package]]
+name = "objc"
+version = "0.2.7"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "915b1b472bc21c53464d6c8461c9d3af805ba1ef837e1cac254428f4a77177b1"
+dependencies = [
+ "malloc_buf",
+]
+
 [[package]]
 name = "once_cell"
 version = "1.16.0"
@@ -284,6 +394,12 @@ dependencies = [
  "winapi",
 ]
 
+[[package]]
+name = "percent-encoding"
+version = "2.2.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "478c572c3d73181ff3c2539045f6eb99e5491218eae919370993b890cdbdd98e"
+
 [[package]]
 name = "ppv-lite86"
 version = "0.2.17"
@@ -350,6 +466,12 @@ dependencies = [
  "getrandom",
 ]
 
+[[package]]
+name = "raw-window-handle"
+version = "0.5.1"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "4f851a03551ceefd30132e447f07f96cb7011d6b658374f3aed847333adb5559"
+
 [[package]]
 name = "redox_syscall"
 version = "0.2.16"
@@ -533,6 +655,21 @@ dependencies = [
  "log",
 ]
 
+[[package]]
+name = "tinyvec"
+version = "1.6.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "87cc5ceb3875bb20c2890005a4e226a4651264a5c75edb2421b52861a0a0cb50"
+dependencies = [
+ "tinyvec_macros",
+]
+
+[[package]]
+name = "tinyvec_macros"
+version = "0.1.1"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "1f3ccbac311fea05f86f61904b462b55fb3df8837a366dfc601a0161d0532f20"
+
 [[package]]
 name = "toml"
 version = "0.5.9"
@@ -561,7 +698,7 @@ dependencies = [
  "clap",
  "ctor",
  "difference",
- "dirs",
+ "dirs 3.0.2",
  "glob",
  "html-escape",
  "indexmap",
@@ -595,7 +732,7 @@ name = "tree-sitter-config"
 version = "0.19.0"
 dependencies = [
  "anyhow",
- "dirs",
+ "dirs 3.0.2",
  "serde",
  "serde_json",
 ]
@@ -615,7 +752,7 @@ version = "0.20.0"
 dependencies = [
  "anyhow",
  "cc",
- "dirs",
+ "dirs 3.0.2",
  "libloading",
  "once_cell",
  "regex",
@@ -636,12 +773,27 @@ dependencies = [
  "tree-sitter",
 ]
 
+[[package]]
+name = "unicode-bidi"
+version = "0.3.11"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "524b68aca1d05e03fdf03fcdce2c6c94b6daf6d16861ddaa7e4f2b6638a9052c"
+
 [[package]]
 name = "unicode-ident"
 version = "1.0.5"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "6ceab39d59e4c9499d4e5a8ee0e2735b891bb7308ac83dfb4e80cad195c9f6f3"
 
+[[package]]
+name = "unicode-normalization"
+version = "0.1.22"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "5c5713f0fc4b5db668a2ac63cdb7bb4469d8c9fed047b1d0292cc7b0ce2ba921"
+dependencies = [
+ "tinyvec",
+]
+
 [[package]]
 name = "unicode-width"
 version = "0.1.10"
@@ -654,6 +806,17 @@ version = "0.2.1"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "5aa30f5ea51ff7edfc797c6d3f9ec8cbd8cfedef5371766b7181d33977f4814f"
 
+[[package]]
+name = "url"
+version = "2.3.1"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "0d68c799ae75762b8c3fe375feb6600ef5602c883c5d21eb51c09f22b83c4643"
+dependencies = [
+ "form_urlencoded",
+ "idna",
+ "percent-encoding",
+]
+
 [[package]]
 name = "utf8-width"
 version = "0.1.6"
@@ -749,10 +912,18 @@ dependencies = [
 
 [[package]]
 name = "webbrowser"
-version = "0.5.5"
+version = "0.8.3"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "ecad156490d6b620308ed411cfee90d280b3cbd13e189ea0d3fada8acc89158a"
+checksum = "aa61ff77f695a94d9c8558e0bb5c362a8fd1f27c74663770fbc633acbafedbb6"
 dependencies = [
+ "core-foundation",
+ "dirs 4.0.0",
+ "jni",
+ "log",
+ "ndk-context",
+ "objc",
+ "raw-window-handle",
+ "url",
  "web-sys",
  "widestring",
  "winapi",
@@ -771,9 +942,9 @@ dependencies = [
 
 [[package]]
 name = "widestring"
-version = "0.4.3"
+version = "1.0.2"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "c168940144dd21fd8046987c16a46a33d5fc84eec29ef9dcddc2ac9e31526b7c"
+checksum = "653f141f39ec16bba3c5abe400a0c60da7468261cc2cbf36805022876bc721a8"
 
 [[package]]
 name = "winapi"
diff --git a/cli/Cargo.toml b/cli/Cargo.toml
index f228951d..6d48e8b9 100644
--- a/cli/Cargo.toml
+++ b/cli/Cargo.toml
@@ -37,7 +37,7 @@ serde = { version = "1.0.130", features = ["derive"] }
 smallbitvec = "2.5.1"
 tiny_http = "0.12.0"
 walkdir = "2.3"
-webbrowser = "0.5.1"
+webbrowser = "0.8.3"
 which = "4.1.0"
 
 [dependencies.tree-sitter]

From 457eb2fe761f1e4d0b6346154345007e040fa487 Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Wed, 15 Mar 2023 14:48:47 +0200
Subject: [PATCH 053/347] Update Cargo.lock

---
 Cargo.lock | 294 +++++++++++++++++++++++++++++++++++++----------------
 1 file changed, 204 insertions(+), 90 deletions(-)

diff --git a/Cargo.lock b/Cargo.lock
index a863b14f..7a675454 100644
--- a/Cargo.lock
+++ b/Cargo.lock
@@ -22,9 +22,9 @@ dependencies = [
 
 [[package]]
 name = "anyhow"
-version = "1.0.66"
+version = "1.0.69"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "216261ddc8289130e551ddcd5ce8a064710c0d064a4d2895c67151c92b5443f6"
+checksum = "224afbd727c3d6e4b90103ece64b8d1b67fbb1973b1046c2281eed3f3803f800"
 
 [[package]]
 name = "ascii"
@@ -57,9 +57,9 @@ checksum = "bef38d45163c2f1dde094a7dfd33ccf595c92905c8f8f4fdc18d06fb1037718a"
 
 [[package]]
 name = "bumpalo"
-version = "3.11.1"
+version = "3.12.0"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "572f695136211188308f16ad2ca5c851a712c464060ae6974944458eb83880ba"
+checksum = "0d261e256854913907f67ed06efbc3338dfe6179796deefc1ff763fc1aee5535"
 
 [[package]]
 name = "bytes"
@@ -69,9 +69,9 @@ checksum = "89b2fd2a0dcf38d7971e2194b6b6eebab45ae01067456a7fd93d5547a61b70be"
 
 [[package]]
 name = "cc"
-version = "1.0.77"
+version = "1.0.79"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "e9f73505338f7d905b19d18738976aae232eb46b8efc15554ffc56deb5d9ebe4"
+checksum = "50d30906286121d95be3d479533b458f87493b30a4b5f79a607db8f5d11aa91f"
 
 [[package]]
 name = "cesu8"
@@ -87,9 +87,9 @@ checksum = "baf1de4339761588bc0619e3cbc0120ee582ebb74b53b4efbf79117bd2da40fd"
 
 [[package]]
 name = "chunked_transfer"
-version = "1.4.0"
+version = "1.4.1"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "fff857943da45f546682664a79488be82e69e43c1a7a2307679ab9afb3a66d2e"
+checksum = "cca491388666e04d7248af3f60f0c40cfb0991c72205595d7c396e3510207d1a"
 
 [[package]]
 name = "clap"
@@ -185,15 +185,36 @@ dependencies = [
 
 [[package]]
 name = "either"
-version = "1.8.0"
+version = "1.8.1"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "90e5c1c8368803113bf0c9584fc495a58b86dc8a29edbf8fe877d21d9507e797"
+checksum = "7fcaabb2fef8c910e7f4c7ce9f67a1283a1715879a7c230ca9d6d1ae31f16d91"
+
+[[package]]
+name = "errno"
+version = "0.2.8"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "f639046355ee4f37944e44f60642c6f3a7efa3cf6b78c78a0d989a8ce6c396a1"
+dependencies = [
+ "errno-dragonfly",
+ "libc",
+ "winapi",
+]
+
+[[package]]
+name = "errno-dragonfly"
+version = "0.1.2"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "aa68f1b12764fab894d2755d2518754e71b4fd80ecfb822714a1206c2aab39bf"
+dependencies = [
+ "cc",
+ "libc",
+]
 
 [[package]]
 name = "fastrand"
-version = "1.8.0"
+version = "1.9.0"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "a7a407cfaa3385c4ae6b23e84623d48c2798d06e3e6a1878f7f59f17b3f86499"
+checksum = "e51093e27b0797c359783294ca4f0a911c270184cb10f85783b118614a1501be"
 dependencies = [
  "instant",
 ]
@@ -220,9 +241,9 @@ dependencies = [
 
 [[package]]
 name = "glob"
-version = "0.3.0"
+version = "0.3.1"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "9b919933a397b79c37e33b77bb2aa3dc8eb6e165ad809e58ff75bc7db2e34574"
+checksum = "d2fabcfbdc87f4758337ca535fb41a6d701b65693ce38287d856d1674551ec9b"
 
 [[package]]
 name = "hashbrown"
@@ -241,9 +262,9 @@ dependencies = [
 
 [[package]]
 name = "html-escape"
-version = "0.2.12"
+version = "0.2.13"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "15315cfa9503e9aa85a477138eff76a1b203a430703548052c330b69d8d8c205"
+checksum = "6d1ad449764d627e22bfd7cd5e8868264fc9236e07c752972b4080cd351cb476"
 dependencies = [
  "utf8-width",
 ]
@@ -284,10 +305,20 @@ dependencies = [
 ]
 
 [[package]]
-name = "itoa"
-version = "1.0.4"
+name = "io-lifetimes"
+version = "1.0.6"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "4217ad341ebadf8d8e724e264f13e593e0648f5b3e94b3896a5df283be015ecc"
+checksum = "cfa919a82ea574332e2de6e74b4c36e74d41982b335080fa59d4ef31be20fdf3"
+dependencies = [
+ "libc",
+ "windows-sys 0.45.0",
+]
+
+[[package]]
+name = "itoa"
+version = "1.0.6"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "453ad9f582a441959e5f0d088b02ce04cfe8d51a8eaf077f12ac6d3e94164ca6"
 
 [[package]]
 name = "jni"
@@ -311,9 +342,9 @@ checksum = "8eaf4bc02d17cbdd7ff4c7438cafcdf7fb9a4613313ad11b4f8fefe7d3fa0130"
 
 [[package]]
 name = "js-sys"
-version = "0.3.60"
+version = "0.3.61"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "49409df3e3bf0856b916e2ceaca09ee28e6871cf7d9ce97a692cacfdb2a25a47"
+checksum = "445dde2150c55e483f3d8416706b97ec8e8237c307e5b7b4b8dd15e6af2a0730"
 dependencies = [
  "wasm-bindgen",
 ]
@@ -326,9 +357,9 @@ checksum = "e2abad23fbc42b3700f2f279844dc832adb2b2eb069b2df918f455c4e18cc646"
 
 [[package]]
 name = "libc"
-version = "0.2.138"
+version = "0.2.140"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "db6d7e329c562c5dfab7a46a2afabc8b987ab9a4834c9d1ca04dc54c1546cef8"
+checksum = "99227334921fae1a979cf0bfdfcc6b3e5ce376ef57e16fb6fb3ea2ed6095f80c"
 
 [[package]]
 name = "libloading"
@@ -340,6 +371,12 @@ dependencies = [
  "winapi",
 ]
 
+[[package]]
+name = "linux-raw-sys"
+version = "0.1.4"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "f051f77a7c8e6957c0696eac88f26b0117e54f52d3fc682ab19397a8812846a4"
+
 [[package]]
 name = "log"
 version = "0.4.17"
@@ -381,9 +418,9 @@ dependencies = [
 
 [[package]]
 name = "once_cell"
-version = "1.16.0"
+version = "1.17.1"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "86f0b0d4bf799edbc74508c1e8bf170ff5f41238e5f8225603ca7caaae2b7860"
+checksum = "b7e5500299e16ebb147ae15a00a942af264cf3688f47923b8fc2cd5858f23ad3"
 
 [[package]]
 name = "output_vt100"
@@ -420,18 +457,18 @@ dependencies = [
 
 [[package]]
 name = "proc-macro2"
-version = "1.0.47"
+version = "1.0.52"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "5ea3d908b0e36316caf9e9e2c4625cdde190a7e6f440d794667ed17a1855e725"
+checksum = "1d0e1ae9e836cc3beddd63db0df682593d7e2d3d891ae8c9083d2113e1744224"
 dependencies = [
  "unicode-ident",
 ]
 
 [[package]]
 name = "quote"
-version = "1.0.21"
+version = "1.0.26"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "bbe448f377a7d6961e30f5955f9b8d106c3f5e449d493ee1b125c1d43c2b5179"
+checksum = "4424af4bf778aae2051a77b60283332f386554255d722233d09fbfc7e30da2fc"
 dependencies = [
  "proc-macro2",
 ]
@@ -494,9 +531,9 @@ dependencies = [
 
 [[package]]
 name = "regex"
-version = "1.7.0"
+version = "1.7.1"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "e076559ef8e241f2ae3479e36f97bd5741c0330689e217ad51ce2c76808b868a"
+checksum = "48aaa5748ba571fb95cd2c85c09f629215d3a6ece942baa100950af03a34f733"
 dependencies = [
  "aho-corasick",
  "memchr",
@@ -509,15 +546,6 @@ version = "0.6.28"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "456c603be3e8d448b072f410900c09faf164fbce2d480456f50eea6e25f9c848"
 
-[[package]]
-name = "remove_dir_all"
-version = "0.5.3"
-source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "3acd125665422973a33ac9d3dd2df85edad0f4ae9b00dafb1a05e43a9f5ef8e7"
-dependencies = [
- "winapi",
-]
-
 [[package]]
 name = "rustc-hash"
 version = "1.1.0"
@@ -525,10 +553,24 @@ source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "08d43f7aa6b08d49f382cde6a7982047c3426db949b1424bc4b7ec9ae12c6ce2"
 
 [[package]]
-name = "ryu"
-version = "1.0.11"
+name = "rustix"
+version = "0.36.9"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "4501abdff3ae82a1c1b477a17252eb69cee9e66eb915c1abaa4f44d873df9f09"
+checksum = "fd5c6ff11fecd55b40746d1995a02f2eb375bf8c00d192d521ee09f42bef37bc"
+dependencies = [
+ "bitflags",
+ "errno",
+ "io-lifetimes",
+ "libc",
+ "linux-raw-sys",
+ "windows-sys 0.45.0",
+]
+
+[[package]]
+name = "ryu"
+version = "1.0.13"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "f91339c0467de62360649f8d3e185ca8de4224ff281f66000de5eb2a77a79041"
 
 [[package]]
 name = "same-file"
@@ -541,24 +583,24 @@ dependencies = [
 
 [[package]]
 name = "semver"
-version = "1.0.14"
+version = "1.0.17"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "e25dfac463d778e353db5be2449d1cce89bd6fd23c9f1ea21310ce6e5a1b29c4"
+checksum = "bebd363326d05ec3e2f532ab7660680f3b02130d780c299bca73469d521bc0ed"
 
 [[package]]
 name = "serde"
-version = "1.0.149"
+version = "1.0.156"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "256b9932320c590e707b94576e3cc1f7c9024d0ee6612dfbcf1cb106cbe8e055"
+checksum = "314b5b092c0ade17c00142951e50ced110ec27cea304b1037c6969246c2469a4"
 dependencies = [
  "serde_derive",
 ]
 
 [[package]]
 name = "serde_derive"
-version = "1.0.149"
+version = "1.0.156"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "b4eae9b04cbffdfd550eb462ed33bc6a1b68c935127d008b27444d08380f94e4"
+checksum = "d7e29c4601e36bcec74a223228dce795f4cd3616341a4af93520ca1a837c087d"
 dependencies = [
  "proc-macro2",
  "quote",
@@ -567,9 +609,9 @@ dependencies = [
 
 [[package]]
 name = "serde_json"
-version = "1.0.89"
+version = "1.0.94"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "020ff22c755c2ed3f8cf162dbb41a7268d934702f3ed3631656ea597e08fc3db"
+checksum = "1c533a59c9d8a93a09c6ab31f0fd5e5f4dd1b8fc9434804029839884765d04ea"
 dependencies = [
  "indexmap",
  "itoa",
@@ -591,9 +633,9 @@ checksum = "8ea5119cdb4c55b55d432abb513a0429384878c15dde60cc77b1c99de1a95a6a"
 
 [[package]]
 name = "syn"
-version = "1.0.105"
+version = "1.0.109"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "60b9b43d45702de4c839cb9b51d9f529c5dd26a4aff255b42b1ebc03e88ee908"
+checksum = "72b64191b275b66ffe2469e8af2c1cfe3bafa67b529ead792a6d0160888b4237"
 dependencies = [
  "proc-macro2",
  "quote",
@@ -602,16 +644,15 @@ dependencies = [
 
 [[package]]
 name = "tempfile"
-version = "3.3.0"
+version = "3.4.0"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "5cdb1ef4eaeeaddc8fbd371e5017057064af0911902ef36b39801f67cc6d79e4"
+checksum = "af18f7ae1acd354b992402e9ec5864359d693cd8a79dcbef59f76891701c1e95"
 dependencies = [
  "cfg-if",
  "fastrand",
- "libc",
  "redox_syscall",
- "remove_dir_all",
- "winapi",
+ "rustix",
+ "windows-sys 0.42.0",
 ]
 
 [[package]]
@@ -625,18 +666,18 @@ dependencies = [
 
 [[package]]
 name = "thiserror"
-version = "1.0.37"
+version = "1.0.39"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "10deb33631e3c9018b9baf9dcbbc4f737320d2b576bac10f6aefa048fa407e3e"
+checksum = "a5ab016db510546d856297882807df8da66a16fb8c4101cb8b30054b0d5b2d9c"
 dependencies = [
  "thiserror-impl",
 ]
 
 [[package]]
 name = "thiserror-impl"
-version = "1.0.37"
+version = "1.0.39"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "982d17546b47146b28f7c22e3d08465f6b8903d0ea13c1660d9d84a6e7adcdbb"
+checksum = "5420d42e90af0c38c3290abcca25b9b3bdf379fc9f55c528f53a269d9c9a267e"
 dependencies = [
  "proc-macro2",
  "quote",
@@ -672,9 +713,9 @@ checksum = "1f3ccbac311fea05f86f61904b462b55fb3df8837a366dfc601a0161d0532f20"
 
 [[package]]
 name = "toml"
-version = "0.5.9"
+version = "0.5.11"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "8d82e1a7758622a465f8cee077614c73484dac5b836c02ff6a40d5d1010324d7"
+checksum = "f4f7f0dd8d50a853a531c426359045b1998f04219d88799810762cd4ad314234"
 dependencies = [
  "serde",
 ]
@@ -781,9 +822,9 @@ checksum = "524b68aca1d05e03fdf03fcdce2c6c94b6daf6d16861ddaa7e4f2b6638a9052c"
 
 [[package]]
 name = "unicode-ident"
-version = "1.0.5"
+version = "1.0.8"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "6ceab39d59e4c9499d4e5a8ee0e2735b891bb7308ac83dfb4e80cad195c9f6f3"
+checksum = "e5464a87b239f13a63a501f2701565754bae92d243d4bb7eb12f6d57d2269bf4"
 
 [[package]]
 name = "unicode-normalization"
@@ -848,9 +889,9 @@ checksum = "9c8d87e72b64a3b4db28d11ce29237c246188f4f51057d65a7eab63b7987e423"
 
 [[package]]
 name = "wasm-bindgen"
-version = "0.2.83"
+version = "0.2.84"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "eaf9f5aceeec8be17c128b2e93e031fb8a4d469bb9c4ae2d7dc1888b26887268"
+checksum = "31f8dcbc21f30d9b8f2ea926ecb58f6b91192c17e9d33594b3df58b2007ca53b"
 dependencies = [
  "cfg-if",
  "wasm-bindgen-macro",
@@ -858,9 +899,9 @@ dependencies = [
 
 [[package]]
 name = "wasm-bindgen-backend"
-version = "0.2.83"
+version = "0.2.84"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "4c8ffb332579b0557b52d268b91feab8df3615f265d5270fec2a8c95b17c1142"
+checksum = "95ce90fd5bcc06af55a641a86428ee4229e44e07033963a2290a8e241607ccb9"
 dependencies = [
  "bumpalo",
  "log",
@@ -873,9 +914,9 @@ dependencies = [
 
 [[package]]
 name = "wasm-bindgen-macro"
-version = "0.2.83"
+version = "0.2.84"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "052be0f94026e6cbc75cdefc9bae13fd6052cdcaf532fa6c45e7ae33a1e6c810"
+checksum = "4c21f77c0bedc37fd5dc21f897894a5ca01e7bb159884559461862ae90c0b4c5"
 dependencies = [
  "quote",
  "wasm-bindgen-macro-support",
@@ -883,9 +924,9 @@ dependencies = [
 
 [[package]]
 name = "wasm-bindgen-macro-support"
-version = "0.2.83"
+version = "0.2.84"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "07bc0c051dc5f23e307b13285f9d75df86bfdf816c5721e573dec1f9b8aa193c"
+checksum = "2aff81306fcac3c7515ad4e177f521b5c9a15f2b08f4e32d823066102f35a5f6"
 dependencies = [
  "proc-macro2",
  "quote",
@@ -896,15 +937,15 @@ dependencies = [
 
 [[package]]
 name = "wasm-bindgen-shared"
-version = "0.2.83"
+version = "0.2.84"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "1c38c045535d93ec4f0b4defec448e4291638ee608530863b1e2ba115d4fff7f"
+checksum = "0046fef7e28c3804e5e38bfa31ea2a0f73905319b677e57ebe37e49358989b5d"
 
 [[package]]
 name = "web-sys"
-version = "0.3.60"
+version = "0.3.61"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "bcda906d8be16e728fd5adc5b729afad4e444e106ab28cd1c7256e54fa61510f"
+checksum = "e33b99f4b23ba3eec1a53ac264e35a755f00e966e0065077d6027c0f575b0b97"
 dependencies = [
  "js-sys",
  "wasm-bindgen",
@@ -912,9 +953,9 @@ dependencies = [
 
 [[package]]
 name = "webbrowser"
-version = "0.8.3"
+version = "0.8.7"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "aa61ff77f695a94d9c8558e0bb5c362a8fd1f27c74663770fbc633acbafedbb6"
+checksum = "97d1fa1e5c829b2bf9eb1e28fb950248b797cd6a04866fbdfa8bc31e5eef4c78"
 dependencies = [
  "core-foundation",
  "dirs 4.0.0",
@@ -925,27 +966,19 @@ dependencies = [
  "raw-window-handle",
  "url",
  "web-sys",
- "widestring",
- "winapi",
 ]
 
 [[package]]
 name = "which"
-version = "4.3.0"
+version = "4.4.0"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "1c831fbbee9e129a8cf93e7747a82da9d95ba8e16621cae60ec2cdc849bacb7b"
+checksum = "2441c784c52b289a054b7201fc93253e288f094e2f4be9058343127c4226a269"
 dependencies = [
  "either",
  "libc",
  "once_cell",
 ]
 
-[[package]]
-name = "widestring"
-version = "1.0.2"
-source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "653f141f39ec16bba3c5abe400a0c60da7468261cc2cbf36805022876bc721a8"
-
 [[package]]
 name = "winapi"
 version = "0.3.9"
@@ -976,3 +1009,84 @@ name = "winapi-x86_64-pc-windows-gnu"
 version = "0.4.0"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "712e227841d057c1ee1cd2fb22fa7e5a5461ae8e48fa2ca79ec42cfc1931183f"
+
+[[package]]
+name = "windows-sys"
+version = "0.42.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "5a3e1820f08b8513f676f7ab6c1f99ff312fb97b553d30ff4dd86f9f15728aa7"
+dependencies = [
+ "windows_aarch64_gnullvm",
+ "windows_aarch64_msvc",
+ "windows_i686_gnu",
+ "windows_i686_msvc",
+ "windows_x86_64_gnu",
+ "windows_x86_64_gnullvm",
+ "windows_x86_64_msvc",
+]
+
+[[package]]
+name = "windows-sys"
+version = "0.45.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "75283be5efb2831d37ea142365f009c02ec203cd29a3ebecbc093d52315b66d0"
+dependencies = [
+ "windows-targets",
+]
+
+[[package]]
+name = "windows-targets"
+version = "0.42.2"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "8e5180c00cd44c9b1c88adb3693291f1cd93605ded80c250a75d472756b4d071"
+dependencies = [
+ "windows_aarch64_gnullvm",
+ "windows_aarch64_msvc",
+ "windows_i686_gnu",
+ "windows_i686_msvc",
+ "windows_x86_64_gnu",
+ "windows_x86_64_gnullvm",
+ "windows_x86_64_msvc",
+]
+
+[[package]]
+name = "windows_aarch64_gnullvm"
+version = "0.42.2"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "597a5118570b68bc08d8d59125332c54f1ba9d9adeedeef5b99b02ba2b0698f8"
+
+[[package]]
+name = "windows_aarch64_msvc"
+version = "0.42.2"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "e08e8864a60f06ef0d0ff4ba04124db8b0fb3be5776a5cd47641e942e58c4d43"
+
+[[package]]
+name = "windows_i686_gnu"
+version = "0.42.2"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "c61d927d8da41da96a81f029489353e68739737d3beca43145c8afec9a31a84f"
+
+[[package]]
+name = "windows_i686_msvc"
+version = "0.42.2"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "44d840b6ec649f480a41c8d80f9c65108b92d89345dd94027bfe06ac444d1060"
+
+[[package]]
+name = "windows_x86_64_gnu"
+version = "0.42.2"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "8de912b8b8feb55c064867cf047dda097f92d51efad5b491dfb98f6bbb70cb36"
+
+[[package]]
+name = "windows_x86_64_gnullvm"
+version = "0.42.2"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "26d41b46a36d453748aedef1486d5c7a85db22e56aff34643984ea85514e94a3"
+
+[[package]]
+name = "windows_x86_64_msvc"
+version = "0.42.2"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "9aec5da331524158c6d1a4ac0ab1541149c0b9505fde06423b02f5ef0106b9f0"

From 62f8c431aeee91894c79a5cf507399a6f764a4ba Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Thu, 16 Mar 2023 15:02:04 +0200
Subject: [PATCH 054/347] test: add `retry` and `test_with_seed` proc macros

---
 Cargo.lock                          |  11 +++
 cli/Cargo.toml                      |   2 +
 cli/src/tests/proc_macro/Cargo.toml |  14 +++
 cli/src/tests/proc_macro/src/lib.rs | 137 ++++++++++++++++++++++++++++
 4 files changed, 164 insertions(+)
 create mode 100644 cli/src/tests/proc_macro/Cargo.toml
 create mode 100644 cli/src/tests/proc_macro/src/lib.rs

diff --git a/Cargo.lock b/Cargo.lock
index 7a675454..404c269f 100644
--- a/Cargo.lock
+++ b/Cargo.lock
@@ -464,6 +464,16 @@ dependencies = [
  "unicode-ident",
 ]
 
+[[package]]
+name = "proc_macro"
+version = "0.1.0"
+dependencies = [
+ "proc-macro2",
+ "quote",
+ "rand",
+ "syn",
+]
+
 [[package]]
 name = "quote"
 version = "1.0.26"
@@ -746,6 +756,7 @@ dependencies = [
  "lazy_static",
  "log",
  "pretty_assertions",
+ "proc_macro",
  "rand",
  "regex",
  "regex-syntax",
diff --git a/cli/Cargo.toml b/cli/Cargo.toml
index 6d48e8b9..47e03284 100644
--- a/cli/Cargo.toml
+++ b/cli/Cargo.toml
@@ -69,6 +69,8 @@ version = "0.4.6"
 features = ["std"]
 
 [dev-dependencies]
+proc_macro = { path = "src/tests/proc_macro" }
+
 rand = "0.8"
 tempfile = "3"
 pretty_assertions = "0.7.2"
diff --git a/cli/src/tests/proc_macro/Cargo.toml b/cli/src/tests/proc_macro/Cargo.toml
new file mode 100644
index 00000000..a9a2b146
--- /dev/null
+++ b/cli/src/tests/proc_macro/Cargo.toml
@@ -0,0 +1,14 @@
+[package]
+name = "proc_macro"
+version = "0.1.0"
+edition = "2021"
+publish = false
+
+[lib]
+proc-macro = true
+
+[dependencies]
+proc-macro2 = "1"
+quote = "1"
+rand = "0.8.5"
+syn = { version = "1", features = ["full"] }
diff --git a/cli/src/tests/proc_macro/src/lib.rs b/cli/src/tests/proc_macro/src/lib.rs
new file mode 100644
index 00000000..d831a75b
--- /dev/null
+++ b/cli/src/tests/proc_macro/src/lib.rs
@@ -0,0 +1,137 @@
+use proc_macro::TokenStream;
+use proc_macro2::Span;
+use quote::quote;
+use syn::{
+    parse::{Parse, ParseStream},
+    parse_macro_input, Error, Expr, Ident, ItemFn, LitInt, Token,
+};
+
+#[proc_macro_attribute]
+pub fn retry(args: TokenStream, input: TokenStream) -> TokenStream {
+    let count = parse_macro_input!(args as LitInt);
+    let input = parse_macro_input!(input as ItemFn);
+    let attrs = input.attrs.clone();
+    let name = input.sig.ident.clone();
+
+    TokenStream::from(quote! {
+        #(#attrs),*
+        fn #name() {
+            #input
+
+            for i in 0..=#count {
+                let result = std::panic::catch_unwind(|| {
+                    #name();
+                });
+
+                if result.is_ok() {
+                    return;
+                }
+
+                if i == #count {
+                    std::panic::resume_unwind(result.unwrap_err());
+                }
+            }
+        }
+    })
+}
+
+#[proc_macro_attribute]
+pub fn test_with_seed(args: TokenStream, input: TokenStream) -> TokenStream {
+    struct Args {
+        retry: LitInt,
+        seed: Expr,
+        seed_fn: Option<Ident>,
+    }
+
+    impl Parse for Args {
+        fn parse(input: ParseStream) -> syn::Result<Self> {
+            let mut retry = None;
+            let mut seed = None;
+            let mut seed_fn = None;
+
+            while !input.is_empty() {
+                let name = input.parse::<Ident>()?;
+                match name.to_string().as_str() {
+                    "retry" => {
+                        input.parse::<Token![=]>()?;
+                        retry.replace(input.parse()?);
+                    }
+                    "seed" => {
+                        input.parse::<Token![=]>()?;
+                        seed.replace(input.parse()?);
+                    }
+                    "seed_fn" => {
+                        input.parse::<Token![=]>()?;
+                        seed_fn.replace(input.parse()?);
+                    }
+                    x => {
+                        return Err(Error::new(
+                            name.span(),
+                            format!("Unsupported parameter `{x}`"),
+                        ))
+                    }
+                }
+
+                if !input.is_empty() {
+                    input.parse::<Token![,]>()?;
+                }
+            }
+
+            if retry.is_none() {
+                retry.replace(LitInt::new("0", Span::mixed_site()));
+            }
+
+            Ok(Args {
+                retry: retry.expect("`retry` parameter is requred"),
+                seed: seed.expect("`initial_seed` parameter is required"),
+                seed_fn,
+            })
+        }
+    }
+
+    let Args {
+        retry,
+        seed,
+        seed_fn,
+    } = parse_macro_input!(args as Args);
+
+    let seed_fn = seed_fn.iter();
+
+    let func = parse_macro_input!(input as ItemFn);
+    let attrs = func.attrs.clone();
+    let name = func.sig.ident.clone();
+
+    // dbg!(quote::ToTokens::into_token_stream(&func));
+
+    TokenStream::from(quote! {
+        #[test]
+        #(#attrs),*
+        fn #name() {
+            #func
+
+            let mut seed = #seed;
+
+            for i in 0..=#retry {
+                let result = std::panic::catch_unwind(|| {
+                    #name(seed);
+                });
+
+                if result.is_ok() {
+                    return;
+                }
+
+                if i == #retry {
+                    std::panic::resume_unwind(result.unwrap_err());
+                }
+
+                #(
+                    seed = #seed_fn();
+                )*
+
+                if i < #retry {
+                    println!("\nRetry {}/{} with a new seed {}", i + 1, #retry, seed);
+                }
+            }
+        }
+    })
+}

From 588549c09388dd6586cfbb06c06f8eeba436f38f Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Thu, 16 Mar 2023 15:02:59 +0200
Subject: [PATCH 055/347] test: run `test_parsing_with_a_timeout` with 10
 retries

---
 cli/src/tests/parser_test.rs | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/cli/src/tests/parser_test.rs b/cli/src/tests/parser_test.rs
index 30b12336..78c6cda4 100644
--- a/cli/src/tests/parser_test.rs
+++ b/cli/src/tests/parser_test.rs
@@ -8,6 +8,7 @@ use crate::{
     generate::generate_parser_for_grammar,
     parse::{perform_edit, Edit},
 };
+use proc_macro::retry;
 use std::{
     sync::atomic::{AtomicUsize, Ordering},
     thread, time,
@@ -638,6 +639,7 @@ fn test_parsing_cancelled_by_another_thread() {
 // Timeouts
 
 #[test]
+#[retry(10)]
 fn test_parsing_with_a_timeout() {
     let mut parser = Parser::new();
     parser.set_language(get_language("json")).unwrap();

From 3aeef44eb651b77b7392d5ee89fa4d92273b8e0c Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Thu, 16 Mar 2023 15:08:23 +0200
Subject: [PATCH 056/347] test: run all corpus tests with 10 retries

---
 cli/src/tests/corpus_test.rs | 95 +++++++++++++++++++-----------------
 1 file changed, 50 insertions(+), 45 deletions(-)

diff --git a/cli/src/tests/corpus_test.rs b/cli/src/tests/corpus_test.rs
index 401a99a5..b818b2c1 100644
--- a/cli/src/tests/corpus_test.rs
+++ b/cli/src/tests/corpus_test.rs
@@ -2,6 +2,7 @@ use super::helpers::{
     allocations,
     edits::{get_random_edit, invert_edit},
     fixtures::{fixtures_dir, get_language, get_test_language},
+    new_seed,
     random::Rand,
     scope_sequence::ScopeSequence,
     EDIT_COUNT, EXAMPLE_FILTER, ITERATION_COUNT, LANGUAGE_FILTER, LOG_ENABLED, LOG_GRAPH_ENABLED,
@@ -13,70 +14,71 @@ use crate::{
     test::{parse_tests, print_diff, print_diff_key, strip_sexp_fields, TestEntry},
     util,
 };
-use std::fs;
+use proc_macro::test_with_seed;
+use std::{env, fs};
 use tree_sitter::{LogType, Node, Parser, Point, Range, Tree};
 
-#[test]
-fn test_bash_corpus() {
-    test_language_corpus("bash");
+#[test_with_seed(retry=10, seed=*START_SEED, seed_fn=new_seed)]
+fn test_corpus_for_bash(seed: usize) {
+    test_language_corpus(seed, "bash");
 }
 
-#[test]
-fn test_c_corpus() {
-    test_language_corpus("c");
+#[test_with_seed(retry=10, seed=*START_SEED, seed_fn=new_seed)]
+fn test_corpus_for_c(seed: usize) {
+    test_language_corpus(seed, "c");
 }
 
-#[test]
-fn test_cpp_corpus() {
-    test_language_corpus("cpp");
+#[test_with_seed(retry=10, seed=*START_SEED, seed_fn=new_seed)]
+fn test_corpus_for_cpp(seed: usize) {
+    test_language_corpus(seed, "cpp");
 }
 
-#[test]
-fn test_embedded_template_corpus() {
-    test_language_corpus("embedded-template");
+#[test_with_seed(retry=10, seed=*START_SEED, seed_fn=new_seed)]
+fn test_corpus_for_embedded_template(seed: usize) {
+    test_language_corpus(seed, "embedded-template");
 }
 
-#[test]
-fn test_go_corpus() {
-    test_language_corpus("go");
+#[test_with_seed(retry=10, seed=*START_SEED, seed_fn=new_seed)]
+fn test_corpus_for_go(seed: usize) {
+    test_language_corpus(seed, "go");
 }
 
-#[test]
-fn test_html_corpus() {
-    test_language_corpus("html");
+#[test_with_seed(retry=10, seed=*START_SEED, seed_fn=new_seed)]
+fn test_corpus_for_html(seed: usize) {
+    test_language_corpus(seed, "html");
 }
 
-#[test]
-fn test_javascript_corpus() {
-    test_language_corpus("javascript");
+#[test_with_seed(retry=10, seed=*START_SEED, seed_fn=new_seed)]
+fn test_corpus_for_javascript(seed: usize) {
+    test_language_corpus(seed, "javascript");
 }
 
-#[test]
-fn test_json_corpus() {
-    test_language_corpus("json");
+#[test_with_seed(retry=10, seed=*START_SEED, seed_fn=new_seed)]
+fn test_corpus_for_json(seed: usize) {
+    test_language_corpus(seed, "json");
 }
 
-#[test]
-fn test_php_corpus() {
-    test_language_corpus("php");
+#[test_with_seed(retry=10, seed=*START_SEED, seed_fn=new_seed)]
+fn test_corpus_for_php(seed: usize) {
+    test_language_corpus(seed, "php");
 }
 
-#[test]
-fn test_python_corpus() {
-    test_language_corpus("python");
+#[test_with_seed(retry=10, seed=*START_SEED, seed_fn=new_seed)]
+fn test_corpus_for_python(seed: usize) {
+    test_language_corpus(seed, "python");
 }
 
-#[test]
-fn test_ruby_corpus() {
-    test_language_corpus("ruby");
+#[test_with_seed(retry=10, seed=*START_SEED, seed_fn=new_seed)]
+fn test_corpus_for_ruby(seed: usize) {
+    test_language_corpus(seed, "ruby");
 }
 
-#[test]
-fn test_rust_corpus() {
-    test_language_corpus("rust");
+#[test_with_seed(retry=10, seed=*START_SEED, seed_fn=new_seed)]
+fn test_corpus_for_rust(seed: usize) {
+    test_language_corpus(seed, "rust");
 }
 
-fn test_language_corpus(language_name: &str) {
+fn test_language_corpus(start_seed: usize, language_name: &str) {
     let grammars_dir = fixtures_dir().join("grammars");
     let error_corpus_dir = fixtures_dir().join("error_corpus");
     let template_corpus_dir = fixtures_dir().join("template_corpus");
@@ -100,6 +102,10 @@ fn test_language_corpus(language_name: &str) {
 
     let language = get_language(language_name);
     let mut failure_count = 0;
+
+    let log_seed = env::var("TREE_SITTER_LOG_SEED").is_ok();
+
+    println!();
     for test in tests {
         println!("  {} example - {}", language_name, test.name);
 
@@ -140,7 +146,7 @@ fn test_language_corpus(language_name: &str) {
         drop(parser);
 
         for trial in 0..*ITERATION_COUNT {
-            let seed = *START_SEED + trial;
+            let seed = start_seed + trial;
             let passed = allocations::record(|| {
                 let mut rand = Rand::new(seed);
                 let mut log_session = None;
@@ -161,7 +167,9 @@ fn test_language_corpus(language_name: &str) {
                     perform_edit(&mut tree, &mut input, &edit);
                 }
 
-                // println!("    seed: {}", seed);
+                if log_seed {
+                    println!("    seed: {}", seed);
+                }
 
                 if *LOG_GRAPH_ENABLED {
                     eprintln!("{}\n", String::from_utf8_lossy(&input));
@@ -173,10 +181,7 @@ fn test_language_corpus(language_name: &str) {
                 // Check that the new tree is consistent.
                 check_consistent_sizes(&tree2, &input);
                 if let Err(message) = check_changed_ranges(&tree, &tree2, &input) {
-                    println!(
-                        "\nUnexpected scope change in seed {}\n{}\n\n",
-                        seed, message
-                    );
+                    println!("\nUnexpected scope change in seed {seed} with start seed {start_seed}\n{message}\n\n",);
                     return false;
                 }
 
@@ -211,7 +216,7 @@ fn test_language_corpus(language_name: &str) {
                 // Check that the edited tree is consistent.
                 check_consistent_sizes(&tree3, &input);
                 if let Err(message) = check_changed_ranges(&tree2, &tree3, &input) {
-                    eprintln!("Unexpected scope change in seed {}\n{}\n\n", seed, message);
+                    println!("Unexpected scope change in seed {seed} with start seed {start_seed}\n{message}\n\n");
                     return false;
                 }
 

From ddb0af95098cf04a307d5ea6e93d77a00643c5d7 Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Thu, 16 Mar 2023 15:08:56 +0200
Subject: [PATCH 057/347] test: use random SEED numbers

This is needed to omit occurrences of the same seed in a sequence of
following seeds due to the reason of that two initial seed are very
close if based on unix epoch seconds.
---
 cli/src/tests/helpers/mod.rs | 16 ++++++++++------
 1 file changed, 10 insertions(+), 6 deletions(-)

diff --git a/cli/src/tests/helpers/mod.rs b/cli/src/tests/helpers/mod.rs
index def0ea3e..54df8809 100644
--- a/cli/src/tests/helpers/mod.rs
+++ b/cli/src/tests/helpers/mod.rs
@@ -6,7 +6,8 @@ pub(super) mod random;
 pub(super) mod scope_sequence;
 
 use lazy_static::lazy_static;
-use std::{env, time, usize};
+use rand::Rng;
+use std::env;
 
 lazy_static! {
     pub static ref LOG_ENABLED: bool = env::var("TREE_SITTER_LOG").is_ok();
@@ -16,11 +17,7 @@ lazy_static! {
 }
 
 lazy_static! {
-    pub static ref START_SEED: usize =
-        int_env_var("TREE_SITTER_SEED").unwrap_or_else(|| time::SystemTime::now()
-            .duration_since(time::UNIX_EPOCH)
-            .unwrap()
-            .as_secs() as usize,);
+    pub static ref START_SEED: usize = new_seed();
     pub static ref EDIT_COUNT: usize = int_env_var("TREE_SITTER_EDITS").unwrap_or(3);
     pub static ref ITERATION_COUNT: usize = int_env_var("TREE_SITTER_ITERATIONS").unwrap_or(10);
 }
@@ -28,3 +25,10 @@ lazy_static! {
 fn int_env_var(name: &'static str) -> Option<usize> {
     env::var(name).ok().and_then(|e| e.parse().ok())
 }
+
+pub(crate) fn new_seed() -> usize {
+    int_env_var("TREE_SITTER_SEED").unwrap_or_else(|| {
+        let mut rng = rand::thread_rng();
+        rng.gen::<usize>()
+    })
+}

From 78fd9196f7cda76d105ddbd34641e010272efc8b Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Thu, 16 Mar 2023 17:29:27 +0200
Subject: [PATCH 058/347] ci: drop AppVeyor and its badge

---
 .appveyor.yml | 50 --------------------------------------------------
 README.md     |  1 -
 2 files changed, 51 deletions(-)
 delete mode 100644 .appveyor.yml

diff --git a/.appveyor.yml b/.appveyor.yml
deleted file mode 100644
index d463b7a2..00000000
--- a/.appveyor.yml
+++ /dev/null
@@ -1,50 +0,0 @@
-build: false
-install:
-  # Terminate early unless building either a tag or a PR.
-  - if "%APPVEYOR_REPO_TAG%" == "false" if not "%APPVEYOR_REPO_BRANCH%" == "master" appveyor exit
-
-  # Install rust
-  - appveyor DownloadFile https://win.rustup.rs/ -FileName rustup-init.exe
-  - IF "%PLATFORM%" == "x86" rustup-init -y --default-toolchain stable --default-host i686-pc-windows-msvc
-  - IF "%PLATFORM%" == "x64" rustup-init -y --default-toolchain stable --default-host x86_64-pc-windows-msvc
-  - set PATH=%PATH%;C:\Users\appveyor\.cargo\bin
-  - rustc -vV
-  - cargo -vV
-
-  # Install dependencies
-  - git submodule update --init
-
-platform:
-  - x64
-  - x86
-
-test_script:
-  # Fetch and regenerate the fixture parsers
-  - script\fetch-fixtures.cmd
-  - cargo build --release
-  - script\generate-fixtures.cmd
-
-  # Run tests
-  - script\test.cmd
-  - script\benchmark.cmd
-
-before_deploy:
-  - move target\release\tree-sitter.exe tree-sitter.exe
-  - 7z a -tgzip tree-sitter-windows-%PLATFORM%.gz tree-sitter.exe
-  - appveyor PushArtifact tree-sitter-windows-%PLATFORM%.gz
-
-deploy:
-  description: ''
-  provider: GitHub
-  auth_token:
-    secure: VC9ntV5+inKoNteZyLQksKzWMKXF46P+Jx3JHKVSfF+o1rWtZn2iIHAVsQv5LaUi
-  artifact: /tree-sitter-windows-.*/
-  draft: true
-  force_update: true
-  on:
-    APPVEYOR_REPO_TAG: true
-
-cache:
-  - target
-  - test\fixtures\grammars
-  - C:\Users\appveyor\.cargo
diff --git a/README.md b/README.md
index 2d1e911d..f3c4abc2 100644
--- a/README.md
+++ b/README.md
@@ -1,7 +1,6 @@
 # tree-sitter
 
 [![Build Status](https://github.com/tree-sitter/tree-sitter/workflows/CI/badge.svg)](https://github.com/tree-sitter/tree-sitter/actions)
-[![Build status](https://ci.appveyor.com/api/projects/status/vtmbd6i92e97l55w/branch/master?svg=true)](https://ci.appveyor.com/project/maxbrunsfeld/tree-sitter/branch/master)
 [![DOI](https://zenodo.org/badge/14164618.svg)](https://zenodo.org/badge/latestdoi/14164618)
 
 Tree-sitter is a parser generator tool and an incremental parsing library. It can build a concrete syntax tree for a source file and efficiently update the syntax tree as the source file is edited. Tree-sitter aims to be:

From ec2af46f6fa8fc73204270397051f9e06fb5e32c Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Thu, 16 Mar 2023 18:00:02 +0200
Subject: [PATCH 059/347] chore: remove all dead badges

---
 cli/README.md              | 2 --
 highlight/README.md        | 2 --
 lib/binding_rust/README.md | 2 --
 lib/binding_web/README.md  | 2 --
 4 files changed, 8 deletions(-)

diff --git a/cli/README.md b/cli/README.md
index fe45b17b..8cdda9c0 100644
--- a/cli/README.md
+++ b/cli/README.md
@@ -1,8 +1,6 @@
 Tree-sitter CLI
 ===============
 
-[![Build Status](https://travis-ci.org/tree-sitter/tree-sitter.svg?branch=master)](https://travis-ci.org/tree-sitter/tree-sitter)
-[![Build status](https://ci.appveyor.com/api/projects/status/vtmbd6i92e97l55w/branch/master?svg=true)](https://ci.appveyor.com/project/maxbrunsfeld/tree-sitter/branch/master)
 [![Crates.io](https://img.shields.io/crates/v/tree-sitter-cli.svg)](https://crates.io/crates/tree-sitter-cli)
 
 The Tree-sitter CLI allows you to develop, test, and use Tree-sitter grammars from the command line. It works on MacOS, Linux, and Windows.
diff --git a/highlight/README.md b/highlight/README.md
index c04c7c08..e8a5d063 100644
--- a/highlight/README.md
+++ b/highlight/README.md
@@ -1,7 +1,5 @@
 # `tree-sitter-highlight`
 
-[![Build Status](https://travis-ci.org/tree-sitter/tree-sitter.svg?branch=master)](https://travis-ci.org/tree-sitter/tree-sitter)
-[![Build status](https://ci.appveyor.com/api/projects/status/vtmbd6i92e97l55w/branch/master?svg=true)](https://ci.appveyor.com/project/maxbrunsfeld/tree-sitter/branch/master)
 [![Crates.io](https://img.shields.io/crates/v/tree-sitter-highlight.svg)](https://crates.io/crates/tree-sitter-highlight)
 
 ### Usage
diff --git a/lib/binding_rust/README.md b/lib/binding_rust/README.md
index 6b48630a..dffe7661 100644
--- a/lib/binding_rust/README.md
+++ b/lib/binding_rust/README.md
@@ -1,7 +1,5 @@
 # Rust Tree-sitter
 
-[![Build Status](https://travis-ci.org/tree-sitter/tree-sitter.svg?branch=master)](https://travis-ci.org/tree-sitter/tree-sitter)
-[![Build status](https://ci.appveyor.com/api/projects/status/vtmbd6i92e97l55w/branch/master?svg=true)](https://ci.appveyor.com/project/maxbrunsfeld/tree-sitter/branch/master)
 [![Crates.io](https://img.shields.io/crates/v/tree-sitter.svg)](https://crates.io/crates/tree-sitter)
 
 Rust bindings to the [Tree-sitter][] parsing library.
diff --git a/lib/binding_web/README.md b/lib/binding_web/README.md
index 0c0f5246..a75cd9f0 100644
--- a/lib/binding_web/README.md
+++ b/lib/binding_web/README.md
@@ -1,8 +1,6 @@
 Web Tree-sitter
 ===============
 
-[![Build Status](https://travis-ci.org/tree-sitter/tree-sitter.svg?branch=master)](https://travis-ci.org/tree-sitter/tree-sitter)
-
 WebAssembly bindings to the [Tree-sitter](https://github.com/tree-sitter/tree-sitter) parsing library.
 
 ### Setup

From cc4f932d175b65e6fc9a55df5c55fc0b3a7d9ada Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Tue, 4 Apr 2023 02:38:29 +0300
Subject: [PATCH 060/347] cicd: new workflow

---
 .github/scripts/cross.sh               |  10 ++
 .github/scripts/make.sh                |  19 +++
 .github/scripts/tree-sitter.sh         |  12 ++
 .github/workflows/CICD.yml             |  69 ++++++++++
 .github/workflows/build.yml            | 171 +++++++++++++++++++++++++
 .github/workflows/ci.yml               | 150 ----------------------
 .github/workflows/fast_checks.yml      |  31 +++++
 .github/workflows/full_rust_checks.yml |  32 +++++
 .github/workflows/msrv.yml             |  42 ++++++
 .github/workflows/publish.yml          |  21 +++
 .github/workflows/release.yml          | 101 +++++++++++++++
 Cargo.lock                             | 157 ++++++++++++-----------
 script/generate-fixtures               |  12 +-
 script/generate-fixtures-wasm          |  12 +-
 14 files changed, 611 insertions(+), 228 deletions(-)
 create mode 100755 .github/scripts/cross.sh
 create mode 100755 .github/scripts/make.sh
 create mode 100755 .github/scripts/tree-sitter.sh
 create mode 100644 .github/workflows/CICD.yml
 create mode 100644 .github/workflows/build.yml
 delete mode 100644 .github/workflows/ci.yml
 create mode 100644 .github/workflows/fast_checks.yml
 create mode 100644 .github/workflows/full_rust_checks.yml
 create mode 100644 .github/workflows/msrv.yml
 create mode 100644 .github/workflows/publish.yml
 create mode 100644 .github/workflows/release.yml

diff --git a/.github/scripts/cross.sh b/.github/scripts/cross.sh
new file mode 100755
index 00000000..07017192
--- /dev/null
+++ b/.github/scripts/cross.sh
@@ -0,0 +1,10 @@
+#!/bin/bash
+
+set -x
+set -e
+
+if [ "$CROSS" != 1 ]; then
+    exit 111
+fi
+
+docker run --rm -v /home/runner:/home/runner -w "$PWD" "$CROSS_IMAGE" "$@"
diff --git a/.github/scripts/make.sh b/.github/scripts/make.sh
new file mode 100755
index 00000000..62aa0c06
--- /dev/null
+++ b/.github/scripts/make.sh
@@ -0,0 +1,19 @@
+#!/bin/bash
+
+set -x
+set -e
+
+if [ "$CROSS" = 1 ]; then
+    if [ -z "$CC" ]; then
+        echo "make.sh: CC is not set" >&2
+        exit 111
+    fi
+    if [ -z "$AR" ]; then
+        echo "make.sh: AR is not set" >&2
+        exit 111
+    fi
+
+    cross.sh make CC=$CC AR=$AR "$@"
+else
+    make "$@"
+fi
diff --git a/.github/scripts/tree-sitter.sh b/.github/scripts/tree-sitter.sh
new file mode 100755
index 00000000..2e6e31c2
--- /dev/null
+++ b/.github/scripts/tree-sitter.sh
@@ -0,0 +1,12 @@
+#!/bin/bash
+
+set -x
+set -e
+
+tree_sitter="$ROOT"/target/"$TARGET"/release/tree-sitter
+
+if [ "$CROSS" = 1 ]; then
+    cross.sh $CROSS_RUNNER "$tree_sitter" "$@"
+else
+    "$tree_sitter" "$@"
+fi
diff --git a/.github/workflows/CICD.yml b/.github/workflows/CICD.yml
new file mode 100644
index 00000000..7c2351a8
--- /dev/null
+++ b/.github/workflows/CICD.yml
@@ -0,0 +1,69 @@
+name: CICD
+
+on:
+  workflow_dispatch:
+  pull_request:
+  push:
+    branches:
+      - master
+      - check/*
+
+concurrency:
+  group: '${{ github.workflow }} @ ${{ github.event.pull_request.head.label || github.head_ref || github.ref }}'
+  cancel-in-progress: true
+
+jobs:
+  init:
+    name: Init
+    runs-on: ubuntu-latest
+    steps:
+      - name: Get PR head ref
+        if: ${{ github.event_name == 'pull_request' }}
+        id: ref
+        run: |
+          echo "ref=refs/pull/${{ github.event.pull_request.number }}/head" >> $GITHUB_OUTPUT
+    outputs:
+      ref: >-
+        ${{
+          (github.event_name == 'pull_request' && startsWith(github.head_ref, 'release/v'))
+          && steps.ref.outputs.ref
+          || github.ref
+        }}
+
+  fast_checks:
+    name: Fast checks
+    uses: ./.github/workflows/fast_checks.yml
+
+  full_checks:
+    name: Full Rust checks
+    needs: fast_checks
+    uses: ./.github/workflows/full_rust_checks.yml
+
+  min_version:
+    name: Minimum supported rust version
+    needs: fast_checks
+    uses: ./.github/workflows/msrv.yml
+    with:
+      package: tree-sitter-cli
+
+  build:
+    name: Build & Test
+    needs: [init, fast_checks]
+    uses: ./.github/workflows/build.yml
+    with:
+      ref: ${{ needs.init.outputs.ref }}
+
+  release:
+    name: Release
+    needs: [init, fast_checks, full_checks, min_version, build]
+    if: >
+      github.event.pull_request.head.repo.full_name == github.repository &&
+      startsWith(github.head_ref, 'release/v')
+    uses: ./.github/workflows/release.yml
+    with:
+      ref: ${{ needs.init.outputs.ref }}
+
+  publish:
+    name: Publish
+    needs: release
+    uses: ./.github/workflows/publish.yml
diff --git a/.github/workflows/build.yml b/.github/workflows/build.yml
new file mode 100644
index 00000000..27b31085
--- /dev/null
+++ b/.github/workflows/build.yml
@@ -0,0 +1,171 @@
+name: Build & Test
+
+env:
+  CARGO_TERM_COLOR: always
+  RUSTFLAGS: "-D warnings"
+  CROSS_DEBUG: 1
+
+on:
+  workflow_call:
+    inputs:
+      ref:
+        default: ${{ github.ref }}
+        type: string
+
+jobs:
+  build:
+    name: ${{ matrix.job.name }} (${{ matrix.job.target }}) (${{ matrix.job.os }})
+    runs-on: ${{ matrix.job.os }}
+    strategy:
+      fail-fast: false
+      matrix:
+        job:
+          - { name: linux-aarch64 , target: aarch64-unknown-linux-gnu   , os: ubuntu-latest  , use-cross: true }
+          - { name: linux-arm     , target: arm-unknown-linux-gnueabihf , os: ubuntu-latest  , use-cross: true }
+          - { name: linux-x64     , target: x86_64-unknown-linux-gnu    , os: ubuntu-latest                    }
+          - { name: linux-x86     , target: i686-unknown-linux-gnu      , os: ubuntu-latest  , use-cross: true }
+          - { name: windows-x64   , target: x86_64-pc-windows-msvc      , os: windows-latest                   }
+          - { name: windows-x86   , target: i686-pc-windows-msvc        , os: windows-latest                   }
+          - { name: macos-x64     , target: x86_64-apple-darwin         , os: macos-latest                     }
+
+    env:
+      BUILD_CMD: cargo
+
+    defaults:
+      run:
+        shell: bash
+
+    steps:
+    - name: Checkout source code
+      uses: actions/checkout@v3
+      with:
+        ref: ${{ inputs.ref }}
+
+    - name: Read Emscripten version
+      run: |
+        echo "EMSCRIPTEN_VERSION=$(cat cli/emscripten-version)" >> $GITHUB_ENV
+
+    - name: Install Emscripten
+      uses: mymindstorm/setup-emsdk@v12
+      with:
+        version: ${{ env.EMSCRIPTEN_VERSION }}
+
+    - name: Install Rust toolchain
+      uses: dtolnay/rust-toolchain@stable
+      with:
+        targets: ${{ matrix.job.target }}
+
+    - name: Install cross
+      if: matrix.job.use-cross
+      uses: taiki-e/install-action@v2
+      with:
+        tool: cross
+
+    - name: Build custom cross image
+      if: ${{ matrix.job.use-cross && matrix.job.os == 'ubuntu-latest' }}
+      run: |
+        cd ..
+
+        target="${{ matrix.job.target }}"
+        image=ghcr.io/cross-rs/$target:custom
+        echo "CROSS_IMAGE=$image"                                  >> $GITHUB_ENV
+
+        echo "[target.$target]"                                    >> Cross.toml
+        echo "image = \"$image\""                                  >> Cross.toml
+        echo "CROSS_CONFIG=$PWD/Cross.toml"                        >> $GITHUB_ENV
+
+        echo "FROM ghcr.io/cross-rs/$target:edge"                  >> Dockerfile
+        echo "ENV DEBIAN_FRONTEND=noninteractive"                  >> Dockerfile
+        echo "RUN apt-get update && apt-get install -y nodejs"     >> Dockerfile
+        docker build -t $image .
+        docker images
+        docker run --rm $image env
+
+        cd -
+
+    - name: Setup extra env
+      run: |
+        PATH="$PWD/.github/scripts:$PATH"
+        echo "PATH=$PATH" >> $GITHUB_ENV
+        echo "ROOT=$PWD" >> $GITHUB_ENV
+        echo "TREE_SITTER=tree-sitter.sh" >> $GITHUB_ENV
+
+        export TARGET=${{ matrix.job.target }}
+        echo "TARGET=$TARGET" >> $GITHUB_ENV
+
+        USE_CROSS="${{ matrix.job.use-cross }}"
+
+        if [ "$USE_CROSS" == "true" ]; then
+          echo "BUILD_CMD=cross" >> $GITHUB_ENV
+
+          export CROSS=1; echo "CROSS=$CROSS" >> $GITHUB_ENV
+
+          runner=$(cross.sh bash -c "env | sed -nr '/^CARGO_TARGET_.*_RUNNER=/s///p'")
+          [ -n "$runner" ] && echo "CROSS_RUNNER=$runner" >> $GITHUB_ENV
+          echo "runner: $runner"
+
+          case "$TARGET" in
+            i686-unknown-linux-gnu)      CC=i686-linux-gnu-gcc              AR=i686-linux-gnu-ar                  ;;
+            aarch64-unknown-linux-gnu)   CC=aarch64-linux-gnu-gcc           AR=aarch64-linux-gnu-ar               ;;
+            arm-unknown-linux-gnueabihf) CC=arm-unknown-linux-gnueabihf-gcc AR=arm-unknown-linux-gnueabihf-gcc-ar ;;
+          esac
+
+          [ -n "$CC" ] && echo "CC=$CC" >> $GITHUB_ENV
+          [ -n "$AR" ] && echo "AR=$AR" >> $GITHUB_ENV
+        fi
+
+        case "$TARGET" in
+          *-windows-*)
+            echo "RUST_TEST_THREADS=1" >> $GITHUB_ENV # See #2041 tree-sitter issue
+            ;;
+        esac
+
+    - name: Build C library
+      if: "!contains(matrix.job.os, 'windows')" # Requires an additional adapted Makefile for `cl.exe` compiler
+      run: make.sh CFLAGS="-Werror" -j
+
+    - name: Build wasm library
+      run: script/build-wasm
+
+    - name: Build CLI
+      run: $BUILD_CMD build --release --target=${{ matrix.job.target }}
+
+    - name: Fetch fixtures
+      run: script/fetch-fixtures
+
+    - name: Generate fixtures
+      run: script/generate-fixtures
+
+    - name: Generate WASM fixtures
+      if: "!matrix.job.use-cross"
+      run: script/generate-fixtures-wasm
+
+    - name: Run main tests
+      run: $BUILD_CMD test --target=${{ matrix.job.target }}
+
+    - name: Run wasm tests
+      if: "!matrix.job.use-cross" # TODO: Install Emscripten into custom cross images
+      run: script/test-wasm
+
+    - name: Run benchmarks
+      if: "!matrix.job.use-cross" # It doesn't make sense to benchmark something in an emulator
+      run: $BUILD_CMD bench benchmark -p tree-sitter-cli --target=${{ matrix.job.target }}
+
+    - name: Upload CLI artifact
+      uses: actions/upload-artifact@v3
+      with:
+        name: tree-sitter.${{ matrix.job.name }}
+        path: target/${{ matrix.job.target }}/release/tree-sitter${{ contains(matrix.job.target, 'windows') && '.exe' || '' }}
+        if-no-files-found: error
+        retention-days: 7
+
+    - name: Upload WASM artifacts
+      if: ${{ matrix.job.name == 'linux-x64' }}
+      uses: actions/upload-artifact@v3
+      with:
+        name: tree-sitter.wasm
+        path: |
+          lib/binding_web/tree-sitter.js
+          lib/binding_web/tree-sitter.wasm
+        if-no-files-found: error
+        retention-days: 7
diff --git a/.github/workflows/ci.yml b/.github/workflows/ci.yml
deleted file mode 100644
index e6ef591a..00000000
--- a/.github/workflows/ci.yml
+++ /dev/null
@@ -1,150 +0,0 @@
-name: CI
-
-on:
-  push:
-    branches:
-      - master
-    tags:
-      - v*
-  pull_request:
-    branches:
-      - "**"
-
-env:
-  CARGO_TERM_COLOR: always
-  CARGO_INCREMENTAL: 0
-
-jobs:
-  unix-tests:
-    name: Unix tests
-    runs-on: ${{ matrix.os }}
-    strategy:
-      fail-fast: true
-      matrix:
-        os:
-          - macos-latest
-          - ubuntu-latest
-    steps:
-      - name: Checkout repo
-        uses: actions/checkout@v3
-
-      # Work around https://github.com/actions/cache/issues/403.
-      - name: Use GNU tar
-        if: matrix.os == 'macos-latest'
-        run: |
-          echo PATH="/usr/local/opt/gnu-tar/libexec/gnubin:$PATH" >> $GITHUB_ENV
-
-      - name: Read Emscripten version
-        run: |
-          printf 'EMSCRIPTEN_VERSION=%s\n' "$(cat cli/emscripten-version)" >> $GITHUB_ENV
-
-      - name: Cache artifacts
-        id: cache
-        uses: actions/cache@v3
-        with:
-          path: |
-            ~/.cargo/registry
-            ~/.cargo/git
-            target
-          key: ${{ runner.os }}-cargo-${{ hashFiles('Cargo.lock') }}-emscripten-${{ env.EMSCRIPTEN_VERSION }}
-
-      - name: Install rust
-        if: steps.cache.outputs.cache-hit != 'true'
-        uses: actions-rs/toolchain@v1
-        with:
-          toolchain: stable
-          profile: minimal
-          components: rustfmt, clippy
-
-      - name: Check Rust code formatting
-        run: cargo fmt -- --check
-
-      - name: Install emscripten
-        uses: mymindstorm/setup-emsdk@v12
-        with:
-          version: ${{ env.EMSCRIPTEN_VERSION }}
-
-      - name: Build C library
-        run: make
-
-      - name: Build wasm library
-        run: script/build-wasm
-
-      - name: Build CLI
-        run: |
-          RUSTFLAGS="-D warnings"
-          cargo build --release
-
-      - name: Set up fixture parsers
-        run: |
-          script/fetch-fixtures
-          script/generate-fixtures
-          script/generate-fixtures-wasm
-
-      - name: Run main tests
-        run: cargo test
-
-      - name: Run wasm tests
-        run: script/test-wasm
-
-      - name: Run benchmarks
-        run: script/benchmark
-
-      - name: Compress CLI binary
-        if: startsWith(github.ref, 'refs/tags/v')
-        run: |
-          cp target/release/tree-sitter .
-          export platform=$(echo ${{ runner.os }} | awk '{print tolower($0)}')
-          gzip --suffix "-${platform}-x64.gz" tree-sitter
-
-      - name: Release
-        uses: softprops/action-gh-release@v1
-        if: startsWith(github.ref, 'refs/tags/v')
-        with:
-          draft: true
-          files: |
-            tree-sitter-*.gz
-            lib/binding_web/tree-sitter.js
-            lib/binding_web/tree-sitter.wasm
-        env:
-          GITHUB_TOKEN: ${{ secrets.GITHUB_TOKEN }}
-
-  windows-tests:
-    name: Windows tests
-    runs-on: windows-latest
-    steps:
-      - name: Checkout repo
-        uses: actions/checkout@v3
-
-      - name: Cache artifacts
-        id: cache
-        uses: actions/cache@v3
-        with:
-          path: |
-            ~/.cargo/registry
-            ~/.cargo/git
-            target
-          key: ${{ runner.os }}-cargo-${{ hashFiles('Cargo.lock') }}
-
-      - name: Install rust
-        if: steps.cache.outputs.cache-hit != 'true'
-        uses: actions-rs/toolchain@v1
-        with:
-          toolchain: stable
-          profile: minimal
-
-      - name: Check Rust code formatting
-        run: cargo fmt -- --check
-
-      - name: Build CLI
-        run: |
-          $env:RUSTFLAGS="-D warnings"
-          cargo build --release
-
-      - name: Set up fixture parsers
-        run: |
-          script/fetch-fixtures.cmd
-          script/generate-fixtures.cmd
-
-      - name: Run main tests
-        run: script/test
diff --git a/.github/workflows/fast_checks.yml b/.github/workflows/fast_checks.yml
new file mode 100644
index 00000000..ea474799
--- /dev/null
+++ b/.github/workflows/fast_checks.yml
@@ -0,0 +1,31 @@
+name: Fast checks to fail fast on any simple code issues
+
+env:
+  CARGO_TERM_COLOR: always
+  RUSTFLAGS: "-D warnings"
+
+on:
+  workflow_call:
+
+jobs:
+  check_rust_formatting:
+    name: Check Rust formating
+    runs-on: ubuntu-latest
+    steps:
+
+    - name: Checkout source code
+      uses: actions/checkout@v3
+
+    - name: Run cargo fmt
+      run: cargo fmt -- --check
+
+  check_c_warnings:
+    name: Check C warnings
+    runs-on: ubuntu-latest
+    steps:
+
+    - name: Checkout source code
+      uses: actions/checkout@v3
+
+    - name: Make C library to check that it's able to compile without warnings
+      run: make -j CFLAGS="-Werror"
diff --git a/.github/workflows/full_rust_checks.yml b/.github/workflows/full_rust_checks.yml
new file mode 100644
index 00000000..2cc5f77d
--- /dev/null
+++ b/.github/workflows/full_rust_checks.yml
@@ -0,0 +1,32 @@
+name: Full Rust codebase checks
+
+env:
+  CARGO_TERM_COLOR: always
+  RUSTFLAGS: "-D warnings"
+
+on:
+  workflow_call:
+
+jobs:
+  run:
+    name: Run checks
+    runs-on: ubuntu-latest
+    steps:
+
+    - name: Checkout source code
+      uses: actions/checkout@v3
+
+    - name: Install rust toolchain
+      uses: dtolnay/rust-toolchain@master
+      with:
+        toolchain: stable
+        components: clippy, rustfmt
+
+    - name: Run cargo fmt
+      run: cargo fmt -- --check
+
+    # - name: Run clippy
+    #   run: cargo clippy --all-targets
+
+    - name: Run cargo check
+      run: cargo check --workspace --examples --tests --benches --bins
diff --git a/.github/workflows/msrv.yml b/.github/workflows/msrv.yml
new file mode 100644
index 00000000..3697930e
--- /dev/null
+++ b/.github/workflows/msrv.yml
@@ -0,0 +1,42 @@
+name: Minimum supported rust version
+
+env:
+  CARGO_TERM_COLOR: always
+  RUSTFLAGS: "-D warnings"
+
+on:
+  workflow_call:
+    inputs:
+      package:
+        description: Target cargo package name
+        required: true
+        type: string
+
+
+jobs:
+  run:
+    name: Run checks
+    runs-on: ubuntu-latest
+    steps:
+
+    - name: Checkout source code
+      uses: actions/checkout@v3
+
+    - name: Get the MSRV from the package metadata
+      id: msrv
+      run: cargo metadata --no-deps --format-version 1 | jq -r '"version=" + (.packages[] | select(.name == "${{ inputs.package }}").rust_version)' >> $GITHUB_OUTPUT
+
+    - name: Install rust toolchain (v${{ steps.msrv.outputs.version }})
+      uses: dtolnay/rust-toolchain@master
+      with:
+        toolchain: ${{ steps.msrv.outputs.version }}
+        components: clippy, rustfmt
+
+    - name: Run cargo fmt
+      run: cargo fmt -- --check
+
+    # - name: Run clippy (on minimum supported rust version to prevent warnings we can't fix)
+    #   run: cargo clippy --all-targets
+
+    # - name: Run main tests
+    #   run: cargo test
diff --git a/.github/workflows/publish.yml b/.github/workflows/publish.yml
new file mode 100644
index 00000000..e1ad3e05
--- /dev/null
+++ b/.github/workflows/publish.yml
@@ -0,0 +1,21 @@
+name: Publish to registries
+
+on:
+  workflow_call:
+
+jobs:
+  crates_io:
+    name: Publish to Crates.io
+    runs-on: ubuntu-latest
+    steps:
+      - name: Publish packages
+        run: |
+          echo "::warning::TODO: add a Crates.io publish logic"
+
+  npm:
+    name: Publish to npmjs.com
+    runs-on: ubuntu-latest
+    steps:
+      - name: Publish packages
+        run: |
+          echo "::warning::TODO: add a npmjs.com publish logic"
diff --git a/.github/workflows/release.yml b/.github/workflows/release.yml
new file mode 100644
index 00000000..27e969e7
--- /dev/null
+++ b/.github/workflows/release.yml
@@ -0,0 +1,101 @@
+name: Release
+
+on:
+  workflow_call:
+    inputs:
+      ref:
+        default: ${{ github.ref }}
+        type: string
+
+jobs:
+  permissions:
+    name: Check permissions
+    runs-on: ubuntu-latest
+    outputs:
+      release_allowed: ${{ steps.maintainer.outputs.is_maintainer == 'true' }}
+    steps:
+
+    - name: Is maintainer
+      id: maintainer
+      env:
+        GH_TOKEN: ${{ github.token }}
+        repo: ${{ github.repository }}
+        actor: ${{ github.actor }}
+      run: |
+        maintainer=$(
+          gh api "/repos/${repo}/collaborators" |
+          jq ".[] | {login, maintainer: .permissions | .maintain} | select(.login == \"${actor}\") | .maintainer"
+        );
+        if [ "$maintainer" == "true" ]; then
+          echo "@${actor} has maintainer level permissions :rocket:" >> $GITHUB_STEP_SUMMARY;
+          echo "is_maintainer=true" >> $GITHUB_OUTPUT
+        fi
+
+  release:
+    name: Release
+    needs: permissions
+    if: needs.permissions.outputs.release_allowed
+    runs-on: ubuntu-latest
+    permissions:
+      contents: write
+    steps:
+
+      - name: Checkout source code
+        uses: actions/checkout@v3
+        with:
+          ref: ${{ inputs.ref }}
+
+      - name: Download build artifacts
+        uses: actions/download-artifact@v3
+        with:
+          path: artifacts
+
+      - name: Display structure of downloaded files
+        run: ls -lR
+        working-directory: artifacts
+
+      - name: Prepare release artifacts
+        run: |
+          mkdir -p target
+          mv artifacts/tree-sitter.wasm/* target/
+          rm -r artifacts/tree-sitter.wasm
+          for platform in $(cd artifacts; ls); do
+            exe=$(ls artifacts/$platform/tree-sitter*)
+            gzip --stdout --name $exe > target/tree-sitter-$platform.gz
+          done
+          rm -rf artifacts
+          ls -l target/
+
+      - name: Get tag name from a release/v* branch name
+        id: tag_name
+        env:
+          tag: ${{ github.head_ref }}
+        run: echo "tag=${tag#release/}" >> $GITHUB_OUTPUT
+
+      - name: Add a release tag
+        env:
+          ref: ${{ inputs.ref }}
+          tag: ${{ steps.tag_name.outputs.tag }}
+          message: "Release ${{ steps.tag_name.outputs.tag }}"
+        run: |
+          git config user.name "${GITHUB_ACTOR}"
+          git config user.email "${GITHUB_ACTOR}@users.noreply.github.com"
+          git tag -a "$tag" HEAD -m "$message"
+          git push origin "$tag"
+
+      - name: Create release
+        uses: softprops/action-gh-release@v1
+        with:
+          name: ${{ steps.tag_name.outputs.tag }}
+          tag_name: ${{ steps.tag_name.outputs.tag }}
+          fail_on_unmatched_files: true
+          files: |
+            tree-sitter-*.gz
+            tree-sitter.wasm
+            tree-sitter.js
+
+      - name: Merge release PR
+        env:
+          GH_TOKEN: ${{ github.token }}
+        run: |
+          gh pr merge ${{ github.event.pull_request.html_url }} --match-head-commit $(git rev-parse HEAD) --merge --delete-branch
diff --git a/Cargo.lock b/Cargo.lock
index 404c269f..4b4437e6 100644
--- a/Cargo.lock
+++ b/Cargo.lock
@@ -22,9 +22,9 @@ dependencies = [
 
 [[package]]
 name = "anyhow"
-version = "1.0.69"
+version = "1.0.70"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "224afbd727c3d6e4b90103ece64b8d1b67fbb1973b1046c2281eed3f3803f800"
+checksum = "7de8ce5e0f9f8d88245311066a578d72b7af3e7088f32783804676302df237e4"
 
 [[package]]
 name = "ascii"
@@ -38,7 +38,7 @@ version = "0.2.14"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "d9b39be18770d11421cdb1b9947a45dd3f37e93092cbf377614828a319d5fee8"
 dependencies = [
- "hermit-abi",
+ "hermit-abi 0.1.19",
  "libc",
  "winapi",
 ]
@@ -128,9 +128,9 @@ dependencies = [
 
 [[package]]
 name = "core-foundation-sys"
-version = "0.8.3"
+version = "0.8.4"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "5827cebf4670468b8772dd191856768aedcb1b0278a04f989f7766351917b9dc"
+checksum = "e496a50fda8aacccc86d7529e2c1e0892dbd0f898a6b5645b5561b89c3210efa"
 
 [[package]]
 name = "ctor"
@@ -139,7 +139,7 @@ source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "6d2301688392eb071b0bf1a37be05c469d3cc4dbbd95df672fe28ab021e6a096"
 dependencies = [
  "quote",
- "syn",
+ "syn 1.0.109",
 ]
 
 [[package]]
@@ -191,13 +191,13 @@ checksum = "7fcaabb2fef8c910e7f4c7ce9f67a1283a1715879a7c230ca9d6d1ae31f16d91"
 
 [[package]]
 name = "errno"
-version = "0.2.8"
+version = "0.3.0"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "f639046355ee4f37944e44f60642c6f3a7efa3cf6b78c78a0d989a8ce6c396a1"
+checksum = "50d6a0976c999d473fe89ad888d5a284e55366d9dc9038b1ba2aa15128c4afa0"
 dependencies = [
  "errno-dragonfly",
  "libc",
- "winapi",
+ "windows-sys",
 ]
 
 [[package]]
@@ -260,6 +260,12 @@ dependencies = [
  "libc",
 ]
 
+[[package]]
+name = "hermit-abi"
+version = "0.3.1"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "fed44880c466736ef9a5c5b5facefb5ed0785676d0c02d612db14e54f0d84286"
+
 [[package]]
 name = "html-escape"
 version = "0.2.13"
@@ -287,9 +293,9 @@ dependencies = [
 
 [[package]]
 name = "indexmap"
-version = "1.9.2"
+version = "1.9.3"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "1885e79c1fc4b10f0e172c475f458b7f7b93061064d98c3293e98c5ba0c8b399"
+checksum = "bd070e393353796e801d209ad339e89596eb4c8d430d18ede6a1cced8fafbd99"
 dependencies = [
  "autocfg",
  "hashbrown",
@@ -306,12 +312,13 @@ dependencies = [
 
 [[package]]
 name = "io-lifetimes"
-version = "1.0.6"
+version = "1.0.9"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "cfa919a82ea574332e2de6e74b4c36e74d41982b335080fa59d4ef31be20fdf3"
+checksum = "09270fd4fa1111bc614ed2246c7ef56239a3063d5be0d1ec3b589c505d400aeb"
 dependencies = [
+ "hermit-abi 0.3.1",
  "libc",
- "windows-sys 0.45.0",
+ "windows-sys",
 ]
 
 [[package]]
@@ -322,16 +329,18 @@ checksum = "453ad9f582a441959e5f0d088b02ce04cfe8d51a8eaf077f12ac6d3e94164ca6"
 
 [[package]]
 name = "jni"
-version = "0.20.0"
+version = "0.21.1"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "039022cdf4d7b1cf548d31f60ae783138e5fd42013f6271049d7df7afadef96c"
+checksum = "1a87aa2bb7d2af34197c04845522473242e1aa17c12f4935d5856491a7fb8c97"
 dependencies = [
  "cesu8",
+ "cfg-if",
  "combine",
  "jni-sys",
  "log",
  "thiserror",
  "walkdir",
+ "windows-sys",
 ]
 
 [[package]]
@@ -373,9 +382,9 @@ dependencies = [
 
 [[package]]
 name = "linux-raw-sys"
-version = "0.1.4"
+version = "0.3.1"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "f051f77a7c8e6957c0696eac88f26b0117e54f52d3fc682ab19397a8812846a4"
+checksum = "d59d8c75012853d2e872fb56bc8a2e53718e2cafe1a4c823143141c6d90c322f"
 
 [[package]]
 name = "log"
@@ -457,9 +466,9 @@ dependencies = [
 
 [[package]]
 name = "proc-macro2"
-version = "1.0.52"
+version = "1.0.56"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "1d0e1ae9e836cc3beddd63db0df682593d7e2d3d891ae8c9083d2113e1744224"
+checksum = "2b63bdb0cd06f1f4dedf69b254734f9b45af66e4a031e42a7480257d9898b435"
 dependencies = [
  "unicode-ident",
 ]
@@ -471,7 +480,7 @@ dependencies = [
  "proc-macro2",
  "quote",
  "rand",
- "syn",
+ "syn 1.0.109",
 ]
 
 [[package]]
@@ -515,9 +524,9 @@ dependencies = [
 
 [[package]]
 name = "raw-window-handle"
-version = "0.5.1"
+version = "0.5.2"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "4f851a03551ceefd30132e447f07f96cb7011d6b658374f3aed847333adb5559"
+checksum = "f2ff9a1f06a88b01621b7ae906ef0211290d1c8a168a15542486a8f61c0833b9"
 
 [[package]]
 name = "redox_syscall"
@@ -528,6 +537,15 @@ dependencies = [
  "bitflags",
 ]
 
+[[package]]
+name = "redox_syscall"
+version = "0.3.5"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "567664f262709473930a4bf9e51bf2ebf3348f2e748ccc50dea20646858f8f29"
+dependencies = [
+ "bitflags",
+]
+
 [[package]]
 name = "redox_users"
 version = "0.4.3"
@@ -535,15 +553,15 @@ source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "b033d837a7cf162d7993aded9304e30a83213c648b6e389db233191f891e5c2b"
 dependencies = [
  "getrandom",
- "redox_syscall",
+ "redox_syscall 0.2.16",
  "thiserror",
 ]
 
 [[package]]
 name = "regex"
-version = "1.7.1"
+version = "1.7.3"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "48aaa5748ba571fb95cd2c85c09f629215d3a6ece942baa100950af03a34f733"
+checksum = "8b1f693b24f6ac912f4893ef08244d70b6067480d2f1a46e950c9691e6749d1d"
 dependencies = [
  "aho-corasick",
  "memchr",
@@ -552,9 +570,9 @@ dependencies = [
 
 [[package]]
 name = "regex-syntax"
-version = "0.6.28"
+version = "0.6.29"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "456c603be3e8d448b072f410900c09faf164fbce2d480456f50eea6e25f9c848"
+checksum = "f162c6dd7b008981e4d40210aca20b4bd0f9b60ca9271061b07f78537722f2e1"
 
 [[package]]
 name = "rustc-hash"
@@ -564,16 +582,16 @@ checksum = "08d43f7aa6b08d49f382cde6a7982047c3426db949b1424bc4b7ec9ae12c6ce2"
 
 [[package]]
 name = "rustix"
-version = "0.36.9"
+version = "0.37.7"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "fd5c6ff11fecd55b40746d1995a02f2eb375bf8c00d192d521ee09f42bef37bc"
+checksum = "2aae838e49b3d63e9274e1c01833cc8139d3fec468c3b84688c628f44b1ae11d"
 dependencies = [
  "bitflags",
  "errno",
  "io-lifetimes",
  "libc",
  "linux-raw-sys",
- "windows-sys 0.45.0",
+ "windows-sys",
 ]
 
 [[package]]
@@ -599,29 +617,29 @@ checksum = "bebd363326d05ec3e2f532ab7660680f3b02130d780c299bca73469d521bc0ed"
 
 [[package]]
 name = "serde"
-version = "1.0.156"
+version = "1.0.159"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "314b5b092c0ade17c00142951e50ced110ec27cea304b1037c6969246c2469a4"
+checksum = "3c04e8343c3daeec41f58990b9d77068df31209f2af111e059e9fe9646693065"
 dependencies = [
  "serde_derive",
 ]
 
 [[package]]
 name = "serde_derive"
-version = "1.0.156"
+version = "1.0.159"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "d7e29c4601e36bcec74a223228dce795f4cd3616341a4af93520ca1a837c087d"
+checksum = "4c614d17805b093df4b147b51339e7e44bf05ef59fba1e45d83500bcfb4d8585"
 dependencies = [
  "proc-macro2",
  "quote",
- "syn",
+ "syn 2.0.13",
 ]
 
 [[package]]
 name = "serde_json"
-version = "1.0.94"
+version = "1.0.95"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "1c533a59c9d8a93a09c6ab31f0fd5e5f4dd1b8fc9434804029839884765d04ea"
+checksum = "d721eca97ac802aa7777b701877c8004d950fc142651367300d21c1cc0194744"
 dependencies = [
  "indexmap",
  "itoa",
@@ -653,16 +671,27 @@ dependencies = [
 ]
 
 [[package]]
-name = "tempfile"
-version = "3.4.0"
+name = "syn"
+version = "2.0.13"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "af18f7ae1acd354b992402e9ec5864359d693cd8a79dcbef59f76891701c1e95"
+checksum = "4c9da457c5285ac1f936ebd076af6dac17a61cfe7826f2076b4d015cf47bc8ec"
+dependencies = [
+ "proc-macro2",
+ "quote",
+ "unicode-ident",
+]
+
+[[package]]
+name = "tempfile"
+version = "3.5.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "b9fbec84f381d5795b08656e4912bec604d162bff9291d6189a78f4c8ab87998"
 dependencies = [
  "cfg-if",
  "fastrand",
- "redox_syscall",
+ "redox_syscall 0.3.5",
  "rustix",
- "windows-sys 0.42.0",
+ "windows-sys",
 ]
 
 [[package]]
@@ -676,22 +705,22 @@ dependencies = [
 
 [[package]]
 name = "thiserror"
-version = "1.0.39"
+version = "1.0.40"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "a5ab016db510546d856297882807df8da66a16fb8c4101cb8b30054b0d5b2d9c"
+checksum = "978c9a314bd8dc99be594bc3c175faaa9794be04a5a5e153caba6915336cebac"
 dependencies = [
  "thiserror-impl",
 ]
 
 [[package]]
 name = "thiserror-impl"
-version = "1.0.39"
+version = "1.0.40"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "5420d42e90af0c38c3290abcca25b9b3bdf379fc9f55c528f53a269d9c9a267e"
+checksum = "f9456a42c5b0d803c8cd86e73dd7cc9edd429499f37a3550d286d5e86720569f"
 dependencies = [
  "proc-macro2",
  "quote",
- "syn",
+ "syn 2.0.13",
 ]
 
 [[package]]
@@ -827,9 +856,9 @@ dependencies = [
 
 [[package]]
 name = "unicode-bidi"
-version = "0.3.11"
+version = "0.3.13"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "524b68aca1d05e03fdf03fcdce2c6c94b6daf6d16861ddaa7e4f2b6638a9052c"
+checksum = "92888ba5573ff080736b3648696b70cafad7d250551175acbaa4e0385b3e1460"
 
 [[package]]
 name = "unicode-ident"
@@ -883,12 +912,11 @@ checksum = "f1bddf1187be692e79c5ffeab891132dfb0f236ed36a43c7ed39f1165ee20191"
 
 [[package]]
 name = "walkdir"
-version = "2.3.2"
+version = "2.3.3"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "808cf2735cd4b6866113f648b791c6adc5714537bc222d9347bb203386ffda56"
+checksum = "36df944cda56c7d8d8b7496af378e6b16de9284591917d307c9b4d313c44e698"
 dependencies = [
  "same-file",
- "winapi",
  "winapi-util",
 ]
 
@@ -919,7 +947,7 @@ dependencies = [
  "once_cell",
  "proc-macro2",
  "quote",
- "syn",
+ "syn 1.0.109",
  "wasm-bindgen-shared",
 ]
 
@@ -941,7 +969,7 @@ checksum = "2aff81306fcac3c7515ad4e177f521b5c9a15f2b08f4e32d823066102f35a5f6"
 dependencies = [
  "proc-macro2",
  "quote",
- "syn",
+ "syn 1.0.109",
  "wasm-bindgen-backend",
  "wasm-bindgen-shared",
 ]
@@ -964,9 +992,9 @@ dependencies = [
 
 [[package]]
 name = "webbrowser"
-version = "0.8.7"
+version = "0.8.8"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "97d1fa1e5c829b2bf9eb1e28fb950248b797cd6a04866fbdfa8bc31e5eef4c78"
+checksum = "579cc485bd5ce5bfa0d738e4921dd0b956eca9800be1fd2e5257ebe95bc4617e"
 dependencies = [
  "core-foundation",
  "dirs 4.0.0",
@@ -1021,21 +1049,6 @@ version = "0.4.0"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "712e227841d057c1ee1cd2fb22fa7e5a5461ae8e48fa2ca79ec42cfc1931183f"
 
-[[package]]
-name = "windows-sys"
-version = "0.42.0"
-source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "5a3e1820f08b8513f676f7ab6c1f99ff312fb97b553d30ff4dd86f9f15728aa7"
-dependencies = [
- "windows_aarch64_gnullvm",
- "windows_aarch64_msvc",
- "windows_i686_gnu",
- "windows_i686_msvc",
- "windows_x86_64_gnu",
- "windows_x86_64_gnullvm",
- "windows_x86_64_msvc",
-]
-
 [[package]]
 name = "windows-sys"
 version = "0.45.0"
diff --git a/script/generate-fixtures b/script/generate-fixtures
index 85298c46..2c3b178a 100755
--- a/script/generate-fixtures
+++ b/script/generate-fixtures
@@ -2,12 +2,18 @@
 
 set -e
 
-cargo build --release
+root_dir=$PWD
+
+if [ "$CI" == true ]; then
+  set -x
+  tree_sitter="$TREE_SITTER"
+else
+  cargo build --release
+  tree_sitter=${root_dir}/target/release/tree-sitter
+fi
 
 filter_grammar_name=$1
 
-root_dir=$PWD
-tree_sitter=${root_dir}/target/release/tree-sitter
 grammars_dir=${root_dir}/test/fixtures/grammars
 grammar_files=$(find $grammars_dir -name grammar.js | grep -v node_modules)
 
diff --git a/script/generate-fixtures-wasm b/script/generate-fixtures-wasm
index 9d44b58c..4bba56ae 100755
--- a/script/generate-fixtures-wasm
+++ b/script/generate-fixtures-wasm
@@ -2,7 +2,15 @@
 
 set -e
 
-cargo build --release
+root_dir=$PWD
+
+if [ "$CI" == true ]; then
+  set -x
+  tree_sitter="$TREE_SITTER"
+else
+  cargo build --release
+  tree_sitter=${root_dir}/target/release/tree-sitter
+fi
 
 build_wasm_args=
 if [[ $1 == "--docker" ]]; then
@@ -12,8 +20,6 @@ fi
 
 filter_grammar_name=$1
 
-root_dir=$PWD
-tree_sitter=${root_dir}/target/release/tree-sitter
 grammars_dir=${root_dir}/test/fixtures/grammars
 grammar_files=$(find $grammars_dir -name grammar.js | grep -v node_modules)
 

From da894afef59e1aefa23470c7db7445096f8f0e65 Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Tue, 4 Apr 2023 02:41:42 +0300
Subject: [PATCH 061/347] cargo: specify minimum supported Rust version

---
 Cargo.toml                          | 5 ++++-
 cli/Cargo.toml                      | 1 +
 cli/config/Cargo.toml               | 1 +
 cli/loader/Cargo.toml               | 1 +
 cli/src/tests/proc_macro/Cargo.toml | 1 +
 highlight/Cargo.toml                | 1 +
 lib/Cargo.toml                      | 1 +
 tags/Cargo.toml                     | 1 +
 8 files changed, 11 insertions(+), 1 deletion(-)

diff --git a/Cargo.toml b/Cargo.toml
index d1e57f89..f69dbc4f 100644
--- a/Cargo.toml
+++ b/Cargo.toml
@@ -1,7 +1,10 @@
 [workspace]
 default-members = ["cli"]
-
 members = ["cli", "lib"]
+resolver = "2"
+
+[workspace.package]
+rust-version = "1.65"
 
 [profile.release]
 strip = true
diff --git a/cli/Cargo.toml b/cli/Cargo.toml
index 47e03284..f9f8ca4b 100644
--- a/cli/Cargo.toml
+++ b/cli/Cargo.toml
@@ -9,6 +9,7 @@ readme = "README.md"
 keywords = ["incremental", "parsing"]
 categories = ["command-line-utilities", "parsing"]
 repository = "https://github.com/tree-sitter/tree-sitter"
+rust-version.workspace = true
 
 [[bin]]
 name = "tree-sitter"
diff --git a/cli/config/Cargo.toml b/cli/config/Cargo.toml
index ab3808ad..114d6ce8 100644
--- a/cli/config/Cargo.toml
+++ b/cli/config/Cargo.toml
@@ -9,6 +9,7 @@ readme = "README.md"
 keywords = ["incremental", "parsing"]
 categories = ["command-line-utilities", "parsing"]
 repository = "https://github.com/tree-sitter/tree-sitter"
+rust-version.workspace = true
 
 [dependencies]
 anyhow = "1.0"
diff --git a/cli/loader/Cargo.toml b/cli/loader/Cargo.toml
index 3a665ea9..6af28f30 100644
--- a/cli/loader/Cargo.toml
+++ b/cli/loader/Cargo.toml
@@ -9,6 +9,7 @@ readme = "README.md"
 keywords = ["incremental", "parsing"]
 categories = ["command-line-utilities", "parsing"]
 repository = "https://github.com/tree-sitter/tree-sitter"
+rust-version.workspace = true
 
 [dependencies]
 anyhow = "1.0"
diff --git a/cli/src/tests/proc_macro/Cargo.toml b/cli/src/tests/proc_macro/Cargo.toml
index a9a2b146..e6900d10 100644
--- a/cli/src/tests/proc_macro/Cargo.toml
+++ b/cli/src/tests/proc_macro/Cargo.toml
@@ -3,6 +3,7 @@ name = "proc_macro"
 version = "0.1.0"
 edition = "2021"
 publish = false
+rust-version.workspace = true
 
 [lib]
 proc-macro = true
diff --git a/highlight/Cargo.toml b/highlight/Cargo.toml
index 0b0de18e..e85ced8e 100644
--- a/highlight/Cargo.toml
+++ b/highlight/Cargo.toml
@@ -12,6 +12,7 @@ edition = "2018"
 keywords = ["incremental", "parsing", "syntax", "highlighting"]
 categories = ["parsing", "text-editors"]
 repository = "https://github.com/tree-sitter/tree-sitter"
+rust-version.workspace = true
 
 [lib]
 crate-type = ["lib", "staticlib"]
diff --git a/lib/Cargo.toml b/lib/Cargo.toml
index 16fd0254..39e07916 100644
--- a/lib/Cargo.toml
+++ b/lib/Cargo.toml
@@ -9,6 +9,7 @@ readme = "binding_rust/README.md"
 keywords = ["incremental", "parsing"]
 categories = ["api-bindings", "parsing", "text-editors"]
 repository = "https://github.com/tree-sitter/tree-sitter"
+rust-version.workspace = true
 
 build = "binding_rust/build.rs"
 
diff --git a/tags/Cargo.toml b/tags/Cargo.toml
index d954a573..99d053e8 100644
--- a/tags/Cargo.toml
+++ b/tags/Cargo.toml
@@ -12,6 +12,7 @@ edition = "2018"
 keywords = ["incremental", "parsing", "syntax", "tagging"]
 categories = ["parsing", "text-editors"]
 repository = "https://github.com/tree-sitter/tree-sitter"
+rust-version.workspace = true
 
 [lib]
 crate-type = ["lib", "staticlib"]

From 34a83dfe695ff80a9d610df2fcbc1925b037d092 Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Tue, 4 Apr 2023 03:08:08 +0300
Subject: [PATCH 062/347] cicd: update status badge

---
 README.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/README.md b/README.md
index f3c4abc2..34390187 100644
--- a/README.md
+++ b/README.md
@@ -1,6 +1,6 @@
 # tree-sitter
 
-[![Build Status](https://github.com/tree-sitter/tree-sitter/workflows/CI/badge.svg)](https://github.com/tree-sitter/tree-sitter/actions)
+[![CICD](https://github.com/tree-sitter/tree-sitter/actions/workflows/CICD.yml/badge.svg)](https://github.com/tree-sitter/tree-sitter/actions/workflows/CICD.yml)
 [![DOI](https://zenodo.org/badge/14164618.svg)](https://zenodo.org/badge/latestdoi/14164618)
 
 Tree-sitter is a parser generator tool and an incremental parsing library. It can build a concrete syntax tree for a source file and efficiently update the syntax tree as the source file is edited. Tree-sitter aims to be:

From 404ae5f49adb52fc1d3f2369e0b744c2e4ade2a7 Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Tue, 4 Apr 2023 05:03:52 +0300
Subject: [PATCH 063/347] cicd: fix bug in release workflow

---
 .github/workflows/release.yml | 10 +++++-----
 1 file changed, 5 insertions(+), 5 deletions(-)

diff --git a/.github/workflows/release.yml b/.github/workflows/release.yml
index 27e969e7..87a06761 100644
--- a/.github/workflows/release.yml
+++ b/.github/workflows/release.yml
@@ -59,8 +59,8 @@ jobs:
           mkdir -p target
           mv artifacts/tree-sitter.wasm/* target/
           rm -r artifacts/tree-sitter.wasm
-          for platform in $(cd artifacts; ls); do
-            exe=$(ls artifacts/$platform/tree-sitter*)
+          for platform in $(cd artifacts; ls | sed 's/^tree-sitter\.//'); do
+            exe=$(ls artifacts/tree-sitter.$platform/tree-sitter*)
             gzip --stdout --name $exe > target/tree-sitter-$platform.gz
           done
           rm -rf artifacts
@@ -90,9 +90,9 @@ jobs:
           tag_name: ${{ steps.tag_name.outputs.tag }}
           fail_on_unmatched_files: true
           files: |
-            tree-sitter-*.gz
-            tree-sitter.wasm
-            tree-sitter.js
+            target/tree-sitter-*.gz
+            target/tree-sitter.wasm
+            target/tree-sitter.js
 
       - name: Merge release PR
         env:

From 0c49d6745b3fc4822ab02e0018770cd6383a779c Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Tue, 4 Apr 2023 12:10:31 +0300
Subject: [PATCH 064/347] 0.20.8 - recovered

---
 Cargo.lock | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/Cargo.lock b/Cargo.lock
index 4b4437e6..956a3f41 100644
--- a/Cargo.lock
+++ b/Cargo.lock
@@ -366,9 +366,9 @@ checksum = "e2abad23fbc42b3700f2f279844dc832adb2b2eb069b2df918f455c4e18cc646"
 
 [[package]]
 name = "libc"
-version = "0.2.140"
+version = "0.2.141"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "99227334921fae1a979cf0bfdfcc6b3e5ce376ef57e16fb6fb3ea2ed6095f80c"
+checksum = "3304a64d199bb964be99741b7a14d26972741915b3649639149b2479bb46f4b5"
 
 [[package]]
 name = "libloading"

From c1f784498f35f2d69e8b53824e1fd5a5d97eed65 Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Tue, 4 Apr 2023 03:34:03 +0300
Subject: [PATCH 065/347] chore: nit picking in internal proc_macro crate

---
 Cargo.lock                          | 22 +++++++++++-----------
 cli/Cargo.toml                      |  2 +-
 cli/src/tests/proc_macro/Cargo.toml |  4 ++--
 cli/src/tests/proc_macro/src/lib.rs |  4 ++--
 4 files changed, 16 insertions(+), 16 deletions(-)

diff --git a/Cargo.lock b/Cargo.lock
index 956a3f41..52013e49 100644
--- a/Cargo.lock
+++ b/Cargo.lock
@@ -473,16 +473,6 @@ dependencies = [
  "unicode-ident",
 ]
 
-[[package]]
-name = "proc_macro"
-version = "0.1.0"
-dependencies = [
- "proc-macro2",
- "quote",
- "rand",
- "syn 1.0.109",
-]
-
 [[package]]
 name = "quote"
 version = "1.0.26"
@@ -785,7 +775,6 @@ dependencies = [
  "lazy_static",
  "log",
  "pretty_assertions",
- "proc_macro",
  "rand",
  "regex",
  "regex-syntax",
@@ -802,6 +791,7 @@ dependencies = [
  "tree-sitter-highlight",
  "tree-sitter-loader",
  "tree-sitter-tags",
+ "tree-sitter-tests-proc-macro",
  "unindent",
  "walkdir",
  "webbrowser",
@@ -854,6 +844,16 @@ dependencies = [
  "tree-sitter",
 ]
 
+[[package]]
+name = "tree-sitter-tests-proc-macro"
+version = "0.0.0"
+dependencies = [
+ "proc-macro2",
+ "quote",
+ "rand",
+ "syn 1.0.109",
+]
+
 [[package]]
 name = "unicode-bidi"
 version = "0.3.13"
diff --git a/cli/Cargo.toml b/cli/Cargo.toml
index f9f8ca4b..48473095 100644
--- a/cli/Cargo.toml
+++ b/cli/Cargo.toml
@@ -70,7 +70,7 @@ version = "0.4.6"
 features = ["std"]
 
 [dev-dependencies]
-proc_macro = { path = "src/tests/proc_macro" }
+proc_macro = { path = "src/tests/proc_macro", package = "tree-sitter-tests-proc-macro" }
 
 rand = "0.8"
 tempfile = "3"
diff --git a/cli/src/tests/proc_macro/Cargo.toml b/cli/src/tests/proc_macro/Cargo.toml
index e6900d10..9db4025b 100644
--- a/cli/src/tests/proc_macro/Cargo.toml
+++ b/cli/src/tests/proc_macro/Cargo.toml
@@ -1,6 +1,6 @@
 [package]
-name = "proc_macro"
-version = "0.1.0"
+name = "tree-sitter-tests-proc-macro"
+version = "0.0.0"
 edition = "2021"
 publish = false
 rust-version.workspace = true
diff --git a/cli/src/tests/proc_macro/src/lib.rs b/cli/src/tests/proc_macro/src/lib.rs
index d831a75b..4d92479f 100644
--- a/cli/src/tests/proc_macro/src/lib.rs
+++ b/cli/src/tests/proc_macro/src/lib.rs
@@ -82,8 +82,8 @@ pub fn test_with_seed(args: TokenStream, input: TokenStream) -> TokenStream {
             }
 
             Ok(Args {
-                retry: retry.expect("`retry` parameter is requred"),
-                seed: seed.expect("`initial_seed` parameter is required"),
+                retry: retry.expect("`retry` parameter is required"),
+                seed: seed.expect("`seed` parameter is required"),
                 seed_fn,
             })
         }

From 3d396e120b6cd574cdfbaf72a6cd0d14ae79bf38 Mon Sep 17 00:00:00 2001
From: Vhyrro <vhyrro@gmail.com>
Date: Mon, 13 Mar 2023 18:52:39 +0100
Subject: [PATCH 066/347] feat(rust_bindings): provide `into_raw()` functions
 for treesitter structs

---
 lib/binding_rust/lib.rs | 42 +++++++++++++++++++++++++++++++++++++++--
 1 file changed, 40 insertions(+), 2 deletions(-)

diff --git a/lib/binding_rust/lib.rs b/lib/binding_rust/lib.rs
index 579bf8e2..568bad25 100644
--- a/lib/binding_rust/lib.rs
+++ b/lib/binding_rust/lib.rs
@@ -1,4 +1,4 @@
-mod ffi;
+pub mod ffi;
 mod util;
 
 #[cfg(unix)]
@@ -9,7 +9,7 @@ use std::{
     ffi::CStr,
     fmt, hash, iter,
     marker::PhantomData,
-    mem::MaybeUninit,
+    mem::{ManuallyDrop, MaybeUninit},
     ops,
     os::raw::{c_char, c_void},
     ptr::{self, NonNull},
@@ -334,6 +334,11 @@ impl Language {
             Some(id)
         }
     }
+
+    /// Consumes the [Language], returning a raw pointer to the underlying C structure.
+    pub fn into_raw(self) -> *const ffi::TSLanguage {
+        self.0
+    }
 }
 
 impl Parser {
@@ -691,6 +696,14 @@ impl Parser {
             ffi::ts_parser_set_cancellation_flag(self.0.as_ptr(), ptr::null());
         }
     }
+
+    /// Consumes the [Parser], returning a raw pointer to the underlying C structure.
+    pub fn into_raw(mut self) -> *mut ffi::TSParser {
+        self.stop_printing_dot_graphs();
+        self.set_logger(None);
+
+        ManuallyDrop::new(self).0.as_ptr()
+    }
 }
 
 impl Drop for Parser {
@@ -785,6 +798,11 @@ impl Tree {
         let fd = file.as_raw_fd();
         unsafe { ffi::ts_tree_print_dot_graph(self.0.as_ptr(), fd) }
     }
+
+    /// Consumes the [Tree], returning a raw pointer to the underlying C structure.
+    pub fn into_raw(self) -> *mut ffi::TSTree {
+        ManuallyDrop::new(self).0.as_ptr()
+    }
 }
 
 impl fmt::Debug for Tree {
@@ -1190,6 +1208,11 @@ impl<'tree> Node<'tree> {
         let edit = edit.into();
         unsafe { ffi::ts_node_edit(&mut self.0 as *mut ffi::TSNode, &edit) }
     }
+
+    /// Consumes the [Node], returning a raw pointer to the underlying C structure.
+    pub fn into_raw(self) -> *mut ffi::TSNode {
+        &mut ManuallyDrop::new(self).0
+    }
 }
 
 impl<'a> PartialEq for Node<'a> {
@@ -1324,6 +1347,11 @@ impl<'a> TreeCursor<'a> {
     pub fn reset(&mut self, node: Node<'a>) {
         unsafe { ffi::ts_tree_cursor_reset(&mut self.0, node.0) };
     }
+
+    /// Consumes the [TreeCursor], returning a raw pointer to the underlying C structure.
+    pub fn into_raw(self) -> *mut ffi::TSTreeCursor {
+        &mut ManuallyDrop::new(self).0
+    }
 }
 
 impl<'a> Clone for TreeCursor<'a> {
@@ -1819,6 +1847,11 @@ impl Query {
             ));
         }
     }
+
+    /// Consumes the [Query], returning a raw pointer to the underlying C structure.
+    pub fn into_raw(self) -> *mut ffi::TSQuery {
+        ManuallyDrop::new(self).ptr.as_ptr()
+    }
 }
 
 impl QueryCursor {
@@ -1926,6 +1959,11 @@ impl QueryCursor {
         }
         self
     }
+
+    /// Consumes the [QueryCursor], returning a raw pointer to the underlying C structure.
+    pub fn into_raw(self) -> *mut ffi::TSQueryCursor {
+        ManuallyDrop::new(self).ptr.as_ptr()
+    }
 }
 
 impl<'a, 'tree> QueryMatch<'a, 'tree> {

From 576e4c7d0682103870acee87075716f424f71d90 Mon Sep 17 00:00:00 2001
From: Vhyrro <vhyrro@gmail.com>
Date: Mon, 13 Mar 2023 19:06:12 +0100
Subject: [PATCH 067/347] fix(rust_bindings): use-after-free for
 `Language::into_raw()`

---
 lib/binding_rust/lib.rs | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/lib/binding_rust/lib.rs b/lib/binding_rust/lib.rs
index 568bad25..16e3cd4b 100644
--- a/lib/binding_rust/lib.rs
+++ b/lib/binding_rust/lib.rs
@@ -337,7 +337,7 @@ impl Language {
 
     /// Consumes the [Language], returning a raw pointer to the underlying C structure.
     pub fn into_raw(self) -> *const ffi::TSLanguage {
-        self.0
+        ManuallyDrop::new(self).0
     }
 }
 

From 6c2957c8d3c5311f30b3468f55fbb2573ce1c9ff Mon Sep 17 00:00:00 2001
From: Vhyrro <vhyrro@gmail.com>
Date: Tue, 14 Mar 2023 19:34:18 +0100
Subject: [PATCH 068/347] ref(rust_bindings): move `into_raw()` functions into
 the `ffi` module

---
 lib/binding_rust/ffi.rs | 55 +++++++++++++++++++++++++++++++++++++++++
 lib/binding_rust/lib.rs | 40 +-----------------------------
 2 files changed, 56 insertions(+), 39 deletions(-)

diff --git a/lib/binding_rust/ffi.rs b/lib/binding_rust/ffi.rs
index 685ed765..9f900c35 100644
--- a/lib/binding_rust/ffi.rs
+++ b/lib/binding_rust/ffi.rs
@@ -7,3 +7,58 @@ include!("./bindings.rs");
 extern "C" {
     pub(crate) fn dup(fd: std::os::raw::c_int) -> std::os::raw::c_int;
 }
+
+use crate::{Language, Node, Parser, Query, QueryCursor, Tree, TreeCursor};
+use std::mem::ManuallyDrop;
+
+impl Language {
+    /// Consumes the [Language], returning a raw pointer to the underlying C structure.
+    pub fn into_raw(self) -> *const TSLanguage {
+        ManuallyDrop::new(self).0
+    }
+}
+
+impl Parser {
+    /// Consumes the [Parser], returning a raw pointer to the underlying C structure.
+    pub fn into_raw(mut self) -> *mut TSParser {
+        self.stop_printing_dot_graphs();
+        self.set_logger(None);
+
+        ManuallyDrop::new(self).0.as_ptr()
+    }
+}
+
+impl Tree {
+    /// Consumes the [Tree], returning a raw pointer to the underlying C structure.
+    pub fn into_raw(self) -> *mut TSTree {
+        ManuallyDrop::new(self).0.as_ptr()
+    }
+}
+
+impl<'tree> Node<'tree> {
+    /// Consumes the [Node], returning a raw pointer to the underlying C structure.
+    pub fn into_raw(self) -> *mut TSNode {
+        &mut ManuallyDrop::new(self).0
+    }
+}
+
+impl<'a> TreeCursor<'a> {
+    /// Consumes the [TreeCursor], returning a raw pointer to the underlying C structure.
+    pub fn into_raw(self) -> *mut TSTreeCursor {
+        &mut ManuallyDrop::new(self).0
+    }
+}
+
+impl Query {
+    /// Consumes the [Query], returning a raw pointer to the underlying C structure.
+    pub fn into_raw(self) -> *mut TSQuery {
+        ManuallyDrop::new(self).ptr.as_ptr()
+    }
+}
+
+impl QueryCursor {
+    /// Consumes the [QueryCursor], returning a raw pointer to the underlying C structure.
+    pub fn into_raw(self) -> *mut TSQueryCursor {
+        ManuallyDrop::new(self).ptr.as_ptr()
+    }
+}
diff --git a/lib/binding_rust/lib.rs b/lib/binding_rust/lib.rs
index 16e3cd4b..3746bcdd 100644
--- a/lib/binding_rust/lib.rs
+++ b/lib/binding_rust/lib.rs
@@ -9,7 +9,7 @@ use std::{
     ffi::CStr,
     fmt, hash, iter,
     marker::PhantomData,
-    mem::{ManuallyDrop, MaybeUninit},
+    mem::MaybeUninit,
     ops,
     os::raw::{c_char, c_void},
     ptr::{self, NonNull},
@@ -334,11 +334,6 @@ impl Language {
             Some(id)
         }
     }
-
-    /// Consumes the [Language], returning a raw pointer to the underlying C structure.
-    pub fn into_raw(self) -> *const ffi::TSLanguage {
-        ManuallyDrop::new(self).0
-    }
 }
 
 impl Parser {
@@ -696,14 +691,6 @@ impl Parser {
             ffi::ts_parser_set_cancellation_flag(self.0.as_ptr(), ptr::null());
         }
     }
-
-    /// Consumes the [Parser], returning a raw pointer to the underlying C structure.
-    pub fn into_raw(mut self) -> *mut ffi::TSParser {
-        self.stop_printing_dot_graphs();
-        self.set_logger(None);
-
-        ManuallyDrop::new(self).0.as_ptr()
-    }
 }
 
 impl Drop for Parser {
@@ -798,11 +785,6 @@ impl Tree {
         let fd = file.as_raw_fd();
         unsafe { ffi::ts_tree_print_dot_graph(self.0.as_ptr(), fd) }
     }
-
-    /// Consumes the [Tree], returning a raw pointer to the underlying C structure.
-    pub fn into_raw(self) -> *mut ffi::TSTree {
-        ManuallyDrop::new(self).0.as_ptr()
-    }
 }
 
 impl fmt::Debug for Tree {
@@ -1208,11 +1190,6 @@ impl<'tree> Node<'tree> {
         let edit = edit.into();
         unsafe { ffi::ts_node_edit(&mut self.0 as *mut ffi::TSNode, &edit) }
     }
-
-    /// Consumes the [Node], returning a raw pointer to the underlying C structure.
-    pub fn into_raw(self) -> *mut ffi::TSNode {
-        &mut ManuallyDrop::new(self).0
-    }
 }
 
 impl<'a> PartialEq for Node<'a> {
@@ -1347,11 +1324,6 @@ impl<'a> TreeCursor<'a> {
     pub fn reset(&mut self, node: Node<'a>) {
         unsafe { ffi::ts_tree_cursor_reset(&mut self.0, node.0) };
     }
-
-    /// Consumes the [TreeCursor], returning a raw pointer to the underlying C structure.
-    pub fn into_raw(self) -> *mut ffi::TSTreeCursor {
-        &mut ManuallyDrop::new(self).0
-    }
 }
 
 impl<'a> Clone for TreeCursor<'a> {
@@ -1847,11 +1819,6 @@ impl Query {
             ));
         }
     }
-
-    /// Consumes the [Query], returning a raw pointer to the underlying C structure.
-    pub fn into_raw(self) -> *mut ffi::TSQuery {
-        ManuallyDrop::new(self).ptr.as_ptr()
-    }
 }
 
 impl QueryCursor {
@@ -1959,11 +1926,6 @@ impl QueryCursor {
         }
         self
     }
-
-    /// Consumes the [QueryCursor], returning a raw pointer to the underlying C structure.
-    pub fn into_raw(self) -> *mut ffi::TSQueryCursor {
-        ManuallyDrop::new(self).ptr.as_ptr()
-    }
 }
 
 impl<'a, 'tree> QueryMatch<'a, 'tree> {

From e5357dc5adfecb94923e6a2a0a2d7170eb647cc2 Mon Sep 17 00:00:00 2001
From: Vhyrro <vhyrro@gmail.com>
Date: Tue, 14 Mar 2023 21:32:48 +0100
Subject: [PATCH 069/347] ref(rust_bindings): add `from_raw()` functions

---
 lib/binding_rust/ffi.rs | 282 +++++++++++++++++++++++++++++++++++++++-
 lib/binding_rust/lib.rs | 214 +-----------------------------
 2 files changed, 282 insertions(+), 214 deletions(-)

diff --git a/lib/binding_rust/ffi.rs b/lib/binding_rust/ffi.rs
index 9f900c35..804c1cfc 100644
--- a/lib/binding_rust/ffi.rs
+++ b/lib/binding_rust/ffi.rs
@@ -8,10 +8,22 @@ extern "C" {
     pub(crate) fn dup(fd: std::os::raw::c_int) -> std::os::raw::c_int;
 }
 
-use crate::{Language, Node, Parser, Query, QueryCursor, Tree, TreeCursor};
-use std::mem::ManuallyDrop;
+use crate::{
+    predicate_error, Language, Node, Parser, Query, QueryCursor, QueryError, QueryPredicate,
+    QueryPredicateArg, TextPredicate, Tree, TreeCursor,
+};
+use std::{marker::PhantomData, mem::ManuallyDrop, ptr::NonNull, slice, str};
 
 impl Language {
+    /// Reconstructs a [Language] from a raw pointer.
+    ///
+    /// # Safety
+    ///
+    /// `ptr` must be non-null.
+    pub unsafe fn from_raw(ptr: *mut TSLanguage) -> Language {
+        Language(ptr)
+    }
+
     /// Consumes the [Language], returning a raw pointer to the underlying C structure.
     pub fn into_raw(self) -> *const TSLanguage {
         ManuallyDrop::new(self).0
@@ -19,6 +31,15 @@ impl Language {
 }
 
 impl Parser {
+    /// Reconstructs a [Parser] from a raw pointer.
+    ///
+    /// # Safety
+    ///
+    /// `ptr` must be non-null.
+    pub unsafe fn from_raw(ptr: *mut TSParser) -> Parser {
+        Parser(NonNull::new_unchecked(ptr))
+    }
+
     /// Consumes the [Parser], returning a raw pointer to the underlying C structure.
     pub fn into_raw(mut self) -> *mut TSParser {
         self.stop_printing_dot_graphs();
@@ -29,6 +50,15 @@ impl Parser {
 }
 
 impl Tree {
+    /// Reconstructs a [Tree] from a raw pointer.
+    ///
+    /// # Safety
+    ///
+    /// `ptr` must be non-null.
+    pub unsafe fn from_raw(ptr: *mut TSTree) -> Tree {
+        Tree(NonNull::new_unchecked(ptr))
+    }
+
     /// Consumes the [Tree], returning a raw pointer to the underlying C structure.
     pub fn into_raw(self) -> *mut TSTree {
         ManuallyDrop::new(self).0.as_ptr()
@@ -36,6 +66,15 @@ impl Tree {
 }
 
 impl<'tree> Node<'tree> {
+    /// Reconstructs a [Node] from a raw pointer.
+    ///
+    /// # Safety
+    ///
+    /// `ptr` must be non-null.
+    pub unsafe fn from_raw(ptr: *mut TSNode) -> Node<'tree> {
+        Node(*ptr, PhantomData)
+    }
+
     /// Consumes the [Node], returning a raw pointer to the underlying C structure.
     pub fn into_raw(self) -> *mut TSNode {
         &mut ManuallyDrop::new(self).0
@@ -43,6 +82,15 @@ impl<'tree> Node<'tree> {
 }
 
 impl<'a> TreeCursor<'a> {
+    /// Reconstructs a [TreeCursor] from a raw pointer.
+    ///
+    /// # Safety
+    ///
+    /// `ptr` must be non-null.
+    pub unsafe fn from_raw(ptr: *mut TSTreeCursor) -> TreeCursor<'a> {
+        TreeCursor(*ptr, PhantomData)
+    }
+
     /// Consumes the [TreeCursor], returning a raw pointer to the underlying C structure.
     pub fn into_raw(self) -> *mut TSTreeCursor {
         &mut ManuallyDrop::new(self).0
@@ -50,6 +98,225 @@ impl<'a> TreeCursor<'a> {
 }
 
 impl Query {
+    /// Reconstructs a [Query] from a raw pointer.
+    ///
+    /// # Safety
+    ///
+    /// `ptr` must be non-null.
+    pub unsafe fn from_raw(ptr: *mut TSQuery, source: &str) -> Result<Query, QueryError> {
+        let string_count = unsafe { ts_query_string_count(ptr) };
+        let capture_count = unsafe { ts_query_capture_count(ptr) };
+        let pattern_count = unsafe { ts_query_pattern_count(ptr) as usize };
+        let mut result = Query {
+            ptr: unsafe { NonNull::new_unchecked(ptr) },
+            capture_names: Vec::with_capacity(capture_count as usize),
+            capture_quantifiers: Vec::with_capacity(pattern_count as usize),
+            text_predicates: Vec::with_capacity(pattern_count),
+            property_predicates: Vec::with_capacity(pattern_count),
+            property_settings: Vec::with_capacity(pattern_count),
+            general_predicates: Vec::with_capacity(pattern_count),
+        };
+
+        // Build a vector of strings to store the capture names.
+        for i in 0..capture_count {
+            unsafe {
+                let mut length = 0u32;
+                let name =
+                    ts_query_capture_name_for_id(ptr, i, &mut length as *mut u32) as *const u8;
+                let name = slice::from_raw_parts(name, length as usize);
+                let name = str::from_utf8_unchecked(name);
+                result.capture_names.push(name.to_string());
+            }
+        }
+
+        // Build a vector to store capture qunatifiers.
+        for i in 0..pattern_count {
+            let mut capture_quantifiers = Vec::with_capacity(capture_count as usize);
+            for j in 0..capture_count {
+                unsafe {
+                    let quantifier = ts_query_capture_quantifier_for_id(ptr, i as u32, j);
+                    capture_quantifiers.push(quantifier.into());
+                }
+            }
+            result.capture_quantifiers.push(capture_quantifiers);
+        }
+
+        // Build a vector of strings to represent literal values used in predicates.
+        let string_values = (0..string_count)
+            .map(|i| unsafe {
+                let mut length = 0u32;
+                let value = ts_query_string_value_for_id(ptr, i as u32, &mut length as *mut u32)
+                    as *const u8;
+                let value = slice::from_raw_parts(value, length as usize);
+                let value = str::from_utf8_unchecked(value);
+                value.to_string()
+            })
+            .collect::<Vec<_>>();
+
+        // Build a vector of predicates for each pattern.
+        for i in 0..pattern_count {
+            let predicate_steps = unsafe {
+                let mut length = 0u32;
+                let raw_predicates =
+                    ts_query_predicates_for_pattern(ptr, i as u32, &mut length as *mut u32);
+                if length > 0 {
+                    slice::from_raw_parts(raw_predicates, length as usize)
+                } else {
+                    &[]
+                }
+            };
+
+            let byte_offset = unsafe { ts_query_start_byte_for_pattern(ptr, i as u32) };
+            let row = source
+                .char_indices()
+                .take_while(|(i, _)| *i < byte_offset as usize)
+                .filter(|(_, c)| *c == '\n')
+                .count();
+
+            let type_done = TSQueryPredicateStepType_TSQueryPredicateStepTypeDone;
+            let type_capture = TSQueryPredicateStepType_TSQueryPredicateStepTypeCapture;
+            let type_string = TSQueryPredicateStepType_TSQueryPredicateStepTypeString;
+
+            let mut text_predicates = Vec::new();
+            let mut property_predicates = Vec::new();
+            let mut property_settings = Vec::new();
+            let mut general_predicates = Vec::new();
+            for p in predicate_steps.split(|s| s.type_ == type_done) {
+                if p.is_empty() {
+                    continue;
+                }
+
+                if p[0].type_ != type_string {
+                    return Err(predicate_error(
+                        row,
+                        format!(
+                            "Expected predicate to start with a function name. Got @{}.",
+                            result.capture_names[p[0].value_id as usize],
+                        ),
+                    ));
+                }
+
+                // Build a predicate for each of the known predicate function names.
+                let operator_name = &string_values[p[0].value_id as usize];
+                match operator_name.as_str() {
+                    "eq?" | "not-eq?" => {
+                        if p.len() != 3 {
+                            return Err(predicate_error(
+                                row,
+                                format!(
+                                "Wrong number of arguments to #eq? predicate. Expected 2, got {}.",
+                                p.len() - 1
+                            ),
+                            ));
+                        }
+                        if p[1].type_ != type_capture {
+                            return Err(predicate_error(row, format!(
+                                "First argument to #eq? predicate must be a capture name. Got literal \"{}\".",
+                                string_values[p[1].value_id as usize],
+                            )));
+                        }
+
+                        let is_positive = operator_name == "eq?";
+                        text_predicates.push(if p[2].type_ == type_capture {
+                            TextPredicate::CaptureEqCapture(
+                                p[1].value_id,
+                                p[2].value_id,
+                                is_positive,
+                            )
+                        } else {
+                            TextPredicate::CaptureEqString(
+                                p[1].value_id,
+                                string_values[p[2].value_id as usize].clone(),
+                                is_positive,
+                            )
+                        });
+                    }
+
+                    "match?" | "not-match?" => {
+                        if p.len() != 3 {
+                            return Err(predicate_error(row, format!(
+                                "Wrong number of arguments to #match? predicate. Expected 2, got {}.",
+                                p.len() - 1
+                            )));
+                        }
+                        if p[1].type_ != type_capture {
+                            return Err(predicate_error(row, format!(
+                                "First argument to #match? predicate must be a capture name. Got literal \"{}\".",
+                                string_values[p[1].value_id as usize],
+                            )));
+                        }
+                        if p[2].type_ == type_capture {
+                            return Err(predicate_error(row, format!(
+                                "Second argument to #match? predicate must be a literal. Got capture @{}.",
+                                result.capture_names[p[2].value_id as usize],
+                            )));
+                        }
+
+                        let is_positive = operator_name == "match?";
+                        let regex = &string_values[p[2].value_id as usize];
+                        text_predicates.push(TextPredicate::CaptureMatchString(
+                            p[1].value_id,
+                            regex::bytes::Regex::new(regex).map_err(|_| {
+                                predicate_error(row, format!("Invalid regex '{}'", regex))
+                            })?,
+                            is_positive,
+                        ));
+                    }
+
+                    "set!" => property_settings.push(Self::parse_property(
+                        row,
+                        &operator_name,
+                        &result.capture_names,
+                        &string_values,
+                        &p[1..],
+                    )?),
+
+                    "is?" | "is-not?" => property_predicates.push((
+                        Self::parse_property(
+                            row,
+                            &operator_name,
+                            &result.capture_names,
+                            &string_values,
+                            &p[1..],
+                        )?,
+                        operator_name == "is?",
+                    )),
+
+                    _ => general_predicates.push(QueryPredicate {
+                        operator: operator_name.clone().into_boxed_str(),
+                        args: p[1..]
+                            .iter()
+                            .map(|a| {
+                                if a.type_ == type_capture {
+                                    QueryPredicateArg::Capture(a.value_id)
+                                } else {
+                                    QueryPredicateArg::String(
+                                        string_values[a.value_id as usize].clone().into_boxed_str(),
+                                    )
+                                }
+                            })
+                            .collect(),
+                    }),
+                }
+            }
+
+            result
+                .text_predicates
+                .push(text_predicates.into_boxed_slice());
+            result
+                .property_predicates
+                .push(property_predicates.into_boxed_slice());
+            result
+                .property_settings
+                .push(property_settings.into_boxed_slice());
+            result
+                .general_predicates
+                .push(general_predicates.into_boxed_slice());
+        }
+
+        Ok(result)
+    }
+
     /// Consumes the [Query], returning a raw pointer to the underlying C structure.
     pub fn into_raw(self) -> *mut TSQuery {
         ManuallyDrop::new(self).ptr.as_ptr()
@@ -57,6 +324,17 @@ impl Query {
 }
 
 impl QueryCursor {
+    /// Reconstructs a [QueryCursor] from a raw pointer.
+    ///
+    /// # Safety
+    ///
+    /// `ptr` must be non-null.
+    pub unsafe fn from_raw(ptr: *mut TSQueryCursor) -> QueryCursor {
+        QueryCursor {
+            ptr: NonNull::new_unchecked(ptr),
+        }
+    }
+
     /// Consumes the [QueryCursor], returning a raw pointer to the underlying C structure.
     pub fn into_raw(self) -> *mut TSQueryCursor {
         ManuallyDrop::new(self).ptr.as_ptr()
diff --git a/lib/binding_rust/lib.rs b/lib/binding_rust/lib.rs
index 3746bcdd..c2a0ead0 100644
--- a/lib/binding_rust/lib.rs
+++ b/lib/binding_rust/lib.rs
@@ -1434,217 +1434,7 @@ impl Query {
             });
         }
 
-        let string_count = unsafe { ffi::ts_query_string_count(ptr) };
-        let capture_count = unsafe { ffi::ts_query_capture_count(ptr) };
-        let pattern_count = unsafe { ffi::ts_query_pattern_count(ptr) as usize };
-        let mut result = Query {
-            ptr: unsafe { NonNull::new_unchecked(ptr) },
-            capture_names: Vec::with_capacity(capture_count as usize),
-            capture_quantifiers: Vec::with_capacity(pattern_count as usize),
-            text_predicates: Vec::with_capacity(pattern_count),
-            property_predicates: Vec::with_capacity(pattern_count),
-            property_settings: Vec::with_capacity(pattern_count),
-            general_predicates: Vec::with_capacity(pattern_count),
-        };
-
-        // Build a vector of strings to store the capture names.
-        for i in 0..capture_count {
-            unsafe {
-                let mut length = 0u32;
-                let name =
-                    ffi::ts_query_capture_name_for_id(ptr, i, &mut length as *mut u32) as *const u8;
-                let name = slice::from_raw_parts(name, length as usize);
-                let name = str::from_utf8_unchecked(name);
-                result.capture_names.push(name.to_string());
-            }
-        }
-
-        // Build a vector to store capture qunatifiers.
-        for i in 0..pattern_count {
-            let mut capture_quantifiers = Vec::with_capacity(capture_count as usize);
-            for j in 0..capture_count {
-                unsafe {
-                    let quantifier = ffi::ts_query_capture_quantifier_for_id(ptr, i as u32, j);
-                    capture_quantifiers.push(quantifier.into());
-                }
-            }
-            result.capture_quantifiers.push(capture_quantifiers);
-        }
-
-        // Build a vector of strings to represent literal values used in predicates.
-        let string_values = (0..string_count)
-            .map(|i| unsafe {
-                let mut length = 0u32;
-                let value =
-                    ffi::ts_query_string_value_for_id(ptr, i as u32, &mut length as *mut u32)
-                        as *const u8;
-                let value = slice::from_raw_parts(value, length as usize);
-                let value = str::from_utf8_unchecked(value);
-                value.to_string()
-            })
-            .collect::<Vec<_>>();
-
-        // Build a vector of predicates for each pattern.
-        for i in 0..pattern_count {
-            let predicate_steps = unsafe {
-                let mut length = 0u32;
-                let raw_predicates =
-                    ffi::ts_query_predicates_for_pattern(ptr, i as u32, &mut length as *mut u32);
-                if length > 0 {
-                    slice::from_raw_parts(raw_predicates, length as usize)
-                } else {
-                    &[]
-                }
-            };
-
-            let byte_offset = unsafe { ffi::ts_query_start_byte_for_pattern(ptr, i as u32) };
-            let row = source
-                .char_indices()
-                .take_while(|(i, _)| *i < byte_offset as usize)
-                .filter(|(_, c)| *c == '\n')
-                .count();
-
-            let type_done = ffi::TSQueryPredicateStepType_TSQueryPredicateStepTypeDone;
-            let type_capture = ffi::TSQueryPredicateStepType_TSQueryPredicateStepTypeCapture;
-            let type_string = ffi::TSQueryPredicateStepType_TSQueryPredicateStepTypeString;
-
-            let mut text_predicates = Vec::new();
-            let mut property_predicates = Vec::new();
-            let mut property_settings = Vec::new();
-            let mut general_predicates = Vec::new();
-            for p in predicate_steps.split(|s| s.type_ == type_done) {
-                if p.is_empty() {
-                    continue;
-                }
-
-                if p[0].type_ != type_string {
-                    return Err(predicate_error(
-                        row,
-                        format!(
-                            "Expected predicate to start with a function name. Got @{}.",
-                            result.capture_names[p[0].value_id as usize],
-                        ),
-                    ));
-                }
-
-                // Build a predicate for each of the known predicate function names.
-                let operator_name = &string_values[p[0].value_id as usize];
-                match operator_name.as_str() {
-                    "eq?" | "not-eq?" => {
-                        if p.len() != 3 {
-                            return Err(predicate_error(
-                                row,
-                                format!(
-                                "Wrong number of arguments to #eq? predicate. Expected 2, got {}.",
-                                p.len() - 1
-                            ),
-                            ));
-                        }
-                        if p[1].type_ != type_capture {
-                            return Err(predicate_error(row, format!(
-                                "First argument to #eq? predicate must be a capture name. Got literal \"{}\".",
-                                string_values[p[1].value_id as usize],
-                            )));
-                        }
-
-                        let is_positive = operator_name == "eq?";
-                        text_predicates.push(if p[2].type_ == type_capture {
-                            TextPredicate::CaptureEqCapture(
-                                p[1].value_id,
-                                p[2].value_id,
-                                is_positive,
-                            )
-                        } else {
-                            TextPredicate::CaptureEqString(
-                                p[1].value_id,
-                                string_values[p[2].value_id as usize].clone(),
-                                is_positive,
-                            )
-                        });
-                    }
-
-                    "match?" | "not-match?" => {
-                        if p.len() != 3 {
-                            return Err(predicate_error(row, format!(
-                                "Wrong number of arguments to #match? predicate. Expected 2, got {}.",
-                                p.len() - 1
-                            )));
-                        }
-                        if p[1].type_ != type_capture {
-                            return Err(predicate_error(row, format!(
-                                "First argument to #match? predicate must be a capture name. Got literal \"{}\".",
-                                string_values[p[1].value_id as usize],
-                            )));
-                        }
-                        if p[2].type_ == type_capture {
-                            return Err(predicate_error(row, format!(
-                                "Second argument to #match? predicate must be a literal. Got capture @{}.",
-                                result.capture_names[p[2].value_id as usize],
-                            )));
-                        }
-
-                        let is_positive = operator_name == "match?";
-                        let regex = &string_values[p[2].value_id as usize];
-                        text_predicates.push(TextPredicate::CaptureMatchString(
-                            p[1].value_id,
-                            regex::bytes::Regex::new(regex).map_err(|_| {
-                                predicate_error(row, format!("Invalid regex '{}'", regex))
-                            })?,
-                            is_positive,
-                        ));
-                    }
-
-                    "set!" => property_settings.push(Self::parse_property(
-                        row,
-                        &operator_name,
-                        &result.capture_names,
-                        &string_values,
-                        &p[1..],
-                    )?),
-
-                    "is?" | "is-not?" => property_predicates.push((
-                        Self::parse_property(
-                            row,
-                            &operator_name,
-                            &result.capture_names,
-                            &string_values,
-                            &p[1..],
-                        )?,
-                        operator_name == "is?",
-                    )),
-
-                    _ => general_predicates.push(QueryPredicate {
-                        operator: operator_name.clone().into_boxed_str(),
-                        args: p[1..]
-                            .iter()
-                            .map(|a| {
-                                if a.type_ == type_capture {
-                                    QueryPredicateArg::Capture(a.value_id)
-                                } else {
-                                    QueryPredicateArg::String(
-                                        string_values[a.value_id as usize].clone().into_boxed_str(),
-                                    )
-                                }
-                            })
-                            .collect(),
-                    }),
-                }
-            }
-
-            result
-                .text_predicates
-                .push(text_predicates.into_boxed_slice());
-            result
-                .property_predicates
-                .push(property_predicates.into_boxed_slice());
-            result
-                .property_settings
-                .push(property_settings.into_boxed_slice());
-            result
-                .general_predicates
-                .push(general_predicates.into_boxed_slice());
-        }
-        Ok(result)
+        unsafe { Query::from_raw(ptr, source) }
     }
 
     /// Get the byte offset where the given pattern starts in the query's source.
@@ -2291,7 +2081,7 @@ impl<'a> Iterator for LossyUtf8<'a> {
     }
 }
 
-fn predicate_error(row: usize, message: String) -> QueryError {
+pub(crate) fn predicate_error(row: usize, message: String) -> QueryError {
     QueryError {
         kind: QueryErrorKind::Predicate,
         row,

From d56506b72714d0f57814866e670ccf0440e48d86 Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Wed, 15 Mar 2023 11:24:53 +0200
Subject: [PATCH 070/347] ref(rust_bindings): keep Query construction logic in
 a one place

---
 lib/binding_rust/ffi.rs | 219 +--------------------------------------
 lib/binding_rust/lib.rs | 220 +++++++++++++++++++++++++++++++++++++++-
 2 files changed, 221 insertions(+), 218 deletions(-)

diff --git a/lib/binding_rust/ffi.rs b/lib/binding_rust/ffi.rs
index 804c1cfc..53032db3 100644
--- a/lib/binding_rust/ffi.rs
+++ b/lib/binding_rust/ffi.rs
@@ -8,11 +8,8 @@ extern "C" {
     pub(crate) fn dup(fd: std::os::raw::c_int) -> std::os::raw::c_int;
 }
 
-use crate::{
-    predicate_error, Language, Node, Parser, Query, QueryCursor, QueryError, QueryPredicate,
-    QueryPredicateArg, TextPredicate, Tree, TreeCursor,
-};
-use std::{marker::PhantomData, mem::ManuallyDrop, ptr::NonNull, slice, str};
+use crate::{Language, Node, Parser, Query, QueryCursor, QueryError, Tree, TreeCursor};
+use std::{marker::PhantomData, mem::ManuallyDrop, ptr::NonNull, str};
 
 impl Language {
     /// Reconstructs a [Language] from a raw pointer.
@@ -104,217 +101,7 @@ impl Query {
     ///
     /// `ptr` must be non-null.
     pub unsafe fn from_raw(ptr: *mut TSQuery, source: &str) -> Result<Query, QueryError> {
-        let string_count = unsafe { ts_query_string_count(ptr) };
-        let capture_count = unsafe { ts_query_capture_count(ptr) };
-        let pattern_count = unsafe { ts_query_pattern_count(ptr) as usize };
-        let mut result = Query {
-            ptr: unsafe { NonNull::new_unchecked(ptr) },
-            capture_names: Vec::with_capacity(capture_count as usize),
-            capture_quantifiers: Vec::with_capacity(pattern_count as usize),
-            text_predicates: Vec::with_capacity(pattern_count),
-            property_predicates: Vec::with_capacity(pattern_count),
-            property_settings: Vec::with_capacity(pattern_count),
-            general_predicates: Vec::with_capacity(pattern_count),
-        };
-
-        // Build a vector of strings to store the capture names.
-        for i in 0..capture_count {
-            unsafe {
-                let mut length = 0u32;
-                let name =
-                    ts_query_capture_name_for_id(ptr, i, &mut length as *mut u32) as *const u8;
-                let name = slice::from_raw_parts(name, length as usize);
-                let name = str::from_utf8_unchecked(name);
-                result.capture_names.push(name.to_string());
-            }
-        }
-
-        // Build a vector to store capture qunatifiers.
-        for i in 0..pattern_count {
-            let mut capture_quantifiers = Vec::with_capacity(capture_count as usize);
-            for j in 0..capture_count {
-                unsafe {
-                    let quantifier = ts_query_capture_quantifier_for_id(ptr, i as u32, j);
-                    capture_quantifiers.push(quantifier.into());
-                }
-            }
-            result.capture_quantifiers.push(capture_quantifiers);
-        }
-
-        // Build a vector of strings to represent literal values used in predicates.
-        let string_values = (0..string_count)
-            .map(|i| unsafe {
-                let mut length = 0u32;
-                let value = ts_query_string_value_for_id(ptr, i as u32, &mut length as *mut u32)
-                    as *const u8;
-                let value = slice::from_raw_parts(value, length as usize);
-                let value = str::from_utf8_unchecked(value);
-                value.to_string()
-            })
-            .collect::<Vec<_>>();
-
-        // Build a vector of predicates for each pattern.
-        for i in 0..pattern_count {
-            let predicate_steps = unsafe {
-                let mut length = 0u32;
-                let raw_predicates =
-                    ts_query_predicates_for_pattern(ptr, i as u32, &mut length as *mut u32);
-                if length > 0 {
-                    slice::from_raw_parts(raw_predicates, length as usize)
-                } else {
-                    &[]
-                }
-            };
-
-            let byte_offset = unsafe { ts_query_start_byte_for_pattern(ptr, i as u32) };
-            let row = source
-                .char_indices()
-                .take_while(|(i, _)| *i < byte_offset as usize)
-                .filter(|(_, c)| *c == '\n')
-                .count();
-
-            let type_done = TSQueryPredicateStepType_TSQueryPredicateStepTypeDone;
-            let type_capture = TSQueryPredicateStepType_TSQueryPredicateStepTypeCapture;
-            let type_string = TSQueryPredicateStepType_TSQueryPredicateStepTypeString;
-
-            let mut text_predicates = Vec::new();
-            let mut property_predicates = Vec::new();
-            let mut property_settings = Vec::new();
-            let mut general_predicates = Vec::new();
-            for p in predicate_steps.split(|s| s.type_ == type_done) {
-                if p.is_empty() {
-                    continue;
-                }
-
-                if p[0].type_ != type_string {
-                    return Err(predicate_error(
-                        row,
-                        format!(
-                            "Expected predicate to start with a function name. Got @{}.",
-                            result.capture_names[p[0].value_id as usize],
-                        ),
-                    ));
-                }
-
-                // Build a predicate for each of the known predicate function names.
-                let operator_name = &string_values[p[0].value_id as usize];
-                match operator_name.as_str() {
-                    "eq?" | "not-eq?" => {
-                        if p.len() != 3 {
-                            return Err(predicate_error(
-                                row,
-                                format!(
-                                "Wrong number of arguments to #eq? predicate. Expected 2, got {}.",
-                                p.len() - 1
-                            ),
-                            ));
-                        }
-                        if p[1].type_ != type_capture {
-                            return Err(predicate_error(row, format!(
-                                "First argument to #eq? predicate must be a capture name. Got literal \"{}\".",
-                                string_values[p[1].value_id as usize],
-                            )));
-                        }
-
-                        let is_positive = operator_name == "eq?";
-                        text_predicates.push(if p[2].type_ == type_capture {
-                            TextPredicate::CaptureEqCapture(
-                                p[1].value_id,
-                                p[2].value_id,
-                                is_positive,
-                            )
-                        } else {
-                            TextPredicate::CaptureEqString(
-                                p[1].value_id,
-                                string_values[p[2].value_id as usize].clone(),
-                                is_positive,
-                            )
-                        });
-                    }
-
-                    "match?" | "not-match?" => {
-                        if p.len() != 3 {
-                            return Err(predicate_error(row, format!(
-                                "Wrong number of arguments to #match? predicate. Expected 2, got {}.",
-                                p.len() - 1
-                            )));
-                        }
-                        if p[1].type_ != type_capture {
-                            return Err(predicate_error(row, format!(
-                                "First argument to #match? predicate must be a capture name. Got literal \"{}\".",
-                                string_values[p[1].value_id as usize],
-                            )));
-                        }
-                        if p[2].type_ == type_capture {
-                            return Err(predicate_error(row, format!(
-                                "Second argument to #match? predicate must be a literal. Got capture @{}.",
-                                result.capture_names[p[2].value_id as usize],
-                            )));
-                        }
-
-                        let is_positive = operator_name == "match?";
-                        let regex = &string_values[p[2].value_id as usize];
-                        text_predicates.push(TextPredicate::CaptureMatchString(
-                            p[1].value_id,
-                            regex::bytes::Regex::new(regex).map_err(|_| {
-                                predicate_error(row, format!("Invalid regex '{}'", regex))
-                            })?,
-                            is_positive,
-                        ));
-                    }
-
-                    "set!" => property_settings.push(Self::parse_property(
-                        row,
-                        &operator_name,
-                        &result.capture_names,
-                        &string_values,
-                        &p[1..],
-                    )?),
-
-                    "is?" | "is-not?" => property_predicates.push((
-                        Self::parse_property(
-                            row,
-                            &operator_name,
-                            &result.capture_names,
-                            &string_values,
-                            &p[1..],
-                        )?,
-                        operator_name == "is?",
-                    )),
-
-                    _ => general_predicates.push(QueryPredicate {
-                        operator: operator_name.clone().into_boxed_str(),
-                        args: p[1..]
-                            .iter()
-                            .map(|a| {
-                                if a.type_ == type_capture {
-                                    QueryPredicateArg::Capture(a.value_id)
-                                } else {
-                                    QueryPredicateArg::String(
-                                        string_values[a.value_id as usize].clone().into_boxed_str(),
-                                    )
-                                }
-                            })
-                            .collect(),
-                    }),
-                }
-            }
-
-            result
-                .text_predicates
-                .push(text_predicates.into_boxed_slice());
-            result
-                .property_predicates
-                .push(property_predicates.into_boxed_slice());
-            result
-                .property_settings
-                .push(property_settings.into_boxed_slice());
-            result
-                .general_predicates
-                .push(general_predicates.into_boxed_slice());
-        }
-
-        Ok(result)
+        Query::from_raw_parts(ptr, source)
     }
 
     /// Consumes the [Query], returning a raw pointer to the underlying C structure.
diff --git a/lib/binding_rust/lib.rs b/lib/binding_rust/lib.rs
index c2a0ead0..9d470457 100644
--- a/lib/binding_rust/lib.rs
+++ b/lib/binding_rust/lib.rs
@@ -1434,7 +1434,223 @@ impl Query {
             });
         }
 
-        unsafe { Query::from_raw(ptr, source) }
+        unsafe { Query::from_raw_parts(ptr, source) }
+    }
+
+    #[doc(hidden)]
+    unsafe fn from_raw_parts(ptr: *mut ffi::TSQuery, source: &str) -> Result<Query, QueryError> {
+        let string_count = unsafe { ffi::ts_query_string_count(ptr) };
+        let capture_count = unsafe { ffi::ts_query_capture_count(ptr) };
+        let pattern_count = unsafe { ffi::ts_query_pattern_count(ptr) as usize };
+        let mut result = Query {
+            ptr: unsafe { NonNull::new_unchecked(ptr) },
+            capture_names: Vec::with_capacity(capture_count as usize),
+            capture_quantifiers: Vec::with_capacity(pattern_count as usize),
+            text_predicates: Vec::with_capacity(pattern_count),
+            property_predicates: Vec::with_capacity(pattern_count),
+            property_settings: Vec::with_capacity(pattern_count),
+            general_predicates: Vec::with_capacity(pattern_count),
+        };
+
+        // Build a vector of strings to store the capture names.
+        for i in 0..capture_count {
+            unsafe {
+                let mut length = 0u32;
+                let name =
+                    ffi::ts_query_capture_name_for_id(ptr, i, &mut length as *mut u32) as *const u8;
+                let name = slice::from_raw_parts(name, length as usize);
+                let name = str::from_utf8_unchecked(name);
+                result.capture_names.push(name.to_string());
+            }
+        }
+
+        // Build a vector to store capture qunatifiers.
+        for i in 0..pattern_count {
+            let mut capture_quantifiers = Vec::with_capacity(capture_count as usize);
+            for j in 0..capture_count {
+                unsafe {
+                    let quantifier = ffi::ts_query_capture_quantifier_for_id(ptr, i as u32, j);
+                    capture_quantifiers.push(quantifier.into());
+                }
+            }
+            result.capture_quantifiers.push(capture_quantifiers);
+        }
+
+        // Build a vector of strings to represent literal values used in predicates.
+        let string_values = (0..string_count)
+            .map(|i| unsafe {
+                let mut length = 0u32;
+                let value =
+                    ffi::ts_query_string_value_for_id(ptr, i as u32, &mut length as *mut u32)
+                        as *const u8;
+                let value = slice::from_raw_parts(value, length as usize);
+                let value = str::from_utf8_unchecked(value);
+                value.to_string()
+            })
+            .collect::<Vec<_>>();
+
+        // Build a vector of predicates for each pattern.
+        for i in 0..pattern_count {
+            let predicate_steps = unsafe {
+                let mut length = 0u32;
+                let raw_predicates =
+                    ffi::ts_query_predicates_for_pattern(ptr, i as u32, &mut length as *mut u32);
+                if length > 0 {
+                    slice::from_raw_parts(raw_predicates, length as usize)
+                } else {
+                    &[]
+                }
+            };
+
+            let byte_offset = unsafe { ffi::ts_query_start_byte_for_pattern(ptr, i as u32) };
+            let row = source
+                .char_indices()
+                .take_while(|(i, _)| *i < byte_offset as usize)
+                .filter(|(_, c)| *c == '\n')
+                .count();
+
+            let type_done = ffi::TSQueryPredicateStepType_TSQueryPredicateStepTypeDone;
+            let type_capture = ffi::TSQueryPredicateStepType_TSQueryPredicateStepTypeCapture;
+            let type_string = ffi::TSQueryPredicateStepType_TSQueryPredicateStepTypeString;
+
+            let mut text_predicates = Vec::new();
+            let mut property_predicates = Vec::new();
+            let mut property_settings = Vec::new();
+            let mut general_predicates = Vec::new();
+            for p in predicate_steps.split(|s| s.type_ == type_done) {
+                if p.is_empty() {
+                    continue;
+                }
+
+                if p[0].type_ != type_string {
+                    return Err(predicate_error(
+                        row,
+                        format!(
+                            "Expected predicate to start with a function name. Got @{}.",
+                            result.capture_names[p[0].value_id as usize],
+                        ),
+                    ));
+                }
+
+                // Build a predicate for each of the known predicate function names.
+                let operator_name = &string_values[p[0].value_id as usize];
+                match operator_name.as_str() {
+                    "eq?" | "not-eq?" => {
+                        if p.len() != 3 {
+                            return Err(predicate_error(
+                                row,
+                                format!(
+                                "Wrong number of arguments to #eq? predicate. Expected 2, got {}.",
+                                p.len() - 1
+                            ),
+                            ));
+                        }
+                        if p[1].type_ != type_capture {
+                            return Err(predicate_error(row, format!(
+                                "First argument to #eq? predicate must be a capture name. Got literal \"{}\".",
+                                string_values[p[1].value_id as usize],
+                            )));
+                        }
+
+                        let is_positive = operator_name == "eq?";
+                        text_predicates.push(if p[2].type_ == type_capture {
+                            TextPredicate::CaptureEqCapture(
+                                p[1].value_id,
+                                p[2].value_id,
+                                is_positive,
+                            )
+                        } else {
+                            TextPredicate::CaptureEqString(
+                                p[1].value_id,
+                                string_values[p[2].value_id as usize].clone(),
+                                is_positive,
+                            )
+                        });
+                    }
+
+                    "match?" | "not-match?" => {
+                        if p.len() != 3 {
+                            return Err(predicate_error(row, format!(
+                                "Wrong number of arguments to #match? predicate. Expected 2, got {}.",
+                                p.len() - 1
+                            )));
+                        }
+                        if p[1].type_ != type_capture {
+                            return Err(predicate_error(row, format!(
+                                "First argument to #match? predicate must be a capture name. Got literal \"{}\".",
+                                string_values[p[1].value_id as usize],
+                            )));
+                        }
+                        if p[2].type_ == type_capture {
+                            return Err(predicate_error(row, format!(
+                                "Second argument to #match? predicate must be a literal. Got capture @{}.",
+                                result.capture_names[p[2].value_id as usize],
+                            )));
+                        }
+
+                        let is_positive = operator_name == "match?";
+                        let regex = &string_values[p[2].value_id as usize];
+                        text_predicates.push(TextPredicate::CaptureMatchString(
+                            p[1].value_id,
+                            regex::bytes::Regex::new(regex).map_err(|_| {
+                                predicate_error(row, format!("Invalid regex '{}'", regex))
+                            })?,
+                            is_positive,
+                        ));
+                    }
+
+                    "set!" => property_settings.push(Self::parse_property(
+                        row,
+                        &operator_name,
+                        &result.capture_names,
+                        &string_values,
+                        &p[1..],
+                    )?),
+
+                    "is?" | "is-not?" => property_predicates.push((
+                        Self::parse_property(
+                            row,
+                            &operator_name,
+                            &result.capture_names,
+                            &string_values,
+                            &p[1..],
+                        )?,
+                        operator_name == "is?",
+                    )),
+
+                    _ => general_predicates.push(QueryPredicate {
+                        operator: operator_name.clone().into_boxed_str(),
+                        args: p[1..]
+                            .iter()
+                            .map(|a| {
+                                if a.type_ == type_capture {
+                                    QueryPredicateArg::Capture(a.value_id)
+                                } else {
+                                    QueryPredicateArg::String(
+                                        string_values[a.value_id as usize].clone().into_boxed_str(),
+                                    )
+                                }
+                            })
+                            .collect(),
+                    }),
+                }
+            }
+
+            result
+                .text_predicates
+                .push(text_predicates.into_boxed_slice());
+            result
+                .property_predicates
+                .push(property_predicates.into_boxed_slice());
+            result
+                .property_settings
+                .push(property_settings.into_boxed_slice());
+            result
+                .general_predicates
+                .push(general_predicates.into_boxed_slice());
+        }
+
+        Ok(result)
     }
 
     /// Get the byte offset where the given pattern starts in the query's source.
@@ -2081,7 +2297,7 @@ impl<'a> Iterator for LossyUtf8<'a> {
     }
 }
 
-pub(crate) fn predicate_error(row: usize, message: String) -> QueryError {
+fn predicate_error(row: usize, message: String) -> QueryError {
     QueryError {
         kind: QueryErrorKind::Predicate,
         row,

From 0261a13984cad1740a6a1ddf53bce978156bd001 Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Sat, 25 Feb 2023 19:54:23 +0200
Subject: [PATCH 071/347] lib: fix `ts_node_field_name_for_child`
 implementation

With hidden subtrees correct incorporation and field inheritance support.
---
 lib/src/node.c | 60 +++++++++++++++++++++++++++++++++++++++-----------
 1 file changed, 47 insertions(+), 13 deletions(-)

diff --git a/lib/src/node.c b/lib/src/node.c
index de59504e..36bfb24c 100644
--- a/lib/src/node.c
+++ b/lib/src/node.c
@@ -569,24 +569,58 @@ recur:
   return ts_node__null();
 }
 
-const char *ts_node_field_name_for_child(TSNode self, uint32_t child_index) {
-  const TSFieldMapEntry *field_map_start = NULL, *field_map_end = NULL;
-  if (!ts_node_child_count(self)) {
+static inline const char *ts_node__field_name_from_language(TSNode self, uint32_t structural_child_index) {
+    const TSFieldMapEntry *field_map, *field_map_end;
+    ts_language_field_map(
+      self.tree->language,
+      ts_node__subtree(self).ptr->production_id,
+      &field_map,
+      &field_map_end
+    );
+    for (; field_map != field_map_end; field_map++) {
+      if (!field_map->inherited && field_map->child_index == structural_child_index) {
+        return self.tree->language->field_names[field_map->field_id];
+      }
+    }
     return NULL;
-  }
+}
 
-  ts_language_field_map(
-    self.tree->language,
-    ts_node__subtree(self).ptr->production_id,
-    &field_map_start,
-    &field_map_end
-  );
+const char *ts_node_field_name_for_child(TSNode self, uint32_t child_index) {
+  TSNode result = self;
+  bool did_descend = true;
+  const char *inherited_field_name = NULL;
 
-  for (const TSFieldMapEntry *i = field_map_start; i < field_map_end; i++) {
-    if (i->child_index == child_index) {
-      return self.tree->language->field_names[i->field_id];
+  while (did_descend) {
+    did_descend = false;
+
+    TSNode child;
+    uint32_t index = 0;
+    NodeChildIterator iterator = ts_node_iterate_children(&result);
+    while (ts_node_child_iterator_next(&iterator, &child)) {
+      if (ts_node__is_relevant(child, true)) {
+        if (index == child_index) {
+          const char *field_name = ts_node__field_name_from_language(result, iterator.structural_child_index - 1);
+          if (field_name) return field_name;
+          return inherited_field_name;
+        }
+        index++;
+      } else {
+        uint32_t grandchild_index = child_index - index;
+        uint32_t grandchild_count = ts_node__relevant_child_count(child, true);
+        if (grandchild_index < grandchild_count) {
+          const char *field_name = ts_node__field_name_from_language(result, iterator.structural_child_index - 1);
+          if (field_name) inherited_field_name = field_name;
+
+          did_descend = true;
+          result = child;
+          child_index = grandchild_index;
+          break;
+        }
+        index += grandchild_count;
+      }
     }
   }
+
   return NULL;
 }
 

From cde45268b6b5de8ab5894ec4313c16b46e5de443 Mon Sep 17 00:00:00 2001
From: Matt <85322+mattmassicotte@users.noreply.github.com>
Date: Thu, 22 Sep 2022 06:39:52 -0400
Subject: [PATCH 072/347] subtree casts

---
 lib/src/subtree.c | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/lib/src/subtree.c b/lib/src/subtree.c
index f8f82951..fd76402f 100644
--- a/lib/src/subtree.c
+++ b/lib/src/subtree.c
@@ -348,7 +348,7 @@ void ts_subtree_balance(Subtree self, SubtreePool *pool, const TSLanguage *langu
       Subtree child2 = ts_subtree_children(tree)[tree.ptr->child_count - 1];
       long repeat_delta = (long)ts_subtree_repeat_depth(child1) - (long)ts_subtree_repeat_depth(child2);
       if (repeat_delta > 0) {
-        unsigned n = repeat_delta;
+        unsigned n = (unsigned)repeat_delta;
         for (unsigned i = n / 2; i > 0; i /= 2) {
           ts_subtree__compress(tree, i, language, &pool->tree_stack);
           n -= i;
@@ -513,7 +513,7 @@ MutableSubtree ts_subtree_new_node(
   size_t new_byte_size = ts_subtree_alloc_size(children->size);
   if (children->capacity * sizeof(Subtree) < new_byte_size) {
     children->contents = ts_realloc(children->contents, new_byte_size);
-    children->capacity = new_byte_size / sizeof(Subtree);
+    children->capacity = (uint32_t)(new_byte_size / sizeof(Subtree));
   }
   SubtreeHeapData *data = (SubtreeHeapData *)&children->contents[children->size];
 

From 65c16bfb17021b09a516c460f7a973b3325a5221 Mon Sep 17 00:00:00 2001
From: Matt <85322+mattmassicotte@users.noreply.github.com>
Date: Thu, 22 Sep 2022 06:47:53 -0400
Subject: [PATCH 073/347] query casts

---
 lib/src/query.c | 22 +++++++++++-----------
 1 file changed, 11 insertions(+), 11 deletions(-)

diff --git a/lib/src/query.c b/lib/src/query.c
index cfe11438..18bd7fd3 100644
--- a/lib/src/query.c
+++ b/lib/src/query.c
@@ -331,7 +331,7 @@ static bool stream_advance(Stream *self) {
   if (self->input < self->end) {
     uint32_t size = ts_decode_utf8(
       (const uint8_t *)self->input,
-      self->end - self->input,
+      (uint32_t)(self->end - self->input),
       &self->next
     );
     if (size > 0) {
@@ -398,7 +398,7 @@ static void stream_scan_identifier(Stream *stream) {
 }
 
 static uint32_t stream_offset(Stream *self) {
-  return self->input - self->start;
+  return (uint32_t)(self->input - self->start);
 }
 
 /******************
@@ -2064,7 +2064,7 @@ static TSQueryError ts_query__parse_predicate(
   if (!stream_is_ident_start(stream)) return TSQueryErrorSyntax;
   const char *predicate_name = stream->input;
   stream_scan_identifier(stream);
-  uint32_t length = stream->input - predicate_name;
+  uint32_t length = (uint32_t)(stream->input - predicate_name);
   uint16_t id = symbol_table_insert_name(
     &self->predicate_values,
     predicate_name,
@@ -2095,7 +2095,7 @@ static TSQueryError ts_query__parse_predicate(
       if (!stream_is_ident_start(stream)) return TSQueryErrorSyntax;
       const char *capture_name = stream->input;
       stream_scan_identifier(stream);
-      uint32_t length = stream->input - capture_name;
+      uint32_t length = (uint32_t)(stream->input - capture_name);
 
       // Add the capture id to the first step of the pattern
       int capture_id = symbol_table_id_for_name(
@@ -2133,7 +2133,7 @@ static TSQueryError ts_query__parse_predicate(
     else if (stream_is_ident_start(stream)) {
       const char *symbol_start = stream->input;
       stream_scan_identifier(stream);
-      uint32_t length = stream->input - symbol_start;
+      uint32_t length = (uint32_t)(stream->input - symbol_start);
       uint16_t id = symbol_table_insert_name(
         &self->predicate_values,
         symbol_start,
@@ -2302,7 +2302,7 @@ static TSQueryError ts_query__parse_pattern(
       if (stream_is_ident_start(stream)) {
         const char *node_name = stream->input;
         stream_scan_identifier(stream);
-        uint32_t length = stream->input - node_name;
+        uint32_t length = (uint32_t)(stream->input - node_name);
 
         // TODO - remove.
         // For temporary backward compatibility, handle predicates without the leading '#' sign.
@@ -2353,7 +2353,7 @@ static TSQueryError ts_query__parse_pattern(
 
         const char *node_name = stream->input;
         stream_scan_identifier(stream);
-        uint32_t length = stream->input - node_name;
+        uint32_t length = (uint32_t)(stream->input - node_name);
 
         step->symbol = ts_language_symbol_for_name(
           self->language,
@@ -2386,7 +2386,7 @@ static TSQueryError ts_query__parse_pattern(
           }
           const char *field_name = stream->input;
           stream_scan_identifier(stream);
-          uint32_t length = stream->input - field_name;
+          uint32_t length = (uint32_t)(stream->input - field_name);
           stream_skip_whitespace(stream);
 
           TSFieldId field_id = ts_language_field_id_for_name(
@@ -2497,7 +2497,7 @@ static TSQueryError ts_query__parse_pattern(
     // Parse the field name
     const char *field_name = stream->input;
     stream_scan_identifier(stream);
-    uint32_t length = stream->input - field_name;
+    uint32_t length = (uint32_t)(stream->input - field_name);
     stream_skip_whitespace(stream);
 
     if (stream->next != ':') {
@@ -2616,7 +2616,7 @@ static TSQueryError ts_query__parse_pattern(
       if (!stream_is_ident_start(stream)) return TSQueryErrorSyntax;
       const char *capture_name = stream->input;
       stream_scan_identifier(stream);
-      uint32_t length = stream->input - capture_name;
+      uint32_t length = (uint32_t)(stream->input - capture_name);
       stream_skip_whitespace(stream);
 
       // Add the capture id to the first step of the pattern
@@ -3323,7 +3323,7 @@ static QueryState *ts_query_cursor__copy_state(
   QueryState **state_ref
 ) {
   const QueryState *state = *state_ref;
-  uint32_t state_index = state - self->states.contents;
+  uint32_t state_index = (uint32_t)(state - self->states.contents);
   QueryState copy = *state;
   copy.capture_list_id = NONE;
 

From 0751736d1709d738b462ecd878b75c0fab536e3a Mon Sep 17 00:00:00 2001
From: Andreas Deininger <andreas@deininger.net>
Date: Fri, 31 Mar 2023 21:02:32 +0200
Subject: [PATCH 074/347] docs: convert various links to https protocol

---
 cli/README.md                        | 4 ++--
 cli/npm/dsl.d.ts                     | 2 +-
 cli/npm/package.json                 | 2 +-
 cli/src/generate/grammar-schema.json | 2 +-
 cli/src/playground.html              | 4 ++--
 docs/index.md                        | 6 +++---
 docs/section-2-using-parsers.md      | 2 +-
 docs/section-3-creating-parsers.md   | 2 +-
 docs/section-5-implementation.md     | 2 +-
 9 files changed, 13 insertions(+), 13 deletions(-)

diff --git a/cli/README.md b/cli/README.md
index 8cdda9c0..eff3608c 100644
--- a/cli/README.md
+++ b/cli/README.md
@@ -30,8 +30,8 @@ The `tree-sitter` binary itself has no dependencies, but specific commands have
 
 ### Commands
 
-* `generate` - The `tree-sitter generate` command will generate a Tree-sitter parser based on the grammar in the current working directory. See [the documentation](http://tree-sitter.github.io/tree-sitter/creating-parsers) for more information.
+* `generate` - The `tree-sitter generate` command will generate a Tree-sitter parser based on the grammar in the current working directory. See [the documentation](https://tree-sitter.github.io/tree-sitter/creating-parsers) for more information.
 
-* `test` - The `tree-sitter test` command will run the unit tests for the Tree-sitter parser in the current working directory. See [the documentation](http://tree-sitter.github.io/tree-sitter/creating-parsers) for more information.
+* `test` - The `tree-sitter test` command will run the unit tests for the Tree-sitter parser in the current working directory. See [the documentation](https://tree-sitter.github.io/tree-sitter/creating-parsers) for more information.
 
 * `parse` - The `tree-sitter parse` command will parse a file (or list of files) using Tree-sitter parsers.
diff --git a/cli/npm/dsl.d.ts b/cli/npm/dsl.d.ts
index f2ee57f1..fdf43b55 100644
--- a/cli/npm/dsl.d.ts
+++ b/cli/npm/dsl.d.ts
@@ -134,7 +134,7 @@ interface Grammar<
    *
    * @param $ grammar rules
    *
-   * @see http://tree-sitter.github.io/tree-sitter/using-parsers#static-node-types
+   * @see https://tree-sitter.github.io/tree-sitter/using-parsers#static-node-types
    */
   supertypes?: (
     $: GrammarSymbols<RuleName | BaseGrammarRuleName>,
diff --git a/cli/npm/package.json b/cli/npm/package.json
index 02309193..44d1327f 100644
--- a/cli/npm/package.json
+++ b/cli/npm/package.json
@@ -5,7 +5,7 @@
   "license": "MIT",
   "repository": {
     "type": "git",
-    "url": "http://github.com/tree-sitter/tree-sitter.git"
+    "url": "https://github.com/tree-sitter/tree-sitter.git"
   },
   "description": "CLI for generating fast incremental parsers",
   "keywords": [
diff --git a/cli/src/generate/grammar-schema.json b/cli/src/generate/grammar-schema.json
index 5ca35370..952aac80 100644
--- a/cli/src/generate/grammar-schema.json
+++ b/cli/src/generate/grammar-schema.json
@@ -63,7 +63,7 @@
     },
 
     "supertypes": {
-      "description": "A list of hidden rule names that should be considered supertypes in the generated node types file. See http://tree-sitter.github.io/tree-sitter/using-parsers#static-node-types.",
+      "description": "A list of hidden rule names that should be considered supertypes in the generated node types file. See https://tree-sitter.github.io/tree-sitter/using-parsers#static-node-types.",
       "type": "array",
       "items": {
         "description": "the name of a rule in `rules` or `extras`",
diff --git a/cli/src/playground.html b/cli/src/playground.html
index 22c874df..b69f9351 100644
--- a/cli/src/playground.html
+++ b/cli/src/playground.html
@@ -3,8 +3,8 @@
   <title>tree-sitter THE_LANGUAGE_NAME</title>
   <link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/codemirror/5.45.0/codemirror.min.css">
   <link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/clusterize.js/0.18.0/clusterize.min.css">
-  <link rel="icon" type="image/png" href="http://tree-sitter.github.io/tree-sitter/assets/images/favicon-32x32.png" sizes="32x32" />
-  <link rel="icon" type="image/png" href="http://tree-sitter.github.io/tree-sitter/assets/images/favicon-16x16.png" sizes="16x16" />
+  <link rel="icon" type="image/png" href="https://tree-sitter.github.io/tree-sitter/assets/images/favicon-32x32.png" sizes="32x32" />
+  <link rel="icon" type="image/png" href="https://tree-sitter.github.io/tree-sitter/assets/images/favicon-16x16.png" sizes="16x16" />
 </head>
 
 <body>
diff --git a/docs/index.md b/docs/index.md
index 2e3b59ed..9a15db06 100644
--- a/docs/index.md
+++ b/docs/index.md
@@ -158,7 +158,7 @@ The design of Tree-sitter was greatly influenced by the following research paper
 
 - [Practical Algorithms for Incremental Software Development Environments](https://www2.eecs.berkeley.edu/Pubs/TechRpts/1997/CSD-97-946.pdf)
 - [Context Aware Scanning for Parsing Extensible Languages](https://www-users.cse.umn.edu/~evw/pubs/vanwyk07gpce/vanwyk07gpce.pdf)
-- [Efficient and Flexible Incremental Parsing](http://harmonia.cs.berkeley.edu/papers/twagner-parsing.pdf)
-- [Incremental Analysis of Real Programming Languages](http://harmonia.cs.berkeley.edu/papers/twagner-glr.pdf)
-- [Error Detection and Recovery in LR Parsers](http://what-when-how.com/compiler-writing/bottom-up-parsing-compiler-writing-part-13)
+- [Efficient and Flexible Incremental Parsing](https://harmonia.cs.berkeley.edu/papers/twagner-parsing.pdf)
+- [Incremental Analysis of Real Programming Languages](https://harmonia.cs.berkeley.edu/papers/twagner-glr.pdf)
+- [Error Detection and Recovery in LR Parsers](https://what-when-how.com/compiler-writing/bottom-up-parsing-compiler-writing-part-13)
 - [Error Recovery for LR Parsers](https://apps.dtic.mil/sti/pdfs/ADA043470.pdf)
diff --git a/docs/section-2-using-parsers.md b/docs/section-2-using-parsers.md
index ea32f4f5..0d683dc1 100644
--- a/docs/section-2-using-parsers.md
+++ b/docs/section-2-using-parsers.md
@@ -290,7 +290,7 @@ This `ts_node_edit` function is _only_ needed in the case where you have retriev
 
 ### Multi-language Documents
 
-Sometimes, different parts of a file may be written in different languages. For example, templating languages like [EJS](http://ejs.co) and [ERB](https://ruby-doc.org/stdlib-2.5.1/libdoc/erb/rdoc/ERB.html) allow you to generate HTML by writing a mixture of HTML and another language like JavaScript or Ruby.
+Sometimes, different parts of a file may be written in different languages. For example, templating languages like [EJS](https://ejs.co) and [ERB](https://ruby-doc.org/stdlib-2.5.1/libdoc/erb/rdoc/ERB.html) allow you to generate HTML by writing a mixture of HTML and another language like JavaScript or Ruby.
 
 Tree-sitter handles these types of documents by allowing you to create a syntax tree based on the text in certain _ranges_ of a file.
 
diff --git a/docs/section-3-creating-parsers.md b/docs/section-3-creating-parsers.md
index 5677292f..0842edbb 100644
--- a/docs/section-3-creating-parsers.md
+++ b/docs/section-3-creating-parsers.md
@@ -752,7 +752,7 @@ External scanners are a common cause of infinite loops.
 Be very careful when emitting zero-width tokens from your external scanner, and if you consume characters in a loop be sure use the `eof` function to check whether you are at the end of the file.
 
 [ambiguous-grammar]: https://en.wikipedia.org/wiki/Ambiguous_grammar
-[antlr]: http://www.antlr.org/
+[antlr]: https://www.antlr.org
 [bison-dprec]: https://www.gnu.org/software/bison/manual/html_node/Generalized-LR-Parsing.html
 [bison]: https://en.wikipedia.org/wiki/GNU_bison
 [c-linkage]: https://en.cppreference.com/w/cpp/language/language_linkage
diff --git a/docs/section-5-implementation.md b/docs/section-5-implementation.md
index 532f1046..e0fa9661 100644
--- a/docs/section-5-implementation.md
+++ b/docs/section-5-implementation.md
@@ -13,7 +13,7 @@ syntax trees up-to-date as the source code changes. `libtree-sitter` is designed
 
 The CLI is
 used to generate a parser for a language by supplying a [context-free grammar](https://en.wikipedia.org/wiki/Context-free_grammar) describing the
-language. The CLI is a build tool; it is no longer needed once a parser has been generated. It is written in Rust, and is available on [crates.io](https://crates.io), [npm](http://npmjs.com), and as a pre-built binary [on GitHub](https://github.com/tree-sitter/tree-sitter/releases/latest).
+language. The CLI is a build tool; it is no longer needed once a parser has been generated. It is written in Rust, and is available on [crates.io](https://crates.io), [npm](https://npmjs.com), and as a pre-built binary [on GitHub](https://github.com/tree-sitter/tree-sitter/releases/latest).
 
 ## The CLI
 

From 5ce60ef9e5183c7cbc91d2fd2c3f50a1c63ced3e Mon Sep 17 00:00:00 2001
From: M Hickford <mirth.hickford@gmail.com>
Date: Sat, 5 Nov 2022 19:46:27 +0000
Subject: [PATCH 075/347] docs: clarify naming convention for bindings and
 parsers

---
 docs/index.md | 4 ++++
 1 file changed, 4 insertions(+)

diff --git a/docs/index.md b/docs/index.md
index 2e3b59ed..cc4f5850 100644
--- a/docs/index.md
+++ b/docs/index.md
@@ -30,6 +30,8 @@ There are currently bindings that allow Tree-sitter to be used from the followin
 * [Kotlin](https://github.com/oxisto/kotlintree)
 * [Java](https://github.com/serenadeai/java-tree-sitter)
 
+By convention, bindings are named with the language first, eg. ruby-tree-sitter.
+
 ### Parsers
 
 * [Ada](https://github.com/briot/tree-sitter-ada)
@@ -146,6 +148,8 @@ There are currently bindings that allow Tree-sitter to be used from the followin
 * [YANG](https://github.com/Hubro/tree-sitter-yang)
 * [Zig](https://github.com/maxxnino/tree-sitter-zig)
 
+By convention, parsers are named with the language last, eg. tree-sitter-ruby.
+
 ### Talks on Tree-sitter
 
 * [Strange Loop 2018](https://www.thestrangeloop.com/2018/tree-sitter---a-new-parsing-system-for-programming-tools.html)

From c38f78345e6bcd511fd0b1e7dfa1645ca69173b1 Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Tue, 4 Apr 2023 22:16:27 +0300
Subject: [PATCH 076/347] binding(rust): update script/generate-bindings to use
 latest rust-bindgen 0.64.0 version

---
 lib/binding_rust/bindings.rs | 357 ++++++-----------------------------
 script/generate-bindings     |   4 +-
 2 files changed, 56 insertions(+), 305 deletions(-)

diff --git a/lib/binding_rust/bindings.rs b/lib/binding_rust/bindings.rs
index be117f83..863b1df5 100644
--- a/lib/binding_rust/bindings.rs
+++ b/lib/binding_rust/bindings.rs
@@ -1,4 +1,4 @@
-/* automatically generated by rust-bindgen 0.59.2 */
+/* automatically generated by rust-bindgen 0.64.0 */
 
 pub type TSSymbol = u16;
 pub type TSFieldId = u16;
@@ -148,14 +148,7 @@ extern "C" {
     pub fn ts_parser_delete(parser: *mut TSParser);
 }
 extern "C" {
-    #[doc = " Set the language that the parser should use for parsing."]
-    #[doc = ""]
-    #[doc = " Returns a boolean indicating whether or not the language was successfully"]
-    #[doc = " assigned. True means assignment succeeded. False means there was a version"]
-    #[doc = " mismatch: the language was generated with an incompatible version of the"]
-    #[doc = " Tree-sitter CLI. Check the language's version using `ts_language_version`"]
-    #[doc = " and compare it to this library's `TREE_SITTER_LANGUAGE_VERSION` and"]
-    #[doc = " `TREE_SITTER_MIN_COMPATIBLE_LANGUAGE_VERSION` constants."]
+    #[doc = " Set the language that the parser should use for parsing.\n\n Returns a boolean indicating whether or not the language was successfully\n assigned. True means assignment succeeded. False means there was a version\n mismatch: the language was generated with an incompatible version of the\n Tree-sitter CLI. Check the language's version using `ts_language_version`\n and compare it to this library's `TREE_SITTER_LANGUAGE_VERSION` and\n `TREE_SITTER_MIN_COMPATIBLE_LANGUAGE_VERSION` constants."]
     pub fn ts_parser_set_language(self_: *mut TSParser, language: *const TSLanguage) -> bool;
 }
 extern "C" {
@@ -163,25 +156,7 @@ extern "C" {
     pub fn ts_parser_language(self_: *const TSParser) -> *const TSLanguage;
 }
 extern "C" {
-    #[doc = " Set the ranges of text that the parser should include when parsing."]
-    #[doc = ""]
-    #[doc = " By default, the parser will always include entire documents. This function"]
-    #[doc = " allows you to parse only a *portion* of a document but still return a syntax"]
-    #[doc = " tree whose ranges match up with the document as a whole. You can also pass"]
-    #[doc = " multiple disjoint ranges."]
-    #[doc = ""]
-    #[doc = " The second and third parameters specify the location and length of an array"]
-    #[doc = " of ranges. The parser does *not* take ownership of these ranges; it copies"]
-    #[doc = " the data, so it doesn't matter how these ranges are allocated."]
-    #[doc = ""]
-    #[doc = " If `length` is zero, then the entire document will be parsed. Otherwise,"]
-    #[doc = " the given ranges must be ordered from earliest to latest in the document,"]
-    #[doc = " and they must not overlap. That is, the following must hold for all"]
-    #[doc = " `i` < `length - 1`: ranges[i].end_byte <= ranges[i + 1].start_byte"]
-    #[doc = ""]
-    #[doc = " If this requirement is not satisfied, the operation will fail, the ranges"]
-    #[doc = " will not be assigned, and this function will return `false`. On success,"]
-    #[doc = " this function returns `true`"]
+    #[doc = " Set the ranges of text that the parser should include when parsing.\n\n By default, the parser will always include entire documents. This function\n allows you to parse only a *portion* of a document but still return a syntax\n tree whose ranges match up with the document as a whole. You can also pass\n multiple disjoint ranges.\n\n The second and third parameters specify the location and length of an array\n of ranges. The parser does *not* take ownership of these ranges; it copies\n the data, so it doesn't matter how these ranges are allocated.\n\n If `length` is zero, then the entire document will be parsed. Otherwise,\n the given ranges must be ordered from earliest to latest in the document,\n and they must not overlap. That is, the following must hold for all\n `i` < `length - 1`: ranges[i].end_byte <= ranges[i + 1].start_byte\n\n If this requirement is not satisfied, the operation will fail, the ranges\n will not be assigned, and this function will return `false`. On success,\n this function returns `true`"]
     pub fn ts_parser_set_included_ranges(
         self_: *mut TSParser,
         ranges: *const TSRange,
@@ -189,50 +164,11 @@ extern "C" {
     ) -> bool;
 }
 extern "C" {
-    #[doc = " Get the ranges of text that the parser will include when parsing."]
-    #[doc = ""]
-    #[doc = " The returned pointer is owned by the parser. The caller should not free it"]
-    #[doc = " or write to it. The length of the array will be written to the given"]
-    #[doc = " `length` pointer."]
+    #[doc = " Get the ranges of text that the parser will include when parsing.\n\n The returned pointer is owned by the parser. The caller should not free it\n or write to it. The length of the array will be written to the given\n `length` pointer."]
     pub fn ts_parser_included_ranges(self_: *const TSParser, length: *mut u32) -> *const TSRange;
 }
 extern "C" {
-    #[doc = " Use the parser to parse some source code and create a syntax tree."]
-    #[doc = ""]
-    #[doc = " If you are parsing this document for the first time, pass `NULL` for the"]
-    #[doc = " `old_tree` parameter. Otherwise, if you have already parsed an earlier"]
-    #[doc = " version of this document and the document has since been edited, pass the"]
-    #[doc = " previous syntax tree so that the unchanged parts of it can be reused."]
-    #[doc = " This will save time and memory. For this to work correctly, you must have"]
-    #[doc = " already edited the old syntax tree using the `ts_tree_edit` function in a"]
-    #[doc = " way that exactly matches the source code changes."]
-    #[doc = ""]
-    #[doc = " The `TSInput` parameter lets you specify how to read the text. It has the"]
-    #[doc = " following three fields:"]
-    #[doc = " 1. `read`: A function to retrieve a chunk of text at a given byte offset"]
-    #[doc = "    and (row, column) position. The function should return a pointer to the"]
-    #[doc = "    text and write its length to the `bytes_read` pointer. The parser does"]
-    #[doc = "    not take ownership of this buffer; it just borrows it until it has"]
-    #[doc = "    finished reading it. The function should write a zero value to the"]
-    #[doc = "    `bytes_read` pointer to indicate the end of the document."]
-    #[doc = " 2. `payload`: An arbitrary pointer that will be passed to each invocation"]
-    #[doc = "    of the `read` function."]
-    #[doc = " 3. `encoding`: An indication of how the text is encoded. Either"]
-    #[doc = "    `TSInputEncodingUTF8` or `TSInputEncodingUTF16`."]
-    #[doc = ""]
-    #[doc = " This function returns a syntax tree on success, and `NULL` on failure. There"]
-    #[doc = " are three possible reasons for failure:"]
-    #[doc = " 1. The parser does not have a language assigned. Check for this using the"]
-    #[doc = "`ts_parser_language` function."]
-    #[doc = " 2. Parsing was cancelled due to a timeout that was set by an earlier call to"]
-    #[doc = "    the `ts_parser_set_timeout_micros` function. You can resume parsing from"]
-    #[doc = "    where the parser left out by calling `ts_parser_parse` again with the"]
-    #[doc = "    same arguments. Or you can start parsing from scratch by first calling"]
-    #[doc = "    `ts_parser_reset`."]
-    #[doc = " 3. Parsing was cancelled using a cancellation flag that was set by an"]
-    #[doc = "    earlier call to `ts_parser_set_cancellation_flag`. You can resume parsing"]
-    #[doc = "    from where the parser left out by calling `ts_parser_parse` again with"]
-    #[doc = "    the same arguments."]
+    #[doc = " Use the parser to parse some source code and create a syntax tree.\n\n If you are parsing this document for the first time, pass `NULL` for the\n `old_tree` parameter. Otherwise, if you have already parsed an earlier\n version of this document and the document has since been edited, pass the\n previous syntax tree so that the unchanged parts of it can be reused.\n This will save time and memory. For this to work correctly, you must have\n already edited the old syntax tree using the `ts_tree_edit` function in a\n way that exactly matches the source code changes.\n\n The `TSInput` parameter lets you specify how to read the text. It has the\n following three fields:\n 1. `read`: A function to retrieve a chunk of text at a given byte offset\n    and (row, column) position. The function should return a pointer to the\n    text and write its length to the `bytes_read` pointer. The parser does\n    not take ownership of this buffer; it just borrows it until it has\n    finished reading it. The function should write a zero value to the\n    `bytes_read` pointer to indicate the end of the document.\n 2. `payload`: An arbitrary pointer that will be passed to each invocation\n    of the `read` function.\n 3. `encoding`: An indication of how the text is encoded. Either\n    `TSInputEncodingUTF8` or `TSInputEncodingUTF16`.\n\n This function returns a syntax tree on success, and `NULL` on failure. There\n are three possible reasons for failure:\n 1. The parser does not have a language assigned. Check for this using the\n`ts_parser_language` function.\n 2. Parsing was cancelled due to a timeout that was set by an earlier call to\n    the `ts_parser_set_timeout_micros` function. You can resume parsing from\n    where the parser left out by calling `ts_parser_parse` again with the\n    same arguments. Or you can start parsing from scratch by first calling\n    `ts_parser_reset`.\n 3. Parsing was cancelled using a cancellation flag that was set by an\n    earlier call to `ts_parser_set_cancellation_flag`. You can resume parsing\n    from where the parser left out by calling `ts_parser_parse` again with\n    the same arguments."]
     pub fn ts_parser_parse(
         self_: *mut TSParser,
         old_tree: *const TSTree,
@@ -240,10 +176,7 @@ extern "C" {
     ) -> *mut TSTree;
 }
 extern "C" {
-    #[doc = " Use the parser to parse some source code stored in one contiguous buffer."]
-    #[doc = " The first two parameters are the same as in the `ts_parser_parse` function"]
-    #[doc = " above. The second two parameters indicate the location of the buffer and its"]
-    #[doc = " length in bytes."]
+    #[doc = " Use the parser to parse some source code stored in one contiguous buffer.\n The first two parameters are the same as in the `ts_parser_parse` function\n above. The second two parameters indicate the location of the buffer and its\n length in bytes."]
     pub fn ts_parser_parse_string(
         self_: *mut TSParser,
         old_tree: *const TSTree,
@@ -252,10 +185,7 @@ extern "C" {
     ) -> *mut TSTree;
 }
 extern "C" {
-    #[doc = " Use the parser to parse some source code stored in one contiguous buffer with"]
-    #[doc = " a given encoding. The first four parameters work the same as in the"]
-    #[doc = " `ts_parser_parse_string` method above. The final parameter indicates whether"]
-    #[doc = " the text is encoded as UTF8 or UTF16."]
+    #[doc = " Use the parser to parse some source code stored in one contiguous buffer with\n a given encoding. The first four parameters work the same as in the\n `ts_parser_parse_string` method above. The final parameter indicates whether\n the text is encoded as UTF8 or UTF16."]
     pub fn ts_parser_parse_string_encoding(
         self_: *mut TSParser,
         old_tree: *const TSTree,
@@ -265,21 +195,11 @@ extern "C" {
     ) -> *mut TSTree;
 }
 extern "C" {
-    #[doc = " Instruct the parser to start the next parse from the beginning."]
-    #[doc = ""]
-    #[doc = " If the parser previously failed because of a timeout or a cancellation, then"]
-    #[doc = " by default, it will resume where it left off on the next call to"]
-    #[doc = " `ts_parser_parse` or other parsing functions. If you don't want to resume,"]
-    #[doc = " and instead intend to use this parser to parse some other document, you must"]
-    #[doc = " call `ts_parser_reset` first."]
+    #[doc = " Instruct the parser to start the next parse from the beginning.\n\n If the parser previously failed because of a timeout or a cancellation, then\n by default, it will resume where it left off on the next call to\n `ts_parser_parse` or other parsing functions. If you don't want to resume,\n and instead intend to use this parser to parse some other document, you must\n call `ts_parser_reset` first."]
     pub fn ts_parser_reset(self_: *mut TSParser);
 }
 extern "C" {
-    #[doc = " Set the maximum duration in microseconds that parsing should be allowed to"]
-    #[doc = " take before halting."]
-    #[doc = ""]
-    #[doc = " If parsing takes longer than this, it will halt early, returning NULL."]
-    #[doc = " See `ts_parser_parse` for more information."]
+    #[doc = " Set the maximum duration in microseconds that parsing should be allowed to\n take before halting.\n\n If parsing takes longer than this, it will halt early, returning NULL.\n See `ts_parser_parse` for more information."]
     pub fn ts_parser_set_timeout_micros(self_: *mut TSParser, timeout: u64);
 }
 extern "C" {
@@ -287,11 +207,7 @@ extern "C" {
     pub fn ts_parser_timeout_micros(self_: *const TSParser) -> u64;
 }
 extern "C" {
-    #[doc = " Set the parser's current cancellation flag pointer."]
-    #[doc = ""]
-    #[doc = " If a non-null pointer is assigned, then the parser will periodically read"]
-    #[doc = " from this pointer during parsing. If it reads a non-zero value, it will"]
-    #[doc = " halt early, returning NULL. See `ts_parser_parse` for more information."]
+    #[doc = " Set the parser's current cancellation flag pointer.\n\n If a non-null pointer is assigned, then the parser will periodically read\n from this pointer during parsing. If it reads a non-zero value, it will\n halt early, returning NULL. See `ts_parser_parse` for more information."]
     pub fn ts_parser_set_cancellation_flag(self_: *mut TSParser, flag: *const usize);
 }
 extern "C" {
@@ -299,11 +215,7 @@ extern "C" {
     pub fn ts_parser_cancellation_flag(self_: *const TSParser) -> *const usize;
 }
 extern "C" {
-    #[doc = " Set the logger that a parser should use during parsing."]
-    #[doc = ""]
-    #[doc = " The parser does not take ownership over the logger payload. If a logger was"]
-    #[doc = " previously assigned, the caller is responsible for releasing any memory"]
-    #[doc = " owned by the previous logger."]
+    #[doc = " Set the logger that a parser should use during parsing.\n\n The parser does not take ownership over the logger payload. If a logger was\n previously assigned, the caller is responsible for releasing any memory\n owned by the previous logger."]
     pub fn ts_parser_set_logger(self_: *mut TSParser, logger: TSLogger);
 }
 extern "C" {
@@ -311,17 +223,11 @@ extern "C" {
     pub fn ts_parser_logger(self_: *const TSParser) -> TSLogger;
 }
 extern "C" {
-    #[doc = " Set the file descriptor to which the parser should write debugging graphs"]
-    #[doc = " during parsing. The graphs are formatted in the DOT language. You may want"]
-    #[doc = " to pipe these graphs directly to a `dot(1)` process in order to generate"]
-    #[doc = " SVG output. You can turn off this logging by passing a negative number."]
+    #[doc = " Set the file descriptor to which the parser should write debugging graphs\n during parsing. The graphs are formatted in the DOT language. You may want\n to pipe these graphs directly to a `dot(1)` process in order to generate\n SVG output. You can turn off this logging by passing a negative number."]
     pub fn ts_parser_print_dot_graphs(self_: *mut TSParser, file: ::std::os::raw::c_int);
 }
 extern "C" {
-    #[doc = " Create a shallow copy of the syntax tree. This is very fast."]
-    #[doc = ""]
-    #[doc = " You need to copy a syntax tree in order to use it on more than one thread at"]
-    #[doc = " a time, as syntax trees are not thread safe."]
+    #[doc = " Create a shallow copy of the syntax tree. This is very fast.\n\n You need to copy a syntax tree in order to use it on more than one thread at\n a time, as syntax trees are not thread safe."]
     pub fn ts_tree_copy(self_: *const TSTree) -> *mut TSTree;
 }
 extern "C" {
@@ -333,8 +239,7 @@ extern "C" {
     pub fn ts_tree_root_node(self_: *const TSTree) -> TSNode;
 }
 extern "C" {
-    #[doc = " Get the root node of the syntax tree, but with its position"]
-    #[doc = " shifted forward by the given offset."]
+    #[doc = " Get the root node of the syntax tree, but with its position\n shifted forward by the given offset."]
     pub fn ts_tree_root_node_with_offset(
         self_: *const TSTree,
         offset_bytes: u32,
@@ -346,32 +251,15 @@ extern "C" {
     pub fn ts_tree_language(arg1: *const TSTree) -> *const TSLanguage;
 }
 extern "C" {
-    #[doc = " Get the array of included ranges that was used to parse the syntax tree."]
-    #[doc = ""]
-    #[doc = " The returned pointer must be freed by the caller."]
+    #[doc = " Get the array of included ranges that was used to parse the syntax tree.\n\n The returned pointer must be freed by the caller."]
     pub fn ts_tree_included_ranges(arg1: *const TSTree, length: *mut u32) -> *mut TSRange;
 }
 extern "C" {
-    #[doc = " Edit the syntax tree to keep it in sync with source code that has been"]
-    #[doc = " edited."]
-    #[doc = ""]
-    #[doc = " You must describe the edit both in terms of byte offsets and in terms of"]
-    #[doc = " (row, column) coordinates."]
+    #[doc = " Edit the syntax tree to keep it in sync with source code that has been\n edited.\n\n You must describe the edit both in terms of byte offsets and in terms of\n (row, column) coordinates."]
     pub fn ts_tree_edit(self_: *mut TSTree, edit: *const TSInputEdit);
 }
 extern "C" {
-    #[doc = " Compare an old edited syntax tree to a new syntax tree representing the same"]
-    #[doc = " document, returning an array of ranges whose syntactic structure has changed."]
-    #[doc = ""]
-    #[doc = " For this to work correctly, the old syntax tree must have been edited such"]
-    #[doc = " that its ranges match up to the new tree. Generally, you'll want to call"]
-    #[doc = " this function right after calling one of the `ts_parser_parse` functions."]
-    #[doc = " You need to pass the old tree that was passed to parse, as well as the new"]
-    #[doc = " tree that was returned from that function."]
-    #[doc = ""]
-    #[doc = " The returned array is allocated using `malloc` and the caller is responsible"]
-    #[doc = " for freeing it using `free`. The length of the array will be written to the"]
-    #[doc = " given `length` pointer."]
+    #[doc = " Compare an old edited syntax tree to a new syntax tree representing the same\n document, returning an array of ranges whose syntactic structure has changed.\n\n For this to work correctly, the old syntax tree must have been edited such\n that its ranges match up to the new tree. Generally, you'll want to call\n this function right after calling one of the `ts_parser_parse` functions.\n You need to pass the old tree that was passed to parse, as well as the new\n tree that was returned from that function.\n\n The returned array is allocated using `malloc` and the caller is responsible\n for freeing it using `free`. The length of the array will be written to the\n given `length` pointer."]
     pub fn ts_tree_get_changed_ranges(
         old_tree: *const TSTree,
         new_tree: *const TSTree,
@@ -407,32 +295,23 @@ extern "C" {
     pub fn ts_node_end_point(arg1: TSNode) -> TSPoint;
 }
 extern "C" {
-    #[doc = " Get an S-expression representing the node as a string."]
-    #[doc = ""]
-    #[doc = " This string is allocated with `malloc` and the caller is responsible for"]
-    #[doc = " freeing it using `free`."]
+    #[doc = " Get an S-expression representing the node as a string.\n\n This string is allocated with `malloc` and the caller is responsible for\n freeing it using `free`."]
     pub fn ts_node_string(arg1: TSNode) -> *mut ::std::os::raw::c_char;
 }
 extern "C" {
-    #[doc = " Check if the node is null. Functions like `ts_node_child` and"]
-    #[doc = " `ts_node_next_sibling` will return a null node to indicate that no such node"]
-    #[doc = " was found."]
+    #[doc = " Check if the node is null. Functions like `ts_node_child` and\n `ts_node_next_sibling` will return a null node to indicate that no such node\n was found."]
     pub fn ts_node_is_null(arg1: TSNode) -> bool;
 }
 extern "C" {
-    #[doc = " Check if the node is *named*. Named nodes correspond to named rules in the"]
-    #[doc = " grammar, whereas *anonymous* nodes correspond to string literals in the"]
-    #[doc = " grammar."]
+    #[doc = " Check if the node is *named*. Named nodes correspond to named rules in the\n grammar, whereas *anonymous* nodes correspond to string literals in the\n grammar."]
     pub fn ts_node_is_named(arg1: TSNode) -> bool;
 }
 extern "C" {
-    #[doc = " Check if the node is *missing*. Missing nodes are inserted by the parser in"]
-    #[doc = " order to recover from certain kinds of syntax errors."]
+    #[doc = " Check if the node is *missing*. Missing nodes are inserted by the parser in\n order to recover from certain kinds of syntax errors."]
     pub fn ts_node_is_missing(arg1: TSNode) -> bool;
 }
 extern "C" {
-    #[doc = " Check if the node is *extra*. Extra nodes represent things like comments,"]
-    #[doc = " which are not required the grammar, but can appear anywhere."]
+    #[doc = " Check if the node is *extra*. Extra nodes represent things like comments,\n which are not required the grammar, but can appear anywhere."]
     pub fn ts_node_is_extra(arg1: TSNode) -> bool;
 }
 extern "C" {
@@ -448,13 +327,11 @@ extern "C" {
     pub fn ts_node_parent(arg1: TSNode) -> TSNode;
 }
 extern "C" {
-    #[doc = " Get the node's child at the given index, where zero represents the first"]
-    #[doc = " child."]
+    #[doc = " Get the node's child at the given index, where zero represents the first\n child."]
     pub fn ts_node_child(arg1: TSNode, arg2: u32) -> TSNode;
 }
 extern "C" {
-    #[doc = " Get the field name for node's child at the given index, where zero represents"]
-    #[doc = " the first child. Returns NULL, if no field is found."]
+    #[doc = " Get the field name for node's child at the given index, where zero represents\n the first child. Returns NULL, if no field is found."]
     pub fn ts_node_field_name_for_child(arg1: TSNode, arg2: u32) -> *const ::std::os::raw::c_char;
 }
 extern "C" {
@@ -462,15 +339,11 @@ extern "C" {
     pub fn ts_node_child_count(arg1: TSNode) -> u32;
 }
 extern "C" {
-    #[doc = " Get the node's *named* child at the given index."]
-    #[doc = ""]
-    #[doc = " See also `ts_node_is_named`."]
+    #[doc = " Get the node's *named* child at the given index.\n\n See also `ts_node_is_named`."]
     pub fn ts_node_named_child(arg1: TSNode, arg2: u32) -> TSNode;
 }
 extern "C" {
-    #[doc = " Get the node's number of *named* children."]
-    #[doc = ""]
-    #[doc = " See also `ts_node_is_named`."]
+    #[doc = " Get the node's number of *named* children.\n\n See also `ts_node_is_named`."]
     pub fn ts_node_named_child_count(arg1: TSNode) -> u32;
 }
 extern "C" {
@@ -482,10 +355,7 @@ extern "C" {
     ) -> TSNode;
 }
 extern "C" {
-    #[doc = " Get the node's child with the given numerical field id."]
-    #[doc = ""]
-    #[doc = " You can convert a field name to an id using the"]
-    #[doc = " `ts_language_field_id_for_name` function."]
+    #[doc = " Get the node's child with the given numerical field id.\n\n You can convert a field name to an id using the\n `ts_language_field_id_for_name` function."]
     pub fn ts_node_child_by_field_id(arg1: TSNode, arg2: TSFieldId) -> TSNode;
 }
 extern "C" {
@@ -511,8 +381,7 @@ extern "C" {
     pub fn ts_node_first_named_child_for_byte(arg1: TSNode, arg2: u32) -> TSNode;
 }
 extern "C" {
-    #[doc = " Get the smallest node within this node that spans the given range of bytes"]
-    #[doc = " or (row, column) positions."]
+    #[doc = " Get the smallest node within this node that spans the given range of bytes\n or (row, column) positions."]
     pub fn ts_node_descendant_for_byte_range(arg1: TSNode, arg2: u32, arg3: u32) -> TSNode;
 }
 extern "C" {
@@ -520,8 +389,7 @@ extern "C" {
         -> TSNode;
 }
 extern "C" {
-    #[doc = " Get the smallest named node within this node that spans the given range of"]
-    #[doc = " bytes or (row, column) positions."]
+    #[doc = " Get the smallest named node within this node that spans the given range of\n bytes or (row, column) positions."]
     pub fn ts_node_named_descendant_for_byte_range(arg1: TSNode, arg2: u32, arg3: u32) -> TSNode;
 }
 extern "C" {
@@ -532,13 +400,7 @@ extern "C" {
     ) -> TSNode;
 }
 extern "C" {
-    #[doc = " Edit the node to keep it in-sync with source code that has been edited."]
-    #[doc = ""]
-    #[doc = " This function is only rarely needed. When you edit a syntax tree with the"]
-    #[doc = " `ts_tree_edit` function, all of the nodes that you retrieve from the tree"]
-    #[doc = " afterward will already reflect the edit. You only need to use `ts_node_edit`"]
-    #[doc = " when you have a `TSNode` instance that you want to keep and continue to use"]
-    #[doc = " after an edit."]
+    #[doc = " Edit the node to keep it in-sync with source code that has been edited.\n\n This function is only rarely needed. When you edit a syntax tree with the\n `ts_tree_edit` function, all of the nodes that you retrieve from the tree\n afterward will already reflect the edit. You only need to use `ts_node_edit`\n when you have a `TSNode` instance that you want to keep and continue to use\n after an edit."]
     pub fn ts_node_edit(arg1: *mut TSNode, arg2: *const TSInputEdit);
 }
 extern "C" {
@@ -546,11 +408,7 @@ extern "C" {
     pub fn ts_node_eq(arg1: TSNode, arg2: TSNode) -> bool;
 }
 extern "C" {
-    #[doc = " Create a new tree cursor starting from the given node."]
-    #[doc = ""]
-    #[doc = " A tree cursor allows you to walk a syntax tree more efficiently than is"]
-    #[doc = " possible using the `TSNode` functions. It is a mutable object that is always"]
-    #[doc = " on a certain syntax node, and can be moved imperatively to different nodes."]
+    #[doc = " Create a new tree cursor starting from the given node.\n\n A tree cursor allows you to walk a syntax tree more efficiently than is\n possible using the `TSNode` functions. It is a mutable object that is always\n on a certain syntax node, and can be moved imperatively to different nodes."]
     pub fn ts_tree_cursor_new(arg1: TSNode) -> TSTreeCursor;
 }
 extern "C" {
@@ -566,48 +424,29 @@ extern "C" {
     pub fn ts_tree_cursor_current_node(arg1: *const TSTreeCursor) -> TSNode;
 }
 extern "C" {
-    #[doc = " Get the field name of the tree cursor's current node."]
-    #[doc = ""]
-    #[doc = " This returns `NULL` if the current node doesn't have a field."]
-    #[doc = " See also `ts_node_child_by_field_name`."]
+    #[doc = " Get the field name of the tree cursor's current node.\n\n This returns `NULL` if the current node doesn't have a field.\n See also `ts_node_child_by_field_name`."]
     pub fn ts_tree_cursor_current_field_name(
         arg1: *const TSTreeCursor,
     ) -> *const ::std::os::raw::c_char;
 }
 extern "C" {
-    #[doc = " Get the field id of the tree cursor's current node."]
-    #[doc = ""]
-    #[doc = " This returns zero if the current node doesn't have a field."]
-    #[doc = " See also `ts_node_child_by_field_id`, `ts_language_field_id_for_name`."]
+    #[doc = " Get the field id of the tree cursor's current node.\n\n This returns zero if the current node doesn't have a field.\n See also `ts_node_child_by_field_id`, `ts_language_field_id_for_name`."]
     pub fn ts_tree_cursor_current_field_id(arg1: *const TSTreeCursor) -> TSFieldId;
 }
 extern "C" {
-    #[doc = " Move the cursor to the parent of its current node."]
-    #[doc = ""]
-    #[doc = " This returns `true` if the cursor successfully moved, and returns `false`"]
-    #[doc = " if there was no parent node (the cursor was already on the root node)."]
+    #[doc = " Move the cursor to the parent of its current node.\n\n This returns `true` if the cursor successfully moved, and returns `false`\n if there was no parent node (the cursor was already on the root node)."]
     pub fn ts_tree_cursor_goto_parent(arg1: *mut TSTreeCursor) -> bool;
 }
 extern "C" {
-    #[doc = " Move the cursor to the next sibling of its current node."]
-    #[doc = ""]
-    #[doc = " This returns `true` if the cursor successfully moved, and returns `false`"]
-    #[doc = " if there was no next sibling node."]
+    #[doc = " Move the cursor to the next sibling of its current node.\n\n This returns `true` if the cursor successfully moved, and returns `false`\n if there was no next sibling node."]
     pub fn ts_tree_cursor_goto_next_sibling(arg1: *mut TSTreeCursor) -> bool;
 }
 extern "C" {
-    #[doc = " Move the cursor to the first child of its current node."]
-    #[doc = ""]
-    #[doc = " This returns `true` if the cursor successfully moved, and returns `false`"]
-    #[doc = " if there were no children."]
+    #[doc = " Move the cursor to the first child of its current node.\n\n This returns `true` if the cursor successfully moved, and returns `false`\n if there were no children."]
     pub fn ts_tree_cursor_goto_first_child(arg1: *mut TSTreeCursor) -> bool;
 }
 extern "C" {
-    #[doc = " Move the cursor to the first child of its current node that extends beyond"]
-    #[doc = " the given byte offset or point."]
-    #[doc = ""]
-    #[doc = " This returns the index of the child node if one was found, and returns -1"]
-    #[doc = " if no such child was found."]
+    #[doc = " Move the cursor to the first child of its current node that extends beyond\n the given byte offset or point.\n\n This returns the index of the child node if one was found, and returns -1\n if no such child was found."]
     pub fn ts_tree_cursor_goto_first_child_for_byte(arg1: *mut TSTreeCursor, arg2: u32) -> i64;
 }
 extern "C" {
@@ -618,15 +457,7 @@ extern "C" {
     pub fn ts_tree_cursor_copy(arg1: *const TSTreeCursor) -> TSTreeCursor;
 }
 extern "C" {
-    #[doc = " Create a new query from a string containing one or more S-expression"]
-    #[doc = " patterns. The query is associated with a particular language, and can"]
-    #[doc = " only be run on syntax nodes parsed with that language."]
-    #[doc = ""]
-    #[doc = " If all of the given patterns are valid, this returns a `TSQuery`."]
-    #[doc = " If a pattern is invalid, this returns `NULL`, and provides two pieces"]
-    #[doc = " of information about the problem:"]
-    #[doc = " 1. The byte offset of the error is written to the `error_offset` parameter."]
-    #[doc = " 2. The type of error is written to the `error_type` parameter."]
+    #[doc = " Create a new query from a string containing one or more S-expression\n patterns. The query is associated with a particular language, and can\n only be run on syntax nodes parsed with that language.\n\n If all of the given patterns are valid, this returns a `TSQuery`.\n If a pattern is invalid, this returns `NULL`, and provides two pieces\n of information about the problem:\n 1. The byte offset of the error is written to the `error_offset` parameter.\n 2. The type of error is written to the `error_type` parameter."]
     pub fn ts_query_new(
         language: *const TSLanguage,
         source: *const ::std::os::raw::c_char,
@@ -650,27 +481,11 @@ extern "C" {
     pub fn ts_query_string_count(arg1: *const TSQuery) -> u32;
 }
 extern "C" {
-    #[doc = " Get the byte offset where the given pattern starts in the query's source."]
-    #[doc = ""]
-    #[doc = " This can be useful when combining queries by concatenating their source"]
-    #[doc = " code strings."]
+    #[doc = " Get the byte offset where the given pattern starts in the query's source.\n\n This can be useful when combining queries by concatenating their source\n code strings."]
     pub fn ts_query_start_byte_for_pattern(arg1: *const TSQuery, arg2: u32) -> u32;
 }
 extern "C" {
-    #[doc = " Get all of the predicates for the given pattern in the query."]
-    #[doc = ""]
-    #[doc = " The predicates are represented as a single array of steps. There are three"]
-    #[doc = " types of steps in this array, which correspond to the three legal values for"]
-    #[doc = " the `type` field:"]
-    #[doc = " - `TSQueryPredicateStepTypeCapture` - Steps with this type represent names"]
-    #[doc = "    of captures. Their `value_id` can be used with the"]
-    #[doc = "   `ts_query_capture_name_for_id` function to obtain the name of the capture."]
-    #[doc = " - `TSQueryPredicateStepTypeString` - Steps with this type represent literal"]
-    #[doc = "    strings. Their `value_id` can be used with the"]
-    #[doc = "    `ts_query_string_value_for_id` function to obtain their string value."]
-    #[doc = " - `TSQueryPredicateStepTypeDone` - Steps with this type are *sentinels*"]
-    #[doc = "    that represent the end of an individual predicate. If a pattern has two"]
-    #[doc = "    predicates, then there will be two steps with this `type` in the array."]
+    #[doc = " Get all of the predicates for the given pattern in the query.\n\n The predicates are represented as a single array of steps. There are three\n types of steps in this array, which correspond to the three legal values for\n the `type` field:\n - `TSQueryPredicateStepTypeCapture` - Steps with this type represent names\n    of captures. Their `value_id` can be used with the\n   `ts_query_capture_name_for_id` function to obtain the name of the capture.\n - `TSQueryPredicateStepTypeString` - Steps with this type represent literal\n    strings. Their `value_id` can be used with the\n    `ts_query_string_value_for_id` function to obtain their string value.\n - `TSQueryPredicateStepTypeDone` - Steps with this type are *sentinels*\n    that represent the end of an individual predicate. If a pattern has two\n    predicates, then there will be two steps with this `type` in the array."]
     pub fn ts_query_predicates_for_pattern(
         self_: *const TSQuery,
         pattern_index: u32,
@@ -678,18 +493,16 @@ extern "C" {
     ) -> *const TSQueryPredicateStep;
 }
 extern "C" {
-    pub fn ts_query_is_pattern_non_local(self_: *const TSQuery, pattern_index: u32) -> bool;
+    pub fn ts_query_is_pattern_rooted(self_: *const TSQuery, pattern_index: u32) -> bool;
 }
 extern "C" {
-    pub fn ts_query_is_pattern_rooted(self_: *const TSQuery, pattern_index: u32) -> bool;
+    pub fn ts_query_is_pattern_non_local(self_: *const TSQuery, pattern_index: u32) -> bool;
 }
 extern "C" {
     pub fn ts_query_is_pattern_guaranteed_at_step(self_: *const TSQuery, byte_offset: u32) -> bool;
 }
 extern "C" {
-    #[doc = " Get the name and length of one of the query's captures, or one of the"]
-    #[doc = " query's string literals. Each capture and string is associated with a"]
-    #[doc = " numeric id based on the order that it appeared in the query's source."]
+    #[doc = " Get the name and length of one of the query's captures, or one of the\n query's string literals. Each capture and string is associated with a\n numeric id based on the order that it appeared in the query's source."]
     pub fn ts_query_capture_name_for_id(
         arg1: *const TSQuery,
         id: u32,
@@ -697,8 +510,7 @@ extern "C" {
     ) -> *const ::std::os::raw::c_char;
 }
 extern "C" {
-    #[doc = " Get the quantifier of the query's captures. Each capture is * associated"]
-    #[doc = " with a numeric id based on the order that it appeared in the query's source."]
+    #[doc = " Get the quantifier of the query's captures. Each capture is * associated\n with a numeric id based on the order that it appeared in the query's source."]
     pub fn ts_query_capture_quantifier_for_id(
         arg1: *const TSQuery,
         pattern_id: u32,
@@ -713,11 +525,7 @@ extern "C" {
     ) -> *const ::std::os::raw::c_char;
 }
 extern "C" {
-    #[doc = " Disable a certain capture within a query."]
-    #[doc = ""]
-    #[doc = " This prevents the capture from being returned in matches, and also avoids"]
-    #[doc = " any resource usage associated with recording the capture. Currently, there"]
-    #[doc = " is no way to undo this."]
+    #[doc = " Disable a certain capture within a query.\n\n This prevents the capture from being returned in matches, and also avoids\n any resource usage associated with recording the capture. Currently, there\n is no way to undo this."]
     pub fn ts_query_disable_capture(
         arg1: *mut TSQuery,
         arg2: *const ::std::os::raw::c_char,
@@ -725,33 +533,11 @@ extern "C" {
     );
 }
 extern "C" {
-    #[doc = " Disable a certain pattern within a query."]
-    #[doc = ""]
-    #[doc = " This prevents the pattern from matching and removes most of the overhead"]
-    #[doc = " associated with the pattern. Currently, there is no way to undo this."]
+    #[doc = " Disable a certain pattern within a query.\n\n This prevents the pattern from matching and removes most of the overhead\n associated with the pattern. Currently, there is no way to undo this."]
     pub fn ts_query_disable_pattern(arg1: *mut TSQuery, arg2: u32);
 }
 extern "C" {
-    #[doc = " Create a new cursor for executing a given query."]
-    #[doc = ""]
-    #[doc = " The cursor stores the state that is needed to iteratively search"]
-    #[doc = " for matches. To use the query cursor, first call `ts_query_cursor_exec`"]
-    #[doc = " to start running a given query on a given syntax node. Then, there are"]
-    #[doc = " two options for consuming the results of the query:"]
-    #[doc = " 1. Repeatedly call `ts_query_cursor_next_match` to iterate over all of the"]
-    #[doc = "    *matches* in the order that they were found. Each match contains the"]
-    #[doc = "    index of the pattern that matched, and an array of captures. Because"]
-    #[doc = "    multiple patterns can match the same set of nodes, one match may contain"]
-    #[doc = "    captures that appear *before* some of the captures from a previous match."]
-    #[doc = " 2. Repeatedly call `ts_query_cursor_next_capture` to iterate over all of the"]
-    #[doc = "    individual *captures* in the order that they appear. This is useful if"]
-    #[doc = "    don't care about which pattern matched, and just want a single ordered"]
-    #[doc = "    sequence of captures."]
-    #[doc = ""]
-    #[doc = " If you don't care about consuming all of the results, you can stop calling"]
-    #[doc = " `ts_query_cursor_next_match` or `ts_query_cursor_next_capture` at any point."]
-    #[doc = "  You can then start executing another query on another node by calling"]
-    #[doc = "  `ts_query_cursor_exec` again."]
+    #[doc = " Create a new cursor for executing a given query.\n\n The cursor stores the state that is needed to iteratively search\n for matches. To use the query cursor, first call `ts_query_cursor_exec`\n to start running a given query on a given syntax node. Then, there are\n two options for consuming the results of the query:\n 1. Repeatedly call `ts_query_cursor_next_match` to iterate over all of the\n    *matches* in the order that they were found. Each match contains the\n    index of the pattern that matched, and an array of captures. Because\n    multiple patterns can match the same set of nodes, one match may contain\n    captures that appear *before* some of the captures from a previous match.\n 2. Repeatedly call `ts_query_cursor_next_capture` to iterate over all of the\n    individual *captures* in the order that they appear. This is useful if\n    don't care about which pattern matched, and just want a single ordered\n    sequence of captures.\n\n If you don't care about consuming all of the results, you can stop calling\n `ts_query_cursor_next_match` or `ts_query_cursor_next_capture` at any point.\n  You can then start executing another query on another node by calling\n  `ts_query_cursor_exec` again."]
     pub fn ts_query_cursor_new() -> *mut TSQueryCursor;
 }
 extern "C" {
@@ -763,15 +549,7 @@ extern "C" {
     pub fn ts_query_cursor_exec(arg1: *mut TSQueryCursor, arg2: *const TSQuery, arg3: TSNode);
 }
 extern "C" {
-    #[doc = " Manage the maximum number of in-progress matches allowed by this query"]
-    #[doc = " cursor."]
-    #[doc = ""]
-    #[doc = " Query cursors have an optional maximum capacity for storing lists of"]
-    #[doc = " in-progress captures. If this capacity is exceeded, then the"]
-    #[doc = " earliest-starting match will silently be dropped to make room for further"]
-    #[doc = " matches. This maximum capacity is optional — by default, query cursors allow"]
-    #[doc = " any number of pending matches, dynamically allocating new space for them as"]
-    #[doc = " needed as the query is executed."]
+    #[doc = " Manage the maximum number of in-progress matches allowed by this query\n cursor.\n\n Query cursors have an optional maximum capacity for storing lists of\n in-progress captures. If this capacity is exceeded, then the\n earliest-starting match will silently be dropped to make room for further\n matches. This maximum capacity is optional — by default, query cursors allow\n any number of pending matches, dynamically allocating new space for them as\n needed as the query is executed."]
     pub fn ts_query_cursor_did_exceed_match_limit(arg1: *const TSQueryCursor) -> bool;
 }
 extern "C" {
@@ -781,28 +559,21 @@ extern "C" {
     pub fn ts_query_cursor_set_match_limit(arg1: *mut TSQueryCursor, arg2: u32);
 }
 extern "C" {
-    #[doc = " Set the range of bytes or (row, column) positions in which the query"]
-    #[doc = " will be executed."]
+    #[doc = " Set the range of bytes or (row, column) positions in which the query\n will be executed."]
     pub fn ts_query_cursor_set_byte_range(arg1: *mut TSQueryCursor, arg2: u32, arg3: u32);
 }
 extern "C" {
     pub fn ts_query_cursor_set_point_range(arg1: *mut TSQueryCursor, arg2: TSPoint, arg3: TSPoint);
 }
 extern "C" {
-    #[doc = " Advance to the next match of the currently running query."]
-    #[doc = ""]
-    #[doc = " If there is a match, write it to `*match` and return `true`."]
-    #[doc = " Otherwise, return `false`."]
+    #[doc = " Advance to the next match of the currently running query.\n\n If there is a match, write it to `*match` and return `true`.\n Otherwise, return `false`."]
     pub fn ts_query_cursor_next_match(arg1: *mut TSQueryCursor, match_: *mut TSQueryMatch) -> bool;
 }
 extern "C" {
     pub fn ts_query_cursor_remove_match(arg1: *mut TSQueryCursor, id: u32);
 }
 extern "C" {
-    #[doc = " Advance to the next capture of the currently running query."]
-    #[doc = ""]
-    #[doc = " If there is a capture, write its match to `*match` and its index within"]
-    #[doc = " the matche's capture list to `*capture_index`. Otherwise, return `false`."]
+    #[doc = " Advance to the next capture of the currently running query.\n\n If there is a capture, write its match to `*match` and its index within\n the matche's capture list to `*capture_index`. Otherwise, return `false`."]
     pub fn ts_query_cursor_next_capture(
         arg1: *mut TSQueryCursor,
         match_: *mut TSQueryMatch,
@@ -849,35 +620,15 @@ extern "C" {
     ) -> TSFieldId;
 }
 extern "C" {
-    #[doc = " Check whether the given node type id belongs to named nodes, anonymous nodes,"]
-    #[doc = " or a hidden nodes."]
-    #[doc = ""]
-    #[doc = " See also `ts_node_is_named`. Hidden nodes are never returned from the API."]
+    #[doc = " Check whether the given node type id belongs to named nodes, anonymous nodes,\n or a hidden nodes.\n\n See also `ts_node_is_named`. Hidden nodes are never returned from the API."]
     pub fn ts_language_symbol_type(arg1: *const TSLanguage, arg2: TSSymbol) -> TSSymbolType;
 }
 extern "C" {
-    #[doc = " Get the ABI version number for this language. This version number is used"]
-    #[doc = " to ensure that languages were generated by a compatible version of"]
-    #[doc = " Tree-sitter."]
-    #[doc = ""]
-    #[doc = " See also `ts_parser_set_language`."]
+    #[doc = " Get the ABI version number for this language. This version number is used\n to ensure that languages were generated by a compatible version of\n Tree-sitter.\n\n See also `ts_parser_set_language`."]
     pub fn ts_language_version(arg1: *const TSLanguage) -> u32;
 }
 extern "C" {
-    #[doc = " Set the allocation functions used by the library."]
-    #[doc = ""]
-    #[doc = " By default, Tree-sitter uses the standard libc allocation functions,"]
-    #[doc = " but aborts the process when an allocation fails. This function lets"]
-    #[doc = " you supply alternative allocation functions at runtime."]
-    #[doc = ""]
-    #[doc = " If you pass `NULL` for any parameter, Tree-sitter will switch back to"]
-    #[doc = " its default implementation of that function."]
-    #[doc = ""]
-    #[doc = " If you call this function after the library has already been used, then"]
-    #[doc = " you must ensure that either:"]
-    #[doc = "  1. All the existing objects have been freed."]
-    #[doc = "  2. The new allocator shares its state with the old one, so it is capable"]
-    #[doc = "     of freeing memory that was allocated by the old allocator."]
+    #[doc = " Set the allocation functions used by the library.\n\n By default, Tree-sitter uses the standard libc allocation functions,\n but aborts the process when an allocation fails. This function lets\n you supply alternative allocation functions at runtime.\n\n If you pass `NULL` for any parameter, Tree-sitter will switch back to\n its default implementation of that function.\n\n If you call this function after the library has already been used, then\n you must ensure that either:\n  1. All the existing objects have been freed.\n  2. The new allocator shares its state with the old one, so it is capable\n     of freeing memory that was allocated by the old allocator."]
     pub fn ts_set_allocator(
         new_malloc: ::std::option::Option<
             unsafe extern "C" fn(arg1: usize) -> *mut ::std::os::raw::c_void,
diff --git a/script/generate-bindings b/script/generate-bindings
index 54abac06..19975d37 100755
--- a/script/generate-bindings
+++ b/script/generate-bindings
@@ -5,8 +5,8 @@ header_path='lib/include/tree_sitter/api.h'
 
 bindgen                                        \
   --no-layout-tests                            \
-  --whitelist-type '^TS.*'                     \
-  --whitelist-function '^ts_.*'                \
+  --allowlist-type '^TS.*'                     \
+  --allowlist-function '^ts_.*'                \
   --blocklist-type '^__.*'                     \
   --size_t-is-usize                            \
   $header_path > $output_path

From 0376533c04e07784b69590daab5684ac51730c11 Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Wed, 5 Apr 2023 20:41:47 +0300
Subject: [PATCH 077/347] cicd: add a test job with enabled UBSAN

---
 .github/workflows/build.yml | 31 +++++++++++++++++++++++++++++++
 1 file changed, 31 insertions(+)

diff --git a/.github/workflows/build.yml b/.github/workflows/build.yml
index 27b31085..cf3628a1 100644
--- a/.github/workflows/build.yml
+++ b/.github/workflows/build.yml
@@ -169,3 +169,34 @@ jobs:
           lib/binding_web/tree-sitter.wasm
         if-no-files-found: error
         retention-days: 7
+
+  check_undefined_behaviour:
+    name: Undefined behaviour checks
+    runs-on: ubuntu-latest
+    env:
+      TREE_SITTER: ${{ github.workspace }}/target/release/tree-sitter
+    steps:
+    - name: Checkout source code
+      uses: actions/checkout@v3
+
+    - name: Install UBSAN library
+      run: sudo apt-get install -y libubsan1
+
+    - name: Install Rust toolchain
+      uses: dtolnay/rust-toolchain@stable
+
+    - name: Build CLI
+      run: cargo build --release
+
+    - name: Fetch fixtures
+      run: script/fetch-fixtures
+
+    - name: Generate fixtures
+      run: script/generate-fixtures
+
+    - name: Run main tests with undefined behaviour sanitizer (UBSAN)
+      env:
+        UBSAN_OPTIONS: halt_on_error=1
+        CFLAGS: -fsanitize=undefined
+        RUSTFLAGS: -lubsan
+      run: cargo test -- --test-threads 1

From 4c2a36302bec7495626250e3dd018252ec4309da Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Thu, 6 Apr 2023 03:59:55 +0300
Subject: [PATCH 078/347] lib: fix OOB in query engine reported in #2162

---
 lib/src/query.c | 3 +++
 1 file changed, 3 insertions(+)

diff --git a/lib/src/query.c b/lib/src/query.c
index 18bd7fd3..da7a4166 100644
--- a/lib/src/query.c
+++ b/lib/src/query.c
@@ -938,6 +938,9 @@ static inline int analysis_state__compare(
 }
 
 static inline AnalysisStateEntry *analysis_state__top(AnalysisState *self) {
+  if (self->depth == 0) {
+    return &self->stack[0];
+  }
   return &self->stack[self->depth - 1];
 }
 

From 0d326824d25912ab0fb558e54980554111f71e64 Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Thu, 6 Apr 2023 01:49:50 +0300
Subject: [PATCH 079/347] test: add a reproducing test for #2162

---
 cli/src/tests/github_issue_test.rs | 16 ++++++++++++++++
 cli/src/tests/mod.rs               |  1 +
 2 files changed, 17 insertions(+)
 create mode 100644 cli/src/tests/github_issue_test.rs

diff --git a/cli/src/tests/github_issue_test.rs b/cli/src/tests/github_issue_test.rs
new file mode 100644
index 00000000..42fe3e9a
--- /dev/null
+++ b/cli/src/tests/github_issue_test.rs
@@ -0,0 +1,16 @@
+// Tests in this mod need be executed with enabled UBSAN library:
+// ```
+// UBSAN_OPTIONS="halt_on_error=1" \
+// CFLAGS="-fsanitize=undefined"   \
+// RUSTFLAGS="-lubsan"             \
+// cargo test --target $(rustc -vV | sed -nr 's/^host: //p') -- --test-threads 1
+// ```
+
+use crate::tests::helpers::fixtures::get_language;
+use tree_sitter::Query;
+
+#[test]
+fn issue_2162_out_of_bound() {
+    let language = get_language("java");
+    assert!(Query::new(language, "(package_declaration _ (_) @name _)").is_ok());
+}
diff --git a/cli/src/tests/mod.rs b/cli/src/tests/mod.rs
index 1b804450..03a588b9 100644
--- a/cli/src/tests/mod.rs
+++ b/cli/src/tests/mod.rs
@@ -1,4 +1,5 @@
 mod corpus_test;
+mod github_issue_test;
 mod helpers;
 mod highlight_test;
 mod node_test;

From 52f22a65eb7153aca6563372425c4c79a84242b9 Mon Sep 17 00:00:00 2001
From: Christian Clason <c.clason@uni-graz.at>
Date: Thu, 6 Apr 2023 14:24:19 +0200
Subject: [PATCH 080/347] cicd: build CLI for macos-arm64

---
 .github/workflows/build.yml | 12 +++++++++---
 cli/npm/install.js          |  8 ++------
 2 files changed, 11 insertions(+), 9 deletions(-)

diff --git a/.github/workflows/build.yml b/.github/workflows/build.yml
index cf3628a1..d4a68a06 100644
--- a/.github/workflows/build.yml
+++ b/.github/workflows/build.yml
@@ -6,6 +6,7 @@ env:
   CROSS_DEBUG: 1
 
 on:
+  workflow_dispatch:
   workflow_call:
     inputs:
       ref:
@@ -27,6 +28,7 @@ jobs:
           - { name: windows-x64   , target: x86_64-pc-windows-msvc      , os: windows-latest                   }
           - { name: windows-x86   , target: i686-pc-windows-msvc        , os: windows-latest                   }
           - { name: macos-x64     , target: x86_64-apple-darwin         , os: macos-latest                     }
+          - { name: macos-arm64   , target: aarch64-apple-darwin        , os: macos-latest                     }
 
     env:
       BUILD_CMD: cargo
@@ -125,30 +127,34 @@ jobs:
       run: make.sh CFLAGS="-Werror" -j
 
     - name: Build wasm library
+      if: ${{ !matrix.job.use-cross && matrix.job.name != 'macos-arm64' }} # Not used
       run: script/build-wasm
 
     - name: Build CLI
       run: $BUILD_CMD build --release --target=${{ matrix.job.target }}
 
     - name: Fetch fixtures
+      if: ${{ matrix.job.name != 'macos-arm64' }} # Not used
       run: script/fetch-fixtures
 
     - name: Generate fixtures
+      if: ${{ matrix.job.name != 'macos-arm64' }} # Can't run CLI on host
       run: script/generate-fixtures
 
     - name: Generate WASM fixtures
-      if: "!matrix.job.use-cross"
+      if: ${{ !matrix.job.use-cross && matrix.job.name != 'macos-arm64' }} # Not used
       run: script/generate-fixtures-wasm
 
     - name: Run main tests
+      if: ${{ matrix.job.name != 'macos-arm64' }} # Can't run CLI on host
       run: $BUILD_CMD test --target=${{ matrix.job.target }}
 
     - name: Run wasm tests
-      if: "!matrix.job.use-cross" # TODO: Install Emscripten into custom cross images
+      if: ${{ !matrix.job.use-cross && matrix.job.name != 'macos-arm64' }} # Not used
       run: script/test-wasm
 
     - name: Run benchmarks
-      if: "!matrix.job.use-cross" # It doesn't make sense to benchmark something in an emulator
+      if: ${{ !matrix.job.use-cross && matrix.job.name != 'macos-arm64' }} # Cross-compiled benchmarks make no sense
       run: $BUILD_CMD bench benchmark -p tree-sitter-cli --target=${{ matrix.job.target }}
 
     - name: Upload CLI artifact
diff --git a/cli/npm/install.js b/cli/npm/install.js
index 2790b47d..9e572c3a 100755
--- a/cli/npm/install.js
+++ b/cli/npm/install.js
@@ -16,14 +16,10 @@ const platformName = {
 let archName = {
   'x64': 'x64',
   'x86': 'x86',
-  'ia32': 'x86'
+  'ia32': 'x86',
+  'arm64': 'arm64'
 }[process.arch];
 
-// ARM macs can run x64 binaries via Rosetta. Rely on that for now.
-if (platformName === 'macos' && process.arch === 'arm64') {
-  archName = 'x64';
-}
-
 if (!platformName || !archName) {
   console.error(
     `Cannot install tree-sitter-cli for platform ${process.platform}, architecture ${process.arch}`

From 71f32a21664502ea08eb2e406c08680650dddba9 Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Fri, 7 Apr 2023 10:22:51 +0300
Subject: [PATCH 081/347] cicd: additional tweaks

---
 .github/workflows/build.yml | 9 ++++-----
 1 file changed, 4 insertions(+), 5 deletions(-)

diff --git a/.github/workflows/build.yml b/.github/workflows/build.yml
index d4a68a06..61543552 100644
--- a/.github/workflows/build.yml
+++ b/.github/workflows/build.yml
@@ -6,7 +6,6 @@ env:
   CROSS_DEBUG: 1
 
 on:
-  workflow_dispatch:
   workflow_call:
     inputs:
       ref:
@@ -27,8 +26,8 @@ jobs:
           - { name: linux-x86     , target: i686-unknown-linux-gnu      , os: ubuntu-latest  , use-cross: true }
           - { name: windows-x64   , target: x86_64-pc-windows-msvc      , os: windows-latest                   }
           - { name: windows-x86   , target: i686-pc-windows-msvc        , os: windows-latest                   }
-          - { name: macos-x64     , target: x86_64-apple-darwin         , os: macos-latest                     }
           - { name: macos-arm64   , target: aarch64-apple-darwin        , os: macos-latest                     }
+          - { name: macos-x64     , target: x86_64-apple-darwin         , os: macos-latest                     }
 
     env:
       BUILD_CMD: cargo
@@ -123,7 +122,7 @@ jobs:
         esac
 
     - name: Build C library
-      if: "!contains(matrix.job.os, 'windows')" # Requires an additional adapted Makefile for `cl.exe` compiler
+      if: ${{ !contains(matrix.job.os, 'windows') }} # Requires an additional adapted Makefile for `cl.exe` compiler
       run: make.sh CFLAGS="-Werror" -j
 
     - name: Build wasm library
@@ -138,7 +137,7 @@ jobs:
       run: script/fetch-fixtures
 
     - name: Generate fixtures
-      if: ${{ matrix.job.name != 'macos-arm64' }} # Can't run CLI on host
+      if: ${{ matrix.job.name != 'macos-arm64' }} # Can't natively run CLI on runner's host
       run: script/generate-fixtures
 
     - name: Generate WASM fixtures
@@ -146,7 +145,7 @@ jobs:
       run: script/generate-fixtures-wasm
 
     - name: Run main tests
-      if: ${{ matrix.job.name != 'macos-arm64' }} # Can't run CLI on host
+      if: ${{ matrix.job.name != 'macos-arm64' }} # Can't natively run CLI on runner's host
       run: $BUILD_CMD test --target=${{ matrix.job.target }}
 
     - name: Run wasm tests

From 10178ade356f33f7603a217fe39680ae6c1c08ad Mon Sep 17 00:00:00 2001
From: Joel Spadin <joelspadin@gmail.com>
Date: Fri, 7 Apr 2023 12:57:50 -0500
Subject: [PATCH 082/347] fix: Use / paths when building WASM

Changed the build-wasm command to always use forward slashes in paths,
since using Windows style paths breaks if the build is run with Docker.

Fixes #532
---
 Cargo.lock      |  7 +++++++
 cli/Cargo.toml  |  1 +
 cli/src/wasm.rs | 15 ++++++++++-----
 3 files changed, 18 insertions(+), 5 deletions(-)

diff --git a/Cargo.lock b/Cargo.lock
index 52013e49..7c3fa7eb 100644
--- a/Cargo.lock
+++ b/Cargo.lock
@@ -440,6 +440,12 @@ dependencies = [
  "winapi",
 ]
 
+[[package]]
+name = "path-slash"
+version = "0.2.1"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "1e91099d4268b0e11973f036e885d652fb0b21fedcf69738c627f94db6a44f42"
+
 [[package]]
 name = "percent-encoding"
 version = "2.2.0"
@@ -774,6 +780,7 @@ dependencies = [
  "indexmap",
  "lazy_static",
  "log",
+ "path-slash",
  "pretty_assertions",
  "rand",
  "regex",
diff --git a/cli/Cargo.toml b/cli/Cargo.toml
index 48473095..ee6d52af 100644
--- a/cli/Cargo.toml
+++ b/cli/Cargo.toml
@@ -30,6 +30,7 @@ glob = "0.3.0"
 html-escape = "0.2.6"
 indexmap = "1"
 lazy_static = "1.2.0"
+path-slash = "0.2.1"
 regex = "1"
 regex-syntax = "0.6.4"
 rustc-hash = "1"
diff --git a/cli/src/wasm.rs b/cli/src/wasm.rs
index 467fef71..35f09b55 100644
--- a/cli/src/wasm.rs
+++ b/cli/src/wasm.rs
@@ -1,5 +1,6 @@
 use super::generate::parse_grammar::GrammarJSON;
 use anyhow::{anyhow, Context, Result};
+use path_slash::PathExt as _;
 use std::ffi::{OsStr, OsString};
 use std::fs;
 use std::path::Path;
@@ -41,7 +42,7 @@ pub fn compile_language_to_wasm(language_dir: &Path, force_docker: bool) -> Resu
             volume_string = OsString::from(parent);
             volume_string.push(":/src:Z");
             command.arg("--workdir");
-            command.arg(&Path::new("/src").join(filename));
+            command.arg(Path::new("/src").join(filename).to_slash_lossy().as_ref());
         } else {
             volume_string = OsString::from(language_dir);
             volume_string.push(":/src:Z");
@@ -103,14 +104,18 @@ pub fn compile_language_to_wasm(language_dir: &Path, force_docker: bool) -> Resu
     let scanner_cpp_path = src.join("scanner.cpp");
 
     if language_dir.join(&scanner_cc_path).exists() {
-        command.arg("-xc++").arg(&scanner_cc_path);
+        command
+            .arg("-xc++")
+            .arg(scanner_cc_path.to_slash_lossy().as_ref());
     } else if language_dir.join(&scanner_cpp_path).exists() {
-        command.arg("-xc++").arg(&scanner_cpp_path);
+        command
+            .arg("-xc++")
+            .arg(scanner_cpp_path.to_slash_lossy().as_ref());
     } else if language_dir.join(&scanner_c_path).exists() {
-        command.arg(&scanner_c_path);
+        command.arg(scanner_c_path.to_slash_lossy().as_ref());
     }
 
-    command.arg(&parser_c_path);
+    command.arg(parser_c_path.to_slash_lossy().as_ref());
 
     let output = command
         .output()

From bb122d6d4788205f72ad3acaa95157dc63d15f4b Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Sat, 8 Apr 2023 01:47:57 +0300
Subject: [PATCH 083/347] cicd: separate sanitize workflow + manual trigger for
 build workflow

---
 .github/workflows/CICD.yml     |  7 +++++-
 .github/workflows/build.yml    | 32 +--------------------------
 .github/workflows/sanitize.yml | 40 ++++++++++++++++++++++++++++++++++
 3 files changed, 47 insertions(+), 32 deletions(-)
 create mode 100644 .github/workflows/sanitize.yml

diff --git a/.github/workflows/CICD.yml b/.github/workflows/CICD.yml
index 7c2351a8..e675781f 100644
--- a/.github/workflows/CICD.yml
+++ b/.github/workflows/CICD.yml
@@ -46,6 +46,11 @@ jobs:
     with:
       package: tree-sitter-cli
 
+  sanitize:
+    name: Sanitize
+    needs: [init, fast_checks]
+    uses: ./.github/workflows/sanitize.yml
+
   build:
     name: Build & Test
     needs: [init, fast_checks]
@@ -55,7 +60,7 @@ jobs:
 
   release:
     name: Release
-    needs: [init, fast_checks, full_checks, min_version, build]
+    needs: [init, fast_checks, full_checks, min_version, build, sanitize]
     if: >
       github.event.pull_request.head.repo.full_name == github.repository &&
       startsWith(github.head_ref, 'release/v')
diff --git a/.github/workflows/build.yml b/.github/workflows/build.yml
index 61543552..6cfa0d48 100644
--- a/.github/workflows/build.yml
+++ b/.github/workflows/build.yml
@@ -6,6 +6,7 @@ env:
   CROSS_DEBUG: 1
 
 on:
+  workflow_dispatch:
   workflow_call:
     inputs:
       ref:
@@ -174,34 +175,3 @@ jobs:
           lib/binding_web/tree-sitter.wasm
         if-no-files-found: error
         retention-days: 7
-
-  check_undefined_behaviour:
-    name: Undefined behaviour checks
-    runs-on: ubuntu-latest
-    env:
-      TREE_SITTER: ${{ github.workspace }}/target/release/tree-sitter
-    steps:
-    - name: Checkout source code
-      uses: actions/checkout@v3
-
-    - name: Install UBSAN library
-      run: sudo apt-get install -y libubsan1
-
-    - name: Install Rust toolchain
-      uses: dtolnay/rust-toolchain@stable
-
-    - name: Build CLI
-      run: cargo build --release
-
-    - name: Fetch fixtures
-      run: script/fetch-fixtures
-
-    - name: Generate fixtures
-      run: script/generate-fixtures
-
-    - name: Run main tests with undefined behaviour sanitizer (UBSAN)
-      env:
-        UBSAN_OPTIONS: halt_on_error=1
-        CFLAGS: -fsanitize=undefined
-        RUSTFLAGS: -lubsan
-      run: cargo test -- --test-threads 1
diff --git a/.github/workflows/sanitize.yml b/.github/workflows/sanitize.yml
new file mode 100644
index 00000000..ebfb477c
--- /dev/null
+++ b/.github/workflows/sanitize.yml
@@ -0,0 +1,40 @@
+name: Sunitize
+
+env:
+  CARGO_TERM_COLOR: always
+  RUSTFLAGS: "-D warnings"
+
+on:
+  workflow_call:
+
+jobs:
+  check_undefined_behaviour:
+    name: Undefined behaviour checks
+    runs-on: ubuntu-latest
+    env:
+      TREE_SITTER: ${{ github.workspace }}/target/release/tree-sitter
+    steps:
+    - name: Checkout source code
+      uses: actions/checkout@v3
+
+    - name: Install UBSAN library
+      run: sudo apt-get install -y libubsan1
+
+    - name: Install Rust toolchain
+      uses: dtolnay/rust-toolchain@stable
+
+    - name: Build CLI
+      run: cargo build --release
+
+    - name: Fetch fixtures
+      run: script/fetch-fixtures
+
+    - name: Generate fixtures
+      run: script/generate-fixtures
+
+    - name: Run main tests with undefined behaviour sanitizer (UBSAN)
+      env:
+        UBSAN_OPTIONS: halt_on_error=1
+        CFLAGS: -fsanitize=undefined
+        RUSTFLAGS: -lubsan
+      run: cargo test -- --test-threads 1

From 96086806d56404e65e82fc17a144506e98d30e43 Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Sat, 8 Apr 2023 05:14:12 +0300
Subject: [PATCH 084/347] cicd: change author configuring for a tag

---
 .github/workflows/release.yml | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/.github/workflows/release.yml b/.github/workflows/release.yml
index 87a06761..979d95a3 100644
--- a/.github/workflows/release.yml
+++ b/.github/workflows/release.yml
@@ -78,8 +78,8 @@ jobs:
           tag: ${{ steps.tag_name.outputs.tag }}
           message: "Release ${{ steps.tag_name.outputs.tag }}"
         run: |
-          git config user.name "${GITHUB_ACTOR}"
-          git config user.email "${GITHUB_ACTOR}@users.noreply.github.com"
+          git config user.name "$(git log -1 --pretty='%cn')"
+          git config user.email "$(git log -1 --pretty='%ce')"
           git tag -a "$tag" HEAD -m "$message"
           git push origin "$tag"
 

From f03f024ec45c092f4a314565d65f641b5f13741c Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Sat, 8 Apr 2023 07:35:34 +0300
Subject: [PATCH 085/347] cicd: change approach for matrix shaping with an
 anchor name plus extras

---
 .github/workflows/build.yml | 112 ++++++++++++++++++++----------------
 1 file changed, 61 insertions(+), 51 deletions(-)

diff --git a/.github/workflows/build.yml b/.github/workflows/build.yml
index 6cfa0d48..2df9bc27 100644
--- a/.github/workflows/build.yml
+++ b/.github/workflows/build.yml
@@ -15,20 +15,39 @@ on:
 
 jobs:
   build:
-    name: ${{ matrix.job.name }} (${{ matrix.job.target }}) (${{ matrix.job.os }})
-    runs-on: ${{ matrix.job.os }}
+    name: ${{ matrix.name }} (${{ matrix.target }}) (${{ matrix.os }})
+    runs-on: ${{ matrix.os }}
     strategy:
       fail-fast: false
       matrix:
-        job:
-          - { name: linux-aarch64 , target: aarch64-unknown-linux-gnu   , os: ubuntu-latest  , use-cross: true }
-          - { name: linux-arm     , target: arm-unknown-linux-gnueabihf , os: ubuntu-latest  , use-cross: true }
-          - { name: linux-x64     , target: x86_64-unknown-linux-gnu    , os: ubuntu-latest                    }
-          - { name: linux-x86     , target: i686-unknown-linux-gnu      , os: ubuntu-latest  , use-cross: true }
-          - { name: windows-x64   , target: x86_64-pc-windows-msvc      , os: windows-latest                   }
-          - { name: windows-x86   , target: i686-pc-windows-msvc        , os: windows-latest                   }
-          - { name: macos-arm64   , target: aarch64-apple-darwin        , os: macos-latest                     }
-          - { name: macos-x64     , target: x86_64-apple-darwin         , os: macos-latest                     }
+        name:
+        - linux-aarch64 #
+        - linux-arm     #
+        - linux-x64     #
+        - linux-x86     #
+        - windows-x64   # <-- No C library build - requires an additional adapted Makefile for `cl.exe` compiler
+        - windows-x86   #     -- // --
+        - macos-arm64   # <-- MacOS M1/M2 - no tests, only CLI build to be published on release artifacts
+        - macos-x64     #
+
+        include:
+        - { name: linux-aarch64 , target: aarch64-unknown-linux-gnu   , os: ubuntu-latest  , use-cross: true }
+        - { name: linux-arm     , target: arm-unknown-linux-gnueabihf , os: ubuntu-latest  , use-cross: true }
+        - { name: linux-x64     , target: x86_64-unknown-linux-gnu    , os: ubuntu-latest                    }
+        - { name: linux-x86     , target: i686-unknown-linux-gnu      , os: ubuntu-latest  , use-cross: true }
+        - { name: windows-x64   , target: x86_64-pc-windows-msvc      , os: windows-latest                   }
+        - { name: windows-x86   , target: i686-pc-windows-msvc        , os: windows-latest                   }
+        - { name: macos-arm64   , target: aarch64-apple-darwin        , os: macos-latest                     }
+        - { name: macos-x64     , target: x86_64-apple-darwin         , os: macos-latest                     }
+
+        # Cross compilers for C library
+        - { name: linux-aarch64 , cc: aarch64-linux-gnu-gcc           , ar: aarch64-linux-gnu-ar               }
+        - { name: linux-arm     , cc: arm-unknown-linux-gnueabihf-gcc , ar: arm-unknown-linux-gnueabihf-gcc-ar }
+        - { name: linux-x86     , cc: i686-linux-gnu-gcc              , ar: i686-linux-gnu-ar                  }
+
+        # See #2041 tree-sitter issue
+        - { name: windows-x64   , rust_test_threads: 1 }
+        - { name: windows-x86   , rust_test_threads: 1 }
 
     env:
       BUILD_CMD: cargo
@@ -55,20 +74,20 @@ jobs:
     - name: Install Rust toolchain
       uses: dtolnay/rust-toolchain@stable
       with:
-        targets: ${{ matrix.job.target }}
+        targets: ${{ matrix.target }}
 
     - name: Install cross
-      if: matrix.job.use-cross
+      if: matrix.use-cross
       uses: taiki-e/install-action@v2
       with:
         tool: cross
 
     - name: Build custom cross image
-      if: ${{ matrix.job.use-cross && matrix.job.os == 'ubuntu-latest' }}
+      if: ${{ matrix.use-cross && matrix.os == 'ubuntu-latest' }}
       run: |
         cd ..
 
-        target="${{ matrix.job.target }}"
+        target="${{ matrix.target }}"
         image=ghcr.io/cross-rs/$target:custom
         echo "CROSS_IMAGE=$image"                                  >> $GITHUB_ENV
 
@@ -85,88 +104,79 @@ jobs:
 
         cd -
 
-    - name: Setup extra env
+    - name: Setup env extras
+      env:
+        RUST_TEST_THREADS: ${{ matrix.rust_test_threads }}
+        USE_CROSS: ${{ matrix.use-cross }}
+        CC: ${{ matrix.cc }}
+        AR: ${{ matrix.ar }}
       run: |
         PATH="$PWD/.github/scripts:$PATH"
         echo "PATH=$PATH" >> $GITHUB_ENV
         echo "ROOT=$PWD" >> $GITHUB_ENV
         echo "TREE_SITTER=tree-sitter.sh" >> $GITHUB_ENV
 
-        export TARGET=${{ matrix.job.target }}
+        export TARGET=${{ matrix.target }}
         echo "TARGET=$TARGET" >> $GITHUB_ENV
 
-        USE_CROSS="${{ matrix.job.use-cross }}"
+        [ -n "$RUST_TEST_THREADS" ] && \
+        echo "RUST_TEST_THREADS=$RUST_TEST_THREADS" >> $GITHUB_ENV
+
+        [ -n "$CC" ] && echo "CC=$CC" >> $GITHUB_ENV
+        [ -n "$AR" ] && echo "AR=$AR" >> $GITHUB_ENV
 
         if [ "$USE_CROSS" == "true" ]; then
           echo "BUILD_CMD=cross" >> $GITHUB_ENV
-
-          export CROSS=1; echo "CROSS=$CROSS" >> $GITHUB_ENV
-
+          export CROSS=1; echo "CROSS=1" >> $GITHUB_ENV
           runner=$(cross.sh bash -c "env | sed -nr '/^CARGO_TARGET_.*_RUNNER=/s///p'")
           [ -n "$runner" ] && echo "CROSS_RUNNER=$runner" >> $GITHUB_ENV
-          echo "runner: $runner"
-
-          case "$TARGET" in
-            i686-unknown-linux-gnu)      CC=i686-linux-gnu-gcc              AR=i686-linux-gnu-ar                  ;;
-            aarch64-unknown-linux-gnu)   CC=aarch64-linux-gnu-gcc           AR=aarch64-linux-gnu-ar               ;;
-            arm-unknown-linux-gnueabihf) CC=arm-unknown-linux-gnueabihf-gcc AR=arm-unknown-linux-gnueabihf-gcc-ar ;;
-          esac
-
-          [ -n "$CC" ] && echo "CC=$CC" >> $GITHUB_ENV
-          [ -n "$AR" ] && echo "AR=$AR" >> $GITHUB_ENV
         fi
 
-        case "$TARGET" in
-          *-windows-*)
-            echo "RUST_TEST_THREADS=1" >> $GITHUB_ENV # See #2041 tree-sitter issue
-            ;;
-        esac
-
     - name: Build C library
-      if: ${{ !contains(matrix.job.os, 'windows') }} # Requires an additional adapted Makefile for `cl.exe` compiler
+      if: ${{ !contains(matrix.os, 'windows') }} # Requires an additional adapted Makefile for `cl.exe` compiler
       run: make.sh CFLAGS="-Werror" -j
 
     - name: Build wasm library
-      if: ${{ !matrix.job.use-cross && matrix.job.name != 'macos-arm64' }} # Not used
+      if: ${{ !matrix.use-cross && matrix.name != 'macos-arm64' }} # Not used
       run: script/build-wasm
 
     - name: Build CLI
-      run: $BUILD_CMD build --release --target=${{ matrix.job.target }}
+      run: $BUILD_CMD build --release --target=${{ matrix.target }}
 
     - name: Fetch fixtures
-      if: ${{ matrix.job.name != 'macos-arm64' }} # Not used
+      if: ${{ matrix.name != 'macos-arm64' }} # Not used
       run: script/fetch-fixtures
 
     - name: Generate fixtures
-      if: ${{ matrix.job.name != 'macos-arm64' }} # Can't natively run CLI on runner's host
+      if: ${{ matrix.name != 'macos-arm64' }} # Can't natively run CLI on runner's host
       run: script/generate-fixtures
 
     - name: Generate WASM fixtures
-      if: ${{ !matrix.job.use-cross && matrix.job.name != 'macos-arm64' }} # Not used
+      if: ${{ !matrix.use-cross && matrix.name != 'macos-arm64' }} # Not used
       run: script/generate-fixtures-wasm
 
     - name: Run main tests
-      if: ${{ matrix.job.name != 'macos-arm64' }} # Can't natively run CLI on runner's host
-      run: $BUILD_CMD test --target=${{ matrix.job.target }}
+      if: ${{ matrix.name != 'macos-arm64' }} # Can't natively run CLI on runner's host
+      run: $BUILD_CMD test --target=${{ matrix.target }}
 
     - name: Run wasm tests
-      if: ${{ !matrix.job.use-cross && matrix.job.name != 'macos-arm64' }} # Not used
+      if: ${{ !matrix.use-cross && matrix.name != 'macos-arm64' }} # Not used
       run: script/test-wasm
 
     - name: Run benchmarks
-      if: ${{ !matrix.job.use-cross && matrix.job.name != 'macos-arm64' }} # Cross-compiled benchmarks make no sense
-      run: $BUILD_CMD bench benchmark -p tree-sitter-cli --target=${{ matrix.job.target }}
+      if: ${{ !matrix.use-cross && matrix.name != 'macos-arm64' }} # Cross-compiled benchmarks make no sense
+      run: $BUILD_CMD bench benchmark -p tree-sitter-cli --target=${{ matrix.target }}
 
     - name: Upload CLI artifact
       uses: actions/upload-artifact@v3
       with:
-        name: tree-sitter.${{ matrix.job.name }}
-        path: target/${{ matrix.job.target }}/release/tree-sitter${{ contains(matrix.job.target, 'windows') && '.exe' || '' }}
+        name: tree-sitter.${{ matrix.name }}
+        path: target/${{ matrix.target }}/release/tree-sitter${{ contains(matrix.target, 'windows') && '.exe' || '' }}
         if-no-files-found: error
         retention-days: 7
 
     - name: Upload WASM artifacts
-      if: ${{ matrix.job.name == 'linux-x64' }}
+      if: ${{ matrix.name == 'linux-x64' }}
       uses: actions/upload-artifact@v3
       with:
         name: tree-sitter.wasm

From d8caf6f8c530bef60f5ee419e0f4e96cb8452c63 Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Sat, 8 Apr 2023 08:42:17 +0300
Subject: [PATCH 086/347] chore(cicd): change formatting

---
 .github/workflows/build.yml | 14 +++++++-------
 1 file changed, 7 insertions(+), 7 deletions(-)

diff --git a/.github/workflows/build.yml b/.github/workflows/build.yml
index 2df9bc27..b5c7ab60 100644
--- a/.github/workflows/build.yml
+++ b/.github/workflows/build.yml
@@ -89,15 +89,15 @@ jobs:
 
         target="${{ matrix.target }}"
         image=ghcr.io/cross-rs/$target:custom
-        echo "CROSS_IMAGE=$image"                                  >> $GITHUB_ENV
+        echo "CROSS_IMAGE=$image"                              >> $GITHUB_ENV
 
-        echo "[target.$target]"                                    >> Cross.toml
-        echo "image = \"$image\""                                  >> Cross.toml
-        echo "CROSS_CONFIG=$PWD/Cross.toml"                        >> $GITHUB_ENV
+        echo "[target.$target]"                                >> Cross.toml
+        echo "image = \"$image\""                              >> Cross.toml
+        echo "CROSS_CONFIG=$PWD/Cross.toml"                    >> $GITHUB_ENV
 
-        echo "FROM ghcr.io/cross-rs/$target:edge"                  >> Dockerfile
-        echo "ENV DEBIAN_FRONTEND=noninteractive"                  >> Dockerfile
-        echo "RUN apt-get update && apt-get install -y nodejs"     >> Dockerfile
+        echo "FROM ghcr.io/cross-rs/$target:edge"              >> Dockerfile
+        echo "ENV DEBIAN_FRONTEND=noninteractive"              >> Dockerfile
+        echo "RUN apt-get update && apt-get install -y nodejs" >> Dockerfile
         docker build -t $image .
         docker images
         docker run --rm $image env

From 34e0ab696ce156843a76ab7f52b83ad2007dfe75 Mon Sep 17 00:00:00 2001
From: Carlo Teubner <435950+c4rlo@users.noreply.github.com>
Date: Sat, 8 Apr 2023 18:10:44 +0100
Subject: [PATCH 087/347] docs: remove mention of Atom

Atom is dead, so this mention seems unnecessary now.
---
 docs/section-4-syntax-highlighting.md | 2 --
 1 file changed, 2 deletions(-)

diff --git a/docs/section-4-syntax-highlighting.md b/docs/section-4-syntax-highlighting.md
index a6e5d74c..0cf7890f 100644
--- a/docs/section-4-syntax-highlighting.md
+++ b/docs/section-4-syntax-highlighting.md
@@ -9,8 +9,6 @@ Syntax highlighting is a very common feature in applications that deal with code
 
 This document explains how the Tree-sitter syntax highlighting system works, using the command line interface. If you are using `tree-sitter-highlight` library (either from C or from Rust), all of these concepts are still applicable, but the configuration data is provided using in-memory objects, rather than files.
 
-**Note - If you are working on syntax highlighting in the [Atom](https://atom.io/) text editor, you should consult [the grammar-creation page](https://flight-manual.atom.io/hacking-atom/sections/creating-a-grammar/) of the Atom Flight Manual, *not* this document. Atom currently uses a different syntax highlighting system that is also based on Tree-sitter, but is older than the one described here.**
-
 ## Overview
 
 All of the files needed to highlight a given language are normally included in the same git repository as the Tree-sitter grammar for that language (for example, [`tree-sitter-javascript`](https://github.com/tree-sitter/tree-sitter-javascript), [`tree-sitter-ruby`](https://github.com/tree-sitter/tree-sitter-ruby)). In order to run syntax highlighting from the command-line, three types of files are needed:

From e3ea048db1cfd184594c92e5cd9869462e164ea2 Mon Sep 17 00:00:00 2001
From: Kait Lam <k@rina.fyi>
Date: Tue, 21 Mar 2023 15:36:09 +1000
Subject: [PATCH 088/347] docs: alphabetise language bindings on front page

This helps with readability when scanning for a particular language. It is, strangely, almost sorted with the exception of Java and Kotlin.
---
 docs/index.md | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/docs/index.md b/docs/index.md
index 8c3f9e52..9fb1fd2a 100644
--- a/docs/index.md
+++ b/docs/index.md
@@ -17,8 +17,10 @@ There are currently bindings that allow Tree-sitter to be used from the followin
 
 * [Go](https://github.com/smacker/go-tree-sitter)
 * [Haskell](https://github.com/tree-sitter/haskell-tree-sitter)
+* [Java](https://github.com/serenadeai/java-tree-sitter)
 * [JavaScript (Node.js)](https://github.com/tree-sitter/node-tree-sitter)
 * [JavaScript (Wasm)](https://github.com/tree-sitter/tree-sitter/tree/master/lib/binding_web)
+* [Kotlin](https://github.com/oxisto/kotlintree)
 * [Lua](https://github.com/euclidianAce/ltreesitter)
 * [OCaml](https://github.com/returntocorp/ocaml-tree-sitter-core)
 * [Perl](https://metacpan.org/pod/Text::Treesitter)
@@ -27,8 +29,6 @@ There are currently bindings that allow Tree-sitter to be used from the followin
 * [Ruby](https://github.com/calicoday/ruby-tree-sitter-ffi)
 * [Rust](https://github.com/tree-sitter/tree-sitter/tree/master/lib/binding_rust)
 * [Swift](https://github.com/ChimeHQ/SwiftTreeSitter)
-* [Kotlin](https://github.com/oxisto/kotlintree)
-* [Java](https://github.com/serenadeai/java-tree-sitter)
 
 By convention, bindings are named with the language first, eg. ruby-tree-sitter.
 

From ae738c3c0f02557960c9c45b3bbac6f8ccb292f3 Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Tue, 24 Jan 2023 14:25:29 +0200
Subject: [PATCH 089/347] fix(dsl): add support for rule refs to externals

---
 cli/npm/dsl.d.ts | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/cli/npm/dsl.d.ts b/cli/npm/dsl.d.ts
index fdf43b55..316400f8 100644
--- a/cli/npm/dsl.d.ts
+++ b/cli/npm/dsl.d.ts
@@ -102,7 +102,7 @@ interface Grammar<
   externals?: (
     $: Record<string, SymbolRule<string>>,
     previous: Rule[],
-  ) => SymbolRule<string>[];
+  ) => (SymbolRule<string> | RegExp | string)[];
 
   /**
    * An array of tokens that may appear anywhere in the language. This

From 8c6d157ca571460bef2220512e9721e65261a12f Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Sat, 11 Mar 2023 11:08:38 +0200
Subject: [PATCH 090/347] fix(dsl): fix formatting

---
 cli/npm/dsl.d.ts | 40 ++++++++++++++++++++--------------------
 1 file changed, 20 insertions(+), 20 deletions(-)

diff --git a/cli/npm/dsl.d.ts b/cli/npm/dsl.d.ts
index 316400f8..78b654f3 100644
--- a/cli/npm/dsl.d.ts
+++ b/cli/npm/dsl.d.ts
@@ -1,19 +1,19 @@
-type AliasRule = {type: 'ALIAS'; named: boolean; content: Rule; value: string};
-type BlankRule = {type: 'BLANK'};
-type ChoiceRule = {type: 'CHOICE'; members: Rule[]};
-type FieldRule = {type: 'FIELD'; name: string; content: Rule};
-type ImmediateTokenRule = {type: 'IMMEDIATE_TOKEN'; content: Rule};
-type PatternRule = {type: 'PATTERN'; value: string};
-type PrecDynamicRule = {type: 'PREC_DYNAMIC'; content: Rule; value: number};
-type PrecLeftRule = {type: 'PREC_LEFT'; content: Rule; value: number};
-type PrecRightRule = {type: 'PREC_RIGHT'; content: Rule; value: number};
-type PrecRule = {type: 'PREC'; content: Rule; value: number};
-type Repeat1Rule = {type: 'REPEAT1'; content: Rule};
-type RepeatRule = {type: 'REPEAT'; content: Rule};
-type SeqRule = {type: 'SEQ'; members: Rule[]};
-type StringRule = {type: 'STRING'; value: string};
-type SymbolRule<Name extends string> = {type: 'SYMBOL'; name: Name};
-type TokenRule = {type: 'TOKEN'; content: Rule};
+type AliasRule = { type: 'ALIAS'; named: boolean; content: Rule; value: string };
+type BlankRule = { type: 'BLANK' };
+type ChoiceRule = { type: 'CHOICE'; members: Rule[] };
+type FieldRule = { type: 'FIELD'; name: string; content: Rule };
+type ImmediateTokenRule = { type: 'IMMEDIATE_TOKEN'; content: Rule };
+type PatternRule = { type: 'PATTERN'; value: string };
+type PrecDynamicRule = { type: 'PREC_DYNAMIC'; content: Rule; value: number };
+type PrecLeftRule = { type: 'PREC_LEFT'; content: Rule; value: number };
+type PrecRightRule = { type: 'PREC_RIGHT'; content: Rule; value: number };
+type PrecRule = { type: 'PREC'; content: Rule; value: number };
+type Repeat1Rule = { type: 'REPEAT1'; content: Rule };
+type RepeatRule = { type: 'REPEAT'; content: Rule };
+type SeqRule = { type: 'SEQ'; members: Rule[] };
+type StringRule = { type: 'STRING'; value: string };
+type SymbolRule<Name extends string> = { type: 'SYMBOL'; name: Name };
+type TokenRule = { type: 'TOKEN'; content: Rule };
 
 type Rule =
   | AliasRule
@@ -48,8 +48,8 @@ type RuleBuilders<
   RuleName extends string,
   BaseGrammarRuleName extends string
 > = {
-  [name in RuleName]: RuleBuilder<RuleName | BaseGrammarRuleName>;
-};
+    [name in RuleName]: RuleBuilder<RuleName | BaseGrammarRuleName>;
+  };
 
 interface Grammar<
   RuleName extends string,
@@ -153,8 +153,8 @@ interface Grammar<
 
 type GrammarSchema<RuleName extends string> = {
   [K in keyof Grammar<RuleName>]: K extends 'rules'
-    ? Record<RuleName, Rule>
-    : Grammar<RuleName>[K];
+  ? Record<RuleName, Rule>
+  : Grammar<RuleName>[K];
 };
 
 /**

From 1f051d339c2639aa6c062bfc504034d427b71a90 Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Sun, 9 Apr 2023 20:40:18 +0300
Subject: [PATCH 091/347] chore(docs): fix misprint repetitions and remove
 dangling spaces

---
 docs/section-3-creating-parsers.md |  2 +-
 docs/section-5-implementation.md   |  2 +-
 lib/binding_web/README.md          | 16 ++++++++--------
 3 files changed, 10 insertions(+), 10 deletions(-)

diff --git a/docs/section-3-creating-parsers.md b/docs/section-3-creating-parsers.md
index 0842edbb..842b87eb 100644
--- a/docs/section-3-creating-parsers.md
+++ b/docs/section-3-creating-parsers.md
@@ -46,7 +46,7 @@ npm install --save nan
 npm install --save-dev tree-sitter-cli
 ```
 
-The last command will install the CLI into the `node_modules` folder in your working directory. An executable program called `tree-sitter` will be created inside of `node_modules/.bin/`. You may want to follow the Node.js convention of adding that folder to your your `PATH` so that you can easily run this program when working in this directory.
+The last command will install the CLI into the `node_modules` folder in your working directory. An executable program called `tree-sitter` will be created inside of `node_modules/.bin/`. You may want to follow the Node.js convention of adding that folder to your `PATH` so that you can easily run this program when working in this directory.
 
 ```sh
 # In your shell profile script
diff --git a/docs/section-5-implementation.md b/docs/section-5-implementation.md
index e0fa9661..4f97d760 100644
--- a/docs/section-5-implementation.md
+++ b/docs/section-5-implementation.md
@@ -21,7 +21,7 @@ The `tree-sitter` CLI's most important feature is the `generate` subcommand. Thi
 
 ### Parsing a Grammar
 
-First, Tree-sitter must must evaluate the JavaScript code in `grammar.js` and convert the grammar to a JSON format. It does this by shelling out to `node`. The format of the grammars is formally specified by the JSON schema in [grammar-schema.json](https://github.com/tree-sitter/tree-sitter/blob/master/cli/src/generate/grammar-schema.json). The parsing is implemented in [parse_grammar.rs](https://github.com/tree-sitter/tree-sitter/blob/master/cli/src/generate/parse_grammar.rs).
+First, Tree-sitter must evaluate the JavaScript code in `grammar.js` and convert the grammar to a JSON format. It does this by shelling out to `node`. The format of the grammars is formally specified by the JSON schema in [grammar-schema.json](https://github.com/tree-sitter/tree-sitter/blob/master/cli/src/generate/grammar-schema.json). The parsing is implemented in [parse_grammar.rs](https://github.com/tree-sitter/tree-sitter/blob/master/cli/src/generate/parse_grammar.rs).
 
 ### Grammar Rules
 
diff --git a/lib/binding_web/README.md b/lib/binding_web/README.md
index a75cd9f0..1d645a33 100644
--- a/lib/binding_web/README.md
+++ b/lib/binding_web/README.md
@@ -5,7 +5,7 @@ WebAssembly bindings to the [Tree-sitter](https://github.com/tree-sitter/tree-si
 
 ### Setup
 
-You can download the the `tree-sitter.js` and `tree-sitter.wasm` files from [the latest GitHub release](https://github.com/tree-sitter/tree-sitter/releases/latest) and load them using a standalone script:
+You can download the `tree-sitter.js` and `tree-sitter.wasm` files from [the latest GitHub release](https://github.com/tree-sitter/tree-sitter/releases/latest) and load them using a standalone script:
 
 ```html
 <script src="/the/path/to/tree-sitter.js"/>
@@ -116,7 +116,7 @@ First install `tree-sitter-cli` and the tree-sitter language for which to genera
 npm install --save-dev tree-sitter-cli tree-sitter-javascript
 ```
 
-Then just use tree-sitter cli tool to generate the `.wasm`. 
+Then just use tree-sitter cli tool to generate the `.wasm`.
 
 ```sh
 npx tree-sitter build-wasm node_modules/tree-sitter-javascript
@@ -147,13 +147,13 @@ const Parser = require('web-tree-sitter');
 
 ##### Loading the .wasm file
 
-`web-tree-sitter` needs to load the `tree-sitter.wasm` file. By default, it assumes that this file is available in the 
+`web-tree-sitter` needs to load the `tree-sitter.wasm` file. By default, it assumes that this file is available in the
 same path as the JavaScript code. Therefore, if the code is being served from `http://localhost:3000/bundle.js`, then
 the wasm file should be at `http://localhost:3000/tree-sitter.wasm`.
 
-For server side frameworks like NextJS, this can be tricky as pages are often served from a path such as 
+For server side frameworks like NextJS, this can be tricky as pages are often served from a path such as
 `http://localhost:3000/_next/static/chunks/pages/index.js`. The loader will therefore look for the wasm file at
-`http://localhost:3000/_next/static/chunks/pages/tree-sitter.wasm`. The solution is to pass a `locateFile` function in 
+`http://localhost:3000/_next/static/chunks/pages/tree-sitter.wasm`. The solution is to pass a `locateFile` function in
 the `moduleOptions` argument to `Parser.init()`:
 
 ```javascript
@@ -164,15 +164,15 @@ await Parser.init({
 });
 ```
 
-`locateFile` takes in two parameters, `scriptName`, i.e. the wasm file name, and `scriptDirectory`, i.e. the directory 
+`locateFile` takes in two parameters, `scriptName`, i.e. the wasm file name, and `scriptDirectory`, i.e. the directory
 where the loader expects the script to be. It returns the path where the loader will look for the wasm file. In the NextJS
 case, we want to return just the `scriptName` so that the loader will look at `http://localhost:3000/tree-sitter.wasm`
 and not `http://localhost:3000/_next/static/chunks/pages/tree-sitter.wasm`.
 
 ##### `Can't resolve 'fs' in 'node_modules/web-tree-sitter'`
 
-Most bundlers will notice that the `tree-sitter.js` file is attempting to import `fs`, i.e. node's file system library. 
-Since this doesn't exist in the browser, the bundlers will get confused. For webpack you can fix this by adding the 
+Most bundlers will notice that the `tree-sitter.js` file is attempting to import `fs`, i.e. node's file system library.
+Since this doesn't exist in the browser, the bundlers will get confused. For webpack you can fix this by adding the
 following to your webpack config:
 
 ```javascript

From 4a723c985d520d9bb7366ba13601852c5a4fe4d9 Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Mon, 10 Apr 2023 01:06:32 +0300
Subject: [PATCH 092/347] cicd: don't cancel runs on master by concurrency
 condition

---
 .github/workflows/CICD.yml | 8 +++++++-
 1 file changed, 7 insertions(+), 1 deletion(-)

diff --git a/.github/workflows/CICD.yml b/.github/workflows/CICD.yml
index e675781f..666d3801 100644
--- a/.github/workflows/CICD.yml
+++ b/.github/workflows/CICD.yml
@@ -9,7 +9,13 @@ on:
       - check/*
 
 concurrency:
-  group: '${{ github.workflow }} @ ${{ github.event.pull_request.head.label || github.head_ref || github.ref }}'
+  group: >
+    ${{ github.workflow }} @ ${{
+      github.ref == 'refs/heads/master' && github.ref_name || ''
+    }}${{
+      github.ref == 'refs/heads/master' && github.sha
+      || github.event.pull_request.head.label || github.head_ref || github.ref
+    }}
   cancel-in-progress: true
 
 jobs:

From de906378ab827dfa9a0f111fdfdde78ab277e8b4 Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Mon, 10 Apr 2023 19:50:32 +0300
Subject: [PATCH 093/347] web: 0.20.8

---
 lib/binding_web/package.json | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/lib/binding_web/package.json b/lib/binding_web/package.json
index 52f72d5b..42fdc518 100644
--- a/lib/binding_web/package.json
+++ b/lib/binding_web/package.json
@@ -1,6 +1,6 @@
 {
   "name": "web-tree-sitter",
-  "version": "0.20.7",
+  "version": "0.20.8",
   "description": "Tree-sitter bindings for the web",
   "main": "tree-sitter.js",
   "types": "tree-sitter-web.d.ts",

From 7bc2bb605e316b497c684da47b5536a86a1e285f Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Sat, 8 Apr 2023 01:51:27 +0300
Subject: [PATCH 094/347] cicd: switch main workflow to work on any branch
 except `release/v*` prefixed

The `release/v*` prefixed branches can be used only with a PR opened on
such branches. The release branches only accepted in the main repo
and not from forks.

Also this workflow enables runining on every `push` unconditionaly.
This leads to parallel runs on `push` and `pull_request` events
and that would seen in PR checks also in parallel, but this is
useful because checks that run on the `push` event runs on
head ref while checks on the `pull_request` event runs on
an additional `refs/pull/<PR>/merge` ref what is created
by Github on every push to a PR to check that it can be
merged to a target branch without conflicts and passed checks.
---
 .github/workflows/CICD.yml | 5 ++---
 1 file changed, 2 insertions(+), 3 deletions(-)

diff --git a/.github/workflows/CICD.yml b/.github/workflows/CICD.yml
index 666d3801..c8a9e4c3 100644
--- a/.github/workflows/CICD.yml
+++ b/.github/workflows/CICD.yml
@@ -4,9 +4,8 @@ on:
   workflow_dispatch:
   pull_request:
   push:
-    branches:
-      - master
-      - check/*
+    branches-ignore:
+      - release/v*
 
 concurrency:
   group: >

From 8eacd34fd7666b4a18bfce96cb9bdacdea76dc66 Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Mon, 10 Apr 2023 22:20:24 +0300
Subject: [PATCH 095/347] chore(cicd): better naming in the build matrix

---
 .github/workflows/build.yml | 48 ++++++++++++++++++-------------------
 1 file changed, 24 insertions(+), 24 deletions(-)

diff --git a/.github/workflows/build.yml b/.github/workflows/build.yml
index b5c7ab60..c07ae114 100644
--- a/.github/workflows/build.yml
+++ b/.github/workflows/build.yml
@@ -15,12 +15,12 @@ on:
 
 jobs:
   build:
-    name: ${{ matrix.name }} (${{ matrix.target }}) (${{ matrix.os }})
+    name: ${{ matrix.runtime }} (${{ matrix.target }}) (${{ matrix.os }})
     runs-on: ${{ matrix.os }}
     strategy:
       fail-fast: false
       matrix:
-        name:
+        runtime:
         - linux-aarch64 #
         - linux-arm     #
         - linux-x64     #
@@ -31,23 +31,23 @@ jobs:
         - macos-x64     #
 
         include:
-        - { name: linux-aarch64 , target: aarch64-unknown-linux-gnu   , os: ubuntu-latest  , use-cross: true }
-        - { name: linux-arm     , target: arm-unknown-linux-gnueabihf , os: ubuntu-latest  , use-cross: true }
-        - { name: linux-x64     , target: x86_64-unknown-linux-gnu    , os: ubuntu-latest                    }
-        - { name: linux-x86     , target: i686-unknown-linux-gnu      , os: ubuntu-latest  , use-cross: true }
-        - { name: windows-x64   , target: x86_64-pc-windows-msvc      , os: windows-latest                   }
-        - { name: windows-x86   , target: i686-pc-windows-msvc        , os: windows-latest                   }
-        - { name: macos-arm64   , target: aarch64-apple-darwin        , os: macos-latest                     }
-        - { name: macos-x64     , target: x86_64-apple-darwin         , os: macos-latest                     }
+        - { runtime: linux-aarch64 , target: aarch64-unknown-linux-gnu   , os: ubuntu-latest  , use-cross: true }
+        - { runtime: linux-arm     , target: arm-unknown-linux-gnueabihf , os: ubuntu-latest  , use-cross: true }
+        - { runtime: linux-x64     , target: x86_64-unknown-linux-gnu    , os: ubuntu-latest                    }
+        - { runtime: linux-x86     , target: i686-unknown-linux-gnu      , os: ubuntu-latest  , use-cross: true }
+        - { runtime: windows-x64   , target: x86_64-pc-windows-msvc      , os: windows-latest                   }
+        - { runtime: windows-x86   , target: i686-pc-windows-msvc        , os: windows-latest                   }
+        - { runtime: macos-arm64   , target: aarch64-apple-darwin        , os: macos-latest                     }
+        - { runtime: macos-x64     , target: x86_64-apple-darwin         , os: macos-latest                     }
 
         # Cross compilers for C library
-        - { name: linux-aarch64 , cc: aarch64-linux-gnu-gcc           , ar: aarch64-linux-gnu-ar               }
-        - { name: linux-arm     , cc: arm-unknown-linux-gnueabihf-gcc , ar: arm-unknown-linux-gnueabihf-gcc-ar }
-        - { name: linux-x86     , cc: i686-linux-gnu-gcc              , ar: i686-linux-gnu-ar                  }
+        - { runtime: linux-aarch64 , cc: aarch64-linux-gnu-gcc           , ar: aarch64-linux-gnu-ar               }
+        - { runtime: linux-arm     , cc: arm-unknown-linux-gnueabihf-gcc , ar: arm-unknown-linux-gnueabihf-gcc-ar }
+        - { runtime: linux-x86     , cc: i686-linux-gnu-gcc              , ar: i686-linux-gnu-ar                  }
 
         # See #2041 tree-sitter issue
-        - { name: windows-x64   , rust_test_threads: 1 }
-        - { name: windows-x86   , rust_test_threads: 1 }
+        - { runtime: windows-x64   , rust_test_threads: 1 }
+        - { runtime: windows-x86   , rust_test_threads: 1 }
 
     env:
       BUILD_CMD: cargo
@@ -137,46 +137,46 @@ jobs:
       run: make.sh CFLAGS="-Werror" -j
 
     - name: Build wasm library
-      if: ${{ !matrix.use-cross && matrix.name != 'macos-arm64' }} # Not used
+      if: ${{ !matrix.use-cross && matrix.runtime != 'macos-arm64' }} # Not used
       run: script/build-wasm
 
     - name: Build CLI
       run: $BUILD_CMD build --release --target=${{ matrix.target }}
 
     - name: Fetch fixtures
-      if: ${{ matrix.name != 'macos-arm64' }} # Not used
+      if: ${{ matrix.runtime != 'macos-arm64' }} # Not used
       run: script/fetch-fixtures
 
     - name: Generate fixtures
-      if: ${{ matrix.name != 'macos-arm64' }} # Can't natively run CLI on runner's host
+      if: ${{ matrix.runtime != 'macos-arm64' }} # Can't natively run CLI on runner's host
       run: script/generate-fixtures
 
     - name: Generate WASM fixtures
-      if: ${{ !matrix.use-cross && matrix.name != 'macos-arm64' }} # Not used
+      if: ${{ !matrix.use-cross && matrix.runtime != 'macos-arm64' }} # Not used
       run: script/generate-fixtures-wasm
 
     - name: Run main tests
-      if: ${{ matrix.name != 'macos-arm64' }} # Can't natively run CLI on runner's host
+      if: ${{ matrix.runtime != 'macos-arm64' }} # Can't natively run CLI on runner's host
       run: $BUILD_CMD test --target=${{ matrix.target }}
 
     - name: Run wasm tests
-      if: ${{ !matrix.use-cross && matrix.name != 'macos-arm64' }} # Not used
+      if: ${{ !matrix.use-cross && matrix.runtime != 'macos-arm64' }} # Not used
       run: script/test-wasm
 
     - name: Run benchmarks
-      if: ${{ !matrix.use-cross && matrix.name != 'macos-arm64' }} # Cross-compiled benchmarks make no sense
+      if: ${{ !matrix.use-cross && matrix.runtime != 'macos-arm64' }} # Cross-compiled benchmarks make no sense
       run: $BUILD_CMD bench benchmark -p tree-sitter-cli --target=${{ matrix.target }}
 
     - name: Upload CLI artifact
       uses: actions/upload-artifact@v3
       with:
-        name: tree-sitter.${{ matrix.name }}
+        name: tree-sitter.${{ matrix.runtime }}
         path: target/${{ matrix.target }}/release/tree-sitter${{ contains(matrix.target, 'windows') && '.exe' || '' }}
         if-no-files-found: error
         retention-days: 7
 
     - name: Upload WASM artifacts
-      if: ${{ matrix.name == 'linux-x64' }}
+      if: ${{ matrix.runtime == 'linux-x64' }}
       uses: actions/upload-artifact@v3
       with:
         name: tree-sitter.wasm

From 160550dabe5e1ddeab24ddf14ceba2b21f23dc7a Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Sat, 15 Apr 2023 02:58:17 +0300
Subject: [PATCH 096/347] cicd: fix windows targets sporadic issue due to
 corrupted PATH

---
 .github/workflows/build.yml | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/.github/workflows/build.yml b/.github/workflows/build.yml
index c07ae114..d76fb853 100644
--- a/.github/workflows/build.yml
+++ b/.github/workflows/build.yml
@@ -77,7 +77,7 @@ jobs:
         targets: ${{ matrix.target }}
 
     - name: Install cross
-      if: matrix.use-cross
+      if: ${{ matrix.use-cross }}
       uses: taiki-e/install-action@v2
       with:
         tool: cross
@@ -112,9 +112,9 @@ jobs:
         AR: ${{ matrix.ar }}
       run: |
         PATH="$PWD/.github/scripts:$PATH"
-        echo "PATH=$PATH" >> $GITHUB_ENV
-        echo "ROOT=$PWD" >> $GITHUB_ENV
+        echo "$PWD/.github/scripts" >> $GITHUB_PATH
         echo "TREE_SITTER=tree-sitter.sh" >> $GITHUB_ENV
+        echo "ROOT=$PWD" >> $GITHUB_ENV
 
         export TARGET=${{ matrix.target }}
         echo "TARGET=$TARGET" >> $GITHUB_ENV

From bfd56a1e59c7cfe000eccc8f2142c8eaa12a552f Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Fri, 14 Apr 2023 03:43:03 +0300
Subject: [PATCH 097/347] docs: remove controversial `Earliest Starting
 Position` item added previously by 87a0517

---
 docs/section-3-creating-parsers.md | 2 --
 1 file changed, 2 deletions(-)

diff --git a/docs/section-3-creating-parsers.md b/docs/section-3-creating-parsers.md
index 842b87eb..a67cfc0c 100644
--- a/docs/section-3-creating-parsers.md
+++ b/docs/section-3-creating-parsers.md
@@ -530,8 +530,6 @@ Grammars often contain multiple tokens that can match the same characters. For e
 
 1. **Context-Aware Lexing** - Tree-sitter performs lexing on-demand, during the parsing process. At any given position in a source document, the lexer only tries to recognize tokens that are *valid* at that position in the document.
 
-1. **Earliest Starting Position** - Tree-sitter will prefer tokens with an earlier starting position. This is most often seen with very permissive regular expressions similar to `/.*/`, which are greedy and will consume as much text as possible. In this example the regex would consume all text until hitting a newline - even if text on that line could be interpreted as a different token.
-
 1. **Explicit Lexical Precedence** - When the precedence functions described [above](#the-grammar-dsl) are used within the `token` function, the given precedence values serve as instructions to the lexer. If there are two valid tokens that match the characters at a given position in the document, Tree-sitter will select the one with the higher precedence.
 
 1. **Match Length** - If multiple valid tokens with the same precedence match the characters at a given position in a document, Tree-sitter will select the token that matches the [longest sequence of characters][longest-match].

From b5e6d1808613509ac11af25fe3bb243b1b6d6eb8 Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Fri, 14 Apr 2023 04:16:00 +0300
Subject: [PATCH 098/347] docs: add a grammar syntax sample for lexical
 precedence

---
 docs/section-3-creating-parsers.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/docs/section-3-creating-parsers.md b/docs/section-3-creating-parsers.md
index a67cfc0c..eb664aec 100644
--- a/docs/section-3-creating-parsers.md
+++ b/docs/section-3-creating-parsers.md
@@ -530,7 +530,7 @@ Grammars often contain multiple tokens that can match the same characters. For e
 
 1. **Context-Aware Lexing** - Tree-sitter performs lexing on-demand, during the parsing process. At any given position in a source document, the lexer only tries to recognize tokens that are *valid* at that position in the document.
 
-1. **Explicit Lexical Precedence** - When the precedence functions described [above](#the-grammar-dsl) are used within the `token` function, the given precedence values serve as instructions to the lexer. If there are two valid tokens that match the characters at a given position in the document, Tree-sitter will select the one with the higher precedence.
+1. **Explicit Lexical Precedence** - When the precedence functions described [above](#the-grammar-dsl) are used within the `token` function like `token(prec(N, ...))`, the given precedence values serve as instructions to the lexer. If there are two valid tokens that match the characters at a given position in the document, Tree-sitter will select the one with the higher precedence.
 
 1. **Match Length** - If multiple valid tokens with the same precedence match the characters at a given position in a document, Tree-sitter will select the token that matches the [longest sequence of characters][longest-match].
 

From e47f05062aa778232a111ba768fdc209bcb84586 Mon Sep 17 00:00:00 2001
From: "dependabot[bot]" <49699333+dependabot[bot]@users.noreply.github.com>
Date: Wed, 12 Apr 2023 05:32:32 +0000
Subject: [PATCH 099/347] chore(deps): bump commonmarker from 0.23.8 to 0.23.9
 in /docs

Bumps [commonmarker](https://github.com/gjtorikian/commonmarker) from 0.23.8 to 0.23.9.
- [Release notes](https://github.com/gjtorikian/commonmarker/releases)
- [Changelog](https://github.com/gjtorikian/commonmarker/blob/main/CHANGELOG.md)
- [Commits](https://github.com/gjtorikian/commonmarker/compare/v0.23.8...v0.23.9)

---
updated-dependencies:
- dependency-name: commonmarker
  dependency-type: indirect
...

Signed-off-by: dependabot[bot] <support@github.com>
---
 docs/Gemfile.lock | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/docs/Gemfile.lock b/docs/Gemfile.lock
index 3b2801be..9979ebc1 100644
--- a/docs/Gemfile.lock
+++ b/docs/Gemfile.lock
@@ -13,7 +13,7 @@ GEM
       execjs
     coffee-script-source (1.11.1)
     colorator (1.1.0)
-    commonmarker (0.23.8)
+    commonmarker (0.23.9)
     concurrent-ruby (1.2.2)
     dnsruby (1.61.9)
       simpleidn (~> 0.1)
@@ -210,7 +210,7 @@ GEM
       jekyll-feed (~> 0.9)
       jekyll-seo-tag (~> 2.1)
     minitest (5.18.0)
-    nokogiri (1.14.2-x86_64-linux)
+    nokogiri (1.14.3-x86_64-linux)
       racc (~> 1.4)
     octokit (4.25.1)
       faraday (>= 1, < 3)
@@ -250,7 +250,7 @@ GEM
     webrick (1.8.1)
 
 PLATFORMS
-  ruby
+  x86_64-linux
 
 DEPENDENCIES
   github-pages

From d5465b9a32fe981fd33777530def03600a2404df Mon Sep 17 00:00:00 2001
From: "dependabot[bot]" <49699333+dependabot[bot]@users.noreply.github.com>
Date: Wed, 12 Apr 2023 06:29:11 +0000
Subject: [PATCH 100/347] chore(deps): bump nokogiri from 1.14.2 to 1.14.3 in
 /docs

Bumps [nokogiri](https://github.com/sparklemotion/nokogiri) from 1.14.2 to 1.14.3.
- [Release notes](https://github.com/sparklemotion/nokogiri/releases)
- [Changelog](https://github.com/sparklemotion/nokogiri/blob/main/CHANGELOG.md)
- [Commits](https://github.com/sparklemotion/nokogiri/compare/v1.14.2...v1.14.3)

---
updated-dependencies:
- dependency-name: nokogiri
  dependency-type: indirect
...

Signed-off-by: dependabot[bot] <support@github.com>
---
 docs/Gemfile.lock | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/docs/Gemfile.lock b/docs/Gemfile.lock
index 3b2801be..b7f8a550 100644
--- a/docs/Gemfile.lock
+++ b/docs/Gemfile.lock
@@ -210,7 +210,7 @@ GEM
       jekyll-feed (~> 0.9)
       jekyll-seo-tag (~> 2.1)
     minitest (5.18.0)
-    nokogiri (1.14.2-x86_64-linux)
+    nokogiri (1.14.3-x86_64-linux)
       racc (~> 1.4)
     octokit (4.25.1)
       faraday (>= 1, < 3)
@@ -250,7 +250,7 @@ GEM
     webrick (1.8.1)
 
 PLATFORMS
-  ruby
+  x86_64-linux
 
 DEPENDENCIES
   github-pages

From 0e4ff0bb27edf37b76fc7d35aa768b02cf4392ad Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Sun, 16 Apr 2023 21:05:28 +0300
Subject: [PATCH 101/347] chore: fix lib version in Makefile and set it to
 0.20.10

---
 Makefile | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/Makefile b/Makefile
index 69f6f590..670e02ac 100644
--- a/Makefile
+++ b/Makefile
@@ -1,4 +1,4 @@
-VERSION := 0.20.9
+VERSION := 0.20.10
 
 # install directory layout
 PREFIX ?= /usr/local

From 6c520452ade1cc1c36ae721591d48febac06c066 Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Sun, 16 Apr 2023 21:06:17 +0300
Subject: [PATCH 102/347] chore: fix years in the license file

---
 LICENSE | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/LICENSE b/LICENSE
index 4c220022..3f674119 100644
--- a/LICENSE
+++ b/LICENSE
@@ -1,6 +1,6 @@
 The MIT License (MIT)
 
-Copyright (c) 2018-2021 Max Brunsfeld
+Copyright (c) 2018-2023 Max Brunsfeld
 
 Permission is hereby granted, free of charge, to any person obtaining a copy
 of this software and associated documentation files (the "Software"), to deal

From 613382c70a6b9af654129c5da4bf2f2dffd6bd6e Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Sun, 16 Apr 2023 21:14:19 +0300
Subject: [PATCH 103/347] docs: update badges; fix markdown lint complains

Linter config `.vscode/settings.json`:
```json
{
    "[markdown]": {
        "files.trimTrailingWhitespace": false,
    },
    "markdownlint.config": {
        "default": true,
        // "ul-style": {
        //     "style": "asterisk"
        // },
        "MD001": false,
        "MD024": false,
        "MD025": false,
        "MD033": false,
        "MD041": false,
        "MD053": false,
    },
}
```
---
 README.md                                 |  5 +-
 cli/README.md                             | 19 ++++--
 docs/index.md                             | 12 ++--
 docs/section-2-using-parsers.md           | 72 +++++++++++------------
 docs/section-3-creating-parsers.md        | 25 ++++----
 docs/section-4-syntax-highlighting.md     | 25 ++++----
 docs/section-5-implementation.md          |  2 -
 docs/section-6-contributing.md            | 18 +++---
 docs/section-8-code-navigation-systems.md | 12 ++--
 highlight/README.md                       |  5 +-
 lib/README.md                             |  3 +-
 lib/binding_rust/README.md                |  5 +-
 lib/binding_web/README.md                 |  8 ++-
 tags/README.md                            |  5 ++
 14 files changed, 121 insertions(+), 95 deletions(-)

diff --git a/README.md b/README.md
index 34390187..e74c6e45 100644
--- a/README.md
+++ b/README.md
@@ -1,8 +1,11 @@
 # tree-sitter
 
-[![CICD](https://github.com/tree-sitter/tree-sitter/actions/workflows/CICD.yml/badge.svg)](https://github.com/tree-sitter/tree-sitter/actions/workflows/CICD.yml)
+[![CICD badge]][CICD]
 [![DOI](https://zenodo.org/badge/14164618.svg)](https://zenodo.org/badge/latestdoi/14164618)
 
+[CICD badge]: https://github.com/tree-sitter/tree-sitter/actions/workflows/CICD.yml/badge.svg
+[CICD]: https://github.com/tree-sitter/tree-sitter/actions/workflows/CICD.yml
+
 Tree-sitter is a parser generator tool and an incremental parsing library. It can build a concrete syntax tree for a source file and efficiently update the syntax tree as the source file is edited. Tree-sitter aims to be:
 
 - **General** enough to parse any programming language
diff --git a/cli/README.md b/cli/README.md
index eff3608c..eb93bcfa 100644
--- a/cli/README.md
+++ b/cli/README.md
@@ -1,7 +1,11 @@
-Tree-sitter CLI
-===============
+# Tree-sitter CLI
 
-[![Crates.io](https://img.shields.io/crates/v/tree-sitter-cli.svg)](https://crates.io/crates/tree-sitter-cli)
+[![crates.io badge]][crates.io] [![npmjs.com badge]][npmjs.com]
+
+[crates.io]: https://crates.io/crates/tree-sitter-cli
+[crates.io badge]: https://img.shields.io/crates/v/tree-sitter-cli.svg?color=%23B48723
+[npmjs.com]: https://www.npmjs.org/package/tree-sitter-cli
+[npmjs.com badge]: https://img.shields.io/npm/v/tree-sitter-cli.svg?color=%23BF4A4A
 
 The Tree-sitter CLI allows you to develop, test, and use Tree-sitter grammars from the command line. It works on MacOS, Linux, and Windows.
 
@@ -19,7 +23,7 @@ or with `npm`:
 npm install tree-sitter-cli
 ```
 
-You can also download a pre-built binary for your platform from [the releases page](https://github.com/tree-sitter/tree-sitter/releases/latest).
+You can also download a pre-built binary for your platform from [the releases page].
 
 ### Dependencies
 
@@ -30,8 +34,11 @@ The `tree-sitter` binary itself has no dependencies, but specific commands have
 
 ### Commands
 
-* `generate` - The `tree-sitter generate` command will generate a Tree-sitter parser based on the grammar in the current working directory. See [the documentation](https://tree-sitter.github.io/tree-sitter/creating-parsers) for more information.
+* `generate` - The `tree-sitter generate` command will generate a Tree-sitter parser based on the grammar in the current working directory. See [the documentation] for more information.
 
-* `test` - The `tree-sitter test` command will run the unit tests for the Tree-sitter parser in the current working directory. See [the documentation](https://tree-sitter.github.io/tree-sitter/creating-parsers) for more information.
+* `test` - The `tree-sitter test` command will run the unit tests for the Tree-sitter parser in the current working directory. See [the documentation] for more information.
 
 * `parse` - The `tree-sitter parse` command will parse a file (or list of files) using Tree-sitter parsers.
+
+[the documentation]: https://tree-sitter.github.io/tree-sitter/creating-parsers
+[the releases page]: https://github.com/tree-sitter/tree-sitter/releases/latest
diff --git a/docs/index.md b/docs/index.md
index 9fb1fd2a..ddfff214 100644
--- a/docs/index.md
+++ b/docs/index.md
@@ -160,9 +160,9 @@ By convention, parsers are named with the language last, eg. tree-sitter-ruby.
 
 The design of Tree-sitter was greatly influenced by the following research papers:
 
-- [Practical Algorithms for Incremental Software Development Environments](https://www2.eecs.berkeley.edu/Pubs/TechRpts/1997/CSD-97-946.pdf)
-- [Context Aware Scanning for Parsing Extensible Languages](https://www-users.cse.umn.edu/~evw/pubs/vanwyk07gpce/vanwyk07gpce.pdf)
-- [Efficient and Flexible Incremental Parsing](https://harmonia.cs.berkeley.edu/papers/twagner-parsing.pdf)
-- [Incremental Analysis of Real Programming Languages](https://harmonia.cs.berkeley.edu/papers/twagner-glr.pdf)
-- [Error Detection and Recovery in LR Parsers](https://what-when-how.com/compiler-writing/bottom-up-parsing-compiler-writing-part-13)
-- [Error Recovery for LR Parsers](https://apps.dtic.mil/sti/pdfs/ADA043470.pdf)
+* [Practical Algorithms for Incremental Software Development Environments](https://www2.eecs.berkeley.edu/Pubs/TechRpts/1997/CSD-97-946.pdf)
+* [Context Aware Scanning for Parsing Extensible Languages](https://www-users.cse.umn.edu/~evw/pubs/vanwyk07gpce/vanwyk07gpce.pdf)
+* [Efficient and Flexible Incremental Parsing](https://harmonia.cs.berkeley.edu/papers/twagner-parsing.pdf)
+* [Incremental Analysis of Real Programming Languages](https://harmonia.cs.berkeley.edu/papers/twagner-glr.pdf)
+* [Error Detection and Recovery in LR Parsers](https://what-when-how.com/compiler-writing/bottom-up-parsing-compiler-writing-part-13)
+* [Error Recovery for LR Parsers](https://apps.dtic.mil/sti/pdfs/ADA043470.pdf)
diff --git a/docs/section-2-using-parsers.md b/docs/section-2-using-parsers.md
index 0d683dc1..87c049e7 100644
--- a/docs/section-2-using-parsers.md
+++ b/docs/section-2-using-parsers.md
@@ -21,21 +21,21 @@ Alternatively, you can incorporate the library in a larger project's build syste
 
 **source file:**
 
-- `tree-sitter/lib/src/lib.c`
+* `tree-sitter/lib/src/lib.c`
 
 **include directories:**
 
-- `tree-sitter/lib/src`
-- `tree-sitter/lib/include`
+* `tree-sitter/lib/src`
+* `tree-sitter/lib/include`
 
 ### The Basic Objects
 
 There are four main types of objects involved when using Tree-sitter: languages, parsers, syntax trees, and syntax nodes. In C, these are called `TSLanguage`, `TSParser`, `TSTree`, and `TSNode`.
 
-- A `TSLanguage` is an opaque object that defines how to parse a particular programming language. The code for each `TSLanguage` is generated by Tree-sitter. Many languages are already available in separate git repositories within the [Tree-sitter GitHub organization](https://github.com/tree-sitter). See [the next page](./creating-parsers) for how to create new languages.
-- A `TSParser` is a stateful object that can be assigned a `TSLanguage` and used to produce a `TSTree` based on some source code.
-- A `TSTree` represents the syntax tree of an entire source code file. It contains `TSNode` instances that indicate the structure of the source code. It can also be edited and used to produce a new `TSTree` in the event that the source code changes.
-- A `TSNode` represents a single node in the syntax tree. It tracks its start and end positions in the source code, as well as its relation to other nodes like its parent, siblings and children.
+* A `TSLanguage` is an opaque object that defines how to parse a particular programming language. The code for each `TSLanguage` is generated by Tree-sitter. Many languages are already available in separate git repositories within the [Tree-sitter GitHub organization](https://github.com/tree-sitter). See [the next page](./creating-parsers) for how to create new languages.
+* A `TSParser` is a stateful object that can be assigned a `TSLanguage` and used to produce a `TSTree` based on some source code.
+* A `TSTree` represents the syntax tree of an entire source code file. It contains `TSNode` instances that indicate the structure of the source code. It can also be edited and used to produce a new `TSTree` in the event that the source code changes.
+* A `TSNode` represents a single node in the syntax tree. It tracks its start and end positions in the source code, as well as its relation to other nodes like its parent, siblings and children.
 
 ### An Example Program
 
@@ -442,13 +442,13 @@ Many code analysis tasks involve searching for patterns in syntax trees. Tree-si
 
 A _query_ consists of one or more _patterns_, where each pattern is an [S-expression](https://en.wikipedia.org/wiki/S-expression) that matches a certain set of nodes in a syntax tree. The expression to match a given node consists of a pair of parentheses containing two things: the node's type, and optionally, a series of other S-expressions that match the node's children. For example, this pattern would match any `binary_expression` node whose children are both `number_literal` nodes:
 
-``` scheme
+```scheme
 (binary_expression (number_literal) (number_literal))
 ```
 
 Children can also be omitted. For example, this would match any `binary_expression` where at least _one_ of child is a `string_literal` node:
 
-``` scheme
+```scheme
 (binary_expression (string_literal))
 ```
 
@@ -456,7 +456,7 @@ Children can also be omitted. For example, this would match any `binary_expressi
 
 In general, it's a good idea to make patterns more specific by specifying [field names](#node-field-names) associated with child nodes. You do this by prefixing a child pattern with a field name followed by a colon. For example, this pattern would match an `assignment_expression` node where the `left` child is a `member_expression` whose `object` is a `call_expression`.
 
-``` scheme
+```scheme
 (assignment_expression
   left: (member_expression
     object: (call_expression)))
@@ -464,9 +464,9 @@ In general, it's a good idea to make patterns more specific by specifying [field
 
 #### Negated Fields
 
-You can also constrain a pattern so that it only matches nodes that *lack* a certain field. To do this, add a field name prefixed by a `!` within the parent pattern. For example, this pattern would match a class declaration with no type parameters:
+You can also constrain a pattern so that it only matches nodes that _lack_ a certain field. To do this, add a field name prefixed by a `!` within the parent pattern. For example, this pattern would match a class declaration with no type parameters:
 
-``` scheme
+```scheme
 (class_declaration
   name: (identifier) @class_name
   !type_parameters)
@@ -476,7 +476,7 @@ You can also constrain a pattern so that it only matches nodes that *lack* a cer
 
 The parenthesized syntax for writing nodes only applies to [named nodes](#named-vs-anonymous-nodes). To match specific anonymous nodes, you write their name between double quotes. For example, this pattern would match any `binary_expression` where the operator is `!=` and the right side is `null`:
 
-``` scheme
+```scheme
 (binary_expression
   operator: "!="
   right: (null))
@@ -488,7 +488,7 @@ When matching patterns, you may want to process specific nodes within the patter
 
 For example, this pattern would match any assignment of a `function` to an `identifier`, and it would associate the name `the-function-name` with the identifier:
 
-``` scheme
+```scheme
 (assignment_expression
   left: (identifier) @the-function-name
   right: (function))
@@ -496,7 +496,7 @@ For example, this pattern would match any assignment of a `function` to an `iden
 
 And this pattern would match all method definitions, associating the name `the-method-name` with the method name, `the-class-name` with the containing class name:
 
-``` scheme
+```scheme
 (class_declaration
   name: (identifier) @the-class-name
   body: (class_body
@@ -510,13 +510,13 @@ You can match a repeating sequence of sibling nodes using the postfix `+` and `*
 
 For example, this pattern would match a sequence of one or more comments:
 
-``` scheme
+```scheme
 (comment)+
 ```
 
 This pattern would match a class declaration, capturing all of the decorators if any were present:
 
-``` scheme
+```scheme
 (class_declaration
   (decorator)* @the-decorator
   name: (identifier) @the-name)
@@ -524,7 +524,7 @@ This pattern would match a class declaration, capturing all of the decorators if
 
 You can also mark a node as optional using the `?` operator. For example, this pattern would match all function calls, capturing a string argument if one was present:
 
-``` scheme
+```scheme
 (call_expression
   function: (identifier) @the-function
   arguments: (arguments (string)? @the-string-arg))
@@ -534,7 +534,7 @@ You can also mark a node as optional using the `?` operator. For example, this p
 
 You can also use parentheses for grouping a sequence of _sibling_ nodes. For example, this pattern would match a comment followed by a function declaration:
 
-``` scheme
+```scheme
 (
   (comment)
   (function_declaration)
@@ -543,7 +543,7 @@ You can also use parentheses for grouping a sequence of _sibling_ nodes. For exa
 
 Any of the quantification operators mentioned above (`+`, `*`, and `?`) can also be applied to groups. For example, this pattern would match a comma-separated series of numbers:
 
-``` scheme
+```scheme
 (
   (number)
   ("," (number))*
@@ -558,7 +558,7 @@ This is similar to _character classes_ from regular expressions (`[abc]` matches
 For example, this pattern would match a call to either a variable or an object property.
 In the case of a variable, capture it as `@function`, and in the case of a property, capture it as `@method`:
 
-``` scheme
+```scheme
 (call_expression
   function: [
     (identifier) @function
@@ -569,7 +569,7 @@ In the case of a variable, capture it as `@function`, and in the case of a prope
 
 This pattern would match a set of possible keyword tokens, capturing them as `@keyword`:
 
-``` scheme
+```scheme
 [
   "break"
   "delete"
@@ -592,7 +592,7 @@ and `_` will match any named or anonymous node.
 
 For example, this pattern would match any node inside a call:
 
-``` scheme
+```scheme
 (call (_) @call.inner)
 ```
 
@@ -602,7 +602,7 @@ The anchor operator, `.`, is used to constrain the ways in which child patterns
 
 When `.` is placed before the _first_ child within a parent pattern, the child will only match when it is the first named node in the parent. For example, the below pattern matches a given `array` node at most once, assigning the `@the-element` capture to the first `identifier` node in the parent `array`:
 
-``` scheme
+```scheme
 (array . (identifier) @the-element)
 ```
 
@@ -610,13 +610,13 @@ Without this anchor, the pattern would match once for every identifier in the ar
 
 Similarly, an anchor placed after a pattern's _last_ child will cause that child pattern to only match nodes that are the last named child of their parent. The below pattern matches only nodes that are the last named child within a `block`.
 
-``` scheme
+```scheme
 (block (_) @last-expression .)
 ```
 
 Finally, an anchor _between_ two child patterns will cause the patterns to only match nodes that are immediate siblings. The pattern below, given a long dotted name like `a.b.c.d`, will only match pairs of consecutive identifiers: `a, b`, `b, c`, and `c, d`.
 
-``` scheme
+```scheme
 (dotted_name
   (identifier) @prev-id
   .
@@ -633,7 +633,7 @@ You can also specify arbitrary metadata and conditions associated with a pattern
 
 For example, this pattern would match identifier whose names is written in `SCREAMING_SNAKE_CASE`:
 
-``` scheme
+```scheme
 (
   (identifier) @constant
   (#match? @constant "^[A-Z][A-Z_]+")
@@ -642,7 +642,7 @@ For example, this pattern would match identifier whose names is written in `SCRE
 
 And this pattern would match key-value pairs where the `value` is an identifier with the same name as the key:
 
-``` scheme
+```scheme
 (
   (pair
     key: (property_identifier) @key-name
@@ -723,8 +723,8 @@ The node types file contains an array of objects, each of which describes a part
 
 Every object in this array has these two entries:
 
-- `"type"` - A string that indicates which grammar rule the node represents. This corresponds to the `ts_node_type` function described [above](#syntax-nodes).
-- `"named"` - A boolean that indicates whether this kind of node corresponds to a rule name in the grammar or just a string literal. See [above](#named-vs-anonymous-nodes) for more info.
+* `"type"` - A string that indicates which grammar rule the node represents. This corresponds to the `ts_node_type` function described [above](#syntax-nodes).
+* `"named"` - A boolean that indicates whether this kind of node corresponds to a rule name in the grammar or just a string literal. See [above](#named-vs-anonymous-nodes) for more info.
 
 Examples:
 
@@ -745,14 +745,14 @@ Together, these two fields constitute a unique identifier for a node type; no tw
 
 Many syntax nodes can have _children_. The node type object describes the possible children that a node can have using the following entries:
 
-- `"fields"` - An object that describes the possible [fields](#node-field-names) that the node can have. The keys of this object are field names, and the values are _child type_ objects, described below.
-- `"children"` - Another _child type_ object that describes all of the node's possible _named_ children _without_ fields.
+* `"fields"` - An object that describes the possible [fields](#node-field-names) that the node can have. The keys of this object are field names, and the values are _child type_ objects, described below.
+* `"children"` - Another _child type_ object that describes all of the node's possible _named_ children _without_ fields.
 
 A _child type_ object describes a set of child nodes using the following entries:
 
-- `"required"` - A boolean indicating whether there is always _at least one_ node in this set.
-- `"multiple"` - A boolean indicating whether there can be _multiple_ nodes in this set.
-- `"types"`- An array of objects that represent the possible types of nodes in this set. Each object has two keys: `"type"` and `"named"`, whose meanings are described above.
+* `"required"` - A boolean indicating whether there is always _at least one_ node in this set.
+* `"multiple"` - A boolean indicating whether there can be _multiple_ nodes in this set.
+* `"types"`- An array of objects that represent the possible types of nodes in this set. Each object has two keys: `"type"` and `"named"`, whose meanings are described above.
 
 Example with fields:
 
@@ -812,7 +812,7 @@ In Tree-sitter grammars, there are usually certain rules that represent abstract
 
 Normally, hidden rules are not mentioned in the node types file, since they don't appear in the syntax tree. But if you add a hidden rule to the grammar's [`supertypes` list](./creating-parsers#the-grammar-dsl), then it _will_ show up in the node types file, with the following special entry:
 
-- `"subtypes"` - An array of objects that specify the _types_ of nodes that this 'supertype' node can wrap.
+* `"subtypes"` - An array of objects that specify the _types_ of nodes that this 'supertype' node can wrap.
 
 Example:
 
diff --git a/docs/section-3-creating-parsers.md b/docs/section-3-creating-parsers.md
index eb664aec..0aa3b139 100644
--- a/docs/section-3-creating-parsers.md
+++ b/docs/section-3-creating-parsers.md
@@ -80,7 +80,9 @@ You can test this parser by creating a source file with the contents "hello" and
 echo 'hello' > example-file
 tree-sitter parse example-file
 ```
+
 Alternatively, in Windows PowerShell:
+
 ```pwsh
 "hello" | Out-File example-file -Encoding utf8
 tree-sitter parse example-file
@@ -88,7 +90,7 @@ tree-sitter parse example-file
 
 This should print the following:
 
-```
+```text
 (source_file [0, 0] - [1, 0])
 ```
 
@@ -121,7 +123,7 @@ For each rule that you add to the grammar, you should first create a *test* that
 
 For example, you might have a file called `test/corpus/statements.txt` that contains a series of entries like this:
 
-```
+```text
 ==================
 Return statements
 ==================
@@ -147,7 +149,7 @@ func x() int {
 
   The expected output section can also *optionally* show the [*field names*][field-names-section] associated with each child node. To include field names in your tests, you write a node's field name followed by a colon, before the node itself in the S-expression:
 
-```
+```text
 (source_file
   (function_definition
     name: (identifier)
@@ -159,7 +161,7 @@ func x() int {
 
 * If your language's syntax conflicts with the `===` and `---` test separators, you can optionally add an arbitrary identical suffix (in the below example, `|||`) to disambiguate them:
 
-```
+```text
 ==================|||
 Basic module
 ==================|||
@@ -199,7 +201,7 @@ The `tree-sitter test` command will *also* run any syntax highlighting tests in
 
 You can run your parser on an arbitrary file using `tree-sitter parse`. This will print the resulting the syntax tree, including nodes' ranges and field names, like this:
 
-```
+```text
 (source_file [0, 0] - [3, 0]
   (function_declaration [0, 0] - [2, 1]
     name: (identifier [0, 5] - [0, 9])
@@ -251,7 +253,6 @@ In addition to the `name` and `rules` fields, grammars have a few other optional
 * **`word`** - the name of a token that will match keywords for the purpose of the [keyword extraction](#keyword-extraction) optimization.
 * **`supertypes`** an array of hidden rule names which should be considered to be 'supertypes' in the generated [*node types* file][static-node-types].
 
-
 ## Writing the Grammar
 
 Writing a grammar requires creativity. There are an infinite number of CFGs (context-free grammars) that can be used to describe any given language. In order to produce a good Tree-sitter parser, you need to create a grammar with two important properties:
@@ -375,7 +376,7 @@ return x + y;
 
 According to the specification, this line is a `ReturnStatement`, the fragment `x + y` is an `AdditiveExpression`, and `x` and `y` are both `IdentifierReferences`. The relationship between these constructs is captured by a complex series of production rules:
 
-```
+```text
 ReturnStatement          ->  'return' Expression
 Expression               ->  AssignmentExpression
 AssignmentExpression     ->  ConditionalExpression
@@ -432,7 +433,7 @@ To produce a readable syntax tree, we'd like to model JavaScript expressions usi
 
 Of course, this flat structure is highly ambiguous. If we try to generate a parser, Tree-sitter gives us an error message:
 
-```
+```text
 Error: Unresolved conflict for symbol sequence:
 
   '-'  _expression  •  '*'  …
@@ -468,7 +469,7 @@ For an expression like `-a * b`, it's not clear whether the `-` operator applies
 
 Applying a higher precedence in `unary_expression` fixes that conflict, but there is still another conflict:
 
-```
+```text
 Error: Unresolved conflict for symbol sequence:
 
   _expression  '*'  _expression  •  '*'  …
@@ -606,6 +607,7 @@ Aside from improving error detection, keyword extraction also has performance be
 ### External Scanners
 
 Many languages have some tokens whose structure is impossible or inconvenient to describe with a regular expression. Some examples:
+
 * [Indent and dedent][indent-tokens] tokens in Python
 * [Heredocs][heredoc] in Bash and Ruby
 * [Percent strings][percent-string] in Ruby
@@ -654,7 +656,6 @@ void * tree_sitter_my_language_external_scanner_create() {
 
 This function should create your scanner object. It will only be called once anytime your language is set on a parser. Often, you will want to allocate memory on the heap and return a pointer to it. If your external scanner doesn't need to maintain any state, it's ok to return `NULL`.
 
-
 #### Destroy
 
 ```c
@@ -714,10 +715,10 @@ This function is responsible for recognizing external tokens. It should return `
 * **`void (*advance)(TSLexer *, bool skip)`** - A function for advancing to the next character. If you pass `true` for the second argument, the current character will be treated as whitespace; whitespace won't be included in the text range associated with tokens emitted by the external scanner.
 * **`void (*mark_end)(TSLexer *)`** - A function for marking the end of the recognized token. This allows matching tokens that require multiple characters of lookahead. By default (if you don't call `mark_end`), any character that you moved past using the `advance` function will be included in the size of the token. But once you call `mark_end`, then any later calls to `advance` will *not* increase the size of the returned token. You can call `mark_end` multiple times to increase the size of the token.
 * **`uint32_t (*get_column)(TSLexer *)`** - A function for querying the current column position of the lexer. It returns the number of codepoints since the start of the current line. The codepoint position is recalculated on every call to this function by reading from the start of the line.
-* **`bool (*is_at_included_range_start)(const TSLexer *)`** - A function for checking whether the parser has just skipped some characters in the document. When parsing an embedded document using the `ts_parser_set_included_ranges` function (described in the [multi-language document section][multi-language-section]), your scanner may want to apply some special behavior when moving to a disjoint part of the document. For example, in [EJS documents][ejs], the JavaScript parser uses this function to enable inserting automatic semicolon tokens in between the code directives, delimited by `<%` and `%>`.
+* **`bool (*is_at_included_range_start)(const TSLexer *)`** - A function for checking whether the parser has just skipped some characters in the document. When parsing an embedded document using the `ts_parser_set_included_ranges` function (described in the [multi-language document section][multi-language-section]), the scanner may want to apply some special behavior when moving to a disjoint part of the document. For example, in [EJS documents][ejs], the JavaScript parser uses this function to enable inserting automatic semicolon tokens in between the code directives, delimited by `<%` and `%>`.
 * **`bool (*eof)(const TSLexer *)`** - A function for determining whether the lexer is at the end of the file. The value of `lookahead` will be `0` at the end of a file, but this function should be used instead of checking for that value because the `0` or "NUL" value is also a valid character that could be present in the file being parsed.
 
-The third argument to the `scan` function is an array of booleans that indicates which of your external tokens are currently expected by the parser. You should only look for a given token if it is valid according to this array. At the same time, you cannot backtrack, so you may need to combine certain pieces of logic.
+The third argument to the `scan` function is an array of booleans that indicates which of external tokens are currently expected by the parser. You should only look for a given token if it is valid according to this array. At the same time, you cannot backtrack, so you may need to combine certain pieces of logic.
 
 ```c
 if (valid_symbols[INDENT] || valid_symbol[DEDENT]) {
diff --git a/docs/section-4-syntax-highlighting.md b/docs/section-4-syntax-highlighting.md
index 0cf7890f..cedd89a6 100644
--- a/docs/section-4-syntax-highlighting.md
+++ b/docs/section-4-syntax-highlighting.md
@@ -25,9 +25,9 @@ The Tree-sitter CLI automatically creates two directories in your home folder.
 
 These directories are created in the "normal" place for your platform:
 
-- On Linux, `~/.config/tree-sitter` and `~/.cache/tree-sitter`
-- On Mac, `~/Library/Application Support/tree-sitter` and `~/Library/Caches/tree-sitter`
-- On Windows, `C:\Users\[username]\AppData\Roaming\tree-sitter` and `C:\Users\[username]\AppData\Local\tree-sitter`
+* On Linux, `~/.config/tree-sitter` and `~/.cache/tree-sitter`
+* On Mac, `~/Library/Application Support/tree-sitter` and `~/Library/Caches/tree-sitter`
+* On Windows, `C:\Users\[username]\AppData\Roaming\tree-sitter` and `C:\Users\[username]\AppData\Local\tree-sitter`
 
 The CLI will work if there's no config file present, falling back on default values for each configuration option.  To create a config file that you can edit, run this command:
 
@@ -61,6 +61,7 @@ In your config file, the `"theme"` value is an object whose keys are dot-separat
 #### Highlight Names
 
 A theme can contain multiple keys that share a common subsequence. Examples:
+
 * `variable` and `variable.parameter`
 * `function`, `function.builtin`, and `function.method`
 
@@ -158,7 +159,7 @@ func increment(a int) int {
 
 With this syntax tree:
 
-```
+```scheme
 (source_file
   (function_declaration
     name: (identifier)
@@ -178,6 +179,7 @@ With this syntax tree:
 #### Example Query
 
 Suppose we wanted to render this code with the following colors:
+
 * keywords `func` and `return` in purple
 * function `increment` in blue
 * type `int` in green
@@ -185,7 +187,7 @@ Suppose we wanted to render this code with the following colors:
 
 We can assign each of these categories a *highlight name* using a query like this:
 
-```
+```scheme
 ; highlights.scm
 
 "func" @keyword
@@ -252,7 +254,7 @@ list = [item]
 
 With this syntax tree:
 
-```
+```scheme
 (program
   (method
     name: (identifier)
@@ -295,7 +297,7 @@ There are several different types of names within this method:
 
 Let's write some queries that let us clearly distinguish between these types of names. First, set up the highlighting query, as described in the previous section. We'll assign distinct colors to method calls, method definitions, and formal parameters:
 
-```
+```scheme
 ; highlights.scm
 
 (call method: (identifier) @function.method)
@@ -312,7 +314,7 @@ Let's write some queries that let us clearly distinguish between these types of
 
 Then, we'll set up a local variable query to keep track of the variables and scopes. Here, we're indicating that methods and blocks create local *scopes*, parameters and assignments create *definitions*, and other identifiers should be considered *references*:
 
-```
+```scheme
 ; locals.scm
 
 (method) @local.scope
@@ -345,6 +347,7 @@ Running `tree-sitter highlight` on this ruby file would produce output like this
 ### Language Injection
 
 Some source files contain code written in multiple different languages. Examples include:
+
 * HTML files, which can contain JavaScript inside of `<script>` tags and CSS inside of `<style>` tags
 * [ERB](https://en.wikipedia.org/wiki/ERuby) files, which contain Ruby inside of `<% %>` tags, and HTML outside of those tags
 * PHP files, which can contain  HTML between the `<php` tags
@@ -374,7 +377,7 @@ BASH
 
 With this syntax tree:
 
-```
+```scheme
 (program
   (method_call
     method: (identifier)
@@ -388,7 +391,7 @@ With this syntax tree:
 
 The following query would specify that the contents of the heredoc should be parsed using a language named "BASH" (because that is the text of the `heredoc_end` node):
 
-```
+```scheme
 (heredoc_body
   (heredoc_end) @injection.language) @injection.content
 ```
@@ -396,7 +399,7 @@ The following query would specify that the contents of the heredoc should be par
 You can also force the language using the `#set!` predicate.
 For example, this will force the language to be always `ruby`.
 
-```
+```scheme
 ((heredoc_body) @injection.content
  (#set! injection.language "ruby"))
 ```
diff --git a/docs/section-5-implementation.md b/docs/section-5-implementation.md
index 4f97d760..07a34307 100644
--- a/docs/section-5-implementation.md
+++ b/docs/section-5-implementation.md
@@ -35,8 +35,6 @@ At the end of these transformations, the initial grammar is split into two gramm
 
 ### Building Parse Tables
 
-
-
 ## The Runtime
 
 WIP
diff --git a/docs/section-6-contributing.md b/docs/section-6-contributing.md
index 36f5f499..1fb8c003 100644
--- a/docs/section-6-contributing.md
+++ b/docs/section-6-contributing.md
@@ -96,18 +96,18 @@ script/test -l javascript -e Arrays
 
 The main [`tree-sitter/tree-sitter`](https://github.com/tree-sitter/tree-sitter) repository contains the source code for several packages that are published to package registries for different languages:
 
-- Rust crates on [crates.io](https://crates.io):
-  - [`tree-sitter`](https://crates.io/crates/tree-sitter) - A Rust binding to the core library
-  - [`tree-sitter-highlight`](https://crates.io/crates/tree-sitter-highlight) - The syntax-highlighting library
-  - [`tree-sitter-cli`](https://crates.io/crates/tree-sitter-cli) - The command-line tool
-- JavaScript modules on [npmjs.com](https://npmjs.com):
-  - [`web-tree-sitter`](https://www.npmjs.com/package/web-tree-sitter) - A WASM-based JavaScript binding to the core library
-  - [`tree-sitter-cli`](https://www.npmjs.com/package/tree-sitter-cli) - The command-line tool
+* Rust crates on [crates.io](https://crates.io):
+  * [`tree-sitter`](https://crates.io/crates/tree-sitter) - A Rust binding to the core library
+  * [`tree-sitter-highlight`](https://crates.io/crates/tree-sitter-highlight) - The syntax-highlighting library
+  * [`tree-sitter-cli`](https://crates.io/crates/tree-sitter-cli) - The command-line tool
+* JavaScript modules on [npmjs.com](https://npmjs.com):
+  * [`web-tree-sitter`](https://www.npmjs.com/package/web-tree-sitter) - A WASM-based JavaScript binding to the core library
+  * [`tree-sitter-cli`](https://www.npmjs.com/package/tree-sitter-cli) - The command-line tool
 
 There are also several other dependent repositories that contain other published packages:
 
-- [`tree-sitter/node-tree-sitter`](https://github.com/tree-sitter/node-tree-sitter) - Node.js bindings to the core library, published as [`tree-sitter`](https://www.npmjs.com/package/tree-sitter) on npmjs.com
-- [`tree-sitter/py-tree-sitter`](https://github.com/tree-sitter/py-tree-sitter) - Python bindings to the core library, published as [`tree-sitter`](https://pypi.org/project/tree-sitter) on [PyPI.org](https://pypi.org).
+* [`tree-sitter/node-tree-sitter`](https://github.com/tree-sitter/node-tree-sitter) - Node.js bindings to the core library, published as [`tree-sitter`](https://www.npmjs.com/package/tree-sitter) on npmjs.com
+* [`tree-sitter/py-tree-sitter`](https://github.com/tree-sitter/py-tree-sitter) - Python bindings to the core library, published as [`tree-sitter`](https://pypi.org/project/tree-sitter) on [PyPI.org](https://pypi.org).
 
 ## Publishing New Releases
 
diff --git a/docs/section-8-code-navigation-systems.md b/docs/section-8-code-navigation-systems.md
index a1b6a280..04346e46 100644
--- a/docs/section-8-code-navigation-systems.md
+++ b/docs/section-8-code-navigation-systems.md
@@ -9,7 +9,7 @@ Tree-sitter can be used in conjunction with its [tree query language](https://tr
 
 ## Tagging and captures
 
-*Tagging* is the act of identifying the entities that can be named in a program. We use Tree-sitter queries to find those entities. Having found them, you use a syntax capture to label the entity and its name.
+_Tagging_ is the act of identifying the entities that can be named in a program. We use Tree-sitter queries to find those entities. Having found them, you use a syntax capture to label the entity and its name.
 
 The essence of a given tag lies in two pieces of data: the _role_ of the entity that is matched (i.e. whether it is a definition or a reference) and the _kind_ of that entity, which describes how the entity is used (i.e. whether it's a class definition, function call, variable reference, and so on). Our convention is to use a syntax capture following the `@role.kind` capture name format, and another inner capture, always called `@name`, that pulls out the name of a given identifier.
 
@@ -19,14 +19,14 @@ You may optionally include a capture named `@doc` to bind a docstring. For conve
 
 This [query](https://github.com/tree-sitter/tree-sitter-python/blob/78c4e9b6b2f08e1be23b541ffced47b15e2972ad/queries/tags.scm#L4-L5) recognizes Python function definitions and captures their declared name. The `function_definition` syntax node is defined in the [Python Tree-sitter grammar](https://github.com/tree-sitter/tree-sitter-python/blob/78c4e9b6b2f08e1be23b541ffced47b15e2972ad/grammar.js#L354).
 
-``` scheme
+```scheme
 (function_definition
   name: (identifier) @name) @definition.function
 ```
 
 A more sophisticated query can be found in the [JavaScript Tree-sitter repository](https://github.com/tree-sitter/tree-sitter-javascript/blob/fdeb68ac8d2bd5a78b943528bb68ceda3aade2eb/queries/tags.scm#L63-L70):
 
-``` scheme
+```scheme
 (assignment_expression
   left: [
     (identifier) @name
@@ -39,7 +39,7 @@ A more sophisticated query can be found in the [JavaScript Tree-sitter repositor
 
 An even more sophisticated query is in the [Ruby Tree-sitter repository](https://github.com/tree-sitter/tree-sitter-ruby/blob/1ebfdb288842dae5a9233e2509a135949023dd82/queries/tags.scm#L24-L43), which uses built-in functions to strip the Ruby comment character (`#`) from the docstrings associated with a class or singleton-class declaration, then selects only the docstrings adjacent to the node matched as `@definition.class`.
 
-``` scheme
+```scheme
 (
   (comment)* @doc
   .
@@ -79,7 +79,7 @@ The below table describes a standard vocabulary for kinds and roles during the t
 
 You can use the `tree-sitter tags` command to test out a tags query file, passing as arguments one or more files to tag. We can run this tool from within the Tree-sitter Ruby repository, over code in a file called `test.rb`:
 
-``` ruby
+```ruby
 module Foo
   class Bar
     # won't be included
@@ -93,7 +93,7 @@ end
 
 Invoking `tree-sitter tags test.rb` produces the following console output, representing matched entities' name, role, location, first line, and docstring:
 
-```
+```text
     test.rb
         Foo              | module       def (0, 7) - (0, 10) `module Foo`
         Bar              | class        def (1, 8) - (1, 11) `class Bar`
diff --git a/highlight/README.md b/highlight/README.md
index e8a5d063..902212ab 100644
--- a/highlight/README.md
+++ b/highlight/README.md
@@ -1,6 +1,9 @@
 # `tree-sitter-highlight`
 
-[![Crates.io](https://img.shields.io/crates/v/tree-sitter-highlight.svg)](https://crates.io/crates/tree-sitter-highlight)
+[![crates.io badge]][crates.io]
+
+[crates.io]: https://crates.io/crates/tree-sitter-highlight
+[crates.io badge]: https://img.shields.io/crates/v/tree-sitter-highlight.svg?color=%23B48723
 
 ### Usage
 
diff --git a/lib/README.md b/lib/README.md
index 82ebc5a5..231fe2ab 100644
--- a/lib/README.md
+++ b/lib/README.md
@@ -1,5 +1,4 @@
-Subdirectories
---------------
+## Subdirectories
 
 * [`src`](./src) - C source code for the Tree-sitter library
 * [`include`](./include) - C headers for the Tree-sitter library
diff --git a/lib/binding_rust/README.md b/lib/binding_rust/README.md
index dffe7661..c004f398 100644
--- a/lib/binding_rust/README.md
+++ b/lib/binding_rust/README.md
@@ -1,6 +1,9 @@
 # Rust Tree-sitter
 
-[![Crates.io](https://img.shields.io/crates/v/tree-sitter.svg)](https://crates.io/crates/tree-sitter)
+[![crates.io badge]][crates.io]
+
+[crates.io]: https://crates.io/crates/tree-sitter
+[crates.io badge]: https://img.shields.io/crates/v/tree-sitter.svg?color=%23B48723
 
 Rust bindings to the [Tree-sitter][] parsing library.
 
diff --git a/lib/binding_web/README.md b/lib/binding_web/README.md
index 1d645a33..b0ffc3ef 100644
--- a/lib/binding_web/README.md
+++ b/lib/binding_web/README.md
@@ -1,5 +1,9 @@
-Web Tree-sitter
-===============
+# Web Tree-sitter
+
+[![npmjs.com badge]][npmjs.com]
+
+[npmjs.com]: https://www.npmjs.org/package/web-tree-sitter
+[npmjs.com badge]: https://img.shields.io/npm/v/web-tree-sitter.svg?color=%23BF4A4A
 
 WebAssembly bindings to the [Tree-sitter](https://github.com/tree-sitter/tree-sitter) parsing library.
 
diff --git a/tags/README.md b/tags/README.md
index 36efa494..f5b85cb2 100644
--- a/tags/README.md
+++ b/tags/README.md
@@ -1,5 +1,10 @@
 # `tree-sitter-tags`
 
+[![crates.io badge]][crates.io]
+
+[crates.io]: https://crates.io/crates/tree-sitter-tags
+[crates.io badge]: https://img.shields.io/crates/v/tree-sitter-tags.svg?color=%23B48723
+
 ### Usage
 
 Add this crate, and the language-specific crates for whichever languages you want to parse, to your `Cargo.toml`:

From 3c806913d8af965f2e0d81e6dc55436df3ee5767 Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Sun, 16 Apr 2023 21:17:53 +0300
Subject: [PATCH 104/347] docs: improve external scanner details and fix
 conflicting tokens details

* Removed convention notes introduced in #1947 due to:
  * It doesn't so strict for bindings and they may need to obey to some
    target language conventions.
  * For language grammars there is a note that states the same in the
    `Creating Parsers` section.
* Removed `External Scanning` item introduced in 87a0517 commit
  originated from #1612 due to unclear consistency with other
  5 original statements. There is a similar explanation in the
  `Other External Scanner Details` section.
---
 docs/index.md                      |  4 ----
 docs/section-3-creating-parsers.md | 34 ++++++++++++------------------
 2 files changed, 14 insertions(+), 24 deletions(-)

diff --git a/docs/index.md b/docs/index.md
index ddfff214..86f83de7 100644
--- a/docs/index.md
+++ b/docs/index.md
@@ -30,8 +30,6 @@ There are currently bindings that allow Tree-sitter to be used from the followin
 * [Rust](https://github.com/tree-sitter/tree-sitter/tree/master/lib/binding_rust)
 * [Swift](https://github.com/ChimeHQ/SwiftTreeSitter)
 
-By convention, bindings are named with the language first, eg. ruby-tree-sitter.
-
 ### Parsers
 
 * [Ada](https://github.com/briot/tree-sitter-ada)
@@ -148,8 +146,6 @@ By convention, bindings are named with the language first, eg. ruby-tree-sitter.
 * [YANG](https://github.com/Hubro/tree-sitter-yang)
 * [Zig](https://github.com/maxxnino/tree-sitter-zig)
 
-By convention, parsers are named with the language last, eg. tree-sitter-ruby.
-
 ### Talks on Tree-sitter
 
 * [Strange Loop 2018](https://www.thestrangeloop.com/2018/tree-sitter---a-new-parsing-system-for-programming-tools.html)
diff --git a/docs/section-3-creating-parsers.md b/docs/section-3-creating-parsers.md
index 0aa3b139..faf02c4c 100644
--- a/docs/section-3-creating-parsers.md
+++ b/docs/section-3-creating-parsers.md
@@ -527,27 +527,21 @@ Tree-sitter's parsing process is divided into two phases: parsing (which is desc
 
 Grammars often contain multiple tokens that can match the same characters. For example, a grammar might contain the tokens (`"if"` and `/[a-z]+/`). Tree-sitter differentiates between these conflicting tokens in a few ways.
 
-1. **External Scanning** - If your grammar has an external scanner and one or more tokens in your `externals` array are valid at the current location, your external scanner will always be called first to determine whether those tokens are present.
+1. **Context-aware Lexing** - Tree-sitter performs lexing on-demand, during the parsing process. At any given position in a source document, the lexer only tries to recognize tokens that are *valid* at that position in the document.
 
-1. **Context-Aware Lexing** - Tree-sitter performs lexing on-demand, during the parsing process. At any given position in a source document, the lexer only tries to recognize tokens that are *valid* at that position in the document.
+2. **Lexical Precedence** - When the precedence functions described [above](#the-grammar-dsl) are used *within* the `token` function, the given explicit precedence values serve as instructions to the lexer. If there are two valid tokens that match the characters at a given position in the document, Tree-sitter will select the one with the higher precedence.
 
-1. **Explicit Lexical Precedence** - When the precedence functions described [above](#the-grammar-dsl) are used within the `token` function like `token(prec(N, ...))`, the given precedence values serve as instructions to the lexer. If there are two valid tokens that match the characters at a given position in the document, Tree-sitter will select the one with the higher precedence.
+3. **Match Length** - If multiple valid tokens with the same precedence match the characters at a given position in a document, Tree-sitter will select the token that matches the [longest sequence of characters][longest-match].
 
-1. **Match Length** - If multiple valid tokens with the same precedence match the characters at a given position in a document, Tree-sitter will select the token that matches the [longest sequence of characters][longest-match].
+4. **Match Specificity** - If there are two valid tokens with the same precedence and which both match the same number of characters, Tree-sitter will prefer a token that is specified in the grammar as a `String` over a token specified as a `RegExp`.
 
-1. **Match Specificity** - If there are two valid tokens with the same precedence and which both match the same number of characters, Tree-sitter will prefer a token that is specified in the grammar as a `String` over a token specified as a `RegExp`.
+5. **Rule Order** - If none of the above criteria can be used to select one token over another, Tree-sitter will prefer the token that appears earlier in the grammar.
 
-1. **Rule Order** - If none of the above criteria can be used to select one token over another, Tree-sitter will prefer the token that appears earlier in the grammar.
+If there is an external scanner it may have [an additional impact](#other-external-scanner-details) over regular tokens defined in the grammar.
 
 ### Lexical Precedence vs. Parse Precedence
 
-One common mistake involves not distinguishing lexical precedence from parse precedence.
-Parse precedence determines which rule is chosen to interpret a given sequence of tokens.
-Lexical precedence determines which token is chosen to interpret a given section of text.
-It is a lower-level operation that is done first.
-The above list fully capture tree-sitter's lexical precedence rules, and you will probably refer back to this section of the documentation more often than any other.
-Most of the time when you really get stuck, you're dealing with a lexical precedence problem.
-Pay particular attention to the difference in meaning between using `prec` inside the `token` function versus outside of it.
+One common mistake involves not distinguishing *lexical precedence* from *parse precedence*. Parse precedence determines which rule is chosen to interpret a given sequence of tokens. *Lexical precedence* determines which token is chosen to interpret at a given position of text and it is a lower-level operation that is done first. The above list fully captures Tree-sitter's lexical precedence rules, and you will probably refer back to this section of the documentation more often than any other. Most of the time when you really get stuck, you're dealing with a lexical precedence problem. Pay particular attention to the difference in meaning between using `prec` inside of the `token` function versus outside of it. The *lexical precedence* syntax is `token(prec(N, ...))`.
 
 ### Keywords
 
@@ -737,15 +731,15 @@ if (valid_symbols[INDENT] || valid_symbol[DEDENT]) {
 
 #### Other External Scanner Details
 
-If a token in your `externals` array is valid at the current position in the parse, your external scanner will be called first before anything else is done.
-This means your external scanner functions as a powerful override of tree-sitter's lexing behavior, and can be used to solve problems that can't be cracked with ordinary lexical, parse, or dynamic precedence.
+If a token in the `externals` array is valid at a given position in the parse, the external scanner will be called first before anything else is done. This means the external scanner functions as a powerful override of Tree-sitter's lexing behavior, and can be used to solve problems that can't be cracked with ordinary lexical, parse, or dynamic precedence.
 
-If a syntax error is encountered during regular parsing, tree-sitter's first action during error recovery will be to call your external scanner's `scan` function with all tokens marked valid.
-Your scanner should detect this case and handle it appropriately.
-One simple method of detection is to add an unused token to the end of your `externals` array, for example `externals: $ => [$.token1, $.token2, $.error_sentinel]`, then check whether that token is marked valid to determine whether tree-sitter is in error correction mode.
+If a syntax error is encountered during regular parsing, Tree-sitter's first action during error recovery will be to call the external scanner's `scan` function with all tokens marked valid. The scanner should detect this case and handle it appropriately. One simple method of detection is to add an unused token to the end of the `externals` array, for example `externals: $ => [$.token1, $.token2, $.error_sentinel]`, then check whether that token is marked valid to determine whether Tree-sitter is in error correction mode.
 
-If you put terminal keywords in your `externals` array, for example `externals: $ => ['if', 'then', 'else']`, then any time those terminals are present in your grammar they will be tokenized by your external scanner.
-It is equivalent to writing `externals: [$.if_keyword, $.then_keyword, $.else_keyword]` then using `alias($.if_keyword, 'if')` in your grammar.
+If you put terminal keywords in the `externals` array, for example `externals: $ => ['if', 'then', 'else']`, then any time those terminals are present in the grammar they will be tokenized by the external scanner. It is similar to writing `externals: [$.if_keyword, $.then_keyword, $.else_keyword]` then using `alias($.if_keyword, 'if')` in the grammar.
+
+If in the `externals` array use literal keywords then lexing works in two steps, the external scanner will be called first and if it sets a resulting token and returns `true` then the token considered as recognized and Tree-sitter moves to a next token. But the external scanner may return `false` and in this case Tree-sitter fallbacks to the internal lexing mechanism.
+
+In case of some keywords defined in the `externals` array in a rule referencing form like `$.if_keyword` and there is no additional definition of that rule in the grammar rules, e.g., `if_keyword: $ => 'if'` then fallback to the internal lexer isn't possible because Tree-sitter doesn't know the actual keyword and it's fully the external scanner resposibilty to recognize such tokens.
 
 External scanners are a common cause of infinite loops.
 Be very careful when emitting zero-width tokens from your external scanner, and if you consume characters in a loop be sure use the `eof` function to check whether you are at the end of the file.

From cae83253a2d45ed46d45fb158a36865de9754ec8 Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Mon, 17 Apr 2023 00:02:42 +0300
Subject: [PATCH 105/347] cli: pack readme file into npm package

---
 cli/npm/.gitignore   | 1 +
 cli/npm/package.json | 3 ++-
 2 files changed, 3 insertions(+), 1 deletion(-)

diff --git a/cli/npm/.gitignore b/cli/npm/.gitignore
index 942b33a1..65e04cff 100644
--- a/cli/npm/.gitignore
+++ b/cli/npm/.gitignore
@@ -3,3 +3,4 @@ tree-sitter.exe
 *.gz
 *.tgz
 LICENSE
+README.md
diff --git a/cli/npm/package.json b/cli/npm/package.json
index 44d1327f..e60c3936 100644
--- a/cli/npm/package.json
+++ b/cli/npm/package.json
@@ -15,7 +15,8 @@
   "main": "lib/api/index.js",
   "scripts": {
     "install": "node install.js",
-    "prepack": "cp ../../LICENSE ."
+    "prepack": "cp ../../LICENSE ../README.md .",
+    "postpack": "rm LICENSE README.md"
   },
   "bin": {
     "tree-sitter": "cli.js"

From 7642fda99f7f45eefee4c8a49f0a2cfde7bc2a66 Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Tue, 11 Apr 2023 09:48:48 +0300
Subject: [PATCH 106/347] cli: npm - strict platform / arch mapping for
 provided targets

---
 .github/workflows/build.yml |  9 ++++---
 cli/npm/install.js          | 48 ++++++++++++++++++++++++++-----------
 2 files changed, 40 insertions(+), 17 deletions(-)

diff --git a/.github/workflows/build.yml b/.github/workflows/build.yml
index d76fb853..fc45f778 100644
--- a/.github/workflows/build.yml
+++ b/.github/workflows/build.yml
@@ -21,7 +21,7 @@ jobs:
       fail-fast: false
       matrix:
         runtime:
-        - linux-aarch64 #
+        - linux-arm64   #
         - linux-arm     #
         - linux-x64     #
         - linux-x86     #
@@ -31,7 +31,10 @@ jobs:
         - macos-x64     #
 
         include:
-        - { runtime: linux-aarch64 , target: aarch64-unknown-linux-gnu   , os: ubuntu-latest  , use-cross: true }
+        # When adding a new `target`:
+        # 1. Define a new runtime alias above
+        # 2. Add a new record to a matrix map in `cli/npm/install.js`
+        - { runtime: linux-arm64   , target: aarch64-unknown-linux-gnu   , os: ubuntu-latest  , use-cross: true }
         - { runtime: linux-arm     , target: arm-unknown-linux-gnueabihf , os: ubuntu-latest  , use-cross: true }
         - { runtime: linux-x64     , target: x86_64-unknown-linux-gnu    , os: ubuntu-latest                    }
         - { runtime: linux-x86     , target: i686-unknown-linux-gnu      , os: ubuntu-latest  , use-cross: true }
@@ -41,7 +44,7 @@ jobs:
         - { runtime: macos-x64     , target: x86_64-apple-darwin         , os: macos-latest                     }
 
         # Cross compilers for C library
-        - { runtime: linux-aarch64 , cc: aarch64-linux-gnu-gcc           , ar: aarch64-linux-gnu-ar               }
+        - { runtime: linux-arm64   , cc: aarch64-linux-gnu-gcc           , ar: aarch64-linux-gnu-ar               }
         - { runtime: linux-arm     , cc: arm-unknown-linux-gnueabihf-gcc , ar: arm-unknown-linux-gnueabihf-gcc-ar }
         - { runtime: linux-x86     , cc: i686-linux-gnu-gcc              , ar: i686-linux-gnu-ar                  }
 
diff --git a/cli/npm/install.js b/cli/npm/install.js
index 9e572c3a..e343158b 100755
--- a/cli/npm/install.js
+++ b/cli/npm/install.js
@@ -6,21 +6,41 @@ const http = require('http');
 const https = require('https');
 const packageJSON = require('./package.json');
 
+// Look to a results table in https://github.com/tree-sitter/tree-sitter/issues/2196
+const matrix = {
+  platform: {
+    'darwin': {
+      name: 'macos',
+      arch: {
+        'arm64': { name: 'arm64' },
+        'x64': { name: 'x64' },
+      }
+    },
+    'linux': {
+      name: 'linux',
+      arch: {
+        'arm64': { name: 'arm64' },
+        'arm': { name: 'arm' },
+        'x64': { name: 'x64' },
+        'x86': { name: 'x86' },
+      }
+    },
+    'win32': {
+      name: 'windows',
+      arch: {
+        'x64': { name: 'x64' },
+        'x86': { name: 'x86' },
+        'ia32': { name: 'x86' },
+      }
+    },
+  },
+}
+
 // Determine the URL of the file.
-const platformName = {
-  'darwin': 'macos',
-  'linux': 'linux',
-  'win32': 'windows'
-}[process.platform];
+const platform = matrix.platform[process.platform];
+const arch = platform && platform.arch[process.arch];
 
-let archName = {
-  'x64': 'x64',
-  'x86': 'x86',
-  'ia32': 'x86',
-  'arm64': 'arm64'
-}[process.arch];
-
-if (!platformName || !archName) {
+if (!platform || !platform.name || !arch || !arch.name) {
   console.error(
     `Cannot install tree-sitter-cli for platform ${process.platform}, architecture ${process.arch}`
   );
@@ -28,7 +48,7 @@ if (!platformName || !archName) {
 }
 
 const releaseURL = `https://github.com/tree-sitter/tree-sitter/releases/download/v${packageJSON.version}`;
-const assetName = `tree-sitter-${platformName}-${archName}.gz`;
+const assetName = `tree-sitter-${platform.name}-${arch.name}.gz`;
 const assetURL = `${releaseURL}/${assetName}`;
 
 // Remove previously-downloaded files.

From 1666283f37b36fd34a360ed2431d9fce4302e1c5 Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Tue, 11 Apr 2023 21:02:18 +0300
Subject: [PATCH 107/347] cicd: cleanup and add building for windows-arm64

---
 .github/workflows/build.yml | 30 ++++++++++++++++--------------
 cli/npm/install.js          |  1 +
 2 files changed, 17 insertions(+), 14 deletions(-)

diff --git a/.github/workflows/build.yml b/.github/workflows/build.yml
index fc45f778..68ba8ce4 100644
--- a/.github/workflows/build.yml
+++ b/.github/workflows/build.yml
@@ -25,6 +25,7 @@ jobs:
         - linux-arm     #
         - linux-x64     #
         - linux-x86     #
+        - windows-arm64 #
         - windows-x64   # <-- No C library build - requires an additional adapted Makefile for `cl.exe` compiler
         - windows-x86   #     -- // --
         - macos-arm64   # <-- MacOS M1/M2 - no tests, only CLI build to be published on release artifacts
@@ -38,6 +39,7 @@ jobs:
         - { runtime: linux-arm     , target: arm-unknown-linux-gnueabihf , os: ubuntu-latest  , use-cross: true }
         - { runtime: linux-x64     , target: x86_64-unknown-linux-gnu    , os: ubuntu-latest                    }
         - { runtime: linux-x86     , target: i686-unknown-linux-gnu      , os: ubuntu-latest  , use-cross: true }
+        - { runtime: windows-arm64 , target: aarch64-pc-windows-msvc     , os: windows-latest                   }
         - { runtime: windows-x64   , target: x86_64-pc-windows-msvc      , os: windows-latest                   }
         - { runtime: windows-x86   , target: i686-pc-windows-msvc        , os: windows-latest                   }
         - { runtime: macos-arm64   , target: aarch64-apple-darwin        , os: macos-latest                     }
@@ -49,8 +51,12 @@ jobs:
         - { runtime: linux-x86     , cc: i686-linux-gnu-gcc              , ar: i686-linux-gnu-ar                  }
 
         # See #2041 tree-sitter issue
-        - { runtime: windows-x64   , rust_test_threads: 1 }
-        - { runtime: windows-x86   , rust_test_threads: 1 }
+        - { runtime: windows-x64   , rust-test-threads: 1 }
+        - { runtime: windows-x86   , rust-test-threads: 1 }
+
+        # CLI only build
+        - { runtime: windows-arm64 , cli-only: true }
+        - { runtime: macos-arm64   , cli-only: true }
 
     env:
       BUILD_CMD: cargo
@@ -102,14 +108,10 @@ jobs:
         echo "ENV DEBIAN_FRONTEND=noninteractive"              >> Dockerfile
         echo "RUN apt-get update && apt-get install -y nodejs" >> Dockerfile
         docker build -t $image .
-        docker images
-        docker run --rm $image env
-
-        cd -
 
     - name: Setup env extras
       env:
-        RUST_TEST_THREADS: ${{ matrix.rust_test_threads }}
+        RUST_TEST_THREADS: ${{ matrix.rust-test-threads }}
         USE_CROSS: ${{ matrix.use-cross }}
         CC: ${{ matrix.cc }}
         AR: ${{ matrix.ar }}
@@ -140,34 +142,34 @@ jobs:
       run: make.sh CFLAGS="-Werror" -j
 
     - name: Build wasm library
-      if: ${{ !matrix.use-cross && matrix.runtime != 'macos-arm64' }} # Not used
+      if: ${{ !matrix.use-cross && !matrix.cli-only }}
       run: script/build-wasm
 
     - name: Build CLI
       run: $BUILD_CMD build --release --target=${{ matrix.target }}
 
     - name: Fetch fixtures
-      if: ${{ matrix.runtime != 'macos-arm64' }} # Not used
+      if: ${{ !matrix.cli-only }}
       run: script/fetch-fixtures
 
     - name: Generate fixtures
-      if: ${{ matrix.runtime != 'macos-arm64' }} # Can't natively run CLI on runner's host
+      if: ${{ !matrix.cli-only }} # Can't natively run CLI on runner's host
       run: script/generate-fixtures
 
     - name: Generate WASM fixtures
-      if: ${{ !matrix.use-cross && matrix.runtime != 'macos-arm64' }} # Not used
+      if: ${{ !matrix.use-cross && !matrix.cli-only }}
       run: script/generate-fixtures-wasm
 
     - name: Run main tests
-      if: ${{ matrix.runtime != 'macos-arm64' }} # Can't natively run CLI on runner's host
+      if: ${{ !matrix.cli-only }} # Can't natively run CLI on runner's host
       run: $BUILD_CMD test --target=${{ matrix.target }}
 
     - name: Run wasm tests
-      if: ${{ !matrix.use-cross && matrix.runtime != 'macos-arm64' }} # Not used
+      if: ${{ !matrix.use-cross && !matrix.cli-only }}
       run: script/test-wasm
 
     - name: Run benchmarks
-      if: ${{ !matrix.use-cross && matrix.runtime != 'macos-arm64' }} # Cross-compiled benchmarks make no sense
+      if: ${{ !matrix.use-cross && !matrix.cli-only }} # Cross-compiled benchmarks make no sense
       run: $BUILD_CMD bench benchmark -p tree-sitter-cli --target=${{ matrix.target }}
 
     - name: Upload CLI artifact
diff --git a/cli/npm/install.js b/cli/npm/install.js
index e343158b..836a840d 100755
--- a/cli/npm/install.js
+++ b/cli/npm/install.js
@@ -28,6 +28,7 @@ const matrix = {
     'win32': {
       name: 'windows',
       arch: {
+        'arm64': { name: 'arm64' },
         'x64': { name: 'x64' },
         'x86': { name: 'x86' },
         'ia32': { name: 'x86' },

From 1e81a1b67f5aa8b17899186142a26eb422886065 Mon Sep 17 00:00:00 2001
From: Lewis Russell <lewis6991@gmail.com>
Date: Fri, 17 Mar 2023 14:22:20 +0000
Subject: [PATCH 108/347] feat(lib): add ts_query_cursor_set_max_start_depth
 query API

This allows configuring cursors from traversing too deep into a tree.
---
 cli/src/tests/query_test.rs   | 97 +++++++++++++++++++++++++++++++++++
 lib/binding_rust/bindings.rs  |  3 ++
 lib/binding_rust/lib.rs       |  8 +++
 lib/include/tree_sitter/api.h |  8 +++
 lib/src/query.c               | 36 ++++++++++---
 5 files changed, 144 insertions(+), 8 deletions(-)

diff --git a/cli/src/tests/query_test.rs b/cli/src/tests/query_test.rs
index 7d01c26e..4743bf9e 100644
--- a/cli/src/tests/query_test.rs
+++ b/cli/src/tests/query_test.rs
@@ -4469,6 +4469,103 @@ fn test_capture_quantifiers() {
     });
 }
 
+#[test]
+fn test_query_max_start_depth() {
+    struct Row {
+        description: &'static str,
+        pattern: &'static str,
+        depth: u32,
+        matches: &'static [(usize, &'static [(&'static str, &'static str)])],
+    }
+
+    let source = r#"
+        if (a1 && a2) {
+            if (b1 && b2) { }
+            if (c) { }
+        }
+        if (d) {
+            if (e1 && e2) { }
+            if (f) { }
+        }
+    "#;
+
+    let rows = &[
+        Row {
+            description: "depth 0: match none",
+            depth: 0,
+            pattern: r#"
+                (if_statement) @capture
+            "#,
+            matches: &[]
+        },
+        Row {
+            description: "depth 1: match 2 if statements at the top level",
+            depth: 1,
+            pattern: r#"
+                (if_statement) @capture
+            "#,
+            matches : &[
+                (0, &[("capture", "if (a1 && a2) {\n            if (b1 && b2) { }\n            if (c) { }\n        }")]),
+                (0, &[("capture", "if (d) {\n            if (e1 && e2) { }\n            if (f) { }\n        }")])
+            ]
+        },
+        Row {
+            description: "depth 1 with deep pattern: match the only the first if statement",
+            depth: 1,
+            pattern: r#"
+                (if_statement
+                    condition: (parenthesized_expression
+                        (binary_expression)
+                    )
+                ) @capture
+            "#,
+            matches: &[
+                (0, &[("capture", "if (a1 && a2) {\n            if (b1 && b2) { }\n            if (c) { }\n        }")]),
+            ]
+        },
+        Row {
+            description: "depth 3 with deep pattern: match all if statements with a binexpr condition",
+            depth: 3,
+            pattern: r#"
+                (if_statement
+                    condition: (parenthesized_expression
+                        (binary_expression)
+                    )
+                ) @capture
+            "#,
+            matches: &[
+                (0, &[("capture", "if (a1 && a2) {\n            if (b1 && b2) { }\n            if (c) { }\n        }")]),
+                (0, &[("capture", "if (b1 && b2) { }")]),
+                (0, &[("capture", "if (e1 && e2) { }")])
+            ]
+        },
+    ];
+
+    allocations::record(|| {
+        let language = get_language("c");
+        let mut parser = Parser::new();
+        parser.set_language(language).unwrap();
+        let tree = parser.parse(source, None).unwrap();
+        let mut cursor = QueryCursor::new();
+
+        for row in rows.iter() {
+            eprintln!("  query example: {:?}", row.description);
+
+            let query = Query::new(language, row.pattern).unwrap();
+            cursor.set_max_start_depth(row.depth);
+
+            let matches = cursor.matches(&query, tree.root_node(), source.as_bytes());
+            let expected = row
+                .matches
+                .iter()
+                .map(|x| (x.0, x.1.to_vec()))
+                .collect::<Vec<_>>();
+
+            assert_eq!(collect_matches(matches, &query, source), expected);
+        }
+    });
+}
+
 fn assert_query_matches(
     language: Language,
     query: &Query,
diff --git a/lib/binding_rust/bindings.rs b/lib/binding_rust/bindings.rs
index 863b1df5..158d1ba1 100644
--- a/lib/binding_rust/bindings.rs
+++ b/lib/binding_rust/bindings.rs
@@ -565,6 +565,9 @@ extern "C" {
 extern "C" {
     pub fn ts_query_cursor_set_point_range(arg1: *mut TSQueryCursor, arg2: TSPoint, arg3: TSPoint);
 }
+extern "C" {
+    pub fn ts_query_cursor_set_max_start_depth(arg1: *mut TSQueryCursor, arg2: u32);
+}
 extern "C" {
     #[doc = " Advance to the next match of the currently running query.\n\n If there is a match, write it to `*match` and return `true`.\n Otherwise, return `false`."]
     pub fn ts_query_cursor_next_match(arg1: *mut TSQueryCursor, match_: *mut TSQueryMatch) -> bool;
diff --git a/lib/binding_rust/lib.rs b/lib/binding_rust/lib.rs
index 9d470457..87294a5d 100644
--- a/lib/binding_rust/lib.rs
+++ b/lib/binding_rust/lib.rs
@@ -1932,6 +1932,14 @@ impl QueryCursor {
         }
         self
     }
+
+    #[doc(alias = "ts_query_cursor_set_max_start_depth")]
+    pub fn set_max_start_depth(&mut self, max_start_depth: u32) -> &mut Self {
+        unsafe {
+            ffi::ts_query_cursor_set_max_start_depth(self.ptr.as_ptr(), max_start_depth);
+        }
+        self
+    }
 }
 
 impl<'a, 'tree> QueryMatch<'a, 'tree> {
diff --git a/lib/include/tree_sitter/api.h b/lib/include/tree_sitter/api.h
index edc1c36a..9dc058e8 100644
--- a/lib/include/tree_sitter/api.h
+++ b/lib/include/tree_sitter/api.h
@@ -892,6 +892,14 @@ bool ts_query_cursor_next_capture(
   uint32_t *capture_index
 );
 
+/**
+ * Set the maximum start depth for a cursor.
+ *
+ * This prevents cursors from exploring children nodes at a certain depth.
+ * Note if a pattern includes many children, then they will still be checked.
+ */
+void ts_query_cursor_set_max_start_depth(TSQueryCursor *, uint32_t);
+
 /**********************/
 /* Section - Language */
 /**********************/
diff --git a/lib/src/query.c b/lib/src/query.c
index da7a4166..dc6ab784 100644
--- a/lib/src/query.c
+++ b/lib/src/query.c
@@ -305,6 +305,7 @@ struct TSQueryCursor {
   Array(QueryState) finished_states;
   CaptureListPool capture_list_pool;
   uint32_t depth;
+  uint32_t max_start_depth;
   uint32_t start_byte;
   uint32_t end_byte;
   TSPoint start_point;
@@ -2976,6 +2977,7 @@ TSQueryCursor *ts_query_cursor_new(void) {
     .end_byte = UINT32_MAX,
     .start_point = {0, 0},
     .end_point = POINT_MAX,
+    .max_start_depth = UINT32_MAX,
   };
   array_reserve(&self->states, 8);
   array_reserve(&self->finished_states, 8);
@@ -3346,9 +3348,15 @@ static QueryState *ts_query_cursor__copy_state(
   return &self->states.contents[state_index + 1];
 }
 
-static inline bool ts_query_cursor__should_descend_outside_of_range(
-  TSQueryCursor *self
+static inline bool ts_query_cursor__should_descend(
+  TSQueryCursor *self,
+  bool node_intersects_range
 ) {
+
+  if (node_intersects_range && self->depth < self->max_start_depth) {
+    return true;
+  }
+
   // If there are in-progress matches whose remaining steps occur
   // deeper in the tree, then descend.
   for (unsigned i = 0; i < self->states.size; i++) {
@@ -3362,6 +3370,10 @@ static inline bool ts_query_cursor__should_descend_outside_of_range(
     }
   }
 
+  if (self->depth >= self->max_start_depth) {
+    return false;
+  }
+
   // If the current node is hidden, then a non-rooted pattern might match
   // one if its roots inside of this node, and match another of its roots
   // as part of a sibling node, so we may need to descend.
@@ -3555,12 +3567,14 @@ static inline bool ts_query_cursor__advance(
             // If this node matches the first step of the pattern, then add a new
             // state at the start of this pattern.
             QueryStep *step = &self->query->steps.contents[pattern->step_index];
+            uint32_t start_depth = self->depth - step->depth;
             if (
               (pattern->is_rooted ?
                 node_intersects_range :
                 (parent_intersects_range && !parent_is_error)) &&
               (!step->field || field_id == step->field) &&
-              (!step->supertype_symbol || supertype_count > 0)
+              (!step->supertype_symbol || supertype_count > 0) &&
+              (start_depth <= self->max_start_depth)
             ) {
               ts_query_cursor__add_state(self, pattern);
             }
@@ -3573,6 +3587,7 @@ static inline bool ts_query_cursor__advance(
           PatternEntry *pattern = &self->query->pattern_map.contents[i];
 
           QueryStep *step = &self->query->steps.contents[pattern->step_index];
+          uint32_t start_depth = self->depth - step->depth;
           do {
             // If this node matches the first step of the pattern, then add a new
             // state at the start of this pattern.
@@ -3580,7 +3595,8 @@ static inline bool ts_query_cursor__advance(
               (pattern->is_rooted ?
                 node_intersects_range :
                 (parent_intersects_range && !parent_is_error)) &&
-              (!step->field || field_id == step->field)
+              (!step->field || field_id == step->field) &&
+              (start_depth <= self->max_start_depth)
             ) {
               ts_query_cursor__add_state(self, pattern);
             }
@@ -3881,10 +3897,7 @@ static inline bool ts_query_cursor__advance(
         }
       }
 
-      bool should_descend =
-        node_intersects_range ||
-        ts_query_cursor__should_descend_outside_of_range(self);
-      if (should_descend) {
+      if (ts_query_cursor__should_descend(self, node_intersects_range)) {
         switch (ts_tree_cursor_goto_first_child_internal(&self->cursor)) {
           case TreeCursorStepVisible:
             self->depth++;
@@ -4075,4 +4088,11 @@ bool ts_query_cursor_next_capture(
   }
 }
 
+void ts_query_cursor_set_max_start_depth(
+  TSQueryCursor *self,
+  uint32_t max_start_depth
+) {
+  self->max_start_depth = max_start_depth;
+}
+
 #undef LOG

From d4d5e29c91ff4f85d625cfbc854ab605c2975e8e Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Mon, 17 Apr 2023 10:54:01 +0300
Subject: [PATCH 109/347] feat(lib): ts_query_cursor_set_max_start_depth - use
 0 to reset

---
 Cargo.lock                    | 139 ++++++++++++++++++++++++++--------
 cli/Cargo.toml                |   1 +
 cli/src/tests/query_test.rs   |  27 ++++---
 lib/include/tree_sitter/api.h |   2 +
 lib/src/query.c               |   6 +-
 5 files changed, 132 insertions(+), 43 deletions(-)

diff --git a/Cargo.lock b/Cargo.lock
index 7c3fa7eb..9b74a638 100644
--- a/Cargo.lock
+++ b/Cargo.lock
@@ -191,13 +191,13 @@ checksum = "7fcaabb2fef8c910e7f4c7ce9f67a1283a1715879a7c230ca9d6d1ae31f16d91"
 
 [[package]]
 name = "errno"
-version = "0.3.0"
+version = "0.3.1"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "50d6a0976c999d473fe89ad888d5a284e55366d9dc9038b1ba2aa15128c4afa0"
+checksum = "4bcfec3a70f97c962c307b2d2c56e358cf1d00b558d74262b5f929ee8cc7e73a"
 dependencies = [
  "errno-dragonfly",
  "libc",
- "windows-sys",
+ "windows-sys 0.48.0",
 ]
 
 [[package]]
@@ -230,9 +230,9 @@ dependencies = [
 
 [[package]]
 name = "getrandom"
-version = "0.2.8"
+version = "0.2.9"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "c05aeb6a22b8f62540c194aac980f2115af067bfe15a0734d7277a768d396b31"
+checksum = "c85e1d9ab2eadba7e5040d4e09cbd6d072b76a557ad64e797c2cb9d4da21d7e4"
 dependencies = [
  "cfg-if",
  "libc",
@@ -301,6 +301,12 @@ dependencies = [
  "hashbrown",
 ]
 
+[[package]]
+name = "indoc"
+version = "2.0.1"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "9f2cb48b81b1dc9f39676bf99f5499babfec7cd8fe14307f7b3d747208fb5690"
+
 [[package]]
 name = "instant"
 version = "0.1.12"
@@ -312,13 +318,13 @@ dependencies = [
 
 [[package]]
 name = "io-lifetimes"
-version = "1.0.9"
+version = "1.0.10"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "09270fd4fa1111bc614ed2246c7ef56239a3063d5be0d1ec3b589c505d400aeb"
+checksum = "9c66c74d2ae7e79a5a8f7ac924adbe38ee42a859c6539ad869eb51f0b52dc220"
 dependencies = [
  "hermit-abi 0.3.1",
  "libc",
- "windows-sys",
+ "windows-sys 0.48.0",
 ]
 
 [[package]]
@@ -340,7 +346,7 @@ dependencies = [
  "log",
  "thiserror",
  "walkdir",
- "windows-sys",
+ "windows-sys 0.45.0",
 ]
 
 [[package]]
@@ -578,16 +584,16 @@ checksum = "08d43f7aa6b08d49f382cde6a7982047c3426db949b1424bc4b7ec9ae12c6ce2"
 
 [[package]]
 name = "rustix"
-version = "0.37.7"
+version = "0.37.11"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "2aae838e49b3d63e9274e1c01833cc8139d3fec468c3b84688c628f44b1ae11d"
+checksum = "85597d61f83914ddeba6a47b3b8ffe7365107221c2e557ed94426489fefb5f77"
 dependencies = [
  "bitflags",
  "errno",
  "io-lifetimes",
  "libc",
  "linux-raw-sys",
- "windows-sys",
+ "windows-sys 0.48.0",
 ]
 
 [[package]]
@@ -613,29 +619,29 @@ checksum = "bebd363326d05ec3e2f532ab7660680f3b02130d780c299bca73469d521bc0ed"
 
 [[package]]
 name = "serde"
-version = "1.0.159"
+version = "1.0.160"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "3c04e8343c3daeec41f58990b9d77068df31209f2af111e059e9fe9646693065"
+checksum = "bb2f3770c8bce3bcda7e149193a069a0f4365bda1fa5cd88e03bca26afc1216c"
 dependencies = [
  "serde_derive",
 ]
 
 [[package]]
 name = "serde_derive"
-version = "1.0.159"
+version = "1.0.160"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "4c614d17805b093df4b147b51339e7e44bf05ef59fba1e45d83500bcfb4d8585"
+checksum = "291a097c63d8497e00160b166a967a4a79c64f3facdd01cbd7502231688d77df"
 dependencies = [
  "proc-macro2",
  "quote",
- "syn 2.0.13",
+ "syn 2.0.15",
 ]
 
 [[package]]
 name = "serde_json"
-version = "1.0.95"
+version = "1.0.96"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "d721eca97ac802aa7777b701877c8004d950fc142651367300d21c1cc0194744"
+checksum = "057d394a50403bcac12672b2b18fb387ab6d289d957dab67dd201875391e52f1"
 dependencies = [
  "indexmap",
  "itoa",
@@ -668,9 +674,9 @@ dependencies = [
 
 [[package]]
 name = "syn"
-version = "2.0.13"
+version = "2.0.15"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "4c9da457c5285ac1f936ebd076af6dac17a61cfe7826f2076b4d015cf47bc8ec"
+checksum = "a34fcf3e8b60f57e6a14301a2e916d323af98b0ea63c599441eec8558660c822"
 dependencies = [
  "proc-macro2",
  "quote",
@@ -687,7 +693,7 @@ dependencies = [
  "fastrand",
  "redox_syscall 0.3.5",
  "rustix",
- "windows-sys",
+ "windows-sys 0.45.0",
 ]
 
 [[package]]
@@ -716,7 +722,7 @@ checksum = "f9456a42c5b0d803c8cd86e73dd7cc9edd429499f37a3550d286d5e86720569f"
 dependencies = [
  "proc-macro2",
  "quote",
- "syn 2.0.13",
+ "syn 2.0.15",
 ]
 
 [[package]]
@@ -778,6 +784,7 @@ dependencies = [
  "glob",
  "html-escape",
  "indexmap",
+ "indoc",
  "lazy_static",
  "log",
  "path-slash",
@@ -999,9 +1006,9 @@ dependencies = [
 
 [[package]]
 name = "webbrowser"
-version = "0.8.8"
+version = "0.8.9"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "579cc485bd5ce5bfa0d738e4921dd0b956eca9800be1fd2e5257ebe95bc4617e"
+checksum = "b692165700260bbd40fbc5ff23766c03e339fbaca907aeea5cb77bf0a553ca83"
 dependencies = [
  "core-foundation",
  "dirs 4.0.0",
@@ -1062,7 +1069,16 @@ version = "0.45.0"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "75283be5efb2831d37ea142365f009c02ec203cd29a3ebecbc093d52315b66d0"
 dependencies = [
- "windows-targets",
+ "windows-targets 0.42.2",
+]
+
+[[package]]
+name = "windows-sys"
+version = "0.48.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "677d2418bec65e3338edb076e806bc1ec15693c5d0104683f2efe857f61056a9"
+dependencies = [
+ "windows-targets 0.48.0",
 ]
 
 [[package]]
@@ -1071,13 +1087,28 @@ version = "0.42.2"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "8e5180c00cd44c9b1c88adb3693291f1cd93605ded80c250a75d472756b4d071"
 dependencies = [
- "windows_aarch64_gnullvm",
- "windows_aarch64_msvc",
- "windows_i686_gnu",
- "windows_i686_msvc",
- "windows_x86_64_gnu",
- "windows_x86_64_gnullvm",
- "windows_x86_64_msvc",
+ "windows_aarch64_gnullvm 0.42.2",
+ "windows_aarch64_msvc 0.42.2",
+ "windows_i686_gnu 0.42.2",
+ "windows_i686_msvc 0.42.2",
+ "windows_x86_64_gnu 0.42.2",
+ "windows_x86_64_gnullvm 0.42.2",
+ "windows_x86_64_msvc 0.42.2",
+]
+
+[[package]]
+name = "windows-targets"
+version = "0.48.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "7b1eb6f0cd7c80c79759c929114ef071b87354ce476d9d94271031c0497adfd5"
+dependencies = [
+ "windows_aarch64_gnullvm 0.48.0",
+ "windows_aarch64_msvc 0.48.0",
+ "windows_i686_gnu 0.48.0",
+ "windows_i686_msvc 0.48.0",
+ "windows_x86_64_gnu 0.48.0",
+ "windows_x86_64_gnullvm 0.48.0",
+ "windows_x86_64_msvc 0.48.0",
 ]
 
 [[package]]
@@ -1086,38 +1117,80 @@ version = "0.42.2"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "597a5118570b68bc08d8d59125332c54f1ba9d9adeedeef5b99b02ba2b0698f8"
 
+[[package]]
+name = "windows_aarch64_gnullvm"
+version = "0.48.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "91ae572e1b79dba883e0d315474df7305d12f569b400fcf90581b06062f7e1bc"
+
 [[package]]
 name = "windows_aarch64_msvc"
 version = "0.42.2"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "e08e8864a60f06ef0d0ff4ba04124db8b0fb3be5776a5cd47641e942e58c4d43"
 
+[[package]]
+name = "windows_aarch64_msvc"
+version = "0.48.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "b2ef27e0d7bdfcfc7b868b317c1d32c641a6fe4629c171b8928c7b08d98d7cf3"
+
 [[package]]
 name = "windows_i686_gnu"
 version = "0.42.2"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "c61d927d8da41da96a81f029489353e68739737d3beca43145c8afec9a31a84f"
 
+[[package]]
+name = "windows_i686_gnu"
+version = "0.48.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "622a1962a7db830d6fd0a69683c80a18fda201879f0f447f065a3b7467daa241"
+
 [[package]]
 name = "windows_i686_msvc"
 version = "0.42.2"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "44d840b6ec649f480a41c8d80f9c65108b92d89345dd94027bfe06ac444d1060"
 
+[[package]]
+name = "windows_i686_msvc"
+version = "0.48.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "4542c6e364ce21bf45d69fdd2a8e455fa38d316158cfd43b3ac1c5b1b19f8e00"
+
 [[package]]
 name = "windows_x86_64_gnu"
 version = "0.42.2"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "8de912b8b8feb55c064867cf047dda097f92d51efad5b491dfb98f6bbb70cb36"
 
+[[package]]
+name = "windows_x86_64_gnu"
+version = "0.48.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "ca2b8a661f7628cbd23440e50b05d705db3686f894fc9580820623656af974b1"
+
 [[package]]
 name = "windows_x86_64_gnullvm"
 version = "0.42.2"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "26d41b46a36d453748aedef1486d5c7a85db22e56aff34643984ea85514e94a3"
 
+[[package]]
+name = "windows_x86_64_gnullvm"
+version = "0.48.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "7896dbc1f41e08872e9d5e8f8baa8fdd2677f29468c4e156210174edc7f7b953"
+
 [[package]]
 name = "windows_x86_64_msvc"
 version = "0.42.2"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "9aec5da331524158c6d1a4ac0ab1541149c0b9505fde06423b02f5ef0106b9f0"
+
+[[package]]
+name = "windows_x86_64_msvc"
+version = "0.48.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "1a515f5799fe4961cb532f983ce2b23082366b898e52ffbce459c86f67c8378a"
diff --git a/cli/Cargo.toml b/cli/Cargo.toml
index ee6d52af..28e3d37f 100644
--- a/cli/Cargo.toml
+++ b/cli/Cargo.toml
@@ -78,6 +78,7 @@ tempfile = "3"
 pretty_assertions = "0.7.2"
 ctor = "0.1"
 unindent = "0.2"
+indoc = "2.0.1"
 
 [build-dependencies]
 toml = "0.5"
diff --git a/cli/src/tests/query_test.rs b/cli/src/tests/query_test.rs
index 4743bf9e..f0bded2f 100644
--- a/cli/src/tests/query_test.rs
+++ b/cli/src/tests/query_test.rs
@@ -4,6 +4,7 @@ use super::helpers::{
     query_helpers::{Match, Pattern},
     ITERATION_COUNT,
 };
+use indoc::indoc;
 use lazy_static::lazy_static;
 use rand::{prelude::StdRng, SeedableRng};
 use std::{env, fmt::Write};
@@ -4478,7 +4479,7 @@ fn test_query_max_start_depth() {
         matches: &'static [(usize, &'static [(&'static str, &'static str)])],
     }
 
-    let source = r#"
+    let source = indoc! {"
         if (a1 && a2) {
             if (b1 && b2) { }
             if (c) { }
@@ -4487,16 +4488,24 @@ fn test_query_max_start_depth() {
             if (e1 && e2) { }
             if (f) { }
         }
-    "#;
+    "};
 
+    #[rustfmt::skip]
     let rows = &[
         Row {
-            description: "depth 0: match none",
+            description: "depth 0: match all",
             depth: 0,
             pattern: r#"
                 (if_statement) @capture
             "#,
-            matches: &[]
+            matches: &[
+                (0, &[("capture", "if (a1 && a2) {\n    if (b1 && b2) { }\n    if (c) { }\n}")]),
+                (0, &[("capture", "if (b1 && b2) { }")]),
+                (0, &[("capture", "if (c) { }")]),
+                (0, &[("capture", "if (d) {\n    if (e1 && e2) { }\n    if (f) { }\n}")]),
+                (0, &[("capture", "if (e1 && e2) { }")]),
+                (0, &[("capture", "if (f) { }")]),
+            ]
         },
         Row {
             description: "depth 1: match 2 if statements at the top level",
@@ -4505,8 +4514,8 @@ fn test_query_max_start_depth() {
                 (if_statement) @capture
             "#,
             matches : &[
-                (0, &[("capture", "if (a1 && a2) {\n            if (b1 && b2) { }\n            if (c) { }\n        }")]),
-                (0, &[("capture", "if (d) {\n            if (e1 && e2) { }\n            if (f) { }\n        }")])
+                (0, &[("capture", "if (a1 && a2) {\n    if (b1 && b2) { }\n    if (c) { }\n}")]),
+                (0, &[("capture", "if (d) {\n    if (e1 && e2) { }\n    if (f) { }\n}")]),
             ]
         },
         Row {
@@ -4520,7 +4529,7 @@ fn test_query_max_start_depth() {
                 ) @capture
             "#,
             matches: &[
-                (0, &[("capture", "if (a1 && a2) {\n            if (b1 && b2) { }\n            if (c) { }\n        }")]),
+                (0, &[("capture", "if (a1 && a2) {\n    if (b1 && b2) { }\n    if (c) { }\n}")]),
             ]
         },
         Row {
@@ -4534,9 +4543,9 @@ fn test_query_max_start_depth() {
                 ) @capture
             "#,
             matches: &[
-                (0, &[("capture", "if (a1 && a2) {\n            if (b1 && b2) { }\n            if (c) { }\n        }")]),
+                (0, &[("capture", "if (a1 && a2) {\n    if (b1 && b2) { }\n    if (c) { }\n}")]),
                 (0, &[("capture", "if (b1 && b2) { }")]),
-                (0, &[("capture", "if (e1 && e2) { }")])
+                (0, &[("capture", "if (e1 && e2) { }")]),
             ]
         },
     ];
diff --git a/lib/include/tree_sitter/api.h b/lib/include/tree_sitter/api.h
index 9dc058e8..6824415a 100644
--- a/lib/include/tree_sitter/api.h
+++ b/lib/include/tree_sitter/api.h
@@ -897,6 +897,8 @@ bool ts_query_cursor_next_capture(
  *
  * This prevents cursors from exploring children nodes at a certain depth.
  * Note if a pattern includes many children, then they will still be checked.
+ *
+ * Set to `0` to remove the maximum start depth.
  */
 void ts_query_cursor_set_max_start_depth(TSQueryCursor *, uint32_t);
 
diff --git a/lib/src/query.c b/lib/src/query.c
index dc6ab784..275512c0 100644
--- a/lib/src/query.c
+++ b/lib/src/query.c
@@ -4092,7 +4092,11 @@ void ts_query_cursor_set_max_start_depth(
   TSQueryCursor *self,
   uint32_t max_start_depth
 ) {
-  self->max_start_depth = max_start_depth;
+  if (max_start_depth == 0) {
+    self->max_start_depth = UINT32_MAX;
+  } else {
+    self->max_start_depth = max_start_depth;
+  }
 }
 
 #undef LOG

From cc6596be820f454695d63fc7822aac9637da9f4a Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Mon, 17 Apr 2023 11:21:37 +0300
Subject: [PATCH 110/347] chore(bindgen): update bindgen to 0.65.1 and
 regenerate bindings

---
 lib/binding_rust/bindings.rs | 9 +++++----
 script/generate-bindings     | 1 -
 2 files changed, 5 insertions(+), 5 deletions(-)

diff --git a/lib/binding_rust/bindings.rs b/lib/binding_rust/bindings.rs
index 158d1ba1..24751e4d 100644
--- a/lib/binding_rust/bindings.rs
+++ b/lib/binding_rust/bindings.rs
@@ -1,4 +1,4 @@
-/* automatically generated by rust-bindgen 0.64.0 */
+/* automatically generated by rust-bindgen 0.65.1 */
 
 pub type TSSymbol = u16;
 pub type TSFieldId = u16;
@@ -565,9 +565,6 @@ extern "C" {
 extern "C" {
     pub fn ts_query_cursor_set_point_range(arg1: *mut TSQueryCursor, arg2: TSPoint, arg3: TSPoint);
 }
-extern "C" {
-    pub fn ts_query_cursor_set_max_start_depth(arg1: *mut TSQueryCursor, arg2: u32);
-}
 extern "C" {
     #[doc = " Advance to the next match of the currently running query.\n\n If there is a match, write it to `*match` and return `true`.\n Otherwise, return `false`."]
     pub fn ts_query_cursor_next_match(arg1: *mut TSQueryCursor, match_: *mut TSQueryMatch) -> bool;
@@ -583,6 +580,10 @@ extern "C" {
         capture_index: *mut u32,
     ) -> bool;
 }
+extern "C" {
+    #[doc = " Set the maximum start depth for a cursor.\n\n This prevents cursors from exploring children nodes at a certain depth.\n Note if a pattern includes many children, then they will still be checked.\n\n Set to `0` to remove the maximum start depth."]
+    pub fn ts_query_cursor_set_max_start_depth(arg1: *mut TSQueryCursor, arg2: u32);
+}
 extern "C" {
     #[doc = " Get the number of distinct node types in the language."]
     pub fn ts_language_symbol_count(arg1: *const TSLanguage) -> u32;
diff --git a/script/generate-bindings b/script/generate-bindings
index 19975d37..25499c0e 100755
--- a/script/generate-bindings
+++ b/script/generate-bindings
@@ -8,7 +8,6 @@ bindgen                                        \
   --allowlist-type '^TS.*'                     \
   --allowlist-function '^ts_.*'                \
   --blocklist-type '^__.*'                     \
-  --size_t-is-usize                            \
   $header_path > $output_path
 
 echo "" >> $output_path

From c2e264ac0a1ce98cd5c329d265cacc2a517ea6b1 Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Mon, 17 Apr 2023 18:14:09 +0300
Subject: [PATCH 111/347] emscripten: 3.1.35

---
 cli/emscripten-version | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/cli/emscripten-version b/cli/emscripten-version
index 05b41fb6..d87cdbb8 100644
--- a/cli/emscripten-version
+++ b/cli/emscripten-version
@@ -1 +1 @@
-3.1.29
+3.1.35

From 4f4b86a40baac59818d2c116aafa037a3733eaee Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Wed, 19 Apr 2023 09:36:42 +0300
Subject: [PATCH 112/347] lib: make query step init depend from
 MAX_STEP_CAPTURE_COUNT decl

---
 lib/src/query.c | 7 +++++--
 1 file changed, 5 insertions(+), 2 deletions(-)

diff --git a/lib/src/query.c b/lib/src/query.c
index 275512c0..e5676e0f 100644
--- a/lib/src/query.c
+++ b/lib/src/query.c
@@ -801,11 +801,10 @@ static QueryStep query_step__new(
   uint16_t depth,
   bool is_immediate
 ) {
-  return (QueryStep) {
+  QueryStep step = {
     .symbol = symbol,
     .depth = depth,
     .field = 0,
-    .capture_ids = {NONE, NONE, NONE},
     .alternative_index = NONE,
     .negated_field_list_id = 0,
     .contains_captures = false,
@@ -817,6 +816,10 @@ static QueryStep query_step__new(
     .is_immediate = is_immediate,
     .alternative_is_immediate = false,
   };
+  for (unsigned i = 0; i < MAX_STEP_CAPTURE_COUNT; i++) {
+    step.capture_ids[i] = NONE;
+  }
+  return step;
 }
 
 static void query_step__add_capture(QueryStep *self, uint16_t capture_id) {

From 85a588b5b0114cf1cd184bd19e090d40c03887a2 Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Sat, 22 Apr 2023 12:06:36 +0300
Subject: [PATCH 113/347] Fix tests, adapt to tree-sitter-json
 40a81c01a40ac48744e0c8ccabbaba1920441199

---
 cli/src/tests/parser_test.rs               |  5 +-
 test/fixtures/error_corpus/json_errors.txt | 54 +++++++++++++++-------
 2 files changed, 42 insertions(+), 17 deletions(-)

diff --git a/cli/src/tests/parser_test.rs b/cli/src/tests/parser_test.rs
index 78c6cda4..f06d88b8 100644
--- a/cli/src/tests/parser_test.rs
+++ b/cli/src/tests/parser_test.rs
@@ -276,7 +276,10 @@ fn test_parsing_invalid_chars_at_eof() {
     let mut parser = Parser::new();
     parser.set_language(get_language("json")).unwrap();
     let tree = parser.parse(b"\xdf", None).unwrap();
-    assert_eq!(tree.root_node().to_sexp(), "(ERROR (UNEXPECTED INVALID))");
+    assert_eq!(
+        tree.root_node().to_sexp(),
+        "(document (ERROR (UNEXPECTED INVALID)))"
+    );
 }
 
 #[test]
diff --git a/test/fixtures/error_corpus/json_errors.txt b/test/fixtures/error_corpus/json_errors.txt
index 53ce94e4..065fa88c 100644
--- a/test/fixtures/error_corpus/json_errors.txt
+++ b/test/fixtures/error_corpus/json_errors.txt
@@ -6,7 +6,8 @@ top-level errors
 
 ---
 
-(ERROR)
+(document
+  (ERROR))
 
 ==========================================
 unexpected tokens
@@ -16,7 +17,9 @@ barf
 
 ---
 
-(ERROR (UNEXPECTED 'b'))
+(document
+  (ERROR
+    (UNEXPECTED 'b')))
 
 ==========================================
 errors inside arrays
@@ -26,10 +29,11 @@ errors inside arrays
 
 ---
 
-(document (array
-  (number)
-  (ERROR)
-  (number)))
+(document
+  (array
+    (number)
+    (ERROR)
+    (number)))
 
 ==========================================
 errors inside objects
@@ -39,9 +43,14 @@ errors inside objects
 
 ---
 
-(document (object
-  (pair (string (string_content)) (number))
-  (ERROR (UNEXPECTED 'o'))))
+(document
+  (object
+    (pair
+      (string
+        (string_content))
+      (number))
+    (ERROR
+      (UNEXPECTED 'o'))))
 
 ==========================================
 errors inside nested objects
@@ -51,12 +60,23 @@ errors inside nested objects
 
 ---
 
-(document (object
-  (pair (string (string_content)) (object
-    (pair (string (string_content)) (number))
-    (ERROR (number))))
-  (pair (string (string_content)) (number))
-  (ERROR)))
+(document
+  (object
+    (pair
+      (string
+        (string_content))
+      (object
+        (pair
+          (string
+            (string_content))
+          (number))
+        (ERROR
+          (number))))
+    (pair
+      (string
+        (string_content))
+      (number))
+    (ERROR)))
 
 ===============================
 incomplete tokens at EOF
@@ -65,4 +85,6 @@ incomplete tokens at EOF
 nul
 ---
 
-(ERROR (UNEXPECTED '\0'))
+(document
+  (ERROR
+    (UNEXPECTED '\0')))

From 63d9f7146f9682098569c2eb527fc7d7cae50095 Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Sat, 22 Apr 2023 10:24:45 +0300
Subject: [PATCH 114/347] Fix get_column() segfault on EOF, don't do lookahead
 without EOF check first

---
 lib/src/lexer.c | 17 ++++++++++-------
 1 file changed, 10 insertions(+), 7 deletions(-)

diff --git a/lib/src/lexer.c b/lib/src/lexer.c
index acaf3e8c..5940be5e 100644
--- a/lib/src/lexer.c
+++ b/lib/src/lexer.c
@@ -213,7 +213,7 @@ static void ts_lexer__advance(TSLexer *_self, bool skip) {
   } else {
     LOG("consume", self->data.lookahead);
   }
-  
+
   ts_lexer__do_advance(self, skip);
 }
 
@@ -245,9 +245,9 @@ static void ts_lexer__mark_end(TSLexer *_self) {
 
 static uint32_t ts_lexer__get_column(TSLexer *_self) {
   Lexer *self = (Lexer *)_self;
-  
+
   uint32_t goal_byte = self->current_position.bytes;
-  
+
   self->did_get_column = true;
   self->current_position.bytes -= self->current_position.extent.column;
   self->current_position.extent.column = 0;
@@ -257,10 +257,13 @@ static uint32_t ts_lexer__get_column(TSLexer *_self) {
   }
 
   uint32_t result = 0;
-  ts_lexer__get_lookahead(self);
-  while (self->current_position.bytes < goal_byte && !ts_lexer__eof(_self) && self->chunk) {
-    ts_lexer__do_advance(self, false);
-    result++;
+  if (!ts_lexer__eof(_self)) {
+    ts_lexer__get_lookahead(self);
+    while (self->current_position.bytes < goal_byte && self->chunk) {
+      result++;
+      ts_lexer__do_advance(self, false);
+      if (ts_lexer__eof(_self)) break;
+    }
   }
 
   return result;

From e966c5ad5b4197bda5aae509733573820f20873a Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Tue, 2 May 2023 10:34:55 +0300
Subject: [PATCH 115/347] fix: use SIGINT instead of stdin for interruption to
 don't mess up piped commands

---
 Cargo.lock           | 67 +++++++++++++++++++++++++++++++++-----------
 cli/Cargo.toml       |  1 +
 cli/src/highlight.rs |  2 +-
 cli/src/main.rs      |  4 +--
 cli/src/tags.rs      |  2 +-
 cli/src/util.rs      | 21 ++++++--------
 6 files changed, 64 insertions(+), 33 deletions(-)

diff --git a/Cargo.lock b/Cargo.lock
index 9b74a638..0588a58d 100644
--- a/Cargo.lock
+++ b/Cargo.lock
@@ -4,9 +4,9 @@ version = 3
 
 [[package]]
 name = "aho-corasick"
-version = "0.7.20"
+version = "1.0.1"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "cc936419f96fa211c1b9166887b38e5e40b19958e5b895be7c1f93adec7071ac"
+checksum = "67fc08ce920c31afb70f013dcce1bfc3a3195de6a228474e45e1f145b36f8d04"
 dependencies = [
  "memchr",
 ]
@@ -22,9 +22,9 @@ dependencies = [
 
 [[package]]
 name = "anyhow"
-version = "1.0.70"
+version = "1.0.71"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "7de8ce5e0f9f8d88245311066a578d72b7af3e7088f32783804676302df237e4"
+checksum = "9c7d0618f0e0b7e8ff11427422b64564d5fb0be1940354bfe2e0529b18a9d9b8"
 
 [[package]]
 name = "ascii"
@@ -57,9 +57,9 @@ checksum = "bef38d45163c2f1dde094a7dfd33ccf595c92905c8f8f4fdc18d06fb1037718a"
 
 [[package]]
 name = "bumpalo"
-version = "3.12.0"
+version = "3.12.1"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "0d261e256854913907f67ed06efbc3338dfe6179796deefc1ff763fc1aee5535"
+checksum = "9b1ce199063694f33ffb7dd4e0ee620741495c32833cde5aa08f02a0bf96f0c8"
 
 [[package]]
 name = "bytes"
@@ -142,6 +142,16 @@ dependencies = [
  "syn 1.0.109",
 ]
 
+[[package]]
+name = "ctrlc"
+version = "3.2.5"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "bbcf33c2a618cbe41ee43ae6e9f2e48368cd9f9db2896f10167d8d762679f639"
+dependencies = [
+ "nix",
+ "windows-sys 0.45.0",
+]
+
 [[package]]
 name = "diff"
 version = "0.1.13"
@@ -372,9 +382,9 @@ checksum = "e2abad23fbc42b3700f2f279844dc832adb2b2eb069b2df918f455c4e18cc646"
 
 [[package]]
 name = "libc"
-version = "0.2.141"
+version = "0.2.142"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "3304a64d199bb964be99741b7a14d26972741915b3649639149b2479bb46f4b5"
+checksum = "6a987beff54b60ffa6d51982e1aa1146bc42f19bd26be28b0586f252fccf5317"
 
 [[package]]
 name = "libloading"
@@ -388,9 +398,9 @@ dependencies = [
 
 [[package]]
 name = "linux-raw-sys"
-version = "0.3.1"
+version = "0.3.6"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "d59d8c75012853d2e872fb56bc8a2e53718e2cafe1a4c823143141c6d90c322f"
+checksum = "b64f40e5e03e0d54f03845c8197d0291253cdbedfb1cb46b13c2c117554a9f4c"
 
 [[package]]
 name = "log"
@@ -422,6 +432,18 @@ version = "0.1.1"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "27b02d87554356db9e9a873add8782d4ea6e3e58ea071a9adb9a2e8ddb884a8b"
 
+[[package]]
+name = "nix"
+version = "0.26.2"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "bfdda3d196821d6af13126e40375cdf7da646a96114af134d5f417a9a1dc8e1a"
+dependencies = [
+ "bitflags",
+ "cfg-if",
+ "libc",
+ "static_assertions",
+]
+
 [[package]]
 name = "objc"
 version = "0.2.7"
@@ -561,13 +583,13 @@ dependencies = [
 
 [[package]]
 name = "regex"
-version = "1.7.3"
+version = "1.8.1"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "8b1f693b24f6ac912f4893ef08244d70b6067480d2f1a46e950c9691e6749d1d"
+checksum = "af83e617f331cc6ae2da5443c602dfa5af81e517212d9d611a5b3ba1777b5370"
 dependencies = [
  "aho-corasick",
  "memchr",
- "regex-syntax",
+ "regex-syntax 0.7.1",
 ]
 
 [[package]]
@@ -576,6 +598,12 @@ version = "0.6.29"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "f162c6dd7b008981e4d40210aca20b4bd0f9b60ca9271061b07f78537722f2e1"
 
+[[package]]
+name = "regex-syntax"
+version = "0.7.1"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "a5996294f19bd3aae0453a862ad728f60e6600695733dd5df01da90c54363a3c"
+
 [[package]]
 name = "rustc-hash"
 version = "1.1.0"
@@ -584,9 +612,9 @@ checksum = "08d43f7aa6b08d49f382cde6a7982047c3426db949b1424bc4b7ec9ae12c6ce2"
 
 [[package]]
 name = "rustix"
-version = "0.37.11"
+version = "0.37.18"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "85597d61f83914ddeba6a47b3b8ffe7365107221c2e557ed94426489fefb5f77"
+checksum = "8bbfc1d1c7c40c01715f47d71444744a81669ca84e8b63e25a55e169b1f86433"
 dependencies = [
  "bitflags",
  "errno",
@@ -655,6 +683,12 @@ version = "2.5.1"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "75ce4f9dc4a41b4c3476cc925f1efb11b66df373a8fde5d4b8915fa91b5d995e"
 
+[[package]]
+name = "static_assertions"
+version = "1.1.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "a2eb9349b6444b326872e140eb1cf5e7c522154d69e7a0ffb0fb81c06b37543f"
+
 [[package]]
 name = "strsim"
 version = "0.8.0"
@@ -779,6 +813,7 @@ dependencies = [
  "atty",
  "clap",
  "ctor",
+ "ctrlc",
  "difference",
  "dirs 3.0.2",
  "glob",
@@ -791,7 +826,7 @@ dependencies = [
  "pretty_assertions",
  "rand",
  "regex",
- "regex-syntax",
+ "regex-syntax 0.6.29",
  "rustc-hash",
  "semver",
  "serde",
diff --git a/cli/Cargo.toml b/cli/Cargo.toml
index 28e3d37f..d0085f67 100644
--- a/cli/Cargo.toml
+++ b/cli/Cargo.toml
@@ -24,6 +24,7 @@ ansi_term = "0.12"
 anyhow = "1.0"
 atty = "0.2"
 clap = "2.32"
+ctrlc = { version = "3.2.5", features = ["termination"] }
 difference = "2.0"
 dirs = "3.0"
 glob = "0.3.0"
diff --git a/cli/src/highlight.rs b/cli/src/highlight.rs
index 6cf1580e..e16a705c 100644
--- a/cli/src/highlight.rs
+++ b/cli/src/highlight.rs
@@ -391,7 +391,7 @@ pub fn html(
     let stdout = io::stdout();
     let mut stdout = stdout.lock();
     let time = Instant::now();
-    let cancellation_flag = util::cancel_on_stdin();
+    let cancellation_flag = util::cancel_on_signal();
     let mut highlighter = Highlighter::new();
 
     let events = highlighter.highlight(config, source, Some(&cancellation_flag), |string| {
diff --git a/cli/src/main.rs b/cli/src/main.rs
index fb2a6327..0a863b1c 100644
--- a/cli/src/main.rs
+++ b/cli/src/main.rs
@@ -403,7 +403,7 @@ fn run() -> Result<()> {
             let edits = matches
                 .values_of("edits")
                 .map_or(Vec::new(), |e| e.collect());
-            let cancellation_flag = util::cancel_on_stdin();
+            let cancellation_flag = util::cancel_on_signal();
 
             if debug {
                 // For augmenting debug logging in external scanners
@@ -530,7 +530,7 @@ fn run() -> Result<()> {
                 println!("{}", highlight::HTML_HEADER);
             }
 
-            let cancellation_flag = util::cancel_on_stdin();
+            let cancellation_flag = util::cancel_on_signal();
 
             let mut lang = None;
             if let Some(scope) = matches.value_of("scope") {
diff --git a/cli/src/tags.rs b/cli/src/tags.rs
index 457955dd..f9f788ab 100644
--- a/cli/src/tags.rs
+++ b/cli/src/tags.rs
@@ -23,7 +23,7 @@ pub fn generate_tags(
     }
 
     let mut context = TagsContext::new();
-    let cancellation_flag = util::cancel_on_stdin();
+    let cancellation_flag = util::cancel_on_signal();
     let stdout = io::stdout();
     let mut stdout = stdout.lock();
 
diff --git a/cli/src/util.rs b/cli/src/util.rs
index d180cd54..0793e525 100644
--- a/cli/src/util.rs
+++ b/cli/src/util.rs
@@ -1,8 +1,6 @@
 use anyhow::Result;
-use std::io;
 use std::sync::atomic::{AtomicUsize, Ordering};
 use std::sync::Arc;
-use std::thread;
 use tree_sitter::{Parser, Tree};
 
 #[cfg(unix)]
@@ -22,18 +20,15 @@ svg { width: 100%; }
 
 ";
 
-pub fn cancel_on_stdin() -> Arc<AtomicUsize> {
+pub fn cancel_on_signal() -> Arc<AtomicUsize> {
     let result = Arc::new(AtomicUsize::new(0));
-    if atty::is(atty::Stream::Stdin) {
-        thread::spawn({
-            let flag = result.clone();
-            move || {
-                let mut line = String::new();
-                io::stdin().read_line(&mut line).unwrap();
-                flag.store(1, Ordering::Relaxed);
-            }
-        });
-    }
+    ctrlc::set_handler({
+        let flag = result.clone();
+        move || {
+            flag.store(1, Ordering::Relaxed);
+        }
+    })
+    .expect("Error setting Ctrl-C handler");
     result
 }
 

From ebd80906fbb098ba0e8d98ed740090a43a70d964 Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Wed, 3 May 2023 05:23:10 +0300
Subject: [PATCH 116/347] cicd: a series of small improvements

---
 .github/scripts/cross.sh       | 11 +++++++++--
 .github/scripts/make.sh        |  4 ++--
 .github/scripts/tree-sitter.sh | 20 ++++++++++++++++++--
 .github/workflows/CICD.yml     |  4 ++--
 .github/workflows/build.yml    | 21 ++++++++++-----------
 5 files changed, 41 insertions(+), 19 deletions(-)

diff --git a/.github/scripts/cross.sh b/.github/scripts/cross.sh
index 07017192..a52f0873 100755
--- a/.github/scripts/cross.sh
+++ b/.github/scripts/cross.sh
@@ -1,9 +1,16 @@
 #!/bin/bash
 
-set -x
+# set -x
 set -e
 
-if [ "$CROSS" != 1 ]; then
+if [ "$BUILD_CMD" != "cross" ]; then
+    echo "cross.sh - is a helper to assist only in cross compiling environments" >&2
+    echo "To use this tool set the BUILD_CMD env var to the \"cross\" value" >&2
+    exit 111
+fi
+
+if [ -z "$CROSS_IMAGE" ]; then
+    echo "The CROSS_IMAGE env var should be provided" >&2
     exit 111
 fi
 
diff --git a/.github/scripts/make.sh b/.github/scripts/make.sh
index 62aa0c06..79192541 100755
--- a/.github/scripts/make.sh
+++ b/.github/scripts/make.sh
@@ -1,9 +1,9 @@
 #!/bin/bash
 
-set -x
+# set -x
 set -e
 
-if [ "$CROSS" = 1 ]; then
+if [ "$BUILD_CMD" == "cross" ]; then
     if [ -z "$CC" ]; then
         echo "make.sh: CC is not set" >&2
         exit 111
diff --git a/.github/scripts/tree-sitter.sh b/.github/scripts/tree-sitter.sh
index 2e6e31c2..0cac9153 100755
--- a/.github/scripts/tree-sitter.sh
+++ b/.github/scripts/tree-sitter.sh
@@ -1,11 +1,27 @@
 #!/bin/bash
 
-set -x
+# set -x
 set -e
 
+if [ -z "$ROOT" ]; then
+    echo "The ROOT env var should be set to absolute path of a repo root folder" >&2
+    exit 111
+fi
+
+if [ -z "$TARGET" ]; then
+    echo "The TARGET env var should be equal to a \`cargo build --target <TARGET>\` command value" >&2
+    exit 111
+fi
+
 tree_sitter="$ROOT"/target/"$TARGET"/release/tree-sitter
 
-if [ "$CROSS" = 1 ]; then
+if [ "$BUILD_CMD" == "cross" ]; then
+    if [ -z "$CROSS_RUNNER" ]; then
+        echo "The CROSS_RUNNER env var should be set to a CARGO_TARGET_*_RUNNER env var value" >&2
+        echo "that is available in a docker image used by the cross tool under the hood" >&2
+        exit 111
+    fi
+
     cross.sh $CROSS_RUNNER "$tree_sitter" "$@"
 else
     "$tree_sitter" "$@"
diff --git a/.github/workflows/CICD.yml b/.github/workflows/CICD.yml
index c8a9e4c3..941cec2a 100644
--- a/.github/workflows/CICD.yml
+++ b/.github/workflows/CICD.yml
@@ -24,14 +24,14 @@ jobs:
     steps:
       - name: Get PR head ref
         if: ${{ github.event_name == 'pull_request' }}
-        id: ref
+        id: pr_head_ref
         run: |
           echo "ref=refs/pull/${{ github.event.pull_request.number }}/head" >> $GITHUB_OUTPUT
     outputs:
       ref: >-
         ${{
           (github.event_name == 'pull_request' && startsWith(github.head_ref, 'release/v'))
-          && steps.ref.outputs.ref
+          && steps.pr_head_ref.outputs.ref
           || github.ref
         }}
 
diff --git a/.github/workflows/build.yml b/.github/workflows/build.yml
index 68ba8ce4..3f7452e0 100644
--- a/.github/workflows/build.yml
+++ b/.github/workflows/build.yml
@@ -113,16 +113,16 @@ jobs:
       env:
         RUST_TEST_THREADS: ${{ matrix.rust-test-threads }}
         USE_CROSS: ${{ matrix.use-cross }}
+        TARGET: ${{ matrix.target }}
         CC: ${{ matrix.cc }}
         AR: ${{ matrix.ar }}
       run: |
         PATH="$PWD/.github/scripts:$PATH"
         echo "$PWD/.github/scripts" >> $GITHUB_PATH
-        echo "TREE_SITTER=tree-sitter.sh" >> $GITHUB_ENV
-        echo "ROOT=$PWD" >> $GITHUB_ENV
 
-        export TARGET=${{ matrix.target }}
+        echo "TREE_SITTER=tree-sitter.sh" >> $GITHUB_ENV
         echo "TARGET=$TARGET" >> $GITHUB_ENV
+        echo "ROOT=$PWD" >> $GITHUB_ENV
 
         [ -n "$RUST_TEST_THREADS" ] && \
         echo "RUST_TEST_THREADS=$RUST_TEST_THREADS" >> $GITHUB_ENV
@@ -132,8 +132,7 @@ jobs:
 
         if [ "$USE_CROSS" == "true" ]; then
           echo "BUILD_CMD=cross" >> $GITHUB_ENV
-          export CROSS=1; echo "CROSS=1" >> $GITHUB_ENV
-          runner=$(cross.sh bash -c "env | sed -nr '/^CARGO_TARGET_.*_RUNNER=/s///p'")
+          runner=$(BUILD_CMD=cross cross.sh bash -c "env | sed -nr '/^CARGO_TARGET_.*_RUNNER=/s///p'")
           [ -n "$runner" ] && echo "CROSS_RUNNER=$runner" >> $GITHUB_ENV
         fi
 
@@ -142,30 +141,30 @@ jobs:
       run: make.sh CFLAGS="-Werror" -j
 
     - name: Build wasm library
-      if: ${{ !matrix.use-cross && !matrix.cli-only }}
+      if: ${{ !matrix.use-cross && !matrix.cli-only }} # No sense to build on the same Github runner hosts many times
       run: script/build-wasm
 
     - name: Build CLI
       run: $BUILD_CMD build --release --target=${{ matrix.target }}
 
     - name: Fetch fixtures
-      if: ${{ !matrix.cli-only }}
+      if: ${{ !matrix.cli-only }} # Don't fetch fixtures for only CLI building targets
       run: script/fetch-fixtures
 
     - name: Generate fixtures
-      if: ${{ !matrix.cli-only }} # Can't natively run CLI on runner's host
+      if: ${{ !matrix.cli-only }} # Can't natively run CLI on Github runner's host
       run: script/generate-fixtures
 
     - name: Generate WASM fixtures
-      if: ${{ !matrix.use-cross && !matrix.cli-only }}
+      if: ${{ !matrix.use-cross && !matrix.cli-only }} # See comment for the "Build wasm library" step
       run: script/generate-fixtures-wasm
 
     - name: Run main tests
-      if: ${{ !matrix.cli-only }} # Can't natively run CLI on runner's host
+      if: ${{ !matrix.cli-only }} # Can't natively run CLI on Github runner's host
       run: $BUILD_CMD test --target=${{ matrix.target }}
 
     - name: Run wasm tests
-      if: ${{ !matrix.use-cross && !matrix.cli-only }}
+      if: ${{ !matrix.use-cross && !matrix.cli-only }} # See comment for the "Build wasm library" step
       run: script/test-wasm
 
     - name: Run benchmarks

From ceac2380ed5fddc623e0b7e2134f75dc4c9e5e7c Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Fri, 12 May 2023 16:34:13 +0300
Subject: [PATCH 117/347] chore(test): reorganize test helpers

---
 cli/src/tests/helpers/query_helpers.rs | 57 +++++++++++++++++++++++-
 cli/src/tests/query_test.rs            | 60 ++------------------------
 2 files changed, 60 insertions(+), 57 deletions(-)

diff --git a/cli/src/tests/helpers/query_helpers.rs b/cli/src/tests/helpers/query_helpers.rs
index 78ae559c..0638701c 100644
--- a/cli/src/tests/helpers/query_helpers.rs
+++ b/cli/src/tests/helpers/query_helpers.rs
@@ -1,6 +1,8 @@
 use rand::prelude::Rng;
 use std::{cmp::Ordering, fmt::Write, ops::Range};
-use tree_sitter::{Node, Point, Tree, TreeCursor};
+use tree_sitter::{
+    Language, Node, Parser, Point, Query, QueryCapture, QueryCursor, QueryMatch, Tree, TreeCursor,
+};
 
 #[derive(Debug)]
 pub struct Pattern {
@@ -304,3 +306,56 @@ fn compare_depth_first(a: Node, b: Node) -> Ordering {
     let b = b.byte_range();
     a.start.cmp(&b.start).then_with(|| b.end.cmp(&a.end))
 }
+
+pub fn assert_query_matches(
+    language: Language,
+    query: &Query,
+    source: &str,
+    expected: &[(usize, Vec<(&str, &str)>)],
+) {
+    let mut parser = Parser::new();
+    parser.set_language(language).unwrap();
+    let tree = parser.parse(source, None).unwrap();
+    let mut cursor = QueryCursor::new();
+    let matches = cursor.matches(&query, tree.root_node(), source.as_bytes());
+    assert_eq!(collect_matches(matches, &query, source), expected);
+    assert_eq!(cursor.did_exceed_match_limit(), false);
+}
+
+pub fn collect_matches<'a>(
+    matches: impl Iterator<Item = QueryMatch<'a, 'a>>,
+    query: &'a Query,
+    source: &'a str,
+) -> Vec<(usize, Vec<(&'a str, &'a str)>)> {
+    matches
+        .map(|m| {
+            (
+                m.pattern_index,
+                format_captures(m.captures.iter().cloned(), query, source),
+            )
+        })
+        .collect()
+}
+
+pub fn collect_captures<'a>(
+    captures: impl Iterator<Item = (QueryMatch<'a, 'a>, usize)>,
+    query: &'a Query,
+    source: &'a str,
+) -> Vec<(&'a str, &'a str)> {
+    format_captures(captures.map(|(m, i)| m.captures[i]), query, source)
+}
+
+fn format_captures<'a>(
+    captures: impl Iterator<Item = QueryCapture<'a>>,
+    query: &'a Query,
+    source: &'a str,
+) -> Vec<(&'a str, &'a str)> {
+    captures
+        .map(|capture| {
+            (
+                query.capture_names()[capture.index as usize].as_str(),
+                capture.node.utf8_text(source.as_bytes()).unwrap(),
+            )
+        })
+        .collect()
+}
diff --git a/cli/src/tests/query_test.rs b/cli/src/tests/query_test.rs
index f0bded2f..912136cb 100644
--- a/cli/src/tests/query_test.rs
+++ b/cli/src/tests/query_test.rs
@@ -1,16 +1,17 @@
 use super::helpers::{
     allocations,
     fixtures::get_language,
-    query_helpers::{Match, Pattern},
+    query_helpers::{assert_query_matches, Match, Pattern},
     ITERATION_COUNT,
 };
+use crate::tests::helpers::query_helpers::{collect_captures, collect_matches};
 use indoc::indoc;
 use lazy_static::lazy_static;
 use rand::{prelude::StdRng, SeedableRng};
 use std::{env, fmt::Write};
 use tree_sitter::{
-    CaptureQuantifier, Language, Node, Parser, Point, Query, QueryCapture, QueryCursor, QueryError,
-    QueryErrorKind, QueryMatch, QueryPredicate, QueryPredicateArg, QueryProperty,
+    CaptureQuantifier, Language, Node, Parser, Point, Query, QueryCursor, QueryError,
+    QueryErrorKind, QueryPredicate, QueryPredicateArg, QueryProperty,
 };
 use unindent::Unindent;
 
@@ -4574,56 +4575,3 @@ fn test_query_max_start_depth() {
         }
     });
 }
-
-fn assert_query_matches(
-    language: Language,
-    query: &Query,
-    source: &str,
-    expected: &[(usize, Vec<(&str, &str)>)],
-) {
-    let mut parser = Parser::new();
-    parser.set_language(language).unwrap();
-    let tree = parser.parse(source, None).unwrap();
-    let mut cursor = QueryCursor::new();
-    let matches = cursor.matches(&query, tree.root_node(), source.as_bytes());
-    assert_eq!(collect_matches(matches, &query, source), expected);
-    assert_eq!(cursor.did_exceed_match_limit(), false);
-}
-
-fn collect_matches<'a>(
-    matches: impl Iterator<Item = QueryMatch<'a, 'a>>,
-    query: &'a Query,
-    source: &'a str,
-) -> Vec<(usize, Vec<(&'a str, &'a str)>)> {
-    matches
-        .map(|m| {
-            (
-                m.pattern_index,
-                format_captures(m.captures.iter().cloned(), query, source),
-            )
-        })
-        .collect()
-}
-
-fn collect_captures<'a>(
-    captures: impl Iterator<Item = (QueryMatch<'a, 'a>, usize)>,
-    query: &'a Query,
-    source: &'a str,
-) -> Vec<(&'a str, &'a str)> {
-    format_captures(captures.map(|(m, i)| m.captures[i]), query, source)
-}
-
-fn format_captures<'a>(
-    captures: impl Iterator<Item = QueryCapture<'a>>,
-    query: &'a Query,
-    source: &'a str,
-) -> Vec<(&'a str, &'a str)> {
-    captures
-        .map(|capture| {
-            (
-                query.capture_names()[capture.index as usize].as_str(),
-                capture.node.utf8_text(source.as_bytes()).unwrap(),
-            )
-        })
-        .collect()
-}

From 09fe5f29d91f8a4f0ebaf71730726bab58d27e6d Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Sat, 13 May 2023 18:57:40 +0300
Subject: [PATCH 118/347] fix(test): stick tree-sitter-cpp fixture grammar to a
 specific hash

It's needed to fix tests fail: https://github.com/tree-sitter/tree-sitter-cpp/pull/202#issuecomment-1546279646

See CLI xtask notes in https://github.com/tree-sitter/tree-sitter/issues/1223
---
 cli/benches/benchmark.rs  | 1 +
 script/fetch-fixtures     | 2 +-
 script/fetch-fixtures.cmd | 2 +-
 3 files changed, 3 insertions(+), 2 deletions(-)

diff --git a/cli/benches/benchmark.rs b/cli/benches/benchmark.rs
index efb73f3a..ae82081a 100644
--- a/cli/benches/benchmark.rs
+++ b/cli/benches/benchmark.rs
@@ -104,6 +104,7 @@ fn main() {
 
             parse(&path, max_path_length, |source| {
                 Query::new(language, str::from_utf8(source).unwrap())
+                    .with_context(|| format!("Query file path: {path:?}"))
                     .expect("Failed to parse query");
             });
         }
diff --git a/script/fetch-fixtures b/script/fetch-fixtures
index 8d21193e..eb66d314 100755
--- a/script/fetch-fixtures
+++ b/script/fetch-fixtures
@@ -23,7 +23,7 @@ fetch_grammar() {
 
 fetch_grammar bash              master
 fetch_grammar c                 master
-fetch_grammar cpp               master
+fetch_grammar cpp               670404d7c689be1c868a46f919ba2a3912f2b7ef
 fetch_grammar embedded-template master
 fetch_grammar go                master
 fetch_grammar html              master
diff --git a/script/fetch-fixtures.cmd b/script/fetch-fixtures.cmd
index 3dad731f..5e8b6a16 100644
--- a/script/fetch-fixtures.cmd
+++ b/script/fetch-fixtures.cmd
@@ -2,7 +2,7 @@
 
 call:fetch_grammar bash              master
 call:fetch_grammar c                 master
-call:fetch_grammar cpp               master
+call:fetch_grammar cpp               670404d7c689be1c868a46f919ba2a3912f2b7ef
 call:fetch_grammar embedded-template master
 call:fetch_grammar go                master
 call:fetch_grammar html              master

From da269ac3507e19e222d4adb8b61c78a6b1ea8781 Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Fri, 12 May 2023 16:34:56 +0300
Subject: [PATCH 119/347] test: add a test case to demonstrate the #2107 issue

---
 cli/src/tests/github_issue_test.rs | 26 ++++++++++++++++++++++++++
 1 file changed, 26 insertions(+)

diff --git a/cli/src/tests/github_issue_test.rs b/cli/src/tests/github_issue_test.rs
index 42fe3e9a..bfc135ca 100644
--- a/cli/src/tests/github_issue_test.rs
+++ b/cli/src/tests/github_issue_test.rs
@@ -6,7 +6,9 @@
 // cargo test --target $(rustc -vV | sed -nr 's/^host: //p') -- --test-threads 1
 // ```
 
+use super::helpers::query_helpers::assert_query_matches;
 use crate::tests::helpers::fixtures::get_language;
+use indoc::indoc;
 use tree_sitter::Query;
 
 #[test]
@@ -14,3 +16,27 @@ fn issue_2162_out_of_bound() {
     let language = get_language("java");
     assert!(Query::new(language, "(package_declaration _ (_) @name _)").is_ok());
 }
+
+#[test]
+fn issue_2107_first_child_group_anchor_had_no_effect() {
+    let language = get_language("c");
+    let source_code = indoc! {r#"
+        void fun(int a, char b, int c) { };
+    "#};
+    let query = indoc! {r#"
+        (parameter_list
+            .
+            (
+                (parameter_declaration) @constant
+                (#match? @constant "^int")
+            )
+        )
+    "#};
+    let query = Query::new(language, query).unwrap();
+    assert_query_matches(
+        language,
+        &query,
+        source_code,
+        &[(0, vec![("constant", "int a")])],
+    );
+}

From 55a8db10ccff9099b52792f7c1e5095bcb6f934d Mon Sep 17 00:00:00 2001
From: Philipp Mildenberger <philipp@mildenberger.me>
Date: Wed, 1 Mar 2023 03:05:53 +0100
Subject: [PATCH 120/347] fix: bug with first child group anchor (anchor had no
 effect)

---
 lib/src/query.c | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/lib/src/query.c b/lib/src/query.c
index e5676e0f..bdc3b0e4 100644
--- a/lib/src/query.c
+++ b/lib/src/query.c
@@ -2260,7 +2260,7 @@ static TSQueryError ts_query__parse_pattern(
 
     // If this parenthesis is followed by a node, then it represents a grouped sequence.
     if (stream->next == '(' || stream->next == '"' || stream->next == '[') {
-      bool child_is_immediate = false;
+      bool child_is_immediate = is_immediate;
       CaptureQuantifiers child_capture_quantifiers = capture_quantifiers_new();
       for (;;) {
         if (stream->next == '.') {

From 543e9cdc93395c370bb2a9c3e707acc7d9d04170 Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Mon, 15 May 2023 13:11:55 +0300
Subject: [PATCH 121/347] emscripten: 3.1.37

---
 cli/emscripten-version | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/cli/emscripten-version b/cli/emscripten-version
index d87cdbb8..1f1a3970 100644
--- a/cli/emscripten-version
+++ b/cli/emscripten-version
@@ -1 +1 @@
-3.1.35
+3.1.37

From be179a3c8092ce24ba1ace9a65e3d39644ce5f83 Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Mon, 15 May 2023 17:03:24 +0300
Subject: [PATCH 122/347] script/build-wasm: add a `--verbose` option

---
 script/build-wasm | 4 ++++
 1 file changed, 4 insertions(+)

diff --git a/script/build-wasm b/script/build-wasm
index dc42895a..ea3c6f0f 100755
--- a/script/build-wasm
+++ b/script/build-wasm
@@ -51,6 +51,10 @@ while [[ $# > 0 ]]; do
       force_docker=1
       ;;
 
+    -v|--verbose)
+      emscripten_flags="-s VERBOSE=1 -v $emscripten_flags"
+      ;;
+
     *)
       usage
       echo "Unrecognized argument '$1'"

From a9dfcb9e4765d8466816a80b87e70a0aa928719c Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Mon, 15 May 2023 17:04:18 +0300
Subject: [PATCH 123/347] script/build-wasm: update emcc options to use actual
 non-deprecated names

---
 script/build-wasm | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/script/build-wasm b/script/build-wasm
index ea3c6f0f..ef0517b8 100755
--- a/script/build-wasm
+++ b/script/build-wasm
@@ -91,10 +91,10 @@ runtime_methods='stringToUTF16','AsciiToString'
 # in the `target/scratch` directory
 $emcc                                            \
   -s WASM=1                                      \
-  -s TOTAL_MEMORY=33554432                       \
+  -s INITIAL_MEMORY=33554432                     \
   -s ALLOW_MEMORY_GROWTH=1                       \
   -s MAIN_MODULE=2                               \
-  -s NO_FILESYSTEM=1                             \
+  -s FILESYSTEM=0                                \
   -s NODEJS_CATCH_EXIT=0                         \
   -s NODEJS_CATCH_REJECTION=0                    \
   -s EXPORTED_FUNCTIONS=@${web_dir}/exports.json \

From b41c678da60d3193b341f693488fc1d47cda0317 Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Fri, 19 May 2023 01:22:09 +0300
Subject: [PATCH 124/347] cicd: rollback runner version to link against older
 GLIBC

---
 .github/workflows/build.yml | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/.github/workflows/build.yml b/.github/workflows/build.yml
index 3f7452e0..e117f7dc 100644
--- a/.github/workflows/build.yml
+++ b/.github/workflows/build.yml
@@ -37,7 +37,7 @@ jobs:
         # 2. Add a new record to a matrix map in `cli/npm/install.js`
         - { runtime: linux-arm64   , target: aarch64-unknown-linux-gnu   , os: ubuntu-latest  , use-cross: true }
         - { runtime: linux-arm     , target: arm-unknown-linux-gnueabihf , os: ubuntu-latest  , use-cross: true }
-        - { runtime: linux-x64     , target: x86_64-unknown-linux-gnu    , os: ubuntu-latest                    }
+        - { runtime: linux-x64     , target: x86_64-unknown-linux-gnu    , os: ubuntu-20.04                     } #2272
         - { runtime: linux-x86     , target: i686-unknown-linux-gnu      , os: ubuntu-latest  , use-cross: true }
         - { runtime: windows-arm64 , target: aarch64-pc-windows-msvc     , os: windows-latest                   }
         - { runtime: windows-x64   , target: x86_64-pc-windows-msvc      , os: windows-latest                   }

From fcbc3db1ab6906d7e01222bff2cae6ec5e56fde6 Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Fri, 19 May 2023 15:57:18 +0300
Subject: [PATCH 125/347] cicd: build - add a `run-tests` input parameter

---
 .github/workflows/build.yml | 24 ++++++++++++++++--------
 1 file changed, 16 insertions(+), 8 deletions(-)

diff --git a/.github/workflows/build.yml b/.github/workflows/build.yml
index e117f7dc..aa569cf5 100644
--- a/.github/workflows/build.yml
+++ b/.github/workflows/build.yml
@@ -6,12 +6,20 @@ env:
   CROSS_DEBUG: 1
 
 on:
-  workflow_dispatch:
   workflow_call:
     inputs:
       ref:
         default: ${{ github.ref }}
         type: string
+      run-tests:
+        default: true
+        type: boolean
+  workflow_dispatch:
+    inputs:
+      run-tests:
+        description: Run tests
+        default: true
+        type: boolean
 
 jobs:
   build:
@@ -141,34 +149,34 @@ jobs:
       run: make.sh CFLAGS="-Werror" -j
 
     - name: Build wasm library
-      if: ${{ !matrix.use-cross && !matrix.cli-only }} # No sense to build on the same Github runner hosts many times
+      if: ${{ !matrix.cli-only && !matrix.use-cross }} # No sense to build on the same Github runner hosts many times
       run: script/build-wasm
 
     - name: Build CLI
       run: $BUILD_CMD build --release --target=${{ matrix.target }}
 
     - name: Fetch fixtures
-      if: ${{ !matrix.cli-only }} # Don't fetch fixtures for only CLI building targets
+      if: ${{ inputs.run-tests && !matrix.cli-only }} # Don't fetch fixtures for only CLI building targets
       run: script/fetch-fixtures
 
     - name: Generate fixtures
-      if: ${{ !matrix.cli-only }} # Can't natively run CLI on Github runner's host
+      if: ${{ inputs.run-tests && !matrix.cli-only }} # Can't natively run CLI on Github runner's host
       run: script/generate-fixtures
 
     - name: Generate WASM fixtures
-      if: ${{ !matrix.use-cross && !matrix.cli-only }} # See comment for the "Build wasm library" step
+      if: ${{ inputs.run-tests && !matrix.cli-only && !matrix.use-cross }} # See comment for the "Build wasm library" step
       run: script/generate-fixtures-wasm
 
     - name: Run main tests
-      if: ${{ !matrix.cli-only }} # Can't natively run CLI on Github runner's host
+      if: ${{ inputs.run-tests && !matrix.cli-only }} # Can't natively run CLI on Github runner's host
       run: $BUILD_CMD test --target=${{ matrix.target }}
 
     - name: Run wasm tests
-      if: ${{ !matrix.use-cross && !matrix.cli-only }} # See comment for the "Build wasm library" step
+      if: ${{ inputs.run-tests && !matrix.cli-only && !matrix.use-cross }} # See comment for the "Build wasm library" step
       run: script/test-wasm
 
     - name: Run benchmarks
-      if: ${{ !matrix.use-cross && !matrix.cli-only }} # Cross-compiled benchmarks make no sense
+      if: ${{ inputs.run-tests && !matrix.cli-only && !matrix.use-cross }} # Cross-compiled benchmarks make no sense
       run: $BUILD_CMD bench benchmark -p tree-sitter-cli --target=${{ matrix.target }}
 
     - name: Upload CLI artifact

From 3af763e4bec84dd3f1bcb3b950a4a38cce96521e Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Fri, 19 May 2023 23:36:48 +0300
Subject: [PATCH 126/347] cicd: build - add a `rust-test-threads` number input
 parameter

---
 .github/workflows/build.yml | 6 +++++-
 1 file changed, 5 insertions(+), 1 deletion(-)

diff --git a/.github/workflows/build.yml b/.github/workflows/build.yml
index aa569cf5..5e216bb4 100644
--- a/.github/workflows/build.yml
+++ b/.github/workflows/build.yml
@@ -20,6 +20,10 @@ on:
         description: Run tests
         default: true
         type: boolean
+      rust-test-threads:
+        description: Number of Rust test threads
+        default: ""
+        type: string
 
 jobs:
   build:
@@ -119,7 +123,7 @@ jobs:
 
     - name: Setup env extras
       env:
-        RUST_TEST_THREADS: ${{ matrix.rust-test-threads }}
+        RUST_TEST_THREADS: ${{ matrix.rust-test-threads || inputs.rust-test-threads || '' }}
         USE_CROSS: ${{ matrix.use-cross }}
         TARGET: ${{ matrix.target }}
         CC: ${{ matrix.cc }}

From 1f42f1efc0f00980243c1a591296fa68c5395ae8 Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Fri, 19 May 2023 15:57:40 +0300
Subject: [PATCH 127/347] cicd: show info about minimal required GLIBC version
 for CLI

---
 .github/workflows/build.yml | 10 +++++++++-
 1 file changed, 9 insertions(+), 1 deletion(-)

diff --git a/.github/workflows/build.yml b/.github/workflows/build.yml
index 5e216bb4..8f10d486 100644
--- a/.github/workflows/build.yml
+++ b/.github/workflows/build.yml
@@ -72,6 +72,8 @@ jobs:
 
     env:
       BUILD_CMD: cargo
+      EMSCRIPTEN_VERSION: ""
+      EXE: ${{ contains(matrix.target, 'windows') && '.exe' || '' }}
 
     defaults:
       run:
@@ -159,6 +161,12 @@ jobs:
     - name: Build CLI
       run: $BUILD_CMD build --release --target=${{ matrix.target }}
 
+    - name: Info about CLI
+      if: ${{ startsWith(matrix.runtime, 'linux') }}
+      run: |
+        min_glibc=$(objdump -p target/$TARGET/release/tree-sitter${{ env.EXE }} | sed -nr 's/.*(GLIBC_.+).*/\1/p' | sort -uV | tail -n1)
+        echo "🔗 Minimal **glibc** version required for CLI: ${min_glibc}">> $GITHUB_STEP_SUMMARY
+
     - name: Fetch fixtures
       if: ${{ inputs.run-tests && !matrix.cli-only }} # Don't fetch fixtures for only CLI building targets
       run: script/fetch-fixtures
@@ -187,7 +195,7 @@ jobs:
       uses: actions/upload-artifact@v3
       with:
         name: tree-sitter.${{ matrix.runtime }}
-        path: target/${{ matrix.target }}/release/tree-sitter${{ contains(matrix.target, 'windows') && '.exe' || '' }}
+        path: target/${{ matrix.target }}/release/tree-sitter${{ env.EXE }}
         if-no-files-found: error
         retention-days: 7
 

From e783d8848d8aeb3f19b8e613efeb0bedec5f6881 Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Fri, 19 May 2023 18:04:53 +0300
Subject: [PATCH 128/347] cicd: don't start release on draft PRs

---
 .github/workflows/CICD.yml | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/.github/workflows/CICD.yml b/.github/workflows/CICD.yml
index 941cec2a..90ac3a94 100644
--- a/.github/workflows/CICD.yml
+++ b/.github/workflows/CICD.yml
@@ -68,7 +68,8 @@ jobs:
     needs: [init, fast_checks, full_checks, min_version, build, sanitize]
     if: >
       github.event.pull_request.head.repo.full_name == github.repository &&
-      startsWith(github.head_ref, 'release/v')
+      startsWith(github.head_ref, 'release/v') &&
+      !github.event.pull_request.draft
     uses: ./.github/workflows/release.yml
     with:
       ref: ${{ needs.init.outputs.ref }}

From 30dc31ff53b9786229c57c26b620e7b5c690ad95 Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Fri, 19 May 2023 23:36:10 +0300
Subject: [PATCH 129/347] cicd: run tests on ready to review PRs

---
 .github/workflows/CICD.yml | 5 +++++
 1 file changed, 5 insertions(+)

diff --git a/.github/workflows/CICD.yml b/.github/workflows/CICD.yml
index 90ac3a94..9afc0e83 100644
--- a/.github/workflows/CICD.yml
+++ b/.github/workflows/CICD.yml
@@ -3,6 +3,11 @@ name: CICD
 on:
   workflow_dispatch:
   pull_request:
+    types:
+      - opened
+      - reopened
+      - synchronize
+      - ready_for_review
   push:
     branches-ignore:
       - release/v*

From 67f4f2328cebefeb32a92669dbed7cc12ba2cad0 Mon Sep 17 00:00:00 2001
From: Samuel Moelius <sam@moeli.us>
Date: Fri, 19 May 2023 21:31:01 -0400
Subject: [PATCH 130/347] Add `test_query_error_does_not_oob`

---
 cli/src/tests/query_test.rs | 16 ++++++++++++++++
 1 file changed, 16 insertions(+)

diff --git a/cli/src/tests/query_test.rs b/cli/src/tests/query_test.rs
index 912136cb..f0f37788 100644
--- a/cli/src/tests/query_test.rs
+++ b/cli/src/tests/query_test.rs
@@ -4575,3 +4575,19 @@ fn test_query_max_start_depth() {
         }
     });
 }
+
+#[test]
+fn test_query_error_does_not_oob() {
+    let language = get_language("javascript");
+
+    assert_eq!(
+        Query::new(language, "(clas").unwrap_err(),
+        QueryError {
+            row: 0,
+            offset: 1,
+            column: 1,
+            kind: QueryErrorKind::NodeType,
+            message: "clas".to_string()
+        }
+    );
+}

From f461d953a64a4adc602e8c432167ea6d9ab5dd69 Mon Sep 17 00:00:00 2001
From: Samuel Moelius <sam@moeli.us>
Date: Fri, 19 May 2023 21:31:26 -0400
Subject: [PATCH 131/347] Fix OOB in `Query::new`

---
 lib/binding_rust/lib.rs | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/lib/binding_rust/lib.rs b/lib/binding_rust/lib.rs
index 87294a5d..f9ec7f67 100644
--- a/lib/binding_rust/lib.rs
+++ b/lib/binding_rust/lib.rs
@@ -1401,7 +1401,7 @@ impl Query {
                     let suffix = source.split_at(offset).1;
                     let end_offset = suffix
                         .find(|c| !char::is_alphanumeric(c) && c != '_' && c != '-')
-                        .unwrap_or(source.len());
+                        .unwrap_or(suffix.len());
                     message = suffix.split_at(end_offset).0.to_string();
                     kind = match error_type {
                         ffi::TSQueryError_TSQueryErrorNodeType => QueryErrorKind::NodeType,

From 010f288b3c67d16f2e3e2a590332c8021a9e4d16 Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Sat, 20 May 2023 01:52:31 +0300
Subject: [PATCH 132/347] cicd: move branch locality checking to the release
 workflow

---
 .github/workflows/CICD.yml    |  2 +-
 .github/workflows/release.yml | 15 +++++++++++++--
 2 files changed, 14 insertions(+), 3 deletions(-)

diff --git a/.github/workflows/CICD.yml b/.github/workflows/CICD.yml
index 9afc0e83..fcdb6ea9 100644
--- a/.github/workflows/CICD.yml
+++ b/.github/workflows/CICD.yml
@@ -72,7 +72,7 @@ jobs:
     name: Release
     needs: [init, fast_checks, full_checks, min_version, build, sanitize]
     if: >
-      github.event.pull_request.head.repo.full_name == github.repository &&
+      github.event_name == 'pull_request' &&
       startsWith(github.head_ref, 'release/v') &&
       !github.event.pull_request.draft
     uses: ./.github/workflows/release.yml
diff --git a/.github/workflows/release.yml b/.github/workflows/release.yml
index 979d95a3..1b75dc96 100644
--- a/.github/workflows/release.yml
+++ b/.github/workflows/release.yml
@@ -12,10 +12,14 @@ jobs:
     name: Check permissions
     runs-on: ubuntu-latest
     outputs:
-      release_allowed: ${{ steps.maintainer.outputs.is_maintainer == 'true' }}
+      release_allowed: >
+        ${{
+          steps.maintainer.outputs.is_maintainer == 'true' &&
+          steps.local_branch.outputs.is_local == 'true'
+        }}
     steps:
 
-    - name: Is maintainer
+    - name: Initated by a maintainer
       id: maintainer
       env:
         GH_TOKEN: ${{ github.token }}
@@ -31,6 +35,13 @@ jobs:
           echo "is_maintainer=true" >> $GITHUB_OUTPUT
         fi
 
+    - name: The ref branch is local
+      id: local_branch
+      env:
+        is_local: ${{ github.event.pull_request.head.repo.full_name == github.repository }}
+      run: |
+        echo "is_local=${is_local}" >> $GITHUB_OUTPUT
+
   release:
     name: Release
     needs: permissions

From 9dd725b4e3945cd36d70792327c16beeec0204e9 Mon Sep 17 00:00:00 2001
From: Max Brunsfeld <maxbrunsfeld@gmail.com>
Date: Thu, 8 Jun 2023 18:51:27 -0700
Subject: [PATCH 133/347] Start work on exposing APIs for node descendant
 counts and indices

---
 cli/src/tests/node_test.rs    |  40 +++-
 lib/binding_rust/bindings.rs  | 375 +++++++++++++++++++++++++++++-----
 lib/binding_rust/lib.rs       |  16 ++
 lib/include/tree_sitter/api.h |  22 +-
 lib/src/node.c                |   4 +
 lib/src/subtree.c             |   8 +-
 lib/src/subtree.h             |  12 +-
 lib/src/tree_cursor.c         |  96 ++++++++-
 lib/src/tree_cursor.h         |   1 +
 9 files changed, 502 insertions(+), 72 deletions(-)

diff --git a/cli/src/tests/node_test.rs b/cli/src/tests/node_test.rs
index 6d5ed61d..28c52116 100644
--- a/cli/src/tests/node_test.rs
+++ b/cli/src/tests/node_test.rs
@@ -385,10 +385,30 @@ fn test_node_named_child_with_aliases_and_extras() {
     assert_eq!(root.named_child(4).unwrap().kind(), "C");
 }
 
+#[test]
+fn test_node_descendant_count() {
+    let tree = parse_json_example();
+    let value_node = tree.root_node();
+    let all_nodes = get_all_nodes(&tree);
+
+    assert_eq!(value_node.descendant_count(), all_nodes.len());
+
+    let mut cursor = value_node.walk();
+    for (i, node) in all_nodes.iter().enumerate() {
+        cursor.goto_descendant(i);
+        assert_eq!(cursor.node(), *node, "index {i}");
+    }
+
+    for (i, node) in all_nodes.iter().enumerate().rev() {
+        cursor.goto_descendant(i);
+        assert_eq!(cursor.node(), *node, "rev index {i}");
+    }
+}
+
 #[test]
 fn test_node_descendant_for_range() {
     let tree = parse_json_example();
-    let array_node = tree.root_node().child(0).unwrap();
+    let array_node = tree.root_node();
 
     // Leaf node exactly matches the given bounds - byte query
     let colon_index = JSON_EXAMPLE.find(":").unwrap();
@@ -841,15 +861,17 @@ fn get_all_nodes(tree: &Tree) -> Vec<Node> {
     let mut visited_children = false;
     let mut cursor = tree.walk();
     loop {
-        result.push(cursor.node());
-        if !visited_children && cursor.goto_first_child() {
-            continue;
-        } else if cursor.goto_next_sibling() {
-            visited_children = false;
-        } else if cursor.goto_parent() {
-            visited_children = true;
+        if !visited_children {
+            result.push(cursor.node());
+            if !cursor.goto_first_child() {
+                visited_children = true;
+            }
         } else {
-            break;
+            if cursor.goto_next_sibling() {
+                visited_children = false;
+            } else if !cursor.goto_parent() {
+                break;
+            }
         }
     }
     return result;
diff --git a/lib/binding_rust/bindings.rs b/lib/binding_rust/bindings.rs
index 24751e4d..1d3b6a30 100644
--- a/lib/binding_rust/bindings.rs
+++ b/lib/binding_rust/bindings.rs
@@ -1,4 +1,4 @@
-/* automatically generated by rust-bindgen 0.65.1 */
+/* automatically generated by rust-bindgen 0.59.2 */
 
 pub type TSSymbol = u16;
 pub type TSFieldId = u16;
@@ -148,7 +148,14 @@ extern "C" {
     pub fn ts_parser_delete(parser: *mut TSParser);
 }
 extern "C" {
-    #[doc = " Set the language that the parser should use for parsing.\n\n Returns a boolean indicating whether or not the language was successfully\n assigned. True means assignment succeeded. False means there was a version\n mismatch: the language was generated with an incompatible version of the\n Tree-sitter CLI. Check the language's version using `ts_language_version`\n and compare it to this library's `TREE_SITTER_LANGUAGE_VERSION` and\n `TREE_SITTER_MIN_COMPATIBLE_LANGUAGE_VERSION` constants."]
+    #[doc = " Set the language that the parser should use for parsing."]
+    #[doc = ""]
+    #[doc = " Returns a boolean indicating whether or not the language was successfully"]
+    #[doc = " assigned. True means assignment succeeded. False means there was a version"]
+    #[doc = " mismatch: the language was generated with an incompatible version of the"]
+    #[doc = " Tree-sitter CLI. Check the language's version using `ts_language_version`"]
+    #[doc = " and compare it to this library's `TREE_SITTER_LANGUAGE_VERSION` and"]
+    #[doc = " `TREE_SITTER_MIN_COMPATIBLE_LANGUAGE_VERSION` constants."]
     pub fn ts_parser_set_language(self_: *mut TSParser, language: *const TSLanguage) -> bool;
 }
 extern "C" {
@@ -156,7 +163,25 @@ extern "C" {
     pub fn ts_parser_language(self_: *const TSParser) -> *const TSLanguage;
 }
 extern "C" {
-    #[doc = " Set the ranges of text that the parser should include when parsing.\n\n By default, the parser will always include entire documents. This function\n allows you to parse only a *portion* of a document but still return a syntax\n tree whose ranges match up with the document as a whole. You can also pass\n multiple disjoint ranges.\n\n The second and third parameters specify the location and length of an array\n of ranges. The parser does *not* take ownership of these ranges; it copies\n the data, so it doesn't matter how these ranges are allocated.\n\n If `length` is zero, then the entire document will be parsed. Otherwise,\n the given ranges must be ordered from earliest to latest in the document,\n and they must not overlap. That is, the following must hold for all\n `i` < `length - 1`: ranges[i].end_byte <= ranges[i + 1].start_byte\n\n If this requirement is not satisfied, the operation will fail, the ranges\n will not be assigned, and this function will return `false`. On success,\n this function returns `true`"]
+    #[doc = " Set the ranges of text that the parser should include when parsing."]
+    #[doc = ""]
+    #[doc = " By default, the parser will always include entire documents. This function"]
+    #[doc = " allows you to parse only a *portion* of a document but still return a syntax"]
+    #[doc = " tree whose ranges match up with the document as a whole. You can also pass"]
+    #[doc = " multiple disjoint ranges."]
+    #[doc = ""]
+    #[doc = " The second and third parameters specify the location and length of an array"]
+    #[doc = " of ranges. The parser does *not* take ownership of these ranges; it copies"]
+    #[doc = " the data, so it doesn't matter how these ranges are allocated."]
+    #[doc = ""]
+    #[doc = " If `length` is zero, then the entire document will be parsed. Otherwise,"]
+    #[doc = " the given ranges must be ordered from earliest to latest in the document,"]
+    #[doc = " and they must not overlap. That is, the following must hold for all"]
+    #[doc = " `i` < `length - 1`: ranges[i].end_byte <= ranges[i + 1].start_byte"]
+    #[doc = ""]
+    #[doc = " If this requirement is not satisfied, the operation will fail, the ranges"]
+    #[doc = " will not be assigned, and this function will return `false`. On success,"]
+    #[doc = " this function returns `true`"]
     pub fn ts_parser_set_included_ranges(
         self_: *mut TSParser,
         ranges: *const TSRange,
@@ -164,11 +189,50 @@ extern "C" {
     ) -> bool;
 }
 extern "C" {
-    #[doc = " Get the ranges of text that the parser will include when parsing.\n\n The returned pointer is owned by the parser. The caller should not free it\n or write to it. The length of the array will be written to the given\n `length` pointer."]
+    #[doc = " Get the ranges of text that the parser will include when parsing."]
+    #[doc = ""]
+    #[doc = " The returned pointer is owned by the parser. The caller should not free it"]
+    #[doc = " or write to it. The length of the array will be written to the given"]
+    #[doc = " `length` pointer."]
     pub fn ts_parser_included_ranges(self_: *const TSParser, length: *mut u32) -> *const TSRange;
 }
 extern "C" {
-    #[doc = " Use the parser to parse some source code and create a syntax tree.\n\n If you are parsing this document for the first time, pass `NULL` for the\n `old_tree` parameter. Otherwise, if you have already parsed an earlier\n version of this document and the document has since been edited, pass the\n previous syntax tree so that the unchanged parts of it can be reused.\n This will save time and memory. For this to work correctly, you must have\n already edited the old syntax tree using the `ts_tree_edit` function in a\n way that exactly matches the source code changes.\n\n The `TSInput` parameter lets you specify how to read the text. It has the\n following three fields:\n 1. `read`: A function to retrieve a chunk of text at a given byte offset\n    and (row, column) position. The function should return a pointer to the\n    text and write its length to the `bytes_read` pointer. The parser does\n    not take ownership of this buffer; it just borrows it until it has\n    finished reading it. The function should write a zero value to the\n    `bytes_read` pointer to indicate the end of the document.\n 2. `payload`: An arbitrary pointer that will be passed to each invocation\n    of the `read` function.\n 3. `encoding`: An indication of how the text is encoded. Either\n    `TSInputEncodingUTF8` or `TSInputEncodingUTF16`.\n\n This function returns a syntax tree on success, and `NULL` on failure. There\n are three possible reasons for failure:\n 1. The parser does not have a language assigned. Check for this using the\n`ts_parser_language` function.\n 2. Parsing was cancelled due to a timeout that was set by an earlier call to\n    the `ts_parser_set_timeout_micros` function. You can resume parsing from\n    where the parser left out by calling `ts_parser_parse` again with the\n    same arguments. Or you can start parsing from scratch by first calling\n    `ts_parser_reset`.\n 3. Parsing was cancelled using a cancellation flag that was set by an\n    earlier call to `ts_parser_set_cancellation_flag`. You can resume parsing\n    from where the parser left out by calling `ts_parser_parse` again with\n    the same arguments."]
+    #[doc = " Use the parser to parse some source code and create a syntax tree."]
+    #[doc = ""]
+    #[doc = " If you are parsing this document for the first time, pass `NULL` for the"]
+    #[doc = " `old_tree` parameter. Otherwise, if you have already parsed an earlier"]
+    #[doc = " version of this document and the document has since been edited, pass the"]
+    #[doc = " previous syntax tree so that the unchanged parts of it can be reused."]
+    #[doc = " This will save time and memory. For this to work correctly, you must have"]
+    #[doc = " already edited the old syntax tree using the `ts_tree_edit` function in a"]
+    #[doc = " way that exactly matches the source code changes."]
+    #[doc = ""]
+    #[doc = " The `TSInput` parameter lets you specify how to read the text. It has the"]
+    #[doc = " following three fields:"]
+    #[doc = " 1. `read`: A function to retrieve a chunk of text at a given byte offset"]
+    #[doc = "    and (row, column) position. The function should return a pointer to the"]
+    #[doc = "    text and write its length to the `bytes_read` pointer. The parser does"]
+    #[doc = "    not take ownership of this buffer; it just borrows it until it has"]
+    #[doc = "    finished reading it. The function should write a zero value to the"]
+    #[doc = "    `bytes_read` pointer to indicate the end of the document."]
+    #[doc = " 2. `payload`: An arbitrary pointer that will be passed to each invocation"]
+    #[doc = "    of the `read` function."]
+    #[doc = " 3. `encoding`: An indication of how the text is encoded. Either"]
+    #[doc = "    `TSInputEncodingUTF8` or `TSInputEncodingUTF16`."]
+    #[doc = ""]
+    #[doc = " This function returns a syntax tree on success, and `NULL` on failure. There"]
+    #[doc = " are three possible reasons for failure:"]
+    #[doc = " 1. The parser does not have a language assigned. Check for this using the"]
+    #[doc = "`ts_parser_language` function."]
+    #[doc = " 2. Parsing was cancelled due to a timeout that was set by an earlier call to"]
+    #[doc = "    the `ts_parser_set_timeout_micros` function. You can resume parsing from"]
+    #[doc = "    where the parser left out by calling `ts_parser_parse` again with the"]
+    #[doc = "    same arguments. Or you can start parsing from scratch by first calling"]
+    #[doc = "    `ts_parser_reset`."]
+    #[doc = " 3. Parsing was cancelled using a cancellation flag that was set by an"]
+    #[doc = "    earlier call to `ts_parser_set_cancellation_flag`. You can resume parsing"]
+    #[doc = "    from where the parser left out by calling `ts_parser_parse` again with"]
+    #[doc = "    the same arguments."]
     pub fn ts_parser_parse(
         self_: *mut TSParser,
         old_tree: *const TSTree,
@@ -176,7 +240,10 @@ extern "C" {
     ) -> *mut TSTree;
 }
 extern "C" {
-    #[doc = " Use the parser to parse some source code stored in one contiguous buffer.\n The first two parameters are the same as in the `ts_parser_parse` function\n above. The second two parameters indicate the location of the buffer and its\n length in bytes."]
+    #[doc = " Use the parser to parse some source code stored in one contiguous buffer."]
+    #[doc = " The first two parameters are the same as in the `ts_parser_parse` function"]
+    #[doc = " above. The second two parameters indicate the location of the buffer and its"]
+    #[doc = " length in bytes."]
     pub fn ts_parser_parse_string(
         self_: *mut TSParser,
         old_tree: *const TSTree,
@@ -185,7 +252,10 @@ extern "C" {
     ) -> *mut TSTree;
 }
 extern "C" {
-    #[doc = " Use the parser to parse some source code stored in one contiguous buffer with\n a given encoding. The first four parameters work the same as in the\n `ts_parser_parse_string` method above. The final parameter indicates whether\n the text is encoded as UTF8 or UTF16."]
+    #[doc = " Use the parser to parse some source code stored in one contiguous buffer with"]
+    #[doc = " a given encoding. The first four parameters work the same as in the"]
+    #[doc = " `ts_parser_parse_string` method above. The final parameter indicates whether"]
+    #[doc = " the text is encoded as UTF8 or UTF16."]
     pub fn ts_parser_parse_string_encoding(
         self_: *mut TSParser,
         old_tree: *const TSTree,
@@ -195,11 +265,21 @@ extern "C" {
     ) -> *mut TSTree;
 }
 extern "C" {
-    #[doc = " Instruct the parser to start the next parse from the beginning.\n\n If the parser previously failed because of a timeout or a cancellation, then\n by default, it will resume where it left off on the next call to\n `ts_parser_parse` or other parsing functions. If you don't want to resume,\n and instead intend to use this parser to parse some other document, you must\n call `ts_parser_reset` first."]
+    #[doc = " Instruct the parser to start the next parse from the beginning."]
+    #[doc = ""]
+    #[doc = " If the parser previously failed because of a timeout or a cancellation, then"]
+    #[doc = " by default, it will resume where it left off on the next call to"]
+    #[doc = " `ts_parser_parse` or other parsing functions. If you don't want to resume,"]
+    #[doc = " and instead intend to use this parser to parse some other document, you must"]
+    #[doc = " call `ts_parser_reset` first."]
     pub fn ts_parser_reset(self_: *mut TSParser);
 }
 extern "C" {
-    #[doc = " Set the maximum duration in microseconds that parsing should be allowed to\n take before halting.\n\n If parsing takes longer than this, it will halt early, returning NULL.\n See `ts_parser_parse` for more information."]
+    #[doc = " Set the maximum duration in microseconds that parsing should be allowed to"]
+    #[doc = " take before halting."]
+    #[doc = ""]
+    #[doc = " If parsing takes longer than this, it will halt early, returning NULL."]
+    #[doc = " See `ts_parser_parse` for more information."]
     pub fn ts_parser_set_timeout_micros(self_: *mut TSParser, timeout: u64);
 }
 extern "C" {
@@ -207,7 +287,11 @@ extern "C" {
     pub fn ts_parser_timeout_micros(self_: *const TSParser) -> u64;
 }
 extern "C" {
-    #[doc = " Set the parser's current cancellation flag pointer.\n\n If a non-null pointer is assigned, then the parser will periodically read\n from this pointer during parsing. If it reads a non-zero value, it will\n halt early, returning NULL. See `ts_parser_parse` for more information."]
+    #[doc = " Set the parser's current cancellation flag pointer."]
+    #[doc = ""]
+    #[doc = " If a non-null pointer is assigned, then the parser will periodically read"]
+    #[doc = " from this pointer during parsing. If it reads a non-zero value, it will"]
+    #[doc = " halt early, returning NULL. See `ts_parser_parse` for more information."]
     pub fn ts_parser_set_cancellation_flag(self_: *mut TSParser, flag: *const usize);
 }
 extern "C" {
@@ -215,7 +299,11 @@ extern "C" {
     pub fn ts_parser_cancellation_flag(self_: *const TSParser) -> *const usize;
 }
 extern "C" {
-    #[doc = " Set the logger that a parser should use during parsing.\n\n The parser does not take ownership over the logger payload. If a logger was\n previously assigned, the caller is responsible for releasing any memory\n owned by the previous logger."]
+    #[doc = " Set the logger that a parser should use during parsing."]
+    #[doc = ""]
+    #[doc = " The parser does not take ownership over the logger payload. If a logger was"]
+    #[doc = " previously assigned, the caller is responsible for releasing any memory"]
+    #[doc = " owned by the previous logger."]
     pub fn ts_parser_set_logger(self_: *mut TSParser, logger: TSLogger);
 }
 extern "C" {
@@ -223,11 +311,17 @@ extern "C" {
     pub fn ts_parser_logger(self_: *const TSParser) -> TSLogger;
 }
 extern "C" {
-    #[doc = " Set the file descriptor to which the parser should write debugging graphs\n during parsing. The graphs are formatted in the DOT language. You may want\n to pipe these graphs directly to a `dot(1)` process in order to generate\n SVG output. You can turn off this logging by passing a negative number."]
+    #[doc = " Set the file descriptor to which the parser should write debugging graphs"]
+    #[doc = " during parsing. The graphs are formatted in the DOT language. You may want"]
+    #[doc = " to pipe these graphs directly to a `dot(1)` process in order to generate"]
+    #[doc = " SVG output. You can turn off this logging by passing a negative number."]
     pub fn ts_parser_print_dot_graphs(self_: *mut TSParser, file: ::std::os::raw::c_int);
 }
 extern "C" {
-    #[doc = " Create a shallow copy of the syntax tree. This is very fast.\n\n You need to copy a syntax tree in order to use it on more than one thread at\n a time, as syntax trees are not thread safe."]
+    #[doc = " Create a shallow copy of the syntax tree. This is very fast."]
+    #[doc = ""]
+    #[doc = " You need to copy a syntax tree in order to use it on more than one thread at"]
+    #[doc = " a time, as syntax trees are not thread safe."]
     pub fn ts_tree_copy(self_: *const TSTree) -> *mut TSTree;
 }
 extern "C" {
@@ -239,7 +333,8 @@ extern "C" {
     pub fn ts_tree_root_node(self_: *const TSTree) -> TSNode;
 }
 extern "C" {
-    #[doc = " Get the root node of the syntax tree, but with its position\n shifted forward by the given offset."]
+    #[doc = " Get the root node of the syntax tree, but with its position"]
+    #[doc = " shifted forward by the given offset."]
     pub fn ts_tree_root_node_with_offset(
         self_: *const TSTree,
         offset_bytes: u32,
@@ -251,15 +346,32 @@ extern "C" {
     pub fn ts_tree_language(arg1: *const TSTree) -> *const TSLanguage;
 }
 extern "C" {
-    #[doc = " Get the array of included ranges that was used to parse the syntax tree.\n\n The returned pointer must be freed by the caller."]
+    #[doc = " Get the array of included ranges that was used to parse the syntax tree."]
+    #[doc = ""]
+    #[doc = " The returned pointer must be freed by the caller."]
     pub fn ts_tree_included_ranges(arg1: *const TSTree, length: *mut u32) -> *mut TSRange;
 }
 extern "C" {
-    #[doc = " Edit the syntax tree to keep it in sync with source code that has been\n edited.\n\n You must describe the edit both in terms of byte offsets and in terms of\n (row, column) coordinates."]
+    #[doc = " Edit the syntax tree to keep it in sync with source code that has been"]
+    #[doc = " edited."]
+    #[doc = ""]
+    #[doc = " You must describe the edit both in terms of byte offsets and in terms of"]
+    #[doc = " (row, column) coordinates."]
     pub fn ts_tree_edit(self_: *mut TSTree, edit: *const TSInputEdit);
 }
 extern "C" {
-    #[doc = " Compare an old edited syntax tree to a new syntax tree representing the same\n document, returning an array of ranges whose syntactic structure has changed.\n\n For this to work correctly, the old syntax tree must have been edited such\n that its ranges match up to the new tree. Generally, you'll want to call\n this function right after calling one of the `ts_parser_parse` functions.\n You need to pass the old tree that was passed to parse, as well as the new\n tree that was returned from that function.\n\n The returned array is allocated using `malloc` and the caller is responsible\n for freeing it using `free`. The length of the array will be written to the\n given `length` pointer."]
+    #[doc = " Compare an old edited syntax tree to a new syntax tree representing the same"]
+    #[doc = " document, returning an array of ranges whose syntactic structure has changed."]
+    #[doc = ""]
+    #[doc = " For this to work correctly, the old syntax tree must have been edited such"]
+    #[doc = " that its ranges match up to the new tree. Generally, you'll want to call"]
+    #[doc = " this function right after calling one of the `ts_parser_parse` functions."]
+    #[doc = " You need to pass the old tree that was passed to parse, as well as the new"]
+    #[doc = " tree that was returned from that function."]
+    #[doc = ""]
+    #[doc = " The returned array is allocated using `malloc` and the caller is responsible"]
+    #[doc = " for freeing it using `free`. The length of the array will be written to the"]
+    #[doc = " given `length` pointer."]
     pub fn ts_tree_get_changed_ranges(
         old_tree: *const TSTree,
         new_tree: *const TSTree,
@@ -295,23 +407,32 @@ extern "C" {
     pub fn ts_node_end_point(arg1: TSNode) -> TSPoint;
 }
 extern "C" {
-    #[doc = " Get an S-expression representing the node as a string.\n\n This string is allocated with `malloc` and the caller is responsible for\n freeing it using `free`."]
+    #[doc = " Get an S-expression representing the node as a string."]
+    #[doc = ""]
+    #[doc = " This string is allocated with `malloc` and the caller is responsible for"]
+    #[doc = " freeing it using `free`."]
     pub fn ts_node_string(arg1: TSNode) -> *mut ::std::os::raw::c_char;
 }
 extern "C" {
-    #[doc = " Check if the node is null. Functions like `ts_node_child` and\n `ts_node_next_sibling` will return a null node to indicate that no such node\n was found."]
+    #[doc = " Check if the node is null. Functions like `ts_node_child` and"]
+    #[doc = " `ts_node_next_sibling` will return a null node to indicate that no such node"]
+    #[doc = " was found."]
     pub fn ts_node_is_null(arg1: TSNode) -> bool;
 }
 extern "C" {
-    #[doc = " Check if the node is *named*. Named nodes correspond to named rules in the\n grammar, whereas *anonymous* nodes correspond to string literals in the\n grammar."]
+    #[doc = " Check if the node is *named*. Named nodes correspond to named rules in the"]
+    #[doc = " grammar, whereas *anonymous* nodes correspond to string literals in the"]
+    #[doc = " grammar."]
     pub fn ts_node_is_named(arg1: TSNode) -> bool;
 }
 extern "C" {
-    #[doc = " Check if the node is *missing*. Missing nodes are inserted by the parser in\n order to recover from certain kinds of syntax errors."]
+    #[doc = " Check if the node is *missing*. Missing nodes are inserted by the parser in"]
+    #[doc = " order to recover from certain kinds of syntax errors."]
     pub fn ts_node_is_missing(arg1: TSNode) -> bool;
 }
 extern "C" {
-    #[doc = " Check if the node is *extra*. Extra nodes represent things like comments,\n which are not required the grammar, but can appear anywhere."]
+    #[doc = " Check if the node is *extra*. Extra nodes represent things like comments,"]
+    #[doc = " which are not required the grammar, but can appear anywhere."]
     pub fn ts_node_is_extra(arg1: TSNode) -> bool;
 }
 extern "C" {
@@ -327,11 +448,13 @@ extern "C" {
     pub fn ts_node_parent(arg1: TSNode) -> TSNode;
 }
 extern "C" {
-    #[doc = " Get the node's child at the given index, where zero represents the first\n child."]
+    #[doc = " Get the node's child at the given index, where zero represents the first"]
+    #[doc = " child."]
     pub fn ts_node_child(arg1: TSNode, arg2: u32) -> TSNode;
 }
 extern "C" {
-    #[doc = " Get the field name for node's child at the given index, where zero represents\n the first child. Returns NULL, if no field is found."]
+    #[doc = " Get the field name for node's child at the given index, where zero represents"]
+    #[doc = " the first child. Returns NULL, if no field is found."]
     pub fn ts_node_field_name_for_child(arg1: TSNode, arg2: u32) -> *const ::std::os::raw::c_char;
 }
 extern "C" {
@@ -339,11 +462,15 @@ extern "C" {
     pub fn ts_node_child_count(arg1: TSNode) -> u32;
 }
 extern "C" {
-    #[doc = " Get the node's *named* child at the given index.\n\n See also `ts_node_is_named`."]
+    #[doc = " Get the node's *named* child at the given index."]
+    #[doc = ""]
+    #[doc = " See also `ts_node_is_named`."]
     pub fn ts_node_named_child(arg1: TSNode, arg2: u32) -> TSNode;
 }
 extern "C" {
-    #[doc = " Get the node's number of *named* children.\n\n See also `ts_node_is_named`."]
+    #[doc = " Get the node's number of *named* children."]
+    #[doc = ""]
+    #[doc = " See also `ts_node_is_named`."]
     pub fn ts_node_named_child_count(arg1: TSNode) -> u32;
 }
 extern "C" {
@@ -355,7 +482,10 @@ extern "C" {
     ) -> TSNode;
 }
 extern "C" {
-    #[doc = " Get the node's child with the given numerical field id.\n\n You can convert a field name to an id using the\n `ts_language_field_id_for_name` function."]
+    #[doc = " Get the node's child with the given numerical field id."]
+    #[doc = ""]
+    #[doc = " You can convert a field name to an id using the"]
+    #[doc = " `ts_language_field_id_for_name` function."]
     pub fn ts_node_child_by_field_id(arg1: TSNode, arg2: TSFieldId) -> TSNode;
 }
 extern "C" {
@@ -381,7 +511,12 @@ extern "C" {
     pub fn ts_node_first_named_child_for_byte(arg1: TSNode, arg2: u32) -> TSNode;
 }
 extern "C" {
-    #[doc = " Get the smallest node within this node that spans the given range of bytes\n or (row, column) positions."]
+    #[doc = " Get the node's number of descendants, including one for the node itself."]
+    pub fn ts_node_descendant_count(arg1: TSNode) -> u32;
+}
+extern "C" {
+    #[doc = " Get the smallest node within this node that spans the given range of bytes"]
+    #[doc = " or (row, column) positions."]
     pub fn ts_node_descendant_for_byte_range(arg1: TSNode, arg2: u32, arg3: u32) -> TSNode;
 }
 extern "C" {
@@ -389,7 +524,8 @@ extern "C" {
         -> TSNode;
 }
 extern "C" {
-    #[doc = " Get the smallest named node within this node that spans the given range of\n bytes or (row, column) positions."]
+    #[doc = " Get the smallest named node within this node that spans the given range of"]
+    #[doc = " bytes or (row, column) positions."]
     pub fn ts_node_named_descendant_for_byte_range(arg1: TSNode, arg2: u32, arg3: u32) -> TSNode;
 }
 extern "C" {
@@ -400,7 +536,13 @@ extern "C" {
     ) -> TSNode;
 }
 extern "C" {
-    #[doc = " Edit the node to keep it in-sync with source code that has been edited.\n\n This function is only rarely needed. When you edit a syntax tree with the\n `ts_tree_edit` function, all of the nodes that you retrieve from the tree\n afterward will already reflect the edit. You only need to use `ts_node_edit`\n when you have a `TSNode` instance that you want to keep and continue to use\n after an edit."]
+    #[doc = " Edit the node to keep it in-sync with source code that has been edited."]
+    #[doc = ""]
+    #[doc = " This function is only rarely needed. When you edit a syntax tree with the"]
+    #[doc = " `ts_tree_edit` function, all of the nodes that you retrieve from the tree"]
+    #[doc = " afterward will already reflect the edit. You only need to use `ts_node_edit`"]
+    #[doc = " when you have a `TSNode` instance that you want to keep and continue to use"]
+    #[doc = " after an edit."]
     pub fn ts_node_edit(arg1: *mut TSNode, arg2: *const TSInputEdit);
 }
 extern "C" {
@@ -408,7 +550,11 @@ extern "C" {
     pub fn ts_node_eq(arg1: TSNode, arg2: TSNode) -> bool;
 }
 extern "C" {
-    #[doc = " Create a new tree cursor starting from the given node.\n\n A tree cursor allows you to walk a syntax tree more efficiently than is\n possible using the `TSNode` functions. It is a mutable object that is always\n on a certain syntax node, and can be moved imperatively to different nodes."]
+    #[doc = " Create a new tree cursor starting from the given node."]
+    #[doc = ""]
+    #[doc = " A tree cursor allows you to walk a syntax tree more efficiently than is"]
+    #[doc = " possible using the `TSNode` functions. It is a mutable object that is always"]
+    #[doc = " on a certain syntax node, and can be moved imperatively to different nodes."]
     pub fn ts_tree_cursor_new(arg1: TSNode) -> TSTreeCursor;
 }
 extern "C" {
@@ -424,29 +570,59 @@ extern "C" {
     pub fn ts_tree_cursor_current_node(arg1: *const TSTreeCursor) -> TSNode;
 }
 extern "C" {
-    #[doc = " Get the field name of the tree cursor's current node.\n\n This returns `NULL` if the current node doesn't have a field.\n See also `ts_node_child_by_field_name`."]
+    #[doc = " Get the field name of the tree cursor's current node."]
+    #[doc = ""]
+    #[doc = " This returns `NULL` if the current node doesn't have a field."]
+    #[doc = " See also `ts_node_child_by_field_name`."]
     pub fn ts_tree_cursor_current_field_name(
         arg1: *const TSTreeCursor,
     ) -> *const ::std::os::raw::c_char;
 }
 extern "C" {
-    #[doc = " Get the field id of the tree cursor's current node.\n\n This returns zero if the current node doesn't have a field.\n See also `ts_node_child_by_field_id`, `ts_language_field_id_for_name`."]
+    #[doc = " Get the field id of the tree cursor's current node."]
+    #[doc = ""]
+    #[doc = " This returns zero if the current node doesn't have a field."]
+    #[doc = " See also `ts_node_child_by_field_id`, `ts_language_field_id_for_name`."]
     pub fn ts_tree_cursor_current_field_id(arg1: *const TSTreeCursor) -> TSFieldId;
 }
 extern "C" {
-    #[doc = " Move the cursor to the parent of its current node.\n\n This returns `true` if the cursor successfully moved, and returns `false`\n if there was no parent node (the cursor was already on the root node)."]
+    #[doc = " Move the cursor to the parent of its current node."]
+    #[doc = ""]
+    #[doc = " This returns `true` if the cursor successfully moved, and returns `false`"]
+    #[doc = " if there was no parent node (the cursor was already on the root node)."]
     pub fn ts_tree_cursor_goto_parent(arg1: *mut TSTreeCursor) -> bool;
 }
 extern "C" {
-    #[doc = " Move the cursor to the next sibling of its current node.\n\n This returns `true` if the cursor successfully moved, and returns `false`\n if there was no next sibling node."]
+    #[doc = " Move the cursor to the next sibling of its current node."]
+    #[doc = ""]
+    #[doc = " This returns `true` if the cursor successfully moved, and returns `false`"]
+    #[doc = " if there was no next sibling node."]
     pub fn ts_tree_cursor_goto_next_sibling(arg1: *mut TSTreeCursor) -> bool;
 }
 extern "C" {
-    #[doc = " Move the cursor to the first child of its current node.\n\n This returns `true` if the cursor successfully moved, and returns `false`\n if there were no children."]
+    #[doc = " Move the cursor to the first child of its current node."]
+    #[doc = ""]
+    #[doc = " This returns `true` if the cursor successfully moved, and returns `false`"]
+    #[doc = " if there were no children."]
     pub fn ts_tree_cursor_goto_first_child(arg1: *mut TSTreeCursor) -> bool;
 }
 extern "C" {
-    #[doc = " Move the cursor to the first child of its current node that extends beyond\n the given byte offset or point.\n\n This returns the index of the child node if one was found, and returns -1\n if no such child was found."]
+    #[doc = " Move the cursor to the node that is the nth descendant of"]
+    #[doc = " the original node that the cursor was constructed with, where"]
+    #[doc = " zero represents the original node itself."]
+    pub fn ts_tree_cursor_goto_descendant(arg1: *mut TSTreeCursor, arg2: u32);
+}
+extern "C" {
+    #[doc = " Get the index of the cursor's current node out of all of the"]
+    #[doc = " descendants of the original node that the cursor was constructed with."]
+    pub fn ts_tree_cursor_descendant_index(arg1: *mut TSTreeCursor) -> u32;
+}
+extern "C" {
+    #[doc = " Move the cursor to the first child of its current node that extends beyond"]
+    #[doc = " the given byte offset or point."]
+    #[doc = ""]
+    #[doc = " This returns the index of the child node if one was found, and returns -1"]
+    #[doc = " if no such child was found."]
     pub fn ts_tree_cursor_goto_first_child_for_byte(arg1: *mut TSTreeCursor, arg2: u32) -> i64;
 }
 extern "C" {
@@ -457,7 +633,15 @@ extern "C" {
     pub fn ts_tree_cursor_copy(arg1: *const TSTreeCursor) -> TSTreeCursor;
 }
 extern "C" {
-    #[doc = " Create a new query from a string containing one or more S-expression\n patterns. The query is associated with a particular language, and can\n only be run on syntax nodes parsed with that language.\n\n If all of the given patterns are valid, this returns a `TSQuery`.\n If a pattern is invalid, this returns `NULL`, and provides two pieces\n of information about the problem:\n 1. The byte offset of the error is written to the `error_offset` parameter.\n 2. The type of error is written to the `error_type` parameter."]
+    #[doc = " Create a new query from a string containing one or more S-expression"]
+    #[doc = " patterns. The query is associated with a particular language, and can"]
+    #[doc = " only be run on syntax nodes parsed with that language."]
+    #[doc = ""]
+    #[doc = " If all of the given patterns are valid, this returns a `TSQuery`."]
+    #[doc = " If a pattern is invalid, this returns `NULL`, and provides two pieces"]
+    #[doc = " of information about the problem:"]
+    #[doc = " 1. The byte offset of the error is written to the `error_offset` parameter."]
+    #[doc = " 2. The type of error is written to the `error_type` parameter."]
     pub fn ts_query_new(
         language: *const TSLanguage,
         source: *const ::std::os::raw::c_char,
@@ -481,11 +665,27 @@ extern "C" {
     pub fn ts_query_string_count(arg1: *const TSQuery) -> u32;
 }
 extern "C" {
-    #[doc = " Get the byte offset where the given pattern starts in the query's source.\n\n This can be useful when combining queries by concatenating their source\n code strings."]
+    #[doc = " Get the byte offset where the given pattern starts in the query's source."]
+    #[doc = ""]
+    #[doc = " This can be useful when combining queries by concatenating their source"]
+    #[doc = " code strings."]
     pub fn ts_query_start_byte_for_pattern(arg1: *const TSQuery, arg2: u32) -> u32;
 }
 extern "C" {
-    #[doc = " Get all of the predicates for the given pattern in the query.\n\n The predicates are represented as a single array of steps. There are three\n types of steps in this array, which correspond to the three legal values for\n the `type` field:\n - `TSQueryPredicateStepTypeCapture` - Steps with this type represent names\n    of captures. Their `value_id` can be used with the\n   `ts_query_capture_name_for_id` function to obtain the name of the capture.\n - `TSQueryPredicateStepTypeString` - Steps with this type represent literal\n    strings. Their `value_id` can be used with the\n    `ts_query_string_value_for_id` function to obtain their string value.\n - `TSQueryPredicateStepTypeDone` - Steps with this type are *sentinels*\n    that represent the end of an individual predicate. If a pattern has two\n    predicates, then there will be two steps with this `type` in the array."]
+    #[doc = " Get all of the predicates for the given pattern in the query."]
+    #[doc = ""]
+    #[doc = " The predicates are represented as a single array of steps. There are three"]
+    #[doc = " types of steps in this array, which correspond to the three legal values for"]
+    #[doc = " the `type` field:"]
+    #[doc = " - `TSQueryPredicateStepTypeCapture` - Steps with this type represent names"]
+    #[doc = "    of captures. Their `value_id` can be used with the"]
+    #[doc = "   `ts_query_capture_name_for_id` function to obtain the name of the capture."]
+    #[doc = " - `TSQueryPredicateStepTypeString` - Steps with this type represent literal"]
+    #[doc = "    strings. Their `value_id` can be used with the"]
+    #[doc = "    `ts_query_string_value_for_id` function to obtain their string value."]
+    #[doc = " - `TSQueryPredicateStepTypeDone` - Steps with this type are *sentinels*"]
+    #[doc = "    that represent the end of an individual predicate. If a pattern has two"]
+    #[doc = "    predicates, then there will be two steps with this `type` in the array."]
     pub fn ts_query_predicates_for_pattern(
         self_: *const TSQuery,
         pattern_index: u32,
@@ -502,7 +702,9 @@ extern "C" {
     pub fn ts_query_is_pattern_guaranteed_at_step(self_: *const TSQuery, byte_offset: u32) -> bool;
 }
 extern "C" {
-    #[doc = " Get the name and length of one of the query's captures, or one of the\n query's string literals. Each capture and string is associated with a\n numeric id based on the order that it appeared in the query's source."]
+    #[doc = " Get the name and length of one of the query's captures, or one of the"]
+    #[doc = " query's string literals. Each capture and string is associated with a"]
+    #[doc = " numeric id based on the order that it appeared in the query's source."]
     pub fn ts_query_capture_name_for_id(
         arg1: *const TSQuery,
         id: u32,
@@ -510,7 +712,8 @@ extern "C" {
     ) -> *const ::std::os::raw::c_char;
 }
 extern "C" {
-    #[doc = " Get the quantifier of the query's captures. Each capture is * associated\n with a numeric id based on the order that it appeared in the query's source."]
+    #[doc = " Get the quantifier of the query's captures. Each capture is * associated"]
+    #[doc = " with a numeric id based on the order that it appeared in the query's source."]
     pub fn ts_query_capture_quantifier_for_id(
         arg1: *const TSQuery,
         pattern_id: u32,
@@ -525,7 +728,11 @@ extern "C" {
     ) -> *const ::std::os::raw::c_char;
 }
 extern "C" {
-    #[doc = " Disable a certain capture within a query.\n\n This prevents the capture from being returned in matches, and also avoids\n any resource usage associated with recording the capture. Currently, there\n is no way to undo this."]
+    #[doc = " Disable a certain capture within a query."]
+    #[doc = ""]
+    #[doc = " This prevents the capture from being returned in matches, and also avoids"]
+    #[doc = " any resource usage associated with recording the capture. Currently, there"]
+    #[doc = " is no way to undo this."]
     pub fn ts_query_disable_capture(
         arg1: *mut TSQuery,
         arg2: *const ::std::os::raw::c_char,
@@ -533,11 +740,33 @@ extern "C" {
     );
 }
 extern "C" {
-    #[doc = " Disable a certain pattern within a query.\n\n This prevents the pattern from matching and removes most of the overhead\n associated with the pattern. Currently, there is no way to undo this."]
+    #[doc = " Disable a certain pattern within a query."]
+    #[doc = ""]
+    #[doc = " This prevents the pattern from matching and removes most of the overhead"]
+    #[doc = " associated with the pattern. Currently, there is no way to undo this."]
     pub fn ts_query_disable_pattern(arg1: *mut TSQuery, arg2: u32);
 }
 extern "C" {
-    #[doc = " Create a new cursor for executing a given query.\n\n The cursor stores the state that is needed to iteratively search\n for matches. To use the query cursor, first call `ts_query_cursor_exec`\n to start running a given query on a given syntax node. Then, there are\n two options for consuming the results of the query:\n 1. Repeatedly call `ts_query_cursor_next_match` to iterate over all of the\n    *matches* in the order that they were found. Each match contains the\n    index of the pattern that matched, and an array of captures. Because\n    multiple patterns can match the same set of nodes, one match may contain\n    captures that appear *before* some of the captures from a previous match.\n 2. Repeatedly call `ts_query_cursor_next_capture` to iterate over all of the\n    individual *captures* in the order that they appear. This is useful if\n    don't care about which pattern matched, and just want a single ordered\n    sequence of captures.\n\n If you don't care about consuming all of the results, you can stop calling\n `ts_query_cursor_next_match` or `ts_query_cursor_next_capture` at any point.\n  You can then start executing another query on another node by calling\n  `ts_query_cursor_exec` again."]
+    #[doc = " Create a new cursor for executing a given query."]
+    #[doc = ""]
+    #[doc = " The cursor stores the state that is needed to iteratively search"]
+    #[doc = " for matches. To use the query cursor, first call `ts_query_cursor_exec`"]
+    #[doc = " to start running a given query on a given syntax node. Then, there are"]
+    #[doc = " two options for consuming the results of the query:"]
+    #[doc = " 1. Repeatedly call `ts_query_cursor_next_match` to iterate over all of the"]
+    #[doc = "    *matches* in the order that they were found. Each match contains the"]
+    #[doc = "    index of the pattern that matched, and an array of captures. Because"]
+    #[doc = "    multiple patterns can match the same set of nodes, one match may contain"]
+    #[doc = "    captures that appear *before* some of the captures from a previous match."]
+    #[doc = " 2. Repeatedly call `ts_query_cursor_next_capture` to iterate over all of the"]
+    #[doc = "    individual *captures* in the order that they appear. This is useful if"]
+    #[doc = "    don't care about which pattern matched, and just want a single ordered"]
+    #[doc = "    sequence of captures."]
+    #[doc = ""]
+    #[doc = " If you don't care about consuming all of the results, you can stop calling"]
+    #[doc = " `ts_query_cursor_next_match` or `ts_query_cursor_next_capture` at any point."]
+    #[doc = "  You can then start executing another query on another node by calling"]
+    #[doc = "  `ts_query_cursor_exec` again."]
     pub fn ts_query_cursor_new() -> *mut TSQueryCursor;
 }
 extern "C" {
@@ -549,7 +778,15 @@ extern "C" {
     pub fn ts_query_cursor_exec(arg1: *mut TSQueryCursor, arg2: *const TSQuery, arg3: TSNode);
 }
 extern "C" {
-    #[doc = " Manage the maximum number of in-progress matches allowed by this query\n cursor.\n\n Query cursors have an optional maximum capacity for storing lists of\n in-progress captures. If this capacity is exceeded, then the\n earliest-starting match will silently be dropped to make room for further\n matches. This maximum capacity is optional — by default, query cursors allow\n any number of pending matches, dynamically allocating new space for them as\n needed as the query is executed."]
+    #[doc = " Manage the maximum number of in-progress matches allowed by this query"]
+    #[doc = " cursor."]
+    #[doc = ""]
+    #[doc = " Query cursors have an optional maximum capacity for storing lists of"]
+    #[doc = " in-progress captures. If this capacity is exceeded, then the"]
+    #[doc = " earliest-starting match will silently be dropped to make room for further"]
+    #[doc = " matches. This maximum capacity is optional — by default, query cursors allow"]
+    #[doc = " any number of pending matches, dynamically allocating new space for them as"]
+    #[doc = " needed as the query is executed."]
     pub fn ts_query_cursor_did_exceed_match_limit(arg1: *const TSQueryCursor) -> bool;
 }
 extern "C" {
@@ -559,21 +796,28 @@ extern "C" {
     pub fn ts_query_cursor_set_match_limit(arg1: *mut TSQueryCursor, arg2: u32);
 }
 extern "C" {
-    #[doc = " Set the range of bytes or (row, column) positions in which the query\n will be executed."]
+    #[doc = " Set the range of bytes or (row, column) positions in which the query"]
+    #[doc = " will be executed."]
     pub fn ts_query_cursor_set_byte_range(arg1: *mut TSQueryCursor, arg2: u32, arg3: u32);
 }
 extern "C" {
     pub fn ts_query_cursor_set_point_range(arg1: *mut TSQueryCursor, arg2: TSPoint, arg3: TSPoint);
 }
 extern "C" {
-    #[doc = " Advance to the next match of the currently running query.\n\n If there is a match, write it to `*match` and return `true`.\n Otherwise, return `false`."]
+    #[doc = " Advance to the next match of the currently running query."]
+    #[doc = ""]
+    #[doc = " If there is a match, write it to `*match` and return `true`."]
+    #[doc = " Otherwise, return `false`."]
     pub fn ts_query_cursor_next_match(arg1: *mut TSQueryCursor, match_: *mut TSQueryMatch) -> bool;
 }
 extern "C" {
     pub fn ts_query_cursor_remove_match(arg1: *mut TSQueryCursor, id: u32);
 }
 extern "C" {
-    #[doc = " Advance to the next capture of the currently running query.\n\n If there is a capture, write its match to `*match` and its index within\n the matche's capture list to `*capture_index`. Otherwise, return `false`."]
+    #[doc = " Advance to the next capture of the currently running query."]
+    #[doc = ""]
+    #[doc = " If there is a capture, write its match to `*match` and its index within"]
+    #[doc = " the matche's capture list to `*capture_index`. Otherwise, return `false`."]
     pub fn ts_query_cursor_next_capture(
         arg1: *mut TSQueryCursor,
         match_: *mut TSQueryMatch,
@@ -581,7 +825,12 @@ extern "C" {
     ) -> bool;
 }
 extern "C" {
-    #[doc = " Set the maximum start depth for a cursor.\n\n This prevents cursors from exploring children nodes at a certain depth.\n Note if a pattern includes many children, then they will still be checked.\n\n Set to `0` to remove the maximum start depth."]
+    #[doc = " Set the maximum start depth for a cursor."]
+    #[doc = ""]
+    #[doc = " This prevents cursors from exploring children nodes at a certain depth."]
+    #[doc = " Note if a pattern includes many children, then they will still be checked."]
+    #[doc = ""]
+    #[doc = " Set to `0` to remove the maximum start depth."]
     pub fn ts_query_cursor_set_max_start_depth(arg1: *mut TSQueryCursor, arg2: u32);
 }
 extern "C" {
@@ -624,15 +873,35 @@ extern "C" {
     ) -> TSFieldId;
 }
 extern "C" {
-    #[doc = " Check whether the given node type id belongs to named nodes, anonymous nodes,\n or a hidden nodes.\n\n See also `ts_node_is_named`. Hidden nodes are never returned from the API."]
+    #[doc = " Check whether the given node type id belongs to named nodes, anonymous nodes,"]
+    #[doc = " or a hidden nodes."]
+    #[doc = ""]
+    #[doc = " See also `ts_node_is_named`. Hidden nodes are never returned from the API."]
     pub fn ts_language_symbol_type(arg1: *const TSLanguage, arg2: TSSymbol) -> TSSymbolType;
 }
 extern "C" {
-    #[doc = " Get the ABI version number for this language. This version number is used\n to ensure that languages were generated by a compatible version of\n Tree-sitter.\n\n See also `ts_parser_set_language`."]
+    #[doc = " Get the ABI version number for this language. This version number is used"]
+    #[doc = " to ensure that languages were generated by a compatible version of"]
+    #[doc = " Tree-sitter."]
+    #[doc = ""]
+    #[doc = " See also `ts_parser_set_language`."]
     pub fn ts_language_version(arg1: *const TSLanguage) -> u32;
 }
 extern "C" {
-    #[doc = " Set the allocation functions used by the library.\n\n By default, Tree-sitter uses the standard libc allocation functions,\n but aborts the process when an allocation fails. This function lets\n you supply alternative allocation functions at runtime.\n\n If you pass `NULL` for any parameter, Tree-sitter will switch back to\n its default implementation of that function.\n\n If you call this function after the library has already been used, then\n you must ensure that either:\n  1. All the existing objects have been freed.\n  2. The new allocator shares its state with the old one, so it is capable\n     of freeing memory that was allocated by the old allocator."]
+    #[doc = " Set the allocation functions used by the library."]
+    #[doc = ""]
+    #[doc = " By default, Tree-sitter uses the standard libc allocation functions,"]
+    #[doc = " but aborts the process when an allocation fails. This function lets"]
+    #[doc = " you supply alternative allocation functions at runtime."]
+    #[doc = ""]
+    #[doc = " If you pass `NULL` for any parameter, Tree-sitter will switch back to"]
+    #[doc = " its default implementation of that function."]
+    #[doc = ""]
+    #[doc = " If you call this function after the library has already been used, then"]
+    #[doc = " you must ensure that either:"]
+    #[doc = "  1. All the existing objects have been freed."]
+    #[doc = "  2. The new allocator shares its state with the old one, so it is capable"]
+    #[doc = "     of freeing memory that was allocated by the old allocator."]
     pub fn ts_set_allocator(
         new_malloc: ::std::option::Option<
             unsafe extern "C" fn(arg1: usize) -> *mut ::std::os::raw::c_void,
diff --git a/lib/binding_rust/lib.rs b/lib/binding_rust/lib.rs
index 87294a5d..b717a161 100644
--- a/lib/binding_rust/lib.rs
+++ b/lib/binding_rust/lib.rs
@@ -1121,6 +1121,12 @@ impl<'tree> Node<'tree> {
         Self::new(unsafe { ffi::ts_node_prev_named_sibling(self.0) })
     }
 
+    /// Get the node's number of descendants, including one for the node itself.
+    #[doc(alias = "ts_node_descendant_count")]
+    pub fn descendant_count(&self) -> usize {
+        unsafe { ffi::ts_node_descendant_count(self.0) as usize }
+    }
+
     /// Get the smallest node within this node that spans the given range.
     #[doc(alias = "ts_node_descendant_for_byte_range")]
     pub fn descendant_for_byte_range(&self, start: usize, end: usize) -> Option<Self> {
@@ -1287,6 +1293,16 @@ impl<'a> TreeCursor<'a> {
         return unsafe { ffi::ts_tree_cursor_goto_next_sibling(&mut self.0) };
     }
 
+    /// Move the cursor to the node that is the nth descendant of
+    /// the original node that the cursor was constructed with, where
+    /// zero represents the original node itself.
+    #[doc(alias = "ts_tree_cursor_goto_descendant")]
+    pub fn goto_descendant(&mut self, descendant_index: usize) {
+        return unsafe {
+            ffi::ts_tree_cursor_goto_descendant(&mut self.0, descendant_index as u32)
+        };
+    }
+
     /// Move this cursor to the first child of its current node that extends beyond
     /// the given byte offset.
     ///
diff --git a/lib/include/tree_sitter/api.h b/lib/include/tree_sitter/api.h
index 6824415a..04aafb84 100644
--- a/lib/include/tree_sitter/api.h
+++ b/lib/include/tree_sitter/api.h
@@ -575,6 +575,11 @@ TSNode ts_node_first_child_for_byte(TSNode, uint32_t);
  */
 TSNode ts_node_first_named_child_for_byte(TSNode, uint32_t);
 
+/**
+ * Get the node's number of descendants, including one for the node itself.
+ */
+uint32_t ts_node_descendant_count(TSNode);
+
 /**
  * Get the smallest node within this node that spans the given range of bytes
  * or (row, column) positions.
@@ -673,6 +678,19 @@ bool ts_tree_cursor_goto_next_sibling(TSTreeCursor *);
  */
 bool ts_tree_cursor_goto_first_child(TSTreeCursor *);
 
+/**
+ * Move the cursor to the node that is the nth descendant of
+ * the original node that the cursor was constructed with, where
+ * zero represents the original node itself.
+ */
+void ts_tree_cursor_goto_descendant(TSTreeCursor *, uint32_t);
+
+/**
+ * Get the index of the cursor's current node out of all of the
+ * descendants of the original node that the cursor was constructed with.
+ */
+uint32_t ts_tree_cursor_descendant_index(TSTreeCursor *);
+
 /**
  * Move the cursor to the first child of its current node that extends beyond
  * the given byte offset or point.
@@ -968,10 +986,10 @@ uint32_t ts_language_version(const TSLanguage *);
  * By default, Tree-sitter uses the standard libc allocation functions,
  * but aborts the process when an allocation fails. This function lets
  * you supply alternative allocation functions at runtime.
- * 
+ *
  * If you pass `NULL` for any parameter, Tree-sitter will switch back to
  * its default implementation of that function.
- * 
+ *
  * If you call this function after the library has already been used, then
  * you must ensure that either:
  *  1. All the existing objects have been freed.
diff --git a/lib/src/node.c b/lib/src/node.c
index 36bfb24c..d6a190c0 100644
--- a/lib/src/node.c
+++ b/lib/src/node.c
@@ -458,6 +458,10 @@ bool ts_node_has_error(TSNode self) {
   return ts_subtree_error_cost(ts_node__subtree(self)) > 0;
 }
 
+uint32_t ts_node_descendant_count(TSNode self) {
+  return ts_subtree_visible_descendant_count(ts_node__subtree(self)) + 1;
+}
+
 TSNode ts_node_parent(TSNode self) {
   TSNode node = ts_tree_root_node(self.tree);
   uint32_t end_byte = ts_node_end_byte(self);
diff --git a/lib/src/subtree.c b/lib/src/subtree.c
index fd76402f..76e45cee 100644
--- a/lib/src/subtree.c
+++ b/lib/src/subtree.c
@@ -376,7 +376,7 @@ void ts_subtree_summarize_children(
   self.ptr->visible_child_count = 0;
   self.ptr->error_cost = 0;
   self.ptr->repeat_depth = 0;
-  self.ptr->node_count = 1;
+  self.ptr->visible_descendant_count = 0;
   self.ptr->has_external_tokens = false;
   self.ptr->depends_on_column = false;
   self.ptr->has_external_scanner_state_change = false;
@@ -435,14 +435,16 @@ void ts_subtree_summarize_children(
     }
 
     self.ptr->dynamic_precedence += ts_subtree_dynamic_precedence(child);
-    self.ptr->node_count += ts_subtree_node_count(child);
+    self.ptr->visible_descendant_count += ts_subtree_visible_descendant_count(child);
 
     if (alias_sequence && alias_sequence[structural_index] != 0 && !ts_subtree_extra(child)) {
+      self.ptr->visible_descendant_count++;
       self.ptr->visible_child_count++;
       if (ts_language_symbol_metadata(language, alias_sequence[structural_index]).named) {
         self.ptr->named_child_count++;
       }
     } else if (ts_subtree_visible(child)) {
+      self.ptr->visible_descendant_count++;
       self.ptr->visible_child_count++;
       if (ts_subtree_named(child)) self.ptr->named_child_count++;
     } else if (grandchild_count > 0) {
@@ -529,7 +531,7 @@ MutableSubtree ts_subtree_new_node(
     .fragile_right = fragile,
     .is_keyword = false,
     {{
-      .node_count = 0,
+      .visible_descendant_count = 0,
       .production_id = production_id,
       .first_leaf = {.symbol = 0, .parse_state = 0},
     }}
diff --git a/lib/src/subtree.h b/lib/src/subtree.h
index a0e838eb..7b4db2e6 100644
--- a/lib/src/subtree.h
+++ b/lib/src/subtree.h
@@ -135,7 +135,7 @@ typedef struct {
     struct {
       uint32_t visible_child_count;
       uint32_t named_child_count;
-      uint32_t node_count;
+      uint32_t visible_descendant_count;
       int32_t dynamic_precedence;
       uint16_t repeat_depth;
       uint16_t production_id;
@@ -297,8 +297,16 @@ static inline uint32_t ts_subtree_is_repetition(Subtree self) {
     : !self.ptr->named && !self.ptr->visible && self.ptr->child_count != 0;
 }
 
+static inline uint32_t ts_subtree_visible_descendant_count(Subtree self) {
+  return (self.data.is_inline || self.ptr->child_count == 0)
+    ? 0
+    : self.ptr->visible_descendant_count;
+}
+
 static inline uint32_t ts_subtree_node_count(Subtree self) {
-  return (self.data.is_inline || self.ptr->child_count == 0) ? 1 : self.ptr->node_count;
+  return
+    ts_subtree_visible_descendant_count(self) +
+    (ts_subtree_visible(self) ? 1 : 0);
 }
 
 static inline uint32_t ts_subtree_visible_child_count(Subtree self) {
diff --git a/lib/src/tree_cursor.c b/lib/src/tree_cursor.c
index 98930250..18ee023d 100644
--- a/lib/src/tree_cursor.c
+++ b/lib/src/tree_cursor.c
@@ -10,26 +10,50 @@ typedef struct {
   Length position;
   uint32_t child_index;
   uint32_t structural_child_index;
+  uint32_t descendant_index;
   const TSSymbol *alias_sequence;
 } CursorChildIterator;
 
 // CursorChildIterator
 
+static inline bool ts_tree_cursor_is_entry_visible(const TreeCursor *self, uint32_t i) {
+  TreeCursorEntry *entry = &self->stack.contents[i];
+  if (ts_subtree_visible(*entry->subtree)) {
+    return true;
+  } else if (i > 0 && !ts_subtree_extra(*entry->subtree)) {
+    TreeCursorEntry *parent_entry = &self->stack.contents[i - 1];
+    return ts_language_alias_at(
+      self->tree->language,
+      parent_entry->subtree->ptr->production_id,
+      entry->structural_child_index
+    );
+  } else {
+    return false;
+  }
+}
+
 static inline CursorChildIterator ts_tree_cursor_iterate_children(const TreeCursor *self) {
   TreeCursorEntry *last_entry = array_back(&self->stack);
   if (ts_subtree_child_count(*last_entry->subtree) == 0) {
-    return (CursorChildIterator) {NULL_SUBTREE, self->tree, length_zero(), 0, 0, NULL};
+    return (CursorChildIterator) {NULL_SUBTREE, self->tree, length_zero(), 0, 0, 0, NULL};
   }
   const TSSymbol *alias_sequence = ts_language_alias_sequence(
     self->tree->language,
     last_entry->subtree->ptr->production_id
   );
+
+  uint32_t descendant_index = last_entry->descendant_index;
+  if (ts_tree_cursor_is_entry_visible(self, self->stack.size - 1)) {
+    descendant_index += 1;
+  }
+
   return (CursorChildIterator) {
     .tree = self->tree,
     .parent = *last_entry->subtree,
     .position = last_entry->position,
     .child_index = 0,
     .structural_child_index = 0,
+    .descendant_index = descendant_index,
     .alias_sequence = alias_sequence,
   };
 }
@@ -46,14 +70,22 @@ static inline bool ts_tree_cursor_child_iterator_next(
     .position = self->position,
     .child_index = self->child_index,
     .structural_child_index = self->structural_child_index,
+    .descendant_index = self->descendant_index,
   };
   *visible = ts_subtree_visible(*child);
   bool extra = ts_subtree_extra(*child);
-  if (!extra && self->alias_sequence) {
-    *visible |= self->alias_sequence[self->structural_child_index];
+  if (!extra) {
+    if (self->alias_sequence) {
+      *visible |= self->alias_sequence[self->structural_child_index];
+    }
     self->structural_child_index++;
   }
 
+  self->descendant_index += ts_subtree_visible_descendant_count(*child);
+  if (*visible) {
+    self->descendant_index += 1;
+  }
+
   self->position = length_add(self->position, ts_subtree_size(*child));
   self->child_index++;
 
@@ -88,6 +120,7 @@ void ts_tree_cursor_init(TreeCursor *self, TSNode node) {
     },
     .child_index = 0,
     .structural_child_index = 0,
+    .descendant_index = 0,
   }));
 }
 
@@ -190,6 +223,7 @@ TreeCursorStep ts_tree_cursor_goto_next_sibling_internal(TSTreeCursor *_self) {
     iterator.child_index = entry.child_index;
     iterator.structural_child_index = entry.structural_child_index;
     iterator.position = entry.position;
+    iterator.descendant_index = entry.descendant_index;
 
     bool visible = false;
     ts_tree_cursor_child_iterator_next(&iterator, &entry, &visible);
@@ -247,6 +281,62 @@ bool ts_tree_cursor_goto_parent(TSTreeCursor *_self) {
   return false;
 }
 
+void ts_tree_cursor_goto_descendant(
+  TSTreeCursor *_self,
+  uint32_t goal_descendant_index
+) {
+  TreeCursor *self = (TreeCursor *)_self;
+
+  // Ascend to the lowest ancestor that contains the goal descendant.
+  for (;;) {
+    TreeCursorEntry *entry = &self->stack.contents[self->stack.size - 1];
+    if (
+      (entry->descendant_index <= goal_descendant_index) &&
+      (entry->descendant_index + ts_subtree_visible_descendant_count(*entry->subtree) > goal_descendant_index)
+    ) {
+      break;
+    } else if (self->stack.size <= 1) {
+      return;
+    } else {
+      array_pop(&self->stack);
+    }
+  }
+
+  // Descend to the goal descendant.
+  bool did_descend = true;
+  do {
+    did_descend = false;
+    bool visible;
+    TreeCursorEntry entry;
+    CursorChildIterator iterator = ts_tree_cursor_iterate_children(self);
+
+    // If the goal descendant is the current node, then we're done.
+    if (iterator.descendant_index > goal_descendant_index) {
+      return;
+    }
+
+    while (ts_tree_cursor_child_iterator_next(&iterator, &entry, &visible)) {
+      uint32_t next_descendant_index = entry.descendant_index + ts_subtree_visible_descendant_count(*entry.subtree);
+      if (visible) next_descendant_index += 1;
+      if (next_descendant_index > goal_descendant_index) {
+        array_push(&self->stack, entry);
+        if (visible && entry.descendant_index == goal_descendant_index) {
+          return;
+        } else {
+          did_descend = true;
+          break;
+        }
+      }
+    }
+  } while (did_descend);
+}
+
+uint32_t ts_tree_cursor_descendant_index(TSTreeCursor *_self) {
+  const TreeCursor *self = (const TreeCursor *)_self;
+  TreeCursorEntry *last_entry = array_back(&self->stack);
+  return last_entry->descendant_index;
+}
+
 TSNode ts_tree_cursor_current_node(const TSTreeCursor *_self) {
   const TreeCursor *self = (const TreeCursor *)_self;
   TreeCursorEntry *last_entry = array_back(&self->stack);
diff --git a/lib/src/tree_cursor.h b/lib/src/tree_cursor.h
index 7b94db6b..6d4c688b 100644
--- a/lib/src/tree_cursor.h
+++ b/lib/src/tree_cursor.h
@@ -8,6 +8,7 @@ typedef struct {
   Length position;
   uint32_t child_index;
   uint32_t structural_child_index;
+  uint32_t descendant_index;
 } TreeCursorEntry;
 
 typedef struct {

From a2119cb6914d62e626fcc40684ef900d7fa90d86 Mon Sep 17 00:00:00 2001
From: Max Brunsfeld <maxbrunsfeld@gmail.com>
Date: Mon, 12 Jun 2023 11:50:44 -0700
Subject: [PATCH 134/347] Add APIs for retrieving tree cursor's depth and
 descendant index

---
 lib/binding_rust/bindings.rs  |  7 +++++-
 lib/binding_rust/lib.rs       | 15 +++++++++++++
 lib/binding_web/README.md     |  2 +-
 lib/include/tree_sitter/api.h |  8 ++++++-
 lib/src/tree_cursor.c         | 42 ++++++++++++++---------------------
 script/generate-bindings      |  1 +
 6 files changed, 47 insertions(+), 28 deletions(-)

diff --git a/lib/binding_rust/bindings.rs b/lib/binding_rust/bindings.rs
index 1d3b6a30..b584a509 100644
--- a/lib/binding_rust/bindings.rs
+++ b/lib/binding_rust/bindings.rs
@@ -615,7 +615,12 @@ extern "C" {
 extern "C" {
     #[doc = " Get the index of the cursor's current node out of all of the"]
     #[doc = " descendants of the original node that the cursor was constructed with."]
-    pub fn ts_tree_cursor_descendant_index(arg1: *mut TSTreeCursor) -> u32;
+    pub fn ts_tree_cursor_current_descendant_index(arg1: *const TSTreeCursor) -> u32;
+}
+extern "C" {
+    #[doc = " Get the depth of the cursor's current node relative to the original"]
+    #[doc = " node that the cursor was constructed with."]
+    pub fn ts_tree_cursor_current_depth(arg1: *const TSTreeCursor) -> u32;
 }
 extern "C" {
     #[doc = " Move the cursor to the first child of its current node that extends beyond"]
diff --git a/lib/binding_rust/lib.rs b/lib/binding_rust/lib.rs
index b717a161..b6255085 100644
--- a/lib/binding_rust/lib.rs
+++ b/lib/binding_rust/lib.rs
@@ -1266,6 +1266,21 @@ impl<'a> TreeCursor<'a> {
         }
     }
 
+    /// Get the numerical field id of this tree cursor's current node.
+    ///
+    /// See also [field_name](TreeCursor::field_name).
+    #[doc(alias = "ts_tree_cursor_current_depth")]
+    pub fn depth(&self) -> u32 {
+        unsafe { ffi::ts_tree_cursor_current_depth(&self.0) }
+    }
+
+    /// Get the index of the cursor's current node out of all of the
+    /// descendants of the original node that the cursor was constructed with
+    #[doc(alias = "ts_tree_cursor_current_descendant_index")]
+    pub fn descendant_index(&self) -> usize {
+        unsafe { ffi::ts_tree_cursor_current_descendant_index(&self.0) as usize }
+    }
+
     /// Move this cursor to the first child of its current node.
     ///
     /// This returns `true` if the cursor successfully moved, and returns `false`
diff --git a/lib/binding_web/README.md b/lib/binding_web/README.md
index b0ffc3ef..bfddd9ef 100644
--- a/lib/binding_web/README.md
+++ b/lib/binding_web/README.md
@@ -12,7 +12,7 @@ WebAssembly bindings to the [Tree-sitter](https://github.com/tree-sitter/tree-si
 You can download the `tree-sitter.js` and `tree-sitter.wasm` files from [the latest GitHub release](https://github.com/tree-sitter/tree-sitter/releases/latest) and load them using a standalone script:
 
 ```html
-<script src="/the/path/to/tree-sitter.js"/>
+<script src="/the/path/to/tree-sitter.js"></script>
 
 <script>
   const Parser = window.TreeSitter;
diff --git a/lib/include/tree_sitter/api.h b/lib/include/tree_sitter/api.h
index 04aafb84..e455e81d 100644
--- a/lib/include/tree_sitter/api.h
+++ b/lib/include/tree_sitter/api.h
@@ -689,7 +689,13 @@ void ts_tree_cursor_goto_descendant(TSTreeCursor *, uint32_t);
  * Get the index of the cursor's current node out of all of the
  * descendants of the original node that the cursor was constructed with.
  */
-uint32_t ts_tree_cursor_descendant_index(TSTreeCursor *);
+uint32_t ts_tree_cursor_current_descendant_index(const TSTreeCursor *);
+
+/**
+ * Get the depth of the cursor's current node relative to the original
+ * node that the cursor was constructed with.
+ */
+uint32_t ts_tree_cursor_current_depth(const TSTreeCursor *);
 
 /**
  * Move the cursor to the first child of its current node that extends beyond
diff --git a/lib/src/tree_cursor.c b/lib/src/tree_cursor.c
index 18ee023d..5c102fcc 100644
--- a/lib/src/tree_cursor.c
+++ b/lib/src/tree_cursor.c
@@ -261,22 +261,10 @@ bool ts_tree_cursor_goto_next_sibling(TSTreeCursor *self) {
 bool ts_tree_cursor_goto_parent(TSTreeCursor *_self) {
   TreeCursor *self = (TreeCursor *)_self;
   for (unsigned i = self->stack.size - 2; i + 1 > 0; i--) {
-    TreeCursorEntry *entry = &self->stack.contents[i];
-    if (ts_subtree_visible(*entry->subtree)) {
+    if (ts_tree_cursor_is_entry_visible(self, i)) {
       self->stack.size = i + 1;
       return true;
     }
-    if (i > 0 && !ts_subtree_extra(*entry->subtree)) {
-      TreeCursorEntry *parent_entry = &self->stack.contents[i - 1];
-      if (ts_language_alias_at(
-        self->tree->language,
-        parent_entry->subtree->ptr->production_id,
-        entry->structural_child_index
-      )) {
-        self->stack.size = i + 1;
-        return true;
-      }
-    }
   }
   return false;
 }
@@ -331,7 +319,7 @@ void ts_tree_cursor_goto_descendant(
   } while (did_descend);
 }
 
-uint32_t ts_tree_cursor_descendant_index(TSTreeCursor *_self) {
+uint32_t ts_tree_cursor_current_descendant_index(const TSTreeCursor *_self) {
   const TreeCursor *self = (const TreeCursor *)_self;
   TreeCursorEntry *last_entry = array_back(&self->stack);
   return last_entry->descendant_index;
@@ -479,6 +467,17 @@ void ts_tree_cursor_current_status(
   }
 }
 
+uint32_t ts_tree_cursor_current_depth(const TSTreeCursor *_self) {
+  const TreeCursor *self = (const TreeCursor *)_self;
+  uint32_t depth = 0;
+  for (unsigned i = 1; i < self->stack.size; i++) {
+    if (ts_tree_cursor_is_entry_visible(self, i)) {
+      depth++;
+    }
+  }
+  return depth;
+}
+
 TSNode ts_tree_cursor_parent_node(const TSTreeCursor *_self) {
   const TreeCursor *self = (const TreeCursor *)_self;
   for (int i = (int)self->stack.size - 2; i >= 0; i--) {
@@ -515,17 +514,10 @@ TSFieldId ts_tree_cursor_current_field_id(const TSTreeCursor *_self) {
     TreeCursorEntry *parent_entry = &self->stack.contents[i - 1];
 
     // Stop walking up when another visible node is found.
-    if (i != self->stack.size - 1) {
-      if (ts_subtree_visible(*entry->subtree)) break;
-      if (
-        !ts_subtree_extra(*entry->subtree) &&
-        ts_language_alias_at(
-          self->tree->language,
-          parent_entry->subtree->ptr->production_id,
-          entry->structural_child_index
-        )
-      ) break;
-    }
+    if (
+      i != self->stack.size - 1 &&
+      ts_tree_cursor_is_entry_visible(self, i)
+    ) break;
 
     if (ts_subtree_extra(*entry->subtree)) break;
 
diff --git a/script/generate-bindings b/script/generate-bindings
index 25499c0e..8757aaeb 100755
--- a/script/generate-bindings
+++ b/script/generate-bindings
@@ -4,6 +4,7 @@ output_path=lib/binding_rust/bindings.rs
 header_path='lib/include/tree_sitter/api.h'
 
 bindgen                                        \
+  --size_t-is-usize                            \
   --no-layout-tests                            \
   --allowlist-type '^TS.*'                     \
   --allowlist-function '^ts_.*'                \

From 6b16a9687be5cce933564dc932a0f50fab4e6406 Mon Sep 17 00:00:00 2001
From: Max Brunsfeld <maxbrunsfeld@gmail.com>
Date: Mon, 12 Jun 2023 13:45:43 -0700
Subject: [PATCH 135/347] Tweak ruby error test to reflect slightly different
 recovery

---
 test/fixtures/error_corpus/ruby_errors.txt | 15 +++++++++------
 1 file changed, 9 insertions(+), 6 deletions(-)

diff --git a/test/fixtures/error_corpus/ruby_errors.txt b/test/fixtures/error_corpus/ruby_errors.txt
index df160811..88e7ee37 100644
--- a/test/fixtures/error_corpus/ruby_errors.txt
+++ b/test/fixtures/error_corpus/ruby_errors.txt
@@ -1,10 +1,11 @@
 ==========================
-Heredocs with errors
+Heredocs with errors 2
 ==========================
 
-joins(<<~SQL(
+joins <<~SQL
   b
 SQL
+)
 c
 
 ---
@@ -12,8 +13,10 @@ c
 (program
   (call
     method: (identifier)
-    (ERROR (heredoc_beginning))
     arguments: (argument_list
-      (heredoc_body (heredoc_content) (heredoc_end))
-      (identifier)
-      (MISSING ")"))))
+      (heredoc_beginning)))
+  (heredoc_body
+    (heredoc_content)
+    (heredoc_end))
+  (ERROR)
+  (identifier))

From 3375527a89e8d315b15e471c0e03c2fdb19b0d45 Mon Sep 17 00:00:00 2001
From: Max Brunsfeld <maxbrunsfeld@gmail.com>
Date: Mon, 12 Jun 2023 14:45:30 -0700
Subject: [PATCH 136/347] Fix bug in ts_tree_cursor_goto_descendant

---
 cli/src/tests/node_test.rs | 22 ++++++++++++++++++++++
 lib/src/subtree.c          |  2 ++
 lib/src/tree_cursor.c      | 23 ++++++++++++-----------
 3 files changed, 36 insertions(+), 11 deletions(-)

diff --git a/cli/src/tests/node_test.rs b/cli/src/tests/node_test.rs
index 28c52116..e7b9640b 100644
--- a/cli/src/tests/node_test.rs
+++ b/cli/src/tests/node_test.rs
@@ -405,6 +405,28 @@ fn test_node_descendant_count() {
     }
 }
 
+#[test]
+fn test_descendant_count_single_node_tree() {
+    let mut parser = Parser::new();
+    parser
+        .set_language(get_language("embedded-template"))
+        .unwrap();
+    let tree = parser.parse("hello", None).unwrap();
+
+    let nodes = get_all_nodes(&tree);
+    assert_eq!(nodes.len(), 2);
+    assert_eq!(tree.root_node().descendant_count(), 2);
+
+    let mut cursor = tree.root_node().walk();
+
+    cursor.goto_descendant(0);
+    assert_eq!(cursor.depth(), 0);
+    assert_eq!(cursor.node(), nodes[0]);
+    cursor.goto_descendant(1);
+    assert_eq!(cursor.depth(), 1);
+    assert_eq!(cursor.node(), nodes[1]);
+}
+
 #[test]
 fn test_node_descendant_for_range() {
     let tree = parse_json_example();
diff --git a/lib/src/subtree.c b/lib/src/subtree.c
index 76e45cee..2bf25dc5 100644
--- a/lib/src/subtree.c
+++ b/lib/src/subtree.c
@@ -971,6 +971,7 @@ void ts_subtree__print_dot_graph(const Subtree *self, uint32_t start_offset,
     "error-cost: %u\n"
     "has-changes: %u\n"
     "depends-on-column: %u\n"
+    "descendant-count: %u\n"
     "repeat-depth: %u\n"
     "lookahead-bytes: %u",
     start_offset, end_offset,
@@ -978,6 +979,7 @@ void ts_subtree__print_dot_graph(const Subtree *self, uint32_t start_offset,
     ts_subtree_error_cost(*self),
     ts_subtree_has_changes(*self),
     ts_subtree_depends_on_column(*self),
+    ts_subtree_visible_descendant_count(*self),
     ts_subtree_repeat_depth(*self),
     ts_subtree_lookahead_bytes(*self)
   );
diff --git a/lib/src/tree_cursor.c b/lib/src/tree_cursor.c
index 5c102fcc..8e6d9414 100644
--- a/lib/src/tree_cursor.c
+++ b/lib/src/tree_cursor.c
@@ -18,9 +18,9 @@ typedef struct {
 
 static inline bool ts_tree_cursor_is_entry_visible(const TreeCursor *self, uint32_t i) {
   TreeCursorEntry *entry = &self->stack.contents[i];
-  if (ts_subtree_visible(*entry->subtree)) {
+  if (i == 0 || ts_subtree_visible(*entry->subtree)) {
     return true;
-  } else if (i > 0 && !ts_subtree_extra(*entry->subtree)) {
+  } else if (!ts_subtree_extra(*entry->subtree)) {
     TreeCursorEntry *parent_entry = &self->stack.contents[i - 1];
     return ts_language_alias_at(
       self->tree->language,
@@ -275,12 +275,17 @@ void ts_tree_cursor_goto_descendant(
 ) {
   TreeCursor *self = (TreeCursor *)_self;
 
-  // Ascend to the lowest ancestor that contains the goal descendant.
+  // Ascend to the lowest ancestor that contains the goal node.
   for (;;) {
-    TreeCursorEntry *entry = &self->stack.contents[self->stack.size - 1];
+    uint32_t i = self->stack.size - 1;
+    TreeCursorEntry *entry = &self->stack.contents[i];
+    uint32_t next_descendant_index =
+      entry->descendant_index +
+      (ts_tree_cursor_is_entry_visible(self, i) ? 1 : 0) +
+      ts_subtree_visible_descendant_count(*entry->subtree);
     if (
       (entry->descendant_index <= goal_descendant_index) &&
-      (entry->descendant_index + ts_subtree_visible_descendant_count(*entry->subtree) > goal_descendant_index)
+      (next_descendant_index > goal_descendant_index)
     ) {
       break;
     } else if (self->stack.size <= 1) {
@@ -290,23 +295,19 @@ void ts_tree_cursor_goto_descendant(
     }
   }
 
-  // Descend to the goal descendant.
+  // Descend to the goal node.
   bool did_descend = true;
   do {
     did_descend = false;
     bool visible;
     TreeCursorEntry entry;
     CursorChildIterator iterator = ts_tree_cursor_iterate_children(self);
-
-    // If the goal descendant is the current node, then we're done.
     if (iterator.descendant_index > goal_descendant_index) {
       return;
     }
 
     while (ts_tree_cursor_child_iterator_next(&iterator, &entry, &visible)) {
-      uint32_t next_descendant_index = entry.descendant_index + ts_subtree_visible_descendant_count(*entry.subtree);
-      if (visible) next_descendant_index += 1;
-      if (next_descendant_index > goal_descendant_index) {
+      if (iterator.descendant_index > goal_descendant_index) {
         array_push(&self->stack, entry);
         if (visible && entry.descendant_index == goal_descendant_index) {
           return;

From d0029a15273e526925a764033e9b7f18f96a7ce5 Mon Sep 17 00:00:00 2001
From: Max Brunsfeld <maxbrunsfeld@gmail.com>
Date: Wed, 14 Jun 2023 11:31:39 -0700
Subject: [PATCH 137/347] Avoid unused value warning from array_pop

---
 lib/src/tree_cursor.c | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/lib/src/tree_cursor.c b/lib/src/tree_cursor.c
index 8e6d9414..5383c094 100644
--- a/lib/src/tree_cursor.c
+++ b/lib/src/tree_cursor.c
@@ -291,7 +291,7 @@ void ts_tree_cursor_goto_descendant(
     } else if (self->stack.size <= 1) {
       return;
     } else {
-      array_pop(&self->stack);
+      self->stack.size--;
     }
   }
 

From b19220000874fea2b8436c4b7f21de4f618bf5c7 Mon Sep 17 00:00:00 2001
From: Amaan Qureshi <amaanq12@gmail.com>
Date: Thu, 29 Jun 2023 20:20:37 -0400
Subject: [PATCH 138/347] fix: update tests from python grammar changes

---
 cli/src/tests/parser_test.rs                 | 2 +-
 test/fixtures/error_corpus/python_errors.txt | 4 +++-
 2 files changed, 4 insertions(+), 2 deletions(-)

diff --git a/cli/src/tests/parser_test.rs b/cli/src/tests/parser_test.rs
index f06d88b8..da9aefa8 100644
--- a/cli/src/tests/parser_test.rs
+++ b/cli/src/tests/parser_test.rs
@@ -509,7 +509,7 @@ fn test_parsing_after_detecting_error_in_the_middle_of_a_string_token() {
     let tree = parser.parse(&source, None).unwrap();
     assert_eq!(
         tree.root_node().to_sexp(),
-        "(module (expression_statement (assignment left: (identifier) right: (expression_list (identifier) (string string_content: (string_content))))))"
+        "(module (expression_statement (assignment left: (identifier) right: (expression_list (identifier) (string (string_start) (string_content) (string_end))))))"
     );
 
     // Delete a suffix of the source code, starting in the middle of the string
diff --git a/test/fixtures/error_corpus/python_errors.txt b/test/fixtures/error_corpus/python_errors.txt
index bd3101a9..d5b4a5dd 100644
--- a/test/fixtures/error_corpus/python_errors.txt
+++ b/test/fixtures/error_corpus/python_errors.txt
@@ -90,7 +90,9 @@ def a():
     (ERROR (identifier))
     body: (block
       (expression_statement (string
-        string_content: (string_content))))))
+        (string_start)
+        (string_content)
+        (string_end))))))
 
 ===========================================
 incomplete definition in class definition

From 1982e48568f4cd8badf565ee345989b6f82008fa Mon Sep 17 00:00:00 2001
From: Amaan Qureshi <amaanq12@gmail.com>
Date: Tue, 4 Jul 2023 00:47:47 -0400
Subject: [PATCH 139/347] chore: update exports to include some string.h
 functions

---
 lib/binding_web/exports.json | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/lib/binding_web/exports.json b/lib/binding_web/exports.json
index d4b6eb5e..eb4553dc 100644
--- a/lib/binding_web/exports.json
+++ b/lib/binding_web/exports.json
@@ -28,6 +28,8 @@
   "_memmove",
   "_memset",
   "_strlen",
+  "_strcmp",
+  "_strncpy",
   "_towupper",
 
   "_ts_init",

From 3504aa326024f6f33288158fa7041272fbd58b49 Mon Sep 17 00:00:00 2001
From: Amaan Qureshi <amaanq12@gmail.com>
Date: Sat, 1 Jul 2023 13:42:51 -0400
Subject: [PATCH 140/347] fix(deps): bump proc-macro2 as an unstable feature
 became stabilized

---
 Cargo.lock                          | 4 ++--
 cli/src/tests/proc_macro/Cargo.toml | 2 +-
 2 files changed, 3 insertions(+), 3 deletions(-)

diff --git a/Cargo.lock b/Cargo.lock
index 0588a58d..7e4ccfa0 100644
--- a/Cargo.lock
+++ b/Cargo.lock
@@ -500,9 +500,9 @@ dependencies = [
 
 [[package]]
 name = "proc-macro2"
-version = "1.0.56"
+version = "1.0.63"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "2b63bdb0cd06f1f4dedf69b254734f9b45af66e4a031e42a7480257d9898b435"
+checksum = "7b368fba921b0dce7e60f5e04ec15e565b3303972b42bcfde1d0713b881959eb"
 dependencies = [
  "unicode-ident",
 ]
diff --git a/cli/src/tests/proc_macro/Cargo.toml b/cli/src/tests/proc_macro/Cargo.toml
index 9db4025b..1ca1be39 100644
--- a/cli/src/tests/proc_macro/Cargo.toml
+++ b/cli/src/tests/proc_macro/Cargo.toml
@@ -9,7 +9,7 @@ rust-version.workspace = true
 proc-macro = true
 
 [dependencies]
-proc-macro2 = "1"
+proc-macro2 = "1.0.63"
 quote = "1"
 rand = "0.8.5"
 syn = { version = "1", features = ["full"] }

From 356f68293a4633375db25f6433bc17ef00118894 Mon Sep 17 00:00:00 2001
From: Max Brunsfeld <maxbrunsfeld@gmail.com>
Date: Mon, 26 Jun 2023 17:18:05 -0700
Subject: [PATCH 141/347] Fix false positive query match bug, introduced in
 #2085

---
 cli/src/tests/helpers/query_helpers.rs |  4 +-
 cli/src/tests/query_test.rs            | 38 +++++++++++-
 lib/src/query.c                        | 84 +++++++++++++-------------
 3 files changed, 81 insertions(+), 45 deletions(-)

diff --git a/cli/src/tests/helpers/query_helpers.rs b/cli/src/tests/helpers/query_helpers.rs
index 0638701c..a21320b1 100644
--- a/cli/src/tests/helpers/query_helpers.rs
+++ b/cli/src/tests/helpers/query_helpers.rs
@@ -318,8 +318,8 @@ pub fn assert_query_matches(
     let tree = parser.parse(source, None).unwrap();
     let mut cursor = QueryCursor::new();
     let matches = cursor.matches(&query, tree.root_node(), source.as_bytes());
-    assert_eq!(collect_matches(matches, &query, source), expected);
-    assert_eq!(cursor.did_exceed_match_limit(), false);
+    pretty_assertions::assert_eq!(collect_matches(matches, &query, source), expected);
+    pretty_assertions::assert_eq!(cursor.did_exceed_match_limit(), false);
 }
 
 pub fn collect_matches<'a>(
diff --git a/cli/src/tests/query_test.rs b/cli/src/tests/query_test.rs
index f0f37788..e244405a 100644
--- a/cli/src/tests/query_test.rs
+++ b/cli/src/tests/query_test.rs
@@ -853,6 +853,33 @@ fn test_query_matches_with_wildcard_at_the_root() {
     });
 }
 
+#[test]
+fn test_query_matches_with_wildcard_within_wildcard() {
+    allocations::record(|| {
+        let language = get_language("javascript");
+        let query = Query::new(
+            language,
+            "
+            (_ (_) @child) @parent
+            ",
+        )
+        .unwrap();
+
+        assert_query_matches(
+            language,
+            &query,
+            "/* a */ b; c;",
+            &[
+                (0, vec![("parent", "/* a */ b; c;"), ("child", "/* a */")]),
+                (0, vec![("parent", "/* a */ b; c;"), ("child", "b;")]),
+                (0, vec![("parent", "b;"), ("child", "b")]),
+                (0, vec![("parent", "/* a */ b; c;"), ("child", "c;")]),
+                (0, vec![("parent", "c;"), ("child", "c")]),
+            ],
+        );
+    });
+}
+
 #[test]
 fn test_query_matches_with_immediate_siblings() {
     allocations::record(|| {
@@ -1166,11 +1193,20 @@ fn test_query_matches_with_non_terminal_repetitions_within_root() {
             language,
             &query,
             r#"
+            function f() {
+                d;
+                e;
+                f;
+                g;
+            }
             a;
             b;
             c;
             "#,
-            &[(0, vec![("id", "a"), ("id", "b"), ("id", "c")])],
+            &[
+                (0, vec![("id", "d"), ("id", "e"), ("id", "f"), ("id", "g")]),
+                (0, vec![("id", "a"), ("id", "b"), ("id", "c")]),
+            ],
         );
     });
 }
diff --git a/lib/src/query.c b/lib/src/query.c
index bdc3b0e4..64ab57e2 100644
--- a/lib/src/query.c
+++ b/lib/src/query.c
@@ -3435,6 +3435,48 @@ static inline bool ts_query_cursor__advance(
           self->depth,
           ts_node_type(ts_tree_cursor_current_node(&self->cursor))
         );
+
+        // After leaving a node, remove any states that cannot make further progress.
+        uint32_t deleted_count = 0;
+        for (unsigned i = 0, n = self->states.size; i < n; i++) {
+          QueryState *state = &self->states.contents[i];
+          QueryStep *step = &self->query->steps.contents[state->step_index];
+
+          // If a state completed its pattern inside of this node, but was deferred from finishing
+          // in order to search for longer matches, mark it as finished.
+          if (
+            step->depth == PATTERN_DONE_MARKER &&
+            (state->start_depth > self->depth || self->depth == 0)
+          ) {
+            LOG("  finish pattern %u\n", state->pattern_index);
+            array_push(&self->finished_states, *state);
+            did_match = true;
+            deleted_count++;
+          }
+
+          // If a state needed to match something within this node, then remove that state
+          // as it has failed to match.
+          else if (
+            step->depth != PATTERN_DONE_MARKER &&
+            (uint32_t)state->start_depth + (uint32_t)step->depth > self->depth
+          ) {
+            LOG(
+              "  failed to match. pattern:%u, step:%u\n",
+              state->pattern_index,
+              state->step_index
+            );
+            capture_list_pool_release(
+              &self->capture_list_pool,
+              state->capture_list_id
+            );
+            deleted_count++;
+          }
+
+          else if (deleted_count > 0) {
+            self->states.contents[i - deleted_count] = *state;
+          }
+        }
+        self->states.size -= deleted_count;
       }
 
       // Leave this node by stepping to its next sibling or to its parent.
@@ -3461,48 +3503,6 @@ static inline bool ts_query_cursor__advance(
             self->halted = true;
           }
       }
-
-      if (self->on_visible_node) {
-        // After leaving a node, remove any states that cannot make further progress.
-        uint32_t deleted_count = 0;
-        for (unsigned i = 0, n = self->states.size; i < n; i++) {
-          QueryState *state = &self->states.contents[i];
-          QueryStep *step = &self->query->steps.contents[state->step_index];
-
-          // If a state completed its pattern inside of this node, but was deferred from finishing
-          // in order to search for longer matches, mark it as finished.
-          if (step->depth == PATTERN_DONE_MARKER) {
-            if (state->start_depth > self->depth || self->halted) {
-              LOG("  finish pattern %u\n", state->pattern_index);
-              array_push(&self->finished_states, *state);
-              did_match = true;
-              deleted_count++;
-              continue;
-            }
-          }
-
-          // If a state needed to match something within this node, then remove that state
-          // as it has failed to match.
-          else if ((uint32_t)state->start_depth + (uint32_t)step->depth > self->depth) {
-            LOG(
-              "  failed to match. pattern:%u, step:%u\n",
-              state->pattern_index,
-              state->step_index
-            );
-            capture_list_pool_release(
-              &self->capture_list_pool,
-              state->capture_list_id
-            );
-            deleted_count++;
-            continue;
-          }
-
-          if (deleted_count > 0) {
-            self->states.contents[i - deleted_count] = *state;
-          }
-        }
-        self->states.size -= deleted_count;
-      }
     }
 
     // Enter a new node.

From 9d669abac45b586ad6d7e838643b214b34f5c4b3 Mon Sep 17 00:00:00 2001
From: Amaan Qureshi <amaanq12@gmail.com>
Date: Mon, 3 Jul 2023 20:59:01 -0400
Subject: [PATCH 142/347] feat: add encoding flag and automatically check if a
 file might be utf-16

---
 cli/src/main.rs  | 33 ++++++++++++++----
 cli/src/parse.rs | 91 ++++++++++++++++++++++++++++++------------------
 2 files changed, 84 insertions(+), 40 deletions(-)

diff --git a/cli/src/main.rs b/cli/src/main.rs
index 0a863b1c..18e50aad 100644
--- a/cli/src/main.rs
+++ b/cli/src/main.rs
@@ -3,8 +3,8 @@ use clap::{App, AppSettings, Arg, SubCommand};
 use glob::glob;
 use std::path::{Path, PathBuf};
 use std::{env, fs, u64};
-use tree_sitter::Point;
-use tree_sitter_cli::parse::ParseOutput;
+use tree_sitter::{ffi, Point};
+use tree_sitter_cli::parse::{ParseFileOptions, ParseOutput};
 use tree_sitter_cli::{
     generate, highlight, logger, parse, playground, query, tags, test, test_highlight, test_tags,
     util, wasm,
@@ -162,6 +162,12 @@ fn run() -> Result<()> {
                         .takes_value(true)
                         .multiple(true)
                         .number_of_values(1),
+                )
+                .arg(
+                    Arg::with_name("encoding")
+                        .help("The encoding of the input files")
+                        .long("encoding")
+                        .takes_value(true),
                 ),
         )
         .subcommand(
@@ -399,6 +405,16 @@ fn run() -> Result<()> {
                 ParseOutput::Normal
             };
 
+            let encoding =
+                matches
+                    .values_of("encoding")
+                    .map_or(Ok(None), |mut e| match e.next() {
+                        Some("utf16") => Ok(Some(ffi::TSInputEncoding_TSInputEncodingUTF16)),
+                        Some("utf8") => Ok(Some(ffi::TSInputEncoding_TSInputEncodingUTF8)),
+                        Some(_) => Err(anyhow!("Invalid encoding. Expected one of: utf8, utf16")),
+                        None => Ok(None),
+                    })?;
+
             let time = matches.is_present("time");
             let edits = matches
                 .values_of("edits")
@@ -431,18 +447,21 @@ fn run() -> Result<()> {
                 let language =
                     loader.select_language(path, &current_dir, matches.value_of("scope"))?;
 
-                let this_file_errored = parse::parse_file_at_path(
+                let opts = ParseFileOptions {
                     language,
                     path,
-                    &edits,
+                    edits: &edits,
                     max_path_length,
                     output,
-                    time,
+                    print_time: time,
                     timeout,
                     debug,
                     debug_graph,
-                    Some(&cancellation_flag),
-                )?;
+                    cancellation_flag: Some(&cancellation_flag),
+                    encoding,
+                };
+
+                let this_file_errored = parse::parse_file_at_path(opts)?;
 
                 if should_track_stats {
                     stats.total_parses += 1;
diff --git a/cli/src/parse.rs b/cli/src/parse.rs
index 3e28e51a..6e62e1cf 100644
--- a/cli/src/parse.rs
+++ b/cli/src/parse.rs
@@ -5,7 +5,7 @@ use std::path::Path;
 use std::sync::atomic::AtomicUsize;
 use std::time::Instant;
 use std::{fmt, fs, usize};
-use tree_sitter::{InputEdit, Language, LogType, Parser, Point, Tree};
+use tree_sitter::{ffi, InputEdit, Language, LogType, Parser, Point, Tree};
 
 #[derive(Debug)]
 pub struct Edit {
@@ -38,37 +38,40 @@ pub enum ParseOutput {
     Dot,
 }
 
-pub fn parse_file_at_path(
-    language: Language,
-    path: &Path,
-    edits: &Vec<&str>,
-    max_path_length: usize,
-    output: ParseOutput,
-    print_time: bool,
-    timeout: u64,
-    debug: bool,
-    debug_graph: bool,
-    cancellation_flag: Option<&AtomicUsize>,
-) -> Result<bool> {
+pub struct ParseFileOptions<'a> {
+    pub language: Language,
+    pub path: &'a Path,
+    pub edits: &'a [&'a str],
+    pub max_path_length: usize,
+    pub output: ParseOutput,
+    pub print_time: bool,
+    pub timeout: u64,
+    pub debug: bool,
+    pub debug_graph: bool,
+    pub cancellation_flag: Option<&'a AtomicUsize>,
+    pub encoding: Option<u32>,
+}
+
+pub fn parse_file_at_path(opts: ParseFileOptions) -> Result<bool> {
     let mut _log_session = None;
     let mut parser = Parser::new();
-    parser.set_language(language)?;
-    let mut source_code =
-        fs::read(path).with_context(|| format!("Error reading source file {:?}", path))?;
+    parser.set_language(opts.language)?;
+    let mut source_code = fs::read(opts.path)
+        .with_context(|| format!("Error reading source file {:?}", opts.path))?;
 
     // If the `--cancel` flag was passed, then cancel the parse
     // when the user types a newline.
-    unsafe { parser.set_cancellation_flag(cancellation_flag) };
+    unsafe { parser.set_cancellation_flag(opts.cancellation_flag) };
 
     // Set a timeout based on the `--time` flag.
-    parser.set_timeout_micros(timeout);
+    parser.set_timeout_micros(opts.timeout);
 
     // Render an HTML graph if `--debug-graph` was passed
-    if debug_graph {
+    if opts.debug_graph {
         _log_session = Some(util::log_graphs(&mut parser, "log.html")?);
     }
     // Log to stderr if `--debug` was passed
-    else if debug {
+    else if opts.debug {
         parser.set_logger(Some(Box::new(|log_type, message| {
             if log_type == LogType::Lex {
                 io::stderr().write(b"  ").unwrap();
@@ -78,22 +81,44 @@ pub fn parse_file_at_path(
     }
 
     let time = Instant::now();
-    let tree = parser.parse(&source_code, None);
+
+    #[inline(always)]
+    fn is_utf16_bom(bom_bytes: &[u8]) -> bool {
+        bom_bytes == [0xFF, 0xFE] || bom_bytes == [0xFE, 0xFF]
+    }
+
+    let tree = match opts.encoding {
+        Some(encoding) if encoding == ffi::TSInputEncoding_TSInputEncodingUTF16 => {
+            let source_code_utf16 = source_code
+                .chunks_exact(2)
+                .map(|chunk| u16::from_le_bytes([chunk[0], chunk[1]]))
+                .collect::<Vec<_>>();
+            parser.parse_utf16(&source_code_utf16, None)
+        }
+        None if is_utf16_bom(&source_code[0..2]) => {
+            let source_code_utf16 = source_code
+                .chunks_exact(2)
+                .map(|chunk| u16::from_le_bytes([chunk[0], chunk[1]]))
+                .collect::<Vec<_>>();
+            parser.parse_utf16(&source_code_utf16, None)
+        }
+        _ => parser.parse(&source_code, None),
+    };
 
     let stdout = io::stdout();
     let mut stdout = stdout.lock();
 
     if let Some(mut tree) = tree {
-        if debug_graph && !edits.is_empty() {
+        if opts.debug_graph && !opts.edits.is_empty() {
             println!("BEFORE:\n{}", String::from_utf8_lossy(&source_code));
         }
 
-        for (i, edit) in edits.iter().enumerate() {
+        for (i, edit) in opts.edits.iter().enumerate() {
             let edit = parse_edit_flag(&source_code, edit)?;
             perform_edit(&mut tree, &mut source_code, &edit);
             tree = parser.parse(&source_code, Some(&tree)).unwrap();
 
-            if debug_graph {
+            if opts.debug_graph {
                 println!("AFTER {}:\n{}", i, String::from_utf8_lossy(&source_code));
             }
         }
@@ -102,7 +127,7 @@ pub fn parse_file_at_path(
         let duration_ms = duration.as_secs() * 1000 + duration.subsec_nanos() as u64 / 1000000;
         let mut cursor = tree.walk();
 
-        if matches!(output, ParseOutput::Normal) {
+        if matches!(opts.output, ParseOutput::Normal) {
             let mut needs_newline = false;
             let mut indent_level = 0;
             let mut did_visit_children = false;
@@ -158,7 +183,7 @@ pub fn parse_file_at_path(
             println!("");
         }
 
-        if matches!(output, ParseOutput::Xml) {
+        if matches!(opts.output, ParseOutput::Xml) {
             let mut needs_newline = false;
             let mut indent_level = 0;
             let mut did_visit_children = false;
@@ -213,7 +238,7 @@ pub fn parse_file_at_path(
             println!("");
         }
 
-        if matches!(output, ParseOutput::Dot) {
+        if matches!(opts.output, ParseOutput::Dot) {
             util::print_tree_graph(&tree, "log.html").unwrap();
         }
 
@@ -234,13 +259,13 @@ pub fn parse_file_at_path(
             }
         }
 
-        if first_error.is_some() || print_time {
+        if first_error.is_some() || opts.print_time {
             write!(
                 &mut stdout,
                 "{:width$}\t{} ms",
-                path.to_str().unwrap(),
+                opts.path.to_str().unwrap(),
                 duration_ms,
-                width = max_path_length
+                width = opts.max_path_length
             )?;
             if let Some(node) = first_error {
                 let start = node.start_position();
@@ -269,15 +294,15 @@ pub fn parse_file_at_path(
         }
 
         return Ok(first_error.is_some());
-    } else if print_time {
+    } else if opts.print_time {
         let duration = time.elapsed();
         let duration_ms = duration.as_secs() * 1000 + duration.subsec_nanos() as u64 / 1000000;
         writeln!(
             &mut stdout,
             "{:width$}\t{} ms (timed out)",
-            path.to_str().unwrap(),
+            opts.path.to_str().unwrap(),
             duration_ms,
-            width = max_path_length
+            width = opts.max_path_length
         )?;
     }
 

From 89edb2ddcaf2928e3197ad6095e1eb1d59bfcc40 Mon Sep 17 00:00:00 2001
From: Andrew Helwer <ahelwer@users.noreply.github.com>
Date: Mon, 10 Jul 2023 19:12:24 -0400
Subject: [PATCH 143/347] fix(fuzzer): only use rule strings for fuzz
 dictionary

The `find_literals` function can also pick up tokens in `precedences`
---
 test/fuzz/gen-dict.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/test/fuzz/gen-dict.py b/test/fuzz/gen-dict.py
index f8cf834e..c9845671 100644
--- a/test/fuzz/gen-dict.py
+++ b/test/fuzz/gen-dict.py
@@ -21,7 +21,7 @@ def main():
     grammar = json.load(f)
 
   literals = set()
-  find_literals(literals, grammar)
+  find_literals(literals, grammar['rules'])
 
   for lit in sorted(literals):
     if lit:

From 76c5773d7c388917bdd9d71a5b71feeb7ac4bde6 Mon Sep 17 00:00:00 2001
From: Amin Yahyaabadi <aminyahyaabadi74@gmail.com>
Date: Sat, 6 Aug 2022 13:41:50 -0700
Subject: [PATCH 144/347] fix: fix detection of the compiler on windows

---
 cli/loader/src/lib.rs | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/cli/loader/src/lib.rs b/cli/loader/src/lib.rs
index 029da451..e71001a4 100644
--- a/cli/loader/src/lib.rs
+++ b/cli/loader/src/lib.rs
@@ -377,7 +377,8 @@ impl Loader {
                 command.env(key, value);
             }
 
-            if cfg!(windows) {
+            let compiler = config.get_compiler();
+            if compiler.is_like_msvc() {
                 command.args(&["/nologo", "/LD", "/I"]).arg(header_path);
                 if self.debug_build {
                     command.arg("/Od");

From 5d83c8f3b879bf99f06ac5b7150b08c8fe928ee6 Mon Sep 17 00:00:00 2001
From: Amin Yahyaabadi <aminyahyaabadi74@gmail.com>
Date: Sat, 6 Aug 2022 13:47:18 -0700
Subject: [PATCH 145/347] fix: do not use -fPIC on Windows

---
 cli/loader/src/lib.rs | 5 ++++-
 1 file changed, 4 insertions(+), 1 deletion(-)

diff --git a/cli/loader/src/lib.rs b/cli/loader/src/lib.rs
index e71001a4..2c268347 100644
--- a/cli/loader/src/lib.rs
+++ b/cli/loader/src/lib.rs
@@ -395,7 +395,6 @@ impl Loader {
             } else {
                 command
                     .arg("-shared")
-                    .arg("-fPIC")
                     .arg("-fno-exceptions")
                     .arg("-g")
                     .arg("-I")
@@ -403,6 +402,10 @@ impl Loader {
                     .arg("-o")
                     .arg(&library_path);
 
+                if !cfg!(windows) {
+                    command.arg("-fPIC");
+                }
+
                 if self.debug_build {
                     command.arg("-O0");
                 } else {

From 04453f64afeaf88f12800331d2766a8d77649658 Mon Sep 17 00:00:00 2001
From: Amin Yahyaabadi <aminyahyaabadi74@gmail.com>
Date: Mon, 9 Jan 2023 11:09:51 -0800
Subject: [PATCH 146/347] fix: remove redundant get_compiler() call

---
 cli/loader/src/lib.rs | 1 -
 1 file changed, 1 deletion(-)

diff --git a/cli/loader/src/lib.rs b/cli/loader/src/lib.rs
index 2c268347..30cec2ca 100644
--- a/cli/loader/src/lib.rs
+++ b/cli/loader/src/lib.rs
@@ -377,7 +377,6 @@ impl Loader {
                 command.env(key, value);
             }
 
-            let compiler = config.get_compiler();
             if compiler.is_like_msvc() {
                 command.args(&["/nologo", "/LD", "/I"]).arg(header_path);
                 if self.debug_build {

From ddc629ae5347414013c984ddb8cfa70962ad2f67 Mon Sep 17 00:00:00 2001
From: ActuallyTaylor <zachary.lineman@gmail.com>
Date: Sat, 20 May 2023 20:38:20 -0400
Subject: [PATCH 147/347] Added Swift Package Manager entry point.

---
 .gitignore    |  3 ++-
 Package.swift | 39 +++++++++++++++++++++++++++++++++++++++
 2 files changed, 41 insertions(+), 1 deletion(-)
 create mode 100644 Package.swift

diff --git a/.gitignore b/.gitignore
index 834fd20f..91423969 100644
--- a/.gitignore
+++ b/.gitignore
@@ -24,4 +24,5 @@ docs/assets/js/tree-sitter.js
 *.obj
 *.exp
 *.lib
-*.wasm
\ No newline at end of file
+*.wasm
+.swiftpm
\ No newline at end of file
diff --git a/Package.swift b/Package.swift
new file mode 100644
index 00000000..7966e529
--- /dev/null
+++ b/Package.swift
@@ -0,0 +1,39 @@
+// swift-tools-version: 5.8
+// The swift-tools-version declares the minimum version of Swift required to build this package.
+
+import PackageDescription
+
+let package = Package(
+    name: "TreeSitter",
+    products: [
+        // Products define the executables and libraries a package produces, and make them visible to other packages.
+        .library(
+            name: "TreeSitter",
+            targets: ["TreeSitter"]),
+    ],
+    targets: [
+        .target(name: "TreeSitter",
+                path: "lib",
+                exclude: [
+                    "binding_rust",
+                    "binding_web",
+                    "Cargo.toml",
+                    "README.md",
+                    "src/unicode/README.md",
+                    "src/unicode/LICENSE",
+                    "src/unicode/ICU_SHA",
+                    "src/get_changed_ranges.c",
+                    "src/tree_cursor.c",
+                    "src/stack.c",
+                    "src/node.c",
+                    "src/lexer.c",
+                    "src/parser.c",
+                    "src/language.c",
+                    "src/alloc.c",
+                    "src/subtree.c",
+                    "src/tree.c",
+                    "src/query.c"
+                ],
+                sources: ["src/lib.c"]),
+    ]
+)

From f01c4f83762660ee20201e5d9510a1ebfe795d63 Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Thu, 13 Jul 2023 17:34:32 +0300
Subject: [PATCH 148/347] Restore Rust bindings generation with newer bindgen
 0.65.1

---
 lib/binding_rust/bindings.rs | 370 ++++++-----------------------------
 script/generate-bindings     |   1 -
 2 files changed, 56 insertions(+), 315 deletions(-)

diff --git a/lib/binding_rust/bindings.rs b/lib/binding_rust/bindings.rs
index b584a509..66406adc 100644
--- a/lib/binding_rust/bindings.rs
+++ b/lib/binding_rust/bindings.rs
@@ -1,4 +1,4 @@
-/* automatically generated by rust-bindgen 0.59.2 */
+/* automatically generated by rust-bindgen 0.65.1 */
 
 pub type TSSymbol = u16;
 pub type TSFieldId = u16;
@@ -148,14 +148,7 @@ extern "C" {
     pub fn ts_parser_delete(parser: *mut TSParser);
 }
 extern "C" {
-    #[doc = " Set the language that the parser should use for parsing."]
-    #[doc = ""]
-    #[doc = " Returns a boolean indicating whether or not the language was successfully"]
-    #[doc = " assigned. True means assignment succeeded. False means there was a version"]
-    #[doc = " mismatch: the language was generated with an incompatible version of the"]
-    #[doc = " Tree-sitter CLI. Check the language's version using `ts_language_version`"]
-    #[doc = " and compare it to this library's `TREE_SITTER_LANGUAGE_VERSION` and"]
-    #[doc = " `TREE_SITTER_MIN_COMPATIBLE_LANGUAGE_VERSION` constants."]
+    #[doc = " Set the language that the parser should use for parsing.\n\n Returns a boolean indicating whether or not the language was successfully\n assigned. True means assignment succeeded. False means there was a version\n mismatch: the language was generated with an incompatible version of the\n Tree-sitter CLI. Check the language's version using `ts_language_version`\n and compare it to this library's `TREE_SITTER_LANGUAGE_VERSION` and\n `TREE_SITTER_MIN_COMPATIBLE_LANGUAGE_VERSION` constants."]
     pub fn ts_parser_set_language(self_: *mut TSParser, language: *const TSLanguage) -> bool;
 }
 extern "C" {
@@ -163,25 +156,7 @@ extern "C" {
     pub fn ts_parser_language(self_: *const TSParser) -> *const TSLanguage;
 }
 extern "C" {
-    #[doc = " Set the ranges of text that the parser should include when parsing."]
-    #[doc = ""]
-    #[doc = " By default, the parser will always include entire documents. This function"]
-    #[doc = " allows you to parse only a *portion* of a document but still return a syntax"]
-    #[doc = " tree whose ranges match up with the document as a whole. You can also pass"]
-    #[doc = " multiple disjoint ranges."]
-    #[doc = ""]
-    #[doc = " The second and third parameters specify the location and length of an array"]
-    #[doc = " of ranges. The parser does *not* take ownership of these ranges; it copies"]
-    #[doc = " the data, so it doesn't matter how these ranges are allocated."]
-    #[doc = ""]
-    #[doc = " If `length` is zero, then the entire document will be parsed. Otherwise,"]
-    #[doc = " the given ranges must be ordered from earliest to latest in the document,"]
-    #[doc = " and they must not overlap. That is, the following must hold for all"]
-    #[doc = " `i` < `length - 1`: ranges[i].end_byte <= ranges[i + 1].start_byte"]
-    #[doc = ""]
-    #[doc = " If this requirement is not satisfied, the operation will fail, the ranges"]
-    #[doc = " will not be assigned, and this function will return `false`. On success,"]
-    #[doc = " this function returns `true`"]
+    #[doc = " Set the ranges of text that the parser should include when parsing.\n\n By default, the parser will always include entire documents. This function\n allows you to parse only a *portion* of a document but still return a syntax\n tree whose ranges match up with the document as a whole. You can also pass\n multiple disjoint ranges.\n\n The second and third parameters specify the location and length of an array\n of ranges. The parser does *not* take ownership of these ranges; it copies\n the data, so it doesn't matter how these ranges are allocated.\n\n If `length` is zero, then the entire document will be parsed. Otherwise,\n the given ranges must be ordered from earliest to latest in the document,\n and they must not overlap. That is, the following must hold for all\n `i` < `length - 1`: ranges[i].end_byte <= ranges[i + 1].start_byte\n\n If this requirement is not satisfied, the operation will fail, the ranges\n will not be assigned, and this function will return `false`. On success,\n this function returns `true`"]
     pub fn ts_parser_set_included_ranges(
         self_: *mut TSParser,
         ranges: *const TSRange,
@@ -189,50 +164,11 @@ extern "C" {
     ) -> bool;
 }
 extern "C" {
-    #[doc = " Get the ranges of text that the parser will include when parsing."]
-    #[doc = ""]
-    #[doc = " The returned pointer is owned by the parser. The caller should not free it"]
-    #[doc = " or write to it. The length of the array will be written to the given"]
-    #[doc = " `length` pointer."]
+    #[doc = " Get the ranges of text that the parser will include when parsing.\n\n The returned pointer is owned by the parser. The caller should not free it\n or write to it. The length of the array will be written to the given\n `length` pointer."]
     pub fn ts_parser_included_ranges(self_: *const TSParser, length: *mut u32) -> *const TSRange;
 }
 extern "C" {
-    #[doc = " Use the parser to parse some source code and create a syntax tree."]
-    #[doc = ""]
-    #[doc = " If you are parsing this document for the first time, pass `NULL` for the"]
-    #[doc = " `old_tree` parameter. Otherwise, if you have already parsed an earlier"]
-    #[doc = " version of this document and the document has since been edited, pass the"]
-    #[doc = " previous syntax tree so that the unchanged parts of it can be reused."]
-    #[doc = " This will save time and memory. For this to work correctly, you must have"]
-    #[doc = " already edited the old syntax tree using the `ts_tree_edit` function in a"]
-    #[doc = " way that exactly matches the source code changes."]
-    #[doc = ""]
-    #[doc = " The `TSInput` parameter lets you specify how to read the text. It has the"]
-    #[doc = " following three fields:"]
-    #[doc = " 1. `read`: A function to retrieve a chunk of text at a given byte offset"]
-    #[doc = "    and (row, column) position. The function should return a pointer to the"]
-    #[doc = "    text and write its length to the `bytes_read` pointer. The parser does"]
-    #[doc = "    not take ownership of this buffer; it just borrows it until it has"]
-    #[doc = "    finished reading it. The function should write a zero value to the"]
-    #[doc = "    `bytes_read` pointer to indicate the end of the document."]
-    #[doc = " 2. `payload`: An arbitrary pointer that will be passed to each invocation"]
-    #[doc = "    of the `read` function."]
-    #[doc = " 3. `encoding`: An indication of how the text is encoded. Either"]
-    #[doc = "    `TSInputEncodingUTF8` or `TSInputEncodingUTF16`."]
-    #[doc = ""]
-    #[doc = " This function returns a syntax tree on success, and `NULL` on failure. There"]
-    #[doc = " are three possible reasons for failure:"]
-    #[doc = " 1. The parser does not have a language assigned. Check for this using the"]
-    #[doc = "`ts_parser_language` function."]
-    #[doc = " 2. Parsing was cancelled due to a timeout that was set by an earlier call to"]
-    #[doc = "    the `ts_parser_set_timeout_micros` function. You can resume parsing from"]
-    #[doc = "    where the parser left out by calling `ts_parser_parse` again with the"]
-    #[doc = "    same arguments. Or you can start parsing from scratch by first calling"]
-    #[doc = "    `ts_parser_reset`."]
-    #[doc = " 3. Parsing was cancelled using a cancellation flag that was set by an"]
-    #[doc = "    earlier call to `ts_parser_set_cancellation_flag`. You can resume parsing"]
-    #[doc = "    from where the parser left out by calling `ts_parser_parse` again with"]
-    #[doc = "    the same arguments."]
+    #[doc = " Use the parser to parse some source code and create a syntax tree.\n\n If you are parsing this document for the first time, pass `NULL` for the\n `old_tree` parameter. Otherwise, if you have already parsed an earlier\n version of this document and the document has since been edited, pass the\n previous syntax tree so that the unchanged parts of it can be reused.\n This will save time and memory. For this to work correctly, you must have\n already edited the old syntax tree using the `ts_tree_edit` function in a\n way that exactly matches the source code changes.\n\n The `TSInput` parameter lets you specify how to read the text. It has the\n following three fields:\n 1. `read`: A function to retrieve a chunk of text at a given byte offset\n    and (row, column) position. The function should return a pointer to the\n    text and write its length to the `bytes_read` pointer. The parser does\n    not take ownership of this buffer; it just borrows it until it has\n    finished reading it. The function should write a zero value to the\n    `bytes_read` pointer to indicate the end of the document.\n 2. `payload`: An arbitrary pointer that will be passed to each invocation\n    of the `read` function.\n 3. `encoding`: An indication of how the text is encoded. Either\n    `TSInputEncodingUTF8` or `TSInputEncodingUTF16`.\n\n This function returns a syntax tree on success, and `NULL` on failure. There\n are three possible reasons for failure:\n 1. The parser does not have a language assigned. Check for this using the\n`ts_parser_language` function.\n 2. Parsing was cancelled due to a timeout that was set by an earlier call to\n    the `ts_parser_set_timeout_micros` function. You can resume parsing from\n    where the parser left out by calling `ts_parser_parse` again with the\n    same arguments. Or you can start parsing from scratch by first calling\n    `ts_parser_reset`.\n 3. Parsing was cancelled using a cancellation flag that was set by an\n    earlier call to `ts_parser_set_cancellation_flag`. You can resume parsing\n    from where the parser left out by calling `ts_parser_parse` again with\n    the same arguments."]
     pub fn ts_parser_parse(
         self_: *mut TSParser,
         old_tree: *const TSTree,
@@ -240,10 +176,7 @@ extern "C" {
     ) -> *mut TSTree;
 }
 extern "C" {
-    #[doc = " Use the parser to parse some source code stored in one contiguous buffer."]
-    #[doc = " The first two parameters are the same as in the `ts_parser_parse` function"]
-    #[doc = " above. The second two parameters indicate the location of the buffer and its"]
-    #[doc = " length in bytes."]
+    #[doc = " Use the parser to parse some source code stored in one contiguous buffer.\n The first two parameters are the same as in the `ts_parser_parse` function\n above. The second two parameters indicate the location of the buffer and its\n length in bytes."]
     pub fn ts_parser_parse_string(
         self_: *mut TSParser,
         old_tree: *const TSTree,
@@ -252,10 +185,7 @@ extern "C" {
     ) -> *mut TSTree;
 }
 extern "C" {
-    #[doc = " Use the parser to parse some source code stored in one contiguous buffer with"]
-    #[doc = " a given encoding. The first four parameters work the same as in the"]
-    #[doc = " `ts_parser_parse_string` method above. The final parameter indicates whether"]
-    #[doc = " the text is encoded as UTF8 or UTF16."]
+    #[doc = " Use the parser to parse some source code stored in one contiguous buffer with\n a given encoding. The first four parameters work the same as in the\n `ts_parser_parse_string` method above. The final parameter indicates whether\n the text is encoded as UTF8 or UTF16."]
     pub fn ts_parser_parse_string_encoding(
         self_: *mut TSParser,
         old_tree: *const TSTree,
@@ -265,21 +195,11 @@ extern "C" {
     ) -> *mut TSTree;
 }
 extern "C" {
-    #[doc = " Instruct the parser to start the next parse from the beginning."]
-    #[doc = ""]
-    #[doc = " If the parser previously failed because of a timeout or a cancellation, then"]
-    #[doc = " by default, it will resume where it left off on the next call to"]
-    #[doc = " `ts_parser_parse` or other parsing functions. If you don't want to resume,"]
-    #[doc = " and instead intend to use this parser to parse some other document, you must"]
-    #[doc = " call `ts_parser_reset` first."]
+    #[doc = " Instruct the parser to start the next parse from the beginning.\n\n If the parser previously failed because of a timeout or a cancellation, then\n by default, it will resume where it left off on the next call to\n `ts_parser_parse` or other parsing functions. If you don't want to resume,\n and instead intend to use this parser to parse some other document, you must\n call `ts_parser_reset` first."]
     pub fn ts_parser_reset(self_: *mut TSParser);
 }
 extern "C" {
-    #[doc = " Set the maximum duration in microseconds that parsing should be allowed to"]
-    #[doc = " take before halting."]
-    #[doc = ""]
-    #[doc = " If parsing takes longer than this, it will halt early, returning NULL."]
-    #[doc = " See `ts_parser_parse` for more information."]
+    #[doc = " Set the maximum duration in microseconds that parsing should be allowed to\n take before halting.\n\n If parsing takes longer than this, it will halt early, returning NULL.\n See `ts_parser_parse` for more information."]
     pub fn ts_parser_set_timeout_micros(self_: *mut TSParser, timeout: u64);
 }
 extern "C" {
@@ -287,11 +207,7 @@ extern "C" {
     pub fn ts_parser_timeout_micros(self_: *const TSParser) -> u64;
 }
 extern "C" {
-    #[doc = " Set the parser's current cancellation flag pointer."]
-    #[doc = ""]
-    #[doc = " If a non-null pointer is assigned, then the parser will periodically read"]
-    #[doc = " from this pointer during parsing. If it reads a non-zero value, it will"]
-    #[doc = " halt early, returning NULL. See `ts_parser_parse` for more information."]
+    #[doc = " Set the parser's current cancellation flag pointer.\n\n If a non-null pointer is assigned, then the parser will periodically read\n from this pointer during parsing. If it reads a non-zero value, it will\n halt early, returning NULL. See `ts_parser_parse` for more information."]
     pub fn ts_parser_set_cancellation_flag(self_: *mut TSParser, flag: *const usize);
 }
 extern "C" {
@@ -299,11 +215,7 @@ extern "C" {
     pub fn ts_parser_cancellation_flag(self_: *const TSParser) -> *const usize;
 }
 extern "C" {
-    #[doc = " Set the logger that a parser should use during parsing."]
-    #[doc = ""]
-    #[doc = " The parser does not take ownership over the logger payload. If a logger was"]
-    #[doc = " previously assigned, the caller is responsible for releasing any memory"]
-    #[doc = " owned by the previous logger."]
+    #[doc = " Set the logger that a parser should use during parsing.\n\n The parser does not take ownership over the logger payload. If a logger was\n previously assigned, the caller is responsible for releasing any memory\n owned by the previous logger."]
     pub fn ts_parser_set_logger(self_: *mut TSParser, logger: TSLogger);
 }
 extern "C" {
@@ -311,17 +223,11 @@ extern "C" {
     pub fn ts_parser_logger(self_: *const TSParser) -> TSLogger;
 }
 extern "C" {
-    #[doc = " Set the file descriptor to which the parser should write debugging graphs"]
-    #[doc = " during parsing. The graphs are formatted in the DOT language. You may want"]
-    #[doc = " to pipe these graphs directly to a `dot(1)` process in order to generate"]
-    #[doc = " SVG output. You can turn off this logging by passing a negative number."]
+    #[doc = " Set the file descriptor to which the parser should write debugging graphs\n during parsing. The graphs are formatted in the DOT language. You may want\n to pipe these graphs directly to a `dot(1)` process in order to generate\n SVG output. You can turn off this logging by passing a negative number."]
     pub fn ts_parser_print_dot_graphs(self_: *mut TSParser, file: ::std::os::raw::c_int);
 }
 extern "C" {
-    #[doc = " Create a shallow copy of the syntax tree. This is very fast."]
-    #[doc = ""]
-    #[doc = " You need to copy a syntax tree in order to use it on more than one thread at"]
-    #[doc = " a time, as syntax trees are not thread safe."]
+    #[doc = " Create a shallow copy of the syntax tree. This is very fast.\n\n You need to copy a syntax tree in order to use it on more than one thread at\n a time, as syntax trees are not thread safe."]
     pub fn ts_tree_copy(self_: *const TSTree) -> *mut TSTree;
 }
 extern "C" {
@@ -333,8 +239,7 @@ extern "C" {
     pub fn ts_tree_root_node(self_: *const TSTree) -> TSNode;
 }
 extern "C" {
-    #[doc = " Get the root node of the syntax tree, but with its position"]
-    #[doc = " shifted forward by the given offset."]
+    #[doc = " Get the root node of the syntax tree, but with its position\n shifted forward by the given offset."]
     pub fn ts_tree_root_node_with_offset(
         self_: *const TSTree,
         offset_bytes: u32,
@@ -346,32 +251,15 @@ extern "C" {
     pub fn ts_tree_language(arg1: *const TSTree) -> *const TSLanguage;
 }
 extern "C" {
-    #[doc = " Get the array of included ranges that was used to parse the syntax tree."]
-    #[doc = ""]
-    #[doc = " The returned pointer must be freed by the caller."]
+    #[doc = " Get the array of included ranges that was used to parse the syntax tree.\n\n The returned pointer must be freed by the caller."]
     pub fn ts_tree_included_ranges(arg1: *const TSTree, length: *mut u32) -> *mut TSRange;
 }
 extern "C" {
-    #[doc = " Edit the syntax tree to keep it in sync with source code that has been"]
-    #[doc = " edited."]
-    #[doc = ""]
-    #[doc = " You must describe the edit both in terms of byte offsets and in terms of"]
-    #[doc = " (row, column) coordinates."]
+    #[doc = " Edit the syntax tree to keep it in sync with source code that has been\n edited.\n\n You must describe the edit both in terms of byte offsets and in terms of\n (row, column) coordinates."]
     pub fn ts_tree_edit(self_: *mut TSTree, edit: *const TSInputEdit);
 }
 extern "C" {
-    #[doc = " Compare an old edited syntax tree to a new syntax tree representing the same"]
-    #[doc = " document, returning an array of ranges whose syntactic structure has changed."]
-    #[doc = ""]
-    #[doc = " For this to work correctly, the old syntax tree must have been edited such"]
-    #[doc = " that its ranges match up to the new tree. Generally, you'll want to call"]
-    #[doc = " this function right after calling one of the `ts_parser_parse` functions."]
-    #[doc = " You need to pass the old tree that was passed to parse, as well as the new"]
-    #[doc = " tree that was returned from that function."]
-    #[doc = ""]
-    #[doc = " The returned array is allocated using `malloc` and the caller is responsible"]
-    #[doc = " for freeing it using `free`. The length of the array will be written to the"]
-    #[doc = " given `length` pointer."]
+    #[doc = " Compare an old edited syntax tree to a new syntax tree representing the same\n document, returning an array of ranges whose syntactic structure has changed.\n\n For this to work correctly, the old syntax tree must have been edited such\n that its ranges match up to the new tree. Generally, you'll want to call\n this function right after calling one of the `ts_parser_parse` functions.\n You need to pass the old tree that was passed to parse, as well as the new\n tree that was returned from that function.\n\n The returned array is allocated using `malloc` and the caller is responsible\n for freeing it using `free`. The length of the array will be written to the\n given `length` pointer."]
     pub fn ts_tree_get_changed_ranges(
         old_tree: *const TSTree,
         new_tree: *const TSTree,
@@ -407,32 +295,23 @@ extern "C" {
     pub fn ts_node_end_point(arg1: TSNode) -> TSPoint;
 }
 extern "C" {
-    #[doc = " Get an S-expression representing the node as a string."]
-    #[doc = ""]
-    #[doc = " This string is allocated with `malloc` and the caller is responsible for"]
-    #[doc = " freeing it using `free`."]
+    #[doc = " Get an S-expression representing the node as a string.\n\n This string is allocated with `malloc` and the caller is responsible for\n freeing it using `free`."]
     pub fn ts_node_string(arg1: TSNode) -> *mut ::std::os::raw::c_char;
 }
 extern "C" {
-    #[doc = " Check if the node is null. Functions like `ts_node_child` and"]
-    #[doc = " `ts_node_next_sibling` will return a null node to indicate that no such node"]
-    #[doc = " was found."]
+    #[doc = " Check if the node is null. Functions like `ts_node_child` and\n `ts_node_next_sibling` will return a null node to indicate that no such node\n was found."]
     pub fn ts_node_is_null(arg1: TSNode) -> bool;
 }
 extern "C" {
-    #[doc = " Check if the node is *named*. Named nodes correspond to named rules in the"]
-    #[doc = " grammar, whereas *anonymous* nodes correspond to string literals in the"]
-    #[doc = " grammar."]
+    #[doc = " Check if the node is *named*. Named nodes correspond to named rules in the\n grammar, whereas *anonymous* nodes correspond to string literals in the\n grammar."]
     pub fn ts_node_is_named(arg1: TSNode) -> bool;
 }
 extern "C" {
-    #[doc = " Check if the node is *missing*. Missing nodes are inserted by the parser in"]
-    #[doc = " order to recover from certain kinds of syntax errors."]
+    #[doc = " Check if the node is *missing*. Missing nodes are inserted by the parser in\n order to recover from certain kinds of syntax errors."]
     pub fn ts_node_is_missing(arg1: TSNode) -> bool;
 }
 extern "C" {
-    #[doc = " Check if the node is *extra*. Extra nodes represent things like comments,"]
-    #[doc = " which are not required the grammar, but can appear anywhere."]
+    #[doc = " Check if the node is *extra*. Extra nodes represent things like comments,\n which are not required the grammar, but can appear anywhere."]
     pub fn ts_node_is_extra(arg1: TSNode) -> bool;
 }
 extern "C" {
@@ -448,13 +327,11 @@ extern "C" {
     pub fn ts_node_parent(arg1: TSNode) -> TSNode;
 }
 extern "C" {
-    #[doc = " Get the node's child at the given index, where zero represents the first"]
-    #[doc = " child."]
+    #[doc = " Get the node's child at the given index, where zero represents the first\n child."]
     pub fn ts_node_child(arg1: TSNode, arg2: u32) -> TSNode;
 }
 extern "C" {
-    #[doc = " Get the field name for node's child at the given index, where zero represents"]
-    #[doc = " the first child. Returns NULL, if no field is found."]
+    #[doc = " Get the field name for node's child at the given index, where zero represents\n the first child. Returns NULL, if no field is found."]
     pub fn ts_node_field_name_for_child(arg1: TSNode, arg2: u32) -> *const ::std::os::raw::c_char;
 }
 extern "C" {
@@ -462,15 +339,11 @@ extern "C" {
     pub fn ts_node_child_count(arg1: TSNode) -> u32;
 }
 extern "C" {
-    #[doc = " Get the node's *named* child at the given index."]
-    #[doc = ""]
-    #[doc = " See also `ts_node_is_named`."]
+    #[doc = " Get the node's *named* child at the given index.\n\n See also `ts_node_is_named`."]
     pub fn ts_node_named_child(arg1: TSNode, arg2: u32) -> TSNode;
 }
 extern "C" {
-    #[doc = " Get the node's number of *named* children."]
-    #[doc = ""]
-    #[doc = " See also `ts_node_is_named`."]
+    #[doc = " Get the node's number of *named* children.\n\n See also `ts_node_is_named`."]
     pub fn ts_node_named_child_count(arg1: TSNode) -> u32;
 }
 extern "C" {
@@ -482,10 +355,7 @@ extern "C" {
     ) -> TSNode;
 }
 extern "C" {
-    #[doc = " Get the node's child with the given numerical field id."]
-    #[doc = ""]
-    #[doc = " You can convert a field name to an id using the"]
-    #[doc = " `ts_language_field_id_for_name` function."]
+    #[doc = " Get the node's child with the given numerical field id.\n\n You can convert a field name to an id using the\n `ts_language_field_id_for_name` function."]
     pub fn ts_node_child_by_field_id(arg1: TSNode, arg2: TSFieldId) -> TSNode;
 }
 extern "C" {
@@ -515,8 +385,7 @@ extern "C" {
     pub fn ts_node_descendant_count(arg1: TSNode) -> u32;
 }
 extern "C" {
-    #[doc = " Get the smallest node within this node that spans the given range of bytes"]
-    #[doc = " or (row, column) positions."]
+    #[doc = " Get the smallest node within this node that spans the given range of bytes\n or (row, column) positions."]
     pub fn ts_node_descendant_for_byte_range(arg1: TSNode, arg2: u32, arg3: u32) -> TSNode;
 }
 extern "C" {
@@ -524,8 +393,7 @@ extern "C" {
         -> TSNode;
 }
 extern "C" {
-    #[doc = " Get the smallest named node within this node that spans the given range of"]
-    #[doc = " bytes or (row, column) positions."]
+    #[doc = " Get the smallest named node within this node that spans the given range of\n bytes or (row, column) positions."]
     pub fn ts_node_named_descendant_for_byte_range(arg1: TSNode, arg2: u32, arg3: u32) -> TSNode;
 }
 extern "C" {
@@ -536,13 +404,7 @@ extern "C" {
     ) -> TSNode;
 }
 extern "C" {
-    #[doc = " Edit the node to keep it in-sync with source code that has been edited."]
-    #[doc = ""]
-    #[doc = " This function is only rarely needed. When you edit a syntax tree with the"]
-    #[doc = " `ts_tree_edit` function, all of the nodes that you retrieve from the tree"]
-    #[doc = " afterward will already reflect the edit. You only need to use `ts_node_edit`"]
-    #[doc = " when you have a `TSNode` instance that you want to keep and continue to use"]
-    #[doc = " after an edit."]
+    #[doc = " Edit the node to keep it in-sync with source code that has been edited.\n\n This function is only rarely needed. When you edit a syntax tree with the\n `ts_tree_edit` function, all of the nodes that you retrieve from the tree\n afterward will already reflect the edit. You only need to use `ts_node_edit`\n when you have a `TSNode` instance that you want to keep and continue to use\n after an edit."]
     pub fn ts_node_edit(arg1: *mut TSNode, arg2: *const TSInputEdit);
 }
 extern "C" {
@@ -550,11 +412,7 @@ extern "C" {
     pub fn ts_node_eq(arg1: TSNode, arg2: TSNode) -> bool;
 }
 extern "C" {
-    #[doc = " Create a new tree cursor starting from the given node."]
-    #[doc = ""]
-    #[doc = " A tree cursor allows you to walk a syntax tree more efficiently than is"]
-    #[doc = " possible using the `TSNode` functions. It is a mutable object that is always"]
-    #[doc = " on a certain syntax node, and can be moved imperatively to different nodes."]
+    #[doc = " Create a new tree cursor starting from the given node.\n\n A tree cursor allows you to walk a syntax tree more efficiently than is\n possible using the `TSNode` functions. It is a mutable object that is always\n on a certain syntax node, and can be moved imperatively to different nodes."]
     pub fn ts_tree_cursor_new(arg1: TSNode) -> TSTreeCursor;
 }
 extern "C" {
@@ -570,64 +428,41 @@ extern "C" {
     pub fn ts_tree_cursor_current_node(arg1: *const TSTreeCursor) -> TSNode;
 }
 extern "C" {
-    #[doc = " Get the field name of the tree cursor's current node."]
-    #[doc = ""]
-    #[doc = " This returns `NULL` if the current node doesn't have a field."]
-    #[doc = " See also `ts_node_child_by_field_name`."]
+    #[doc = " Get the field name of the tree cursor's current node.\n\n This returns `NULL` if the current node doesn't have a field.\n See also `ts_node_child_by_field_name`."]
     pub fn ts_tree_cursor_current_field_name(
         arg1: *const TSTreeCursor,
     ) -> *const ::std::os::raw::c_char;
 }
 extern "C" {
-    #[doc = " Get the field id of the tree cursor's current node."]
-    #[doc = ""]
-    #[doc = " This returns zero if the current node doesn't have a field."]
-    #[doc = " See also `ts_node_child_by_field_id`, `ts_language_field_id_for_name`."]
+    #[doc = " Get the field id of the tree cursor's current node.\n\n This returns zero if the current node doesn't have a field.\n See also `ts_node_child_by_field_id`, `ts_language_field_id_for_name`."]
     pub fn ts_tree_cursor_current_field_id(arg1: *const TSTreeCursor) -> TSFieldId;
 }
 extern "C" {
-    #[doc = " Move the cursor to the parent of its current node."]
-    #[doc = ""]
-    #[doc = " This returns `true` if the cursor successfully moved, and returns `false`"]
-    #[doc = " if there was no parent node (the cursor was already on the root node)."]
+    #[doc = " Move the cursor to the parent of its current node.\n\n This returns `true` if the cursor successfully moved, and returns `false`\n if there was no parent node (the cursor was already on the root node)."]
     pub fn ts_tree_cursor_goto_parent(arg1: *mut TSTreeCursor) -> bool;
 }
 extern "C" {
-    #[doc = " Move the cursor to the next sibling of its current node."]
-    #[doc = ""]
-    #[doc = " This returns `true` if the cursor successfully moved, and returns `false`"]
-    #[doc = " if there was no next sibling node."]
+    #[doc = " Move the cursor to the next sibling of its current node.\n\n This returns `true` if the cursor successfully moved, and returns `false`\n if there was no next sibling node."]
     pub fn ts_tree_cursor_goto_next_sibling(arg1: *mut TSTreeCursor) -> bool;
 }
 extern "C" {
-    #[doc = " Move the cursor to the first child of its current node."]
-    #[doc = ""]
-    #[doc = " This returns `true` if the cursor successfully moved, and returns `false`"]
-    #[doc = " if there were no children."]
+    #[doc = " Move the cursor to the first child of its current node.\n\n This returns `true` if the cursor successfully moved, and returns `false`\n if there were no children."]
     pub fn ts_tree_cursor_goto_first_child(arg1: *mut TSTreeCursor) -> bool;
 }
 extern "C" {
-    #[doc = " Move the cursor to the node that is the nth descendant of"]
-    #[doc = " the original node that the cursor was constructed with, where"]
-    #[doc = " zero represents the original node itself."]
+    #[doc = " Move the cursor to the node that is the nth descendant of\n the original node that the cursor was constructed with, where\n zero represents the original node itself."]
     pub fn ts_tree_cursor_goto_descendant(arg1: *mut TSTreeCursor, arg2: u32);
 }
 extern "C" {
-    #[doc = " Get the index of the cursor's current node out of all of the"]
-    #[doc = " descendants of the original node that the cursor was constructed with."]
+    #[doc = " Get the index of the cursor's current node out of all of the\n descendants of the original node that the cursor was constructed with."]
     pub fn ts_tree_cursor_current_descendant_index(arg1: *const TSTreeCursor) -> u32;
 }
 extern "C" {
-    #[doc = " Get the depth of the cursor's current node relative to the original"]
-    #[doc = " node that the cursor was constructed with."]
+    #[doc = " Get the depth of the cursor's current node relative to the original\n node that the cursor was constructed with."]
     pub fn ts_tree_cursor_current_depth(arg1: *const TSTreeCursor) -> u32;
 }
 extern "C" {
-    #[doc = " Move the cursor to the first child of its current node that extends beyond"]
-    #[doc = " the given byte offset or point."]
-    #[doc = ""]
-    #[doc = " This returns the index of the child node if one was found, and returns -1"]
-    #[doc = " if no such child was found."]
+    #[doc = " Move the cursor to the first child of its current node that extends beyond\n the given byte offset or point.\n\n This returns the index of the child node if one was found, and returns -1\n if no such child was found."]
     pub fn ts_tree_cursor_goto_first_child_for_byte(arg1: *mut TSTreeCursor, arg2: u32) -> i64;
 }
 extern "C" {
@@ -638,15 +473,7 @@ extern "C" {
     pub fn ts_tree_cursor_copy(arg1: *const TSTreeCursor) -> TSTreeCursor;
 }
 extern "C" {
-    #[doc = " Create a new query from a string containing one or more S-expression"]
-    #[doc = " patterns. The query is associated with a particular language, and can"]
-    #[doc = " only be run on syntax nodes parsed with that language."]
-    #[doc = ""]
-    #[doc = " If all of the given patterns are valid, this returns a `TSQuery`."]
-    #[doc = " If a pattern is invalid, this returns `NULL`, and provides two pieces"]
-    #[doc = " of information about the problem:"]
-    #[doc = " 1. The byte offset of the error is written to the `error_offset` parameter."]
-    #[doc = " 2. The type of error is written to the `error_type` parameter."]
+    #[doc = " Create a new query from a string containing one or more S-expression\n patterns. The query is associated with a particular language, and can\n only be run on syntax nodes parsed with that language.\n\n If all of the given patterns are valid, this returns a `TSQuery`.\n If a pattern is invalid, this returns `NULL`, and provides two pieces\n of information about the problem:\n 1. The byte offset of the error is written to the `error_offset` parameter.\n 2. The type of error is written to the `error_type` parameter."]
     pub fn ts_query_new(
         language: *const TSLanguage,
         source: *const ::std::os::raw::c_char,
@@ -670,27 +497,11 @@ extern "C" {
     pub fn ts_query_string_count(arg1: *const TSQuery) -> u32;
 }
 extern "C" {
-    #[doc = " Get the byte offset where the given pattern starts in the query's source."]
-    #[doc = ""]
-    #[doc = " This can be useful when combining queries by concatenating their source"]
-    #[doc = " code strings."]
+    #[doc = " Get the byte offset where the given pattern starts in the query's source.\n\n This can be useful when combining queries by concatenating their source\n code strings."]
     pub fn ts_query_start_byte_for_pattern(arg1: *const TSQuery, arg2: u32) -> u32;
 }
 extern "C" {
-    #[doc = " Get all of the predicates for the given pattern in the query."]
-    #[doc = ""]
-    #[doc = " The predicates are represented as a single array of steps. There are three"]
-    #[doc = " types of steps in this array, which correspond to the three legal values for"]
-    #[doc = " the `type` field:"]
-    #[doc = " - `TSQueryPredicateStepTypeCapture` - Steps with this type represent names"]
-    #[doc = "    of captures. Their `value_id` can be used with the"]
-    #[doc = "   `ts_query_capture_name_for_id` function to obtain the name of the capture."]
-    #[doc = " - `TSQueryPredicateStepTypeString` - Steps with this type represent literal"]
-    #[doc = "    strings. Their `value_id` can be used with the"]
-    #[doc = "    `ts_query_string_value_for_id` function to obtain their string value."]
-    #[doc = " - `TSQueryPredicateStepTypeDone` - Steps with this type are *sentinels*"]
-    #[doc = "    that represent the end of an individual predicate. If a pattern has two"]
-    #[doc = "    predicates, then there will be two steps with this `type` in the array."]
+    #[doc = " Get all of the predicates for the given pattern in the query.\n\n The predicates are represented as a single array of steps. There are three\n types of steps in this array, which correspond to the three legal values for\n the `type` field:\n - `TSQueryPredicateStepTypeCapture` - Steps with this type represent names\n    of captures. Their `value_id` can be used with the\n   `ts_query_capture_name_for_id` function to obtain the name of the capture.\n - `TSQueryPredicateStepTypeString` - Steps with this type represent literal\n    strings. Their `value_id` can be used with the\n    `ts_query_string_value_for_id` function to obtain their string value.\n - `TSQueryPredicateStepTypeDone` - Steps with this type are *sentinels*\n    that represent the end of an individual predicate. If a pattern has two\n    predicates, then there will be two steps with this `type` in the array."]
     pub fn ts_query_predicates_for_pattern(
         self_: *const TSQuery,
         pattern_index: u32,
@@ -707,9 +518,7 @@ extern "C" {
     pub fn ts_query_is_pattern_guaranteed_at_step(self_: *const TSQuery, byte_offset: u32) -> bool;
 }
 extern "C" {
-    #[doc = " Get the name and length of one of the query's captures, or one of the"]
-    #[doc = " query's string literals. Each capture and string is associated with a"]
-    #[doc = " numeric id based on the order that it appeared in the query's source."]
+    #[doc = " Get the name and length of one of the query's captures, or one of the\n query's string literals. Each capture and string is associated with a\n numeric id based on the order that it appeared in the query's source."]
     pub fn ts_query_capture_name_for_id(
         arg1: *const TSQuery,
         id: u32,
@@ -717,8 +526,7 @@ extern "C" {
     ) -> *const ::std::os::raw::c_char;
 }
 extern "C" {
-    #[doc = " Get the quantifier of the query's captures. Each capture is * associated"]
-    #[doc = " with a numeric id based on the order that it appeared in the query's source."]
+    #[doc = " Get the quantifier of the query's captures. Each capture is * associated\n with a numeric id based on the order that it appeared in the query's source."]
     pub fn ts_query_capture_quantifier_for_id(
         arg1: *const TSQuery,
         pattern_id: u32,
@@ -733,11 +541,7 @@ extern "C" {
     ) -> *const ::std::os::raw::c_char;
 }
 extern "C" {
-    #[doc = " Disable a certain capture within a query."]
-    #[doc = ""]
-    #[doc = " This prevents the capture from being returned in matches, and also avoids"]
-    #[doc = " any resource usage associated with recording the capture. Currently, there"]
-    #[doc = " is no way to undo this."]
+    #[doc = " Disable a certain capture within a query.\n\n This prevents the capture from being returned in matches, and also avoids\n any resource usage associated with recording the capture. Currently, there\n is no way to undo this."]
     pub fn ts_query_disable_capture(
         arg1: *mut TSQuery,
         arg2: *const ::std::os::raw::c_char,
@@ -745,33 +549,11 @@ extern "C" {
     );
 }
 extern "C" {
-    #[doc = " Disable a certain pattern within a query."]
-    #[doc = ""]
-    #[doc = " This prevents the pattern from matching and removes most of the overhead"]
-    #[doc = " associated with the pattern. Currently, there is no way to undo this."]
+    #[doc = " Disable a certain pattern within a query.\n\n This prevents the pattern from matching and removes most of the overhead\n associated with the pattern. Currently, there is no way to undo this."]
     pub fn ts_query_disable_pattern(arg1: *mut TSQuery, arg2: u32);
 }
 extern "C" {
-    #[doc = " Create a new cursor for executing a given query."]
-    #[doc = ""]
-    #[doc = " The cursor stores the state that is needed to iteratively search"]
-    #[doc = " for matches. To use the query cursor, first call `ts_query_cursor_exec`"]
-    #[doc = " to start running a given query on a given syntax node. Then, there are"]
-    #[doc = " two options for consuming the results of the query:"]
-    #[doc = " 1. Repeatedly call `ts_query_cursor_next_match` to iterate over all of the"]
-    #[doc = "    *matches* in the order that they were found. Each match contains the"]
-    #[doc = "    index of the pattern that matched, and an array of captures. Because"]
-    #[doc = "    multiple patterns can match the same set of nodes, one match may contain"]
-    #[doc = "    captures that appear *before* some of the captures from a previous match."]
-    #[doc = " 2. Repeatedly call `ts_query_cursor_next_capture` to iterate over all of the"]
-    #[doc = "    individual *captures* in the order that they appear. This is useful if"]
-    #[doc = "    don't care about which pattern matched, and just want a single ordered"]
-    #[doc = "    sequence of captures."]
-    #[doc = ""]
-    #[doc = " If you don't care about consuming all of the results, you can stop calling"]
-    #[doc = " `ts_query_cursor_next_match` or `ts_query_cursor_next_capture` at any point."]
-    #[doc = "  You can then start executing another query on another node by calling"]
-    #[doc = "  `ts_query_cursor_exec` again."]
+    #[doc = " Create a new cursor for executing a given query.\n\n The cursor stores the state that is needed to iteratively search\n for matches. To use the query cursor, first call `ts_query_cursor_exec`\n to start running a given query on a given syntax node. Then, there are\n two options for consuming the results of the query:\n 1. Repeatedly call `ts_query_cursor_next_match` to iterate over all of the\n    *matches* in the order that they were found. Each match contains the\n    index of the pattern that matched, and an array of captures. Because\n    multiple patterns can match the same set of nodes, one match may contain\n    captures that appear *before* some of the captures from a previous match.\n 2. Repeatedly call `ts_query_cursor_next_capture` to iterate over all of the\n    individual *captures* in the order that they appear. This is useful if\n    don't care about which pattern matched, and just want a single ordered\n    sequence of captures.\n\n If you don't care about consuming all of the results, you can stop calling\n `ts_query_cursor_next_match` or `ts_query_cursor_next_capture` at any point.\n  You can then start executing another query on another node by calling\n  `ts_query_cursor_exec` again."]
     pub fn ts_query_cursor_new() -> *mut TSQueryCursor;
 }
 extern "C" {
@@ -783,15 +565,7 @@ extern "C" {
     pub fn ts_query_cursor_exec(arg1: *mut TSQueryCursor, arg2: *const TSQuery, arg3: TSNode);
 }
 extern "C" {
-    #[doc = " Manage the maximum number of in-progress matches allowed by this query"]
-    #[doc = " cursor."]
-    #[doc = ""]
-    #[doc = " Query cursors have an optional maximum capacity for storing lists of"]
-    #[doc = " in-progress captures. If this capacity is exceeded, then the"]
-    #[doc = " earliest-starting match will silently be dropped to make room for further"]
-    #[doc = " matches. This maximum capacity is optional — by default, query cursors allow"]
-    #[doc = " any number of pending matches, dynamically allocating new space for them as"]
-    #[doc = " needed as the query is executed."]
+    #[doc = " Manage the maximum number of in-progress matches allowed by this query\n cursor.\n\n Query cursors have an optional maximum capacity for storing lists of\n in-progress captures. If this capacity is exceeded, then the\n earliest-starting match will silently be dropped to make room for further\n matches. This maximum capacity is optional — by default, query cursors allow\n any number of pending matches, dynamically allocating new space for them as\n needed as the query is executed."]
     pub fn ts_query_cursor_did_exceed_match_limit(arg1: *const TSQueryCursor) -> bool;
 }
 extern "C" {
@@ -801,28 +575,21 @@ extern "C" {
     pub fn ts_query_cursor_set_match_limit(arg1: *mut TSQueryCursor, arg2: u32);
 }
 extern "C" {
-    #[doc = " Set the range of bytes or (row, column) positions in which the query"]
-    #[doc = " will be executed."]
+    #[doc = " Set the range of bytes or (row, column) positions in which the query\n will be executed."]
     pub fn ts_query_cursor_set_byte_range(arg1: *mut TSQueryCursor, arg2: u32, arg3: u32);
 }
 extern "C" {
     pub fn ts_query_cursor_set_point_range(arg1: *mut TSQueryCursor, arg2: TSPoint, arg3: TSPoint);
 }
 extern "C" {
-    #[doc = " Advance to the next match of the currently running query."]
-    #[doc = ""]
-    #[doc = " If there is a match, write it to `*match` and return `true`."]
-    #[doc = " Otherwise, return `false`."]
+    #[doc = " Advance to the next match of the currently running query.\n\n If there is a match, write it to `*match` and return `true`.\n Otherwise, return `false`."]
     pub fn ts_query_cursor_next_match(arg1: *mut TSQueryCursor, match_: *mut TSQueryMatch) -> bool;
 }
 extern "C" {
     pub fn ts_query_cursor_remove_match(arg1: *mut TSQueryCursor, id: u32);
 }
 extern "C" {
-    #[doc = " Advance to the next capture of the currently running query."]
-    #[doc = ""]
-    #[doc = " If there is a capture, write its match to `*match` and its index within"]
-    #[doc = " the matche's capture list to `*capture_index`. Otherwise, return `false`."]
+    #[doc = " Advance to the next capture of the currently running query.\n\n If there is a capture, write its match to `*match` and its index within\n the matche's capture list to `*capture_index`. Otherwise, return `false`."]
     pub fn ts_query_cursor_next_capture(
         arg1: *mut TSQueryCursor,
         match_: *mut TSQueryMatch,
@@ -830,12 +597,7 @@ extern "C" {
     ) -> bool;
 }
 extern "C" {
-    #[doc = " Set the maximum start depth for a cursor."]
-    #[doc = ""]
-    #[doc = " This prevents cursors from exploring children nodes at a certain depth."]
-    #[doc = " Note if a pattern includes many children, then they will still be checked."]
-    #[doc = ""]
-    #[doc = " Set to `0` to remove the maximum start depth."]
+    #[doc = " Set the maximum start depth for a cursor.\n\n This prevents cursors from exploring children nodes at a certain depth.\n Note if a pattern includes many children, then they will still be checked.\n\n Set to `0` to remove the maximum start depth."]
     pub fn ts_query_cursor_set_max_start_depth(arg1: *mut TSQueryCursor, arg2: u32);
 }
 extern "C" {
@@ -878,35 +640,15 @@ extern "C" {
     ) -> TSFieldId;
 }
 extern "C" {
-    #[doc = " Check whether the given node type id belongs to named nodes, anonymous nodes,"]
-    #[doc = " or a hidden nodes."]
-    #[doc = ""]
-    #[doc = " See also `ts_node_is_named`. Hidden nodes are never returned from the API."]
+    #[doc = " Check whether the given node type id belongs to named nodes, anonymous nodes,\n or a hidden nodes.\n\n See also `ts_node_is_named`. Hidden nodes are never returned from the API."]
     pub fn ts_language_symbol_type(arg1: *const TSLanguage, arg2: TSSymbol) -> TSSymbolType;
 }
 extern "C" {
-    #[doc = " Get the ABI version number for this language. This version number is used"]
-    #[doc = " to ensure that languages were generated by a compatible version of"]
-    #[doc = " Tree-sitter."]
-    #[doc = ""]
-    #[doc = " See also `ts_parser_set_language`."]
+    #[doc = " Get the ABI version number for this language. This version number is used\n to ensure that languages were generated by a compatible version of\n Tree-sitter.\n\n See also `ts_parser_set_language`."]
     pub fn ts_language_version(arg1: *const TSLanguage) -> u32;
 }
 extern "C" {
-    #[doc = " Set the allocation functions used by the library."]
-    #[doc = ""]
-    #[doc = " By default, Tree-sitter uses the standard libc allocation functions,"]
-    #[doc = " but aborts the process when an allocation fails. This function lets"]
-    #[doc = " you supply alternative allocation functions at runtime."]
-    #[doc = ""]
-    #[doc = " If you pass `NULL` for any parameter, Tree-sitter will switch back to"]
-    #[doc = " its default implementation of that function."]
-    #[doc = ""]
-    #[doc = " If you call this function after the library has already been used, then"]
-    #[doc = " you must ensure that either:"]
-    #[doc = "  1. All the existing objects have been freed."]
-    #[doc = "  2. The new allocator shares its state with the old one, so it is capable"]
-    #[doc = "     of freeing memory that was allocated by the old allocator."]
+    #[doc = " Set the allocation functions used by the library.\n\n By default, Tree-sitter uses the standard libc allocation functions,\n but aborts the process when an allocation fails. This function lets\n you supply alternative allocation functions at runtime.\n\n If you pass `NULL` for any parameter, Tree-sitter will switch back to\n its default implementation of that function.\n\n If you call this function after the library has already been used, then\n you must ensure that either:\n  1. All the existing objects have been freed.\n  2. The new allocator shares its state with the old one, so it is capable\n     of freeing memory that was allocated by the old allocator."]
     pub fn ts_set_allocator(
         new_malloc: ::std::option::Option<
             unsafe extern "C" fn(arg1: usize) -> *mut ::std::os::raw::c_void,
diff --git a/script/generate-bindings b/script/generate-bindings
index 8757aaeb..25499c0e 100755
--- a/script/generate-bindings
+++ b/script/generate-bindings
@@ -4,7 +4,6 @@ output_path=lib/binding_rust/bindings.rs
 header_path='lib/include/tree_sitter/api.h'
 
 bindgen                                        \
-  --size_t-is-usize                            \
   --no-layout-tests                            \
   --allowlist-type '^TS.*'                     \
   --allowlist-function '^ts_.*'                \

From 0c318d3468fbe4d19c2011bd13ccfa9b57eb51b4 Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Thu, 13 Jul 2023 17:44:38 +0300
Subject: [PATCH 149/347] cicd: fix ubsan deb package installation

---
 .github/workflows/sanitize.yml | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/.github/workflows/sanitize.yml b/.github/workflows/sanitize.yml
index ebfb477c..6348f222 100644
--- a/.github/workflows/sanitize.yml
+++ b/.github/workflows/sanitize.yml
@@ -18,7 +18,7 @@ jobs:
       uses: actions/checkout@v3
 
     - name: Install UBSAN library
-      run: sudo apt-get install -y libubsan1
+      run: sudo apt-get update -y && sudo apt-get install -y libubsan1
 
     - name: Install Rust toolchain
       uses: dtolnay/rust-toolchain@stable

From 0b0cc6c429b6b3243e26221e21633a62b1330890 Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Thu, 13 Jul 2023 17:50:04 +0300
Subject: [PATCH 150/347] Fix rustc 1.71.0 warnings

---
 cli/src/generate/prepare_grammar/extract_default_aliases.rs | 4 ++--
 cli/src/generate/prepare_grammar/extract_tokens.rs          | 4 ++--
 2 files changed, 4 insertions(+), 4 deletions(-)

diff --git a/cli/src/generate/prepare_grammar/extract_default_aliases.rs b/cli/src/generate/prepare_grammar/extract_default_aliases.rs
index d39bf8dd..ee44f489 100644
--- a/cli/src/generate/prepare_grammar/extract_default_aliases.rs
+++ b/cli/src/generate/prepare_grammar/extract_default_aliases.rs
@@ -31,7 +31,7 @@ pub(super) fn extract_default_aliases(
     for variable in syntax_grammar.variables.iter() {
         for production in variable.productions.iter() {
             for step in production.steps.iter() {
-                let mut status = match step.symbol.kind {
+                let status = match step.symbol.kind {
                     SymbolType::External => &mut external_status_list[step.symbol.index],
                     SymbolType::NonTerminal => &mut non_terminal_status_list[step.symbol.index],
                     SymbolType::Terminal => &mut terminal_status_list[step.symbol.index],
@@ -63,7 +63,7 @@ pub(super) fn extract_default_aliases(
     }
 
     for symbol in syntax_grammar.extra_symbols.iter() {
-        let mut status = match symbol.kind {
+        let status = match symbol.kind {
             SymbolType::External => &mut external_status_list[symbol.index],
             SymbolType::NonTerminal => &mut non_terminal_status_list[symbol.index],
             SymbolType::Terminal => &mut terminal_status_list[symbol.index],
diff --git a/cli/src/generate/prepare_grammar/extract_tokens.rs b/cli/src/generate/prepare_grammar/extract_tokens.rs
index 928f914c..45233b71 100644
--- a/cli/src/generate/prepare_grammar/extract_tokens.rs
+++ b/cli/src/generate/prepare_grammar/extract_tokens.rs
@@ -49,7 +49,7 @@ pub(super) fn extract_tokens(
         }) = variable.rule
         {
             if i > 0 && extractor.extracted_usage_counts[index] == 1 {
-                let mut lexical_variable = &mut lexical_variables[index];
+                let lexical_variable = &mut lexical_variables[index];
                 lexical_variable.kind = variable.kind;
                 lexical_variable.name = variable.name;
                 symbol_replacer.replacements.insert(i, index);
@@ -209,7 +209,7 @@ impl TokenExtractor {
                 } else {
                     Rule::Metadata {
                         params: params.clone(),
-                        rule: Box::new(self.extract_tokens_in_rule((&rule).clone())),
+                        rule: Box::new(self.extract_tokens_in_rule(&rule)),
                     }
                 }
             }

From 9a74f5cbf5cb5dc59c0729f16550b33c1eec5cc0 Mon Sep 17 00:00:00 2001
From: Jille Timmermans <jille@quis.cx>
Date: Thu, 8 Jun 2023 19:37:04 +0100
Subject: [PATCH 151/347] Add ts_node_language() that returns the language of
 the node

Since an input might have a nested sublanguage (like Javascript inside
Vue) and symbols are per-language, we need to know which language a node
is.
---
 lib/include/tree_sitter/api.h | 5 +++++
 lib/src/node.c                | 4 ++++
 2 files changed, 9 insertions(+)

diff --git a/lib/include/tree_sitter/api.h b/lib/include/tree_sitter/api.h
index e455e81d..306891df 100644
--- a/lib/include/tree_sitter/api.h
+++ b/lib/include/tree_sitter/api.h
@@ -436,6 +436,11 @@ const char *ts_node_type(TSNode);
  */
 TSSymbol ts_node_symbol(TSNode);
 
+/**
+ * Get the node's language.
+ */
+const TSLanguage *ts_node_language(TSNode);
+
 /**
  * Get the node's start byte.
  */
diff --git a/lib/src/node.c b/lib/src/node.c
index d6a190c0..aa947148 100644
--- a/lib/src/node.c
+++ b/lib/src/node.c
@@ -423,6 +423,10 @@ const char *ts_node_type(TSNode self) {
   return ts_language_symbol_name(self.tree->language, symbol);
 }
 
+const TSLanguage *ts_node_language(TSNode self) {
+  return self.tree->language;
+}
+
 char *ts_node_string(TSNode self) {
   return ts_subtree_string(ts_node__subtree(self), self.tree->language, false);
 }

From 2f2e4160316b3c60a8973950fa3968afbff8a827 Mon Sep 17 00:00:00 2001
From: Amaan Qureshi <amaanq12@gmail.com>
Date: Thu, 13 Jul 2023 11:39:33 -0400
Subject: [PATCH 152/347] chore: update Rust bindings

---
 lib/binding_rust/bindings.rs | 6 +++++-
 lib/binding_rust/lib.rs      | 4 ++--
 2 files changed, 7 insertions(+), 3 deletions(-)

diff --git a/lib/binding_rust/bindings.rs b/lib/binding_rust/bindings.rs
index 66406adc..a3de6a4a 100644
--- a/lib/binding_rust/bindings.rs
+++ b/lib/binding_rust/bindings.rs
@@ -1,4 +1,4 @@
-/* automatically generated by rust-bindgen 0.65.1 */
+/* automatically generated by rust-bindgen 0.66.1 */
 
 pub type TSSymbol = u16;
 pub type TSFieldId = u16;
@@ -278,6 +278,10 @@ extern "C" {
     #[doc = " Get the node's type as a numerical id."]
     pub fn ts_node_symbol(arg1: TSNode) -> TSSymbol;
 }
+extern "C" {
+    #[doc = " Get the node's language."]
+    pub fn ts_node_language(arg1: TSNode) -> *const TSLanguage;
+}
 extern "C" {
     #[doc = " Get the node's start byte."]
     pub fn ts_node_start_byte(arg1: TSNode) -> u32;
diff --git a/lib/binding_rust/lib.rs b/lib/binding_rust/lib.rs
index caa5af44..5bed0817 100644
--- a/lib/binding_rust/lib.rs
+++ b/lib/binding_rust/lib.rs
@@ -839,9 +839,9 @@ impl<'tree> Node<'tree> {
     }
 
     /// Get the [Language] that was used to parse this node's syntax tree.
-    #[doc(alias = "ts_tree_language")]
+    #[doc(alias = "ts_node_language")]
     pub fn language(&self) -> Language {
-        Language(unsafe { ffi::ts_tree_language(self.0.tree) })
+        Language(unsafe { ffi::ts_node_language(self.0) })
     }
 
     /// Check if this node is *named*.

From af42cfccd6385773d54d2b5424ae6d551dfe1405 Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Thu, 13 Jul 2023 23:44:19 +0300
Subject: [PATCH 153/347] rust: fix ffi impl, some structs are stack allocated

---
 lib/binding_rust/ffi.rs | 29 ++++++++++++++++-------------
 1 file changed, 16 insertions(+), 13 deletions(-)

diff --git a/lib/binding_rust/ffi.rs b/lib/binding_rust/ffi.rs
index 53032db3..fc872041 100644
--- a/lib/binding_rust/ffi.rs
+++ b/lib/binding_rust/ffi.rs
@@ -17,7 +17,7 @@ impl Language {
     /// # Safety
     ///
     /// `ptr` must be non-null.
-    pub unsafe fn from_raw(ptr: *mut TSLanguage) -> Language {
+    pub unsafe fn from_raw(ptr: *const TSLanguage) -> Language {
         Language(ptr)
     }
 
@@ -38,10 +38,13 @@ impl Parser {
     }
 
     /// Consumes the [Parser], returning a raw pointer to the underlying C structure.
-    pub fn into_raw(mut self) -> *mut TSParser {
-        self.stop_printing_dot_graphs();
-        self.set_logger(None);
-
+    ///
+    /// # Safety
+    ///
+    /// It's a caller responsibility to adjust parser's state
+    /// like disable logging or dot graphs printing if this
+    /// may cause issues like use after free.
+    pub fn into_raw(self) -> *mut TSParser {
         ManuallyDrop::new(self).0.as_ptr()
     }
 }
@@ -68,13 +71,13 @@ impl<'tree> Node<'tree> {
     /// # Safety
     ///
     /// `ptr` must be non-null.
-    pub unsafe fn from_raw(ptr: *mut TSNode) -> Node<'tree> {
-        Node(*ptr, PhantomData)
+    pub unsafe fn from_raw(raw: TSNode) -> Node<'tree> {
+        Node(raw, PhantomData)
     }
 
     /// Consumes the [Node], returning a raw pointer to the underlying C structure.
-    pub fn into_raw(self) -> *mut TSNode {
-        &mut ManuallyDrop::new(self).0
+    pub fn into_raw(self) -> TSNode {
+        ManuallyDrop::new(self).0
     }
 }
 
@@ -84,13 +87,13 @@ impl<'a> TreeCursor<'a> {
     /// # Safety
     ///
     /// `ptr` must be non-null.
-    pub unsafe fn from_raw(ptr: *mut TSTreeCursor) -> TreeCursor<'a> {
-        TreeCursor(*ptr, PhantomData)
+    pub unsafe fn from_raw(raw: TSTreeCursor) -> TreeCursor<'a> {
+        TreeCursor(raw, PhantomData)
     }
 
     /// Consumes the [TreeCursor], returning a raw pointer to the underlying C structure.
-    pub fn into_raw(self) -> *mut TSTreeCursor {
-        &mut ManuallyDrop::new(self).0
+    pub fn into_raw(self) -> TSTreeCursor {
+        ManuallyDrop::new(self).0
     }
 }
 

From a2bcc4f4488894e69cca4307a8e9de60bba9f80b Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Tue, 11 Jul 2023 22:15:28 +0300
Subject: [PATCH 154/347] script/generate-bindings - no derived Copy, Clone for
 ptr data wrappers

---
 script/generate-bindings | 14 ++++++++++++++
 1 file changed, 14 insertions(+)

diff --git a/script/generate-bindings b/script/generate-bindings
index 25499c0e..e68a7e57 100755
--- a/script/generate-bindings
+++ b/script/generate-bindings
@@ -2,12 +2,26 @@
 
 output_path=lib/binding_rust/bindings.rs
 header_path='lib/include/tree_sitter/api.h'
+no_derive_copy=(
+  TSInput
+  TSLanguage
+  TSLogger
+  TSParser
+  TSTree
+  TSQuery
+  TSQueryCursor
+  TSQueryCapture
+  TSQueryMatch
+  TSQueryPredicateStep
+)
+no_copy=$(IFS='|'; echo "${no_derive_copy[*]}")
 
 bindgen                                        \
   --no-layout-tests                            \
   --allowlist-type '^TS.*'                     \
   --allowlist-function '^ts_.*'                \
   --blocklist-type '^__.*'                     \
+  --no-copy "$no_copy"                         \
   $header_path > $output_path
 
 echo "" >> $output_path

From 7afd5a1a8bd14a6e783654d3f728d5cc81b6631d Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Thu, 13 Jul 2023 23:46:15 +0300
Subject: [PATCH 155/347] rust: remove Copy, Clone from opaque ptr data structs

---
 lib/binding_rust/bindings.rs | 20 ++++++++++----------
 1 file changed, 10 insertions(+), 10 deletions(-)

diff --git a/lib/binding_rust/bindings.rs b/lib/binding_rust/bindings.rs
index a3de6a4a..76aeef57 100644
--- a/lib/binding_rust/bindings.rs
+++ b/lib/binding_rust/bindings.rs
@@ -3,27 +3,27 @@
 pub type TSSymbol = u16;
 pub type TSFieldId = u16;
 #[repr(C)]
-#[derive(Debug, Copy, Clone)]
+#[derive(Debug)]
 pub struct TSLanguage {
     _unused: [u8; 0],
 }
 #[repr(C)]
-#[derive(Debug, Copy, Clone)]
+#[derive(Debug)]
 pub struct TSParser {
     _unused: [u8; 0],
 }
 #[repr(C)]
-#[derive(Debug, Copy, Clone)]
+#[derive(Debug)]
 pub struct TSTree {
     _unused: [u8; 0],
 }
 #[repr(C)]
-#[derive(Debug, Copy, Clone)]
+#[derive(Debug)]
 pub struct TSQuery {
     _unused: [u8; 0],
 }
 #[repr(C)]
-#[derive(Debug, Copy, Clone)]
+#[derive(Debug)]
 pub struct TSQueryCursor {
     _unused: [u8; 0],
 }
@@ -49,7 +49,7 @@ pub struct TSRange {
     pub end_byte: u32,
 }
 #[repr(C)]
-#[derive(Debug, Copy, Clone)]
+#[derive(Debug)]
 pub struct TSInput {
     pub payload: *mut ::std::os::raw::c_void,
     pub read: ::std::option::Option<
@@ -66,7 +66,7 @@ pub const TSLogType_TSLogTypeParse: TSLogType = 0;
 pub const TSLogType_TSLogTypeLex: TSLogType = 1;
 pub type TSLogType = ::std::os::raw::c_uint;
 #[repr(C)]
-#[derive(Debug, Copy, Clone)]
+#[derive(Debug)]
 pub struct TSLogger {
     pub payload: *mut ::std::os::raw::c_void,
     pub log: ::std::option::Option<
@@ -102,7 +102,7 @@ pub struct TSTreeCursor {
     pub context: [u32; 2usize],
 }
 #[repr(C)]
-#[derive(Debug, Copy, Clone)]
+#[derive(Debug)]
 pub struct TSQueryCapture {
     pub node: TSNode,
     pub index: u32,
@@ -114,7 +114,7 @@ pub const TSQuantifier_TSQuantifierOne: TSQuantifier = 3;
 pub const TSQuantifier_TSQuantifierOneOrMore: TSQuantifier = 4;
 pub type TSQuantifier = ::std::os::raw::c_uint;
 #[repr(C)]
-#[derive(Debug, Copy, Clone)]
+#[derive(Debug)]
 pub struct TSQueryMatch {
     pub id: u32,
     pub pattern_index: u16,
@@ -126,7 +126,7 @@ pub const TSQueryPredicateStepType_TSQueryPredicateStepTypeCapture: TSQueryPredi
 pub const TSQueryPredicateStepType_TSQueryPredicateStepTypeString: TSQueryPredicateStepType = 2;
 pub type TSQueryPredicateStepType = ::std::os::raw::c_uint;
 #[repr(C)]
-#[derive(Debug, Copy, Clone)]
+#[derive(Debug)]
 pub struct TSQueryPredicateStep {
     pub type_: TSQueryPredicateStepType,
     pub value_id: u32,

From 45aede8bf512fac04406d101f6468e41537e7856 Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Thu, 13 Jul 2023 00:36:16 +0300
Subject: [PATCH 156/347] script/generate-bindings - protect from using old
 incompatible bindgen versions

---
 script/generate-bindings | 16 ++++++++++++++--
 1 file changed, 14 insertions(+), 2 deletions(-)

diff --git a/script/generate-bindings b/script/generate-bindings
index e68a7e57..da1796ba 100755
--- a/script/generate-bindings
+++ b/script/generate-bindings
@@ -16,6 +16,18 @@ no_derive_copy=(
 )
 no_copy=$(IFS='|'; echo "${no_derive_copy[*]}")
 
+file_version=$(head -n1 "$output_path" | cut -d' ' -f6)
+tool_version=$(bindgen --version | cut -d' ' -f2)
+higher_version=$(echo -e "${file_version}\n${tool_version}" | sort -V | tail -n1)
+
+if [ "$higher_version" != "$tool_version" ]; then
+  echo "Latest used bindgen version was $file_version" >&2
+  echo "Currently installed bindgen CLI version is $tool_version" >&2
+  echo >&2
+  echo "It's needed to upgrade bindgen CLI first with \`cargo install bindgen-cli\`" >&2
+  exit 1
+fi
+
 bindgen                                        \
   --no-layout-tests                            \
   --allowlist-type '^TS.*'                     \
@@ -31,7 +43,7 @@ defines=(
   TREE_SITTER_MIN_COMPATIBLE_LANGUAGE_VERSION
 )
 
-for define in ${defines[@]}; do
-  define_value=$(egrep "#define $define (.*)" $header_path | cut -d' ' -f3)
+for define in "${defines[@]}"; do
+  define_value=$(grep -E "#define $define (.*)" $header_path | cut -d' ' -f3)
   echo "pub const $define: usize = $define_value;" >> $output_path
 done

From cb58bc593f9d137e1261e6e499ccd69e3310d0bf Mon Sep 17 00:00:00 2001
From: Patrick Thomson <patrickt@github.com>
Date: Thu, 22 Jun 2023 09:18:53 -0400
Subject: [PATCH 157/347] Add --check flag to tree-sitter highlight.

Recently I've been pulling a lot of grammars into GitHub's highlighting backend,
replacing legacy language support with tree-sitter highlighting queries.
Our backend systems have a standard set of highlight captures we expect, very
similar to the standard tagging captures we expect. Though end-user applications
are free to choose whatever tagging nomenclature they want, I think it's nice to
include a checking stage that will help us ensure that we know whether a capture
might be recognized or not. It will also help us figure out where we need to
expand our standard set of captures (see #1539).
---
 Cargo.lock           |  3 ++-
 cli/src/main.rs      | 25 ++++++++++++++++++++++
 highlight/Cargo.toml |  3 ++-
 highlight/src/lib.rs | 49 ++++++++++++++++++++++++++++++++++++++++++++
 4 files changed, 78 insertions(+), 2 deletions(-)

diff --git a/Cargo.lock b/Cargo.lock
index 7e4ccfa0..606f1e95 100644
--- a/Cargo.lock
+++ b/Cargo.lock
@@ -859,8 +859,9 @@ dependencies = [
 
 [[package]]
 name = "tree-sitter-highlight"
-version = "0.20.1"
+version = "0.20.2"
 dependencies = [
+ "lazy_static",
  "regex",
  "thiserror",
  "tree-sitter",
diff --git a/cli/src/main.rs b/cli/src/main.rs
index 18e50aad..7d2f6a17 100644
--- a/cli/src/main.rs
+++ b/cli/src/main.rs
@@ -239,6 +239,11 @@ fn run() -> Result<()> {
                         .long("html")
                         .short("H"),
                 )
+                .arg(
+                    Arg::with_name("check")
+                        .help("Check that highlighting captures conform strictly to standards")
+                        .long("check"),
+                )
                 .arg(&scope_arg)
                 .arg(&time_arg)
                 .arg(&quiet_arg)
@@ -543,6 +548,7 @@ fn run() -> Result<()> {
             let time = matches.is_present("time");
             let quiet = matches.is_present("quiet");
             let html_mode = quiet || matches.is_present("html");
+            let should_check = matches.is_present("check");
             let paths = collect_paths(matches.value_of("paths-file"), matches.values_of("paths"))?;
 
             if html_mode && !quiet {
@@ -573,6 +579,25 @@ fn run() -> Result<()> {
                 };
 
                 if let Some(highlight_config) = language_config.highlight_config(language)? {
+                    if should_check {
+                        let names = highlight_config.nonconformant_capture_names();
+                        if names.is_empty() {
+                            eprintln!("All highlight captures conform to standards.");
+                        } else {
+                            eprintln!(
+                                "Non-standard highlight {} detected:",
+                                if names.len() > 1 {
+                                    "captures"
+                                } else {
+                                    "capture"
+                                }
+                            );
+                            for name in names {
+                                eprintln!("* {}", name);
+                            }
+                        }
+                    }
+
                     let source = fs::read(path)?;
                     if html_mode {
                         highlight::html(
diff --git a/highlight/Cargo.toml b/highlight/Cargo.toml
index e85ced8e..84c748b6 100644
--- a/highlight/Cargo.toml
+++ b/highlight/Cargo.toml
@@ -1,7 +1,7 @@
 [package]
 name = "tree-sitter-highlight"
 description = "Library for performing syntax highlighting with Tree-sitter"
-version = "0.20.1"
+version = "0.20.2"
 authors = [
   "Max Brunsfeld <maxbrunsfeld@gmail.com>",
   "Tim Clem <timothy.clem@gmail.com>",
@@ -18,6 +18,7 @@ rust-version.workspace = true
 crate-type = ["lib", "staticlib"]
 
 [dependencies]
+lazy_static = "1.2.0"
 regex = "1"
 thiserror = "1.0"
 
diff --git a/highlight/src/lib.rs b/highlight/src/lib.rs
index 8a79c624..ce3c3e06 100644
--- a/highlight/src/lib.rs
+++ b/highlight/src/lib.rs
@@ -2,6 +2,8 @@ pub mod c_lib;
 pub mod util;
 pub use c_lib as c;
 
+use lazy_static::lazy_static;
+use std::collections::HashSet;
 use std::sync::atomic::{AtomicUsize, Ordering};
 use std::{iter, mem, ops, str, usize};
 use thiserror::Error;
@@ -14,6 +16,42 @@ const CANCELLATION_CHECK_INTERVAL: usize = 100;
 const BUFFER_HTML_RESERVE_CAPACITY: usize = 10 * 1024;
 const BUFFER_LINES_RESERVE_CAPACITY: usize = 1000;
 
+lazy_static! {
+    static ref STANDARD_CAPTURE_NAMES: HashSet<&'static str> = vec![
+        "attribute",
+        "carriage-return",
+        "comment",
+        "constant",
+        "constant.builtin",
+        "constructor",
+        "constructor.builtin",
+        "embedded",
+        "escape",
+        "function",
+        "function.builtin",
+        "keyword",
+        "number",
+        "module",
+        "operator",
+        "property",
+        "property.builtin",
+        "punctuation",
+        "punctuation.bracket",
+        "punctuation.delimiter",
+        "punctuation.special",
+        "string",
+        "string.special",
+        "tag",
+        "type",
+        "type.builtin",
+        "variable",
+        "variable.builtin",
+        "variable.parameter",
+    ]
+    .into_iter()
+    .collect();
+}
+
 /// Indicates which highlight should be applied to a region of source code.
 #[derive(Copy, Clone, Debug, PartialEq, Eq)]
 pub struct Highlight(pub usize);
@@ -321,6 +359,17 @@ impl HighlightConfiguration {
                 best_index.map(Highlight)
             }));
     }
+
+    // Return the list of this configuration's capture names that are neither present in the
+    // list of predefined 'canonical' names nor start with an underscore (denoting 'private' captures
+    // used as part of capture internals).
+    pub fn nonconformant_capture_names(&self) -> Vec<&String> {
+        return self
+            .names()
+            .iter()
+            .filter(|&n| !STANDARD_CAPTURE_NAMES.contains(n.as_str()))
+            .collect();
+    }
 }
 
 impl<'a> HighlightIterLayer<'a> {

From 01b47f1a15bb1a2bb65135dbedccb5079931b989 Mon Sep 17 00:00:00 2001
From: Patrick Thomson <patrickt@github.com>
Date: Wed, 28 Jun 2023 09:03:01 -0400
Subject: [PATCH 158/347] Add more Helix captures, including the markup
 hierarchy.

---
 highlight/src/lib.rs | 24 +++++++++++++++++++++++-
 1 file changed, 23 insertions(+), 1 deletion(-)

diff --git a/highlight/src/lib.rs b/highlight/src/lib.rs
index ce3c3e06..d02196eb 100644
--- a/highlight/src/lib.rs
+++ b/highlight/src/lib.rs
@@ -21,17 +21,35 @@ lazy_static! {
         "attribute",
         "carriage-return",
         "comment",
+        "comment.documentation",
         "constant",
         "constant.builtin",
         "constructor",
         "constructor.builtin",
         "embedded",
+        "error",
         "escape",
         "function",
         "function.builtin",
         "keyword",
-        "number",
+        "markup",
+        "markup.bold",
+        "markup.heading",
+        "markup.italic",
+        "markup.link",
+        "markup.link.url",
+        "markup.list",
+        "markup.list.checked",
+        "markup.list.numbered",
+        "markup.list.unchecked",
+        "markup.list.unnumbered",
+        "markup.quote",
+        "markup.raw",
+        "markup.raw.block",
+        "markup.raw.inline",
+        "markup.strikethrough",
         "module",
+        "number",
         "operator",
         "property",
         "property.builtin",
@@ -40,12 +58,16 @@ lazy_static! {
         "punctuation.delimiter",
         "punctuation.special",
         "string",
+        "string.escape",
+        "string.regexp",
         "string.special",
+        "string.special.symbol",
         "tag",
         "type",
         "type.builtin",
         "variable",
         "variable.builtin",
+        "variable.member",
         "variable.parameter",
     ]
     .into_iter()

From a7481361cf37221d658a58c5d7d686504479932e Mon Sep 17 00:00:00 2001
From: Patrick Thomson <patrickt@github.com>
Date: Thu, 6 Jul 2023 15:53:17 -0400
Subject: [PATCH 159/347] Treat leading _ character as private.

---
 highlight/src/lib.rs | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/highlight/src/lib.rs b/highlight/src/lib.rs
index d02196eb..c3a54f6c 100644
--- a/highlight/src/lib.rs
+++ b/highlight/src/lib.rs
@@ -389,7 +389,7 @@ impl HighlightConfiguration {
         return self
             .names()
             .iter()
-            .filter(|&n| !STANDARD_CAPTURE_NAMES.contains(n.as_str()))
+            .filter(|&n| !(n.starts_with('_') || STANDARD_CAPTURE_NAMES.contains(n.as_str())))
             .collect();
     }
 }

From fc0e3a34ba449aa7d857a106aab13061889796cf Mon Sep 17 00:00:00 2001
From: Amaan Qureshi <amaanq12@gmail.com>
Date: Sat, 15 Jul 2023 20:07:46 -0400
Subject: [PATCH 160/347] test: update C tests from upstream

---
 test/fixtures/error_corpus/c_errors.txt | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/test/fixtures/error_corpus/c_errors.txt b/test/fixtures/error_corpus/c_errors.txt
index 97c75f0c..4b507590 100644
--- a/test/fixtures/error_corpus/c_errors.txt
+++ b/test/fixtures/error_corpus/c_errors.txt
@@ -14,8 +14,8 @@ int main() {
     (primitive_type)
     (function_declarator (identifier) (parameter_list))
     (compound_statement
-      (expression_statement (call_expression (identifier) (argument_list (string_literal))) (MISSING ";"))
-      (expression_statement (call_expression (identifier) (argument_list (string_literal))) (MISSING ";")))))
+      (expression_statement (call_expression (identifier) (argument_list (string_literal (string_content)))) (MISSING ";"))
+      (expression_statement (call_expression (identifier) (argument_list (string_literal (string_content)))) (MISSING ";")))))
 
 ==============================================
 Top-level declarations with missing semicolons
@@ -53,7 +53,7 @@ int c() {
 
 (translation_unit
   (preproc_ifdef (identifier)
-    (linkage_specification (string_literal) (declaration_list
+    (linkage_specification (string_literal (string_content)) (declaration_list
       (preproc_call (preproc_directive))
       (comment)
       (declaration (primitive_type) (identifier))

From 12971103f5bc08c4b98c011a4ee9b41fd7ffed5e Mon Sep 17 00:00:00 2001
From: Amaan Qureshi <amaanq12@gmail.com>
Date: Sat, 15 Jul 2023 21:02:04 -0400
Subject: [PATCH 161/347] ci: only run release if the owner is `tree-sitter`

---
 .github/workflows/release.yml | 1 +
 1 file changed, 1 insertion(+)

diff --git a/.github/workflows/release.yml b/.github/workflows/release.yml
index 1b75dc96..adf1021b 100644
--- a/.github/workflows/release.yml
+++ b/.github/workflows/release.yml
@@ -14,6 +14,7 @@ jobs:
     outputs:
       release_allowed: >
         ${{
+          github.repository_owner == 'tree-sitter' &&
           steps.maintainer.outputs.is_maintainer == 'true' &&
           steps.local_branch.outputs.is_local == 'true'
         }}

From 0558f1e0bfcf740ef3da6acee086b4f7cac3d633 Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Sun, 16 Jul 2023 04:50:00 +0300
Subject: [PATCH 162/347] test: add retries for all timeout tests

---
 cli/src/tests/parser_test.rs | 3 +++
 1 file changed, 3 insertions(+)

diff --git a/cli/src/tests/parser_test.rs b/cli/src/tests/parser_test.rs
index da9aefa8..8ad1888a 100644
--- a/cli/src/tests/parser_test.rs
+++ b/cli/src/tests/parser_test.rs
@@ -700,6 +700,7 @@ fn test_parsing_with_a_timeout() {
 }
 
 #[test]
+#[retry(10)]
 fn test_parsing_with_a_timeout_and_a_reset() {
     let mut parser = Parser::new();
     parser.set_language(get_language("json")).unwrap();
@@ -755,6 +756,7 @@ fn test_parsing_with_a_timeout_and_a_reset() {
 }
 
 #[test]
+#[retry(10)]
 fn test_parsing_with_a_timeout_and_implicit_reset() {
     allocations::record(|| {
         let mut parser = Parser::new();
@@ -788,6 +790,7 @@ fn test_parsing_with_a_timeout_and_implicit_reset() {
 }
 
 #[test]
+#[retry(10)]
 fn test_parsing_with_timeout_and_no_completion() {
     allocations::record(|| {
         let mut parser = Parser::new();

From c23ec2c3ae0b4b19584edfb3f58bf580c8902f4a Mon Sep 17 00:00:00 2001
From: Amaan Qureshi <amaanq12@gmail.com>
Date: Sat, 15 Jul 2023 23:12:25 -0400
Subject: [PATCH 163/347] ci: add more architectures

---
 .github/workflows/build.yml | 58 +++++++++++++++++++++++--------------
 cli/npm/install.js          |  5 ++++
 2 files changed, 42 insertions(+), 21 deletions(-)

diff --git a/.github/workflows/build.yml b/.github/workflows/build.yml
index 8f10d486..ba333992 100644
--- a/.github/workflows/build.yml
+++ b/.github/workflows/build.yml
@@ -33,34 +33,50 @@ jobs:
       fail-fast: false
       matrix:
         runtime:
-        - linux-arm64   #
-        - linux-arm     #
-        - linux-x64     #
-        - linux-x86     #
-        - windows-arm64 #
-        - windows-x64   # <-- No C library build - requires an additional adapted Makefile for `cl.exe` compiler
-        - windows-x86   #     -- // --
-        - macos-arm64   # <-- MacOS M1/M2 - no tests, only CLI build to be published on release artifacts
-        - macos-x64     #
+        - linux-arm64     #
+        - linux-arm       #
+        - linux-x64       #
+        - linux-x86       #
+        - linux-i586      #
+        - linux-mipsel    #
+        - linux-mips64el  #
+        - linux-ppc64el   #
+        - linux-riscv64gc #
+        - windows-arm64   #
+        - windows-x64     # <-- No C library build - requires an additional adapted Makefile for `cl.exe` compiler
+        - windows-x86     #     -- // --
+        - macos-arm64     # <-- MacOS M1/M2 - no tests, only CLI build to be published on release artifacts
+        - macos-x64       #
 
         include:
         # When adding a new `target`:
         # 1. Define a new runtime alias above
         # 2. Add a new record to a matrix map in `cli/npm/install.js`
-        - { runtime: linux-arm64   , target: aarch64-unknown-linux-gnu   , os: ubuntu-latest  , use-cross: true }
-        - { runtime: linux-arm     , target: arm-unknown-linux-gnueabihf , os: ubuntu-latest  , use-cross: true }
-        - { runtime: linux-x64     , target: x86_64-unknown-linux-gnu    , os: ubuntu-20.04                     } #2272
-        - { runtime: linux-x86     , target: i686-unknown-linux-gnu      , os: ubuntu-latest  , use-cross: true }
-        - { runtime: windows-arm64 , target: aarch64-pc-windows-msvc     , os: windows-latest                   }
-        - { runtime: windows-x64   , target: x86_64-pc-windows-msvc      , os: windows-latest                   }
-        - { runtime: windows-x86   , target: i686-pc-windows-msvc        , os: windows-latest                   }
-        - { runtime: macos-arm64   , target: aarch64-apple-darwin        , os: macos-latest                     }
-        - { runtime: macos-x64     , target: x86_64-apple-darwin         , os: macos-latest                     }
+        - { runtime: linux-arm64     , target: aarch64-unknown-linux-gnu       , os: ubuntu-latest  , use-cross: true }
+        - { runtime: linux-arm       , target: arm-unknown-linux-gnueabihf     , os: ubuntu-latest  , use-cross: true }
+        - { runtime: linux-x64       , target: x86_64-unknown-linux-gnu        , os: ubuntu-20.04                     } #2272
+        - { runtime: linux-x86       , target: i686-unknown-linux-gnu          , os: ubuntu-latest  , use-cross: true }
+        - { runtime: linux-i586      , target: i586-unknown-linux-gnu          , os: ubuntu-latest  , use-cross: true }
+        - { runtime: linux-mipsel    , target: mipsel-unknown-linux-gnu        , os: ubuntu-latest  , use-cross: true }
+        - { runtime: linux-mips64el  , target: mips64el-unknown-linux-gnuabi64 , os: ubuntu-latest  , use-cross: true }
+        - { runtime: linux-ppc64el   , target: powerpc64le-unknown-linux-gnu   , os: ubuntu-latest  , use-cross: true }
+        - { runtime: linux-riscv64gc , target: riscv64gc-unknown-linux-gnu     , os: ubuntu-latest  , use-cross: true }
+        - { runtime: windows-arm64   , target: aarch64-pc-windows-msvc         , os: windows-latest                   }
+        - { runtime: windows-x64     , target: x86_64-pc-windows-msvc          , os: windows-latest                   }
+        - { runtime: windows-x86     , target: i686-pc-windows-msvc            , os: windows-latest                   }
+        - { runtime: macos-arm64     , target: aarch64-apple-darwin            , os: macos-latest                     }
+        - { runtime: macos-x64       , target: x86_64-apple-darwin             , os: macos-latest                     }
 
         # Cross compilers for C library
-        - { runtime: linux-arm64   , cc: aarch64-linux-gnu-gcc           , ar: aarch64-linux-gnu-ar               }
-        - { runtime: linux-arm     , cc: arm-unknown-linux-gnueabihf-gcc , ar: arm-unknown-linux-gnueabihf-gcc-ar }
-        - { runtime: linux-x86     , cc: i686-linux-gnu-gcc              , ar: i686-linux-gnu-ar                  }
+        - { runtime: linux-arm64     , cc: aarch64-linux-gnu-gcc           , ar: aarch64-linux-gnu-ar               }
+        - { runtime: linux-arm       , cc: arm-unknown-linux-gnueabihf-gcc , ar: arm-unknown-linux-gnueabihf-gcc-ar }
+        - { runtime: linux-x86       , cc: i686-linux-gnu-gcc              , ar: i686-linux-gnu-ar                  }
+        - { runtime: linux-i586      , cc: i686-linux-gnu-gcc              , ar: i686-linux-gnu-ar                  }
+        - { runtime: linux-mipsel    , cc: mipsel-linux-gnu-gcc            , ar: mipsel-linux-gnu-ar                }
+        - { runtime: linux-mips64el  , cc: mips64el-linux-gnuabi64-gcc     , ar: mips64el-linux-gnuabi64-ar         }
+        - { runtime: linux-ppc64el   , cc: powerpc64le-linux-gnu-gcc       , ar: powerpc64le-linux-gnu-ar           }
+        - { runtime: linux-riscv64gc , cc: riscv64-linux-gnu-gcc           , ar: riscv64-linux-gnu-ar               }
+
 
         # See #2041 tree-sitter issue
         - { runtime: windows-x64   , rust-test-threads: 1 }
diff --git a/cli/npm/install.js b/cli/npm/install.js
index 836a840d..01fcfa6b 100755
--- a/cli/npm/install.js
+++ b/cli/npm/install.js
@@ -23,6 +23,11 @@ const matrix = {
         'arm': { name: 'arm' },
         'x64': { name: 'x64' },
         'x86': { name: 'x86' },
+        'mipsel': { name: 'x64' },
+        'mips64el': { name: 'x64' },
+        'ppc64el': { name: 'x64' },
+        'i586': { name: 'x64' },
+        'riscv64gc': { name: 'x86_64' },
       }
     },
     'win32': {

From 975f3f4686d2157b3b6a65580562d7ef06a3f6d8 Mon Sep 17 00:00:00 2001
From: Amaan Qureshi <amaanq12@gmail.com>
Date: Sun, 16 Jul 2023 04:50:04 -0400
Subject: [PATCH 164/347] refactor!: use AtomicUsize for AllocationRecorder for
 portability

---
 cli/src/tests/helpers/allocations.rs | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/cli/src/tests/helpers/allocations.rs b/cli/src/tests/helpers/allocations.rs
index 9a514014..2ab80291 100644
--- a/cli/src/tests/helpers/allocations.rs
+++ b/cli/src/tests/helpers/allocations.rs
@@ -2,7 +2,7 @@ use std::{
     collections::HashMap,
     os::raw::c_void,
     sync::{
-        atomic::{AtomicBool, AtomicU64, Ordering::SeqCst},
+        atomic::{AtomicBool, AtomicUsize, Ordering::SeqCst},
         Mutex,
     },
 };
@@ -25,8 +25,8 @@ unsafe impl Sync for Allocation {}
 #[derive(Default)]
 struct AllocationRecorder {
     enabled: AtomicBool,
-    allocation_count: AtomicU64,
-    outstanding_allocations: Mutex<HashMap<Allocation, u64>>,
+    allocation_count: AtomicUsize,
+    outstanding_allocations: Mutex<HashMap<Allocation, usize>>,
 }
 
 thread_local! {

From 19ed2238cd1d932e12e3e738b834d817863b2346 Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Sun, 16 Jul 2023 15:42:29 +0300
Subject: [PATCH 165/347] Fix arch mappings in install.js

---
 cli/npm/install.js | 10 +++++-----
 1 file changed, 5 insertions(+), 5 deletions(-)

diff --git a/cli/npm/install.js b/cli/npm/install.js
index 01fcfa6b..8142afe2 100755
--- a/cli/npm/install.js
+++ b/cli/npm/install.js
@@ -23,11 +23,11 @@ const matrix = {
         'arm': { name: 'arm' },
         'x64': { name: 'x64' },
         'x86': { name: 'x86' },
-        'mipsel': { name: 'x64' },
-        'mips64el': { name: 'x64' },
-        'ppc64el': { name: 'x64' },
-        'i586': { name: 'x64' },
-        'riscv64gc': { name: 'x86_64' },
+        'i586': { name: 'i586' },
+        'mipsel': { name: 'mipsel' },
+        'mips64el': { name: 'mips64el' },
+        'ppc64el': { name: 'ppc64el' },
+        'riscv64gc': { name: 'riscv64gc' },
       }
     },
     'win32': {

From 6ab282b57816ac8b6570882c17e9abd54db85e4c Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Sun, 16 Jul 2023 15:44:01 +0300
Subject: [PATCH 166/347] cicd: add armv7l target #1366#issuecomment-1503176694

---
 .github/workflows/build.yml | 19 +++++++++++--------
 cli/npm/install.js          |  1 +
 2 files changed, 12 insertions(+), 8 deletions(-)

diff --git a/.github/workflows/build.yml b/.github/workflows/build.yml
index ba333992..b03b527d 100644
--- a/.github/workflows/build.yml
+++ b/.github/workflows/build.yml
@@ -35,6 +35,7 @@ jobs:
         runtime:
         - linux-arm64     #
         - linux-arm       #
+        - linux-armv7l    #
         - linux-x64       #
         - linux-x86       #
         - linux-i586      #
@@ -54,6 +55,7 @@ jobs:
         # 2. Add a new record to a matrix map in `cli/npm/install.js`
         - { runtime: linux-arm64     , target: aarch64-unknown-linux-gnu       , os: ubuntu-latest  , use-cross: true }
         - { runtime: linux-arm       , target: arm-unknown-linux-gnueabihf     , os: ubuntu-latest  , use-cross: true }
+        - { runtime: linux-armv7l    , target: armv7-unknown-linux-gnueabihf   , os: ubuntu-latest  , use-cross: true }
         - { runtime: linux-x64       , target: x86_64-unknown-linux-gnu        , os: ubuntu-20.04                     } #2272
         - { runtime: linux-x86       , target: i686-unknown-linux-gnu          , os: ubuntu-latest  , use-cross: true }
         - { runtime: linux-i586      , target: i586-unknown-linux-gnu          , os: ubuntu-latest  , use-cross: true }
@@ -68,14 +70,15 @@ jobs:
         - { runtime: macos-x64       , target: x86_64-apple-darwin             , os: macos-latest                     }
 
         # Cross compilers for C library
-        - { runtime: linux-arm64     , cc: aarch64-linux-gnu-gcc           , ar: aarch64-linux-gnu-ar               }
-        - { runtime: linux-arm       , cc: arm-unknown-linux-gnueabihf-gcc , ar: arm-unknown-linux-gnueabihf-gcc-ar }
-        - { runtime: linux-x86       , cc: i686-linux-gnu-gcc              , ar: i686-linux-gnu-ar                  }
-        - { runtime: linux-i586      , cc: i686-linux-gnu-gcc              , ar: i686-linux-gnu-ar                  }
-        - { runtime: linux-mipsel    , cc: mipsel-linux-gnu-gcc            , ar: mipsel-linux-gnu-ar                }
-        - { runtime: linux-mips64el  , cc: mips64el-linux-gnuabi64-gcc     , ar: mips64el-linux-gnuabi64-ar         }
-        - { runtime: linux-ppc64el   , cc: powerpc64le-linux-gnu-gcc       , ar: powerpc64le-linux-gnu-ar           }
-        - { runtime: linux-riscv64gc , cc: riscv64-linux-gnu-gcc           , ar: riscv64-linux-gnu-ar               }
+        - { runtime: linux-arm64     , cc: aarch64-linux-gnu-gcc             , ar: aarch64-linux-gnu-ar           }
+        - { runtime: linux-arm       , cc: arm-unknown-linux-gnueabihf-gcc   , ar: arm-unknown-linux-gnueabihf-ar }
+        - { runtime: linux-armv7l    , cc: arm-linux-gnueabihf-gcc           , ar: arm-linux-gnueabihf-ar         }
+        - { runtime: linux-x86       , cc: i686-linux-gnu-gcc                , ar: i686-linux-gnu-ar              }
+        - { runtime: linux-i586      , cc: i686-linux-gnu-gcc                , ar: i686-linux-gnu-ar              }
+        - { runtime: linux-mipsel    , cc: mipsel-linux-gnu-gcc              , ar: mipsel-linux-gnu-ar            }
+        - { runtime: linux-mips64el  , cc: mips64el-linux-gnuabi64-gcc       , ar: mips64el-linux-gnuabi64-ar     }
+        - { runtime: linux-ppc64el   , cc: powerpc64le-linux-gnu-gcc         , ar: powerpc64le-linux-gnu-ar       }
+        - { runtime: linux-riscv64gc , cc: riscv64-linux-gnu-gcc             , ar: riscv64-linux-gnu-ar           }
 
 
         # See #2041 tree-sitter issue
diff --git a/cli/npm/install.js b/cli/npm/install.js
index 8142afe2..d9bffb1c 100755
--- a/cli/npm/install.js
+++ b/cli/npm/install.js
@@ -21,6 +21,7 @@ const matrix = {
       arch: {
         'arm64': { name: 'arm64' },
         'arm': { name: 'arm' },
+        'armv7l': { name: 'armv7l' },
         'x64': { name: 'x64' },
         'x86': { name: 'x86' },
         'i586': { name: 'i586' },

From e7a16ceb0609f5831e2f9bebbffa1272a7c593ba Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Sun, 16 Jul 2023 15:48:24 +0300
Subject: [PATCH 167/347] cicd: install Emscripten conditionally

---
 .github/workflows/build.yml | 1 +
 1 file changed, 1 insertion(+)

diff --git a/.github/workflows/build.yml b/.github/workflows/build.yml
index b03b527d..faf0af35 100644
--- a/.github/workflows/build.yml
+++ b/.github/workflows/build.yml
@@ -109,6 +109,7 @@ jobs:
         echo "EMSCRIPTEN_VERSION=$(cat cli/emscripten-version)" >> $GITHUB_ENV
 
     - name: Install Emscripten
+      if: ${{ !matrix.cli-only && !matrix.use-cross }}
       uses: mymindstorm/setup-emsdk@v12
       with:
         version: ${{ env.EMSCRIPTEN_VERSION }}

From 834ae233cbef757dbbed68eb149a7e3059cc1695 Mon Sep 17 00:00:00 2001
From: Auguste Rame <19855629+SuperAuguste@users.noreply.github.com>
Date: Fri, 28 Apr 2023 23:14:50 -0400
Subject: [PATCH 168/347] Add build.zig for easy use as a Zig library

---
 .gitignore |  3 ++-
 build.zig  | 16 ++++++++++++++++
 2 files changed, 18 insertions(+), 1 deletion(-)
 create mode 100644 build.zig

diff --git a/.gitignore b/.gitignore
index 91423969..5a17dd9b 100644
--- a/.gitignore
+++ b/.gitignore
@@ -25,4 +25,5 @@ docs/assets/js/tree-sitter.js
 *.exp
 *.lib
 *.wasm
-.swiftpm
\ No newline at end of file
+.swiftpm
+zig-*
diff --git a/build.zig b/build.zig
new file mode 100644
index 00000000..05e4f2c2
--- /dev/null
+++ b/build.zig
@@ -0,0 +1,16 @@
+const std = @import("std");
+
+pub fn build(b: *std.Build) void {
+    var lib = b.addStaticLibrary(.{
+        .name = "tree-sitter",
+        .target = b.standardTargetOptions(.{}),
+        .optimize = b.standardOptimizeOption(.{}),
+    });
+
+    lib.linkLibC();
+    lib.addCSourceFile("lib/src/lib.c", &.{});
+    lib.addIncludePath("lib/include");
+    lib.addIncludePath("lib/src");
+
+    b.installArtifact(lib);
+}

From b52d9313dd79c4803eac7086ff1a319ac84c4fcc Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Sun, 16 Jul 2023 19:50:13 +0300
Subject: [PATCH 169/347] chore: script/test - fix usage, remove trial mention,
 deleted in 7170ec7c

---
 script/test | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/script/test b/script/test
index 619c190f..1abd2053 100755
--- a/script/test
+++ b/script/test
@@ -6,7 +6,7 @@ function usage {
   cat <<-EOF
 USAGE
 
-  $0 [-adDg] [-s SEED] [-l LANGUAGE] [-e EXAMPLE] [-t TRIAL]
+  $0 [-adDg] [-s SEED] [-l LANGUAGE] [-e EXAMPLE]
 
 OPTIONS
 

From c16a8c71ce7f67534a808fecca24d1aa767c7b90 Mon Sep 17 00:00:00 2001
From: Amaan Qureshi <amaanq12@gmail.com>
Date: Tue, 18 Jul 2023 05:27:48 -0400
Subject: [PATCH 170/347] fix: pass a value_id the same size of
 predicate_capture_ids's elements to avoid big-endian integer narrowing

This solves a bug on big-endian architectures where the value would be later passed by reference as an elements "view" before being inserted. The issue is it is casted as a void pointer, and when writing uint16_t's of size 1, only 2 of the 4 bytes are written. This is okay for little-endian systems, but not big-endian
---
 lib/src/query.c | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/lib/src/query.c b/lib/src/query.c
index 64ab57e2..b44fd9c8 100644
--- a/lib/src/query.c
+++ b/lib/src/query.c
@@ -1788,7 +1788,8 @@ static bool ts_query__analyze_patterns(TSQuery *self, unsigned *error_offset) {
     ) {
       TSQueryPredicateStep *step = &self->predicate_steps.contents[j];
       if (step->type == TSQueryPredicateStepTypeCapture) {
-        array_insert_sorted_by(&predicate_capture_ids, , step->value_id);
+        uint16_t value_id = step->value_id;
+        array_insert_sorted_by(&predicate_capture_ids, , value_id);
       }
     }
 

From 77a8c565588edd0391b0306f9accf12f93daa80b Mon Sep 17 00:00:00 2001
From: Amaan Qureshi <amaanq12@gmail.com>
Date: Tue, 18 Jul 2023 05:49:37 -0400
Subject: [PATCH 171/347] ci: add big-endian & some obscure architectures

---
 .github/workflows/build.yml | 105 ++++++++++++++++++++++--------------
 cli/npm/install.js          |   8 ++-
 2 files changed, 73 insertions(+), 40 deletions(-)

diff --git a/.github/workflows/build.yml b/.github/workflows/build.yml
index faf0af35..c0f632b1 100644
--- a/.github/workflows/build.yml
+++ b/.github/workflows/build.yml
@@ -33,52 +33,79 @@ jobs:
       fail-fast: false
       matrix:
         runtime:
-        - linux-arm64     #
-        - linux-arm       #
-        - linux-armv7l    #
-        - linux-x64       #
-        - linux-x86       #
-        - linux-i586      #
-        - linux-mipsel    #
-        - linux-mips64el  #
-        - linux-ppc64el   #
-        - linux-riscv64gc #
-        - windows-arm64   #
-        - windows-x64     # <-- No C library build - requires an additional adapted Makefile for `cl.exe` compiler
-        - windows-x86     #     -- // --
-        - macos-arm64     # <-- MacOS M1/M2 - no tests, only CLI build to be published on release artifacts
-        - macos-x64       #
+        - linux-arm64       #
+        - linux-arm         #
+        - linux-armhf       #
+        - linux-armv5te     #
+        - linux-armv7l      #
+        - linux-x64         #
+        - linux-x86         #
+        - linux-i586        #
+        - linux-mips        #
+        - linux-mips64      #
+        - linux-mipsel      #
+        - linux-mips64el    #
+        - linux-powerpc     #
+        - linux-powerpc64   #
+        - linux-powerpc64el #
+        - linux-riscv64gc   #
+        - linux-s390x       #
+        - linux-sparc64     #
+        - linux-thumbv7neon #
+        - windows-arm64     #
+        - windows-x64       # <-- No C library build - requires an additional adapted Makefile for `cl.exe` compiler
+        - windows-x86       #     -- // --
+        - macos-arm64       # <-- MacOS M1/M2 - no tests, only CLI build to be published on release artifacts
+        - macos-x64         #
 
         include:
         # When adding a new `target`:
         # 1. Define a new runtime alias above
         # 2. Add a new record to a matrix map in `cli/npm/install.js`
-        - { runtime: linux-arm64     , target: aarch64-unknown-linux-gnu       , os: ubuntu-latest  , use-cross: true }
-        - { runtime: linux-arm       , target: arm-unknown-linux-gnueabihf     , os: ubuntu-latest  , use-cross: true }
-        - { runtime: linux-armv7l    , target: armv7-unknown-linux-gnueabihf   , os: ubuntu-latest  , use-cross: true }
-        - { runtime: linux-x64       , target: x86_64-unknown-linux-gnu        , os: ubuntu-20.04                     } #2272
-        - { runtime: linux-x86       , target: i686-unknown-linux-gnu          , os: ubuntu-latest  , use-cross: true }
-        - { runtime: linux-i586      , target: i586-unknown-linux-gnu          , os: ubuntu-latest  , use-cross: true }
-        - { runtime: linux-mipsel    , target: mipsel-unknown-linux-gnu        , os: ubuntu-latest  , use-cross: true }
-        - { runtime: linux-mips64el  , target: mips64el-unknown-linux-gnuabi64 , os: ubuntu-latest  , use-cross: true }
-        - { runtime: linux-ppc64el   , target: powerpc64le-unknown-linux-gnu   , os: ubuntu-latest  , use-cross: true }
-        - { runtime: linux-riscv64gc , target: riscv64gc-unknown-linux-gnu     , os: ubuntu-latest  , use-cross: true }
-        - { runtime: windows-arm64   , target: aarch64-pc-windows-msvc         , os: windows-latest                   }
-        - { runtime: windows-x64     , target: x86_64-pc-windows-msvc          , os: windows-latest                   }
-        - { runtime: windows-x86     , target: i686-pc-windows-msvc            , os: windows-latest                   }
-        - { runtime: macos-arm64     , target: aarch64-apple-darwin            , os: macos-latest                     }
-        - { runtime: macos-x64       , target: x86_64-apple-darwin             , os: macos-latest                     }
+        - { runtime: linux-arm64       , target: aarch64-unknown-linux-gnu           , os: ubuntu-latest  , use-cross: true }
+        - { runtime: linux-arm         , target: arm-unknown-linux-gnueabi           , os: ubuntu-latest  , use-cross: true }
+        - { runtime: linux-armhf       , target: arm-unknown-linux-gnueabihf         , os: ubuntu-latest  , use-cross: true }
+        - { runtime: linux-armv5te     , target: armv5te-unknown-linux-gnueabi       , os: ubuntu-latest  , use-cross: true }
+        - { runtime: linux-armv7l      , target: armv7-unknown-linux-gnueabihf       , os: ubuntu-latest  , use-cross: true }
+        - { runtime: linux-x64         , target: x86_64-unknown-linux-gnu            , os: ubuntu-20.04                     } #2272
+        - { runtime: linux-x86         , target: i686-unknown-linux-gnu              , os: ubuntu-latest  , use-cross: true }
+        - { runtime: linux-i586        , target: i586-unknown-linux-gnu              , os: ubuntu-latest  , use-cross: true }
+        - { runtime: linux-mips        , target: mips-unknown-linux-gnu              , os: ubuntu-latest  , use-cross: true }
+        - { runtime: linux-mips64      , target: mips64-unknown-linux-gnuabi64       , os: ubuntu-latest  , use-cross: true }
+        - { runtime: linux-mipsel      , target: mipsel-unknown-linux-gnu            , os: ubuntu-latest  , use-cross: true }
+        - { runtime: linux-mips64el    , target: mips64el-unknown-linux-gnuabi64     , os: ubuntu-latest  , use-cross: true }
+        - { runtime: linux-powerpc     , target: powerpc-unknown-linux-gnu           , os: ubuntu-latest  , use-cross: true }
+        - { runtime: linux-powerpc64   , target: powerpc64-unknown-linux-gnu         , os: ubuntu-latest  , use-cross: true }
+        - { runtime: linux-powerpc64el , target: powerpc64le-unknown-linux-gnu       , os: ubuntu-latest  , use-cross: true }
+        - { runtime: linux-riscv64gc   , target: riscv64gc-unknown-linux-gnu         , os: ubuntu-latest  , use-cross: true }
+        - { runtime: linux-s390x       , target: s390x-unknown-linux-gnu             , os: ubuntu-latest  , use-cross: true }
+        - { runtime: linux-sparc64     , target: sparc64-unknown-linux-gnu           , os: ubuntu-latest  , use-cross: true }
+        - { runtime: linux-thumbv7neon , target: thumbv7neon-unknown-linux-gnueabihf , os: ubuntu-latest  , use-cross: true }
+        - { runtime: windows-arm64     , target: aarch64-pc-windows-msvc             , os: windows-latest                   }
+        - { runtime: windows-x64       , target: x86_64-pc-windows-msvc              , os: windows-latest                   }
+        - { runtime: windows-x86       , target: i686-pc-windows-msvc                , os: windows-latest                   }
+        - { runtime: macos-arm64       , target: aarch64-apple-darwin                , os: macos-latest                     }
+        - { runtime: macos-x64         , target: x86_64-apple-darwin                 , os: macos-latest                     }
 
         # Cross compilers for C library
-        - { runtime: linux-arm64     , cc: aarch64-linux-gnu-gcc             , ar: aarch64-linux-gnu-ar           }
-        - { runtime: linux-arm       , cc: arm-unknown-linux-gnueabihf-gcc   , ar: arm-unknown-linux-gnueabihf-ar }
-        - { runtime: linux-armv7l    , cc: arm-linux-gnueabihf-gcc           , ar: arm-linux-gnueabihf-ar         }
-        - { runtime: linux-x86       , cc: i686-linux-gnu-gcc                , ar: i686-linux-gnu-ar              }
-        - { runtime: linux-i586      , cc: i686-linux-gnu-gcc                , ar: i686-linux-gnu-ar              }
-        - { runtime: linux-mipsel    , cc: mipsel-linux-gnu-gcc              , ar: mipsel-linux-gnu-ar            }
-        - { runtime: linux-mips64el  , cc: mips64el-linux-gnuabi64-gcc       , ar: mips64el-linux-gnuabi64-ar     }
-        - { runtime: linux-ppc64el   , cc: powerpc64le-linux-gnu-gcc         , ar: powerpc64le-linux-gnu-ar       }
-        - { runtime: linux-riscv64gc , cc: riscv64-linux-gnu-gcc             , ar: riscv64-linux-gnu-ar           }
+        - { runtime: linux-arm64       , cc: aarch64-linux-gnu-gcc             , ar: aarch64-linux-gnu-ar           }
+        - { runtime: linux-arm         , cc: arm-linux-gnueabi-gcc             , ar: arm-linux-gnueabi-ar           }
+        - { runtime: linux-armhf       , cc: arm-unknown-linux-gnueabihf-gcc   , ar: arm-unknown-linux-gnueabihf-ar }
+        - { runtime: linux-armv5te     , cc: arm-linux-gnueabi-gcc             , ar: arm-linux-gnueabi-ar           }
+        - { runtime: linux-armv7l      , cc: arm-linux-gnueabihf-gcc           , ar: arm-linux-gnueabihf-ar         }
+        - { runtime: linux-x86         , cc: i686-linux-gnu-gcc                , ar: i686-linux-gnu-ar              }
+        - { runtime: linux-i586        , cc: i686-linux-gnu-gcc                , ar: i686-linux-gnu-ar              }
+        - { runtime: linux-mips        , cc: mips-linux-gnu-gcc                , ar: mips-linux-gnu-ar              }
+        - { runtime: linux-mips64      , cc: mips64-linux-gnuabi64-gcc         , ar: mips64-linux-gnuabi64-ar       }
+        - { runtime: linux-mipsel      , cc: mipsel-linux-gnu-gcc              , ar: mipsel-linux-gnu-ar            }
+        - { runtime: linux-mips64el    , cc: mips64el-linux-gnuabi64-gcc       , ar: mips64el-linux-gnuabi64-ar     }
+        - { runtime: linux-powerpc     , cc: powerpc-linux-gnu-gcc             , ar: powerpc-linux-gnu-ar           }
+        - { runtime: linux-powerpc64   , cc: powerpc64-linux-gnu-gcc           , ar: powerpc64-linux-gnu-ar         }
+        - { runtime: linux-powerpc64el , cc: powerpc64le-linux-gnu-gcc         , ar: powerpc64le-linux-gnu-ar       }
+        - { runtime: linux-riscv64gc   , cc: riscv64-linux-gnu-gcc             , ar: riscv64-linux-gnu-ar           }
+        - { runtime: linux-s390x       , cc: s390x-linux-gnu-gcc               , ar: s390x-linux-gnu-ar             }
+        - { runtime: linux-sparc64     , cc: sparc64-linux-gnu-gcc             , ar: sparc64-linux-gnu-ar           }
+        - { runtime: linux-thumbv7neon , cc: arm-linux-gnueabihf-gcc           , ar: arm-linux-gnueabihf-ar         }
 
 
         # See #2041 tree-sitter issue
diff --git a/cli/npm/install.js b/cli/npm/install.js
index d9bffb1c..b2db3d7d 100755
--- a/cli/npm/install.js
+++ b/cli/npm/install.js
@@ -25,10 +25,16 @@ const matrix = {
         'x64': { name: 'x64' },
         'x86': { name: 'x86' },
         'i586': { name: 'i586' },
+        'mips': { name: 'mips' },
+        'mips64': { name: 'mips64' },
         'mipsel': { name: 'mipsel' },
         'mips64el': { name: 'mips64el' },
-        'ppc64el': { name: 'ppc64el' },
+        'ppc': { name: 'powerpc' },
+        'ppc64': { name: 'powerpc64' },
+        'ppc64el': { name: 'powerpc64el' },
         'riscv64gc': { name: 'riscv64gc' },
+        's390x': { name: 's390x' },
+        'sparc64': { name: 'sparc64' },
       }
     },
     'win32': {

From c4368976628cf1852b23435541d9db5b5da44e3f Mon Sep 17 00:00:00 2001
From: Amaan Qureshi <amaanq12@gmail.com>
Date: Tue, 18 Jul 2023 15:35:18 -0400
Subject: [PATCH 172/347] test: bump start_time limit for sparc64

---
 cli/src/tests/parser_test.rs | 4 ++++
 1 file changed, 4 insertions(+)

diff --git a/cli/src/tests/parser_test.rs b/cli/src/tests/parser_test.rs
index 8ad1888a..af5f36f5 100644
--- a/cli/src/tests/parser_test.rs
+++ b/cli/src/tests/parser_test.rs
@@ -661,8 +661,12 @@ fn test_parsing_with_a_timeout() {
         None,
     );
     assert!(tree.is_none());
+    #[cfg(not(target_arch = "sparc64"))]
     assert!(start_time.elapsed().as_micros() < 2000);
 
+    #[cfg(target_arch = "sparc64")]
+    assert!(start_time.elapsed().as_micros() < 4000);
+
     // Continue parsing, but pause after 1 ms of processing.
     parser.set_timeout_micros(5000);
     let start_time = time::Instant::now();

From 76f5f81aee241071c35298f2ca9915e9ec0b863d Mon Sep 17 00:00:00 2001
From: Amaan Qureshi <amaanq12@gmail.com>
Date: Tue, 18 Jul 2023 19:29:40 -0400
Subject: [PATCH 173/347] chore: update test

---
 cli/src/tests/corpus_test.rs | 7 ++++++-
 cli/src/tests/node_test.rs   | 6 +++++-
 2 files changed, 11 insertions(+), 2 deletions(-)

diff --git a/cli/src/tests/corpus_test.rs b/cli/src/tests/corpus_test.rs
index b818b2c1..0bd1db88 100644
--- a/cli/src/tests/corpus_test.rs
+++ b/cli/src/tests/corpus_test.rs
@@ -429,7 +429,12 @@ fn set_included_ranges(parser: &mut Parser, input: &[u8], delimiters: Option<(&s
         let mut ranges = Vec::new();
         let mut ix = 0;
         while ix < input.len() {
-            let Some(mut start_ix) = input[ix..].windows(2).position(|win| win == start.as_bytes()) else { break };
+            let Some(mut start_ix) = input[ix..]
+                .windows(2)
+                .position(|win| win == start.as_bytes())
+            else {
+                break;
+            };
             start_ix += ix + start.len();
             let end_ix = input[start_ix..]
                 .windows(2)
diff --git a/cli/src/tests/node_test.rs b/cli/src/tests/node_test.rs
index e7b9640b..9dd8a1c2 100644
--- a/cli/src/tests/node_test.rs
+++ b/cli/src/tests/node_test.rs
@@ -252,9 +252,13 @@ fn test_node_parent_of_child_by_field_name() {
 fn test_node_field_name_for_child() {
     let mut parser = Parser::new();
     parser.set_language(get_language("c")).unwrap();
-    let tree = parser.parse("x + y;", None).unwrap();
+    let tree = parser.parse("void main() { x + y; }", None).unwrap();
     let translation_unit_node = tree.root_node();
     let binary_expression_node = translation_unit_node
+        .named_child(0)
+        .unwrap()
+        .named_child(2)
+        .unwrap()
         .named_child(0)
         .unwrap()
         .named_child(0)

From e77405841e97d1d41484828fccb5ad1b98091066 Mon Sep 17 00:00:00 2001
From: Amaan Qureshi <amaanq12@gmail.com>
Date: Tue, 18 Jul 2023 19:48:03 -0400
Subject: [PATCH 174/347] refactor: make a subdirectory for the scratch dir
 depending on the machine's features

---
 cli/src/tests/helpers/dirs.rs | 32 +++++++++++++++++++++++++++++++-
 1 file changed, 31 insertions(+), 1 deletion(-)

diff --git a/cli/src/tests/helpers/dirs.rs b/cli/src/tests/helpers/dirs.rs
index 4bf345d8..e4f220ea 100644
--- a/cli/src/tests/helpers/dirs.rs
+++ b/cli/src/tests/helpers/dirs.rs
@@ -4,7 +4,37 @@ lazy_static! {
     static ref HEADER_DIR: PathBuf = ROOT_DIR.join("lib").join("include");
     static ref GRAMMARS_DIR: PathBuf = ROOT_DIR.join("test").join("fixtures").join("grammars");
     static ref SCRATCH_DIR: PathBuf = {
-        let result = ROOT_DIR.join("target").join("scratch");
+        // https://doc.rust-lang.org/reference/conditional-compilation.html
+        let vendor = if cfg!(target_vendor = "apple") {
+            "apple"
+        } else if cfg!(target_vendor = "fortanix") {
+            "fortanix"
+        } else if cfg!(target_vendor = "pc") {
+            "pc"
+        } else {
+            "unknown"
+        };
+        let env = if cfg!(target_env = "gnu") {
+            "gnu"
+        } else if cfg!(target_env = "msvc") {
+            "msvc"
+        } else if cfg!(target_env = "musl") {
+            "musl"
+        } else if cfg!(target_env = "sgx") {
+            "sgx"
+        } else {
+            "unknown"
+        };
+        let endian = if cfg!(target_endian = "little") {
+            "little"
+        } else if cfg!(target_endian = "big") {
+            "big"
+        } else {
+            "unknown"
+        };
+
+        let machine = format!("{}-{}-{}-{}-{}", std::env::consts::ARCH, std::env::consts::OS, vendor, env, endian);
+        let result = ROOT_DIR.join("target").join("scratch").join(machine);
         fs::create_dir_all(&result).unwrap();
         result
     };

From 40f7b2ec9799ad6f1eb638be99f0a106292e473a Mon Sep 17 00:00:00 2001
From: Max Brunsfeld <maxbrunsfeld@gmail.com>
Date: Tue, 18 Jul 2023 17:32:58 -0700
Subject: [PATCH 175/347] Fix parsing of queries that start with repetitions
 followed by alternatives

---
 cli/src/tests/query_test.rs | 47 +++++++++++++++++++++++++++++++++++++
 lib/src/query.c             | 39 ++++++++++++++++++++++++------
 2 files changed, 79 insertions(+), 7 deletions(-)

diff --git a/cli/src/tests/query_test.rs b/cli/src/tests/query_test.rs
index e244405a..3ba1a272 100644
--- a/cli/src/tests/query_test.rs
+++ b/cli/src/tests/query_test.rs
@@ -1826,6 +1826,53 @@ fn test_query_matches_with_alternatives_and_too_many_permutations_to_track() {
     });
 }
 
+#[test]
+fn test_repetitions_before_with_alternatives() {
+    allocations::record(|| {
+        let language = get_language("rust");
+        let query = Query::new(
+            language,
+            r#"
+            (
+                (line_comment)* @comment
+                .
+                [
+                    (struct_item name: (_) @name)
+                    (function_item name: (_) @name)
+                    (enum_item name: (_) @name)
+                    (impl_item type: (_) @name)
+                ]
+            )
+            "#,
+        )
+        .unwrap();
+
+        assert_query_matches(
+            language,
+            &query,
+            r#"
+            // a
+            // b
+            fn c() {}
+
+            // d
+            // e
+            impl F {}
+            "#,
+            &[
+                (
+                    0,
+                    vec![("comment", "// a"), ("comment", "// b"), ("name", "c")],
+                ),
+                (
+                    0,
+                    vec![("comment", "// d"), ("comment", "// e"), ("name", "F")],
+                ),
+            ],
+        );
+    });
+}
+
 #[test]
 fn test_query_matches_with_anonymous_tokens() {
     allocations::record(|| {
diff --git a/lib/src/query.c b/lib/src/query.c
index b44fd9c8..74fa888f 100644
--- a/lib/src/query.c
+++ b/lib/src/query.c
@@ -2780,7 +2780,6 @@ TSQuery *ts_query_new(
       // then add multiple entries to the pattern map.
       if (step->alternative_index != NONE) {
         start_step_index = step->alternative_index;
-        step->alternative_index = NONE;
       } else if (wildcard_root_alternative_index != NONE) {
         start_step_index = wildcard_root_alternative_index;
         wildcard_root_alternative_index = NONE;
@@ -3008,11 +3007,43 @@ void ts_query_cursor_set_match_limit(TSQueryCursor *self, uint32_t limit) {
   self->capture_list_pool.max_capture_list_count = limit;
 }
 
+#ifdef DEBUG_EXECUTE_QUERY
+#define LOG(...) fprintf(stderr, __VA_ARGS__)
+#else
+#define LOG(...)
+#endif
+
 void ts_query_cursor_exec(
   TSQueryCursor *self,
   const TSQuery *query,
   TSNode node
 ) {
+  if  (query) {
+    LOG("query steps:\n");
+    for (unsigned i = 0; i < query->steps.size; i++) {
+      QueryStep *step = &query->steps.contents[i];
+      LOG("  %u: {", i);
+      if (step->depth == PATTERN_DONE_MARKER) {
+        LOG("DONE");
+      } else if (step->is_dead_end) {
+        LOG("dead_end");
+      } else if (step->is_pass_through) {
+        LOG("pass_through");
+      } else if (step->symbol != WILDCARD_SYMBOL) {
+        LOG("symbol: %s", query->language->symbol_names[step->symbol]);
+      } else {
+        LOG("symbol: *");
+      }
+      if (step->field) {
+        LOG(", field: %s", query->language->field_names[step->field]);
+      }
+      if (step->alternative_index != NONE) {
+        LOG(", alternative: %u", step->alternative_index);
+      }
+      LOG("},\n");
+    }
+  }
+
   array_clear(&self->states);
   array_clear(&self->finished_states);
   ts_tree_cursor_reset(&self->cursor, node);
@@ -3180,12 +3211,6 @@ void ts_query_cursor__compare_captures(
   }
 }
 
-#ifdef DEBUG_EXECUTE_QUERY
-#define LOG(...) fprintf(stderr, __VA_ARGS__)
-#else
-#define LOG(...)
-#endif
-
 static void ts_query_cursor__add_state(
   TSQueryCursor *self,
   const PatternEntry *pattern

From 8310fd423ebaa3b55727df8aaa34a77cbca4c791 Mon Sep 17 00:00:00 2001
From: Max Brunsfeld <maxbrunsfeld@gmail.com>
Date: Tue, 18 Jul 2023 17:46:44 -0700
Subject: [PATCH 176/347] Update node unit test to reflect C grammar change

---
 cli/src/tests/node_test.rs | 14 ++++++--------
 1 file changed, 6 insertions(+), 8 deletions(-)

diff --git a/cli/src/tests/node_test.rs b/cli/src/tests/node_test.rs
index 9dd8a1c2..43b3d66b 100644
--- a/cli/src/tests/node_test.rs
+++ b/cli/src/tests/node_test.rs
@@ -252,16 +252,14 @@ fn test_node_parent_of_child_by_field_name() {
 fn test_node_field_name_for_child() {
     let mut parser = Parser::new();
     parser.set_language(get_language("c")).unwrap();
-    let tree = parser.parse("void main() { x + y; }", None).unwrap();
+    let tree = parser.parse("int w = x + y;", None).unwrap();
     let translation_unit_node = tree.root_node();
-    let binary_expression_node = translation_unit_node
-        .named_child(0)
+    let declaration_node = translation_unit_node.named_child(0).unwrap();
+
+    let binary_expression_node = declaration_node
+        .child_by_field_name("declarator")
         .unwrap()
-        .named_child(2)
-        .unwrap()
-        .named_child(0)
-        .unwrap()
-        .named_child(0)
+        .child_by_field_name("value")
         .unwrap();
 
     assert_eq!(binary_expression_node.field_name_for_child(0), Some("left"));

From 0e53b66931b8a6f0015a9ab08040021840fbef24 Mon Sep 17 00:00:00 2001
From: Amaan Qureshi <amaanq12@gmail.com>
Date: Wed, 19 Jul 2023 03:12:13 -0400
Subject: [PATCH 177/347] chore: remove useless use

---
 cli/src/playground.rs | 1 -
 1 file changed, 1 deletion(-)

diff --git a/cli/src/playground.rs b/cli/src/playground.rs
index a2dbef96..5bbcb3c3 100644
--- a/cli/src/playground.rs
+++ b/cli/src/playground.rs
@@ -8,7 +8,6 @@ use std::{
     str::{self, FromStr as _},
 };
 use tiny_http::{Header, Response, Server};
-use webbrowser;
 
 macro_rules! optional_resource {
     ($name: tt, $path: tt) => {

From 56cedba4bf2c1375e39833726a7698d9f00b0c5a Mon Sep 17 00:00:00 2001
From: Amaan Qureshi <amaanq12@gmail.com>
Date: Wed, 19 Jul 2023 03:15:03 -0400
Subject: [PATCH 178/347] chore: bump dependencies

---
 cli/Cargo.toml       | 54 ++++++++++++++++++++++----------------------
 highlight/Cargo.toml | 10 ++++----
 lib/Cargo.toml       |  6 ++---
 tags/Cargo.toml      | 10 ++++----
 4 files changed, 40 insertions(+), 40 deletions(-)

diff --git a/cli/Cargo.toml b/cli/Cargo.toml
index d0085f67..c50a29ed 100644
--- a/cli/Cargo.toml
+++ b/cli/Cargo.toml
@@ -20,28 +20,28 @@ name = "benchmark"
 harness = false
 
 [dependencies]
-ansi_term = "0.12"
-anyhow = "1.0"
-atty = "0.2"
+ansi_term = "0.12.1"
+anyhow = "1.0.72"
+atty = "0.2.14"
 clap = "2.32"
-ctrlc = { version = "3.2.5", features = ["termination"] }
-difference = "2.0"
-dirs = "3.0"
-glob = "0.3.0"
-html-escape = "0.2.6"
-indexmap = "1"
-lazy_static = "1.2.0"
+ctrlc = { version = "3.4.0", features = ["termination"] }
+difference = "2.0.0"
+dirs = "5.0.1"
+glob = "0.3.1"
+html-escape = "0.2.13"
+indexmap = "2.0.0"
+lazy_static = "1.4.0"
 path-slash = "0.2.1"
-regex = "1"
-regex-syntax = "0.6.4"
-rustc-hash = "1"
-semver = "1.0"
-serde = { version = "1.0.130", features = ["derive"] }
+regex = "1.9.1"
+regex-syntax = "0.7.4"
+rustc-hash = "1.1.0"
+semver = "1.0.18"
+serde = { version = "1.0.171", features = ["derive"] }
 smallbitvec = "2.5.1"
 tiny_http = "0.12.0"
-walkdir = "2.3"
-webbrowser = "0.8.3"
-which = "4.1.0"
+walkdir = "2.3.3"
+webbrowser = "0.8.10"
+which = "4.4.0"
 
 [dependencies.tree-sitter]
 version = "0.20.10"
@@ -64,22 +64,22 @@ version = "0.20"
 path = "../tags"
 
 [dependencies.serde_json]
-version = "1.0"
+version = "1.0.103"
 features = ["preserve_order"]
 
 [dependencies.log]
-version = "0.4.6"
+version = "0.4.19"
 features = ["std"]
 
 [dev-dependencies]
 proc_macro = { path = "src/tests/proc_macro", package = "tree-sitter-tests-proc-macro" }
 
-rand = "0.8"
-tempfile = "3"
-pretty_assertions = "0.7.2"
-ctor = "0.1"
-unindent = "0.2"
-indoc = "2.0.1"
+rand = "0.8.5"
+tempfile = "3.6.0"
+pretty_assertions = "1.4.0"
+ctor = "0.2.4"
+unindent = "0.2.2"
+indoc = "2.0.3"
 
 [build-dependencies]
-toml = "0.5"
+toml = "0.7.6"
diff --git a/highlight/Cargo.toml b/highlight/Cargo.toml
index 84c748b6..c74e66c9 100644
--- a/highlight/Cargo.toml
+++ b/highlight/Cargo.toml
@@ -3,8 +3,8 @@ name = "tree-sitter-highlight"
 description = "Library for performing syntax highlighting with Tree-sitter"
 version = "0.20.2"
 authors = [
-  "Max Brunsfeld <maxbrunsfeld@gmail.com>",
-  "Tim Clem <timothy.clem@gmail.com>",
+	"Max Brunsfeld <maxbrunsfeld@gmail.com>",
+	"Tim Clem <timothy.clem@gmail.com>",
 ]
 license = "MIT"
 readme = "README.md"
@@ -18,9 +18,9 @@ rust-version.workspace = true
 crate-type = ["lib", "staticlib"]
 
 [dependencies]
-lazy_static = "1.2.0"
-regex = "1"
-thiserror = "1.0"
+lazy_static = "1.4.0"
+regex = "1.9.1"
+thiserror = "1.0.43"
 
 [dependencies.tree-sitter]
 version = "0.20"
diff --git a/lib/Cargo.toml b/lib/Cargo.toml
index 39e07916..d3aabd39 100644
--- a/lib/Cargo.toml
+++ b/lib/Cargo.toml
@@ -23,11 +23,11 @@ include = [
 ]
 
 [dependencies]
-lazy_static = { version = "1.2.0", optional = true }
-regex = "1"
+lazy_static = { version = "1.4.0", optional = true }
+regex = "1.9.1"
 
 [build-dependencies]
-cc = "^1.0.58"
+cc = "^1.0.79"
 
 [lib]
 path = "binding_rust/lib.rs"
diff --git a/tags/Cargo.toml b/tags/Cargo.toml
index 99d053e8..02799403 100644
--- a/tags/Cargo.toml
+++ b/tags/Cargo.toml
@@ -3,8 +3,8 @@ name = "tree-sitter-tags"
 description = "Library for extracting tag information"
 version = "0.20.2"
 authors = [
-  "Max Brunsfeld <maxbrunsfeld@gmail.com>",
-  "Patrick Thomson <patrickt@github.com>",
+	"Max Brunsfeld <maxbrunsfeld@gmail.com>",
+	"Patrick Thomson <patrickt@github.com>",
 ]
 license = "MIT"
 readme = "README.md"
@@ -18,9 +18,9 @@ rust-version.workspace = true
 crate-type = ["lib", "staticlib"]
 
 [dependencies]
-regex = "1"
-memchr = "2.3"
-thiserror = "1.0"
+regex = "1.9.1"
+memchr = "2.5.0"
+thiserror = "1.0.43"
 
 [dependencies.tree-sitter]
 version = "0.20"

From d9d4116105c9dec369fe21fac313dd741718d43f Mon Sep 17 00:00:00 2001
From: Samuel Moelius <sam@moeli.us>
Date: Sat, 20 May 2023 11:44:39 -0400
Subject: [PATCH 179/347] Add `test_consecutive_zero_or_modifiers`

---
 cli/src/tests/query_test.rs | 46 +++++++++++++++++++++++++++++++++++++
 1 file changed, 46 insertions(+)

diff --git a/cli/src/tests/query_test.rs b/cli/src/tests/query_test.rs
index 3ba1a272..1ca1e658 100644
--- a/cli/src/tests/query_test.rs
+++ b/cli/src/tests/query_test.rs
@@ -4674,3 +4674,49 @@ fn test_query_error_does_not_oob() {
         }
     );
 }
+
+#[test]
+fn test_consecutive_zero_or_modifiers() {
+    let language = get_language("javascript");
+    let mut parser = Parser::new();
+    parser.set_language(language).unwrap();
+
+    let zero_source = "";
+    let three_source = "/**/ /**/ /**/";
+
+    let zero_tree = parser.parse(zero_source, None).unwrap();
+    let three_tree = parser.parse(three_source, None).unwrap();
+
+    let tests = [
+        "(comment)*** @capture",
+        "(comment)??? @capture",
+        "(comment)*?* @capture",
+        "(comment)?*? @capture",
+    ];
+
+    for test in tests {
+        let query = Query::new(language, test).unwrap();
+
+        let mut cursor = QueryCursor::new();
+        let mut matches = cursor.matches(&query, zero_tree.root_node(), zero_source.as_bytes());
+        assert!(matches.next().is_some());
+
+        let mut cursor = QueryCursor::new();
+        let matches = cursor.matches(&query, three_tree.root_node(), three_source.as_bytes());
+
+        let mut len_3 = false;
+        let mut len_1 = false;
+
+        for m in matches {
+            if m.captures.len() == 3 {
+                len_3 = true;
+            }
+            if m.captures.len() == 1 {
+                len_1 = true;
+            }
+        }
+
+        assert_eq!(len_3, test.contains('*'));
+        assert_eq!(len_1, test.contains("???"));
+    }
+}

From a07cdb59f323f046478751f2a67dafa96273013e Mon Sep 17 00:00:00 2001
From: Samuel Moelius <sam@moeli.us>
Date: Sat, 20 May 2023 11:44:56 -0400
Subject: [PATCH 180/347] Handle edge cases involving consecutive "zero or"
 modifiers

---
 lib/src/query.c | 7 +++++--
 1 file changed, 5 insertions(+), 2 deletions(-)

diff --git a/lib/src/query.c b/lib/src/query.c
index 74fa888f..123b77e1 100644
--- a/lib/src/query.c
+++ b/lib/src/query.c
@@ -2597,8 +2597,11 @@ static TSQueryError ts_query__parse_pattern(
       repeat_step.alternative_is_immediate = true;
       array_push(&self->steps, repeat_step);
 
+      // Stop when `step->alternative_index` is `NONE` or it points to
+      // `repeat_step` or beyond. Note that having just been pushed,
+      // `repeat_step` occupies slot `self->steps.size - 1`.
       QueryStep *step = &self->steps.contents[starting_step_index];
-      while (step->alternative_index != NONE) {
+      while (step->alternative_index != NONE && step->alternative_index < self->steps.size - 1) {
         step = &self->steps.contents[step->alternative_index];
       }
       step->alternative_index = self->steps.size;
@@ -2612,7 +2615,7 @@ static TSQueryError ts_query__parse_pattern(
       stream_skip_whitespace(stream);
 
       QueryStep *step = &self->steps.contents[starting_step_index];
-      while (step->alternative_index != NONE) {
+      while (step->alternative_index != NONE && step->alternative_index < self->steps.size) {
         step = &self->steps.contents[step->alternative_index];
       }
       step->alternative_index = self->steps.size;

From 753fa1c3ffb78738d7a61cb132e6912c4e8ce341 Mon Sep 17 00:00:00 2001
From: Amaan Qureshi <amaanq12@gmail.com>
Date: Wed, 19 Jul 2023 03:49:14 -0400
Subject: [PATCH 181/347] fix(lib): explicitly cast numbers to the same size in
 potential spots for infinite loops

---
 lib/src/language.c |  4 ++--
 lib/src/parser.c   |  2 +-
 lib/src/query.c    | 14 +++++++-------
 3 files changed, 10 insertions(+), 10 deletions(-)

diff --git a/lib/src/language.c b/lib/src/language.c
index d0b497d6..c87a8dc1 100644
--- a/lib/src/language.c
+++ b/lib/src/language.c
@@ -78,7 +78,7 @@ TSSymbol ts_language_symbol_for_name(
   bool is_named
 ) {
   if (!strncmp(string, "ERROR", length)) return ts_builtin_sym_error;
-  uint32_t count = ts_language_symbol_count(self);
+  uint16_t count = (uint16_t)ts_language_symbol_count(self);
   for (TSSymbol i = 0; i < count; i++) {
     TSSymbolMetadata metadata = ts_language_symbol_metadata(self, i);
     if ((!metadata.visible && !metadata.supertype) || metadata.named != is_named) continue;
@@ -121,7 +121,7 @@ TSFieldId ts_language_field_id_for_name(
   const char *name,
   uint32_t name_length
 ) {
-  uint32_t count = ts_language_field_count(self);
+  uint16_t count = (uint16_t)ts_language_field_count(self);
   for (TSSymbol i = 1; i < count + 1; i++) {
     switch (strncmp(name, self->field_names[i], name_length)) {
       case 0:
diff --git a/lib/src/parser.c b/lib/src/parser.c
index f84b3c8d..b6be9aa6 100644
--- a/lib/src/parser.c
+++ b/lib/src/parser.c
@@ -1328,7 +1328,7 @@ static void ts_parser__handle_error(
       TSStateId state = ts_stack_state(self->stack, v);
       for (
         TSSymbol missing_symbol = 1;
-        missing_symbol < self->language->token_count;
+        missing_symbol < (uint16_t)self->language->token_count;
         missing_symbol++
       ) {
         TSStateId state_after_missing_symbol = ts_language_next_state(
diff --git a/lib/src/query.c b/lib/src/query.c
index 74fa888f..32fc2836 100644
--- a/lib/src/query.c
+++ b/lib/src/query.c
@@ -416,7 +416,7 @@ static CaptureListPool capture_list_pool_new(void) {
 }
 
 static void capture_list_pool_reset(CaptureListPool *self) {
-  for (uint16_t i = 0; i < self->list.size; i++) {
+  for (uint16_t i = 0; i < (uint16_t)self->list.size; i++) {
     // This invalid size means that the list is not in use.
     self->list.contents[i].size = UINT32_MAX;
   }
@@ -424,7 +424,7 @@ static void capture_list_pool_reset(CaptureListPool *self) {
 }
 
 static void capture_list_pool_delete(CaptureListPool *self) {
-  for (uint16_t i = 0; i < self->list.size; i++) {
+  for (uint16_t i = 0; i < (uint16_t)self->list.size; i++) {
     array_delete(&self->list.contents[i]);
   }
   array_delete(&self->list);
@@ -449,7 +449,7 @@ static bool capture_list_pool_is_empty(const CaptureListPool *self) {
 static uint16_t capture_list_pool_acquire(CaptureListPool *self) {
   // First see if any already allocated capture list is currently unused.
   if (self->free_capture_list_count > 0) {
-    for (uint16_t i = 0; i < self->list.size; i++) {
+    for (uint16_t i = 0; i < (uint16_t)self->list.size; i++) {
       if (self->list.contents[i].size == UINT32_MAX) {
         array_clear(&self->list.contents[i]);
         self->free_capture_list_count--;
@@ -696,7 +696,7 @@ static void capture_quantifiers_add_all(
   if (self->size < quantifiers->size) {
     array_grow_by(self, quantifiers->size - self->size);
   }
-  for (uint16_t id = 0; id < quantifiers->size; id++) {
+  for (uint16_t id = 0; id < (uint16_t)quantifiers->size; id++) {
     uint8_t *quantifier = array_get(quantifiers, id);
     uint8_t *own_quantifier = array_get(self, id);
     *own_quantifier = (uint8_t) quantifier_add((TSQuantifier) *own_quantifier, (TSQuantifier) *quantifier);
@@ -708,7 +708,7 @@ static void capture_quantifiers_mul(
   CaptureQuantifiers *self,
   TSQuantifier quantifier
 ) {
-  for (uint16_t id = 0; id < self->size; id++) {
+  for (uint16_t id = 0; id < (uint16_t)self->size; id++) {
     uint8_t *own_quantifier = array_get(self, id);
     *own_quantifier = (uint8_t) quantifier_mul((TSQuantifier) *own_quantifier, quantifier);
   }
@@ -1519,7 +1519,7 @@ static bool ts_query__analyze_patterns(TSQuery *self, unsigned *error_offset) {
     AnalysisSubgraph subgraph = { .symbol = parent_symbol };
     array_insert_sorted_by(&subgraphs, .symbol, subgraph);
   }
-  for (TSSymbol sym = self->language->token_count; sym < self->language->symbol_count; sym++) {
+  for (TSSymbol sym = (uint16_t)self->language->token_count; sym < (uint16_t)self->language->symbol_count; sym++) {
     if (!ts_language_symbol_metadata(self->language, sym).visible) {
       AnalysisSubgraph subgraph = { .symbol = sym };
       array_insert_sorted_by(&subgraphs, .symbol, subgraph);
@@ -1533,7 +1533,7 @@ static bool ts_query__analyze_patterns(TSQuery *self, unsigned *error_offset) {
   //      with information about the node that would be created.
   //   3) A list of predecessor states for each state.
   StatePredecessorMap predecessor_map = state_predecessor_map_new(self->language);
-  for (TSStateId state = 1; state < self->language->state_count; state++) {
+  for (TSStateId state = 1; state < (uint16_t)self->language->state_count; state++) {
     unsigned subgraph_index, exists;
     LookaheadIterator lookahead_iterator = ts_language_lookaheads(self->language, state);
     while (ts_lookahead_iterator_next(&lookahead_iterator)) {

From 2a5122e673852c935a551b88990662b5c3642e65 Mon Sep 17 00:00:00 2001
From: Amaan Qureshi <amaanq12@gmail.com>
Date: Wed, 19 Jul 2023 03:15:16 -0400
Subject: [PATCH 182/347] feat: better optimizations for release builds

---
 Cargo.toml | 5 ++++-
 1 file changed, 4 insertions(+), 1 deletion(-)

diff --git a/Cargo.toml b/Cargo.toml
index f69dbc4f..1e4c00c7 100644
--- a/Cargo.toml
+++ b/Cargo.toml
@@ -7,4 +7,7 @@ resolver = "2"
 rust-version = "1.65"
 
 [profile.release]
-strip = true
+strip = true      # Automatically strip symbols from the binary.
+lto = true        # Link-time optimization.
+opt-level = "s"   # Optimize for speed.
+codegen-units = 1 # Maximum size reduction optimizations.

From 5fba369c4abda2db269e39c07a569cc4cea918f6 Mon Sep 17 00:00:00 2001
From: Amaan Qureshi <amaanq12@gmail.com>
Date: Sun, 16 Jul 2023 23:29:26 -0400
Subject: [PATCH 183/347] fix: disallow inlining the first rule

This prevents a panic when indexing symbol_ids during the generation process
---
 cli/src/generate/prepare_grammar/process_inlines.rs | 6 ++++++
 1 file changed, 6 insertions(+)

diff --git a/cli/src/generate/prepare_grammar/process_inlines.rs b/cli/src/generate/prepare_grammar/process_inlines.rs
index 206ef8d3..9452e35a 100644
--- a/cli/src/generate/prepare_grammar/process_inlines.rs
+++ b/cli/src/generate/prepare_grammar/process_inlines.rs
@@ -203,6 +203,12 @@ pub(super) fn process_inlines(
                     lexical_grammar.variables[symbol.index].name,
                 ))
             }
+            SymbolType::NonTerminal if symbol.index == 0 => {
+                return Err(anyhow!(
+                    "Rule `{}` cannot be inlined because it is the first rule",
+                    grammar.variables[symbol.index].name,
+                ))
+            }
             _ => {}
         }
     }

From 13f6ec2b0cedbaeaf5aa2645ed0b86929ddbfff1 Mon Sep 17 00:00:00 2001
From: Amaan Qureshi <amaanq12@gmail.com>
Date: Tue, 4 Jul 2023 00:43:58 -0400
Subject: [PATCH 184/347] fix: rename shadowed variables from -Wshadow warnings
 and apply some useful clang-tidy warnings

---
 Makefile                         |   2 +-
 lib/include/tree_sitter/api.h    |  12 ++--
 lib/include/tree_sitter/parser.h |   6 +-
 lib/src/array.h                  |  58 ++++++++---------
 lib/src/atomic.h                 |   4 +-
 lib/src/get_changed_ranges.c     |   2 +-
 lib/src/language.h               |  24 +++----
 lib/src/lexer.c                  |   4 +-
 lib/src/parser.c                 |  30 ++++-----
 lib/src/query.c                  | 104 +++++++++++++++----------------
 lib/src/stack.c                  |   8 +--
 lib/src/subtree.c                |  76 +++++++++++-----------
 lib/src/subtree.h                |   4 +-
 lib/src/tree.c                   |  20 +++---
 lib/src/tree_cursor.c            |  26 ++++----
 15 files changed, 190 insertions(+), 190 deletions(-)

diff --git a/Makefile b/Makefile
index 670e02ac..59554e1d 100644
--- a/Makefile
+++ b/Makefile
@@ -18,7 +18,7 @@ endif
 OBJ := $(SRC:.c=.o)
 
 # define default flags, and override to append mandatory flags
-CFLAGS ?= -O3 -Wall -Wextra -Werror
+CFLAGS ?= -O3 -Wall -Wextra -Werror -Wshadow
 override CFLAGS += -std=gnu99 -fPIC -Ilib/src -Ilib/include
 
 # ABI versioning
diff --git a/lib/include/tree_sitter/api.h b/lib/include/tree_sitter/api.h
index 306891df..dc7704d5 100644
--- a/lib/include/tree_sitter/api.h
+++ b/lib/include/tree_sitter/api.h
@@ -776,7 +776,7 @@ uint32_t ts_query_start_byte_for_pattern(const TSQuery *, uint32_t);
 const TSQueryPredicateStep *ts_query_predicates_for_pattern(
   const TSQuery *self,
   uint32_t pattern_index,
-  uint32_t *length
+  uint32_t *step_count
 );
 
 /*
@@ -807,7 +807,7 @@ bool ts_query_is_pattern_guaranteed_at_step(const TSQuery *self, uint32_t byte_o
  */
 const char *ts_query_capture_name_for_id(
   const TSQuery *,
-  uint32_t id,
+  uint32_t index,
   uint32_t *length
 );
 
@@ -817,13 +817,13 @@ const char *ts_query_capture_name_for_id(
  */
 TSQuantifier ts_query_capture_quantifier_for_id(
   const TSQuery *,
-  uint32_t pattern_id,
-  uint32_t capture_id
+  uint32_t pattern_index,
+  uint32_t capture_index
 );
 
 const char *ts_query_string_value_for_id(
   const TSQuery *,
-  uint32_t id,
+  uint32_t index,
   uint32_t *length
 );
 
@@ -907,7 +907,7 @@ void ts_query_cursor_set_point_range(TSQueryCursor *, TSPoint, TSPoint);
  * Otherwise, return `false`.
  */
 bool ts_query_cursor_next_match(TSQueryCursor *, TSQueryMatch *match);
-void ts_query_cursor_remove_match(TSQueryCursor *, uint32_t id);
+void ts_query_cursor_remove_match(TSQueryCursor *, uint32_t match_id);
 
 /**
  * Advance to the next capture of the currently running query.
diff --git a/lib/include/tree_sitter/parser.h b/lib/include/tree_sitter/parser.h
index 2b14ac10..46994f46 100644
--- a/lib/include/tree_sitter/parser.h
+++ b/lib/include/tree_sitter/parser.h
@@ -166,7 +166,7 @@ struct TSLanguage {
  *  Parse Table Macros
  */
 
-#define SMALL_STATE(id) id - LARGE_STATE_COUNT
+#define SMALL_STATE(id) ((id) - LARGE_STATE_COUNT)
 
 #define STATE(id) id
 
@@ -176,7 +176,7 @@ struct TSLanguage {
   {{                                  \
     .shift = {                        \
       .type = TSParseActionTypeShift, \
-      .state = state_value            \
+      .state = (state_value)          \
     }                                 \
   }}
 
@@ -184,7 +184,7 @@ struct TSLanguage {
   {{                                  \
     .shift = {                        \
       .type = TSParseActionTypeShift, \
-      .state = state_value,           \
+      .state = (state_value),         \
       .repetition = true              \
     }                                 \
   }}
diff --git a/lib/src/array.h b/lib/src/array.h
index abec9410..e5cd361f 100644
--- a/lib/src/array.h
+++ b/lib/src/array.h
@@ -25,8 +25,8 @@ extern "C" {
 #define array_new() \
   { NULL, 0, 0 }
 
-#define array_get(self, index) \
-  (assert((uint32_t)index < (self)->size), &(self)->contents[index])
+#define array_get(self, _index) \
+  (assert((uint32_t)(_index) < (self)->size), &(self)->contents[_index])
 
 #define array_front(self) array_get(self, 0)
 
@@ -38,7 +38,7 @@ extern "C" {
   array__reserve((VoidArray *)(self), array__elem_size(self), new_capacity)
 
 // Free any memory allocated for this array.
-#define array_delete(self) array__delete((VoidArray *)self)
+#define array_delete(self) array__delete((VoidArray *)(self))
 
 #define array_push(self, element)                            \
   (array__grow((VoidArray *)(self), 1, array__elem_size(self)), \
@@ -65,19 +65,19 @@ extern "C" {
 // Remove `old_count` elements from the array starting at the given `index`. At
 // the same index, insert `new_count` new elements, reading their values from the
 // `new_contents` pointer.
-#define array_splice(self, index, old_count, new_count, new_contents)  \
+#define array_splice(self, _index, old_count, new_count, new_contents)  \
   array__splice(                                                       \
-    (VoidArray *)(self), array__elem_size(self), index,                \
+    (VoidArray *)(self), array__elem_size(self), _index,                \
     old_count, new_count, new_contents                                 \
   )
 
 // Insert one `element` into the array at the given `index`.
-#define array_insert(self, index, element) \
-  array__splice((VoidArray *)(self), array__elem_size(self), index, 0, 1, &element)
+#define array_insert(self, _index, element) \
+  array__splice((VoidArray *)(self), array__elem_size(self), _index, 0, 1, &(element))
 
 // Remove one `element` from the array at the given `index`.
-#define array_erase(self, index) \
-  array__erase((VoidArray *)(self), array__elem_size(self), index)
+#define array_erase(self, _index) \
+  array__erase((VoidArray *)(self), array__elem_size(self), _index)
 
 #define array_pop(self) ((self)->contents[--(self)->size])
 
@@ -95,23 +95,23 @@ extern "C" {
 // out-parameter is set to true. Otherwise, `index` is set to an index where
 // `needle` should be inserted in order to preserve the sorting, and `exists`
 // is set to false.
-#define array_search_sorted_with(self, compare, needle, index, exists) \
-  array__search_sorted(self, 0, compare, , needle, index, exists)
+#define array_search_sorted_with(self, compare, needle, _index, _exists) \
+  array__search_sorted(self, 0, compare, , needle, _index, _exists)
 
 // Search a sorted array for a given `needle` value, using integer comparisons
 // of a given struct field (specified with a leading dot) to determine the order.
 //
 // See also `array_search_sorted_with`.
-#define array_search_sorted_by(self, field, needle, index, exists) \
-  array__search_sorted(self, 0, _compare_int, field, needle, index, exists)
+#define array_search_sorted_by(self, field, needle, _index, _exists) \
+  array__search_sorted(self, 0, compare_int, field, needle, _index, _exists)
 
 // Insert a given `value` into a sorted array, using the given `compare`
 // callback to determine the order.
 #define array_insert_sorted_with(self, compare, value) \
   do { \
-    unsigned index, exists; \
-    array_search_sorted_with(self, compare, &(value), &index, &exists); \
-    if (!exists) array_insert(self, index, value); \
+    unsigned _index, _exists; \
+    array_search_sorted_with(self, compare, &(value), &_index, &_exists); \
+    if (!_exists) array_insert(self, _index, value); \
   } while (0)
 
 // Insert a given `value` into a sorted array, using integer comparisons of
@@ -120,9 +120,9 @@ extern "C" {
 // See also `array_search_sorted_by`.
 #define array_insert_sorted_by(self, field, value) \
   do { \
-    unsigned index, exists; \
-    array_search_sorted_by(self, field, (value) field, &index, &exists); \
-    if (!exists) array_insert(self, index, value); \
+    unsigned _index, _exists; \
+    array_search_sorted_by(self, field, (value) field, &_index, &_exists); \
+    if (!_exists) array_insert(self, _index, value); \
   } while (0)
 
 // Private
@@ -217,28 +217,28 @@ static inline void array__splice(VoidArray *self, size_t element_size,
 }
 
 // A binary search routine, based on Rust's `std::slice::binary_search_by`.
-#define array__search_sorted(self, start, compare, suffix, needle, index, exists) \
+#define array__search_sorted(self, start, compare, suffix, needle, _index, _exists) \
   do { \
-    *(index) = start; \
-    *(exists) = false; \
-    uint32_t size = (self)->size - *(index); \
+    *(_index) = start; \
+    *(_exists) = false; \
+    uint32_t size = (self)->size - *(_index); \
     if (size == 0) break; \
     int comparison; \
     while (size > 1) { \
       uint32_t half_size = size / 2; \
-      uint32_t mid_index = *(index) + half_size; \
+      uint32_t mid_index = *(_index) + half_size; \
       comparison = compare(&((self)->contents[mid_index] suffix), (needle)); \
-      if (comparison <= 0) *(index) = mid_index; \
+      if (comparison <= 0) *(_index) = mid_index; \
       size -= half_size; \
     } \
-    comparison = compare(&((self)->contents[*(index)] suffix), (needle)); \
-    if (comparison == 0) *(exists) = true; \
-    else if (comparison < 0) *(index) += 1; \
+    comparison = compare(&((self)->contents[*(_index)] suffix), (needle)); \
+    if (comparison == 0) *(_exists) = true; \
+    else if (comparison < 0) *(_index) += 1; \
   } while (0)
 
 // Helper macro for the `_sorted_by` routines below. This takes the left (existing)
 // parameter by reference in order to work with the generic sorting function above.
-#define _compare_int(a, b) ((int)*(a) - (int)(b))
+#define compare_int(a, b) ((int)*(a) - (int)(b))
 
 #ifdef __cplusplus
 }
diff --git a/lib/src/atomic.h b/lib/src/atomic.h
index 16573242..e8a2060a 100644
--- a/lib/src/atomic.h
+++ b/lib/src/atomic.h
@@ -46,11 +46,11 @@ static inline size_t atomic_load(const volatile size_t *p) {
 }
 
 static inline uint32_t atomic_inc(volatile uint32_t *p) {
-  return __sync_add_and_fetch(p, 1u);
+  return __sync_add_and_fetch(p, 1U);
 }
 
 static inline uint32_t atomic_dec(volatile uint32_t *p) {
-  return __sync_sub_and_fetch(p, 1u);
+  return __sync_sub_and_fetch(p, 1U);
 }
 
 #endif
diff --git a/lib/src/get_changed_ranges.c b/lib/src/get_changed_ranges.c
index 18a42417..bcf8da94 100644
--- a/lib/src/get_changed_ranges.c
+++ b/lib/src/get_changed_ranges.c
@@ -210,7 +210,7 @@ static void iterator_ascend(Iterator *self) {
 static bool iterator_descend(Iterator *self, uint32_t goal_position) {
   if (self->in_padding) return false;
 
-  bool did_descend;
+  bool did_descend = false;
   do {
     did_descend = false;
     TreeCursorEntry entry = *array_back(&self->cursor.stack);
diff --git a/lib/src/language.h b/lib/src/language.h
index 7234685e..db61b602 100644
--- a/lib/src/language.h
+++ b/lib/src/language.h
@@ -83,7 +83,7 @@ static inline uint16_t ts_language_lookup(
     for (unsigned i = 0; i < group_count; i++) {
       uint16_t section_value = *(data++);
       uint16_t symbol_count = *(data++);
-      for (unsigned i = 0; i < symbol_count; i++) {
+      for (unsigned j = 0; j < symbol_count; j++) {
         if (*(data++) == symbol) return section_value;
       }
     }
@@ -269,17 +269,17 @@ static inline void ts_language_aliases_for_symbol(
   *start = &self->public_symbol_map[original_symbol];
   *end = *start + 1;
 
-  unsigned i = 0;
+  unsigned idx = 0;
   for (;;) {
-    TSSymbol symbol = self->alias_map[i++];
+    TSSymbol symbol = self->alias_map[idx++];
     if (symbol == 0 || symbol > original_symbol) break;
-    uint16_t count = self->alias_map[i++];
+    uint16_t count = self->alias_map[idx++];
     if (symbol == original_symbol) {
-      *start = &self->alias_map[i];
-      *end = &self->alias_map[i + count];
+      *start = &self->alias_map[idx];
+      *end = &self->alias_map[idx + count];
       break;
     }
-    i += count;
+    idx += count;
   }
 }
 
@@ -289,21 +289,21 @@ static inline void ts_language_write_symbol_as_dot_string(
   TSSymbol symbol
 ) {
   const char *name = ts_language_symbol_name(self, symbol);
-  for (const char *c = name; *c; c++) {
-    switch (*c) {
+  for (const char *chr = name; *chr; chr++) {
+    switch (*chr) {
       case '"':
       case '\\':
         fputc('\\', f);
-        fputc(*c, f);
+        fputc(*chr, f);
         break;
       case '\n':
         fputs("\\n", f);
         break;
       case '\t':
-        fputs("\\n", f);
+        fputs("\\t", f);
         break;
       default:
-        fputc(*c, f);
+        fputc(*chr, f);
         break;
     }
   }
diff --git a/lib/src/lexer.c b/lib/src/lexer.c
index 5940be5e..e32158b2 100644
--- a/lib/src/lexer.c
+++ b/lib/src/lexer.c
@@ -209,9 +209,9 @@ static void ts_lexer__advance(TSLexer *_self, bool skip) {
   if (!self->chunk) return;
 
   if (skip) {
-    LOG("skip", self->data.lookahead);
+    LOG("skip", self->data.lookahead)
   } else {
-    LOG("consume", self->data.lookahead);
+    LOG("consume", self->data.lookahead)
   }
 
   ts_lexer__do_advance(self, skip);
diff --git a/lib/src/parser.c b/lib/src/parser.c
index b6be9aa6..e6a4d3d5 100644
--- a/lib/src/parser.c
+++ b/lib/src/parser.c
@@ -132,10 +132,10 @@ typedef struct {
 static const char *ts_string_input_read(
   void *_self,
   uint32_t byte,
-  TSPoint pt,
+  TSPoint point,
   uint32_t *length
 ) {
-  (void)pt;
+  (void)point;
   TSStringInput *self = (TSStringInput *)_self;
   if (byte >= self->length) {
     *length = 0;
@@ -159,9 +159,9 @@ static void ts_parser__log(TSParser *self) {
 
   if (self->dot_graph_file) {
     fprintf(self->dot_graph_file, "graph {\nlabel=\"");
-    for (char *c = &self->lexer.debug_buffer[0]; *c != 0; c++) {
-      if (*c == '"' || *c == '\\') fputc('\\', self->dot_graph_file);
-      fputc(*c, self->dot_graph_file);
+    for (char *chr = &self->lexer.debug_buffer[0]; *chr != 0; chr++) {
+      if (*chr == '"' || *chr == '\\') fputc('\\', self->dot_graph_file);
+      fputc(*chr, self->dot_graph_file);
     }
     fprintf(self->dot_graph_file, "\"\n}\n\n");
   }
@@ -871,19 +871,19 @@ static StackVersion ts_parser__reduce(
       if (next_slice.version != slice.version) break;
       i++;
 
-      SubtreeArray children = next_slice.subtrees;
-      ts_subtree_array_remove_trailing_extras(&children, &self->trailing_extras2);
+      SubtreeArray next_slice_children = next_slice.subtrees;
+      ts_subtree_array_remove_trailing_extras(&next_slice_children, &self->trailing_extras2);
 
       if (ts_parser__select_children(
         self,
         ts_subtree_from_mut(parent),
-        &children
+        &next_slice_children
       )) {
         ts_subtree_array_clear(&self->tree_pool, &self->trailing_extras);
         ts_subtree_release(&self->tree_pool, ts_subtree_from_mut(parent));
         array_swap(&self->trailing_extras, &self->trailing_extras2);
         parent = ts_subtree_new_node(
-          symbol, &children, production_id, self->language
+          symbol, &next_slice_children, production_id, self->language
         );
       } else {
         array_clear(&self->trailing_extras2);
@@ -994,8 +994,8 @@ static bool ts_parser__do_all_potential_reductions(
     if (version >= version_count) break;
 
     bool merged = false;
-    for (StackVersion i = initial_version_count; i < version; i++) {
-      if (ts_stack_merge(self->stack, i, version)) {
+    for (StackVersion j = initial_version_count; j < version; j++) {
+      if (ts_stack_merge(self->stack, j, version)) {
         merged = true;
         break;
       }
@@ -1018,8 +1018,8 @@ static bool ts_parser__do_all_potential_reductions(
     for (TSSymbol symbol = first_symbol; symbol < end_symbol; symbol++) {
       TableEntry entry;
       ts_language_table_entry(self->language, state, symbol, &entry);
-      for (uint32_t i = 0; i < entry.action_count; i++) {
-        TSParseAction action = entry.actions[i];
+      for (uint32_t j = 0; j < entry.action_count; j++) {
+        TSParseAction action = entry.actions[j];
         switch (action.type) {
           case TSParseActionTypeShift:
           case TSParseActionTypeRecover:
@@ -1041,8 +1041,8 @@ static bool ts_parser__do_all_potential_reductions(
     }
 
     StackVersion reduction_version = STACK_VERSION_NONE;
-    for (uint32_t i = 0; i < self->reduce_actions.size; i++) {
-      ReduceAction action = self->reduce_actions.contents[i];
+    for (uint32_t j = 0; j < self->reduce_actions.size; j++) {
+      ReduceAction action = self->reduce_actions.contents[j];
 
       reduction_version = ts_parser__reduce(
         self, version, action.symbol, action.count,
diff --git a/lib/src/query.c b/lib/src/query.c
index 18cde3e5..ff4bb06c 100644
--- a/lib/src/query.c
+++ b/lib/src/query.c
@@ -1687,10 +1687,10 @@ static bool ts_query__analyze_patterns(TSQuery *self, unsigned *error_offset) {
     array_search_sorted_by(&subgraphs, .symbol, parent_symbol, &subgraph_index, &exists);
     if (!exists) {
       unsigned first_child_step_index = parent_step_index + 1;
-      uint32_t i, exists;
-      array_search_sorted_by(&self->step_offsets, .step_index, first_child_step_index, &i, &exists);
-      assert(exists);
-      *error_offset = self->step_offsets.contents[i].byte_offset;
+      uint32_t j, child_exists;
+      array_search_sorted_by(&self->step_offsets, .step_index, first_child_step_index, &j, &child_exists);
+      assert(child_exists);
+      *error_offset = self->step_offsets.contents[j].byte_offset;
       all_patterns_are_valid = false;
       break;
     }
@@ -1750,10 +1750,10 @@ static bool ts_query__analyze_patterns(TSQuery *self, unsigned *error_offset) {
     if (analysis.finished_parent_symbols.size == 0) {
       assert(analysis.final_step_indices.size > 0);
       uint16_t impossible_step_index = *array_back(&analysis.final_step_indices);
-      uint32_t i, exists;
-      array_search_sorted_by(&self->step_offsets, .step_index, impossible_step_index, &i, &exists);
-      if (i >= self->step_offsets.size) i = self->step_offsets.size - 1;
-      *error_offset = self->step_offsets.contents[i].byte_offset;
+      uint32_t j, impossible_exists;
+      array_search_sorted_by(&self->step_offsets, .step_index, impossible_step_index, &j, &impossible_exists);
+      if (j >= self->step_offsets.size) j = self->step_offsets.size - 1;
+      *error_offset = self->step_offsets.contents[j].byte_offset;
       all_patterns_are_valid = false;
       break;
     }
@@ -2103,13 +2103,13 @@ static TSQueryError ts_query__parse_predicate(
       if (!stream_is_ident_start(stream)) return TSQueryErrorSyntax;
       const char *capture_name = stream->input;
       stream_scan_identifier(stream);
-      uint32_t length = (uint32_t)(stream->input - capture_name);
+      uint32_t capture_length = (uint32_t)(stream->input - capture_name);
 
       // Add the capture id to the first step of the pattern
       int capture_id = symbol_table_id_for_name(
         &self->captures,
         capture_name,
-        length
+        capture_length
       );
       if (capture_id == -1) {
         stream_reset(stream, capture_name);
@@ -2126,14 +2126,14 @@ static TSQueryError ts_query__parse_predicate(
     else if (stream->next == '"') {
       TSQueryError e = ts_query__parse_string_literal(self, stream);
       if (e) return e;
-      uint16_t id = symbol_table_insert_name(
+      uint16_t query_id = symbol_table_insert_name(
         &self->predicate_values,
         self->string_buffer.contents,
         self->string_buffer.size
       );
       array_push(&self->predicate_steps, ((TSQueryPredicateStep) {
         .type = TSQueryPredicateStepTypeString,
-        .value_id = id,
+        .value_id = query_id,
       }));
     }
 
@@ -2141,15 +2141,15 @@ static TSQueryError ts_query__parse_predicate(
     else if (stream_is_ident_start(stream)) {
       const char *symbol_start = stream->input;
       stream_scan_identifier(stream);
-      uint32_t length = (uint32_t)(stream->input - symbol_start);
-      uint16_t id = symbol_table_insert_name(
+      uint32_t symbol_length = (uint32_t)(stream->input - symbol_start);
+      uint16_t query_id = symbol_table_insert_name(
         &self->predicate_values,
         symbol_start,
-        length
+        symbol_length
       );
       array_push(&self->predicate_steps, ((TSQueryPredicateStep) {
         .type = TSQueryPredicateStepTypeString,
-        .value_id = id,
+        .value_id = query_id,
       }));
     }
 
@@ -2762,9 +2762,9 @@ TSQuery *ts_query_new(
       uint32_t start_depth = step->depth;
       bool is_rooted = start_depth == 0;
       for (uint32_t step_index = start_step_index + 1; step_index < self->steps.size; step_index++) {
-        QueryStep *step = &self->steps.contents[step_index];
-        if (step->is_dead_end) break;
-        if (step->depth == start_depth) {
+        QueryStep *child_step = &self->steps.contents[step_index];
+        if (child_step->is_dead_end) break;
+        if (child_step->depth == start_depth) {
           is_rooted = false;
           break;
         }
@@ -3642,8 +3642,8 @@ static inline bool ts_query_cursor__advance(
         }
 
         // Update all of the in-progress states with current node.
-        for (unsigned i = 0, copy_count = 0; i < self->states.size; i += 1 + copy_count) {
-          QueryState *state = &self->states.contents[i];
+        for (unsigned j = 0, copy_count = 0; j < self->states.size; j += 1 + copy_count) {
+          QueryState *state = &self->states.contents[j];
           QueryStep *step = &self->query->steps.contents[state->step_index];
           state->has_in_progress_alternatives = false;
           copy_count = 0;
@@ -3670,8 +3670,8 @@ static inline bool ts_query_cursor__advance(
           }
           if (step->supertype_symbol) {
             bool has_supertype = false;
-            for (unsigned j = 0; j < supertype_count; j++) {
-              if (supertypes[j] == step->supertype_symbol) {
+            for (unsigned k = 0; k < supertype_count; k++) {
+              if (supertypes[k] == step->supertype_symbol) {
                 has_supertype = true;
                 break;
               }
@@ -3716,8 +3716,8 @@ static inline bool ts_query_cursor__advance(
                 &self->capture_list_pool,
                 state->capture_list_id
               );
-              array_erase(&self->states, i);
-              i--;
+              array_erase(&self->states, j);
+              j--;
             }
             continue;
           }
@@ -3777,8 +3777,8 @@ static inline bool ts_query_cursor__advance(
           }
 
           if (state->dead) {
-            array_erase(&self->states, i);
-            i--;
+            array_erase(&self->states, j);
+            j--;
             continue;
           }
 
@@ -3797,29 +3797,29 @@ static inline bool ts_query_cursor__advance(
           // If this state's next step has an alternative step, then copy the state in order
           // to pursue both alternatives. The alternative step itself may have an alternative,
           // so this is an interactive process.
-          unsigned end_index = i + 1;
-          for (unsigned j = i; j < end_index; j++) {
-            QueryState *state = &self->states.contents[j];
-            QueryStep *next_step = &self->query->steps.contents[state->step_index];
-            if (next_step->alternative_index != NONE) {
+          unsigned end_index = j + 1;
+          for (unsigned k = j; k < end_index; k++) {
+            QueryState *child_state = &self->states.contents[k];
+            QueryStep *child_step = &self->query->steps.contents[child_state->step_index];
+            if (child_step->alternative_index != NONE) {
               // A "dead-end" step exists only to add a non-sequential jump into the step sequence,
               // via its alternative index. When a state reaches a dead-end step, it jumps straight
               // to the step's alternative.
-              if (next_step->is_dead_end) {
-                state->step_index = next_step->alternative_index;
-                j--;
+              if (child_step->is_dead_end) {
+                child_state->step_index = child_step->alternative_index;
+                k--;
                 continue;
               }
 
               // A "pass-through" step exists only to add a branch into the step sequence,
               // via its alternative_index. When a state reaches a pass-through step, it splits
               // in order to process the alternative step, and then it advances to the next step.
-              if (next_step->is_pass_through) {
-                state->step_index++;
-                j--;
+              if (child_step->is_pass_through) {
+                child_state->step_index++;
+                k--;
               }
 
-              QueryState *copy = ts_query_cursor__copy_state(self, &state);
+              QueryState *copy = ts_query_cursor__copy_state(self, &child_state);
               if (copy) {
                 LOG(
                   "  split state for branch. pattern:%u, from_step:%u, to_step:%u, immediate:%d, capture_count: %u\n",
@@ -3831,8 +3831,8 @@ static inline bool ts_query_cursor__advance(
                 );
                 end_index++;
                 copy_count++;
-                copy->step_index = next_step->alternative_index;
-                if (next_step->alternative_is_immediate) {
+                copy->step_index = child_step->alternative_index;
+                if (child_step->alternative_is_immediate) {
                   copy->seeking_immediate_match = true;
                 }
               }
@@ -3840,11 +3840,11 @@ static inline bool ts_query_cursor__advance(
           }
         }
 
-        for (unsigned i = 0; i < self->states.size; i++) {
-          QueryState *state = &self->states.contents[i];
+        for (unsigned j = 0; j < self->states.size; j++) {
+          QueryState *state = &self->states.contents[j];
           if (state->dead) {
-            array_erase(&self->states, i);
-            i--;
+            array_erase(&self->states, j);
+            j--;
             continue;
           }
 
@@ -3852,8 +3852,8 @@ static inline bool ts_query_cursor__advance(
           // repeated nodes, this is necessary to avoid multiple redundant states, where
           // one state has a strict subset of another state's captures.
           bool did_remove = false;
-          for (unsigned j = i + 1; j < self->states.size; j++) {
-            QueryState *other_state = &self->states.contents[j];
+          for (unsigned k = j + 1; k < self->states.size; k++) {
+            QueryState *other_state = &self->states.contents[k];
 
             // Query states are kept in ascending order of start_depth and pattern_index.
             // Since the longest-match criteria is only used for deduping matches of the same
@@ -3880,8 +3880,8 @@ static inline bool ts_query_cursor__advance(
                   state->step_index
                 );
                 capture_list_pool_release(&self->capture_list_pool, other_state->capture_list_id);
-                array_erase(&self->states, j);
-                j--;
+                array_erase(&self->states, k);
+                k--;
                 continue;
               }
               other_state->has_in_progress_alternatives = true;
@@ -3894,8 +3894,8 @@ static inline bool ts_query_cursor__advance(
                   state->step_index
                 );
                 capture_list_pool_release(&self->capture_list_pool, state->capture_list_id);
-                array_erase(&self->states, i);
-                i--;
+                array_erase(&self->states, j);
+                j--;
                 did_remove = true;
                 break;
               }
@@ -3922,7 +3922,7 @@ static inline bool ts_query_cursor__advance(
                 array_push(&self->finished_states, *state);
                 array_erase(&self->states, (uint32_t)(state - self->states.contents));
                 did_match = true;
-                i--;
+                j--;
               }
             }
           }
diff --git a/lib/src/stack.c b/lib/src/stack.c
index 98e3a96f..44f989ae 100644
--- a/lib/src/stack.c
+++ b/lib/src/stack.c
@@ -316,7 +316,7 @@ inline StackSliceArray stack__iter(
   array_clear(&self->iterators);
 
   StackHead *head = array_get(&self->heads, version);
-  StackIterator iterator = {
+  StackIterator new_iterator = {
     .node = head->node,
     .subtrees = array_new(),
     .subtree_count = 0,
@@ -326,10 +326,10 @@ inline StackSliceArray stack__iter(
   bool include_subtrees = false;
   if (goal_subtree_count >= 0) {
     include_subtrees = true;
-    array_reserve(&iterator.subtrees, (uint32_t)ts_subtree_alloc_size(goal_subtree_count) / sizeof(Subtree));
+    array_reserve(&new_iterator.subtrees, (uint32_t)ts_subtree_alloc_size(goal_subtree_count) / sizeof(Subtree));
   }
 
-  array_push(&self->iterators, iterator);
+  array_push(&self->iterators, new_iterator);
 
   while (self->iterators.size > 0) {
     for (uint32_t i = 0, size = self->iterators.size; i < size; i++) {
@@ -505,7 +505,7 @@ inline StackAction pop_count_callback(void *payload, const StackIterator *iterat
 }
 
 StackSliceArray ts_stack_pop_count(Stack *self, StackVersion version, uint32_t count) {
-  return stack__iter(self, version, pop_count_callback, &count, count);
+  return stack__iter(self, version, pop_count_callback, &count, (int)count);
 }
 
 inline StackAction pop_pending_callback(void *payload, const StackIterator *iterator) {
diff --git a/lib/src/subtree.c b/lib/src/subtree.c
index 2bf25dc5..5f39bd82 100644
--- a/lib/src/subtree.c
+++ b/lib/src/subtree.c
@@ -56,10 +56,10 @@ const char *ts_external_scanner_state_data(const ExternalScannerState *self) {
   }
 }
 
-bool ts_external_scanner_state_eq(const ExternalScannerState *a, const char *buffer, unsigned length) {
+bool ts_external_scanner_state_eq(const ExternalScannerState *self, const char *buffer, unsigned length) {
   return
-    a->length == length &&
-    memcmp(ts_external_scanner_state_data(a), buffer, length) == 0;
+    self->length == length &&
+    memcmp(ts_external_scanner_state_data(self), buffer, length) == 0;
 }
 
 // SubtreeArray
@@ -643,7 +643,7 @@ static inline void ts_subtree_set_has_changes(MutableSubtree *self) {
   }
 }
 
-Subtree ts_subtree_edit(Subtree self, const TSInputEdit *edit, SubtreePool *pool) {
+Subtree ts_subtree_edit(Subtree self, const TSInputEdit *input_edit, SubtreePool *pool) {
   typedef struct {
     Subtree *tree;
     Edit edit;
@@ -653,9 +653,9 @@ Subtree ts_subtree_edit(Subtree self, const TSInputEdit *edit, SubtreePool *pool
   array_push(&stack, ((StackEntry) {
     .tree = &self,
     .edit = (Edit) {
-      .start = {edit->start_byte, edit->start_point},
-      .old_end = {edit->old_end_byte, edit->old_end_point},
-      .new_end = {edit->new_end_byte, edit->new_end_point},
+      .start = {input_edit->start_byte, input_edit->start_point},
+      .old_end = {input_edit->old_end_byte, input_edit->old_end_point},
+      .new_end = {input_edit->new_end_byte, input_edit->new_end_point},
     },
   }));
 
@@ -813,24 +813,24 @@ Subtree ts_subtree_last_external_token(Subtree tree) {
   return tree;
 }
 
-static size_t ts_subtree__write_char_to_string(char *s, size_t n, int32_t c) {
-  if (c == -1)
-    return snprintf(s, n, "INVALID");
-  else if (c == '\0')
-    return snprintf(s, n, "'\\0'");
-  else if (c == '\n')
-    return snprintf(s, n, "'\\n'");
-  else if (c == '\t')
-    return snprintf(s, n, "'\\t'");
-  else if (c == '\r')
-    return snprintf(s, n, "'\\r'");
-  else if (0 < c && c < 128 && isprint(c))
-    return snprintf(s, n, "'%c'", c);
+static size_t ts_subtree__write_char_to_string(char *str, size_t n, int32_t chr) {
+  if (chr == -1)
+    return snprintf(str, n, "INVALID");
+  else if (chr == '\0')
+    return snprintf(str, n, "'\\0'");
+  else if (chr == '\n')
+    return snprintf(str, n, "'\\n'");
+  else if (chr == '\t')
+    return snprintf(str, n, "'\\t'");
+  else if (chr == '\r')
+    return snprintf(str, n, "'\\r'");
+  else if (0 < chr && chr < 128 && isprint(chr))
+    return snprintf(str, n, "'%c'", chr);
   else
-    return snprintf(s, n, "%d", c);
+    return snprintf(str, n, "%d", chr);
 }
 
-static const char *ROOT_FIELD = "__ROOT__";
+static const char *const ROOT_FIELD = "__ROOT__";
 
 static size_t ts_subtree__write_to_string(
   Subtree self, char *string, size_t limit,
@@ -902,17 +902,17 @@ static size_t ts_subtree__write_to_string(
           0, false, NULL
         );
       } else {
-        TSSymbol alias_symbol = alias_sequence
+        TSSymbol subtree_alias_symbol = alias_sequence
           ? alias_sequence[structural_child_index]
           : 0;
-        bool alias_is_named = alias_symbol
-          ? ts_language_symbol_metadata(language, alias_symbol).named
+        bool subtree_alias_is_named = subtree_alias_symbol
+          ? ts_language_symbol_metadata(language, subtree_alias_symbol).named
           : false;
 
         const char *child_field_name = is_visible ? NULL : field_name;
-        for (const TSFieldMapEntry *i = field_map; i < field_map_end; i++) {
-          if (!i->inherited && i->child_index == structural_child_index) {
-            child_field_name = language->field_names[i->field_id];
+        for (const TSFieldMapEntry *map = field_map; map < field_map_end; map++) {
+          if (!map->inherited && map->child_index == structural_child_index) {
+            child_field_name = language->field_names[map->field_id];
             break;
           }
         }
@@ -920,7 +920,7 @@ static size_t ts_subtree__write_to_string(
         cursor += ts_subtree__write_to_string(
           child, *writer, limit,
           language, include_all,
-          alias_symbol, alias_is_named, child_field_name
+          subtree_alias_symbol, subtree_alias_is_named, child_field_name
         );
         structural_child_index++;
       }
@@ -996,12 +996,12 @@ void ts_subtree__print_dot_graph(const Subtree *self, uint32_t start_offset,
     ts_subtree_production_id(*self);
   for (uint32_t i = 0, n = ts_subtree_child_count(*self); i < n; i++) {
     const Subtree *child = &ts_subtree_children(*self)[i];
-    TSSymbol alias_symbol = 0;
+    TSSymbol subtree_alias_symbol = 0;
     if (!ts_subtree_extra(*child) && child_info_offset) {
-      alias_symbol = language->alias_sequences[child_info_offset];
+      subtree_alias_symbol = language->alias_sequences[child_info_offset];
       child_info_offset++;
     }
-    ts_subtree__print_dot_graph(child, child_start_offset, language, alias_symbol, f);
+    ts_subtree__print_dot_graph(child, child_start_offset, language, subtree_alias_symbol, f);
     fprintf(f, "tree_%p -> tree_%p [tooltip=%u]\n", (void *)self, (void *)child, i);
     child_start_offset += ts_subtree_total_bytes(*child);
   }
@@ -1028,12 +1028,12 @@ const ExternalScannerState *ts_subtree_external_scanner_state(Subtree self) {
   }
 }
 
-bool ts_subtree_external_scanner_state_eq(Subtree a, Subtree b) {
-  const ExternalScannerState *state_a = ts_subtree_external_scanner_state(a);
-  const ExternalScannerState *state_b = ts_subtree_external_scanner_state(b);
+bool ts_subtree_external_scanner_state_eq(Subtree self, Subtree other) {
+  const ExternalScannerState *state_self = ts_subtree_external_scanner_state(self);
+  const ExternalScannerState *state_other = ts_subtree_external_scanner_state(other);
   return ts_external_scanner_state_eq(
-    state_a,
-    ts_external_scanner_state_data(state_b),
-    state_b->length
+    state_self,
+    ts_external_scanner_state_data(state_other),
+    state_other->length
   );
 }
diff --git a/lib/src/subtree.h b/lib/src/subtree.h
index 7b4db2e6..c5eca079 100644
--- a/lib/src/subtree.h
+++ b/lib/src/subtree.h
@@ -175,7 +175,7 @@ typedef struct {
 
 void ts_external_scanner_state_init(ExternalScannerState *, const char *, unsigned);
 const char *ts_external_scanner_state_data(const ExternalScannerState *);
-bool ts_external_scanner_state_eq(const ExternalScannerState *a, const char *, unsigned);
+bool ts_external_scanner_state_eq(const ExternalScannerState *self, const char *, unsigned);
 void ts_external_scanner_state_delete(ExternalScannerState *self);
 
 void ts_subtree_array_copy(SubtreeArray, SubtreeArray *);
@@ -212,7 +212,7 @@ Subtree ts_subtree_last_external_token(Subtree);
 const ExternalScannerState *ts_subtree_external_scanner_state(Subtree self);
 bool ts_subtree_external_scanner_state_eq(Subtree, Subtree);
 
-#define SUBTREE_GET(self, name) (self.data.is_inline ? self.data.name : self.ptr->name)
+#define SUBTREE_GET(self, name) ((self).data.is_inline ? (self).data.name : (self).ptr->name)
 
 static inline TSSymbol ts_subtree_symbol(Subtree self) { return SUBTREE_GET(self, symbol); }
 static inline bool ts_subtree_visible(Subtree self) { return SUBTREE_GET(self, visible); }
diff --git a/lib/src/tree.c b/lib/src/tree.c
index 79e1d1ae..784c51fd 100644
--- a/lib/src/tree.c
+++ b/lib/src/tree.c
@@ -98,23 +98,23 @@ TSRange *ts_tree_included_ranges(const TSTree *self, uint32_t *length) {
   return ranges;
 }
 
-TSRange *ts_tree_get_changed_ranges(const TSTree *self, const TSTree *other, uint32_t *count) {
+TSRange *ts_tree_get_changed_ranges(const TSTree *old_tree, const TSTree *new_tree, uint32_t *length) {
   TreeCursor cursor1 = {NULL, array_new()};
   TreeCursor cursor2 = {NULL, array_new()};
-  ts_tree_cursor_init(&cursor1, ts_tree_root_node(self));
-  ts_tree_cursor_init(&cursor2, ts_tree_root_node(other));
+  ts_tree_cursor_init(&cursor1, ts_tree_root_node(old_tree));
+  ts_tree_cursor_init(&cursor2, ts_tree_root_node(new_tree));
 
   TSRangeArray included_range_differences = array_new();
   ts_range_array_get_changed_ranges(
-    self->included_ranges, self->included_range_count,
-    other->included_ranges, other->included_range_count,
+    old_tree->included_ranges, old_tree->included_range_count,
+    new_tree->included_ranges, new_tree->included_range_count,
     &included_range_differences
   );
 
   TSRange *result;
-  *count = ts_subtree_get_changed_ranges(
-    &self->root, &other->root, &cursor1, &cursor2,
-    self->language, &included_range_differences, &result
+  *length = ts_subtree_get_changed_ranges(
+    &old_tree->root, &new_tree->root, &cursor1, &cursor2,
+    old_tree->language, &included_range_differences, &result
   );
 
   array_delete(&included_range_differences);
@@ -134,8 +134,8 @@ void ts_tree_print_dot_graph(const TSTree *self, int fd) {
 
 #include <unistd.h>
 
-void ts_tree_print_dot_graph(const TSTree *self, int fd) {
-  FILE *file = fdopen(dup(fd), "a");
+void ts_tree_print_dot_graph(const TSTree *self, int file_descriptor) {
+  FILE *file = fdopen(dup(file_descriptor), "a");
   ts_subtree_print_dot_graph(self->root, self->language, file);
   fclose(file);
 }
diff --git a/lib/src/tree_cursor.c b/lib/src/tree_cursor.c
index 5383c094..97a53152 100644
--- a/lib/src/tree_cursor.c
+++ b/lib/src/tree_cursor.c
@@ -16,12 +16,12 @@ typedef struct {
 
 // CursorChildIterator
 
-static inline bool ts_tree_cursor_is_entry_visible(const TreeCursor *self, uint32_t i) {
-  TreeCursorEntry *entry = &self->stack.contents[i];
-  if (i == 0 || ts_subtree_visible(*entry->subtree)) {
+static inline bool ts_tree_cursor_is_entry_visible(const TreeCursor *self, uint32_t index) {
+  TreeCursorEntry *entry = &self->stack.contents[index];
+  if (index == 0 || ts_subtree_visible(*entry->subtree)) {
     return true;
   } else if (!ts_subtree_extra(*entry->subtree)) {
-    TreeCursorEntry *parent_entry = &self->stack.contents[i - 1];
+    TreeCursorEntry *parent_entry = &self->stack.contents[index - 1];
     return ts_language_alias_at(
       self->tree->language,
       parent_entry->subtree->ptr->production_id,
@@ -444,9 +444,9 @@ void ts_tree_cursor_current_status(
 
       // Look for a field name associated with the current node.
       if (!*field_id) {
-        for (const TSFieldMapEntry *i = field_map; i < field_map_end; i++) {
-          if (!i->inherited && i->child_index == entry->structural_child_index) {
-            *field_id = i->field_id;
+        for (const TSFieldMapEntry *map = field_map; map < field_map_end; map++) {
+          if (!map->inherited && map->child_index == entry->structural_child_index) {
+            *field_id = map->field_id;
             break;
           }
         }
@@ -454,10 +454,10 @@ void ts_tree_cursor_current_status(
 
       // Determine if the current node can have later siblings with the same field name.
       if (*field_id) {
-        for (const TSFieldMapEntry *i = field_map; i < field_map_end; i++) {
+        for (const TSFieldMapEntry *map = field_map; map < field_map_end; map++) {
           if (
-            i->field_id == *field_id &&
-            i->child_index > entry->structural_child_index
+            map->field_id == *field_id &&
+            map->child_index > entry->structural_child_index
           ) {
             *can_have_later_siblings_with_this_field = true;
             break;
@@ -528,9 +528,9 @@ TSFieldId ts_tree_cursor_current_field_id(const TSTreeCursor *_self) {
       parent_entry->subtree->ptr->production_id,
       &field_map, &field_map_end
     );
-    for (const TSFieldMapEntry *i = field_map; i < field_map_end; i++) {
-      if (!i->inherited && i->child_index == entry->structural_child_index) {
-        return i->field_id;
+    for (const TSFieldMapEntry *map = field_map; map < field_map_end; map++) {
+      if (!map->inherited && map->child_index == entry->structural_child_index) {
+        return map->field_id;
       }
     }
   }

From cf418a286e427089997e59b284118970b9664f53 Mon Sep 17 00:00:00 2001
From: Amaan Qureshi <amaanq12@gmail.com>
Date: Thu, 20 Jul 2023 06:52:11 -0400
Subject: [PATCH 185/347] chore: make implicit function declarations a
 compile-time error

---
 cli/loader/src/lib.rs | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/cli/loader/src/lib.rs b/cli/loader/src/lib.rs
index 30cec2ca..b498e64b 100644
--- a/cli/loader/src/lib.rs
+++ b/cli/loader/src/lib.rs
@@ -370,7 +370,8 @@ impl Loader {
                 .opt_level(2)
                 .cargo_metadata(false)
                 .target(BUILD_TARGET)
-                .host(BUILD_TARGET);
+                .host(BUILD_TARGET)
+                .flag_if_supported("-Werror=implicit-function-declaration");
             let compiler = config.get_compiler();
             let mut command = Command::new(compiler.path());
             for (key, value) in compiler.env() {

From 13de63a11356f21e6b46a23eb1333d008c658ff3 Mon Sep 17 00:00:00 2001
From: Amaan Qureshi <amaanq12@gmail.com>
Date: Thu, 20 Jul 2023 07:02:08 -0400
Subject: [PATCH 186/347] chore: update Cargo.lock

---
 Cargo.lock | 335 ++++++++++++++++++++++++++++++++---------------------
 1 file changed, 205 insertions(+), 130 deletions(-)

diff --git a/Cargo.lock b/Cargo.lock
index 606f1e95..af6868dd 100644
--- a/Cargo.lock
+++ b/Cargo.lock
@@ -4,9 +4,9 @@ version = 3
 
 [[package]]
 name = "aho-corasick"
-version = "1.0.1"
+version = "1.0.2"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "67fc08ce920c31afb70f013dcce1bfc3a3195de6a228474e45e1f145b36f8d04"
+checksum = "43f6cb1bf222025340178f382c426f13757b2960e89779dfcb319c32542a5a41"
 dependencies = [
  "memchr",
 ]
@@ -22,9 +22,9 @@ dependencies = [
 
 [[package]]
 name = "anyhow"
-version = "1.0.71"
+version = "1.0.72"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "9c7d0618f0e0b7e8ff11427422b64564d5fb0be1940354bfe2e0529b18a9d9b8"
+checksum = "3b13c32d80ecc7ab747b80c3784bce54ee8a7a0cc4fbda9bf4cda2cf6fe90854"
 
 [[package]]
 name = "ascii"
@@ -57,9 +57,9 @@ checksum = "bef38d45163c2f1dde094a7dfd33ccf595c92905c8f8f4fdc18d06fb1037718a"
 
 [[package]]
 name = "bumpalo"
-version = "3.12.1"
+version = "3.13.0"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "9b1ce199063694f33ffb7dd4e0ee620741495c32833cde5aa08f02a0bf96f0c8"
+checksum = "a3e2c3daef883ecc1b5d58c15adae93470a91d425f3532ba1695849656af3fc1"
 
 [[package]]
 name = "bytes"
@@ -134,22 +134,22 @@ checksum = "e496a50fda8aacccc86d7529e2c1e0892dbd0f898a6b5645b5561b89c3210efa"
 
 [[package]]
 name = "ctor"
-version = "0.1.26"
+version = "0.2.4"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "6d2301688392eb071b0bf1a37be05c469d3cc4dbbd95df672fe28ab021e6a096"
+checksum = "1f34ba9a9bcb8645379e9de8cb3ecfcf4d1c85ba66d90deb3259206fa5aa193b"
 dependencies = [
  "quote",
- "syn 1.0.109",
+ "syn 2.0.26",
 ]
 
 [[package]]
 name = "ctrlc"
-version = "3.2.5"
+version = "3.4.0"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "bbcf33c2a618cbe41ee43ae6e9f2e48368cd9f9db2896f10167d8d762679f639"
+checksum = "2a011bbe2c35ce9c1f143b7af6f94f29a167beb4cd1d29e6740ce836f723120e"
 dependencies = [
  "nix",
- "windows-sys 0.45.0",
+ "windows-sys 0.48.0",
 ]
 
 [[package]]
@@ -170,16 +170,16 @@ version = "3.0.2"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "30baa043103c9d0c2a57cf537cc2f35623889dc0d405e6c3cccfadbc81c71309"
 dependencies = [
- "dirs-sys",
+ "dirs-sys 0.3.7",
 ]
 
 [[package]]
 name = "dirs"
-version = "4.0.0"
+version = "5.0.1"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "ca3aa72a6f96ea37bbc5aa912f6788242832f75369bdfdadcb0e38423f100059"
+checksum = "44c45a9d03d6676652bcb5e724c7e988de1acad23a711b5217ab9cbecbec2225"
 dependencies = [
- "dirs-sys",
+ "dirs-sys 0.4.1",
 ]
 
 [[package]]
@@ -193,12 +193,30 @@ dependencies = [
  "winapi",
 ]
 
+[[package]]
+name = "dirs-sys"
+version = "0.4.1"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "520f05a5cbd335fae5a99ff7a6ab8627577660ee5cfd6a94a6a929b52ff0321c"
+dependencies = [
+ "libc",
+ "option-ext",
+ "redox_users",
+ "windows-sys 0.48.0",
+]
+
 [[package]]
 name = "either"
 version = "1.8.1"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "7fcaabb2fef8c910e7f4c7ce9f67a1283a1715879a7c230ca9d6d1ae31f16d91"
 
+[[package]]
+name = "equivalent"
+version = "1.0.1"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "5443807d6dff69373d433ab9ef5378ad8df50ca6298caf15de6e52e24aaf54d5"
+
 [[package]]
 name = "errno"
 version = "0.3.1"
@@ -231,18 +249,18 @@ dependencies = [
 
 [[package]]
 name = "form_urlencoded"
-version = "1.1.0"
+version = "1.2.0"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "a9c384f161156f5260c24a097c56119f9be8c798586aecc13afbcbe7b7e26bf8"
+checksum = "a62bc1cf6f830c2ec14a513a9fb124d0a213a629668a4186f329db21fe045652"
 dependencies = [
  "percent-encoding",
 ]
 
 [[package]]
 name = "getrandom"
-version = "0.2.9"
+version = "0.2.10"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "c85e1d9ab2eadba7e5040d4e09cbd6d072b76a557ad64e797c2cb9d4da21d7e4"
+checksum = "be4136b2a15dd319360be1c07d9933517ccf0be8f16bf62a3bee4f0d618df427"
 dependencies = [
  "cfg-if",
  "libc",
@@ -257,9 +275,9 @@ checksum = "d2fabcfbdc87f4758337ca535fb41a6d701b65693ce38287d856d1674551ec9b"
 
 [[package]]
 name = "hashbrown"
-version = "0.12.3"
+version = "0.14.0"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "8a9ee70c43aaf417c914396645a0fa852624801b24ebb7ae78fe8272889ac888"
+checksum = "2c6201b9ff9fd90a5a3bac2e56a830d0caa509576f0e503818ee82c181b3437a"
 
 [[package]]
 name = "hermit-abi"
@@ -272,9 +290,18 @@ dependencies = [
 
 [[package]]
 name = "hermit-abi"
-version = "0.3.1"
+version = "0.3.2"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "fed44880c466736ef9a5c5b5facefb5ed0785676d0c02d612db14e54f0d84286"
+checksum = "443144c8cdadd93ebf52ddb4056d257f5b52c04d3c804e657d19eb73fc33668b"
+
+[[package]]
+name = "home"
+version = "0.5.5"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "5444c27eef6923071f7ebcc33e3444508466a76f7a2b93da00ed6e19f30c1ddb"
+dependencies = [
+ "windows-sys 0.48.0",
+]
 
 [[package]]
 name = "html-escape"
@@ -293,9 +320,9 @@ checksum = "c4a1e36c821dbe04574f602848a19f742f4fb3c98d40449f11bcad18d6b17421"
 
 [[package]]
 name = "idna"
-version = "0.3.0"
+version = "0.4.0"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "e14ddfc70884202db2244c223200c204c2bda1bc6e0998d11b5e024d657209e6"
+checksum = "7d20d6b07bfbc108882d88ed8e37d39636dcc260e15e30c45e6ba089610b917c"
 dependencies = [
  "unicode-bidi",
  "unicode-normalization",
@@ -303,19 +330,19 @@ dependencies = [
 
 [[package]]
 name = "indexmap"
-version = "1.9.3"
+version = "2.0.0"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "bd070e393353796e801d209ad339e89596eb4c8d430d18ede6a1cced8fafbd99"
+checksum = "d5477fe2230a79769d8dc68e0eabf5437907c0457a5614a9e8dddb67f65eb65d"
 dependencies = [
- "autocfg",
+ "equivalent",
  "hashbrown",
 ]
 
 [[package]]
 name = "indoc"
-version = "2.0.1"
+version = "2.0.3"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "9f2cb48b81b1dc9f39676bf99f5499babfec7cd8fe14307f7b3d747208fb5690"
+checksum = "2c785eefb63ebd0e33416dfcb8d6da0bf27ce752843a45632a67bf10d4d4b5c4"
 
 [[package]]
 name = "instant"
@@ -328,20 +355,20 @@ dependencies = [
 
 [[package]]
 name = "io-lifetimes"
-version = "1.0.10"
+version = "1.0.11"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "9c66c74d2ae7e79a5a8f7ac924adbe38ee42a859c6539ad869eb51f0b52dc220"
+checksum = "eae7b9aee968036d54dce06cebaefd919e4472e753296daccd6d344e3e2df0c2"
 dependencies = [
- "hermit-abi 0.3.1",
+ "hermit-abi 0.3.2",
  "libc",
  "windows-sys 0.48.0",
 ]
 
 [[package]]
 name = "itoa"
-version = "1.0.6"
+version = "1.0.9"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "453ad9f582a441959e5f0d088b02ce04cfe8d51a8eaf077f12ac6d3e94164ca6"
+checksum = "af150ab688ff2122fcef229be89cb50dd66af9e01a4ff320cc137eecc9bacc38"
 
 [[package]]
 name = "jni"
@@ -367,9 +394,9 @@ checksum = "8eaf4bc02d17cbdd7ff4c7438cafcdf7fb9a4613313ad11b4f8fefe7d3fa0130"
 
 [[package]]
 name = "js-sys"
-version = "0.3.61"
+version = "0.3.64"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "445dde2150c55e483f3d8416706b97ec8e8237c307e5b7b4b8dd15e6af2a0730"
+checksum = "c5f195fe497f702db0f318b07fdd68edb16955aed830df8363d837542f8f935a"
 dependencies = [
  "wasm-bindgen",
 ]
@@ -382,9 +409,9 @@ checksum = "e2abad23fbc42b3700f2f279844dc832adb2b2eb069b2df918f455c4e18cc646"
 
 [[package]]
 name = "libc"
-version = "0.2.142"
+version = "0.2.147"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "6a987beff54b60ffa6d51982e1aa1146bc42f19bd26be28b0586f252fccf5317"
+checksum = "b4668fb0ea861c1df094127ac5f1da3409a82116a4ba74fca2e58ef927159bb3"
 
 [[package]]
 name = "libloading"
@@ -398,18 +425,15 @@ dependencies = [
 
 [[package]]
 name = "linux-raw-sys"
-version = "0.3.6"
+version = "0.3.8"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "b64f40e5e03e0d54f03845c8197d0291253cdbedfb1cb46b13c2c117554a9f4c"
+checksum = "ef53942eb7bf7ff43a617b3e2c1c4a5ecf5944a7c1bc12d7ee39bbb15e5c1519"
 
 [[package]]
 name = "log"
-version = "0.4.17"
+version = "0.4.19"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "abb12e687cfb44aa40f41fc3978ef76448f9b6038cad6aef4259d3c095a2382e"
-dependencies = [
- "cfg-if",
-]
+checksum = "b06a4cde4c0f271a446782e3eff8de789548ce57dbc8eca9292c27f4a42004b4"
 
 [[package]]
 name = "malloc_buf"
@@ -455,18 +479,15 @@ dependencies = [
 
 [[package]]
 name = "once_cell"
-version = "1.17.1"
+version = "1.18.0"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "b7e5500299e16ebb147ae15a00a942af264cf3688f47923b8fc2cd5858f23ad3"
+checksum = "dd8b5dd2ae5ed71462c540258bedcb51965123ad7e7ccf4b9a8cafaa4a63576d"
 
 [[package]]
-name = "output_vt100"
-version = "0.1.3"
+name = "option-ext"
+version = "0.2.0"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "628223faebab4e3e40667ee0b2336d34a5b960ff60ea743ddfdbcf7770bcfb66"
-dependencies = [
- "winapi",
-]
+checksum = "04744f49eae99ab78e0d5c0b603ab218f515ea8cfe5a456d7629ad883a3b6e7d"
 
 [[package]]
 name = "path-slash"
@@ -476,9 +497,9 @@ checksum = "1e91099d4268b0e11973f036e885d652fb0b21fedcf69738c627f94db6a44f42"
 
 [[package]]
 name = "percent-encoding"
-version = "2.2.0"
+version = "2.3.0"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "478c572c3d73181ff3c2539045f6eb99e5491218eae919370993b890cdbdd98e"
+checksum = "9b2a4787296e9989611394c33f193f676704af1686e70b8f8033ab5ba9a35a94"
 
 [[package]]
 name = "ppv-lite86"
@@ -488,30 +509,28 @@ checksum = "5b40af805b3121feab8a3c29f04d8ad262fa8e0561883e7653e024ae4479e6de"
 
 [[package]]
 name = "pretty_assertions"
-version = "0.7.2"
+version = "1.4.0"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "1cab0e7c02cf376875e9335e0ba1da535775beb5450d21e1dffca068818ed98b"
+checksum = "af7cee1a6c8a5b9208b3cb1061f10c0cb689087b3d8ce85fb9d2dd7a29b6ba66"
 dependencies = [
- "ansi_term",
- "ctor",
  "diff",
- "output_vt100",
+ "yansi",
 ]
 
 [[package]]
 name = "proc-macro2"
-version = "1.0.63"
+version = "1.0.66"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "7b368fba921b0dce7e60f5e04ec15e565b3303972b42bcfde1d0713b881959eb"
+checksum = "18fb31db3f9bddb2ea821cde30a9f70117e3f119938b5ee630b7403aa6e2ead9"
 dependencies = [
  "unicode-ident",
 ]
 
 [[package]]
 name = "quote"
-version = "1.0.26"
+version = "1.0.31"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "4424af4bf778aae2051a77b60283332f386554255d722233d09fbfc7e30da2fc"
+checksum = "5fe8a65d69dd0808184ebb5f836ab526bb259db23c657efa38711b1072ee47f0"
 dependencies = [
  "proc-macro2",
 ]
@@ -583,26 +602,32 @@ dependencies = [
 
 [[package]]
 name = "regex"
-version = "1.8.1"
+version = "1.9.1"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "af83e617f331cc6ae2da5443c602dfa5af81e517212d9d611a5b3ba1777b5370"
+checksum = "b2eae68fc220f7cf2532e4494aded17545fce192d59cd996e0fe7887f4ceb575"
 dependencies = [
  "aho-corasick",
  "memchr",
- "regex-syntax 0.7.1",
+ "regex-automata",
+ "regex-syntax",
+]
+
+[[package]]
+name = "regex-automata"
+version = "0.3.3"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "39354c10dd07468c2e73926b23bb9c2caca74c5501e38a35da70406f1d923310"
+dependencies = [
+ "aho-corasick",
+ "memchr",
+ "regex-syntax",
 ]
 
 [[package]]
 name = "regex-syntax"
-version = "0.6.29"
+version = "0.7.4"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "f162c6dd7b008981e4d40210aca20b4bd0f9b60ca9271061b07f78537722f2e1"
-
-[[package]]
-name = "regex-syntax"
-version = "0.7.1"
-source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "a5996294f19bd3aae0453a862ad728f60e6600695733dd5df01da90c54363a3c"
+checksum = "e5ea92a5b6195c6ef2a0295ea818b312502c6fc94dde986c5553242e18fd4ce2"
 
 [[package]]
 name = "rustc-hash"
@@ -612,9 +637,9 @@ checksum = "08d43f7aa6b08d49f382cde6a7982047c3426db949b1424bc4b7ec9ae12c6ce2"
 
 [[package]]
 name = "rustix"
-version = "0.37.18"
+version = "0.37.23"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "8bbfc1d1c7c40c01715f47d71444744a81669ca84e8b63e25a55e169b1f86433"
+checksum = "4d69718bf81c6127a49dc64e44a742e8bb9213c0ff8869a22c308f84c1d4ab06"
 dependencies = [
  "bitflags",
  "errno",
@@ -626,9 +651,9 @@ dependencies = [
 
 [[package]]
 name = "ryu"
-version = "1.0.13"
+version = "1.0.15"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "f91339c0467de62360649f8d3e185ca8de4224ff281f66000de5eb2a77a79041"
+checksum = "1ad4cc8da4ef723ed60bced201181d83791ad433213d8c24efffda1eec85d741"
 
 [[package]]
 name = "same-file"
@@ -641,35 +666,35 @@ dependencies = [
 
 [[package]]
 name = "semver"
-version = "1.0.17"
+version = "1.0.18"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "bebd363326d05ec3e2f532ab7660680f3b02130d780c299bca73469d521bc0ed"
+checksum = "b0293b4b29daaf487284529cc2f5675b8e57c61f70167ba415a463651fd6a918"
 
 [[package]]
 name = "serde"
-version = "1.0.160"
+version = "1.0.173"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "bb2f3770c8bce3bcda7e149193a069a0f4365bda1fa5cd88e03bca26afc1216c"
+checksum = "e91f70896d6720bc714a4a57d22fc91f1db634680e65c8efe13323f1fa38d53f"
 dependencies = [
  "serde_derive",
 ]
 
 [[package]]
 name = "serde_derive"
-version = "1.0.160"
+version = "1.0.173"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "291a097c63d8497e00160b166a967a4a79c64f3facdd01cbd7502231688d77df"
+checksum = "a6250dde8342e0232232be9ca3db7aa40aceb5a3e5dd9bddbc00d99a007cde49"
 dependencies = [
  "proc-macro2",
  "quote",
- "syn 2.0.15",
+ "syn 2.0.26",
 ]
 
 [[package]]
 name = "serde_json"
-version = "1.0.96"
+version = "1.0.103"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "057d394a50403bcac12672b2b18fb387ab6d289d957dab67dd201875391e52f1"
+checksum = "d03b412469450d4404fe8499a268edd7f8b79fecb074b0d812ad64ca21f4031b"
 dependencies = [
  "indexmap",
  "itoa",
@@ -677,6 +702,15 @@ dependencies = [
  "serde",
 ]
 
+[[package]]
+name = "serde_spanned"
+version = "0.6.3"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "96426c9936fd7a0124915f9185ea1d20aa9445cc9821142f0a73bc9207a2e186"
+dependencies = [
+ "serde",
+]
+
 [[package]]
 name = "smallbitvec"
 version = "2.5.1"
@@ -708,9 +742,9 @@ dependencies = [
 
 [[package]]
 name = "syn"
-version = "2.0.15"
+version = "2.0.26"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "a34fcf3e8b60f57e6a14301a2e916d323af98b0ea63c599441eec8558660c822"
+checksum = "45c3457aacde3c65315de5031ec191ce46604304d2446e803d71ade03308d970"
 dependencies = [
  "proc-macro2",
  "quote",
@@ -719,15 +753,16 @@ dependencies = [
 
 [[package]]
 name = "tempfile"
-version = "3.5.0"
+version = "3.6.0"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "b9fbec84f381d5795b08656e4912bec604d162bff9291d6189a78f4c8ab87998"
+checksum = "31c0432476357e58790aaa47a8efb0c5138f137343f3b5f23bd36a27e3b0a6d6"
 dependencies = [
+ "autocfg",
  "cfg-if",
  "fastrand",
  "redox_syscall 0.3.5",
  "rustix",
- "windows-sys 0.45.0",
+ "windows-sys 0.48.0",
 ]
 
 [[package]]
@@ -741,22 +776,22 @@ dependencies = [
 
 [[package]]
 name = "thiserror"
-version = "1.0.40"
+version = "1.0.43"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "978c9a314bd8dc99be594bc3c175faaa9794be04a5a5e153caba6915336cebac"
+checksum = "a35fc5b8971143ca348fa6df4f024d4d55264f3468c71ad1c2f365b0a4d58c42"
 dependencies = [
  "thiserror-impl",
 ]
 
 [[package]]
 name = "thiserror-impl"
-version = "1.0.40"
+version = "1.0.43"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "f9456a42c5b0d803c8cd86e73dd7cc9edd429499f37a3550d286d5e86720569f"
+checksum = "463fe12d7993d3b327787537ce8dd4dfa058de32fc2b195ef3cde03dc4771e8f"
 dependencies = [
  "proc-macro2",
  "quote",
- "syn 2.0.15",
+ "syn 2.0.26",
 ]
 
 [[package]]
@@ -788,11 +823,36 @@ checksum = "1f3ccbac311fea05f86f61904b462b55fb3df8837a366dfc601a0161d0532f20"
 
 [[package]]
 name = "toml"
-version = "0.5.11"
+version = "0.7.6"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "f4f7f0dd8d50a853a531c426359045b1998f04219d88799810762cd4ad314234"
+checksum = "c17e963a819c331dcacd7ab957d80bc2b9a9c1e71c804826d2f283dd65306542"
 dependencies = [
  "serde",
+ "serde_spanned",
+ "toml_datetime",
+ "toml_edit",
+]
+
+[[package]]
+name = "toml_datetime"
+version = "0.6.3"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "7cda73e2f1397b1262d6dfdcef8aafae14d1de7748d66822d3bfeeb6d03e5e4b"
+dependencies = [
+ "serde",
+]
+
+[[package]]
+name = "toml_edit"
+version = "0.19.14"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "f8123f27e969974a3dfba720fdb560be359f57b44302d280ba72e76a74480e8a"
+dependencies = [
+ "indexmap",
+ "serde",
+ "serde_spanned",
+ "toml_datetime",
+ "winnow",
 ]
 
 [[package]]
@@ -815,7 +875,7 @@ dependencies = [
  "ctor",
  "ctrlc",
  "difference",
- "dirs 3.0.2",
+ "dirs 5.0.1",
  "glob",
  "html-escape",
  "indexmap",
@@ -826,7 +886,7 @@ dependencies = [
  "pretty_assertions",
  "rand",
  "regex",
- "regex-syntax 0.6.29",
+ "regex-syntax",
  "rustc-hash",
  "semver",
  "serde",
@@ -912,9 +972,9 @@ checksum = "92888ba5573ff080736b3648696b70cafad7d250551175acbaa4e0385b3e1460"
 
 [[package]]
 name = "unicode-ident"
-version = "1.0.8"
+version = "1.0.11"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "e5464a87b239f13a63a501f2701565754bae92d243d4bb7eb12f6d57d2269bf4"
+checksum = "301abaae475aa91687eb82514b328ab47a211a533026cb25fc3e519b86adfc3c"
 
 [[package]]
 name = "unicode-normalization"
@@ -933,15 +993,15 @@ checksum = "c0edd1e5b14653f783770bce4a4dabb4a5108a5370a5f5d8cfe8710c361f6c8b"
 
 [[package]]
 name = "unindent"
-version = "0.2.1"
+version = "0.2.2"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "5aa30f5ea51ff7edfc797c6d3f9ec8cbd8cfedef5371766b7181d33977f4814f"
+checksum = "0f86d931b9d0b666761dcfcbac3ec5e9daff8a2becfff93a8fce2591ae297b95"
 
 [[package]]
 name = "url"
-version = "2.3.1"
+version = "2.4.0"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "0d68c799ae75762b8c3fe375feb6600ef5602c883c5d21eb51c09f22b83c4643"
+checksum = "50bff7831e19200a85b17131d085c25d7811bc4e186efdaf54bbd132994a88cb"
 dependencies = [
  "form_urlencoded",
  "idna",
@@ -978,9 +1038,9 @@ checksum = "9c8d87e72b64a3b4db28d11ce29237c246188f4f51057d65a7eab63b7987e423"
 
 [[package]]
 name = "wasm-bindgen"
-version = "0.2.84"
+version = "0.2.87"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "31f8dcbc21f30d9b8f2ea926ecb58f6b91192c17e9d33594b3df58b2007ca53b"
+checksum = "7706a72ab36d8cb1f80ffbf0e071533974a60d0a308d01a5d0375bf60499a342"
 dependencies = [
  "cfg-if",
  "wasm-bindgen-macro",
@@ -988,24 +1048,24 @@ dependencies = [
 
 [[package]]
 name = "wasm-bindgen-backend"
-version = "0.2.84"
+version = "0.2.87"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "95ce90fd5bcc06af55a641a86428ee4229e44e07033963a2290a8e241607ccb9"
+checksum = "5ef2b6d3c510e9625e5fe6f509ab07d66a760f0885d858736483c32ed7809abd"
 dependencies = [
  "bumpalo",
  "log",
  "once_cell",
  "proc-macro2",
  "quote",
- "syn 1.0.109",
+ "syn 2.0.26",
  "wasm-bindgen-shared",
 ]
 
 [[package]]
 name = "wasm-bindgen-macro"
-version = "0.2.84"
+version = "0.2.87"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "4c21f77c0bedc37fd5dc21f897894a5ca01e7bb159884559461862ae90c0b4c5"
+checksum = "dee495e55982a3bd48105a7b947fd2a9b4a8ae3010041b9e0faab3f9cd028f1d"
 dependencies = [
  "quote",
  "wasm-bindgen-macro-support",
@@ -1013,28 +1073,28 @@ dependencies = [
 
 [[package]]
 name = "wasm-bindgen-macro-support"
-version = "0.2.84"
+version = "0.2.87"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "2aff81306fcac3c7515ad4e177f521b5c9a15f2b08f4e32d823066102f35a5f6"
+checksum = "54681b18a46765f095758388f2d0cf16eb8d4169b639ab575a8f5693af210c7b"
 dependencies = [
  "proc-macro2",
  "quote",
- "syn 1.0.109",
+ "syn 2.0.26",
  "wasm-bindgen-backend",
  "wasm-bindgen-shared",
 ]
 
 [[package]]
 name = "wasm-bindgen-shared"
-version = "0.2.84"
+version = "0.2.87"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "0046fef7e28c3804e5e38bfa31ea2a0f73905319b677e57ebe37e49358989b5d"
+checksum = "ca6ad05a4870b2bf5fe995117d3728437bd27d7cd5f06f13c17443ef369775a1"
 
 [[package]]
 name = "web-sys"
-version = "0.3.61"
+version = "0.3.64"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "e33b99f4b23ba3eec1a53ac264e35a755f00e966e0065077d6027c0f575b0b97"
+checksum = "9b85cbef8c220a6abc02aefd892dfc0fc23afb1c6a426316ec33253a3877249b"
 dependencies = [
  "js-sys",
  "wasm-bindgen",
@@ -1042,12 +1102,12 @@ dependencies = [
 
 [[package]]
 name = "webbrowser"
-version = "0.8.9"
+version = "0.8.10"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "b692165700260bbd40fbc5ff23766c03e339fbaca907aeea5cb77bf0a553ca83"
+checksum = "fd222aa310eb7532e3fd427a5d7db7e44bc0b0cf1c1e21139c345325511a85b6"
 dependencies = [
  "core-foundation",
- "dirs 4.0.0",
+ "home",
  "jni",
  "log",
  "ndk-context",
@@ -1114,7 +1174,7 @@ version = "0.48.0"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "677d2418bec65e3338edb076e806bc1ec15693c5d0104683f2efe857f61056a9"
 dependencies = [
- "windows-targets 0.48.0",
+ "windows-targets 0.48.1",
 ]
 
 [[package]]
@@ -1134,9 +1194,9 @@ dependencies = [
 
 [[package]]
 name = "windows-targets"
-version = "0.48.0"
+version = "0.48.1"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "7b1eb6f0cd7c80c79759c929114ef071b87354ce476d9d94271031c0497adfd5"
+checksum = "05d4b17490f70499f20b9e791dcf6a299785ce8af4d709018206dc5b4953e95f"
 dependencies = [
  "windows_aarch64_gnullvm 0.48.0",
  "windows_aarch64_msvc 0.48.0",
@@ -1230,3 +1290,18 @@ name = "windows_x86_64_msvc"
 version = "0.48.0"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "1a515f5799fe4961cb532f983ce2b23082366b898e52ffbce459c86f67c8378a"
+
+[[package]]
+name = "winnow"
+version = "0.5.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "81fac9742fd1ad1bd9643b991319f72dd031016d44b77039a26977eb667141e7"
+dependencies = [
+ "memchr",
+]
+
+[[package]]
+name = "yansi"
+version = "0.5.1"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "09041cd90cf85f7f8b2df60c646f853b7f535ce68f85244eb6731cf89fa498ec"

From f9e5696bcbbac7af1ce4d1fb7f6f1d1e0509b1cb Mon Sep 17 00:00:00 2001
From: Amaan Qureshi <amaanq12@gmail.com>
Date: Wed, 19 Jul 2023 22:20:01 -0400
Subject: [PATCH 187/347] ci: rework fuzzer script

---
 script/build-fuzzers  | 29 +++++++++++++++++------------
 script/run-fuzzer     | 15 +++++++++++----
 test/fuzz/fuzzer.cc   |  2 +-
 test/fuzz/gen-dict.py | 31 -------------------------------
 4 files changed, 29 insertions(+), 48 deletions(-)
 delete mode 100644 test/fuzz/gen-dict.py

diff --git a/script/build-fuzzers b/script/build-fuzzers
index bff43c8b..1d07cba7 100755
--- a/script/build-fuzzers
+++ b/script/build-fuzzers
@@ -6,14 +6,8 @@ if [[ "$(uname -s)" != Linux ]]; then
   exit 1
 fi
 
-if [[ -z "$LIB_FUZZER_PATH" ]]; then
-  echo "LIB_FUZZER_PATH not set"
-  exit 1
-fi
-
 CC=${CC:-clang}
 CXX=${CXX:-clang++}
-LINK=${LINK:-clang++}
 
 default_fuzz_flags="-fsanitize=fuzzer,address,undefined"
 
@@ -21,7 +15,7 @@ CFLAGS=${CFLAGS:-"$default_fuzz_flags"}
 CXXFLAGS=${CXXFLAGS:-"$default_fuzz_flags"}
 
 export CFLAGS
-make
+make CC="$CC" CXX="$CXX"
 
 if [ -z "$@" ]; then
   languages=$(ls test/fixtures/grammars)
@@ -29,7 +23,13 @@ else
   languages="$@"
 fi
 
+mkdir -p test/fuzz/out
+
 for lang in ${languages[@]}; do
+  # skip typescript
+  if [[ $lang == "typescript" ]]; then
+	continue
+  fi
   echo "Building $lang fuzzer..."
   lang_dir="test/fixtures/grammars/$lang"
 
@@ -54,7 +54,7 @@ for lang in ${languages[@]}; do
   highlights_filename="${lang_dir}/queries/highlights.scm"
   if [ -e "${highlights_filename}" ]; then
     ts_lang_query_filename="${lang}.scm"
-    cp "${highlights_filename}" "out/${ts_lang_query_filename}"
+    cp "${highlights_filename}" "test/fuzz/out/${ts_lang_query_filename}"
   else
     ts_lang_query_filename=""
   fi
@@ -62,11 +62,16 @@ for lang in ${languages[@]}; do
   # FIXME: We should extract the grammar name from grammar.js. Use the name of
   # the directory instead. Also, the grammar name needs to be a valid C
   # identifier so replace any '-' characters
-  ts_lang="tree_sitter_$(echo $lang | tr -- - _)"
+  ts_lang="tree_sitter_$(echo "$lang" | tr -- - _)"
   $CXX $CXXFLAGS -std=c++11 -I lib/include -D TS_LANG="$ts_lang" -D TS_LANG_QUERY_FILENAME="\"${ts_lang_query_filename}\"" \
     "test/fuzz/fuzzer.cc" "${objects[@]}" \
-    libtree-sitter.a "$LIB_FUZZER_PATH" \
-    -o "out/${lang}_fuzzer"
+    libtree-sitter.a \
+    -o "test/fuzz/out/${lang}_fuzzer"
 
-  python test/fuzz/gen-dict.py "${lang_dir}/src/grammar.json" > "out/$lang.dict"
+  jq '
+    [ ..
+      | if .type? == "STRING" or (.type? == "ALIAS" and .named? == false) then .value else empty end
+      | select(test("\\S") and length == utf8bytelength)
+    ] | unique | .[]
+  ' | sort
 done
diff --git a/script/run-fuzzer b/script/run-fuzzer
index ddd481d9..ae73958b 100755
--- a/script/run-fuzzer
+++ b/script/run-fuzzer
@@ -6,7 +6,13 @@ root=$(dirname "$0")/..
 export ASAN_OPTIONS="quarantine_size_mb=10:detect_leaks=1:symbolize=1"
 export UBSAN="print_stacktrace=1:halt_on_error=1:symbolize=1"
 
-declare -A mode_config=( ["halt"]="-timeout=1 -rss_limit_mb=256" ["recover"]="-timeout=10 -rss_limit_mb=256" )
+# check if CI env var exists
+
+if [ -z "${CI:-}" ]; then
+  declare -A mode_config=( ["halt"]="-timeout=1 -rss_limit_mb=2048" ["recover"]="-timeout=10 -rss_limit_mb=2048" )
+else
+  declare -A mode_config=( ["halt"]="-max_total_time=120 -timeout=1 -rss_limit_mb=2048" ["recover"]="-time=120 -timeout=10 -rss_limit_mb=2048" )
+fi
 
 run_fuzzer() {
   if [ "$#" -lt 2 ]; then
@@ -21,7 +27,7 @@ run_fuzzer() {
   # Treat remainder of arguments as libFuzzer arguments
 
   # Fuzzing logs and testcases are always written to `pwd`, so `cd` there first
-  results="${root}/out/fuzz-results/${lang}_${mode}"
+  results="${root}/test/fuzz/out/fuzz-results/${lang}"
   mkdir -p "${results}"
   cd "${results}"
 
@@ -29,7 +35,8 @@ run_fuzzer() {
   # then be loaded on subsequent fuzzing runs
   mkdir -p corpus
 
-  "../../${lang}_fuzzer_${mode}" "-dict=../../${lang}.dict" "-artifact_prefix=${lang}_${mode}_" -max_len=2048 ${mode_config[$mode]} "./corpus" "$@"
+  pwd
+  "../../${lang}_fuzzer" "-dict=../../${lang}.dict" "-artifact_prefix=${lang}_" -max_len=2048 "${mode_config[$mode]}" "./corpus" "$@"
 }
 
 reproduce() {
@@ -46,7 +53,7 @@ reproduce() {
   shift
   # Treat remainder of arguments as libFuzzer arguments
 
-  "${root}/out/${lang}_fuzzer_${mode}" ${mode_config[$mode]} -runs=1 "${testcase}" "$@"
+  "${root}/test/fuzz/out/${lang}_fuzzer" "${mode_config[$mode]}" -runs=1 "${testcase}" "$@"
 }
 
 script=$(basename "$0")
diff --git a/test/fuzz/fuzzer.cc b/test/fuzz/fuzzer.cc
index ef800883..3b933746 100644
--- a/test/fuzz/fuzzer.cc
+++ b/test/fuzz/fuzzer.cc
@@ -47,7 +47,7 @@ extern "C" int LLVMFuzzerTestOneInput(const uint8_t *data, size_t size) {
   TSTree *tree = ts_parser_parse_string(parser, NULL, str, size);
   TSNode root_node = ts_tree_root_node(tree);
 
-  if (lang_query) {
+  if (lang_query != nullptr) {
     {
       TSQueryCursor *cursor = ts_query_cursor_new();
 
diff --git a/test/fuzz/gen-dict.py b/test/fuzz/gen-dict.py
deleted file mode 100644
index c9845671..00000000
--- a/test/fuzz/gen-dict.py
+++ /dev/null
@@ -1,31 +0,0 @@
-import json
-import sys
-
-def find_literals(literals, node):
-  '''Recursively find STRING literals in the grammar definition'''
-
-  if type(node) is dict:
-    if 'type' in node and node['type'] == 'STRING' and 'value' in node:
-      literals.add(node['value'])
-
-    for key, value in node.iteritems():
-      find_literals(literals, value)
-
-  elif type(node) is list:
-    for item in node:
-      find_literals(literals, item)
-
-def main():
-  '''Generate a libFuzzer / AFL dictionary from a tree-sitter grammar.json'''
-  with open(sys.argv[1]) as f:
-    grammar = json.load(f)
-
-  literals = set()
-  find_literals(literals, grammar['rules'])
-
-  for lit in sorted(literals):
-    if lit:
-      print '"%s"' % ''.join(['\\x%02x' % ord(b) for b in lit.encode('utf-8')])
-
-if __name__ == '__main__':
-  main()

From 9a057398514a950d0b4e6f9d865579f91c71bf93 Mon Sep 17 00:00:00 2001
From: Amaan Qureshi <amaanq12@gmail.com>
Date: Wed, 19 Jul 2023 22:19:06 -0400
Subject: [PATCH 188/347] fix: typo

---
 .github/workflows/sanitize.yml | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/.github/workflows/sanitize.yml b/.github/workflows/sanitize.yml
index 6348f222..3d470a84 100644
--- a/.github/workflows/sanitize.yml
+++ b/.github/workflows/sanitize.yml
@@ -1,4 +1,4 @@
-name: Sunitize
+name: Sanitize
 
 env:
   CARGO_TERM_COLOR: always

From c521e9c18e0590cd18f51df6954cb35f30a78804 Mon Sep 17 00:00:00 2001
From: Amaan Qureshi <amaanq12@gmail.com>
Date: Wed, 19 Jul 2023 22:19:22 -0400
Subject: [PATCH 189/347] chore: improve error message in some spots loading
 `grammar.json`

---
 cli/src/generate/mod.rs           | 3 ++-
 cli/src/tests/helpers/fixtures.rs | 5 ++++-
 2 files changed, 6 insertions(+), 2 deletions(-)

diff --git a/cli/src/generate/mod.rs b/cli/src/generate/mod.rs
index 4838828b..206b74f9 100644
--- a/cli/src/generate/mod.rs
+++ b/cli/src/generate/mod.rs
@@ -61,7 +61,8 @@ pub fn generate_parser_in_directory(
         None => {
             let grammar_js_path = grammar_path.map_or(repo_path.join("grammar.js"), |s| s.into());
             grammar_json = load_grammar_file(&grammar_js_path)?;
-            fs::write(&src_path.join("grammar.json"), &grammar_json)?;
+            fs::write(&src_path.join("grammar.json"), &grammar_json)
+                .with_context(|| format!("Failed to write grammar.json to {:?}", src_path))?;
         }
     }
 
diff --git a/cli/src/tests/helpers/fixtures.rs b/cli/src/tests/helpers/fixtures.rs
index 7d04b24a..46c674cd 100644
--- a/cli/src/tests/helpers/fixtures.rs
+++ b/cli/src/tests/helpers/fixtures.rs
@@ -86,6 +86,9 @@ pub fn get_test_language(name: &str, parser_code: &str, path: Option<&Path>) ->
 
 pub fn get_test_grammar(name: &str) -> (String, Option<PathBuf>) {
     let dir = fixtures_dir().join("test_grammars").join(name);
-    let grammar = fs::read_to_string(&dir.join("grammar.json")).unwrap();
+    let grammar = fs::read_to_string(&dir.join("grammar.json")).expect(&format!(
+        "Can't find grammar.json for test grammar {}",
+        name
+    ));
     (grammar, Some(dir))
 }

From 75e1bcf70a0a3de5ff32bc2b6672bfc6d1033207 Mon Sep 17 00:00:00 2001
From: Amaan Qureshi <amaanq12@gmail.com>
Date: Wed, 19 Jul 2023 22:19:43 -0400
Subject: [PATCH 190/347] refactor!: rename proc_macro to avoid conflicts when
 building std with `-Z build-std`

---
 cli/Cargo.toml               | 2 +-
 cli/src/tests/corpus_test.rs | 2 +-
 cli/src/tests/parser_test.rs | 2 +-
 3 files changed, 3 insertions(+), 3 deletions(-)

diff --git a/cli/Cargo.toml b/cli/Cargo.toml
index c50a29ed..7bc2e2ea 100644
--- a/cli/Cargo.toml
+++ b/cli/Cargo.toml
@@ -72,7 +72,7 @@ version = "0.4.19"
 features = ["std"]
 
 [dev-dependencies]
-proc_macro = { path = "src/tests/proc_macro", package = "tree-sitter-tests-proc-macro" }
+tree_sitter_proc_macro = { path = "src/tests/proc_macro", package = "tree-sitter-tests-proc-macro" }
 
 rand = "0.8.5"
 tempfile = "3.6.0"
diff --git a/cli/src/tests/corpus_test.rs b/cli/src/tests/corpus_test.rs
index 0bd1db88..7166d249 100644
--- a/cli/src/tests/corpus_test.rs
+++ b/cli/src/tests/corpus_test.rs
@@ -14,9 +14,9 @@ use crate::{
     test::{parse_tests, print_diff, print_diff_key, strip_sexp_fields, TestEntry},
     util,
 };
-use proc_macro::test_with_seed;
 use std::{env, fs};
 use tree_sitter::{LogType, Node, Parser, Point, Range, Tree};
+use tree_sitter_proc_macro::test_with_seed;
 
 #[test_with_seed(retry=10, seed=*START_SEED, seed_fn=new_seed)]
 fn test_corpus_for_bash(seed: usize) {
diff --git a/cli/src/tests/parser_test.rs b/cli/src/tests/parser_test.rs
index af5f36f5..01063359 100644
--- a/cli/src/tests/parser_test.rs
+++ b/cli/src/tests/parser_test.rs
@@ -8,12 +8,12 @@ use crate::{
     generate::generate_parser_for_grammar,
     parse::{perform_edit, Edit},
 };
-use proc_macro::retry;
 use std::{
     sync::atomic::{AtomicUsize, Ordering},
     thread, time,
 };
 use tree_sitter::{IncludedRangesError, InputEdit, LogType, Parser, Point, Range};
+use tree_sitter_proc_macro::retry;
 
 #[test]
 fn test_parsing_simple_string() {

From a76701103e15b449fd915edd519a0bd254def2b0 Mon Sep 17 00:00:00 2001
From: Amaan Qureshi <amaanq12@gmail.com>
Date: Wed, 19 Jul 2023 22:20:30 -0400
Subject: [PATCH 191/347] fix(asan): only use `slice::from_raw_parts` if
 locals_query is not null

---
 tags/src/c_lib.rs | 6 +++++-
 1 file changed, 5 insertions(+), 1 deletion(-)

diff --git a/tags/src/c_lib.rs b/tags/src/c_lib.rs
index 088cc7bc..c8f39d2c 100644
--- a/tags/src/c_lib.rs
+++ b/tags/src/c_lib.rs
@@ -84,7 +84,11 @@ pub extern "C" fn ts_tagger_add_language(
     let tagger = unwrap_mut_ptr(this);
     let scope_name = unsafe { unwrap(CStr::from_ptr(scope_name).to_str()) };
     let tags_query = unsafe { slice::from_raw_parts(tags_query, tags_query_len as usize) };
-    let locals_query = unsafe { slice::from_raw_parts(locals_query, locals_query_len as usize) };
+    let locals_query = if locals_query != std::ptr::null() {
+        unsafe { slice::from_raw_parts(locals_query, locals_query_len as usize) }
+    } else {
+        &[]
+    };
     let tags_query = match str::from_utf8(tags_query) {
         Ok(e) => e,
         Err(_) => return TSTagsError::InvalidUtf8,

From 56870fdda2f10b3202823f8c300d7a34342c5503 Mon Sep 17 00:00:00 2001
From: Amaan Qureshi <amaanq12@gmail.com>
Date: Wed, 19 Jul 2023 22:19:55 -0400
Subject: [PATCH 192/347] chore: remove unneeded include

---
 lib/include/tree_sitter/api.h | 1 -
 1 file changed, 1 deletion(-)

diff --git a/lib/include/tree_sitter/api.h b/lib/include/tree_sitter/api.h
index dc7704d5..1e67f217 100644
--- a/lib/include/tree_sitter/api.h
+++ b/lib/include/tree_sitter/api.h
@@ -5,7 +5,6 @@
 extern "C" {
 #endif
 
-#include <stdio.h>
 #include <stdlib.h>
 #include <stdint.h>
 #include <stdbool.h>

From 211e13d56670950da94ad628f72cb88c7c9b5f74 Mon Sep 17 00:00:00 2001
From: Amaan Qureshi <amaanq12@gmail.com>
Date: Mon, 24 Jul 2023 00:48:12 -0400
Subject: [PATCH 193/347] ci: add asan

---
 .github/workflows/sanitize.yml | 11 ++++++++++-
 1 file changed, 10 insertions(+), 1 deletion(-)

diff --git a/.github/workflows/sanitize.yml b/.github/workflows/sanitize.yml
index 3d470a84..bb085eae 100644
--- a/.github/workflows/sanitize.yml
+++ b/.github/workflows/sanitize.yml
@@ -9,7 +9,7 @@ on:
 
 jobs:
   check_undefined_behaviour:
-    name: Undefined behaviour checks
+    name: Sanitizer checks
     runs-on: ubuntu-latest
     env:
       TREE_SITTER: ${{ github.workspace }}/target/release/tree-sitter
@@ -38,3 +38,12 @@ jobs:
         CFLAGS: -fsanitize=undefined
         RUSTFLAGS: -lubsan
       run: cargo test -- --test-threads 1
+
+    - name: Run main tests with address sanitizer (ASAN)
+      env:
+        CFLAGS: -fsanitize=address
+        RUSTFLAGS: -Zsanitizer=address
+      run: |
+        rustup install nightly
+        rustup component add rust-src --toolchain nightly-x86_64-unknown-linux-gnu
+        cargo +nightly test -Z build-std --target x86_64-unknown-linux-gnu -- --test-threads 1

From a4f939520fd02720c4039ee9d536c5568057746b Mon Sep 17 00:00:00 2001
From: Amaan Qureshi <amaanq12@gmail.com>
Date: Mon, 24 Jul 2023 02:07:01 -0400
Subject: [PATCH 194/347] docs: update Rust bindings' README

---
 lib/binding_rust/README.md | 41 ++++++++++++++------------------------
 1 file changed, 15 insertions(+), 26 deletions(-)

diff --git a/lib/binding_rust/README.md b/lib/binding_rust/README.md
index c004f398..7a052b2b 100644
--- a/lib/binding_rust/README.md
+++ b/lib/binding_rust/README.md
@@ -7,7 +7,7 @@
 
 Rust bindings to the [Tree-sitter][] parsing library.
 
-### Basic Usage
+## Basic Usage
 
 First, create a parser:
 
@@ -17,22 +17,6 @@ use tree_sitter::{Parser, Language};
 let mut parser = Parser::new();
 ```
 
-Tree-sitter languages consist of generated C code. To make sure they're properly compiled and linked, you can create a [build script](https://doc.rust-lang.org/cargo/reference/build-scripts.html) like the following (assuming `tree-sitter-javascript` is in your root directory):
-
-```rust
-use std::path::PathBuf;
-
-fn main() {
-    let dir: PathBuf = ["tree-sitter-javascript", "src"].iter().collect();
-
-    cc::Build::new()
-        .include(&dir)
-        .file(dir.join("parser.c"))
-        .file(dir.join("scanner.c"))
-        .compile("tree-sitter-javascript");
-}
-```
-
 Add the `cc` crate to your `Cargo.toml` under `[build-dependencies]`:
 
 ```toml
@@ -40,15 +24,18 @@ Add the `cc` crate to your `Cargo.toml` under `[build-dependencies]`:
 cc="*"
 ```
 
-To then use languages from rust, you must declare them as `extern "C"` functions and invoke them with `unsafe`. Then you can assign them to the parser.
+Then, add a language as a dependency:
+
+```toml
+[dependencies]
+tree-sitter = "0.20.10"
+tree-sitter-rust = "0.20.3"
+```
+
+To then use a language, you assign them to the parser.
 
 ```rust
-extern "C" { fn tree_sitter_c() -> Language; }
-extern "C" { fn tree_sitter_rust() -> Language; }
-extern "C" { fn tree_sitter_javascript() -> Language; }
-
-let language = unsafe { tree_sitter_rust() };
-parser.set_language(language).unwrap();
+parser.set_language(tree_sitter_rust::language()).expect("Error loading Rust grammar");
 ```
 
 Now you can parse source code:
@@ -65,7 +52,8 @@ assert_eq!(root_node.end_position().column, 12);
 
 ### Editing
 
-Once you have a syntax tree, you can update it when your source code changes. Passing in the previous edited tree makes `parse` run much more quickly:
+Once you have a syntax tree, you can update it when your source code changes.
+Passing in the previous edited tree makes `parse` run much more quickly:
 
 ```rust
 let new_source_code = "fn test(a: u32) {}"
@@ -84,7 +72,8 @@ let new_tree = parser.parse(new_source_code, Some(&tree));
 
 ### Text Input
 
-The source code to parse can be provided either as a string, a slice, a vector, or as a function that returns a slice. The text can be encoded as either UTF8 or UTF16:
+The source code to parse can be provided either as a string, a slice, a vector,
+or as a function that returns a slice. The text can be encoded as either UTF8 or UTF16:
 
 ```rust
 // Store some source code in an array of lines.

From 269a9a8ecfad6479fa9448c29984ec4b36d4563c Mon Sep 17 00:00:00 2001
From: Amaan Qureshi <amaanq12@gmail.com>
Date: Mon, 24 Jul 2023 02:28:09 -0400
Subject: [PATCH 195/347] fix!: use `abort` instead of `exit(1)` when
 allocations fail

---
 lib/src/alloc.c | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/lib/src/alloc.c b/lib/src/alloc.c
index a5d86fcd..30597571 100644
--- a/lib/src/alloc.c
+++ b/lib/src/alloc.c
@@ -5,7 +5,7 @@ static void *ts_malloc_default(size_t size) {
   void *result = malloc(size);
   if (size > 0 && !result) {
     fprintf(stderr, "tree-sitter failed to allocate %zu bytes", size);
-    exit(1);
+    abort();
   }
   return result;
 }
@@ -14,7 +14,7 @@ static void *ts_calloc_default(size_t count, size_t size) {
   void *result = calloc(count, size);
   if (count > 0 && !result) {
     fprintf(stderr, "tree-sitter failed to allocate %zu bytes", count * size);
-    exit(1);
+    abort();
   }
   return result;
 }
@@ -23,7 +23,7 @@ static void *ts_realloc_default(void *buffer, size_t size) {
   void *result = realloc(buffer, size);
   if (size > 0 && !result) {
     fprintf(stderr, "tree-sitter failed to reallocate %zu bytes", size);
-    exit(1);
+    abort();
   }
   return result;
 }

From 36deb567c8aa02a3d27582d5023d2b9f31cee50b Mon Sep 17 00:00:00 2001
From: Amaan Qureshi <amaanq12@gmail.com>
Date: Mon, 24 Jul 2023 03:05:09 -0400
Subject: [PATCH 196/347] fix(tests): sort categories alphabetically

---
 cli/src/test.rs | 11 ++++++++++-
 1 file changed, 10 insertions(+), 1 deletion(-)

diff --git a/cli/src/test.rs b/cli/src/test.rs
index 69c4a663..c531c18a 100644
--- a/cli/src/test.rs
+++ b/cli/src/test.rs
@@ -353,9 +353,18 @@ pub fn parse_tests(path: &Path) -> io::Result<TestEntry> {
             let entry = entry?;
             let hidden = entry.file_name().to_str().unwrap_or("").starts_with(".");
             if !hidden {
-                children.push(parse_tests(&entry.path())?);
+                children.push(entry.path());
             }
         }
+        children.sort_by(|a, b| {
+            a.file_name()
+                .unwrap_or_default()
+                .cmp(&b.file_name().unwrap_or_default())
+        });
+        let children = children
+            .iter()
+            .map(|path| parse_tests(path))
+            .collect::<io::Result<Vec<TestEntry>>>()?;
         Ok(TestEntry::Group {
             name,
             children,

From 5a8a4b0dcf067e8eb5f33a46ff5be2f213f045df Mon Sep 17 00:00:00 2001
From: Michael Davis <mcarsondavis@gmail.com>
Date: Mon, 24 Jul 2023 15:02:37 -0500
Subject: [PATCH 197/347] ts_node__prev_child: Reset earlier node when
 backtracking

`earlier_node` must be reset when backtracking up the tree or else
`ts_node__prev_child` may loop infinitely on a subtree which contains
zero-width tokens.
---
 lib/src/node.c | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/lib/src/node.c b/lib/src/node.c
index aa947148..eafaa7bb 100644
--- a/lib/src/node.c
+++ b/lib/src/node.c
@@ -237,6 +237,8 @@ static inline TSNode ts_node__prev_sibling(TSNode self, bool include_anonymous)
       return earlier_node;
     } else {
       node = earlier_node;
+      earlier_node = ts_node__null();
+      earlier_node_is_relevant = false;
     }
   }
 

From c9fd357c06f8660c7f02f57cde8bd392a75705f3 Mon Sep 17 00:00:00 2001
From: Amaan Qureshi <amaanq12@gmail.com>
Date: Mon, 24 Jul 2023 23:43:25 -0400
Subject: [PATCH 198/347] fix: avoid infinite loop bug

If the current tag is the last tag and the test fails, the j loop neverends. This prevents that by checking that in the j loop
---
 cli/src/test_tags.rs | 3 +++
 1 file changed, 3 insertions(+)

diff --git a/cli/src/test_tags.rs b/cli/src/test_tags.rs
index 024d094c..8c1fb34a 100644
--- a/cli/src/test_tags.rs
+++ b/cli/src/test_tags.rs
@@ -125,6 +125,9 @@ pub fn test_tag(
                     }
 
                     j += 1;
+                    if tag == tags.last().unwrap() {
+                        break 'tag_loop;
+                    }
                 }
             } else {
                 break;

From 68b1006a3bfa428999a1f3eb4ba3fdfaa75dfdcc Mon Sep 17 00:00:00 2001
From: Amaan Qureshi <amaanq12@gmail.com>
Date: Mon, 24 Jul 2023 23:44:10 -0400
Subject: [PATCH 199/347] feat: add negative assertions, remove duplicate code

---
 cli/src/query_testing.rs             | 28 ++++++++++-
 cli/src/test_highlight.rs            | 69 ++--------------------------
 cli/src/test_tags.rs                 |  3 +-
 cli/src/tests/test_highlight_test.rs | 17 ++-----
 cli/src/tests/test_tags_test.rs      | 17 ++-----
 5 files changed, 44 insertions(+), 90 deletions(-)

diff --git a/cli/src/query_testing.rs b/cli/src/query_testing.rs
index 9950f12f..1f88d619 100644
--- a/cli/src/query_testing.rs
+++ b/cli/src/query_testing.rs
@@ -18,9 +18,20 @@ pub struct CaptureInfo {
 #[derive(Debug, PartialEq, Eq)]
 pub struct Assertion {
     pub position: Point,
+    pub negative: bool,
     pub expected_capture_name: String,
 }
 
+impl Assertion {
+    pub fn new(row: usize, col: usize, negative: bool, expected_capture_name: String) -> Self {
+        Self {
+            position: Point::new(row, col),
+            negative,
+            expected_capture_name,
+        }
+    }
+}
+
 /// Parse the given source code, finding all of the comments that contain
 /// highlighting assertions. Return a vector of (position, expected highlight name)
 /// pairs.
@@ -54,6 +65,7 @@ pub fn parse_position_comments(
                         // to its own column.
                         let mut has_left_caret = false;
                         let mut has_arrow = false;
+                        let mut negative = false;
                         let mut arrow_end = 0;
                         for (i, c) in text.char_indices() {
                             arrow_end = i + 1;
@@ -69,6 +81,19 @@ pub fn parse_position_comments(
                             has_left_caret = c == '<';
                         }
 
+                        // find any ! after arrows but before capture name
+                        if has_arrow {
+                            for (i, c) in text[arrow_end..].char_indices() {
+                                if c == '!' {
+                                    negative = true;
+                                    arrow_end += i + 1;
+                                    break;
+                                } else if !c.is_whitespace() {
+                                    break;
+                                }
+                            }
+                        }
+
                         // If the comment node contains an arrow and a highlight name, record the
                         // highlight name and the position.
                         if let (true, Some(mat)) =
@@ -76,7 +101,8 @@ pub fn parse_position_comments(
                         {
                             assertion_ranges.push((node.start_position(), node.end_position()));
                             result.push(Assertion {
-                                position: position,
+                                position,
+                                negative,
                                 expected_capture_name: mat.as_str().to_string(),
                             });
                         }
diff --git a/cli/src/test_highlight.rs b/cli/src/test_highlight.rs
index 2d9d536a..44a24244 100644
--- a/cli/src/test_highlight.rs
+++ b/cli/src/test_highlight.rs
@@ -94,6 +94,7 @@ pub fn iterate_assertions(
     let mut actual_highlights = Vec::<&String>::new();
     for Assertion {
         position,
+        negative,
         expected_capture_name: expected_highlight,
     } in assertions
     {
@@ -117,12 +118,13 @@ pub fn iterate_assertions(
                         break 'highlight_loop;
                     }
 
-                    // If the highlight matches the assertion, this test passes. Otherwise,
+                    // If the highlight matches the assertion, or if the highlight doesn't
+                    // match the assertion but it's negative, this test passes. Otherwise,
                     // add this highlight to the list of actual highlights that span the
                     // assertion's position, in order to generate an error message in the event
                     // of a failure.
                     let highlight_name = &highlight_names[(highlight.2).0];
-                    if *highlight_name == *expected_highlight {
+                    if (*highlight_name == *expected_highlight) == !negative {
                         passed = true;
                         break 'highlight_loop;
                     } else {
@@ -162,68 +164,7 @@ pub fn test_highlight(
     let assertions =
         parse_position_comments(highlighter.parser(), highlight_config.language, source)?;
 
-    iterate_assertions(&assertions, &highlights, &highlight_names)?;
-
-    // Iterate through all of the highlighting assertions, checking each one against the
-    // actual highlights.
-    let mut i = 0;
-    let mut actual_highlights = Vec::<&String>::new();
-    for Assertion {
-        position,
-        expected_capture_name: expected_highlight,
-    } in &assertions
-    {
-        let mut passed = false;
-        actual_highlights.clear();
-
-        'highlight_loop: loop {
-            // The assertions are ordered by position, so skip past all of the highlights that
-            // end at or before this assertion's position.
-            if let Some(highlight) = highlights.get(i) {
-                if highlight.1 <= *position {
-                    i += 1;
-                    continue;
-                }
-
-                // Iterate through all of the highlights that start at or before this assertion's,
-                // position, looking for one that matches the assertion.
-                let mut j = i;
-                while let (false, Some(highlight)) = (passed, highlights.get(j)) {
-                    if highlight.0 > *position {
-                        break 'highlight_loop;
-                    }
-
-                    // If the highlight matches the assertion, this test passes. Otherwise,
-                    // add this highlight to the list of actual highlights that span the
-                    // assertion's position, in order to generate an error message in the event
-                    // of a failure.
-                    let highlight_name = &highlight_names[(highlight.2).0];
-                    if *highlight_name == *expected_highlight {
-                        passed = true;
-                        break 'highlight_loop;
-                    } else {
-                        actual_highlights.push(highlight_name);
-                    }
-
-                    j += 1;
-                }
-            } else {
-                break;
-            }
-        }
-
-        if !passed {
-            return Err(Failure {
-                row: position.row,
-                column: position.column,
-                expected_highlight: expected_highlight.clone(),
-                actual_highlights: actual_highlights.into_iter().cloned().collect(),
-            }
-            .into());
-        }
-    }
-
-    Ok(assertions.len())
+    iterate_assertions(&assertions, &highlights, &highlight_names)
 }
 
 pub fn get_highlight_positions(
diff --git a/cli/src/test_tags.rs b/cli/src/test_tags.rs
index 8c1fb34a..d27e7244 100644
--- a/cli/src/test_tags.rs
+++ b/cli/src/test_tags.rs
@@ -96,6 +96,7 @@ pub fn test_tag(
     let mut actual_tags = Vec::<&String>::new();
     for Assertion {
         position,
+        negative,
         expected_capture_name: expected_tag,
     } in &assertions
     {
@@ -117,7 +118,7 @@ pub fn test_tag(
                     }
 
                     let tag_name = &tag.2;
-                    if *tag_name == *expected_tag {
+                    if (*tag_name == *expected_tag) == !negative {
                         passed = true;
                         break 'tag_loop;
                     } else {
diff --git a/cli/src/tests/test_highlight_test.rs b/cli/src/tests/test_highlight_test.rs
index af2c15c5..d9b2c43a 100644
--- a/cli/src/tests/test_highlight_test.rs
+++ b/cli/src/tests/test_highlight_test.rs
@@ -23,6 +23,7 @@ fn test_highlight_test_with_basic_test() {
         "  //       ^ keyword",
         "  return d + e;",
         "  //     ^ variable.parameter",
+        "  //       ^ !variable",
         "};",
     ]
     .join("\n");
@@ -32,18 +33,10 @@ fn test_highlight_test_with_basic_test() {
     assert_eq!(
         assertions,
         &[
-            Assertion {
-                position: Point::new(1, 5),
-                expected_capture_name: "function".to_string()
-            },
-            Assertion {
-                position: Point::new(1, 11),
-                expected_capture_name: "keyword".to_string()
-            },
-            Assertion {
-                position: Point::new(4, 9),
-                expected_capture_name: "variable.parameter".to_string()
-            },
+            Assertion::new(1, 5, false, String::from("function")),
+            Assertion::new(1, 11, false, String::from("keyword")),
+            Assertion::new(4, 9, false, String::from("variable.parameter")),
+            Assertion::new(4, 11, true, String::from("variable")),
         ]
     );
 
diff --git a/cli/src/tests/test_tags_test.rs b/cli/src/tests/test_tags_test.rs
index 61f98abd..e682434e 100644
--- a/cli/src/tests/test_tags_test.rs
+++ b/cli/src/tests/test_tags_test.rs
@@ -16,6 +16,7 @@ fn test_tags_test_with_basic_test() {
         "    #    ^ reference.call",
         "    return d(e)",
         "    #      ^ reference.call",
+        "    #        ^ !variable.parameter",
         "",
     ]
     .join("\n");
@@ -26,18 +27,10 @@ fn test_tags_test_with_basic_test() {
     assert_eq!(
         assertions,
         &[
-            Assertion {
-                position: Point::new(1, 4),
-                expected_capture_name: "definition.function".to_string(),
-            },
-            Assertion {
-                position: Point::new(3, 9),
-                expected_capture_name: "reference.call".to_string(),
-            },
-            Assertion {
-                position: Point::new(5, 11),
-                expected_capture_name: "reference.call".to_string(),
-            },
+            Assertion::new(1, 4, false, String::from("definition.function")),
+            Assertion::new(3, 9, false, String::from("reference.call")),
+            Assertion::new(5, 11, false, String::from("reference.call")),
+            Assertion::new(5, 13, true, String::from("variable.parameter")),
         ]
     );
 

From c1d227bdb7884c5f588eafb0a26f7117a6f74f1b Mon Sep 17 00:00:00 2001
From: Amaan Qureshi <amaanq12@gmail.com>
Date: Tue, 25 Jul 2023 00:32:40 -0400
Subject: [PATCH 200/347] docs: document negative assertions

---
 docs/section-4-syntax-highlighting.md | 5 +++++
 1 file changed, 5 insertions(+)

diff --git a/docs/section-4-syntax-highlighting.md b/docs/section-4-syntax-highlighting.md
index cedd89a6..964fb677 100644
--- a/docs/section-4-syntax-highlighting.md
+++ b/docs/section-4-syntax-highlighting.md
@@ -428,6 +428,9 @@ var abc = function(d) {
     //    ^ string
     //          ^ variable
   }
+
+  baz();
+  ^ !variable
 };
 ```
 
@@ -438,3 +441,5 @@ From the Sublime text docs:
 > **Caret**: ^ this will test the following selector against the scope on the most recent non-test line. It will test it at the same column the ^ is in. Consecutive ^s will test each column against the selector.
 >
 > **Arrow**: <- this will test the following selector against the scope on the most recent non-test line. It will test it at the same column as the comment character is in.
+
+Note that an exclamation mark (`!`) can be used to negate a selector. For example, `!keyword` will match any scope that is not the `keyword` class.

From ee399e67d40117e3944ebc50419616d64e93bf1f Mon Sep 17 00:00:00 2001
From: Amaan Qureshi <amaanq12@gmail.com>
Date: Thu, 27 Jul 2023 03:31:46 -0400
Subject: [PATCH 201/347] fix: retain header and divider delimiter lengths when
 updating tests

This helps to prevent visual bloat in diffs when updating tests where the delimiter is not 80 chars long
---
 cli/src/test.rs              | 111 +++++++++++++++++++++++++++--------
 cli/src/tests/corpus_test.rs |   1 +
 2 files changed, 89 insertions(+), 23 deletions(-)

diff --git a/cli/src/test.rs b/cli/src/test.rs
index c531c18a..7c704160 100644
--- a/cli/src/test.rs
+++ b/cli/src/test.rs
@@ -16,11 +16,11 @@ use walkdir::WalkDir;
 
 lazy_static! {
     static ref HEADER_REGEX: ByteRegex =
-        ByteRegexBuilder::new(r"^===+(?P<suffix1>[^=\r\n][^\r\n]*)?\r?\n(?P<test_name>([^=\r\n][^\r\n]*\r?\n)+)===+(?P<suffix2>[^=\r\n][^\r\n]*)?\r?\n")
+        ByteRegexBuilder::new(r"^(?P<equals>(?:=+){3,})(?P<suffix1>[^=\r\n][^\r\n]*)?\r?\n(?P<test_name>([^=\r\n][^\r\n]*\r?\n)+)===+(?P<suffix2>[^=\r\n][^\r\n]*)?\r?\n")
             .multi_line(true)
             .build()
             .unwrap();
-    static ref DIVIDER_REGEX: ByteRegex = ByteRegexBuilder::new(r"^---+(?P<suffix>[^-\r\n][^\r\n]*)?\r?\n")
+    static ref DIVIDER_REGEX: ByteRegex = ByteRegexBuilder::new(r"^(?P<hyphens>(?:-+){3,})(?P<suffix>[^-\r\n][^\r\n]*)?\r?\n")
         .multi_line(true)
         .build()
         .unwrap();
@@ -40,6 +40,8 @@ pub enum TestEntry {
         name: String,
         input: Vec<u8>,
         output: String,
+        header_delim_len: usize,
+        divider_delim_len: usize,
         has_fields: bool,
     },
 }
@@ -179,13 +181,15 @@ fn run_tests(
     mut indent_level: i32,
     failures: &mut Vec<(String, String, String)>,
     update: bool,
-    corrected_entries: &mut Vec<(String, String, String)>,
+    corrected_entries: &mut Vec<(String, String, String, usize, usize)>,
 ) -> Result<()> {
     match test_entry {
         TestEntry::Example {
             name,
             input,
             output,
+            header_delim_len,
+            divider_delim_len,
             has_fields,
         } => {
             if let Some(filter) = filter {
@@ -193,7 +197,13 @@ fn run_tests(
                     if update {
                         let input = String::from_utf8(input).unwrap();
                         let output = format_sexp(&output);
-                        corrected_entries.push((name, input, output));
+                        corrected_entries.push((
+                            name,
+                            input,
+                            output,
+                            header_delim_len,
+                            divider_delim_len,
+                        ));
                     }
                     return Ok(());
                 }
@@ -203,21 +213,31 @@ fn run_tests(
             if !has_fields {
                 actual = strip_sexp_fields(actual);
             }
-            for _ in 0..indent_level {
-                print!("  ");
-            }
+            print!("{}", "  ".repeat(indent_level as usize));
             if actual == output {
                 println!("✓ {}", Colour::Green.paint(&name));
                 if update {
                     let input = String::from_utf8(input).unwrap();
                     let output = format_sexp(&output);
-                    corrected_entries.push((name, input, output));
+                    corrected_entries.push((
+                        name,
+                        input,
+                        output,
+                        header_delim_len,
+                        divider_delim_len,
+                    ));
                 }
             } else {
                 if update {
                     let input = String::from_utf8(input).unwrap();
                     let output = format_sexp(&actual);
-                    corrected_entries.push((name.clone(), input, output));
+                    corrected_entries.push((
+                        name.clone(),
+                        input,
+                        output,
+                        header_delim_len,
+                        divider_delim_len,
+                    ));
                     println!("✓ {}", Colour::Blue.paint(&name));
                 } else {
                     println!("✗ {}", Colour::Red.paint(&name));
@@ -231,9 +251,7 @@ fn run_tests(
             file_path,
         } => {
             if indent_level > 0 {
-                for _ in 0..indent_level {
-                    print!("  ");
-                }
+                print!("{}", "  ".repeat(indent_level as usize));
                 println!("{}:", name);
             }
 
@@ -314,27 +332,32 @@ fn format_sexp_indented(sexp: &String, initial_indent_level: u32) -> String {
     formatted
 }
 
-fn write_tests(file_path: &Path, corrected_entries: &Vec<(String, String, String)>) -> Result<()> {
+fn write_tests(
+    file_path: &Path,
+    corrected_entries: &Vec<(String, String, String, usize, usize)>,
+) -> Result<()> {
     let mut buffer = fs::File::create(file_path)?;
     write_tests_to_buffer(&mut buffer, corrected_entries)
 }
 
 fn write_tests_to_buffer(
     buffer: &mut impl Write,
-    corrected_entries: &Vec<(String, String, String)>,
+    corrected_entries: &Vec<(String, String, String, usize, usize)>,
 ) -> Result<()> {
-    for (i, (name, input, output)) in corrected_entries.iter().enumerate() {
+    for (i, (name, input, output, header_delim_len, divider_delim_len)) in
+        corrected_entries.iter().enumerate()
+    {
         if i > 0 {
             write!(buffer, "\n")?;
         }
         write!(
             buffer,
             "{}\n{}\n{}\n{}\n{}\n\n{}\n",
-            "=".repeat(80),
+            "=".repeat(*header_delim_len),
             name,
-            "=".repeat(80),
+            "=".repeat(*header_delim_len),
             input,
-            "-".repeat(80),
+            "-".repeat(*divider_delim_len),
             output.trim()
         )?;
     }
@@ -398,6 +421,7 @@ fn parse_test_content(name: String, content: String, file_path: Option<PathBuf>)
     // Ignore any matches whose suffix does not match the first header
     // suffix in the file.
     let header_matches = HEADER_REGEX.captures_iter(&bytes).filter_map(|c| {
+        let header_delim_len = c.name("equals").map(|n| n.as_bytes().len()).unwrap_or(80);
         let suffix1 = c
             .name("suffix1")
             .map(|m| String::from_utf8_lossy(m.as_bytes()));
@@ -409,13 +433,17 @@ fn parse_test_content(name: String, content: String, file_path: Option<PathBuf>)
             let test_name = c
                 .name("test_name")
                 .map(|c| String::from_utf8_lossy(c.as_bytes()).trim_end().to_string());
-            Some((header_range, test_name))
+            let res = Some((header_delim_len, header_range, test_name));
+            res
         } else {
             None
         }
     });
 
-    for (header_range, test_name) in header_matches.chain(Some((bytes.len()..bytes.len(), None))) {
+    let mut prev_header_len = 80;
+    for (header_delim_len, header_range, test_name) in
+        header_matches.chain(Some((80, bytes.len()..bytes.len(), None)))
+    {
         // Find the longest line of dashes following each test description. That line
         // separates the input from the expected output. Ignore any matches whose suffix
         // does not match the first suffix in the file.
@@ -423,19 +451,25 @@ fn parse_test_content(name: String, content: String, file_path: Option<PathBuf>)
             let divider_range = DIVIDER_REGEX
                 .captures_iter(&bytes[prev_header_end..header_range.start])
                 .filter_map(|m| {
+                    let divider_delim_len =
+                        m.name("hyphens").map(|m| m.as_bytes().len()).unwrap_or(80);
                     let suffix = m
                         .name("suffix")
                         .map(|m| String::from_utf8_lossy(m.as_bytes()));
                     if suffix == first_suffix {
                         let range = m.get(0).unwrap().range();
-                        Some((prev_header_end + range.start)..(prev_header_end + range.end))
+                        let res = Some((
+                            divider_delim_len,
+                            (prev_header_end + range.start)..(prev_header_end + range.end),
+                        ));
+                        res
                     } else {
                         None
                     }
                 })
-                .max_by_key(|range| range.len());
+                .max_by_key(|(_, range)| range.len());
 
-            if let Some(divider_range) = divider_range {
+            if let Some((divider_delim_len, divider_range)) = divider_range {
                 if let Ok(output) = str::from_utf8(&bytes[divider_range.end..header_range.start]) {
                     let mut input = bytes[prev_header_end..divider_range.start].to_vec();
 
@@ -460,12 +494,15 @@ fn parse_test_content(name: String, content: String, file_path: Option<PathBuf>)
                         name: prev_name,
                         input,
                         output,
+                        header_delim_len: prev_header_len,
+                        divider_delim_len,
                         has_fields,
                     });
                 }
             }
         }
         prev_name = test_name.unwrap_or(String::new());
+        prev_header_len = header_delim_len;
         prev_header_end = header_range.end;
     }
     TestEntry::Group {
@@ -516,12 +553,16 @@ d
                         name: "The first test".to_string(),
                         input: "\na b c\n".as_bytes().to_vec(),
                         output: "(a (b c))".to_string(),
+                        header_delim_len: 15,
+                        divider_delim_len: 3,
                         has_fields: false,
                     },
                     TestEntry::Example {
                         name: "The second test".to_string(),
                         input: "d".as_bytes().to_vec(),
                         output: "(d)".to_string(),
+                        header_delim_len: 16,
+                        divider_delim_len: 3,
                         has_fields: false,
                     },
                 ],
@@ -570,12 +611,16 @@ abc
                         name: "Code with dashes".to_string(),
                         input: "abc\n---\ndefg\n----\nhijkl".as_bytes().to_vec(),
                         output: "(a (b))".to_string(),
+                        header_delim_len: 18,
+                        divider_delim_len: 7,
                         has_fields: false,
                     },
                     TestEntry::Example {
                         name: "Code ending with dashes".to_string(),
                         input: "abc\n-----------".as_bytes().to_vec(),
                         output: "(c (d))".to_string(),
+                        header_delim_len: 25,
+                        divider_delim_len: 19,
                         has_fields: false,
                     },
                 ],
@@ -619,11 +664,15 @@ abc
                 "title 1".to_string(),
                 "input 1".to_string(),
                 "output 1".to_string(),
+                80,
+                80,
             ),
             (
                 "title 2".to_string(),
                 "input 2".to_string(),
                 "output 2".to_string(),
+                80,
+                80,
             ),
         ];
         write_tests_to_buffer(&mut buffer, &corrected_entries).unwrap();
@@ -700,18 +749,24 @@ code
                         name: "sexp with comment".to_string(),
                         input: "code".as_bytes().to_vec(),
                         output: "(a (b))".to_string(),
+                        header_delim_len: 18,
+                        divider_delim_len: 3,
                         has_fields: false,
                     },
                     TestEntry::Example {
                         name: "sexp with comment between".to_string(),
                         input: "code".as_bytes().to_vec(),
                         output: "(a (b))".to_string(),
+                        header_delim_len: 18,
+                        divider_delim_len: 3,
                         has_fields: false,
                     },
                     TestEntry::Example {
                         name: "sexp with ';'".to_string(),
                         input: "code".as_bytes().to_vec(),
                         output: "(MISSING \";\")".to_string(),
+                        header_delim_len: 25,
+                        divider_delim_len: 3,
                         has_fields: false,
                     }
                 ],
@@ -784,18 +839,24 @@ NOT A TEST HEADER
                         name: "First test".to_string(),
                         input: expected_input.clone(),
                         output: "(a)".to_string(),
+                        header_delim_len: 18,
+                        divider_delim_len: 3,
                         has_fields: false,
                     },
                     TestEntry::Example {
                         name: "Second test".to_string(),
                         input: expected_input.clone(),
                         output: "(a)".to_string(),
+                        header_delim_len: 18,
+                        divider_delim_len: 3,
                         has_fields: false,
                     },
                     TestEntry::Example {
                         name: "Test name with = symbol".to_string(),
                         input: expected_input.clone(),
                         output: "(a)".to_string(),
+                        header_delim_len: 25,
+                        divider_delim_len: 3,
                         has_fields: false,
                     }
                 ],
@@ -839,12 +900,16 @@ code with ----
                         name: "name\nwith\nnewlines".to_string(),
                         input: b"a".to_vec(),
                         output: "(b)".to_string(),
+                        header_delim_len: 15,
+                        divider_delim_len: 3,
                         has_fields: false,
                     },
                     TestEntry::Example {
                         name: "name with === signs".to_string(),
                         input: b"code with ----".to_vec(),
                         output: "(d)".to_string(),
+                        header_delim_len: 20,
+                        divider_delim_len: 3,
                         has_fields: false,
                     }
                 ]
diff --git a/cli/src/tests/corpus_test.rs b/cli/src/tests/corpus_test.rs
index 7166d249..24e72398 100644
--- a/cli/src/tests/corpus_test.rs
+++ b/cli/src/tests/corpus_test.rs
@@ -502,6 +502,7 @@ fn flatten_tests(test: TestEntry) -> Vec<FlattenedTest> {
                 input,
                 output,
                 has_fields,
+                ..
             } => {
                 if !prefix.is_empty() {
                     name.insert_str(0, " - ");

From 192793a6aba6dff53a283da52eba1273fc34204c Mon Sep 17 00:00:00 2001
From: Amaan Qureshi <amaanq12@gmail.com>
Date: Thu, 27 Jul 2023 03:32:55 -0400
Subject: [PATCH 202/347] fix: avoid panic if input is empty

---
 cli/src/parse.rs | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/cli/src/parse.rs b/cli/src/parse.rs
index 6e62e1cf..3647c2c4 100644
--- a/cli/src/parse.rs
+++ b/cli/src/parse.rs
@@ -95,7 +95,7 @@ pub fn parse_file_at_path(opts: ParseFileOptions) -> Result<bool> {
                 .collect::<Vec<_>>();
             parser.parse_utf16(&source_code_utf16, None)
         }
-        None if is_utf16_bom(&source_code[0..2]) => {
+        None if source_code.len() >= 2 && is_utf16_bom(&source_code[0..2]) => {
             let source_code_utf16 = source_code
                 .chunks_exact(2)
                 .map(|chunk| u16::from_le_bytes([chunk[0], chunk[1]]))

From 7ad21396c2ac5aa7ea4dfd250d1597c71ff8fea7 Mon Sep 17 00:00:00 2001
From: Amaan Qureshi <amaanq12@gmail.com>
Date: Mon, 24 Jul 2023 01:57:10 -0400
Subject: [PATCH 203/347] feat!: use `Option<NonZeroU16>` for TSFieldIds

---
 lib/binding_rust/lib.rs | 17 ++++++++++-------
 1 file changed, 10 insertions(+), 7 deletions(-)

diff --git a/lib/binding_rust/lib.rs b/lib/binding_rust/lib.rs
index 5bed0817..84c3d12e 100644
--- a/lib/binding_rust/lib.rs
+++ b/lib/binding_rust/lib.rs
@@ -10,6 +10,7 @@ use std::{
     fmt, hash, iter,
     marker::PhantomData,
     mem::MaybeUninit,
+    num::NonZeroU16,
     ops,
     os::raw::{c_char, c_void},
     ptr::{self, NonNull},
@@ -93,6 +94,8 @@ pub enum LogType {
     Lex,
 }
 
+type FieldId = NonZeroU16;
+
 /// A callback that receives log messages during parser.
 type Logger<'a> = Box<dyn FnMut(LogType, &str) + 'a>;
 
@@ -319,7 +322,7 @@ impl Language {
 
     /// Get the numerical id for the given field name.
     #[doc(alias = "ts_language_field_id_for_name")]
-    pub fn field_id_for_name(&self, field_name: impl AsRef<[u8]>) -> Option<u16> {
+    pub fn field_id_for_name(&self, field_name: impl AsRef<[u8]>) -> Option<FieldId> {
         let field_name = field_name.as_ref();
         let id = unsafe {
             ffi::ts_language_field_id_for_name(
@@ -331,7 +334,7 @@ impl Language {
         if id == 0 {
             None
         } else {
-            Some(id)
+            Some(FieldId::new(id).unwrap())
         }
     }
 }
@@ -1060,7 +1063,7 @@ impl<'tree> Node<'tree> {
         cursor: &'a mut TreeCursor<'tree>,
     ) -> impl Iterator<Item = Node<'tree>> + 'a {
         let field_id = self.language().field_id_for_name(field_name);
-        self.children_by_field_id(field_id.unwrap_or(0), cursor)
+        self.children_by_field_id(field_id, cursor)
     }
 
     /// Iterate over this node's children with a given field id.
@@ -1068,7 +1071,7 @@ impl<'tree> Node<'tree> {
     /// See also [Node::children_by_field_name].
     pub fn children_by_field_id<'a>(
         &self,
-        field_id: u16,
+        field_id: Option<FieldId>,
         cursor: &'a mut TreeCursor<'tree>,
     ) -> impl Iterator<Item = Node<'tree>> + 'a {
         cursor.reset(*self);
@@ -1076,7 +1079,7 @@ impl<'tree> Node<'tree> {
         let mut done = false;
         iter::from_fn(move || {
             while !done {
-                while cursor.field_id() != Some(field_id) {
+                while cursor.field_id() != field_id {
                     if !cursor.goto_next_sibling() {
                         return None;
                     }
@@ -1242,13 +1245,13 @@ impl<'a> TreeCursor<'a> {
     ///
     /// See also [field_name](TreeCursor::field_name).
     #[doc(alias = "ts_tree_cursor_current_field_id")]
-    pub fn field_id(&self) -> Option<u16> {
+    pub fn field_id(&self) -> Option<FieldId> {
         unsafe {
             let id = ffi::ts_tree_cursor_current_field_id(&self.0);
             if id == 0 {
                 None
             } else {
-                Some(id)
+                Some(FieldId::new(id).unwrap())
             }
         }
     }

From 99366f3b5d2f2ec9fe15a52d1a0256857524cdc5 Mon Sep 17 00:00:00 2001
From: Amaan Qureshi <amaanq12@gmail.com>
Date: Mon, 24 Jul 2023 02:42:22 -0400
Subject: [PATCH 204/347] ci(sparc64): increase timeout time

---
 cli/src/tests/parser_test.rs | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/cli/src/tests/parser_test.rs b/cli/src/tests/parser_test.rs
index af5f36f5..a9815d5c 100644
--- a/cli/src/tests/parser_test.rs
+++ b/cli/src/tests/parser_test.rs
@@ -665,7 +665,7 @@ fn test_parsing_with_a_timeout() {
     assert!(start_time.elapsed().as_micros() < 2000);
 
     #[cfg(target_arch = "sparc64")]
-    assert!(start_time.elapsed().as_micros() < 4000);
+    assert!(start_time.elapsed().as_micros() < 8000);
 
     // Continue parsing, but pause after 1 ms of processing.
     parser.set_timeout_micros(5000);

From 137483c7b9180bb1533bf04fdb5f4a0e328789be Mon Sep 17 00:00:00 2001
From: Amaan Qureshi <amaanq12@gmail.com>
Date: Mon, 24 Jul 2023 01:27:13 -0400
Subject: [PATCH 205/347] fix: take the last range element by default if the
 query error isn't found

---
 cli/loader/src/lib.rs | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/cli/loader/src/lib.rs b/cli/loader/src/lib.rs
index b498e64b..3548ab8c 100644
--- a/cli/loader/src/lib.rs
+++ b/cli/loader/src/lib.rs
@@ -782,7 +782,7 @@ impl<'a> LanguageConfiguration<'a> {
         let (path, range) = ranges
             .iter()
             .find(|(_, range)| range.contains(&offset_within_section))
-            .unwrap();
+            .unwrap_or(ranges.last().unwrap());
         error.offset = offset_within_section - range.start;
         error.row = source[range.start..offset_within_section]
             .chars()

From f4e788b28e44bc756768b66f6abc7c501cfeca1a Mon Sep 17 00:00:00 2001
From: Amaan Qureshi <amaanq12@gmail.com>
Date: Thu, 27 Jul 2023 15:09:03 -0400
Subject: [PATCH 206/347] feat: warn when unused conflicts are present in a
 grammar

---
 .../generate/build_tables/build_parse_table.rs | 18 ++++++++++++++++++
 1 file changed, 18 insertions(+)

diff --git a/cli/src/generate/build_tables/build_parse_table.rs b/cli/src/generate/build_tables/build_parse_table.rs
index 10320263..d19d44de 100644
--- a/cli/src/generate/build_tables/build_parse_table.rs
+++ b/cli/src/generate/build_tables/build_parse_table.rs
@@ -57,6 +57,7 @@ struct ParseTableBuilder<'a> {
     parse_state_info_by_id: Vec<ParseStateInfo<'a>>,
     parse_state_queue: VecDeque<ParseStateQueueEntry>,
     non_terminal_extra_states: Vec<(Symbol, usize)>,
+    actual_conflicts: HashSet<Vec<Symbol>>,
     parse_table: ParseTable,
 }
 
@@ -132,6 +133,20 @@ impl<'a> ParseTableBuilder<'a> {
             )?;
         }
 
+        if !self.actual_conflicts.is_empty() {
+            println!("Warning: unnecessary conflicts");
+            for conflict in &self.actual_conflicts {
+                println!(
+                    "  {}",
+                    conflict
+                        .iter()
+                        .map(|symbol| format!("`{}`", self.symbol_name(symbol)))
+                        .collect::<Vec<_>>()
+                        .join(", ")
+                );
+            }
+        }
+
         Ok((self.parse_table, self.parse_state_info_by_id))
     }
 
@@ -582,6 +597,7 @@ impl<'a> ParseTableBuilder<'a> {
             .expected_conflicts
             .contains(&actual_conflict)
         {
+            self.actual_conflicts.remove(&actual_conflict);
             return Ok(());
         }
 
@@ -964,6 +980,7 @@ pub(crate) fn build_parse_table<'a>(
     inlines: &'a InlinedProductionMap,
     variable_info: &'a Vec<VariableInfo>,
 ) -> Result<(ParseTable, Vec<TokenSet>, Vec<ParseStateInfo<'a>>)> {
+    let actual_conflicts = syntax_grammar.expected_conflicts.iter().cloned().collect();
     let item_set_builder = ParseItemSetBuilder::new(syntax_grammar, lexical_grammar, inlines);
     let mut following_tokens = vec![TokenSet::new(); lexical_grammar.variables.len()];
     populate_following_tokens(
@@ -979,6 +996,7 @@ pub(crate) fn build_parse_table<'a>(
         item_set_builder,
         variable_info,
         non_terminal_extra_states: Vec::new(),
+        actual_conflicts,
         state_ids_by_item_set: IndexMap::default(),
         core_ids_by_core: HashMap::new(),
         parse_state_info_by_id: Vec::new(),

From f9f51480eba6c9118734408c90a11dd38b49b434 Mon Sep 17 00:00:00 2001
From: Ganesan Arjuna Maharaja <ganesans@athenahealth.com>
Date: Sat, 29 Jul 2023 20:55:33 +0530
Subject: [PATCH 207/347] correcting the spelling of valid_symbols in indent
 dedent example

---
 docs/section-3-creating-parsers.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/docs/section-3-creating-parsers.md b/docs/section-3-creating-parsers.md
index faf02c4c..0ecef257 100644
--- a/docs/section-3-creating-parsers.md
+++ b/docs/section-3-creating-parsers.md
@@ -715,7 +715,7 @@ This function is responsible for recognizing external tokens. It should return `
 The third argument to the `scan` function is an array of booleans that indicates which of external tokens are currently expected by the parser. You should only look for a given token if it is valid according to this array. At the same time, you cannot backtrack, so you may need to combine certain pieces of logic.
 
 ```c
-if (valid_symbols[INDENT] || valid_symbol[DEDENT]) {
+if (valid_symbols[INDENT] || valid_symbols[DEDENT]) {
 
   // ... logic that is common to both `INDENT` and `DEDENT`
 

From a2f834d84684026cd1218a6901606682d1c5f3a1 Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Sun, 30 Jul 2023 20:43:52 +0300
Subject: [PATCH 208/347] More error contexts + conv panics to errors with
 context

---
 cli/src/generate/mod.rs | 53 ++++++++++++++++++++++++-----------------
 cli/src/main.rs         | 26 ++++++++++----------
 cli/src/playground.rs   | 47 ++++++++++++++++++++----------------
 3 files changed, 72 insertions(+), 54 deletions(-)

diff --git a/cli/src/generate/mod.rs b/cli/src/generate/mod.rs
index 206b74f9..4e1cac63 100644
--- a/cli/src/generate/mod.rs
+++ b/cli/src/generate/mod.rs
@@ -48,22 +48,22 @@ pub fn generate_parser_in_directory(
     let src_path = repo_path.join("src");
     let header_path = src_path.join("tree_sitter");
 
+    // Read the grammar.json.
+    let grammar_json = match grammar_path {
+        Some(path) => load_grammar_file(path.as_ref())?,
+        None => {
+            let grammar_js_path = grammar_path.map_or(repo_path.join("grammar.js"), |s| s.into());
+            load_grammar_file(&grammar_js_path)?
+        }
+    };
+
     // Ensure that the output directories exist.
     fs::create_dir_all(&src_path)?;
     fs::create_dir_all(&header_path)?;
 
-    // Read the grammar.json.
-    let grammar_json;
-    match grammar_path {
-        Some(path) => {
-            grammar_json = load_grammar_file(path.as_ref())?;
-        }
-        None => {
-            let grammar_js_path = grammar_path.map_or(repo_path.join("grammar.js"), |s| s.into());
-            grammar_json = load_grammar_file(&grammar_js_path)?;
-            fs::write(&src_path.join("grammar.json"), &grammar_json)
-                .with_context(|| format!("Failed to write grammar.json to {:?}", src_path))?;
-        }
+    if grammar_path.is_none() {
+        fs::write(&src_path.join("grammar.json"), &grammar_json)
+            .with_context(|| format!("Failed to write grammar.json to {:?}", src_path))?;
     }
 
     // Parse and preprocess the grammar.
@@ -157,9 +157,18 @@ fn generate_parser_for_grammar_with_opts(
 }
 
 pub fn load_grammar_file(grammar_path: &Path) -> Result<String> {
+    if grammar_path.is_dir() {
+        return Err(anyhow!(
+            "Path to a grammar file with `.js` or `.json` extension is required"
+        ));
+    }
     match grammar_path.extension().and_then(|e| e.to_str()) {
-        Some("js") => Ok(load_js_grammar_file(grammar_path)?),
-        Some("json") => Ok(fs::read_to_string(grammar_path)?),
+        Some("js") => {
+            Ok(load_js_grammar_file(grammar_path).with_context(|| "Failed to load grammar.js")?)
+        }
+        Some("json") => {
+            Ok(fs::read_to_string(grammar_path).with_context(|| "Failed to load grammar.json")?)
+        }
         _ => Err(anyhow!(
             "Unknown grammar file extension: {:?}",
             grammar_path
@@ -174,14 +183,14 @@ fn load_js_grammar_file(grammar_path: &Path) -> Result<String> {
         .stdin(Stdio::piped())
         .stdout(Stdio::piped())
         .spawn()
-        .expect("Failed to run `node`");
+        .with_context(|| "Failed to run `node`")?;
 
     let mut node_stdin = node_process
         .stdin
         .take()
-        .expect("Failed to open stdin for node");
+        .with_context(|| "Failed to open stdin for node")?;
     let cli_version = Version::parse(env!("CARGO_PKG_VERSION"))
-        .expect("Could not parse this package's version as semver.");
+        .with_context(|| "Could not parse this package's version as semver.")?;
     write!(
         node_stdin,
         "global.TREE_SITTER_CLI_VERSION_MAJOR = {};
@@ -189,22 +198,22 @@ fn load_js_grammar_file(grammar_path: &Path) -> Result<String> {
         global.TREE_SITTER_CLI_VERSION_PATCH = {};",
         cli_version.major, cli_version.minor, cli_version.patch,
     )
-    .expect("Failed to write tree-sitter version to node's stdin");
+    .with_context(|| "Failed to write tree-sitter version to node's stdin")?;
     let javascript_code = include_bytes!("./dsl.js");
     node_stdin
         .write(javascript_code)
-        .expect("Failed to write grammar dsl to node's stdin");
+        .with_context(|| "Failed to write grammar dsl to node's stdin")?;
     drop(node_stdin);
     let output = node_process
         .wait_with_output()
-        .expect("Failed to read output from node");
+        .with_context(|| "Failed to read output from node")?;
     match output.status.code() {
         None => panic!("Node process was killed"),
         Some(0) => {}
         Some(code) => return Err(anyhow!("Node process exited with status {}", code)),
     }
-
-    let mut result = String::from_utf8(output.stdout).expect("Got invalid UTF8 from node");
+    let mut result =
+        String::from_utf8(output.stdout).with_context(|| "Got invalid UTF8 from node")?;
     result.push('\n');
     Ok(result)
 }
diff --git a/cli/src/main.rs b/cli/src/main.rs
index 7d2f6a17..1912762d 100644
--- a/cli/src/main.rs
+++ b/cli/src/main.rs
@@ -1,4 +1,4 @@
-use anyhow::{anyhow, Context, Result};
+use anyhow::{anyhow, Context, Error, Result};
 use clap::{App, AppSettings, Arg, SubCommand};
 use glob::glob;
 use std::path::{Path, PathBuf};
@@ -317,16 +317,18 @@ fn run() -> Result<()> {
             if matches.is_present("log") {
                 logger::init();
             }
-            let abi_version =
-                matches
-                    .value_of("abi-version")
-                    .map_or(DEFAULT_GENERATE_ABI_VERSION, |version| {
-                        if version == "latest" {
-                            tree_sitter::LANGUAGE_VERSION
-                        } else {
-                            version.parse().expect("invalid abi version flag")
-                        }
-                    });
+            let abi_version = matches.value_of("abi-version").map_or(
+                Ok::<_, Error>(DEFAULT_GENERATE_ABI_VERSION),
+                |version| {
+                    Ok(if version == "latest" {
+                        tree_sitter::LANGUAGE_VERSION
+                    } else {
+                        version
+                            .parse()
+                            .with_context(|| "invalid abi version flag")?
+                    })
+                },
+            )?;
             let generate_bindings = !matches.is_present("no-bindings");
             generate::generate_parser_in_directory(
                 &current_dir,
@@ -635,7 +637,7 @@ fn run() -> Result<()> {
 
         ("playground", Some(matches)) => {
             let open_in_browser = !matches.is_present("quiet");
-            playground::serve(&current_dir, open_in_browser);
+            playground::serve(&current_dir, open_in_browser)?;
         }
 
         ("dump-languages", Some(_)) => {
diff --git a/cli/src/playground.rs b/cli/src/playground.rs
index 5bbcb3c3..662eb8aa 100644
--- a/cli/src/playground.rs
+++ b/cli/src/playground.rs
@@ -1,5 +1,5 @@
 use super::wasm;
-use anyhow::Context;
+use anyhow::{anyhow, Context, Result};
 use std::{
     borrow::Cow,
     env, fs,
@@ -43,20 +43,17 @@ fn get_main_html(tree_sitter_dir: &Option<PathBuf>) -> Cow<'static, [u8]> {
     }
 }
 
-pub fn serve(grammar_path: &Path, open_in_browser: bool) {
-    let server = get_server();
+pub fn serve(grammar_path: &Path, open_in_browser: bool) -> Result<()> {
+    let server = get_server()?;
     let grammar_name = wasm::get_grammar_name(&grammar_path.join("src"))
-        .with_context(|| "Failed to get wasm filename")
-        .unwrap();
+        .with_context(|| "Failed to get wasm filename")?;
     let wasm_filename = format!("tree-sitter-{}.wasm", grammar_name);
-    let language_wasm = fs::read(grammar_path.join(&wasm_filename))
-        .with_context(|| {
-            format!(
-                "Failed to read {}. Run `tree-sitter build-wasm` first.",
-                wasm_filename
-            )
-        })
-        .unwrap();
+    let language_wasm = fs::read(grammar_path.join(&wasm_filename)).with_context(|| {
+        format!(
+            "Failed to read {}. Run `tree-sitter build-wasm` first.",
+            wasm_filename
+        )
+    })?;
     let url = format!("http://{}", server.server_addr());
     println!("Started playground on: {}", url);
     if open_in_browser {
@@ -105,8 +102,12 @@ pub fn serve(grammar_path: &Path, open_in_browser: bool) {
             }
             _ => response(b"Not found", &html_header).with_status_code(404),
         };
-        request.respond(res).expect("Failed to write HTTP response");
+        request
+            .respond(res)
+            .with_context(|| "Failed to write HTTP response")?;
     }
+
+    Ok(())
 }
 
 fn redirect<'a>(url: &'a str) -> Response<&'a [u8]> {
@@ -121,18 +122,24 @@ fn response<'a>(data: &'a [u8], header: &Header) -> Response<&'a [u8]> {
         .with_header(header.clone())
 }
 
-fn get_server() -> Server {
+fn get_server() -> Result<Server> {
     let addr = env::var("TREE_SITTER_PLAYGROUND_ADDR").unwrap_or("127.0.0.1".to_owned());
     let port = env::var("TREE_SITTER_PLAYGROUND_PORT")
-        .map(|v| v.parse::<u16>().expect("Invalid port specification"))
+        .map(|v| {
+            v.parse::<u16>()
+                .with_context(|| "Invalid port specification")
+        })
         .ok();
     let listener = match port {
-        Some(port) => bind_to(&*addr, port).expect("Can't bind to the specified port"),
-        None => {
-            get_listener_on_available_port(&*addr).expect("Can't find a free port to bind to it")
+        Some(port) => {
+            bind_to(&*addr, port?).with_context(|| "Failed to bind to the specified port")?
         }
+        None => get_listener_on_available_port(&*addr)
+            .with_context(|| "Failed to find a free port to bind to it")?,
     };
-    Server::from_listener(listener, None).expect("Failed to start web server")
+    let server =
+        Server::from_listener(listener, None).map_err(|_| anyhow!("Failed to start web server"))?;
+    Ok(server)
 }
 
 fn get_listener_on_available_port(addr: &str) -> Option<TcpListener> {

From 7938db90fe87a2f55fb8e5af47dfbb46eafcfc68 Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Sat, 22 Jul 2023 21:38:55 +0300
Subject: [PATCH 209/347] TextProvider with generic return type

---
 highlight/src/lib.rs    |   2 +-
 lib/binding_rust/lib.rs | 103 ++++++++++++++++++++++++----------------
 2 files changed, 64 insertions(+), 41 deletions(-)

diff --git a/highlight/src/lib.rs b/highlight/src/lib.rs
index c3a54f6c..1042a1b2 100644
--- a/highlight/src/lib.rs
+++ b/highlight/src/lib.rs
@@ -165,7 +165,7 @@ where
 struct HighlightIterLayer<'a> {
     _tree: Tree,
     cursor: QueryCursor,
-    captures: iter::Peekable<QueryCaptures<'a, 'a, &'a [u8]>>,
+    captures: iter::Peekable<QueryCaptures<'a, 'a, &'a [u8], &'a [u8]>>,
     config: &'a HighlightConfiguration,
     highlight_end_stack: Vec<usize>,
     scope_stack: Vec<LocalScope<'a>>,
diff --git a/lib/binding_rust/lib.rs b/lib/binding_rust/lib.rs
index 84c3d12e..2d98dc7c 100644
--- a/lib/binding_rust/lib.rs
+++ b/lib/binding_rust/lib.rs
@@ -175,27 +175,30 @@ pub struct QueryMatch<'cursor, 'tree> {
 }
 
 /// A sequence of `QueryMatch`es associated with a given `QueryCursor`.
-pub struct QueryMatches<'a, 'tree: 'a, T: TextProvider<'a>> {
+pub struct QueryMatches<'a, 'tree: 'a, T: TextProvider<I>, I: AsRef<[u8]>> {
     ptr: *mut ffi::TSQueryCursor,
     query: &'a Query,
     text_provider: T,
     buffer1: Vec<u8>,
     buffer2: Vec<u8>,
-    _tree: PhantomData<&'tree ()>,
+    _phantom: PhantomData<(&'tree (), I)>,
 }
 
 /// A sequence of `QueryCapture`s associated with a given `QueryCursor`.
-pub struct QueryCaptures<'a, 'tree: 'a, T: TextProvider<'a>> {
+pub struct QueryCaptures<'a, 'tree: 'a, T: TextProvider<I>, I: AsRef<[u8]>> {
     ptr: *mut ffi::TSQueryCursor,
     query: &'a Query,
     text_provider: T,
     buffer1: Vec<u8>,
     buffer2: Vec<u8>,
-    _tree: PhantomData<&'tree ()>,
+    _phantom: PhantomData<(&'tree (), I)>,
 }
 
-pub trait TextProvider<'a> {
-    type I: Iterator<Item = &'a [u8]> + 'a;
+pub trait TextProvider<I>
+where
+    I: AsRef<[u8]>,
+{
+    type I: Iterator<Item = I>;
     fn text(&mut self, node: Node) -> Self::I;
 }
 
@@ -1900,12 +1903,12 @@ impl QueryCursor {
     /// Because multiple patterns can match the same set of nodes, one match may contain
     /// captures that appear *before* some of the captures from a previous match.
     #[doc(alias = "ts_query_cursor_exec")]
-    pub fn matches<'a, 'tree: 'a, T: TextProvider<'a> + 'a>(
+    pub fn matches<'a, 'tree: 'a, T: TextProvider<I>, I: AsRef<[u8]>>(
         &'a mut self,
         query: &'a Query,
         node: Node<'tree>,
         text_provider: T,
-    ) -> QueryMatches<'a, 'tree, T> {
+    ) -> QueryMatches<'a, 'tree, T, I> {
         let ptr = self.ptr.as_ptr();
         unsafe { ffi::ts_query_cursor_exec(ptr, query.ptr.as_ptr(), node.0) };
         QueryMatches {
@@ -1914,7 +1917,7 @@ impl QueryCursor {
             text_provider,
             buffer1: Default::default(),
             buffer2: Default::default(),
-            _tree: PhantomData,
+            _phantom: PhantomData,
         }
     }
 
@@ -1923,12 +1926,12 @@ impl QueryCursor {
     /// This is useful if you don't care about which pattern matched, and just want a single,
     /// ordered sequence of captures.
     #[doc(alias = "ts_query_cursor_exec")]
-    pub fn captures<'a, 'tree: 'a, T: TextProvider<'a> + 'a>(
+    pub fn captures<'a, 'tree: 'a, T: TextProvider<I>, I: AsRef<[u8]>>(
         &'a mut self,
         query: &'a Query,
         node: Node<'tree>,
         text_provider: T,
-    ) -> QueryCaptures<'a, 'tree, T> {
+    ) -> QueryCaptures<'a, 'tree, T, I> {
         let ptr = self.ptr.as_ptr();
         unsafe { ffi::ts_query_cursor_exec(self.ptr.as_ptr(), query.ptr.as_ptr(), node.0) };
         QueryCaptures {
@@ -1937,7 +1940,7 @@ impl QueryCursor {
             text_provider,
             buffer1: Default::default(),
             buffer2: Default::default(),
-            _tree: PhantomData,
+            _phantom: PhantomData,
         }
     }
 
@@ -2017,31 +2020,47 @@ impl<'a, 'tree> QueryMatch<'a, 'tree> {
         }
     }
 
-    fn satisfies_text_predicates(
+    fn satisfies_text_predicates<I: AsRef<[u8]>>(
         &self,
         query: &Query,
-        buffer1: &mut Vec<u8>,
-        buffer2: &mut Vec<u8>,
-        text_provider: &mut impl TextProvider<'a>,
+        buffer1: &'a mut Vec<u8>,
+        buffer2: &'a mut Vec<u8>,
+        text_provider: &mut impl TextProvider<I>,
     ) -> bool {
-        fn get_text<'a, 'b: 'a, I: Iterator<Item = &'b [u8]>>(
+        struct NodeText<'a, T> {
             buffer: &'a mut Vec<u8>,
-            mut chunks: I,
-        ) -> &'a [u8] {
-            let first_chunk = chunks.next().unwrap_or(&[]);
-            if let Some(next_chunk) = chunks.next() {
-                buffer.clear();
-                buffer.extend_from_slice(first_chunk);
-                buffer.extend_from_slice(next_chunk);
-                for chunk in chunks {
-                    buffer.extend_from_slice(chunk);
+            first_chunk: Option<T>,
+        }
+        impl<'a, T: AsRef<[u8]>> NodeText<'a, T> {
+            fn new(buffer: &'a mut Vec<u8>) -> Self {
+                Self {
+                    buffer,
+                    first_chunk: None,
+                }
+            }
+
+            fn get_text(&mut self, chunks: &mut impl Iterator<Item = T>) -> &[u8] {
+                self.first_chunk = chunks.next();
+                if let Some(next_chunk) = chunks.next() {
+                    self.buffer.clear();
+                    self.buffer
+                        .extend_from_slice(self.first_chunk.as_ref().unwrap().as_ref());
+                    self.buffer.extend_from_slice(next_chunk.as_ref());
+                    for chunk in chunks {
+                        self.buffer.extend_from_slice(chunk.as_ref());
+                    }
+                    self.buffer.as_slice()
+                } else if let Some(ref first_chunk) = self.first_chunk {
+                    first_chunk.as_ref()
+                } else {
+                    &[]
                 }
-                buffer.as_slice()
-            } else {
-                first_chunk
             }
         }
 
+        let mut node_text1 = NodeText::new(buffer1);
+        let mut node_text2 = NodeText::new(buffer2);
+
         query.text_predicates[self.pattern_index]
             .iter()
             .all(|predicate| match predicate {
@@ -2050,8 +2069,10 @@ impl<'a, 'tree> QueryMatch<'a, 'tree> {
                     let node2 = self.nodes_for_capture_index(*j).next();
                     match (node1, node2) {
                         (Some(node1), Some(node2)) => {
-                            let text1 = get_text(buffer1, text_provider.text(node1));
-                            let text2 = get_text(buffer2, text_provider.text(node2));
+                            let mut text1 = text_provider.text(node1);
+                            let mut text2 = text_provider.text(node2);
+                            let text1 = node_text1.get_text(&mut text1);
+                            let text2 = node_text2.get_text(&mut text2);
                             (text1 == text2) == *is_positive
                         }
                         _ => true,
@@ -2061,7 +2082,8 @@ impl<'a, 'tree> QueryMatch<'a, 'tree> {
                     let node = self.nodes_for_capture_index(*i).next();
                     match node {
                         Some(node) => {
-                            let text = get_text(buffer1, text_provider.text(node));
+                            let mut text = text_provider.text(node);
+                            let text = node_text1.get_text(&mut text);
                             (text == s.as_bytes()) == *is_positive
                         }
                         None => true,
@@ -2071,7 +2093,8 @@ impl<'a, 'tree> QueryMatch<'a, 'tree> {
                     let node = self.nodes_for_capture_index(*i).next();
                     match node {
                         Some(node) => {
-                            let text = get_text(buffer1, text_provider.text(node));
+                            let mut text = text_provider.text(node);
+                            let text = node_text1.get_text(&mut text);
                             r.is_match(text) == *is_positive
                         }
                         None => true,
@@ -2091,7 +2114,7 @@ impl QueryProperty {
     }
 }
 
-impl<'a, 'tree, T: TextProvider<'a>> Iterator for QueryMatches<'a, 'tree, T> {
+impl<'a, 'tree, T: TextProvider<I>, I: AsRef<[u8]>> Iterator for QueryMatches<'a, 'tree, T, I> {
     type Item = QueryMatch<'a, 'tree>;
 
     fn next(&mut self) -> Option<Self::Item> {
@@ -2116,7 +2139,7 @@ impl<'a, 'tree, T: TextProvider<'a>> Iterator for QueryMatches<'a, 'tree, T> {
     }
 }
 
-impl<'a, 'tree, T: TextProvider<'a>> Iterator for QueryCaptures<'a, 'tree, T> {
+impl<'a, 'tree, T: TextProvider<I>, I: AsRef<[u8]>> Iterator for QueryCaptures<'a, 'tree, T, I> {
     type Item = (QueryMatch<'a, 'tree>, usize);
 
     fn next(&mut self) -> Option<Self::Item> {
@@ -2148,7 +2171,7 @@ impl<'a, 'tree, T: TextProvider<'a>> Iterator for QueryCaptures<'a, 'tree, T> {
     }
 }
 
-impl<'a, 'tree, T: TextProvider<'a>> QueryMatches<'a, 'tree, T> {
+impl<'a, 'tree, T: TextProvider<I>, I: AsRef<[u8]>> QueryMatches<'a, 'tree, T, I> {
     #[doc(alias = "ts_query_cursor_set_byte_range")]
     pub fn set_byte_range(&mut self, range: ops::Range<usize>) {
         unsafe {
@@ -2164,7 +2187,7 @@ impl<'a, 'tree, T: TextProvider<'a>> QueryMatches<'a, 'tree, T> {
     }
 }
 
-impl<'a, 'tree, T: TextProvider<'a>> QueryCaptures<'a, 'tree, T> {
+impl<'a, 'tree, T: TextProvider<I>, I: AsRef<[u8]>> QueryCaptures<'a, 'tree, T, I> {
     #[doc(alias = "ts_query_cursor_set_byte_range")]
     pub fn set_byte_range(&mut self, range: ops::Range<usize>) {
         unsafe {
@@ -2190,10 +2213,10 @@ impl<'cursor, 'tree> fmt::Debug for QueryMatch<'cursor, 'tree> {
     }
 }
 
-impl<'a, F, I> TextProvider<'a> for F
+impl<'a, F, I> TextProvider<&'a [u8]> for F
 where
     F: FnMut(Node) -> I,
-    I: Iterator<Item = &'a [u8]> + 'a,
+    I: Iterator<Item = &'a [u8]>,
 {
     type I = I;
 
@@ -2202,7 +2225,7 @@ where
     }
 }
 
-impl<'a> TextProvider<'a> for &'a [u8] {
+impl<'a> TextProvider<&'a [u8]> for &'a [u8] {
     type I = iter::Once<&'a [u8]>;
 
     fn text(&mut self, node: Node) -> Self::I {

From 9c06b90fc21d292713a2936edc6c77624443049d Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Sun, 23 Jul 2023 02:58:56 +0300
Subject: [PATCH 210/347] More general TextProvider for F

---
 lib/binding_rust/lib.rs | 9 +++++----
 1 file changed, 5 insertions(+), 4 deletions(-)

diff --git a/lib/binding_rust/lib.rs b/lib/binding_rust/lib.rs
index 2d98dc7c..917243b0 100644
--- a/lib/binding_rust/lib.rs
+++ b/lib/binding_rust/lib.rs
@@ -2213,12 +2213,13 @@ impl<'cursor, 'tree> fmt::Debug for QueryMatch<'cursor, 'tree> {
     }
 }
 
-impl<'a, F, I> TextProvider<&'a [u8]> for F
+impl<F, R, I> TextProvider<I> for F
 where
-    F: FnMut(Node) -> I,
-    I: Iterator<Item = &'a [u8]>,
+    F: FnMut(Node) -> R,
+    R: Iterator<Item = I>,
+    I: AsRef<[u8]>,
 {
-    type I = I;
+    type I = R;
 
     fn text(&mut self, node: Node) -> Self::I {
         (self)(node)

From 19e665ef7938cd74354665dfcb61e09737caf2e2 Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Mon, 31 Jul 2023 11:18:43 +0300
Subject: [PATCH 211/347] Add tests for TextProvider

---
 cli/src/tests/mod.rs                |   1 +
 cli/src/tests/text_provider_test.rs | 173 ++++++++++++++++++++++++++++
 2 files changed, 174 insertions(+)
 create mode 100644 cli/src/tests/text_provider_test.rs

diff --git a/cli/src/tests/mod.rs b/cli/src/tests/mod.rs
index 03a588b9..223b6d3c 100644
--- a/cli/src/tests/mod.rs
+++ b/cli/src/tests/mod.rs
@@ -9,4 +9,5 @@ mod query_test;
 mod tags_test;
 mod test_highlight_test;
 mod test_tags_test;
+mod text_provider_test;
 mod tree_test;
diff --git a/cli/src/tests/text_provider_test.rs b/cli/src/tests/text_provider_test.rs
new file mode 100644
index 00000000..cb0b38f6
--- /dev/null
+++ b/cli/src/tests/text_provider_test.rs
@@ -0,0 +1,173 @@
+use std::{iter, sync::Arc};
+
+use crate::tests::helpers::fixtures::get_language;
+use tree_sitter::{Language, Node, Parser, Point, Query, QueryCursor, TextProvider, Tree};
+
+fn parse_text(text: impl AsRef<[u8]>) -> (Tree, Language) {
+    let language = get_language("c");
+    let mut parser = Parser::new();
+    parser.set_language(language).unwrap();
+    (parser.parse(text, None).unwrap(), language)
+}
+
+fn parse_text_with<T, F>(callback: &mut F) -> (Tree, Language)
+where
+    T: AsRef<[u8]>,
+    F: FnMut(usize, Point) -> T,
+{
+    let language = get_language("c");
+    let mut parser = Parser::new();
+    parser.set_language(language).unwrap();
+    let tree = parser.parse_with(callback, None).unwrap();
+    // eprintln!("{}", tree.clone().root_node().to_sexp());
+    assert_eq!("comment", tree.clone().root_node().child(0).unwrap().kind());
+    (tree, language)
+}
+
+fn tree_query<I: AsRef<[u8]>>(tree: &Tree, text: impl TextProvider<I>, language: Language) {
+    let query = Query::new(language, "((comment) @c (#eq? @c \"// comment\"))").unwrap();
+    let mut cursor = QueryCursor::new();
+    let mut captures = cursor.captures(&query, tree.root_node(), text);
+    let (match_, idx) = captures.next().unwrap();
+    let capture = match_.captures[idx];
+    assert_eq!(capture.index as usize, idx);
+    assert_eq!("comment", capture.node.kind());
+}
+
+fn check_parsing<I: AsRef<[u8]>>(
+    parser_text: impl AsRef<[u8]>,
+    text_provider: impl TextProvider<I>,
+) {
+    let (tree, language) = parse_text(parser_text);
+    tree_query(&tree, text_provider, language);
+}
+
+fn check_parsing_callback<T, F, I: AsRef<[u8]>>(
+    parser_callback: &mut F,
+    text_provider: impl TextProvider<I>,
+) where
+    T: AsRef<[u8]>,
+    F: FnMut(usize, Point) -> T,
+{
+    let (tree, language) = parse_text_with(parser_callback);
+    tree_query(&tree, text_provider, language);
+}
+
+#[test]
+fn test_text_provider_for_str_slice() {
+    let text: &str = "// comment";
+
+    check_parsing(text, text.as_bytes());
+    check_parsing(text.as_bytes(), text.as_bytes());
+}
+
+#[test]
+fn test_text_provider_for_string() {
+    let text: String = "// comment".to_owned();
+
+    check_parsing(text.clone(), text.as_bytes());
+    check_parsing(text.as_bytes(), text.as_bytes());
+    check_parsing(<_ as AsRef<[u8]>>::as_ref(&text), text.as_bytes());
+}
+
+#[test]
+fn test_text_provider_for_box_of_str_slice() {
+    let text: Box<str> = "// comment".to_owned().into_boxed_str();
+
+    check_parsing(text.as_bytes(), text.as_bytes());
+    check_parsing(<_ as AsRef<str>>::as_ref(&text), text.as_bytes());
+    check_parsing(text.as_ref(), text.as_ref().as_bytes());
+    check_parsing(text.as_ref(), text.as_bytes());
+}
+
+#[test]
+fn test_text_provider_for_box_of_bytes_slice() {
+    let text: Box<[u8]> = "// comment".to_owned().into_boxed_str().into_boxed_bytes();
+
+    check_parsing(text.as_ref(), text.as_ref());
+    check_parsing(text.as_ref(), &*text);
+    check_parsing(&*text, &*text);
+}
+
+#[test]
+fn test_text_provider_for_vec_of_bytes() {
+    let text: Vec<u8> = "// comment".to_owned().into_bytes();
+
+    check_parsing(&*text, &*text);
+}
+
+#[test]
+fn test_text_provider_for_arc_of_bytes_slice() {
+    let text: Vec<u8> = "// comment".to_owned().into_bytes();
+    let text: Arc<[u8]> = Arc::from(text);
+
+    check_parsing(&*text, &*text);
+    check_parsing(text.as_ref(), text.as_ref());
+    check_parsing(text.clone(), text.as_ref());
+}
+
+#[test]
+fn test_text_provider_callback_with_str_slice() {
+    let text: &str = "// comment";
+
+    check_parsing(text, |_node: Node<'_>| iter::once(text));
+    check_parsing_callback(
+        &mut |offset, _point| {
+            (offset < text.len())
+                .then(|| text.as_bytes())
+                .unwrap_or_default()
+        },
+        |_node: Node<'_>| iter::once(text),
+    );
+}
+
+#[test]
+fn test_text_provider_callback_with_owned_string_slice() {
+    let text: &str = "// comment";
+
+    check_parsing_callback(
+        &mut |offset, _point| {
+            (offset < text.len())
+                .then(|| text.as_bytes())
+                .unwrap_or_default()
+        },
+        |_node: Node<'_>| {
+            let slice: String = text.to_owned();
+            iter::once(slice)
+        },
+    );
+}
+
+#[test]
+fn test_text_provider_callback_with_owned_bytes_vec_slice() {
+    let text: &str = "// comment";
+
+    check_parsing_callback(
+        &mut |offset, _point| {
+            (offset < text.len())
+                .then(|| text.as_bytes())
+                .unwrap_or_default()
+        },
+        |_node: Node<'_>| {
+            let slice: Vec<u8> = text.to_owned().into_bytes();
+            iter::once(slice)
+        },
+    );
+}
+
+#[test]
+fn test_text_provider_callback_with_owned_arc_of_bytes_slice() {
+    let text: &str = "// comment";
+
+    check_parsing_callback(
+        &mut |offset, _point| {
+            (offset < text.len())
+                .then(|| text.as_bytes())
+                .unwrap_or_default()
+        },
+        |_node: Node<'_>| {
+            let slice: Arc<[u8]> = text.to_owned().into_bytes().into();
+            iter::once(slice)
+        },
+    );
+}

From fec7454ced4c182c7bdb750ad9837d0be5336eff Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Tue, 1 Aug 2023 11:11:46 +0300
Subject: [PATCH 212/347] chore: simply use FieldId::new because it contains id
 == 0 check

---
 lib/binding_rust/lib.rs | 16 +++-------------
 1 file changed, 3 insertions(+), 13 deletions(-)

diff --git a/lib/binding_rust/lib.rs b/lib/binding_rust/lib.rs
index 917243b0..ae8e744d 100644
--- a/lib/binding_rust/lib.rs
+++ b/lib/binding_rust/lib.rs
@@ -334,11 +334,7 @@ impl Language {
                 field_name.len() as u32,
             )
         };
-        if id == 0 {
-            None
-        } else {
-            Some(FieldId::new(id).unwrap())
-        }
+        FieldId::new(id)
     }
 }
 
@@ -1249,14 +1245,8 @@ impl<'a> TreeCursor<'a> {
     /// See also [field_name](TreeCursor::field_name).
     #[doc(alias = "ts_tree_cursor_current_field_id")]
     pub fn field_id(&self) -> Option<FieldId> {
-        unsafe {
-            let id = ffi::ts_tree_cursor_current_field_id(&self.0);
-            if id == 0 {
-                None
-            } else {
-                Some(FieldId::new(id).unwrap())
-            }
-        }
+        let id = unsafe { ffi::ts_tree_cursor_current_field_id(&self.0) };
+        FieldId::new(id)
     }
 
     /// Get the field name of this tree cursor's current node.

From d489d716230f73b528d91ce9f7d3ecda4c52a4c4 Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Tue, 1 Aug 2023 12:21:13 +0300
Subject: [PATCH 213/347] fix: `children_by_field_id` API to receive non option
 field id

---
 lib/binding_rust/lib.rs | 27 +++++++++++++++++++++++----
 1 file changed, 23 insertions(+), 4 deletions(-)

diff --git a/lib/binding_rust/lib.rs b/lib/binding_rust/lib.rs
index ae8e744d..2f8323df 100644
--- a/lib/binding_rust/lib.rs
+++ b/lib/binding_rust/lib.rs
@@ -1062,7 +1062,26 @@ impl<'tree> Node<'tree> {
         cursor: &'a mut TreeCursor<'tree>,
     ) -> impl Iterator<Item = Node<'tree>> + 'a {
         let field_id = self.language().field_id_for_name(field_name);
-        self.children_by_field_id(field_id, cursor)
+        let mut done = field_id.is_none();
+        if !done {
+            cursor.reset(*self);
+            cursor.goto_first_child();
+        }
+        iter::from_fn(move || {
+            if !done {
+                while cursor.field_id() != field_id {
+                    if !cursor.goto_next_sibling() {
+                        return None;
+                    }
+                }
+                let result = cursor.node();
+                if !cursor.goto_next_sibling() {
+                    done = true;
+                }
+                return Some(result);
+            }
+            None
+        })
     }
 
     /// Iterate over this node's children with a given field id.
@@ -1070,15 +1089,15 @@ impl<'tree> Node<'tree> {
     /// See also [Node::children_by_field_name].
     pub fn children_by_field_id<'a>(
         &self,
-        field_id: Option<FieldId>,
+        field_id: FieldId,
         cursor: &'a mut TreeCursor<'tree>,
     ) -> impl Iterator<Item = Node<'tree>> + 'a {
         cursor.reset(*self);
         cursor.goto_first_child();
         let mut done = false;
         iter::from_fn(move || {
-            while !done {
-                while cursor.field_id() != field_id {
+            if !done {
+                while cursor.field_id() != Some(field_id) {
                     if !cursor.goto_next_sibling() {
                         return None;
                     }

From 614f2f61c84049331cd4ec2b29c407ca338c2228 Mon Sep 17 00:00:00 2001
From: Amaan Qureshi <amaanq12@gmail.com>
Date: Tue, 1 Aug 2023 11:16:16 +0100
Subject: [PATCH 214/347] fix: suppress unused warnings for eof

---
 lib/include/tree_sitter/parser.h | 7 +++++++
 1 file changed, 7 insertions(+)

diff --git a/lib/include/tree_sitter/parser.h b/lib/include/tree_sitter/parser.h
index 46994f46..ac773580 100644
--- a/lib/include/tree_sitter/parser.h
+++ b/lib/include/tree_sitter/parser.h
@@ -130,9 +130,16 @@ struct TSLanguage {
  *  Lexer Macros
  */
 
+#ifdef _MSC_VER
+#define UNUSED __pragma(warning(suppress : 4101))
+#else
+#define UNUSED __attribute__((unused))
+#endif
+
 #define START_LEXER()           \
   bool result = false;          \
   bool skip = false;            \
+  UNUSED                        \
   bool eof = false;             \
   int32_t lookahead;            \
   goto start;                   \

From cd1d717551f9f6719afe0780bb6ddc387340e961 Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Tue, 1 Aug 2023 21:33:55 +0300
Subject: [PATCH 215/347] chore: regenerate bindings.rs after #2370

---
 lib/binding_rust/bindings.rs | 12 ++++++------
 1 file changed, 6 insertions(+), 6 deletions(-)

diff --git a/lib/binding_rust/bindings.rs b/lib/binding_rust/bindings.rs
index 76aeef57..82eec594 100644
--- a/lib/binding_rust/bindings.rs
+++ b/lib/binding_rust/bindings.rs
@@ -509,7 +509,7 @@ extern "C" {
     pub fn ts_query_predicates_for_pattern(
         self_: *const TSQuery,
         pattern_index: u32,
-        length: *mut u32,
+        step_count: *mut u32,
     ) -> *const TSQueryPredicateStep;
 }
 extern "C" {
@@ -525,7 +525,7 @@ extern "C" {
     #[doc = " Get the name and length of one of the query's captures, or one of the\n query's string literals. Each capture and string is associated with a\n numeric id based on the order that it appeared in the query's source."]
     pub fn ts_query_capture_name_for_id(
         arg1: *const TSQuery,
-        id: u32,
+        index: u32,
         length: *mut u32,
     ) -> *const ::std::os::raw::c_char;
 }
@@ -533,14 +533,14 @@ extern "C" {
     #[doc = " Get the quantifier of the query's captures. Each capture is * associated\n with a numeric id based on the order that it appeared in the query's source."]
     pub fn ts_query_capture_quantifier_for_id(
         arg1: *const TSQuery,
-        pattern_id: u32,
-        capture_id: u32,
+        pattern_index: u32,
+        capture_index: u32,
     ) -> TSQuantifier;
 }
 extern "C" {
     pub fn ts_query_string_value_for_id(
         arg1: *const TSQuery,
-        id: u32,
+        index: u32,
         length: *mut u32,
     ) -> *const ::std::os::raw::c_char;
 }
@@ -590,7 +590,7 @@ extern "C" {
     pub fn ts_query_cursor_next_match(arg1: *mut TSQueryCursor, match_: *mut TSQueryMatch) -> bool;
 }
 extern "C" {
-    pub fn ts_query_cursor_remove_match(arg1: *mut TSQueryCursor, id: u32);
+    pub fn ts_query_cursor_remove_match(arg1: *mut TSQueryCursor, match_id: u32);
 }
 extern "C" {
     #[doc = " Advance to the next capture of the currently running query.\n\n If there is a capture, write its match to `*match` and its index within\n the matche's capture list to `*capture_index`. Otherwise, return `false`."]

From c47e217e7303c704d2cb88ced1b2720f15a2d949 Mon Sep 17 00:00:00 2001
From: Daumantas Kavolis <daumantas.kavolis@sensmetry.com>
Date: Wed, 17 May 2023 10:39:37 +0300
Subject: [PATCH 216/347] API extensions

---
 lib/binding_rust/bindings.rs         |  77 ++++++++++++++-
 lib/binding_rust/ffi.rs              |  20 +++-
 lib/binding_rust/lib.rs              | 126 ++++++++++++++++++++++++
 lib/binding_web/binding.c            |  37 +++++++
 lib/binding_web/binding.js           |  97 +++++++++++++++++++
 lib/binding_web/exports.json         |  16 ++-
 lib/binding_web/test/node-test.js    |  33 +++++++
 lib/binding_web/tree-sitter-web.d.ts |  20 ++++
 lib/include/tree_sitter/api.h        | 104 +++++++++++++++++++-
 lib/include/tree_sitter/parser.h     |   2 +
 lib/src/language.c                   |  66 +++++++++++++
 lib/src/language.h                   |  24 +----
 lib/src/node.c                       |   9 ++
 lib/src/tree_cursor.c                | 139 ++++++++++++++++++++++++++-
 14 files changed, 741 insertions(+), 29 deletions(-)

diff --git a/lib/binding_rust/bindings.rs b/lib/binding_rust/bindings.rs
index 82eec594..da870263 100644
--- a/lib/binding_rust/bindings.rs
+++ b/lib/binding_rust/bindings.rs
@@ -1,5 +1,6 @@
 /* automatically generated by rust-bindgen 0.66.1 */
 
+pub type TSStateId = u16;
 pub type TSSymbol = u16;
 pub type TSFieldId = u16;
 #[repr(C)]
@@ -27,6 +28,11 @@ pub struct TSQuery {
 pub struct TSQueryCursor {
     _unused: [u8; 0],
 }
+#[repr(C)]
+#[derive(Debug, Copy, Clone)]
+pub struct TSLookaheadIterator {
+    _unused: [u8; 0],
+}
 pub const TSInputEncoding_TSInputEncodingUTF8: TSInputEncoding = 0;
 pub const TSInputEncoding_TSInputEncodingUTF16: TSInputEncoding = 1;
 pub type TSInputEncoding = ::std::os::raw::c_uint;
@@ -326,6 +332,14 @@ extern "C" {
     #[doc = " Check if the node is a syntax error or contains any syntax errors."]
     pub fn ts_node_has_error(arg1: TSNode) -> bool;
 }
+extern "C" {
+    #[doc = " Check if the node is a syntax error."]
+    pub fn ts_node_is_error(arg1: TSNode) -> bool;
+}
+extern "C" {
+    #[doc = " Get this node's parse state."]
+    pub fn ts_node_parse_state(arg1: TSNode) -> TSStateId;
+}
 extern "C" {
     #[doc = " Get the node's immediate parent."]
     pub fn ts_node_parent(arg1: TSNode) -> TSNode;
@@ -427,6 +441,10 @@ extern "C" {
     #[doc = " Re-initialize a tree cursor to start at a different node."]
     pub fn ts_tree_cursor_reset(arg1: *mut TSTreeCursor, arg2: TSNode);
 }
+extern "C" {
+    #[doc = " Re-initialize a tree cursor to the same position as another cursor.\n\n Unlike `ts_tree_cursor_reset`, this will not lose parent information and\n allows reusing already created cursors."]
+    pub fn ts_tree_cursor_reset_to(arg1: *mut TSTreeCursor, arg2: *const TSTreeCursor);
+}
 extern "C" {
     #[doc = " Get the tree cursor's current node."]
     pub fn ts_tree_cursor_current_node(arg1: *const TSTreeCursor) -> TSNode;
@@ -450,9 +468,16 @@ extern "C" {
     pub fn ts_tree_cursor_goto_next_sibling(arg1: *mut TSTreeCursor) -> bool;
 }
 extern "C" {
-    #[doc = " Move the cursor to the first child of its current node.\n\n This returns `true` if the cursor successfully moved, and returns `false`\n if there were no children."]
+    #[doc = " Move the cursor to the previous sibling of its current node.\n\n This returns `true` if the cursor successfully moved, and returns `false` if\n there was no previous sibling node."]
+    pub fn ts_tree_cursor_goto_previous_sibling(arg1: *mut TSTreeCursor) -> bool;
+}
+extern "C" {
+    #[doc = " Move the cursor to the first/last child of its current node.\n\n This returns `true` if the cursor successfully moved, and returns `false`\n if there were no children."]
     pub fn ts_tree_cursor_goto_first_child(arg1: *mut TSTreeCursor) -> bool;
 }
+extern "C" {
+    pub fn ts_tree_cursor_goto_last_child(arg1: *mut TSTreeCursor) -> bool;
+}
 extern "C" {
     #[doc = " Move the cursor to the node that is the nth descendant of\n the original node that the cursor was constructed with, where\n zero represents the original node itself."]
     pub fn ts_tree_cursor_goto_descendant(arg1: *mut TSTreeCursor, arg2: u32);
@@ -608,6 +633,10 @@ extern "C" {
     #[doc = " Get the number of distinct node types in the language."]
     pub fn ts_language_symbol_count(arg1: *const TSLanguage) -> u32;
 }
+extern "C" {
+    #[doc = " Get the number of valid states in this language."]
+    pub fn ts_language_state_count(arg1: *const TSLanguage) -> u32;
+}
 extern "C" {
     #[doc = " Get a node type string for the given numerical id."]
     pub fn ts_language_symbol_name(
@@ -651,6 +680,52 @@ extern "C" {
     #[doc = " Get the ABI version number for this language. This version number is used\n to ensure that languages were generated by a compatible version of\n Tree-sitter.\n\n See also `ts_parser_set_language`."]
     pub fn ts_language_version(arg1: *const TSLanguage) -> u32;
 }
+extern "C" {
+    #[doc = " Get the next parse state. Combine this with lookahead iterators to generate\n completion suggestions or valid symbols in error nodes."]
+    pub fn ts_language_next_state(
+        arg1: *const TSLanguage,
+        arg2: TSStateId,
+        arg3: TSSymbol,
+    ) -> TSStateId;
+}
+extern "C" {
+    #[doc = " Create a new lookahead iterator for the given language and parse state.\n\n This returns `NULL` if state is invalid for the language.\n\n Repeatedly using `ts_lookahead_iterator_advance` and\n `ts_lookahead_iterator_current_symbol` will generate valid symbols in the\n given parse state. Newly created lookahead iterators will contain the `ERROR`\n symbol.\n\n Lookahead iterators can be useful to generate suggestions and improve syntax\n error diagnostics. To get symbols valid in an ERROR node, use the lookahead\n iterator on its first leaf node state. For `MISSING` nodes, a lookahead\n iterator created on the previous non-extra leaf node may be appropriate."]
+    pub fn ts_lookahead_iterator_new(
+        arg1: *const TSLanguage,
+        arg2: TSStateId,
+    ) -> *mut TSLookaheadIterator;
+}
+extern "C" {
+    #[doc = " Delete a lookahead iterator freeing all the memory used."]
+    pub fn ts_lookahead_iterator_delete(arg1: *mut TSLookaheadIterator);
+}
+extern "C" {
+    #[doc = " Reset the lookahead iterator to another state.\n\n This returns `true` if the iterator was reset to the given state and `false`\n otherwise."]
+    pub fn ts_lookahead_iterator_reset_state(
+        arg1: *mut TSLookaheadIterator,
+        arg2: TSStateId,
+    ) -> bool;
+}
+extern "C" {
+    #[doc = " Reset the lookahead iterator.\n\n This returns `true` if the language was set successfully and `false`\n otherwise."]
+    pub fn ts_lookahead_iterator_reset(
+        arg1: *mut TSLookaheadIterator,
+        arg2: *const TSLanguage,
+        arg3: TSStateId,
+    ) -> bool;
+}
+extern "C" {
+    #[doc = " Get the current language of the lookahead iterator."]
+    pub fn ts_lookahead_iterator_language(arg1: *const TSLookaheadIterator) -> *const TSLanguage;
+}
+extern "C" {
+    #[doc = " Advance the lookahead iterator to the next symbol.\n\n This returns `true` if there is a new symbol and `false` otherwise."]
+    pub fn ts_lookahead_iterator_advance(arg1: *mut TSLookaheadIterator) -> bool;
+}
+extern "C" {
+    #[doc = " Get the current symbol of the lookahead iterator;"]
+    pub fn ts_lookahead_iterator_current_symbol(arg1: *const TSLookaheadIterator) -> TSSymbol;
+}
 extern "C" {
     #[doc = " Set the allocation functions used by the library.\n\n By default, Tree-sitter uses the standard libc allocation functions,\n but aborts the process when an allocation fails. This function lets\n you supply alternative allocation functions at runtime.\n\n If you pass `NULL` for any parameter, Tree-sitter will switch back to\n its default implementation of that function.\n\n If you call this function after the library has already been used, then\n you must ensure that either:\n  1. All the existing objects have been freed.\n  2. The new allocator shares its state with the old one, so it is capable\n     of freeing memory that was allocated by the old allocator."]
     pub fn ts_set_allocator(
diff --git a/lib/binding_rust/ffi.rs b/lib/binding_rust/ffi.rs
index fc872041..f1a739b1 100644
--- a/lib/binding_rust/ffi.rs
+++ b/lib/binding_rust/ffi.rs
@@ -8,7 +8,9 @@ extern "C" {
     pub(crate) fn dup(fd: std::os::raw::c_int) -> std::os::raw::c_int;
 }
 
-use crate::{Language, Node, Parser, Query, QueryCursor, QueryError, Tree, TreeCursor};
+use crate::{
+    Language, LookaheadIterator, Node, Parser, Query, QueryCursor, QueryError, Tree, TreeCursor,
+};
 use std::{marker::PhantomData, mem::ManuallyDrop, ptr::NonNull, str};
 
 impl Language {
@@ -130,3 +132,19 @@ impl QueryCursor {
         ManuallyDrop::new(self).ptr.as_ptr()
     }
 }
+
+impl<'a> LookaheadIterator<'a> {
+    /// Reconstructs a [LookaheadIterator] from a raw pointer.
+    ///
+    /// # Safety
+    ///
+    /// `ptr` must be non-null.
+    pub unsafe fn from_raw(ptr: *mut TSLookaheadIterator) -> LookaheadIterator<'a> {
+        LookaheadIterator(NonNull::new_unchecked(ptr), PhantomData)
+    }
+
+    /// Consumes the [LookaheadIterator], returning a raw pointer to the underlying C structure.
+    pub fn into_raw(self) -> *mut TSLookaheadIterator {
+        ManuallyDrop::new(self).0.as_ptr()
+    }
+}
diff --git a/lib/binding_rust/lib.rs b/lib/binding_rust/lib.rs
index 2f8323df..6a46dafc 100644
--- a/lib/binding_rust/lib.rs
+++ b/lib/binding_rust/lib.rs
@@ -87,6 +87,10 @@ pub struct Node<'a>(ffi::TSNode, PhantomData<&'a ()>);
 #[doc(alias = "TSParser")]
 pub struct Parser(NonNull<ffi::TSParser>);
 
+/// A stateful object that is used to look up symbols valid in a specific parse state
+#[doc(alias = "TSLookaheadIterator")]
+pub struct LookaheadIterator<'a>(NonNull<ffi::TSLookaheadIterator>, PhantomData<&'a ()>);
+
 /// A type of log message.
 #[derive(Debug, PartialEq, Eq)]
 pub enum LogType {
@@ -269,6 +273,12 @@ impl Language {
         unsafe { ffi::ts_language_symbol_count(self.0) as usize }
     }
 
+    /// Get the number of valid states in this language.
+    #[doc(alias = "ts_language_state_count")]
+    pub fn parse_state_count(&self) -> usize {
+        unsafe { ffi::ts_language_state_count(self.0) as usize }
+    }
+
     /// Get the name of the node kind for the given numerical id.
     #[doc(alias = "ts_language_symbol_name")]
     pub fn node_kind_for_id(&self, id: u16) -> Option<&'static str> {
@@ -336,6 +346,36 @@ impl Language {
         };
         FieldId::new(id)
     }
+
+    /// Get the next parse state. Combine this with [lookahead_iterator] to
+    /// generate completion suggestions or valid symbols in error nodes.
+    #[doc(alias = "ts_language_next_state")]
+    pub fn next_state(&self, state: u16, id: u16) -> u16 {
+        unsafe { ffi::ts_language_next_state(self.0, state, id) }
+    }
+
+    /// Create a new lookahead iterator for this language and parse state.
+    ///
+    /// This returns `None` if state is invalid for this language.
+    ///
+    /// Iterating [LookaheadIterator] will yield valid symbols in the given
+    /// parse state. Newly created lookahead iterators will return the `ERROR`
+    /// symbol from [LookaheadIterator::current_symbol].
+    ///
+    /// Lookahead iterators can be useful to generate suggestions and improve
+    /// syntax error diagnostics. To get symbols valid in an ERROR node, use the
+    /// lookahead iterator on its first leaf node state. For `MISSING` nodes, a
+    /// lookahead iterator created on the previous non-extra leaf node may be
+    /// appropriate.
+    #[doc(alias = "ts_lookahead_iterator_new")]
+    pub fn lookahead_iterator<'a>(&self, state: u16) -> Option<LookaheadIterator<'a>> {
+        let ptr = unsafe { ffi::ts_lookahead_iterator_new(self.0, state) };
+        if ptr.is_null() {
+            None
+        } else {
+            Some(unsafe { LookaheadIterator::from_raw(ptr) })
+        }
+    }
 }
 
 impl Parser {
@@ -885,6 +925,12 @@ impl<'tree> Node<'tree> {
         self.kind_id() == u16::MAX
     }
 
+    /// Get this node's parse state.
+    #[doc(alias = "ts_node_parse_state")]
+    pub fn parse_state(&self) -> u16 {
+        unsafe { ffi::ts_node_parse_state(self.0) }
+    }
+
     /// Check if this node is *missing*.
     ///
     /// Missing nodes are inserted by the parser in order to recover from certain kinds of
@@ -1305,6 +1351,15 @@ impl<'a> TreeCursor<'a> {
         return unsafe { ffi::ts_tree_cursor_goto_first_child(&mut self.0) };
     }
 
+    /// Move this cursor to the last child of its current node.
+    ///
+    /// This returns `true` if the cursor successfully moved, and returns `false`
+    /// if there were no children.
+    #[doc(alias = "ts_tree_cursor_goto_last_child")]
+    pub fn goto_last_child(&mut self) -> bool {
+        return unsafe { ffi::ts_tree_cursor_goto_last_child(&mut self.0) };
+    }
+
     /// Move this cursor to the parent of its current node.
     ///
     /// This returns `true` if the cursor successfully moved, and returns `false`
@@ -1333,6 +1388,15 @@ impl<'a> TreeCursor<'a> {
         };
     }
 
+    /// Move this cursor to the previous sibling of its current node.
+    ///
+    /// This returns `true` if the cursor successfully moved, and returns
+    /// `false` if there was no previous sibling node.
+    #[doc(alias = "ts_tree_cursor_goto_previous_sibling")]
+    pub fn goto_previous_sibling(&mut self) -> bool {
+        return unsafe { ffi::ts_tree_cursor_goto_previous_sibling(&mut self.0) };
+    }
+
     /// Move this cursor to the first child of its current node that extends beyond
     /// the given byte offset.
     ///
@@ -1370,6 +1434,15 @@ impl<'a> TreeCursor<'a> {
     pub fn reset(&mut self, node: Node<'a>) {
         unsafe { ffi::ts_tree_cursor_reset(&mut self.0, node.0) };
     }
+
+    /// Re-initialize a tree cursor to the same position as another cursor.
+    ///
+    /// Unlike `reset`, this will not lose parent information and
+    /// allows reusing already created cursors.
+    #[doc(alias = "ts_tree_cursor_reset_to")]
+    pub fn reset_to(&mut self, cursor: TreeCursor<'a>) {
+        unsafe { ffi::ts_tree_cursor_reset_to(&mut self.0, &cursor.0) };
+    }
 }
 
 impl<'a> Clone for TreeCursor<'a> {
@@ -1384,6 +1457,59 @@ impl<'a> Drop for TreeCursor<'a> {
     }
 }
 
+impl<'a> LookaheadIterator<'a> {
+    /// Get the current language of the lookahead iterator.
+    #[doc(alias = "ts_lookahead_iterator_language")]
+    pub fn language(&self) -> Language {
+        Language(unsafe { ffi::ts_lookahead_iterator_language(self.0.as_ptr()) })
+    }
+
+    /// Get the current symbol of the lookahead iterator.
+    #[doc(alias = "ts_lookahead_iterator_current_symbol")]
+    pub fn current_symbol(&self) -> u16 {
+        unsafe { ffi::ts_lookahead_iterator_current_symbol(self.0.as_ptr()) }
+    }
+
+    /// Reset the lookahead iterator.
+    ///
+    /// This returns `true` if the language was set successfully and `false`
+    /// otherwise.
+    #[doc(alias = "ts_lookahead_iterator_reset")]
+    pub fn reset(&self, language: &'a Language, state: u16) -> bool {
+        unsafe { ffi::ts_lookahead_iterator_reset(self.0.as_ptr(), language.0, state) }
+    }
+
+    /// Reset the lookahead iterator to another state.
+    ///
+    /// This returns `true` if the iterator was reset to the given state and `false`
+    /// otherwise.
+    #[doc(alias = "ts_lookahead_iterator_reset_state")]
+    pub fn reset_state(&self, state: u16) -> bool {
+        unsafe { ffi::ts_lookahead_iterator_reset_state(self.0.as_ptr(), state) }
+    }
+}
+
+impl<'a> Iterator for LookaheadIterator<'a> {
+    type Item = u16;
+
+    #[doc(alias = "ts_lookahead_iterator_advance")]
+    fn next(&mut self) -> Option<Self::Item> {
+        // the first symbol is always `0` so we can safely skip it
+        if !(unsafe { ffi::ts_lookahead_iterator_advance(self.0.as_ptr()) }) {
+            None
+        } else {
+            Some(self.current_symbol())
+        }
+    }
+}
+
+impl<'a> Drop for LookaheadIterator<'a> {
+    #[doc(alias = "ts_lookahead_iterator_delete")]
+    fn drop(&mut self) {
+        unsafe { ffi::ts_lookahead_iterator_delete(self.0.as_ptr()) }
+    }
+}
+
 impl Query {
     /// Create a new query from a string containing one or more S-expression
     /// patterns.
diff --git a/lib/binding_web/binding.c b/lib/binding_web/binding.c
index 27292911..4ba36f65 100644
--- a/lib/binding_web/binding.c
+++ b/lib/binding_web/binding.c
@@ -243,6 +243,13 @@ void ts_tree_cursor_reset_wasm(const TSTree *tree) {
   marshal_cursor(&cursor);
 }
 
+void ts_tree_cursor_reset_to_wasm(const TSTree *_dst, const TSTree *_src) {
+  TSTreeCursor cursor = unmarshal_cursor(TRANSFER_BUFFER, _dst);
+  TSTreeCursor src = unmarshal_cursor(&TRANSFER_BUFFER[3], _src);
+  ts_tree_cursor_reset_to(&cursor, &src);
+  marshal_cursor(&cursor);
+}
+
 bool ts_tree_cursor_goto_first_child_wasm(const TSTree *tree) {
   TSTreeCursor cursor = unmarshal_cursor(TRANSFER_BUFFER, tree);
   bool result = ts_tree_cursor_goto_first_child(&cursor);
@@ -250,6 +257,13 @@ bool ts_tree_cursor_goto_first_child_wasm(const TSTree *tree) {
   return result;
 }
 
+bool ts_tree_cursor_goto_last_child_wasm(const TSTree *tree) {
+  TSTreeCursor cursor = unmarshal_cursor(TRANSFER_BUFFER, tree);
+  bool result = ts_tree_cursor_goto_last_child(&cursor);
+  marshal_cursor(&cursor);
+  return result;
+}
+
 bool ts_tree_cursor_goto_next_sibling_wasm(const TSTree *tree) {
   TSTreeCursor cursor = unmarshal_cursor(TRANSFER_BUFFER, tree);
   bool result = ts_tree_cursor_goto_next_sibling(&cursor);
@@ -257,6 +271,13 @@ bool ts_tree_cursor_goto_next_sibling_wasm(const TSTree *tree) {
   return result;
 }
 
+bool ts_tree_cursor_goto_previous_sibling_wasm(const TSTree *tree) {
+  TSTreeCursor cursor = unmarshal_cursor(TRANSFER_BUFFER, tree);
+  bool result = ts_tree_cursor_goto_previous_sibling(&cursor);
+  marshal_cursor(&cursor);
+  return result;
+}
+
 bool ts_tree_cursor_goto_parent_wasm(const TSTree *tree) {
   TSTreeCursor cursor = unmarshal_cursor(TRANSFER_BUFFER, tree);
   bool result = ts_tree_cursor_goto_parent(&cursor);
@@ -270,6 +291,12 @@ uint16_t ts_tree_cursor_current_node_type_id_wasm(const TSTree *tree) {
   return ts_node_symbol(node);
 }
 
+uint16_t ts_tree_cursor_current_node_state_id_wasm(const TSTree *tree) {
+  TSTreeCursor cursor = unmarshal_cursor(TRANSFER_BUFFER, tree);
+  TSNode node = ts_tree_cursor_current_node(&cursor);
+  return ts_node_parse_state(node);
+}
+
 bool ts_tree_cursor_current_node_is_named_wasm(const TSTree *tree) {
   TSTreeCursor cursor = unmarshal_cursor(TRANSFER_BUFFER, tree);
   TSNode node = ts_tree_cursor_current_node(&cursor);
@@ -579,11 +606,21 @@ int ts_node_has_error_wasm(const TSTree *tree) {
   return ts_node_has_error(node);
 }
 
+int ts_node_is_error_wasm(const TSTree *tree) {
+  TSNode node = unmarshal_node(tree);
+  return ts_node_is_error(node);
+}
+
 int ts_node_is_missing_wasm(const TSTree *tree) {
   TSNode node = unmarshal_node(tree);
   return ts_node_is_missing(node);
 }
 
+uint16_t ts_node_parse_state_wasm(const TSTree *tree) {
+  TSNode node = unmarshal_node(tree);
+  return ts_node_parse_state(node);
+}
+
 /******************/
 /* Section - Query */
 /******************/
diff --git a/lib/binding_web/binding.js b/lib/binding_web/binding.js
index 5352cb18..4203bd92 100644
--- a/lib/binding_web/binding.js
+++ b/lib/binding_web/binding.js
@@ -1,6 +1,7 @@
 const C = Module;
 const INTERNAL = {};
 const SIZE_OF_INT = 4;
+const SIZE_OF_CURSOR = 3 * SIZE_OF_INT;
 const SIZE_OF_NODE = 5 * SIZE_OF_INT;
 const SIZE_OF_POINT = 2 * SIZE_OF_INT;
 const SIZE_OF_RANGE = 2 * SIZE_OF_INT + 2 * SIZE_OF_POINT;
@@ -227,6 +228,11 @@ class Node {
     return getText(this.tree, this.startIndex, this.endIndex);
   }
 
+  get parseState() {
+    marshalNode(this);
+    return C._ts_node_parse_state_wasm(this.tree[0]);
+  }
+
   isNamed() {
     marshalNode(this);
     return C._ts_node_is_named_wasm(this.tree[0]) === 1;
@@ -242,6 +248,11 @@ class Node {
     return C._ts_node_has_changes_wasm(this.tree[0]) === 1;
   }
 
+  isError() {
+    marshalNode(this);
+    return C._ts_node_is_error_wasm(this.tree[0]) === 1;
+  }
+
   isMissing() {
     marshalNode(this);
     return C._ts_node_is_missing_wasm(this.tree[0]) === 1;
@@ -505,6 +516,13 @@ class TreeCursor {
     unmarshalTreeCursor(this);
   }
 
+  resetTo(cursor) {
+    marshalTreeCursor(this, TRANSFER_BUFFER);
+    marshalTreeCursor(cursor, TRANSFER_BUFFER + SIZE_OF_CURSOR);
+    C._ts_tree_cursor_reset_to_wasm(this.tree[0], cursor.tree[0]);
+    unmarshalTreeCursor(this);
+  }
+
   get nodeType() {
     return this.tree.language.types[this.nodeTypeId] || 'ERROR';
   }
@@ -514,6 +532,11 @@ class TreeCursor {
     return C._ts_tree_cursor_current_node_type_id_wasm(this.tree[0]);
   }
 
+  get nodeStateId() {
+    marshalTreeCursor(this);
+    return C._ts_tree_cursor_current_node_state_id_wasm(this.tree[0]);
+  }
+
   get nodeId() {
     marshalTreeCursor(this);
     return C._ts_tree_cursor_current_node_id_wasm(this.tree[0]);
@@ -580,6 +603,13 @@ class TreeCursor {
     return result === 1;
   }
 
+  gotoLastChild() {
+    marshalTreeCursor(this);
+    const result = C._ts_tree_cursor_goto_last_child_wasm(this.tree[0]);
+    unmarshalTreeCursor(this);
+    return result === 1;
+  }
+
   gotoNextSibling() {
     marshalTreeCursor(this);
     const result = C._ts_tree_cursor_goto_next_sibling_wasm(this.tree[0]);
@@ -587,6 +617,13 @@ class TreeCursor {
     return result === 1;
   }
 
+  gotoPreviousSibling() {
+    marshalTreeCursor(this);
+    const result = C._ts_tree_cursor_goto_previous_sibling_wasm(this.tree[0]);
+    unmarshalTreeCursor(this);
+    return result === 1;
+  }
+
   gotoParent() {
     marshalTreeCursor(this);
     const result = C._ts_tree_cursor_goto_parent_wasm(this.tree[0]);
@@ -624,6 +661,10 @@ class Language {
     return this.fields.length - 1;
   }
 
+  get stateCount() {
+    return C._ts_language_state_count(this[0]);
+  }
+
   fieldIdForName(fieldName) {
     const result = this.fields.indexOf(fieldName);
     if (result !== -1) {
@@ -663,6 +704,15 @@ class Language {
     return C._ts_language_type_is_visible_wasm(this[0], typeId) ? true : false;
   }
 
+  nextState(stateId, typeId) {
+    return C._ts_language_next_state(this[0], stateId, typeId);
+  }
+
+  lookaheadIterator(stateId) {
+    const address = C._ts_lookahead_iterator_new(this[0], stateId);
+    if (address) return new LookaheadIterable(INTERNAL, address, this);
+  }
+
   query(source) {
     const sourceLength = lengthBytesUTF8(source);
     const sourceAddress = C._malloc(sourceLength + 1);
@@ -924,6 +974,53 @@ class Language {
   }
 }
 
+class LookaheadIterable {
+  constructor(internal, address, language) {
+    assertInternal(internal);
+    this[0] = address;
+    this.language = language;
+  }
+
+  get currentTypeId() {
+    return C._ts_lookahead_iterator_current_symbol(this[0]);
+  }
+
+  get currentType() {
+    return this.language.types[this.currentTypeId] || 'ERROR'
+  }
+
+  delete() {
+    C._ts_lookahead_iterator_delete(this[0]);
+    this[0] = 0;
+  }
+
+  resetState(stateId) {
+    return C._ts_lookahead_iterator_reset_state(this[0], stateId);
+  }
+
+  reset(language, stateId) {
+    if (C._ts_lookahead_iterator_reset(this[0], language, stateId)) {
+      this.language = language;
+      return true;
+    }
+
+    return false;
+  }
+
+  [Symbol.iterator]() {
+    const self = this;
+    return {
+      next() {
+        if (C._ts_lookahead_iterator_advance(self[0])) {
+          return { done: false, value: self.currentType };
+        }
+    
+        return { done: true, value: "" };
+      }
+    };
+  }
+}
+
 class Query {
   constructor(
     internal, address, captureNames, textPredicates, predicates,
diff --git a/lib/binding_web/exports.json b/lib/binding_web/exports.json
index eb4553dc..ba34eedb 100644
--- a/lib/binding_web/exports.json
+++ b/lib/binding_web/exports.json
@@ -38,10 +38,12 @@
   "_ts_language_type_is_named_wasm",
   "_ts_language_type_is_visible_wasm",
   "_ts_language_symbol_count",
+  "_ts_language_state_count",
   "_ts_language_symbol_for_name",
   "_ts_language_symbol_name",
   "_ts_language_symbol_type",
   "_ts_language_version",
+  "_ts_language_next_state",
   "_ts_node_child_by_field_id_wasm",
   "_ts_node_child_count_wasm",
   "_ts_node_child_wasm",
@@ -53,8 +55,10 @@
   "_ts_node_end_point_wasm",
   "_ts_node_has_changes_wasm",
   "_ts_node_has_error_wasm",
+  "_ts_node_is_error_wasm",
   "_ts_node_is_missing_wasm",
   "_ts_node_is_named_wasm",
+  "_ts_node_parse_state_wasm",
   "_ts_node_named_child_count_wasm",
   "_ts_node_named_child_wasm",
   "_ts_node_named_children_wasm",
@@ -93,19 +97,29 @@
   "_ts_tree_cursor_current_node_is_missing_wasm",
   "_ts_tree_cursor_current_node_is_named_wasm",
   "_ts_tree_cursor_current_node_type_id_wasm",
+  "_ts_tree_cursor_current_node_state_id_wasm",
   "_ts_tree_cursor_current_node_wasm",
   "_ts_tree_cursor_delete_wasm",
   "_ts_tree_cursor_end_index_wasm",
   "_ts_tree_cursor_end_position_wasm",
   "_ts_tree_cursor_goto_first_child_wasm",
+  "_ts_tree_cursor_goto_last_child",
   "_ts_tree_cursor_goto_next_sibling_wasm",
+  "_ts_tree_cursor_goto_previous_sibling_wasm",
   "_ts_tree_cursor_goto_parent_wasm",
   "_ts_tree_cursor_new_wasm",
   "_ts_tree_cursor_reset_wasm",
+  "_ts_tree_cursor_reset_to_wasm",
   "_ts_tree_cursor_start_index_wasm",
   "_ts_tree_cursor_start_position_wasm",
   "_ts_tree_delete",
   "_ts_tree_edit_wasm",
   "_ts_tree_get_changed_ranges_wasm",
-  "_ts_tree_root_node_wasm"
+  "_ts_tree_root_node_wasm",
+  "_ts_lookahead_iterator_new",
+  "_ts_lookahead_iterator_delete",
+  "_ts_lookahead_iterator_reset_state",
+  "_ts_lookahead_iterator_reset",
+  "_ts_lookahead_iterator_advance",
+  "_ts_lookahead_iterator_current_symbol"
 ]
diff --git a/lib/binding_web/test/node-test.js b/lib/binding_web/test/node-test.js
index 6bbcafb0..e897d991 100644
--- a/lib/binding_web/test/node-test.js
+++ b/lib/binding_web/test/node-test.js
@@ -268,6 +268,24 @@ describe("Node", () => {
     });
   });
 
+  describe(".isError()", () => {
+    it("returns true if the node is an error", () => {
+      tree = parser.parse("2 * * 3");
+      const node = tree.rootNode;
+      assert.equal(
+        node.toString(),
+        '(program (expression_statement (binary_expression left: (number) (ERROR) right: (number))))'
+      );
+
+      const multi = node.firstChild.firstChild;
+      assert(multi.hasError());
+      assert(!multi.children[0].isError());
+      assert(!multi.children[1].isError());
+      assert(multi.children[2].isError());
+      assert(!multi.children[3].isError());
+    });
+  });
+
   describe(".isMissing()", () => {
     it("returns true if the node is missing from the source and was inserted via error recovery", () => {
       tree = parser.parse("(2 ||)");
@@ -308,6 +326,21 @@ describe("Node", () => {
     );
   });
 
+  describe(".parseState", () => {
+    const text = "10 * 5";
+
+    it(`returns node parse state ids`, async () => {
+      tree = await parser.parse(text)
+      const quotientNode = tree.rootNode.firstChild.firstChild;
+      const [numerator, slash, denominator] = quotientNode.children;
+
+      assert.equal(tree.rootNode.parseState, 0);
+      assert.equal(numerator.parseState, 1);
+      assert.equal(slash.parseState, 553);
+      assert.equal(denominator.parseState, 185);
+    })
+  });
+
   describe('.descendantsOfType(type, min, max)', () => {
     it('finds all of the descendants of the given type in the given range', () => {
       tree = parser.parse("a + 1 * b * 2 + c + 3");
diff --git a/lib/binding_web/tree-sitter-web.d.ts b/lib/binding_web/tree-sitter-web.d.ts
index 016af4ae..709c2023 100644
--- a/lib/binding_web/tree-sitter-web.d.ts
+++ b/lib/binding_web/tree-sitter-web.d.ts
@@ -59,6 +59,7 @@ declare module 'web-tree-sitter' {
       tree: Tree;
       type: string;
       text: string;
+      parseState: number;
       startPosition: Point;
       endPosition: Point;
       startIndex: number;
@@ -80,6 +81,7 @@ declare module 'web-tree-sitter' {
       hasChanges(): boolean;
       hasError(): boolean;
       equals(other: SyntaxNode): boolean;
+      isError(): boolean;
       isMissing(): boolean;
       isNamed(): boolean;
       toString(): string;
@@ -104,6 +106,7 @@ declare module 'web-tree-sitter' {
     export interface TreeCursor {
       nodeType: string;
       nodeTypeId: number;
+      nodeStateId: number;
       nodeText: string;
       nodeId: number;
       nodeIsNamed: boolean;
@@ -114,14 +117,17 @@ declare module 'web-tree-sitter' {
       endIndex: number;
 
       reset(node: SyntaxNode): void;
+      resetTo(cursor: TreeCursor): void;
       delete(): void;
       currentNode(): SyntaxNode;
       currentFieldId(): number;
       currentFieldName(): string;
       gotoParent(): boolean;
       gotoFirstChild(): boolean;
+      gotoLastChild(): boolean;
       gotoFirstChildForIndex(index: number): boolean;
       gotoNextSibling(): boolean;
+      gotoPreviousSibling(): boolean;
     }
 
     export interface Tree {
@@ -141,6 +147,7 @@ declare module 'web-tree-sitter' {
 
       readonly version: number;
       readonly fieldCount: number;
+      readonly stateCount: number;
       readonly nodeTypeCount: number;
 
       fieldNameForId(fieldId: number): string | null;
@@ -149,7 +156,20 @@ declare module 'web-tree-sitter' {
       nodeTypeForId(typeId: number): string | null;
       nodeTypeIsNamed(typeId: number): boolean;
       nodeTypeIsVisible(typeId: number): boolean;
+      nextState(stateId: number, typeId: number): number;
       query(source: string): Query;
+      lookaheadIterator(stateId: number): LookaheadIterable | null;
+    }
+
+    class LookaheadIterable {
+      readonly language: Language;
+      readonly currentTypeId: number;
+      readonly currentType: string;
+
+      delete(): void;
+      resetState(stateId: number): boolean;
+      reset(language: Language, stateId: number): boolean;
+      [Symbol.iterator](): Iterator<string>;
     }
 
     interface QueryCapture {
diff --git a/lib/include/tree_sitter/api.h b/lib/include/tree_sitter/api.h
index 1e67f217..a9c8a182 100644
--- a/lib/include/tree_sitter/api.h
+++ b/lib/include/tree_sitter/api.h
@@ -32,6 +32,10 @@ extern "C" {
 /* Section - Types */
 /*******************/
 
+#ifndef TREE_SITTER_PARSER_H_
+typedef uint16_t TSStateId;
+#endif
+
 typedef uint16_t TSSymbol;
 typedef uint16_t TSFieldId;
 typedef struct TSLanguage TSLanguage;
@@ -39,6 +43,7 @@ typedef struct TSParser TSParser;
 typedef struct TSTree TSTree;
 typedef struct TSQuery TSQuery;
 typedef struct TSQueryCursor TSQueryCursor;
+typedef struct TSLookaheadIterator TSLookaheadIterator;
 
 typedef enum {
   TSInputEncodingUTF8,
@@ -504,6 +509,16 @@ bool ts_node_has_changes(TSNode);
  */
 bool ts_node_has_error(TSNode);
 
+/**
+ * Check if the node is a syntax error.
+*/
+bool ts_node_is_error(TSNode);
+
+/**
+ * Get this node's parse state.
+*/
+TSStateId ts_node_parse_state(TSNode);
+
 /**
  * Get the node's immediate parent.
  */
@@ -637,6 +652,14 @@ void ts_tree_cursor_delete(TSTreeCursor *);
  */
 void ts_tree_cursor_reset(TSTreeCursor *, TSNode);
 
+/**
+ * Re-initialize a tree cursor to the same position as another cursor.
+ *
+ * Unlike `ts_tree_cursor_reset`, this will not lose parent information and
+ * allows reusing already created cursors.
+*/
+void ts_tree_cursor_reset_to(TSTreeCursor *, const TSTreeCursor *);
+
 /**
  * Get the tree cursor's current node.
  */
@@ -675,12 +698,21 @@ bool ts_tree_cursor_goto_parent(TSTreeCursor *);
 bool ts_tree_cursor_goto_next_sibling(TSTreeCursor *);
 
 /**
- * Move the cursor to the first child of its current node.
+ * Move the cursor to the previous sibling of its current node.
+ *
+ * This returns `true` if the cursor successfully moved, and returns `false` if
+ * there was no previous sibling node.
+ */
+bool ts_tree_cursor_goto_previous_sibling(TSTreeCursor *);
+
+/**
+ * Move the cursor to the first/last child of its current node.
  *
  * This returns `true` if the cursor successfully moved, and returns `false`
  * if there were no children.
  */
 bool ts_tree_cursor_goto_first_child(TSTreeCursor *);
+bool ts_tree_cursor_goto_last_child(TSTreeCursor *);
 
 /**
  * Move the cursor to the node that is the nth descendant of
@@ -939,6 +971,11 @@ void ts_query_cursor_set_max_start_depth(TSQueryCursor *, uint32_t);
  */
 uint32_t ts_language_symbol_count(const TSLanguage *);
 
+/**
+ * Get the number of valid states in this language.
+*/
+uint32_t ts_language_state_count(const TSLanguage *);
+
 /**
  * Get a node type string for the given numerical id.
  */
@@ -986,6 +1023,71 @@ TSSymbolType ts_language_symbol_type(const TSLanguage *, TSSymbol);
  */
 uint32_t ts_language_version(const TSLanguage *);
 
+/**
+ * Get the next parse state. Combine this with lookahead iterators to generate
+ * completion suggestions or valid symbols in error nodes.
+*/
+TSStateId ts_language_next_state(const TSLanguage *, TSStateId, TSSymbol);
+
+/********************************/
+/* Section - Lookahead Iterator */
+/********************************/
+
+/**
+ * Create a new lookahead iterator for the given language and parse state.
+ *
+ * This returns `NULL` if state is invalid for the language.
+ *
+ * Repeatedly using `ts_lookahead_iterator_advance` and
+ * `ts_lookahead_iterator_current_symbol` will generate valid symbols in the
+ * given parse state. Newly created lookahead iterators will contain the `ERROR`
+ * symbol.
+ *
+ * Lookahead iterators can be useful to generate suggestions and improve syntax
+ * error diagnostics. To get symbols valid in an ERROR node, use the lookahead
+ * iterator on its first leaf node state. For `MISSING` nodes, a lookahead
+ * iterator created on the previous non-extra leaf node may be appropriate.
+*/
+TSLookaheadIterator *ts_lookahead_iterator_new(const TSLanguage *, TSStateId);
+
+/**
+ * Delete a lookahead iterator freeing all the memory used.
+*/
+void ts_lookahead_iterator_delete(TSLookaheadIterator *);
+
+/**
+ * Reset the lookahead iterator to another state.
+ *
+ * This returns `true` if the iterator was reset to the given state and `false`
+ * otherwise.
+*/
+bool ts_lookahead_iterator_reset_state(TSLookaheadIterator *, TSStateId);
+
+/**
+ * Reset the lookahead iterator.
+ *
+ * This returns `true` if the language was set successfully and `false`
+ * otherwise.
+*/
+bool ts_lookahead_iterator_reset(TSLookaheadIterator *, const TSLanguage *, TSStateId);
+
+/**
+ * Get the current language of the lookahead iterator.
+*/
+const TSLanguage * ts_lookahead_iterator_language(const TSLookaheadIterator *);
+
+/**
+ * Advance the lookahead iterator to the next symbol.
+ *
+ * This returns `true` if there is a new symbol and `false` otherwise.
+*/
+bool ts_lookahead_iterator_advance(TSLookaheadIterator *);
+
+/**
+ * Get the current symbol of the lookahead iterator;
+*/
+TSSymbol ts_lookahead_iterator_current_symbol(const TSLookaheadIterator *);
+
 /**********************************/
 /* Section - Global Configuration */
 /**********************************/
diff --git a/lib/include/tree_sitter/parser.h b/lib/include/tree_sitter/parser.h
index ac773580..c7ad1907 100644
--- a/lib/include/tree_sitter/parser.h
+++ b/lib/include/tree_sitter/parser.h
@@ -13,7 +13,9 @@ extern "C" {
 #define ts_builtin_sym_end 0
 #define TREE_SITTER_SERIALIZATION_BUFFER_SIZE 1024
 
+#ifndef TREE_SITTER_API_H_
 typedef uint16_t TSStateId;
+#endif
 
 #ifndef TREE_SITTER_API_H_
 typedef uint16_t TSSymbol;
diff --git a/lib/src/language.c b/lib/src/language.c
index c87a8dc1..d8d07c2c 100644
--- a/lib/src/language.c
+++ b/lib/src/language.c
@@ -7,6 +7,10 @@ uint32_t ts_language_symbol_count(const TSLanguage *self) {
   return self->symbol_count + self->alias_count;
 }
 
+uint32_t ts_language_state_count(const TSLanguage *self) {
+  return self->state_count;
+}
+
 uint32_t ts_language_version(const TSLanguage *self) {
   return self->version;
 }
@@ -56,6 +60,28 @@ TSSymbol ts_language_public_symbol(
   return self->public_symbol_map[symbol];
 }
 
+TSStateId ts_language_next_state(
+  const TSLanguage *self,
+  TSStateId state,
+  TSSymbol symbol
+) {
+  if (symbol == ts_builtin_sym_error || symbol == ts_builtin_sym_error_repeat) {
+    return 0;
+  } else if (symbol < self->token_count) {
+    uint32_t count;
+    const TSParseAction *actions = ts_language_actions(self, state, symbol, &count);
+    if (count > 0) {
+      TSParseAction action = actions[count - 1];
+      if (action.type == TSParseActionTypeShift) {
+        return action.shift.extra ? state : action.shift.state;
+      }
+    }
+    return 0;
+  } else {
+    return ts_language_lookup(self, state, symbol);
+  }
+}
+
 const char *ts_language_symbol_name(
   const TSLanguage *self,
   TSSymbol symbol
@@ -135,3 +161,43 @@ TSFieldId ts_language_field_id_for_name(
   }
   return 0;
 }
+
+TSLookaheadIterator *ts_lookahead_iterator_new(const TSLanguage *self, TSStateId state) {
+  if (state >= self->state_count) return NULL;
+  LookaheadIterator *iterator = ts_malloc(sizeof(LookaheadIterator));
+  *iterator = ts_language_lookaheads(self, state);
+  return (TSLookaheadIterator *)iterator;
+}
+
+void ts_lookahead_iterator_delete(TSLookaheadIterator *self) {
+  ts_free(self);
+}
+
+bool ts_lookahead_iterator_reset_state(TSLookaheadIterator * self, TSStateId state) {
+  LookaheadIterator *iterator = (LookaheadIterator *)self;
+  if (state >= iterator->language->state_count) return false;
+  *iterator = ts_language_lookaheads(iterator->language, state);
+  return true;
+}
+
+const TSLanguage * ts_lookahead_iterator_language(const TSLookaheadIterator *self) {
+  LookaheadIterator *iterator = (LookaheadIterator *)self;
+  return iterator->language;
+}
+
+bool ts_lookahead_iterator_reset(TSLookaheadIterator *self, const TSLanguage *language, TSStateId state) {
+  if (state >= language->state_count) return false;
+  LookaheadIterator *iterator = (LookaheadIterator *)self;
+  *iterator = ts_language_lookaheads(language, state);
+  return true;
+}
+
+bool ts_lookahead_iterator_advance(TSLookaheadIterator *self) {
+  LookaheadIterator *iterator = (LookaheadIterator *)self;
+  return ts_lookahead_iterator_next(iterator);
+}
+
+TSSymbol ts_lookahead_iterator_current_symbol(const TSLookaheadIterator *self) {
+  LookaheadIterator *iterator = (LookaheadIterator *)self;
+  return iterator->symbol;
+}
diff --git a/lib/src/language.h b/lib/src/language.h
index db61b602..002f564f 100644
--- a/lib/src/language.h
+++ b/lib/src/language.h
@@ -38,6 +38,8 @@ TSSymbolMetadata ts_language_symbol_metadata(const TSLanguage *, TSSymbol);
 
 TSSymbol ts_language_public_symbol(const TSLanguage *, TSSymbol);
 
+TSStateId ts_language_next_state(const TSLanguage *self, TSStateId state, TSSymbol symbol);
+
 static inline bool ts_language_is_symbol_external(const TSLanguage *self, TSSymbol symbol) {
   return 0 < symbol && symbol < self->external_token_count + 1;
 }
@@ -178,28 +180,6 @@ static inline bool ts_lookahead_iterator_next(LookaheadIterator *self) {
   return true;
 }
 
-static inline TSStateId ts_language_next_state(
-  const TSLanguage *self,
-  TSStateId state,
-  TSSymbol symbol
-) {
-  if (symbol == ts_builtin_sym_error || symbol == ts_builtin_sym_error_repeat) {
-    return 0;
-  } else if (symbol < self->token_count) {
-    uint32_t count;
-    const TSParseAction *actions = ts_language_actions(self, state, symbol, &count);
-    if (count > 0) {
-      TSParseAction action = actions[count - 1];
-      if (action.type == TSParseActionTypeShift) {
-        return action.shift.extra ? state : action.shift.state;
-      }
-    }
-    return 0;
-  } else {
-    return ts_language_lookup(self, state, symbol);
-  }
-}
-
 // Whether the state is a "primary state". If this returns false, it indicates that there exists
 // another state that behaves identically to this one with respect to query analysis.
 static inline bool ts_language_state_is_primary(
diff --git a/lib/src/node.c b/lib/src/node.c
index eafaa7bb..8ef2d150 100644
--- a/lib/src/node.c
+++ b/lib/src/node.c
@@ -468,6 +468,15 @@ uint32_t ts_node_descendant_count(TSNode self) {
   return ts_subtree_visible_descendant_count(ts_node__subtree(self)) + 1;
 }
 
+bool ts_node_is_error(TSNode self) {
+  TSSymbol symbol = ts_node_symbol(self);
+  return symbol == ts_builtin_sym_error;
+}
+
+TSStateId ts_node_parse_state(TSNode self) {
+  return ts_subtree_parse_state(ts_node__subtree(self));
+}
+
 TSNode ts_node_parent(TSNode self) {
   TSNode node = ts_tree_root_node(self.tree);
   uint32_t end_byte = ts_node_end_byte(self);
diff --git a/lib/src/tree_cursor.c b/lib/src/tree_cursor.c
index 97a53152..624cfa2f 100644
--- a/lib/src/tree_cursor.c
+++ b/lib/src/tree_cursor.c
@@ -97,6 +97,40 @@ static inline bool ts_tree_cursor_child_iterator_next(
   return true;
 }
 
+static inline bool ts_tree_cursor_child_iterator_previous(
+  CursorChildIterator *self,
+  TreeCursorEntry *result,
+  bool *visible
+) {
+  // this is mostly a reverse `ts_tree_cursor_child_iterator_next` taking into
+  // account unsigned underflow
+  if (!self->parent.ptr || (int8_t)self->child_index == -1) return false;
+  const Subtree *child = &ts_subtree_children(self->parent)[self->child_index];
+  *result = (TreeCursorEntry) {
+    .subtree = child,
+    .position = self->position,
+    .child_index = self->child_index,
+    .structural_child_index = self->structural_child_index,
+  };
+  *visible = ts_subtree_visible(*child);
+  bool extra = ts_subtree_extra(*child);
+  if (!extra && self->alias_sequence) {
+    *visible |= self->alias_sequence[self->structural_child_index];
+    self->structural_child_index--;
+  }
+
+  self->position = length_sub(self->position, ts_subtree_padding(*child));
+  self->child_index--;
+
+  // unsigned can underflow so compare it to child_count
+  if (self->child_index < self->parent.ptr->child_count) {
+    Subtree previous_child = ts_subtree_children(self->parent)[self->child_index];
+    self->position = length_sub(self->position, ts_subtree_size(previous_child));
+  }
+
+  return true;
+}
+
 // TSTreeCursor - lifecycle
 
 TSTreeCursor ts_tree_cursor_new(TSNode node) {
@@ -163,6 +197,47 @@ bool ts_tree_cursor_goto_first_child(TSTreeCursor *self) {
   return false;
 }
 
+TreeCursorStep ts_tree_cursor_goto_last_child_internal(TSTreeCursor *_self) {
+  TreeCursor *self = (TreeCursor *)_self;
+  bool visible;
+  TreeCursorEntry entry;
+  CursorChildIterator iterator = ts_tree_cursor_iterate_children(self);
+  if (!iterator.parent.ptr || iterator.parent.ptr->child_count == 0) return TreeCursorStepNone;
+
+  TreeCursorEntry last_entry;
+  bool last_visible;
+  while (ts_tree_cursor_child_iterator_next(&iterator, &entry, &visible)) {
+    if (visible) {
+      last_entry = entry;
+      last_visible = true;
+    }
+    else if (ts_subtree_visible_child_count(*entry.subtree) > 0) {
+      last_entry = entry;
+      last_visible = false;
+    }
+  }
+  if (last_entry.subtree) {
+    array_push(&self->stack, last_entry);
+    return last_visible? TreeCursorStepVisible : TreeCursorStepHidden;
+  }
+
+  return TreeCursorStepNone;
+}
+
+bool ts_tree_cursor_goto_last_child(TSTreeCursor *self) {
+  for (;;) {
+    switch (ts_tree_cursor_goto_last_child_internal(self)) {
+      case TreeCursorStepHidden:
+        continue;
+      case TreeCursorStepVisible:
+        return true;
+      default:
+        return false;
+    }
+  }
+  return false;
+}
+
 static inline int64_t ts_tree_cursor_goto_first_child_for_byte_and_point(
   TSTreeCursor *_self,
   uint32_t goal_byte,
@@ -213,7 +288,9 @@ int64_t ts_tree_cursor_goto_first_child_for_point(TSTreeCursor *self, TSPoint go
   return ts_tree_cursor_goto_first_child_for_byte_and_point(self, 0, goal_point);
 }
 
-TreeCursorStep ts_tree_cursor_goto_next_sibling_internal(TSTreeCursor *_self) {
+TreeCursorStep ts_tree_cursor_goto_sibling_internal(
+    TSTreeCursor *_self,
+    bool (*advance)(CursorChildIterator *, TreeCursorEntry *, bool *)) {
   TreeCursor *self = (TreeCursor *)_self;
   uint32_t initial_size = self->stack.size;
 
@@ -226,10 +303,10 @@ TreeCursorStep ts_tree_cursor_goto_next_sibling_internal(TSTreeCursor *_self) {
     iterator.descendant_index = entry.descendant_index;
 
     bool visible = false;
-    ts_tree_cursor_child_iterator_next(&iterator, &entry, &visible);
+    advance(&iterator, &entry, &visible);
     if (visible && self->stack.size + 1 < initial_size) break;
 
-    while (ts_tree_cursor_child_iterator_next(&iterator, &entry, &visible)) {
+    while (advance(&iterator, &entry, &visible)) {
       if (visible) {
         array_push(&self->stack, entry);
         return TreeCursorStepVisible;
@@ -246,6 +323,10 @@ TreeCursorStep ts_tree_cursor_goto_next_sibling_internal(TSTreeCursor *_self) {
   return TreeCursorStepNone;
 }
 
+TreeCursorStep ts_tree_cursor_goto_next_sibling_internal(TSTreeCursor *_self) {
+  return ts_tree_cursor_goto_sibling_internal(_self, ts_tree_cursor_child_iterator_next);
+}
+
 bool ts_tree_cursor_goto_next_sibling(TSTreeCursor *self) {
   switch (ts_tree_cursor_goto_next_sibling_internal(self)) {
     case TreeCursorStepHidden:
@@ -258,6 +339,50 @@ bool ts_tree_cursor_goto_next_sibling(TSTreeCursor *self) {
   }
 }
 
+TreeCursorStep ts_tree_cursor_goto_previous_sibling_internal(TSTreeCursor *_self) {
+  // since subtracting across row loses column information, we may have to
+  // restore it
+  TreeCursor *self = (TreeCursor *)_self;
+
+  // for that, save current position before traversing
+  Length position = array_back(&self->stack)->position;
+  TreeCursorStep step = ts_tree_cursor_goto_sibling_internal(
+      _self, ts_tree_cursor_child_iterator_previous);
+  if (step == TreeCursorStepNone)
+    return step;
+
+  // if row has not changed, column is still valid
+  if (array_back(&self->stack)->position.extent.row == position.extent.row)
+    return step;
+
+  // restore position from the parent node
+  const TreeCursorEntry *parent = &self->stack.contents[self->stack.size - 2];
+  position = parent->position;
+  uint32_t child_index = array_back(&self->stack)->child_index;
+  const Subtree *children = ts_subtree_children((*(parent->subtree)));
+  for (uint32_t i = 0; i < child_index; ++i) {
+    position = length_add(position, ts_subtree_total_size(children[i]));
+  }
+  if (child_index > 0)
+    position = length_add(position, ts_subtree_padding(children[child_index]));
+
+  array_back(&self->stack)->position = position;
+
+  return step;
+}
+
+bool ts_tree_cursor_goto_previous_sibling(TSTreeCursor *self) {
+  switch (ts_tree_cursor_goto_previous_sibling_internal(self)) {
+    case TreeCursorStepHidden:
+      ts_tree_cursor_goto_last_child(self);
+      return true;
+    case TreeCursorStepVisible:
+      return true;
+    default:
+      return false;
+  }
+}
+
 bool ts_tree_cursor_goto_parent(TSTreeCursor *_self) {
   TreeCursor *self = (TreeCursor *)_self;
   for (unsigned i = self->stack.size - 2; i + 1 > 0; i--) {
@@ -556,3 +681,11 @@ TSTreeCursor ts_tree_cursor_copy(const TSTreeCursor *_cursor) {
   array_push_all(&copy->stack, &cursor->stack);
   return res;
 }
+
+void ts_tree_cursor_reset_to(TSTreeCursor *_dst, const TSTreeCursor *_src) {
+  const TreeCursor *cursor = (const TreeCursor *)_src;
+  TreeCursor *copy = (TreeCursor *)_dst;
+  copy->tree = cursor->tree;
+  array_clear(&copy->stack);
+  array_push_all(&copy->stack, &cursor->stack);
+}

From 726738497042d7c6172517c5e1256be28682b2cf Mon Sep 17 00:00:00 2001
From: Daumantas Kavolis <daumantas.kavolis@sensmetry.com>
Date: Thu, 15 Jun 2023 13:36:49 +0300
Subject: [PATCH 217/347] Use step directly

---
 lib/src/tree_cursor.c | 8 ++++----
 1 file changed, 4 insertions(+), 4 deletions(-)

diff --git a/lib/src/tree_cursor.c b/lib/src/tree_cursor.c
index 624cfa2f..702088ad 100644
--- a/lib/src/tree_cursor.c
+++ b/lib/src/tree_cursor.c
@@ -205,20 +205,20 @@ TreeCursorStep ts_tree_cursor_goto_last_child_internal(TSTreeCursor *_self) {
   if (!iterator.parent.ptr || iterator.parent.ptr->child_count == 0) return TreeCursorStepNone;
 
   TreeCursorEntry last_entry;
-  bool last_visible;
+  TreeCursorStep last_step = TreeCursorStepNone;
   while (ts_tree_cursor_child_iterator_next(&iterator, &entry, &visible)) {
     if (visible) {
       last_entry = entry;
-      last_visible = true;
+      last_step = TreeCursorStepVisible;
     }
     else if (ts_subtree_visible_child_count(*entry.subtree) > 0) {
       last_entry = entry;
-      last_visible = false;
+      last_step = TreeCursorStepHidden;
     }
   }
   if (last_entry.subtree) {
     array_push(&self->stack, last_entry);
-    return last_visible? TreeCursorStepVisible : TreeCursorStepHidden;
+    return last_step;
   }
 
   return TreeCursorStepNone;

From 1f52f2f1dca4a9a549e6593b583857f749210918 Mon Sep 17 00:00:00 2001
From: Daumantas Kavolis <daumantas.kavolis@sensmetry.com>
Date: Thu, 15 Jun 2023 15:55:32 +0300
Subject: [PATCH 218/347] Symbols without aliases should be used for lookahead

---
 lib/binding_rust/bindings.rs         | 14 +++++++++++++-
 lib/binding_rust/lib.rs              | 27 +++++++++++++++++++++++++++
 lib/binding_web/binding.c            | 10 ++++++++++
 lib/binding_web/binding.js           | 14 ++++++++++++++
 lib/binding_web/exports.json         |  2 ++
 lib/binding_web/test/node-test.js    | 12 ++++++++----
 lib/binding_web/tree-sitter-web.d.ts |  5 ++++-
 lib/include/tree_sitter/api.h        | 21 ++++++++++++++++++++-
 lib/src/node.c                       | 17 +++++++++++++++++
 9 files changed, 115 insertions(+), 7 deletions(-)

diff --git a/lib/binding_rust/bindings.rs b/lib/binding_rust/bindings.rs
index da870263..d2239893 100644
--- a/lib/binding_rust/bindings.rs
+++ b/lib/binding_rust/bindings.rs
@@ -288,6 +288,14 @@ extern "C" {
     #[doc = " Get the node's language."]
     pub fn ts_node_language(arg1: TSNode) -> *const TSLanguage;
 }
+extern "C" {
+    #[doc = " Get the node's type as it appears in the grammar ignoring aliases as a\n null-terminated string."]
+    pub fn ts_node_grammar_type(arg1: TSNode) -> *const ::std::os::raw::c_char;
+}
+extern "C" {
+    #[doc = " Get the node's type as a numerical id as it appears in the grammar ignoring\n aliases. This should be used in `ts_language_next_state` instead of\n `ts_node_symbol`."]
+    pub fn ts_node_grammar_symbol(arg1: TSNode) -> TSSymbol;
+}
 extern "C" {
     #[doc = " Get the node's start byte."]
     pub fn ts_node_start_byte(arg1: TSNode) -> u32;
@@ -340,6 +348,10 @@ extern "C" {
     #[doc = " Get this node's parse state."]
     pub fn ts_node_parse_state(arg1: TSNode) -> TSStateId;
 }
+extern "C" {
+    #[doc = " Get the parse state after this node."]
+    pub fn ts_node_next_parse_state(arg1: TSNode) -> TSStateId;
+}
 extern "C" {
     #[doc = " Get the node's immediate parent."]
     pub fn ts_node_parent(arg1: TSNode) -> TSNode;
@@ -681,7 +693,7 @@ extern "C" {
     pub fn ts_language_version(arg1: *const TSLanguage) -> u32;
 }
 extern "C" {
-    #[doc = " Get the next parse state. Combine this with lookahead iterators to generate\n completion suggestions or valid symbols in error nodes."]
+    #[doc = " Get the next parse state. Combine this with lookahead iterators to generate\n completion suggestions or valid symbols in error nodes. Use\n `ts_node_grammar_symbol` for valid symbols."]
     pub fn ts_language_next_state(
         arg1: *const TSLanguage,
         arg2: TSStateId,
diff --git a/lib/binding_rust/lib.rs b/lib/binding_rust/lib.rs
index 6a46dafc..cdf1ffcf 100644
--- a/lib/binding_rust/lib.rs
+++ b/lib/binding_rust/lib.rs
@@ -349,6 +349,11 @@ impl Language {
 
     /// Get the next parse state. Combine this with [lookahead_iterator] to
     /// generate completion suggestions or valid symbols in error nodes.
+    ///
+    /// Example:
+    /// ```
+    /// let state = language.next_state(node.parse_state(), node.grammar_id());
+    /// ```
     #[doc(alias = "ts_language_next_state")]
     pub fn next_state(&self, state: u16, id: u16) -> u16 {
         unsafe { ffi::ts_language_next_state(self.0, state, id) }
@@ -872,6 +877,13 @@ impl<'tree> Node<'tree> {
         unsafe { ffi::ts_node_symbol(self.0) }
     }
 
+    /// Get the node's type as a numerical id as it appears in the grammar
+    /// ignoring aliases.
+    #[doc(alias = "ts_node_grammar_symbol")]
+    pub fn grammar_id(&self) -> u16 {
+        unsafe { ffi::ts_node_grammar_symbol(self.0) }
+    }
+
     /// Get this node's type as a string.
     #[doc(alias = "ts_node_type")]
     pub fn kind(&self) -> &'static str {
@@ -880,6 +892,15 @@ impl<'tree> Node<'tree> {
             .unwrap()
     }
 
+    /// Get this node's symbol name as it appears in the grammar ignoring
+    /// aliases as a string.
+    #[doc(alias = "ts_node_grammar_type")]
+    pub fn grammar_name(&self) -> &'static str {
+        unsafe { CStr::from_ptr(ffi::ts_node_grammar_type(self.0)) }
+            .to_str()
+            .unwrap()
+    }
+
     /// Get the [Language] that was used to parse this node's syntax tree.
     #[doc(alias = "ts_node_language")]
     pub fn language(&self) -> Language {
@@ -931,6 +952,12 @@ impl<'tree> Node<'tree> {
         unsafe { ffi::ts_node_parse_state(self.0) }
     }
 
+    /// Get the parse state after this node.
+    #[doc(alias = "ts_node_next_parse_state")]
+    pub fn next_parse_state(&self) -> u16 {
+        unsafe { ffi::ts_node_next_parse_state(self.0) }
+    }
+
     /// Check if this node is *missing*.
     ///
     /// Missing nodes are inserted by the parser in order to recover from certain kinds of
diff --git a/lib/binding_web/binding.c b/lib/binding_web/binding.c
index 4ba36f65..5a8e4e34 100644
--- a/lib/binding_web/binding.c
+++ b/lib/binding_web/binding.c
@@ -361,6 +361,11 @@ uint16_t ts_node_symbol_wasm(const TSTree *tree) {
   return ts_node_symbol(node);
 }
 
+uint16_t ts_node_grammar_symbol_wasm(const TSTree *tree) {
+  TSNode node = unmarshal_node(tree);
+  return ts_node_grammar_symbol(node);
+}
+
 uint32_t ts_node_child_count_wasm(const TSTree *tree) {
   TSNode node = unmarshal_node(tree);
   return ts_node_child_count(node);
@@ -621,6 +626,11 @@ uint16_t ts_node_parse_state_wasm(const TSTree *tree) {
   return ts_node_parse_state(node);
 }
 
+uint16_t ts_node_next_parse_state_wasm(const TSTree *tree) {
+  TSNode node = unmarshal_node(tree);
+  return ts_node_next_parse_state(node);
+}
+
 /******************/
 /* Section - Query */
 /******************/
diff --git a/lib/binding_web/binding.js b/lib/binding_web/binding.js
index 4203bd92..38efabd6 100644
--- a/lib/binding_web/binding.js
+++ b/lib/binding_web/binding.js
@@ -209,10 +209,19 @@ class Node {
     return C._ts_node_symbol_wasm(this.tree[0]);
   }
 
+  get grammarId() {
+    marshalNode(this);
+    return C._ts_node_grammar_symbol_wasm(this.tree[0]);
+  }
+
   get type() {
     return this.tree.language.types[this.typeId] || 'ERROR';
   }
 
+  get grammarType() {
+    return this.tree.language.types[this.grammarId] || 'ERROR';
+  }
+
   get endPosition() {
     marshalNode(this);
     C._ts_node_end_point_wasm(this.tree[0]);
@@ -233,6 +242,11 @@ class Node {
     return C._ts_node_parse_state_wasm(this.tree[0]);
   }
 
+  get nextParseState() {
+    marshalNode(this);
+    return C._ts_node_next_parse_state_wasm(this.tree[0]);
+  }
+
   isNamed() {
     marshalNode(this);
     return C._ts_node_is_named_wasm(this.tree[0]) === 1;
diff --git a/lib/binding_web/exports.json b/lib/binding_web/exports.json
index ba34eedb..1c638bb0 100644
--- a/lib/binding_web/exports.json
+++ b/lib/binding_web/exports.json
@@ -59,6 +59,7 @@
   "_ts_node_is_missing_wasm",
   "_ts_node_is_named_wasm",
   "_ts_node_parse_state_wasm",
+  "_ts_node_next_parse_state_wasm",
   "_ts_node_named_child_count_wasm",
   "_ts_node_named_child_wasm",
   "_ts_node_named_children_wasm",
@@ -72,6 +73,7 @@
   "_ts_node_start_index_wasm",
   "_ts_node_start_point_wasm",
   "_ts_node_symbol_wasm",
+  "_ts_node_grammar_symbol_wasm",
   "_ts_node_to_string_wasm",
   "_ts_parser_delete",
   "_ts_parser_enable_logger_wasm",
diff --git a/lib/binding_web/test/node-test.js b/lib/binding_web/test/node-test.js
index e897d991..1abef756 100644
--- a/lib/binding_web/test/node-test.js
+++ b/lib/binding_web/test/node-test.js
@@ -327,7 +327,7 @@ describe("Node", () => {
   });
 
   describe(".parseState", () => {
-    const text = "10 * 5";
+    const text = "10 / 5";
 
     it(`returns node parse state ids`, async () => {
       tree = await parser.parse(text)
@@ -335,9 +335,13 @@ describe("Node", () => {
       const [numerator, slash, denominator] = quotientNode.children;
 
       assert.equal(tree.rootNode.parseState, 0);
-      assert.equal(numerator.parseState, 1);
-      assert.equal(slash.parseState, 553);
-      assert.equal(denominator.parseState, 185);
+      // parse states will change on any change to the grammar so test that it
+      // returns something instead
+      assert.isAbove(numerator.parseState, 0);
+      assert.isAbove(numerator.nextParseState, 0);
+      assert.isAbove(slash.parseState, 0);
+      assert.isAbove(denominator.parseState, 0);
+      assert.isAbove(denominator.nextParseState, 0);
     })
   });
 
diff --git a/lib/binding_web/tree-sitter-web.d.ts b/lib/binding_web/tree-sitter-web.d.ts
index 709c2023..dfe7766c 100644
--- a/lib/binding_web/tree-sitter-web.d.ts
+++ b/lib/binding_web/tree-sitter-web.d.ts
@@ -55,11 +55,14 @@ declare module 'web-tree-sitter' {
     ) => string | null;
 
     export interface SyntaxNode {
-      id: number;
+      typeId: number;
+      grammarId: number;
       tree: Tree;
       type: string;
+      grammarType: string;
       text: string;
       parseState: number;
+      nextParseState: number;
       startPosition: Point;
       endPosition: Point;
       startIndex: number;
diff --git a/lib/include/tree_sitter/api.h b/lib/include/tree_sitter/api.h
index a9c8a182..4bd2f43d 100644
--- a/lib/include/tree_sitter/api.h
+++ b/lib/include/tree_sitter/api.h
@@ -445,6 +445,19 @@ TSSymbol ts_node_symbol(TSNode);
  */
 const TSLanguage *ts_node_language(TSNode);
 
+/**
+ * Get the node's type as it appears in the grammar ignoring aliases as a
+ * null-terminated string.
+ */
+const char *ts_node_grammar_type(TSNode);
+
+/**
+ * Get the node's type as a numerical id as it appears in the grammar ignoring
+ * aliases. This should be used in `ts_language_next_state` instead of
+ * `ts_node_symbol`.
+ */
+TSSymbol ts_node_grammar_symbol(TSNode);
+
 /**
  * Get the node's start byte.
  */
@@ -519,6 +532,11 @@ bool ts_node_is_error(TSNode);
 */
 TSStateId ts_node_parse_state(TSNode);
 
+/**
+ * Get the parse state after this node.
+*/
+TSStateId ts_node_next_parse_state(TSNode);
+
 /**
  * Get the node's immediate parent.
  */
@@ -1025,7 +1043,8 @@ uint32_t ts_language_version(const TSLanguage *);
 
 /**
  * Get the next parse state. Combine this with lookahead iterators to generate
- * completion suggestions or valid symbols in error nodes.
+ * completion suggestions or valid symbols in error nodes. Use
+ * `ts_node_grammar_symbol` for valid symbols.
 */
 TSStateId ts_language_next_state(const TSLanguage *, TSStateId, TSSymbol);
 
diff --git a/lib/src/node.c b/lib/src/node.c
index 8ef2d150..46028f37 100644
--- a/lib/src/node.c
+++ b/lib/src/node.c
@@ -429,6 +429,15 @@ const TSLanguage *ts_node_language(TSNode self) {
   return self.tree->language;
 }
 
+TSSymbol ts_node_grammar_symbol(TSNode self) {
+  return ts_subtree_symbol(ts_node__subtree(self));
+}
+
+const char *ts_node_grammar_type(TSNode self) {
+  TSSymbol symbol = ts_subtree_symbol(ts_node__subtree(self));
+  return ts_language_symbol_name(self.tree->language, symbol);
+}
+
 char *ts_node_string(TSNode self) {
   return ts_subtree_string(ts_node__subtree(self), self.tree->language, false);
 }
@@ -477,6 +486,14 @@ TSStateId ts_node_parse_state(TSNode self) {
   return ts_subtree_parse_state(ts_node__subtree(self));
 }
 
+TSStateId ts_node_next_parse_state(TSNode self) {
+  const TSLanguage *language = self.tree->language;
+  uint16_t state = ts_node_parse_state(self);
+  uint16_t symbol = ts_node_grammar_symbol(self);
+
+  return ts_language_next_state(language, state, symbol);
+}
+
 TSNode ts_node_parent(TSNode self) {
   TSNode node = ts_tree_root_node(self.tree);
   uint32_t end_byte = ts_node_end_byte(self);

From 672d38803e61416a0d4653adf6392c5cc2ac6391 Mon Sep 17 00:00:00 2001
From: Daumantas Kavolis <daumantas.kavolis@sensmetry.com>
Date: Thu, 15 Jun 2023 17:25:08 +0300
Subject: [PATCH 219/347] Add iteration over names

---
 lib/binding_rust/bindings.rs  |  6 ++++++
 lib/binding_rust/lib.rs       | 32 ++++++++++++++++++++++++++++++++
 lib/include/tree_sitter/api.h |  6 ++++++
 lib/src/language.c            |  9 +++++++--
 4 files changed, 51 insertions(+), 2 deletions(-)

diff --git a/lib/binding_rust/bindings.rs b/lib/binding_rust/bindings.rs
index d2239893..5ad38721 100644
--- a/lib/binding_rust/bindings.rs
+++ b/lib/binding_rust/bindings.rs
@@ -738,6 +738,12 @@ extern "C" {
     #[doc = " Get the current symbol of the lookahead iterator;"]
     pub fn ts_lookahead_iterator_current_symbol(arg1: *const TSLookaheadIterator) -> TSSymbol;
 }
+extern "C" {
+    #[doc = " Get the current symbol type of the lookahead iterator as a null terminated\n string."]
+    pub fn ts_lookahead_iterator_current_symbol_name(
+        arg1: *const TSLookaheadIterator,
+    ) -> *const ::std::os::raw::c_char;
+}
 extern "C" {
     #[doc = " Set the allocation functions used by the library.\n\n By default, Tree-sitter uses the standard libc allocation functions,\n but aborts the process when an allocation fails. This function lets\n you supply alternative allocation functions at runtime.\n\n If you pass `NULL` for any parameter, Tree-sitter will switch back to\n its default implementation of that function.\n\n If you call this function after the library has already been used, then\n you must ensure that either:\n  1. All the existing objects have been freed.\n  2. The new allocator shares its state with the old one, so it is capable\n     of freeing memory that was allocated by the old allocator."]
     pub fn ts_set_allocator(
diff --git a/lib/binding_rust/lib.rs b/lib/binding_rust/lib.rs
index cdf1ffcf..49263b28 100644
--- a/lib/binding_rust/lib.rs
+++ b/lib/binding_rust/lib.rs
@@ -1497,6 +1497,18 @@ impl<'a> LookaheadIterator<'a> {
         unsafe { ffi::ts_lookahead_iterator_current_symbol(self.0.as_ptr()) }
     }
 
+    /// Get the current symbol name of the lookahead iterator.
+    #[doc(alias = "ts_lookahead_iterator_current_symbol_name")]
+    pub fn current_symbol_name(&self) -> &'static str {
+        unsafe {
+            CStr::from_ptr(ffi::ts_lookahead_iterator_current_symbol_name(
+                self.0.as_ptr(),
+            ))
+            .to_str()
+            .unwrap()
+        }
+    }
+
     /// Reset the lookahead iterator.
     ///
     /// This returns `true` if the language was set successfully and `false`
@@ -1514,6 +1526,26 @@ impl<'a> LookaheadIterator<'a> {
     pub fn reset_state(&self, state: u16) -> bool {
         unsafe { ffi::ts_lookahead_iterator_reset_state(self.0.as_ptr(), state) }
     }
+
+    /// Iterate symbol names.
+    pub fn iter_names(&'a self) -> impl Iterator<Item = &'static str> + 'a {
+        NameLookaheadIterator(&self)
+    }
+}
+
+struct NameLookaheadIterator<'a>(&'a LookaheadIterator<'a>);
+
+impl<'a> Iterator for NameLookaheadIterator<'a> {
+    type Item = &'static str;
+
+    #[doc(alias = "ts_lookahead_iterator_advance")]
+    fn next(&mut self) -> Option<Self::Item> {
+        if !(unsafe { ffi::ts_lookahead_iterator_advance(self.0 .0.as_ptr()) }) {
+            None
+        } else {
+            Some(self.0.current_symbol_name())
+        }
+    }
 }
 
 impl<'a> Iterator for LookaheadIterator<'a> {
diff --git a/lib/include/tree_sitter/api.h b/lib/include/tree_sitter/api.h
index 4bd2f43d..0fc9faf5 100644
--- a/lib/include/tree_sitter/api.h
+++ b/lib/include/tree_sitter/api.h
@@ -1107,6 +1107,12 @@ bool ts_lookahead_iterator_advance(TSLookaheadIterator *);
 */
 TSSymbol ts_lookahead_iterator_current_symbol(const TSLookaheadIterator *);
 
+/**
+ * Get the current symbol type of the lookahead iterator as a null terminated
+ * string.
+*/
+const char *ts_lookahead_iterator_current_symbol_name(const TSLookaheadIterator *);
+
 /**********************************/
 /* Section - Global Configuration */
 /**********************************/
diff --git a/lib/src/language.c b/lib/src/language.c
index d8d07c2c..df5c6de1 100644
--- a/lib/src/language.c
+++ b/lib/src/language.c
@@ -181,7 +181,7 @@ bool ts_lookahead_iterator_reset_state(TSLookaheadIterator * self, TSStateId sta
 }
 
 const TSLanguage * ts_lookahead_iterator_language(const TSLookaheadIterator *self) {
-  LookaheadIterator *iterator = (LookaheadIterator *)self;
+  const LookaheadIterator *iterator = (const LookaheadIterator *)self;
   return iterator->language;
 }
 
@@ -198,6 +198,11 @@ bool ts_lookahead_iterator_advance(TSLookaheadIterator *self) {
 }
 
 TSSymbol ts_lookahead_iterator_current_symbol(const TSLookaheadIterator *self) {
-  LookaheadIterator *iterator = (LookaheadIterator *)self;
+  const LookaheadIterator *iterator = (const LookaheadIterator *)self;
   return iterator->symbol;
 }
+
+const char *ts_lookahead_iterator_current_symbol_name(const TSLookaheadIterator *self) {
+  const LookaheadIterator *iterator = (const LookaheadIterator *)self;
+  return ts_language_symbol_name(iterator->language, iterator->symbol);
+}

From 1cb378b4459eb7ed9fa5a1c1b417e66d5112f345 Mon Sep 17 00:00:00 2001
From: Daumantas Kavolis <daumantas.kavolis@sensmetry.com>
Date: Fri, 16 Jun 2023 10:46:42 +0300
Subject: [PATCH 220/347] Add rust tests for lookahead iterator

---
 cli/src/tests/language_test.rs | 41 ++++++++++++++++++++++++++++++++++
 cli/src/tests/mod.rs           |  1 +
 2 files changed, 42 insertions(+)
 create mode 100644 cli/src/tests/language_test.rs

diff --git a/cli/src/tests/language_test.rs b/cli/src/tests/language_test.rs
new file mode 100644
index 00000000..2ac5bb77
--- /dev/null
+++ b/cli/src/tests/language_test.rs
@@ -0,0 +1,41 @@
+use super::helpers::fixtures::get_language;
+use tree_sitter::Parser;
+
+#[test]
+fn test_lookahead_iterator() {
+    let mut parser = Parser::new();
+    let language = get_language("rust");
+    parser.set_language(language).unwrap();
+
+    let tree = parser.parse("struct Stuff {}", None).unwrap();
+
+    let mut cursor = tree.walk();
+
+    assert!(cursor.goto_first_child()); // struct
+    assert!(cursor.goto_first_child()); // struct keyword
+
+    let next_state = cursor.node().next_parse_state();
+    assert_ne!(next_state, 0);
+    assert_eq!(
+        next_state,
+        language.next_state(cursor.node().parse_state(), cursor.node().grammar_id())
+    );
+    assert!((next_state as usize) < language.parse_state_count());
+    assert!(cursor.goto_next_sibling()); // type_identifier
+    assert_eq!(next_state, cursor.node().parse_state());
+    assert_eq!(cursor.node().grammar_name(), "identifier");
+    assert_ne!(cursor.node().grammar_id(), cursor.node().kind_id());
+
+    let expected_symbols = ["identifier", "block_comment", "line_comment"];
+    let lookahead = language.lookahead_iterator(next_state).unwrap();
+    assert_eq!(lookahead.language(), language);
+    assert!(lookahead.iter_names().eq(expected_symbols));
+
+    lookahead.reset_state(next_state);
+    assert!(lookahead.iter_names().eq(expected_symbols));
+
+    lookahead.reset(&language, next_state);
+    assert!(lookahead
+        .map(|s| language.node_kind_for_id(s).unwrap())
+        .eq(expected_symbols));
+}
diff --git a/cli/src/tests/mod.rs b/cli/src/tests/mod.rs
index 223b6d3c..577770a2 100644
--- a/cli/src/tests/mod.rs
+++ b/cli/src/tests/mod.rs
@@ -2,6 +2,7 @@ mod corpus_test;
 mod github_issue_test;
 mod helpers;
 mod highlight_test;
+mod language_test;
 mod node_test;
 mod parser_test;
 mod pathological_test;

From ec90c215ae8ee833440bf743ab69fca10c55b541 Mon Sep 17 00:00:00 2001
From: Daumantas Kavolis <daumantas.kavolis@sensmetry.com>
Date: Fri, 16 Jun 2023 10:47:10 +0300
Subject: [PATCH 221/347] Add tests for bidirectional cursor

---
 cli/src/tests/tree_test.rs | 45 +++++++++++++++++++++++++++++++++++++-
 lib/src/tree_cursor.c      | 15 +++++++++++--
 2 files changed, 57 insertions(+), 3 deletions(-)

diff --git a/cli/src/tests/tree_test.rs b/cli/src/tests/tree_test.rs
index be0c4ff1..7d091c3f 100644
--- a/cli/src/tests/tree_test.rs
+++ b/cli/src/tests/tree_test.rs
@@ -306,7 +306,7 @@ fn test_tree_cursor() {
         .parse(
             "
                 struct Stuff {
-                    a: A;
+                    a: A,
                     b: Option<B>,
                 }
             ",
@@ -331,6 +331,49 @@ fn test_tree_cursor() {
     assert!(cursor.goto_next_sibling());
     assert_eq!(cursor.node().kind(), "field_declaration_list");
     assert_eq!(cursor.node().is_named(), true);
+
+    assert!(cursor.goto_last_child());
+    assert_eq!(cursor.node().kind(), "}");
+    assert_eq!(cursor.node().is_named(), false);
+    assert_eq!(cursor.node().start_position(), Point { row: 4, column: 16 });
+
+    assert!(cursor.goto_previous_sibling());
+    assert_eq!(cursor.node().kind(), ",");
+    assert_eq!(cursor.node().is_named(), false);
+    assert_eq!(cursor.node().start_position(), Point { row: 3, column: 32 });
+
+    assert!(cursor.goto_previous_sibling());
+    assert_eq!(cursor.node().kind(), "field_declaration");
+    assert_eq!(cursor.node().is_named(), true);
+    assert_eq!(cursor.node().start_position(), Point { row: 3, column: 20 });
+
+    assert!(cursor.goto_previous_sibling());
+    assert_eq!(cursor.node().kind(), ",");
+    assert_eq!(cursor.node().is_named(), false);
+    assert_eq!(cursor.node().start_position(), Point { row: 2, column: 24 });
+
+    assert!(cursor.goto_previous_sibling());
+    assert_eq!(cursor.node().kind(), "field_declaration");
+    assert_eq!(cursor.node().is_named(), true);
+    assert_eq!(cursor.node().start_position(), Point { row: 2, column: 20 });
+
+    assert!(cursor.goto_previous_sibling());
+    assert_eq!(cursor.node().kind(), "{");
+    assert_eq!(cursor.node().is_named(), false);
+    assert_eq!(cursor.node().start_position(), Point { row: 1, column: 29 });
+
+    let mut copy = tree.walk();
+    copy.reset_to(cursor);
+
+    assert_eq!(copy.node().kind(), "{");
+    assert_eq!(copy.node().is_named(), false);
+
+    assert!(copy.goto_parent());
+    assert_eq!(copy.node().kind(), "field_declaration_list");
+    assert_eq!(copy.node().is_named(), true);
+
+    assert!(copy.goto_parent());
+    assert_eq!(copy.node().kind(), "struct_item");
 }
 
 #[test]
diff --git a/lib/src/tree_cursor.c b/lib/src/tree_cursor.c
index 702088ad..0512b914 100644
--- a/lib/src/tree_cursor.c
+++ b/lib/src/tree_cursor.c
@@ -97,6 +97,16 @@ static inline bool ts_tree_cursor_child_iterator_next(
   return true;
 }
 
+static inline Length length_sub_zero(Length a, Length b) {
+  // length_sub doesn't account for 0 row subtraction, i.e. only columns
+  // should be subtracted, but changing point_sub breaks other tests
+  Length result = length_sub(a, b);
+  if (b.extent.row == 0) {
+    result.extent.column -= b.extent.column;
+  }
+  return result;
+}
+
 static inline bool ts_tree_cursor_child_iterator_previous(
   CursorChildIterator *self,
   TreeCursorEntry *result,
@@ -119,13 +129,14 @@ static inline bool ts_tree_cursor_child_iterator_previous(
     self->structural_child_index--;
   }
 
-  self->position = length_sub(self->position, ts_subtree_padding(*child));
+  self->position = length_sub_zero(self->position, ts_subtree_padding(*child));
   self->child_index--;
 
   // unsigned can underflow so compare it to child_count
   if (self->child_index < self->parent.ptr->child_count) {
     Subtree previous_child = ts_subtree_children(self->parent)[self->child_index];
-    self->position = length_sub(self->position, ts_subtree_size(previous_child));
+    Length size = ts_subtree_size(previous_child);
+    self->position = length_sub_zero(self->position, size);
   }
 
   return true;

From ab788619ca4fc33a5b723ccda0e5e25ff0529c6b Mon Sep 17 00:00:00 2001
From: Daumantas Kavolis <daumantas.kavolis@sensmetry.com>
Date: Fri, 16 Jun 2023 11:32:13 +0300
Subject: [PATCH 222/347] Split wasm tests for next parse state

---
 lib/binding_web/test/node-test.js | 17 +++++++++++++----
 1 file changed, 13 insertions(+), 4 deletions(-)

diff --git a/lib/binding_web/test/node-test.js b/lib/binding_web/test/node-test.js
index 1abef756..a87658c7 100644
--- a/lib/binding_web/test/node-test.js
+++ b/lib/binding_web/test/node-test.js
@@ -326,10 +326,10 @@ describe("Node", () => {
     );
   });
 
-  describe(".parseState", () => {
+  describe(".parseState, .nextParseState", () => {
     const text = "10 / 5";
 
-    it(`returns node parse state ids`, async () => {
+    it("returns node parse state ids", async () => {
       tree = await parser.parse(text)
       const quotientNode = tree.rootNode.firstChild.firstChild;
       const [numerator, slash, denominator] = quotientNode.children;
@@ -338,11 +338,20 @@ describe("Node", () => {
       // parse states will change on any change to the grammar so test that it
       // returns something instead
       assert.isAbove(numerator.parseState, 0);
-      assert.isAbove(numerator.nextParseState, 0);
       assert.isAbove(slash.parseState, 0);
       assert.isAbove(denominator.parseState, 0);
-      assert.isAbove(denominator.nextParseState, 0);
     })
+
+    it("returns next parse state equal to the language", async () => {
+      tree = await parser.parse(text);
+      const quotientNode = tree.rootNode.firstChild.firstChild;
+      quotientNode.children.forEach(node => {
+        assert.equal(
+          node.nextParseState,
+          JavaScript.nextState(node.parseState, node.grammarId)
+        );
+      });
+    });
   });
 
   describe('.descendantsOfType(type, min, max)', () => {

From e2094ef202576901f3361e3f09d1966ef6f97be2 Mon Sep 17 00:00:00 2001
From: Daumantas Kavolis <daumantas.kavolis@sensmetry.com>
Date: Fri, 16 Jun 2023 11:33:00 +0300
Subject: [PATCH 223/347] Add wasm tests for lookahead iterator

---
 lib/binding_web/binding.js            |  4 +--
 lib/binding_web/test/language-test.js | 38 +++++++++++++++++++++++++++
 2 files changed, 40 insertions(+), 2 deletions(-)

diff --git a/lib/binding_web/binding.js b/lib/binding_web/binding.js
index 38efabd6..e6c2b27e 100644
--- a/lib/binding_web/binding.js
+++ b/lib/binding_web/binding.js
@@ -1013,7 +1013,7 @@ class LookaheadIterable {
   }
 
   reset(language, stateId) {
-    if (C._ts_lookahead_iterator_reset(this[0], language, stateId)) {
+    if (C._ts_lookahead_iterator_reset(this[0], language[0], stateId)) {
       this.language = language;
       return true;
     }
@@ -1028,7 +1028,7 @@ class LookaheadIterable {
         if (C._ts_lookahead_iterator_advance(self[0])) {
           return { done: false, value: self.currentType };
         }
-    
+
         return { done: true, value: "" };
       }
     };
diff --git a/lib/binding_web/test/language-test.js b/lib/binding_web/test/language-test.js
index 385b77ed..dab212d6 100644
--- a/lib/binding_web/test/language-test.js
+++ b/lib/binding_web/test/language-test.js
@@ -42,3 +42,41 @@ describe("Language", () => {
     });
   });
 });
+
+describe("Lookahead iterator", () => {
+  let lookahead;
+  let state;
+  before(async () => {
+    let Parser;
+    ({ JavaScript, Parser } = await require("./helper"));
+    const parser = new Parser().setLanguage(JavaScript);
+    const tree = parser.parse("function fn() {}");
+    const cursor = tree.walk();
+    cursor.gotoFirstChild();
+    cursor.gotoFirstChild();
+    state = cursor.currentNode().nextParseState;
+    lookahead = JavaScript.lookaheadIterator(state);
+    assert.exists(lookahead);
+  });
+
+  const expected = ["identifier", "comment", "(", "*", "formal_parameters"];
+  it("should iterate over valid symbols in the state", () => {
+    const symbols = Array.from(lookahead);
+    assert.includeMembers(symbols, expected);
+    assert.lengthOf(symbols, expected.length);
+  });
+
+  it("should reset to the initial state", () => {
+    assert(lookahead.resetState(state));
+    const symbols = Array.from(lookahead);
+    assert.includeMembers(symbols, expected);
+    assert.lengthOf(symbols, expected.length);
+  });
+
+  it("should reset", () => {
+    assert(lookahead.reset(JavaScript, state));
+    const symbols = Array.from(lookahead);
+    assert.includeMembers(symbols, expected);
+    assert.lengthOf(symbols, expected.length);
+  });
+});

From 4d6a30a69e2036ea72bca196a871c8cbeab37cbd Mon Sep 17 00:00:00 2001
From: Daumantas Kavolis <daumantas.kavolis@sensmetry.com>
Date: Fri, 16 Jun 2023 13:15:22 +0300
Subject: [PATCH 224/347] Need to check that left row is also non-zero so that
 columns are not subtracted twice

---
 lib/src/tree_cursor.c | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/lib/src/tree_cursor.c b/lib/src/tree_cursor.c
index 0512b914..7b820983 100644
--- a/lib/src/tree_cursor.c
+++ b/lib/src/tree_cursor.c
@@ -101,7 +101,7 @@ static inline Length length_sub_zero(Length a, Length b) {
   // length_sub doesn't account for 0 row subtraction, i.e. only columns
   // should be subtracted, but changing point_sub breaks other tests
   Length result = length_sub(a, b);
-  if (b.extent.row == 0) {
+  if (b.extent.row == 0 && a.extent.row != 0) {
     result.extent.column -= b.extent.column;
   }
   return result;

From e2c2e39e15ac1409483f01b5c28cab0ab7cf7ebf Mon Sep 17 00:00:00 2001
From: Daumantas Kavolis <daumantas.kavolis@sensmetry.com>
Date: Fri, 16 Jun 2023 13:20:20 +0300
Subject: [PATCH 225/347] Delete parser and iterator

---
 lib/binding_web/test/language-test.js | 9 +++++++--
 1 file changed, 7 insertions(+), 2 deletions(-)

diff --git a/lib/binding_web/test/language-test.js b/lib/binding_web/test/language-test.js
index dab212d6..394e32b4 100644
--- a/lib/binding_web/test/language-test.js
+++ b/lib/binding_web/test/language-test.js
@@ -51,14 +51,19 @@ describe("Lookahead iterator", () => {
     ({ JavaScript, Parser } = await require("./helper"));
     const parser = new Parser().setLanguage(JavaScript);
     const tree = parser.parse("function fn() {}");
+    parser.delete();
     const cursor = tree.walk();
-    cursor.gotoFirstChild();
-    cursor.gotoFirstChild();
+    assert(cursor.gotoFirstChild());
+    assert(cursor.gotoFirstChild());
     state = cursor.currentNode().nextParseState;
     lookahead = JavaScript.lookaheadIterator(state);
     assert.exists(lookahead);
   });
 
+  after(() => {
+    lookahead.delete();
+  });
+
   const expected = ["identifier", "comment", "(", "*", "formal_parameters"];
   it("should iterate over valid symbols in the state", () => {
     const symbols = Array.from(lookahead);

From fd8fd3f535ffe1b07b19abf178a6604df55ac9d2 Mon Sep 17 00:00:00 2001
From: Daumantas Kavolis <daumantas.kavolis@sensmetry.com>
Date: Fri, 16 Jun 2023 13:22:11 +0300
Subject: [PATCH 226/347] Add tests for previous sibling, last child

---
 lib/binding_web/exports.json      |  2 +-
 lib/binding_web/test/tree-test.js | 44 +++++++++++++++++++++++++++++++
 2 files changed, 45 insertions(+), 1 deletion(-)

diff --git a/lib/binding_web/exports.json b/lib/binding_web/exports.json
index 1c638bb0..9e219d70 100644
--- a/lib/binding_web/exports.json
+++ b/lib/binding_web/exports.json
@@ -105,7 +105,7 @@
   "_ts_tree_cursor_end_index_wasm",
   "_ts_tree_cursor_end_position_wasm",
   "_ts_tree_cursor_goto_first_child_wasm",
-  "_ts_tree_cursor_goto_last_child",
+  "_ts_tree_cursor_goto_last_child_wasm",
   "_ts_tree_cursor_goto_next_sibling_wasm",
   "_ts_tree_cursor_goto_previous_sibling_wasm",
   "_ts_tree_cursor_goto_parent_wasm",
diff --git a/lib/binding_web/test/tree-test.js b/lib/binding_web/test/tree-test.js
index 8c04e63e..a98d216a 100644
--- a/lib/binding_web/test/tree-test.js
+++ b/lib/binding_web/test/tree-test.js
@@ -244,6 +244,50 @@ describe("Tree", () => {
         endIndex: 13
       });
 
+      {
+        const copy = tree.walk();
+        copy.resetTo(cursor);
+
+        assert(copy.gotoPreviousSibling());
+        assertCursorState(copy, {
+          nodeType: '+',
+          nodeIsNamed: false,
+          startPosition: {row: 0, column: 6},
+          endPosition: {row: 0, column: 7},
+          startIndex: 6,
+          endIndex: 7
+        });
+
+        assert(copy.gotoPreviousSibling());
+        assertCursorState(copy, {
+          nodeType: 'binary_expression',
+          nodeIsNamed: true,
+          startPosition: {row: 0, column: 0},
+          endPosition: {row: 0, column: 5},
+          startIndex: 0,
+          endIndex: 5
+        });
+
+        assert(copy.gotoLastChild());
+        assertCursorState(copy, {
+          nodeType: "identifier",
+          nodeIsNamed: true,
+          startPosition: {row: 0, column: 4},
+          endPosition: {row: 0, column: 5},
+          startIndex: 4,
+          endIndex: 5
+        })
+
+        assert(copy.gotoParent());
+        assert(copy.gotoParent());
+        assert.equal(copy.nodeType, 'binary_expression')
+        assert(copy.gotoParent());
+        assert.equal(copy.nodeType, 'expression_statement')
+        assert(copy.gotoParent());
+        assert.equal(copy.nodeType, 'program')
+        assert(!copy.gotoParent());
+    }
+
       // const childIndex = cursor.gotoFirstChildForIndex(12);
       // assertCursorState(cursor, {
       //   nodeType: 'identifier',

From 8d5462cea4f23bf21b95f7e280577b8145018367 Mon Sep 17 00:00:00 2001
From: Daumantas Kavolis <daumantas.kavolis@sensmetry.com>
Date: Wed, 12 Jul 2023 15:34:08 +0300
Subject: [PATCH 227/347] `LookaheadIterator` doesn't need lifetime annotation
 as it depends on language only

---
 lib/binding_rust/ffi.rs |  6 +++---
 lib/binding_rust/lib.rs | 16 ++++++++--------
 2 files changed, 11 insertions(+), 11 deletions(-)

diff --git a/lib/binding_rust/ffi.rs b/lib/binding_rust/ffi.rs
index f1a739b1..ac4da98b 100644
--- a/lib/binding_rust/ffi.rs
+++ b/lib/binding_rust/ffi.rs
@@ -133,14 +133,14 @@ impl QueryCursor {
     }
 }
 
-impl<'a> LookaheadIterator<'a> {
+impl LookaheadIterator {
     /// Reconstructs a [LookaheadIterator] from a raw pointer.
     ///
     /// # Safety
     ///
     /// `ptr` must be non-null.
-    pub unsafe fn from_raw(ptr: *mut TSLookaheadIterator) -> LookaheadIterator<'a> {
-        LookaheadIterator(NonNull::new_unchecked(ptr), PhantomData)
+    pub unsafe fn from_raw(ptr: *mut TSLookaheadIterator) -> LookaheadIterator {
+        LookaheadIterator(NonNull::new_unchecked(ptr))
     }
 
     /// Consumes the [LookaheadIterator], returning a raw pointer to the underlying C structure.
diff --git a/lib/binding_rust/lib.rs b/lib/binding_rust/lib.rs
index 49263b28..c371b8a1 100644
--- a/lib/binding_rust/lib.rs
+++ b/lib/binding_rust/lib.rs
@@ -89,7 +89,7 @@ pub struct Parser(NonNull<ffi::TSParser>);
 
 /// A stateful object that is used to look up symbols valid in a specific parse state
 #[doc(alias = "TSLookaheadIterator")]
-pub struct LookaheadIterator<'a>(NonNull<ffi::TSLookaheadIterator>, PhantomData<&'a ()>);
+pub struct LookaheadIterator(NonNull<ffi::TSLookaheadIterator>);
 
 /// A type of log message.
 #[derive(Debug, PartialEq, Eq)]
@@ -373,7 +373,7 @@ impl Language {
     /// lookahead iterator created on the previous non-extra leaf node may be
     /// appropriate.
     #[doc(alias = "ts_lookahead_iterator_new")]
-    pub fn lookahead_iterator<'a>(&self, state: u16) -> Option<LookaheadIterator<'a>> {
+    pub fn lookahead_iterator(&self, state: u16) -> Option<LookaheadIterator> {
         let ptr = unsafe { ffi::ts_lookahead_iterator_new(self.0, state) };
         if ptr.is_null() {
             None
@@ -1484,7 +1484,7 @@ impl<'a> Drop for TreeCursor<'a> {
     }
 }
 
-impl<'a> LookaheadIterator<'a> {
+impl LookaheadIterator {
     /// Get the current language of the lookahead iterator.
     #[doc(alias = "ts_lookahead_iterator_language")]
     pub fn language(&self) -> Language {
@@ -1514,7 +1514,7 @@ impl<'a> LookaheadIterator<'a> {
     /// This returns `true` if the language was set successfully and `false`
     /// otherwise.
     #[doc(alias = "ts_lookahead_iterator_reset")]
-    pub fn reset(&self, language: &'a Language, state: u16) -> bool {
+    pub fn reset(&self, language: &Language, state: u16) -> bool {
         unsafe { ffi::ts_lookahead_iterator_reset(self.0.as_ptr(), language.0, state) }
     }
 
@@ -1528,12 +1528,12 @@ impl<'a> LookaheadIterator<'a> {
     }
 
     /// Iterate symbol names.
-    pub fn iter_names(&'a self) -> impl Iterator<Item = &'static str> + 'a {
+    pub fn iter_names<'a>(&'a self) -> impl Iterator<Item = &'static str> + 'a {
         NameLookaheadIterator(&self)
     }
 }
 
-struct NameLookaheadIterator<'a>(&'a LookaheadIterator<'a>);
+struct NameLookaheadIterator<'a>(&'a LookaheadIterator);
 
 impl<'a> Iterator for NameLookaheadIterator<'a> {
     type Item = &'static str;
@@ -1548,7 +1548,7 @@ impl<'a> Iterator for NameLookaheadIterator<'a> {
     }
 }
 
-impl<'a> Iterator for LookaheadIterator<'a> {
+impl Iterator for LookaheadIterator {
     type Item = u16;
 
     #[doc(alias = "ts_lookahead_iterator_advance")]
@@ -1562,7 +1562,7 @@ impl<'a> Iterator for LookaheadIterator<'a> {
     }
 }
 
-impl<'a> Drop for LookaheadIterator<'a> {
+impl Drop for LookaheadIterator {
     #[doc(alias = "ts_lookahead_iterator_delete")]
     fn drop(&mut self) {
         unsafe { ffi::ts_lookahead_iterator_delete(self.0.as_ptr()) }

From 8c789bf7d5573b2775522db51910b4d1663f17df Mon Sep 17 00:00:00 2001
From: Daumantas Kavolis <daumantas.kavolis@sensmetry.com>
Date: Mon, 17 Jul 2023 09:09:19 +0300
Subject: [PATCH 228/347] After review

---
 lib/binding_rust/bindings.rs  |  5 +++--
 lib/binding_rust/lib.rs       | 14 ++++++++++++--
 lib/include/tree_sitter/api.h | 18 +++++++++++++++++-
 lib/src/tree_cursor.c         | 26 ++++++++++++++++----------
 4 files changed, 48 insertions(+), 15 deletions(-)

diff --git a/lib/binding_rust/bindings.rs b/lib/binding_rust/bindings.rs
index 5ad38721..d0d6c5e8 100644
--- a/lib/binding_rust/bindings.rs
+++ b/lib/binding_rust/bindings.rs
@@ -480,14 +480,15 @@ extern "C" {
     pub fn ts_tree_cursor_goto_next_sibling(arg1: *mut TSTreeCursor) -> bool;
 }
 extern "C" {
-    #[doc = " Move the cursor to the previous sibling of its current node.\n\n This returns `true` if the cursor successfully moved, and returns `false` if\n there was no previous sibling node."]
+    #[doc = " Move the cursor to the previous sibling of its current node.\n\n This returns `true` if the cursor successfully moved, and returns `false` if\n there was no previous sibling node.\n\n Note, that this function may be slower than\n `ts_tree_cursor_goto_next_sibling` due to how node positions are stored. In\n the worst case, this will need to iterate through all the children upto the\n previous sibling node to recalculate its position."]
     pub fn ts_tree_cursor_goto_previous_sibling(arg1: *mut TSTreeCursor) -> bool;
 }
 extern "C" {
-    #[doc = " Move the cursor to the first/last child of its current node.\n\n This returns `true` if the cursor successfully moved, and returns `false`\n if there were no children."]
+    #[doc = " Move the cursor to the first child of its current node.\n\n This returns `true` if the cursor successfully moved, and returns `false`\n if there were no children."]
     pub fn ts_tree_cursor_goto_first_child(arg1: *mut TSTreeCursor) -> bool;
 }
 extern "C" {
+    #[doc = " Move the cursor to the last child of its current node.\n\n This returns `true` if the cursor successfully moved, and returns `false` if\n there were no children.\n\n Note that this function may be slower than `ts_tree_cursor_goto_first_child`\n because it needs to iterate through all the children to compute the child's\n position."]
     pub fn ts_tree_cursor_goto_last_child(arg1: *mut TSTreeCursor) -> bool;
 }
 extern "C" {
diff --git a/lib/binding_rust/lib.rs b/lib/binding_rust/lib.rs
index c371b8a1..6dd9daec 100644
--- a/lib/binding_rust/lib.rs
+++ b/lib/binding_rust/lib.rs
@@ -1380,8 +1380,12 @@ impl<'a> TreeCursor<'a> {
 
     /// Move this cursor to the last child of its current node.
     ///
-    /// This returns `true` if the cursor successfully moved, and returns `false`
-    /// if there were no children.
+    /// This returns `true` if the cursor successfully moved, and returns
+    /// `false` if there were no children.
+    ///
+    /// Note that this function may be slower than
+    /// [`goto_first_child`](TreeCursor::goto_first_child) because it needs to
+    /// iterate through all the children to compute the child's position.
     #[doc(alias = "ts_tree_cursor_goto_last_child")]
     pub fn goto_last_child(&mut self) -> bool {
         return unsafe { ffi::ts_tree_cursor_goto_last_child(&mut self.0) };
@@ -1419,6 +1423,12 @@ impl<'a> TreeCursor<'a> {
     ///
     /// This returns `true` if the cursor successfully moved, and returns
     /// `false` if there was no previous sibling node.
+    ///
+    /// Note, that this function may be slower than
+    /// [`goto_next_sibling`](TreeCursor::goto_next_sibling) due to how node
+    /// positions are stored. In the worst case, this will need to iterate
+    /// through all the children upto the previous sibling node to recalculate
+    /// its position.
     #[doc(alias = "ts_tree_cursor_goto_previous_sibling")]
     pub fn goto_previous_sibling(&mut self) -> bool {
         return unsafe { ffi::ts_tree_cursor_goto_previous_sibling(&mut self.0) };
diff --git a/lib/include/tree_sitter/api.h b/lib/include/tree_sitter/api.h
index 0fc9faf5..5ccf4610 100644
--- a/lib/include/tree_sitter/api.h
+++ b/lib/include/tree_sitter/api.h
@@ -720,16 +720,32 @@ bool ts_tree_cursor_goto_next_sibling(TSTreeCursor *);
  *
  * This returns `true` if the cursor successfully moved, and returns `false` if
  * there was no previous sibling node.
+ *
+ * Note, that this function may be slower than
+ * `ts_tree_cursor_goto_next_sibling` due to how node positions are stored. In
+ * the worst case, this will need to iterate through all the children upto the
+ * previous sibling node to recalculate its position.
  */
 bool ts_tree_cursor_goto_previous_sibling(TSTreeCursor *);
 
 /**
- * Move the cursor to the first/last child of its current node.
+ * Move the cursor to the first child of its current node.
  *
  * This returns `true` if the cursor successfully moved, and returns `false`
  * if there were no children.
  */
 bool ts_tree_cursor_goto_first_child(TSTreeCursor *);
+
+/**
+ * Move the cursor to the last child of its current node.
+ *
+ * This returns `true` if the cursor successfully moved, and returns `false` if
+ * there were no children.
+ *
+ * Note that this function may be slower than `ts_tree_cursor_goto_first_child`
+ * because it needs to iterate through all the children to compute the child's
+ * position.
+ */
 bool ts_tree_cursor_goto_last_child(TSTreeCursor *);
 
 /**
diff --git a/lib/src/tree_cursor.c b/lib/src/tree_cursor.c
index 7b820983..25eca482 100644
--- a/lib/src/tree_cursor.c
+++ b/lib/src/tree_cursor.c
@@ -97,13 +97,19 @@ static inline bool ts_tree_cursor_child_iterator_next(
   return true;
 }
 
-static inline Length length_sub_zero(Length a, Length b) {
-  // length_sub doesn't account for 0 row subtraction, i.e. only columns
-  // should be subtracted, but changing point_sub breaks other tests
-  Length result = length_sub(a, b);
-  if (b.extent.row == 0 && a.extent.row != 0) {
-    result.extent.column -= b.extent.column;
+// Return a position that, when `b` is added to it, yields `a`. This
+// can only be computed if `b` has zero rows. Otherwise, this function
+// returns `LENGTH_UNDEFINED`, and the caller needs to recompute
+// the position some other way.
+static inline Length length_backtrack(Length a, Length b) {
+  if (length_is_undefined(a) || b.extent.row != 0) {
+    return LENGTH_UNDEFINED;
   }
+
+  Length result;
+  result.bytes = a.bytes - b.bytes;
+  result.extent.row = a.extent.row;
+  result.extent.column = a.extent.column - b.extent.column;
   return result;
 }
 
@@ -129,14 +135,14 @@ static inline bool ts_tree_cursor_child_iterator_previous(
     self->structural_child_index--;
   }
 
-  self->position = length_sub_zero(self->position, ts_subtree_padding(*child));
+  self->position = length_backtrack(self->position, ts_subtree_padding(*child));
   self->child_index--;
 
   // unsigned can underflow so compare it to child_count
   if (self->child_index < self->parent.ptr->child_count) {
     Subtree previous_child = ts_subtree_children(self->parent)[self->child_index];
     Length size = ts_subtree_size(previous_child);
-    self->position = length_sub_zero(self->position, size);
+    self->position = length_backtrack(self->position, size);
   }
 
   return true;
@@ -362,8 +368,8 @@ TreeCursorStep ts_tree_cursor_goto_previous_sibling_internal(TSTreeCursor *_self
   if (step == TreeCursorStepNone)
     return step;
 
-  // if row has not changed, column is still valid
-  if (array_back(&self->stack)->position.extent.row == position.extent.row)
+  // if length is already valid, there's no need to recompute it
+  if (!length_is_undefined(array_back(&self->stack)->position))
     return step;
 
   // restore position from the parent node

From 759af6d0a46aa47b2c319000ebc48ea6c9719805 Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Mon, 17 Jul 2023 10:52:33 +0300
Subject: [PATCH 229/347] Remove Copy, Clone from TSLookaheadIterator raw
 binding struct

---
 lib/binding_rust/bindings.rs | 2 +-
 script/generate-bindings     | 1 +
 2 files changed, 2 insertions(+), 1 deletion(-)

diff --git a/lib/binding_rust/bindings.rs b/lib/binding_rust/bindings.rs
index d0d6c5e8..912916c0 100644
--- a/lib/binding_rust/bindings.rs
+++ b/lib/binding_rust/bindings.rs
@@ -29,7 +29,7 @@ pub struct TSQueryCursor {
     _unused: [u8; 0],
 }
 #[repr(C)]
-#[derive(Debug, Copy, Clone)]
+#[derive(Debug)]
 pub struct TSLookaheadIterator {
     _unused: [u8; 0],
 }
diff --git a/script/generate-bindings b/script/generate-bindings
index da1796ba..fb47e247 100755
--- a/script/generate-bindings
+++ b/script/generate-bindings
@@ -6,6 +6,7 @@ no_derive_copy=(
   TSInput
   TSLanguage
   TSLogger
+  TSLookaheadIterator
   TSParser
   TSTree
   TSQuery

From a08c61235d2df2dc23f4cc6cb7705a771b3484ba Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Tue, 1 Aug 2023 23:45:01 +0300
Subject: [PATCH 230/347] Fix, reference by value for Language as everywhere

---
 cli/src/tests/language_test.rs | 2 +-
 lib/binding_rust/lib.rs        | 2 +-
 2 files changed, 2 insertions(+), 2 deletions(-)

diff --git a/cli/src/tests/language_test.rs b/cli/src/tests/language_test.rs
index 2ac5bb77..f8a4653f 100644
--- a/cli/src/tests/language_test.rs
+++ b/cli/src/tests/language_test.rs
@@ -34,7 +34,7 @@ fn test_lookahead_iterator() {
     lookahead.reset_state(next_state);
     assert!(lookahead.iter_names().eq(expected_symbols));
 
-    lookahead.reset(&language, next_state);
+    lookahead.reset(language, next_state);
     assert!(lookahead
         .map(|s| language.node_kind_for_id(s).unwrap())
         .eq(expected_symbols));
diff --git a/lib/binding_rust/lib.rs b/lib/binding_rust/lib.rs
index 6dd9daec..e8d99a87 100644
--- a/lib/binding_rust/lib.rs
+++ b/lib/binding_rust/lib.rs
@@ -1524,7 +1524,7 @@ impl LookaheadIterator {
     /// This returns `true` if the language was set successfully and `false`
     /// otherwise.
     #[doc(alias = "ts_lookahead_iterator_reset")]
-    pub fn reset(&self, language: &Language, state: u16) -> bool {
+    pub fn reset(&self, language: Language, state: u16) -> bool {
         unsafe { ffi::ts_lookahead_iterator_reset(self.0.as_ptr(), language.0, state) }
     }
 

From 1ac134a97dfb58df8b9767f5ca9de65d5570630f Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Wed, 2 Aug 2023 00:27:19 +0300
Subject: [PATCH 231/347] Apply `ts_node_is_error` in Rust binding

---
 lib/binding_rust/lib.rs | 3 ++-
 lib/src/node.c          | 8 ++++----
 2 files changed, 6 insertions(+), 5 deletions(-)

diff --git a/lib/binding_rust/lib.rs b/lib/binding_rust/lib.rs
index e8d99a87..2e3403b4 100644
--- a/lib/binding_rust/lib.rs
+++ b/lib/binding_rust/lib.rs
@@ -942,8 +942,9 @@ impl<'tree> Node<'tree> {
     ///
     /// Syntax errors represent parts of the code that could not be incorporated into a
     /// valid syntax tree.
+    #[doc(alias = "ts_node_is_error")]
     pub fn is_error(&self) -> bool {
-        self.kind_id() == u16::MAX
+        unsafe { ffi::ts_node_is_error(self.0) }
     }
 
     /// Get this node's parse state.
diff --git a/lib/src/node.c b/lib/src/node.c
index 46028f37..092e96f8 100644
--- a/lib/src/node.c
+++ b/lib/src/node.c
@@ -473,15 +473,15 @@ bool ts_node_has_error(TSNode self) {
   return ts_subtree_error_cost(ts_node__subtree(self)) > 0;
 }
 
-uint32_t ts_node_descendant_count(TSNode self) {
-  return ts_subtree_visible_descendant_count(ts_node__subtree(self)) + 1;
-}
-
 bool ts_node_is_error(TSNode self) {
   TSSymbol symbol = ts_node_symbol(self);
   return symbol == ts_builtin_sym_error;
 }
 
+uint32_t ts_node_descendant_count(TSNode self) {
+  return ts_subtree_visible_descendant_count(ts_node__subtree(self)) + 1;
+}
+
 TSStateId ts_node_parse_state(TSNode self) {
   return ts_subtree_parse_state(ts_node__subtree(self));
 }

From b9e3cc56d6fecc57993a3ba824f45460d3a76f96 Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Wed, 2 Aug 2023 00:33:10 +0300
Subject: [PATCH 232/347] chore: apply common approach for `api.h` defs

---
 lib/include/tree_sitter/api.h    | 3 ---
 lib/include/tree_sitter/parser.h | 3 ---
 2 files changed, 6 deletions(-)

diff --git a/lib/include/tree_sitter/api.h b/lib/include/tree_sitter/api.h
index 5ccf4610..d9560f24 100644
--- a/lib/include/tree_sitter/api.h
+++ b/lib/include/tree_sitter/api.h
@@ -32,10 +32,7 @@ extern "C" {
 /* Section - Types */
 /*******************/
 
-#ifndef TREE_SITTER_PARSER_H_
 typedef uint16_t TSStateId;
-#endif
-
 typedef uint16_t TSSymbol;
 typedef uint16_t TSFieldId;
 typedef struct TSLanguage TSLanguage;
diff --git a/lib/include/tree_sitter/parser.h b/lib/include/tree_sitter/parser.h
index c7ad1907..17b4fde9 100644
--- a/lib/include/tree_sitter/parser.h
+++ b/lib/include/tree_sitter/parser.h
@@ -15,9 +15,6 @@ extern "C" {
 
 #ifndef TREE_SITTER_API_H_
 typedef uint16_t TSStateId;
-#endif
-
-#ifndef TREE_SITTER_API_H_
 typedef uint16_t TSSymbol;
 typedef uint16_t TSFieldId;
 typedef struct TSLanguage TSLanguage;

From b8fe5fe21b27a6118191f7b76ecda440e1992c02 Mon Sep 17 00:00:00 2001
From: Amaan Qureshi <amaanq12@gmail.com>
Date: Mon, 31 Jul 2023 13:51:30 +0100
Subject: [PATCH 233/347] fix: do not allow eof to advance states if the new
 state is the same state

---
 cli/src/generate/render.rs | 9 +++++++++
 1 file changed, 9 insertions(+)

diff --git a/cli/src/generate/render.rs b/cli/src/generate/render.rs
index cb9f6c72..f7e6c18e 100644
--- a/cli/src/generate/render.rs
+++ b/cli/src/generate/render.rs
@@ -879,14 +879,23 @@ impl Generator {
                     add!(self, " ||{}", line_break);
                 }
                 if range.end == range.start {
+                    if range.start == '\0' {
+                        add!(self, "!eof && ");
+                    }
                     add!(self, "lookahead == ");
                     self.add_character(range.start);
                 } else if range.end as u32 == range.start as u32 + 1 {
+                    if range.start == '\0' {
+                        add!(self, "!eof && ");
+                    }
                     add!(self, "lookahead == ");
                     self.add_character(range.start);
                     add!(self, " ||{}lookahead == ", line_break);
                     self.add_character(range.end);
                 } else {
+                    if range.start == '\0' {
+                        add!(self, "!eof && ");
+                    }
                     add!(self, "(");
                     self.add_character(range.start);
                     add!(self, " <= lookahead && lookahead <= ");

From acef7a3cdf20171f40b2299030506cca735df611 Mon Sep 17 00:00:00 2001
From: Amaan Qureshi <amaanq12@gmail.com>
Date: Tue, 1 Aug 2023 08:35:08 +0100
Subject: [PATCH 234/347] chore: add tests

---
 cli/src/tests/parser_test.rs | 79 ++++++++++++++++++++++++++++++++++++
 1 file changed, 79 insertions(+)

diff --git a/cli/src/tests/parser_test.rs b/cli/src/tests/parser_test.rs
index 69d2f4fc..d490b78f 100644
--- a/cli/src/tests/parser_test.rs
+++ b/cli/src/tests/parser_test.rs
@@ -1303,6 +1303,85 @@ fn test_parsing_with_included_ranges_and_missing_tokens() {
     assert_eq!(root.child(3).unwrap().start_byte(), 4);
 }
 
+#[test]
+fn test_grammars_that_can_hang_on_eof() {
+    let (parser_name, parser_code) = generate_parser_for_grammar(
+        r#"
+        {
+            "name": "test_single_null_char_regex",
+            "rules": {
+                "source_file": {
+                    "type": "SEQ",
+                    "members": [
+                        { "type": "STRING", "value": "\"" },
+                        { "type": "PATTERN", "value": "[\\x00]*" },
+                        { "type": "STRING", "value": "\"" }
+                    ]
+                }
+            },
+            "extras": [ { "type": "PATTERN", "value": "\\s" } ]
+        }
+        "#,
+    )
+    .unwrap();
+
+    let mut parser = Parser::new();
+    parser
+        .set_language(get_test_language(&parser_name, &parser_code, None))
+        .unwrap();
+    parser.parse("\"", None).unwrap();
+
+    let (parser_name, parser_code) = generate_parser_for_grammar(
+        r#"
+        {
+            "name": "test_null_char_with_next_char_regex",
+            "rules": {
+                "source_file": {
+                    "type": "SEQ",
+                    "members": [
+                        { "type": "STRING", "value": "\"" },
+                        { "type": "PATTERN", "value": "[\\x00-\\x01]*" },
+                        { "type": "STRING", "value": "\"" }
+                    ]
+                }
+            },
+            "extras": [ { "type": "PATTERN", "value": "\\s" } ]
+        }
+        "#,
+    )
+    .unwrap();
+
+    parser
+        .set_language(get_test_language(&parser_name, &parser_code, None))
+        .unwrap();
+    parser.parse("\"", None).unwrap();
+
+    let (parser_name, parser_code) = generate_parser_for_grammar(
+        r#"
+        {
+            "name": "test_null_char_with_range_regex",
+            "rules": {
+                "source_file": {
+                    "type": "SEQ",
+                    "members": [
+                        { "type": "STRING", "value": "\"" },
+                        { "type": "PATTERN", "value": "[\\x00-\\x7F]*" },
+                        { "type": "STRING", "value": "\"" }
+                    ]
+                }
+            },
+            "extras": [ { "type": "PATTERN", "value": "\\s" } ]
+        }
+        "#,
+    )
+    .unwrap();
+
+    parser
+        .set_language(get_test_language(&parser_name, &parser_code, None))
+        .unwrap();
+    parser.parse("\"", None).unwrap();
+}
+
 fn simple_range(start: usize, end: usize) -> Range {
     Range {
         start_byte: start,

From 3e499d675a2ef9b526c9eaf34b82cae62b863977 Mon Sep 17 00:00:00 2001
From: Michael Davis <mcarsondavis@gmail.com>
Date: Wed, 2 Aug 2023 08:56:26 -0500
Subject: [PATCH 235/347] CLI: Re-use highlight cancellation flag for HTML
 highlights

The `html` highlight function created its own cancellation flag which
conflicts with the Ctrl-c handler set up in the CLI's `main` block
for `tree-sitter highlight`. We can re-use the cancellation flag from
that block to avoid a panic that happens when using `tree-sitter
highlight -H <file>`

    thread 'main' panicked at 'Error setting Ctrl-C handler: MultipleHandlers', cli/src/util.rs:31:6

This change also aligns the parameters that `highlight::ansi` and
`highlight::html` take.
---
 cli/src/highlight.rs | 5 ++---
 cli/src/main.rs      | 1 +
 2 files changed, 3 insertions(+), 3 deletions(-)

diff --git a/cli/src/highlight.rs b/cli/src/highlight.rs
index e16a705c..35f7583e 100644
--- a/cli/src/highlight.rs
+++ b/cli/src/highlight.rs
@@ -1,4 +1,3 @@
-use super::util;
 use ansi_term::Color;
 use anyhow::Result;
 use lazy_static::lazy_static;
@@ -385,16 +384,16 @@ pub fn html(
     config: &HighlightConfiguration,
     quiet: bool,
     print_time: bool,
+    cancellation_flag: Option<&AtomicUsize>,
 ) -> Result<()> {
     use std::io::Write;
 
     let stdout = io::stdout();
     let mut stdout = stdout.lock();
     let time = Instant::now();
-    let cancellation_flag = util::cancel_on_signal();
     let mut highlighter = Highlighter::new();
 
-    let events = highlighter.highlight(config, source, Some(&cancellation_flag), |string| {
+    let events = highlighter.highlight(config, source, cancellation_flag, |string| {
         loader.highlight_config_for_injection_string(string)
     })?;
 
diff --git a/cli/src/main.rs b/cli/src/main.rs
index 1912762d..fe250e68 100644
--- a/cli/src/main.rs
+++ b/cli/src/main.rs
@@ -609,6 +609,7 @@ fn run() -> Result<()> {
                             highlight_config,
                             quiet,
                             time,
+                            Some(&cancellation_flag),
                         )?;
                     } else {
                         highlight::ansi(

From b456f831d1371b95b785dab919f183d5d0d38b76 Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Wed, 2 Aug 2023 18:28:44 +0300
Subject: [PATCH 236/347] Remove `PartialOrd, Ord` deriving from `Range` in
 Rust lib

---
 lib/binding_rust/lib.rs | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/lib/binding_rust/lib.rs b/lib/binding_rust/lib.rs
index 2e3403b4..b80e2661 100644
--- a/lib/binding_rust/lib.rs
+++ b/lib/binding_rust/lib.rs
@@ -58,7 +58,7 @@ pub struct Point {
 
 /// A range of positions in a multi-line text document, both in terms of bytes and of
 /// rows and columns.
-#[derive(Clone, Copy, Debug, PartialEq, Eq, Hash, PartialOrd, Ord)]
+#[derive(Clone, Copy, Debug, PartialEq, Eq, Hash)]
 pub struct Range {
     pub start_byte: usize,
     pub end_byte: usize,

From 4f28ce4e3b9c2e398af3110adab30034f36933be Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Wed, 2 Aug 2023 22:59:51 +0300
Subject: [PATCH 237/347] Add async context tests for `Node` and `TreeCursor`

---
 cli/src/tests/async_context_test.rs | 279 ++++++++++++++++++++++++++++
 cli/src/tests/mod.rs                |   1 +
 2 files changed, 280 insertions(+)
 create mode 100644 cli/src/tests/async_context_test.rs

diff --git a/cli/src/tests/async_context_test.rs b/cli/src/tests/async_context_test.rs
new file mode 100644
index 00000000..08226387
--- /dev/null
+++ b/cli/src/tests/async_context_test.rs
@@ -0,0 +1,279 @@
+use super::helpers::fixtures::get_language;
+use std::future::Future;
+use std::pin::{pin, Pin};
+use std::ptr;
+use std::task::{self, Context, Poll, RawWaker, RawWakerVTable, Waker};
+use tree_sitter::Parser;
+
+#[test]
+fn test_node_in_fut() {
+    let (ret, pended) = tokio_like_spawn(async {
+        let mut parser = Parser::new();
+        let language = get_language("bash");
+        parser.set_language(language).unwrap();
+
+        let tree = parser.parse("#", None).unwrap();
+
+        let root = tree.root_node();
+        let root_ref = &root;
+
+        let fut_val_fn = || async {
+            // eprintln!("fut_val_fn: {}", root.child(0).unwrap().kind());
+            yield_now().await;
+            root.child(0).unwrap().kind()
+        };
+
+        yield_now().await;
+
+        let fut_ref_fn = || async {
+            // eprintln!("fut_ref_fn: {}", root_ref.child(0).unwrap().kind());
+            yield_now().await;
+            root_ref.child(0).unwrap().kind()
+        };
+
+        let f1 = fut_val_fn().await;
+        let f2 = fut_ref_fn().await;
+        assert_eq!(f1, f2);
+
+        let fut_val = async {
+            // eprintln!("fut_val: {}", root.child(0).unwrap().kind());
+            yield_now().await;
+            root.child(0).unwrap().kind()
+        };
+
+        let fut_ref = async {
+            // eprintln!("fut_ref: {}", root_ref.child(0).unwrap().kind());
+            yield_now().await;
+            root_ref.child(0).unwrap().kind()
+        };
+
+        let f1 = fut_val.await;
+        let f2 = fut_ref.await;
+        assert_eq!(f1, f2);
+
+        f1
+    })
+    .join();
+    // eprintln!("pended: {pended:?}");
+    assert_eq!(ret, "comment");
+    assert_eq!(pended, 5);
+}
+
+#[test]
+fn test_node_and_cursor_ref_in_fut() {
+    let (_, pended) = tokio_like_spawn(async {
+        let mut parser = Parser::new();
+        let language = get_language("bash");
+        parser.set_language(language).unwrap();
+
+        let tree = parser.parse("#", None).unwrap();
+
+        let root = tree.root_node();
+        let root_ref = &root;
+
+        let mut cursor = tree.walk();
+        let cursor_ref = &mut cursor;
+
+        cursor_ref.goto_first_child();
+
+        let fut_val = async {
+            yield_now().await;
+            root.to_sexp();
+        };
+
+        yield_now().await;
+
+        let fut_ref = async {
+            yield_now().await;
+            root_ref.to_sexp();
+            cursor_ref.goto_first_child();
+        };
+
+        fut_val.await;
+        fut_ref.await;
+
+        cursor_ref.goto_first_child();
+    })
+    .join();
+    assert_eq!(pended, 3);
+}
+
+#[test]
+fn test_node_and_cursor_ref_in_fut_with_fut_fabrics() {
+    let (_, pended) = tokio_like_spawn(async {
+        let mut parser = Parser::new();
+        let language = get_language("bash");
+        parser.set_language(language).unwrap();
+
+        let tree = parser.parse("#", None).unwrap();
+
+        let root = tree.root_node();
+        let root_ref = &root;
+
+        let mut cursor = tree.walk();
+        let cursor_ref = &mut cursor;
+
+        cursor_ref.goto_first_child();
+
+        let fut_val = || async {
+            yield_now().await;
+            root.to_sexp();
+        };
+
+        yield_now().await;
+
+        let fut_ref = || async move {
+            yield_now().await;
+            root_ref.to_sexp();
+            cursor_ref.goto_first_child();
+        };
+
+        fut_val().await;
+        fut_val().await;
+        fut_ref().await;
+    })
+    .join();
+    assert_eq!(pended, 4);
+}
+
+#[test]
+fn test_node_and_cursor_ref_in_fut_with_inner_spawns() {
+    let (ret, pended) = tokio_like_spawn(async {
+        let mut parser = Parser::new();
+        let language = get_language("bash");
+        parser.set_language(language).unwrap();
+
+        let tree = parser.parse("#", None).unwrap();
+
+        let mut cursor = tree.walk();
+        let cursor_ref = &mut cursor;
+
+        cursor_ref.goto_first_child();
+
+        let fut_val = || {
+            let tree = tree.clone();
+            async move {
+                let root = tree.root_node();
+                let mut cursor = tree.walk();
+                let cursor_ref = &mut cursor;
+                yield_now().await;
+                root.to_sexp();
+                cursor_ref.goto_first_child();
+            }
+        };
+
+        yield_now().await;
+
+        let fut_ref = || {
+            let tree = tree.clone();
+            async move {
+                let root = tree.root_node();
+                let root_ref = &root;
+                let mut cursor = tree.walk();
+                let cursor_ref = &mut cursor;
+                yield_now().await;
+                root_ref.to_sexp();
+                cursor_ref.goto_first_child();
+            }
+        };
+
+        let (_, p1) = tokio_like_spawn(fut_val()).await.unwrap();
+        let (_, p2) = tokio_like_spawn(fut_ref()).await.unwrap();
+
+        cursor_ref.goto_first_child();
+
+        fut_val().await;
+        fut_val().await;
+        fut_ref().await;
+
+        cursor_ref.goto_first_child();
+
+        p1 + p2
+    })
+    .join();
+    assert_eq!(pended, 4);
+    assert_eq!(ret, 2);
+}
+
+fn tokio_like_spawn<T>(future: T) -> JoinHandle<(T::Output, usize)>
+where
+    T: Future + Send + 'static,
+    T::Output: Send + 'static,
+{
+    // No runtime, just noop waker
+
+    let waker = noop_waker();
+    let mut cx = task::Context::from_waker(&waker);
+
+    let mut pending = 0;
+    let mut future = pin!(future);
+    let ret = loop {
+        match future.as_mut().poll(&mut cx) {
+            Poll::Pending => pending += 1,
+            Poll::Ready(r) => {
+                // eprintln!("ready, pended: {pending}");
+                break r;
+            }
+        }
+    };
+    JoinHandle::new((ret, pending))
+}
+
+async fn yield_now() {
+    struct SimpleYieldNow {
+        yielded: bool,
+    }
+
+    impl Future for SimpleYieldNow {
+        type Output = ();
+
+        fn poll(mut self: Pin<&mut Self>, cx: &mut Context<'_>) -> Poll<()> {
+            cx.waker().clone().wake();
+            if self.yielded {
+                return Poll::Ready(());
+            }
+            self.yielded = true;
+            Poll::Pending
+        }
+    }
+
+    SimpleYieldNow { yielded: false }.await
+}
+
+pub fn noop_waker() -> Waker {
+    const VTABLE: RawWakerVTable = RawWakerVTable::new(
+        // Cloning just returns a new no-op raw waker
+        |_| RAW,
+        // `wake` does nothing
+        |_| {},
+        // `wake_by_ref` does nothing
+        |_| {},
+        // Dropping does nothing as we don't allocate anything
+        |_| {},
+    );
+    const RAW: RawWaker = RawWaker::new(ptr::null(), &VTABLE);
+    unsafe { Waker::from_raw(RAW) }
+}
+
+struct JoinHandle<T> {
+    data: Option<T>,
+}
+
+impl<T> JoinHandle<T> {
+    fn new(data: T) -> Self {
+        Self { data: Some(data) }
+    }
+
+    fn join(&mut self) -> T {
+        self.data.take().unwrap()
+    }
+}
+
+impl<T: Unpin> Future for JoinHandle<T> {
+    type Output = std::result::Result<T, ()>;
+
+    fn poll(self: Pin<&mut Self>, _cx: &mut Context<'_>) -> Poll<Self::Output> {
+        let data = self.get_mut().data.take().unwrap();
+        Poll::Ready(Ok(data))
+    }
+}
diff --git a/cli/src/tests/mod.rs b/cli/src/tests/mod.rs
index 577770a2..e579209f 100644
--- a/cli/src/tests/mod.rs
+++ b/cli/src/tests/mod.rs
@@ -1,3 +1,4 @@
+mod async_context_test;
 mod corpus_test;
 mod github_issue_test;
 mod helpers;

From 0f533b909d7df710f3d0ca3d8ed8a4137633da0f Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Sat, 22 Jul 2023 17:38:42 +0300
Subject: [PATCH 238/347] chore: group Sync, Send impls by type

---
 lib/binding_rust/lib.rs | 12 ++++++++----
 1 file changed, 8 insertions(+), 4 deletions(-)

diff --git a/lib/binding_rust/lib.rs b/lib/binding_rust/lib.rs
index b80e2661..efac4f1a 100644
--- a/lib/binding_rust/lib.rs
+++ b/lib/binding_rust/lib.rs
@@ -2642,12 +2642,16 @@ impl error::Error for LanguageError {}
 impl error::Error for QueryError {}
 
 unsafe impl Send for Language {}
-unsafe impl Send for Parser {}
-unsafe impl Send for Query {}
-unsafe impl Send for QueryCursor {}
-unsafe impl Send for Tree {}
 unsafe impl Sync for Language {}
+
+unsafe impl Send for Parser {}
 unsafe impl Sync for Parser {}
+
+unsafe impl Send for Query {}
 unsafe impl Sync for Query {}
+
+unsafe impl Send for QueryCursor {}
 unsafe impl Sync for QueryCursor {}
+
+unsafe impl Send for Tree {}
 unsafe impl Sync for Tree {}

From 1fbe929ad911514af31db749cbbd55e181a8ce27 Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Sat, 22 Jul 2023 17:39:17 +0300
Subject: [PATCH 239/347] feat: define Sync, Send for Node and TreeCursor types

---
 lib/binding_rust/lib.rs | 6 ++++++
 1 file changed, 6 insertions(+)

diff --git a/lib/binding_rust/lib.rs b/lib/binding_rust/lib.rs
index efac4f1a..8e6b091a 100644
--- a/lib/binding_rust/lib.rs
+++ b/lib/binding_rust/lib.rs
@@ -2644,6 +2644,9 @@ impl error::Error for QueryError {}
 unsafe impl Send for Language {}
 unsafe impl Sync for Language {}
 
+unsafe impl Send for Node<'_> {}
+unsafe impl Sync for Node<'_> {}
+
 unsafe impl Send for Parser {}
 unsafe impl Sync for Parser {}
 
@@ -2655,3 +2658,6 @@ unsafe impl Sync for QueryCursor {}
 
 unsafe impl Send for Tree {}
 unsafe impl Sync for Tree {}
+
+unsafe impl Send for TreeCursor<'_> {}
+unsafe impl Sync for TreeCursor<'_> {}

From 4eb22ed3aeaa0484e893606cad9fe430074d808a Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Wed, 2 Aug 2023 21:36:52 +0300
Subject: [PATCH 240/347] Fix UB for LookaheadIterator

---
 cli/src/tests/language_test.rs |  2 +-
 lib/binding_rust/lib.rs        | 13 ++++++-------
 2 files changed, 7 insertions(+), 8 deletions(-)

diff --git a/cli/src/tests/language_test.rs b/cli/src/tests/language_test.rs
index f8a4653f..9880a9a3 100644
--- a/cli/src/tests/language_test.rs
+++ b/cli/src/tests/language_test.rs
@@ -27,7 +27,7 @@ fn test_lookahead_iterator() {
     assert_ne!(cursor.node().grammar_id(), cursor.node().kind_id());
 
     let expected_symbols = ["identifier", "block_comment", "line_comment"];
-    let lookahead = language.lookahead_iterator(next_state).unwrap();
+    let mut lookahead = language.lookahead_iterator(next_state).unwrap();
     assert_eq!(lookahead.language(), language);
     assert!(lookahead.iter_names().eq(expected_symbols));
 
diff --git a/lib/binding_rust/lib.rs b/lib/binding_rust/lib.rs
index 8e6b091a..461c9557 100644
--- a/lib/binding_rust/lib.rs
+++ b/lib/binding_rust/lib.rs
@@ -90,6 +90,7 @@ pub struct Parser(NonNull<ffi::TSParser>);
 /// A stateful object that is used to look up symbols valid in a specific parse state
 #[doc(alias = "TSLookaheadIterator")]
 pub struct LookaheadIterator(NonNull<ffi::TSLookaheadIterator>);
+struct LookaheadNamesIterator<'a>(&'a mut LookaheadIterator);
 
 /// A type of log message.
 #[derive(Debug, PartialEq, Eq)]
@@ -1525,7 +1526,7 @@ impl LookaheadIterator {
     /// This returns `true` if the language was set successfully and `false`
     /// otherwise.
     #[doc(alias = "ts_lookahead_iterator_reset")]
-    pub fn reset(&self, language: Language, state: u16) -> bool {
+    pub fn reset(&mut self, language: Language, state: u16) -> bool {
         unsafe { ffi::ts_lookahead_iterator_reset(self.0.as_ptr(), language.0, state) }
     }
 
@@ -1534,19 +1535,17 @@ impl LookaheadIterator {
     /// This returns `true` if the iterator was reset to the given state and `false`
     /// otherwise.
     #[doc(alias = "ts_lookahead_iterator_reset_state")]
-    pub fn reset_state(&self, state: u16) -> bool {
+    pub fn reset_state(&mut self, state: u16) -> bool {
         unsafe { ffi::ts_lookahead_iterator_reset_state(self.0.as_ptr(), state) }
     }
 
     /// Iterate symbol names.
-    pub fn iter_names<'a>(&'a self) -> impl Iterator<Item = &'static str> + 'a {
-        NameLookaheadIterator(&self)
+    pub fn iter_names(&mut self) -> impl Iterator<Item = &'static str> + '_ {
+        LookaheadNamesIterator(self)
     }
 }
 
-struct NameLookaheadIterator<'a>(&'a LookaheadIterator);
-
-impl<'a> Iterator for NameLookaheadIterator<'a> {
+impl Iterator for LookaheadNamesIterator<'_> {
     type Item = &'static str;
 
     #[doc(alias = "ts_lookahead_iterator_advance")]

From 781639702609b6fc3a584d4f2415a5bd6bb98447 Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Wed, 2 Aug 2023 21:37:11 +0300
Subject: [PATCH 241/347] Add compile fail tests for LookaheadIterator

---
 cli/src/lib.rs                 |  4 +++
 cli/src/tests/language_test.rs | 54 ++++++++++++++++++++++++++++++++++
 2 files changed, 58 insertions(+)

diff --git a/cli/src/lib.rs b/cli/src/lib.rs
index d36417c2..d52b516a 100644
--- a/cli/src/lib.rs
+++ b/cli/src/lib.rs
@@ -14,3 +14,7 @@ pub mod wasm;
 
 #[cfg(test)]
 mod tests;
+
+// To run compile fail tests
+#[cfg(doctest)]
+mod tests;
diff --git a/cli/src/tests/language_test.rs b/cli/src/tests/language_test.rs
index 9880a9a3..5dd04c46 100644
--- a/cli/src/tests/language_test.rs
+++ b/cli/src/tests/language_test.rs
@@ -39,3 +39,57 @@ fn test_lookahead_iterator() {
         .map(|s| language.node_kind_for_id(s).unwrap())
         .eq(expected_symbols));
 }
+
+#[test]
+fn test_lookahead_iterator_modifiable_only_by_mut() {
+    let mut parser = Parser::new();
+    let language = get_language("rust");
+    parser.set_language(language).unwrap();
+
+    let tree = parser.parse("struct Stuff {}", None).unwrap();
+
+    let mut cursor = tree.walk();
+
+    assert!(cursor.goto_first_child()); // struct
+    assert!(cursor.goto_first_child()); // struct keyword
+
+    let next_state = cursor.node().next_parse_state();
+    assert_ne!(next_state, 0);
+
+    let mut lookahead = language.lookahead_iterator(next_state).unwrap();
+    let _ = lookahead.next();
+
+    let mut names = lookahead.iter_names();
+    let _ = names.next();
+}
+
+/// It doesn't allowed to use lookahead iterator by shared ref:
+///     error[E0596]: cannot borrow `lookahead` as mutable, as it is not declared as mutable
+/// ```compile_fail
+/// use tree_sitter::{Parser, Language};
+/// let mut parser = Parser::new();
+/// let language = unsafe { Language::from_raw(std::ptr::null()) };
+/// let tree = parser.parse("", None).unwrap();
+/// let mut cursor = tree.walk();
+/// let next_state = cursor.node().next_parse_state();
+/// let lookahead = language.lookahead_iterator(next_state).unwrap();
+/// let _ = lookahead.next();
+/// ```
+
+/// It doesn't allowed to use lookahead names iterator by shared ref:
+///     error[E0596]: cannot borrow `names` as mutable, as it is not declared as mutable
+/// ```compile_fail
+/// use tree_sitter::{Parser, Language};
+/// let mut parser = Parser::new();
+/// let language = unsafe { Language::from_raw(std::ptr::null()) };
+/// let tree = parser.parse("", None).unwrap();
+/// let mut cursor = tree.walk();
+/// let next_state = cursor.node().next_parse_state();
+/// if let Some(mut lookahead) = language.lookahead_iterator(next_state) {
+///     let _ = lookahead.next();
+///     let names = lookahead.iter_names();
+///     let _ = names.next();
+/// }
+/// ```
+
+fn _dummy() {}

From d185f3126f0d58ee5a56f341231f02f004a638cc Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Wed, 2 Aug 2023 21:37:33 +0300
Subject: [PATCH 242/347] Make LookaheadIterator Sync and Send

---
 lib/binding_rust/lib.rs | 6 ++++++
 1 file changed, 6 insertions(+)

diff --git a/lib/binding_rust/lib.rs b/lib/binding_rust/lib.rs
index 461c9557..ad20507e 100644
--- a/lib/binding_rust/lib.rs
+++ b/lib/binding_rust/lib.rs
@@ -2646,6 +2646,12 @@ unsafe impl Sync for Language {}
 unsafe impl Send for Node<'_> {}
 unsafe impl Sync for Node<'_> {}
 
+unsafe impl Send for LookaheadIterator {}
+unsafe impl Sync for LookaheadIterator {}
+
+unsafe impl Send for LookaheadNamesIterator<'_> {}
+unsafe impl Sync for LookaheadNamesIterator<'_> {}
+
 unsafe impl Send for Parser {}
 unsafe impl Sync for Parser {}
 

From 41ec8b41661bc0eaa0ff1b0bdebd7861267e77c4 Mon Sep 17 00:00:00 2001
From: Samuel Moelius <sam@moeli.us>
Date: Fri, 19 May 2023 19:02:30 -0400
Subject: [PATCH 243/347] Partially revert d4d5e29

---
 cli/src/tests/query_test.rs   | 21 ++++++++++++---------
 lib/binding_rust/bindings.rs  |  2 +-
 lib/include/tree_sitter/api.h | 10 ++++++++--
 lib/src/query.c               |  6 +-----
 4 files changed, 22 insertions(+), 17 deletions(-)

diff --git a/cli/src/tests/query_test.rs b/cli/src/tests/query_test.rs
index 1ca1e658..9e3f5303 100644
--- a/cli/src/tests/query_test.rs
+++ b/cli/src/tests/query_test.rs
@@ -4577,19 +4577,22 @@ fn test_query_max_start_depth() {
     #[rustfmt::skip]
     let rows = &[
         Row {
-            description: "depth 0: match all",
+            description: "depth 0: match translation unit",
+            depth: 0,
+            pattern: r#"
+                (translation_unit) @capture
+            "#,
+            matches: &[
+                (0, &[("capture", "if (a1 && a2) {\n    if (b1 && b2) { }\n    if (c) { }\n}\nif (d) {\n    if (e1 && e2) { }\n    if (f) { }\n}\n")]),
+            ]
+        },
+        Row {
+            description: "depth 0: match none",
             depth: 0,
             pattern: r#"
                 (if_statement) @capture
             "#,
-            matches: &[
-                (0, &[("capture", "if (a1 && a2) {\n    if (b1 && b2) { }\n    if (c) { }\n}")]),
-                (0, &[("capture", "if (b1 && b2) { }")]),
-                (0, &[("capture", "if (c) { }")]),
-                (0, &[("capture", "if (d) {\n    if (e1 && e2) { }\n    if (f) { }\n}")]),
-                (0, &[("capture", "if (e1 && e2) { }")]),
-                (0, &[("capture", "if (f) { }")]),
-            ]
+            matches: &[]
         },
         Row {
             description: "depth 1: match 2 if statements at the top level",
diff --git a/lib/binding_rust/bindings.rs b/lib/binding_rust/bindings.rs
index 912916c0..faec9d3b 100644
--- a/lib/binding_rust/bindings.rs
+++ b/lib/binding_rust/bindings.rs
@@ -639,7 +639,7 @@ extern "C" {
     ) -> bool;
 }
 extern "C" {
-    #[doc = " Set the maximum start depth for a cursor.\n\n This prevents cursors from exploring children nodes at a certain depth.\n Note if a pattern includes many children, then they will still be checked.\n\n Set to `0` to remove the maximum start depth."]
+    #[doc = " Set the maximum start depth for a query cursor.\n\n This prevents cursors from exploring children nodes at a certain depth.\n Note if a pattern includes many children, then they will still be checked.\n\n The zero max start depth value can be used as a special behavior and\n it helps to destructure a subtree by staying on a node and using captures\n for interested parts. Note that the zero max start depth only limit a search\n depth for a pattern's root node but other nodes that are parts of the pattern\n may be searched at any depth what defined by the pattern structure.\n\n Set to `UINT32_MAX` to remove the maximum start depth."]
     pub fn ts_query_cursor_set_max_start_depth(arg1: *mut TSQueryCursor, arg2: u32);
 }
 extern "C" {
diff --git a/lib/include/tree_sitter/api.h b/lib/include/tree_sitter/api.h
index d9560f24..349f6838 100644
--- a/lib/include/tree_sitter/api.h
+++ b/lib/include/tree_sitter/api.h
@@ -984,12 +984,18 @@ bool ts_query_cursor_next_capture(
 );
 
 /**
- * Set the maximum start depth for a cursor.
+ * Set the maximum start depth for a query cursor.
  *
  * This prevents cursors from exploring children nodes at a certain depth.
  * Note if a pattern includes many children, then they will still be checked.
  *
- * Set to `0` to remove the maximum start depth.
+ * The zero max start depth value can be used as a special behavior and
+ * it helps to destructure a subtree by staying on a node and using captures
+ * for interested parts. Note that the zero max start depth only limit a search
+ * depth for a pattern's root node but other nodes that are parts of the pattern
+ * may be searched at any depth what defined by the pattern structure.
+ *
+ * Set to `UINT32_MAX` to remove the maximum start depth.
  */
 void ts_query_cursor_set_max_start_depth(TSQueryCursor *, uint32_t);
 
diff --git a/lib/src/query.c b/lib/src/query.c
index ff4bb06c..be4464ea 100644
--- a/lib/src/query.c
+++ b/lib/src/query.c
@@ -4124,11 +4124,7 @@ void ts_query_cursor_set_max_start_depth(
   TSQueryCursor *self,
   uint32_t max_start_depth
 ) {
-  if (max_start_depth == 0) {
-    self->max_start_depth = UINT32_MAX;
-  } else {
-    self->max_start_depth = max_start_depth;
-  }
+  self->max_start_depth = max_start_depth;
 }
 
 #undef LOG

From 7b01d8ee054644fc779c83cc16adf41ff9af5646 Mon Sep 17 00:00:00 2001
From: Samuel Moelius <sam@moeli.us>
Date: Sat, 20 May 2023 08:13:26 -0400
Subject: [PATCH 244/347] Add `test_query_max_start_depth_more`

---
 cli/src/tests/query_test.rs | 72 +++++++++++++++++++++++++++++++++++++
 1 file changed, 72 insertions(+)

diff --git a/cli/src/tests/query_test.rs b/cli/src/tests/query_test.rs
index 9e3f5303..28c01f4c 100644
--- a/cli/src/tests/query_test.rs
+++ b/cli/src/tests/query_test.rs
@@ -4723,3 +4723,75 @@ fn test_consecutive_zero_or_modifiers() {
         assert_eq!(len_1, test.contains("???"));
     }
 }
+
+#[test]
+fn test_query_max_start_depth_more() {
+    struct Row {
+        depth: u32,
+        matches: &'static [(usize, &'static [(&'static str, &'static str)])],
+    }
+
+    let source = indoc! {"
+        {
+            { }
+            {
+                { }
+            }
+        }
+    "};
+
+    #[rustfmt::skip]
+    let rows = &[
+        Row {
+            depth: 0,
+            matches: &[
+                (0, &[("capture", "{\n    { }\n    {\n        { }\n    }\n}")])
+            ]
+        },
+        Row {
+            depth: 1,
+            matches: &[
+                (0, &[("capture", "{\n    { }\n    {\n        { }\n    }\n}")]),
+                (0, &[("capture", "{ }")]),
+                (0, &[("capture", "{\n        { }\n    }")])
+            ]
+        },
+        Row {
+            depth: 2,
+            matches: &[
+                (0, &[("capture", "{\n    { }\n    {\n        { }\n    }\n}")]),
+                (0, &[("capture", "{ }")]),
+                (0, &[("capture", "{\n        { }\n    }")]),
+                (0, &[("capture", "{ }")]),
+            ]
+        },
+    ];
+
+    allocations::record(|| {
+        let language = get_language("c");
+        let mut parser = Parser::new();
+        parser.set_language(language).unwrap();
+        let tree = parser.parse(source, None).unwrap();
+        let mut cursor = QueryCursor::new();
+        let query = Query::new(language, "(compound_statement) @capture").unwrap();
+
+        let mut matches = cursor.matches(&query, tree.root_node(), source.as_bytes());
+        let node = matches.next().unwrap().captures[0].node;
+        assert_eq!(node.kind(), "compound_statement");
+
+        for row in rows.iter() {
+            eprintln!("  depth: {}", row.depth);
+
+            cursor.set_max_start_depth(row.depth);
+
+            let matches = cursor.matches(&query, node, source.as_bytes());
+            let expected = row
+                .matches
+                .iter()
+                .map(|x| (x.0, x.1.to_vec()))
+                .collect::<Vec<_>>();
+
+            assert_eq!(collect_matches(matches, &query, source), expected);
+        }
+    });
+}

From 485d19288027d9b92010c69b8951e7fb6ddd9df0 Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Sun, 21 May 2023 01:05:13 +0300
Subject: [PATCH 245/347] binding_rust: `set_max_start_depth` accepts optional
 to reset limit

---
 cli/src/tests/query_test.rs |  4 ++--
 lib/binding_rust/lib.rs     | 19 +++++++++++++++++--
 2 files changed, 19 insertions(+), 4 deletions(-)

diff --git a/cli/src/tests/query_test.rs b/cli/src/tests/query_test.rs
index 28c01f4c..c3bf54a2 100644
--- a/cli/src/tests/query_test.rs
+++ b/cli/src/tests/query_test.rs
@@ -4648,7 +4648,7 @@ fn test_query_max_start_depth() {
             eprintln!("  query example: {:?}", row.description);
 
             let query = Query::new(language, row.pattern).unwrap();
-            cursor.set_max_start_depth(row.depth);
+            cursor.set_max_start_depth(Some(row.depth));
 
             let matches = cursor.matches(&query, tree.root_node(), source.as_bytes());
             let expected = row
@@ -4782,7 +4782,7 @@ fn test_query_max_start_depth_more() {
         for row in rows.iter() {
             eprintln!("  depth: {}", row.depth);
 
-            cursor.set_max_start_depth(row.depth);
+            cursor.set_max_start_depth(Some(row.depth));
 
             let matches = cursor.matches(&query, node, source.as_bytes());
             let expected = row
diff --git a/lib/binding_rust/lib.rs b/lib/binding_rust/lib.rs
index ad20507e..cc3ebe9b 100644
--- a/lib/binding_rust/lib.rs
+++ b/lib/binding_rust/lib.rs
@@ -2174,10 +2174,25 @@ impl QueryCursor {
         self
     }
 
+    /// Set the maximum start depth for a query cursor.
+    ///
+    /// This prevents cursors from exploring children nodes at a certain depth.
+    /// Note if a pattern includes many children, then they will still be checked.
+    ///
+    /// The zero max start depth value can be used as a special behavior and
+    /// it helps to destructure a subtree by staying on a node and using captures
+    /// for interested parts. Note that the zero max start depth only limit a search
+    /// depth for a pattern's root node but other nodes that are parts of the pattern
+    /// may be searched at any depth what defined by the pattern structure.
+    ///
+    /// Set to `None` to remove the maximum start depth.
     #[doc(alias = "ts_query_cursor_set_max_start_depth")]
-    pub fn set_max_start_depth(&mut self, max_start_depth: u32) -> &mut Self {
+    pub fn set_max_start_depth(&mut self, max_start_depth: Option<u32>) -> &mut Self {
         unsafe {
-            ffi::ts_query_cursor_set_max_start_depth(self.ptr.as_ptr(), max_start_depth);
+            ffi::ts_query_cursor_set_max_start_depth(
+                self.ptr.as_ptr(),
+                max_start_depth.unwrap_or(u32::MAX),
+            );
         }
         self
     }

From c85f81f62515a915a2d26ef031c0fa013227d76d Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Thu, 3 Aug 2023 13:13:26 +0300
Subject: [PATCH 246/347] feat: rework lifetimes, relax deps and tie only on
 impls

---
 lib/binding_rust/lib.rs | 121 ++++++++++++++++++++--------------------
 1 file changed, 61 insertions(+), 60 deletions(-)

diff --git a/lib/binding_rust/lib.rs b/lib/binding_rust/lib.rs
index ad20507e..2f8140a9 100644
--- a/lib/binding_rust/lib.rs
+++ b/lib/binding_rust/lib.rs
@@ -81,7 +81,7 @@ pub struct InputEdit {
 #[doc(alias = "TSNode")]
 #[derive(Clone, Copy)]
 #[repr(transparent)]
-pub struct Node<'a>(ffi::TSNode, PhantomData<&'a ()>);
+pub struct Node<'tree>(ffi::TSNode, PhantomData<&'tree ()>);
 
 /// A stateful object that this is used to produce a `Tree` based on some source code.
 #[doc(alias = "TSParser")]
@@ -106,7 +106,7 @@ type Logger<'a> = Box<dyn FnMut(LogType, &str) + 'a>;
 
 /// A stateful object for walking a syntax `Tree` efficiently.
 #[doc(alias = "TSTreeCursor")]
-pub struct TreeCursor<'a>(ffi::TSTreeCursor, PhantomData<&'a ()>);
+pub struct TreeCursor<'cursor>(ffi::TSTreeCursor, PhantomData<&'cursor ()>);
 
 /// A set of patterns that match nodes in a syntax tree.
 #[doc(alias = "TSQuery")]
@@ -180,23 +180,23 @@ pub struct QueryMatch<'cursor, 'tree> {
 }
 
 /// A sequence of `QueryMatch`es associated with a given `QueryCursor`.
-pub struct QueryMatches<'a, 'tree: 'a, T: TextProvider<I>, I: AsRef<[u8]>> {
+pub struct QueryMatches<'query, 'cursor, T: TextProvider<I>, I: AsRef<[u8]>> {
     ptr: *mut ffi::TSQueryCursor,
-    query: &'a Query,
+    query: &'query Query,
     text_provider: T,
     buffer1: Vec<u8>,
     buffer2: Vec<u8>,
-    _phantom: PhantomData<(&'tree (), I)>,
+    _phantom: PhantomData<(&'cursor (), I)>,
 }
 
 /// A sequence of `QueryCapture`s associated with a given `QueryCursor`.
-pub struct QueryCaptures<'a, 'tree: 'a, T: TextProvider<I>, I: AsRef<[u8]>> {
+pub struct QueryCaptures<'query, 'cursor, T: TextProvider<I>, I: AsRef<[u8]>> {
     ptr: *mut ffi::TSQueryCursor,
-    query: &'a Query,
+    query: &'query Query,
     text_provider: T,
     buffer1: Vec<u8>,
     buffer2: Vec<u8>,
-    _phantom: PhantomData<(&'tree (), I)>,
+    _phantom: PhantomData<(&'cursor (), I)>,
 }
 
 pub trait TextProvider<I>
@@ -210,8 +210,8 @@ where
 /// A particular `Node` that has been captured with a particular name within a `Query`.
 #[derive(Clone, Copy, Debug)]
 #[repr(C)]
-pub struct QueryCapture<'a> {
-    pub node: Node<'a>,
+pub struct QueryCapture<'tree> {
+    pub node: Node<'tree>,
     pub index: u32,
 }
 
@@ -548,7 +548,7 @@ impl Parser {
     ///   If the text of the document has changed since `old_tree` was
     ///   created, then you must edit `old_tree` to match the new text using
     ///   [Tree::edit].
-    pub fn parse_with<'a, T: AsRef<[u8]>, F: FnMut(usize, Point) -> T>(
+    pub fn parse_with<T: AsRef<[u8]>, F: FnMut(usize, Point) -> T>(
         &mut self,
         callback: &mut F,
         old_tree: Option<&Tree>,
@@ -561,7 +561,7 @@ impl Parser {
         let mut payload: (&mut F, Option<T>) = (callback, None);
 
         // This C function is passed to Tree-sitter as the input callback.
-        unsafe extern "C" fn read<'a, T: AsRef<[u8]>, F: FnMut(usize, Point) -> T>(
+        unsafe extern "C" fn read<T: AsRef<[u8]>, F: FnMut(usize, Point) -> T>(
             payload: *mut c_void,
             byte_offset: u32,
             position: ffi::TSPoint,
@@ -598,7 +598,7 @@ impl Parser {
     ///   If the text of the document has changed since `old_tree` was
     ///   created, then you must edit `old_tree` to match the new text using
     ///   [Tree::edit].
-    pub fn parse_utf16_with<'a, T: AsRef<[u16]>, F: FnMut(usize, Point) -> T>(
+    pub fn parse_utf16_with<T: AsRef<[u16]>, F: FnMut(usize, Point) -> T>(
         &mut self,
         callback: &mut F,
         old_tree: Option<&Tree>,
@@ -611,7 +611,7 @@ impl Parser {
         let mut payload: (&mut F, Option<T>) = (callback, None);
 
         // This C function is passed to Tree-sitter as the input callback.
-        unsafe extern "C" fn read<'a, T: AsRef<[u16]>, F: FnMut(usize, Point) -> T>(
+        unsafe extern "C" fn read<T: AsRef<[u16]>, F: FnMut(usize, Point) -> T>(
             payload: *mut c_void,
             byte_offset: u32,
             position: ffi::TSPoint,
@@ -689,10 +689,7 @@ impl Parser {
     /// If this requirement is not satisfied, method will return IncludedRangesError
     /// error with an offset in the passed ranges slice pointing to a first incorrect range.
     #[doc(alias = "ts_parser_set_included_ranges")]
-    pub fn set_included_ranges<'a>(
-        &mut self,
-        ranges: &'a [Range],
-    ) -> Result<(), IncludedRangesError> {
+    pub fn set_included_ranges(&mut self, ranges: &[Range]) -> Result<(), IncludedRangesError> {
         let ts_ranges: Vec<ffi::TSRange> =
             ranges.iter().cloned().map(|range| range.into()).collect();
         let result = unsafe {
@@ -1035,7 +1032,7 @@ impl<'tree> Node<'tree> {
     /// if you might be iterating over a long list of children, you should use
     /// [Node::named_children] instead.
     #[doc(alias = "ts_node_named_child")]
-    pub fn named_child<'a>(&'a self, i: usize) -> Option<Self> {
+    pub fn named_child(&self, i: usize) -> Option<Self> {
         Self::new(unsafe { ffi::ts_node_named_child(self.0, i as u32) })
     }
 
@@ -1094,10 +1091,10 @@ impl<'tree> Node<'tree> {
     ///
     /// If you're walking the tree recursively, you may want to use the `TreeCursor`
     /// APIs directly instead.
-    pub fn children<'a>(
+    pub fn children<'cursor>(
         &self,
-        cursor: &'a mut TreeCursor<'tree>,
-    ) -> impl ExactSizeIterator<Item = Node<'tree>> + 'a {
+        cursor: &'cursor mut TreeCursor<'tree>,
+    ) -> impl ExactSizeIterator<Item = Node<'tree>> + 'cursor {
         cursor.reset(*self);
         cursor.goto_first_child();
         (0..self.child_count()).into_iter().map(move |_| {
@@ -1110,10 +1107,10 @@ impl<'tree> Node<'tree> {
     /// Iterate over this node's named children.
     ///
     /// See also [Node::children].
-    pub fn named_children<'a>(
+    pub fn named_children<'cursor>(
         &self,
-        cursor: &'a mut TreeCursor<'tree>,
-    ) -> impl ExactSizeIterator<Item = Node<'tree>> + 'a {
+        cursor: &'cursor mut TreeCursor<'tree>,
+    ) -> impl ExactSizeIterator<Item = Node<'tree>> + 'cursor {
         cursor.reset(*self);
         cursor.goto_first_child();
         (0..self.named_child_count()).into_iter().map(move |_| {
@@ -1131,11 +1128,11 @@ impl<'tree> Node<'tree> {
     /// Iterate over this node's children with a given field name.
     ///
     /// See also [Node::children].
-    pub fn children_by_field_name<'a>(
+    pub fn children_by_field_name<'cursor>(
         &self,
         field_name: &str,
-        cursor: &'a mut TreeCursor<'tree>,
-    ) -> impl Iterator<Item = Node<'tree>> + 'a {
+        cursor: &'cursor mut TreeCursor<'tree>,
+    ) -> impl Iterator<Item = Node<'tree>> + 'cursor {
         let field_id = self.language().field_id_for_name(field_name);
         let mut done = field_id.is_none();
         if !done {
@@ -1162,11 +1159,11 @@ impl<'tree> Node<'tree> {
     /// Iterate over this node's children with a given field id.
     ///
     /// See also [Node::children_by_field_name].
-    pub fn children_by_field_id<'a>(
+    pub fn children_by_field_id<'cursor>(
         &self,
         field_id: FieldId,
-        cursor: &'a mut TreeCursor<'tree>,
-    ) -> impl Iterator<Item = Node<'tree>> + 'a {
+        cursor: &'cursor mut TreeCursor<'tree>,
+    ) -> impl Iterator<Item = Node<'tree>> + 'cursor {
         cursor.reset(*self);
         cursor.goto_first_child();
         let mut done = false;
@@ -1294,15 +1291,15 @@ impl<'tree> Node<'tree> {
     }
 }
 
-impl<'a> PartialEq for Node<'a> {
+impl PartialEq for Node<'_> {
     fn eq(&self, other: &Self) -> bool {
         self.0.id == other.0.id
     }
 }
 
-impl<'a> Eq for Node<'a> {}
+impl Eq for Node<'_> {}
 
-impl<'a> hash::Hash for Node<'a> {
+impl hash::Hash for Node<'_> {
     fn hash<H: hash::Hasher>(&self, state: &mut H) {
         self.0.id.hash(state);
         self.0.context[0].hash(state);
@@ -1312,7 +1309,7 @@ impl<'a> hash::Hash for Node<'a> {
     }
 }
 
-impl<'a> fmt::Debug for Node<'a> {
+impl fmt::Debug for Node<'_> {
     fn fmt(&self, f: &mut fmt::Formatter) -> Result<(), fmt::Error> {
         write!(
             f,
@@ -1324,10 +1321,10 @@ impl<'a> fmt::Debug for Node<'a> {
     }
 }
 
-impl<'a> TreeCursor<'a> {
+impl<'cursor> TreeCursor<'cursor> {
     /// Get the tree cursor's current [Node].
     #[doc(alias = "ts_tree_cursor_current_node")]
-    pub fn node(&self) -> Node<'a> {
+    pub fn node(&self) -> Node<'cursor> {
         Node(
             unsafe { ffi::ts_tree_cursor_current_node(&self.0) },
             PhantomData,
@@ -1470,7 +1467,7 @@ impl<'a> TreeCursor<'a> {
 
     /// Re-initialize this tree cursor to start at a different node.
     #[doc(alias = "ts_tree_cursor_reset")]
-    pub fn reset(&mut self, node: Node<'a>) {
+    pub fn reset(&mut self, node: Node<'cursor>) {
         unsafe { ffi::ts_tree_cursor_reset(&mut self.0, node.0) };
     }
 
@@ -1479,18 +1476,18 @@ impl<'a> TreeCursor<'a> {
     /// Unlike `reset`, this will not lose parent information and
     /// allows reusing already created cursors.
     #[doc(alias = "ts_tree_cursor_reset_to")]
-    pub fn reset_to(&mut self, cursor: TreeCursor<'a>) {
+    pub fn reset_to(&mut self, cursor: TreeCursor<'cursor>) {
         unsafe { ffi::ts_tree_cursor_reset_to(&mut self.0, &cursor.0) };
     }
 }
 
-impl<'a> Clone for TreeCursor<'a> {
+impl Clone for TreeCursor<'_> {
     fn clone(&self) -> Self {
         TreeCursor(unsafe { ffi::ts_tree_cursor_copy(&self.0) }, PhantomData)
     }
 }
 
-impl<'a> Drop for TreeCursor<'a> {
+impl Drop for TreeCursor<'_> {
     fn drop(&mut self) {
         unsafe { ffi::ts_tree_cursor_delete(&mut self.0) }
     }
@@ -2107,12 +2104,12 @@ impl QueryCursor {
     /// Because multiple patterns can match the same set of nodes, one match may contain
     /// captures that appear *before* some of the captures from a previous match.
     #[doc(alias = "ts_query_cursor_exec")]
-    pub fn matches<'a, 'tree: 'a, T: TextProvider<I>, I: AsRef<[u8]>>(
-        &'a mut self,
-        query: &'a Query,
+    pub fn matches<'query, 'tree, T: TextProvider<I>, I: AsRef<[u8]>>(
+        &mut self,
+        query: &'query Query,
         node: Node<'tree>,
         text_provider: T,
-    ) -> QueryMatches<'a, 'tree, T, I> {
+    ) -> QueryMatches<'query, 'tree, T, I> {
         let ptr = self.ptr.as_ptr();
         unsafe { ffi::ts_query_cursor_exec(ptr, query.ptr.as_ptr(), node.0) };
         QueryMatches {
@@ -2130,12 +2127,12 @@ impl QueryCursor {
     /// This is useful if you don't care about which pattern matched, and just want a single,
     /// ordered sequence of captures.
     #[doc(alias = "ts_query_cursor_exec")]
-    pub fn captures<'a, 'tree: 'a, T: TextProvider<I>, I: AsRef<[u8]>>(
-        &'a mut self,
-        query: &'a Query,
+    pub fn captures<'query, 'tree, T: TextProvider<I>, I: AsRef<[u8]>>(
+        &mut self,
+        query: &'query Query,
         node: Node<'tree>,
         text_provider: T,
-    ) -> QueryCaptures<'a, 'tree, T, I> {
+    ) -> QueryCaptures<'query, 'tree, T, I> {
         let ptr = self.ptr.as_ptr();
         unsafe { ffi::ts_query_cursor_exec(self.ptr.as_ptr(), query.ptr.as_ptr(), node.0) };
         QueryCaptures {
@@ -2183,7 +2180,7 @@ impl QueryCursor {
     }
 }
 
-impl<'a, 'tree> QueryMatch<'a, 'tree> {
+impl<'tree> QueryMatch<'_, 'tree> {
     pub fn id(&self) -> u32 {
         self.id
     }
@@ -2227,8 +2224,8 @@ impl<'a, 'tree> QueryMatch<'a, 'tree> {
     fn satisfies_text_predicates<I: AsRef<[u8]>>(
         &self,
         query: &Query,
-        buffer1: &'a mut Vec<u8>,
-        buffer2: &'a mut Vec<u8>,
+        buffer1: &mut Vec<u8>,
+        buffer2: &mut Vec<u8>,
         text_provider: &mut impl TextProvider<I>,
     ) -> bool {
         struct NodeText<'a, T> {
@@ -2318,8 +2315,10 @@ impl QueryProperty {
     }
 }
 
-impl<'a, 'tree, T: TextProvider<I>, I: AsRef<[u8]>> Iterator for QueryMatches<'a, 'tree, T, I> {
-    type Item = QueryMatch<'a, 'tree>;
+impl<'query, 'tree: 'query, T: TextProvider<I>, I: AsRef<[u8]>> Iterator
+    for QueryMatches<'query, 'tree, T, I>
+{
+    type Item = QueryMatch<'query, 'tree>;
 
     fn next(&mut self) -> Option<Self::Item> {
         unsafe {
@@ -2343,8 +2342,10 @@ impl<'a, 'tree, T: TextProvider<I>, I: AsRef<[u8]>> Iterator for QueryMatches<'a
     }
 }
 
-impl<'a, 'tree, T: TextProvider<I>, I: AsRef<[u8]>> Iterator for QueryCaptures<'a, 'tree, T, I> {
-    type Item = (QueryMatch<'a, 'tree>, usize);
+impl<'query, 'tree: 'query, T: TextProvider<I>, I: AsRef<[u8]>> Iterator
+    for QueryCaptures<'query, 'tree, T, I>
+{
+    type Item = (QueryMatch<'query, 'tree>, usize);
 
     fn next(&mut self) -> Option<Self::Item> {
         unsafe {
@@ -2375,7 +2376,7 @@ impl<'a, 'tree, T: TextProvider<I>, I: AsRef<[u8]>> Iterator for QueryCaptures<'
     }
 }
 
-impl<'a, 'tree, T: TextProvider<I>, I: AsRef<[u8]>> QueryMatches<'a, 'tree, T, I> {
+impl<T: TextProvider<I>, I: AsRef<[u8]>> QueryMatches<'_, '_, T, I> {
     #[doc(alias = "ts_query_cursor_set_byte_range")]
     pub fn set_byte_range(&mut self, range: ops::Range<usize>) {
         unsafe {
@@ -2391,7 +2392,7 @@ impl<'a, 'tree, T: TextProvider<I>, I: AsRef<[u8]>> QueryMatches<'a, 'tree, T, I
     }
 }
 
-impl<'a, 'tree, T: TextProvider<I>, I: AsRef<[u8]>> QueryCaptures<'a, 'tree, T, I> {
+impl<T: TextProvider<I>, I: AsRef<[u8]>> QueryCaptures<'_, '_, T, I> {
     #[doc(alias = "ts_query_cursor_set_byte_range")]
     pub fn set_byte_range(&mut self, range: ops::Range<usize>) {
         unsafe {
@@ -2407,7 +2408,7 @@ impl<'a, 'tree, T: TextProvider<I>, I: AsRef<[u8]>> QueryCaptures<'a, 'tree, T,
     }
 }
 
-impl<'cursor, 'tree> fmt::Debug for QueryMatch<'cursor, 'tree> {
+impl fmt::Debug for QueryMatch<'_, '_> {
     fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
         write!(
             f,
@@ -2508,7 +2509,7 @@ impl From<ffi::TSRange> for Range {
     }
 }
 
-impl<'a> Into<ffi::TSInputEdit> for &'a InputEdit {
+impl Into<ffi::TSInputEdit> for &'_ InputEdit {
     fn into(self) -> ffi::TSInputEdit {
         ffi::TSInputEdit {
             start_byte: self.start_byte as u32,

From e23e4cea18753287ad4533b69ec9b2ffe4bd873a Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Mon, 17 Jul 2023 14:44:35 +0300
Subject: [PATCH 247/347] Make Rust code statements more compact and in
 functional style

---
 lib/binding_rust/lib.rs | 106 +++++++++++-----------------------------
 1 file changed, 28 insertions(+), 78 deletions(-)

diff --git a/lib/binding_rust/lib.rs b/lib/binding_rust/lib.rs
index 98e247b2..69f595de 100644
--- a/lib/binding_rust/lib.rs
+++ b/lib/binding_rust/lib.rs
@@ -284,11 +284,7 @@ impl Language {
     #[doc(alias = "ts_language_symbol_name")]
     pub fn node_kind_for_id(&self, id: u16) -> Option<&'static str> {
         let ptr = unsafe { ffi::ts_language_symbol_name(self.0, id) };
-        if ptr.is_null() {
-            None
-        } else {
-            Some(unsafe { CStr::from_ptr(ptr) }.to_str().unwrap())
-        }
+        (!ptr.is_null()).then(|| unsafe { CStr::from_ptr(ptr) }.to_str().unwrap())
     }
 
     /// Get the numeric id for the given node kind.
@@ -327,11 +323,7 @@ impl Language {
     #[doc(alias = "ts_language_field_name_for_id")]
     pub fn field_name_for_id(&self, field_id: u16) -> Option<&'static str> {
         let ptr = unsafe { ffi::ts_language_field_name_for_id(self.0, field_id) };
-        if ptr.is_null() {
-            None
-        } else {
-            Some(unsafe { CStr::from_ptr(ptr) }.to_str().unwrap())
-        }
+        (!ptr.is_null()).then(|| unsafe { CStr::from_ptr(ptr) }.to_str().unwrap())
     }
 
     /// Get the numerical id for the given field name.
@@ -376,11 +368,7 @@ impl Language {
     #[doc(alias = "ts_lookahead_iterator_new")]
     pub fn lookahead_iterator(&self, state: u16) -> Option<LookaheadIterator> {
         let ptr = unsafe { ffi::ts_lookahead_iterator_new(self.0, state) };
-        if ptr.is_null() {
-            None
-        } else {
-            Some(unsafe { LookaheadIterator::from_raw(ptr) })
-        }
+        (!ptr.is_null()).then(|| unsafe { LookaheadIterator::from_raw(ptr) })
     }
 }
 
@@ -418,11 +406,7 @@ impl Parser {
     #[doc(alias = "ts_parser_language")]
     pub fn language(&self) -> Option<Language> {
         let ptr = unsafe { ffi::ts_parser_language(self.0.as_ptr()) };
-        if ptr.is_null() {
-            None
-        } else {
-            Some(Language(ptr))
-        }
+        (!ptr.is_null()).then(|| Language(ptr))
     }
 
     /// Get the parser's current logger.
@@ -511,7 +495,7 @@ impl Parser {
         let bytes = text.as_ref();
         let len = bytes.len();
         self.parse_with(
-            &mut |i, _| if i < len { &bytes[i..] } else { &[] },
+            &mut |i, _| (i < len).then(|| &bytes[i..]).unwrap_or_default(),
             old_tree,
         )
     }
@@ -532,7 +516,7 @@ impl Parser {
         let code_points = input.as_ref();
         let len = code_points.len();
         self.parse_utf16_with(
-            &mut |i, _| if i < len { &code_points[i..] } else { &[] },
+            &mut |i, _| (i < len).then(|| &code_points[i..]).unwrap_or_default(),
             old_tree,
         )
     }
@@ -852,11 +836,7 @@ impl Clone for Tree {
 
 impl<'tree> Node<'tree> {
     fn new(node: ffi::TSNode) -> Option<Self> {
-        if node.id.is_null() {
-            None
-        } else {
-            Some(Node(node, PhantomData))
-        }
+        (!node.id.is_null()).then(|| Node(node, PhantomData))
     }
 
     /// Get a numeric id for this node that is unique.
@@ -1074,11 +1054,7 @@ impl<'tree> Node<'tree> {
     pub fn field_name_for_child(&self, child_index: u32) -> Option<&'static str> {
         unsafe {
             let ptr = ffi::ts_node_field_name_for_child(self.0, child_index);
-            if ptr.is_null() {
-                None
-            } else {
-                Some(CStr::from_ptr(ptr).to_str().unwrap())
-            }
+            (!ptr.is_null()).then(|| CStr::from_ptr(ptr).to_str().unwrap())
         }
     }
 
@@ -1345,11 +1321,7 @@ impl<'cursor> TreeCursor<'cursor> {
     pub fn field_name(&self) -> Option<&'static str> {
         unsafe {
             let ptr = ffi::ts_tree_cursor_current_field_name(&self.0);
-            if ptr.is_null() {
-                None
-            } else {
-                Some(CStr::from_ptr(ptr).to_str().unwrap())
-            }
+            (!ptr.is_null()).then(|| CStr::from_ptr(ptr).to_str().unwrap())
         }
     }
 
@@ -1442,11 +1414,7 @@ impl<'cursor> TreeCursor<'cursor> {
     pub fn goto_first_child_for_byte(&mut self, index: usize) -> Option<usize> {
         let result =
             unsafe { ffi::ts_tree_cursor_goto_first_child_for_byte(&mut self.0, index as u32) };
-        if result < 0 {
-            None
-        } else {
-            Some(result as usize)
-        }
+        (result >= 0).then_some(result as usize)
     }
 
     /// Move this cursor to the first child of its current node that extends beyond
@@ -1458,11 +1426,7 @@ impl<'cursor> TreeCursor<'cursor> {
     pub fn goto_first_child_for_point(&mut self, point: Point) -> Option<usize> {
         let result =
             unsafe { ffi::ts_tree_cursor_goto_first_child_for_point(&mut self.0, point.into()) };
-        if result < 0 {
-            None
-        } else {
-            Some(result as usize)
-        }
+        (result >= 0).then_some(result as usize)
     }
 
     /// Re-initialize this tree cursor to start at a different node.
@@ -1547,11 +1511,8 @@ impl Iterator for LookaheadNamesIterator<'_> {
 
     #[doc(alias = "ts_lookahead_iterator_advance")]
     fn next(&mut self) -> Option<Self::Item> {
-        if !(unsafe { ffi::ts_lookahead_iterator_advance(self.0 .0.as_ptr()) }) {
-            None
-        } else {
-            Some(self.0.current_symbol_name())
-        }
+        unsafe { ffi::ts_lookahead_iterator_advance(self.0 .0.as_ptr()) }
+            .then(|| self.0.current_symbol_name())
     }
 }
 
@@ -1561,11 +1522,8 @@ impl Iterator for LookaheadIterator {
     #[doc(alias = "ts_lookahead_iterator_advance")]
     fn next(&mut self) -> Option<Self::Item> {
         // the first symbol is always `0` so we can safely skip it
-        if !(unsafe { ffi::ts_lookahead_iterator_advance(self.0.as_ptr()) }) {
-            None
-        } else {
-            Some(self.current_symbol())
-        }
+        unsafe { ffi::ts_lookahead_iterator_advance(self.0.as_ptr()) }
+            .then(|| self.current_symbol())
     }
 }
 
@@ -1733,11 +1691,9 @@ impl Query {
                 let mut length = 0u32;
                 let raw_predicates =
                     ffi::ts_query_predicates_for_pattern(ptr, i as u32, &mut length as *mut u32);
-                if length > 0 {
-                    slice::from_raw_parts(raw_predicates, length as usize)
-                } else {
-                    &[]
-                }
+                (length > 0)
+                    .then(|| slice::from_raw_parts(raw_predicates, length as usize))
+                    .unwrap_or_default()
             };
 
             let byte_offset = unsafe { ffi::ts_query_start_byte_for_pattern(ptr, i as u32) };
@@ -2134,7 +2090,7 @@ impl QueryCursor {
         text_provider: T,
     ) -> QueryCaptures<'query, 'tree, T, I> {
         let ptr = self.ptr.as_ptr();
-        unsafe { ffi::ts_query_cursor_exec(self.ptr.as_ptr(), query.ptr.as_ptr(), node.0) };
+        unsafe { ffi::ts_query_cursor_exec(ptr, query.ptr.as_ptr(), node.0) };
         QueryCaptures {
             ptr,
             query,
@@ -2209,13 +2165,9 @@ impl<'tree> QueryMatch<'_, 'tree> {
         &self,
         capture_ix: u32,
     ) -> impl Iterator<Item = Node<'tree>> + '_ {
-        self.captures.iter().filter_map(move |capture| {
-            if capture.index == capture_ix {
-                Some(capture.node)
-            } else {
-                None
-            }
-        })
+        self.captures
+            .iter()
+            .filter_map(move |capture| (capture.index == capture_ix).then(|| capture.node))
     }
 
     fn new(m: ffi::TSQueryMatch, cursor: *mut ffi::TSQueryCursor) -> Self {
@@ -2223,16 +2175,14 @@ impl<'tree> QueryMatch<'_, 'tree> {
             cursor,
             id: m.id,
             pattern_index: m.pattern_index as usize,
-            captures: if m.capture_count > 0 {
-                unsafe {
+            captures: (m.capture_count > 0)
+                .then(|| unsafe {
                     slice::from_raw_parts(
                         m.captures as *const QueryCapture<'tree>,
                         m.capture_count as usize,
                     )
-                }
-            } else {
-                &[]
-            },
+                })
+                .unwrap_or_default(),
         }
     }
 
@@ -2269,7 +2219,7 @@ impl<'tree> QueryMatch<'_, 'tree> {
                 } else if let Some(ref first_chunk) = self.first_chunk {
                     first_chunk.as_ref()
                 } else {
-                    &[]
+                    Default::default()
                 }
             }
         }
@@ -2559,7 +2509,7 @@ impl<'a> Iterator for LossyUtf8<'a> {
         }
         match std::str::from_utf8(self.bytes) {
             Ok(valid) => {
-                self.bytes = &[];
+                self.bytes = Default::default();
                 Some(valid)
             }
             Err(error) => {

From b407b5588db29e2b93939afea001693776811131 Mon Sep 17 00:00:00 2001
From: Tom Beckmann <tomjonabc@gmail.com>
Date: Thu, 3 Aug 2023 16:02:51 +0200
Subject: [PATCH 248/347] binding_web: expose Node.fieldNameForChild(index)
 function

---
 lib/binding_web/binding.c    |  5 +++++
 lib/binding_web/binding.js   | 11 +++++++++++
 lib/binding_web/exports.json |  1 +
 3 files changed, 17 insertions(+)

diff --git a/lib/binding_web/binding.c b/lib/binding_web/binding.c
index 5a8e4e34..4be22a7e 100644
--- a/lib/binding_web/binding.c
+++ b/lib/binding_web/binding.c
@@ -361,6 +361,11 @@ uint16_t ts_node_symbol_wasm(const TSTree *tree) {
   return ts_node_symbol(node);
 }
 
+const char *ts_node_field_name_for_child_wasm(const TSTree *tree, uint32_t index) {
+  TSNode node = unmarshal_node(tree);
+  return ts_node_field_name_for_child(node, index);
+}
+
 uint16_t ts_node_grammar_symbol_wasm(const TSTree *tree) {
   TSNode node = unmarshal_node(tree);
   return ts_node_grammar_symbol(node);
diff --git a/lib/binding_web/binding.js b/lib/binding_web/binding.js
index e6c2b27e..35ad1cf5 100644
--- a/lib/binding_web/binding.js
+++ b/lib/binding_web/binding.js
@@ -282,6 +282,17 @@ class Node {
     return unmarshalNode(this.tree);
   }
 
+  fieldNameForChild(index) {
+    marshalNode(this);
+    const address = C._ts_node_field_name_for_child_wasm(this.tree[0], index);
+    if (!address) {
+      return null;
+    }
+    const result = AsciiToString(address);
+    // must not free, the string memory is owned by the language
+    return result;
+  }
+
   namedChild(index) {
     marshalNode(this);
     C._ts_node_named_child_wasm(this.tree[0], index);
diff --git a/lib/binding_web/exports.json b/lib/binding_web/exports.json
index 9e219d70..2063db47 100644
--- a/lib/binding_web/exports.json
+++ b/lib/binding_web/exports.json
@@ -44,6 +44,7 @@
   "_ts_language_symbol_type",
   "_ts_language_version",
   "_ts_language_next_state",
+  "_ts_node_field_name_for_child_wasm",
   "_ts_node_child_by_field_id_wasm",
   "_ts_node_child_count_wasm",
   "_ts_node_child_wasm",

From b947145e53234d13c935030113f16f5cd0bb6d3a Mon Sep 17 00:00:00 2001
From: Tom Beckmann <tomjonabc@gmail.com>
Date: Thu, 3 Aug 2023 16:32:51 +0200
Subject: [PATCH 249/347] add a test

---
 lib/binding_web/test/node-test.js | 16 ++++++++++++++++
 1 file changed, 16 insertions(+)

diff --git a/lib/binding_web/test/node-test.js b/lib/binding_web/test/node-test.js
index a87658c7..a1011154 100644
--- a/lib/binding_web/test/node-test.js
+++ b/lib/binding_web/test/node-test.js
@@ -454,4 +454,20 @@ describe("Node", () => {
       assert(!node1.equals(node2));
     });
   });
+
+  describe('.fieldNameForChild(index)', () => {
+    it('returns the field of a child or null', () => {
+      tree = parser.parse('let a = 5');
+
+      const noField = tree.rootNode.fieldNameForChild(0);
+      const name = tree.rootNode.firstChild.children[1].fieldNameForChild(0);
+      const value = tree.rootNode.firstChild.children[1].fieldNameForChild(2);
+      const overflow = tree.rootNode.firstChild.children[1].fieldNameForChild(3);
+
+      assert.equal(noField, null);
+      assert.equal(name, 'name');
+      assert.equal(value, 'value');
+      assert.equal(overflow, null);
+    });
+  });
 });

From 14aa23b1e13cd75a053dc21ae01a1e471fb912a5 Mon Sep 17 00:00:00 2001
From: Eddie Hatfield <edward.hatfield@tufts.edu>
Date: Thu, 8 Apr 2021 16:33:50 -0400
Subject: [PATCH 250/347] feat: run highlight tests in subdirectories

---
 cli/src/test_highlight.rs | 72 +++++++++++++++++++++++++--------------
 1 file changed, 46 insertions(+), 26 deletions(-)

diff --git a/cli/src/test_highlight.rs b/cli/src/test_highlight.rs
index 44a24244..a47f4560 100644
--- a/cli/src/test_highlight.rs
+++ b/cli/src/test_highlight.rs
@@ -39,41 +39,61 @@ impl std::fmt::Display for Failure {
 }
 
 pub fn test_highlights(loader: &Loader, directory: &Path) -> Result<()> {
+    println!("syntax highlighting:");
+    test_highlights_indented(loader, directory, 2)
+}
+
+fn test_highlights_indented(loader: &Loader, directory: &Path, indent_level: usize) -> Result<()> {
     let mut failed = false;
     let mut highlighter = Highlighter::new();
 
-    println!("syntax highlighting:");
     for highlight_test_file in fs::read_dir(directory)? {
         let highlight_test_file = highlight_test_file?;
         let test_file_path = highlight_test_file.path();
         let test_file_name = highlight_test_file.file_name();
-        let (language, language_config) = loader
-            .language_configuration_for_file_name(&test_file_path)?
-            .ok_or_else(|| anyhow!("No language found for path {:?}", test_file_path))?;
-        let highlight_config = language_config
-            .highlight_config(language)?
-            .ok_or_else(|| anyhow!("No highlighting config found for {:?}", test_file_path))?;
-        match test_highlight(
-            &loader,
-            &mut highlighter,
-            highlight_config,
-            fs::read(&test_file_path)?.as_slice(),
-        ) {
-            Ok(assertion_count) => {
-                println!(
-                    "  ✓ {} ({} assertions)",
-                    Colour::Green.paint(test_file_name.to_string_lossy().as_ref()),
-                    assertion_count
-                );
-            }
-            Err(e) => {
-                println!(
-                    "  ✗ {}",
-                    Colour::Red.paint(test_file_name.to_string_lossy().as_ref())
-                );
-                println!("    {}", e);
+        print!(
+            "{indent:indent_level$}",
+            indent = "",
+            indent_level = indent_level * 2
+        );
+        if test_file_path.is_dir() && !test_file_path.read_dir()?.next().is_none() {
+            println!("{}:", test_file_name.into_string().unwrap());
+            if let Err(_) = test_highlights_indented(loader, &test_file_path, indent_level + 1) {
                 failed = true;
             }
+        } else {
+            let (language, language_config) = loader
+                .language_configuration_for_file_name(&test_file_path)?
+                .ok_or_else(|| anyhow!("No language found for path {:?}", test_file_path))?;
+            let highlight_config = language_config
+                .highlight_config(language)?
+                .ok_or_else(|| anyhow!("No highlighting config found for {:?}", test_file_path))?;
+            match test_highlight(
+                &loader,
+                &mut highlighter,
+                highlight_config,
+                fs::read(&test_file_path)?.as_slice(),
+            ) {
+                Ok(assertion_count) => {
+                    println!(
+                        "✓ {} ({} assertions)",
+                        Colour::Green.paint(test_file_name.to_string_lossy().as_ref()),
+                        assertion_count
+                    );
+                }
+                Err(e) => {
+                    println!(
+                        "✗ {}",
+                        Colour::Red.paint(test_file_name.to_string_lossy().as_ref())
+                    );
+                    println!(
+                        "{indent:indent_level$}  {e}",
+                        indent = "",
+                        indent_level = indent_level * 2
+                    );
+                    failed = true;
+                }
+            }
         }
     }
 

From 61b70943b1caef016ae986c9169dd46dce78783e Mon Sep 17 00:00:00 2001
From: Jake Sarjeant <jake@sarjeant.me>
Date: Tue, 18 Jul 2023 13:24:52 +0200
Subject: [PATCH 251/347] feat(cli): add option to select JS runtime other than
 node

---
 cli/src/generate/mod.rs      | 23 +++++++++++++----------
 cli/src/main.rs              | 10 ++++++++++
 cli/src/tests/corpus_test.rs |  2 +-
 3 files changed, 24 insertions(+), 11 deletions(-)

diff --git a/cli/src/generate/mod.rs b/cli/src/generate/mod.rs
index 4e1cac63..3c0aeda1 100644
--- a/cli/src/generate/mod.rs
+++ b/cli/src/generate/mod.rs
@@ -21,10 +21,10 @@ use anyhow::{anyhow, Context, Result};
 use lazy_static::lazy_static;
 use regex::{Regex, RegexBuilder};
 use semver::Version;
-use std::fs;
 use std::io::Write;
 use std::path::{Path, PathBuf};
 use std::process::{Command, Stdio};
+use std::{env, fs};
 
 lazy_static! {
     static ref JSON_COMMENT_REGEX: Regex = RegexBuilder::new("^\\s*//.*")
@@ -44,16 +44,17 @@ pub fn generate_parser_in_directory(
     abi_version: usize,
     generate_bindings: bool,
     report_symbol_name: Option<&str>,
+    js_runtime: Option<&str>,
 ) -> Result<()> {
     let src_path = repo_path.join("src");
     let header_path = src_path.join("tree_sitter");
 
     // Read the grammar.json.
     let grammar_json = match grammar_path {
-        Some(path) => load_grammar_file(path.as_ref())?,
+        Some(path) => load_grammar_file(path.as_ref(), js_runtime)?,
         None => {
             let grammar_js_path = grammar_path.map_or(repo_path.join("grammar.js"), |s| s.into());
-            load_grammar_file(&grammar_js_path)?
+            load_grammar_file(&grammar_js_path, js_runtime)?
         }
     };
 
@@ -156,16 +157,15 @@ fn generate_parser_for_grammar_with_opts(
     })
 }
 
-pub fn load_grammar_file(grammar_path: &Path) -> Result<String> {
+pub fn load_grammar_file(grammar_path: &Path, js_runtime: Option<&str>) -> Result<String> {
     if grammar_path.is_dir() {
         return Err(anyhow!(
             "Path to a grammar file with `.js` or `.json` extension is required"
         ));
     }
     match grammar_path.extension().and_then(|e| e.to_str()) {
-        Some("js") => {
-            Ok(load_js_grammar_file(grammar_path).with_context(|| "Failed to load grammar.js")?)
-        }
+        Some("js") => Ok(load_js_grammar_file(grammar_path, js_runtime)
+            .with_context(|| "Failed to load grammar.js")?),
         Some("json") => {
             Ok(fs::read_to_string(grammar_path).with_context(|| "Failed to load grammar.json")?)
         }
@@ -176,14 +176,17 @@ pub fn load_grammar_file(grammar_path: &Path) -> Result<String> {
     }
 }
 
-fn load_js_grammar_file(grammar_path: &Path) -> Result<String> {
+fn load_js_grammar_file(grammar_path: &Path, js_runtime: Option<&str>) -> Result<String> {
     let grammar_path = fs::canonicalize(grammar_path)?;
-    let mut node_process = Command::new("node")
+
+    let js_runtime = js_runtime.unwrap_or("node");
+
+    let mut node_process = Command::new(js_runtime)
         .env("TREE_SITTER_GRAMMAR_PATH", grammar_path)
         .stdin(Stdio::piped())
         .stdout(Stdio::piped())
         .spawn()
-        .with_context(|| "Failed to run `node`")?;
+        .with_context(|| format!("Failed to run `{js_runtime}`"))?;
 
     let mut node_stdin = node_process
         .stdin
diff --git a/cli/src/main.rs b/cli/src/main.rs
index fe250e68..f66864ff 100644
--- a/cli/src/main.rs
+++ b/cli/src/main.rs
@@ -126,6 +126,14 @@ fn run() -> Result<()> {
                         .long("report-states-for-rule")
                         .value_name("rule-name")
                         .takes_value(true),
+                )
+                .arg(
+                    Arg::with_name("js-runtime")
+                        .long("js-runtime")
+                        .takes_value(true)
+                        .value_name("executable")
+                        .env("TREE_SITTER_JS_RUNTIME")
+                        .help("Use a JavaScript runtime other than node"),
                 ),
         )
         .subcommand(
@@ -307,6 +315,7 @@ fn run() -> Result<()> {
             let debug_build = matches.is_present("debug-build");
             let build = matches.is_present("build");
             let libdir = matches.value_of("libdir");
+            let js_runtime = matches.value_of("js-runtime");
             let report_symbol_name = matches.value_of("report-states-for-rule").or_else(|| {
                 if matches.is_present("report-states") {
                     Some("")
@@ -336,6 +345,7 @@ fn run() -> Result<()> {
                 abi_version,
                 generate_bindings,
                 report_symbol_name,
+                js_runtime,
             )?;
             if build {
                 if let Some(path) = libdir {
diff --git a/cli/src/tests/corpus_test.rs b/cli/src/tests/corpus_test.rs
index 24e72398..a193c029 100644
--- a/cli/src/tests/corpus_test.rs
+++ b/cli/src/tests/corpus_test.rs
@@ -260,7 +260,7 @@ fn test_feature_corpus_files() {
             grammar_path = test_path.join("grammar.json");
         }
         let error_message_path = test_path.join("expected_error.txt");
-        let grammar_json = generate::load_grammar_file(&grammar_path).unwrap();
+        let grammar_json = generate::load_grammar_file(&grammar_path, None).unwrap();
         let generate_result = generate::generate_parser_for_grammar(&grammar_json);
 
         if error_message_path.exists() {

From d710dc9c89d917ecee24c44cfd031dc1b3a8543a Mon Sep 17 00:00:00 2001
From: Amaan Qureshi <amaanq12@gmail.com>
Date: Thu, 3 Aug 2023 21:00:56 +0100
Subject: [PATCH 252/347] fix: ensure function signatures in the API
 consistently show parameter names

---
 lib/binding_rust/bindings.rs  | 280 ++++++++++++++++++----------------
 lib/include/tree_sitter/api.h | 230 ++++++++++++++--------------
 lib/src/alloc.c               |   8 +-
 lib/src/language.c            |   2 +-
 4 files changed, 270 insertions(+), 250 deletions(-)

diff --git a/lib/binding_rust/bindings.rs b/lib/binding_rust/bindings.rs
index faec9d3b..97117bde 100644
--- a/lib/binding_rust/bindings.rs
+++ b/lib/binding_rust/bindings.rs
@@ -78,8 +78,8 @@ pub struct TSLogger {
     pub log: ::std::option::Option<
         unsafe extern "C" fn(
             payload: *mut ::std::os::raw::c_void,
-            arg1: TSLogType,
-            arg2: *const ::std::os::raw::c_char,
+            log_type: TSLogType,
+            buffer: *const ::std::os::raw::c_char,
         ),
     >,
 }
@@ -151,27 +151,27 @@ extern "C" {
 }
 extern "C" {
     #[doc = " Delete the parser, freeing all of the memory that it used."]
-    pub fn ts_parser_delete(parser: *mut TSParser);
-}
-extern "C" {
-    #[doc = " Set the language that the parser should use for parsing.\n\n Returns a boolean indicating whether or not the language was successfully\n assigned. True means assignment succeeded. False means there was a version\n mismatch: the language was generated with an incompatible version of the\n Tree-sitter CLI. Check the language's version using `ts_language_version`\n and compare it to this library's `TREE_SITTER_LANGUAGE_VERSION` and\n `TREE_SITTER_MIN_COMPATIBLE_LANGUAGE_VERSION` constants."]
-    pub fn ts_parser_set_language(self_: *mut TSParser, language: *const TSLanguage) -> bool;
+    pub fn ts_parser_delete(self_: *mut TSParser);
 }
 extern "C" {
     #[doc = " Get the parser's current language."]
     pub fn ts_parser_language(self_: *const TSParser) -> *const TSLanguage;
 }
 extern "C" {
-    #[doc = " Set the ranges of text that the parser should include when parsing.\n\n By default, the parser will always include entire documents. This function\n allows you to parse only a *portion* of a document but still return a syntax\n tree whose ranges match up with the document as a whole. You can also pass\n multiple disjoint ranges.\n\n The second and third parameters specify the location and length of an array\n of ranges. The parser does *not* take ownership of these ranges; it copies\n the data, so it doesn't matter how these ranges are allocated.\n\n If `length` is zero, then the entire document will be parsed. Otherwise,\n the given ranges must be ordered from earliest to latest in the document,\n and they must not overlap. That is, the following must hold for all\n `i` < `length - 1`: ranges[i].end_byte <= ranges[i + 1].start_byte\n\n If this requirement is not satisfied, the operation will fail, the ranges\n will not be assigned, and this function will return `false`. On success,\n this function returns `true`"]
+    #[doc = " Set the language that the parser should use for parsing.\n\n Returns a boolean indicating whether or not the language was successfully\n assigned. True means assignment succeeded. False means there was a version\n mismatch: the language was generated with an incompatible version of the\n Tree-sitter CLI. Check the language's version using `ts_language_version`\n and compare it to this library's `TREE_SITTER_LANGUAGE_VERSION` and\n `TREE_SITTER_MIN_COMPATIBLE_LANGUAGE_VERSION` constants."]
+    pub fn ts_parser_set_language(self_: *mut TSParser, language: *const TSLanguage) -> bool;
+}
+extern "C" {
+    #[doc = " Set the ranges of text that the parser should include when parsing.\n\n By default, the parser will always include entire documents. This function\n allows you to parse only a *portion* of a document but still return a syntax\n tree whose ranges match up with the document as a whole. You can also pass\n multiple disjoint ranges.\n\n The second and third parameters specify the location and length of an array\n of ranges. The parser does *not* take ownership of these ranges; it copies\n the data, so it doesn't matter how these ranges are allocated.\n\n If `count` is zero, then the entire document will be parsed. Otherwise,\n the given ranges must be ordered from earliest to latest in the document,\n and they must not overlap. That is, the following must hold for all\n `i` < `count - 1`: ranges[i].end_byte <= ranges[i + 1].start_byte\n\n If this requirement is not satisfied, the operation will fail, the ranges\n will not be assigned, and this function will return `false`. On success,\n this function returns `true`"]
     pub fn ts_parser_set_included_ranges(
         self_: *mut TSParser,
         ranges: *const TSRange,
-        length: u32,
+        count: u32,
     ) -> bool;
 }
 extern "C" {
-    #[doc = " Get the ranges of text that the parser will include when parsing.\n\n The returned pointer is owned by the parser. The caller should not free it\n or write to it. The length of the array will be written to the given\n `length` pointer."]
-    pub fn ts_parser_included_ranges(self_: *const TSParser, length: *mut u32) -> *const TSRange;
+    #[doc = " Get the ranges of text that the parser will include when parsing.\n\n The returned pointer is owned by the parser. The caller should not free it\n or write to it. The length of the array will be written to the given\n `count` pointer."]
+    pub fn ts_parser_included_ranges(self_: *const TSParser, count: *mut u32) -> *const TSRange;
 }
 extern "C" {
     #[doc = " Use the parser to parse some source code and create a syntax tree.\n\n If you are parsing this document for the first time, pass `NULL` for the\n `old_tree` parameter. Otherwise, if you have already parsed an earlier\n version of this document and the document has since been edited, pass the\n previous syntax tree so that the unchanged parts of it can be reused.\n This will save time and memory. For this to work correctly, you must have\n already edited the old syntax tree using the `ts_tree_edit` function in a\n way that exactly matches the source code changes.\n\n The `TSInput` parameter lets you specify how to read the text. It has the\n following three fields:\n 1. `read`: A function to retrieve a chunk of text at a given byte offset\n    and (row, column) position. The function should return a pointer to the\n    text and write its length to the `bytes_read` pointer. The parser does\n    not take ownership of this buffer; it just borrows it until it has\n    finished reading it. The function should write a zero value to the\n    `bytes_read` pointer to indicate the end of the document.\n 2. `payload`: An arbitrary pointer that will be passed to each invocation\n    of the `read` function.\n 3. `encoding`: An indication of how the text is encoded. Either\n    `TSInputEncodingUTF8` or `TSInputEncodingUTF16`.\n\n This function returns a syntax tree on success, and `NULL` on failure. There\n are three possible reasons for failure:\n 1. The parser does not have a language assigned. Check for this using the\n`ts_parser_language` function.\n 2. Parsing was cancelled due to a timeout that was set by an earlier call to\n    the `ts_parser_set_timeout_micros` function. You can resume parsing from\n    where the parser left out by calling `ts_parser_parse` again with the\n    same arguments. Or you can start parsing from scratch by first calling\n    `ts_parser_reset`.\n 3. Parsing was cancelled using a cancellation flag that was set by an\n    earlier call to `ts_parser_set_cancellation_flag`. You can resume parsing\n    from where the parser left out by calling `ts_parser_parse` again with\n    the same arguments."]
@@ -206,7 +206,7 @@ extern "C" {
 }
 extern "C" {
     #[doc = " Set the maximum duration in microseconds that parsing should be allowed to\n take before halting.\n\n If parsing takes longer than this, it will halt early, returning NULL.\n See `ts_parser_parse` for more information."]
-    pub fn ts_parser_set_timeout_micros(self_: *mut TSParser, timeout: u64);
+    pub fn ts_parser_set_timeout_micros(self_: *mut TSParser, timeout_micros: u64);
 }
 extern "C" {
     #[doc = " Get the duration in microseconds that parsing is allowed to take."]
@@ -230,7 +230,7 @@ extern "C" {
 }
 extern "C" {
     #[doc = " Set the file descriptor to which the parser should write debugging graphs\n during parsing. The graphs are formatted in the DOT language. You may want\n to pipe these graphs directly to a `dot(1)` process in order to generate\n SVG output. You can turn off this logging by passing a negative number."]
-    pub fn ts_parser_print_dot_graphs(self_: *mut TSParser, file: ::std::os::raw::c_int);
+    pub fn ts_parser_print_dot_graphs(self_: *mut TSParser, fd: ::std::os::raw::c_int);
 }
 extern "C" {
     #[doc = " Create a shallow copy of the syntax tree. This is very fast.\n\n You need to copy a syntax tree in order to use it on more than one thread at\n a time, as syntax trees are not thread safe."]
@@ -249,16 +249,16 @@ extern "C" {
     pub fn ts_tree_root_node_with_offset(
         self_: *const TSTree,
         offset_bytes: u32,
-        offset_point: TSPoint,
+        offset_extent: TSPoint,
     ) -> TSNode;
 }
 extern "C" {
     #[doc = " Get the language that was used to parse the syntax tree."]
-    pub fn ts_tree_language(arg1: *const TSTree) -> *const TSLanguage;
+    pub fn ts_tree_language(self_: *const TSTree) -> *const TSLanguage;
 }
 extern "C" {
     #[doc = " Get the array of included ranges that was used to parse the syntax tree.\n\n The returned pointer must be freed by the caller."]
-    pub fn ts_tree_included_ranges(arg1: *const TSTree, length: *mut u32) -> *mut TSRange;
+    pub fn ts_tree_included_ranges(self_: *const TSTree, length: *mut u32) -> *mut TSRange;
 }
 extern "C" {
     #[doc = " Edit the syntax tree to keep it in sync with source code that has been\n edited.\n\n You must describe the edit both in terms of byte offsets and in terms of\n (row, column) coordinates."]
@@ -274,245 +274,256 @@ extern "C" {
 }
 extern "C" {
     #[doc = " Write a DOT graph describing the syntax tree to the given file."]
-    pub fn ts_tree_print_dot_graph(arg1: *const TSTree, file_descriptor: ::std::os::raw::c_int);
+    pub fn ts_tree_print_dot_graph(self_: *const TSTree, file_descriptor: ::std::os::raw::c_int);
 }
 extern "C" {
     #[doc = " Get the node's type as a null-terminated string."]
-    pub fn ts_node_type(arg1: TSNode) -> *const ::std::os::raw::c_char;
+    pub fn ts_node_type(self_: TSNode) -> *const ::std::os::raw::c_char;
 }
 extern "C" {
     #[doc = " Get the node's type as a numerical id."]
-    pub fn ts_node_symbol(arg1: TSNode) -> TSSymbol;
+    pub fn ts_node_symbol(self_: TSNode) -> TSSymbol;
 }
 extern "C" {
     #[doc = " Get the node's language."]
-    pub fn ts_node_language(arg1: TSNode) -> *const TSLanguage;
+    pub fn ts_node_language(self_: TSNode) -> *const TSLanguage;
 }
 extern "C" {
     #[doc = " Get the node's type as it appears in the grammar ignoring aliases as a\n null-terminated string."]
-    pub fn ts_node_grammar_type(arg1: TSNode) -> *const ::std::os::raw::c_char;
+    pub fn ts_node_grammar_type(self_: TSNode) -> *const ::std::os::raw::c_char;
 }
 extern "C" {
     #[doc = " Get the node's type as a numerical id as it appears in the grammar ignoring\n aliases. This should be used in `ts_language_next_state` instead of\n `ts_node_symbol`."]
-    pub fn ts_node_grammar_symbol(arg1: TSNode) -> TSSymbol;
+    pub fn ts_node_grammar_symbol(self_: TSNode) -> TSSymbol;
 }
 extern "C" {
     #[doc = " Get the node's start byte."]
-    pub fn ts_node_start_byte(arg1: TSNode) -> u32;
+    pub fn ts_node_start_byte(self_: TSNode) -> u32;
 }
 extern "C" {
     #[doc = " Get the node's start position in terms of rows and columns."]
-    pub fn ts_node_start_point(arg1: TSNode) -> TSPoint;
+    pub fn ts_node_start_point(self_: TSNode) -> TSPoint;
 }
 extern "C" {
     #[doc = " Get the node's end byte."]
-    pub fn ts_node_end_byte(arg1: TSNode) -> u32;
+    pub fn ts_node_end_byte(self_: TSNode) -> u32;
 }
 extern "C" {
     #[doc = " Get the node's end position in terms of rows and columns."]
-    pub fn ts_node_end_point(arg1: TSNode) -> TSPoint;
+    pub fn ts_node_end_point(self_: TSNode) -> TSPoint;
 }
 extern "C" {
     #[doc = " Get an S-expression representing the node as a string.\n\n This string is allocated with `malloc` and the caller is responsible for\n freeing it using `free`."]
-    pub fn ts_node_string(arg1: TSNode) -> *mut ::std::os::raw::c_char;
+    pub fn ts_node_string(self_: TSNode) -> *mut ::std::os::raw::c_char;
 }
 extern "C" {
     #[doc = " Check if the node is null. Functions like `ts_node_child` and\n `ts_node_next_sibling` will return a null node to indicate that no such node\n was found."]
-    pub fn ts_node_is_null(arg1: TSNode) -> bool;
+    pub fn ts_node_is_null(self_: TSNode) -> bool;
 }
 extern "C" {
     #[doc = " Check if the node is *named*. Named nodes correspond to named rules in the\n grammar, whereas *anonymous* nodes correspond to string literals in the\n grammar."]
-    pub fn ts_node_is_named(arg1: TSNode) -> bool;
+    pub fn ts_node_is_named(self_: TSNode) -> bool;
 }
 extern "C" {
     #[doc = " Check if the node is *missing*. Missing nodes are inserted by the parser in\n order to recover from certain kinds of syntax errors."]
-    pub fn ts_node_is_missing(arg1: TSNode) -> bool;
+    pub fn ts_node_is_missing(self_: TSNode) -> bool;
 }
 extern "C" {
     #[doc = " Check if the node is *extra*. Extra nodes represent things like comments,\n which are not required the grammar, but can appear anywhere."]
-    pub fn ts_node_is_extra(arg1: TSNode) -> bool;
+    pub fn ts_node_is_extra(self_: TSNode) -> bool;
 }
 extern "C" {
     #[doc = " Check if a syntax node has been edited."]
-    pub fn ts_node_has_changes(arg1: TSNode) -> bool;
+    pub fn ts_node_has_changes(self_: TSNode) -> bool;
 }
 extern "C" {
     #[doc = " Check if the node is a syntax error or contains any syntax errors."]
-    pub fn ts_node_has_error(arg1: TSNode) -> bool;
+    pub fn ts_node_has_error(self_: TSNode) -> bool;
 }
 extern "C" {
     #[doc = " Check if the node is a syntax error."]
-    pub fn ts_node_is_error(arg1: TSNode) -> bool;
+    pub fn ts_node_is_error(self_: TSNode) -> bool;
 }
 extern "C" {
     #[doc = " Get this node's parse state."]
-    pub fn ts_node_parse_state(arg1: TSNode) -> TSStateId;
+    pub fn ts_node_parse_state(self_: TSNode) -> TSStateId;
 }
 extern "C" {
     #[doc = " Get the parse state after this node."]
-    pub fn ts_node_next_parse_state(arg1: TSNode) -> TSStateId;
+    pub fn ts_node_next_parse_state(self_: TSNode) -> TSStateId;
 }
 extern "C" {
     #[doc = " Get the node's immediate parent."]
-    pub fn ts_node_parent(arg1: TSNode) -> TSNode;
+    pub fn ts_node_parent(self_: TSNode) -> TSNode;
 }
 extern "C" {
     #[doc = " Get the node's child at the given index, where zero represents the first\n child."]
-    pub fn ts_node_child(arg1: TSNode, arg2: u32) -> TSNode;
+    pub fn ts_node_child(self_: TSNode, child_index: u32) -> TSNode;
 }
 extern "C" {
     #[doc = " Get the field name for node's child at the given index, where zero represents\n the first child. Returns NULL, if no field is found."]
-    pub fn ts_node_field_name_for_child(arg1: TSNode, arg2: u32) -> *const ::std::os::raw::c_char;
+    pub fn ts_node_field_name_for_child(
+        self_: TSNode,
+        child_index: u32,
+    ) -> *const ::std::os::raw::c_char;
 }
 extern "C" {
     #[doc = " Get the node's number of children."]
-    pub fn ts_node_child_count(arg1: TSNode) -> u32;
+    pub fn ts_node_child_count(self_: TSNode) -> u32;
 }
 extern "C" {
     #[doc = " Get the node's *named* child at the given index.\n\n See also `ts_node_is_named`."]
-    pub fn ts_node_named_child(arg1: TSNode, arg2: u32) -> TSNode;
+    pub fn ts_node_named_child(self_: TSNode, child_index: u32) -> TSNode;
 }
 extern "C" {
     #[doc = " Get the node's number of *named* children.\n\n See also `ts_node_is_named`."]
-    pub fn ts_node_named_child_count(arg1: TSNode) -> u32;
+    pub fn ts_node_named_child_count(self_: TSNode) -> u32;
 }
 extern "C" {
     #[doc = " Get the node's child with the given field name."]
     pub fn ts_node_child_by_field_name(
         self_: TSNode,
-        field_name: *const ::std::os::raw::c_char,
-        field_name_length: u32,
+        name: *const ::std::os::raw::c_char,
+        name_length: u32,
     ) -> TSNode;
 }
 extern "C" {
     #[doc = " Get the node's child with the given numerical field id.\n\n You can convert a field name to an id using the\n `ts_language_field_id_for_name` function."]
-    pub fn ts_node_child_by_field_id(arg1: TSNode, arg2: TSFieldId) -> TSNode;
+    pub fn ts_node_child_by_field_id(self_: TSNode, field_id: TSFieldId) -> TSNode;
 }
 extern "C" {
     #[doc = " Get the node's next / previous sibling."]
-    pub fn ts_node_next_sibling(arg1: TSNode) -> TSNode;
+    pub fn ts_node_next_sibling(self_: TSNode) -> TSNode;
 }
 extern "C" {
-    pub fn ts_node_prev_sibling(arg1: TSNode) -> TSNode;
+    pub fn ts_node_prev_sibling(self_: TSNode) -> TSNode;
 }
 extern "C" {
     #[doc = " Get the node's next / previous *named* sibling."]
-    pub fn ts_node_next_named_sibling(arg1: TSNode) -> TSNode;
+    pub fn ts_node_next_named_sibling(self_: TSNode) -> TSNode;
 }
 extern "C" {
-    pub fn ts_node_prev_named_sibling(arg1: TSNode) -> TSNode;
+    pub fn ts_node_prev_named_sibling(self_: TSNode) -> TSNode;
 }
 extern "C" {
     #[doc = " Get the node's first child that extends beyond the given byte offset."]
-    pub fn ts_node_first_child_for_byte(arg1: TSNode, arg2: u32) -> TSNode;
+    pub fn ts_node_first_child_for_byte(self_: TSNode, byte: u32) -> TSNode;
 }
 extern "C" {
     #[doc = " Get the node's first named child that extends beyond the given byte offset."]
-    pub fn ts_node_first_named_child_for_byte(arg1: TSNode, arg2: u32) -> TSNode;
+    pub fn ts_node_first_named_child_for_byte(self_: TSNode, byte: u32) -> TSNode;
 }
 extern "C" {
     #[doc = " Get the node's number of descendants, including one for the node itself."]
-    pub fn ts_node_descendant_count(arg1: TSNode) -> u32;
+    pub fn ts_node_descendant_count(self_: TSNode) -> u32;
 }
 extern "C" {
     #[doc = " Get the smallest node within this node that spans the given range of bytes\n or (row, column) positions."]
-    pub fn ts_node_descendant_for_byte_range(arg1: TSNode, arg2: u32, arg3: u32) -> TSNode;
+    pub fn ts_node_descendant_for_byte_range(self_: TSNode, start: u32, end: u32) -> TSNode;
 }
 extern "C" {
-    pub fn ts_node_descendant_for_point_range(arg1: TSNode, arg2: TSPoint, arg3: TSPoint)
-        -> TSNode;
+    pub fn ts_node_descendant_for_point_range(
+        self_: TSNode,
+        start: TSPoint,
+        end: TSPoint,
+    ) -> TSNode;
 }
 extern "C" {
     #[doc = " Get the smallest named node within this node that spans the given range of\n bytes or (row, column) positions."]
-    pub fn ts_node_named_descendant_for_byte_range(arg1: TSNode, arg2: u32, arg3: u32) -> TSNode;
+    pub fn ts_node_named_descendant_for_byte_range(self_: TSNode, start: u32, end: u32) -> TSNode;
 }
 extern "C" {
     pub fn ts_node_named_descendant_for_point_range(
-        arg1: TSNode,
-        arg2: TSPoint,
-        arg3: TSPoint,
+        self_: TSNode,
+        start: TSPoint,
+        end: TSPoint,
     ) -> TSNode;
 }
 extern "C" {
     #[doc = " Edit the node to keep it in-sync with source code that has been edited.\n\n This function is only rarely needed. When you edit a syntax tree with the\n `ts_tree_edit` function, all of the nodes that you retrieve from the tree\n afterward will already reflect the edit. You only need to use `ts_node_edit`\n when you have a `TSNode` instance that you want to keep and continue to use\n after an edit."]
-    pub fn ts_node_edit(arg1: *mut TSNode, arg2: *const TSInputEdit);
+    pub fn ts_node_edit(self_: *mut TSNode, edit: *const TSInputEdit);
 }
 extern "C" {
     #[doc = " Check if two nodes are identical."]
-    pub fn ts_node_eq(arg1: TSNode, arg2: TSNode) -> bool;
+    pub fn ts_node_eq(self_: TSNode, other: TSNode) -> bool;
 }
 extern "C" {
     #[doc = " Create a new tree cursor starting from the given node.\n\n A tree cursor allows you to walk a syntax tree more efficiently than is\n possible using the `TSNode` functions. It is a mutable object that is always\n on a certain syntax node, and can be moved imperatively to different nodes."]
-    pub fn ts_tree_cursor_new(arg1: TSNode) -> TSTreeCursor;
+    pub fn ts_tree_cursor_new(node: TSNode) -> TSTreeCursor;
 }
 extern "C" {
     #[doc = " Delete a tree cursor, freeing all of the memory that it used."]
-    pub fn ts_tree_cursor_delete(arg1: *mut TSTreeCursor);
+    pub fn ts_tree_cursor_delete(self_: *mut TSTreeCursor);
 }
 extern "C" {
     #[doc = " Re-initialize a tree cursor to start at a different node."]
-    pub fn ts_tree_cursor_reset(arg1: *mut TSTreeCursor, arg2: TSNode);
+    pub fn ts_tree_cursor_reset(self_: *mut TSTreeCursor, node: TSNode);
 }
 extern "C" {
     #[doc = " Re-initialize a tree cursor to the same position as another cursor.\n\n Unlike `ts_tree_cursor_reset`, this will not lose parent information and\n allows reusing already created cursors."]
-    pub fn ts_tree_cursor_reset_to(arg1: *mut TSTreeCursor, arg2: *const TSTreeCursor);
+    pub fn ts_tree_cursor_reset_to(dst: *mut TSTreeCursor, src: *const TSTreeCursor);
 }
 extern "C" {
     #[doc = " Get the tree cursor's current node."]
-    pub fn ts_tree_cursor_current_node(arg1: *const TSTreeCursor) -> TSNode;
+    pub fn ts_tree_cursor_current_node(self_: *const TSTreeCursor) -> TSNode;
 }
 extern "C" {
     #[doc = " Get the field name of the tree cursor's current node.\n\n This returns `NULL` if the current node doesn't have a field.\n See also `ts_node_child_by_field_name`."]
     pub fn ts_tree_cursor_current_field_name(
-        arg1: *const TSTreeCursor,
+        self_: *const TSTreeCursor,
     ) -> *const ::std::os::raw::c_char;
 }
 extern "C" {
     #[doc = " Get the field id of the tree cursor's current node.\n\n This returns zero if the current node doesn't have a field.\n See also `ts_node_child_by_field_id`, `ts_language_field_id_for_name`."]
-    pub fn ts_tree_cursor_current_field_id(arg1: *const TSTreeCursor) -> TSFieldId;
+    pub fn ts_tree_cursor_current_field_id(self_: *const TSTreeCursor) -> TSFieldId;
 }
 extern "C" {
     #[doc = " Move the cursor to the parent of its current node.\n\n This returns `true` if the cursor successfully moved, and returns `false`\n if there was no parent node (the cursor was already on the root node)."]
-    pub fn ts_tree_cursor_goto_parent(arg1: *mut TSTreeCursor) -> bool;
+    pub fn ts_tree_cursor_goto_parent(self_: *mut TSTreeCursor) -> bool;
 }
 extern "C" {
     #[doc = " Move the cursor to the next sibling of its current node.\n\n This returns `true` if the cursor successfully moved, and returns `false`\n if there was no next sibling node."]
-    pub fn ts_tree_cursor_goto_next_sibling(arg1: *mut TSTreeCursor) -> bool;
+    pub fn ts_tree_cursor_goto_next_sibling(self_: *mut TSTreeCursor) -> bool;
 }
 extern "C" {
     #[doc = " Move the cursor to the previous sibling of its current node.\n\n This returns `true` if the cursor successfully moved, and returns `false` if\n there was no previous sibling node.\n\n Note, that this function may be slower than\n `ts_tree_cursor_goto_next_sibling` due to how node positions are stored. In\n the worst case, this will need to iterate through all the children upto the\n previous sibling node to recalculate its position."]
-    pub fn ts_tree_cursor_goto_previous_sibling(arg1: *mut TSTreeCursor) -> bool;
+    pub fn ts_tree_cursor_goto_previous_sibling(self_: *mut TSTreeCursor) -> bool;
 }
 extern "C" {
     #[doc = " Move the cursor to the first child of its current node.\n\n This returns `true` if the cursor successfully moved, and returns `false`\n if there were no children."]
-    pub fn ts_tree_cursor_goto_first_child(arg1: *mut TSTreeCursor) -> bool;
+    pub fn ts_tree_cursor_goto_first_child(self_: *mut TSTreeCursor) -> bool;
 }
 extern "C" {
     #[doc = " Move the cursor to the last child of its current node.\n\n This returns `true` if the cursor successfully moved, and returns `false` if\n there were no children.\n\n Note that this function may be slower than `ts_tree_cursor_goto_first_child`\n because it needs to iterate through all the children to compute the child's\n position."]
-    pub fn ts_tree_cursor_goto_last_child(arg1: *mut TSTreeCursor) -> bool;
+    pub fn ts_tree_cursor_goto_last_child(self_: *mut TSTreeCursor) -> bool;
 }
 extern "C" {
     #[doc = " Move the cursor to the node that is the nth descendant of\n the original node that the cursor was constructed with, where\n zero represents the original node itself."]
-    pub fn ts_tree_cursor_goto_descendant(arg1: *mut TSTreeCursor, arg2: u32);
+    pub fn ts_tree_cursor_goto_descendant(self_: *mut TSTreeCursor, goal_descendant_index: u32);
 }
 extern "C" {
     #[doc = " Get the index of the cursor's current node out of all of the\n descendants of the original node that the cursor was constructed with."]
-    pub fn ts_tree_cursor_current_descendant_index(arg1: *const TSTreeCursor) -> u32;
+    pub fn ts_tree_cursor_current_descendant_index(self_: *const TSTreeCursor) -> u32;
 }
 extern "C" {
     #[doc = " Get the depth of the cursor's current node relative to the original\n node that the cursor was constructed with."]
-    pub fn ts_tree_cursor_current_depth(arg1: *const TSTreeCursor) -> u32;
+    pub fn ts_tree_cursor_current_depth(self_: *const TSTreeCursor) -> u32;
 }
 extern "C" {
     #[doc = " Move the cursor to the first child of its current node that extends beyond\n the given byte offset or point.\n\n This returns the index of the child node if one was found, and returns -1\n if no such child was found."]
-    pub fn ts_tree_cursor_goto_first_child_for_byte(arg1: *mut TSTreeCursor, arg2: u32) -> i64;
+    pub fn ts_tree_cursor_goto_first_child_for_byte(
+        self_: *mut TSTreeCursor,
+        goal_byte: u32,
+    ) -> i64;
 }
 extern "C" {
-    pub fn ts_tree_cursor_goto_first_child_for_point(arg1: *mut TSTreeCursor, arg2: TSPoint)
-        -> i64;
+    pub fn ts_tree_cursor_goto_first_child_for_point(
+        self_: *mut TSTreeCursor,
+        goal_point: TSPoint,
+    ) -> i64;
 }
 extern "C" {
-    pub fn ts_tree_cursor_copy(arg1: *const TSTreeCursor) -> TSTreeCursor;
+    pub fn ts_tree_cursor_copy(cursor: *const TSTreeCursor) -> TSTreeCursor;
 }
 extern "C" {
     #[doc = " Create a new query from a string containing one or more S-expression\n patterns. The query is associated with a particular language, and can\n only be run on syntax nodes parsed with that language.\n\n If all of the given patterns are valid, this returns a `TSQuery`.\n If a pattern is invalid, this returns `NULL`, and provides two pieces\n of information about the problem:\n 1. The byte offset of the error is written to the `error_offset` parameter.\n 2. The type of error is written to the `error_type` parameter."]
@@ -526,21 +537,21 @@ extern "C" {
 }
 extern "C" {
     #[doc = " Delete a query, freeing all of the memory that it used."]
-    pub fn ts_query_delete(arg1: *mut TSQuery);
+    pub fn ts_query_delete(self_: *mut TSQuery);
 }
 extern "C" {
     #[doc = " Get the number of patterns, captures, or string literals in the query."]
-    pub fn ts_query_pattern_count(arg1: *const TSQuery) -> u32;
+    pub fn ts_query_pattern_count(self_: *const TSQuery) -> u32;
 }
 extern "C" {
-    pub fn ts_query_capture_count(arg1: *const TSQuery) -> u32;
+    pub fn ts_query_capture_count(self_: *const TSQuery) -> u32;
 }
 extern "C" {
-    pub fn ts_query_string_count(arg1: *const TSQuery) -> u32;
+    pub fn ts_query_string_count(self_: *const TSQuery) -> u32;
 }
 extern "C" {
     #[doc = " Get the byte offset where the given pattern starts in the query's source.\n\n This can be useful when combining queries by concatenating their source\n code strings."]
-    pub fn ts_query_start_byte_for_pattern(arg1: *const TSQuery, arg2: u32) -> u32;
+    pub fn ts_query_start_byte_for_pattern(self_: *const TSQuery, pattern_index: u32) -> u32;
 }
 extern "C" {
     #[doc = " Get all of the predicates for the given pattern in the query.\n\n The predicates are represented as a single array of steps. There are three\n types of steps in this array, which correspond to the three legal values for\n the `type` field:\n - `TSQueryPredicateStepTypeCapture` - Steps with this type represent names\n    of captures. Their `value_id` can be used with the\n   `ts_query_capture_name_for_id` function to obtain the name of the capture.\n - `TSQueryPredicateStepTypeString` - Steps with this type represent literal\n    strings. Their `value_id` can be used with the\n    `ts_query_string_value_for_id` function to obtain their string value.\n - `TSQueryPredicateStepTypeDone` - Steps with this type are *sentinels*\n    that represent the end of an individual predicate. If a pattern has two\n    predicates, then there will be two steps with this `type` in the array."]
@@ -562,7 +573,7 @@ extern "C" {
 extern "C" {
     #[doc = " Get the name and length of one of the query's captures, or one of the\n query's string literals. Each capture and string is associated with a\n numeric id based on the order that it appeared in the query's source."]
     pub fn ts_query_capture_name_for_id(
-        arg1: *const TSQuery,
+        self_: *const TSQuery,
         index: u32,
         length: *mut u32,
     ) -> *const ::std::os::raw::c_char;
@@ -570,14 +581,14 @@ extern "C" {
 extern "C" {
     #[doc = " Get the quantifier of the query's captures. Each capture is * associated\n with a numeric id based on the order that it appeared in the query's source."]
     pub fn ts_query_capture_quantifier_for_id(
-        arg1: *const TSQuery,
+        self_: *const TSQuery,
         pattern_index: u32,
         capture_index: u32,
     ) -> TSQuantifier;
 }
 extern "C" {
     pub fn ts_query_string_value_for_id(
-        arg1: *const TSQuery,
+        self_: *const TSQuery,
         index: u32,
         length: *mut u32,
     ) -> *const ::std::os::raw::c_char;
@@ -585,14 +596,14 @@ extern "C" {
 extern "C" {
     #[doc = " Disable a certain capture within a query.\n\n This prevents the capture from being returned in matches, and also avoids\n any resource usage associated with recording the capture. Currently, there\n is no way to undo this."]
     pub fn ts_query_disable_capture(
-        arg1: *mut TSQuery,
-        arg2: *const ::std::os::raw::c_char,
-        arg3: u32,
+        self_: *mut TSQuery,
+        name: *const ::std::os::raw::c_char,
+        length: u32,
     );
 }
 extern "C" {
     #[doc = " Disable a certain pattern within a query.\n\n This prevents the pattern from matching and removes most of the overhead\n associated with the pattern. Currently, there is no way to undo this."]
-    pub fn ts_query_disable_pattern(arg1: *mut TSQuery, arg2: u32);
+    pub fn ts_query_disable_pattern(self_: *mut TSQuery, pattern_index: u32);
 }
 extern "C" {
     #[doc = " Create a new cursor for executing a given query.\n\n The cursor stores the state that is needed to iteratively search\n for matches. To use the query cursor, first call `ts_query_cursor_exec`\n to start running a given query on a given syntax node. Then, there are\n two options for consuming the results of the query:\n 1. Repeatedly call `ts_query_cursor_next_match` to iterate over all of the\n    *matches* in the order that they were found. Each match contains the\n    index of the pattern that matched, and an array of captures. Because\n    multiple patterns can match the same set of nodes, one match may contain\n    captures that appear *before* some of the captures from a previous match.\n 2. Repeatedly call `ts_query_cursor_next_capture` to iterate over all of the\n    individual *captures* in the order that they appear. This is useful if\n    don't care about which pattern matched, and just want a single ordered\n    sequence of captures.\n\n If you don't care about consuming all of the results, you can stop calling\n `ts_query_cursor_next_match` or `ts_query_cursor_next_capture` at any point.\n  You can then start executing another query on another node by calling\n  `ts_query_cursor_exec` again."]
@@ -600,61 +611,70 @@ extern "C" {
 }
 extern "C" {
     #[doc = " Delete a query cursor, freeing all of the memory that it used."]
-    pub fn ts_query_cursor_delete(arg1: *mut TSQueryCursor);
+    pub fn ts_query_cursor_delete(self_: *mut TSQueryCursor);
 }
 extern "C" {
     #[doc = " Start running a given query on a given node."]
-    pub fn ts_query_cursor_exec(arg1: *mut TSQueryCursor, arg2: *const TSQuery, arg3: TSNode);
+    pub fn ts_query_cursor_exec(self_: *mut TSQueryCursor, query: *const TSQuery, node: TSNode);
 }
 extern "C" {
     #[doc = " Manage the maximum number of in-progress matches allowed by this query\n cursor.\n\n Query cursors have an optional maximum capacity for storing lists of\n in-progress captures. If this capacity is exceeded, then the\n earliest-starting match will silently be dropped to make room for further\n matches. This maximum capacity is optional — by default, query cursors allow\n any number of pending matches, dynamically allocating new space for them as\n needed as the query is executed."]
-    pub fn ts_query_cursor_did_exceed_match_limit(arg1: *const TSQueryCursor) -> bool;
+    pub fn ts_query_cursor_did_exceed_match_limit(self_: *const TSQueryCursor) -> bool;
 }
 extern "C" {
-    pub fn ts_query_cursor_match_limit(arg1: *const TSQueryCursor) -> u32;
+    pub fn ts_query_cursor_match_limit(self_: *const TSQueryCursor) -> u32;
 }
 extern "C" {
-    pub fn ts_query_cursor_set_match_limit(arg1: *mut TSQueryCursor, arg2: u32);
+    pub fn ts_query_cursor_set_match_limit(self_: *mut TSQueryCursor, limit: u32);
 }
 extern "C" {
     #[doc = " Set the range of bytes or (row, column) positions in which the query\n will be executed."]
-    pub fn ts_query_cursor_set_byte_range(arg1: *mut TSQueryCursor, arg2: u32, arg3: u32);
+    pub fn ts_query_cursor_set_byte_range(
+        self_: *mut TSQueryCursor,
+        start_byte: u32,
+        end_byte: u32,
+    );
 }
 extern "C" {
-    pub fn ts_query_cursor_set_point_range(arg1: *mut TSQueryCursor, arg2: TSPoint, arg3: TSPoint);
+    pub fn ts_query_cursor_set_point_range(
+        self_: *mut TSQueryCursor,
+        start_point: TSPoint,
+        end_point: TSPoint,
+    );
 }
 extern "C" {
     #[doc = " Advance to the next match of the currently running query.\n\n If there is a match, write it to `*match` and return `true`.\n Otherwise, return `false`."]
-    pub fn ts_query_cursor_next_match(arg1: *mut TSQueryCursor, match_: *mut TSQueryMatch) -> bool;
+    pub fn ts_query_cursor_next_match(self_: *mut TSQueryCursor, match_: *mut TSQueryMatch)
+        -> bool;
 }
 extern "C" {
-    pub fn ts_query_cursor_remove_match(arg1: *mut TSQueryCursor, match_id: u32);
+    pub fn ts_query_cursor_remove_match(self_: *mut TSQueryCursor, match_id: u32);
 }
 extern "C" {
     #[doc = " Advance to the next capture of the currently running query.\n\n If there is a capture, write its match to `*match` and its index within\n the matche's capture list to `*capture_index`. Otherwise, return `false`."]
     pub fn ts_query_cursor_next_capture(
-        arg1: *mut TSQueryCursor,
+        self_: *mut TSQueryCursor,
         match_: *mut TSQueryMatch,
         capture_index: *mut u32,
     ) -> bool;
 }
 extern "C" {
     #[doc = " Set the maximum start depth for a query cursor.\n\n This prevents cursors from exploring children nodes at a certain depth.\n Note if a pattern includes many children, then they will still be checked.\n\n The zero max start depth value can be used as a special behavior and\n it helps to destructure a subtree by staying on a node and using captures\n for interested parts. Note that the zero max start depth only limit a search\n depth for a pattern's root node but other nodes that are parts of the pattern\n may be searched at any depth what defined by the pattern structure.\n\n Set to `UINT32_MAX` to remove the maximum start depth."]
-    pub fn ts_query_cursor_set_max_start_depth(arg1: *mut TSQueryCursor, arg2: u32);
+    pub fn ts_query_cursor_set_max_start_depth(self_: *mut TSQueryCursor, max_start_depth: u32);
 }
 extern "C" {
     #[doc = " Get the number of distinct node types in the language."]
-    pub fn ts_language_symbol_count(arg1: *const TSLanguage) -> u32;
+    pub fn ts_language_symbol_count(self_: *const TSLanguage) -> u32;
 }
 extern "C" {
     #[doc = " Get the number of valid states in this language."]
-    pub fn ts_language_state_count(arg1: *const TSLanguage) -> u32;
+    pub fn ts_language_state_count(self_: *const TSLanguage) -> u32;
 }
 extern "C" {
     #[doc = " Get a node type string for the given numerical id."]
     pub fn ts_language_symbol_name(
-        arg1: *const TSLanguage,
-        arg2: TSSymbol,
+        self_: *const TSLanguage,
+        symbol: TSSymbol,
     ) -> *const ::std::os::raw::c_char;
 }
 extern "C" {
@@ -668,81 +688,81 @@ extern "C" {
 }
 extern "C" {
     #[doc = " Get the number of distinct field names in the language."]
-    pub fn ts_language_field_count(arg1: *const TSLanguage) -> u32;
+    pub fn ts_language_field_count(self_: *const TSLanguage) -> u32;
 }
 extern "C" {
     #[doc = " Get the field name string for the given numerical id."]
     pub fn ts_language_field_name_for_id(
-        arg1: *const TSLanguage,
-        arg2: TSFieldId,
+        self_: *const TSLanguage,
+        id: TSFieldId,
     ) -> *const ::std::os::raw::c_char;
 }
 extern "C" {
     #[doc = " Get the numerical id for the given field name string."]
     pub fn ts_language_field_id_for_name(
-        arg1: *const TSLanguage,
-        arg2: *const ::std::os::raw::c_char,
-        arg3: u32,
+        self_: *const TSLanguage,
+        name: *const ::std::os::raw::c_char,
+        name_length: u32,
     ) -> TSFieldId;
 }
 extern "C" {
     #[doc = " Check whether the given node type id belongs to named nodes, anonymous nodes,\n or a hidden nodes.\n\n See also `ts_node_is_named`. Hidden nodes are never returned from the API."]
-    pub fn ts_language_symbol_type(arg1: *const TSLanguage, arg2: TSSymbol) -> TSSymbolType;
+    pub fn ts_language_symbol_type(self_: *const TSLanguage, symbol: TSSymbol) -> TSSymbolType;
 }
 extern "C" {
     #[doc = " Get the ABI version number for this language. This version number is used\n to ensure that languages were generated by a compatible version of\n Tree-sitter.\n\n See also `ts_parser_set_language`."]
-    pub fn ts_language_version(arg1: *const TSLanguage) -> u32;
+    pub fn ts_language_version(self_: *const TSLanguage) -> u32;
 }
 extern "C" {
     #[doc = " Get the next parse state. Combine this with lookahead iterators to generate\n completion suggestions or valid symbols in error nodes. Use\n `ts_node_grammar_symbol` for valid symbols."]
     pub fn ts_language_next_state(
-        arg1: *const TSLanguage,
-        arg2: TSStateId,
-        arg3: TSSymbol,
+        self_: *const TSLanguage,
+        state: TSStateId,
+        symbol: TSSymbol,
     ) -> TSStateId;
 }
 extern "C" {
     #[doc = " Create a new lookahead iterator for the given language and parse state.\n\n This returns `NULL` if state is invalid for the language.\n\n Repeatedly using `ts_lookahead_iterator_advance` and\n `ts_lookahead_iterator_current_symbol` will generate valid symbols in the\n given parse state. Newly created lookahead iterators will contain the `ERROR`\n symbol.\n\n Lookahead iterators can be useful to generate suggestions and improve syntax\n error diagnostics. To get symbols valid in an ERROR node, use the lookahead\n iterator on its first leaf node state. For `MISSING` nodes, a lookahead\n iterator created on the previous non-extra leaf node may be appropriate."]
     pub fn ts_lookahead_iterator_new(
-        arg1: *const TSLanguage,
-        arg2: TSStateId,
+        self_: *const TSLanguage,
+        state: TSStateId,
     ) -> *mut TSLookaheadIterator;
 }
 extern "C" {
     #[doc = " Delete a lookahead iterator freeing all the memory used."]
-    pub fn ts_lookahead_iterator_delete(arg1: *mut TSLookaheadIterator);
+    pub fn ts_lookahead_iterator_delete(self_: *mut TSLookaheadIterator);
 }
 extern "C" {
     #[doc = " Reset the lookahead iterator to another state.\n\n This returns `true` if the iterator was reset to the given state and `false`\n otherwise."]
     pub fn ts_lookahead_iterator_reset_state(
-        arg1: *mut TSLookaheadIterator,
-        arg2: TSStateId,
+        self_: *mut TSLookaheadIterator,
+        state: TSStateId,
     ) -> bool;
 }
 extern "C" {
     #[doc = " Reset the lookahead iterator.\n\n This returns `true` if the language was set successfully and `false`\n otherwise."]
     pub fn ts_lookahead_iterator_reset(
-        arg1: *mut TSLookaheadIterator,
-        arg2: *const TSLanguage,
-        arg3: TSStateId,
+        self_: *mut TSLookaheadIterator,
+        language: *const TSLanguage,
+        state: TSStateId,
     ) -> bool;
 }
 extern "C" {
     #[doc = " Get the current language of the lookahead iterator."]
-    pub fn ts_lookahead_iterator_language(arg1: *const TSLookaheadIterator) -> *const TSLanguage;
+    pub fn ts_lookahead_iterator_language(self_: *const TSLookaheadIterator) -> *const TSLanguage;
 }
 extern "C" {
     #[doc = " Advance the lookahead iterator to the next symbol.\n\n This returns `true` if there is a new symbol and `false` otherwise."]
-    pub fn ts_lookahead_iterator_advance(arg1: *mut TSLookaheadIterator) -> bool;
+    pub fn ts_lookahead_iterator_advance(self_: *mut TSLookaheadIterator) -> bool;
 }
 extern "C" {
     #[doc = " Get the current symbol of the lookahead iterator;"]
-    pub fn ts_lookahead_iterator_current_symbol(arg1: *const TSLookaheadIterator) -> TSSymbol;
+    pub fn ts_lookahead_iterator_current_symbol(self_: *const TSLookaheadIterator) -> TSSymbol;
 }
 extern "C" {
     #[doc = " Get the current symbol type of the lookahead iterator as a null terminated\n string."]
     pub fn ts_lookahead_iterator_current_symbol_name(
-        arg1: *const TSLookaheadIterator,
+        self_: *const TSLookaheadIterator,
     ) -> *const ::std::os::raw::c_char;
 }
 extern "C" {
diff --git a/lib/include/tree_sitter/api.h b/lib/include/tree_sitter/api.h
index 349f6838..f07929bd 100644
--- a/lib/include/tree_sitter/api.h
+++ b/lib/include/tree_sitter/api.h
@@ -78,7 +78,7 @@ typedef enum {
 
 typedef struct {
   void *payload;
-  void (*log)(void *payload, TSLogType, const char *);
+  void (*log)(void *payload, TSLogType log_type, const char *buffer);
 } TSLogger;
 
 typedef struct {
@@ -155,7 +155,12 @@ TSParser *ts_parser_new(void);
 /**
  * Delete the parser, freeing all of the memory that it used.
  */
-void ts_parser_delete(TSParser *parser);
+void ts_parser_delete(TSParser *self);
+
+/**
+ * Get the parser's current language.
+ */
+const TSLanguage *ts_parser_language(const TSParser *self);
 
 /**
  * Set the language that the parser should use for parsing.
@@ -169,11 +174,6 @@ void ts_parser_delete(TSParser *parser);
  */
 bool ts_parser_set_language(TSParser *self, const TSLanguage *language);
 
-/**
- * Get the parser's current language.
- */
-const TSLanguage *ts_parser_language(const TSParser *self);
-
 /**
  * Set the ranges of text that the parser should include when parsing.
  *
@@ -186,10 +186,10 @@ const TSLanguage *ts_parser_language(const TSParser *self);
  * of ranges. The parser does *not* take ownership of these ranges; it copies
  * the data, so it doesn't matter how these ranges are allocated.
  *
- * If `length` is zero, then the entire document will be parsed. Otherwise,
+ * If `count` is zero, then the entire document will be parsed. Otherwise,
  * the given ranges must be ordered from earliest to latest in the document,
  * and they must not overlap. That is, the following must hold for all
- * `i` < `length - 1`: ranges[i].end_byte <= ranges[i + 1].start_byte
+ * `i` < `count - 1`: ranges[i].end_byte <= ranges[i + 1].start_byte
  *
  * If this requirement is not satisfied, the operation will fail, the ranges
  * will not be assigned, and this function will return `false`. On success,
@@ -198,7 +198,7 @@ const TSLanguage *ts_parser_language(const TSParser *self);
 bool ts_parser_set_included_ranges(
   TSParser *self,
   const TSRange *ranges,
-  uint32_t length
+  uint32_t count
 );
 
 /**
@@ -206,11 +206,11 @@ bool ts_parser_set_included_ranges(
  *
  * The returned pointer is owned by the parser. The caller should not free it
  * or write to it. The length of the array will be written to the given
- * `length` pointer.
+ * `count` pointer.
  */
 const TSRange *ts_parser_included_ranges(
   const TSParser *self,
-  uint32_t *length
+  uint32_t *count
 );
 
 /**
@@ -302,7 +302,7 @@ void ts_parser_reset(TSParser *self);
  * If parsing takes longer than this, it will halt early, returning NULL.
  * See `ts_parser_parse` for more information.
  */
-void ts_parser_set_timeout_micros(TSParser *self, uint64_t timeout);
+void ts_parser_set_timeout_micros(TSParser *self, uint64_t timeout_micros);
 
 /**
  * Get the duration in microseconds that parsing is allowed to take.
@@ -343,7 +343,7 @@ TSLogger ts_parser_logger(const TSParser *self);
  * to pipe these graphs directly to a `dot(1)` process in order to generate
  * SVG output. You can turn off this logging by passing a negative number.
  */
-void ts_parser_print_dot_graphs(TSParser *self, int file);
+void ts_parser_print_dot_graphs(TSParser *self, int fd);
 
 /******************/
 /* Section - Tree */
@@ -374,20 +374,20 @@ TSNode ts_tree_root_node(const TSTree *self);
 TSNode ts_tree_root_node_with_offset(
   const TSTree *self,
   uint32_t offset_bytes,
-  TSPoint offset_point
+  TSPoint offset_extent
 );
 
 /**
  * Get the language that was used to parse the syntax tree.
  */
-const TSLanguage *ts_tree_language(const TSTree *);
+const TSLanguage *ts_tree_language(const TSTree *self);
 
 /**
  * Get the array of included ranges that was used to parse the syntax tree.
  *
  * The returned pointer must be freed by the caller.
  */
-TSRange *ts_tree_included_ranges(const TSTree *, uint32_t *length);
+TSRange *ts_tree_included_ranges(const TSTree *self, uint32_t *length);
 
 /**
  * Edit the syntax tree to keep it in sync with source code that has been
@@ -421,7 +421,7 @@ TSRange *ts_tree_get_changed_ranges(
 /**
  * Write a DOT graph describing the syntax tree to the given file.
  */
-void ts_tree_print_dot_graph(const TSTree *, int file_descriptor);
+void ts_tree_print_dot_graph(const TSTree *self, int file_descriptor);
 
 /******************/
 /* Section - Node */
@@ -430,50 +430,50 @@ void ts_tree_print_dot_graph(const TSTree *, int file_descriptor);
 /**
  * Get the node's type as a null-terminated string.
  */
-const char *ts_node_type(TSNode);
+const char *ts_node_type(TSNode self);
 
 /**
  * Get the node's type as a numerical id.
  */
-TSSymbol ts_node_symbol(TSNode);
+TSSymbol ts_node_symbol(TSNode self);
 
 /**
  * Get the node's language.
  */
-const TSLanguage *ts_node_language(TSNode);
+const TSLanguage *ts_node_language(TSNode self);
 
 /**
  * Get the node's type as it appears in the grammar ignoring aliases as a
  * null-terminated string.
  */
-const char *ts_node_grammar_type(TSNode);
+const char *ts_node_grammar_type(TSNode self);
 
 /**
  * Get the node's type as a numerical id as it appears in the grammar ignoring
  * aliases. This should be used in `ts_language_next_state` instead of
  * `ts_node_symbol`.
  */
-TSSymbol ts_node_grammar_symbol(TSNode);
+TSSymbol ts_node_grammar_symbol(TSNode self);
 
 /**
  * Get the node's start byte.
  */
-uint32_t ts_node_start_byte(TSNode);
+uint32_t ts_node_start_byte(TSNode self);
 
 /**
  * Get the node's start position in terms of rows and columns.
  */
-TSPoint ts_node_start_point(TSNode);
+TSPoint ts_node_start_point(TSNode self);
 
 /**
  * Get the node's end byte.
  */
-uint32_t ts_node_end_byte(TSNode);
+uint32_t ts_node_end_byte(TSNode self);
 
 /**
  * Get the node's end position in terms of rows and columns.
  */
-TSPoint ts_node_end_point(TSNode);
+TSPoint ts_node_end_point(TSNode self);
 
 /**
  * Get an S-expression representing the node as a string.
@@ -481,102 +481,102 @@ TSPoint ts_node_end_point(TSNode);
  * This string is allocated with `malloc` and the caller is responsible for
  * freeing it using `free`.
  */
-char *ts_node_string(TSNode);
+char *ts_node_string(TSNode self);
 
 /**
  * Check if the node is null. Functions like `ts_node_child` and
  * `ts_node_next_sibling` will return a null node to indicate that no such node
  * was found.
  */
-bool ts_node_is_null(TSNode);
+bool ts_node_is_null(TSNode self);
 
 /**
  * Check if the node is *named*. Named nodes correspond to named rules in the
  * grammar, whereas *anonymous* nodes correspond to string literals in the
  * grammar.
  */
-bool ts_node_is_named(TSNode);
+bool ts_node_is_named(TSNode self);
 
 /**
  * Check if the node is *missing*. Missing nodes are inserted by the parser in
  * order to recover from certain kinds of syntax errors.
  */
-bool ts_node_is_missing(TSNode);
+bool ts_node_is_missing(TSNode self);
 
 /**
  * Check if the node is *extra*. Extra nodes represent things like comments,
  * which are not required the grammar, but can appear anywhere.
  */
-bool ts_node_is_extra(TSNode);
+bool ts_node_is_extra(TSNode self);
 
 /**
  * Check if a syntax node has been edited.
  */
-bool ts_node_has_changes(TSNode);
+bool ts_node_has_changes(TSNode self);
 
 /**
  * Check if the node is a syntax error or contains any syntax errors.
  */
-bool ts_node_has_error(TSNode);
+bool ts_node_has_error(TSNode self);
 
 /**
  * Check if the node is a syntax error.
 */
-bool ts_node_is_error(TSNode);
+bool ts_node_is_error(TSNode self);
 
 /**
  * Get this node's parse state.
 */
-TSStateId ts_node_parse_state(TSNode);
+TSStateId ts_node_parse_state(TSNode self);
 
 /**
  * Get the parse state after this node.
 */
-TSStateId ts_node_next_parse_state(TSNode);
+TSStateId ts_node_next_parse_state(TSNode self);
 
 /**
  * Get the node's immediate parent.
  */
-TSNode ts_node_parent(TSNode);
+TSNode ts_node_parent(TSNode self);
 
 /**
  * Get the node's child at the given index, where zero represents the first
  * child.
  */
-TSNode ts_node_child(TSNode, uint32_t);
+TSNode ts_node_child(TSNode self, uint32_t child_index);
 
 /**
  * Get the field name for node's child at the given index, where zero represents
  * the first child. Returns NULL, if no field is found.
  */
-const char *ts_node_field_name_for_child(TSNode, uint32_t);
+const char *ts_node_field_name_for_child(TSNode self, uint32_t child_index);
 
 /**
  * Get the node's number of children.
  */
-uint32_t ts_node_child_count(TSNode);
+uint32_t ts_node_child_count(TSNode self);
 
 /**
  * Get the node's *named* child at the given index.
  *
  * See also `ts_node_is_named`.
  */
-TSNode ts_node_named_child(TSNode, uint32_t);
+TSNode ts_node_named_child(TSNode self, uint32_t child_index);
 
 /**
  * Get the node's number of *named* children.
  *
  * See also `ts_node_is_named`.
  */
-uint32_t ts_node_named_child_count(TSNode);
+uint32_t ts_node_named_child_count(TSNode self);
 
 /**
  * Get the node's child with the given field name.
  */
 TSNode ts_node_child_by_field_name(
   TSNode self,
-  const char *field_name,
-  uint32_t field_name_length
+  const char *name,
+  uint32_t name_length
 );
 
 /**
@@ -585,48 +585,48 @@ TSNode ts_node_child_by_field_name(
  * You can convert a field name to an id using the
  * `ts_language_field_id_for_name` function.
  */
-TSNode ts_node_child_by_field_id(TSNode, TSFieldId);
+TSNode ts_node_child_by_field_id(TSNode self, TSFieldId field_id);
 
 /**
  * Get the node's next / previous sibling.
  */
-TSNode ts_node_next_sibling(TSNode);
-TSNode ts_node_prev_sibling(TSNode);
+TSNode ts_node_next_sibling(TSNode self);
+TSNode ts_node_prev_sibling(TSNode self);
 
 /**
  * Get the node's next / previous *named* sibling.
  */
-TSNode ts_node_next_named_sibling(TSNode);
-TSNode ts_node_prev_named_sibling(TSNode);
+TSNode ts_node_next_named_sibling(TSNode self);
+TSNode ts_node_prev_named_sibling(TSNode self);
 
 /**
  * Get the node's first child that extends beyond the given byte offset.
  */
-TSNode ts_node_first_child_for_byte(TSNode, uint32_t);
+TSNode ts_node_first_child_for_byte(TSNode self, uint32_t byte);
 
 /**
  * Get the node's first named child that extends beyond the given byte offset.
  */
-TSNode ts_node_first_named_child_for_byte(TSNode, uint32_t);
+TSNode ts_node_first_named_child_for_byte(TSNode self, uint32_t byte);
 
 /**
  * Get the node's number of descendants, including one for the node itself.
  */
-uint32_t ts_node_descendant_count(TSNode);
+uint32_t ts_node_descendant_count(TSNode self);
 
 /**
  * Get the smallest node within this node that spans the given range of bytes
  * or (row, column) positions.
  */
-TSNode ts_node_descendant_for_byte_range(TSNode, uint32_t, uint32_t);
-TSNode ts_node_descendant_for_point_range(TSNode, TSPoint, TSPoint);
+TSNode ts_node_descendant_for_byte_range(TSNode self, uint32_t start, uint32_t end);
+TSNode ts_node_descendant_for_point_range(TSNode self, TSPoint start, TSPoint end);
 
 /**
  * Get the smallest named node within this node that spans the given range of
  * bytes or (row, column) positions.
  */
-TSNode ts_node_named_descendant_for_byte_range(TSNode, uint32_t, uint32_t);
-TSNode ts_node_named_descendant_for_point_range(TSNode, TSPoint, TSPoint);
+TSNode ts_node_named_descendant_for_byte_range(TSNode self, uint32_t start, uint32_t end);
+TSNode ts_node_named_descendant_for_point_range(TSNode self, TSPoint start, TSPoint end);
 
 /**
  * Edit the node to keep it in-sync with source code that has been edited.
@@ -637,12 +637,12 @@ TSNode ts_node_named_descendant_for_point_range(TSNode, TSPoint, TSPoint);
  * when you have a `TSNode` instance that you want to keep and continue to use
  * after an edit.
  */
-void ts_node_edit(TSNode *, const TSInputEdit *);
+void ts_node_edit(TSNode *self, const TSInputEdit *edit);
 
 /**
  * Check if two nodes are identical.
  */
-bool ts_node_eq(TSNode, TSNode);
+bool ts_node_eq(TSNode self, TSNode other);
 
 /************************/
 /* Section - TreeCursor */
@@ -655,17 +655,17 @@ bool ts_node_eq(TSNode, TSNode);
  * possible using the `TSNode` functions. It is a mutable object that is always
  * on a certain syntax node, and can be moved imperatively to different nodes.
  */
-TSTreeCursor ts_tree_cursor_new(TSNode);
+TSTreeCursor ts_tree_cursor_new(TSNode node);
 
 /**
  * Delete a tree cursor, freeing all of the memory that it used.
  */
-void ts_tree_cursor_delete(TSTreeCursor *);
+void ts_tree_cursor_delete(TSTreeCursor *self);
 
 /**
  * Re-initialize a tree cursor to start at a different node.
  */
-void ts_tree_cursor_reset(TSTreeCursor *, TSNode);
+void ts_tree_cursor_reset(TSTreeCursor *self, TSNode node);
 
 /**
  * Re-initialize a tree cursor to the same position as another cursor.
@@ -673,12 +673,12 @@ void ts_tree_cursor_reset(TSTreeCursor *, TSNode);
  * Unlike `ts_tree_cursor_reset`, this will not lose parent information and
  * allows reusing already created cursors.
 */
-void ts_tree_cursor_reset_to(TSTreeCursor *, const TSTreeCursor *);
+void ts_tree_cursor_reset_to(TSTreeCursor *dst, const TSTreeCursor *src);
 
 /**
  * Get the tree cursor's current node.
  */
-TSNode ts_tree_cursor_current_node(const TSTreeCursor *);
+TSNode ts_tree_cursor_current_node(const TSTreeCursor *self);
 
 /**
  * Get the field name of the tree cursor's current node.
@@ -686,7 +686,7 @@ TSNode ts_tree_cursor_current_node(const TSTreeCursor *);
  * This returns `NULL` if the current node doesn't have a field.
  * See also `ts_node_child_by_field_name`.
  */
-const char *ts_tree_cursor_current_field_name(const TSTreeCursor *);
+const char *ts_tree_cursor_current_field_name(const TSTreeCursor *self);
 
 /**
  * Get the field id of the tree cursor's current node.
@@ -694,7 +694,7 @@ const char *ts_tree_cursor_current_field_name(const TSTreeCursor *);
  * This returns zero if the current node doesn't have a field.
  * See also `ts_node_child_by_field_id`, `ts_language_field_id_for_name`.
  */
-TSFieldId ts_tree_cursor_current_field_id(const TSTreeCursor *);
+TSFieldId ts_tree_cursor_current_field_id(const TSTreeCursor *self);
 
 /**
  * Move the cursor to the parent of its current node.
@@ -702,7 +702,7 @@ TSFieldId ts_tree_cursor_current_field_id(const TSTreeCursor *);
  * This returns `true` if the cursor successfully moved, and returns `false`
  * if there was no parent node (the cursor was already on the root node).
  */
-bool ts_tree_cursor_goto_parent(TSTreeCursor *);
+bool ts_tree_cursor_goto_parent(TSTreeCursor *self);
 
 /**
  * Move the cursor to the next sibling of its current node.
@@ -710,7 +710,7 @@ bool ts_tree_cursor_goto_parent(TSTreeCursor *);
  * This returns `true` if the cursor successfully moved, and returns `false`
  * if there was no next sibling node.
  */
-bool ts_tree_cursor_goto_next_sibling(TSTreeCursor *);
+bool ts_tree_cursor_goto_next_sibling(TSTreeCursor *self);
 
 /**
  * Move the cursor to the previous sibling of its current node.
@@ -723,7 +723,7 @@ bool ts_tree_cursor_goto_next_sibling(TSTreeCursor *);
  * the worst case, this will need to iterate through all the children upto the
  * previous sibling node to recalculate its position.
  */
-bool ts_tree_cursor_goto_previous_sibling(TSTreeCursor *);
+bool ts_tree_cursor_goto_previous_sibling(TSTreeCursor *self);
 
 /**
  * Move the cursor to the first child of its current node.
@@ -731,7 +731,7 @@ bool ts_tree_cursor_goto_previous_sibling(TSTreeCursor *);
  * This returns `true` if the cursor successfully moved, and returns `false`
  * if there were no children.
  */
-bool ts_tree_cursor_goto_first_child(TSTreeCursor *);
+bool ts_tree_cursor_goto_first_child(TSTreeCursor *self);
 
 /**
  * Move the cursor to the last child of its current node.
@@ -743,26 +743,26 @@ bool ts_tree_cursor_goto_first_child(TSTreeCursor *);
  * because it needs to iterate through all the children to compute the child's
  * position.
  */
-bool ts_tree_cursor_goto_last_child(TSTreeCursor *);
+bool ts_tree_cursor_goto_last_child(TSTreeCursor *self);
 
 /**
  * Move the cursor to the node that is the nth descendant of
  * the original node that the cursor was constructed with, where
  * zero represents the original node itself.
  */
-void ts_tree_cursor_goto_descendant(TSTreeCursor *, uint32_t);
+void ts_tree_cursor_goto_descendant(TSTreeCursor *self, uint32_t goal_descendant_index);
 
 /**
  * Get the index of the cursor's current node out of all of the
  * descendants of the original node that the cursor was constructed with.
  */
-uint32_t ts_tree_cursor_current_descendant_index(const TSTreeCursor *);
+uint32_t ts_tree_cursor_current_descendant_index(const TSTreeCursor *self);
 
 /**
  * Get the depth of the cursor's current node relative to the original
  * node that the cursor was constructed with.
  */
-uint32_t ts_tree_cursor_current_depth(const TSTreeCursor *);
+uint32_t ts_tree_cursor_current_depth(const TSTreeCursor *self);
 
 /**
  * Move the cursor to the first child of its current node that extends beyond
@@ -771,10 +771,10 @@ uint32_t ts_tree_cursor_current_depth(const TSTreeCursor *);
  * This returns the index of the child node if one was found, and returns -1
  * if no such child was found.
  */
-int64_t ts_tree_cursor_goto_first_child_for_byte(TSTreeCursor *, uint32_t);
-int64_t ts_tree_cursor_goto_first_child_for_point(TSTreeCursor *, TSPoint);
+int64_t ts_tree_cursor_goto_first_child_for_byte(TSTreeCursor *self, uint32_t goal_byte);
+int64_t ts_tree_cursor_goto_first_child_for_point(TSTreeCursor *self, TSPoint goal_point);
 
-TSTreeCursor ts_tree_cursor_copy(const TSTreeCursor *);
+TSTreeCursor ts_tree_cursor_copy(const TSTreeCursor *cursor);
 
 /*******************/
 /* Section - Query */
@@ -802,14 +802,14 @@ TSQuery *ts_query_new(
 /**
  * Delete a query, freeing all of the memory that it used.
  */
-void ts_query_delete(TSQuery *);
+void ts_query_delete(TSQuery *self);
 
 /**
  * Get the number of patterns, captures, or string literals in the query.
  */
-uint32_t ts_query_pattern_count(const TSQuery *);
-uint32_t ts_query_capture_count(const TSQuery *);
-uint32_t ts_query_string_count(const TSQuery *);
+uint32_t ts_query_pattern_count(const TSQuery *self);
+uint32_t ts_query_capture_count(const TSQuery *self);
+uint32_t ts_query_string_count(const TSQuery *self);
 
 /**
  * Get the byte offset where the given pattern starts in the query's source.
@@ -817,7 +817,7 @@ uint32_t ts_query_string_count(const TSQuery *);
  * This can be useful when combining queries by concatenating their source
  * code strings.
  */
-uint32_t ts_query_start_byte_for_pattern(const TSQuery *, uint32_t);
+uint32_t ts_query_start_byte_for_pattern(const TSQuery *self, uint32_t pattern_index);
 
 /**
  * Get all of the predicates for the given pattern in the query.
@@ -868,7 +868,7 @@ bool ts_query_is_pattern_guaranteed_at_step(const TSQuery *self, uint32_t byte_o
  * numeric id based on the order that it appeared in the query's source.
  */
 const char *ts_query_capture_name_for_id(
-  const TSQuery *,
+  const TSQuery *self,
   uint32_t index,
   uint32_t *length
 );
@@ -878,13 +878,13 @@ const char *ts_query_capture_name_for_id(
  * with a numeric id based on the order that it appeared in the query's source.
  */
 TSQuantifier ts_query_capture_quantifier_for_id(
-  const TSQuery *,
+  const TSQuery *self,
   uint32_t pattern_index,
   uint32_t capture_index
 );
 
 const char *ts_query_string_value_for_id(
-  const TSQuery *,
+  const TSQuery *self,
   uint32_t index,
   uint32_t *length
 );
@@ -896,7 +896,7 @@ const char *ts_query_string_value_for_id(
  * any resource usage associated with recording the capture. Currently, there
  * is no way to undo this.
  */
-void ts_query_disable_capture(TSQuery *, const char *, uint32_t);
+void ts_query_disable_capture(TSQuery *self, const char *name, uint32_t length);
 
 /**
  * Disable a certain pattern within a query.
@@ -904,7 +904,7 @@ void ts_query_disable_capture(TSQuery *, const char *, uint32_t);
  * This prevents the pattern from matching and removes most of the overhead
  * associated with the pattern. Currently, there is no way to undo this.
  */
-void ts_query_disable_pattern(TSQuery *, uint32_t);
+void ts_query_disable_pattern(TSQuery *self, uint32_t pattern_index);
 
 /**
  * Create a new cursor for executing a given query.
@@ -933,12 +933,12 @@ TSQueryCursor *ts_query_cursor_new(void);
 /**
  * Delete a query cursor, freeing all of the memory that it used.
  */
-void ts_query_cursor_delete(TSQueryCursor *);
+void ts_query_cursor_delete(TSQueryCursor *self);
 
 /**
  * Start running a given query on a given node.
  */
-void ts_query_cursor_exec(TSQueryCursor *, const TSQuery *, TSNode);
+void ts_query_cursor_exec(TSQueryCursor *self, const TSQuery *query, TSNode node);
 
 /**
  * Manage the maximum number of in-progress matches allowed by this query
@@ -951,16 +951,16 @@ void ts_query_cursor_exec(TSQueryCursor *, const TSQuery *, TSNode);
  * any number of pending matches, dynamically allocating new space for them as
  * needed as the query is executed.
  */
-bool ts_query_cursor_did_exceed_match_limit(const TSQueryCursor *);
-uint32_t ts_query_cursor_match_limit(const TSQueryCursor *);
-void ts_query_cursor_set_match_limit(TSQueryCursor *, uint32_t);
+bool ts_query_cursor_did_exceed_match_limit(const TSQueryCursor *self);
+uint32_t ts_query_cursor_match_limit(const TSQueryCursor *self);
+void ts_query_cursor_set_match_limit(TSQueryCursor *self, uint32_t limit);
 
 /**
  * Set the range of bytes or (row, column) positions in which the query
  * will be executed.
  */
-void ts_query_cursor_set_byte_range(TSQueryCursor *, uint32_t, uint32_t);
-void ts_query_cursor_set_point_range(TSQueryCursor *, TSPoint, TSPoint);
+void ts_query_cursor_set_byte_range(TSQueryCursor *self, uint32_t start_byte, uint32_t end_byte);
+void ts_query_cursor_set_point_range(TSQueryCursor *self, TSPoint start_point, TSPoint end_point);
 
 /**
  * Advance to the next match of the currently running query.
@@ -968,8 +968,8 @@ void ts_query_cursor_set_point_range(TSQueryCursor *, TSPoint, TSPoint);
  * If there is a match, write it to `*match` and return `true`.
  * Otherwise, return `false`.
  */
-bool ts_query_cursor_next_match(TSQueryCursor *, TSQueryMatch *match);
-void ts_query_cursor_remove_match(TSQueryCursor *, uint32_t match_id);
+bool ts_query_cursor_next_match(TSQueryCursor *self, TSQueryMatch *match);
+void ts_query_cursor_remove_match(TSQueryCursor *self, uint32_t match_id);
 
 /**
  * Advance to the next capture of the currently running query.
@@ -978,7 +978,7 @@ void ts_query_cursor_remove_match(TSQueryCursor *, uint32_t match_id);
  * the matche's capture list to `*capture_index`. Otherwise, return `false`.
  */
 bool ts_query_cursor_next_capture(
-  TSQueryCursor *,
+  TSQueryCursor *self,
   TSQueryMatch *match,
   uint32_t *capture_index
 );
@@ -997,7 +997,7 @@ bool ts_query_cursor_next_capture(
  *
  * Set to `UINT32_MAX` to remove the maximum start depth.
  */
-void ts_query_cursor_set_max_start_depth(TSQueryCursor *, uint32_t);
+void ts_query_cursor_set_max_start_depth(TSQueryCursor *self, uint32_t max_start_depth);
 
 /**********************/
 /* Section - Language */
@@ -1006,17 +1006,17 @@ void ts_query_cursor_set_max_start_depth(TSQueryCursor *, uint32_t);
 /**
  * Get the number of distinct node types in the language.
  */
-uint32_t ts_language_symbol_count(const TSLanguage *);
+uint32_t ts_language_symbol_count(const TSLanguage *self);
 
 /**
  * Get the number of valid states in this language.
 */
-uint32_t ts_language_state_count(const TSLanguage *);
+uint32_t ts_language_state_count(const TSLanguage *self);
 
 /**
  * Get a node type string for the given numerical id.
  */
-const char *ts_language_symbol_name(const TSLanguage *, TSSymbol);
+const char *ts_language_symbol_name(const TSLanguage *self, TSSymbol symbol);
 
 /**
  * Get the numerical id for the given node type string.
@@ -1031,17 +1031,17 @@ TSSymbol ts_language_symbol_for_name(
 /**
  * Get the number of distinct field names in the language.
  */
-uint32_t ts_language_field_count(const TSLanguage *);
+uint32_t ts_language_field_count(const TSLanguage *self);
 
 /**
  * Get the field name string for the given numerical id.
  */
-const char *ts_language_field_name_for_id(const TSLanguage *, TSFieldId);
+const char *ts_language_field_name_for_id(const TSLanguage *self, TSFieldId id);
 
 /**
  * Get the numerical id for the given field name string.
  */
-TSFieldId ts_language_field_id_for_name(const TSLanguage *, const char *, uint32_t);
+TSFieldId ts_language_field_id_for_name(const TSLanguage *self, const char *name, uint32_t name_length);
 
 /**
  * Check whether the given node type id belongs to named nodes, anonymous nodes,
@@ -1049,7 +1049,7 @@ TSFieldId ts_language_field_id_for_name(const TSLanguage *, const char *, uint32
  *
  * See also `ts_node_is_named`. Hidden nodes are never returned from the API.
  */
-TSSymbolType ts_language_symbol_type(const TSLanguage *, TSSymbol);
+TSSymbolType ts_language_symbol_type(const TSLanguage *self, TSSymbol symbol);
 
 /**
  * Get the ABI version number for this language. This version number is used
@@ -1058,14 +1058,14 @@ TSSymbolType ts_language_symbol_type(const TSLanguage *, TSSymbol);
  *
  * See also `ts_parser_set_language`.
  */
-uint32_t ts_language_version(const TSLanguage *);
+uint32_t ts_language_version(const TSLanguage *self);
 
 /**
  * Get the next parse state. Combine this with lookahead iterators to generate
  * completion suggestions or valid symbols in error nodes. Use
  * `ts_node_grammar_symbol` for valid symbols.
 */
-TSStateId ts_language_next_state(const TSLanguage *, TSStateId, TSSymbol);
+TSStateId ts_language_next_state(const TSLanguage *self, TSStateId state, TSSymbol symbol);
 
 /********************************/
 /* Section - Lookahead Iterator */
@@ -1086,12 +1086,12 @@ TSStateId ts_language_next_state(const TSLanguage *, TSStateId, TSSymbol);
  * iterator on its first leaf node state. For `MISSING` nodes, a lookahead
  * iterator created on the previous non-extra leaf node may be appropriate.
 */
-TSLookaheadIterator *ts_lookahead_iterator_new(const TSLanguage *, TSStateId);
+TSLookaheadIterator *ts_lookahead_iterator_new(const TSLanguage *self, TSStateId state);
 
 /**
  * Delete a lookahead iterator freeing all the memory used.
 */
-void ts_lookahead_iterator_delete(TSLookaheadIterator *);
+void ts_lookahead_iterator_delete(TSLookaheadIterator *self);
 
 /**
  * Reset the lookahead iterator to another state.
@@ -1099,7 +1099,7 @@ void ts_lookahead_iterator_delete(TSLookaheadIterator *);
  * This returns `true` if the iterator was reset to the given state and `false`
  * otherwise.
 */
-bool ts_lookahead_iterator_reset_state(TSLookaheadIterator *, TSStateId);
+bool ts_lookahead_iterator_reset_state(TSLookaheadIterator *self, TSStateId state);
 
 /**
  * Reset the lookahead iterator.
@@ -1107,30 +1107,30 @@ bool ts_lookahead_iterator_reset_state(TSLookaheadIterator *, TSStateId);
  * This returns `true` if the language was set successfully and `false`
  * otherwise.
 */
-bool ts_lookahead_iterator_reset(TSLookaheadIterator *, const TSLanguage *, TSStateId);
+bool ts_lookahead_iterator_reset(TSLookaheadIterator *self, const TSLanguage *language, TSStateId state);
 
 /**
  * Get the current language of the lookahead iterator.
 */
-const TSLanguage * ts_lookahead_iterator_language(const TSLookaheadIterator *);
+const TSLanguage *ts_lookahead_iterator_language(const TSLookaheadIterator *self);
 
 /**
  * Advance the lookahead iterator to the next symbol.
  *
  * This returns `true` if there is a new symbol and `false` otherwise.
 */
-bool ts_lookahead_iterator_advance(TSLookaheadIterator *);
+bool ts_lookahead_iterator_advance(TSLookaheadIterator *self);
 
 /**
  * Get the current symbol of the lookahead iterator;
 */
-TSSymbol ts_lookahead_iterator_current_symbol(const TSLookaheadIterator *);
+TSSymbol ts_lookahead_iterator_current_symbol(const TSLookaheadIterator *self);
 
 /**
  * Get the current symbol type of the lookahead iterator as a null terminated
  * string.
 */
-const char *ts_lookahead_iterator_current_symbol_name(const TSLookaheadIterator *);
+const char *ts_lookahead_iterator_current_symbol_name(const TSLookaheadIterator *self);
 
 /**********************************/
 /* Section - Global Configuration */
diff --git a/lib/src/alloc.c b/lib/src/alloc.c
index 30597571..78b8057d 100644
--- a/lib/src/alloc.c
+++ b/lib/src/alloc.c
@@ -35,10 +35,10 @@ void *(*ts_current_realloc)(void *, size_t) = ts_realloc_default;
 void (*ts_current_free)(void *) = free;
 
 void ts_set_allocator(
-  void *(*new_malloc)(size_t),
-  void *(*new_calloc)(size_t, size_t),
-  void *(*new_realloc)(void *, size_t),
-  void (*new_free)(void *)
+  void *(*new_malloc)(size_t size),
+  void *(*new_calloc)(size_t count, size_t size),
+  void *(*new_realloc)(void *ptr, size_t size),
+  void (*new_free)(void *ptr)
 ) {
   ts_current_malloc = new_malloc ? new_malloc : ts_malloc_default;
   ts_current_calloc = new_calloc ? new_calloc : ts_calloc_default;
diff --git a/lib/src/language.c b/lib/src/language.c
index df5c6de1..1c5fe1fc 100644
--- a/lib/src/language.c
+++ b/lib/src/language.c
@@ -180,7 +180,7 @@ bool ts_lookahead_iterator_reset_state(TSLookaheadIterator * self, TSStateId sta
   return true;
 }
 
-const TSLanguage * ts_lookahead_iterator_language(const TSLookaheadIterator *self) {
+const TSLanguage *ts_lookahead_iterator_language(const TSLookaheadIterator *self) {
   const LookaheadIterator *iterator = (const LookaheadIterator *)self;
   return iterator->language;
 }

From 96919cae5d525094355302f8aa2567f514cd2d3d Mon Sep 17 00:00:00 2001
From: Amaan Qureshi <amaanq12@gmail.com>
Date: Mon, 24 Jul 2023 03:59:47 -0400
Subject: [PATCH 253/347] fix(generate): add Vertical Tab and Form Feed to the
 whitespace class

---
 cli/src/generate/prepare_grammar/expand_tokens.rs | 4 +++-
 1 file changed, 3 insertions(+), 1 deletion(-)

diff --git a/cli/src/generate/prepare_grammar/expand_tokens.rs b/cli/src/generate/prepare_grammar/expand_tokens.rs
index d6c73d9a..5774381c 100644
--- a/cli/src/generate/prepare_grammar/expand_tokens.rs
+++ b/cli/src/generate/prepare_grammar/expand_tokens.rs
@@ -475,7 +475,9 @@ impl NfaBuilder {
                 .add_char(' ')
                 .add_char('\t')
                 .add_char('\r')
-                .add_char('\n'),
+                .add_char('\n')
+                .add_char('\x0B')
+                .add_char('\x0C'),
             ClassPerlKind::Word => CharacterSet::empty()
                 .add_char('_')
                 .add_range('A', 'Z')

From 083b6949edc399ca809b11d531795ed1f364f6fe Mon Sep 17 00:00:00 2001
From: Andrew Biehl <70184461+andrewtbiehl@users.noreply.github.com>
Date: Mon, 25 Jul 2022 15:04:29 -0500
Subject: [PATCH 254/347] docs: update tree-sitter-higlight README

---
 highlight/README.md | 29 ++++++++++-------------------
 1 file changed, 10 insertions(+), 19 deletions(-)

diff --git a/highlight/README.md b/highlight/README.md
index 902212ab..95b229eb 100644
--- a/highlight/README.md
+++ b/highlight/README.md
@@ -11,15 +11,14 @@ Add this crate, and the language-specific crates for whichever languages you wan
 
 ```toml
 [dependencies]
-tree-sitter-highlight = "0.19"
-tree-sitter-html = "0.19"
+tree-sitter-highlight = "^0.20"
 tree-sitter-javascript = "0.19"
 ```
 
 Define the list of highlight names that you will recognize:
 
 ```rust
-let highlight_names = &[
+let highlight_names = [
     "attribute",
     "constant",
     "function.builtin",
@@ -46,29 +45,21 @@ Create a highlighter. You need one of these for each thread that you're using fo
 ```rust
 use tree_sitter_highlight::Highlighter;
 
-let highlighter = Highlighter::new();
+let mut highlighter = Highlighter::new();
 ```
 
-Load some highlighting queries from the `queries` directory of some language repositories:
+Load some highlighting queries from the `queries` directory of the language repository:
 
 ```rust
 use tree_sitter_highlight::HighlightConfiguration;
 
-let html_language = unsafe { tree_sitter_html() };
-let javascript_language = unsafe { tree_sitter_javascript() };
+let javascript_language = tree_sitter_javascript::language();
 
-let html_config = HighlightConfiguration::new(
-    tree_sitter_html::language(),
-    tree_sitter_html::HIGHLIGHTS_QUERY,
-    tree_sitter_html::INJECTIONS_QUERY,
-    "",
-).unwrap();
-
-let javascript_config = HighlightConfiguration::new(
-    tree_sitter_javascript::language(),
-    tree_sitter_javascript::HIGHLIGHTS_QUERY,
-    tree_sitter_javascript::INJECTIONS_QUERY,
-    tree_sitter_javascript::LCOALS_QUERY,
+let mut javascript_config = HighlightConfiguration::new(
+    javascript_language,
+    tree_sitter_javascript::HIGHLIGHT_QUERY,
+    tree_sitter_javascript::INJECTION_QUERY,
+    tree_sitter_javascript::LOCALS_QUERY,
 ).unwrap();
 ```
 

From f35752e3ac8f02b3f8e17437e6ffbe640771d868 Mon Sep 17 00:00:00 2001
From: Amaan Qureshi <amaanq12@gmail.com>
Date: Sun, 6 Aug 2023 20:30:02 -0400
Subject: [PATCH 255/347] feat!: support the case-insensitive regex flag

---
 .../generate/build_tables/token_conflicts.rs  |  12 +-
 cli/src/generate/dsl.js                       |   3 +-
 cli/src/generate/node_types.rs                |   8 +-
 cli/src/generate/parse_grammar.rs             |  17 +-
 .../generate/prepare_grammar/expand_tokens.rs | 193 ++++++++++++------
 .../prepare_grammar/extract_tokens.rs         |  12 +-
 cli/src/generate/rules.rs                     |   6 +-
 7 files changed, 166 insertions(+), 85 deletions(-)

diff --git a/cli/src/generate/build_tables/token_conflicts.rs b/cli/src/generate/build_tables/token_conflicts.rs
index 223d3481..485fdc96 100644
--- a/cli/src/generate/build_tables/token_conflicts.rs
+++ b/cli/src/generate/build_tables/token_conflicts.rs
@@ -390,12 +390,12 @@ mod tests {
                 Variable {
                     name: "token_0".to_string(),
                     kind: VariableType::Named,
-                    rule: Rule::pattern("[a-f]1|0x\\d"),
+                    rule: Rule::pattern("[a-f]1|0x\\d", ""),
                 },
                 Variable {
                     name: "token_1".to_string(),
                     kind: VariableType::Named,
-                    rule: Rule::pattern("d*ef"),
+                    rule: Rule::pattern("d*ef", ""),
                 },
             ],
         })
@@ -426,7 +426,7 @@ mod tests {
                 Variable {
                     name: "identifier".to_string(),
                     kind: VariableType::Named,
-                    rule: Rule::pattern("\\w+"),
+                    rule: Rule::pattern("\\w+", ""),
                 },
                 Variable {
                     name: "instanceof".to_string(),
@@ -471,7 +471,7 @@ mod tests {
     #[test]
     fn test_token_conflicts_with_separators() {
         let grammar = expand_tokens(ExtractedLexicalGrammar {
-            separators: vec![Rule::pattern("\\s")],
+            separators: vec![Rule::pattern("\\s", "")],
             variables: vec![
                 Variable {
                     name: "x".to_string(),
@@ -498,7 +498,7 @@ mod tests {
     #[test]
     fn test_token_conflicts_with_open_ended_tokens() {
         let grammar = expand_tokens(ExtractedLexicalGrammar {
-            separators: vec![Rule::pattern("\\s")],
+            separators: vec![Rule::pattern("\\s", "")],
             variables: vec![
                 Variable {
                     name: "x".to_string(),
@@ -508,7 +508,7 @@ mod tests {
                 Variable {
                     name: "anything".to_string(),
                     kind: VariableType::Named,
-                    rule: Rule::prec(Precedence::Integer(-1), Rule::pattern(".*")),
+                    rule: Rule::prec(Precedence::Integer(-1), Rule::pattern(".*", "")),
                 },
             ],
         })
diff --git a/cli/src/generate/dsl.js b/cli/src/generate/dsl.js
index 4281cee1..fefd970e 100644
--- a/cli/src/generate/dsl.js
+++ b/cli/src/generate/dsl.js
@@ -183,7 +183,8 @@ function normalize(value) {
     case RegExp:
       return {
         type: 'PATTERN',
-        value: value.source
+        value: value.source,
+        flags: value.flags
       };
     case ReferenceError:
       throw value
diff --git a/cli/src/generate/node_types.rs b/cli/src/generate/node_types.rs
index 43918980..2b44cfd2 100644
--- a/cli/src/generate/node_types.rs
+++ b/cli/src/generate/node_types.rs
@@ -1172,12 +1172,12 @@ mod tests {
                 Variable {
                     name: "identifier".to_string(),
                     kind: VariableType::Named,
-                    rule: Rule::pattern("\\w+"),
+                    rule: Rule::pattern("\\w+", ""),
                 },
                 Variable {
                     name: "foo_identifier".to_string(),
                     kind: VariableType::Named,
-                    rule: Rule::pattern("[\\w-]+"),
+                    rule: Rule::pattern("[\\w-]+", ""),
                 },
             ],
             ..Default::default()
@@ -1275,8 +1275,8 @@ mod tests {
                 name: "script".to_string(),
                 kind: VariableType::Named,
                 rule: Rule::seq(vec![
-                    Rule::field("a".to_string(), Rule::pattern("hi")),
-                    Rule::field("b".to_string(), Rule::pattern("bye")),
+                    Rule::field("a".to_string(), Rule::pattern("hi", "")),
+                    Rule::field("b".to_string(), Rule::pattern("bye", "")),
                 ]),
             }],
             ..Default::default()
diff --git a/cli/src/generate/parse_grammar.rs b/cli/src/generate/parse_grammar.rs
index 7fda0b71..88bd57c1 100644
--- a/cli/src/generate/parse_grammar.rs
+++ b/cli/src/generate/parse_grammar.rs
@@ -19,6 +19,7 @@ enum RuleJSON {
     },
     PATTERN {
         value: String,
+        flags: Option<String>,
     },
     SYMBOL {
         name: String,
@@ -143,7 +144,21 @@ fn parse_rule(json: RuleJSON) -> Rule {
         } => Rule::alias(parse_rule(*content), value, named),
         RuleJSON::BLANK => Rule::Blank,
         RuleJSON::STRING { value } => Rule::String(value),
-        RuleJSON::PATTERN { value } => Rule::Pattern(value),
+        RuleJSON::PATTERN { value, flags } => Rule::Pattern(
+            value,
+            flags.map_or(String::new(), |f| {
+                f.chars()
+                    .filter(|c| {
+                        if *c != 'i' {
+                            eprintln!("Warning: unsupported flag {}", c);
+                            false
+                        } else {
+                            true
+                        }
+                    })
+                    .collect()
+            }),
+        ),
         RuleJSON::SYMBOL { name } => Rule::NamedSymbol(name),
         RuleJSON::CHOICE { members } => Rule::choice(members.into_iter().map(parse_rule).collect()),
         RuleJSON::FIELD { content, name } => Rule::field(name, parse_rule(*content)),
diff --git a/cli/src/generate/prepare_grammar/expand_tokens.rs b/cli/src/generate/prepare_grammar/expand_tokens.rs
index 5774381c..fdbd004f 100644
--- a/cli/src/generate/prepare_grammar/expand_tokens.rs
+++ b/cli/src/generate/prepare_grammar/expand_tokens.rs
@@ -139,10 +139,10 @@ pub(crate) fn expand_tokens(mut grammar: ExtractedLexicalGrammar) -> Result<Lexi
 impl NfaBuilder {
     fn expand_rule(&mut self, rule: &Rule, mut next_state_id: u32) -> Result<bool> {
         match rule {
-            Rule::Pattern(s) => {
+            Rule::Pattern(s, f) => {
                 let s = preprocess_regex(s);
                 let ast = parse::Parser::new().parse(&s)?;
-                self.expand_regex(&ast, next_state_id)
+                self.expand_regex(&ast, next_state_id, f.contains('i'))
             }
             Rule::String(s) => {
                 for c in s.chars().rev() {
@@ -210,12 +210,42 @@ impl NfaBuilder {
         }
     }
 
-    fn expand_regex(&mut self, ast: &Ast, mut next_state_id: u32) -> Result<bool> {
+    fn expand_regex(
+        &mut self,
+        ast: &Ast,
+        mut next_state_id: u32,
+        case_insensitive: bool,
+    ) -> Result<bool> {
+        fn inverse_char(c: char) -> char {
+            match c {
+                'a'..='z' => (c as u8 - b'a' + b'A') as char,
+                'A'..='Z' => (c as u8 - b'A' + b'a') as char,
+                c => c,
+            }
+        }
+
+        fn with_inverse_char(mut chars: CharacterSet) -> CharacterSet {
+            for char in chars.clone().chars() {
+                let inverted = inverse_char(char);
+                if char != inverted {
+                    chars = chars.add_char(inverted);
+                }
+            }
+            chars
+        }
+
         match ast {
             Ast::Empty(_) => Ok(false),
             Ast::Flags(_) => Err(anyhow!("Regex error: Flags are not supported")),
             Ast::Literal(literal) => {
-                self.push_advance(CharacterSet::from_char(literal.c), next_state_id);
+                let mut char_set = CharacterSet::from_char(literal.c);
+                if case_insensitive {
+                    let inverted = inverse_char(literal.c);
+                    if literal.c != inverted {
+                        char_set = char_set.add_char(inverted);
+                    }
+                }
+                self.push_advance(char_set, next_state_id);
                 Ok(true)
             }
             Ast::Dot(_) => {
@@ -229,6 +259,9 @@ impl NfaBuilder {
                     if class.negated {
                         chars = chars.negate();
                     }
+                    if case_insensitive {
+                        chars = with_inverse_char(chars);
+                    }
                     self.push_advance(chars, next_state_id);
                     Ok(true)
                 }
@@ -237,6 +270,9 @@ impl NfaBuilder {
                     if class.negated {
                         chars = chars.negate();
                     }
+                    if case_insensitive {
+                        chars = with_inverse_char(chars);
+                    }
                     self.push_advance(chars, next_state_id);
                     Ok(true)
                 }
@@ -245,48 +281,56 @@ impl NfaBuilder {
                     if class.negated {
                         chars = chars.negate();
                     }
+                    if case_insensitive {
+                        chars = with_inverse_char(chars);
+                    }
                     self.push_advance(chars, next_state_id);
                     Ok(true)
                 }
             },
             Ast::Repetition(repetition) => match repetition.op.kind {
                 RepetitionKind::ZeroOrOne => {
-                    self.expand_zero_or_one(&repetition.ast, next_state_id)
+                    self.expand_zero_or_one(&repetition.ast, next_state_id, case_insensitive)
                 }
                 RepetitionKind::OneOrMore => {
-                    self.expand_one_or_more(&repetition.ast, next_state_id)
+                    self.expand_one_or_more(&repetition.ast, next_state_id, case_insensitive)
                 }
                 RepetitionKind::ZeroOrMore => {
-                    self.expand_zero_or_more(&repetition.ast, next_state_id)
+                    self.expand_zero_or_more(&repetition.ast, next_state_id, case_insensitive)
                 }
                 RepetitionKind::Range(RepetitionRange::Exactly(count)) => {
-                    self.expand_count(&repetition.ast, count, next_state_id)
+                    self.expand_count(&repetition.ast, count, next_state_id, case_insensitive)
                 }
                 RepetitionKind::Range(RepetitionRange::AtLeast(min)) => {
-                    if self.expand_zero_or_more(&repetition.ast, next_state_id)? {
-                        self.expand_count(&repetition.ast, min, next_state_id)
+                    if self.expand_zero_or_more(&repetition.ast, next_state_id, case_insensitive)? {
+                        self.expand_count(&repetition.ast, min, next_state_id, case_insensitive)
                     } else {
                         Ok(false)
                     }
                 }
                 RepetitionKind::Range(RepetitionRange::Bounded(min, max)) => {
-                    let mut result = self.expand_count(&repetition.ast, min, next_state_id)?;
+                    let mut result =
+                        self.expand_count(&repetition.ast, min, next_state_id, case_insensitive)?;
                     for _ in min..max {
                         if result {
                             next_state_id = self.nfa.last_state_id();
                         }
-                        if self.expand_zero_or_one(&repetition.ast, next_state_id)? {
+                        if self.expand_zero_or_one(
+                            &repetition.ast,
+                            next_state_id,
+                            case_insensitive,
+                        )? {
                             result = true;
                         }
                     }
                     Ok(result)
                 }
             },
-            Ast::Group(group) => self.expand_regex(&group.ast, next_state_id),
+            Ast::Group(group) => self.expand_regex(&group.ast, next_state_id, case_insensitive),
             Ast::Alternation(alternation) => {
                 let mut alternative_state_ids = Vec::new();
                 for ast in alternation.asts.iter() {
-                    if self.expand_regex(&ast, next_state_id)? {
+                    if self.expand_regex(&ast, next_state_id, case_insensitive)? {
                         alternative_state_ids.push(self.nfa.last_state_id());
                     } else {
                         alternative_state_ids.push(next_state_id);
@@ -304,7 +348,7 @@ impl NfaBuilder {
             Ast::Concat(concat) => {
                 let mut result = false;
                 for ast in concat.asts.iter().rev() {
-                    if self.expand_regex(&ast, next_state_id)? {
+                    if self.expand_regex(&ast, next_state_id, case_insensitive)? {
                         result = true;
                         next_state_id = self.nfa.last_state_id();
                     }
@@ -335,13 +379,18 @@ impl NfaBuilder {
         }
     }
 
-    fn expand_one_or_more(&mut self, ast: &Ast, next_state_id: u32) -> Result<bool> {
+    fn expand_one_or_more(
+        &mut self,
+        ast: &Ast,
+        next_state_id: u32,
+        case_insensitive: bool,
+    ) -> Result<bool> {
         self.nfa.states.push(NfaState::Accept {
             variable_index: 0,
             precedence: 0,
         }); // Placeholder for split
         let split_state_id = self.nfa.last_state_id();
-        if self.expand_regex(&ast, split_state_id)? {
+        if self.expand_regex(&ast, split_state_id, case_insensitive)? {
             self.nfa.states[split_state_id as usize] =
                 NfaState::Split(self.nfa.last_state_id(), next_state_id);
             Ok(true)
@@ -351,8 +400,13 @@ impl NfaBuilder {
         }
     }
 
-    fn expand_zero_or_one(&mut self, ast: &Ast, next_state_id: u32) -> Result<bool> {
-        if self.expand_regex(ast, next_state_id)? {
+    fn expand_zero_or_one(
+        &mut self,
+        ast: &Ast,
+        next_state_id: u32,
+        case_insensitive: bool,
+    ) -> Result<bool> {
+        if self.expand_regex(ast, next_state_id, case_insensitive)? {
             self.push_split(next_state_id);
             Ok(true)
         } else {
@@ -360,8 +414,13 @@ impl NfaBuilder {
         }
     }
 
-    fn expand_zero_or_more(&mut self, ast: &Ast, next_state_id: u32) -> Result<bool> {
-        if self.expand_one_or_more(&ast, next_state_id)? {
+    fn expand_zero_or_more(
+        &mut self,
+        ast: &Ast,
+        next_state_id: u32,
+        case_insensitive: bool,
+    ) -> Result<bool> {
+        if self.expand_one_or_more(&ast, next_state_id, case_insensitive)? {
             self.push_split(next_state_id);
             Ok(true)
         } else {
@@ -369,10 +428,16 @@ impl NfaBuilder {
         }
     }
 
-    fn expand_count(&mut self, ast: &Ast, count: u32, mut next_state_id: u32) -> Result<bool> {
+    fn expand_count(
+        &mut self,
+        ast: &Ast,
+        count: u32,
+        mut next_state_id: u32,
+        case_insensitive: bool,
+    ) -> Result<bool> {
         let mut result = false;
         for _ in 0..count {
-            if self.expand_regex(ast, next_state_id)? {
+            if self.expand_regex(ast, next_state_id, case_insensitive)? {
                 result = true;
                 next_state_id = self.nfa.last_state_id();
             }
@@ -565,7 +630,7 @@ mod tests {
         let table = [
             // regex with sequences and alternatives
             Row {
-                rules: vec![Rule::pattern("(a|b|c)d(e|f|g)h?")],
+                rules: vec![Rule::pattern("(a|b|c)d(e|f|g)h?", "")],
                 separators: vec![],
                 examples: vec![
                     ("ade1", Some((0, "ade"))),
@@ -576,13 +641,13 @@ mod tests {
             },
             // regex with repeats
             Row {
-                rules: vec![Rule::pattern("a*")],
+                rules: vec![Rule::pattern("a*", "")],
                 separators: vec![],
                 examples: vec![("aaa1", Some((0, "aaa"))), ("b", Some((0, "")))],
             },
             // regex with repeats in sequences
             Row {
-                rules: vec![Rule::pattern("a((bc)+|(de)*)f")],
+                rules: vec![Rule::pattern("a((bc)+|(de)*)f", "")],
                 separators: vec![],
                 examples: vec![
                     ("af1", Some((0, "af"))),
@@ -593,13 +658,13 @@ mod tests {
             },
             // regex with character ranges
             Row {
-                rules: vec![Rule::pattern("[a-fA-F0-9]+")],
+                rules: vec![Rule::pattern("[a-fA-F0-9]+", "")],
                 separators: vec![],
                 examples: vec![("A1ff0.", Some((0, "A1ff0")))],
             },
             // regex with perl character classes
             Row {
-                rules: vec![Rule::pattern("\\w\\d\\s")],
+                rules: vec![Rule::pattern("\\w\\d\\s", "")],
                 separators: vec![],
                 examples: vec![("_0  ", Some((0, "_0 ")))],
             },
@@ -613,7 +678,7 @@ mod tests {
             Row {
                 rules: vec![Rule::repeat(Rule::seq(vec![
                     Rule::string("{"),
-                    Rule::pattern("[a-f]+"),
+                    Rule::pattern("[a-f]+", ""),
                     Rule::string("}"),
                 ]))],
                 separators: vec![],
@@ -626,9 +691,9 @@ mod tests {
             // longest match rule
             Row {
                 rules: vec![
-                    Rule::pattern("a|bc"),
-                    Rule::pattern("aa"),
-                    Rule::pattern("bcd"),
+                    Rule::pattern("a|bc", ""),
+                    Rule::pattern("aa", ""),
+                    Rule::pattern("bcd", ""),
                 ],
                 separators: vec![],
                 examples: vec![
@@ -642,7 +707,7 @@ mod tests {
             },
             // regex with an alternative including the empty string
             Row {
-                rules: vec![Rule::pattern("a(b|)+c")],
+                rules: vec![Rule::pattern("a(b|)+c", "")],
                 separators: vec![],
                 examples: vec![
                     ("ac.", Some((0, "ac"))),
@@ -652,8 +717,8 @@ mod tests {
             },
             // separators
             Row {
-                rules: vec![Rule::pattern("[a-f]+")],
-                separators: vec![Rule::string("\\\n"), Rule::pattern("\\s")],
+                rules: vec![Rule::pattern("[a-f]+", "")],
+                separators: vec![Rule::string("\\\n"), Rule::pattern("\\s", "")],
                 examples: vec![
                     ("  a", Some((0, "a"))),
                     ("  \nb", Some((0, "b"))),
@@ -664,11 +729,11 @@ mod tests {
             // shorter tokens with higher precedence
             Row {
                 rules: vec![
-                    Rule::prec(Precedence::Integer(2), Rule::pattern("abc")),
-                    Rule::prec(Precedence::Integer(1), Rule::pattern("ab[cd]e")),
-                    Rule::pattern("[a-e]+"),
+                    Rule::prec(Precedence::Integer(2), Rule::pattern("abc", "")),
+                    Rule::prec(Precedence::Integer(1), Rule::pattern("ab[cd]e", "")),
+                    Rule::pattern("[a-e]+", ""),
                 ],
-                separators: vec![Rule::string("\\\n"), Rule::pattern("\\s")],
+                separators: vec![Rule::string("\\\n"), Rule::pattern("\\s", "")],
                 examples: vec![
                     ("abceef", Some((0, "abc"))),
                     ("abdeef", Some((1, "abde"))),
@@ -678,13 +743,13 @@ mod tests {
             // immediate tokens with higher precedence
             Row {
                 rules: vec![
-                    Rule::prec(Precedence::Integer(1), Rule::pattern("[^a]+")),
+                    Rule::prec(Precedence::Integer(1), Rule::pattern("[^a]+", "")),
                     Rule::immediate_token(Rule::prec(
                         Precedence::Integer(2),
-                        Rule::pattern("[^ab]+"),
+                        Rule::pattern("[^ab]+", ""),
                     )),
                 ],
-                separators: vec![Rule::pattern("\\s")],
+                separators: vec![Rule::pattern("\\s", "")],
                 examples: vec![("cccb", Some((1, "ccc")))],
             },
             Row {
@@ -706,7 +771,7 @@ mod tests {
             // nested choices within sequences
             Row {
                 rules: vec![Rule::seq(vec![
-                    Rule::pattern("[0-9]+"),
+                    Rule::pattern("[0-9]+", ""),
                     Rule::choice(vec![
                         Rule::Blank,
                         Rule::choice(vec![Rule::seq(vec![
@@ -715,7 +780,7 @@ mod tests {
                                 Rule::Blank,
                                 Rule::choice(vec![Rule::string("+"), Rule::string("-")]),
                             ]),
-                            Rule::pattern("[0-9]+"),
+                            Rule::pattern("[0-9]+", ""),
                         ])]),
                     ]),
                 ])],
@@ -732,7 +797,7 @@ mod tests {
             },
             // nested groups
             Row {
-                rules: vec![Rule::seq(vec![Rule::pattern(r#"([^x\\]|\\(.|\n))+"#)])],
+                rules: vec![Rule::seq(vec![Rule::pattern(r#"([^x\\]|\\(.|\n))+"#, "")])],
                 separators: vec![],
                 examples: vec![("abcx", Some((0, "abc"))), ("abc\\0x", Some((0, "abc\\0")))],
             },
@@ -740,11 +805,11 @@ mod tests {
             Row {
                 rules: vec![
                     // Escaped forward slash (used in JS because '/' is the regex delimiter)
-                    Rule::pattern(r#"\/"#),
+                    Rule::pattern(r#"\/"#, ""),
                     // Escaped quotes
-                    Rule::pattern(r#"\"\'"#),
+                    Rule::pattern(r#"\"\'"#, ""),
                     // Quote preceded by a literal backslash
-                    Rule::pattern(r#"[\\']+"#),
+                    Rule::pattern(r#"[\\']+"#, ""),
                 ],
                 separators: vec![],
                 examples: vec![
@@ -756,8 +821,8 @@ mod tests {
             // unicode property escapes
             Row {
                 rules: vec![
-                    Rule::pattern(r#"\p{L}+\P{L}+"#),
-                    Rule::pattern(r#"\p{White_Space}+\P{White_Space}+[\p{White_Space}]*"#),
+                    Rule::pattern(r#"\p{L}+\P{L}+"#, ""),
+                    Rule::pattern(r#"\p{White_Space}+\P{White_Space}+[\p{White_Space}]*"#, ""),
                 ],
                 separators: vec![],
                 examples: vec![
@@ -767,17 +832,17 @@ mod tests {
             },
             // unicode property escapes in bracketed sets
             Row {
-                rules: vec![Rule::pattern(r#"[\p{L}\p{Nd}]+"#)],
+                rules: vec![Rule::pattern(r#"[\p{L}\p{Nd}]+"#, "")],
                 separators: vec![],
                 examples: vec![("abΨ12٣٣, ok", Some((0, "abΨ12٣٣")))],
             },
             // unicode character escapes
             Row {
                 rules: vec![
-                    Rule::pattern(r#"\u{00dc}"#),
-                    Rule::pattern(r#"\U{000000dd}"#),
-                    Rule::pattern(r#"\u00de"#),
-                    Rule::pattern(r#"\U000000df"#),
+                    Rule::pattern(r#"\u{00dc}"#, ""),
+                    Rule::pattern(r#"\U{000000dd}"#, ""),
+                    Rule::pattern(r#"\u00de"#, ""),
+                    Rule::pattern(r#"\U000000df"#, ""),
                 ],
                 separators: vec![],
                 examples: vec![
@@ -791,13 +856,13 @@ mod tests {
             Row {
                 rules: vec![
                     // Un-escaped curly braces
-                    Rule::pattern(r#"u{[0-9a-fA-F]+}"#),
+                    Rule::pattern(r#"u{[0-9a-fA-F]+}"#, ""),
                     // Already-escaped curly braces
-                    Rule::pattern(r#"\{[ab]{3}\}"#),
+                    Rule::pattern(r#"\{[ab]{3}\}"#, ""),
                     // Unicode codepoints
-                    Rule::pattern(r#"\u{1000A}"#),
+                    Rule::pattern(r#"\u{1000A}"#, ""),
                     // Unicode codepoints (lowercase)
-                    Rule::pattern(r#"\u{1000b}"#),
+                    Rule::pattern(r#"\u{1000b}"#, ""),
                 ],
                 separators: vec![],
                 examples: vec![
@@ -809,7 +874,7 @@ mod tests {
             },
             // Emojis
             Row {
-                rules: vec![Rule::pattern(r"\p{Emoji}+")],
+                rules: vec![Rule::pattern(r"\p{Emoji}+", "")],
                 separators: vec![],
                 examples: vec![
                     ("🐎", Some((0, "🐎"))),
@@ -822,7 +887,7 @@ mod tests {
             },
             // Intersection
             Row {
-                rules: vec![Rule::pattern(r"[[0-7]&&[4-9]]+")],
+                rules: vec![Rule::pattern(r"[[0-7]&&[4-9]]+", "")],
                 separators: vec![],
                 examples: vec![
                     ("456", Some((0, "456"))),
@@ -835,7 +900,7 @@ mod tests {
             },
             // Difference
             Row {
-                rules: vec![Rule::pattern(r"[[0-9]--[4-7]]+")],
+                rules: vec![Rule::pattern(r"[[0-9]--[4-7]]+", "")],
                 separators: vec![],
                 examples: vec![
                     ("123", Some((0, "123"))),
@@ -848,7 +913,7 @@ mod tests {
             },
             // Symmetric difference
             Row {
-                rules: vec![Rule::pattern(r"[[0-7]~~[4-9]]+")],
+                rules: vec![Rule::pattern(r"[[0-7]~~[4-9]]+", "")],
                 separators: vec![],
                 examples: vec![
                     ("123", Some((0, "123"))),
@@ -869,7 +934,7 @@ mod tests {
                 // [6-7]:                    y y
                 // [3-9]--[5-7]:       y y y     y y
                 // final regex:  y y   y y       y y
-                rules: vec![Rule::pattern(r"[[[0-5]--[2-4]]~~[[3-9]--[6-7]]]+")],
+                rules: vec![Rule::pattern(r"[[[0-5]--[2-4]]~~[[3-9]--[6-7]]]+", "")],
                 separators: vec![],
                 examples: vec![
                     ("01", Some((0, "01"))),
diff --git a/cli/src/generate/prepare_grammar/extract_tokens.rs b/cli/src/generate/prepare_grammar/extract_tokens.rs
index 45233b71..54991829 100644
--- a/cli/src/generate/prepare_grammar/extract_tokens.rs
+++ b/cli/src/generate/prepare_grammar/extract_tokens.rs
@@ -320,7 +320,7 @@ mod test {
                 "rule_0",
                 Rule::repeat(Rule::seq(vec![
                     Rule::string("a"),
-                    Rule::pattern("b"),
+                    Rule::pattern("b", ""),
                     Rule::choice(vec![
                         Rule::non_terminal(1),
                         Rule::non_terminal(2),
@@ -331,8 +331,8 @@ mod test {
                     ]),
                 ])),
             ),
-            Variable::named("rule_1", Rule::pattern("e")),
-            Variable::named("rule_2", Rule::pattern("b")),
+            Variable::named("rule_1", Rule::pattern("e", "")),
+            Variable::named("rule_2", Rule::pattern("b", "")),
             Variable::named(
                 "rule_3",
                 Rule::seq(vec![Rule::non_terminal(2), Rule::Blank]),
@@ -378,12 +378,12 @@ mod test {
             lexical_grammar.variables,
             vec![
                 Variable::anonymous("a", Rule::string("a")),
-                Variable::auxiliary("rule_0_token1", Rule::pattern("b")),
+                Variable::auxiliary("rule_0_token1", Rule::pattern("b", "")),
                 Variable::auxiliary(
                     "rule_0_token2",
                     Rule::repeat(Rule::choice(vec![Rule::string("c"), Rule::string("d"),]))
                 ),
-                Variable::named("rule_1", Rule::pattern("e")),
+                Variable::named("rule_1", Rule::pattern("e", "")),
             ]
         );
     }
@@ -411,7 +411,7 @@ mod test {
     fn test_extracting_extra_symbols() {
         let mut grammar = build_grammar(vec![
             Variable::named("rule_0", Rule::string("x")),
-            Variable::named("comment", Rule::pattern("//.*")),
+            Variable::named("comment", Rule::pattern("//.*", "")),
         ]);
         grammar.extra_symbols = vec![Rule::string(" "), Rule::non_terminal(1)];
 
diff --git a/cli/src/generate/rules.rs b/cli/src/generate/rules.rs
index 0e3ff898..c6f0dd33 100644
--- a/cli/src/generate/rules.rs
+++ b/cli/src/generate/rules.rs
@@ -56,7 +56,7 @@ pub(crate) struct Symbol {
 pub(crate) enum Rule {
     Blank,
     String(String),
-    Pattern(String),
+    Pattern(String, String),
     NamedSymbol(String),
     Symbol(Symbol),
     Choice(Vec<Rule>),
@@ -187,8 +187,8 @@ impl Rule {
         Rule::String(value.to_string())
     }
 
-    pub fn pattern(value: &'static str) -> Self {
-        Rule::Pattern(value.to_string())
+    pub fn pattern(value: &'static str, flags: &'static str) -> Self {
+        Rule::Pattern(value.to_string(), flags.to_string())
     }
 }
 

From d0afe1ad0a9394263af52f2d57ea13f93c2453fe Mon Sep 17 00:00:00 2001
From: Brian Strauch <bstrauch@confluent.io>
Date: Mon, 7 Aug 2023 19:18:58 -0700
Subject: [PATCH 256/347] fix: pad hex numbers with zeros when writing colors

This solves a bug where a hex color with a zero can get truncated
---
 cli/src/highlight.rs | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/cli/src/highlight.rs b/cli/src/highlight.rs
index 35f7583e..ba3fcd70 100644
--- a/cli/src/highlight.rs
+++ b/cli/src/highlight.rs
@@ -280,7 +280,7 @@ fn style_to_css(style: ansi_term::Style) -> String {
 
 fn write_color(buffer: &mut String, color: Color) {
     if let Color::RGB(r, g, b) = &color {
-        write!(buffer, "color: #{:x?}{:x?}{:x?}", r, g, b).unwrap()
+        write!(buffer, "color: #{r:02x}{g:02x}{b:02x}").unwrap()
     } else {
         write!(
             buffer,
@@ -447,7 +447,7 @@ mod tests {
         env::set_var("COLORTERM", "");
         parse_style(&mut style, Value::String(DARK_CYAN.to_string()));
         assert_eq!(style.ansi.foreground, Some(Color::Fixed(36)));
-        assert_eq!(style.css, Some("style=\'color: #0af87\'".to_string()));
+        assert_eq!(style.css, Some("style=\'color: #00af87\'".to_string()));
 
         // junglegreen is not an ANSI color and is preserved when the terminal supports it
         env::set_var("COLORTERM", "truecolor");

From 5cca35e2efa3d2b1745098ac671fbd5653f3ceac Mon Sep 17 00:00:00 2001
From: "dependabot[bot]" <49699333+dependabot[bot]@users.noreply.github.com>
Date: Tue, 8 Aug 2023 20:25:20 +0000
Subject: [PATCH 257/347] chore(deps-dev): bump commonmarker from 0.23.9 to
 0.23.10 in /docs

Bumps [commonmarker](https://github.com/gjtorikian/commonmarker) from 0.23.9 to 0.23.10.
- [Release notes](https://github.com/gjtorikian/commonmarker/releases)
- [Changelog](https://github.com/gjtorikian/commonmarker/blob/v0.23.10/CHANGELOG.md)
- [Commits](https://github.com/gjtorikian/commonmarker/compare/v0.23.9...v0.23.10)

---
updated-dependencies:
- dependency-name: commonmarker
  dependency-type: indirect
...

Signed-off-by: dependabot[bot] <support@github.com>
---
 docs/Gemfile.lock | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/docs/Gemfile.lock b/docs/Gemfile.lock
index 9979ebc1..ce19edac 100644
--- a/docs/Gemfile.lock
+++ b/docs/Gemfile.lock
@@ -13,7 +13,7 @@ GEM
       execjs
     coffee-script-source (1.11.1)
     colorator (1.1.0)
-    commonmarker (0.23.9)
+    commonmarker (0.23.10)
     concurrent-ruby (1.2.2)
     dnsruby (1.61.9)
       simpleidn (~> 0.1)

From 26c3ae7b98e6da87295ddcd28fc3848f51a3f301 Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Wed, 9 Aug 2023 14:17:54 +0300
Subject: [PATCH 258/347] Rename: ts_lookahead_iterator_advance ->
 ts_lookahead_iterator_next

---
 lib/binding_rust/bindings.rs  | 4 ++--
 lib/binding_rust/lib.rs       | 9 ++++-----
 lib/binding_web/binding.js    | 2 +-
 lib/binding_web/exports.json  | 2 +-
 lib/include/tree_sitter/api.h | 4 ++--
 lib/src/language.c            | 4 ++--
 lib/src/language.h            | 2 +-
 lib/src/query.c               | 4 ++--
 8 files changed, 15 insertions(+), 16 deletions(-)

diff --git a/lib/binding_rust/bindings.rs b/lib/binding_rust/bindings.rs
index 97117bde..e7168fb5 100644
--- a/lib/binding_rust/bindings.rs
+++ b/lib/binding_rust/bindings.rs
@@ -722,7 +722,7 @@ extern "C" {
     ) -> TSStateId;
 }
 extern "C" {
-    #[doc = " Create a new lookahead iterator for the given language and parse state.\n\n This returns `NULL` if state is invalid for the language.\n\n Repeatedly using `ts_lookahead_iterator_advance` and\n `ts_lookahead_iterator_current_symbol` will generate valid symbols in the\n given parse state. Newly created lookahead iterators will contain the `ERROR`\n symbol.\n\n Lookahead iterators can be useful to generate suggestions and improve syntax\n error diagnostics. To get symbols valid in an ERROR node, use the lookahead\n iterator on its first leaf node state. For `MISSING` nodes, a lookahead\n iterator created on the previous non-extra leaf node may be appropriate."]
+    #[doc = " Create a new lookahead iterator for the given language and parse state.\n\n This returns `NULL` if state is invalid for the language.\n\n Repeatedly using `ts_lookahead_iterator_next` and\n `ts_lookahead_iterator_current_symbol` will generate valid symbols in the\n given parse state. Newly created lookahead iterators will contain the `ERROR`\n symbol.\n\n Lookahead iterators can be useful to generate suggestions and improve syntax\n error diagnostics. To get symbols valid in an ERROR node, use the lookahead\n iterator on its first leaf node state. For `MISSING` nodes, a lookahead\n iterator created on the previous non-extra leaf node may be appropriate."]
     pub fn ts_lookahead_iterator_new(
         self_: *const TSLanguage,
         state: TSStateId,
@@ -753,7 +753,7 @@ extern "C" {
 }
 extern "C" {
     #[doc = " Advance the lookahead iterator to the next symbol.\n\n This returns `true` if there is a new symbol and `false` otherwise."]
-    pub fn ts_lookahead_iterator_advance(self_: *mut TSLookaheadIterator) -> bool;
+    pub fn ts_lookahead_iterator_next(self_: *mut TSLookaheadIterator) -> bool;
 }
 extern "C" {
     #[doc = " Get the current symbol of the lookahead iterator;"]
diff --git a/lib/binding_rust/lib.rs b/lib/binding_rust/lib.rs
index 69f595de..b259aacf 100644
--- a/lib/binding_rust/lib.rs
+++ b/lib/binding_rust/lib.rs
@@ -1509,9 +1509,9 @@ impl LookaheadIterator {
 impl Iterator for LookaheadNamesIterator<'_> {
     type Item = &'static str;
 
-    #[doc(alias = "ts_lookahead_iterator_advance")]
+    #[doc(alias = "ts_lookahead_iterator_next")]
     fn next(&mut self) -> Option<Self::Item> {
-        unsafe { ffi::ts_lookahead_iterator_advance(self.0 .0.as_ptr()) }
+        unsafe { ffi::ts_lookahead_iterator_next(self.0 .0.as_ptr()) }
             .then(|| self.0.current_symbol_name())
     }
 }
@@ -1519,11 +1519,10 @@ impl Iterator for LookaheadNamesIterator<'_> {
 impl Iterator for LookaheadIterator {
     type Item = u16;
 
-    #[doc(alias = "ts_lookahead_iterator_advance")]
+    #[doc(alias = "ts_lookahead_iterator_next")]
     fn next(&mut self) -> Option<Self::Item> {
         // the first symbol is always `0` so we can safely skip it
-        unsafe { ffi::ts_lookahead_iterator_advance(self.0.as_ptr()) }
-            .then(|| self.current_symbol())
+        unsafe { ffi::ts_lookahead_iterator_next(self.0.as_ptr()) }.then(|| self.current_symbol())
     }
 }
 
diff --git a/lib/binding_web/binding.js b/lib/binding_web/binding.js
index e6c2b27e..725b301b 100644
--- a/lib/binding_web/binding.js
+++ b/lib/binding_web/binding.js
@@ -1025,7 +1025,7 @@ class LookaheadIterable {
     const self = this;
     return {
       next() {
-        if (C._ts_lookahead_iterator_advance(self[0])) {
+        if (C._ts_lookahead_iterator_next(self[0])) {
           return { done: false, value: self.currentType };
         }
 
diff --git a/lib/binding_web/exports.json b/lib/binding_web/exports.json
index 9e219d70..47639a9f 100644
--- a/lib/binding_web/exports.json
+++ b/lib/binding_web/exports.json
@@ -122,6 +122,6 @@
   "_ts_lookahead_iterator_delete",
   "_ts_lookahead_iterator_reset_state",
   "_ts_lookahead_iterator_reset",
-  "_ts_lookahead_iterator_advance",
+  "_ts_lookahead_iterator_next",
   "_ts_lookahead_iterator_current_symbol"
 ]
diff --git a/lib/include/tree_sitter/api.h b/lib/include/tree_sitter/api.h
index f07929bd..9e936ff8 100644
--- a/lib/include/tree_sitter/api.h
+++ b/lib/include/tree_sitter/api.h
@@ -1076,7 +1076,7 @@ TSStateId ts_language_next_state(const TSLanguage *self, TSStateId state, TSSymb
  *
  * This returns `NULL` if state is invalid for the language.
  *
- * Repeatedly using `ts_lookahead_iterator_advance` and
+ * Repeatedly using `ts_lookahead_iterator_next` and
  * `ts_lookahead_iterator_current_symbol` will generate valid symbols in the
  * given parse state. Newly created lookahead iterators will contain the `ERROR`
  * symbol.
@@ -1119,7 +1119,7 @@ const TSLanguage *ts_lookahead_iterator_language(const TSLookaheadIterator *self
  *
  * This returns `true` if there is a new symbol and `false` otherwise.
 */
-bool ts_lookahead_iterator_advance(TSLookaheadIterator *self);
+bool ts_lookahead_iterator_next(TSLookaheadIterator *self);
 
 /**
  * Get the current symbol of the lookahead iterator;
diff --git a/lib/src/language.c b/lib/src/language.c
index 1c5fe1fc..f30329de 100644
--- a/lib/src/language.c
+++ b/lib/src/language.c
@@ -192,9 +192,9 @@ bool ts_lookahead_iterator_reset(TSLookaheadIterator *self, const TSLanguage *la
   return true;
 }
 
-bool ts_lookahead_iterator_advance(TSLookaheadIterator *self) {
+bool ts_lookahead_iterator_next(TSLookaheadIterator *self) {
   LookaheadIterator *iterator = (LookaheadIterator *)self;
-  return ts_lookahead_iterator_next(iterator);
+  return ts_lookahead_iterator__next(iterator);
 }
 
 TSSymbol ts_lookahead_iterator_current_symbol(const TSLookaheadIterator *self) {
diff --git a/lib/src/language.h b/lib/src/language.h
index 002f564f..55b5d89b 100644
--- a/lib/src/language.h
+++ b/lib/src/language.h
@@ -136,7 +136,7 @@ static inline LookaheadIterator ts_language_lookaheads(
   };
 }
 
-static inline bool ts_lookahead_iterator_next(LookaheadIterator *self) {
+static inline bool ts_lookahead_iterator__next(LookaheadIterator *self) {
   // For small parse states, valid symbols are listed explicitly,
   // grouped by their value. There's no need to look up the actions
   // again until moving to the next group.
diff --git a/lib/src/query.c b/lib/src/query.c
index be4464ea..f7c98375 100644
--- a/lib/src/query.c
+++ b/lib/src/query.c
@@ -1265,7 +1265,7 @@ static void ts_query__perform_analysis(
       // Follow every possible path in the parse table, but only visit states that
       // are part of the subgraph for the current symbol.
       LookaheadIterator lookahead_iterator = ts_language_lookaheads(self->language, parse_state);
-      while (ts_lookahead_iterator_next(&lookahead_iterator)) {
+      while (ts_lookahead_iterator__next(&lookahead_iterator)) {
         TSSymbol sym = lookahead_iterator.symbol;
 
         AnalysisSubgraphNode successor = {
@@ -1536,7 +1536,7 @@ static bool ts_query__analyze_patterns(TSQuery *self, unsigned *error_offset) {
   for (TSStateId state = 1; state < (uint16_t)self->language->state_count; state++) {
     unsigned subgraph_index, exists;
     LookaheadIterator lookahead_iterator = ts_language_lookaheads(self->language, state);
-    while (ts_lookahead_iterator_next(&lookahead_iterator)) {
+    while (ts_lookahead_iterator__next(&lookahead_iterator)) {
       if (lookahead_iterator.action_count) {
         for (unsigned i = 0; i < lookahead_iterator.action_count; i++) {
           const TSParseAction *action = &lookahead_iterator.actions[i];

From 4a007259fc92227df4821c07463421f00428c51a Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Wed, 9 Aug 2023 01:53:08 +0300
Subject: [PATCH 259/347] Fix warning from #2454 in more clear way

---
 cli/src/generate/render.rs       |  1 -
 lib/include/tree_sitter/parser.h | 10 ++--------
 2 files changed, 2 insertions(+), 9 deletions(-)

diff --git a/cli/src/generate/render.rs b/cli/src/generate/render.rs
index f7e6c18e..3a7130aa 100644
--- a/cli/src/generate/render.rs
+++ b/cli/src/generate/render.rs
@@ -764,7 +764,6 @@ impl Generator {
         indent!(self);
 
         add_line!(self, "START_LEXER();");
-        add_line!(self, "eof = lexer->eof(lexer);");
         add_line!(self, "switch (state) {{");
 
         indent!(self);
diff --git a/lib/include/tree_sitter/parser.h b/lib/include/tree_sitter/parser.h
index 17b4fde9..d2103259 100644
--- a/lib/include/tree_sitter/parser.h
+++ b/lib/include/tree_sitter/parser.h
@@ -129,16 +129,9 @@ struct TSLanguage {
  *  Lexer Macros
  */
 
-#ifdef _MSC_VER
-#define UNUSED __pragma(warning(suppress : 4101))
-#else
-#define UNUSED __attribute__((unused))
-#endif
-
 #define START_LEXER()           \
   bool result = false;          \
   bool skip = false;            \
-  UNUSED                        \
   bool eof = false;             \
   int32_t lookahead;            \
   goto start;                   \
@@ -146,7 +139,8 @@ struct TSLanguage {
   lexer->advance(lexer, skip);  \
   start:                        \
   skip = false;                 \
-  lookahead = lexer->lookahead;
+  lookahead = lexer->lookahead; \
+  eof = lexer->eof(lexer);
 
 #define ADVANCE(state_value) \
   {                          \

From f0fde974e4fba256c1086853330c454bb5db0751 Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Sat, 12 Aug 2023 00:09:41 +0300
Subject: [PATCH 260/347] Remove lazy_static lib dep forgotten in 622359b4

---
 Cargo.lock     | 141 ++++++++++++++++++++-----------------------------
 lib/Cargo.toml |   1 -
 2 files changed, 56 insertions(+), 86 deletions(-)

diff --git a/Cargo.lock b/Cargo.lock
index af6868dd..23306a9a 100644
--- a/Cargo.lock
+++ b/Cargo.lock
@@ -4,9 +4,9 @@ version = 3
 
 [[package]]
 name = "aho-corasick"
-version = "1.0.2"
+version = "1.0.3"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "43f6cb1bf222025340178f382c426f13757b2960e89779dfcb319c32542a5a41"
+checksum = "86b8f9420f797f2d9e935edf629310eb938a0d839f984e25327f3c7eed22300c"
 dependencies = [
  "memchr",
 ]
@@ -38,23 +38,23 @@ version = "0.2.14"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "d9b39be18770d11421cdb1b9947a45dd3f37e93092cbf377614828a319d5fee8"
 dependencies = [
- "hermit-abi 0.1.19",
+ "hermit-abi",
  "libc",
  "winapi",
 ]
 
-[[package]]
-name = "autocfg"
-version = "1.1.0"
-source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "d468802bab17cbc0cc575e9b053f41e72aa36bfa6b7f55e3529ffa43161b97fa"
-
 [[package]]
 name = "bitflags"
 version = "1.3.2"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "bef38d45163c2f1dde094a7dfd33ccf595c92905c8f8f4fdc18d06fb1037718a"
 
+[[package]]
+name = "bitflags"
+version = "2.4.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "b4682ae6287fcf752ecaabbfcc7b6f9b72aa33933dc23a554d853aea8eea8635"
+
 [[package]]
 name = "bumpalo"
 version = "3.13.0"
@@ -69,9 +69,12 @@ checksum = "89b2fd2a0dcf38d7971e2194b6b6eebab45ae01067456a7fd93d5547a61b70be"
 
 [[package]]
 name = "cc"
-version = "1.0.79"
+version = "1.0.82"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "50d30906286121d95be3d479533b458f87493b30a4b5f79a607db8f5d11aa91f"
+checksum = "305fe645edc1442a0fa8b6726ba61d422798d37a52e12eaecf4b022ebbb88f01"
+dependencies = [
+ "libc",
+]
 
 [[package]]
 name = "cesu8"
@@ -99,7 +102,7 @@ checksum = "a0610544180c38b88101fecf2dd634b174a62eef6946f84dfc6a7127512b381c"
 dependencies = [
  "ansi_term",
  "atty",
- "bitflags",
+ "bitflags 1.3.2",
  "strsim",
  "textwrap",
  "unicode-width",
@@ -139,7 +142,7 @@ source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "1f34ba9a9bcb8645379e9de8cb3ecfcf4d1c85ba66d90deb3259206fa5aa193b"
 dependencies = [
  "quote",
- "syn 2.0.26",
+ "syn 2.0.28",
 ]
 
 [[package]]
@@ -207,9 +210,9 @@ dependencies = [
 
 [[package]]
 name = "either"
-version = "1.8.1"
+version = "1.9.0"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "7fcaabb2fef8c910e7f4c7ce9f67a1283a1715879a7c230ca9d6d1ae31f16d91"
+checksum = "a26ae43d7bcc3b814de94796a5e736d4029efb0ee900c12e2d54c993ad1a1e07"
 
 [[package]]
 name = "equivalent"
@@ -219,9 +222,9 @@ checksum = "5443807d6dff69373d433ab9ef5378ad8df50ca6298caf15de6e52e24aaf54d5"
 
 [[package]]
 name = "errno"
-version = "0.3.1"
+version = "0.3.2"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "4bcfec3a70f97c962c307b2d2c56e358cf1d00b558d74262b5f929ee8cc7e73a"
+checksum = "6b30f669a7961ef1631673d2766cc92f52d64f7ef354d4fe0ddfd30ed52f0f4f"
 dependencies = [
  "errno-dragonfly",
  "libc",
@@ -240,12 +243,9 @@ dependencies = [
 
 [[package]]
 name = "fastrand"
-version = "1.9.0"
+version = "2.0.0"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "e51093e27b0797c359783294ca4f0a911c270184cb10f85783b118614a1501be"
-dependencies = [
- "instant",
-]
+checksum = "6999dc1837253364c2ebb0704ba97994bd874e8f195d665c50b7548f6ea92764"
 
 [[package]]
 name = "form_urlencoded"
@@ -288,12 +288,6 @@ dependencies = [
  "libc",
 ]
 
-[[package]]
-name = "hermit-abi"
-version = "0.3.2"
-source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "443144c8cdadd93ebf52ddb4056d257f5b52c04d3c804e657d19eb73fc33668b"
-
 [[package]]
 name = "home"
 version = "0.5.5"
@@ -344,26 +338,6 @@ version = "2.0.3"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "2c785eefb63ebd0e33416dfcb8d6da0bf27ce752843a45632a67bf10d4d4b5c4"
 
-[[package]]
-name = "instant"
-version = "0.1.12"
-source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "7a5bbe824c507c5da5956355e86a746d82e0e1464f65d862cc5e71da70e94b2c"
-dependencies = [
- "cfg-if",
-]
-
-[[package]]
-name = "io-lifetimes"
-version = "1.0.11"
-source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "eae7b9aee968036d54dce06cebaefd919e4472e753296daccd6d344e3e2df0c2"
-dependencies = [
- "hermit-abi 0.3.2",
- "libc",
- "windows-sys 0.48.0",
-]
-
 [[package]]
 name = "itoa"
 version = "1.0.9"
@@ -425,9 +399,9 @@ dependencies = [
 
 [[package]]
 name = "linux-raw-sys"
-version = "0.3.8"
+version = "0.4.5"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "ef53942eb7bf7ff43a617b3e2c1c4a5ecf5944a7c1bc12d7ee39bbb15e5c1519"
+checksum = "57bcfdad1b858c2db7c38303a6d2ad4dfaf5eb53dfeb0910128b2c26d6158503"
 
 [[package]]
 name = "log"
@@ -462,7 +436,7 @@ version = "0.26.2"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "bfdda3d196821d6af13126e40375cdf7da646a96114af134d5f417a9a1dc8e1a"
 dependencies = [
- "bitflags",
+ "bitflags 1.3.2",
  "cfg-if",
  "libc",
  "static_assertions",
@@ -528,9 +502,9 @@ dependencies = [
 
 [[package]]
 name = "quote"
-version = "1.0.31"
+version = "1.0.32"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "5fe8a65d69dd0808184ebb5f836ab526bb259db23c657efa38711b1072ee47f0"
+checksum = "50f3b39ccfb720540debaa0164757101c08ecb8d326b15358ce76a62c7e85965"
 dependencies = [
  "proc-macro2",
 ]
@@ -577,7 +551,7 @@ version = "0.2.16"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "fb5a58c1855b4b6819d59012155603f0b22ad30cad752600aadfcb695265519a"
 dependencies = [
- "bitflags",
+ "bitflags 1.3.2",
 ]
 
 [[package]]
@@ -586,7 +560,7 @@ version = "0.3.5"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "567664f262709473930a4bf9e51bf2ebf3348f2e748ccc50dea20646858f8f29"
 dependencies = [
- "bitflags",
+ "bitflags 1.3.2",
 ]
 
 [[package]]
@@ -602,9 +576,9 @@ dependencies = [
 
 [[package]]
 name = "regex"
-version = "1.9.1"
+version = "1.9.3"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "b2eae68fc220f7cf2532e4494aded17545fce192d59cd996e0fe7887f4ceb575"
+checksum = "81bc1d4caf89fac26a70747fe603c130093b53c773888797a6329091246d651a"
 dependencies = [
  "aho-corasick",
  "memchr",
@@ -614,9 +588,9 @@ dependencies = [
 
 [[package]]
 name = "regex-automata"
-version = "0.3.3"
+version = "0.3.6"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "39354c10dd07468c2e73926b23bb9c2caca74c5501e38a35da70406f1d923310"
+checksum = "fed1ceff11a1dddaee50c9dc8e4938bd106e9d89ae372f192311e7da498e3b69"
 dependencies = [
  "aho-corasick",
  "memchr",
@@ -637,13 +611,12 @@ checksum = "08d43f7aa6b08d49f382cde6a7982047c3426db949b1424bc4b7ec9ae12c6ce2"
 
 [[package]]
 name = "rustix"
-version = "0.37.23"
+version = "0.38.8"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "4d69718bf81c6127a49dc64e44a742e8bb9213c0ff8869a22c308f84c1d4ab06"
+checksum = "19ed4fa021d81c8392ce04db050a3da9a60299050b7ae1cf482d862b54a7218f"
 dependencies = [
- "bitflags",
+ "bitflags 2.4.0",
  "errno",
- "io-lifetimes",
  "libc",
  "linux-raw-sys",
  "windows-sys 0.48.0",
@@ -672,29 +645,29 @@ checksum = "b0293b4b29daaf487284529cc2f5675b8e57c61f70167ba415a463651fd6a918"
 
 [[package]]
 name = "serde"
-version = "1.0.173"
+version = "1.0.183"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "e91f70896d6720bc714a4a57d22fc91f1db634680e65c8efe13323f1fa38d53f"
+checksum = "32ac8da02677876d532745a130fc9d8e6edfa81a269b107c5b00829b91d8eb3c"
 dependencies = [
  "serde_derive",
 ]
 
 [[package]]
 name = "serde_derive"
-version = "1.0.173"
+version = "1.0.183"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "a6250dde8342e0232232be9ca3db7aa40aceb5a3e5dd9bddbc00d99a007cde49"
+checksum = "aafe972d60b0b9bee71a91b92fee2d4fb3c9d7e8f6b179aa99f27203d99a4816"
 dependencies = [
  "proc-macro2",
  "quote",
- "syn 2.0.26",
+ "syn 2.0.28",
 ]
 
 [[package]]
 name = "serde_json"
-version = "1.0.103"
+version = "1.0.104"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "d03b412469450d4404fe8499a268edd7f8b79fecb074b0d812ad64ca21f4031b"
+checksum = "076066c5f1078eac5b722a31827a8832fe108bed65dfa75e233c89f8206e976c"
 dependencies = [
  "indexmap",
  "itoa",
@@ -742,9 +715,9 @@ dependencies = [
 
 [[package]]
 name = "syn"
-version = "2.0.26"
+version = "2.0.28"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "45c3457aacde3c65315de5031ec191ce46604304d2446e803d71ade03308d970"
+checksum = "04361975b3f5e348b2189d8dc55bc942f278b2d482a6a0365de5bdd62d351567"
 dependencies = [
  "proc-macro2",
  "quote",
@@ -753,11 +726,10 @@ dependencies = [
 
 [[package]]
 name = "tempfile"
-version = "3.6.0"
+version = "3.7.1"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "31c0432476357e58790aaa47a8efb0c5138f137343f3b5f23bd36a27e3b0a6d6"
+checksum = "dc02fddf48964c42031a0b3fe0428320ecf3a73c401040fc0096f97794310651"
 dependencies = [
- "autocfg",
  "cfg-if",
  "fastrand",
  "redox_syscall 0.3.5",
@@ -776,22 +748,22 @@ dependencies = [
 
 [[package]]
 name = "thiserror"
-version = "1.0.43"
+version = "1.0.44"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "a35fc5b8971143ca348fa6df4f024d4d55264f3468c71ad1c2f365b0a4d58c42"
+checksum = "611040a08a0439f8248d1990b111c95baa9c704c805fa1f62104b39655fd7f90"
 dependencies = [
  "thiserror-impl",
 ]
 
 [[package]]
 name = "thiserror-impl"
-version = "1.0.43"
+version = "1.0.44"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "463fe12d7993d3b327787537ce8dd4dfa058de32fc2b195ef3cde03dc4771e8f"
+checksum = "090198534930841fab3a5d1bb637cde49e339654e606195f8d9c76eeb081dc96"
 dependencies = [
  "proc-macro2",
  "quote",
- "syn 2.0.26",
+ "syn 2.0.28",
 ]
 
 [[package]]
@@ -860,7 +832,6 @@ name = "tree-sitter"
 version = "0.20.10"
 dependencies = [
  "cc",
- "lazy_static",
  "regex",
 ]
 
@@ -1057,7 +1028,7 @@ dependencies = [
  "once_cell",
  "proc-macro2",
  "quote",
- "syn 2.0.26",
+ "syn 2.0.28",
  "wasm-bindgen-shared",
 ]
 
@@ -1079,7 +1050,7 @@ checksum = "54681b18a46765f095758388f2d0cf16eb8d4169b639ab575a8f5693af210c7b"
 dependencies = [
  "proc-macro2",
  "quote",
- "syn 2.0.26",
+ "syn 2.0.28",
  "wasm-bindgen-backend",
  "wasm-bindgen-shared",
 ]
@@ -1293,9 +1264,9 @@ checksum = "1a515f5799fe4961cb532f983ce2b23082366b898e52ffbce459c86f67c8378a"
 
 [[package]]
 name = "winnow"
-version = "0.5.0"
+version = "0.5.9"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "81fac9742fd1ad1bd9643b991319f72dd031016d44b77039a26977eb667141e7"
+checksum = "4344c9f03e6918ce61d94ea6b0500964bb42ee9ca9b2c9c8931990e20b481144"
 dependencies = [
  "memchr",
 ]
diff --git a/lib/Cargo.toml b/lib/Cargo.toml
index d3aabd39..5e1f3559 100644
--- a/lib/Cargo.toml
+++ b/lib/Cargo.toml
@@ -23,7 +23,6 @@ include = [
 ]
 
 [dependencies]
-lazy_static = { version = "1.4.0", optional = true }
 regex = "1.9.1"
 
 [build-dependencies]

From 7a6c0f23fabcf7bf94959de6535d754fdf51dbb2 Mon Sep 17 00:00:00 2001
From: Amaan Qureshi <amaanq12@gmail.com>
Date: Sun, 13 Aug 2023 02:01:02 -0400
Subject: [PATCH 261/347] fix: musl compilation

---
 lib/src/atomic.h | 13 +++++++++++--
 1 file changed, 11 insertions(+), 2 deletions(-)

diff --git a/lib/src/atomic.h b/lib/src/atomic.h
index e8a2060a..d91c2c0b 100644
--- a/lib/src/atomic.h
+++ b/lib/src/atomic.h
@@ -1,6 +1,7 @@
 #ifndef TREE_SITTER_ATOMIC_H_
 #define TREE_SITTER_ATOMIC_H_
 
+#include <stddef.h>
 #include <stdint.h>
 
 #ifdef __TINYC__
@@ -46,11 +47,19 @@ static inline size_t atomic_load(const volatile size_t *p) {
 }
 
 static inline uint32_t atomic_inc(volatile uint32_t *p) {
-  return __sync_add_and_fetch(p, 1U);
+  #ifdef __ATOMIC_RELAXED
+    return __atomic_add_fetch(p, 1U, __ATOMIC_RELAXED);
+  #else
+    return __sync_add_and_fetch(p, 1U);
+  #endif
 }
 
 static inline uint32_t atomic_dec(volatile uint32_t *p) {
-  return __sync_sub_and_fetch(p, 1U);
+  #ifdef __ATOMIC_RELAXED
+    return __atomic_sub_fetch(p, 1U, __ATOMIC_RELAXED);
+  #else
+    return __sync_sub_and_fetch(p, 1U);
+  #endif
 }
 
 #endif

From ec17f60de5d7b099f2a1c7d470d241ee659d586f Mon Sep 17 00:00:00 2001
From: Amaan Qureshi <amaanq12@gmail.com>
Date: Sun, 13 Aug 2023 12:27:00 -0400
Subject: [PATCH 262/347] fix: use SEQ_CST in atomic inc/dec

---
 lib/src/atomic.h | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/lib/src/atomic.h b/lib/src/atomic.h
index d91c2c0b..9e9269cc 100644
--- a/lib/src/atomic.h
+++ b/lib/src/atomic.h
@@ -48,7 +48,7 @@ static inline size_t atomic_load(const volatile size_t *p) {
 
 static inline uint32_t atomic_inc(volatile uint32_t *p) {
   #ifdef __ATOMIC_RELAXED
-    return __atomic_add_fetch(p, 1U, __ATOMIC_RELAXED);
+    return __atomic_add_fetch(p, 1U, __ATOMIC_SEQ_CST);
   #else
     return __sync_add_and_fetch(p, 1U);
   #endif
@@ -56,7 +56,7 @@ static inline uint32_t atomic_inc(volatile uint32_t *p) {
 
 static inline uint32_t atomic_dec(volatile uint32_t *p) {
   #ifdef __ATOMIC_RELAXED
-    return __atomic_sub_fetch(p, 1U, __ATOMIC_RELAXED);
+    return __atomic_sub_fetch(p, 1U, __ATOMIC_SEQ_CST);
   #else
     return __sync_sub_and_fetch(p, 1U);
   #endif

From 318d4a705a920a5ac3b89b775de1394651c9b9ef Mon Sep 17 00:00:00 2001
From: Amaan Qureshi <amaanq12@gmail.com>
Date: Sun, 13 Aug 2023 16:23:55 -0400
Subject: [PATCH 263/347] fix: don't add flags if they're not present

---
 cli/src/generate/dsl.js | 5 ++++-
 1 file changed, 4 insertions(+), 1 deletion(-)

diff --git a/cli/src/generate/dsl.js b/cli/src/generate/dsl.js
index fefd970e..4fdfbef1 100644
--- a/cli/src/generate/dsl.js
+++ b/cli/src/generate/dsl.js
@@ -181,10 +181,13 @@ function normalize(value) {
         value
       };
     case RegExp:
-      return {
+      return value.flags ? {
         type: 'PATTERN',
         value: value.source,
         flags: value.flags
+      } : {
+        type: 'PATTERN',
+        value: value.source
       };
     case ReferenceError:
       throw value

From 0b1b0d2fb7a7da627a98bd9af023e6f75dfbec9a Mon Sep 17 00:00:00 2001
From: Amaan Qureshi <amaanq12@gmail.com>
Date: Sun, 13 Aug 2023 00:58:19 -0400
Subject: [PATCH 264/347] fix: replace & sanitize more characters

---
 cli/src/generate/render.rs | 137 +++++++++++++++++++++++++------------
 1 file changed, 92 insertions(+), 45 deletions(-)

diff --git a/cli/src/generate/render.rs b/cli/src/generate/render.rs
index 3a7130aa..709de1d8 100644
--- a/cli/src/generate/render.rs
+++ b/cli/src/generate/render.rs
@@ -1533,54 +1533,92 @@ impl Generator {
     fn sanitize_identifier(&self, name: &str) -> String {
         let mut result = String::with_capacity(name.len());
         for c in name.chars() {
-            if ('a' <= c && c <= 'z')
-                || ('A' <= c && c <= 'Z')
-                || ('0' <= c && c <= '9')
-                || c == '_'
-            {
+            if c.is_ascii_alphanumeric() || c == '_' {
                 result.push(c);
             } else {
-                let replacement = match c {
-                    '~' => "TILDE",
-                    '`' => "BQUOTE",
-                    '!' => "BANG",
-                    '@' => "AT",
-                    '#' => "POUND",
-                    '$' => "DOLLAR",
-                    '%' => "PERCENT",
-                    '^' => "CARET",
-                    '&' => "AMP",
-                    '*' => "STAR",
-                    '(' => "LPAREN",
-                    ')' => "RPAREN",
-                    '-' => "DASH",
-                    '+' => "PLUS",
-                    '=' => "EQ",
-                    '{' => "LBRACE",
-                    '}' => "RBRACE",
-                    '[' => "LBRACK",
-                    ']' => "RBRACK",
-                    '\\' => "BSLASH",
-                    '|' => "PIPE",
-                    ':' => "COLON",
-                    ';' => "SEMI",
-                    '"' => "DQUOTE",
-                    '\'' => "SQUOTE",
-                    '<' => "LT",
-                    '>' => "GT",
-                    ',' => "COMMA",
-                    '.' => "DOT",
-                    '?' => "QMARK",
-                    '/' => "SLASH",
-                    '\n' => "LF",
-                    '\r' => "CR",
-                    '\t' => "TAB",
-                    _ => continue,
-                };
-                if !result.is_empty() && !result.ends_with("_") {
-                    result.push('_');
+                'special_chars: {
+                    let replacement = match c {
+                        ' ' => "SPACE",
+                        '~' => "TILDE",
+                        '`' => "BQUOTE",
+                        '!' => "BANG",
+                        '@' => "AT",
+                        '#' => "POUND",
+                        '$' => "DOLLAR",
+                        '%' => "PERCENT",
+                        '^' => "CARET",
+                        '&' => "AMP",
+                        '*' => "STAR",
+                        '(' => "LPAREN",
+                        ')' => "RPAREN",
+                        '-' => "DASH",
+                        '+' => "PLUS",
+                        '=' => "EQ",
+                        '{' => "LBRACE",
+                        '}' => "RBRACE",
+                        '[' => "LBRACK",
+                        ']' => "RBRACK",
+                        '\\' => "BSLASH",
+                        '|' => "PIPE",
+                        ':' => "COLON",
+                        ';' => "SEMI",
+                        '"' => "DQUOTE",
+                        '\'' => "SQUOTE",
+                        '<' => "LT",
+                        '>' => "GT",
+                        ',' => "COMMA",
+                        '.' => "DOT",
+                        '?' => "QMARK",
+                        '/' => "SLASH",
+                        '\n' => "LF",
+                        '\r' => "CR",
+                        '\t' => "TAB",
+                        '\0' => "NULL",
+                        '\u{0001}' => "SOH",
+                        '\u{0002}' => "STX",
+                        '\u{0003}' => "ETX",
+                        '\u{0004}' => "EOT",
+                        '\u{0005}' => "ENQ",
+                        '\u{0006}' => "ACK",
+                        '\u{0007}' => "BEL",
+                        '\u{0008}' => "BS",
+                        '\u{000b}' => "VTAB",
+                        '\u{000c}' => "FF",
+                        '\u{000e}' => "SO",
+                        '\u{000f}' => "SI",
+                        '\u{0010}' => "DLE",
+                        '\u{0011}' => "DC1",
+                        '\u{0012}' => "DC2",
+                        '\u{0013}' => "DC3",
+                        '\u{0014}' => "DC4",
+                        '\u{0015}' => "NAK",
+                        '\u{0016}' => "SYN",
+                        '\u{0017}' => "ETB",
+                        '\u{0018}' => "CAN",
+                        '\u{0019}' => "EM",
+                        '\u{001a}' => "SUB",
+                        '\u{001b}' => "ESC",
+                        '\u{001c}' => "FS",
+                        '\u{001d}' => "GS",
+                        '\u{001e}' => "RS",
+                        '\u{001f}' => "US",
+                        '\u{007F}' => "DEL",
+                        '\u{FEFF}' => "BOM",
+                        '\u{0080}'..='\u{FFFF}' => {
+                            result.push_str(&format!("u{:04x}", c as u32));
+                            break 'special_chars;
+                        }
+                        '\u{10000}'..='\u{10FFFF}' => {
+                            result.push_str(&format!("U{:08x}", c as u32));
+                            break 'special_chars;
+                        }
+                        '0'..='9' | 'a'..='z' | 'A'..='Z' | '_' => unreachable!(),
+                    };
+                    if !result.is_empty() && !result.ends_with("_") {
+                        result.push('_');
+                    }
+                    result += replacement;
                 }
-                result += replacement;
             }
         }
         result
@@ -1593,10 +1631,19 @@ impl Generator {
                 '\"' => result += "\\\"",
                 '?' => result += "\\?",
                 '\\' => result += "\\\\",
+                '\u{0007}' => result += "\\a",
+                '\u{0008}' => result += "\\b",
+                '\u{000b}' => result += "\\v",
                 '\u{000c}' => result += "\\f",
                 '\n' => result += "\\n",
                 '\r' => result += "\\r",
                 '\t' => result += "\\t",
+                '\0' => result += "\\0",
+                '\u{0001}'..='\u{001f}' => result += &format!("\\x{:02x}", c as u32),
+                '\u{007F}'..='\u{FFFF}' => result += &format!("\\u{:04x}", c as u32),
+                '\u{10000}'..='\u{10FFFF}' => {
+                    result.push_str(&format!("\\U{:08x}", c as u32));
+                }
                 _ => result.push(c),
             }
         }

From 93450df85e86e29b5501a734c93c3175d0410cc9 Mon Sep 17 00:00:00 2001
From: Amaan Qureshi <amaanq12@gmail.com>
Date: Mon, 14 Aug 2023 14:12:45 -0400
Subject: [PATCH 265/347] fix: use opt-level 3 by default, and add a size
 profile

---
 Cargo.toml | 6 +++++-
 1 file changed, 5 insertions(+), 1 deletion(-)

diff --git a/Cargo.toml b/Cargo.toml
index 1e4c00c7..03e24caf 100644
--- a/Cargo.toml
+++ b/Cargo.toml
@@ -9,5 +9,9 @@ rust-version = "1.65"
 [profile.release]
 strip = true      # Automatically strip symbols from the binary.
 lto = true        # Link-time optimization.
-opt-level = "s"   # Optimize for speed.
+opt-level = 3     # Optimization level 3.
 codegen-units = 1 # Maximum size reduction optimizations.
+
+[profile.size]
+inherits = "release"
+opt-level = "s"      # Optimize for size.

From 029899f719982a891720fa7a7703519ff09e276f Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Tue, 15 Aug 2023 23:28:54 +0300
Subject: [PATCH 266/347] fix: dsl.d.ts - define previous param in rule
 callbacks

---
 cli/npm/dsl.d.ts | 1 +
 1 file changed, 1 insertion(+)

diff --git a/cli/npm/dsl.d.ts b/cli/npm/dsl.d.ts
index 78b654f3..507291ac 100644
--- a/cli/npm/dsl.d.ts
+++ b/cli/npm/dsl.d.ts
@@ -42,6 +42,7 @@ type GrammarSymbols<RuleName extends string> = {
 
 type RuleBuilder<RuleName extends string> = (
   $: GrammarSymbols<RuleName>,
+  previous: Rule,
 ) => RuleOrLiteral;
 
 type RuleBuilders<

From ece1060d2c3e2f1c6fa1b5a95db0cdaa0883e9ca Mon Sep 17 00:00:00 2001
From: Amaan Qureshi <amaanq12@gmail.com>
Date: Wed, 16 Aug 2023 01:24:45 -0400
Subject: [PATCH 267/347] feat: warn users when using non-static functions that
 aren't needed for tree-sitter

---
 cli/loader/src/lib.rs | 30 ++++++++++++++++++++++++++++++
 1 file changed, 30 insertions(+)

diff --git a/cli/loader/src/lib.rs b/cli/loader/src/lib.rs
index 3548ab8c..c0f050e0 100644
--- a/cli/loader/src/lib.rs
+++ b/cli/loader/src/lib.rs
@@ -438,6 +438,36 @@ impl Loader {
             }
         }
 
+        #[cfg(any(target_os = "macos", target_os = "linux"))]
+        if scanner_path.is_some() {
+            let command = Command::new("nm")
+                .arg("-W")
+                .arg("-U")
+                .arg(&library_path)
+                .output();
+            if let Ok(output) = command {
+                if output.status.success() {
+                    let mut found_non_static = false;
+                    for line in String::from_utf8_lossy(&output.stdout).lines() {
+                        if line.contains(" T ") && !line.contains("tree_sitter_") {
+                            if let Some(function_name) =
+                                line.split_whitespace().collect::<Vec<_>>().get(2)
+                            {
+                                if !found_non_static {
+                                    found_non_static = true;
+                                    eprintln!("Warning: Found non-static non-tree-sitter functions in external scannner");
+                                }
+                                eprintln!("  `{function_name}`");
+                            }
+                        }
+                    }
+                    if found_non_static {
+                        eprintln!("Consider making these functions static, they can cause conflicts when another tree-sitter project uses the same function name");
+                    }
+                }
+            }
+        }
+
         let library = unsafe { Library::new(&library_path) }
             .with_context(|| format!("Error opening dynamic library {:?}", &library_path))?;
         let language_fn_name = format!("tree_sitter_{}", replace_dashes_with_underscores(name));

From c008005f9a116e201ec04cd8c70ecf378101aaf9 Mon Sep 17 00:00:00 2001
From: Amaan Qureshi <amaanq12@gmail.com>
Date: Sun, 13 Aug 2023 21:43:58 -0400
Subject: [PATCH 268/347] feat: improve dsl definitions

---
 cli/npm/dsl.d.ts | 19 ++++++++++++++-----
 1 file changed, 14 insertions(+), 5 deletions(-)

diff --git a/cli/npm/dsl.d.ts b/cli/npm/dsl.d.ts
index 507291ac..63f9ed49 100644
--- a/cli/npm/dsl.d.ts
+++ b/cli/npm/dsl.d.ts
@@ -69,11 +69,17 @@ interface Grammar<
   rules: Rules;
 
   /**
-   * An array of arrays of precedence names. Each inner array represents
-   * a *descending* ordering. Names listed earlier in one of these arrays
-   * have higher precedence than any names listed later in the same array.
+   * An array of arrays of precedence names or rules. Each inner array represents
+   * a *descending* ordering. Names/rules listed earlier in one of these arrays
+   * have higher precedence than any names/rules listed later in the same array.
+   *
+   * Using rules is just a shorthand way for using a name then calling prec()
+   * with that name. It is just a convenience.
    */
-  precedences?: () => String[][],
+  precedences?: (
+    $: GrammarSymbols<RuleName | BaseGrammarRuleName>,
+    previous: Rule[][],
+  ) => RuleOrLiteral[][],
 
   /**
    * An array of arrays of rule names. Each inner array represents a set of
@@ -87,6 +93,7 @@ interface Grammar<
    */
   conflicts?: (
     $: GrammarSymbols<RuleName | BaseGrammarRuleName>,
+    previous: Rule[][],
   ) => RuleOrLiteral[][];
 
   /**
@@ -103,7 +110,7 @@ interface Grammar<
   externals?: (
     $: Record<string, SymbolRule<string>>,
     previous: Rule[],
-  ) => (SymbolRule<string> | RegExp | string)[];
+  ) => RuleOrLiteral[];
 
   /**
    * An array of tokens that may appear anywhere in the language. This
@@ -127,6 +134,7 @@ interface Grammar<
    */
   inline?: (
     $: GrammarSymbols<RuleName | BaseGrammarRuleName>,
+    previous: Rule[],
   ) => RuleOrLiteral[];
 
   /**
@@ -139,6 +147,7 @@ interface Grammar<
    */
   supertypes?: (
     $: GrammarSymbols<RuleName | BaseGrammarRuleName>,
+    previous: Rule[],
   ) => RuleOrLiteral[];
 
   /**

From e0434327d0267531d74c517d37d48031c779702a Mon Sep 17 00:00:00 2001
From: Amaan Qureshi <amaanq12@gmail.com>
Date: Wed, 16 Aug 2023 13:44:44 -0400
Subject: [PATCH 269/347] fix(render): only output SPACE for strings that are
 just a space

---
 cli/src/generate/render.rs | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/cli/src/generate/render.rs b/cli/src/generate/render.rs
index 709de1d8..197ce364 100644
--- a/cli/src/generate/render.rs
+++ b/cli/src/generate/render.rs
@@ -1538,7 +1538,7 @@ impl Generator {
             } else {
                 'special_chars: {
                     let replacement = match c {
-                        ' ' => "SPACE",
+                        ' ' if name.len() == 1 => "SPACE",
                         '~' => "TILDE",
                         '`' => "BQUOTE",
                         '!' => "BANG",
@@ -1613,6 +1613,7 @@ impl Generator {
                             break 'special_chars;
                         }
                         '0'..='9' | 'a'..='z' | 'A'..='Z' | '_' => unreachable!(),
+                        ' ' => break 'special_chars,
                     };
                     if !result.is_empty() && !result.ends_with("_") {
                         result.push('_');

From cbe805d82a7355ee4b7506dc8510abe56c7eb4b5 Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Thu, 17 Aug 2023 15:00:58 +0300
Subject: [PATCH 270/347] Allow override Makefile CFLAGS by appending and not
 by overwriting

---
 Makefile | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/Makefile b/Makefile
index 59554e1d..57f19da3 100644
--- a/Makefile
+++ b/Makefile
@@ -18,8 +18,8 @@ endif
 OBJ := $(SRC:.c=.o)
 
 # define default flags, and override to append mandatory flags
-CFLAGS ?= -O3 -Wall -Wextra -Werror -Wshadow
-override CFLAGS += -std=gnu99 -fPIC -Ilib/src -Ilib/include
+override CFLAGS := -O3 -std=gnu99 -fPIC -Wall -Wextra -Werror -Wshadow $(CFLAGS)
+override CFLAGS += -Ilib/src -Ilib/include
 
 # ABI versioning
 SONAME_MAJOR := 0

From 5e3df64a460116b1a4480c29cf4a141d41b3ccf4 Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Thu, 17 Aug 2023 15:01:47 +0300
Subject: [PATCH 271/347] fix(lib): expose only symbols defined in api.h

---
 Makefile                      | 2 +-
 lib/include/tree_sitter/api.h | 4 ++++
 2 files changed, 5 insertions(+), 1 deletion(-)

diff --git a/Makefile b/Makefile
index 57f19da3..f2afed00 100644
--- a/Makefile
+++ b/Makefile
@@ -18,7 +18,7 @@ endif
 OBJ := $(SRC:.c=.o)
 
 # define default flags, and override to append mandatory flags
-override CFLAGS := -O3 -std=gnu99 -fPIC -Wall -Wextra -Werror -Wshadow $(CFLAGS)
+override CFLAGS := -O3 -std=gnu99 -fPIC -fvisibility=hidden -Wall -Wextra -Werror -Wshadow $(CFLAGS)
 override CFLAGS += -Ilib/src -Ilib/include
 
 # ABI versioning
diff --git a/lib/include/tree_sitter/api.h b/lib/include/tree_sitter/api.h
index 9e936ff8..1cc6b3e9 100644
--- a/lib/include/tree_sitter/api.h
+++ b/lib/include/tree_sitter/api.h
@@ -1,6 +1,8 @@
 #ifndef TREE_SITTER_API_H_
 #define TREE_SITTER_API_H_
 
+#pragma GCC visibility push(default)
+
 #ifdef __cplusplus
 extern "C" {
 #endif
@@ -1163,4 +1165,6 @@ void ts_set_allocator(
 }
 #endif
 
+#pragma GCC visibility pop
+
 #endif  // TREE_SITTER_API_H_

From 113d100250b08c47d421884a3a355aca7b6ef5f2 Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Thu, 17 Aug 2023 15:39:14 +0300
Subject: [PATCH 272/347] Add an optional strip step to the Makefile

It can be used like:
  > make clean && make -j CC=clang AR=llvm-ar STRIP=llvm-strip
---
 Makefile | 3 +++
 1 file changed, 3 insertions(+)

diff --git a/Makefile b/Makefile
index f2afed00..5339d1e6 100644
--- a/Makefile
+++ b/Makefile
@@ -50,6 +50,9 @@ libtree-sitter.$(SOEXTVER): $(OBJ)
 	$(CC) $(LDFLAGS) $(LINKSHARED) $^ $(LDLIBS) -o $@
 	ln -sf $@ libtree-sitter.$(SOEXT)
 	ln -sf $@ libtree-sitter.$(SOEXTVER_MAJOR)
+ifneq ($(STRIP),)
+	$(STRIP) $@
+endif
 
 install: all
 	install -d '$(DESTDIR)$(LIBDIR)'

From f9e8802234cbd692b1979cff3bea90f5103d4187 Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Thu, 17 Aug 2023 16:27:52 +0300
Subject: [PATCH 273/347] Use the same flags in lib's build.rs as in Makefile

---
 lib/binding_rust/build.rs |  4 +++-
 lib/src/subtree.c         | 10 +++++-----
 2 files changed, 8 insertions(+), 6 deletions(-)

diff --git a/lib/binding_rust/build.rs b/lib/binding_rust/build.rs
index 5798cde3..c812c3b9 100644
--- a/lib/binding_rust/build.rs
+++ b/lib/binding_rust/build.rs
@@ -26,7 +26,9 @@ fn main() {
 
     cc::Build::new()
         .flag_if_supported("-std=c99")
-        .flag_if_supported("-Wno-unused-parameter")
+        .flag_if_supported("-fvisibility=hidden")
+        .flag_if_supported("-Wshadow")
+        .flag_if_supported("-Werror")
         .include(src_path)
         .include("include")
         .file(src_path.join("lib.c"))
diff --git a/lib/src/subtree.c b/lib/src/subtree.c
index 5f39bd82..51bc2ef6 100644
--- a/lib/src/subtree.c
+++ b/lib/src/subtree.c
@@ -647,10 +647,10 @@ Subtree ts_subtree_edit(Subtree self, const TSInputEdit *input_edit, SubtreePool
   typedef struct {
     Subtree *tree;
     Edit edit;
-  } StackEntry;
+  } EditEntry;
 
-  Array(StackEntry) stack = array_new();
-  array_push(&stack, ((StackEntry) {
+  Array(EditEntry) stack = array_new();
+  array_push(&stack, ((EditEntry) {
     .tree = &self,
     .edit = (Edit) {
       .start = {input_edit->start_byte, input_edit->start_point},
@@ -660,7 +660,7 @@ Subtree ts_subtree_edit(Subtree self, const TSInputEdit *input_edit, SubtreePool
   }));
 
   while (stack.size) {
-    StackEntry entry = array_pop(&stack);
+    EditEntry entry = array_pop(&stack);
     Edit edit = entry.edit;
     bool is_noop = edit.old_end.bytes == edit.start.bytes && edit.new_end.bytes == edit.start.bytes;
     bool is_pure_insertion = edit.old_end.bytes == edit.start.bytes;
@@ -788,7 +788,7 @@ Subtree ts_subtree_edit(Subtree self, const TSInputEdit *input_edit, SubtreePool
       }
 
       // Queue processing of this child's subtree.
-      array_push(&stack, ((StackEntry) {
+      array_push(&stack, ((EditEntry) {
         .tree = child,
         .edit = child_edit,
       }));

From 0dd85c84521fe8b10d26275b70578a28753c55be Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Thu, 17 Aug 2023 18:16:41 +0300
Subject: [PATCH 274/347] Add TREE_SITTER_GRAMMAR_DEBUG env var to use debug
 grammars in tests

---
 cli/src/tests/corpus_test.rs      |  4 ++++
 cli/src/tests/helpers/fixtures.rs | 10 ++++++++--
 2 files changed, 12 insertions(+), 2 deletions(-)

diff --git a/cli/src/tests/corpus_test.rs b/cli/src/tests/corpus_test.rs
index a193c029..f7b4815b 100644
--- a/cli/src/tests/corpus_test.rs
+++ b/cli/src/tests/corpus_test.rs
@@ -105,6 +105,10 @@ fn test_language_corpus(start_seed: usize, language_name: &str) {
 
     let log_seed = env::var("TREE_SITTER_LOG_SEED").is_ok();
 
+    if log_seed {
+        println!("  start seed: {}", start_seed);
+    }
+
     println!();
     for test in tests {
         println!("  {} example - {}", language_name, test.name);
diff --git a/cli/src/tests/helpers/fixtures.rs b/cli/src/tests/helpers/fixtures.rs
index 46c674cd..f790ed75 100644
--- a/cli/src/tests/helpers/fixtures.rs
+++ b/cli/src/tests/helpers/fixtures.rs
@@ -1,6 +1,6 @@
 use lazy_static::lazy_static;
-use std::fs;
 use std::path::{Path, PathBuf};
+use std::{env, fs};
 use tree_sitter::Language;
 use tree_sitter_highlight::HighlightConfiguration;
 use tree_sitter_loader::Loader;
@@ -9,7 +9,13 @@ use tree_sitter_tags::TagsConfiguration;
 include!("./dirs.rs");
 
 lazy_static! {
-    static ref TEST_LOADER: Loader = Loader::with_parser_lib_path(SCRATCH_DIR.clone());
+    static ref TEST_LOADER: Loader = {
+        let mut loader = Loader::with_parser_lib_path(SCRATCH_DIR.clone());
+        if env::var("TREE_SITTER_GRAMMAR_DEBUG").is_ok() {
+            loader.use_debug_build(true);
+        }
+        loader
+    };
 }
 
 pub fn test_loader<'a>() -> &'a Loader {

From e9bed05c7c554630e06e8aaaef1fee081e78ed0b Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Thu, 17 Aug 2023 18:26:08 +0300
Subject: [PATCH 275/347] chore(ci): explicitly define halt on error for ASAN
 detected issues

---
 .github/workflows/sanitize.yml | 1 +
 1 file changed, 1 insertion(+)

diff --git a/.github/workflows/sanitize.yml b/.github/workflows/sanitize.yml
index bb085eae..834c5ab4 100644
--- a/.github/workflows/sanitize.yml
+++ b/.github/workflows/sanitize.yml
@@ -41,6 +41,7 @@ jobs:
 
     - name: Run main tests with address sanitizer (ASAN)
       env:
+        ASAN_OPTIONS: halt_on_error=1
         CFLAGS: -fsanitize=address
         RUSTFLAGS: -Zsanitizer=address
       run: |

From caaa533b8d0cb5ce2f7e3a29094500d2c8cfd68a Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Thu, 17 Aug 2023 20:55:20 +0300
Subject: [PATCH 276/347] test: add TREE_SITTER_DUMP_EDITS env var to dump
 corpus edits

It dumps edits to the `target/scratch` folder in a format like `<SEED>.edit`
---
 cli/src/tests/corpus_test.rs  |  7 ++++++-
 cli/src/tests/helpers/dirs.rs | 17 +++++++++++------
 2 files changed, 17 insertions(+), 7 deletions(-)

diff --git a/cli/src/tests/corpus_test.rs b/cli/src/tests/corpus_test.rs
index f7b4815b..9e4729d3 100644
--- a/cli/src/tests/corpus_test.rs
+++ b/cli/src/tests/corpus_test.rs
@@ -1,7 +1,7 @@
 use super::helpers::{
     allocations,
     edits::{get_random_edit, invert_edit},
-    fixtures::{fixtures_dir, get_language, get_test_language},
+    fixtures::{fixtures_dir, get_language, get_test_language, SCRATCH_BASE_DIR},
     new_seed,
     random::Rand,
     scope_sequence::ScopeSequence,
@@ -104,6 +104,7 @@ fn test_language_corpus(start_seed: usize, language_name: &str) {
     let mut failure_count = 0;
 
     let log_seed = env::var("TREE_SITTER_LOG_SEED").is_ok();
+    let dump_edits = env::var("TREE_SITTER_DUMP_EDITS").is_ok();
 
     if log_seed {
         println!("  start seed: {}", start_seed);
@@ -175,6 +176,10 @@ fn test_language_corpus(start_seed: usize, language_name: &str) {
                     println!("    seed: {}", seed);
                 }
 
+                if dump_edits {
+                    fs::write(SCRATCH_BASE_DIR.join(format!("{seed}.edit")), &input).unwrap();
+                }
+
                 if *LOG_GRAPH_ENABLED {
                     eprintln!("{}\n", String::from_utf8_lossy(&input));
                 }
diff --git a/cli/src/tests/helpers/dirs.rs b/cli/src/tests/helpers/dirs.rs
index e4f220ea..7ff48ab7 100644
--- a/cli/src/tests/helpers/dirs.rs
+++ b/cli/src/tests/helpers/dirs.rs
@@ -1,9 +1,14 @@
 lazy_static! {
-    static ref ROOT_DIR: PathBuf = PathBuf::from(env!("CARGO_MANIFEST_DIR")).parent().unwrap().to_owned();
-    static ref FIXTURES_DIR: PathBuf = ROOT_DIR.join("test").join("fixtures");
-    static ref HEADER_DIR: PathBuf = ROOT_DIR.join("lib").join("include");
-    static ref GRAMMARS_DIR: PathBuf = ROOT_DIR.join("test").join("fixtures").join("grammars");
-    static ref SCRATCH_DIR: PathBuf = {
+    pub static ref ROOT_DIR: PathBuf = PathBuf::from(env!("CARGO_MANIFEST_DIR")).parent().unwrap().to_owned();
+    pub static ref FIXTURES_DIR: PathBuf = ROOT_DIR.join("test").join("fixtures");
+    pub static ref HEADER_DIR: PathBuf = ROOT_DIR.join("lib").join("include");
+    pub static ref GRAMMARS_DIR: PathBuf = ROOT_DIR.join("test").join("fixtures").join("grammars");
+    pub static ref SCRATCH_BASE_DIR: PathBuf = {
+        let result = ROOT_DIR.join("target").join("scratch");
+        fs::create_dir_all(&result).unwrap();
+        result
+    };
+    pub static ref SCRATCH_DIR: PathBuf = {
         // https://doc.rust-lang.org/reference/conditional-compilation.html
         let vendor = if cfg!(target_vendor = "apple") {
             "apple"
@@ -34,7 +39,7 @@ lazy_static! {
         };
 
         let machine = format!("{}-{}-{}-{}-{}", std::env::consts::ARCH, std::env::consts::OS, vendor, env, endian);
-        let result = ROOT_DIR.join("target").join("scratch").join(machine);
+        let result = SCRATCH_BASE_DIR.join(machine);
         fs::create_dir_all(&result).unwrap();
         result
     };

From 6616d7deeb3541f8190582ae8f942db440f27db2 Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Thu, 17 Aug 2023 23:28:48 +0300
Subject: [PATCH 277/347] Change edit dumps format and add indexes for all
 corpus tests

The new dumped edits format is `edit.<SEED>.<TEST_INDEX>.<SEED_INDEX>.<TEST_NAME>`

To cleanup edits:
- Instead of the standard:
    > rm target/scratch/edit.*

- Use the following shell command:
    > find target/scratch/ -name 'edit.*' -delete
---
 cli/src/tests/corpus_test.rs | 15 +++++++++++----
 1 file changed, 11 insertions(+), 4 deletions(-)

diff --git a/cli/src/tests/corpus_test.rs b/cli/src/tests/corpus_test.rs
index 9e4729d3..6b2f2a20 100644
--- a/cli/src/tests/corpus_test.rs
+++ b/cli/src/tests/corpus_test.rs
@@ -111,8 +111,10 @@ fn test_language_corpus(start_seed: usize, language_name: &str) {
     }
 
     println!();
-    for test in tests {
-        println!("  {} example - {}", language_name, test.name);
+    for (test_index, test) in tests.iter().enumerate() {
+        let test_name = format!("{language_name} example - {}", test.name);
+
+        println!("  {test_index}. {test_name}");
 
         let passed = allocations::record(|| {
             let mut log_session = None;
@@ -173,11 +175,16 @@ fn test_language_corpus(start_seed: usize, language_name: &str) {
                 }
 
                 if log_seed {
-                    println!("    seed: {}", seed);
+                    println!("   {test_index}.{trial:<2} seed: {}", seed);
                 }
 
                 if dump_edits {
-                    fs::write(SCRATCH_BASE_DIR.join(format!("{seed}.edit")), &input).unwrap();
+                    fs::write(
+                        SCRATCH_BASE_DIR
+                            .join(format!("edit.{seed}.{test_index}.{trial} {test_name}")),
+                        &input,
+                    )
+                    .unwrap();
                 }
 
                 if *LOG_GRAPH_ENABLED {

From 9564e1706de651cea6df9939b8a5dba02e7dbc71 Mon Sep 17 00:00:00 2001
From: Max Brunsfeld <maxbrunsfeld@gmail.com>
Date: Thu, 17 Aug 2023 17:21:31 -0700
Subject: [PATCH 278/347] Fix error recovery regression due to stack node_count
 change

---
 lib/src/stack.c   | 18 ++++++++++++++++--
 lib/src/subtree.h |  6 ------
 2 files changed, 16 insertions(+), 8 deletions(-)

diff --git a/lib/src/stack.c b/lib/src/stack.c
index 431cd6a7..34846352 100644
--- a/lib/src/stack.c
+++ b/lib/src/stack.c
@@ -120,6 +120,20 @@ recur:
   }
 }
 
+/// Get the number of nodes in the subtree, for the purpose of measuring
+/// how much progress has been made by a given version of the stack.
+static uint32_t stack__subtree_node_count(Subtree subtree) {
+  uint32_t count = ts_subtree_visible_descendant_count(subtree);
+  if (ts_subtree_visible(subtree)) count++;
+
+  // Count intermediate error nodes even though they are not visible,
+  // because a stack version's node count is used to check whether it
+  // has made any progress since the last time it encountered an error.
+  if (ts_subtree_symbol(subtree) == ts_builtin_sym_error_repeat) count++;
+
+  return count;
+}
+
 static StackNode *stack_node_new(
   StackNode *previous_node,
   Subtree subtree,
@@ -152,7 +166,7 @@ static StackNode *stack_node_new(
     if (subtree.ptr) {
       node->error_cost += ts_subtree_error_cost(subtree);
       node->position = length_add(node->position, ts_subtree_total_size(subtree));
-      node->node_count += ts_subtree_node_count(subtree);
+      node->node_count += stack__subtree_node_count(subtree);
       node->dynamic_precedence += ts_subtree_dynamic_precedence(subtree);
     }
   } else {
@@ -239,7 +253,7 @@ static void stack_node_add_link(
 
   if (link.subtree.ptr) {
     ts_subtree_retain(link.subtree);
-    node_count += ts_subtree_node_count(link.subtree);
+    node_count += stack__subtree_node_count(link.subtree);
     dynamic_precedence += ts_subtree_dynamic_precedence(link.subtree);
   }
 
diff --git a/lib/src/subtree.h b/lib/src/subtree.h
index c5eca079..cac657fd 100644
--- a/lib/src/subtree.h
+++ b/lib/src/subtree.h
@@ -303,12 +303,6 @@ static inline uint32_t ts_subtree_visible_descendant_count(Subtree self) {
     : self.ptr->visible_descendant_count;
 }
 
-static inline uint32_t ts_subtree_node_count(Subtree self) {
-  return
-    ts_subtree_visible_descendant_count(self) +
-    (ts_subtree_visible(self) ? 1 : 0);
-}
-
 static inline uint32_t ts_subtree_visible_child_count(Subtree self) {
   if (ts_subtree_child_count(self) > 0) {
     return self.ptr->visible_child_count;

From 8eb92d1c6487a10165c2cf852ced318e1189d42c Mon Sep 17 00:00:00 2001
From: Amaan Qureshi <amaanq12@gmail.com>
Date: Thu, 20 Jul 2023 03:42:52 -0400
Subject: [PATCH 279/347] feat: add an `--apply-all-captures` argument to
 highlight & test

---
 cli/loader/src/lib.rs                     | 30 +++++++----
 cli/src/highlight.rs                      |  4 +-
 cli/src/main.rs                           | 18 +++++--
 cli/src/test_highlight.rs                 | 24 ++++++---
 cli/src/tests/helpers/fixtures.rs         |  1 +
 cli/src/tests/highlight_test.rs           | 61 +++++++++++++++++++++++
 highlight/include/tree_sitter/highlight.h |  3 +-
 highlight/src/c_lib.rs                    | 12 +++--
 highlight/src/lib.rs                      | 15 +++++-
 9 files changed, 138 insertions(+), 30 deletions(-)

diff --git a/cli/loader/src/lib.rs b/cli/loader/src/lib.rs
index c0f050e0..e2f4b703 100644
--- a/cli/loader/src/lib.rs
+++ b/cli/loader/src/lib.rs
@@ -484,6 +484,7 @@ impl Loader {
     pub fn highlight_config_for_injection_string<'a>(
         &'a self,
         string: &str,
+        apply_all_captures: bool,
     ) -> Option<&'a HighlightConfiguration> {
         match self.language_configuration_for_injection_string(string) {
             Err(e) => {
@@ -494,17 +495,19 @@ impl Loader {
                 None
             }
             Ok(None) => None,
-            Ok(Some((language, configuration))) => match configuration.highlight_config(language) {
-                Err(e) => {
-                    eprintln!(
-                        "Failed to load property sheet for injection string '{}': {}",
-                        string, e
-                    );
-                    None
+            Ok(Some((language, configuration))) => {
+                match configuration.highlight_config(language, apply_all_captures) {
+                    Err(e) => {
+                        eprintln!(
+                            "Failed to load property sheet for injection string '{}': {}",
+                            string, e
+                        );
+                        None
+                    }
+                    Ok(None) => None,
+                    Ok(Some(config)) => Some(config),
                 }
-                Ok(None) => None,
-                Ok(Some(config)) => Some(config),
-            },
+            }
         }
     }
 
@@ -701,7 +704,11 @@ impl Loader {
 }
 
 impl<'a> LanguageConfiguration<'a> {
-    pub fn highlight_config(&self, language: Language) -> Result<Option<&HighlightConfiguration>> {
+    pub fn highlight_config(
+        &self,
+        language: Language,
+        apply_all_captures: bool,
+    ) -> Result<Option<&HighlightConfiguration>> {
         return self
             .highlight_config
             .get_or_try_init(|| {
@@ -720,6 +727,7 @@ impl<'a> LanguageConfiguration<'a> {
                         &highlights_query,
                         &injections_query,
                         &locals_query,
+                        apply_all_captures,
                     )
                     .map_err(|error| match error.kind {
                         QueryErrorKind::Language => Error::from(error),
diff --git a/cli/src/highlight.rs b/cli/src/highlight.rs
index ba3fcd70..a7a98936 100644
--- a/cli/src/highlight.rs
+++ b/cli/src/highlight.rs
@@ -348,7 +348,7 @@ pub fn ansi(
     let mut highlighter = Highlighter::new();
 
     let events = highlighter.highlight(config, source, cancellation_flag, |string| {
-        loader.highlight_config_for_injection_string(string)
+        loader.highlight_config_for_injection_string(string, config.apply_all_captures)
     })?;
 
     let mut style_stack = vec![theme.default_style().ansi];
@@ -394,7 +394,7 @@ pub fn html(
     let mut highlighter = Highlighter::new();
 
     let events = highlighter.highlight(config, source, cancellation_flag, |string| {
-        loader.highlight_config_for_injection_string(string)
+        loader.highlight_config_for_injection_string(string, config.apply_all_captures)
     })?;
 
     let mut renderer = HtmlRenderer::new();
diff --git a/cli/src/main.rs b/cli/src/main.rs
index f66864ff..cbcbb181 100644
--- a/cli/src/main.rs
+++ b/cli/src/main.rs
@@ -78,6 +78,10 @@ fn run() -> Result<()> {
         .long("quiet")
         .short("q");
 
+    let apply_all_captures_arg = Arg::with_name("apply-all-captures")
+        .help("Apply all captures to highlights")
+        .long("apply-all-captures");
+
     let matches = App::new("tree-sitter")
         .author("Max Brunsfeld <maxbrunsfeld@gmail.com>")
         .about("Generates and tests parsers")
@@ -236,7 +240,8 @@ fn run() -> Result<()> {
                 )
                 .arg(&debug_arg)
                 .arg(&debug_build_arg)
-                .arg(&debug_graph_arg),
+                .arg(&debug_graph_arg)
+                .arg(&apply_all_captures_arg),
         )
         .subcommand(
             SubCommand::with_name("highlight")
@@ -256,7 +261,8 @@ fn run() -> Result<()> {
                 .arg(&time_arg)
                 .arg(&quiet_arg)
                 .arg(&paths_file_arg)
-                .arg(&paths_arg),
+                .arg(&paths_arg)
+                .arg(&apply_all_captures_arg),
         )
         .subcommand(
             SubCommand::with_name("build-wasm")
@@ -362,6 +368,7 @@ fn run() -> Result<()> {
             let debug_build = matches.is_present("debug-build");
             let update = matches.is_present("update");
             let filter = matches.value_of("filter");
+            let apply_all_captures = matches.is_present("apply-all-captures");
 
             if debug {
                 // For augmenting debug logging in external scanners
@@ -398,7 +405,7 @@ fn run() -> Result<()> {
             // Run the syntax highlighting tests.
             let test_highlight_dir = test_dir.join("highlight");
             if test_highlight_dir.is_dir() {
-                test_highlight::test_highlights(&loader, &test_highlight_dir)?;
+                test_highlight::test_highlights(&loader, &test_highlight_dir, apply_all_captures)?;
             }
 
             let test_tag_dir = test_dir.join("tags");
@@ -562,6 +569,7 @@ fn run() -> Result<()> {
             let html_mode = quiet || matches.is_present("html");
             let should_check = matches.is_present("check");
             let paths = collect_paths(matches.value_of("paths-file"), matches.values_of("paths"))?;
+            let apply_all_captures = matches.is_present("apply-all-captures");
 
             if html_mode && !quiet {
                 println!("{}", highlight::HTML_HEADER);
@@ -590,7 +598,9 @@ fn run() -> Result<()> {
                     },
                 };
 
-                if let Some(highlight_config) = language_config.highlight_config(language)? {
+                if let Some(highlight_config) =
+                    language_config.highlight_config(language, apply_all_captures)?
+                {
                     if should_check {
                         let names = highlight_config.nonconformant_capture_names();
                         if names.is_empty() {
diff --git a/cli/src/test_highlight.rs b/cli/src/test_highlight.rs
index a47f4560..78a93be6 100644
--- a/cli/src/test_highlight.rs
+++ b/cli/src/test_highlight.rs
@@ -38,12 +38,17 @@ impl std::fmt::Display for Failure {
     }
 }
 
-pub fn test_highlights(loader: &Loader, directory: &Path) -> Result<()> {
+pub fn test_highlights(loader: &Loader, directory: &Path, apply_all_captures: bool) -> Result<()> {
     println!("syntax highlighting:");
-    test_highlights_indented(loader, directory, 2)
+    test_highlights_indented(loader, directory, apply_all_captures, 2)
 }
 
-fn test_highlights_indented(loader: &Loader, directory: &Path, indent_level: usize) -> Result<()> {
+fn test_highlights_indented(
+    loader: &Loader,
+    directory: &Path,
+    apply_all_captures: bool,
+    indent_level: usize,
+) -> Result<()> {
     let mut failed = false;
     let mut highlighter = Highlighter::new();
 
@@ -58,7 +63,12 @@ fn test_highlights_indented(loader: &Loader, directory: &Path, indent_level: usi
         );
         if test_file_path.is_dir() && !test_file_path.read_dir()?.next().is_none() {
             println!("{}:", test_file_name.into_string().unwrap());
-            if let Err(_) = test_highlights_indented(loader, &test_file_path, indent_level + 1) {
+            if let Err(_) = test_highlights_indented(
+                loader,
+                &test_file_path,
+                apply_all_captures,
+                indent_level + 1,
+            ) {
                 failed = true;
             }
         } else {
@@ -66,7 +76,7 @@ fn test_highlights_indented(loader: &Loader, directory: &Path, indent_level: usi
                 .language_configuration_for_file_name(&test_file_path)?
                 .ok_or_else(|| anyhow!("No language found for path {:?}", test_file_path))?;
             let highlight_config = language_config
-                .highlight_config(language)?
+                .highlight_config(language, apply_all_captures)?
                 .ok_or_else(|| anyhow!("No highlighting config found for {:?}", test_file_path))?;
             match test_highlight(
                 &loader,
@@ -111,7 +121,7 @@ pub fn iterate_assertions(
     // Iterate through all of the highlighting assertions, checking each one against the
     // actual highlights.
     let mut i = 0;
-    let mut actual_highlights = Vec::<&String>::new();
+    let mut actual_highlights = Vec::new();
     for Assertion {
         position,
         negative,
@@ -202,7 +212,7 @@ pub fn get_highlight_positions(
     let source = String::from_utf8_lossy(source);
     let mut char_indices = source.char_indices();
     for event in highlighter.highlight(highlight_config, source.as_bytes(), None, |string| {
-        loader.highlight_config_for_injection_string(string)
+        loader.highlight_config_for_injection_string(string, highlight_config.apply_all_captures)
     })? {
         match event? {
             HighlightEvent::HighlightStart(h) => highlight_stack.push(h),
diff --git a/cli/src/tests/helpers/fixtures.rs b/cli/src/tests/helpers/fixtures.rs
index f790ed75..7232e84a 100644
--- a/cli/src/tests/helpers/fixtures.rs
+++ b/cli/src/tests/helpers/fixtures.rs
@@ -55,6 +55,7 @@ pub fn get_highlight_config(
         &highlights_query,
         &injections_query,
         &locals_query,
+        false,
     )
     .unwrap();
     result.configure(&highlight_names);
diff --git a/cli/src/tests/highlight_test.rs b/cli/src/tests/highlight_test.rs
index e0b356d2..8a5f22d3 100644
--- a/cli/src/tests/highlight_test.rs
+++ b/cli/src/tests/highlight_test.rs
@@ -522,6 +522,7 @@ fn test_highlighting_via_c_api() {
         highlights_query.len() as u32,
         injections_query.len() as u32,
         locals_query.len() as u32,
+        false,
     );
 
     let html_scope = c_string("text.html.basic");
@@ -541,6 +542,7 @@ fn test_highlighting_via_c_api() {
         highlights_query.len() as u32,
         injections_query.len() as u32,
         0,
+        false,
     );
 
     let buffer = c::ts_highlight_buffer_new();
@@ -587,6 +589,65 @@ fn test_highlighting_via_c_api() {
     c::ts_highlight_buffer_delete(buffer);
 }
 
+#[test]
+fn test_highlighting_with_all_captures_applied() {
+    let source = "fn main(a: u32, b: u32) -> { let c = a + b; }";
+    let language = get_language("rust");
+    let highlights_query = indoc::indoc! {"
+        [
+          \"fn\"
+          \"let\"
+        ] @keyword
+        (identifier) @variable
+        (function_item name: (identifier) @function)
+        (parameter pattern: (identifier) @variable.parameter)
+        (primitive_type) @type.builtin
+        \"=\" @operator
+        [ \"->\" \":\" \";\" ] @punctuation.delimiter
+        [ \"{\" \"}\" \"(\" \")\" ] @punctuation.bracket
+    "};
+    let mut rust_highlight_reverse =
+        HighlightConfiguration::new(language, &highlights_query, "", "", true).unwrap();
+    rust_highlight_reverse.configure(&HIGHLIGHT_NAMES);
+
+    assert_eq!(
+        &to_token_vector(&source, &rust_highlight_reverse).unwrap(),
+        &[[
+            ("fn", vec!["keyword"]),
+            (" ", vec![]),
+            ("main", vec!["function"]),
+            ("(", vec!["punctuation.bracket"]),
+            ("a", vec!["variable.parameter"]),
+            (":", vec!["punctuation.delimiter"]),
+            (" ", vec![]),
+            ("u32", vec!["type.builtin"]),
+            (", ", vec![]),
+            ("b", vec!["variable.parameter"]),
+            (":", vec!["punctuation.delimiter"]),
+            (" ", vec![]),
+            ("u32", vec!["type.builtin"]),
+            (")", vec!["punctuation.bracket"]),
+            (" ", vec![]),
+            ("->", vec!["punctuation.delimiter"]),
+            (" ", vec![]),
+            ("{", vec!["punctuation.bracket"]),
+            (" ", vec![]),
+            ("let", vec!["keyword"]),
+            (" ", vec![]),
+            ("c", vec!["variable"]),
+            (" ", vec![]),
+            ("=", vec!["operator"]),
+            (" ", vec![]),
+            ("a", vec!["variable"]),
+            (" + ", vec![]),
+            ("b", vec!["variable"]),
+            (";", vec!["punctuation.delimiter"]),
+            (" ", vec![]),
+            ("}", vec!["punctuation.bracket"])
+        ]],
+    );
+}
+
 #[test]
 fn test_decode_utf8_lossy() {
     use tree_sitter::LossyUtf8;
diff --git a/highlight/include/tree_sitter/highlight.h b/highlight/include/tree_sitter/highlight.h
index 496faea4..325cf413 100644
--- a/highlight/include/tree_sitter/highlight.h
+++ b/highlight/include/tree_sitter/highlight.h
@@ -48,7 +48,8 @@ TSHighlightError ts_highlighter_add_language(
   const char *locals_query,
   uint32_t highlight_query_len,
   uint32_t injection_query_len,
-  uint32_t locals_query_len
+  uint32_t locals_query_len,
+  bool apply_all_captures
 );
 
 // Compute syntax highlighting for a given document. You must first
diff --git a/highlight/src/c_lib.rs b/highlight/src/c_lib.rs
index d48a180c..7f1c9490 100644
--- a/highlight/src/c_lib.rs
+++ b/highlight/src/c_lib.rs
@@ -70,6 +70,7 @@ pub extern "C" fn ts_highlighter_add_language(
     highlight_query_len: u32,
     injection_query_len: u32,
     locals_query_len: u32,
+    apply_all_captures: bool,
 ) -> ErrorCode {
     let f = move || {
         let this = unwrap_mut_ptr(this);
@@ -109,9 +110,14 @@ pub extern "C" fn ts_highlighter_add_language(
             ""
         };
 
-        let mut config =
-            HighlightConfiguration::new(language, highlight_query, injection_query, locals_query)
-                .or(Err(ErrorCode::InvalidQuery))?;
+        let mut config = HighlightConfiguration::new(
+            language,
+            highlight_query,
+            injection_query,
+            locals_query,
+            apply_all_captures,
+        )
+        .or(Err(ErrorCode::InvalidQuery))?;
         config.configure(&this.highlight_names.as_slice());
         this.languages.insert(scope_name, (injection_regex, config));
 
diff --git a/highlight/src/lib.rs b/highlight/src/lib.rs
index 1042a1b2..4e72e729 100644
--- a/highlight/src/lib.rs
+++ b/highlight/src/lib.rs
@@ -103,6 +103,7 @@ pub enum HighlightEvent {
 pub struct HighlightConfiguration {
     pub language: Language,
     pub query: Query,
+    pub apply_all_captures: bool,
     combined_injections_query: Option<Query>,
     locals_pattern_index: usize,
     highlights_pattern_index: usize,
@@ -160,6 +161,7 @@ where
     iter_count: usize,
     next_event: Option<HighlightEvent>,
     last_highlight_range: Option<(usize, usize, usize)>,
+    apply_all_captures: bool,
 }
 
 struct HighlightIterLayer<'a> {
@@ -215,9 +217,10 @@ impl Highlighter {
             cancellation_flag,
             highlighter: self,
             iter_count: 0,
-            layers: layers,
+            layers,
             next_event: None,
             last_highlight_range: None,
+            apply_all_captures: config.apply_all_captures,
         };
         result.sort_layers();
         Ok(result)
@@ -244,6 +247,7 @@ impl HighlightConfiguration {
         highlights_query: &str,
         injection_query: &str,
         locals_query: &str,
+        apply_all_captures: bool,
     ) -> Result<Self, QueryError> {
         // Concatenate the query strings, keeping track of the start offset of each section.
         let mut query_source = String::new();
@@ -324,6 +328,7 @@ impl HighlightConfiguration {
         Ok(HighlightConfiguration {
             language,
             query,
+            apply_all_captures,
             combined_injections_query,
             locals_pattern_index,
             highlights_pattern_index,
@@ -929,7 +934,13 @@ where
             while let Some((next_match, next_capture_index)) = layer.captures.peek() {
                 let next_capture = next_match.captures[*next_capture_index];
                 if next_capture.node == capture.node {
-                    layer.captures.next();
+                    if self.apply_all_captures {
+                        match_.remove();
+                        capture = next_capture;
+                        match_ = layer.captures.next().unwrap().0;
+                    } else {
+                        layer.captures.next();
+                    }
                 } else {
                     break;
                 }

From 458b5de0fc99d25403e5e440d905a45924301210 Mon Sep 17 00:00:00 2001
From: Amaan Qureshi <amaanq12@gmail.com>
Date: Thu, 20 Jul 2023 04:41:47 -0400
Subject: [PATCH 280/347] feat: add `any-of` predicate

---
 cli/src/tests/query_test.rs | 17 ++++++++++++++
 lib/binding_rust/lib.rs     | 44 +++++++++++++++++++++++++++++++++++++
 2 files changed, 61 insertions(+)

diff --git a/cli/src/tests/query_test.rs b/cli/src/tests/query_test.rs
index c3bf54a2..c0994d31 100644
--- a/cli/src/tests/query_test.rs
+++ b/cli/src/tests/query_test.rs
@@ -2842,6 +2842,14 @@ fn test_query_captures_with_text_conditions() {
             ((identifier) @function.builtin
              (#eq? @function.builtin "require"))
 
+            ((identifier) @variable.builtin
+              (#any-of? @variable.builtin
+                        "arguments"
+                        "module"
+                        "console"
+                        "window"
+                        "document"))
+
             ((identifier) @variable
              (#not-match? @variable "^(lambda|load)$"))
             "#,
@@ -2855,6 +2863,9 @@ fn test_query_captures_with_text_conditions() {
           lambda
           const ab = require('./ab');
           new Cd(EF);
+          document;
+          module;
+          console;
         ";
 
         let mut parser = Parser::new();
@@ -2876,6 +2887,12 @@ fn test_query_captures_with_text_conditions() {
                 ("constant", "EF"),
                 ("constructor", "EF"),
                 ("variable", "EF"),
+                ("variable.builtin", "document"),
+                ("variable", "document"),
+                ("variable.builtin", "module"),
+                ("variable", "module"),
+                ("variable.builtin", "console"),
+                ("variable", "console"),
             ],
         );
     });
diff --git a/lib/binding_rust/lib.rs b/lib/binding_rust/lib.rs
index b259aacf..932fc452 100644
--- a/lib/binding_rust/lib.rs
+++ b/lib/binding_rust/lib.rs
@@ -251,6 +251,7 @@ enum TextPredicate {
     CaptureEqString(u32, String, bool),
     CaptureEqCapture(u32, u32, bool),
     CaptureMatchString(u32, regex::bytes::Regex, bool),
+    CaptureAnyString(u32, Vec<String>, bool),
 }
 
 // TODO: Remove this struct at at some point. If `core::str::lossy::Utf8Lossy`
@@ -1811,6 +1812,38 @@ impl Query {
                         operator_name == "is?",
                     )),
 
+                    "any-of?" | "not-any-of?" => {
+                        if p.len() < 2 {
+                            return Err(predicate_error(row, format!(
+                                "Wrong number of arguments to #any-of? predicate. Expected at least 1, got {}.",
+                                p.len() - 1
+                            )));
+                        }
+                        if p[1].type_ != type_capture {
+                            return Err(predicate_error(row, format!(
+                                "First argument to #any-of? predicate must be a capture name. Got literal \"{}\".",
+                                string_values[p[1].value_id as usize],
+                            )));
+                        }
+
+                        let is_positive = operator_name == "any-of?";
+                        let mut values = Vec::new();
+                        for arg in &p[2..] {
+                            if arg.type_ == type_capture {
+                                return Err(predicate_error(row, format!(
+                                    "Arguments to #any-of? predicate must be literals. Got capture @{}.",
+                                    result.capture_names[arg.value_id as usize],
+                                )));
+                            }
+                            values.push(string_values[arg.value_id as usize].clone());
+                        }
+                        text_predicates.push(TextPredicate::CaptureAnyString(
+                            p[1].value_id,
+                            values,
+                            is_positive,
+                        ));
+                    }
+
                     _ => general_predicates.push(QueryPredicate {
                         operator: operator_name.clone().into_boxed_str(),
                         args: p[1..]
@@ -2265,6 +2298,17 @@ impl<'tree> QueryMatch<'_, 'tree> {
                         None => true,
                     }
                 }
+                TextPredicate::CaptureAnyString(i, v, is_positive) => {
+                    let node = self.nodes_for_capture_index(*i).next();
+                    match node {
+                        Some(node) => {
+                            let mut text = text_provider.text(node);
+                            let text = node_text1.get_text(&mut text);
+                            v.iter().any(|s| text == s.as_bytes()) == *is_positive
+                        }
+                        None => true,
+                    }
+                }
             })
     }
 }

From 9971e5d5f5814e4d51991a3fe615dffd470aa4d1 Mon Sep 17 00:00:00 2001
From: Amaan Qureshi <amaanq12@gmail.com>
Date: Thu, 20 Jul 2023 04:57:11 -0400
Subject: [PATCH 281/347] feat: allow specifying an input `captures-path`
 argument

---
 cli/src/main.rs      | 24 +++++++++++++++++++++++-
 highlight/src/lib.rs | 14 +++++++++-----
 2 files changed, 32 insertions(+), 6 deletions(-)

diff --git a/cli/src/main.rs b/cli/src/main.rs
index cbcbb181..6e9aa552 100644
--- a/cli/src/main.rs
+++ b/cli/src/main.rs
@@ -1,6 +1,7 @@
 use anyhow::{anyhow, Context, Error, Result};
 use clap::{App, AppSettings, Arg, SubCommand};
 use glob::glob;
+use std::collections::HashSet;
 use std::path::{Path, PathBuf};
 use std::{env, fs, u64};
 use tree_sitter::{ffi, Point};
@@ -257,6 +258,12 @@ fn run() -> Result<()> {
                         .help("Check that highlighting captures conform strictly to standards")
                         .long("check"),
                 )
+                .arg(
+                    Arg::with_name("captures-path")
+                        .help("Path to a file with captures")
+                        .long("captures-path")
+                        .takes_value(true),
+                )
                 .arg(&scope_arg)
                 .arg(&time_arg)
                 .arg(&quiet_arg)
@@ -602,7 +609,22 @@ fn run() -> Result<()> {
                     language_config.highlight_config(language, apply_all_captures)?
                 {
                     if should_check {
-                        let names = highlight_config.nonconformant_capture_names();
+                        let names = if let Some(path) = matches.value_of("captures-path") {
+                            let path = Path::new(path);
+                            let file = fs::read_to_string(path)?;
+                            let capture_names = file
+                                .lines()
+                                .filter_map(|line| {
+                                    if line.trim().is_empty() || line.trim().starts_with(';') {
+                                        return None;
+                                    }
+                                    line.split(';').next().map(|s| s.trim().trim_matches('"'))
+                                })
+                                .collect::<HashSet<_>>();
+                            highlight_config.nonconformant_capture_names(&capture_names)
+                        } else {
+                            highlight_config.nonconformant_capture_names(&HashSet::new())
+                        };
                         if names.is_empty() {
                             eprintln!("All highlight captures conform to standards.");
                         } else {
diff --git a/highlight/src/lib.rs b/highlight/src/lib.rs
index 4e72e729..4e96fe41 100644
--- a/highlight/src/lib.rs
+++ b/highlight/src/lib.rs
@@ -390,12 +390,16 @@ impl HighlightConfiguration {
     // Return the list of this configuration's capture names that are neither present in the
     // list of predefined 'canonical' names nor start with an underscore (denoting 'private' captures
     // used as part of capture internals).
-    pub fn nonconformant_capture_names(&self) -> Vec<&String> {
-        return self
-            .names()
+    pub fn nonconformant_capture_names(&self, capture_names: &HashSet<&str>) -> Vec<&String> {
+        let capture_names = if capture_names.is_empty() {
+            &*STANDARD_CAPTURE_NAMES
+        } else {
+            &capture_names
+        };
+        self.names()
             .iter()
-            .filter(|&n| !(n.starts_with('_') || STANDARD_CAPTURE_NAMES.contains(n.as_str())))
-            .collect();
+            .filter(|&n| !(n.starts_with('_') || capture_names.contains(n.as_str())))
+            .collect()
     }
 }
 

From ce4a9ef4de3e1f2b7fc1dfd3bd8fc08a8eb295bf Mon Sep 17 00:00:00 2001
From: Amaan Qureshi <amaanq12@gmail.com>
Date: Thu, 20 Jul 2023 08:04:59 -0400
Subject: [PATCH 282/347] feat: allow specifying an input `query-paths`
 argument

---
 cli/loader/src/lib.rs     | 59 ++++++++++++++++++++++++++++++++++-----
 cli/src/main.rs           | 25 +++++++++++++++--
 cli/src/test_highlight.rs |  2 +-
 3 files changed, 75 insertions(+), 11 deletions(-)

diff --git a/cli/loader/src/lib.rs b/cli/loader/src/lib.rs
index e2f4b703..a2c28be9 100644
--- a/cli/loader/src/lib.rs
+++ b/cli/loader/src/lib.rs
@@ -496,7 +496,7 @@ impl Loader {
             }
             Ok(None) => None,
             Ok(Some((language, configuration))) => {
-                match configuration.highlight_config(language, apply_all_captures) {
+                match configuration.highlight_config(language, apply_all_captures, None) {
                     Err(e) => {
                         eprintln!(
                             "Failed to load property sheet for injection string '{}': {}",
@@ -708,16 +708,61 @@ impl<'a> LanguageConfiguration<'a> {
         &self,
         language: Language,
         apply_all_captures: bool,
+        paths: Option<&[String]>,
     ) -> Result<Option<&HighlightConfiguration>> {
+        let (highlights_filenames, injections_filenames, locals_filenames) = match paths {
+            Some(paths) => (
+                Some(
+                    paths
+                        .iter()
+                        .filter(|p| p.ends_with("highlights.scm"))
+                        .cloned()
+                        .collect(),
+                ),
+                Some(
+                    paths
+                        .iter()
+                        .filter(|p| p.ends_with("tags.scm"))
+                        .cloned()
+                        .collect(),
+                ),
+                Some(
+                    paths
+                        .iter()
+                        .filter(|p| p.ends_with("locals.scm"))
+                        .cloned()
+                        .collect(),
+                ),
+            ),
+            None => (None, None, None),
+        };
         return self
             .highlight_config
             .get_or_try_init(|| {
-                let (highlights_query, highlight_ranges) =
-                    self.read_queries(&self.highlights_filenames, "highlights.scm")?;
-                let (injections_query, injection_ranges) =
-                    self.read_queries(&self.injections_filenames, "injections.scm")?;
-                let (locals_query, locals_ranges) =
-                    self.read_queries(&self.locals_filenames, "locals.scm")?;
+                let (highlights_query, highlight_ranges) = self.read_queries(
+                    if highlights_filenames.is_some() {
+                        &highlights_filenames
+                    } else {
+                        &self.highlights_filenames
+                    },
+                    "highlights.scm",
+                )?;
+                let (injections_query, injection_ranges) = self.read_queries(
+                    if injections_filenames.is_some() {
+                        &injections_filenames
+                    } else {
+                        &self.injections_filenames
+                    },
+                    "injections.scm",
+                )?;
+                let (locals_query, locals_ranges) = self.read_queries(
+                    if locals_filenames.is_some() {
+                        &locals_filenames
+                    } else {
+                        &self.locals_filenames
+                    },
+                    "locals.scm",
+                )?;
 
                 if highlights_query.is_empty() {
                     Ok(None)
diff --git a/cli/src/main.rs b/cli/src/main.rs
index 6e9aa552..fbdb0343 100644
--- a/cli/src/main.rs
+++ b/cli/src/main.rs
@@ -264,6 +264,14 @@ fn run() -> Result<()> {
                         .long("captures-path")
                         .takes_value(true),
                 )
+                .arg(
+                    Arg::with_name("query-paths")
+                        .help("Paths to files with queries")
+                        .long("query-paths")
+                        .takes_value(true)
+                        .multiple(true)
+                        .number_of_values(1),
+                )
                 .arg(&scope_arg)
                 .arg(&time_arg)
                 .arg(&quiet_arg)
@@ -592,6 +600,15 @@ fn run() -> Result<()> {
                 }
             }
 
+            let query_paths = matches.values_of("query-paths").map_or(None, |e| {
+                Some(
+                    e.collect::<Vec<_>>()
+                        .into_iter()
+                        .map(|s| s.to_string())
+                        .collect::<Vec<_>>(),
+                )
+            });
+
             for path in paths {
                 let path = Path::new(&path);
                 let (language, language_config) = match lang {
@@ -605,9 +622,11 @@ fn run() -> Result<()> {
                     },
                 };
 
-                if let Some(highlight_config) =
-                    language_config.highlight_config(language, apply_all_captures)?
-                {
+                if let Some(highlight_config) = language_config.highlight_config(
+                    language,
+                    apply_all_captures,
+                    query_paths.as_deref(),
+                )? {
                     if should_check {
                         let names = if let Some(path) = matches.value_of("captures-path") {
                             let path = Path::new(path);
diff --git a/cli/src/test_highlight.rs b/cli/src/test_highlight.rs
index 78a93be6..ea2ecc1e 100644
--- a/cli/src/test_highlight.rs
+++ b/cli/src/test_highlight.rs
@@ -76,7 +76,7 @@ fn test_highlights_indented(
                 .language_configuration_for_file_name(&test_file_path)?
                 .ok_or_else(|| anyhow!("No language found for path {:?}", test_file_path))?;
             let highlight_config = language_config
-                .highlight_config(language, apply_all_captures)?
+                .highlight_config(language, apply_all_captures, None)?
                 .ok_or_else(|| anyhow!("No highlighting config found for {:?}", test_file_path))?;
             match test_highlight(
                 &loader,

From 545ef842de83a453b3b04f77fb5ba44f3b82f7de Mon Sep 17 00:00:00 2001
From: James McCoy <jamessan@jamessan.com>
Date: Fri, 18 Aug 2023 11:23:36 -0400
Subject: [PATCH 283/347] Remove -Werror from default CFLAGS

Production builds shouldn't include -Werror by default since that could
cause spurious build failures when there are toolchain updates.

CI uses -Werror to prevent warnings, so that should be sufficient.
---
 .github/workflows/build.yml | 5 ++++-
 Makefile                    | 2 +-
 lib/binding_rust/build.rs   | 1 -
 3 files changed, 5 insertions(+), 3 deletions(-)

diff --git a/.github/workflows/build.yml b/.github/workflows/build.yml
index c0f632b1..775db7de 100644
--- a/.github/workflows/build.yml
+++ b/.github/workflows/build.yml
@@ -177,6 +177,7 @@ jobs:
         TARGET: ${{ matrix.target }}
         CC: ${{ matrix.cc }}
         AR: ${{ matrix.ar }}
+        IS_WINDOWS: ${{ contains(matrix.os, 'windows') }}
       run: |
         PATH="$PWD/.github/scripts:$PATH"
         echo "$PWD/.github/scripts" >> $GITHUB_PATH
@@ -191,6 +192,8 @@ jobs:
         [ -n "$CC" ] && echo "CC=$CC" >> $GITHUB_ENV
         [ -n "$AR" ] && echo "AR=$AR" >> $GITHUB_ENV
 
+        [ "$IS_WINDOWS" = "false" ] && echo "CFLAGS=-Werror" >> $GITHUB_ENV
+
         if [ "$USE_CROSS" == "true" ]; then
           echo "BUILD_CMD=cross" >> $GITHUB_ENV
           runner=$(BUILD_CMD=cross cross.sh bash -c "env | sed -nr '/^CARGO_TARGET_.*_RUNNER=/s///p'")
@@ -199,7 +202,7 @@ jobs:
 
     - name: Build C library
       if: ${{ !contains(matrix.os, 'windows') }} # Requires an additional adapted Makefile for `cl.exe` compiler
-      run: make.sh CFLAGS="-Werror" -j
+      run: make.sh -j
 
     - name: Build wasm library
       if: ${{ !matrix.cli-only && !matrix.use-cross }} # No sense to build on the same Github runner hosts many times
diff --git a/Makefile b/Makefile
index 5339d1e6..be915fa3 100644
--- a/Makefile
+++ b/Makefile
@@ -18,7 +18,7 @@ endif
 OBJ := $(SRC:.c=.o)
 
 # define default flags, and override to append mandatory flags
-override CFLAGS := -O3 -std=gnu99 -fPIC -fvisibility=hidden -Wall -Wextra -Werror -Wshadow $(CFLAGS)
+override CFLAGS := -O3 -std=gnu99 -fPIC -fvisibility=hidden -Wall -Wextra -Wshadow $(CFLAGS)
 override CFLAGS += -Ilib/src -Ilib/include
 
 # ABI versioning
diff --git a/lib/binding_rust/build.rs b/lib/binding_rust/build.rs
index c812c3b9..ec367980 100644
--- a/lib/binding_rust/build.rs
+++ b/lib/binding_rust/build.rs
@@ -28,7 +28,6 @@ fn main() {
         .flag_if_supported("-std=c99")
         .flag_if_supported("-fvisibility=hidden")
         .flag_if_supported("-Wshadow")
-        .flag_if_supported("-Werror")
         .include(src_path)
         .include("include")
         .file(src_path.join("lib.c"))

From 45313e0dfb78a3c29ab43b26632185c2d5b40248 Mon Sep 17 00:00:00 2001
From: Amaan Qureshi <amaanq12@gmail.com>
Date: Fri, 18 Aug 2023 16:14:01 -0400
Subject: [PATCH 284/347] feat: add `injection.self` to inject a node with
 itself

---
 cli/loader/src/lib.rs                 | 22 ++++++++++++++++++++++
 cli/src/tests/helpers/fixtures.rs     |  1 +
 cli/src/tests/highlight_test.rs       |  6 +++++-
 docs/section-4-syntax-highlighting.md |  1 +
 highlight/src/c_lib.rs                |  7 +++++++
 highlight/src/lib.rs                  | 11 ++++++++++-
 6 files changed, 46 insertions(+), 2 deletions(-)

diff --git a/cli/loader/src/lib.rs b/cli/loader/src/lib.rs
index a2c28be9..2b3896ef 100644
--- a/cli/loader/src/lib.rs
+++ b/cli/loader/src/lib.rs
@@ -86,6 +86,7 @@ pub struct LanguageConfiguration<'a> {
     pub injections_filenames: Option<Vec<String>>,
     pub locals_filenames: Option<Vec<String>>,
     pub tags_filenames: Option<Vec<String>>,
+    pub language_name: String,
     language_id: usize,
     highlight_config: OnceCell<Option<HighlightConfiguration>>,
     tags_config: OnceCell<Option<TagsConfiguration>>,
@@ -569,6 +570,11 @@ impl Loader {
             tree_sitter: Vec<LanguageConfigurationJSON>,
         }
 
+        #[derive(Deserialize)]
+        struct GrammarJSON {
+            name: String,
+        }
+
         let initial_language_configuration_count = self.language_configurations.len();
 
         if let Ok(package_json_contents) = fs::read_to_string(&parser_path.join("package.json")) {
@@ -580,6 +586,13 @@ impl Loader {
                     // the package.json, but defaults to the directory containing the package.json.
                     let language_path = parser_path.join(config_json.path);
 
+                    let grammar_path = language_path.join("src").join("grammar.json");
+                    let mut grammar_file = fs::File::open(grammar_path)
+                        .with_context(|| "Failed to read grammar.json")?;
+                    let grammar_json: GrammarJSON =
+                        serde_json::from_reader(BufReader::new(&mut grammar_file))
+                            .with_context(|| "Failed to parse grammar.json")?;
+
                     // Determine if a previous language configuration in this package.json file
                     // already uses the same language.
                     let mut language_id = None;
@@ -599,6 +612,7 @@ impl Loader {
 
                     let configuration = LanguageConfiguration {
                         root_path: parser_path.to_path_buf(),
+                        language_name: grammar_json.name,
                         scope: config_json.scope,
                         language_id,
                         file_types: config_json.file_types.unwrap_or(Vec::new()),
@@ -631,8 +645,15 @@ impl Loader {
         if self.language_configurations.len() == initial_language_configuration_count
             && parser_path.join("src").join("grammar.json").exists()
         {
+            let grammar_path = parser_path.join("src").join("grammar.json");
+            let mut grammar_file =
+                fs::File::open(grammar_path).with_context(|| "Failed to read grammar.json")?;
+            let grammar_json: GrammarJSON =
+                serde_json::from_reader(BufReader::new(&mut grammar_file))
+                    .with_context(|| "Failed to parse grammar.json")?;
             let configuration = LanguageConfiguration {
                 root_path: parser_path.to_owned(),
+                language_name: grammar_json.name,
                 language_id: self.languages_by_id.len(),
                 file_types: Vec::new(),
                 scope: None,
@@ -769,6 +790,7 @@ impl<'a> LanguageConfiguration<'a> {
                 } else {
                     let mut result = HighlightConfiguration::new(
                         language,
+                        &self.language_name,
                         &highlights_query,
                         &injections_query,
                         &locals_query,
diff --git a/cli/src/tests/helpers/fixtures.rs b/cli/src/tests/helpers/fixtures.rs
index 7232e84a..5d27329b 100644
--- a/cli/src/tests/helpers/fixtures.rs
+++ b/cli/src/tests/helpers/fixtures.rs
@@ -52,6 +52,7 @@ pub fn get_highlight_config(
     let locals_query = fs::read_to_string(queries_path.join("locals.scm")).unwrap_or(String::new());
     let mut result = HighlightConfiguration::new(
         language,
+        language_name,
         &highlights_query,
         &injections_query,
         &locals_query,
diff --git a/cli/src/tests/highlight_test.rs b/cli/src/tests/highlight_test.rs
index 8a5f22d3..5cdd0f1d 100644
--- a/cli/src/tests/highlight_test.rs
+++ b/cli/src/tests/highlight_test.rs
@@ -507,12 +507,14 @@ fn test_highlighting_via_c_api() {
     let js_scope = c_string("source.js");
     let js_injection_regex = c_string("^javascript");
     let language = get_language("javascript");
+    let lang_name = c_string("javascript");
     let queries = get_language_queries_path("javascript");
     let highlights_query = fs::read_to_string(queries.join("highlights.scm")).unwrap();
     let injections_query = fs::read_to_string(queries.join("injections.scm")).unwrap();
     let locals_query = fs::read_to_string(queries.join("locals.scm")).unwrap();
     c::ts_highlighter_add_language(
         highlighter,
+        lang_name.as_ptr(),
         js_scope.as_ptr(),
         js_injection_regex.as_ptr(),
         language,
@@ -528,11 +530,13 @@ fn test_highlighting_via_c_api() {
     let html_scope = c_string("text.html.basic");
     let html_injection_regex = c_string("^html");
     let language = get_language("html");
+    let lang_name = c_string("html");
     let queries = get_language_queries_path("html");
     let highlights_query = fs::read_to_string(queries.join("highlights.scm")).unwrap();
     let injections_query = fs::read_to_string(queries.join("injections.scm")).unwrap();
     c::ts_highlighter_add_language(
         highlighter,
+        lang_name.as_ptr(),
         html_scope.as_ptr(),
         html_injection_regex.as_ptr(),
         language,
@@ -607,7 +611,7 @@ fn test_highlighting_with_all_captures_applied() {
         [ \"{\" \"}\" \"(\" \")\" ] @punctuation.bracket
     "};
     let mut rust_highlight_reverse =
-        HighlightConfiguration::new(language, &highlights_query, "", "", true).unwrap();
+        HighlightConfiguration::new(language, "rust", &highlights_query, "", "", true).unwrap();
     rust_highlight_reverse.configure(&HIGHLIGHT_NAMES);
 
     assert_eq!(
diff --git a/docs/section-4-syntax-highlighting.md b/docs/section-4-syntax-highlighting.md
index 964fb677..fc2c9c17 100644
--- a/docs/section-4-syntax-highlighting.md
+++ b/docs/section-4-syntax-highlighting.md
@@ -364,6 +364,7 @@ The language injection behavior can also be configured by some properties associ
 * `injection.language` - can be used to hard-code the name of a specific language.
 * `injection.combined` - indicates that *all* of the matching nodes in the tree should have their content parsed as *one* nested document.
 * `injection.include-children` - indicates that the `@injection.content` node's *entire* text should be re-parsed, including the text of its child nodes. By default, child nodes' text will be *excluded* from the injected document.
+* `injection.self` - indicates that the `@injection.content` node should be parsed using the same language as the parent node. This is useful for cases where the parent node's language is not known until runtime (e.g. via inheriting another language)
 
 #### Examples
 
diff --git a/highlight/src/c_lib.rs b/highlight/src/c_lib.rs
index 7f1c9490..33197088 100644
--- a/highlight/src/c_lib.rs
+++ b/highlight/src/c_lib.rs
@@ -29,6 +29,7 @@ pub enum ErrorCode {
     InvalidUtf8,
     InvalidRegex,
     InvalidQuery,
+    InvalidLanguageName,
 }
 
 #[no_mangle]
@@ -61,6 +62,7 @@ pub extern "C" fn ts_highlighter_new(
 #[no_mangle]
 pub extern "C" fn ts_highlighter_add_language(
     this: *mut TSHighlighter,
+    language_name: *const c_char,
     scope_name: *const c_char,
     injection_regex: *const c_char,
     language: Language,
@@ -110,8 +112,13 @@ pub extern "C" fn ts_highlighter_add_language(
             ""
         };
 
+        let lang = unsafe { CStr::from_ptr(language_name) }
+            .to_str()
+            .or(Err(ErrorCode::InvalidLanguageName))?;
+
         let mut config = HighlightConfiguration::new(
             language,
+            lang,
             highlight_query,
             injection_query,
             locals_query,
diff --git a/highlight/src/lib.rs b/highlight/src/lib.rs
index 4e96fe41..20ac5edf 100644
--- a/highlight/src/lib.rs
+++ b/highlight/src/lib.rs
@@ -102,6 +102,7 @@ pub enum HighlightEvent {
 /// This struct is immutable and can be shared between threads.
 pub struct HighlightConfiguration {
     pub language: Language,
+    pub language_name: String,
     pub query: Query,
     pub apply_all_captures: bool,
     combined_injections_query: Option<Query>,
@@ -244,6 +245,7 @@ impl HighlightConfiguration {
     /// Returns a `HighlightConfiguration` that can then be used with the `highlight` method.
     pub fn new(
         language: Language,
+        name: impl Into<String>,
         highlights_query: &str,
         injection_query: &str,
         locals_query: &str,
@@ -327,6 +329,7 @@ impl HighlightConfiguration {
         let highlight_indices = vec![None; query.capture_names().len()];
         Ok(HighlightConfiguration {
             language,
+            language_name: name.into(),
             query,
             apply_all_captures,
             combined_injections_query,
@@ -1110,7 +1113,7 @@ impl HtmlRenderer {
 }
 
 fn injection_for_match<'a>(
-    config: &HighlightConfiguration,
+    config: &'a HighlightConfiguration,
     query: &'a Query,
     query_match: &QueryMatch<'a, 'a>,
     source: &'a [u8],
@@ -1141,6 +1144,12 @@ fn injection_for_match<'a>(
                 }
             }
 
+            "injection.self" => {
+                if language_name.is_none() {
+                    language_name = Some(config.language_name.as_str());
+                }
+            }
+
             // By default, injections do not include the *children* of an
             // `injection.content` node - only the ranges that belong to the
             // node itself. This can be changed using a `#set!` predicate that

From 59b8eaf9115700ed1ec623fe488629cec841e89e Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Sat, 19 Aug 2023 15:18:37 +0300
Subject: [PATCH 285/347] rust: pin serde version on 1.0.171 due to
 serde-rs/serde#2538

---
 Cargo.lock            | 114 +++++++++++++++++++++---------------------
 cli/Cargo.toml        |   5 +-
 cli/config/Cargo.toml |   5 +-
 cli/loader/Cargo.toml |   3 +-
 4 files changed, 65 insertions(+), 62 deletions(-)

diff --git a/Cargo.lock b/Cargo.lock
index 23306a9a..3c444391 100644
--- a/Cargo.lock
+++ b/Cargo.lock
@@ -4,9 +4,9 @@ version = 3
 
 [[package]]
 name = "aho-corasick"
-version = "1.0.3"
+version = "1.0.4"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "86b8f9420f797f2d9e935edf629310eb938a0d839f984e25327f3c7eed22300c"
+checksum = "6748e8def348ed4d14996fa801f4122cd763fff530258cdc03f64b25f89d3a5a"
 dependencies = [
  "memchr",
 ]
@@ -22,9 +22,9 @@ dependencies = [
 
 [[package]]
 name = "anyhow"
-version = "1.0.72"
+version = "1.0.75"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "3b13c32d80ecc7ab747b80c3784bce54ee8a7a0cc4fbda9bf4cda2cf6fe90854"
+checksum = "a4668cab20f66d8d020e1fbc0ebe47217433c1b6c8f2040faf858554e394ace6"
 
 [[package]]
 name = "ascii"
@@ -142,7 +142,7 @@ source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "1f34ba9a9bcb8645379e9de8cb3ecfcf4d1c85ba66d90deb3259206fa5aa193b"
 dependencies = [
  "quote",
- "syn 2.0.28",
+ "syn 2.0.29",
 ]
 
 [[package]]
@@ -308,9 +308,9 @@ dependencies = [
 
 [[package]]
 name = "httpdate"
-version = "1.0.2"
+version = "1.0.3"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "c4a1e36c821dbe04574f602848a19f742f4fb3c98d40449f11bcad18d6b17421"
+checksum = "df3b46402a9d5adb4c86a0cf463f42e19994e3ee891101b1841f30a545cb49a9"
 
 [[package]]
 name = "idna"
@@ -405,9 +405,9 @@ checksum = "57bcfdad1b858c2db7c38303a6d2ad4dfaf5eb53dfeb0910128b2c26d6158503"
 
 [[package]]
 name = "log"
-version = "0.4.19"
+version = "0.4.20"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "b06a4cde4c0f271a446782e3eff8de789548ce57dbc8eca9292c27f4a42004b4"
+checksum = "b5e6163cb8c49088c2c36f57875e58ccd8c87c7427f7fbd50ea6710b2f3f2e8f"
 
 [[package]]
 name = "malloc_buf"
@@ -502,9 +502,9 @@ dependencies = [
 
 [[package]]
 name = "quote"
-version = "1.0.32"
+version = "1.0.33"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "50f3b39ccfb720540debaa0164757101c08ecb8d326b15358ce76a62c7e85965"
+checksum = "5267fca4496028628a95160fc423a33e8b2e6af8a5302579e322e4b520293cae"
 dependencies = [
  "proc-macro2",
 ]
@@ -645,29 +645,29 @@ checksum = "b0293b4b29daaf487284529cc2f5675b8e57c61f70167ba415a463651fd6a918"
 
 [[package]]
 name = "serde"
-version = "1.0.183"
+version = "1.0.171"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "32ac8da02677876d532745a130fc9d8e6edfa81a269b107c5b00829b91d8eb3c"
+checksum = "30e27d1e4fd7659406c492fd6cfaf2066ba8773de45ca75e855590f856dc34a9"
 dependencies = [
  "serde_derive",
 ]
 
 [[package]]
 name = "serde_derive"
-version = "1.0.183"
+version = "1.0.171"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "aafe972d60b0b9bee71a91b92fee2d4fb3c9d7e8f6b179aa99f27203d99a4816"
+checksum = "389894603bd18c46fa56231694f8d827779c0951a667087194cf9de94ed24682"
 dependencies = [
  "proc-macro2",
  "quote",
- "syn 2.0.28",
+ "syn 2.0.29",
 ]
 
 [[package]]
 name = "serde_json"
-version = "1.0.104"
+version = "1.0.105"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "076066c5f1078eac5b722a31827a8832fe108bed65dfa75e233c89f8206e976c"
+checksum = "693151e1ac27563d6dbcec9dee9fbd5da8539b20fa14ad3752b2e6d363ace360"
 dependencies = [
  "indexmap",
  "itoa",
@@ -715,9 +715,9 @@ dependencies = [
 
 [[package]]
 name = "syn"
-version = "2.0.28"
+version = "2.0.29"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "04361975b3f5e348b2189d8dc55bc942f278b2d482a6a0365de5bdd62d351567"
+checksum = "c324c494eba9d92503e6f1ef2e6df781e78f6a7705a0202d9801b198807d518a"
 dependencies = [
  "proc-macro2",
  "quote",
@@ -726,9 +726,9 @@ dependencies = [
 
 [[package]]
 name = "tempfile"
-version = "3.7.1"
+version = "3.8.0"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "dc02fddf48964c42031a0b3fe0428320ecf3a73c401040fc0096f97794310651"
+checksum = "cb94d2f3cc536af71caac6b6fcebf65860b347e7ce0cc9ebe8f70d3e521054ef"
 dependencies = [
  "cfg-if",
  "fastrand",
@@ -748,22 +748,22 @@ dependencies = [
 
 [[package]]
 name = "thiserror"
-version = "1.0.44"
+version = "1.0.47"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "611040a08a0439f8248d1990b111c95baa9c704c805fa1f62104b39655fd7f90"
+checksum = "97a802ec30afc17eee47b2855fc72e0c4cd62be9b4efe6591edde0ec5bd68d8f"
 dependencies = [
  "thiserror-impl",
 ]
 
 [[package]]
 name = "thiserror-impl"
-version = "1.0.44"
+version = "1.0.47"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "090198534930841fab3a5d1bb637cde49e339654e606195f8d9c76eeb081dc96"
+checksum = "6bb623b56e39ab7dcd4b1b98bb6c8f8d907ed255b18de254088016b27a8ee19b"
 dependencies = [
  "proc-macro2",
  "quote",
- "syn 2.0.28",
+ "syn 2.0.29",
 ]
 
 [[package]]
@@ -1028,7 +1028,7 @@ dependencies = [
  "once_cell",
  "proc-macro2",
  "quote",
- "syn 2.0.28",
+ "syn 2.0.29",
  "wasm-bindgen-shared",
 ]
 
@@ -1050,7 +1050,7 @@ checksum = "54681b18a46765f095758388f2d0cf16eb8d4169b639ab575a8f5693af210c7b"
 dependencies = [
  "proc-macro2",
  "quote",
- "syn 2.0.28",
+ "syn 2.0.29",
  "wasm-bindgen-backend",
  "wasm-bindgen-shared",
 ]
@@ -1073,9 +1073,9 @@ dependencies = [
 
 [[package]]
 name = "webbrowser"
-version = "0.8.10"
+version = "0.8.11"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "fd222aa310eb7532e3fd427a5d7db7e44bc0b0cf1c1e21139c345325511a85b6"
+checksum = "b2c79b77f525a2d670cb40619d7d9c673d09e0666f72c591ebd7861f84a87e57"
 dependencies = [
  "core-foundation",
  "home",
@@ -1145,7 +1145,7 @@ version = "0.48.0"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "677d2418bec65e3338edb076e806bc1ec15693c5d0104683f2efe857f61056a9"
 dependencies = [
- "windows-targets 0.48.1",
+ "windows-targets 0.48.5",
 ]
 
 [[package]]
@@ -1165,17 +1165,17 @@ dependencies = [
 
 [[package]]
 name = "windows-targets"
-version = "0.48.1"
+version = "0.48.5"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "05d4b17490f70499f20b9e791dcf6a299785ce8af4d709018206dc5b4953e95f"
+checksum = "9a2fa6e2155d7247be68c096456083145c183cbbbc2764150dda45a87197940c"
 dependencies = [
- "windows_aarch64_gnullvm 0.48.0",
- "windows_aarch64_msvc 0.48.0",
- "windows_i686_gnu 0.48.0",
- "windows_i686_msvc 0.48.0",
- "windows_x86_64_gnu 0.48.0",
- "windows_x86_64_gnullvm 0.48.0",
- "windows_x86_64_msvc 0.48.0",
+ "windows_aarch64_gnullvm 0.48.5",
+ "windows_aarch64_msvc 0.48.5",
+ "windows_i686_gnu 0.48.5",
+ "windows_i686_msvc 0.48.5",
+ "windows_x86_64_gnu 0.48.5",
+ "windows_x86_64_gnullvm 0.48.5",
+ "windows_x86_64_msvc 0.48.5",
 ]
 
 [[package]]
@@ -1186,9 +1186,9 @@ checksum = "597a5118570b68bc08d8d59125332c54f1ba9d9adeedeef5b99b02ba2b0698f8"
 
 [[package]]
 name = "windows_aarch64_gnullvm"
-version = "0.48.0"
+version = "0.48.5"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "91ae572e1b79dba883e0d315474df7305d12f569b400fcf90581b06062f7e1bc"
+checksum = "2b38e32f0abccf9987a4e3079dfb67dcd799fb61361e53e2882c3cbaf0d905d8"
 
 [[package]]
 name = "windows_aarch64_msvc"
@@ -1198,9 +1198,9 @@ checksum = "e08e8864a60f06ef0d0ff4ba04124db8b0fb3be5776a5cd47641e942e58c4d43"
 
 [[package]]
 name = "windows_aarch64_msvc"
-version = "0.48.0"
+version = "0.48.5"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "b2ef27e0d7bdfcfc7b868b317c1d32c641a6fe4629c171b8928c7b08d98d7cf3"
+checksum = "dc35310971f3b2dbbf3f0690a219f40e2d9afcf64f9ab7cc1be722937c26b4bc"
 
 [[package]]
 name = "windows_i686_gnu"
@@ -1210,9 +1210,9 @@ checksum = "c61d927d8da41da96a81f029489353e68739737d3beca43145c8afec9a31a84f"
 
 [[package]]
 name = "windows_i686_gnu"
-version = "0.48.0"
+version = "0.48.5"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "622a1962a7db830d6fd0a69683c80a18fda201879f0f447f065a3b7467daa241"
+checksum = "a75915e7def60c94dcef72200b9a8e58e5091744960da64ec734a6c6e9b3743e"
 
 [[package]]
 name = "windows_i686_msvc"
@@ -1222,9 +1222,9 @@ checksum = "44d840b6ec649f480a41c8d80f9c65108b92d89345dd94027bfe06ac444d1060"
 
 [[package]]
 name = "windows_i686_msvc"
-version = "0.48.0"
+version = "0.48.5"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "4542c6e364ce21bf45d69fdd2a8e455fa38d316158cfd43b3ac1c5b1b19f8e00"
+checksum = "8f55c233f70c4b27f66c523580f78f1004e8b5a8b659e05a4eb49d4166cca406"
 
 [[package]]
 name = "windows_x86_64_gnu"
@@ -1234,9 +1234,9 @@ checksum = "8de912b8b8feb55c064867cf047dda097f92d51efad5b491dfb98f6bbb70cb36"
 
 [[package]]
 name = "windows_x86_64_gnu"
-version = "0.48.0"
+version = "0.48.5"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "ca2b8a661f7628cbd23440e50b05d705db3686f894fc9580820623656af974b1"
+checksum = "53d40abd2583d23e4718fddf1ebec84dbff8381c07cae67ff7768bbf19c6718e"
 
 [[package]]
 name = "windows_x86_64_gnullvm"
@@ -1246,9 +1246,9 @@ checksum = "26d41b46a36d453748aedef1486d5c7a85db22e56aff34643984ea85514e94a3"
 
 [[package]]
 name = "windows_x86_64_gnullvm"
-version = "0.48.0"
+version = "0.48.5"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "7896dbc1f41e08872e9d5e8f8baa8fdd2677f29468c4e156210174edc7f7b953"
+checksum = "0b7b52767868a23d5bab768e390dc5f5c55825b6d30b86c844ff2dc7414044cc"
 
 [[package]]
 name = "windows_x86_64_msvc"
@@ -1258,15 +1258,15 @@ checksum = "9aec5da331524158c6d1a4ac0ab1541149c0b9505fde06423b02f5ef0106b9f0"
 
 [[package]]
 name = "windows_x86_64_msvc"
-version = "0.48.0"
+version = "0.48.5"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "1a515f5799fe4961cb532f983ce2b23082366b898e52ffbce459c86f67c8378a"
+checksum = "ed94fce61571a4006852b7389a063ab983c02eb1bb37b47f8272ce92d06d9538"
 
 [[package]]
 name = "winnow"
-version = "0.5.9"
+version = "0.5.14"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "4344c9f03e6918ce61d94ea6b0500964bb42ee9ca9b2c9c8931990e20b481144"
+checksum = "d09770118a7eb1ccaf4a594a221334119a44a814fcb0d31c5b85e83e97227a97"
 dependencies = [
  "memchr",
 ]
diff --git a/cli/Cargo.toml b/cli/Cargo.toml
index 7bc2e2ea..de703c85 100644
--- a/cli/Cargo.toml
+++ b/cli/Cargo.toml
@@ -36,7 +36,8 @@ regex = "1.9.1"
 regex-syntax = "0.7.4"
 rustc-hash = "1.1.0"
 semver = "1.0.18"
-serde = { version = "1.0.171", features = ["derive"] }
+# Due to https://github.com/serde-rs/serde/issues/2538
+serde = { version = "1.0, < 1.0.172", features = ["derive"] }
 smallbitvec = "2.5.1"
 tiny_http = "0.12.0"
 walkdir = "2.3.3"
@@ -64,7 +65,7 @@ version = "0.20"
 path = "../tags"
 
 [dependencies.serde_json]
-version = "1.0.103"
+version = "1.0"
 features = ["preserve_order"]
 
 [dependencies.log]
diff --git a/cli/config/Cargo.toml b/cli/config/Cargo.toml
index 114d6ce8..01847e93 100644
--- a/cli/config/Cargo.toml
+++ b/cli/config/Cargo.toml
@@ -14,8 +14,9 @@ rust-version.workspace = true
 [dependencies]
 anyhow = "1.0"
 dirs = "3.0"
-serde = { version = "1.0.130", features = ["derive"] }
+# Due to https://github.com/serde-rs/serde/issues/2538
+serde = { version = "1.0, < 1.0.172", features = ["derive"] }
 
 [dependencies.serde_json]
-version = "1.0.45"
+version = "1.0"
 features = ["preserve_order"]
diff --git a/cli/loader/Cargo.toml b/cli/loader/Cargo.toml
index 6af28f30..431aa926 100644
--- a/cli/loader/Cargo.toml
+++ b/cli/loader/Cargo.toml
@@ -18,7 +18,8 @@ dirs = "3.0"
 libloading = "0.7"
 once_cell = "1.7"
 regex = "1"
-serde = { version = "1.0.130", features = ["derive"] }
+# Due to https://github.com/serde-rs/serde/issues/2538
+serde = { version = "1.0, < 1.0.172", features = ["derive"] }
 
 [dependencies.serde_json]
 version = "1.0"

From ac579be788001916024083b3066a314a138d3b31 Mon Sep 17 00:00:00 2001
From: Amaan Qureshi <amaanq12@gmail.com>
Date: Sat, 19 Aug 2023 18:59:11 -0400
Subject: [PATCH 286/347] fix(safety): mark functions that potentially deref a
 raw pointer as unsafe

---
 cli/src/tests/highlight_test.rs | 96 ++++++++++++++++++---------------
 cli/src/tests/tags_test.rs      | 50 +++++++++--------
 highlight/src/c_lib.rs          | 55 +++++++++++++------
 tags/src/c_lib.rs               | 37 ++++++++++---
 4 files changed, 150 insertions(+), 88 deletions(-)

diff --git a/cli/src/tests/highlight_test.rs b/cli/src/tests/highlight_test.rs
index 5cdd0f1d..c788c177 100644
--- a/cli/src/tests/highlight_test.rs
+++ b/cli/src/tests/highlight_test.rs
@@ -496,11 +496,13 @@ fn test_highlighting_via_c_api() {
         .iter()
         .map(|h| h.as_bytes().as_ptr() as *const c_char)
         .collect::<Vec<_>>();
-    let highlighter = c::ts_highlighter_new(
-        &highlight_names[0] as *const *const c_char,
-        &highlight_attrs[0] as *const *const c_char,
-        highlights.len() as u32,
-    );
+    let highlighter = unsafe {
+        c::ts_highlighter_new(
+            &highlight_names[0] as *const *const c_char,
+            &highlight_attrs[0] as *const *const c_char,
+            highlights.len() as u32,
+        )
+    };
 
     let source_code = c_string("<script>\nconst a = b('c');\nc.d();\n</script>");
 
@@ -512,20 +514,22 @@ fn test_highlighting_via_c_api() {
     let highlights_query = fs::read_to_string(queries.join("highlights.scm")).unwrap();
     let injections_query = fs::read_to_string(queries.join("injections.scm")).unwrap();
     let locals_query = fs::read_to_string(queries.join("locals.scm")).unwrap();
-    c::ts_highlighter_add_language(
-        highlighter,
-        lang_name.as_ptr(),
-        js_scope.as_ptr(),
-        js_injection_regex.as_ptr(),
-        language,
-        highlights_query.as_ptr() as *const c_char,
-        injections_query.as_ptr() as *const c_char,
-        locals_query.as_ptr() as *const c_char,
-        highlights_query.len() as u32,
-        injections_query.len() as u32,
-        locals_query.len() as u32,
-        false,
-    );
+    unsafe {
+        c::ts_highlighter_add_language(
+            highlighter,
+            lang_name.as_ptr(),
+            js_scope.as_ptr(),
+            js_injection_regex.as_ptr(),
+            language,
+            highlights_query.as_ptr() as *const c_char,
+            injections_query.as_ptr() as *const c_char,
+            locals_query.as_ptr() as *const c_char,
+            highlights_query.len() as u32,
+            injections_query.len() as u32,
+            locals_query.len() as u32,
+            false,
+        );
+    }
 
     let html_scope = c_string("text.html.basic");
     let html_injection_regex = c_string("^html");
@@ -534,31 +538,35 @@ fn test_highlighting_via_c_api() {
     let queries = get_language_queries_path("html");
     let highlights_query = fs::read_to_string(queries.join("highlights.scm")).unwrap();
     let injections_query = fs::read_to_string(queries.join("injections.scm")).unwrap();
-    c::ts_highlighter_add_language(
-        highlighter,
-        lang_name.as_ptr(),
-        html_scope.as_ptr(),
-        html_injection_regex.as_ptr(),
-        language,
-        highlights_query.as_ptr() as *const c_char,
-        injections_query.as_ptr() as *const c_char,
-        ptr::null(),
-        highlights_query.len() as u32,
-        injections_query.len() as u32,
-        0,
-        false,
-    );
+    unsafe {
+        c::ts_highlighter_add_language(
+            highlighter,
+            lang_name.as_ptr(),
+            html_scope.as_ptr(),
+            html_injection_regex.as_ptr(),
+            language,
+            highlights_query.as_ptr() as *const c_char,
+            injections_query.as_ptr() as *const c_char,
+            ptr::null(),
+            highlights_query.len() as u32,
+            injections_query.len() as u32,
+            0,
+            false,
+        );
+    }
 
     let buffer = c::ts_highlight_buffer_new();
 
-    c::ts_highlighter_highlight(
-        highlighter,
-        html_scope.as_ptr(),
-        source_code.as_ptr(),
-        source_code.as_bytes().len() as u32,
-        buffer,
-        ptr::null_mut(),
-    );
+    unsafe {
+        c::ts_highlighter_highlight(
+            highlighter,
+            html_scope.as_ptr(),
+            source_code.as_ptr(),
+            source_code.as_bytes().len() as u32,
+            buffer,
+            ptr::null_mut(),
+        );
+    }
 
     let output_bytes = c::ts_highlight_buffer_content(buffer);
     let output_line_offsets = c::ts_highlight_buffer_line_offsets(buffer);
@@ -589,8 +597,10 @@ fn test_highlighting_via_c_api() {
         ]
     );
 
-    c::ts_highlighter_delete(highlighter);
-    c::ts_highlight_buffer_delete(buffer);
+    unsafe {
+        c::ts_highlighter_delete(highlighter);
+        c::ts_highlight_buffer_delete(buffer);
+    }
 }
 
 #[test]
diff --git a/cli/src/tests/tags_test.rs b/cli/src/tests/tags_test.rs
index 07e5d1de..20392749 100644
--- a/cli/src/tests/tags_test.rs
+++ b/cli/src/tests/tags_test.rs
@@ -9,7 +9,7 @@ use std::{
 use tree_sitter::Point;
 use tree_sitter_tags::{c_lib as c, Error, TagsConfiguration, TagsContext};
 
-const PYTHON_TAG_QUERY: &'static str = r#"
+const PYTHON_TAG_QUERY: &str = r#"
 (
   (function_definition
     name: (identifier) @name
@@ -39,7 +39,7 @@ const PYTHON_TAG_QUERY: &'static str = r#"
     attribute: (identifier) @name)) @reference.call
 "#;
 
-const JS_TAG_QUERY: &'static str = r#"
+const JS_TAG_QUERY: &str = r#"
 (
     (comment)* @doc .
     (class_declaration
@@ -68,7 +68,7 @@ const JS_TAG_QUERY: &'static str = r#"
     function: (identifier) @name) @reference.call
 "#;
 
-const RUBY_TAG_QUERY: &'static str = r#"
+const RUBY_TAG_QUERY: &str = r#"
 (method
     name: (_) @name) @definition.method
 
@@ -359,25 +359,29 @@ fn test_tags_via_c_api() {
         );
 
         let c_scope_name = CString::new(scope_name).unwrap();
-        let result = c::ts_tagger_add_language(
-            tagger,
-            c_scope_name.as_ptr(),
-            language,
-            JS_TAG_QUERY.as_ptr(),
-            ptr::null(),
-            JS_TAG_QUERY.len() as u32,
-            0,
-        );
+        let result = unsafe {
+            c::ts_tagger_add_language(
+                tagger,
+                c_scope_name.as_ptr(),
+                language,
+                JS_TAG_QUERY.as_ptr(),
+                ptr::null(),
+                JS_TAG_QUERY.len() as u32,
+                0,
+            )
+        };
         assert_eq!(result, c::TSTagsError::Ok);
 
-        let result = c::ts_tagger_tag(
-            tagger,
-            c_scope_name.as_ptr(),
-            source_code.as_ptr(),
-            source_code.len() as u32,
-            buffer,
-            ptr::null(),
-        );
+        let result = unsafe {
+            c::ts_tagger_tag(
+                tagger,
+                c_scope_name.as_ptr(),
+                source_code.as_ptr(),
+                source_code.len() as u32,
+                buffer,
+                ptr::null(),
+            )
+        };
         assert_eq!(result, c::TSTagsError::Ok);
         let tags = unsafe {
             slice::from_raw_parts(
@@ -419,8 +423,10 @@ fn test_tags_via_c_api() {
             ]
         );
 
-        c::ts_tags_buffer_delete(buffer);
-        c::ts_tagger_delete(tagger);
+        unsafe {
+            c::ts_tags_buffer_delete(buffer);
+            c::ts_tagger_delete(tagger);
+        }
     });
 }
 
diff --git a/highlight/src/c_lib.rs b/highlight/src/c_lib.rs
index 33197088..78cdd8c2 100644
--- a/highlight/src/c_lib.rs
+++ b/highlight/src/c_lib.rs
@@ -32,8 +32,14 @@ pub enum ErrorCode {
     InvalidLanguageName,
 }
 
+/// Create a new [`TSHighlighter`] instance.
+///
+/// # Safety
+///
+/// The caller must ensure that the `highlight_names` and `attribute_strings` arrays are valid for
+/// the lifetime of the returned [`TSHighlighter`] instance, and are non-null.
 #[no_mangle]
-pub extern "C" fn ts_highlighter_new(
+pub unsafe extern "C" fn ts_highlighter_new(
     highlight_names: *const *const c_char,
     attribute_strings: *const *const c_char,
     highlight_count: u32,
@@ -43,11 +49,11 @@ pub extern "C" fn ts_highlighter_new(
     let attribute_strings =
         unsafe { slice::from_raw_parts(attribute_strings, highlight_count as usize) };
     let highlight_names = highlight_names
-        .into_iter()
+        .iter()
         .map(|s| unsafe { CStr::from_ptr(*s).to_string_lossy().to_string() })
         .collect::<Vec<_>>();
     let attribute_strings = attribute_strings
-        .into_iter()
+        .iter()
         .map(|s| unsafe { CStr::from_ptr(*s).to_bytes() })
         .collect();
     let carriage_return_index = highlight_names.iter().position(|s| s == "carriage-return");
@@ -59,8 +65,14 @@ pub extern "C" fn ts_highlighter_new(
     }))
 }
 
+/// Add a language to a [`TSHighlighter`] instance.
+///
+/// # Safety
+///
+/// The caller must ensure that any `*const c_char` parameters are valid for the lifetime of
+/// the [`TSHighlighter`] instance, and are non-null.
 #[no_mangle]
-pub extern "C" fn ts_highlighter_add_language(
+pub unsafe extern "C" fn ts_highlighter_add_language(
     this: *mut TSHighlighter,
     language_name: *const c_char,
     scope_name: *const c_char,
@@ -125,7 +137,7 @@ pub extern "C" fn ts_highlighter_add_language(
             apply_all_captures,
         )
         .or(Err(ErrorCode::InvalidQuery))?;
-        config.configure(&this.highlight_names.as_slice());
+        config.configure(this.highlight_names.as_slice());
         this.languages.insert(scope_name, (injection_regex, config));
 
         Ok(())
@@ -145,13 +157,23 @@ pub extern "C" fn ts_highlight_buffer_new() -> *mut TSHighlightBuffer {
     }))
 }
 
+/// Deleteis a [`TSHighlighter`] instance.
+///
+/// # Safety
+///
+/// `this` must be non-null.
 #[no_mangle]
-pub extern "C" fn ts_highlighter_delete(this: *mut TSHighlighter) {
+pub unsafe extern "C" fn ts_highlighter_delete(this: *mut TSHighlighter) {
     drop(unsafe { Box::from_raw(this) })
 }
 
+/// Deleteis a [`TSHighlightBuffer`] instance.
+///
+/// # Safety
+///
+/// `this` must be non-null.
 #[no_mangle]
-pub extern "C" fn ts_highlight_buffer_delete(this: *mut TSHighlightBuffer) {
+pub unsafe extern "C" fn ts_highlight_buffer_delete(this: *mut TSHighlightBuffer) {
     drop(unsafe { Box::from_raw(this) })
 }
 
@@ -179,8 +201,14 @@ pub extern "C" fn ts_highlight_buffer_line_count(this: *const TSHighlightBuffer)
     this.renderer.line_offsets.len() as u32
 }
 
+/// Highlight a string of source code.
+///
+/// # Safety
+///
+/// The caller must ensure that `scope_name`, `source_code`, and `cancellation_flag` are valid for
+/// the lifetime of the [`TSHighlighter`] instance, and are non-null.
 #[no_mangle]
-pub extern "C" fn ts_highlighter_highlight(
+pub unsafe extern "C" fn ts_highlighter_highlight(
     this: *const TSHighlighter,
     scope_name: *const c_char,
     source_code: *const c_char,
@@ -238,15 +266,8 @@ impl TSHighlighter {
                 .renderer
                 .render(highlights, source_code, &|s| self.attribute_strings[s.0]);
             match result {
-                Err(Error::Cancelled) => {
-                    return ErrorCode::Timeout;
-                }
-                Err(Error::InvalidLanguage) => {
-                    return ErrorCode::InvalidLanguage;
-                }
-                Err(Error::Unknown) => {
-                    return ErrorCode::Timeout;
-                }
+                Err(Error::Cancelled) | Err(Error::Unknown) => ErrorCode::Timeout,
+                Err(Error::InvalidLanguage) => ErrorCode::InvalidLanguage,
                 Ok(()) => ErrorCode::Ok,
             }
         } else {
diff --git a/tags/src/c_lib.rs b/tags/src/c_lib.rs
index c8f39d2c..0952d851 100644
--- a/tags/src/c_lib.rs
+++ b/tags/src/c_lib.rs
@@ -66,13 +66,23 @@ pub extern "C" fn ts_tagger_new() -> *mut TSTagger {
     }))
 }
 
+/// Delete a TSTagger.
+///
+/// # Safety
+///
+/// `this` must be non-null
 #[no_mangle]
-pub extern "C" fn ts_tagger_delete(this: *mut TSTagger) {
+pub unsafe extern "C" fn ts_tagger_delete(this: *mut TSTagger) {
     drop(unsafe { Box::from_raw(this) })
 }
 
+/// Add a language to a TSTagger.
+///
+/// # Safety
+///
+/// `this` must be non-null
 #[no_mangle]
-pub extern "C" fn ts_tagger_add_language(
+pub unsafe extern "C" fn ts_tagger_add_language(
     this: *mut TSTagger,
     scope_name: *const c_char,
     language: Language,
@@ -84,7 +94,7 @@ pub extern "C" fn ts_tagger_add_language(
     let tagger = unwrap_mut_ptr(this);
     let scope_name = unsafe { unwrap(CStr::from_ptr(scope_name).to_str()) };
     let tags_query = unsafe { slice::from_raw_parts(tags_query, tags_query_len as usize) };
-    let locals_query = if locals_query != std::ptr::null() {
+    let locals_query = if !locals_query.is_null() {
         unsafe { slice::from_raw_parts(locals_query, locals_query_len as usize) }
     } else {
         &[]
@@ -111,8 +121,13 @@ pub extern "C" fn ts_tagger_add_language(
     }
 }
 
+/// Tag some source code.
+///
+/// # Safety
+///
+/// `this` must be non-null
 #[no_mangle]
-pub extern "C" fn ts_tagger_tag(
+pub unsafe extern "C" fn ts_tagger_tag(
     this: *mut TSTagger,
     scope_name: *const c_char,
     source_code: *const u8,
@@ -201,8 +216,13 @@ pub extern "C" fn ts_tags_buffer_new() -> *mut TSTagsBuffer {
     }))
 }
 
+/// Delete a TSTagsBuffer.
+///
+/// # Safety
+///
+/// `this` must be non-null
 #[no_mangle]
-pub extern "C" fn ts_tags_buffer_delete(this: *mut TSTagsBuffer) {
+pub unsafe extern "C" fn ts_tags_buffer_delete(this: *mut TSTagsBuffer) {
     drop(unsafe { Box::from_raw(this) })
 }
 
@@ -236,8 +256,13 @@ pub extern "C" fn ts_tags_buffer_found_parse_error(this: *const TSTagsBuffer) ->
     buffer.errors_present
 }
 
+/// Get the syntax kinds for a given scope name.
+///
+/// # Safety
+///
+/// `this` must be non-null
 #[no_mangle]
-pub extern "C" fn ts_tagger_syntax_kinds_for_scope_name(
+pub unsafe extern "C" fn ts_tagger_syntax_kinds_for_scope_name(
     this: *mut TSTagger,
     scope_name: *const c_char,
     len: *mut u32,

From ffae7d611563f0a7e6fcfafbcb34e14f0c722a9d Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Sun, 20 Aug 2023 01:48:17 +0300
Subject: [PATCH 287/347] fix: mark helper Rust funcs that receive raw pointers
 as unsafe

---
 cli/src/tests/highlight_test.rs |  8 ++---
 highlight/src/c_lib.rs          | 62 +++++++++++++++------------------
 tags/src/c_lib.rs               | 34 +++++++++---------
 3 files changed, 50 insertions(+), 54 deletions(-)

diff --git a/cli/src/tests/highlight_test.rs b/cli/src/tests/highlight_test.rs
index c788c177..c4ca0b49 100644
--- a/cli/src/tests/highlight_test.rs
+++ b/cli/src/tests/highlight_test.rs
@@ -568,10 +568,10 @@ fn test_highlighting_via_c_api() {
         );
     }
 
-    let output_bytes = c::ts_highlight_buffer_content(buffer);
-    let output_line_offsets = c::ts_highlight_buffer_line_offsets(buffer);
-    let output_len = c::ts_highlight_buffer_len(buffer);
-    let output_line_count = c::ts_highlight_buffer_line_count(buffer);
+    let output_bytes = unsafe { c::ts_highlight_buffer_content(buffer) };
+    let output_line_offsets = unsafe { c::ts_highlight_buffer_line_offsets(buffer) };
+    let output_len = unsafe { c::ts_highlight_buffer_len(buffer) };
+    let output_line_count = unsafe { c::ts_highlight_buffer_line_count(buffer) };
 
     let output_bytes = unsafe { slice::from_raw_parts(output_bytes, output_len as usize) };
     let output_line_offsets =
diff --git a/highlight/src/c_lib.rs b/highlight/src/c_lib.rs
index 78cdd8c2..2fc6934e 100644
--- a/highlight/src/c_lib.rs
+++ b/highlight/src/c_lib.rs
@@ -44,17 +44,15 @@ pub unsafe extern "C" fn ts_highlighter_new(
     attribute_strings: *const *const c_char,
     highlight_count: u32,
 ) -> *mut TSHighlighter {
-    let highlight_names =
-        unsafe { slice::from_raw_parts(highlight_names, highlight_count as usize) };
-    let attribute_strings =
-        unsafe { slice::from_raw_parts(attribute_strings, highlight_count as usize) };
+    let highlight_names = slice::from_raw_parts(highlight_names, highlight_count as usize);
+    let attribute_strings = slice::from_raw_parts(attribute_strings, highlight_count as usize);
     let highlight_names = highlight_names
-        .iter()
-        .map(|s| unsafe { CStr::from_ptr(*s).to_string_lossy().to_string() })
+        .into_iter()
+        .map(|s| CStr::from_ptr(*s).to_string_lossy().to_string())
         .collect::<Vec<_>>();
     let attribute_strings = attribute_strings
-        .iter()
-        .map(|s| unsafe { CStr::from_ptr(*s).to_bytes() })
+        .into_iter()
+        .map(|s| CStr::from_ptr(*s).to_bytes())
         .collect();
     let carriage_return_index = highlight_names.iter().position(|s| s == "carriage-return");
     Box::into_raw(Box::new(TSHighlighter {
@@ -88,7 +86,7 @@ pub unsafe extern "C" fn ts_highlighter_add_language(
 ) -> ErrorCode {
     let f = move || {
         let this = unwrap_mut_ptr(this);
-        let scope_name = unsafe { CStr::from_ptr(scope_name) };
+        let scope_name = CStr::from_ptr(scope_name);
         let scope_name = scope_name
             .to_str()
             .or(Err(ErrorCode::InvalidUtf8))?
@@ -96,29 +94,26 @@ pub unsafe extern "C" fn ts_highlighter_add_language(
         let injection_regex = if injection_regex.is_null() {
             None
         } else {
-            let pattern = unsafe { CStr::from_ptr(injection_regex) };
+            let pattern = CStr::from_ptr(injection_regex);
             let pattern = pattern.to_str().or(Err(ErrorCode::InvalidUtf8))?;
             Some(Regex::new(pattern).or(Err(ErrorCode::InvalidRegex))?)
         };
 
-        let highlight_query = unsafe {
-            slice::from_raw_parts(highlight_query as *const u8, highlight_query_len as usize)
-        };
+        let highlight_query =
+            slice::from_raw_parts(highlight_query as *const u8, highlight_query_len as usize);
+
         let highlight_query = str::from_utf8(highlight_query).or(Err(ErrorCode::InvalidUtf8))?;
 
         let injection_query = if injection_query_len > 0 {
-            let query = unsafe {
-                slice::from_raw_parts(injection_query as *const u8, injection_query_len as usize)
-            };
+            let query =
+                slice::from_raw_parts(injection_query as *const u8, injection_query_len as usize);
             str::from_utf8(query).or(Err(ErrorCode::InvalidUtf8))?
         } else {
             ""
         };
 
         let locals_query = if locals_query_len > 0 {
-            let query = unsafe {
-                slice::from_raw_parts(locals_query as *const u8, locals_query_len as usize)
-            };
+            let query = slice::from_raw_parts(locals_query as *const u8, locals_query_len as usize);
             str::from_utf8(query).or(Err(ErrorCode::InvalidUtf8))?
         } else {
             ""
@@ -164,7 +159,7 @@ pub extern "C" fn ts_highlight_buffer_new() -> *mut TSHighlightBuffer {
 /// `this` must be non-null.
 #[no_mangle]
 pub unsafe extern "C" fn ts_highlighter_delete(this: *mut TSHighlighter) {
-    drop(unsafe { Box::from_raw(this) })
+    drop(Box::from_raw(this))
 }
 
 /// Deleteis a [`TSHighlightBuffer`] instance.
@@ -174,29 +169,31 @@ pub unsafe extern "C" fn ts_highlighter_delete(this: *mut TSHighlighter) {
 /// `this` must be non-null.
 #[no_mangle]
 pub unsafe extern "C" fn ts_highlight_buffer_delete(this: *mut TSHighlightBuffer) {
-    drop(unsafe { Box::from_raw(this) })
+    drop(Box::from_raw(this))
 }
 
 #[no_mangle]
-pub extern "C" fn ts_highlight_buffer_content(this: *const TSHighlightBuffer) -> *const u8 {
+pub unsafe extern "C" fn ts_highlight_buffer_content(this: *const TSHighlightBuffer) -> *const u8 {
     let this = unwrap_ptr(this);
     this.renderer.html.as_slice().as_ptr()
 }
 
 #[no_mangle]
-pub extern "C" fn ts_highlight_buffer_line_offsets(this: *const TSHighlightBuffer) -> *const u32 {
+pub unsafe extern "C" fn ts_highlight_buffer_line_offsets(
+    this: *const TSHighlightBuffer,
+) -> *const u32 {
     let this = unwrap_ptr(this);
     this.renderer.line_offsets.as_slice().as_ptr()
 }
 
 #[no_mangle]
-pub extern "C" fn ts_highlight_buffer_len(this: *const TSHighlightBuffer) -> u32 {
+pub unsafe extern "C" fn ts_highlight_buffer_len(this: *const TSHighlightBuffer) -> u32 {
     let this = unwrap_ptr(this);
     this.renderer.html.len() as u32
 }
 
 #[no_mangle]
-pub extern "C" fn ts_highlight_buffer_line_count(this: *const TSHighlightBuffer) -> u32 {
+pub unsafe extern "C" fn ts_highlight_buffer_line_count(this: *const TSHighlightBuffer) -> u32 {
     let this = unwrap_ptr(this);
     this.renderer.line_offsets.len() as u32
 }
@@ -218,10 +215,9 @@ pub unsafe extern "C" fn ts_highlighter_highlight(
 ) -> ErrorCode {
     let this = unwrap_ptr(this);
     let output = unwrap_mut_ptr(output);
-    let scope_name = unwrap(unsafe { CStr::from_ptr(scope_name).to_str() });
-    let source_code =
-        unsafe { slice::from_raw_parts(source_code as *const u8, source_code_len as usize) };
-    let cancellation_flag = unsafe { cancellation_flag.as_ref() };
+    let scope_name = unwrap(CStr::from_ptr(scope_name).to_str());
+    let source_code = slice::from_raw_parts(source_code as *const u8, source_code_len as usize);
+    let cancellation_flag = cancellation_flag.as_ref();
     this.highlight(source_code, scope_name, output, cancellation_flag)
 }
 
@@ -276,15 +272,15 @@ impl TSHighlighter {
     }
 }
 
-fn unwrap_ptr<'a, T>(result: *const T) -> &'a T {
-    unsafe { result.as_ref() }.unwrap_or_else(|| {
+unsafe fn unwrap_ptr<'a, T>(result: *const T) -> &'a T {
+    result.as_ref().unwrap_or_else(|| {
         eprintln!("{}:{} - pointer must not be null", file!(), line!());
         abort();
     })
 }
 
-fn unwrap_mut_ptr<'a, T>(result: *mut T) -> &'a mut T {
-    unsafe { result.as_mut() }.unwrap_or_else(|| {
+unsafe fn unwrap_mut_ptr<'a, T>(result: *mut T) -> &'a mut T {
+    result.as_mut().unwrap_or_else(|| {
         eprintln!("{}:{} - pointer must not be null", file!(), line!());
         abort();
     })
diff --git a/tags/src/c_lib.rs b/tags/src/c_lib.rs
index 0952d851..df21f181 100644
--- a/tags/src/c_lib.rs
+++ b/tags/src/c_lib.rs
@@ -73,7 +73,7 @@ pub extern "C" fn ts_tagger_new() -> *mut TSTagger {
 /// `this` must be non-null
 #[no_mangle]
 pub unsafe extern "C" fn ts_tagger_delete(this: *mut TSTagger) {
-    drop(unsafe { Box::from_raw(this) })
+    drop(Box::from_raw(this))
 }
 
 /// Add a language to a TSTagger.
@@ -92,10 +92,10 @@ pub unsafe extern "C" fn ts_tagger_add_language(
     locals_query_len: u32,
 ) -> TSTagsError {
     let tagger = unwrap_mut_ptr(this);
-    let scope_name = unsafe { unwrap(CStr::from_ptr(scope_name).to_str()) };
-    let tags_query = unsafe { slice::from_raw_parts(tags_query, tags_query_len as usize) };
-    let locals_query = if !locals_query.is_null() {
-        unsafe { slice::from_raw_parts(locals_query, locals_query_len as usize) }
+    let scope_name = unwrap(CStr::from_ptr(scope_name).to_str());
+    let tags_query = slice::from_raw_parts(tags_query, tags_query_len as usize);
+    let locals_query = if locals_query != std::ptr::null() {
+        slice::from_raw_parts(locals_query, locals_query_len as usize)
     } else {
         &[]
     };
@@ -137,14 +137,14 @@ pub unsafe extern "C" fn ts_tagger_tag(
 ) -> TSTagsError {
     let tagger = unwrap_mut_ptr(this);
     let buffer = unwrap_mut_ptr(output);
-    let scope_name = unsafe { unwrap(CStr::from_ptr(scope_name).to_str()) };
+    let scope_name = unwrap(CStr::from_ptr(scope_name).to_str());
 
     if let Some(config) = tagger.languages.get(scope_name) {
         shrink_and_clear(&mut buffer.tags, BUFFER_TAGS_RESERVE_CAPACITY);
         shrink_and_clear(&mut buffer.docs, BUFFER_DOCS_RESERVE_CAPACITY);
 
-        let source_code = unsafe { slice::from_raw_parts(source_code, source_code_len as usize) };
-        let cancellation_flag = unsafe { cancellation_flag.as_ref() };
+        let source_code = slice::from_raw_parts(source_code, source_code_len as usize);
+        let cancellation_flag = cancellation_flag.as_ref();
 
         let tags = match buffer
             .context
@@ -223,35 +223,35 @@ pub extern "C" fn ts_tags_buffer_new() -> *mut TSTagsBuffer {
 /// `this` must be non-null
 #[no_mangle]
 pub unsafe extern "C" fn ts_tags_buffer_delete(this: *mut TSTagsBuffer) {
-    drop(unsafe { Box::from_raw(this) })
+    drop(Box::from_raw(this))
 }
 
 #[no_mangle]
-pub extern "C" fn ts_tags_buffer_tags(this: *const TSTagsBuffer) -> *const TSTag {
+pub unsafe extern "C" fn ts_tags_buffer_tags(this: *const TSTagsBuffer) -> *const TSTag {
     let buffer = unwrap_ptr(this);
     buffer.tags.as_ptr()
 }
 
 #[no_mangle]
-pub extern "C" fn ts_tags_buffer_tags_len(this: *const TSTagsBuffer) -> u32 {
+pub unsafe extern "C" fn ts_tags_buffer_tags_len(this: *const TSTagsBuffer) -> u32 {
     let buffer = unwrap_ptr(this);
     buffer.tags.len() as u32
 }
 
 #[no_mangle]
-pub extern "C" fn ts_tags_buffer_docs(this: *const TSTagsBuffer) -> *const c_char {
+pub unsafe extern "C" fn ts_tags_buffer_docs(this: *const TSTagsBuffer) -> *const c_char {
     let buffer = unwrap_ptr(this);
     buffer.docs.as_ptr() as *const c_char
 }
 
 #[no_mangle]
-pub extern "C" fn ts_tags_buffer_docs_len(this: *const TSTagsBuffer) -> u32 {
+pub unsafe extern "C" fn ts_tags_buffer_docs_len(this: *const TSTagsBuffer) -> u32 {
     let buffer = unwrap_ptr(this);
     buffer.docs.len() as u32
 }
 
 #[no_mangle]
-pub extern "C" fn ts_tags_buffer_found_parse_error(this: *const TSTagsBuffer) -> bool {
+pub unsafe extern "C" fn ts_tags_buffer_found_parse_error(this: *const TSTagsBuffer) -> bool {
     let buffer = unwrap_ptr(this);
     buffer.errors_present
 }
@@ -268,7 +268,7 @@ pub unsafe extern "C" fn ts_tagger_syntax_kinds_for_scope_name(
     len: *mut u32,
 ) -> *const *const c_char {
     let tagger = unwrap_mut_ptr(this);
-    let scope_name = unsafe { unwrap(CStr::from_ptr(scope_name).to_str()) };
+    let scope_name = unwrap(CStr::from_ptr(scope_name).to_str());
     let len = unwrap_mut_ptr(len);
 
     *len = 0;
@@ -279,14 +279,14 @@ pub unsafe extern "C" fn ts_tagger_syntax_kinds_for_scope_name(
     std::ptr::null()
 }
 
-fn unwrap_ptr<'a, T>(result: *const T) -> &'a T {
+unsafe fn unwrap_ptr<'a, T>(result: *const T) -> &'a T {
     unsafe { result.as_ref() }.unwrap_or_else(|| {
         eprintln!("{}:{} - pointer must not be null", file!(), line!());
         abort();
     })
 }
 
-fn unwrap_mut_ptr<'a, T>(result: *mut T) -> &'a mut T {
+unsafe fn unwrap_mut_ptr<'a, T>(result: *mut T) -> &'a mut T {
     unsafe { result.as_mut() }.unwrap_or_else(|| {
         eprintln!("{}:{} - pointer must not be null", file!(), line!());
         abort();

From c332066666b1bced7575aacd8f469d13b1e63437 Mon Sep 17 00:00:00 2001
From: Amaan Qureshi <amaanq12@gmail.com>
Date: Sat, 19 Aug 2023 19:42:18 -0400
Subject: [PATCH 288/347] fix(safety): improve docs for unsafe C functions

---
 highlight/src/c_lib.rs | 65 +++++++++++++++++++++++++++++-----
 tags/src/c_lib.rs      | 79 +++++++++++++++++++++++++++++++++++++-----
 2 files changed, 126 insertions(+), 18 deletions(-)

diff --git a/highlight/src/c_lib.rs b/highlight/src/c_lib.rs
index 2fc6934e..1ab4903a 100644
--- a/highlight/src/c_lib.rs
+++ b/highlight/src/c_lib.rs
@@ -47,11 +47,11 @@ pub unsafe extern "C" fn ts_highlighter_new(
     let highlight_names = slice::from_raw_parts(highlight_names, highlight_count as usize);
     let attribute_strings = slice::from_raw_parts(attribute_strings, highlight_count as usize);
     let highlight_names = highlight_names
-        .into_iter()
+        .iter()
         .map(|s| CStr::from_ptr(*s).to_string_lossy().to_string())
         .collect::<Vec<_>>();
     let attribute_strings = attribute_strings
-        .into_iter()
+        .iter()
         .map(|s| CStr::from_ptr(*s).to_bytes())
         .collect();
     let carriage_return_index = highlight_names.iter().position(|s| s == "carriage-return");
@@ -65,9 +65,14 @@ pub unsafe extern "C" fn ts_highlighter_new(
 
 /// Add a language to a [`TSHighlighter`] instance.
 ///
+/// Returns an [`ErrorCode`] indicating whether the language was added successfully or not.
+///
 /// # Safety
 ///
-/// The caller must ensure that any `*const c_char` parameters are valid for the lifetime of
+/// `this` must be non-null and must be a valid pointer to a [`TSHighlighter`] instance
+/// created by [`ts_highlighter_new`].
+///
+/// The caller must ensure that any `*const c_char` (C-style string) parameters are valid for the lifetime of
 /// the [`TSHighlighter`] instance, and are non-null.
 #[no_mangle]
 pub unsafe extern "C" fn ts_highlighter_add_language(
@@ -119,7 +124,7 @@ pub unsafe extern "C" fn ts_highlighter_add_language(
             ""
         };
 
-        let lang = unsafe { CStr::from_ptr(language_name) }
+        let lang = CStr::from_ptr(language_name)
             .to_str()
             .or(Err(ErrorCode::InvalidLanguageName))?;
 
@@ -152,32 +157,60 @@ pub extern "C" fn ts_highlight_buffer_new() -> *mut TSHighlightBuffer {
     }))
 }
 
-/// Deleteis a [`TSHighlighter`] instance.
+/// Deletes a [`TSHighlighter`] instance.
 ///
 /// # Safety
 ///
-/// `this` must be non-null.
+/// `this` must be non-null and must be a valid pointer to a [`TSHighlighter`] instance
+/// created by [`ts_highlighter_new`].
+///
+/// It cannot be used after this function is called.
 #[no_mangle]
 pub unsafe extern "C" fn ts_highlighter_delete(this: *mut TSHighlighter) {
     drop(Box::from_raw(this))
 }
 
-/// Deleteis a [`TSHighlightBuffer`] instance.
+/// Deletes a [`TSHighlightBuffer`] instance.
 ///
 /// # Safety
 ///
-/// `this` must be non-null.
+/// `this` must be non-null and must be a valid pointer to a [`TSHighlightBuffer`] instance
+/// created by [`ts_highlight_buffer_new`]
+///
+/// It cannot be used after this function is called.
 #[no_mangle]
 pub unsafe extern "C" fn ts_highlight_buffer_delete(this: *mut TSHighlightBuffer) {
     drop(Box::from_raw(this))
 }
 
+/// Get the HTML content of a [`TSHighlightBuffer`] instance as a raw pointer.
+///
+/// # Safety
+///
+/// `this` must be non-null and must be a valid pointer to a [`TSHighlightBuffer`] instance
+/// created by [`ts_highlight_buffer_new`].
+///
+/// The returned pointer, a C-style string, must not outlive the [`TSHighlightBuffer`] instance, else the
+/// data will point to garbage.
+///
+/// To get the length of the HTML content, use [`ts_highlight_buffer_len`].
 #[no_mangle]
 pub unsafe extern "C" fn ts_highlight_buffer_content(this: *const TSHighlightBuffer) -> *const u8 {
     let this = unwrap_ptr(this);
     this.renderer.html.as_slice().as_ptr()
 }
 
+/// Get the line offsets of a [`TSHighlightBuffer`] instance as a C-style array.
+///
+/// # Safety
+///
+/// `this` must be non-null and must be a valid pointer to a [`TSHighlightBuffer`] instance
+/// created by [`ts_highlight_buffer_new`].
+///
+/// The returned pointer, a C-style array of [`u32`]s, must not outlive the [`TSHighlightBuffer`] instance, else the
+/// data will point to garbage.
+///
+/// To get the length of the array, use [`ts_highlight_buffer_line_count`].
 #[no_mangle]
 pub unsafe extern "C" fn ts_highlight_buffer_line_offsets(
     this: *const TSHighlightBuffer,
@@ -186,12 +219,24 @@ pub unsafe extern "C" fn ts_highlight_buffer_line_offsets(
     this.renderer.line_offsets.as_slice().as_ptr()
 }
 
+/// Get the length of the HTML content of a [`TSHighlightBuffer`] instance.
+///
+/// # Safety
+///
+/// `this` must be non-null and must be a valid pointer to a [`TSHighlightBuffer`] instance
+/// created by [`ts_highlight_buffer_new`].
 #[no_mangle]
 pub unsafe extern "C" fn ts_highlight_buffer_len(this: *const TSHighlightBuffer) -> u32 {
     let this = unwrap_ptr(this);
     this.renderer.html.len() as u32
 }
 
+/// Get the number of lines in a [`TSHighlightBuffer`] instance.
+///
+/// # Safety
+///
+/// `this` must be non-null and must be a valid pointer to a [`TSHighlightBuffer`] instance
+/// created by [`ts_highlight_buffer_new`].
 #[no_mangle]
 pub unsafe extern "C" fn ts_highlight_buffer_line_count(this: *const TSHighlightBuffer) -> u32 {
     let this = unwrap_ptr(this);
@@ -202,8 +247,10 @@ pub unsafe extern "C" fn ts_highlight_buffer_line_count(this: *const TSHighlight
 ///
 /// # Safety
 ///
-/// The caller must ensure that `scope_name`, `source_code`, and `cancellation_flag` are valid for
+/// The caller must ensure that `scope_name`, `source_code`, `output`, and `cancellation_flag` are valid for
 /// the lifetime of the [`TSHighlighter`] instance, and are non-null.
+///
+/// `this` must be a non-null pointer to a [`TSHighlighter`] instance created by [`ts_highlighter_new`]
 #[no_mangle]
 pub unsafe extern "C" fn ts_highlighter_highlight(
     this: *const TSHighlighter,
diff --git a/tags/src/c_lib.rs b/tags/src/c_lib.rs
index df21f181..915b0220 100644
--- a/tags/src/c_lib.rs
+++ b/tags/src/c_lib.rs
@@ -70,7 +70,7 @@ pub extern "C" fn ts_tagger_new() -> *mut TSTagger {
 ///
 /// # Safety
 ///
-/// `this` must be non-null
+/// `this` must be non-null and a valid pointer to a [`TSTagger`] instance.
 #[no_mangle]
 pub unsafe extern "C" fn ts_tagger_delete(this: *mut TSTagger) {
     drop(Box::from_raw(this))
@@ -78,9 +78,15 @@ pub unsafe extern "C" fn ts_tagger_delete(this: *mut TSTagger) {
 
 /// Add a language to a TSTagger.
 ///
+/// Returns a [`TSTagsError`] indicating whether the operation was successful or not.
+///
 /// # Safety
 ///
-/// `this` must be non-null
+/// `this` must be non-null and a valid pointer to a [`TSTagger`] instance.
+/// `scope_name` must be non-null and a valid pointer to a null-terminated string.
+/// `tags_query` and `locals_query` must be non-null and valid pointers to strings.
+///
+/// The caller must ensure that the lengths of `tags_query` and `locals_query` are correct.
 #[no_mangle]
 pub unsafe extern "C" fn ts_tagger_add_language(
     this: *mut TSTagger,
@@ -94,7 +100,7 @@ pub unsafe extern "C" fn ts_tagger_add_language(
     let tagger = unwrap_mut_ptr(this);
     let scope_name = unwrap(CStr::from_ptr(scope_name).to_str());
     let tags_query = slice::from_raw_parts(tags_query, tags_query_len as usize);
-    let locals_query = if locals_query != std::ptr::null() {
+    let locals_query = if !locals_query.is_null() {
         slice::from_raw_parts(locals_query, locals_query_len as usize)
     } else {
         &[]
@@ -121,11 +127,17 @@ pub unsafe extern "C" fn ts_tagger_add_language(
     }
 }
 
-/// Tag some source code.
+/// Tags some source code.
+///
+/// Returns a [`TSTagsError`] indicating whether the operation was successful or not.
 ///
 /// # Safety
 ///
-/// `this` must be non-null
+/// `this` must be a non-null valid pointer to a [`TSTagger`] instance.
+/// `scope_name` must be a non-null valid pointer to a null-terminated string.
+/// `source_code` must be a non-null valid pointer to a slice of bytes.
+/// `output` must be a non-null valid pointer to a [`TSTagsBuffer`] instance.
+/// `cancellation_flag` must be a non-null valid pointer to an [`AtomicUsize`] instance.
 #[no_mangle]
 pub unsafe extern "C" fn ts_tagger_tag(
     this: *mut TSTagger,
@@ -220,36 +232,75 @@ pub extern "C" fn ts_tags_buffer_new() -> *mut TSTagsBuffer {
 ///
 /// # Safety
 ///
-/// `this` must be non-null
+/// `this` must be non-null and a valid pointer to a [`TSTagsBuffer`] instance created by
+/// [`ts_tags_buffer_new`].
 #[no_mangle]
 pub unsafe extern "C" fn ts_tags_buffer_delete(this: *mut TSTagsBuffer) {
     drop(Box::from_raw(this))
 }
 
+/// Get the tags from a TSTagsBuffer.
+///
+/// # Safety
+///
+/// `this` must be non-null and a valid pointer to a [`TSTagsBuffer`] instance created by
+/// [`ts_tags_buffer_new`].
+///
+/// The caller must ensure that the returned pointer is not used after the [`TSTagsBuffer`]
+/// is deleted with [`ts_tags_buffer_delete`], else the data will point to garbage.
 #[no_mangle]
 pub unsafe extern "C" fn ts_tags_buffer_tags(this: *const TSTagsBuffer) -> *const TSTag {
     let buffer = unwrap_ptr(this);
     buffer.tags.as_ptr()
 }
 
+/// Get the number of tags in a TSTagsBuffer.
+///
+/// # Safety
+///
+/// `this` must be non-null and a valid pointer to a [`TSTagsBuffer`] instance.
 #[no_mangle]
 pub unsafe extern "C" fn ts_tags_buffer_tags_len(this: *const TSTagsBuffer) -> u32 {
     let buffer = unwrap_ptr(this);
     buffer.tags.len() as u32
 }
 
+/// Get the documentation strings from a TSTagsBuffer.
+///
+/// # Safety
+///
+/// `this` must be non-null and a valid pointer to a [`TSTagsBuffer`] instance created by
+/// [`ts_tags_buffer_new`].
+///
+/// The caller must ensure that the returned pointer is not used after the [`TSTagsBuffer`]
+/// is deleted with [`ts_tags_buffer_delete`], else the data will point to garbage.
+///
+/// The returned pointer points to a C-style string.
+/// To get the length of the string, use [`ts_tags_buffer_docs_len`].
 #[no_mangle]
 pub unsafe extern "C" fn ts_tags_buffer_docs(this: *const TSTagsBuffer) -> *const c_char {
     let buffer = unwrap_ptr(this);
     buffer.docs.as_ptr() as *const c_char
 }
 
+/// Get the length of the documentation strings in a TSTagsBuffer.
+///
+/// # Safety
+///
+/// `this` must be non-null and a valid pointer to a [`TSTagsBuffer`] instance created by
+/// [`ts_tags_buffer_new`].
 #[no_mangle]
 pub unsafe extern "C" fn ts_tags_buffer_docs_len(this: *const TSTagsBuffer) -> u32 {
     let buffer = unwrap_ptr(this);
     buffer.docs.len() as u32
 }
 
+/// Get whether or not a TSTagsBuffer contains any parse errors.
+///
+/// # Safety
+///
+/// `this` must be non-null and a valid pointer to a [`TSTagsBuffer`] instance created by
+/// [`ts_tags_buffer_new`].
 #[no_mangle]
 pub unsafe extern "C" fn ts_tags_buffer_found_parse_error(this: *const TSTagsBuffer) -> bool {
     let buffer = unwrap_ptr(this);
@@ -258,9 +309,19 @@ pub unsafe extern "C" fn ts_tags_buffer_found_parse_error(this: *const TSTagsBuf
 
 /// Get the syntax kinds for a given scope name.
 ///
+/// Returns a pointer to a null-terminated array of null-terminated strings.
+///
 /// # Safety
 ///
-/// `this` must be non-null
+/// `this` must be non-null and a valid pointer to a [`TSTagger`] instance created by
+/// [`ts_tagger_new`].
+/// `scope_name` must be non-null and a valid pointer to a null-terminated string.
+/// `len` must be non-null and a valid pointer to a `u32`.
+///
+/// The caller must ensure that the returned pointer is not used after the [`TSTagger`]
+/// is deleted with [`ts_tagger_delete`], else the data will point to garbage.
+///
+/// The returned pointer points to a C-style string array.
 #[no_mangle]
 pub unsafe extern "C" fn ts_tagger_syntax_kinds_for_scope_name(
     this: *mut TSTagger,
@@ -280,14 +341,14 @@ pub unsafe extern "C" fn ts_tagger_syntax_kinds_for_scope_name(
 }
 
 unsafe fn unwrap_ptr<'a, T>(result: *const T) -> &'a T {
-    unsafe { result.as_ref() }.unwrap_or_else(|| {
+    result.as_ref().unwrap_or_else(|| {
         eprintln!("{}:{} - pointer must not be null", file!(), line!());
         abort();
     })
 }
 
 unsafe fn unwrap_mut_ptr<'a, T>(result: *mut T) -> &'a mut T {
-    unsafe { result.as_mut() }.unwrap_or_else(|| {
+    result.as_mut().unwrap_or_else(|| {
         eprintln!("{}:{} - pointer must not be null", file!(), line!());
         abort();
     })

From 4278e03b1138d0171a40145cd89bd0486fc733c1 Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Sun, 20 Aug 2023 16:00:33 +0300
Subject: [PATCH 289/347] feat: generate Rust bindings during build process

It can be used as:
  > cargo build -p tree-sitter -F bindgen
---
 Cargo.lock                | 88 +++++++++++++++++++++++++++++++++++++++
 lib/Cargo.toml            |  1 +
 lib/binding_rust/build.rs | 41 ++++++++++++++++++
 lib/binding_rust/ffi.rs   |  4 ++
 lib/binding_rust/lib.rs   |  5 ++-
 5 files changed, 137 insertions(+), 2 deletions(-)

diff --git a/Cargo.lock b/Cargo.lock
index 3c444391..80a4e28d 100644
--- a/Cargo.lock
+++ b/Cargo.lock
@@ -43,6 +43,29 @@ dependencies = [
  "winapi",
 ]
 
+[[package]]
+name = "bindgen"
+version = "0.66.1"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "f2b84e06fc203107bfbad243f4aba2af864eb7db3b1cf46ea0a023b0b433d2a7"
+dependencies = [
+ "bitflags 2.4.0",
+ "cexpr",
+ "clang-sys",
+ "lazy_static",
+ "lazycell",
+ "log",
+ "peeking_take_while",
+ "prettyplease",
+ "proc-macro2",
+ "quote",
+ "regex",
+ "rustc-hash",
+ "shlex",
+ "syn 2.0.29",
+ "which",
+]
+
 [[package]]
 name = "bitflags"
 version = "1.3.2"
@@ -82,6 +105,15 @@ version = "1.1.0"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "6d43a04d8753f35258c91f8ec639f792891f748a1edbd759cf1dcea3382ad83c"
 
+[[package]]
+name = "cexpr"
+version = "0.6.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "6fac387a98bb7c37292057cffc56d62ecb629900026402633ae9160df93a8766"
+dependencies = [
+ "nom",
+]
+
 [[package]]
 name = "cfg-if"
 version = "1.0.0"
@@ -94,6 +126,17 @@ version = "1.4.1"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "cca491388666e04d7248af3f60f0c40cfb0991c72205595d7c396e3510207d1a"
 
+[[package]]
+name = "clang-sys"
+version = "1.6.1"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "c688fc74432808e3eb684cae8830a86be1d66a2bd58e1f248ed0960a590baf6f"
+dependencies = [
+ "glob",
+ "libc",
+ "libloading",
+]
+
 [[package]]
 name = "clap"
 version = "2.34.0"
@@ -381,6 +424,12 @@ version = "1.4.0"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "e2abad23fbc42b3700f2f279844dc832adb2b2eb069b2df918f455c4e18cc646"
 
+[[package]]
+name = "lazycell"
+version = "1.3.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "830d08ce1d1d941e6b30645f1a0eb5643013d835ce3779a5fc208261dbe10f55"
+
 [[package]]
 name = "libc"
 version = "0.2.147"
@@ -424,6 +473,12 @@ version = "2.5.0"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "2dffe52ecf27772e601905b7522cb4ef790d2cc203488bbd0e2fe85fcb74566d"
 
+[[package]]
+name = "minimal-lexical"
+version = "0.2.1"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "68354c5c6bd36d73ff3feceb05efa59b6acb7626617f4962be322a825e61f79a"
+
 [[package]]
 name = "ndk-context"
 version = "0.1.1"
@@ -442,6 +497,16 @@ dependencies = [
  "static_assertions",
 ]
 
+[[package]]
+name = "nom"
+version = "7.1.3"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "d273983c5a657a70a3e8f2a01329822f3b8c8172b73826411a55751e404a0a4a"
+dependencies = [
+ "memchr",
+ "minimal-lexical",
+]
+
 [[package]]
 name = "objc"
 version = "0.2.7"
@@ -469,6 +534,12 @@ version = "0.2.1"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "1e91099d4268b0e11973f036e885d652fb0b21fedcf69738c627f94db6a44f42"
 
+[[package]]
+name = "peeking_take_while"
+version = "0.1.2"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "19b17cddbe7ec3f8bc800887bab5e717348c95ea2ca0b1bf0837fb964dc67099"
+
 [[package]]
 name = "percent-encoding"
 version = "2.3.0"
@@ -491,6 +562,16 @@ dependencies = [
  "yansi",
 ]
 
+[[package]]
+name = "prettyplease"
+version = "0.2.12"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "6c64d9ba0963cdcea2e1b2230fbae2bab30eb25a174be395c41e764bfb65dd62"
+dependencies = [
+ "proc-macro2",
+ "syn 2.0.29",
+]
+
 [[package]]
 name = "proc-macro2"
 version = "1.0.66"
@@ -684,6 +765,12 @@ dependencies = [
  "serde",
 ]
 
+[[package]]
+name = "shlex"
+version = "1.1.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "43b2853a4d09f215c24cc5489c992ce46052d359b5109343cbafbf26bc62f8a3"
+
 [[package]]
 name = "smallbitvec"
 version = "2.5.1"
@@ -831,6 +918,7 @@ dependencies = [
 name = "tree-sitter"
 version = "0.20.10"
 dependencies = [
+ "bindgen",
  "cc",
  "regex",
 ]
diff --git a/lib/Cargo.toml b/lib/Cargo.toml
index 5e1f3559..592521fd 100644
--- a/lib/Cargo.toml
+++ b/lib/Cargo.toml
@@ -26,6 +26,7 @@ include = [
 regex = "1.9.1"
 
 [build-dependencies]
+bindgen = { version = "^0.66.1", optional = true }
 cc = "^1.0.79"
 
 [lib]
diff --git a/lib/binding_rust/build.rs b/lib/binding_rust/build.rs
index ec367980..a74bdb27 100644
--- a/lib/binding_rust/build.rs
+++ b/lib/binding_rust/build.rs
@@ -17,6 +17,9 @@ fn main() {
         }
     }
 
+    #[cfg(feature = "bindgen")]
+    generate_bindings();
+
     let src_path = Path::new("src");
     for entry in fs::read_dir(&src_path).unwrap() {
         let entry = entry.unwrap();
@@ -34,6 +37,44 @@ fn main() {
         .compile("tree-sitter");
 }
 
+#[cfg(feature = "bindgen")]
+fn generate_bindings() {
+    const HEADER_PATH: &str = "include/tree_sitter/api.h";
+
+    println!("cargo:rerun-if-changed={}", HEADER_PATH);
+
+    let no_copy = [
+        "TSInput",
+        "TSLanguage",
+        "TSLogger",
+        "TSLookaheadIterator",
+        "TSParser",
+        "TSTree",
+        "TSQuery",
+        "TSQueryCursor",
+        "TSQueryCapture",
+        "TSQueryMatch",
+        "TSQueryPredicateStep",
+    ];
+
+    let bindings = bindgen::Builder::default()
+        .header(HEADER_PATH)
+        .layout_tests(false)
+        .allowlist_type("^TS.*")
+        .allowlist_function("^ts_.*")
+        .allowlist_var("^TREE_SITTER.*")
+        .no_copy(no_copy.join("|"))
+        .generate()
+        .expect("Failed to generate bindings");
+
+    let out_dir = PathBuf::from(env::var("OUT_DIR").unwrap());
+    let bindings_rs = out_dir.join("bindings.rs");
+
+    bindings.write_to_file(&bindings_rs).expect(&*format!(
+        "Failed to write bindings into path: {bindings_rs:?}"
+    ));
+}
+
 fn which(exe_name: impl AsRef<Path>) -> Option<PathBuf> {
     env::var_os("PATH").and_then(|paths| {
         env::split_paths(&paths).find_map(|dir| {
diff --git a/lib/binding_rust/ffi.rs b/lib/binding_rust/ffi.rs
index ac4da98b..a99d2afe 100644
--- a/lib/binding_rust/ffi.rs
+++ b/lib/binding_rust/ffi.rs
@@ -2,6 +2,10 @@
 #![allow(non_upper_case_globals)]
 #![allow(non_camel_case_types)]
 
+#[cfg(feature = "bindgen")]
+include!(concat!(env!("OUT_DIR"), "/bindings.rs"));
+
+#[cfg(not(feature = "bindgen"))]
 include!("./bindings.rs");
 
 extern "C" {
diff --git a/lib/binding_rust/lib.rs b/lib/binding_rust/lib.rs
index 932fc452..de3065d2 100644
--- a/lib/binding_rust/lib.rs
+++ b/lib/binding_rust/lib.rs
@@ -27,12 +27,13 @@ use std::{
 /// The Tree-sitter library is generally backwards-compatible with languages
 /// generated using older CLI versions, but is not forwards-compatible.
 #[doc(alias = "TREE_SITTER_LANGUAGE_VERSION")]
-pub const LANGUAGE_VERSION: usize = ffi::TREE_SITTER_LANGUAGE_VERSION;
+pub const LANGUAGE_VERSION: usize = ffi::TREE_SITTER_LANGUAGE_VERSION as usize;
 
 /// The earliest ABI version that is supported by the current version of the
 /// library.
 #[doc(alias = "TREE_SITTER_MIN_COMPATIBLE_LANGUAGE_VERSION")]
-pub const MIN_COMPATIBLE_LANGUAGE_VERSION: usize = ffi::TREE_SITTER_MIN_COMPATIBLE_LANGUAGE_VERSION;
+pub const MIN_COMPATIBLE_LANGUAGE_VERSION: usize =
+    ffi::TREE_SITTER_MIN_COMPATIBLE_LANGUAGE_VERSION as usize;
 
 pub const PARSER_HEADER: &'static str = include_str!("../include/tree_sitter/parser.h");
 

From abd57bc69b4ec9af9d4e5f76c2f4f63273a35444 Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Sun, 20 Aug 2023 16:10:13 +0300
Subject: [PATCH 290/347] chore: simplify script/generate-bindings

---
 lib/binding_rust/bindings.rs |  5 ++---
 script/generate-bindings     | 13 +------------
 2 files changed, 3 insertions(+), 15 deletions(-)

diff --git a/lib/binding_rust/bindings.rs b/lib/binding_rust/bindings.rs
index e7168fb5..225fbc11 100644
--- a/lib/binding_rust/bindings.rs
+++ b/lib/binding_rust/bindings.rs
@@ -1,5 +1,7 @@
 /* automatically generated by rust-bindgen 0.66.1 */
 
+pub const TREE_SITTER_LANGUAGE_VERSION: u32 = 14;
+pub const TREE_SITTER_MIN_COMPATIBLE_LANGUAGE_VERSION: u32 = 13;
 pub type TSStateId = u16;
 pub type TSSymbol = u16;
 pub type TSFieldId = u16;
@@ -783,6 +785,3 @@ extern "C" {
         new_free: ::std::option::Option<unsafe extern "C" fn(arg1: *mut ::std::os::raw::c_void)>,
     );
 }
-
-pub const TREE_SITTER_LANGUAGE_VERSION: usize = 14;
-pub const TREE_SITTER_MIN_COMPATIBLE_LANGUAGE_VERSION: usize = 13;
diff --git a/script/generate-bindings b/script/generate-bindings
index fb47e247..52fc43f3 100755
--- a/script/generate-bindings
+++ b/script/generate-bindings
@@ -33,18 +33,7 @@ bindgen                                        \
   --no-layout-tests                            \
   --allowlist-type '^TS.*'                     \
   --allowlist-function '^ts_.*'                \
+  --allowlist-var "^TREE_SITTER.*"             \
   --blocklist-type '^__.*'                     \
   --no-copy "$no_copy"                         \
   $header_path > $output_path
-
-echo "" >> $output_path
-
-defines=(
-  TREE_SITTER_LANGUAGE_VERSION
-  TREE_SITTER_MIN_COMPATIBLE_LANGUAGE_VERSION
-)
-
-for define in "${defines[@]}"; do
-  define_value=$(grep -E "#define $define (.*)" $header_path | cut -d' ' -f3)
-  echo "pub const $define: usize = $define_value;" >> $output_path
-done

From 897c187786a00b353dc0333e00b6b570d245f0ef Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Mon, 21 Aug 2023 05:19:20 +0300
Subject: [PATCH 291/347] fix: `make install` should install files with default
 perms

---
 .gitignore |  1 +
 Makefile   | 22 +++++++++++++---------
 2 files changed, 14 insertions(+), 9 deletions(-)

diff --git a/.gitignore b/.gitignore
index 5a17dd9b..53550dd7 100644
--- a/.gitignore
+++ b/.gitignore
@@ -7,6 +7,7 @@ log*.html
 
 fuzz-results
 
+/tree-sitter.pc
 test/fixtures/grammars/*
 !test/fixtures/grammars/.gitkeep
 package-lock.json
diff --git a/Makefile b/Makefile
index be915fa3..a11214d5 100644
--- a/Makefile
+++ b/Makefile
@@ -55,18 +55,22 @@ ifneq ($(STRIP),)
 endif
 
 install: all
-	install -d '$(DESTDIR)$(LIBDIR)'
-	install -m755 libtree-sitter.a '$(DESTDIR)$(LIBDIR)'/libtree-sitter.a
-	install -m755 libtree-sitter.$(SOEXTVER) '$(DESTDIR)$(LIBDIR)'/libtree-sitter.$(SOEXTVER)
-	ln -sf libtree-sitter.$(SOEXTVER) '$(DESTDIR)$(LIBDIR)'/libtree-sitter.$(SOEXTVER_MAJOR)
-	ln -sf libtree-sitter.$(SOEXTVER) '$(DESTDIR)$(LIBDIR)'/libtree-sitter.$(SOEXT)
-	install -d '$(DESTDIR)$(INCLUDEDIR)'/tree_sitter
-	install -m644 lib/include/tree_sitter/*.h '$(DESTDIR)$(INCLUDEDIR)'/tree_sitter/
-	install -d '$(DESTDIR)$(PCLIBDIR)'
 	sed -e 's|@LIBDIR@|$(LIBDIR)|;s|@INCLUDEDIR@|$(INCLUDEDIR)|;s|@VERSION@|$(VERSION)|' \
 	    -e 's|=$(PREFIX)|=$${prefix}|' \
 	    -e 's|@PREFIX@|$(PREFIX)|' \
-	    tree-sitter.pc.in > '$(DESTDIR)$(PCLIBDIR)'/tree-sitter.pc
+	    tree-sitter.pc.in > tree-sitter.pc
+
+	install -d '$(DESTDIR)$(LIBDIR)'
+	install -m644 -t '$(DESTDIR)$(LIBDIR)' libtree-sitter.a
+	install -m755 -t '$(DESTDIR)$(LIBDIR)' libtree-sitter.$(SOEXTVER)
+	ln -sf libtree-sitter.$(SOEXTVER) '$(DESTDIR)$(LIBDIR)'/libtree-sitter.$(SOEXTVER_MAJOR)
+	ln -sf libtree-sitter.$(SOEXTVER) '$(DESTDIR)$(LIBDIR)'/libtree-sitter.$(SOEXT)
+
+	install -d '$(DESTDIR)$(INCLUDEDIR)'/tree_sitter
+	install -m644 -t '$(DESTDIR)$(INCLUDEDIR)'/tree_sitter lib/include/tree_sitter/*.h
+
+	install -d '$(DESTDIR)$(PCLIBDIR)'
+	install -m644 -t '$(DESTDIR)$(PCLIBDIR)' tree-sitter.pc
 
 clean:
 	rm -f lib/src/*.o libtree-sitter.a libtree-sitter.$(SOEXT) libtree-sitter.$(SOEXTVER_MAJOR) libtree-sitter.$(SOEXTVER)

From da6affaf940509e09f2a38262ae617fd244fbe95 Mon Sep 17 00:00:00 2001
From: Amaan Qureshi <amaanq12@gmail.com>
Date: Mon, 21 Aug 2023 00:53:04 -0400
Subject: [PATCH 292/347] feat: allow `@injection.self` to inject the node w/
 itself

---
 highlight/src/lib.rs | 13 +++++++++++++
 1 file changed, 13 insertions(+)

diff --git a/highlight/src/lib.rs b/highlight/src/lib.rs
index 20ac5edf..9f4e5b8e 100644
--- a/highlight/src/lib.rs
+++ b/highlight/src/lib.rs
@@ -112,6 +112,7 @@ pub struct HighlightConfiguration {
     non_local_variable_patterns: Vec<bool>,
     injection_content_capture_index: Option<u32>,
     injection_language_capture_index: Option<u32>,
+    injection_self_capture_index: Option<u32>,
     local_scope_capture_index: Option<u32>,
     local_def_capture_index: Option<u32>,
     local_def_value_capture_index: Option<u32>,
@@ -309,6 +310,7 @@ impl HighlightConfiguration {
         // Store the numeric ids for all of the special captures.
         let mut injection_content_capture_index = None;
         let mut injection_language_capture_index = None;
+        let mut injection_self_capture_index = None;
         let mut local_def_capture_index = None;
         let mut local_def_value_capture_index = None;
         let mut local_ref_capture_index = None;
@@ -318,6 +320,7 @@ impl HighlightConfiguration {
             match name.as_str() {
                 "injection.content" => injection_content_capture_index = i,
                 "injection.language" => injection_language_capture_index = i,
+                "injection.self" => injection_self_capture_index = i,
                 "local.definition" => local_def_capture_index = i,
                 "local.definition-value" => local_def_value_capture_index = i,
                 "local.reference" => local_ref_capture_index = i,
@@ -339,6 +342,7 @@ impl HighlightConfiguration {
             non_local_variable_patterns,
             injection_content_capture_index,
             injection_language_capture_index,
+            injection_self_capture_index,
             local_def_capture_index,
             local_def_value_capture_index,
             local_ref_capture_index,
@@ -1120,6 +1124,7 @@ fn injection_for_match<'a>(
 ) -> (Option<&'a str>, Option<Node<'a>>, bool) {
     let content_capture_index = config.injection_content_capture_index;
     let language_capture_index = config.injection_language_capture_index;
+    let self_capture_index = config.injection_self_capture_index;
 
     let mut language_name = None;
     let mut content_node = None;
@@ -1129,6 +1134,11 @@ fn injection_for_match<'a>(
             language_name = capture.node.utf8_text(source).ok();
         } else if index == content_capture_index {
             content_node = Some(capture.node);
+        } else if index == self_capture_index {
+            if let Ok(name) = capture.node.utf8_text(source) {
+                language_name = Some(name);
+                content_node = Some(capture.node);
+            }
         }
     }
 
@@ -1144,6 +1154,9 @@ fn injection_for_match<'a>(
                 }
             }
 
+            // Setting the `injection.self` key can be used to specify that the
+            // language name should be the same as the language of the current
+            // layer.
             "injection.self" => {
                 if language_name.is_none() {
                     language_name = Some(config.language_name.as_str());

From e3a5863287e1da35f41bd764a96de1b06222129e Mon Sep 17 00:00:00 2001
From: Amaan Qureshi <amaanq12@gmail.com>
Date: Mon, 21 Aug 2023 00:53:46 -0400
Subject: [PATCH 293/347] feat: add `@injection.parent` to inject an
 injection's node with the parent language

---
 cli/src/tests/highlight_test.rs |  1 +
 highlight/src/lib.rs            | 37 ++++++++++++++++++++++++++++-----
 2 files changed, 33 insertions(+), 5 deletions(-)

diff --git a/cli/src/tests/highlight_test.rs b/cli/src/tests/highlight_test.rs
index c4ca0b49..e400b047 100644
--- a/cli/src/tests/highlight_test.rs
+++ b/cli/src/tests/highlight_test.rs
@@ -24,6 +24,7 @@ lazy_static! {
         get_highlight_config("rust", Some("injections.scm"), &HIGHLIGHT_NAMES);
     static ref HIGHLIGHT_NAMES: Vec<String> = [
         "attribute",
+        "boolean",
         "carriage-return",
         "comment",
         "constant",
diff --git a/highlight/src/lib.rs b/highlight/src/lib.rs
index 9f4e5b8e..e118530f 100644
--- a/highlight/src/lib.rs
+++ b/highlight/src/lib.rs
@@ -19,6 +19,7 @@ const BUFFER_LINES_RESERVE_CAPACITY: usize = 1000;
 lazy_static! {
     static ref STANDARD_CAPTURE_NAMES: HashSet<&'static str> = vec![
         "attribute",
+        "boolean",
         "carriage-return",
         "comment",
         "comment.documentation",
@@ -112,6 +113,7 @@ pub struct HighlightConfiguration {
     non_local_variable_patterns: Vec<bool>,
     injection_content_capture_index: Option<u32>,
     injection_language_capture_index: Option<u32>,
+    injection_parent_capture_index: Option<u32>,
     injection_self_capture_index: Option<u32>,
     local_scope_capture_index: Option<u32>,
     local_def_capture_index: Option<u32>,
@@ -155,6 +157,7 @@ where
     F: FnMut(&str) -> Option<&'a HighlightConfiguration> + 'a,
 {
     source: &'a [u8],
+    language_name: &'a str,
     byte_offset: usize,
     highlighter: &'a mut Highlighter,
     injection_callback: F,
@@ -199,6 +202,7 @@ impl Highlighter {
     ) -> Result<impl Iterator<Item = Result<HighlightEvent, Error>> + 'a, Error> {
         let layers = HighlightIterLayer::new(
             source,
+            None,
             self,
             cancellation_flag,
             &mut injection_callback,
@@ -214,6 +218,7 @@ impl Highlighter {
         assert_ne!(layers.len(), 0);
         let mut result = HighlightIter {
             source,
+            language_name: &config.language_name,
             byte_offset: 0,
             injection_callback,
             cancellation_flag,
@@ -310,6 +315,7 @@ impl HighlightConfiguration {
         // Store the numeric ids for all of the special captures.
         let mut injection_content_capture_index = None;
         let mut injection_language_capture_index = None;
+        let mut injection_parent_capture_index = None;
         let mut injection_self_capture_index = None;
         let mut local_def_capture_index = None;
         let mut local_def_value_capture_index = None;
@@ -320,6 +326,7 @@ impl HighlightConfiguration {
             match name.as_str() {
                 "injection.content" => injection_content_capture_index = i,
                 "injection.language" => injection_language_capture_index = i,
+                "injection.parent" => injection_parent_capture_index = i,
                 "injection.self" => injection_self_capture_index = i,
                 "local.definition" => local_def_capture_index = i,
                 "local.definition-value" => local_def_value_capture_index = i,
@@ -342,6 +349,7 @@ impl HighlightConfiguration {
             non_local_variable_patterns,
             injection_content_capture_index,
             injection_language_capture_index,
+            injection_parent_capture_index,
             injection_self_capture_index,
             local_def_capture_index,
             local_def_value_capture_index,
@@ -418,6 +426,7 @@ impl<'a> HighlightIterLayer<'a> {
     /// added to the returned vector.
     fn new<F: FnMut(&str) -> Option<&'a HighlightConfiguration> + 'a>(
         source: &'a [u8],
+        parent_name: Option<&str>,
         highlighter: &mut Highlighter,
         cancellation_flag: Option<&'a AtomicUsize>,
         injection_callback: &mut F,
@@ -450,8 +459,13 @@ impl<'a> HighlightIterLayer<'a> {
                         cursor.matches(combined_injections_query, tree.root_node(), source);
                     for mat in matches {
                         let entry = &mut injections_by_pattern_index[mat.pattern_index];
-                        let (language_name, content_node, include_children) =
-                            injection_for_match(config, combined_injections_query, &mat, source);
+                        let (language_name, content_node, include_children) = injection_for_match(
+                            config,
+                            parent_name,
+                            combined_injections_query,
+                            &mat,
+                            source,
+                        );
                         if language_name.is_some() {
                             entry.0 = language_name;
                         }
@@ -772,8 +786,13 @@ where
 
             // If this capture represents an injection, then process the injection.
             if match_.pattern_index < layer.config.locals_pattern_index {
-                let (language_name, content_node, include_children) =
-                    injection_for_match(&layer.config, &layer.config.query, &match_, &self.source);
+                let (language_name, content_node, include_children) = injection_for_match(
+                    layer.config,
+                    Some(self.language_name),
+                    &layer.config.query,
+                    &match_,
+                    self.source,
+                );
 
                 // Explicitly remove this match so that none of its other captures will remain
                 // in the stream of captures.
@@ -791,6 +810,7 @@ where
                         if !ranges.is_empty() {
                             match HighlightIterLayer::new(
                                 self.source,
+                                Some(self.language_name),
                                 self.highlighter,
                                 self.cancellation_flag,
                                 &mut self.injection_callback,
@@ -1118,22 +1138,29 @@ impl HtmlRenderer {
 
 fn injection_for_match<'a>(
     config: &'a HighlightConfiguration,
+    parent_name: Option<&'a str>,
     query: &'a Query,
     query_match: &QueryMatch<'a, 'a>,
     source: &'a [u8],
 ) -> (Option<&'a str>, Option<Node<'a>>, bool) {
     let content_capture_index = config.injection_content_capture_index;
     let language_capture_index = config.injection_language_capture_index;
+    let parent_capture_index = config.injection_parent_capture_index;
     let self_capture_index = config.injection_self_capture_index;
 
     let mut language_name = None;
     let mut content_node = None;
+    let parent_name = parent_name.unwrap_or_default();
+
     for capture in query_match.captures {
         let index = Some(capture.index);
         if index == language_capture_index {
             language_name = capture.node.utf8_text(source).ok();
         } else if index == content_capture_index {
             content_node = Some(capture.node);
+        } else if index == parent_capture_index && !parent_name.is_empty() {
+            language_name = Some(parent_name);
+            content_node = Some(capture.node);
         } else if index == self_capture_index {
             if let Ok(name) = capture.node.utf8_text(source) {
                 language_name = Some(name);
@@ -1150,7 +1177,7 @@ fn injection_for_match<'a>(
             // that sets the injection.language key.
             "injection.language" => {
                 if language_name.is_none() {
-                    language_name = prop.value.as_ref().map(|s| s.as_ref())
+                    language_name = prop.value.as_ref().map(|s| s.as_ref());
                 }
             }
 

From f4a6134461e844796af13fa0e86d89d0f9d27e73 Mon Sep 17 00:00:00 2001
From: DennySun2100 <138833544+DennySun2100@users.noreply.github.com>
Date: Mon, 21 Aug 2023 11:54:09 -0700
Subject: [PATCH 294/347] GCC pragma causes warning on non-GNU compilers

---
 lib/include/tree_sitter/api.h | 4 ++++
 1 file changed, 4 insertions(+)

diff --git a/lib/include/tree_sitter/api.h b/lib/include/tree_sitter/api.h
index 1cc6b3e9..5003cff7 100644
--- a/lib/include/tree_sitter/api.h
+++ b/lib/include/tree_sitter/api.h
@@ -1,7 +1,9 @@
 #ifndef TREE_SITTER_API_H_
 #define TREE_SITTER_API_H_
 
+#ifdef __GNUC__
 #pragma GCC visibility push(default)
+#endif
 
 #ifdef __cplusplus
 extern "C" {
@@ -1165,6 +1167,8 @@ void ts_set_allocator(
 }
 #endif
 
+#ifdef __GNUC__
 #pragma GCC visibility pop
+#endif
 
 #endif  // TREE_SITTER_API_H_

From cd0bdf586fd910f8224f0a35969145531f66a649 Mon Sep 17 00:00:00 2001
From: Amaan Qureshi <amaanq12@gmail.com>
Date: Tue, 22 Aug 2023 01:27:00 -0400
Subject: [PATCH 295/347] fix(injections): only allow setting self/parent via
 `#set!`

---
 highlight/src/lib.rs | 28 +++++++++-------------------
 1 file changed, 9 insertions(+), 19 deletions(-)

diff --git a/highlight/src/lib.rs b/highlight/src/lib.rs
index e118530f..fad91ad9 100644
--- a/highlight/src/lib.rs
+++ b/highlight/src/lib.rs
@@ -113,8 +113,6 @@ pub struct HighlightConfiguration {
     non_local_variable_patterns: Vec<bool>,
     injection_content_capture_index: Option<u32>,
     injection_language_capture_index: Option<u32>,
-    injection_parent_capture_index: Option<u32>,
-    injection_self_capture_index: Option<u32>,
     local_scope_capture_index: Option<u32>,
     local_def_capture_index: Option<u32>,
     local_def_value_capture_index: Option<u32>,
@@ -315,8 +313,6 @@ impl HighlightConfiguration {
         // Store the numeric ids for all of the special captures.
         let mut injection_content_capture_index = None;
         let mut injection_language_capture_index = None;
-        let mut injection_parent_capture_index = None;
-        let mut injection_self_capture_index = None;
         let mut local_def_capture_index = None;
         let mut local_def_value_capture_index = None;
         let mut local_ref_capture_index = None;
@@ -326,8 +322,6 @@ impl HighlightConfiguration {
             match name.as_str() {
                 "injection.content" => injection_content_capture_index = i,
                 "injection.language" => injection_language_capture_index = i,
-                "injection.parent" => injection_parent_capture_index = i,
-                "injection.self" => injection_self_capture_index = i,
                 "local.definition" => local_def_capture_index = i,
                 "local.definition-value" => local_def_value_capture_index = i,
                 "local.reference" => local_ref_capture_index = i,
@@ -349,8 +343,6 @@ impl HighlightConfiguration {
             non_local_variable_patterns,
             injection_content_capture_index,
             injection_language_capture_index,
-            injection_parent_capture_index,
-            injection_self_capture_index,
             local_def_capture_index,
             local_def_value_capture_index,
             local_ref_capture_index,
@@ -1145,12 +1137,9 @@ fn injection_for_match<'a>(
 ) -> (Option<&'a str>, Option<Node<'a>>, bool) {
     let content_capture_index = config.injection_content_capture_index;
     let language_capture_index = config.injection_language_capture_index;
-    let parent_capture_index = config.injection_parent_capture_index;
-    let self_capture_index = config.injection_self_capture_index;
 
     let mut language_name = None;
     let mut content_node = None;
-    let parent_name = parent_name.unwrap_or_default();
 
     for capture in query_match.captures {
         let index = Some(capture.index);
@@ -1158,14 +1147,6 @@ fn injection_for_match<'a>(
             language_name = capture.node.utf8_text(source).ok();
         } else if index == content_capture_index {
             content_node = Some(capture.node);
-        } else if index == parent_capture_index && !parent_name.is_empty() {
-            language_name = Some(parent_name);
-            content_node = Some(capture.node);
-        } else if index == self_capture_index {
-            if let Ok(name) = capture.node.utf8_text(source) {
-                language_name = Some(name);
-                content_node = Some(capture.node);
-            }
         }
     }
 
@@ -1190,6 +1171,15 @@ fn injection_for_match<'a>(
                 }
             }
 
+            // Setting the `injection.parent` key can be used to specify that
+            // the language name should be the same as the language of the
+            // parent layer
+            "injection.parent" => {
+                if language_name.is_none() {
+                    language_name = parent_name;
+                }
+            }
+
             // By default, injections do not include the *children* of an
             // `injection.content` node - only the ranges that belong to the
             // node itself. This can be changed using a `#set!` predicate that

From 95ab103f48c9cf22837a31174ff10b38bc00f793 Mon Sep 17 00:00:00 2001
From: Amaan Qureshi <amaanq12@gmail.com>
Date: Tue, 22 Aug 2023 01:36:25 -0400
Subject: [PATCH 296/347] docs: update injection properties

---
 docs/section-4-syntax-highlighting.md | 15 ++++++++++++---
 1 file changed, 12 insertions(+), 3 deletions(-)

diff --git a/docs/section-4-syntax-highlighting.md b/docs/section-4-syntax-highlighting.md
index fc2c9c17..8fd73cf6 100644
--- a/docs/section-4-syntax-highlighting.md
+++ b/docs/section-4-syntax-highlighting.md
@@ -362,9 +362,18 @@ All of these examples can be modeled in terms of a *parent* syntax tree and one
 The language injection behavior can also be configured by some properties associated with patterns:
 
 * `injection.language` - can be used to hard-code the name of a specific language.
-* `injection.combined` - indicates that *all* of the matching nodes in the tree should have their content parsed as *one* nested document.
-* `injection.include-children` - indicates that the `@injection.content` node's *entire* text should be re-parsed, including the text of its child nodes. By default, child nodes' text will be *excluded* from the injected document.
-* `injection.self` - indicates that the `@injection.content` node should be parsed using the same language as the parent node. This is useful for cases where the parent node's language is not known until runtime (e.g. via inheriting another language)
+* `injection.combined` - indicates that *all* of the matching nodes in the tree
+  should have their content parsed as *one* nested document.
+* `injection.include-children` - indicates that the `@injection.content` node's
+  *entire* text should be re-parsed, including the text of its child nodes. By default,
+child nodes' text will be *excluded* from the injected document.
+* `injection.self` - indicates that the `@injection.content` node should be parsed
+  using the same language as the node itself. This is useful for cases where the
+  node's language is not known until runtime (e.g. via inheriting another language)
+* `injection.parent` indicates that the `@injection.content` node should be parsed
+  using the same language as the node's parent language. This is only meant for injections
+  that need to refer back to the parent language to parse the node's text inside
+  the injected language.
 
 #### Examples
 

From bba9809390f355e993f0a8436f83bdb125ab0e5a Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Tue, 22 Aug 2023 16:33:03 +0300
Subject: [PATCH 297/347] fix: `make install` BSDs don't have `-t` option

---
 Makefile | 8 ++++----
 1 file changed, 4 insertions(+), 4 deletions(-)

diff --git a/Makefile b/Makefile
index a11214d5..b73e6363 100644
--- a/Makefile
+++ b/Makefile
@@ -61,16 +61,16 @@ install: all
 	    tree-sitter.pc.in > tree-sitter.pc
 
 	install -d '$(DESTDIR)$(LIBDIR)'
-	install -m644 -t '$(DESTDIR)$(LIBDIR)' libtree-sitter.a
-	install -m755 -t '$(DESTDIR)$(LIBDIR)' libtree-sitter.$(SOEXTVER)
+	install -m644 libtree-sitter.a '$(DESTDIR)$(LIBDIR)'/
+	install -m755 libtree-sitter.$(SOEXTVER) '$(DESTDIR)$(LIBDIR)'/
 	ln -sf libtree-sitter.$(SOEXTVER) '$(DESTDIR)$(LIBDIR)'/libtree-sitter.$(SOEXTVER_MAJOR)
 	ln -sf libtree-sitter.$(SOEXTVER) '$(DESTDIR)$(LIBDIR)'/libtree-sitter.$(SOEXT)
 
 	install -d '$(DESTDIR)$(INCLUDEDIR)'/tree_sitter
-	install -m644 -t '$(DESTDIR)$(INCLUDEDIR)'/tree_sitter lib/include/tree_sitter/*.h
+	install -m644 lib/include/tree_sitter/*.h '$(DESTDIR)$(INCLUDEDIR)'/tree_sitter/
 
 	install -d '$(DESTDIR)$(PCLIBDIR)'
-	install -m644 -t '$(DESTDIR)$(PCLIBDIR)' tree-sitter.pc
+	install -m644 tree-sitter.pc '$(DESTDIR)$(PCLIBDIR)'/
 
 clean:
 	rm -f lib/src/*.o libtree-sitter.a libtree-sitter.$(SOEXT) libtree-sitter.$(SOEXTVER_MAJOR) libtree-sitter.$(SOEXTVER)

From 5c7098dd5684e4f5a931053f852d40a5205557d1 Mon Sep 17 00:00:00 2001
From: Amaan Qureshi <amaanq12@gmail.com>
Date: Tue, 22 Aug 2023 19:22:31 -0400
Subject: [PATCH 298/347] fix(query): debug print uses wrong variable

---
 lib/src/query.c | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/lib/src/query.c b/lib/src/query.c
index f7c98375..e3fd27a0 100644
--- a/lib/src/query.c
+++ b/lib/src/query.c
@@ -1907,7 +1907,7 @@ static bool ts_query__analyze_patterns(TSQuery *self, unsigned *error_offset) {
     }
 
     #ifdef DEBUG_ANALYZE_QUERY
-      printf("\nWalk states for rootless pattern step %u:\n", step_index);
+      printf("\nWalk states for rootless pattern step %u:\n", pattern_entry->step_index);
     #endif
 
     ts_query__perform_analysis(

From 683fe442e49bb2c8b9e37c6a9b49ec5f7a50c2ac Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Wed, 23 Aug 2023 15:14:32 +0300
Subject: [PATCH 299/347] fix(gen): cycle between aliases and anonymous symbols

An example of an error cycle in a `parser.c`:

```
static const TSSymbol ts_symbol_map[] = {
  ...
  [anon_sym_RBRACE] = anon_sym_RBRACE2,
  [anon_sym_RBRACE2] = anon_sym_RBRACE,
  ...
};
```
---
 cli/src/generate/render.rs | 76 +++++++++++++++++++-------------------
 1 file changed, 39 insertions(+), 37 deletions(-)

diff --git a/cli/src/generate/render.rs b/cli/src/generate/render.rs
index 197ce364..f92bf312 100644
--- a/cli/src/generate/render.rs
+++ b/cli/src/generate/render.rs
@@ -152,49 +152,51 @@ impl Generator {
             self.symbol_ids[&Symbol::end()].clone(),
         );
 
-        self.symbol_map = self
-            .parse_table
-            .symbols
-            .iter()
-            .map(|symbol| {
-                let mut mapping = symbol;
+        self.symbol_map = HashMap::new();
 
-                // There can be multiple symbols in the grammar that have the same name and kind,
-                // due to simple aliases. When that happens, ensure that they map to the same
-                // public-facing symbol. If one of the symbols is not aliased, choose that one
-                // to be the public-facing symbol. Otherwise, pick the symbol with the lowest
-                // numeric value.
-                if let Some(alias) = self.default_aliases.get(symbol) {
-                    let kind = alias.kind();
-                    for other_symbol in &self.parse_table.symbols {
-                        if let Some(other_alias) = self.default_aliases.get(other_symbol) {
-                            if other_symbol < mapping && other_alias == alias {
-                                mapping = other_symbol;
+        for symbol in self.parse_table.symbols.iter() {
+            let mut mapping = symbol;
+
+            // There can be multiple symbols in the grammar that have the same name and kind,
+            // due to simple aliases. When that happens, ensure that they map to the same
+            // public-facing symbol. If one of the symbols is not aliased, choose that one
+            // to be the public-facing symbol. Otherwise, pick the symbol with the lowest
+            // numeric value.
+            if let Some(alias) = self.default_aliases.get(symbol) {
+                let kind = alias.kind();
+                for other_symbol in &self.parse_table.symbols {
+                    if let Some(other_alias) = self.default_aliases.get(other_symbol) {
+                        if other_symbol < mapping && other_alias == alias {
+                            mapping = other_symbol;
+                        }
+                    } else if self.metadata_for_symbol(*other_symbol) == (&alias.value, kind) {
+                        mapping = other_symbol;
+                        break;
+                    }
+                }
+            }
+            // Two anonymous tokens with different flags but the same string value
+            // should be represented with the same symbol in the public API. Examples:
+            // *  "<" and token(prec(1, "<"))
+            // *  "(" and token.immediate("(")
+            else if symbol.is_terminal() {
+                let metadata = self.metadata_for_symbol(*symbol);
+                for other_symbol in &self.parse_table.symbols {
+                    let other_metadata = self.metadata_for_symbol(*other_symbol);
+                    if other_metadata == metadata {
+                        if let Some(mapped) = self.symbol_map.get(other_symbol) {
+                            if mapped == symbol {
+                                break;
                             }
-                        } else if self.metadata_for_symbol(*other_symbol) == (&alias.value, kind) {
-                            mapping = other_symbol;
-                            break;
-                        }
-                    }
-                }
-                // Two anonymous tokens with different flags but the same string value
-                // should be represented with the same symbol in the public API. Examples:
-                // *  "<" and token(prec(1, "<"))
-                // *  "(" and token.immediate("(")
-                else if symbol.is_terminal() {
-                    let metadata = self.metadata_for_symbol(*symbol);
-                    for other_symbol in &self.parse_table.symbols {
-                        let other_metadata = self.metadata_for_symbol(*other_symbol);
-                        if other_metadata == metadata {
-                            mapping = other_symbol;
-                            break;
                         }
+                        mapping = other_symbol;
+                        break;
                     }
                 }
+            }
 
-                (*symbol, *mapping)
-            })
-            .collect();
+            self.symbol_map.insert(*symbol, *mapping);
+        }
 
         for production_info in &self.parse_table.production_infos {
             // Build a list of all field names

From 1dbb986515b32308a6f0b0e42cf4c1eef56367f6 Mon Sep 17 00:00:00 2001
From: Amaan Qureshi <amaanq12@gmail.com>
Date: Wed, 23 Aug 2023 08:56:14 -0400
Subject: [PATCH 300/347] chore: add a test for an aliased anonymous symbol
 with flags

---
 cli/src/tests/query_test.rs | 90 ++++++++++++++++++++++++++++++++++++-
 1 file changed, 88 insertions(+), 2 deletions(-)

diff --git a/cli/src/tests/query_test.rs b/cli/src/tests/query_test.rs
index c0994d31..94d5ca97 100644
--- a/cli/src/tests/query_test.rs
+++ b/cli/src/tests/query_test.rs
@@ -1,10 +1,13 @@
 use super::helpers::{
     allocations,
-    fixtures::get_language,
+    fixtures::{get_language, get_test_language},
     query_helpers::{assert_query_matches, Match, Pattern},
     ITERATION_COUNT,
 };
-use crate::tests::helpers::query_helpers::{collect_captures, collect_matches};
+use crate::{
+    generate::generate_parser_for_grammar,
+    tests::helpers::query_helpers::{collect_captures, collect_matches},
+};
 use indoc::indoc;
 use lazy_static::lazy_static;
 use rand::{prelude::StdRng, SeedableRng};
@@ -4812,3 +4815,86 @@ fn test_query_max_start_depth_more() {
         }
     });
 }
+
+#[test]
+fn test_grammar_with_aliased_literal_query() {
+    // module.exports = grammar({
+    //   name: 'test',
+    //
+    //   rules: {
+    //     source: $ => repeat(choice($.compound_statement, $.expansion)),
+    //
+    //     compound_statement: $ => seq(alias(token(prec(-1, '}')), '}')),
+    //
+    //     expansion: $ => seq('}'),
+    //   },
+    // });
+    let (parser_name, parser_code) = generate_parser_for_grammar(
+        r#"
+        {
+            "name": "test",
+            "rules": {
+                "source": {
+                    "type": "REPEAT",
+                    "content": {
+                        "type": "CHOICE",
+                        "members": [
+                            {
+                                "type": "SYMBOL",
+                                "name": "compound_statement"
+                            },
+                            {
+                                "type": "SYMBOL",
+                                "name": "expansion"
+                            }
+                        ]
+                    }
+                },
+                "compound_statement": {
+                    "type": "SEQ",
+                    "members": [
+                        {
+                            "type": "ALIAS",
+                            "content": {
+                                "type": "TOKEN",
+                                "content": {
+                                    "type": "PREC",
+                                    "value": -1,
+                                    "content": {
+                                        "type": "STRING",
+                                        "value": "}"
+                                    }
+                                }
+                            },
+                            "named": false,
+                            "value": "}"
+                        }
+                    ]
+                },
+                "expansion": {
+                    "type": "SEQ",
+                    "members": [
+                        {
+                            "type": "STRING",
+                            "value": "}"
+                        }
+                    ]
+                }
+            }
+        }
+        "#,
+    )
+    .unwrap();
+
+    let language = get_test_language(&parser_name, &parser_code, None);
+
+    let query = Query::new(
+        language,
+        r#"
+        (compound_statement "}" @bracket1)
+        (expansion "}" @bracket2)
+        "#,
+    );
+
+    assert!(query.is_ok());
+}

From b22e4fe3c9d9501c6c61b93ac0c06c83435ffa50 Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Fri, 25 Aug 2023 16:55:08 +0300
Subject: [PATCH 301/347] chore: fix a wasm bash test

---
 lib/binding_web/test/parser-test.js | 22 +++++++++++-----------
 1 file changed, 11 insertions(+), 11 deletions(-)

diff --git a/lib/binding_web/test/parser-test.js b/lib/binding_web/test/parser-test.js
index fcd714b2..74c45d96 100644
--- a/lib/binding_web/test/parser-test.js
+++ b/lib/binding_web/test/parser-test.js
@@ -127,19 +127,19 @@ describe("Parser", () => {
 
     it("can use the bash parser", async () => {
       parser.setLanguage(await Parser.Language.load(languageURL('bash')));
-      tree = parser.parse("FOO=bar echo <<EOF 2> err.txt > hello.txt \nhello\nEOF");
+      tree = parser.parse("FOO=bar echo <<EOF 2> err.txt > hello.txt \nhello${FOO}\nEOF");
       assert.equal(
         tree.rootNode.toString(),
-        '(program (redirected_statement ' +
-          'body: (command ' +
-            '(variable_assignment ' +
-              'name: (variable_name) ' +
-              'value: (word)) ' +
-            'name: (command_name (word))) ' +
-          'redirect: (heredoc_redirect (heredoc_start)) ' +
-          'redirect: (file_redirect descriptor: (file_descriptor) destination: (word)) ' +
-          'redirect: (file_redirect destination: (word))) ' +
-          '(heredoc_body))'
+          '(program ' +
+            '(redirected_statement ' +
+              'body: (command ' +
+                '(variable_assignment name: (variable_name) value: (word)) ' +
+                'name: (command_name (word))) ' +
+              'redirect: (heredoc_redirect (heredoc_start) ' +
+                'redirect: (file_redirect descriptor: (file_descriptor) destination: (word)) ' +
+                'redirect: (file_redirect destination: (word)) ' +
+                '(heredoc_body ' +
+                  '(expansion (variable_name))) (heredoc_end))))'
       );
     }).timeout(5000);
 

From e985d0e74342c78f99ff6c12dc7b7efaf597dfd3 Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Fri, 25 Aug 2023 17:12:04 +0300
Subject: [PATCH 302/347] cicd: pin rust toolchain to 1.71.1 for all mips
 targets

---
 .github/workflows/build.yml | 6 ++++++
 1 file changed, 6 insertions(+)

diff --git a/.github/workflows/build.yml b/.github/workflows/build.yml
index 775db7de..91cc7f5f 100644
--- a/.github/workflows/build.yml
+++ b/.github/workflows/build.yml
@@ -107,6 +107,11 @@ jobs:
         - { runtime: linux-sparc64     , cc: sparc64-linux-gnu-gcc             , ar: sparc64-linux-gnu-ar           }
         - { runtime: linux-thumbv7neon , cc: arm-linux-gnueabihf-gcc           , ar: arm-linux-gnueabihf-ar         }
 
+        # Rust toolchains
+        - { runtime: linux-mips        , rust-toolchain: 1.71.1 }
+        - { runtime: linux-mips64      , rust-toolchain: 1.71.1 }
+        - { runtime: linux-mipsel      , rust-toolchain: 1.71.1 }
+        - { runtime: linux-mips64el    , rust-toolchain: 1.71.1 }
 
         # See #2041 tree-sitter issue
         - { runtime: windows-x64   , rust-test-threads: 1 }
@@ -145,6 +150,7 @@ jobs:
       uses: dtolnay/rust-toolchain@stable
       with:
         targets: ${{ matrix.target }}
+        toolchain: ${{ matrix.rust-toolchain || 'stable' }}
 
     - name: Install cross
       if: ${{ matrix.use-cross }}

From 5c5de9ca610a0f7037406cb82f3c715ba4e3d50c Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Fri, 25 Aug 2023 17:14:55 +0300
Subject: [PATCH 303/347] cicd: rename `runtime` to `platform` for better
 clarity

---
 .github/workflows/build.yml | 112 ++++++++++++++++++------------------
 1 file changed, 56 insertions(+), 56 deletions(-)

diff --git a/.github/workflows/build.yml b/.github/workflows/build.yml
index 91cc7f5f..05c08d2c 100644
--- a/.github/workflows/build.yml
+++ b/.github/workflows/build.yml
@@ -27,12 +27,12 @@ on:
 
 jobs:
   build:
-    name: ${{ matrix.runtime }} (${{ matrix.target }}) (${{ matrix.os }})
+    name: ${{ matrix.platform }} (${{ matrix.target }}) (${{ matrix.os }})
     runs-on: ${{ matrix.os }}
     strategy:
       fail-fast: false
       matrix:
-        runtime:
+        platform:
         - linux-arm64       #
         - linux-arm         #
         - linux-armhf       #
@@ -60,66 +60,66 @@ jobs:
 
         include:
         # When adding a new `target`:
-        # 1. Define a new runtime alias above
+        # 1. Define a new platform alias above
         # 2. Add a new record to a matrix map in `cli/npm/install.js`
-        - { runtime: linux-arm64       , target: aarch64-unknown-linux-gnu           , os: ubuntu-latest  , use-cross: true }
-        - { runtime: linux-arm         , target: arm-unknown-linux-gnueabi           , os: ubuntu-latest  , use-cross: true }
-        - { runtime: linux-armhf       , target: arm-unknown-linux-gnueabihf         , os: ubuntu-latest  , use-cross: true }
-        - { runtime: linux-armv5te     , target: armv5te-unknown-linux-gnueabi       , os: ubuntu-latest  , use-cross: true }
-        - { runtime: linux-armv7l      , target: armv7-unknown-linux-gnueabihf       , os: ubuntu-latest  , use-cross: true }
-        - { runtime: linux-x64         , target: x86_64-unknown-linux-gnu            , os: ubuntu-20.04                     } #2272
-        - { runtime: linux-x86         , target: i686-unknown-linux-gnu              , os: ubuntu-latest  , use-cross: true }
-        - { runtime: linux-i586        , target: i586-unknown-linux-gnu              , os: ubuntu-latest  , use-cross: true }
-        - { runtime: linux-mips        , target: mips-unknown-linux-gnu              , os: ubuntu-latest  , use-cross: true }
-        - { runtime: linux-mips64      , target: mips64-unknown-linux-gnuabi64       , os: ubuntu-latest  , use-cross: true }
-        - { runtime: linux-mipsel      , target: mipsel-unknown-linux-gnu            , os: ubuntu-latest  , use-cross: true }
-        - { runtime: linux-mips64el    , target: mips64el-unknown-linux-gnuabi64     , os: ubuntu-latest  , use-cross: true }
-        - { runtime: linux-powerpc     , target: powerpc-unknown-linux-gnu           , os: ubuntu-latest  , use-cross: true }
-        - { runtime: linux-powerpc64   , target: powerpc64-unknown-linux-gnu         , os: ubuntu-latest  , use-cross: true }
-        - { runtime: linux-powerpc64el , target: powerpc64le-unknown-linux-gnu       , os: ubuntu-latest  , use-cross: true }
-        - { runtime: linux-riscv64gc   , target: riscv64gc-unknown-linux-gnu         , os: ubuntu-latest  , use-cross: true }
-        - { runtime: linux-s390x       , target: s390x-unknown-linux-gnu             , os: ubuntu-latest  , use-cross: true }
-        - { runtime: linux-sparc64     , target: sparc64-unknown-linux-gnu           , os: ubuntu-latest  , use-cross: true }
-        - { runtime: linux-thumbv7neon , target: thumbv7neon-unknown-linux-gnueabihf , os: ubuntu-latest  , use-cross: true }
-        - { runtime: windows-arm64     , target: aarch64-pc-windows-msvc             , os: windows-latest                   }
-        - { runtime: windows-x64       , target: x86_64-pc-windows-msvc              , os: windows-latest                   }
-        - { runtime: windows-x86       , target: i686-pc-windows-msvc                , os: windows-latest                   }
-        - { runtime: macos-arm64       , target: aarch64-apple-darwin                , os: macos-latest                     }
-        - { runtime: macos-x64         , target: x86_64-apple-darwin                 , os: macos-latest                     }
+        - { platform: linux-arm64       , target: aarch64-unknown-linux-gnu           , os: ubuntu-latest  , use-cross: true }
+        - { platform: linux-arm         , target: arm-unknown-linux-gnueabi           , os: ubuntu-latest  , use-cross: true }
+        - { platform: linux-armhf       , target: arm-unknown-linux-gnueabihf         , os: ubuntu-latest  , use-cross: true }
+        - { platform: linux-armv5te     , target: armv5te-unknown-linux-gnueabi       , os: ubuntu-latest  , use-cross: true }
+        - { platform: linux-armv7l      , target: armv7-unknown-linux-gnueabihf       , os: ubuntu-latest  , use-cross: true }
+        - { platform: linux-x64         , target: x86_64-unknown-linux-gnu            , os: ubuntu-20.04                     } #2272
+        - { platform: linux-x86         , target: i686-unknown-linux-gnu              , os: ubuntu-latest  , use-cross: true }
+        - { platform: linux-i586        , target: i586-unknown-linux-gnu              , os: ubuntu-latest  , use-cross: true }
+        - { platform: linux-mips        , target: mips-unknown-linux-gnu              , os: ubuntu-latest  , use-cross: true }
+        - { platform: linux-mips64      , target: mips64-unknown-linux-gnuabi64       , os: ubuntu-latest  , use-cross: true }
+        - { platform: linux-mipsel      , target: mipsel-unknown-linux-gnu            , os: ubuntu-latest  , use-cross: true }
+        - { platform: linux-mips64el    , target: mips64el-unknown-linux-gnuabi64     , os: ubuntu-latest  , use-cross: true }
+        - { platform: linux-powerpc     , target: powerpc-unknown-linux-gnu           , os: ubuntu-latest  , use-cross: true }
+        - { platform: linux-powerpc64   , target: powerpc64-unknown-linux-gnu         , os: ubuntu-latest  , use-cross: true }
+        - { platform: linux-powerpc64el , target: powerpc64le-unknown-linux-gnu       , os: ubuntu-latest  , use-cross: true }
+        - { platform: linux-riscv64gc   , target: riscv64gc-unknown-linux-gnu         , os: ubuntu-latest  , use-cross: true }
+        - { platform: linux-s390x       , target: s390x-unknown-linux-gnu             , os: ubuntu-latest  , use-cross: true }
+        - { platform: linux-sparc64     , target: sparc64-unknown-linux-gnu           , os: ubuntu-latest  , use-cross: true }
+        - { platform: linux-thumbv7neon , target: thumbv7neon-unknown-linux-gnueabihf , os: ubuntu-latest  , use-cross: true }
+        - { platform: windows-arm64     , target: aarch64-pc-windows-msvc             , os: windows-latest                   }
+        - { platform: windows-x64       , target: x86_64-pc-windows-msvc              , os: windows-latest                   }
+        - { platform: windows-x86       , target: i686-pc-windows-msvc                , os: windows-latest                   }
+        - { platform: macos-arm64       , target: aarch64-apple-darwin                , os: macos-latest                     }
+        - { platform: macos-x64         , target: x86_64-apple-darwin                 , os: macos-latest                     }
 
         # Cross compilers for C library
-        - { runtime: linux-arm64       , cc: aarch64-linux-gnu-gcc             , ar: aarch64-linux-gnu-ar           }
-        - { runtime: linux-arm         , cc: arm-linux-gnueabi-gcc             , ar: arm-linux-gnueabi-ar           }
-        - { runtime: linux-armhf       , cc: arm-unknown-linux-gnueabihf-gcc   , ar: arm-unknown-linux-gnueabihf-ar }
-        - { runtime: linux-armv5te     , cc: arm-linux-gnueabi-gcc             , ar: arm-linux-gnueabi-ar           }
-        - { runtime: linux-armv7l      , cc: arm-linux-gnueabihf-gcc           , ar: arm-linux-gnueabihf-ar         }
-        - { runtime: linux-x86         , cc: i686-linux-gnu-gcc                , ar: i686-linux-gnu-ar              }
-        - { runtime: linux-i586        , cc: i686-linux-gnu-gcc                , ar: i686-linux-gnu-ar              }
-        - { runtime: linux-mips        , cc: mips-linux-gnu-gcc                , ar: mips-linux-gnu-ar              }
-        - { runtime: linux-mips64      , cc: mips64-linux-gnuabi64-gcc         , ar: mips64-linux-gnuabi64-ar       }
-        - { runtime: linux-mipsel      , cc: mipsel-linux-gnu-gcc              , ar: mipsel-linux-gnu-ar            }
-        - { runtime: linux-mips64el    , cc: mips64el-linux-gnuabi64-gcc       , ar: mips64el-linux-gnuabi64-ar     }
-        - { runtime: linux-powerpc     , cc: powerpc-linux-gnu-gcc             , ar: powerpc-linux-gnu-ar           }
-        - { runtime: linux-powerpc64   , cc: powerpc64-linux-gnu-gcc           , ar: powerpc64-linux-gnu-ar         }
-        - { runtime: linux-powerpc64el , cc: powerpc64le-linux-gnu-gcc         , ar: powerpc64le-linux-gnu-ar       }
-        - { runtime: linux-riscv64gc   , cc: riscv64-linux-gnu-gcc             , ar: riscv64-linux-gnu-ar           }
-        - { runtime: linux-s390x       , cc: s390x-linux-gnu-gcc               , ar: s390x-linux-gnu-ar             }
-        - { runtime: linux-sparc64     , cc: sparc64-linux-gnu-gcc             , ar: sparc64-linux-gnu-ar           }
-        - { runtime: linux-thumbv7neon , cc: arm-linux-gnueabihf-gcc           , ar: arm-linux-gnueabihf-ar         }
+        - { platform: linux-arm64       , cc: aarch64-linux-gnu-gcc             , ar: aarch64-linux-gnu-ar           }
+        - { platform: linux-arm         , cc: arm-linux-gnueabi-gcc             , ar: arm-linux-gnueabi-ar           }
+        - { platform: linux-armhf       , cc: arm-unknown-linux-gnueabihf-gcc   , ar: arm-unknown-linux-gnueabihf-ar }
+        - { platform: linux-armv5te     , cc: arm-linux-gnueabi-gcc             , ar: arm-linux-gnueabi-ar           }
+        - { platform: linux-armv7l      , cc: arm-linux-gnueabihf-gcc           , ar: arm-linux-gnueabihf-ar         }
+        - { platform: linux-x86         , cc: i686-linux-gnu-gcc                , ar: i686-linux-gnu-ar              }
+        - { platform: linux-i586        , cc: i686-linux-gnu-gcc                , ar: i686-linux-gnu-ar              }
+        - { platform: linux-mips        , cc: mips-linux-gnu-gcc                , ar: mips-linux-gnu-ar              }
+        - { platform: linux-mips64      , cc: mips64-linux-gnuabi64-gcc         , ar: mips64-linux-gnuabi64-ar       }
+        - { platform: linux-mipsel      , cc: mipsel-linux-gnu-gcc              , ar: mipsel-linux-gnu-ar            }
+        - { platform: linux-mips64el    , cc: mips64el-linux-gnuabi64-gcc       , ar: mips64el-linux-gnuabi64-ar     }
+        - { platform: linux-powerpc     , cc: powerpc-linux-gnu-gcc             , ar: powerpc-linux-gnu-ar           }
+        - { platform: linux-powerpc64   , cc: powerpc64-linux-gnu-gcc           , ar: powerpc64-linux-gnu-ar         }
+        - { platform: linux-powerpc64el , cc: powerpc64le-linux-gnu-gcc         , ar: powerpc64le-linux-gnu-ar       }
+        - { platform: linux-riscv64gc   , cc: riscv64-linux-gnu-gcc             , ar: riscv64-linux-gnu-ar           }
+        - { platform: linux-s390x       , cc: s390x-linux-gnu-gcc               , ar: s390x-linux-gnu-ar             }
+        - { platform: linux-sparc64     , cc: sparc64-linux-gnu-gcc             , ar: sparc64-linux-gnu-ar           }
+        - { platform: linux-thumbv7neon , cc: arm-linux-gnueabihf-gcc           , ar: arm-linux-gnueabihf-ar         }
 
         # Rust toolchains
-        - { runtime: linux-mips        , rust-toolchain: 1.71.1 }
-        - { runtime: linux-mips64      , rust-toolchain: 1.71.1 }
-        - { runtime: linux-mipsel      , rust-toolchain: 1.71.1 }
-        - { runtime: linux-mips64el    , rust-toolchain: 1.71.1 }
+        - { platform: linux-mips        , rust-toolchain: 1.71.1 }
+        - { platform: linux-mips64      , rust-toolchain: 1.71.1 }
+        - { platform: linux-mipsel      , rust-toolchain: 1.71.1 }
+        - { platform: linux-mips64el    , rust-toolchain: 1.71.1 }
 
         # See #2041 tree-sitter issue
-        - { runtime: windows-x64   , rust-test-threads: 1 }
-        - { runtime: windows-x86   , rust-test-threads: 1 }
+        - { platform: windows-x64   , rust-test-threads: 1 }
+        - { platform: windows-x86   , rust-test-threads: 1 }
 
         # CLI only build
-        - { runtime: windows-arm64 , cli-only: true }
-        - { runtime: macos-arm64   , cli-only: true }
+        - { platform: windows-arm64 , cli-only: true }
+        - { platform: macos-arm64   , cli-only: true }
 
     env:
       BUILD_CMD: cargo
@@ -218,7 +218,7 @@ jobs:
       run: $BUILD_CMD build --release --target=${{ matrix.target }}
 
     - name: Info about CLI
-      if: ${{ startsWith(matrix.runtime, 'linux') }}
+      if: ${{ startsWith(matrix.platform, 'linux') }}
       run: |
         min_glibc=$(objdump -p target/$TARGET/release/tree-sitter${{ env.EXE }} | sed -nr 's/.*(GLIBC_.+).*/\1/p' | sort -uV | tail -n1)
         echo "🔗 Minimal **glibc** version required for CLI: ${min_glibc}">> $GITHUB_STEP_SUMMARY
@@ -250,13 +250,13 @@ jobs:
     - name: Upload CLI artifact
       uses: actions/upload-artifact@v3
       with:
-        name: tree-sitter.${{ matrix.runtime }}
+        name: tree-sitter.${{ matrix.platform }}
         path: target/${{ matrix.target }}/release/tree-sitter${{ env.EXE }}
         if-no-files-found: error
         retention-days: 7
 
     - name: Upload WASM artifacts
-      if: ${{ matrix.runtime == 'linux-x64' }}
+      if: ${{ matrix.platform == 'linux-x64' }}
       uses: actions/upload-artifact@v3
       with:
         name: tree-sitter.wasm

From fae3c5b5cf84fdb918e89604f00445046be13b50 Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Thu, 24 Aug 2023 15:55:48 +0300
Subject: [PATCH 304/347] fix(lib): improve visibility control for clang

---
 lib/include/tree_sitter/api.h | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/lib/include/tree_sitter/api.h b/lib/include/tree_sitter/api.h
index 5003cff7..b2d8a6f5 100644
--- a/lib/include/tree_sitter/api.h
+++ b/lib/include/tree_sitter/api.h
@@ -1,7 +1,7 @@
 #ifndef TREE_SITTER_API_H_
 #define TREE_SITTER_API_H_
 
-#ifdef __GNUC__
+#if defined(__GNUC__) || defined(__clang__)
 #pragma GCC visibility push(default)
 #endif
 
@@ -1167,7 +1167,7 @@ void ts_set_allocator(
 }
 #endif
 
-#ifdef __GNUC__
+#if defined(__GNUC__) || defined(__clang__)
 #pragma GCC visibility pop
 #endif
 

From fbfa58edc8663e9c0a825a72bef42dcfff8a1aef Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Thu, 24 Aug 2023 15:23:44 +0300
Subject: [PATCH 305/347] chore(gen): move external scanner stuff closer to the
 end of `parser.c`

---
 cli/src/generate/render.rs | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/cli/src/generate/render.rs b/cli/src/generate/render.rs
index f92bf312..b4cf9150 100644
--- a/cli/src/generate/render.rs
+++ b/cli/src/generate/render.rs
@@ -129,6 +129,7 @@ impl Generator {
         }
 
         self.add_lex_modes_list();
+        self.add_parse_table();
 
         if !self.syntax_grammar.external_tokens.is_empty() {
             self.add_external_token_enum();
@@ -136,7 +137,6 @@ impl Generator {
             self.add_external_scanner_states_list();
         }
 
-        self.add_parse_table();
         self.add_parser_export();
 
         self.buffer

From b3fef28a1063a56c75a3ae114a6731ffb871961f Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Thu, 24 Aug 2023 19:09:10 +0300
Subject: [PATCH 306/347] chore(gen): add `parser.c` enum names to be better
 discoverable

---
 cli/src/generate/render.rs | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/cli/src/generate/render.rs b/cli/src/generate/render.rs
index b4cf9150..f0d8ddec 100644
--- a/cli/src/generate/render.rs
+++ b/cli/src/generate/render.rs
@@ -338,7 +338,7 @@ impl Generator {
     }
 
     fn add_symbol_enum(&mut self) {
-        add_line!(self, "enum {{");
+        add_line!(self, "enum ts_symbol_identifiers {{");
         indent!(self);
         self.symbol_order.insert(Symbol::end(), 0);
         let mut i = 1;
@@ -410,7 +410,7 @@ impl Generator {
     }
 
     fn add_field_name_enum(&mut self) {
-        add_line!(self, "enum {{");
+        add_line!(self, "enum ts_field_identifiers {{");
         indent!(self);
         for (i, field_name) in self.field_names.iter().enumerate() {
             add_line!(self, "{} = {},", self.field_id(field_name), i + 1);
@@ -1026,7 +1026,7 @@ impl Generator {
     }
 
     fn add_external_token_enum(&mut self) {
-        add_line!(self, "enum {{");
+        add_line!(self, "enum ts_external_scanner_symbol_identifiers {{");
         indent!(self);
         for i in 0..self.syntax_grammar.external_tokens.len() {
             add_line!(

From 13c79db3aac71281bb17ea470e9fe4664138b2fa Mon Sep 17 00:00:00 2001
From: Shem Sedrick <shem.sedrick@caylent.com>
Date: Thu, 24 Aug 2023 12:43:53 -0500
Subject: [PATCH 307/347] Updated build.zig to work with 0.11.0

---
 build.zig | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/build.zig b/build.zig
index 05e4f2c2..8b6a7c33 100644
--- a/build.zig
+++ b/build.zig
@@ -8,9 +8,9 @@ pub fn build(b: *std.Build) void {
     });
 
     lib.linkLibC();
-    lib.addCSourceFile("lib/src/lib.c", &.{});
-    lib.addIncludePath("lib/include");
-    lib.addIncludePath("lib/src");
+    lib.addCSourceFile(.{ .file = .{ .path = "lib/src/lib.c" }, .flags = &.{} });
+    lib.addIncludePath(.{ .path = "lib/include" });
+    lib.addIncludePath(.{ .path = "lib/src" });
 
     b.installArtifact(lib);
 }

From 69697666641d60fd816adb2e7329c857d68ebe25 Mon Sep 17 00:00:00 2001
From: Amaan Qureshi <amaanq12@gmail.com>
Date: Thu, 24 Aug 2023 02:54:59 -0400
Subject: [PATCH 308/347] fix: ignore regex u flag

It's needed for certain regex patterns in JS, and we can just silently ignore it.
---
 cli/src/generate/parse_grammar.rs | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/cli/src/generate/parse_grammar.rs b/cli/src/generate/parse_grammar.rs
index 88bd57c1..e8eca095 100644
--- a/cli/src/generate/parse_grammar.rs
+++ b/cli/src/generate/parse_grammar.rs
@@ -150,10 +150,10 @@ fn parse_rule(json: RuleJSON) -> Rule {
                 f.chars()
                     .filter(|c| {
                         if *c != 'i' {
-                            eprintln!("Warning: unsupported flag {}", c);
+                            eprintln!("Warning: unsupported flag {c}");
                             false
                         } else {
-                            true
+                            *c != 'u' // silently ignore unicode flag
                         }
                     })
                     .collect()

From b412d86f198573f4303c671534d7358fdb04f0f1 Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Sat, 26 Aug 2023 20:50:23 +0300
Subject: [PATCH 309/347] fix: makefile should install only `api.h` header

---
 Makefile | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/Makefile b/Makefile
index b73e6363..eb4075f0 100644
--- a/Makefile
+++ b/Makefile
@@ -67,7 +67,7 @@ install: all
 	ln -sf libtree-sitter.$(SOEXTVER) '$(DESTDIR)$(LIBDIR)'/libtree-sitter.$(SOEXT)
 
 	install -d '$(DESTDIR)$(INCLUDEDIR)'/tree_sitter
-	install -m644 lib/include/tree_sitter/*.h '$(DESTDIR)$(INCLUDEDIR)'/tree_sitter/
+	install -m644 lib/include/tree_sitter/api.h '$(DESTDIR)$(INCLUDEDIR)'/tree_sitter/
 
 	install -d '$(DESTDIR)$(PCLIBDIR)'
 	install -m644 tree-sitter.pc '$(DESTDIR)$(PCLIBDIR)'/

From 60779cc1acb9929a10a773c4dbad304c5f524f1e Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Sat, 26 Aug 2023 20:57:08 +0300
Subject: [PATCH 310/347] fix(gen): `parser.c` should include `parser.h`
 relatively

---
 cli/src/generate/render.rs | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/cli/src/generate/render.rs b/cli/src/generate/render.rs
index f0d8ddec..69fa3c48 100644
--- a/cli/src/generate/render.rs
+++ b/cli/src/generate/render.rs
@@ -256,7 +256,7 @@ impl Generator {
     }
 
     fn add_includes(&mut self) {
-        add_line!(self, "#include <tree_sitter/parser.h>");
+        add_line!(self, "#include \"tree_sitter/parser.h\"");
         add_line!(self, "");
     }
 

From a4ea4737ac13ec0e0a34a26624330010f51b27be Mon Sep 17 00:00:00 2001
From: Amaan Qureshi <amaanq12@gmail.com>
Date: Fri, 25 Aug 2023 18:28:27 -0400
Subject: [PATCH 311/347] fix: do not increment `current_included_range_index`
 past `included_range_count` in `__do_advance`

---
 cli/src/tests/mod.rs                          |  1 +
 cli/src/tests/parser_hang_test.rs             | 61 +++++++++++++++++++
 lib/src/lexer.c                               |  4 +-
 .../get_col_should_hang_not_crash/corpus.txt  |  0
 .../get_col_should_hang_not_crash/grammar.js  | 13 ++++
 .../get_col_should_hang_not_crash/scanner.c   | 17 ++++++
 6 files changed, 95 insertions(+), 1 deletion(-)
 create mode 100644 cli/src/tests/parser_hang_test.rs
 create mode 100644 test/fixtures/test_grammars/get_col_should_hang_not_crash/corpus.txt
 create mode 100644 test/fixtures/test_grammars/get_col_should_hang_not_crash/grammar.js
 create mode 100644 test/fixtures/test_grammars/get_col_should_hang_not_crash/scanner.c

diff --git a/cli/src/tests/mod.rs b/cli/src/tests/mod.rs
index e579209f..308fc2c5 100644
--- a/cli/src/tests/mod.rs
+++ b/cli/src/tests/mod.rs
@@ -5,6 +5,7 @@ mod helpers;
 mod highlight_test;
 mod language_test;
 mod node_test;
+mod parser_hang_test;
 mod parser_test;
 mod pathological_test;
 mod query_test;
diff --git a/cli/src/tests/parser_hang_test.rs b/cli/src/tests/parser_hang_test.rs
new file mode 100644
index 00000000..cfa34957
--- /dev/null
+++ b/cli/src/tests/parser_hang_test.rs
@@ -0,0 +1,61 @@
+use pretty_assertions::assert_eq;
+use tree_sitter::Parser;
+
+use crate::{
+    generate::generate_parser_for_grammar,
+    tests::helpers::fixtures::{fixtures_dir, get_test_language},
+};
+
+#[test]
+fn test_grammar_that_should_hang_and_not_segfault() {
+    use std::sync::mpsc;
+
+    let (tx, rx) = mpsc::channel();
+
+    std::thread::spawn(move || {
+        let (parser_name, parser_code) = generate_parser_for_grammar(
+            r#"
+            {
+                "name": "get_col_should_hang_not_crash",
+                "rules": {
+                    "source_file": {
+                        "type": "SEQ",
+                        "members": [ { "type": "SYMBOL", "name": "test" } ]
+                    }
+                },
+                "extras": [ { "type": "PATTERN", "value": "\\s" } ],
+                "externals": [ { "type": "SYMBOL", "name": "test" } ]
+            }
+            "#,
+        )
+        .unwrap();
+
+        let mut parser = Parser::new();
+        parser
+            .set_language(get_test_language(
+                &parser_name,
+                &parser_code,
+                Some(
+                    fixtures_dir()
+                        .join("test_grammars")
+                        .join("get_col_should_hang_not_crash")
+                        .as_path(),
+                ),
+            ))
+            .unwrap();
+
+        let code_that_should_hang = "\nHello";
+
+        parser.parse(code_that_should_hang, None).unwrap();
+
+        // Won't be reached
+        let _ = tx.send(());
+    });
+
+    // Ok signifies that it did not hang
+    // RecvTimeoutError::Disconnected signifies that the parser thread exited unexpectedly (crashed)
+    assert_eq!(
+        rx.recv_timeout(std::time::Duration::from_secs(5)),
+        Err(mpsc::RecvTimeoutError::Timeout)
+    );
+}
diff --git a/lib/src/lexer.c b/lib/src/lexer.c
index e32158b2..d108c04e 100644
--- a/lib/src/lexer.c
+++ b/lib/src/lexer.c
@@ -172,7 +172,9 @@ static void ts_lexer__do_advance(Lexer *self, bool skip) {
     self->current_position.bytes >= current_range->end_byte ||
     current_range->end_byte == current_range->start_byte
   ) {
-    self->current_included_range_index++;
+    if (self->current_included_range_index < self->included_range_count) {
+      self->current_included_range_index++;
+    }
     if (self->current_included_range_index < self->included_range_count) {
       current_range++;
       self->current_position = (Length) {
diff --git a/test/fixtures/test_grammars/get_col_should_hang_not_crash/corpus.txt b/test/fixtures/test_grammars/get_col_should_hang_not_crash/corpus.txt
new file mode 100644
index 00000000..e69de29b
diff --git a/test/fixtures/test_grammars/get_col_should_hang_not_crash/grammar.js b/test/fixtures/test_grammars/get_col_should_hang_not_crash/grammar.js
new file mode 100644
index 00000000..83d57d2c
--- /dev/null
+++ b/test/fixtures/test_grammars/get_col_should_hang_not_crash/grammar.js
@@ -0,0 +1,13 @@
+module.exports = grammar({
+  name: 'get_col_should_hang_not_crash',
+
+  externals: $ => [
+    $.test,
+  ],
+
+  rules: {
+    source_file: $ => seq(
+      $.test
+    ),
+  },
+});
diff --git a/test/fixtures/test_grammars/get_col_should_hang_not_crash/scanner.c b/test/fixtures/test_grammars/get_col_should_hang_not_crash/scanner.c
new file mode 100644
index 00000000..d21ec6d4
--- /dev/null
+++ b/test/fixtures/test_grammars/get_col_should_hang_not_crash/scanner.c
@@ -0,0 +1,17 @@
+#include <tree_sitter/parser.h>
+
+unsigned tree_sitter_get_col_should_hang_not_crash_external_scanner_serialize() { return 0; }
+
+void tree_sitter_get_col_should_hang_not_crash_external_scanner_deserialize() {}
+
+void *tree_sitter_get_col_should_hang_not_crash_external_scanner_create() { return NULL; }
+
+void tree_sitter_get_col_should_hang_not_crash_external_scanner_destroy() {}
+
+bool tree_sitter_get_col_should_hang_not_crash_external_scanner_scan(void *payload, TSLexer *lexer,
+                                            const bool *valid_symbols) {
+    while (true) {
+        lexer->advance(lexer, false);
+        lexer->get_column(lexer);
+    }
+}

From b205a1f5a2c8980853ee537dd34b52c8bd4de3bd Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Sun, 27 Aug 2023 18:37:15 +0300
Subject: [PATCH 312/347] Run parser hang test in a killable subprocess

---
 cli/src/tests/parser_hang_test.rs | 114 ++++++++++++++++++------------
 1 file changed, 70 insertions(+), 44 deletions(-)

diff --git a/cli/src/tests/parser_hang_test.rs b/cli/src/tests/parser_hang_test.rs
index cfa34957..ab4273e3 100644
--- a/cli/src/tests/parser_hang_test.rs
+++ b/cli/src/tests/parser_hang_test.rs
@@ -1,61 +1,87 @@
-use pretty_assertions::assert_eq;
-use tree_sitter::Parser;
-
 use crate::{
-    generate::generate_parser_for_grammar,
+    generate::{generate_parser_for_grammar, load_grammar_file},
     tests::helpers::fixtures::{fixtures_dir, get_test_language},
 };
+use std::{
+    env::VarError,
+    process::{Command, Stdio},
+};
+use tree_sitter::Parser;
 
 #[test]
 fn test_grammar_that_should_hang_and_not_segfault() {
-    use std::sync::mpsc;
+    let parent_sleep_millis = 1000;
+    let test_name = "test_grammar_that_should_hang_and_not_segfault";
+    let test_var = "CARGO_HANG_TEST";
 
-    let (tx, rx) = mpsc::channel();
+    eprintln!("  {test_name}");
 
-    std::thread::spawn(move || {
-        let (parser_name, parser_code) = generate_parser_for_grammar(
-            r#"
-            {
-                "name": "get_col_should_hang_not_crash",
-                "rules": {
-                    "source_file": {
-                        "type": "SEQ",
-                        "members": [ { "type": "SYMBOL", "name": "test" } ]
+    let tests_exec_path = std::env::args()
+        .nth(0)
+        .expect("Failed get get tests executable path");
+
+    match std::env::var(test_var) {
+        Ok(v) if v == test_name => {
+            eprintln!("    child process id {}", std::process::id());
+            hang_test();
+        }
+
+        Err(VarError::NotPresent) => {
+            eprintln!("    parent process id {}", std::process::id());
+            if true {
+                let mut command = Command::new(tests_exec_path);
+                command.arg(test_name).env(test_var, test_name);
+                if std::env::args().any(|x| x == "--nocapture") {
+                    command.arg("--nocapture");
+                } else {
+                    command.stdout(Stdio::null()).stderr(Stdio::null());
+                }
+                match command.spawn() {
+                    Ok(mut child) => {
+                        std::thread::sleep(std::time::Duration::from_millis(parent_sleep_millis));
+                        match child.try_wait() {
+                            Ok(Some(status)) if status.success() => {
+                                panic!("Child wasn't hang and exited successfully")
+                            }
+                            Ok(Some(status)) => panic!(
+                                "Child wasn't hang and exited with status code: {:?}",
+                                status.code()
+                            ),
+                            _ => (),
+                        }
+                        if let Err(e) = child.kill() {
+                            eprintln!(
+                                "Failed to kill hang test sub process id: {}, error: {e}",
+                                child.id()
+                            );
+                        }
                     }
-                },
-                "extras": [ { "type": "PATTERN", "value": "\\s" } ],
-                "externals": [ { "type": "SYMBOL", "name": "test" } ]
+                    Err(e) => panic!("{e}"),
+                }
             }
-            "#,
-        )
-        .unwrap();
+        }
+
+        Err(e) => panic!("Env var error: {e}"),
+        _ => unreachable!(),
+    }
+
+    fn hang_test() {
+        let test_grammar_dir = fixtures_dir()
+            .join("test_grammars")
+            .join("get_col_should_hang_not_crash");
+
+        let grammar_json = load_grammar_file(&test_grammar_dir.join("grammar.js"), None).unwrap();
+        let (parser_name, parser_code) =
+            generate_parser_for_grammar(grammar_json.as_str()).unwrap();
+
+        let language =
+            get_test_language(&parser_name, &parser_code, Some(test_grammar_dir.as_path()));
 
         let mut parser = Parser::new();
-        parser
-            .set_language(get_test_language(
-                &parser_name,
-                &parser_code,
-                Some(
-                    fixtures_dir()
-                        .join("test_grammars")
-                        .join("get_col_should_hang_not_crash")
-                        .as_path(),
-                ),
-            ))
-            .unwrap();
+        parser.set_language(language).unwrap();
 
         let code_that_should_hang = "\nHello";
 
         parser.parse(code_that_should_hang, None).unwrap();
-
-        // Won't be reached
-        let _ = tx.send(());
-    });
-
-    // Ok signifies that it did not hang
-    // RecvTimeoutError::Disconnected signifies that the parser thread exited unexpectedly (crashed)
-    assert_eq!(
-        rx.recv_timeout(std::time::Duration::from_secs(5)),
-        Err(mpsc::RecvTimeoutError::Timeout)
-    );
+    }
 }

From a9c4965dd620c086e5419f71117ec46de8fb5b99 Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Mon, 28 Aug 2023 04:46:07 +0300
Subject: [PATCH 313/347] cicd: exclude hang tests for exotic arches and ASAN

---
 .github/workflows/sanitize.yml    |  4 ++--
 cli/src/tests/parser_hang_test.rs | 12 ++++++++++++
 2 files changed, 14 insertions(+), 2 deletions(-)

diff --git a/.github/workflows/sanitize.yml b/.github/workflows/sanitize.yml
index 834c5ab4..2ece182b 100644
--- a/.github/workflows/sanitize.yml
+++ b/.github/workflows/sanitize.yml
@@ -36,14 +36,14 @@ jobs:
       env:
         UBSAN_OPTIONS: halt_on_error=1
         CFLAGS: -fsanitize=undefined
-        RUSTFLAGS: -lubsan
+        RUSTFLAGS: ${{ env.RUSTFLAGS }} -lubsan
       run: cargo test -- --test-threads 1
 
     - name: Run main tests with address sanitizer (ASAN)
       env:
         ASAN_OPTIONS: halt_on_error=1
         CFLAGS: -fsanitize=address
-        RUSTFLAGS: -Zsanitizer=address
+        RUSTFLAGS: ${{ env.RUSTFLAGS }} -Zsanitizer=address --cfg=sanitizing
       run: |
         rustup install nightly
         rustup component add rust-src --toolchain nightly-x86_64-unknown-linux-gnu
diff --git a/cli/src/tests/parser_hang_test.rs b/cli/src/tests/parser_hang_test.rs
index ab4273e3..b8274804 100644
--- a/cli/src/tests/parser_hang_test.rs
+++ b/cli/src/tests/parser_hang_test.rs
@@ -1,3 +1,6 @@
+// For some reasons `Command::spawn` doesn't work in CI env for many exotic arches.
+#![cfg(all(any(target_arch = "x86_64", target_arch = "x86"), not(sanitizing)))]
+
 use crate::{
     generate::{generate_parser_for_grammar, load_grammar_file},
     tests::helpers::fixtures::{fixtures_dir, get_test_language},
@@ -8,6 +11,15 @@ use std::{
 };
 use tree_sitter::Parser;
 
+// The `sanitizing` cfg is required to don't run tests under specific sunitizer
+// because they don't work well with subprocesses _(it's an assumption)_.
+//
+// Bellow are two alternative examples of how to disable tests for some arches
+// if a way with excluding the whole mod from compilation would work well.
+//
+// #[cfg(all(any(target_arch = "x86_64", target_arch = "x86"), not(sanitizing)))]
+// #[cfg_attr(not(all(any(target_arch = "x86_64", target_arch = "x86"), not(sanitizing))), ignore)]
+//
 #[test]
 fn test_grammar_that_should_hang_and_not_segfault() {
     let parent_sleep_millis = 1000;

From cbce87dab11adf8a91c60c307470b18cb2d44b41 Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Mon, 28 Aug 2023 14:16:36 +0300
Subject: [PATCH 314/347] chore: add an extra notes for hang tests

---
 cli/src/tests/parser_hang_test.rs | 7 ++++++-
 1 file changed, 6 insertions(+), 1 deletion(-)

diff --git a/cli/src/tests/parser_hang_test.rs b/cli/src/tests/parser_hang_test.rs
index b8274804..02a2689c 100644
--- a/cli/src/tests/parser_hang_test.rs
+++ b/cli/src/tests/parser_hang_test.rs
@@ -15,7 +15,12 @@ use tree_sitter::Parser;
 // because they don't work well with subprocesses _(it's an assumption)_.
 //
 // Bellow are two alternative examples of how to disable tests for some arches
-// if a way with excluding the whole mod from compilation would work well.
+// if a way with excluding the whole mod from compilation wouldn't work well.
+//
+// XXX: Also may be it makes sense to keep such tests as ignored by default
+//      to omit surprises and enable them on CI by passing an extra option explicitly:
+//
+//        > cargo test -- --include-ignored
 //
 // #[cfg(all(any(target_arch = "x86_64", target_arch = "x86"), not(sanitizing)))]
 // #[cfg_attr(not(all(any(target_arch = "x86_64", target_arch = "x86"), not(sanitizing))), ignore)]

From 4fabc49066300f51e538c545f05f9196089018f7 Mon Sep 17 00:00:00 2001
From: mgunyho <20118130+mgunyho@users.noreply.github.com>
Date: Mon, 28 Aug 2023 19:26:33 +0300
Subject: [PATCH 315/347] doc: Fix broken link

---
 lib/binding_rust/lib.rs | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/lib/binding_rust/lib.rs b/lib/binding_rust/lib.rs
index de3065d2..de9dd0dc 100644
--- a/lib/binding_rust/lib.rs
+++ b/lib/binding_rust/lib.rs
@@ -342,7 +342,8 @@ impl Language {
         FieldId::new(id)
     }
 
-    /// Get the next parse state. Combine this with [lookahead_iterator] to
+    /// Get the next parse state. Combine this with
+    /// [lookahead_iterator](Language::lookahead_iterator) to
     /// generate completion suggestions or valid symbols in error nodes.
     ///
     /// Example:

From dcfd91fc25e6e3d9cec8db213046af3329062e41 Mon Sep 17 00:00:00 2001
From: mgunyho <20118130+mgunyho@users.noreply.github.com>
Date: Mon, 28 Aug 2023 19:26:37 +0300
Subject: [PATCH 316/347] doc: Add internal links to backticked text where
 applicable

---
 lib/binding_rust/lib.rs | 42 ++++++++++++++++++++---------------------
 1 file changed, 21 insertions(+), 21 deletions(-)

diff --git a/lib/binding_rust/lib.rs b/lib/binding_rust/lib.rs
index de9dd0dc..c44dd7f5 100644
--- a/lib/binding_rust/lib.rs
+++ b/lib/binding_rust/lib.rs
@@ -78,13 +78,13 @@ pub struct InputEdit {
     pub new_end_position: Point,
 }
 
-/// A single node within a syntax `Tree`.
+/// A single node within a syntax [`Tree`].
 #[doc(alias = "TSNode")]
 #[derive(Clone, Copy)]
 #[repr(transparent)]
 pub struct Node<'tree>(ffi::TSNode, PhantomData<&'tree ()>);
 
-/// A stateful object that this is used to produce a `Tree` based on some source code.
+/// A stateful object that this is used to produce a [`Tree`] based on some source code.
 #[doc(alias = "TSParser")]
 pub struct Parser(NonNull<ffi::TSParser>);
 
@@ -105,7 +105,7 @@ type FieldId = NonZeroU16;
 /// A callback that receives log messages during parser.
 type Logger<'a> = Box<dyn FnMut(LogType, &str) + 'a>;
 
-/// A stateful object for walking a syntax `Tree` efficiently.
+/// A stateful object for walking a syntax [Tree] efficiently.
 #[doc(alias = "TSTreeCursor")]
 pub struct TreeCursor<'cursor>(ffi::TSTreeCursor, PhantomData<&'cursor ()>);
 
@@ -145,13 +145,13 @@ impl From<ffi::TSQuantifier> for CaptureQuantifier {
     }
 }
 
-/// A stateful object for executing a `Query` on a syntax `Tree`.
+/// A stateful object for executing a [`Query`] on a syntax [`Tree`].
 #[doc(alias = "TSQueryCursor")]
 pub struct QueryCursor {
     ptr: NonNull<ffi::TSQueryCursor>,
 }
 
-/// A key-value pair associated with a particular pattern in a `Query`.
+/// A key-value pair associated with a particular pattern in a [`Query`].
 #[derive(Debug, PartialEq, Eq)]
 pub struct QueryProperty {
     pub key: Box<str>,
@@ -165,14 +165,14 @@ pub enum QueryPredicateArg {
     String(Box<str>),
 }
 
-/// A key-value pair associated with a particular pattern in a `Query`.
+/// A key-value pair associated with a particular pattern in a [`Query`].
 #[derive(Debug, PartialEq, Eq)]
 pub struct QueryPredicate {
     pub operator: Box<str>,
     pub args: Vec<QueryPredicateArg>,
 }
 
-/// A match of a `Query` to a particular set of `Node`s.
+/// A match of a [`Query`] to a particular set of [`Node`]s.
 pub struct QueryMatch<'cursor, 'tree> {
     pub pattern_index: usize,
     pub captures: &'cursor [QueryCapture<'tree>],
@@ -180,7 +180,7 @@ pub struct QueryMatch<'cursor, 'tree> {
     cursor: *mut ffi::TSQueryCursor,
 }
 
-/// A sequence of `QueryMatch`es associated with a given `QueryCursor`.
+/// A sequence of [`QueryMatch`]es associated with a given [`QueryCursor`].
 pub struct QueryMatches<'query, 'cursor, T: TextProvider<I>, I: AsRef<[u8]>> {
     ptr: *mut ffi::TSQueryCursor,
     query: &'query Query,
@@ -190,7 +190,7 @@ pub struct QueryMatches<'query, 'cursor, T: TextProvider<I>, I: AsRef<[u8]>> {
     _phantom: PhantomData<(&'cursor (), I)>,
 }
 
-/// A sequence of `QueryCapture`s associated with a given `QueryCursor`.
+/// A sequence of [`QueryCapture`]s associated with a given [`QueryCursor`].
 pub struct QueryCaptures<'query, 'cursor, T: TextProvider<I>, I: AsRef<[u8]>> {
     ptr: *mut ffi::TSQueryCursor,
     query: &'query Query,
@@ -208,7 +208,7 @@ where
     fn text(&mut self, node: Node) -> Self::I;
 }
 
-/// A particular `Node` that has been captured with a particular name within a `Query`.
+/// A particular [`Node`] that has been captured with a particular name within a [`Query`].
 #[derive(Clone, Copy, Debug)]
 #[repr(C)]
 pub struct QueryCapture<'tree> {
@@ -216,17 +216,17 @@ pub struct QueryCapture<'tree> {
     pub index: u32,
 }
 
-/// An error that occurred when trying to assign an incompatible `Language` to a `Parser`.
+/// An error that occurred when trying to assign an incompatible [`Language`] to a [`Parser`].
 #[derive(Debug, PartialEq, Eq)]
 pub struct LanguageError {
     version: usize,
 }
 
-/// An error that occurred in `Parser::set_included_ranges`.
+/// An error that occurred in [`Parser::set_included_ranges`].
 #[derive(Debug, PartialEq, Eq)]
 pub struct IncludedRangesError(pub usize);
 
-/// An error that occurred when trying to create a `Query`.
+/// An error that occurred when trying to create a [`Query`].
 #[derive(Debug, PartialEq, Eq)]
 pub struct QueryError {
     pub row: usize,
@@ -264,7 +264,7 @@ pub struct LossyUtf8<'a> {
 
 impl Language {
     /// Get the ABI version number that indicates which version of the Tree-sitter CLI
-    /// that was used to generate this `Language`.
+    /// that was used to generate this [`Language`].
     #[doc(alias = "ts_language_version")]
     pub fn version(&self) -> usize {
         unsafe { ffi::ts_language_version(self.0) as usize }
@@ -632,10 +632,10 @@ impl Parser {
 
     /// Instruct the parser to start the next parse from the beginning.
     ///
-    /// If the parser previously failed because of a timeout or a cancellation, then
-    /// by default, it will resume where it left off on the next call to `parse` or
-    /// other parsing functions. If you don't want to resume, and instead intend to
-    /// use this parser to parse some other document, you must call `reset` first.
+    /// If the parser previously failed because of a timeout or a cancellation, then by default, it
+    /// will resume where it left off on the next call to [`parse`](Parser::parse) or other parsing
+    /// functions. If you don't want to resume, and instead intend to use this parser to parse some
+    /// other document, you must call `reset` first.
     #[doc(alias = "ts_parser_reset")]
     pub fn reset(&mut self) {
         unsafe { ffi::ts_parser_reset(self.0.as_ptr()) }
@@ -653,7 +653,7 @@ impl Parser {
     /// take before halting.
     ///
     /// If parsing takes longer than this, it will halt early, returning `None`.
-    /// See `parse` for more information.
+    /// See [`parse`](Parser::parse) for more information.
     #[doc(alias = "ts_parser_set_timeout_micros")]
     pub fn set_timeout_micros(&mut self, timeout_micros: u64) {
         unsafe { ffi::ts_parser_set_timeout_micros(self.0.as_ptr(), timeout_micros) }
@@ -1068,7 +1068,7 @@ impl<'tree> Node<'tree> {
     /// allocations, you should reuse the same cursor for subsequent calls to
     /// this method.
     ///
-    /// If you're walking the tree recursively, you may want to use the `TreeCursor`
+    /// If you're walking the tree recursively, you may want to use the [`TreeCursor`]
     /// APIs directly instead.
     pub fn children<'cursor>(
         &self,
@@ -1440,7 +1440,7 @@ impl<'cursor> TreeCursor<'cursor> {
 
     /// Re-initialize a tree cursor to the same position as another cursor.
     ///
-    /// Unlike `reset`, this will not lose parent information and
+    /// Unlike [`reset`](TreeCursor::reset), this will not lose parent information and
     /// allows reusing already created cursors.
     #[doc(alias = "ts_tree_cursor_reset_to")]
     pub fn reset_to(&mut self, cursor: TreeCursor<'cursor>) {

From 8d894bb0500a3481735141983dee203084bca18a Mon Sep 17 00:00:00 2001
From: mgunyho <20118130+mgunyho@users.noreply.github.com>
Date: Mon, 28 Aug 2023 19:26:38 +0300
Subject: [PATCH 317/347] doc: Add backticks to all internal links

---
 lib/binding_rust/ffi.rs | 32 ++++++++---------
 lib/binding_rust/lib.rs | 78 ++++++++++++++++++++---------------------
 2 files changed, 55 insertions(+), 55 deletions(-)

diff --git a/lib/binding_rust/ffi.rs b/lib/binding_rust/ffi.rs
index a99d2afe..a962e6c1 100644
--- a/lib/binding_rust/ffi.rs
+++ b/lib/binding_rust/ffi.rs
@@ -18,7 +18,7 @@ use crate::{
 use std::{marker::PhantomData, mem::ManuallyDrop, ptr::NonNull, str};
 
 impl Language {
-    /// Reconstructs a [Language] from a raw pointer.
+    /// Reconstructs a [`Language`] from a raw pointer.
     ///
     /// # Safety
     ///
@@ -27,14 +27,14 @@ impl Language {
         Language(ptr)
     }
 
-    /// Consumes the [Language], returning a raw pointer to the underlying C structure.
+    /// Consumes the [`Language`], returning a raw pointer to the underlying C structure.
     pub fn into_raw(self) -> *const TSLanguage {
         ManuallyDrop::new(self).0
     }
 }
 
 impl Parser {
-    /// Reconstructs a [Parser] from a raw pointer.
+    /// Reconstructs a [`Parser`] from a raw pointer.
     ///
     /// # Safety
     ///
@@ -43,7 +43,7 @@ impl Parser {
         Parser(NonNull::new_unchecked(ptr))
     }
 
-    /// Consumes the [Parser], returning a raw pointer to the underlying C structure.
+    /// Consumes the [`Parser`], returning a raw pointer to the underlying C structure.
     ///
     /// # Safety
     ///
@@ -56,7 +56,7 @@ impl Parser {
 }
 
 impl Tree {
-    /// Reconstructs a [Tree] from a raw pointer.
+    /// Reconstructs a [`Tree`] from a raw pointer.
     ///
     /// # Safety
     ///
@@ -65,14 +65,14 @@ impl Tree {
         Tree(NonNull::new_unchecked(ptr))
     }
 
-    /// Consumes the [Tree], returning a raw pointer to the underlying C structure.
+    /// Consumes the [`Tree`], returning a raw pointer to the underlying C structure.
     pub fn into_raw(self) -> *mut TSTree {
         ManuallyDrop::new(self).0.as_ptr()
     }
 }
 
 impl<'tree> Node<'tree> {
-    /// Reconstructs a [Node] from a raw pointer.
+    /// Reconstructs a [`Node`] from a raw pointer.
     ///
     /// # Safety
     ///
@@ -81,14 +81,14 @@ impl<'tree> Node<'tree> {
         Node(raw, PhantomData)
     }
 
-    /// Consumes the [Node], returning a raw pointer to the underlying C structure.
+    /// Consumes the [`Node`], returning a raw pointer to the underlying C structure.
     pub fn into_raw(self) -> TSNode {
         ManuallyDrop::new(self).0
     }
 }
 
 impl<'a> TreeCursor<'a> {
-    /// Reconstructs a [TreeCursor] from a raw pointer.
+    /// Reconstructs a [`TreeCursor`] from a raw pointer.
     ///
     /// # Safety
     ///
@@ -97,14 +97,14 @@ impl<'a> TreeCursor<'a> {
         TreeCursor(raw, PhantomData)
     }
 
-    /// Consumes the [TreeCursor], returning a raw pointer to the underlying C structure.
+    /// Consumes the [`TreeCursor`], returning a raw pointer to the underlying C structure.
     pub fn into_raw(self) -> TSTreeCursor {
         ManuallyDrop::new(self).0
     }
 }
 
 impl Query {
-    /// Reconstructs a [Query] from a raw pointer.
+    /// Reconstructs a [`Query`] from a raw pointer.
     ///
     /// # Safety
     ///
@@ -113,14 +113,14 @@ impl Query {
         Query::from_raw_parts(ptr, source)
     }
 
-    /// Consumes the [Query], returning a raw pointer to the underlying C structure.
+    /// Consumes the [`Query`], returning a raw pointer to the underlying C structure.
     pub fn into_raw(self) -> *mut TSQuery {
         ManuallyDrop::new(self).ptr.as_ptr()
     }
 }
 
 impl QueryCursor {
-    /// Reconstructs a [QueryCursor] from a raw pointer.
+    /// Reconstructs a [`QueryCursor`] from a raw pointer.
     ///
     /// # Safety
     ///
@@ -131,14 +131,14 @@ impl QueryCursor {
         }
     }
 
-    /// Consumes the [QueryCursor], returning a raw pointer to the underlying C structure.
+    /// Consumes the [`QueryCursor`], returning a raw pointer to the underlying C structure.
     pub fn into_raw(self) -> *mut TSQueryCursor {
         ManuallyDrop::new(self).ptr.as_ptr()
     }
 }
 
 impl LookaheadIterator {
-    /// Reconstructs a [LookaheadIterator] from a raw pointer.
+    /// Reconstructs a [`LookaheadIterator`] from a raw pointer.
     ///
     /// # Safety
     ///
@@ -147,7 +147,7 @@ impl LookaheadIterator {
         LookaheadIterator(NonNull::new_unchecked(ptr))
     }
 
-    /// Consumes the [LookaheadIterator], returning a raw pointer to the underlying C structure.
+    /// Consumes the [`LookaheadIterator`], returning a raw pointer to the underlying C structure.
     pub fn into_raw(self) -> *mut TSLookaheadIterator {
         ManuallyDrop::new(self).0.as_ptr()
     }
diff --git a/lib/binding_rust/lib.rs b/lib/binding_rust/lib.rs
index c44dd7f5..3c8d7504 100644
--- a/lib/binding_rust/lib.rs
+++ b/lib/binding_rust/lib.rs
@@ -105,7 +105,7 @@ type FieldId = NonZeroU16;
 /// A callback that receives log messages during parser.
 type Logger<'a> = Box<dyn FnMut(LogType, &str) + 'a>;
 
-/// A stateful object for walking a syntax [Tree] efficiently.
+/// A stateful object for walking a syntax [`Tree`] efficiently.
 #[doc(alias = "TSTreeCursor")]
 pub struct TreeCursor<'cursor>(ffi::TSTreeCursor, PhantomData<&'cursor ()>);
 
@@ -343,7 +343,7 @@ impl Language {
     }
 
     /// Get the next parse state. Combine this with
-    /// [lookahead_iterator](Language::lookahead_iterator) to
+    /// [`lookahead_iterator`](Language::lookahead_iterator) to
     /// generate completion suggestions or valid symbols in error nodes.
     ///
     /// Example:
@@ -359,9 +359,9 @@ impl Language {
     ///
     /// This returns `None` if state is invalid for this language.
     ///
-    /// Iterating [LookaheadIterator] will yield valid symbols in the given
+    /// Iterating [`LookaheadIterator`] will yield valid symbols in the given
     /// parse state. Newly created lookahead iterators will return the `ERROR`
-    /// symbol from [LookaheadIterator::current_symbol].
+    /// symbol from [`LookaheadIterator::current_symbol`].
     ///
     /// Lookahead iterators can be useful to generate suggestions and improve
     /// syntax error diagnostics. To get symbols valid in an ERROR node, use the
@@ -389,9 +389,9 @@ impl Parser {
     /// Returns a Result indicating whether or not the language was successfully
     /// assigned. True means assignment succeeded. False means there was a version
     /// mismatch: the language was generated with an incompatible version of the
-    /// Tree-sitter CLI. Check the language's version using [Language::version]
-    /// and compare it to this library's [LANGUAGE_VERSION](LANGUAGE_VERSION) and
-    /// [MIN_COMPATIBLE_LANGUAGE_VERSION](MIN_COMPATIBLE_LANGUAGE_VERSION) constants.
+    /// Tree-sitter CLI. Check the language's version using [`Language::version`]
+    /// and compare it to this library's [`LANGUAGE_VERSION`](LANGUAGE_VERSION) and
+    /// [`MIN_COMPATIBLE_LANGUAGE_VERSION`](MIN_COMPATIBLE_LANGUAGE_VERSION) constants.
     #[doc(alias = "ts_parser_set_language")]
     pub fn set_language(&mut self, language: Language) -> Result<(), LanguageError> {
         let version = language.version();
@@ -487,12 +487,12 @@ impl Parser {
     /// * `old_tree` A previous syntax tree parsed from the same document.
     ///   If the text of the document has changed since `old_tree` was
     ///   created, then you must edit `old_tree` to match the new text using
-    ///   [Tree::edit].
+    ///   [`Tree::edit`].
     ///
-    /// Returns a [Tree] if parsing succeeded, or `None` if:
-    ///  * The parser has not yet had a language assigned with [Parser::set_language]
-    ///  * The timeout set with [Parser::set_timeout_micros] expired
-    ///  * The cancellation flag set with [Parser::set_cancellation_flag] was flipped
+    /// Returns a [`Tree`] if parsing succeeded, or `None` if:
+    ///  * The parser has not yet had a language assigned with [`Parser::set_language`]
+    ///  * The timeout set with [`Parser::set_timeout_micros`] expired
+    ///  * The cancellation flag set with [`Parser::set_cancellation_flag`] was flipped
     #[doc(alias = "ts_parser_parse")]
     pub fn parse(&mut self, text: impl AsRef<[u8]>, old_tree: Option<&Tree>) -> Option<Tree> {
         let bytes = text.as_ref();
@@ -510,7 +510,7 @@ impl Parser {
     /// * `old_tree` A previous syntax tree parsed from the same document.
     ///   If the text of the document has changed since `old_tree` was
     ///   created, then you must edit `old_tree` to match the new text using
-    ///   [Tree::edit].
+    ///   [`Tree::edit`].
     pub fn parse_utf16(
         &mut self,
         input: impl AsRef<[u16]>,
@@ -534,7 +534,7 @@ impl Parser {
     /// * `old_tree` A previous syntax tree parsed from the same document.
     ///   If the text of the document has changed since `old_tree` was
     ///   created, then you must edit `old_tree` to match the new text using
-    ///   [Tree::edit].
+    ///   [`Tree::edit`].
     pub fn parse_with<T: AsRef<[u8]>, F: FnMut(usize, Point) -> T>(
         &mut self,
         callback: &mut F,
@@ -584,7 +584,7 @@ impl Parser {
     /// * `old_tree` A previous syntax tree parsed from the same document.
     ///   If the text of the document has changed since `old_tree` was
     ///   created, then you must edit `old_tree` to match the new text using
-    ///   [Tree::edit].
+    ///   [`Tree::edit`].
     pub fn parse_utf16_with<T: AsRef<[u16]>, F: FnMut(usize, Point) -> T>(
         &mut self,
         callback: &mut F,
@@ -643,7 +643,7 @@ impl Parser {
 
     /// Get the duration in microseconds that parsing is allowed to take.
     ///
-    /// This is set via [set_timeout_micros](Parser::set_timeout_micros).
+    /// This is set via [`set_timeout_micros`](Parser::set_timeout_micros).
     #[doc(alias = "ts_parser_timeout_micros")]
     pub fn timeout_micros(&self) -> u64 {
         unsafe { ffi::ts_parser_timeout_micros(self.0.as_ptr()) }
@@ -711,7 +711,7 @@ impl Parser {
     ///
     /// If a pointer is assigned, then the parser will periodically read from
     /// this pointer during parsing. If it reads a non-zero value, it will halt early,
-    /// returning `None`. See [parse](Parser::parse) for more information.
+    /// returning `None`. See [`parse`](Parser::parse) for more information.
     #[doc(alias = "ts_parser_set_cancellation_flag")]
     pub unsafe fn set_cancellation_flag(&mut self, flag: Option<&AtomicUsize>) {
         if let Some(flag) = flag {
@@ -771,7 +771,7 @@ impl Tree {
         unsafe { ffi::ts_tree_edit(self.0.as_ptr(), &edit) };
     }
 
-    /// Create a new [TreeCursor] starting from the root of the tree.
+    /// Create a new [`TreeCursor`] starting from the root of the tree.
     pub fn walk(&self) -> TreeCursor {
         self.root_node().walk()
     }
@@ -781,7 +781,7 @@ impl Tree {
     ///
     /// For this to work correctly, this syntax tree must have been edited such that its
     /// ranges match up to the new tree. Generally, you'll want to call this method right
-    /// after calling one of the [Parser::parse] functions. Call it on the old tree that
+    /// after calling one of the [`Parser::parse`] functions. Call it on the old tree that
     /// was passed to parse, and pass the new tree that was returned from `parse`.
     #[doc(alias = "ts_tree_get_changed_ranges")]
     pub fn changed_ranges(&self, other: &Tree) -> impl ExactSizeIterator<Item = Range> {
@@ -882,7 +882,7 @@ impl<'tree> Node<'tree> {
             .unwrap()
     }
 
-    /// Get the [Language] that was used to parse this node's syntax tree.
+    /// Get the [`Language`] that was used to parse this node's syntax tree.
     #[doc(alias = "ts_node_language")]
     pub fn language(&self) -> Language {
         Language(unsafe { ffi::ts_node_language(self.0) })
@@ -996,7 +996,7 @@ impl<'tree> Node<'tree> {
     ///
     /// This method is fairly fast, but its cost is technically log(i), so you
     /// if you might be iterating over a long list of children, you should use
-    /// [Node::children] instead.
+    /// [`Node::children`] instead.
     #[doc(alias = "ts_node_child")]
     pub fn child(&self, i: usize) -> Option<Self> {
         Self::new(unsafe { ffi::ts_node_child(self.0, i as u32) })
@@ -1010,10 +1010,10 @@ impl<'tree> Node<'tree> {
 
     /// Get this node's *named* child at the given index.
     ///
-    /// See also [Node::is_named].
+    /// See also [`Node::is_named`].
     /// This method is fairly fast, but its cost is technically log(i), so you
     /// if you might be iterating over a long list of children, you should use
-    /// [Node::named_children] instead.
+    /// [`Node::named_children`] instead.
     #[doc(alias = "ts_node_named_child")]
     pub fn named_child(&self, i: usize) -> Option<Self> {
         Self::new(unsafe { ffi::ts_node_named_child(self.0, i as u32) })
@@ -1021,7 +1021,7 @@ impl<'tree> Node<'tree> {
 
     /// Get this node's number of *named* children.
     ///
-    /// See also [Node::is_named].
+    /// See also [`Node::is_named`].
     #[doc(alias = "ts_node_named_child_count")]
     pub fn named_child_count(&self) -> usize {
         unsafe { ffi::ts_node_named_child_count(self.0) as usize }
@@ -1030,7 +1030,7 @@ impl<'tree> Node<'tree> {
     /// Get the first child with the given field name.
     ///
     /// If multiple children may have the same field name, access them using
-    /// [children_by_field_name](Node::children_by_field_name)
+    /// [`children_by_field_name`](Node::children_by_field_name)
     #[doc(alias = "ts_node_child_by_field_name")]
     pub fn child_by_field_name(&self, field_name: impl AsRef<[u8]>) -> Option<Self> {
         let field_name = field_name.as_ref();
@@ -1045,8 +1045,8 @@ impl<'tree> Node<'tree> {
 
     /// Get this node's child with the given numerical field id.
     ///
-    /// See also [child_by_field_name](Node::child_by_field_name). You can convert a field name to
-    /// an id using [Language::field_id_for_name].
+    /// See also [`child_by_field_name`](Node::child_by_field_name). You can convert a field name to
+    /// an id using [`Language::field_id_for_name`].
     #[doc(alias = "ts_node_child_by_field_id")]
     pub fn child_by_field_id(&self, field_id: u16) -> Option<Self> {
         Self::new(unsafe { ffi::ts_node_child_by_field_id(self.0, field_id) })
@@ -1063,8 +1063,8 @@ impl<'tree> Node<'tree> {
 
     /// Iterate over this node's children.
     ///
-    /// A [TreeCursor] is used to retrieve the children efficiently. Obtain
-    /// a [TreeCursor] by calling [Tree::walk] or [Node::walk]. To avoid unnecessary
+    /// A [`TreeCursor`] is used to retrieve the children efficiently. Obtain
+    /// a [`TreeCursor`] by calling [`Tree::walk`] or [`Node::walk`]. To avoid unnecessary
     /// allocations, you should reuse the same cursor for subsequent calls to
     /// this method.
     ///
@@ -1085,7 +1085,7 @@ impl<'tree> Node<'tree> {
 
     /// Iterate over this node's named children.
     ///
-    /// See also [Node::children].
+    /// See also [`Node::children`].
     pub fn named_children<'cursor>(
         &self,
         cursor: &'cursor mut TreeCursor<'tree>,
@@ -1106,7 +1106,7 @@ impl<'tree> Node<'tree> {
 
     /// Iterate over this node's children with a given field name.
     ///
-    /// See also [Node::children].
+    /// See also [`Node::children`].
     pub fn children_by_field_name<'cursor>(
         &self,
         field_name: &str,
@@ -1137,7 +1137,7 @@ impl<'tree> Node<'tree> {
 
     /// Iterate over this node's children with a given field id.
     ///
-    /// See also [Node::children_by_field_name].
+    /// See also [`Node::children_by_field_name`].
     pub fn children_by_field_id<'cursor>(
         &self,
         field_id: FieldId,
@@ -1250,7 +1250,7 @@ impl<'tree> Node<'tree> {
         &source.as_ref()[self.start_byte()..self.end_byte()]
     }
 
-    /// Create a new [TreeCursor] starting from this node.
+    /// Create a new [`TreeCursor`] starting from this node.
     #[doc(alias = "ts_tree_cursor_new")]
     pub fn walk(&self) -> TreeCursor<'tree> {
         TreeCursor(unsafe { ffi::ts_tree_cursor_new(self.0) }, PhantomData)
@@ -1259,9 +1259,9 @@ impl<'tree> Node<'tree> {
     /// Edit this node to keep it in-sync with source code that has been edited.
     ///
     /// This function is only rarely needed. When you edit a syntax tree with the
-    /// [Tree::edit] method, all of the nodes that you retrieve from the tree
-    /// afterward will already reflect the edit. You only need to use [Node::edit]
-    /// when you have a specific [Node] instance that you want to keep and continue
+    /// [`Tree::edit`] method, all of the nodes that you retrieve from the tree
+    /// afterward will already reflect the edit. You only need to use [`Node::edit`]
+    /// when you have a specific [`Node`] instance that you want to keep and continue
     /// to use after an edit.
     #[doc(alias = "ts_node_edit")]
     pub fn edit(&mut self, edit: &InputEdit) {
@@ -1301,7 +1301,7 @@ impl fmt::Debug for Node<'_> {
 }
 
 impl<'cursor> TreeCursor<'cursor> {
-    /// Get the tree cursor's current [Node].
+    /// Get the tree cursor's current [`Node`].
     #[doc(alias = "ts_tree_cursor_current_node")]
     pub fn node(&self) -> Node<'cursor> {
         Node(
@@ -1312,7 +1312,7 @@ impl<'cursor> TreeCursor<'cursor> {
 
     /// Get the numerical field id of this tree cursor's current node.
     ///
-    /// See also [field_name](TreeCursor::field_name).
+    /// See also [`field_name`](TreeCursor::field_name).
     #[doc(alias = "ts_tree_cursor_current_field_id")]
     pub fn field_id(&self) -> Option<FieldId> {
         let id = unsafe { ffi::ts_tree_cursor_current_field_id(&self.0) };
@@ -1330,7 +1330,7 @@ impl<'cursor> TreeCursor<'cursor> {
 
     /// Get the numerical field id of this tree cursor's current node.
     ///
-    /// See also [field_name](TreeCursor::field_name).
+    /// See also [`field_name`](TreeCursor::field_name).
     #[doc(alias = "ts_tree_cursor_current_depth")]
     pub fn depth(&self) -> u32 {
         unsafe { ffi::ts_tree_cursor_current_depth(&self.0) }

From bdc0e44d45234af7581ff362d1193cbded588cfd Mon Sep 17 00:00:00 2001
From: mgunyho <20118130+mgunyho@users.noreply.github.com>
Date: Mon, 28 Aug 2023 19:52:29 +0300
Subject: [PATCH 318/347] doc: Include README in top-level module documentation

---
 lib/binding_rust/lib.rs | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/lib/binding_rust/lib.rs b/lib/binding_rust/lib.rs
index 3c8d7504..9cd04563 100644
--- a/lib/binding_rust/lib.rs
+++ b/lib/binding_rust/lib.rs
@@ -1,3 +1,5 @@
+#![doc = include_str!("./README.md")]
+
 pub mod ffi;
 mod util;
 

From 08629215371fa434db92e0b1f6fadd34544bba9a Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Mon, 28 Aug 2023 21:16:02 +0300
Subject: [PATCH 319/347] doc: Include README as top-level module documentation
 for all crates

---
 cli/config/README.md  | 6 ++++--
 cli/config/src/lib.rs | 2 +-
 cli/loader/README.md  | 4 ++--
 cli/loader/src/lib.rs | 2 ++
 cli/src/lib.rs        | 2 ++
 highlight/README.md   | 2 +-
 highlight/src/lib.rs  | 2 ++
 tags/README.md        | 2 +-
 tags/src/lib.rs       | 2 ++
 9 files changed, 17 insertions(+), 7 deletions(-)

diff --git a/cli/config/README.md b/cli/config/README.md
index 8cbfbcf4..e7d7b39b 100644
--- a/cli/config/README.md
+++ b/cli/config/README.md
@@ -1,5 +1,7 @@
-# `tree-sitter-config`
+# Tree-sitter Config
+
+Manages Tree-sitter's configuration file.
 
 You can use a configuration file to control the behavior of the `tree-sitter`
-command-line program.  This crate implements the logic for finding and the
+command-line program. This crate implements the logic for finding and the
 parsing the contents of the configuration file.
diff --git a/cli/config/src/lib.rs b/cli/config/src/lib.rs
index 3cd09b8d..83b85358 100644
--- a/cli/config/src/lib.rs
+++ b/cli/config/src/lib.rs
@@ -1,4 +1,4 @@
-//! Manages tree-sitter's configuration file.
+#![doc = include_str!("../README.md")]
 
 use anyhow::{anyhow, Context, Result};
 use serde::{Deserialize, Serialize};
diff --git a/cli/loader/README.md b/cli/loader/README.md
index 9889ec71..a3c18674 100644
--- a/cli/loader/README.md
+++ b/cli/loader/README.md
@@ -1,6 +1,6 @@
-# `tree-sitter-loader`
+# Tree-sitter Loader
 
 The `tree-sitter` command-line program will dynamically find and build grammars
 at runtime, if you have cloned the grammars' repositories to your local
-filesystem.  This helper crate implements that logic, so that you can use it in
+filesystem. This helper crate implements that logic, so that you can use it in
 your own program analysis tools, as well.
diff --git a/cli/loader/src/lib.rs b/cli/loader/src/lib.rs
index 2b3896ef..3022b6b9 100644
--- a/cli/loader/src/lib.rs
+++ b/cli/loader/src/lib.rs
@@ -1,3 +1,5 @@
+#![doc = include_str!("../README.md")]
+
 use anyhow::{anyhow, Context, Error, Result};
 use libloading::{Library, Symbol};
 use once_cell::unsync::OnceCell;
diff --git a/cli/src/lib.rs b/cli/src/lib.rs
index d52b516a..549db773 100644
--- a/cli/src/lib.rs
+++ b/cli/src/lib.rs
@@ -1,3 +1,5 @@
+#![doc = include_str!("../README.md")]
+
 pub mod generate;
 pub mod highlight;
 pub mod logger;
diff --git a/highlight/README.md b/highlight/README.md
index 95b229eb..459790ef 100644
--- a/highlight/README.md
+++ b/highlight/README.md
@@ -1,4 +1,4 @@
-# `tree-sitter-highlight`
+# Tree-sitter Highlight
 
 [![crates.io badge]][crates.io]
 
diff --git a/highlight/src/lib.rs b/highlight/src/lib.rs
index fad91ad9..2903c7c5 100644
--- a/highlight/src/lib.rs
+++ b/highlight/src/lib.rs
@@ -1,3 +1,5 @@
+#![doc = include_str!("../README.md")]
+
 pub mod c_lib;
 pub mod util;
 pub use c_lib as c;
diff --git a/tags/README.md b/tags/README.md
index f5b85cb2..d7daac79 100644
--- a/tags/README.md
+++ b/tags/README.md
@@ -1,4 +1,4 @@
-# `tree-sitter-tags`
+# Tree-sitter Tags
 
 [![crates.io badge]][crates.io]
 
diff --git a/tags/src/lib.rs b/tags/src/lib.rs
index 13499d86..0cf1bf96 100644
--- a/tags/src/lib.rs
+++ b/tags/src/lib.rs
@@ -1,3 +1,5 @@
+#![doc = include_str!("../README.md")]
+
 pub mod c_lib;
 
 use memchr::memchr;

From 756e51867d7b47616e86d4205f3cca81f06f462e Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Mon, 28 Aug 2023 22:48:46 +0300
Subject: [PATCH 320/347] doc: fix `cargo doc` warnings

---
 cli/Cargo.toml                | 1 +
 lib/binding_rust/bindings.rs  | 2 +-
 lib/include/tree_sitter/api.h | 5 +++--
 3 files changed, 5 insertions(+), 3 deletions(-)

diff --git a/cli/Cargo.toml b/cli/Cargo.toml
index de703c85..0edd3c3d 100644
--- a/cli/Cargo.toml
+++ b/cli/Cargo.toml
@@ -14,6 +14,7 @@ rust-version.workspace = true
 [[bin]]
 name = "tree-sitter"
 path = "src/main.rs"
+doc = false
 
 [[bench]]
 name = "benchmark"
diff --git a/lib/binding_rust/bindings.rs b/lib/binding_rust/bindings.rs
index 225fbc11..3cf38097 100644
--- a/lib/binding_rust/bindings.rs
+++ b/lib/binding_rust/bindings.rs
@@ -164,7 +164,7 @@ extern "C" {
     pub fn ts_parser_set_language(self_: *mut TSParser, language: *const TSLanguage) -> bool;
 }
 extern "C" {
-    #[doc = " Set the ranges of text that the parser should include when parsing.\n\n By default, the parser will always include entire documents. This function\n allows you to parse only a *portion* of a document but still return a syntax\n tree whose ranges match up with the document as a whole. You can also pass\n multiple disjoint ranges.\n\n The second and third parameters specify the location and length of an array\n of ranges. The parser does *not* take ownership of these ranges; it copies\n the data, so it doesn't matter how these ranges are allocated.\n\n If `count` is zero, then the entire document will be parsed. Otherwise,\n the given ranges must be ordered from earliest to latest in the document,\n and they must not overlap. That is, the following must hold for all\n `i` < `count - 1`: ranges[i].end_byte <= ranges[i + 1].start_byte\n\n If this requirement is not satisfied, the operation will fail, the ranges\n will not be assigned, and this function will return `false`. On success,\n this function returns `true`"]
+    #[doc = " Set the ranges of text that the parser should include when parsing.\n\n By default, the parser will always include entire documents. This function\n allows you to parse only a *portion* of a document but still return a syntax\n tree whose ranges match up with the document as a whole. You can also pass\n multiple disjoint ranges.\n\n The second and third parameters specify the location and length of an array\n of ranges. The parser does *not* take ownership of these ranges; it copies\n the data, so it doesn't matter how these ranges are allocated.\n\n If `count` is zero, then the entire document will be parsed. Otherwise,\n the given ranges must be ordered from earliest to latest in the document,\n and they must not overlap. That is, the following must hold for all:\n\n `i < count - 1`: `ranges[i].end_byte <= ranges[i + 1].start_byte`\n\n If this requirement is not satisfied, the operation will fail, the ranges\n will not be assigned, and this function will return `false`. On success,\n this function returns `true`"]
     pub fn ts_parser_set_included_ranges(
         self_: *mut TSParser,
         ranges: *const TSRange,
diff --git a/lib/include/tree_sitter/api.h b/lib/include/tree_sitter/api.h
index b2d8a6f5..9072bb60 100644
--- a/lib/include/tree_sitter/api.h
+++ b/lib/include/tree_sitter/api.h
@@ -192,8 +192,9 @@ bool ts_parser_set_language(TSParser *self, const TSLanguage *language);
  *
  * If `count` is zero, then the entire document will be parsed. Otherwise,
  * the given ranges must be ordered from earliest to latest in the document,
- * and they must not overlap. That is, the following must hold for all
- * `i` < `count - 1`: ranges[i].end_byte <= ranges[i + 1].start_byte
+ * and they must not overlap. That is, the following must hold for all:
+ *
+ * `i < count - 1`: `ranges[i].end_byte <= ranges[i + 1].start_byte`
  *
  * If this requirement is not satisfied, the operation will fail, the ranges
  * will not be assigned, and this function will return `false`. On success,

From f9117a022145695b1bf083c943a384fac4b9144a Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Mon, 28 Aug 2023 23:05:36 +0300
Subject: [PATCH 321/347] doc: Add internal links for `api.h` funcs

---
 lib/binding_rust/bindings.rs  |  54 ++++++++---------
 lib/include/tree_sitter/api.h | 111 ++++++++++++++++++----------------
 2 files changed, 85 insertions(+), 80 deletions(-)

diff --git a/lib/binding_rust/bindings.rs b/lib/binding_rust/bindings.rs
index 3cf38097..a0e52f6c 100644
--- a/lib/binding_rust/bindings.rs
+++ b/lib/binding_rust/bindings.rs
@@ -160,7 +160,7 @@ extern "C" {
     pub fn ts_parser_language(self_: *const TSParser) -> *const TSLanguage;
 }
 extern "C" {
-    #[doc = " Set the language that the parser should use for parsing.\n\n Returns a boolean indicating whether or not the language was successfully\n assigned. True means assignment succeeded. False means there was a version\n mismatch: the language was generated with an incompatible version of the\n Tree-sitter CLI. Check the language's version using `ts_language_version`\n and compare it to this library's `TREE_SITTER_LANGUAGE_VERSION` and\n `TREE_SITTER_MIN_COMPATIBLE_LANGUAGE_VERSION` constants."]
+    #[doc = " Set the language that the parser should use for parsing.\n\n Returns a boolean indicating whether or not the language was successfully\n assigned. True means assignment succeeded. False means there was a version\n mismatch: the language was generated with an incompatible version of the\n Tree-sitter CLI. Check the language's version using [`ts_language_version`]\n and compare it to this library's [`TREE_SITTER_LANGUAGE_VERSION`] and\n [`TREE_SITTER_MIN_COMPATIBLE_LANGUAGE_VERSION`] constants."]
     pub fn ts_parser_set_language(self_: *mut TSParser, language: *const TSLanguage) -> bool;
 }
 extern "C" {
@@ -176,7 +176,7 @@ extern "C" {
     pub fn ts_parser_included_ranges(self_: *const TSParser, count: *mut u32) -> *const TSRange;
 }
 extern "C" {
-    #[doc = " Use the parser to parse some source code and create a syntax tree.\n\n If you are parsing this document for the first time, pass `NULL` for the\n `old_tree` parameter. Otherwise, if you have already parsed an earlier\n version of this document and the document has since been edited, pass the\n previous syntax tree so that the unchanged parts of it can be reused.\n This will save time and memory. For this to work correctly, you must have\n already edited the old syntax tree using the `ts_tree_edit` function in a\n way that exactly matches the source code changes.\n\n The `TSInput` parameter lets you specify how to read the text. It has the\n following three fields:\n 1. `read`: A function to retrieve a chunk of text at a given byte offset\n    and (row, column) position. The function should return a pointer to the\n    text and write its length to the `bytes_read` pointer. The parser does\n    not take ownership of this buffer; it just borrows it until it has\n    finished reading it. The function should write a zero value to the\n    `bytes_read` pointer to indicate the end of the document.\n 2. `payload`: An arbitrary pointer that will be passed to each invocation\n    of the `read` function.\n 3. `encoding`: An indication of how the text is encoded. Either\n    `TSInputEncodingUTF8` or `TSInputEncodingUTF16`.\n\n This function returns a syntax tree on success, and `NULL` on failure. There\n are three possible reasons for failure:\n 1. The parser does not have a language assigned. Check for this using the\n`ts_parser_language` function.\n 2. Parsing was cancelled due to a timeout that was set by an earlier call to\n    the `ts_parser_set_timeout_micros` function. You can resume parsing from\n    where the parser left out by calling `ts_parser_parse` again with the\n    same arguments. Or you can start parsing from scratch by first calling\n    `ts_parser_reset`.\n 3. Parsing was cancelled using a cancellation flag that was set by an\n    earlier call to `ts_parser_set_cancellation_flag`. You can resume parsing\n    from where the parser left out by calling `ts_parser_parse` again with\n    the same arguments."]
+    #[doc = " Use the parser to parse some source code and create a syntax tree.\n\n If you are parsing this document for the first time, pass `NULL` for the\n `old_tree` parameter. Otherwise, if you have already parsed an earlier\n version of this document and the document has since been edited, pass the\n previous syntax tree so that the unchanged parts of it can be reused.\n This will save time and memory. For this to work correctly, you must have\n already edited the old syntax tree using the [`ts_tree_edit`] function in a\n way that exactly matches the source code changes.\n\n The [`TSInput`] parameter lets you specify how to read the text. It has the\n following three fields:\n 1. [`read`]: A function to retrieve a chunk of text at a given byte offset\n    and (row, column) position. The function should return a pointer to the\n    text and write its length to the [`bytes_read`] pointer. The parser does\n    not take ownership of this buffer; it just borrows it until it has\n    finished reading it. The function should write a zero value to the\n    [`bytes_read`] pointer to indicate the end of the document.\n 2. [`payload`]: An arbitrary pointer that will be passed to each invocation\n    of the [`read`] function.\n 3. [`encoding`]: An indication of how the text is encoded. Either\n    `TSInputEncodingUTF8` or `TSInputEncodingUTF16`.\n\n This function returns a syntax tree on success, and `NULL` on failure. There\n are three possible reasons for failure:\n 1. The parser does not have a language assigned. Check for this using the\n[`ts_parser_language`] function.\n 2. Parsing was cancelled due to a timeout that was set by an earlier call to\n    the [`ts_parser_set_timeout_micros`] function. You can resume parsing from\n    where the parser left out by calling [`ts_parser_parse`] again with the\n    same arguments. Or you can start parsing from scratch by first calling\n    [`ts_parser_reset`].\n 3. Parsing was cancelled using a cancellation flag that was set by an\n    earlier call to [`ts_parser_set_cancellation_flag`]. You can resume parsing\n    from where the parser left out by calling [`ts_parser_parse`] again with\n    the same arguments.\n\n [`read`]: TSInput::read\n [`payload`]: TSInput::payload\n [`encoding`]: TSInput::encoding\n [`bytes_read`]: TSInput::read"]
     pub fn ts_parser_parse(
         self_: *mut TSParser,
         old_tree: *const TSTree,
@@ -184,7 +184,7 @@ extern "C" {
     ) -> *mut TSTree;
 }
 extern "C" {
-    #[doc = " Use the parser to parse some source code stored in one contiguous buffer.\n The first two parameters are the same as in the `ts_parser_parse` function\n above. The second two parameters indicate the location of the buffer and its\n length in bytes."]
+    #[doc = " Use the parser to parse some source code stored in one contiguous buffer.\n The first two parameters are the same as in the [`ts_parser_parse`] function\n above. The second two parameters indicate the location of the buffer and its\n length in bytes."]
     pub fn ts_parser_parse_string(
         self_: *mut TSParser,
         old_tree: *const TSTree,
@@ -193,7 +193,7 @@ extern "C" {
     ) -> *mut TSTree;
 }
 extern "C" {
-    #[doc = " Use the parser to parse some source code stored in one contiguous buffer with\n a given encoding. The first four parameters work the same as in the\n `ts_parser_parse_string` method above. The final parameter indicates whether\n the text is encoded as UTF8 or UTF16."]
+    #[doc = " Use the parser to parse some source code stored in one contiguous buffer with\n a given encoding. The first four parameters work the same as in the\n [`ts_parser_parse_string`] method above. The final parameter indicates whether\n the text is encoded as UTF8 or UTF16."]
     pub fn ts_parser_parse_string_encoding(
         self_: *mut TSParser,
         old_tree: *const TSTree,
@@ -203,11 +203,11 @@ extern "C" {
     ) -> *mut TSTree;
 }
 extern "C" {
-    #[doc = " Instruct the parser to start the next parse from the beginning.\n\n If the parser previously failed because of a timeout or a cancellation, then\n by default, it will resume where it left off on the next call to\n `ts_parser_parse` or other parsing functions. If you don't want to resume,\n and instead intend to use this parser to parse some other document, you must\n call `ts_parser_reset` first."]
+    #[doc = " Instruct the parser to start the next parse from the beginning.\n\n If the parser previously failed because of a timeout or a cancellation, then\n by default, it will resume where it left off on the next call to\n [`ts_parser_parse`] or other parsing functions. If you don't want to resume,\n and instead intend to use this parser to parse some other document, you must\n call [`ts_parser_reset`] first."]
     pub fn ts_parser_reset(self_: *mut TSParser);
 }
 extern "C" {
-    #[doc = " Set the maximum duration in microseconds that parsing should be allowed to\n take before halting.\n\n If parsing takes longer than this, it will halt early, returning NULL.\n See `ts_parser_parse` for more information."]
+    #[doc = " Set the maximum duration in microseconds that parsing should be allowed to\n take before halting.\n\n If parsing takes longer than this, it will halt early, returning NULL.\n See [`ts_parser_parse`] for more information."]
     pub fn ts_parser_set_timeout_micros(self_: *mut TSParser, timeout_micros: u64);
 }
 extern "C" {
@@ -215,7 +215,7 @@ extern "C" {
     pub fn ts_parser_timeout_micros(self_: *const TSParser) -> u64;
 }
 extern "C" {
-    #[doc = " Set the parser's current cancellation flag pointer.\n\n If a non-null pointer is assigned, then the parser will periodically read\n from this pointer during parsing. If it reads a non-zero value, it will\n halt early, returning NULL. See `ts_parser_parse` for more information."]
+    #[doc = " Set the parser's current cancellation flag pointer.\n\n If a non-null pointer is assigned, then the parser will periodically read\n from this pointer during parsing. If it reads a non-zero value, it will\n halt early, returning NULL. See [`ts_parser_parse`] for more information."]
     pub fn ts_parser_set_cancellation_flag(self_: *mut TSParser, flag: *const usize);
 }
 extern "C" {
@@ -267,7 +267,7 @@ extern "C" {
     pub fn ts_tree_edit(self_: *mut TSTree, edit: *const TSInputEdit);
 }
 extern "C" {
-    #[doc = " Compare an old edited syntax tree to a new syntax tree representing the same\n document, returning an array of ranges whose syntactic structure has changed.\n\n For this to work correctly, the old syntax tree must have been edited such\n that its ranges match up to the new tree. Generally, you'll want to call\n this function right after calling one of the `ts_parser_parse` functions.\n You need to pass the old tree that was passed to parse, as well as the new\n tree that was returned from that function.\n\n The returned array is allocated using `malloc` and the caller is responsible\n for freeing it using `free`. The length of the array will be written to the\n given `length` pointer."]
+    #[doc = " Compare an old edited syntax tree to a new syntax tree representing the same\n document, returning an array of ranges whose syntactic structure has changed.\n\n For this to work correctly, the old syntax tree must have been edited such\n that its ranges match up to the new tree. Generally, you'll want to call\n this function right after calling one of the [`ts_parser_parse`] functions.\n You need to pass the old tree that was passed to parse, as well as the new\n tree that was returned from that function.\n\n The returned array is allocated using `malloc` and the caller is responsible\n for freeing it using `free`. The length of the array will be written to the\n given `length` pointer."]
     pub fn ts_tree_get_changed_ranges(
         old_tree: *const TSTree,
         new_tree: *const TSTree,
@@ -295,7 +295,7 @@ extern "C" {
     pub fn ts_node_grammar_type(self_: TSNode) -> *const ::std::os::raw::c_char;
 }
 extern "C" {
-    #[doc = " Get the node's type as a numerical id as it appears in the grammar ignoring\n aliases. This should be used in `ts_language_next_state` instead of\n `ts_node_symbol`."]
+    #[doc = " Get the node's type as a numerical id as it appears in the grammar ignoring\n aliases. This should be used in [`ts_language_next_state`] instead of\n [`ts_node_symbol`]."]
     pub fn ts_node_grammar_symbol(self_: TSNode) -> TSSymbol;
 }
 extern "C" {
@@ -319,7 +319,7 @@ extern "C" {
     pub fn ts_node_string(self_: TSNode) -> *mut ::std::os::raw::c_char;
 }
 extern "C" {
-    #[doc = " Check if the node is null. Functions like `ts_node_child` and\n `ts_node_next_sibling` will return a null node to indicate that no such node\n was found."]
+    #[doc = " Check if the node is null. Functions like [`ts_node_child`] and\n [`ts_node_next_sibling`] will return a null node to indicate that no such node\n was found."]
     pub fn ts_node_is_null(self_: TSNode) -> bool;
 }
 extern "C" {
@@ -374,11 +374,11 @@ extern "C" {
     pub fn ts_node_child_count(self_: TSNode) -> u32;
 }
 extern "C" {
-    #[doc = " Get the node's *named* child at the given index.\n\n See also `ts_node_is_named`."]
+    #[doc = " Get the node's *named* child at the given index.\n\n See also [`ts_node_is_named`]."]
     pub fn ts_node_named_child(self_: TSNode, child_index: u32) -> TSNode;
 }
 extern "C" {
-    #[doc = " Get the node's number of *named* children.\n\n See also `ts_node_is_named`."]
+    #[doc = " Get the node's number of *named* children.\n\n See also [`ts_node_is_named`]."]
     pub fn ts_node_named_child_count(self_: TSNode) -> u32;
 }
 extern "C" {
@@ -390,7 +390,7 @@ extern "C" {
     ) -> TSNode;
 }
 extern "C" {
-    #[doc = " Get the node's child with the given numerical field id.\n\n You can convert a field name to an id using the\n `ts_language_field_id_for_name` function."]
+    #[doc = " Get the node's child with the given numerical field id.\n\n You can convert a field name to an id using the\n [`ts_language_field_id_for_name`] function."]
     pub fn ts_node_child_by_field_id(self_: TSNode, field_id: TSFieldId) -> TSNode;
 }
 extern "C" {
@@ -442,7 +442,7 @@ extern "C" {
     ) -> TSNode;
 }
 extern "C" {
-    #[doc = " Edit the node to keep it in-sync with source code that has been edited.\n\n This function is only rarely needed. When you edit a syntax tree with the\n `ts_tree_edit` function, all of the nodes that you retrieve from the tree\n afterward will already reflect the edit. You only need to use `ts_node_edit`\n when you have a `TSNode` instance that you want to keep and continue to use\n after an edit."]
+    #[doc = " Edit the node to keep it in-sync with source code that has been edited.\n\n This function is only rarely needed. When you edit a syntax tree with the\n [`ts_tree_edit`] function, all of the nodes that you retrieve from the tree\n afterward will already reflect the edit. You only need to use [`ts_node_edit`]\n when you have a [`TSNode`] instance that you want to keep and continue to use\n after an edit."]
     pub fn ts_node_edit(self_: *mut TSNode, edit: *const TSInputEdit);
 }
 extern "C" {
@@ -450,7 +450,7 @@ extern "C" {
     pub fn ts_node_eq(self_: TSNode, other: TSNode) -> bool;
 }
 extern "C" {
-    #[doc = " Create a new tree cursor starting from the given node.\n\n A tree cursor allows you to walk a syntax tree more efficiently than is\n possible using the `TSNode` functions. It is a mutable object that is always\n on a certain syntax node, and can be moved imperatively to different nodes."]
+    #[doc = " Create a new tree cursor starting from the given node.\n\n A tree cursor allows you to walk a syntax tree more efficiently than is\n possible using the [`TSNode`] functions. It is a mutable object that is always\n on a certain syntax node, and can be moved imperatively to different nodes."]
     pub fn ts_tree_cursor_new(node: TSNode) -> TSTreeCursor;
 }
 extern "C" {
@@ -462,7 +462,7 @@ extern "C" {
     pub fn ts_tree_cursor_reset(self_: *mut TSTreeCursor, node: TSNode);
 }
 extern "C" {
-    #[doc = " Re-initialize a tree cursor to the same position as another cursor.\n\n Unlike `ts_tree_cursor_reset`, this will not lose parent information and\n allows reusing already created cursors."]
+    #[doc = " Re-initialize a tree cursor to the same position as another cursor.\n\n Unlike [`ts_tree_cursor_reset`], this will not lose parent information and\n allows reusing already created cursors."]
     pub fn ts_tree_cursor_reset_to(dst: *mut TSTreeCursor, src: *const TSTreeCursor);
 }
 extern "C" {
@@ -470,13 +470,13 @@ extern "C" {
     pub fn ts_tree_cursor_current_node(self_: *const TSTreeCursor) -> TSNode;
 }
 extern "C" {
-    #[doc = " Get the field name of the tree cursor's current node.\n\n This returns `NULL` if the current node doesn't have a field.\n See also `ts_node_child_by_field_name`."]
+    #[doc = " Get the field name of the tree cursor's current node.\n\n This returns `NULL` if the current node doesn't have a field.\n See also [`ts_node_child_by_field_name`]."]
     pub fn ts_tree_cursor_current_field_name(
         self_: *const TSTreeCursor,
     ) -> *const ::std::os::raw::c_char;
 }
 extern "C" {
-    #[doc = " Get the field id of the tree cursor's current node.\n\n This returns zero if the current node doesn't have a field.\n See also `ts_node_child_by_field_id`, `ts_language_field_id_for_name`."]
+    #[doc = " Get the field id of the tree cursor's current node.\n\n This returns zero if the current node doesn't have a field.\n See also [`ts_node_child_by_field_id`], [`ts_language_field_id_for_name`]."]
     pub fn ts_tree_cursor_current_field_id(self_: *const TSTreeCursor) -> TSFieldId;
 }
 extern "C" {
@@ -488,7 +488,7 @@ extern "C" {
     pub fn ts_tree_cursor_goto_next_sibling(self_: *mut TSTreeCursor) -> bool;
 }
 extern "C" {
-    #[doc = " Move the cursor to the previous sibling of its current node.\n\n This returns `true` if the cursor successfully moved, and returns `false` if\n there was no previous sibling node.\n\n Note, that this function may be slower than\n `ts_tree_cursor_goto_next_sibling` due to how node positions are stored. In\n the worst case, this will need to iterate through all the children upto the\n previous sibling node to recalculate its position."]
+    #[doc = " Move the cursor to the previous sibling of its current node.\n\n This returns `true` if the cursor successfully moved, and returns `false` if\n there was no previous sibling node.\n\n Note, that this function may be slower than\n [`ts_tree_cursor_goto_next_sibling`] due to how node positions are stored. In\n the worst case, this will need to iterate through all the children upto the\n previous sibling node to recalculate its position."]
     pub fn ts_tree_cursor_goto_previous_sibling(self_: *mut TSTreeCursor) -> bool;
 }
 extern "C" {
@@ -496,7 +496,7 @@ extern "C" {
     pub fn ts_tree_cursor_goto_first_child(self_: *mut TSTreeCursor) -> bool;
 }
 extern "C" {
-    #[doc = " Move the cursor to the last child of its current node.\n\n This returns `true` if the cursor successfully moved, and returns `false` if\n there were no children.\n\n Note that this function may be slower than `ts_tree_cursor_goto_first_child`\n because it needs to iterate through all the children to compute the child's\n position."]
+    #[doc = " Move the cursor to the last child of its current node.\n\n This returns `true` if the cursor successfully moved, and returns `false` if\n there were no children.\n\n Note that this function may be slower than [`ts_tree_cursor_goto_first_child`]\n because it needs to iterate through all the children to compute the child's\n position."]
     pub fn ts_tree_cursor_goto_last_child(self_: *mut TSTreeCursor) -> bool;
 }
 extern "C" {
@@ -528,7 +528,7 @@ extern "C" {
     pub fn ts_tree_cursor_copy(cursor: *const TSTreeCursor) -> TSTreeCursor;
 }
 extern "C" {
-    #[doc = " Create a new query from a string containing one or more S-expression\n patterns. The query is associated with a particular language, and can\n only be run on syntax nodes parsed with that language.\n\n If all of the given patterns are valid, this returns a `TSQuery`.\n If a pattern is invalid, this returns `NULL`, and provides two pieces\n of information about the problem:\n 1. The byte offset of the error is written to the `error_offset` parameter.\n 2. The type of error is written to the `error_type` parameter."]
+    #[doc = " Create a new query from a string containing one or more S-expression\n patterns. The query is associated with a particular language, and can\n only be run on syntax nodes parsed with that language.\n\n If all of the given patterns are valid, this returns a [`TSQuery`].\n If a pattern is invalid, this returns `NULL`, and provides two pieces\n of information about the problem:\n 1. The byte offset of the error is written to the `error_offset` parameter.\n 2. The type of error is written to the `error_type` parameter."]
     pub fn ts_query_new(
         language: *const TSLanguage,
         source: *const ::std::os::raw::c_char,
@@ -556,7 +556,7 @@ extern "C" {
     pub fn ts_query_start_byte_for_pattern(self_: *const TSQuery, pattern_index: u32) -> u32;
 }
 extern "C" {
-    #[doc = " Get all of the predicates for the given pattern in the query.\n\n The predicates are represented as a single array of steps. There are three\n types of steps in this array, which correspond to the three legal values for\n the `type` field:\n - `TSQueryPredicateStepTypeCapture` - Steps with this type represent names\n    of captures. Their `value_id` can be used with the\n   `ts_query_capture_name_for_id` function to obtain the name of the capture.\n - `TSQueryPredicateStepTypeString` - Steps with this type represent literal\n    strings. Their `value_id` can be used with the\n    `ts_query_string_value_for_id` function to obtain their string value.\n - `TSQueryPredicateStepTypeDone` - Steps with this type are *sentinels*\n    that represent the end of an individual predicate. If a pattern has two\n    predicates, then there will be two steps with this `type` in the array."]
+    #[doc = " Get all of the predicates for the given pattern in the query.\n\n The predicates are represented as a single array of steps. There are three\n types of steps in this array, which correspond to the three legal values for\n the `type` field:\n - `TSQueryPredicateStepTypeCapture` - Steps with this type represent names\n    of captures. Their `value_id` can be used with the\n   [`ts_query_capture_name_for_id`] function to obtain the name of the capture.\n - `TSQueryPredicateStepTypeString` - Steps with this type represent literal\n    strings. Their `value_id` can be used with the\n    [`ts_query_string_value_for_id`] function to obtain their string value.\n - `TSQueryPredicateStepTypeDone` - Steps with this type are *sentinels*\n    that represent the end of an individual predicate. If a pattern has two\n    predicates, then there will be two steps with this `type` in the array."]
     pub fn ts_query_predicates_for_pattern(
         self_: *const TSQuery,
         pattern_index: u32,
@@ -608,7 +608,7 @@ extern "C" {
     pub fn ts_query_disable_pattern(self_: *mut TSQuery, pattern_index: u32);
 }
 extern "C" {
-    #[doc = " Create a new cursor for executing a given query.\n\n The cursor stores the state that is needed to iteratively search\n for matches. To use the query cursor, first call `ts_query_cursor_exec`\n to start running a given query on a given syntax node. Then, there are\n two options for consuming the results of the query:\n 1. Repeatedly call `ts_query_cursor_next_match` to iterate over all of the\n    *matches* in the order that they were found. Each match contains the\n    index of the pattern that matched, and an array of captures. Because\n    multiple patterns can match the same set of nodes, one match may contain\n    captures that appear *before* some of the captures from a previous match.\n 2. Repeatedly call `ts_query_cursor_next_capture` to iterate over all of the\n    individual *captures* in the order that they appear. This is useful if\n    don't care about which pattern matched, and just want a single ordered\n    sequence of captures.\n\n If you don't care about consuming all of the results, you can stop calling\n `ts_query_cursor_next_match` or `ts_query_cursor_next_capture` at any point.\n  You can then start executing another query on another node by calling\n  `ts_query_cursor_exec` again."]
+    #[doc = " Create a new cursor for executing a given query.\n\n The cursor stores the state that is needed to iteratively search\n for matches. To use the query cursor, first call [`ts_query_cursor_exec`]\n to start running a given query on a given syntax node. Then, there are\n two options for consuming the results of the query:\n 1. Repeatedly call [`ts_query_cursor_next_match`] to iterate over all of the\n    *matches* in the order that they were found. Each match contains the\n    index of the pattern that matched, and an array of captures. Because\n    multiple patterns can match the same set of nodes, one match may contain\n    captures that appear *before* some of the captures from a previous match.\n 2. Repeatedly call [`ts_query_cursor_next_capture`] to iterate over all of the\n    individual *captures* in the order that they appear. This is useful if\n    don't care about which pattern matched, and just want a single ordered\n    sequence of captures.\n\n If you don't care about consuming all of the results, you can stop calling\n [`ts_query_cursor_next_match`] or [`ts_query_cursor_next_capture`] at any point.\n  You can then start executing another query on another node by calling\n  [`ts_query_cursor_exec`] again."]
     pub fn ts_query_cursor_new() -> *mut TSQueryCursor;
 }
 extern "C" {
@@ -708,15 +708,15 @@ extern "C" {
     ) -> TSFieldId;
 }
 extern "C" {
-    #[doc = " Check whether the given node type id belongs to named nodes, anonymous nodes,\n or a hidden nodes.\n\n See also `ts_node_is_named`. Hidden nodes are never returned from the API."]
+    #[doc = " Check whether the given node type id belongs to named nodes, anonymous nodes,\n or a hidden nodes.\n\n See also [`ts_node_is_named`]. Hidden nodes are never returned from the API."]
     pub fn ts_language_symbol_type(self_: *const TSLanguage, symbol: TSSymbol) -> TSSymbolType;
 }
 extern "C" {
-    #[doc = " Get the ABI version number for this language. This version number is used\n to ensure that languages were generated by a compatible version of\n Tree-sitter.\n\n See also `ts_parser_set_language`."]
+    #[doc = " Get the ABI version number for this language. This version number is used\n to ensure that languages were generated by a compatible version of\n Tree-sitter.\n\n See also [`ts_parser_set_language`]."]
     pub fn ts_language_version(self_: *const TSLanguage) -> u32;
 }
 extern "C" {
-    #[doc = " Get the next parse state. Combine this with lookahead iterators to generate\n completion suggestions or valid symbols in error nodes. Use\n `ts_node_grammar_symbol` for valid symbols."]
+    #[doc = " Get the next parse state. Combine this with lookahead iterators to generate\n completion suggestions or valid symbols in error nodes. Use\n [`ts_node_grammar_symbol`] for valid symbols."]
     pub fn ts_language_next_state(
         self_: *const TSLanguage,
         state: TSStateId,
@@ -724,7 +724,7 @@ extern "C" {
     ) -> TSStateId;
 }
 extern "C" {
-    #[doc = " Create a new lookahead iterator for the given language and parse state.\n\n This returns `NULL` if state is invalid for the language.\n\n Repeatedly using `ts_lookahead_iterator_next` and\n `ts_lookahead_iterator_current_symbol` will generate valid symbols in the\n given parse state. Newly created lookahead iterators will contain the `ERROR`\n symbol.\n\n Lookahead iterators can be useful to generate suggestions and improve syntax\n error diagnostics. To get symbols valid in an ERROR node, use the lookahead\n iterator on its first leaf node state. For `MISSING` nodes, a lookahead\n iterator created on the previous non-extra leaf node may be appropriate."]
+    #[doc = " Create a new lookahead iterator for the given language and parse state.\n\n This returns `NULL` if state is invalid for the language.\n\n Repeatedly using [`ts_lookahead_iterator_next`] and\n [`ts_lookahead_iterator_current_symbol`] will generate valid symbols in the\n given parse state. Newly created lookahead iterators will contain the `ERROR`\n symbol.\n\n Lookahead iterators can be useful to generate suggestions and improve syntax\n error diagnostics. To get symbols valid in an ERROR node, use the lookahead\n iterator on its first leaf node state. For `MISSING` nodes, a lookahead\n iterator created on the previous non-extra leaf node may be appropriate."]
     pub fn ts_lookahead_iterator_new(
         self_: *const TSLanguage,
         state: TSStateId,
diff --git a/lib/include/tree_sitter/api.h b/lib/include/tree_sitter/api.h
index 9072bb60..56093d91 100644
--- a/lib/include/tree_sitter/api.h
+++ b/lib/include/tree_sitter/api.h
@@ -172,9 +172,9 @@ const TSLanguage *ts_parser_language(const TSParser *self);
  * Returns a boolean indicating whether or not the language was successfully
  * assigned. True means assignment succeeded. False means there was a version
  * mismatch: the language was generated with an incompatible version of the
- * Tree-sitter CLI. Check the language's version using `ts_language_version`
- * and compare it to this library's `TREE_SITTER_LANGUAGE_VERSION` and
- * `TREE_SITTER_MIN_COMPATIBLE_LANGUAGE_VERSION` constants.
+ * Tree-sitter CLI. Check the language's version using [`ts_language_version`]
+ * and compare it to this library's [`TREE_SITTER_LANGUAGE_VERSION`] and
+ * [`TREE_SITTER_MIN_COMPATIBLE_LANGUAGE_VERSION`] constants.
  */
 bool ts_parser_set_language(TSParser *self, const TSLanguage *language);
 
@@ -226,35 +226,40 @@ const TSRange *ts_parser_included_ranges(
  * version of this document and the document has since been edited, pass the
  * previous syntax tree so that the unchanged parts of it can be reused.
  * This will save time and memory. For this to work correctly, you must have
- * already edited the old syntax tree using the `ts_tree_edit` function in a
+ * already edited the old syntax tree using the [`ts_tree_edit`] function in a
  * way that exactly matches the source code changes.
  *
- * The `TSInput` parameter lets you specify how to read the text. It has the
+ * The [`TSInput`] parameter lets you specify how to read the text. It has the
  * following three fields:
- * 1. `read`: A function to retrieve a chunk of text at a given byte offset
+ * 1. [`read`]: A function to retrieve a chunk of text at a given byte offset
  *    and (row, column) position. The function should return a pointer to the
- *    text and write its length to the `bytes_read` pointer. The parser does
+ *    text and write its length to the [`bytes_read`] pointer. The parser does
  *    not take ownership of this buffer; it just borrows it until it has
  *    finished reading it. The function should write a zero value to the
- *    `bytes_read` pointer to indicate the end of the document.
- * 2. `payload`: An arbitrary pointer that will be passed to each invocation
- *    of the `read` function.
- * 3. `encoding`: An indication of how the text is encoded. Either
+ *    [`bytes_read`] pointer to indicate the end of the document.
+ * 2. [`payload`]: An arbitrary pointer that will be passed to each invocation
+ *    of the [`read`] function.
+ * 3. [`encoding`]: An indication of how the text is encoded. Either
  *    `TSInputEncodingUTF8` or `TSInputEncodingUTF16`.
  *
  * This function returns a syntax tree on success, and `NULL` on failure. There
  * are three possible reasons for failure:
  * 1. The parser does not have a language assigned. Check for this using the
-      `ts_parser_language` function.
+      [`ts_parser_language`] function.
  * 2. Parsing was cancelled due to a timeout that was set by an earlier call to
- *    the `ts_parser_set_timeout_micros` function. You can resume parsing from
- *    where the parser left out by calling `ts_parser_parse` again with the
+ *    the [`ts_parser_set_timeout_micros`] function. You can resume parsing from
+ *    where the parser left out by calling [`ts_parser_parse`] again with the
  *    same arguments. Or you can start parsing from scratch by first calling
- *    `ts_parser_reset`.
+ *    [`ts_parser_reset`].
  * 3. Parsing was cancelled using a cancellation flag that was set by an
- *    earlier call to `ts_parser_set_cancellation_flag`. You can resume parsing
- *    from where the parser left out by calling `ts_parser_parse` again with
+ *    earlier call to [`ts_parser_set_cancellation_flag`]. You can resume parsing
+ *    from where the parser left out by calling [`ts_parser_parse`] again with
  *    the same arguments.
+ *
+ * [`read`]: TSInput::read
+ * [`payload`]: TSInput::payload
+ * [`encoding`]: TSInput::encoding
+ * [`bytes_read`]: TSInput::read
  */
 TSTree *ts_parser_parse(
   TSParser *self,
@@ -264,7 +269,7 @@ TSTree *ts_parser_parse(
 
 /**
  * Use the parser to parse some source code stored in one contiguous buffer.
- * The first two parameters are the same as in the `ts_parser_parse` function
+ * The first two parameters are the same as in the [`ts_parser_parse`] function
  * above. The second two parameters indicate the location of the buffer and its
  * length in bytes.
  */
@@ -278,7 +283,7 @@ TSTree *ts_parser_parse_string(
 /**
  * Use the parser to parse some source code stored in one contiguous buffer with
  * a given encoding. The first four parameters work the same as in the
- * `ts_parser_parse_string` method above. The final parameter indicates whether
+ * [`ts_parser_parse_string`] method above. The final parameter indicates whether
  * the text is encoded as UTF8 or UTF16.
  */
 TSTree *ts_parser_parse_string_encoding(
@@ -294,9 +299,9 @@ TSTree *ts_parser_parse_string_encoding(
  *
  * If the parser previously failed because of a timeout or a cancellation, then
  * by default, it will resume where it left off on the next call to
- * `ts_parser_parse` or other parsing functions. If you don't want to resume,
+ * [`ts_parser_parse`] or other parsing functions. If you don't want to resume,
  * and instead intend to use this parser to parse some other document, you must
- * call `ts_parser_reset` first.
+ * call [`ts_parser_reset`] first.
  */
 void ts_parser_reset(TSParser *self);
 
@@ -305,7 +310,7 @@ void ts_parser_reset(TSParser *self);
  * take before halting.
  *
  * If parsing takes longer than this, it will halt early, returning NULL.
- * See `ts_parser_parse` for more information.
+ * See [`ts_parser_parse`] for more information.
  */
 void ts_parser_set_timeout_micros(TSParser *self, uint64_t timeout_micros);
 
@@ -319,7 +324,7 @@ uint64_t ts_parser_timeout_micros(const TSParser *self);
  *
  * If a non-null pointer is assigned, then the parser will periodically read
  * from this pointer during parsing. If it reads a non-zero value, it will
- * halt early, returning NULL. See `ts_parser_parse` for more information.
+ * halt early, returning NULL. See [`ts_parser_parse`] for more information.
  */
 void ts_parser_set_cancellation_flag(TSParser *self, const size_t *flag);
 
@@ -409,7 +414,7 @@ void ts_tree_edit(TSTree *self, const TSInputEdit *edit);
  *
  * For this to work correctly, the old syntax tree must have been edited such
  * that its ranges match up to the new tree. Generally, you'll want to call
- * this function right after calling one of the `ts_parser_parse` functions.
+ * this function right after calling one of the [`ts_parser_parse`] functions.
  * You need to pass the old tree that was passed to parse, as well as the new
  * tree that was returned from that function.
  *
@@ -455,8 +460,8 @@ const char *ts_node_grammar_type(TSNode self);
 
 /**
  * Get the node's type as a numerical id as it appears in the grammar ignoring
- * aliases. This should be used in `ts_language_next_state` instead of
- * `ts_node_symbol`.
+ * aliases. This should be used in [`ts_language_next_state`] instead of
+ * [`ts_node_symbol`].
  */
 TSSymbol ts_node_grammar_symbol(TSNode self);
 
@@ -489,8 +494,8 @@ TSPoint ts_node_end_point(TSNode self);
 char *ts_node_string(TSNode self);
 
 /**
- * Check if the node is null. Functions like `ts_node_child` and
- * `ts_node_next_sibling` will return a null node to indicate that no such node
+ * Check if the node is null. Functions like [`ts_node_child`] and
+ * [`ts_node_next_sibling`] will return a null node to indicate that no such node
  * was found.
  */
 bool ts_node_is_null(TSNode self);
@@ -564,14 +569,14 @@ uint32_t ts_node_child_count(TSNode self);
 /**
  * Get the node's *named* child at the given index.
  *
- * See also `ts_node_is_named`.
+ * See also [`ts_node_is_named`].
  */
 TSNode ts_node_named_child(TSNode self, uint32_t child_index);
 
 /**
  * Get the node's number of *named* children.
  *
- * See also `ts_node_is_named`.
+ * See also [`ts_node_is_named`].
  */
 uint32_t ts_node_named_child_count(TSNode self);
 
@@ -588,7 +593,7 @@ TSNode ts_node_child_by_field_name(
  * Get the node's child with the given numerical field id.
  *
  * You can convert a field name to an id using the
- * `ts_language_field_id_for_name` function.
+ * [`ts_language_field_id_for_name`] function.
  */
 TSNode ts_node_child_by_field_id(TSNode self, TSFieldId field_id);
 
@@ -637,9 +642,9 @@ TSNode ts_node_named_descendant_for_point_range(TSNode self, TSPoint start, TSPo
  * Edit the node to keep it in-sync with source code that has been edited.
  *
  * This function is only rarely needed. When you edit a syntax tree with the
- * `ts_tree_edit` function, all of the nodes that you retrieve from the tree
- * afterward will already reflect the edit. You only need to use `ts_node_edit`
- * when you have a `TSNode` instance that you want to keep and continue to use
+ * [`ts_tree_edit`] function, all of the nodes that you retrieve from the tree
+ * afterward will already reflect the edit. You only need to use [`ts_node_edit`]
+ * when you have a [`TSNode`] instance that you want to keep and continue to use
  * after an edit.
  */
 void ts_node_edit(TSNode *self, const TSInputEdit *edit);
@@ -657,7 +662,7 @@ bool ts_node_eq(TSNode self, TSNode other);
  * Create a new tree cursor starting from the given node.
  *
  * A tree cursor allows you to walk a syntax tree more efficiently than is
- * possible using the `TSNode` functions. It is a mutable object that is always
+ * possible using the [`TSNode`] functions. It is a mutable object that is always
  * on a certain syntax node, and can be moved imperatively to different nodes.
  */
 TSTreeCursor ts_tree_cursor_new(TSNode node);
@@ -675,7 +680,7 @@ void ts_tree_cursor_reset(TSTreeCursor *self, TSNode node);
 /**
  * Re-initialize a tree cursor to the same position as another cursor.
  *
- * Unlike `ts_tree_cursor_reset`, this will not lose parent information and
+ * Unlike [`ts_tree_cursor_reset`], this will not lose parent information and
  * allows reusing already created cursors.
 */
 void ts_tree_cursor_reset_to(TSTreeCursor *dst, const TSTreeCursor *src);
@@ -689,7 +694,7 @@ TSNode ts_tree_cursor_current_node(const TSTreeCursor *self);
  * Get the field name of the tree cursor's current node.
  *
  * This returns `NULL` if the current node doesn't have a field.
- * See also `ts_node_child_by_field_name`.
+ * See also [`ts_node_child_by_field_name`].
  */
 const char *ts_tree_cursor_current_field_name(const TSTreeCursor *self);
 
@@ -697,7 +702,7 @@ const char *ts_tree_cursor_current_field_name(const TSTreeCursor *self);
  * Get the field id of the tree cursor's current node.
  *
  * This returns zero if the current node doesn't have a field.
- * See also `ts_node_child_by_field_id`, `ts_language_field_id_for_name`.
+ * See also [`ts_node_child_by_field_id`], [`ts_language_field_id_for_name`].
  */
 TSFieldId ts_tree_cursor_current_field_id(const TSTreeCursor *self);
 
@@ -724,7 +729,7 @@ bool ts_tree_cursor_goto_next_sibling(TSTreeCursor *self);
  * there was no previous sibling node.
  *
  * Note, that this function may be slower than
- * `ts_tree_cursor_goto_next_sibling` due to how node positions are stored. In
+ * [`ts_tree_cursor_goto_next_sibling`] due to how node positions are stored. In
  * the worst case, this will need to iterate through all the children upto the
  * previous sibling node to recalculate its position.
  */
@@ -744,7 +749,7 @@ bool ts_tree_cursor_goto_first_child(TSTreeCursor *self);
  * This returns `true` if the cursor successfully moved, and returns `false` if
  * there were no children.
  *
- * Note that this function may be slower than `ts_tree_cursor_goto_first_child`
+ * Note that this function may be slower than [`ts_tree_cursor_goto_first_child`]
  * because it needs to iterate through all the children to compute the child's
  * position.
  */
@@ -790,7 +795,7 @@ TSTreeCursor ts_tree_cursor_copy(const TSTreeCursor *cursor);
  * patterns. The query is associated with a particular language, and can
  * only be run on syntax nodes parsed with that language.
  *
- * If all of the given patterns are valid, this returns a `TSQuery`.
+ * If all of the given patterns are valid, this returns a [`TSQuery`].
  * If a pattern is invalid, this returns `NULL`, and provides two pieces
  * of information about the problem:
  * 1. The byte offset of the error is written to the `error_offset` parameter.
@@ -832,10 +837,10 @@ uint32_t ts_query_start_byte_for_pattern(const TSQuery *self, uint32_t pattern_i
  * the `type` field:
  * - `TSQueryPredicateStepTypeCapture` - Steps with this type represent names
  *    of captures. Their `value_id` can be used with the
- *   `ts_query_capture_name_for_id` function to obtain the name of the capture.
+ *   [`ts_query_capture_name_for_id`] function to obtain the name of the capture.
  * - `TSQueryPredicateStepTypeString` - Steps with this type represent literal
  *    strings. Their `value_id` can be used with the
- *    `ts_query_string_value_for_id` function to obtain their string value.
+ *    [`ts_query_string_value_for_id`] function to obtain their string value.
  * - `TSQueryPredicateStepTypeDone` - Steps with this type are *sentinels*
  *    that represent the end of an individual predicate. If a pattern has two
  *    predicates, then there will be two steps with this `type` in the array.
@@ -915,23 +920,23 @@ void ts_query_disable_pattern(TSQuery *self, uint32_t pattern_index);
  * Create a new cursor for executing a given query.
  *
  * The cursor stores the state that is needed to iteratively search
- * for matches. To use the query cursor, first call `ts_query_cursor_exec`
+ * for matches. To use the query cursor, first call [`ts_query_cursor_exec`]
  * to start running a given query on a given syntax node. Then, there are
  * two options for consuming the results of the query:
- * 1. Repeatedly call `ts_query_cursor_next_match` to iterate over all of the
+ * 1. Repeatedly call [`ts_query_cursor_next_match`] to iterate over all of the
  *    *matches* in the order that they were found. Each match contains the
  *    index of the pattern that matched, and an array of captures. Because
  *    multiple patterns can match the same set of nodes, one match may contain
  *    captures that appear *before* some of the captures from a previous match.
- * 2. Repeatedly call `ts_query_cursor_next_capture` to iterate over all of the
+ * 2. Repeatedly call [`ts_query_cursor_next_capture`] to iterate over all of the
  *    individual *captures* in the order that they appear. This is useful if
  *    don't care about which pattern matched, and just want a single ordered
  *    sequence of captures.
  *
  * If you don't care about consuming all of the results, you can stop calling
- * `ts_query_cursor_next_match` or `ts_query_cursor_next_capture` at any point.
+ * [`ts_query_cursor_next_match`] or [`ts_query_cursor_next_capture`] at any point.
  *  You can then start executing another query on another node by calling
- *  `ts_query_cursor_exec` again.
+ *  [`ts_query_cursor_exec`] again.
  */
 TSQueryCursor *ts_query_cursor_new(void);
 
@@ -1052,7 +1057,7 @@ TSFieldId ts_language_field_id_for_name(const TSLanguage *self, const char *name
  * Check whether the given node type id belongs to named nodes, anonymous nodes,
  * or a hidden nodes.
  *
- * See also `ts_node_is_named`. Hidden nodes are never returned from the API.
+ * See also [`ts_node_is_named`]. Hidden nodes are never returned from the API.
  */
 TSSymbolType ts_language_symbol_type(const TSLanguage *self, TSSymbol symbol);
 
@@ -1061,14 +1066,14 @@ TSSymbolType ts_language_symbol_type(const TSLanguage *self, TSSymbol symbol);
  * to ensure that languages were generated by a compatible version of
  * Tree-sitter.
  *
- * See also `ts_parser_set_language`.
+ * See also [`ts_parser_set_language`].
  */
 uint32_t ts_language_version(const TSLanguage *self);
 
 /**
  * Get the next parse state. Combine this with lookahead iterators to generate
  * completion suggestions or valid symbols in error nodes. Use
- * `ts_node_grammar_symbol` for valid symbols.
+ * [`ts_node_grammar_symbol`] for valid symbols.
 */
 TSStateId ts_language_next_state(const TSLanguage *self, TSStateId state, TSSymbol symbol);
 
@@ -1081,8 +1086,8 @@ TSStateId ts_language_next_state(const TSLanguage *self, TSStateId state, TSSymb
  *
  * This returns `NULL` if state is invalid for the language.
  *
- * Repeatedly using `ts_lookahead_iterator_next` and
- * `ts_lookahead_iterator_current_symbol` will generate valid symbols in the
+ * Repeatedly using [`ts_lookahead_iterator_next`] and
+ * [`ts_lookahead_iterator_current_symbol`] will generate valid symbols in the
  * given parse state. Newly created lookahead iterators will contain the `ERROR`
  * symbol.
  *

From 09ac28c77d216964636ea054ba76bcf96a670933 Mon Sep 17 00:00:00 2001
From: Amaan Qureshi <amaanq12@gmail.com>
Date: Fri, 18 Aug 2023 19:45:00 -0400
Subject: [PATCH 322/347] feat!: properly handle predicates used on quantified
 captures

---
 cli/src/tests/query_test.rs |  83 +++++++++++++++++++++++
 lib/binding_rust/lib.rs     | 132 ++++++++++++++++++++++--------------
 lib/binding_web/binding.js  |  66 +++++++++++++++---
 3 files changed, 218 insertions(+), 63 deletions(-)

diff --git a/cli/src/tests/query_test.rs b/cli/src/tests/query_test.rs
index 94d5ca97..34cf40a9 100644
--- a/cli/src/tests/query_test.rs
+++ b/cli/src/tests/query_test.rs
@@ -4574,6 +4574,89 @@ fn test_capture_quantifiers() {
     });
 }
 
+#[test]
+fn test_query_quantified_captures() {
+    struct Row {
+        description: &'static str,
+        language: Language,
+        code: &'static str,
+        pattern: &'static str,
+        captures: &'static [(&'static str, &'static str)],
+    }
+
+    // #[rustfmt::skip]
+    let rows = &[
+        Row {
+            description: "doc comments where all must match the prefiix",
+            language: get_language("c"),
+            code: indoc! {"
+            /// foo
+            /// bar
+            /// baz
+
+            void main() {}
+
+            /// qux
+            /// quux
+            // quuz
+        "},
+            pattern: r#"
+                ((comment)+ @comment.documentation
+                  (#match? @comment.documentation "^///"))
+            "#,
+            captures: &[
+                ("comment.documentation", "/// foo"),
+                ("comment.documentation", "/// bar"),
+                ("comment.documentation", "/// baz"),
+            ],
+        },
+        Row {
+            description: "doc comments where one must match the prefix",
+            language: get_language("c"),
+            code: indoc! {"
+            /// foo
+            /// bar
+            /// baz
+
+            void main() {}
+
+            /// qux
+            /// quux
+            // quuz
+        "},
+            pattern: r#"
+                ((comment)+ @comment.documentation
+                  (#any-match? @comment.documentation "^///"))
+            "#,
+            captures: &[
+                ("comment.documentation", "/// foo"),
+                ("comment.documentation", "/// bar"),
+                ("comment.documentation", "/// baz"),
+                ("comment.documentation", "/// qux"),
+                ("comment.documentation", "/// quux"),
+                ("comment.documentation", "// quuz"),
+            ],
+        },
+    ];
+
+    allocations::record(|| {
+        for row in rows {
+            eprintln!("  quantified query example: {:?}", row.description);
+
+            let mut parser = Parser::new();
+            parser.set_language(row.language).unwrap();
+            let tree = parser.parse(row.code, None).unwrap();
+
+            let query = Query::new(row.language, row.pattern).unwrap();
+
+            let mut cursor = QueryCursor::new();
+            let matches = cursor.captures(&query, tree.root_node(), row.code.as_bytes());
+
+            assert_eq!(collect_captures(matches, &query, row.code), row.captures);
+        }
+    });
+}
+
 #[test]
 fn test_query_max_start_depth() {
     struct Row {
diff --git a/lib/binding_rust/lib.rs b/lib/binding_rust/lib.rs
index 9cd04563..8762c7f6 100644
--- a/lib/binding_rust/lib.rs
+++ b/lib/binding_rust/lib.rs
@@ -118,7 +118,7 @@ pub struct Query {
     ptr: NonNull<ffi::TSQuery>,
     capture_names: Vec<String>,
     capture_quantifiers: Vec<Vec<CaptureQuantifier>>,
-    text_predicates: Vec<Box<[TextPredicate]>>,
+    text_predicates: Vec<Box<[TextPredicateCapture]>>,
     property_settings: Vec<Box<[QueryProperty]>>,
     property_predicates: Vec<Box<[(QueryProperty, bool)]>>,
     general_predicates: Vec<Box<[QueryPredicate]>>,
@@ -250,11 +250,16 @@ pub enum QueryErrorKind {
 }
 
 #[derive(Debug)]
-enum TextPredicate {
-    CaptureEqString(u32, String, bool),
-    CaptureEqCapture(u32, u32, bool),
-    CaptureMatchString(u32, regex::bytes::Regex, bool),
-    CaptureAnyString(u32, Vec<String>, bool),
+/// The first item is the capture index
+/// The next is capture specific, depending on what item is expected
+/// The first bool is if the capture is positive
+/// The last item is a bool signifying whether or not it's meant to match
+/// any or all captures
+enum TextPredicateCapture {
+    EqString(u32, String, bool, bool),
+    EqCapture(u32, u32, bool, bool),
+    MatchString(u32, regex::bytes::Regex, bool, bool),
+    AnyString(u32, Vec<String>, bool),
 }
 
 // TODO: Remove this struct at at some point. If `core::str::lossy::Utf8Lossy`
@@ -1733,7 +1738,7 @@ impl Query {
                 // Build a predicate for each of the known predicate function names.
                 let operator_name = &string_values[p[0].value_id as usize];
                 match operator_name.as_str() {
-                    "eq?" | "not-eq?" => {
+                    "eq?" | "not-eq?" | "any-eq?" | "any-not-eq?" => {
                         if p.len() != 3 {
                             return Err(predicate_error(
                                 row,
@@ -1750,23 +1755,30 @@ impl Query {
                             )));
                         }
 
-                        let is_positive = operator_name == "eq?";
+                        let is_positive = operator_name == "eq?" || operator_name == "any-eq?";
+                        let match_all = match operator_name.as_str() {
+                            "eq?" | "not-eq?" => true,
+                            "any-eq?" | "any-not-eq?" => false,
+                            _ => unreachable!(),
+                        };
                         text_predicates.push(if p[2].type_ == type_capture {
-                            TextPredicate::CaptureEqCapture(
+                            TextPredicateCapture::EqCapture(
                                 p[1].value_id,
                                 p[2].value_id,
                                 is_positive,
+                                match_all,
                             )
                         } else {
-                            TextPredicate::CaptureEqString(
+                            TextPredicateCapture::EqString(
                                 p[1].value_id,
                                 string_values[p[2].value_id as usize].clone(),
                                 is_positive,
+                                match_all,
                             )
                         });
                     }
 
-                    "match?" | "not-match?" => {
+                    "match?" | "not-match?" | "any-match?" | "any-not-match?" => {
                         if p.len() != 3 {
                             return Err(predicate_error(row, format!(
                                 "Wrong number of arguments to #match? predicate. Expected 2, got {}.",
@@ -1786,20 +1798,27 @@ impl Query {
                             )));
                         }
 
-                        let is_positive = operator_name == "match?";
+                        let is_positive =
+                            operator_name == "match?" || operator_name == "any-match?";
+                        let match_all = match operator_name.as_str() {
+                            "match?" | "not-match?" => true,
+                            "any-match?" | "any-not-match?" => false,
+                            _ => unreachable!(),
+                        };
                         let regex = &string_values[p[2].value_id as usize];
-                        text_predicates.push(TextPredicate::CaptureMatchString(
+                        text_predicates.push(TextPredicateCapture::MatchString(
                             p[1].value_id,
                             regex::bytes::Regex::new(regex).map_err(|_| {
                                 predicate_error(row, format!("Invalid regex '{}'", regex))
                             })?,
                             is_positive,
+                            match_all,
                         ));
                     }
 
                     "set!" => property_settings.push(Self::parse_property(
                         row,
-                        &operator_name,
+                        operator_name,
                         &result.capture_names,
                         &string_values,
                         &p[1..],
@@ -1808,7 +1827,7 @@ impl Query {
                     "is?" | "is-not?" => property_predicates.push((
                         Self::parse_property(
                             row,
-                            &operator_name,
+                            operator_name,
                             &result.capture_names,
                             &string_values,
                             &p[1..],
@@ -1841,7 +1860,7 @@ impl Query {
                             }
                             values.push(string_values[arg.value_id as usize].clone());
                         }
-                        text_predicates.push(TextPredicate::CaptureAnyString(
+                        text_predicates.push(TextPredicateCapture::AnyString(
                             p[1].value_id,
                             values,
                             is_positive,
@@ -2203,7 +2222,7 @@ impl<'tree> QueryMatch<'_, 'tree> {
     ) -> impl Iterator<Item = Node<'tree>> + '_ {
         self.captures
             .iter()
-            .filter_map(move |capture| (capture.index == capture_ix).then(|| capture.node))
+            .filter_map(move |capture| (capture.index == capture_ix).then_some(capture.node))
     }
 
     fn new(m: ffi::TSQueryMatch, cursor: *mut ffi::TSQueryCursor) -> Self {
@@ -2266,52 +2285,61 @@ impl<'tree> QueryMatch<'_, 'tree> {
         query.text_predicates[self.pattern_index]
             .iter()
             .all(|predicate| match predicate {
-                TextPredicate::CaptureEqCapture(i, j, is_positive) => {
-                    let node1 = self.nodes_for_capture_index(*i).next();
-                    let node2 = self.nodes_for_capture_index(*j).next();
-                    match (node1, node2) {
-                        (Some(node1), Some(node2)) => {
-                            let mut text1 = text_provider.text(node1);
-                            let mut text2 = text_provider.text(node2);
-                            let text1 = node_text1.get_text(&mut text1);
-                            let text2 = node_text2.get_text(&mut text2);
-                            (text1 == text2) == *is_positive
+                TextPredicateCapture::EqCapture(i, j, is_positive, match_all_nodes) => {
+                    let mut nodes_1 = self.nodes_for_capture_index(*i);
+                    let mut nodes_2 = self.nodes_for_capture_index(*j);
+                    while let (Some(node1), Some(node2)) = (nodes_1.next(), nodes_2.next()) {
+                        let mut text1 = text_provider.text(node1);
+                        let mut text2 = text_provider.text(node2);
+                        let text1 = node_text1.get_text(&mut text1);
+                        let text2 = node_text2.get_text(&mut text2);
+                        if (text1 == text2) != *is_positive && *match_all_nodes {
+                            return false;
+                        }
+                        if (text1 == text2) == *is_positive && !*match_all_nodes {
+                            return true;
                         }
-                        _ => true,
                     }
+                    nodes_1.next().is_none() && nodes_2.next().is_none()
                 }
-                TextPredicate::CaptureEqString(i, s, is_positive) => {
-                    let node = self.nodes_for_capture_index(*i).next();
-                    match node {
-                        Some(node) => {
-                            let mut text = text_provider.text(node);
-                            let text = node_text1.get_text(&mut text);
-                            (text == s.as_bytes()) == *is_positive
+                TextPredicateCapture::EqString(i, s, is_positive, match_all_nodes) => {
+                    let nodes = self.nodes_for_capture_index(*i);
+                    for node in nodes {
+                        let mut text = text_provider.text(node);
+                        let text = node_text1.get_text(&mut text);
+                        if (text == s.as_bytes()) != *is_positive && *match_all_nodes {
+                            return false;
+                        }
+                        if (text == s.as_bytes()) == *is_positive && !*match_all_nodes {
+                            return true;
                         }
-                        None => true,
                     }
+                    true
                 }
-                TextPredicate::CaptureMatchString(i, r, is_positive) => {
-                    let node = self.nodes_for_capture_index(*i).next();
-                    match node {
-                        Some(node) => {
-                            let mut text = text_provider.text(node);
-                            let text = node_text1.get_text(&mut text);
-                            r.is_match(text) == *is_positive
+                TextPredicateCapture::MatchString(i, r, is_positive, match_all_nodes) => {
+                    let nodes = self.nodes_for_capture_index(*i);
+                    for node in nodes {
+                        let mut text = text_provider.text(node);
+                        let text = node_text1.get_text(&mut text);
+                        if (r.is_match(text)) != *is_positive && *match_all_nodes {
+                            return false;
+                        }
+                        if (r.is_match(text)) == *is_positive && !*match_all_nodes {
+                            return true;
                         }
-                        None => true,
                     }
+                    true
                 }
-                TextPredicate::CaptureAnyString(i, v, is_positive) => {
-                    let node = self.nodes_for_capture_index(*i).next();
-                    match node {
-                        Some(node) => {
-                            let mut text = text_provider.text(node);
-                            let text = node_text1.get_text(&mut text);
-                            v.iter().any(|s| text == s.as_bytes()) == *is_positive
+                TextPredicateCapture::AnyString(i, v, is_positive) => {
+                    let nodes = self.nodes_for_capture_index(*i);
+                    for node in nodes {
+                        let mut text = text_provider.text(node);
+                        let text = node_text1.get_text(&mut text);
+                        if (v.iter().any(|s| text == s.as_bytes())) != *is_positive {
+                            return false;
                         }
-                        None => true,
                     }
+                    true
                 }
             })
     }
diff --git a/lib/binding_web/binding.js b/lib/binding_web/binding.js
index 8443bf25..0ba30106 100644
--- a/lib/binding_web/binding.js
+++ b/lib/binding_web/binding.js
@@ -841,7 +841,13 @@ class Language {
           }
           const operator = steps[0].value;
           let isPositive = true;
+          let matchAll = true;
           switch (operator) {
+            case 'any-not-eq?':
+              isPositive = false;
+              matchAll = false;
+            case 'any-eq?':
+              matchAll = false;
             case 'not-eq?':
               isPositive = false;
             case 'eq?':
@@ -855,28 +861,36 @@ class Language {
                 const captureName1 = steps[1].name;
                 const captureName2 = steps[2].name;
                 textPredicates[i].push(function(captures) {
-                  let node1, node2
+                  let nodes_1 = [];
+                  let nodes_2 = [];
                   for (const c of captures) {
-                    if (c.name === captureName1) node1 = c.node;
-                    if (c.name === captureName2) node2 = c.node;
+                    if (c.name === captureName1) nodes_1.push(c.node);
+                    if (c.name === captureName2) nodes_2.push(c.node);
                   }
-                  if(node1 === undefined || node2 === undefined) return true;
-                  return (node1.text === node2.text) === isPositive;
+                  return matchAll
+                    ? nodes_1.every(n1 => nodes_2.some(n2 => n1.text === n2.text)) === isPositive
+                    : nodes_1.some(n1 => nodes_2.some(n2 => n1.text === n2.text)) === isPositive;
                 });
               } else {
                 const captureName = steps[1].name;
                 const stringValue = steps[2].value;
                 textPredicates[i].push(function(captures) {
+                  let nodes = [];
                   for (const c of captures) {
-                    if (c.name === captureName) {
-                      return (c.node.text === stringValue) === isPositive;
-                    };
+                    if (c.name === captureName) nodes.push(c.node);
                   }
-                  return true;
+                  return matchAll
+                    ? nodes.every(n => n.text === stringValue) === isPositive
+                    : nodes.some(n => n.text === stringValue) === isPositive;
                 });
               }
               break;
 
+            case 'not-any-match?':
+              isPositive = false;
+              matchAll = false;
+            case 'any-match?':
+              matchAll = false;
             case 'not-match?':
               isPositive = false;
             case 'match?':
@@ -892,10 +906,14 @@ class Language {
               const captureName = steps[1].name;
               const regex = new RegExp(steps[2].value);
               textPredicates[i].push(function(captures) {
+                const nodes = [];
                 for (const c of captures) {
-                  if (c.name === captureName) return regex.test(c.node.text) === isPositive;
+                  if (c.name === captureName) nodes.push(c.node.text);
                 }
-                return true;
+                if (nodes.length === 0) return !isPositive;
+                return matchAll
+                  ? nodes.every(text => regex.test(text)) === isPositive
+                  : nodes.some(text => regex.test(text)) === isPositive;
               });
               break;
 
@@ -923,6 +941,32 @@ class Language {
               properties[i][steps[1].value] = steps[2] ? steps[2].value : null;
               break;
 
+            case 'not-any-of?':
+              isPositive = false;
+            case 'any-of?':
+              if (steps.length < 2) throw new Error(
+                `Wrong number of arguments to \`#${operator}\` predicate. Expected at least 1. Got ${steps.length - 1}.`
+              );
+              if (steps[1].type !== 'capture') throw new Error(
+                `First argument of \`#${operator}\` predicate must be a capture. Got "${steps[1].value}".`
+              );
+              for (let i = 2; i < steps.length; i++) {
+                if (steps[i].type !== 'string') throw new Error(
+                  `Arguments to \`#${operator}\` predicate must be a strings.".`
+                );
+              }
+              captureName = steps[1].name;
+              const values = steps.slice(2).map(s => s.value);
+              textPredicates[i].push(function(captures) {
+                const nodes = [];
+                for (const c of captures) {
+                  if (c.name === captureName) nodes.push(c.node.text);
+                }
+                if (nodes.length === 0) return !isPositive;
+                return nodes.every(text => values.includes(text)) === isPositive;
+              });
+              break;
+
             default:
               predicates[i].push({operator, operands: steps.slice(1)});
           }

From c5cb27e52256ac61db6324472cf2ad93c059e3b3 Mon Sep 17 00:00:00 2001
From: Amaan Qureshi <amaanq12@gmail.com>
Date: Sat, 19 Aug 2023 00:15:27 -0400
Subject: [PATCH 323/347] docs: improve predicate docs

---
 cli/src/tests/query_test.rs     |   2 +-
 docs/section-2-using-parsers.md | 144 +++++++++++++++++++++++++++-----
 2 files changed, 122 insertions(+), 24 deletions(-)

diff --git a/cli/src/tests/query_test.rs b/cli/src/tests/query_test.rs
index 34cf40a9..ed1f9e25 100644
--- a/cli/src/tests/query_test.rs
+++ b/cli/src/tests/query_test.rs
@@ -4587,7 +4587,7 @@ fn test_query_quantified_captures() {
     // #[rustfmt::skip]
     let rows = &[
         Row {
-            description: "doc comments where all must match the prefiix",
+            description: "doc comments where all must match the prefix",
             language: get_language("c"),
             code: indoc! {"
             /// foo
diff --git a/docs/section-2-using-parsers.md b/docs/section-2-using-parsers.md
index 87c049e7..5106a49c 100644
--- a/docs/section-2-using-parsers.md
+++ b/docs/section-2-using-parsers.md
@@ -21,21 +21,21 @@ Alternatively, you can incorporate the library in a larger project's build syste
 
 **source file:**
 
-* `tree-sitter/lib/src/lib.c`
+- `tree-sitter/lib/src/lib.c`
 
 **include directories:**
 
-* `tree-sitter/lib/src`
-* `tree-sitter/lib/include`
+- `tree-sitter/lib/src`
+- `tree-sitter/lib/include`
 
 ### The Basic Objects
 
 There are four main types of objects involved when using Tree-sitter: languages, parsers, syntax trees, and syntax nodes. In C, these are called `TSLanguage`, `TSParser`, `TSTree`, and `TSNode`.
 
-* A `TSLanguage` is an opaque object that defines how to parse a particular programming language. The code for each `TSLanguage` is generated by Tree-sitter. Many languages are already available in separate git repositories within the [Tree-sitter GitHub organization](https://github.com/tree-sitter). See [the next page](./creating-parsers) for how to create new languages.
-* A `TSParser` is a stateful object that can be assigned a `TSLanguage` and used to produce a `TSTree` based on some source code.
-* A `TSTree` represents the syntax tree of an entire source code file. It contains `TSNode` instances that indicate the structure of the source code. It can also be edited and used to produce a new `TSTree` in the event that the source code changes.
-* A `TSNode` represents a single node in the syntax tree. It tracks its start and end positions in the source code, as well as its relation to other nodes like its parent, siblings and children.
+- A `TSLanguage` is an opaque object that defines how to parse a particular programming language. The code for each `TSLanguage` is generated by Tree-sitter. Many languages are already available in separate git repositories within the [Tree-sitter GitHub organization](https://github.com/tree-sitter). See [the next page](./creating-parsers) for how to create new languages.
+- A `TSParser` is a stateful object that can be assigned a `TSLanguage` and used to produce a `TSTree` based on some source code.
+- A `TSTree` represents the syntax tree of an entire source code file. It contains `TSNode` instances that indicate the structure of the source code. It can also be edited and used to produce a new `TSTree` in the event that the source code changes.
+- A `TSNode` represents a single node in the syntax tree. It tracks its start and end positions in the source code, as well as its relation to other nodes like its parent, siblings and children.
 
 ### An Example Program
 
@@ -629,18 +629,36 @@ The restrictions placed on a pattern by an anchor operator ignore anonymous node
 
 #### Predicates
 
-You can also specify arbitrary metadata and conditions associated with a pattern by adding _predicate_ S-expressions anywhere within your pattern. Predicate S-expressions start with a _predicate name_ beginning with a `#` character. After that, they can contain an arbitrary number of `@`-prefixed capture names or strings.
+You can also specify arbitrary metadata and conditions associated with a pattern
+by adding _predicate_ S-expressions anywhere within your pattern. Predicate S-expressions
+start with a _predicate name_ beginning with a `#` character. After that, they can
+contain an arbitrary number of `@`-prefixed capture names or strings.
 
-For example, this pattern would match identifier whose names is written in `SCREAMING_SNAKE_CASE`:
+Tree-Sitter's CLI supports the following predicates by default:
+
+##### eq?, not-eq?, any-eq?, any-not-eq?
+
+This family of predicates allows you to match against a single capture or string
+value.
+
+The first argument must be a capture, but the second can be either a capture to
+compare the two captures' text, or a string to compare first capture's text
+against.
+
+The base predicate is "#eq?", but its complement "#not-eq?" can be used to _not_
+match a value.
+
+Consider the following example targeting C:
 
 ```scheme
-(
-  (identifier) @constant
-  (#match? @constant "^[A-Z][A-Z_]+")
-)
+((identifier) @variable.builtin
+  (#eq? @variable.builtin "self"))
 ```
 
-And this pattern would match key-value pairs where the `value` is an identifier with the same name as the key:
+This pattern would match any identifier that is `self` or `this`.
+
+And this pattern would match key-value pairs where the `value` is an identifier
+with the same name as the key:
 
 ```scheme
 (
@@ -651,7 +669,87 @@ And this pattern would match key-value pairs where the `value` is an identifier
 )
 ```
 
-_Note_ - Predicates are not handled directly by the Tree-sitter C library. They are just exposed in a structured form so that higher-level code can perform the filtering. However, higher-level bindings to Tree-sitter like [the Rust crate](https://github.com/tree-sitter/tree-sitter/tree/master/lib/binding_rust) or the [WebAssembly binding](https://github.com/tree-sitter/tree-sitter/tree/master/lib/binding_web) implement a few common predicates like `#eq?` and `#match?`.
+The prefix "any-" is meant for use with quantified captures. Here's
+an example finding a segment of empty comments
+
+```scheme
+((comment)+ @comment.empty
+  (#any-eq? @comment.empty "//"))
+```
+
+Note that "#any-eq?" will match a quantified capture if
+_any_ of the nodes match the predicate, while by default a quantified capture
+will only match if _all_ the nodes match the predicate.
+
+##### match?, not-match?, any-match?, any-not-match?
+
+These predicates are similar to the eq? predicates, but they use regular expressions
+to match against the capture's text.
+
+The first argument must be a capture, and the second must be a string containing
+a regular expression.
+
+For example, this pattern would match identifier whose name is written in `SCREAMING_SNAKE_CASE`:
+
+```scheme
+((identifier) @constant
+  (#match? @constant "^[A-Z][A-Z_]+"))
+```
+
+Here's an example finding potential documentation comments in C
+
+```scheme
+((comment)+ @comment.documentation
+  (#match? @comment.documentation "^///\s+.*"))
+```
+
+Here's another example finding Cgo comments to potentially inject with C
+
+```scheme
+((comment)+ @injection.content
+  .
+  (import_declaration
+    (import_spec path: (interpreted_string_literal) @_import_c))
+  (#eq? @_import_c "\"C\"")
+  (#match? @injection.content "^//"))
+```
+
+##### any-of?, not-any-of?
+
+The "any-of?" predicate allows you to match a capture against multiple strings,
+and will match if the capture's text is equal to any of the strings.
+
+Consider this example that targets JavaScript:
+
+```scheme
+((identifier) @variable.builtin
+  (#any-of? @variable.builtin
+        "arguments"
+        "module"
+        "console"
+        "window"
+        "document"))
+```
+
+This will match any of the builtin variables in JavaScript.
+
+_Note_ — Predicates are not handled directly by the Tree-sitter C library.
+They are just exposed in a structured form so that higher-level code can perform
+the filtering. However, higher-level bindings to Tree-sitter like
+[the Rust Crate](https://github.com/tree-sitter/tree-sitter/tree/master/lib/binding_rust)
+or the [WebAssembly binding](https://github.com/tree-sitter/tree-sitter/tree/master/lib/binding_web)
+do implement a few common predicates like the `#eq?`, `#match?`, and `#any-of?`
+predicates explained above.
+
+To recap about the predicates Tree-Sitter's bindings support:
+
+- `#eq?` checks for a direct match against a capture or string
+- `#match?` checks for a match against a regular expression
+- `#any-of?` checks for a match against a list of strings
+- Adding `not-` to the beginning of any of these predicates will negate the match
+- By default, a quantified capture will only match if _all_ of the nodes match the predicate
+- Adding `any-` before the `eq` or `match` predicates will instead match if any of the nodes match the predicate
+
 
 ### The Query API
 
@@ -723,8 +821,8 @@ The node types file contains an array of objects, each of which describes a part
 
 Every object in this array has these two entries:
 
-* `"type"` - A string that indicates which grammar rule the node represents. This corresponds to the `ts_node_type` function described [above](#syntax-nodes).
-* `"named"` - A boolean that indicates whether this kind of node corresponds to a rule name in the grammar or just a string literal. See [above](#named-vs-anonymous-nodes) for more info.
+- `"type"` - A string that indicates which grammar rule the node represents. This corresponds to the `ts_node_type` function described [above](#syntax-nodes).
+- `"named"` - A boolean that indicates whether this kind of node corresponds to a rule name in the grammar or just a string literal. See [above](#named-vs-anonymous-nodes) for more info.
 
 Examples:
 
@@ -745,14 +843,14 @@ Together, these two fields constitute a unique identifier for a node type; no tw
 
 Many syntax nodes can have _children_. The node type object describes the possible children that a node can have using the following entries:
 
-* `"fields"` - An object that describes the possible [fields](#node-field-names) that the node can have. The keys of this object are field names, and the values are _child type_ objects, described below.
-* `"children"` - Another _child type_ object that describes all of the node's possible _named_ children _without_ fields.
+- `"fields"` - An object that describes the possible [fields](#node-field-names) that the node can have. The keys of this object are field names, and the values are _child type_ objects, described below.
+- `"children"` - Another _child type_ object that describes all of the node's possible _named_ children _without_ fields.
 
 A _child type_ object describes a set of child nodes using the following entries:
 
-* `"required"` - A boolean indicating whether there is always _at least one_ node in this set.
-* `"multiple"` - A boolean indicating whether there can be _multiple_ nodes in this set.
-* `"types"`- An array of objects that represent the possible types of nodes in this set. Each object has two keys: `"type"` and `"named"`, whose meanings are described above.
+- `"required"` - A boolean indicating whether there is always _at least one_ node in this set.
+- `"multiple"` - A boolean indicating whether there can be _multiple_ nodes in this set.
+- `"types"`- An array of objects that represent the possible types of nodes in this set. Each object has two keys: `"type"` and `"named"`, whose meanings are described above.
 
 Example with fields:
 
@@ -812,7 +910,7 @@ In Tree-sitter grammars, there are usually certain rules that represent abstract
 
 Normally, hidden rules are not mentioned in the node types file, since they don't appear in the syntax tree. But if you add a hidden rule to the grammar's [`supertypes` list](./creating-parsers#the-grammar-dsl), then it _will_ show up in the node types file, with the following special entry:
 
-* `"subtypes"` - An array of objects that specify the _types_ of nodes that this 'supertype' node can wrap.
+- `"subtypes"` - An array of objects that specify the _types_ of nodes that this 'supertype' node can wrap.
 
 Example:
 

From 09030401d1fb0c93b34352437767b587e6697cfb Mon Sep 17 00:00:00 2001
From: Amaan Qureshi <amaanq12@gmail.com>
Date: Thu, 31 Aug 2023 17:15:38 -0400
Subject: [PATCH 324/347] fix(node): add `_isalpha`

---
 lib/binding_web/exports.json | 1 +
 1 file changed, 1 insertion(+)

diff --git a/lib/binding_web/exports.json b/lib/binding_web/exports.json
index 71151b71..ad7a6987 100644
--- a/lib/binding_web/exports.json
+++ b/lib/binding_web/exports.json
@@ -17,6 +17,7 @@
   "__Znwm",
   "___cxa_atexit",
   "_abort",
+  "_isalpha",
   "_iswalnum",
   "_iswalpha",
   "_iswdigit",

From ec88699f1c537420c3d75355c95c6c0a9022064c Mon Sep 17 00:00:00 2001
From: Amaan Qureshi <amaanq12@gmail.com>
Date: Thu, 31 Aug 2023 18:26:22 -0400
Subject: [PATCH 325/347] test(node): update bash test

---
 lib/binding_web/test/parser-test.js | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/lib/binding_web/test/parser-test.js b/lib/binding_web/test/parser-test.js
index 74c45d96..a25e5dc5 100644
--- a/lib/binding_web/test/parser-test.js
+++ b/lib/binding_web/test/parser-test.js
@@ -139,7 +139,7 @@ describe("Parser", () => {
                 'redirect: (file_redirect descriptor: (file_descriptor) destination: (word)) ' +
                 'redirect: (file_redirect destination: (word)) ' +
                 '(heredoc_body ' +
-                  '(expansion (variable_name))) (heredoc_end))))'
+                  '(expansion (variable_name)) (heredoc_content)) (heredoc_end))))'
       );
     }).timeout(5000);
 

From dc5ec1cf5380910fa6eb71af7c452ddc62582f82 Mon Sep 17 00:00:00 2001
From: Amaan Qureshi <amaanq12@gmail.com>
Date: Fri, 1 Sep 2023 17:01:39 -0400
Subject: [PATCH 326/347] refactor: remove `&Option<T>` where used

---
 cli/loader/src/lib.rs             | 34 +++++++++++++++----------------
 cli/src/playground.rs             | 14 ++++++-------
 cli/src/tests/helpers/fixtures.rs |  2 +-
 3 files changed, 25 insertions(+), 25 deletions(-)

diff --git a/cli/loader/src/lib.rs b/cli/loader/src/lib.rs
index 3022b6b9..1fbb1473 100644
--- a/cli/loader/src/lib.rs
+++ b/cli/loader/src/lib.rs
@@ -344,7 +344,7 @@ impl Loader {
             &grammar_json.name,
             &header_path,
             &parser_path,
-            &scanner_path,
+            scanner_path.as_deref(),
         )
     }
 
@@ -353,7 +353,7 @@ impl Loader {
         name: &str,
         header_path: &Path,
         parser_path: &Path,
-        scanner_path: &Option<PathBuf>,
+        scanner_path: Option<&Path>,
     ) -> Result<Language> {
         let mut lib_name = name.to_string();
         if self.debug_build {
@@ -362,7 +362,7 @@ impl Loader {
         let mut library_path = self.parser_lib_path.join(lib_name);
         library_path.set_extension(DYLIB_EXTENSION);
 
-        let recompile = needs_recompile(&library_path, &parser_path, &scanner_path)
+        let recompile = needs_recompile(&library_path, &parser_path, scanner_path)
             .with_context(|| "Failed to compare source and binary timestamps")?;
 
         if recompile {
@@ -740,21 +740,21 @@ impl<'a> LanguageConfiguration<'a> {
                         .iter()
                         .filter(|p| p.ends_with("highlights.scm"))
                         .cloned()
-                        .collect(),
+                        .collect::<Vec<_>>(),
                 ),
                 Some(
                     paths
                         .iter()
                         .filter(|p| p.ends_with("tags.scm"))
                         .cloned()
-                        .collect(),
+                        .collect::<Vec<_>>(),
                 ),
                 Some(
                     paths
                         .iter()
                         .filter(|p| p.ends_with("locals.scm"))
                         .cloned()
-                        .collect(),
+                        .collect::<Vec<_>>(),
                 ),
             ),
             None => (None, None, None),
@@ -764,25 +764,25 @@ impl<'a> LanguageConfiguration<'a> {
             .get_or_try_init(|| {
                 let (highlights_query, highlight_ranges) = self.read_queries(
                     if highlights_filenames.is_some() {
-                        &highlights_filenames
+                        highlights_filenames.as_deref()
                     } else {
-                        &self.highlights_filenames
+                        self.highlights_filenames.as_deref()
                     },
                     "highlights.scm",
                 )?;
                 let (injections_query, injection_ranges) = self.read_queries(
                     if injections_filenames.is_some() {
-                        &injections_filenames
+                        injections_filenames.as_deref()
                     } else {
-                        &self.injections_filenames
+                        self.injections_filenames.as_deref()
                     },
                     "injections.scm",
                 )?;
                 let (locals_query, locals_ranges) = self.read_queries(
                     if locals_filenames.is_some() {
-                        &locals_filenames
+                        locals_filenames.as_deref()
                     } else {
-                        &self.locals_filenames
+                        self.locals_filenames.as_deref()
                     },
                     "locals.scm",
                 )?;
@@ -844,9 +844,9 @@ impl<'a> LanguageConfiguration<'a> {
         self.tags_config
             .get_or_try_init(|| {
                 let (tags_query, tags_ranges) =
-                    self.read_queries(&self.tags_filenames, "tags.scm")?;
+                    self.read_queries(self.tags_filenames.as_deref(), "tags.scm")?;
                 let (locals_query, locals_ranges) =
-                    self.read_queries(&self.locals_filenames, "locals.scm")?;
+                    self.read_queries(self.locals_filenames.as_deref(), "locals.scm")?;
                 if tags_query.is_empty() {
                     Ok(None)
                 } else {
@@ -900,12 +900,12 @@ impl<'a> LanguageConfiguration<'a> {
 
     fn read_queries(
         &self,
-        paths: &Option<Vec<String>>,
+        paths: Option<&[String]>,
         default_path: &str,
     ) -> Result<(String, Vec<(String, Range<usize>)>)> {
         let mut query = String::new();
         let mut path_ranges = Vec::new();
-        if let Some(paths) = paths.as_ref() {
+        if let Some(paths) = paths {
             for path in paths {
                 let abs_path = self.root_path.join(path);
                 let prev_query_len = query.len();
@@ -930,7 +930,7 @@ impl<'a> LanguageConfiguration<'a> {
 fn needs_recompile(
     lib_path: &Path,
     parser_c_path: &Path,
-    scanner_path: &Option<PathBuf>,
+    scanner_path: Option<&Path>,
 ) -> Result<bool> {
     if !lib_path.exists() {
         return Ok(true);
diff --git a/cli/src/playground.rs b/cli/src/playground.rs
index 662eb8aa..35314c77 100644
--- a/cli/src/playground.rs
+++ b/cli/src/playground.rs
@@ -12,7 +12,7 @@ use tiny_http::{Header, Response, Server};
 macro_rules! optional_resource {
     ($name: tt, $path: tt) => {
         #[cfg(TREE_SITTER_EMBED_WASM_BINDING)]
-        fn $name(tree_sitter_dir: &Option<PathBuf>) -> Cow<'static, [u8]> {
+        fn $name(tree_sitter_dir: Option<&PathBuf>) -> Cow<'static, [u8]> {
             if let Some(tree_sitter_dir) = tree_sitter_dir {
                 Cow::Owned(fs::read(tree_sitter_dir.join($path)).unwrap())
             } else {
@@ -21,7 +21,7 @@ macro_rules! optional_resource {
         }
 
         #[cfg(not(TREE_SITTER_EMBED_WASM_BINDING))]
-        fn $name(tree_sitter_dir: &Option<PathBuf>) -> Cow<'static, [u8]> {
+        fn $name(tree_sitter_dir: Option<&PathBuf>) -> Cow<'static, [u8]> {
             if let Some(tree_sitter_dir) = tree_sitter_dir {
                 Cow::Owned(fs::read(tree_sitter_dir.join($path)).unwrap())
             } else {
@@ -35,7 +35,7 @@ optional_resource!(get_playground_js, "docs/assets/js/playground.js");
 optional_resource!(get_lib_js, "lib/binding_web/tree-sitter.js");
 optional_resource!(get_lib_wasm, "lib/binding_web/tree-sitter.wasm");
 
-fn get_main_html(tree_sitter_dir: &Option<PathBuf>) -> Cow<'static, [u8]> {
+fn get_main_html(tree_sitter_dir: Option<&PathBuf>) -> Cow<'static, [u8]> {
     if let Some(tree_sitter_dir) = tree_sitter_dir {
         Cow::Owned(fs::read(tree_sitter_dir.join("cli/src/playground.html")).unwrap())
     } else {
@@ -63,13 +63,13 @@ pub fn serve(grammar_path: &Path, open_in_browser: bool) -> Result<()> {
     }
 
     let tree_sitter_dir = env::var("TREE_SITTER_BASE_DIR").map(PathBuf::from).ok();
-    let main_html = str::from_utf8(&get_main_html(&tree_sitter_dir))
+    let main_html = str::from_utf8(&get_main_html(tree_sitter_dir.as_ref()))
         .unwrap()
         .replace("THE_LANGUAGE_NAME", &grammar_name)
         .into_bytes();
-    let playground_js = get_playground_js(&tree_sitter_dir);
-    let lib_js = get_lib_js(&tree_sitter_dir);
-    let lib_wasm = get_lib_wasm(&tree_sitter_dir);
+    let playground_js = get_playground_js(tree_sitter_dir.as_ref());
+    let lib_js = get_lib_js(tree_sitter_dir.as_ref());
+    let lib_wasm = get_lib_wasm(tree_sitter_dir.as_ref());
 
     let html_header = Header::from_str("Content-Type: text/html").unwrap();
     let js_header = Header::from_str("Content-Type: application/javascript").unwrap();
diff --git a/cli/src/tests/helpers/fixtures.rs b/cli/src/tests/helpers/fixtures.rs
index 5d27329b..0f45ef54 100644
--- a/cli/src/tests/helpers/fixtures.rs
+++ b/cli/src/tests/helpers/fixtures.rs
@@ -88,7 +88,7 @@ pub fn get_test_language(name: &str, parser_code: &str, path: Option<&Path>) ->
         }
     });
     TEST_LOADER
-        .load_language_from_sources(name, &HEADER_DIR, &parser_c_path, &scanner_path)
+        .load_language_from_sources(name, &HEADER_DIR, &parser_c_path, scanner_path.as_deref())
         .unwrap()
 }
 

From 055c329a693b1f3b6efd98408e2952d5bc32958b Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Fri, 1 Sep 2023 20:41:42 +0300
Subject: [PATCH 327/347] chore(lib): fix fields naming in QueryPattern to
 singular

---
 lib/src/query.c | 22 +++++++++++-----------
 1 file changed, 11 insertions(+), 11 deletions(-)

diff --git a/lib/src/query.c b/lib/src/query.c
index e3fd27a0..4e623ae7 100644
--- a/lib/src/query.c
+++ b/lib/src/query.c
@@ -143,8 +143,8 @@ typedef struct {
 } PatternEntry;
 
 typedef struct {
-  Slice steps;
-  Slice predicate_steps;
+  Slice step;
+  Slice predicate_step;
   uint32_t start_byte;
   bool is_non_local;
 } QueryPattern;
@@ -1782,8 +1782,8 @@ static bool ts_query__analyze_patterns(TSQuery *self, unsigned *error_offset) {
     // Gather all of the captures that are used in predicates for this pattern.
     array_clear(&predicate_capture_ids);
     for (
-      unsigned start = pattern->predicate_steps.offset,
-      end = start + pattern->predicate_steps.length,
+      unsigned start = pattern->predicate_step.offset,
+      end = start + pattern->predicate_step.length,
       j = start; j < end; j++
     ) {
       TSQueryPredicateStep *step = &self->predicate_steps.contents[j];
@@ -1795,8 +1795,8 @@ static bool ts_query__analyze_patterns(TSQuery *self, unsigned *error_offset) {
 
     // Find all of the steps that have these captures.
     for (
-      unsigned start = pattern->steps.offset,
-      end = start + pattern->steps.length,
+      unsigned start = pattern->step.offset,
+      end = start + pattern->step.length,
       j = start; j < end; j++
     ) {
       QueryStep *step = &self->steps.contents[j];
@@ -2711,8 +2711,8 @@ TSQuery *ts_query_new(
     uint32_t start_step_index = self->steps.size;
     uint32_t start_predicate_step_index = self->predicate_steps.size;
     array_push(&self->patterns, ((QueryPattern) {
-      .steps = (Slice) {.offset = start_step_index},
-      .predicate_steps = (Slice) {.offset = start_predicate_step_index},
+      .step = (Slice) {.offset = start_step_index},
+      .predicate_step = (Slice) {.offset = start_predicate_step_index},
       .start_byte = stream_offset(&stream),
       .is_non_local = false,
     }));
@@ -2721,8 +2721,8 @@ TSQuery *ts_query_new(
     array_push(&self->steps, query_step__new(0, PATTERN_DONE_MARKER, false));
 
     QueryPattern *pattern = array_back(&self->patterns);
-    pattern->steps.length = self->steps.size - start_step_index;
-    pattern->predicate_steps.length = self->predicate_steps.size - start_predicate_step_index;
+    pattern->step.length = self->steps.size - start_step_index;
+    pattern->predicate_step.length = self->predicate_steps.size - start_predicate_step_index;
 
     // If any pattern could not be parsed, then report the error information
     // and terminate.
@@ -2865,7 +2865,7 @@ const TSQueryPredicateStep *ts_query_predicates_for_pattern(
   uint32_t pattern_index,
   uint32_t *step_count
 ) {
-  Slice slice = self->patterns.contents[pattern_index].predicate_steps;
+  Slice slice = self->patterns.contents[pattern_index].predicate_step;
   *step_count = slice.length;
   if (self->predicate_steps.contents == NULL) {
     return NULL;

From 52f7eaff3182a726eb064a91d4e49dfbaecd4ee3 Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Fri, 1 Sep 2023 05:33:52 +0300
Subject: [PATCH 328/347] chore(rust): make `Query` extra predicates state
 fully immutable

---
 cli/loader/src/lib.rs                  |   4 +-
 cli/src/tests/helpers/query_helpers.rs |   2 +-
 cli/src/tests/query_test.rs            |  11 +-
 highlight/src/lib.rs                   |   9 +-
 lib/binding_rust/lib.rs                | 146 ++++++++++++++-----------
 tags/src/lib.rs                        |   2 +-
 6 files changed, 96 insertions(+), 78 deletions(-)

diff --git a/cli/loader/src/lib.rs b/cli/loader/src/lib.rs
index 1fbb1473..d260a96c 100644
--- a/cli/loader/src/lib.rs
+++ b/cli/loader/src/lib.rs
@@ -828,8 +828,8 @@ impl<'a> LanguageConfiguration<'a> {
                     let mut all_highlight_names = self.highlight_names.lock().unwrap();
                     if self.use_all_highlight_names {
                         for capture_name in result.query.capture_names() {
-                            if !all_highlight_names.contains(capture_name) {
-                                all_highlight_names.push(capture_name.clone());
+                            if !all_highlight_names.iter().any(|x| x == capture_name) {
+                                all_highlight_names.push(capture_name.to_string());
                             }
                         }
                     }
diff --git a/cli/src/tests/helpers/query_helpers.rs b/cli/src/tests/helpers/query_helpers.rs
index a21320b1..4d71dfd0 100644
--- a/cli/src/tests/helpers/query_helpers.rs
+++ b/cli/src/tests/helpers/query_helpers.rs
@@ -353,7 +353,7 @@ fn format_captures<'a>(
     captures
         .map(|capture| {
             (
-                query.capture_names()[capture.index as usize].as_str(),
+                query.capture_names()[capture.index as usize],
                 capture.node.utf8_text(source.as_bytes()).unwrap(),
             )
         })
diff --git a/cli/src/tests/query_test.rs b/cli/src/tests/query_test.rs
index ed1f9e25..51c783e7 100644
--- a/cli/src/tests/query_test.rs
+++ b/cli/src/tests/query_test.rs
@@ -2269,7 +2269,7 @@ fn test_query_captures_within_byte_range_assigned_after_iterating() {
         for (mat, capture_ix) in captures.by_ref().take(5) {
             let capture = mat.captures[capture_ix as usize];
             results.push((
-                query.capture_names()[capture.index as usize].as_str(),
+                query.capture_names()[capture.index as usize],
                 &source[capture.node.byte_range()],
             ));
         }
@@ -2292,7 +2292,7 @@ fn test_query_captures_within_byte_range_assigned_after_iterating() {
         for (mat, capture_ix) in captures {
             let capture = mat.captures[capture_ix as usize];
             results.push((
-                query.capture_names()[capture.index as usize].as_str(),
+                query.capture_names()[capture.index as usize],
                 &source[capture.node.byte_range()],
             ));
         }
@@ -2533,7 +2533,7 @@ fn test_query_matches_with_captured_wildcard_at_root() {
                     .iter()
                     .map(|c| {
                         (
-                            query.capture_names()[c.index as usize].as_str(),
+                            query.capture_names()[c.index as usize],
                             c.node.kind(),
                             c.node.start_position().row,
                         )
@@ -2934,7 +2934,8 @@ fn test_query_captures_with_predicates() {
                 args: vec![
                     QueryPredicateArg::Capture(0),
                     QueryPredicateArg::String("omg".to_string().into_boxed_str()),
-                ],
+                ]
+                .into_boxed_slice(),
             },]
         );
         assert_eq!(query.property_settings(1), &[]);
@@ -3826,7 +3827,7 @@ fn test_query_random() {
                     captures: mat
                         .captures
                         .iter()
-                        .map(|c| (query.capture_names()[c.index as usize].as_str(), c.node))
+                        .map(|c| (query.capture_names()[c.index as usize], c.node))
                         .collect::<Vec<_>>(),
                 })
                 .collect::<Vec<_>>();
diff --git a/highlight/src/lib.rs b/highlight/src/lib.rs
index 2903c7c5..2170b07f 100644
--- a/highlight/src/lib.rs
+++ b/highlight/src/lib.rs
@@ -321,7 +321,7 @@ impl HighlightConfiguration {
         let mut local_scope_capture_index = None;
         for (i, name) in query.capture_names().iter().enumerate() {
             let i = Some(i as u32);
-            match name.as_str() {
+            match *name {
                 "injection.content" => injection_content_capture_index = i,
                 "injection.language" => injection_language_capture_index = i,
                 "local.definition" => local_def_capture_index = i,
@@ -353,7 +353,7 @@ impl HighlightConfiguration {
     }
 
     /// Get a slice containing all of the highlight names used in the configuration.
-    pub fn names(&self) -> &[String] {
+    pub fn names(&self) -> &[&str] {
         self.query.capture_names()
     }
 
@@ -399,7 +399,7 @@ impl HighlightConfiguration {
     // Return the list of this configuration's capture names that are neither present in the
     // list of predefined 'canonical' names nor start with an underscore (denoting 'private' captures
     // used as part of capture internals).
-    pub fn nonconformant_capture_names(&self, capture_names: &HashSet<&str>) -> Vec<&String> {
+    pub fn nonconformant_capture_names(&self, capture_names: &HashSet<&str>) -> Vec<&str> {
         let capture_names = if capture_names.is_empty() {
             &*STANDARD_CAPTURE_NAMES
         } else {
@@ -407,7 +407,8 @@ impl HighlightConfiguration {
         };
         self.names()
             .iter()
-            .filter(|&n| !(n.starts_with('_') || capture_names.contains(n.as_str())))
+            .filter(|&n| !(n.starts_with('_') || capture_names.contains(n)))
+            .map(|n| *n)
             .collect()
     }
 }
diff --git a/lib/binding_rust/lib.rs b/lib/binding_rust/lib.rs
index 8762c7f6..81204625 100644
--- a/lib/binding_rust/lib.rs
+++ b/lib/binding_rust/lib.rs
@@ -116,12 +116,12 @@ pub struct TreeCursor<'cursor>(ffi::TSTreeCursor, PhantomData<&'cursor ()>);
 #[derive(Debug)]
 pub struct Query {
     ptr: NonNull<ffi::TSQuery>,
-    capture_names: Vec<String>,
-    capture_quantifiers: Vec<Vec<CaptureQuantifier>>,
-    text_predicates: Vec<Box<[TextPredicateCapture]>>,
-    property_settings: Vec<Box<[QueryProperty]>>,
-    property_predicates: Vec<Box<[(QueryProperty, bool)]>>,
-    general_predicates: Vec<Box<[QueryPredicate]>>,
+    capture_names: Box<[&'static str]>,
+    capture_quantifiers: Box<[Box<[CaptureQuantifier]>]>,
+    text_predicates: Box<[Box<[TextPredicateCapture]>]>,
+    property_settings: Box<[Box<[QueryProperty]>]>,
+    property_predicates: Box<[Box<[(QueryProperty, bool)]>]>,
+    general_predicates: Box<[Box<[QueryPredicate]>]>,
 }
 
 /// A quantifier for captures
@@ -171,7 +171,7 @@ pub enum QueryPredicateArg {
 #[derive(Debug, PartialEq, Eq)]
 pub struct QueryPredicate {
     pub operator: Box<str>,
-    pub args: Vec<QueryPredicateArg>,
+    pub args: Box<[QueryPredicateArg]>,
 }
 
 /// A match of a [`Query`] to a particular set of [`Node`]s.
@@ -256,10 +256,10 @@ pub enum QueryErrorKind {
 /// The last item is a bool signifying whether or not it's meant to match
 /// any or all captures
 enum TextPredicateCapture {
-    EqString(u32, String, bool, bool),
+    EqString(u32, Box<str>, bool, bool),
     EqCapture(u32, u32, bool, bool),
     MatchString(u32, regex::bytes::Regex, bool, bool),
-    AnyString(u32, Vec<String>, bool),
+    AnyString(u32, Box<[Box<str>]>, bool),
 }
 
 // TODO: Remove this struct at at some point. If `core::str::lossy::Utf8Lossy`
@@ -1643,29 +1643,37 @@ impl Query {
     }
 
     #[doc(hidden)]
-    unsafe fn from_raw_parts(ptr: *mut ffi::TSQuery, source: &str) -> Result<Query, QueryError> {
-        let string_count = unsafe { ffi::ts_query_string_count(ptr) };
-        let capture_count = unsafe { ffi::ts_query_capture_count(ptr) };
-        let pattern_count = unsafe { ffi::ts_query_pattern_count(ptr) as usize };
-        let mut result = Query {
-            ptr: unsafe { NonNull::new_unchecked(ptr) },
-            capture_names: Vec::with_capacity(capture_count as usize),
-            capture_quantifiers: Vec::with_capacity(pattern_count as usize),
-            text_predicates: Vec::with_capacity(pattern_count),
-            property_predicates: Vec::with_capacity(pattern_count),
-            property_settings: Vec::with_capacity(pattern_count),
-            general_predicates: Vec::with_capacity(pattern_count),
+    unsafe fn from_raw_parts(ptr: *mut ffi::TSQuery, source: &str) -> Result<Self, QueryError> {
+        let ptr = {
+            struct TSQueryDrop(*mut ffi::TSQuery);
+            impl Drop for TSQueryDrop {
+                fn drop(&mut self) {
+                    unsafe { ffi::ts_query_delete(self.0) }
+                }
+            }
+            TSQueryDrop(ptr)
         };
 
+        let string_count = unsafe { ffi::ts_query_string_count(ptr.0) };
+        let capture_count = unsafe { ffi::ts_query_capture_count(ptr.0) };
+        let pattern_count = unsafe { ffi::ts_query_pattern_count(ptr.0) as usize };
+
+        let mut capture_names = Vec::with_capacity(capture_count as usize);
+        let mut capture_quantifiers_vec = Vec::with_capacity(pattern_count as usize);
+        let mut text_predicates_vec = Vec::with_capacity(pattern_count);
+        let mut property_predicates_vec = Vec::with_capacity(pattern_count);
+        let mut property_settings_vec = Vec::with_capacity(pattern_count);
+        let mut general_predicates_vec = Vec::with_capacity(pattern_count);
+
         // Build a vector of strings to store the capture names.
         for i in 0..capture_count {
             unsafe {
                 let mut length = 0u32;
-                let name =
-                    ffi::ts_query_capture_name_for_id(ptr, i, &mut length as *mut u32) as *const u8;
+                let name = ffi::ts_query_capture_name_for_id(ptr.0, i, &mut length as *mut u32)
+                    as *const u8;
                 let name = slice::from_raw_parts(name, length as usize);
                 let name = str::from_utf8_unchecked(name);
-                result.capture_names.push(name.to_string());
+                capture_names.push(name);
             }
         }
 
@@ -1674,11 +1682,11 @@ impl Query {
             let mut capture_quantifiers = Vec::with_capacity(capture_count as usize);
             for j in 0..capture_count {
                 unsafe {
-                    let quantifier = ffi::ts_query_capture_quantifier_for_id(ptr, i as u32, j);
+                    let quantifier = ffi::ts_query_capture_quantifier_for_id(ptr.0, i as u32, j);
                     capture_quantifiers.push(quantifier.into());
                 }
             }
-            result.capture_quantifiers.push(capture_quantifiers);
+            capture_quantifiers_vec.push(capture_quantifiers.into());
         }
 
         // Build a vector of strings to represent literal values used in predicates.
@@ -1686,11 +1694,11 @@ impl Query {
             .map(|i| unsafe {
                 let mut length = 0u32;
                 let value =
-                    ffi::ts_query_string_value_for_id(ptr, i as u32, &mut length as *mut u32)
+                    ffi::ts_query_string_value_for_id(ptr.0, i as u32, &mut length as *mut u32)
                         as *const u8;
                 let value = slice::from_raw_parts(value, length as usize);
                 let value = str::from_utf8_unchecked(value);
-                value.to_string()
+                value
             })
             .collect::<Vec<_>>();
 
@@ -1699,13 +1707,13 @@ impl Query {
             let predicate_steps = unsafe {
                 let mut length = 0u32;
                 let raw_predicates =
-                    ffi::ts_query_predicates_for_pattern(ptr, i as u32, &mut length as *mut u32);
+                    ffi::ts_query_predicates_for_pattern(ptr.0, i as u32, &mut length as *mut u32);
                 (length > 0)
                     .then(|| slice::from_raw_parts(raw_predicates, length as usize))
                     .unwrap_or_default()
             };
 
-            let byte_offset = unsafe { ffi::ts_query_start_byte_for_pattern(ptr, i as u32) };
+            let byte_offset = unsafe { ffi::ts_query_start_byte_for_pattern(ptr.0, i as u32) };
             let row = source
                 .char_indices()
                 .take_while(|(i, _)| *i < byte_offset as usize)
@@ -1730,14 +1738,14 @@ impl Query {
                         row,
                         format!(
                             "Expected predicate to start with a function name. Got @{}.",
-                            result.capture_names[p[0].value_id as usize],
+                            capture_names[p[0].value_id as usize],
                         ),
                     ));
                 }
 
                 // Build a predicate for each of the known predicate function names.
-                let operator_name = &string_values[p[0].value_id as usize];
-                match operator_name.as_str() {
+                let operator_name = string_values[p[0].value_id as usize];
+                match operator_name {
                     "eq?" | "not-eq?" | "any-eq?" | "any-not-eq?" => {
                         if p.len() != 3 {
                             return Err(predicate_error(
@@ -1756,7 +1764,7 @@ impl Query {
                         }
 
                         let is_positive = operator_name == "eq?" || operator_name == "any-eq?";
-                        let match_all = match operator_name.as_str() {
+                        let match_all = match operator_name {
                             "eq?" | "not-eq?" => true,
                             "any-eq?" | "any-not-eq?" => false,
                             _ => unreachable!(),
@@ -1771,7 +1779,7 @@ impl Query {
                         } else {
                             TextPredicateCapture::EqString(
                                 p[1].value_id,
-                                string_values[p[2].value_id as usize].clone(),
+                                string_values[p[2].value_id as usize].to_string().into(),
                                 is_positive,
                                 match_all,
                             )
@@ -1794,13 +1802,13 @@ impl Query {
                         if p[2].type_ == type_capture {
                             return Err(predicate_error(row, format!(
                                 "Second argument to #match? predicate must be a literal. Got capture @{}.",
-                                result.capture_names[p[2].value_id as usize],
+                                capture_names[p[2].value_id as usize],
                             )));
                         }
 
                         let is_positive =
                             operator_name == "match?" || operator_name == "any-match?";
-                        let match_all = match operator_name.as_str() {
+                        let match_all = match operator_name {
                             "match?" | "not-match?" => true,
                             "any-match?" | "any-not-match?" => false,
                             _ => unreachable!(),
@@ -1818,8 +1826,8 @@ impl Query {
 
                     "set!" => property_settings.push(Self::parse_property(
                         row,
-                        operator_name,
-                        &result.capture_names,
+                        &operator_name,
+                        &capture_names,
                         &string_values,
                         &p[1..],
                     )?),
@@ -1827,8 +1835,8 @@ impl Query {
                     "is?" | "is-not?" => property_predicates.push((
                         Self::parse_property(
                             row,
-                            operator_name,
-                            &result.capture_names,
+                            &operator_name,
+                            &capture_names,
                             &string_values,
                             &p[1..],
                         )?,
@@ -1855,20 +1863,24 @@ impl Query {
                             if arg.type_ == type_capture {
                                 return Err(predicate_error(row, format!(
                                     "Arguments to #any-of? predicate must be literals. Got capture @{}.",
-                                    result.capture_names[arg.value_id as usize],
+                                    capture_names[arg.value_id as usize],
                                 )));
                             }
-                            values.push(string_values[arg.value_id as usize].clone());
+                            values.push(string_values[arg.value_id as usize]);
                         }
                         text_predicates.push(TextPredicateCapture::AnyString(
                             p[1].value_id,
-                            values,
+                            values
+                                .iter()
+                                .map(|x| x.to_string().into())
+                                .collect::<Vec<_>>()
+                                .into(),
                             is_positive,
                         ));
                     }
 
                     _ => general_predicates.push(QueryPredicate {
-                        operator: operator_name.clone().into_boxed_str(),
+                        operator: operator_name.to_string().into(),
                         args: p[1..]
                             .iter()
                             .map(|a| {
@@ -1876,7 +1888,7 @@ impl Query {
                                     QueryPredicateArg::Capture(a.value_id)
                                 } else {
                                     QueryPredicateArg::String(
-                                        string_values[a.value_id as usize].clone().into_boxed_str(),
+                                        string_values[a.value_id as usize].to_string().into(),
                                     )
                                 }
                             })
@@ -1885,20 +1897,24 @@ impl Query {
                 }
             }
 
-            result
-                .text_predicates
-                .push(text_predicates.into_boxed_slice());
-            result
-                .property_predicates
-                .push(property_predicates.into_boxed_slice());
-            result
-                .property_settings
-                .push(property_settings.into_boxed_slice());
-            result
-                .general_predicates
-                .push(general_predicates.into_boxed_slice());
+            text_predicates_vec.push(text_predicates.into());
+            property_predicates_vec.push(property_predicates.into());
+            property_settings_vec.push(property_settings.into());
+            general_predicates_vec.push(general_predicates.into());
         }
 
+        let result = Query {
+            ptr: unsafe { NonNull::new_unchecked(ptr.0) },
+            capture_names: capture_names.into(),
+            capture_quantifiers: capture_quantifiers_vec.into(),
+            text_predicates: text_predicates_vec.into(),
+            property_predicates: property_predicates_vec.into(),
+            property_settings: property_settings_vec.into(),
+            general_predicates: general_predicates_vec.into(),
+        };
+
+        std::mem::forget(ptr);
+
         Ok(result)
     }
 
@@ -1924,7 +1940,7 @@ impl Query {
     }
 
     /// Get the names of the captures used in the query.
-    pub fn capture_names(&self) -> &[String] {
+    pub fn capture_names(&self) -> &[&str] {
         &self.capture_names
     }
 
@@ -1937,7 +1953,7 @@ impl Query {
     pub fn capture_index_for_name(&self, name: &str) -> Option<u32> {
         self.capture_names
             .iter()
-            .position(|n| n == name)
+            .position(|n| *n == name)
             .map(|ix| ix as u32)
     }
 
@@ -2016,8 +2032,8 @@ impl Query {
     fn parse_property(
         row: usize,
         function_name: &str,
-        capture_names: &[String],
-        string_values: &[String],
+        capture_names: &[&str],
+        string_values: &[&str],
         args: &[ffi::TSQueryPredicateStep],
     ) -> Result<QueryProperty, QueryError> {
         if args.len() == 0 || args.len() > 3 {
@@ -2050,7 +2066,7 @@ impl Query {
             } else if key.is_none() {
                 key = Some(&string_values[arg.value_id as usize]);
             } else if value.is_none() {
-                value = Some(string_values[arg.value_id as usize].as_str());
+                value = Some(string_values[arg.value_id as usize]);
             } else {
                 return Err(predicate_error(
                     row,
@@ -2349,8 +2365,8 @@ impl QueryProperty {
     pub fn new(key: &str, value: Option<&str>, capture_id: Option<usize>) -> Self {
         QueryProperty {
             capture_id,
-            key: key.to_string().into_boxed_str(),
-            value: value.map(|s| s.to_string().into_boxed_str()),
+            key: key.to_string().into(),
+            value: value.map(|s| s.to_string().into()),
         }
     }
 }
diff --git a/tags/src/lib.rs b/tags/src/lib.rs
index 0cf1bf96..e151e3ee 100644
--- a/tags/src/lib.rs
+++ b/tags/src/lib.rs
@@ -136,7 +136,7 @@ impl TagsConfiguration {
         let mut local_scope_capture_index = None;
         let mut local_definition_capture_index = None;
         for (i, name) in query.capture_names().iter().enumerate() {
-            match name.as_str() {
+            match *name {
                 "" => continue,
                 "name" => name_capture_index = Some(i as u32),
                 "ignore" => ignore_capture_index = Some(i as u32),

From 08ac19086babd0ea7c4744e0e4b80f1c145b7e6d Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Fri, 1 Sep 2023 20:28:31 +0300
Subject: [PATCH 329/347] chore: simplify test case after query state
 improvements

---
 cli/src/tests/query_test.rs | 7 +------
 1 file changed, 1 insertion(+), 6 deletions(-)

diff --git a/cli/src/tests/query_test.rs b/cli/src/tests/query_test.rs
index 51c783e7..5fb33e01 100644
--- a/cli/src/tests/query_test.rs
+++ b/cli/src/tests/query_test.rs
@@ -3605,12 +3605,7 @@ fn test_query_capture_names() {
 
         assert_eq!(
             query.capture_names(),
-            &[
-                "left-operand".to_string(),
-                "right-operand".to_string(),
-                "body".to_string(),
-                "loop-condition".to_string(),
-            ]
+            ["left-operand", "right-operand", "body", "loop-condition"]
         );
     });
 }

From 67a5dbdd935d284a406e898d074b2cc820a98508 Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Sun, 3 Sep 2023 05:52:24 +0300
Subject: [PATCH 330/347] fix: dealloc calls on zero pointers

---
 cli/src/tests/helpers/allocations.rs |  4 +++-
 lib/binding_rust/util.rs             |  4 +++-
 lib/src/array.h                      | 10 ++++++----
 3 files changed, 12 insertions(+), 6 deletions(-)

diff --git a/cli/src/tests/helpers/allocations.rs b/cli/src/tests/helpers/allocations.rs
index 2ab80291..0d2331d3 100644
--- a/cli/src/tests/helpers/allocations.rs
+++ b/cli/src/tests/helpers/allocations.rs
@@ -107,7 +107,9 @@ unsafe extern "C" fn ts_record_calloc(count: usize, size: usize) -> *mut c_void
 }
 
 unsafe extern "C" fn ts_record_realloc(ptr: *mut c_void, size: usize) -> *mut c_void {
-    record_dealloc(ptr);
+    if !ptr.is_null() {
+        record_dealloc(ptr);
+    }
     let result = realloc(ptr, size);
     record_alloc(result);
     result
diff --git a/lib/binding_rust/util.rs b/lib/binding_rust/util.rs
index 5eda71f4..d5a73437 100644
--- a/lib/binding_rust/util.rs
+++ b/lib/binding_rust/util.rs
@@ -37,6 +37,8 @@ impl<T: Copy> ExactSizeIterator for CBufferIter<T> {}
 
 impl<T> Drop for CBufferIter<T> {
     fn drop(&mut self) {
-        unsafe { (FREE_FN)(self.ptr as *mut c_void) };
+        if !self.ptr.is_null() {
+            unsafe { (FREE_FN)(self.ptr as *mut c_void) };
+        }
     }
 }
diff --git a/lib/src/array.h b/lib/src/array.h
index e5cd361f..e026f6b2 100644
--- a/lib/src/array.h
+++ b/lib/src/array.h
@@ -132,10 +132,12 @@ typedef Array(void) VoidArray;
 #define array__elem_size(self) sizeof(*(self)->contents)
 
 static inline void array__delete(VoidArray *self) {
-  ts_free(self->contents);
-  self->contents = NULL;
-  self->size = 0;
-  self->capacity = 0;
+  if (self->contents) {
+    ts_free(self->contents);
+    self->contents = NULL;
+    self->size = 0;
+    self->capacity = 0;
+  }
 }
 
 static inline void array__erase(VoidArray *self, size_t element_size,

From 7f7084c2cb64a1617746ac6c7bbdb773131593a7 Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Sun, 3 Sep 2023 05:29:48 +0300
Subject: [PATCH 331/347] chore(test): panic on zero pointer deallocs for alloc
 tracked scopes

---
 cli/src/tests/helpers/allocations.rs | 13 +++++++++----
 1 file changed, 9 insertions(+), 4 deletions(-)

diff --git a/cli/src/tests/helpers/allocations.rs b/cli/src/tests/helpers/allocations.rs
index 0d2331d3..43537633 100644
--- a/cli/src/tests/helpers/allocations.rs
+++ b/cli/src/tests/helpers/allocations.rs
@@ -83,6 +83,9 @@ fn record_alloc(ptr: *mut c_void) {
 }
 
 fn record_dealloc(ptr: *mut c_void) {
+    if ptr.is_null() {
+        panic!("Zero pointer deallocation!");
+    }
     RECORDER.with(|recorder| {
         if recorder.enabled.load(SeqCst) {
             recorder
@@ -107,11 +110,13 @@ unsafe extern "C" fn ts_record_calloc(count: usize, size: usize) -> *mut c_void
 }
 
 unsafe extern "C" fn ts_record_realloc(ptr: *mut c_void, size: usize) -> *mut c_void {
-    if !ptr.is_null() {
-        record_dealloc(ptr);
-    }
     let result = realloc(ptr, size);
-    record_alloc(result);
+    if ptr.is_null() {
+        record_alloc(result);
+    } else if ptr != result {
+        record_dealloc(ptr);
+        record_alloc(result);
+    }
     result
 }
 

From 9cc1daafcab760224a767d1dc37b25a5d5344530 Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Sun, 3 Sep 2023 06:47:27 +0300
Subject: [PATCH 332/347] chore(ffi): remove enum name prefixes from all C enum
 values

---
 cli/src/main.rs              |  4 +--
 cli/src/parse.rs             |  2 +-
 lib/binding_rust/bindings.rs | 44 ++++++++++++-------------
 lib/binding_rust/build.rs    |  1 +
 lib/binding_rust/lib.rs      | 63 +++++++++++++++++-------------------
 script/generate-bindings     |  1 +
 6 files changed, 57 insertions(+), 58 deletions(-)

diff --git a/cli/src/main.rs b/cli/src/main.rs
index fbdb0343..6699d764 100644
--- a/cli/src/main.rs
+++ b/cli/src/main.rs
@@ -448,8 +448,8 @@ fn run() -> Result<()> {
                 matches
                     .values_of("encoding")
                     .map_or(Ok(None), |mut e| match e.next() {
-                        Some("utf16") => Ok(Some(ffi::TSInputEncoding_TSInputEncodingUTF16)),
-                        Some("utf8") => Ok(Some(ffi::TSInputEncoding_TSInputEncodingUTF8)),
+                        Some("utf16") => Ok(Some(ffi::TSInputEncodingUTF16)),
+                        Some("utf8") => Ok(Some(ffi::TSInputEncodingUTF8)),
                         Some(_) => Err(anyhow!("Invalid encoding. Expected one of: utf8, utf16")),
                         None => Ok(None),
                     })?;
diff --git a/cli/src/parse.rs b/cli/src/parse.rs
index 3647c2c4..5b1a4b31 100644
--- a/cli/src/parse.rs
+++ b/cli/src/parse.rs
@@ -88,7 +88,7 @@ pub fn parse_file_at_path(opts: ParseFileOptions) -> Result<bool> {
     }
 
     let tree = match opts.encoding {
-        Some(encoding) if encoding == ffi::TSInputEncoding_TSInputEncodingUTF16 => {
+        Some(encoding) if encoding == ffi::TSInputEncodingUTF16 => {
             let source_code_utf16 = source_code
                 .chunks_exact(2)
                 .map(|chunk| u16::from_le_bytes([chunk[0], chunk[1]]))
diff --git a/lib/binding_rust/bindings.rs b/lib/binding_rust/bindings.rs
index a0e52f6c..c25bc1e4 100644
--- a/lib/binding_rust/bindings.rs
+++ b/lib/binding_rust/bindings.rs
@@ -35,12 +35,12 @@ pub struct TSQueryCursor {
 pub struct TSLookaheadIterator {
     _unused: [u8; 0],
 }
-pub const TSInputEncoding_TSInputEncodingUTF8: TSInputEncoding = 0;
-pub const TSInputEncoding_TSInputEncodingUTF16: TSInputEncoding = 1;
+pub const TSInputEncodingUTF8: TSInputEncoding = 0;
+pub const TSInputEncodingUTF16: TSInputEncoding = 1;
 pub type TSInputEncoding = ::std::os::raw::c_uint;
-pub const TSSymbolType_TSSymbolTypeRegular: TSSymbolType = 0;
-pub const TSSymbolType_TSSymbolTypeAnonymous: TSSymbolType = 1;
-pub const TSSymbolType_TSSymbolTypeAuxiliary: TSSymbolType = 2;
+pub const TSSymbolTypeRegular: TSSymbolType = 0;
+pub const TSSymbolTypeAnonymous: TSSymbolType = 1;
+pub const TSSymbolTypeAuxiliary: TSSymbolType = 2;
 pub type TSSymbolType = ::std::os::raw::c_uint;
 #[repr(C)]
 #[derive(Debug, Copy, Clone)]
@@ -70,8 +70,8 @@ pub struct TSInput {
     >,
     pub encoding: TSInputEncoding,
 }
-pub const TSLogType_TSLogTypeParse: TSLogType = 0;
-pub const TSLogType_TSLogTypeLex: TSLogType = 1;
+pub const TSLogTypeParse: TSLogType = 0;
+pub const TSLogTypeLex: TSLogType = 1;
 pub type TSLogType = ::std::os::raw::c_uint;
 #[repr(C)]
 #[derive(Debug)]
@@ -115,11 +115,11 @@ pub struct TSQueryCapture {
     pub node: TSNode,
     pub index: u32,
 }
-pub const TSQuantifier_TSQuantifierZero: TSQuantifier = 0;
-pub const TSQuantifier_TSQuantifierZeroOrOne: TSQuantifier = 1;
-pub const TSQuantifier_TSQuantifierZeroOrMore: TSQuantifier = 2;
-pub const TSQuantifier_TSQuantifierOne: TSQuantifier = 3;
-pub const TSQuantifier_TSQuantifierOneOrMore: TSQuantifier = 4;
+pub const TSQuantifierZero: TSQuantifier = 0;
+pub const TSQuantifierZeroOrOne: TSQuantifier = 1;
+pub const TSQuantifierZeroOrMore: TSQuantifier = 2;
+pub const TSQuantifierOne: TSQuantifier = 3;
+pub const TSQuantifierOneOrMore: TSQuantifier = 4;
 pub type TSQuantifier = ::std::os::raw::c_uint;
 #[repr(C)]
 #[derive(Debug)]
@@ -129,9 +129,9 @@ pub struct TSQueryMatch {
     pub capture_count: u16,
     pub captures: *const TSQueryCapture,
 }
-pub const TSQueryPredicateStepType_TSQueryPredicateStepTypeDone: TSQueryPredicateStepType = 0;
-pub const TSQueryPredicateStepType_TSQueryPredicateStepTypeCapture: TSQueryPredicateStepType = 1;
-pub const TSQueryPredicateStepType_TSQueryPredicateStepTypeString: TSQueryPredicateStepType = 2;
+pub const TSQueryPredicateStepTypeDone: TSQueryPredicateStepType = 0;
+pub const TSQueryPredicateStepTypeCapture: TSQueryPredicateStepType = 1;
+pub const TSQueryPredicateStepTypeString: TSQueryPredicateStepType = 2;
 pub type TSQueryPredicateStepType = ::std::os::raw::c_uint;
 #[repr(C)]
 #[derive(Debug)]
@@ -139,13 +139,13 @@ pub struct TSQueryPredicateStep {
     pub type_: TSQueryPredicateStepType,
     pub value_id: u32,
 }
-pub const TSQueryError_TSQueryErrorNone: TSQueryError = 0;
-pub const TSQueryError_TSQueryErrorSyntax: TSQueryError = 1;
-pub const TSQueryError_TSQueryErrorNodeType: TSQueryError = 2;
-pub const TSQueryError_TSQueryErrorField: TSQueryError = 3;
-pub const TSQueryError_TSQueryErrorCapture: TSQueryError = 4;
-pub const TSQueryError_TSQueryErrorStructure: TSQueryError = 5;
-pub const TSQueryError_TSQueryErrorLanguage: TSQueryError = 6;
+pub const TSQueryErrorNone: TSQueryError = 0;
+pub const TSQueryErrorSyntax: TSQueryError = 1;
+pub const TSQueryErrorNodeType: TSQueryError = 2;
+pub const TSQueryErrorField: TSQueryError = 3;
+pub const TSQueryErrorCapture: TSQueryError = 4;
+pub const TSQueryErrorStructure: TSQueryError = 5;
+pub const TSQueryErrorLanguage: TSQueryError = 6;
 pub type TSQueryError = ::std::os::raw::c_uint;
 extern "C" {
     #[doc = " Create a new parser."]
diff --git a/lib/binding_rust/build.rs b/lib/binding_rust/build.rs
index a74bdb27..690d1527 100644
--- a/lib/binding_rust/build.rs
+++ b/lib/binding_rust/build.rs
@@ -64,6 +64,7 @@ fn generate_bindings() {
         .allowlist_function("^ts_.*")
         .allowlist_var("^TREE_SITTER.*")
         .no_copy(no_copy.join("|"))
+        .prepend_enum_name(false)
         .generate()
         .expect("Failed to generate bindings");
 
diff --git a/lib/binding_rust/lib.rs b/lib/binding_rust/lib.rs
index 81204625..fdd661dd 100644
--- a/lib/binding_rust/lib.rs
+++ b/lib/binding_rust/lib.rs
@@ -137,11 +137,11 @@ pub enum CaptureQuantifier {
 impl From<ffi::TSQuantifier> for CaptureQuantifier {
     fn from(value: ffi::TSQuantifier) -> Self {
         match value {
-            ffi::TSQuantifier_TSQuantifierZero => CaptureQuantifier::Zero,
-            ffi::TSQuantifier_TSQuantifierZeroOrOne => CaptureQuantifier::ZeroOrOne,
-            ffi::TSQuantifier_TSQuantifierZeroOrMore => CaptureQuantifier::ZeroOrMore,
-            ffi::TSQuantifier_TSQuantifierOne => CaptureQuantifier::One,
-            ffi::TSQuantifier_TSQuantifierOneOrMore => CaptureQuantifier::OneOrMore,
+            ffi::TSQuantifierZero => CaptureQuantifier::Zero,
+            ffi::TSQuantifierZeroOrOne => CaptureQuantifier::ZeroOrOne,
+            ffi::TSQuantifierZeroOrMore => CaptureQuantifier::ZeroOrMore,
+            ffi::TSQuantifierOne => CaptureQuantifier::One,
+            ffi::TSQuantifierOneOrMore => CaptureQuantifier::OneOrMore,
             _ => panic!("Unrecognized quantifier: {}", value),
         }
     }
@@ -312,14 +312,12 @@ impl Language {
     /// Check if the node type for the given numerical id is named (as opposed
     /// to an anonymous node type).
     pub fn node_kind_is_named(&self, id: u16) -> bool {
-        unsafe { ffi::ts_language_symbol_type(self.0, id) == ffi::TSSymbolType_TSSymbolTypeRegular }
+        unsafe { ffi::ts_language_symbol_type(self.0, id) == ffi::TSSymbolTypeRegular }
     }
 
     #[doc(alias = "ts_language_symbol_type")]
     pub fn node_kind_is_visible(&self, id: u16) -> bool {
-        unsafe {
-            ffi::ts_language_symbol_type(self.0, id) <= ffi::TSSymbolType_TSSymbolTypeAnonymous
-        }
+        unsafe { ffi::ts_language_symbol_type(self.0, id) <= ffi::TSSymbolTypeAnonymous }
     }
 
     /// Get the number of distinct field names in this language.
@@ -445,7 +443,7 @@ impl Parser {
             ) {
                 let callback = (payload as *mut Logger).as_mut().unwrap();
                 if let Ok(message) = CStr::from_ptr(c_message).to_str() {
-                    let log_type = if c_log_type == ffi::TSLogType_TSLogTypeParse {
+                    let log_type = if c_log_type == ffi::TSLogTypeParse {
                         LogType::Parse
                     } else {
                         LogType::Lex
@@ -571,7 +569,7 @@ impl Parser {
         let c_input = ffi::TSInput {
             payload: &mut payload as *mut (&mut F, Option<T>) as *mut c_void,
             read: Some(read::<T, F>),
-            encoding: ffi::TSInputEncoding_TSInputEncodingUTF8,
+            encoding: ffi::TSInputEncodingUTF8,
         };
 
         let c_old_tree = old_tree.map_or(ptr::null_mut(), |t| t.0.as_ptr());
@@ -627,7 +625,7 @@ impl Parser {
         let c_input = ffi::TSInput {
             payload: &mut payload as *mut (&mut F, Option<T>) as *mut c_void,
             read: Some(read::<T, F>),
-            encoding: ffi::TSInputEncoding_TSInputEncodingUTF16,
+            encoding: ffi::TSInputEncodingUTF16,
         };
 
         let c_old_tree = old_tree.map_or(ptr::null_mut(), |t| t.0.as_ptr());
@@ -1568,7 +1566,7 @@ impl Query {
 
         // On failure, build an error based on the error code and offset.
         if ptr.is_null() {
-            if error_type == ffi::TSQueryError_TSQueryErrorLanguage {
+            if error_type == ffi::TSQueryErrorLanguage {
                 return Err(QueryError {
                     row: 0,
                     column: 0,
@@ -1600,18 +1598,16 @@ impl Query {
             let message;
             match error_type {
                 // Error types that report names
-                ffi::TSQueryError_TSQueryErrorNodeType
-                | ffi::TSQueryError_TSQueryErrorField
-                | ffi::TSQueryError_TSQueryErrorCapture => {
+                ffi::TSQueryErrorNodeType | ffi::TSQueryErrorField | ffi::TSQueryErrorCapture => {
                     let suffix = source.split_at(offset).1;
                     let end_offset = suffix
                         .find(|c| !char::is_alphanumeric(c) && c != '_' && c != '-')
                         .unwrap_or(suffix.len());
                     message = suffix.split_at(end_offset).0.to_string();
                     kind = match error_type {
-                        ffi::TSQueryError_TSQueryErrorNodeType => QueryErrorKind::NodeType,
-                        ffi::TSQueryError_TSQueryErrorField => QueryErrorKind::Field,
-                        ffi::TSQueryError_TSQueryErrorCapture => QueryErrorKind::Capture,
+                        ffi::TSQueryErrorNodeType => QueryErrorKind::NodeType,
+                        ffi::TSQueryErrorField => QueryErrorKind::Field,
+                        ffi::TSQueryErrorCapture => QueryErrorKind::Capture,
                         _ => unreachable!(),
                     };
                 }
@@ -1624,7 +1620,7 @@ impl Query {
                         "Unexpected EOF".to_string()
                     };
                     kind = match error_type {
-                        ffi::TSQueryError_TSQueryErrorStructure => QueryErrorKind::Structure,
+                        ffi::TSQueryErrorStructure => QueryErrorKind::Structure,
                         _ => QueryErrorKind::Syntax,
                     };
                 }
@@ -1720,20 +1716,21 @@ impl Query {
                 .filter(|(_, c)| *c == '\n')
                 .count();
 
-            let type_done = ffi::TSQueryPredicateStepType_TSQueryPredicateStepTypeDone;
-            let type_capture = ffi::TSQueryPredicateStepType_TSQueryPredicateStepTypeCapture;
-            let type_string = ffi::TSQueryPredicateStepType_TSQueryPredicateStepTypeString;
+            use ffi::TSQueryPredicateStepType as T;
+            const TYPE_DONE: T = ffi::TSQueryPredicateStepTypeDone;
+            const TYPE_CAPTURE: T = ffi::TSQueryPredicateStepTypeCapture;
+            const TYPE_STRING: T = ffi::TSQueryPredicateStepTypeString;
 
             let mut text_predicates = Vec::new();
             let mut property_predicates = Vec::new();
             let mut property_settings = Vec::new();
             let mut general_predicates = Vec::new();
-            for p in predicate_steps.split(|s| s.type_ == type_done) {
+            for p in predicate_steps.split(|s| s.type_ == TYPE_DONE) {
                 if p.is_empty() {
                     continue;
                 }
 
-                if p[0].type_ != type_string {
+                if p[0].type_ != TYPE_STRING {
                     return Err(predicate_error(
                         row,
                         format!(
@@ -1756,7 +1753,7 @@ impl Query {
                             ),
                             ));
                         }
-                        if p[1].type_ != type_capture {
+                        if p[1].type_ != TYPE_CAPTURE {
                             return Err(predicate_error(row, format!(
                                 "First argument to #eq? predicate must be a capture name. Got literal \"{}\".",
                                 string_values[p[1].value_id as usize],
@@ -1769,7 +1766,7 @@ impl Query {
                             "any-eq?" | "any-not-eq?" => false,
                             _ => unreachable!(),
                         };
-                        text_predicates.push(if p[2].type_ == type_capture {
+                        text_predicates.push(if p[2].type_ == TYPE_CAPTURE {
                             TextPredicateCapture::EqCapture(
                                 p[1].value_id,
                                 p[2].value_id,
@@ -1793,13 +1790,13 @@ impl Query {
                                 p.len() - 1
                             )));
                         }
-                        if p[1].type_ != type_capture {
+                        if p[1].type_ != TYPE_CAPTURE {
                             return Err(predicate_error(row, format!(
                                 "First argument to #match? predicate must be a capture name. Got literal \"{}\".",
                                 string_values[p[1].value_id as usize],
                             )));
                         }
-                        if p[2].type_ == type_capture {
+                        if p[2].type_ == TYPE_CAPTURE {
                             return Err(predicate_error(row, format!(
                                 "Second argument to #match? predicate must be a literal. Got capture @{}.",
                                 capture_names[p[2].value_id as usize],
@@ -1850,7 +1847,7 @@ impl Query {
                                 p.len() - 1
                             )));
                         }
-                        if p[1].type_ != type_capture {
+                        if p[1].type_ != TYPE_CAPTURE {
                             return Err(predicate_error(row, format!(
                                 "First argument to #any-of? predicate must be a capture name. Got literal \"{}\".",
                                 string_values[p[1].value_id as usize],
@@ -1860,7 +1857,7 @@ impl Query {
                         let is_positive = operator_name == "any-of?";
                         let mut values = Vec::new();
                         for arg in &p[2..] {
-                            if arg.type_ == type_capture {
+                            if arg.type_ == TYPE_CAPTURE {
                                 return Err(predicate_error(row, format!(
                                     "Arguments to #any-of? predicate must be literals. Got capture @{}.",
                                     capture_names[arg.value_id as usize],
@@ -1884,7 +1881,7 @@ impl Query {
                         args: p[1..]
                             .iter()
                             .map(|a| {
-                                if a.type_ == type_capture {
+                                if a.type_ == TYPE_CAPTURE {
                                     QueryPredicateArg::Capture(a.value_id)
                                 } else {
                                     QueryPredicateArg::String(
@@ -2052,7 +2049,7 @@ impl Query {
         let mut value = None;
 
         for arg in args {
-            if arg.type_ == ffi::TSQueryPredicateStepType_TSQueryPredicateStepTypeCapture {
+            if arg.type_ == ffi::TSQueryPredicateStepTypeCapture {
                 if capture_id.is_some() {
                     return Err(predicate_error(
                         row,
diff --git a/script/generate-bindings b/script/generate-bindings
index 52fc43f3..9ced5712 100755
--- a/script/generate-bindings
+++ b/script/generate-bindings
@@ -35,5 +35,6 @@ bindgen                                        \
   --allowlist-function '^ts_.*'                \
   --allowlist-var "^TREE_SITTER.*"             \
   --blocklist-type '^__.*'                     \
+  --no-prepend-enum-name                       \
   --no-copy "$no_copy"                         \
   $header_path > $output_path

From 46965770fc554acdda414f70b4a1566e66988a5e Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Wed, 30 Aug 2023 20:03:03 +0300
Subject: [PATCH 333/347] fix(lib): segmentation fault in `ts_node_parse_state`

---
 lib/src/node.c | 4 +++-
 1 file changed, 3 insertions(+), 1 deletion(-)

diff --git a/lib/src/node.c b/lib/src/node.c
index 092e96f8..546b9099 100644
--- a/lib/src/node.c
+++ b/lib/src/node.c
@@ -489,8 +489,10 @@ TSStateId ts_node_parse_state(TSNode self) {
 TSStateId ts_node_next_parse_state(TSNode self) {
   const TSLanguage *language = self.tree->language;
   uint16_t state = ts_node_parse_state(self);
+  if (state == TS_TREE_STATE_NONE) {
+    return TS_TREE_STATE_NONE;
+  }
   uint16_t symbol = ts_node_grammar_symbol(self);
-
   return ts_language_next_state(language, state, symbol);
 }
 

From 6d4aac723f7951dfecedafed5f80e5bc231a5ff0 Mon Sep 17 00:00:00 2001
From: Amaan Qureshi <amaanq12@gmail.com>
Date: Tue, 19 Sep 2023 09:29:13 -0400
Subject: [PATCH 334/347] feat: add some more commonly used functions to
 exports.json

---
 lib/binding_web/exports.json | 5 +++++
 1 file changed, 5 insertions(+)

diff --git a/lib/binding_web/exports.json b/lib/binding_web/exports.json
index ad7a6987..bc794480 100644
--- a/lib/binding_web/exports.json
+++ b/lib/binding_web/exports.json
@@ -18,10 +18,13 @@
   "___cxa_atexit",
   "_abort",
   "_isalpha",
+  "_isspace",
   "_iswalnum",
   "_iswalpha",
+  "_iswblank",
   "_iswdigit",
   "_iswlower",
+  "_iswupper",
   "_iswspace",
   "_memchr",
   "_memcmp",
@@ -31,7 +34,9 @@
   "_strlen",
   "_strcmp",
   "_strncpy",
+  "_tolower",
   "_towupper",
+  "_stderr",
 
   "_ts_init",
   "_ts_language_field_count",

From 8d0997d5b4f38fbd94c188bb24c1fa5c088a3a4b Mon Sep 17 00:00:00 2001
From: dstoc <539597+dstoc@users.noreply.github.com>
Date: Mon, 17 Oct 2022 16:53:34 +1100
Subject: [PATCH 335/347] Add towlower to wasm exports

tree-sitter/tree-sitter#1906
---
 lib/binding_web/exports.json | 1 +
 1 file changed, 1 insertion(+)

diff --git a/lib/binding_web/exports.json b/lib/binding_web/exports.json
index bc794480..dfc9ff54 100644
--- a/lib/binding_web/exports.json
+++ b/lib/binding_web/exports.json
@@ -35,6 +35,7 @@
   "_strcmp",
   "_strncpy",
   "_tolower",
+  "_towlower",
   "_towupper",
   "_stderr",
 

From ef9cabd4b5e1eda9d5d3b9377f2bee4e781dafdf Mon Sep 17 00:00:00 2001
From: Amaan Qureshi <amaanq12@gmail.com>
Date: Wed, 20 Sep 2023 09:47:24 -0400
Subject: [PATCH 336/347] fix: update javascript tests and use cpp/javascript
 master for fixtures

---
 cli/src/tests/highlight_test.rs               | 42 +++++------
 cli/src/tests/parser_test.rs                  | 12 ++--
 cli/src/tests/query_test.rs                   | 70 +++++++++----------
 cli/src/tests/test_highlight_test.rs          |  7 +-
 script/fetch-fixtures                         |  4 +-
 .../error_corpus/javascript_errors.txt        |  8 +--
 6 files changed, 72 insertions(+), 71 deletions(-)

diff --git a/cli/src/tests/highlight_test.rs b/cli/src/tests/highlight_test.rs
index e400b047..12c120ab 100644
--- a/cli/src/tests/highlight_test.rs
+++ b/cli/src/tests/highlight_test.rs
@@ -62,7 +62,7 @@ lazy_static! {
 fn test_highlighting_javascript() {
     let source = "const a = function(b) { return b + c; }";
     assert_eq!(
-        &to_token_vector(&source, &JS_HIGHLIGHT).unwrap(),
+        &to_token_vector(source, &JS_HIGHLIGHT).unwrap(),
         &[vec![
             ("const", vec!["keyword"]),
             (" ", vec![]),
@@ -72,14 +72,14 @@ fn test_highlighting_javascript() {
             (" ", vec![]),
             ("function", vec!["keyword"]),
             ("(", vec!["punctuation.bracket"]),
-            ("b", vec!["variable.parameter"]),
+            ("b", vec!["variable"]),
             (")", vec!["punctuation.bracket"]),
             (" ", vec![]),
             ("{", vec!["punctuation.bracket"]),
             (" ", vec![]),
             ("return", vec!["keyword"]),
             (" ", vec![]),
-            ("b", vec!["variable.parameter"]),
+            ("b", vec!["variable"]),
             (" ", vec![]),
             ("+", vec!["operator"]),
             (" ", vec![]),
@@ -93,7 +93,7 @@ fn test_highlighting_javascript() {
 
 #[test]
 fn test_highlighting_injected_html_in_javascript() {
-    let source = vec!["const s = html `<div>${a < b}</div>`;"].join("\n");
+    let source = ["const s = html `<div>${a < b}</div>`;"].join("\n");
 
     assert_eq!(
         &to_token_vector(&source, &JS_HIGHLIGHT).unwrap(),
@@ -157,7 +157,7 @@ fn test_highlighting_injected_javascript_in_html_mini() {
 
 #[test]
 fn test_highlighting_injected_javascript_in_html() {
-    let source = vec![
+    let source = [
         "<body>",
         "  <script>",
         "    const x = new Thing();",
@@ -212,7 +212,7 @@ fn test_highlighting_injected_javascript_in_html() {
 
 #[test]
 fn test_highlighting_multiline_nodes_to_html() {
-    let source = vec![
+    let source = [
         "const SOMETHING = `",
         "  one ${",
         "    two()",
@@ -236,7 +236,7 @@ fn test_highlighting_multiline_nodes_to_html() {
 
 #[test]
 fn test_highlighting_with_local_variable_tracking() {
-    let source = vec![
+    let source = [
         "module.exports = function a(b) {",
         "  const module = c;",
         "  console.log(module, b);",
@@ -258,7 +258,7 @@ fn test_highlighting_with_local_variable_tracking() {
                 (" ", vec![]),
                 ("a", vec!["function"]),
                 ("(", vec!["punctuation.bracket"]),
-                ("b", vec!["variable.parameter"]),
+                ("b", vec!["variable"]),
                 (")", vec!["punctuation.bracket"]),
                 (" ", vec![]),
                 ("{", vec!["punctuation.bracket"])
@@ -285,7 +285,7 @@ fn test_highlighting_with_local_variable_tracking() {
                 (",", vec!["punctuation.delimiter"]),
                 (" ", vec![]),
                 // A parameter, because `b` was defined as a parameter above.
-                ("b", vec!["variable.parameter"]),
+                ("b", vec!["variable"]),
                 (")", vec!["punctuation.bracket"]),
                 (";", vec!["punctuation.delimiter"]),
             ],
@@ -296,7 +296,7 @@ fn test_highlighting_with_local_variable_tracking() {
 
 #[test]
 fn test_highlighting_empty_lines() {
-    let source = vec![
+    let source = [
         "class A {",
         "",
         "  b(c) {",
@@ -314,7 +314,7 @@ fn test_highlighting_empty_lines() {
         &[
             "<span class=keyword>class</span> <span class=constructor>A</span> <span class=punctuation.bracket>{</span>\n".to_string(),
             "\n".to_string(),
-            "  <span class=function>b</span><span class=punctuation.bracket>(</span><span class=variable.parameter>c</span><span class=punctuation.bracket>)</span> <span class=punctuation.bracket>{</span>\n".to_string(),
+            "  <span class=function>b</span><span class=punctuation.bracket>(</span><span class=variable>c</span><span class=punctuation.bracket>)</span> <span class=punctuation.bracket>{</span>\n".to_string(),
             "\n".to_string(),
             "    <span class=function>d</span><span class=punctuation.bracket>(</span><span class=variable>e</span><span class=punctuation.bracket>)</span>\n".to_string(),
             "\n".to_string(),
@@ -330,7 +330,7 @@ fn test_highlighting_carriage_returns() {
     let source = "a = \"a\rb\"\r\nb\r";
 
     assert_eq!(
-        &to_html(&source, &JS_HIGHLIGHT).unwrap(),
+        &to_html(source, &JS_HIGHLIGHT).unwrap(),
         &[
             "<span class=variable>a</span> <span class=operator>=</span> <span class=string>&quot;a<span class=carriage-return></span>b&quot;</span>\n",
             "<span class=variable>b</span>\n",
@@ -340,7 +340,7 @@ fn test_highlighting_carriage_returns() {
 
 #[test]
 fn test_highlighting_ejs_with_html_and_javascript() {
-    let source = vec!["<div><% foo() %></div><script> bar() </script>"].join("\n");
+    let source = ["<div><% foo() %></div><script> bar() </script>"].join("\n");
 
     assert_eq!(
         &to_token_vector(&source, &EJS_HIGHLIGHT).unwrap(),
@@ -377,7 +377,7 @@ fn test_highlighting_ejs_with_html_and_javascript() {
 fn test_highlighting_javascript_with_jsdoc() {
     // Regression test: the middle comment has no highlights. This should not prevent
     // later injections from highlighting properly.
-    let source = vec!["a /* @see a */ b; /* nothing */ c; /* @see b */"].join("\n");
+    let source = ["a /* @see a */ b; /* nothing */ c; /* @see b */"].join("\n");
 
     assert_eq!(
         &to_token_vector(&source, &JS_HIGHLIGHT).unwrap(),
@@ -405,7 +405,7 @@ fn test_highlighting_javascript_with_jsdoc() {
 
 #[test]
 fn test_highlighting_with_content_children_included() {
-    let source = vec!["assert!(", "    a.b.c() < D::e::<F>()", ");"].join("\n");
+    let source = ["assert!(", "    a.b.c() < D::e::<F>()", ");"].join("\n");
 
     assert_eq!(
         &to_token_vector(&source, &RUST_HIGHLIGHT).unwrap(),
@@ -483,7 +483,7 @@ fn test_highlighting_cancellation() {
 
 #[test]
 fn test_highlighting_via_c_api() {
-    let highlights = vec![
+    let highlights = [
         "class=tag\0",
         "class=function\0",
         "class=string\0",
@@ -622,11 +622,11 @@ fn test_highlighting_with_all_captures_applied() {
         [ \"{\" \"}\" \"(\" \")\" ] @punctuation.bracket
     "};
     let mut rust_highlight_reverse =
-        HighlightConfiguration::new(language, "rust", &highlights_query, "", "", true).unwrap();
+        HighlightConfiguration::new(language, "rust", highlights_query, "", "", true).unwrap();
     rust_highlight_reverse.configure(&HIGHLIGHT_NAMES);
 
     assert_eq!(
-        &to_token_vector(&source, &rust_highlight_reverse).unwrap(),
+        &to_token_vector(source, &rust_highlight_reverse).unwrap(),
         &[[
             ("fn", vec!["keyword"]),
             (" ", vec![]),
@@ -743,20 +743,20 @@ fn to_token_vector<'a>(
             }
             HighlightEvent::Source { start, end } => {
                 let s = str::from_utf8(&src[start..end]).unwrap();
-                for (i, l) in s.split("\n").enumerate() {
+                for (i, l) in s.split('\n').enumerate() {
                     let l = l.trim_end_matches('\r');
                     if i > 0 {
                         lines.push(line);
                         line = Vec::new();
                     }
-                    if l.len() > 0 {
+                    if !l.is_empty() {
                         line.push((l, highlights.clone()));
                     }
                 }
             }
         }
     }
-    if line.len() > 0 {
+    if !line.is_empty() {
         lines.push(line);
     }
     Ok(lines)
diff --git a/cli/src/tests/parser_test.rs b/cli/src/tests/parser_test.rs
index d490b78f..99616f56 100644
--- a/cli/src/tests/parser_test.rs
+++ b/cli/src/tests/parser_test.rs
@@ -148,7 +148,7 @@ fn test_parsing_with_custom_utf8_input() {
         )
     );
     assert_eq!(root.kind(), "source_file");
-    assert_eq!(root.has_error(), false);
+    assert!(!root.has_error());
     assert_eq!(root.child(0).unwrap().kind(), "function_item");
 }
 
@@ -187,7 +187,7 @@ fn test_parsing_with_custom_utf16_input() {
         "(source_file (function_item (visibility_modifier) name: (identifier) parameters: (parameters) body: (block (integer_literal))))"
     );
     assert_eq!(root.kind(), "source_file");
-    assert_eq!(root.has_error(), false);
+    assert!(!root.has_error());
     assert_eq!(root.child(0).unwrap().kind(), "function_item");
 }
 
@@ -834,7 +834,7 @@ fn test_parsing_with_one_included_range() {
         concat!(
             "(program (expression_statement (call_expression ",
             "function: (member_expression object: (identifier) property: (property_identifier)) ",
-            "arguments: (arguments (string)))))",
+            "arguments: (arguments (string (string_fragment))))))",
         )
     );
     assert_eq!(
@@ -1183,7 +1183,7 @@ fn test_parsing_with_a_newly_included_range() {
         .set_included_ranges(&[simple_range(range1_start, range1_end)])
         .unwrap();
     let tree = parser
-        .parse_with(&mut chunked_input(&source_code, 3), None)
+        .parse_with(&mut chunked_input(source_code, 3), None)
         .unwrap();
     assert_eq!(
         tree.root_node().to_sexp(),
@@ -1202,7 +1202,7 @@ fn test_parsing_with_a_newly_included_range() {
         ])
         .unwrap();
     let tree2 = parser
-        .parse_with(&mut chunked_input(&source_code, 3), Some(&tree))
+        .parse_with(&mut chunked_input(source_code, 3), Some(&tree))
         .unwrap();
     assert_eq!(
         tree2.root_node().to_sexp(),
@@ -1226,7 +1226,7 @@ fn test_parsing_with_a_newly_included_range() {
             simple_range(range3_start, range3_end),
         ])
         .unwrap();
-    let tree3 = parser.parse(&source_code, Some(&tree)).unwrap();
+    let tree3 = parser.parse(source_code, Some(&tree)).unwrap();
     assert_eq!(
         tree3.root_node().to_sexp(),
         concat!(
diff --git a/cli/src/tests/query_test.rs b/cli/src/tests/query_test.rs
index 5fb33e01..13e4f8d0 100644
--- a/cli/src/tests/query_test.rs
+++ b/cli/src/tests/query_test.rs
@@ -323,16 +323,16 @@ fn test_query_errors_on_impossible_patterns() {
         assert_eq!(
             Query::new(
                 js_lang,
-                "(binary_expression left: (identifier) left: (identifier))"
+                "(binary_expression left: (expression (identifier)) left: (expression (identifier)))"
             ),
             Err(QueryError {
                 kind: QueryErrorKind::Structure,
                 row: 0,
-                offset: 38,
-                column: 38,
+                offset: 51,
+                column: 51,
                 message: [
-                    "(binary_expression left: (identifier) left: (identifier))",
-                    "                                      ^"
+                    "(binary_expression left: (expression (identifier)) left: (expression (identifier)))",
+                    "                                                   ^",
                 ]
                 .join("\n"),
             })
@@ -437,19 +437,19 @@ fn test_query_errors_on_impossible_patterns() {
         Query::new(
             js_lang,
             "(if_statement
-                condition: (parenthesized_expression (_expression) @cond))",
+                condition: (parenthesized_expression (expression) @cond))",
         )
         .unwrap();
 
         assert_eq!(
-            Query::new(js_lang, "(if_statement condition: (_expression))",),
+            Query::new(js_lang, "(if_statement condition: (expression))",),
             Err(QueryError {
                 kind: QueryErrorKind::Structure,
                 row: 0,
                 offset: 14,
                 column: 14,
                 message: [
-                    "(if_statement condition: (_expression))", //
+                    "(if_statement condition: (expression))", //
                     "              ^",
                 ]
                 .join("\n")
@@ -1726,7 +1726,7 @@ fn test_query_matches_with_too_many_permutations_to_track() {
             collect_matches(matches, &query, source.as_str())[0],
             (0, vec![("pre", "hello"), ("post", "hello")]),
         );
-        assert_eq!(cursor.did_exceed_match_limit(), true);
+        assert!(cursor.did_exceed_match_limit());
     });
 }
 
@@ -1775,7 +1775,7 @@ fn test_query_sibling_patterns_dont_match_children_of_an_error() {
 
         let mut parser = Parser::new();
         parser.set_language(language).unwrap();
-        let tree = parser.parse(&source, None).unwrap();
+        let tree = parser.parse(source, None).unwrap();
         let mut cursor = QueryCursor::new();
         let matches = cursor.matches(&query, tree.root_node(), source.as_bytes());
         assert_eq!(
@@ -1825,7 +1825,7 @@ fn test_query_matches_with_alternatives_and_too_many_permutations_to_track() {
             collect_matches(matches, &query, source.as_str()),
             vec![(1, vec![("method", "b")]); 50],
         );
-        assert_eq!(cursor.did_exceed_match_limit(), true);
+        assert!(cursor.did_exceed_match_limit());
     });
 }
 
@@ -1956,7 +1956,7 @@ fn test_query_matches_within_byte_range() {
 
         let mut parser = Parser::new();
         parser.set_language(language).unwrap();
-        let tree = parser.parse(&source, None).unwrap();
+        let tree = parser.parse(source, None).unwrap();
 
         let mut cursor = QueryCursor::new();
 
@@ -2086,7 +2086,7 @@ fn test_query_captures_within_byte_range() {
 
         let mut parser = Parser::new();
         parser.set_language(language).unwrap();
-        let tree = parser.parse(&source, None).unwrap();
+        let tree = parser.parse(source, None).unwrap();
 
         let mut cursor = QueryCursor::new();
         let captures =
@@ -2122,7 +2122,7 @@ fn test_query_matches_with_unrooted_patterns_intersecting_byte_range() {
 
         let mut parser = Parser::new();
         parser.set_language(language).unwrap();
-        let tree = parser.parse(&source, None).unwrap();
+        let tree = parser.parse(source, None).unwrap();
         let mut cursor = QueryCursor::new();
 
         // within the type parameter list
@@ -2260,14 +2260,14 @@ fn test_query_captures_within_byte_range_assigned_after_iterating() {
 
         let mut parser = Parser::new();
         parser.set_language(language).unwrap();
-        let tree = parser.parse(&source, None).unwrap();
+        let tree = parser.parse(source, None).unwrap();
         let mut cursor = QueryCursor::new();
         let mut captures = cursor.captures(&query, tree.root_node(), source.as_bytes());
 
         // Retrieve some captures
         let mut results = Vec::new();
         for (mat, capture_ix) in captures.by_ref().take(5) {
-            let capture = mat.captures[capture_ix as usize];
+            let capture = mat.captures[capture_ix];
             results.push((
                 query.capture_names()[capture.index as usize],
                 &source[capture.node.byte_range()],
@@ -2290,7 +2290,7 @@ fn test_query_captures_within_byte_range_assigned_after_iterating() {
         results.clear();
         captures.set_byte_range(source.find("Ok").unwrap()..source.len());
         for (mat, capture_ix) in captures {
-            let capture = mat.captures[capture_ix as usize];
+            let capture = mat.captures[capture_ix];
             results.push((
                 query.capture_names()[capture.index as usize],
                 &source[capture.node.byte_range()],
@@ -2393,7 +2393,7 @@ fn test_query_matches_different_queries_same_cursor() {
         let mut cursor = QueryCursor::new();
 
         parser.set_language(language).unwrap();
-        let tree = parser.parse(&source, None).unwrap();
+        let tree = parser.parse(source, None).unwrap();
 
         let matches = cursor.matches(&query1, tree.root_node(), source.as_bytes());
         assert_eq!(
@@ -2436,7 +2436,7 @@ fn test_query_matches_with_multiple_captures_on_a_node() {
         let mut cursor = QueryCursor::new();
 
         parser.set_language(language).unwrap();
-        let tree = parser.parse(&source, None).unwrap();
+        let tree = parser.parse(source, None).unwrap();
 
         let matches = cursor.matches(&query, tree.root_node(), source.as_bytes());
         assert_eq!(
@@ -2524,7 +2524,7 @@ fn test_query_matches_with_captured_wildcard_at_root() {
         let mut parser = Parser::new();
         let mut cursor = QueryCursor::new();
         parser.set_language(language).unwrap();
-        let tree = parser.parse(&source, None).unwrap();
+        let tree = parser.parse(source, None).unwrap();
 
         let match_capture_names_and_rows = cursor
             .matches(&query, tree.root_node(), source.as_bytes())
@@ -2790,7 +2790,7 @@ fn test_query_captures_basic() {
 
         let mut parser = Parser::new();
         parser.set_language(language).unwrap();
-        let tree = parser.parse(&source, None).unwrap();
+        let tree = parser.parse(source, None).unwrap();
         let mut cursor = QueryCursor::new();
         let matches = cursor.matches(&query, tree.root_node(), source.as_bytes());
 
@@ -2873,7 +2873,7 @@ fn test_query_captures_with_text_conditions() {
 
         let mut parser = Parser::new();
         parser.set_language(language).unwrap();
-        let tree = parser.parse(&source, None).unwrap();
+        let tree = parser.parse(source, None).unwrap();
         let mut cursor = QueryCursor::new();
 
         let captures = cursor.captures(&query, tree.root_node(), source.as_bytes());
@@ -3019,7 +3019,7 @@ fn test_query_captures_with_duplicates() {
 
         let mut parser = Parser::new();
         parser.set_language(language).unwrap();
-        let tree = parser.parse(&source, None).unwrap();
+        let tree = parser.parse(source, None).unwrap();
         let mut cursor = QueryCursor::new();
 
         let captures = cursor.captures(&query, tree.root_node(), source.as_bytes());
@@ -3221,11 +3221,11 @@ fn test_query_captures_with_too_many_nested_results() {
 
         let mut parser = Parser::new();
         parser.set_language(language).unwrap();
-        let tree = parser.parse(&source, None).unwrap();
+        let tree = parser.parse(source, None).unwrap();
         let mut cursor = QueryCursor::new();
         cursor.set_match_limit(32);
         let captures = cursor.captures(&query, tree.root_node(), source.as_bytes());
-        let captures = collect_captures(captures, &query, &source);
+        let captures = collect_captures(captures, &query, source);
 
         assert_eq!(
             &captures[0..4],
@@ -3284,7 +3284,7 @@ fn test_query_captures_with_definite_pattern_containing_many_nested_matches() {
 
         let mut parser = Parser::new();
         parser.set_language(language).unwrap();
-        let tree = parser.parse(&source, None).unwrap();
+        let tree = parser.parse(source, None).unwrap();
         let mut cursor = QueryCursor::new();
 
         let captures = cursor.captures(&query, tree.root_node(), source.as_bytes());
@@ -3320,7 +3320,7 @@ fn test_query_captures_ordered_by_both_start_and_end_positions() {
 
         let mut parser = Parser::new();
         parser.set_language(language).unwrap();
-        let tree = parser.parse(&source, None).unwrap();
+        let tree = parser.parse(source, None).unwrap();
         let mut cursor = QueryCursor::new();
 
         let captures = cursor.captures(&query, tree.root_node(), source.as_bytes());
@@ -3361,7 +3361,7 @@ fn test_query_captures_with_matches_removed() {
 
         let mut parser = Parser::new();
         parser.set_language(language).unwrap();
-        let tree = parser.parse(&source, None).unwrap();
+        let tree = parser.parse(source, None).unwrap();
         let mut cursor = QueryCursor::new();
 
         let mut captured_strings = Vec::new();
@@ -3405,7 +3405,7 @@ fn test_query_captures_with_matches_removed_before_they_finish() {
 
         let mut parser = Parser::new();
         parser.set_language(language).unwrap();
-        let tree = parser.parse(&source, None).unwrap();
+        let tree = parser.parse(source, None).unwrap();
         let mut cursor = QueryCursor::new();
 
         let mut captured_strings = Vec::new();
@@ -3447,7 +3447,7 @@ fn test_query_captures_and_matches_iterators_are_fused() {
 
         let mut parser = Parser::new();
         parser.set_language(language).unwrap();
-        let tree = parser.parse(&source, None).unwrap();
+        let tree = parser.parse(source, None).unwrap();
         let mut cursor = QueryCursor::new();
         let mut captures = cursor.captures(&query, tree.root_node(), source.as_bytes());
 
@@ -3521,7 +3521,7 @@ fn test_query_text_callback_returns_chunks() {
 
         let mut parser = Parser::new();
         parser.set_language(language).unwrap();
-        let tree = parser.parse(&source, None).unwrap();
+        let tree = parser.parse(source, None).unwrap();
         let mut cursor = QueryCursor::new();
         let captures = cursor.captures(&query, tree.root_node(), |node: Node| {
             chunks_in_range(node.byte_range())
@@ -3619,7 +3619,7 @@ fn test_query_lifetime_is_separate_from_nodes_lifetime() {
         let language = get_language("javascript");
         let mut parser = Parser::new();
         parser.set_language(language).unwrap();
-        let tree = parser.parse(&source, None).unwrap();
+        let tree = parser.parse(source, None).unwrap();
 
         fn take_first_node_from_captures<'tree>(
             source: &str,
@@ -3932,10 +3932,10 @@ fn test_query_is_pattern_guaranteed_at_step() {
         Row {
             description: "a guaranteed step with a field",
             language: get_language("javascript"),
-            pattern: r#"(binary_expression left: (identifier) right: (_))"#,
+            pattern: r#"(binary_expression left: (expression) right: (_))"#,
             results_by_substring: &[
                 ("binary_expression", false),
-                ("(identifier)", false),
+                ("(expression)", false),
                 ("(_)", true),
             ],
         },
@@ -4002,7 +4002,7 @@ fn test_query_is_pattern_guaranteed_at_step() {
             "#,
             results_by_substring: &[
                 ("identifier", false),
-                ("property_identifier", true),
+                ("property_identifier", false),
                 ("[", true),
             ],
         },
diff --git a/cli/src/tests/test_highlight_test.rs b/cli/src/tests/test_highlight_test.rs
index d9b2c43a..06ad7d59 100644
--- a/cli/src/tests/test_highlight_test.rs
+++ b/cli/src/tests/test_highlight_test.rs
@@ -12,7 +12,7 @@ fn test_highlight_test_with_basic_test() {
         Some("injections.scm"),
         &[
             "function".to_string(),
-            "variable.parameter".to_string(),
+            "variable".to_string(),
             "keyword".to_string(),
         ],
     );
@@ -22,7 +22,7 @@ fn test_highlight_test_with_basic_test() {
         "  // ^ function",
         "  //       ^ keyword",
         "  return d + e;",
-        "  //     ^ variable.parameter",
+        "  //     ^ variable",
         "  //       ^ !variable",
         "};",
     ]
@@ -35,7 +35,7 @@ fn test_highlight_test_with_basic_test() {
         &[
             Assertion::new(1, 5, false, String::from("function")),
             Assertion::new(1, 11, false, String::from("keyword")),
-            Assertion::new(4, 9, false, String::from("variable.parameter")),
+            Assertion::new(4, 9, false, String::from("variable")),
             Assertion::new(4, 11, true, String::from("variable")),
         ]
     );
@@ -53,6 +53,7 @@ fn test_highlight_test_with_basic_test() {
             (Point::new(1, 19), Point::new(1, 20), Highlight(1)), // "d"
             (Point::new(4, 2), Point::new(4, 8), Highlight(2)), // "return"
             (Point::new(4, 9), Point::new(4, 10), Highlight(1)), // "d"
+            (Point::new(4, 13), Point::new(4, 14), Highlight(1)), // "e"
         ]
     );
 }
diff --git a/script/fetch-fixtures b/script/fetch-fixtures
index eb66d314..1eec16ee 100755
--- a/script/fetch-fixtures
+++ b/script/fetch-fixtures
@@ -23,12 +23,12 @@ fetch_grammar() {
 
 fetch_grammar bash              master
 fetch_grammar c                 master
-fetch_grammar cpp               670404d7c689be1c868a46f919ba2a3912f2b7ef
+fetch_grammar cpp               master
 fetch_grammar embedded-template master
 fetch_grammar go                master
 fetch_grammar html              master
 fetch_grammar java              master
-fetch_grammar javascript        partial-order-precedences
+fetch_grammar javascript        master
 fetch_grammar jsdoc             master
 fetch_grammar json              master
 fetch_grammar php               master
diff --git a/test/fixtures/error_corpus/javascript_errors.txt b/test/fixtures/error_corpus/javascript_errors.txt
index 4359ae68..e2f21176 100644
--- a/test/fixtures/error_corpus/javascript_errors.txt
+++ b/test/fixtures/error_corpus/javascript_errors.txt
@@ -74,8 +74,8 @@ if ({a: 'b'} {c: 'd'}) {
 (program
   (if_statement
     (parenthesized_expression
-      (ERROR (object (pair (property_identifier) (string))))
-      (object (pair (property_identifier) (string))))
+      (ERROR (object (pair (property_identifier) (string (string_fragment)))))
+      (object (pair (property_identifier) (string (string_fragment)))))
     (statement_block
       (expression_statement
         (assignment_expression
@@ -178,12 +178,12 @@ function main(x) {
       (expression_statement
         (call_expression
           (member_expression (identifier) (property_identifier))
-          (arguments (string))))
+          (arguments (string (string_fragment)))))
       (expression_statement
         (binary_expression
           (identifier)
           (ERROR)
           (call_expression
             (member_expression (identifier) (property_identifier))
-            (arguments (string)))))
+            (arguments (string (string_fragment))))))
       (return_statement (object)))))

From cc6689534323ad0f142250ed553fb6469ff34bb3 Mon Sep 17 00:00:00 2001
From: Amaan Qureshi <amaanq12@gmail.com>
Date: Thu, 21 Sep 2023 00:52:50 -0400
Subject: [PATCH 337/347] perf: cache the current language configuration to
 lookup later on

---
 Cargo.toml            |  4 +++
 cli/loader/src/lib.rs | 64 +++++++++++++++++++++++--------------------
 2 files changed, 39 insertions(+), 29 deletions(-)

diff --git a/Cargo.toml b/Cargo.toml
index 03e24caf..bc2aedaa 100644
--- a/Cargo.toml
+++ b/Cargo.toml
@@ -15,3 +15,7 @@ codegen-units = 1 # Maximum size reduction optimizations.
 [profile.size]
 inherits = "release"
 opt-level = "s"      # Optimize for size.
+
+[profile.profile]
+inherits = "release"
+strip = false
diff --git a/cli/loader/src/lib.rs b/cli/loader/src/lib.rs
index d260a96c..ed9c5f39 100644
--- a/cli/loader/src/lib.rs
+++ b/cli/loader/src/lib.rs
@@ -70,12 +70,12 @@ impl Config {
 }
 
 #[cfg(unix)]
-const DYLIB_EXTENSION: &'static str = "so";
+const DYLIB_EXTENSION: &str = "so";
 
 #[cfg(windows)]
 const DYLIB_EXTENSION: &'static str = "dll";
 
-const BUILD_TARGET: &'static str = env!("BUILD_TARGET");
+const BUILD_TARGET: &str = env!("BUILD_TARGET");
 
 pub struct LanguageConfiguration<'a> {
     pub scope: Option<String>,
@@ -101,6 +101,7 @@ pub struct Loader {
     languages_by_id: Vec<(PathBuf, OnceCell<Language>)>,
     language_configurations: Vec<LanguageConfiguration<'static>>,
     language_configuration_ids_by_file_type: HashMap<String, Vec<usize>>,
+    language_configuration_in_current_path: Option<usize>,
     highlight_names: Box<Mutex<Vec<String>>>,
     use_all_highlight_names: bool,
     debug_build: bool,
@@ -127,13 +128,14 @@ impl Loader {
             languages_by_id: Vec::new(),
             language_configurations: Vec::new(),
             language_configuration_ids_by_file_type: HashMap::new(),
+            language_configuration_in_current_path: None,
             highlight_names: Box::new(Mutex::new(Vec::new())),
             use_all_highlight_names: true,
             debug_build: false,
         }
     }
 
-    pub fn configure_highlights(&mut self, names: &Vec<String>) {
+    pub fn configure_highlights(&mut self, names: &[String]) {
         self.use_all_highlight_names = false;
         let mut highlights = self.highlight_names.lock().unwrap();
         highlights.clear();
@@ -149,8 +151,7 @@ impl Loader {
             eprintln!("Warning: You have not configured any parser directories!");
             eprintln!("Please run `tree-sitter init-config` and edit the resulting");
             eprintln!("configuration file to indicate where we should look for");
-            eprintln!("language grammars.");
-            eprintln!("");
+            eprintln!("language grammars.\n");
         }
         for parser_container_dir in &config.parser_directories {
             if let Ok(entries) = fs::read_dir(parser_container_dir) {
@@ -160,6 +161,7 @@ impl Loader {
                         if parser_dir_name.starts_with("tree-sitter-") {
                             self.find_language_configurations_at_path(
                                 &parser_container_dir.join(parser_dir_name),
+                                false,
                             )
                             .ok();
                         }
@@ -171,7 +173,7 @@ impl Loader {
     }
 
     pub fn languages_at_path(&mut self, path: &Path) -> Result<Vec<Language>> {
-        if let Ok(configurations) = self.find_language_configurations_at_path(path) {
+        if let Ok(configurations) = self.find_language_configurations_at_path(path, true) {
             let mut language_ids = configurations
                 .iter()
                 .map(|c| c.language_id)
@@ -342,7 +344,7 @@ impl Loader {
 
         self.load_language_from_sources(
             &grammar_json.name,
-            &header_path,
+            header_path,
             &parser_path,
             scanner_path.as_deref(),
         )
@@ -362,7 +364,7 @@ impl Loader {
         let mut library_path = self.parser_lib_path.join(lib_name);
         library_path.set_extension(DYLIB_EXTENSION);
 
-        let recompile = needs_recompile(&library_path, &parser_path, scanner_path)
+        let recompile = needs_recompile(&library_path, parser_path, scanner_path)
             .with_context(|| "Failed to compare source and binary timestamps")?;
 
         if recompile {
@@ -382,7 +384,7 @@ impl Loader {
             }
 
             if compiler.is_like_msvc() {
-                command.args(&["/nologo", "/LD", "/I"]).arg(header_path);
+                command.args(["/nologo", "/LD", "/I"]).arg(header_path);
                 if self.debug_build {
                     command.arg("/Od");
                 } else {
@@ -514,24 +516,20 @@ impl Loader {
         }
     }
 
-    pub fn find_language_configurations_at_path<'a>(
-        &'a mut self,
+    pub fn find_language_configurations_at_path(
+        &mut self,
         parser_path: &Path,
+        set_current_path_config: bool,
     ) -> Result<&[LanguageConfiguration]> {
-        #[derive(Deserialize)]
+        #[derive(Default, Deserialize)]
         #[serde(untagged)]
         enum PathsJSON {
+            #[default]
             Empty,
             Single(String),
             Multiple(Vec<String>),
         }
 
-        impl Default for PathsJSON {
-            fn default() -> Self {
-                PathsJSON::Empty
-            }
-        }
-
         impl PathsJSON {
             fn into_vec(self) -> Option<Vec<String>> {
                 match self {
@@ -614,7 +612,7 @@ impl Loader {
 
                     let configuration = LanguageConfiguration {
                         root_path: parser_path.to_path_buf(),
-                        language_name: grammar_json.name,
+                        language_name: grammar_json.name.clone(),
                         scope: config_json.scope,
                         language_id,
                         file_types: config_json.file_types.unwrap_or(Vec::new()),
@@ -627,19 +625,26 @@ impl Loader {
                         highlights_filenames: config_json.highlights.into_vec(),
                         highlight_config: OnceCell::new(),
                         tags_config: OnceCell::new(),
-                        highlight_names: &*self.highlight_names,
+                        highlight_names: &self.highlight_names,
                         use_all_highlight_names: self.use_all_highlight_names,
                     };
 
                     for file_type in &configuration.file_types {
                         self.language_configuration_ids_by_file_type
                             .entry(file_type.to_string())
-                            .or_insert(Vec::new())
+                            .or_default()
                             .push(self.language_configurations.len());
                     }
 
                     self.language_configurations
                         .push(unsafe { mem::transmute(configuration) });
+
+                    if set_current_path_config
+                        && self.language_configuration_in_current_path.is_none()
+                    {
+                        self.language_configuration_in_current_path =
+                            Some(self.language_configurations.len() - 1);
+                    }
                 }
             }
         }
@@ -668,7 +673,7 @@ impl Loader {
                 tags_filenames: None,
                 highlight_config: OnceCell::new(),
                 tags_config: OnceCell::new(),
-                highlight_names: &*self.highlight_names,
+                highlight_names: &self.highlight_names,
                 use_all_highlight_names: self.use_all_highlight_names,
             };
             self.language_configurations
@@ -693,11 +698,11 @@ impl Loader {
         if let Some(scope) = scope {
             if let Some(config) = self
                 .language_configuration_for_scope(scope)
-                .with_context(|| format!("Failed to load language for scope '{}'", scope))?
+                .with_context(|| format!("Failed to load language for scope '{scope}'"))?
             {
                 Ok(config.0)
             } else {
-                return Err(anyhow!("Unknown scope '{}'", scope));
+                Err(anyhow!("Unknown scope '{scope}'"))
             }
         } else if let Some((lang, _)) = self
             .language_configuration_for_file_name(path)
@@ -709,8 +714,10 @@ impl Loader {
             })?
         {
             Ok(lang)
+        } else if let Some(id) = self.language_configuration_in_current_path {
+            Ok(self.language_for_id(self.language_configurations[id].language_id)?)
         } else if let Some(lang) = self
-            .languages_at_path(&current_dir)
+            .languages_at_path(current_dir)
             .with_context(|| "Failed to load language in current directory")?
             .first()
             .cloned()
@@ -833,7 +840,7 @@ impl<'a> LanguageConfiguration<'a> {
                             }
                         }
                     }
-                    result.configure(&all_highlight_names.as_slice());
+                    result.configure(all_highlight_names.as_slice());
                     Ok(Some(result))
                 }
             })
@@ -869,7 +876,6 @@ impl<'a> LanguageConfiguration<'a> {
                                         locals_query.len(),
                                     )
                                 }
-                                .into()
                             } else {
                                 error.into()
                             }
@@ -879,9 +885,9 @@ impl<'a> LanguageConfiguration<'a> {
             .map(Option::as_ref)
     }
 
-    fn include_path_in_query_error<'b>(
+    fn include_path_in_query_error(
         mut error: QueryError,
-        ranges: &'b Vec<(String, Range<usize>)>,
+        ranges: &[(String, Range<usize>)],
         source: &str,
         start_offset: usize,
     ) -> Error {

From dd52cafdd9537c93bb2d77d68385dab47934d9f5 Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Thu, 21 Sep 2023 11:28:22 +0300
Subject: [PATCH 338/347] chore: switch fetch-fixtures.cmd to all master
 branches

---
 script/fetch-fixtures.cmd | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/script/fetch-fixtures.cmd b/script/fetch-fixtures.cmd
index 5e8b6a16..32727b0c 100644
--- a/script/fetch-fixtures.cmd
+++ b/script/fetch-fixtures.cmd
@@ -2,12 +2,12 @@
 
 call:fetch_grammar bash              master
 call:fetch_grammar c                 master
-call:fetch_grammar cpp               670404d7c689be1c868a46f919ba2a3912f2b7ef
+call:fetch_grammar cpp               master
 call:fetch_grammar embedded-template master
 call:fetch_grammar go                master
 call:fetch_grammar html              master
 call:fetch_grammar java              master
-call:fetch_grammar javascript        partial-order-precedences
+call:fetch_grammar javascript        master
 call:fetch_grammar jsdoc             master
 call:fetch_grammar json              master
 call:fetch_grammar php               master

From 82ddb3ddcc30dd557695d02b189ca17ef1993374 Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Thu, 5 Oct 2023 07:59:35 +0300
Subject: [PATCH 339/347] cicd: add skips for fragile corpus tests

---
 cli/src/tests/corpus_test.rs | 59 ++++++++++++++++++++++--------------
 1 file changed, 36 insertions(+), 23 deletions(-)

diff --git a/cli/src/tests/corpus_test.rs b/cli/src/tests/corpus_test.rs
index 6b2f2a20..ce89743b 100644
--- a/cli/src/tests/corpus_test.rs
+++ b/cli/src/tests/corpus_test.rs
@@ -14,71 +14,81 @@ use crate::{
     test::{parse_tests, print_diff, print_diff_key, strip_sexp_fields, TestEntry},
     util,
 };
-use std::{env, fs};
+use std::{collections::HashSet, env, fs};
 use tree_sitter::{LogType, Node, Parser, Point, Range, Tree};
 use tree_sitter_proc_macro::test_with_seed;
 
 #[test_with_seed(retry=10, seed=*START_SEED, seed_fn=new_seed)]
 fn test_corpus_for_bash(seed: usize) {
-    test_language_corpus(seed, "bash");
+    test_language_corpus(
+        "bash",
+        seed,
+        Some(&[
+            // Fragile tests where edit customization changes
+            // lead to significant parse tree structure changes.
+            "bash - corpus - commands - Nested Heredocs",
+            "bash - corpus - commands - Quoted Heredocs",
+            "bash - corpus - commands - Heredocs with weird characters",
+        ]),
+    );
 }
 
 #[test_with_seed(retry=10, seed=*START_SEED, seed_fn=new_seed)]
 fn test_corpus_for_c(seed: usize) {
-    test_language_corpus(seed, "c");
+    test_language_corpus("c", seed, None);
 }
 
 #[test_with_seed(retry=10, seed=*START_SEED, seed_fn=new_seed)]
 fn test_corpus_for_cpp(seed: usize) {
-    test_language_corpus(seed, "cpp");
+    test_language_corpus("cpp", seed, None);
 }
 
 #[test_with_seed(retry=10, seed=*START_SEED, seed_fn=new_seed)]
 fn test_corpus_for_embedded_template(seed: usize) {
-    test_language_corpus(seed, "embedded-template");
+    test_language_corpus("embedded-template", seed, None);
 }
 
 #[test_with_seed(retry=10, seed=*START_SEED, seed_fn=new_seed)]
 fn test_corpus_for_go(seed: usize) {
-    test_language_corpus(seed, "go");
+    test_language_corpus("go", seed, None);
 }
 
 #[test_with_seed(retry=10, seed=*START_SEED, seed_fn=new_seed)]
 fn test_corpus_for_html(seed: usize) {
-    test_language_corpus(seed, "html");
+    test_language_corpus("html", seed, None);
 }
 
 #[test_with_seed(retry=10, seed=*START_SEED, seed_fn=new_seed)]
 fn test_corpus_for_javascript(seed: usize) {
-    test_language_corpus(seed, "javascript");
+    test_language_corpus("javascript", seed, None);
 }
 
 #[test_with_seed(retry=10, seed=*START_SEED, seed_fn=new_seed)]
 fn test_corpus_for_json(seed: usize) {
-    test_language_corpus(seed, "json");
+    test_language_corpus("json", seed, None);
 }
 
 #[test_with_seed(retry=10, seed=*START_SEED, seed_fn=new_seed)]
 fn test_corpus_for_php(seed: usize) {
-    test_language_corpus(seed, "php");
+    test_language_corpus("php", seed, None);
 }
 
 #[test_with_seed(retry=10, seed=*START_SEED, seed_fn=new_seed)]
 fn test_corpus_for_python(seed: usize) {
-    test_language_corpus(seed, "python");
+    test_language_corpus("python", seed, None);
 }
 
 #[test_with_seed(retry=10, seed=*START_SEED, seed_fn=new_seed)]
 fn test_corpus_for_ruby(seed: usize) {
-    test_language_corpus(seed, "ruby");
+    test_language_corpus("ruby", seed, None);
 }
 
 #[test_with_seed(retry=10, seed=*START_SEED, seed_fn=new_seed)]
 fn test_corpus_for_rust(seed: usize) {
-    test_language_corpus(seed, "rust");
+    test_language_corpus("rust", seed, None);
 }
 
-fn test_language_corpus(start_seed: usize, language_name: &str) {
+fn test_language_corpus(language_name: &str, start_seed: usize, skipped: Option<&[&str]>) {
     let grammars_dir = fixtures_dir().join("grammars");
     let error_corpus_dir = fixtures_dir().join("error_corpus");
     let template_corpus_dir = fixtures_dir().join("template_corpus");
@@ -100,6 +110,8 @@ fn test_language_corpus(start_seed: usize, language_name: &str) {
         t
     }));
 
+    let skipped = skipped.map(|x| HashSet::<&str>::from_iter(x.iter().map(|x| *x)));
+
     let language = get_language(language_name);
     let mut failure_count = 0;
 
@@ -112,7 +124,14 @@ fn test_language_corpus(start_seed: usize, language_name: &str) {
 
     println!();
     for (test_index, test) in tests.iter().enumerate() {
-        let test_name = format!("{language_name} example - {}", test.name);
+        let test_name = format!("{language_name} - {}", test.name);
+
+        if let Some(skipped) = skipped.as_ref() {
+            if skipped.contains(test_name.as_str()) {
+                println!("  {test_index}. {test_name} - SKIPPED");
+                continue;
+            }
+        }
 
         println!("  {test_index}. {test_name}");
 
@@ -129,10 +148,7 @@ fn test_language_corpus(start_seed: usize, language_name: &str) {
             }
 
             if actual_output != test.output {
-                println!(
-                    "Incorrect initial parse for {} - {}",
-                    language_name, test.name,
-                );
+                println!("Incorrect initial parse for {test_name}");
                 print_diff_key();
                 print_diff(&actual_output, &test.output);
                 println!("");
@@ -219,10 +235,7 @@ fn test_language_corpus(start_seed: usize, language_name: &str) {
                 }
 
                 if actual_output != test.output {
-                    println!(
-                        "Incorrect parse for {} - {} - seed {}",
-                        language_name, test.name, seed
-                    );
+                    println!("Incorrect parse for {test_name} - seed {seed}");
                     print_diff_key();
                     print_diff(&actual_output, &test.output);
                     println!("");

From d95836eb35872d7eec4f3b7a4e1dd709a814391a Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Thu, 5 Oct 2023 14:39:36 +0300
Subject: [PATCH 340/347] cicd: add en extra check for non matchable skips

---
 cli/src/tests/corpus_test.rs | 22 +++++++++++++++++-----
 1 file changed, 17 insertions(+), 5 deletions(-)

diff --git a/cli/src/tests/corpus_test.rs b/cli/src/tests/corpus_test.rs
index ce89743b..8a4c54cc 100644
--- a/cli/src/tests/corpus_test.rs
+++ b/cli/src/tests/corpus_test.rs
@@ -14,7 +14,7 @@ use crate::{
     test::{parse_tests, print_diff, print_diff_key, strip_sexp_fields, TestEntry},
     util,
 };
-use std::{collections::HashSet, env, fs};
+use std::{collections::HashMap, env, fs};
 use tree_sitter::{LogType, Node, Parser, Point, Range, Tree};
 use tree_sitter_proc_macro::test_with_seed;
 
@@ -110,7 +110,7 @@ fn test_language_corpus(language_name: &str, start_seed: usize, skipped: Option<
         t
     }));
 
-    let skipped = skipped.map(|x| HashSet::<&str>::from_iter(x.iter().map(|x| *x)));
+    let mut skipped = skipped.map(|x| HashMap::<&str, usize>::from_iter(x.iter().map(|x| (*x, 0))));
 
     let language = get_language(language_name);
     let mut failure_count = 0;
@@ -125,10 +125,10 @@ fn test_language_corpus(language_name: &str, start_seed: usize, skipped: Option<
     println!();
     for (test_index, test) in tests.iter().enumerate() {
         let test_name = format!("{language_name} - {}", test.name);
-
-        if let Some(skipped) = skipped.as_ref() {
-            if skipped.contains(test_name.as_str()) {
+        if let Some(skipped) = skipped.as_mut() {
+            if let Some(counter) = skipped.get_mut(test_name.as_str()) {
                 println!("  {test_index}. {test_name} - SKIPPED");
+                *counter += 1;
                 continue;
             }
         }
@@ -262,6 +262,18 @@ fn test_language_corpus(language_name: &str, start_seed: usize, skipped: Option<
     if failure_count > 0 {
         panic!("{} {} corpus tests failed", failure_count, language_name);
     }
+
+    if let Some(skipped) = skipped.as_mut() {
+        skipped.retain(|_, v| *v == 0);
+
+        if skipped.len() > 0 {
+            println!("Non matchable skip definitions:");
+            for k in skipped.keys() {
+                println!("  {k}");
+            }
+            panic!("Non matchable skip definitions needs to be removed");
+        }
+    }
 }
 
 #[test]

From c63f1680adb6237cba4a372146497e2e4757c174 Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Wed, 4 Oct 2023 11:20:18 +0300
Subject: [PATCH 341/347] chore(rust): improve perf for position funcs

---
 Cargo.lock       |  5 +++--
 cli/Cargo.toml   |  1 +
 cli/src/parse.rs | 44 ++++++++++++++++++++++++--------------------
 3 files changed, 28 insertions(+), 22 deletions(-)

diff --git a/Cargo.lock b/Cargo.lock
index 80a4e28d..be8829ac 100644
--- a/Cargo.lock
+++ b/Cargo.lock
@@ -469,9 +469,9 @@ dependencies = [
 
 [[package]]
 name = "memchr"
-version = "2.5.0"
+version = "2.6.4"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "2dffe52ecf27772e601905b7522cb4ef790d2cc203488bbd0e2fe85fcb74566d"
+checksum = "f665ee40bc4a3c5590afb1e9677db74a508659dfd71e126420da8274909a0167"
 
 [[package]]
 name = "minimal-lexical"
@@ -941,6 +941,7 @@ dependencies = [
  "indoc",
  "lazy_static",
  "log",
+ "memchr",
  "path-slash",
  "pretty_assertions",
  "rand",
diff --git a/cli/Cargo.toml b/cli/Cargo.toml
index 0edd3c3d..e62c443a 100644
--- a/cli/Cargo.toml
+++ b/cli/Cargo.toml
@@ -32,6 +32,7 @@ glob = "0.3.1"
 html-escape = "0.2.13"
 indexmap = "2.0.0"
 lazy_static = "1.4.0"
+memchr = "2.6.3"
 path-slash = "0.2.1"
 regex = "1.9.1"
 regex-syntax = "0.7.4"
diff --git a/cli/src/parse.rs b/cli/src/parse.rs
index 5b1a4b31..30ddd238 100644
--- a/cli/src/parse.rs
+++ b/cli/src/parse.rs
@@ -370,31 +370,35 @@ fn parse_edit_flag(source_code: &Vec<u8>, flag: &str) -> Result<Edit> {
     })
 }
 
-fn offset_for_position(input: &Vec<u8>, position: Point) -> usize {
-    let mut current_position = Point { row: 0, column: 0 };
-    for (i, c) in input.iter().enumerate() {
-        if *c as char == '\n' {
-            current_position.row += 1;
-            current_position.column = 0;
-        } else {
-            current_position.column += 1;
-        }
-        if current_position > position {
-            return i;
+fn offset_for_position(input: &[u8], position: Point) -> usize {
+    let mut row = 0;
+    let mut offset = 0;
+    let mut iter = memchr::memchr_iter(b'\n', input);
+    loop {
+        if let Some(pos) = iter.next() {
+            if row < position.row {
+                row += 1;
+                offset = pos;
+                continue;
+            }
         }
+        offset += 1;
+        break;
     }
-    return input.len();
+    offset + position.column
 }
 
-fn position_for_offset(input: &Vec<u8>, offset: usize) -> Point {
+fn position_for_offset(input: &[u8], offset: usize) -> Point {
     let mut result = Point { row: 0, column: 0 };
-    for c in &input[0..offset] {
-        if *c as char == '\n' {
-            result.row += 1;
-            result.column = 0;
-        } else {
-            result.column += 1;
-        }
+    let mut last = 0;
+    for pos in memchr::memchr_iter(b'\n', &input[..offset]) {
+        result.row += 1;
+        last = pos;
     }
+    result.column = if result.row > 0 {
+        offset - last - 1
+    } else {
+        offset
+    };
     result
 }

From a5a75648189612bc15138d92331e98c96f87a748 Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Wed, 4 Oct 2023 11:21:48 +0300
Subject: [PATCH 342/347] chore(rust): add error reporting for position funcs

---
 cli/src/parse.rs             | 35 ++++++++++++++++++++++++-----------
 cli/src/tests/corpus_test.rs |  4 ++--
 cli/src/tests/node_test.rs   |  2 +-
 cli/src/tests/parser_test.rs | 13 ++++++++-----
 cli/src/tests/tree_test.rs   |  2 +-
 5 files changed, 36 insertions(+), 20 deletions(-)

diff --git a/cli/src/parse.rs b/cli/src/parse.rs
index 30ddd238..68279361 100644
--- a/cli/src/parse.rs
+++ b/cli/src/parse.rs
@@ -115,7 +115,7 @@ pub fn parse_file_at_path(opts: ParseFileOptions) -> Result<bool> {
 
         for (i, edit) in opts.edits.iter().enumerate() {
             let edit = parse_edit_flag(&source_code, edit)?;
-            perform_edit(&mut tree, &mut source_code, &edit);
+            perform_edit(&mut tree, &mut source_code, &edit)?;
             tree = parser.parse(&source_code, Some(&tree)).unwrap();
 
             if opts.debug_graph {
@@ -309,14 +309,14 @@ pub fn parse_file_at_path(opts: ParseFileOptions) -> Result<bool> {
     Ok(false)
 }
 
-pub fn perform_edit(tree: &mut Tree, input: &mut Vec<u8>, edit: &Edit) -> InputEdit {
+pub fn perform_edit(tree: &mut Tree, input: &mut Vec<u8>, edit: &Edit) -> Result<InputEdit> {
     let start_byte = edit.position;
     let old_end_byte = edit.position + edit.deleted_length;
     let new_end_byte = edit.position + edit.inserted_text.len();
-    let start_position = position_for_offset(input, start_byte);
-    let old_end_position = position_for_offset(input, old_end_byte);
+    let start_position = position_for_offset(input, start_byte)?;
+    let old_end_position = position_for_offset(input, old_end_byte)?;
     input.splice(start_byte..old_end_byte, edit.inserted_text.iter().cloned());
-    let new_end_position = position_for_offset(input, new_end_byte);
+    let new_end_position = position_for_offset(input, new_end_byte)?;
     let edit = InputEdit {
         start_byte,
         old_end_byte,
@@ -326,7 +326,7 @@ pub fn perform_edit(tree: &mut Tree, input: &mut Vec<u8>, edit: &Edit) -> InputE
         new_end_position,
     };
     tree.edit(&edit);
-    edit
+    Ok(edit)
 }
 
 fn parse_edit_flag(source_code: &Vec<u8>, flag: &str) -> Result<Edit> {
@@ -355,7 +355,7 @@ fn parse_edit_flag(source_code: &Vec<u8>, flag: &str) -> Result<Edit> {
         let row = usize::from_str_radix(row, 10).map_err(|_| error())?;
         let column = parts.next().ok_or_else(error)?;
         let column = usize::from_str_radix(column, 10).map_err(|_| error())?;
-        offset_for_position(source_code, Point { row, column })
+        offset_for_position(source_code, Point { row, column })?
     } else {
         usize::from_str_radix(position, 10).map_err(|_| error())?
     };
@@ -370,7 +370,7 @@ fn parse_edit_flag(source_code: &Vec<u8>, flag: &str) -> Result<Edit> {
     })
 }
 
-fn offset_for_position(input: &[u8], position: Point) -> usize {
+pub fn offset_for_position(input: &[u8], position: Point) -> Result<usize> {
     let mut row = 0;
     let mut offset = 0;
     let mut iter = memchr::memchr_iter(b'\n', input);
@@ -385,10 +385,23 @@ fn offset_for_position(input: &[u8], position: Point) -> usize {
         offset += 1;
         break;
     }
-    offset + position.column
+    if position.row - row > 0 {
+        return Err(anyhow!("Failed to address a row: {}", position.row));
+    }
+    if let Some(pos) = iter.next() {
+        if (pos - offset < position.column) || (input[offset] == b'\n' && position.column > 0) {
+            return Err(anyhow!("Failed to address a column: {}", position.column));
+        };
+    } else if input.len() - offset < position.column {
+        return Err(anyhow!("Failed to address a column over the end"));
+    }
+    Ok(offset + position.column)
 }
 
-fn position_for_offset(input: &[u8], offset: usize) -> Point {
+pub fn position_for_offset(input: &[u8], offset: usize) -> Result<Point> {
+    if offset > input.len() {
+        return Err(anyhow!("Failed to address an offset: {offset}"));
+    }
     let mut result = Point { row: 0, column: 0 };
     let mut last = 0;
     for pos in memchr::memchr_iter(b'\n', &input[..offset]) {
@@ -400,5 +413,5 @@ fn position_for_offset(input: &[u8], offset: usize) -> Point {
     } else {
         offset
     };
-    result
+    Ok(result)
 }
diff --git a/cli/src/tests/corpus_test.rs b/cli/src/tests/corpus_test.rs
index 8a4c54cc..589b1839 100644
--- a/cli/src/tests/corpus_test.rs
+++ b/cli/src/tests/corpus_test.rs
@@ -187,7 +187,7 @@ fn test_language_corpus(language_name: &str, start_seed: usize, skipped: Option<
                 for _ in 0..1 + rand.unsigned(*EDIT_COUNT) {
                     let edit = get_random_edit(&mut rand, &input);
                     undo_stack.push(invert_edit(&input, &edit));
-                    perform_edit(&mut tree, &mut input, &edit);
+                    perform_edit(&mut tree, &mut input, &edit).unwrap();
                 }
 
                 if log_seed {
@@ -219,7 +219,7 @@ fn test_language_corpus(language_name: &str, start_seed: usize, skipped: Option<
 
                 // Undo all of the edits and re-parse again.
                 while let Some(edit) = undo_stack.pop() {
-                    perform_edit(&mut tree2, &mut input, &edit);
+                    perform_edit(&mut tree2, &mut input, &edit).unwrap();
                 }
                 if *LOG_GRAPH_ENABLED {
                     eprintln!("{}\n", String::from_utf8_lossy(&input));
diff --git a/cli/src/tests/node_test.rs b/cli/src/tests/node_test.rs
index 43b3d66b..c4548d3e 100644
--- a/cli/src/tests/node_test.rs
+++ b/cli/src/tests/node_test.rs
@@ -552,7 +552,7 @@ fn test_node_edit() {
 
         let edit = get_random_edit(&mut rand, &mut code);
         let mut tree2 = tree.clone();
-        let edit = perform_edit(&mut tree2, &mut code, &edit);
+        let edit = perform_edit(&mut tree2, &mut code, &edit).unwrap();
         for node in nodes_before.iter_mut() {
             node.edit(&edit);
         }
diff --git a/cli/src/tests/parser_test.rs b/cli/src/tests/parser_test.rs
index 99616f56..434a81f9 100644
--- a/cli/src/tests/parser_test.rs
+++ b/cli/src/tests/parser_test.rs
@@ -342,7 +342,8 @@ fn test_parsing_after_editing_beginning_of_code() {
             deleted_length: 0,
             inserted_text: b" || 5".to_vec(),
         },
-    );
+    )
+    .unwrap();
 
     let mut recorder = ReadRecorder::new(&code);
     let tree = parser
@@ -389,7 +390,8 @@ fn test_parsing_after_editing_end_of_code() {
             deleted_length: 0,
             inserted_text: b".d".to_vec(),
         },
-    );
+    )
+    .unwrap();
 
     let mut recorder = ReadRecorder::new(&code);
     let tree = parser
@@ -464,7 +466,8 @@ h + i
             deleted_length: 0,
             inserted_text: b"1234".to_vec(),
         },
-    );
+    )
+    .unwrap();
 
     assert_eq!(
         code,
@@ -528,12 +531,12 @@ fn test_parsing_after_detecting_error_in_the_middle_of_a_string_token() {
     let undo = invert_edit(&source, &edit);
 
     let mut tree2 = tree.clone();
-    perform_edit(&mut tree2, &mut source, &edit);
+    perform_edit(&mut tree2, &mut source, &edit).unwrap();
     tree2 = parser.parse(&source, Some(&tree2)).unwrap();
     assert!(tree2.root_node().has_error());
 
     let mut tree3 = tree2.clone();
-    perform_edit(&mut tree3, &mut source, &undo);
+    perform_edit(&mut tree3, &mut source, &undo).unwrap();
     tree3 = parser.parse(&source, Some(&tree3)).unwrap();
     assert_eq!(tree3.root_node().to_sexp(), tree.root_node().to_sexp(),);
 }
diff --git a/cli/src/tests/tree_test.rs b/cli/src/tests/tree_test.rs
index 7d091c3f..c63b588b 100644
--- a/cli/src/tests/tree_test.rs
+++ b/cli/src/tests/tree_test.rs
@@ -663,7 +663,7 @@ fn get_changed_ranges(
     source_code: &mut Vec<u8>,
     edit: Edit,
 ) -> Vec<Range> {
-    perform_edit(tree, source_code, &edit);
+    perform_edit(tree, source_code, &edit).unwrap();
     let new_tree = parser.parse(&source_code, Some(tree)).unwrap();
     let result = tree.changed_ranges(&new_tree).collect();
     *tree = new_tree;

From a91a6cc61508a518fd5ff93843cce5bdb5e1c19b Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Mon, 16 Oct 2023 16:13:40 +0300
Subject: [PATCH 343/347] cicd: disable failed `linux-riscv64gc` target

Related issue #2712
---
 .github/workflows/build.yml | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/.github/workflows/build.yml b/.github/workflows/build.yml
index 05c08d2c..77dbb9df 100644
--- a/.github/workflows/build.yml
+++ b/.github/workflows/build.yml
@@ -48,7 +48,7 @@ jobs:
         - linux-powerpc     #
         - linux-powerpc64   #
         - linux-powerpc64el #
-        - linux-riscv64gc   #
+      # - linux-riscv64gc   # #2712
         - linux-s390x       #
         - linux-sparc64     #
         - linux-thumbv7neon #
@@ -77,7 +77,7 @@ jobs:
         - { platform: linux-powerpc     , target: powerpc-unknown-linux-gnu           , os: ubuntu-latest  , use-cross: true }
         - { platform: linux-powerpc64   , target: powerpc64-unknown-linux-gnu         , os: ubuntu-latest  , use-cross: true }
         - { platform: linux-powerpc64el , target: powerpc64le-unknown-linux-gnu       , os: ubuntu-latest  , use-cross: true }
-        - { platform: linux-riscv64gc   , target: riscv64gc-unknown-linux-gnu         , os: ubuntu-latest  , use-cross: true }
+      # - { platform: linux-riscv64gc   , target: riscv64gc-unknown-linux-gnu         , os: ubuntu-latest  , use-cross: true } #2712
         - { platform: linux-s390x       , target: s390x-unknown-linux-gnu             , os: ubuntu-latest  , use-cross: true }
         - { platform: linux-sparc64     , target: sparc64-unknown-linux-gnu           , os: ubuntu-latest  , use-cross: true }
         - { platform: linux-thumbv7neon , target: thumbv7neon-unknown-linux-gnueabihf , os: ubuntu-latest  , use-cross: true }
@@ -102,7 +102,7 @@ jobs:
         - { platform: linux-powerpc     , cc: powerpc-linux-gnu-gcc             , ar: powerpc-linux-gnu-ar           }
         - { platform: linux-powerpc64   , cc: powerpc64-linux-gnu-gcc           , ar: powerpc64-linux-gnu-ar         }
         - { platform: linux-powerpc64el , cc: powerpc64le-linux-gnu-gcc         , ar: powerpc64le-linux-gnu-ar       }
-        - { platform: linux-riscv64gc   , cc: riscv64-linux-gnu-gcc             , ar: riscv64-linux-gnu-ar           }
+      # - { platform: linux-riscv64gc   , cc: riscv64-linux-gnu-gcc             , ar: riscv64-linux-gnu-ar           } #2712
         - { platform: linux-s390x       , cc: s390x-linux-gnu-gcc               , ar: s390x-linux-gnu-ar             }
         - { platform: linux-sparc64     , cc: sparc64-linux-gnu-gcc             , ar: sparc64-linux-gnu-ar           }
         - { platform: linux-thumbv7neon , cc: arm-linux-gnueabihf-gcc           , ar: arm-linux-gnueabihf-ar         }

From 5e62120050ae4db6adf07c3071641f36bcb62eb2 Mon Sep 17 00:00:00 2001
From: Andrew Hlynskyi <ahlincq@gmail.com>
Date: Mon, 16 Oct 2023 21:45:40 +0300
Subject: [PATCH 344/347] chore: fix local fixture test for C language

---
 test/fixtures/error_corpus/c_errors.txt | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/test/fixtures/error_corpus/c_errors.txt b/test/fixtures/error_corpus/c_errors.txt
index 4b507590..d44400cf 100644
--- a/test/fixtures/error_corpus/c_errors.txt
+++ b/test/fixtures/error_corpus/c_errors.txt
@@ -108,7 +108,7 @@ int main() {
     (function_declarator (identifier) (parameter_list))
     (compound_statement
       (declaration (primitive_type) (identifier))
-      (ERROR (primitive_type) (UNEXPECTED '$')))))
+      (ERROR (primitive_type) (ERROR) (identifier) (UNEXPECTED '@')))))
 
 =========================================
 Extra values in parenthesized expressions

From e265929f90b6c961466f96679d222c01b1d53bbf Mon Sep 17 00:00:00 2001
From: Daumantas Kavolis <daumantas.kavolis@sensmetry.com>
Date: Wed, 25 Oct 2023 10:19:03 +0300
Subject: [PATCH 345/347] Fix `goto_previous_sibling` with padded first
 children

---
 cli/src/tests/tree_test.rs | 30 ++++++++++++++++++++++++++++++
 lib/src/tree_cursor.c      |  6 +++++-
 2 files changed, 35 insertions(+), 1 deletion(-)

diff --git a/cli/src/tests/tree_test.rs b/cli/src/tests/tree_test.rs
index c63b588b..161f65e9 100644
--- a/cli/src/tests/tree_test.rs
+++ b/cli/src/tests/tree_test.rs
@@ -376,6 +376,36 @@ fn test_tree_cursor() {
     assert_eq!(copy.node().kind(), "struct_item");
 }
 
+#[test]
+fn test_tree_cursor_previous_sibling() {
+    let mut parser = Parser::new();
+    parser.set_language(get_language("rust")).unwrap();
+
+    let text = "
+    // Hi there
+    // This is fun!
+    // Another one!
+";
+    let tree = parser.parse(text, None).unwrap();
+
+    let mut cursor = tree.walk();
+    assert_eq!(cursor.node().kind(), "source_file");
+
+    assert!(cursor.goto_last_child());
+    assert_eq!(cursor.node().kind(), "line_comment");
+    assert_eq!(cursor.node().utf8_text(text.as_bytes()).unwrap(), "// Another one!");
+
+    assert!(cursor.goto_previous_sibling());
+    assert_eq!(cursor.node().kind(), "line_comment");
+    assert_eq!(cursor.node().utf8_text(text.as_bytes()).unwrap(), "// This is fun!");
+
+    assert!(cursor.goto_previous_sibling());
+    assert_eq!(cursor.node().kind(), "line_comment");
+    assert_eq!(cursor.node().utf8_text(text.as_bytes()).unwrap(), "// Hi there");
+
+    assert!(!cursor.goto_previous_sibling());
+}
+
 #[test]
 fn test_tree_cursor_fields() {
     let mut parser = Parser::new();
diff --git a/lib/src/tree_cursor.c b/lib/src/tree_cursor.c
index 25eca482..f08b9692 100644
--- a/lib/src/tree_cursor.c
+++ b/lib/src/tree_cursor.c
@@ -377,7 +377,11 @@ TreeCursorStep ts_tree_cursor_goto_previous_sibling_internal(TSTreeCursor *_self
   position = parent->position;
   uint32_t child_index = array_back(&self->stack)->child_index;
   const Subtree *children = ts_subtree_children((*(parent->subtree)));
-  for (uint32_t i = 0; i < child_index; ++i) {
+
+  // skip first child padding since its position should match the position of the parent
+  if (child_index > 0)
+    position = length_add(position, ts_subtree_size(children[0]));
+  for (uint32_t i = 1; i < child_index; ++i) {
     position = length_add(position, ts_subtree_total_size(children[i]));
   }
   if (child_index > 0)

From e26e23fd0e6baad6b5285ba1d990142b1f0ff1aa Mon Sep 17 00:00:00 2001
From: Daumantas Kavolis <daumantas.kavolis@sensmetry.com>
Date: Wed, 25 Oct 2023 10:24:35 +0300
Subject: [PATCH 346/347] Fix formatting

---
 cli/src/tests/tree_test.rs | 15 ++++++++++++---
 1 file changed, 12 insertions(+), 3 deletions(-)

diff --git a/cli/src/tests/tree_test.rs b/cli/src/tests/tree_test.rs
index 161f65e9..f3792138 100644
--- a/cli/src/tests/tree_test.rs
+++ b/cli/src/tests/tree_test.rs
@@ -393,15 +393,24 @@ fn test_tree_cursor_previous_sibling() {
 
     assert!(cursor.goto_last_child());
     assert_eq!(cursor.node().kind(), "line_comment");
-    assert_eq!(cursor.node().utf8_text(text.as_bytes()).unwrap(), "// Another one!");
+    assert_eq!(
+        cursor.node().utf8_text(text.as_bytes()).unwrap(),
+        "// Another one!"
+    );
 
     assert!(cursor.goto_previous_sibling());
     assert_eq!(cursor.node().kind(), "line_comment");
-    assert_eq!(cursor.node().utf8_text(text.as_bytes()).unwrap(), "// This is fun!");
+    assert_eq!(
+        cursor.node().utf8_text(text.as_bytes()).unwrap(),
+        "// This is fun!"
+    );
 
     assert!(cursor.goto_previous_sibling());
     assert_eq!(cursor.node().kind(), "line_comment");
-    assert_eq!(cursor.node().utf8_text(text.as_bytes()).unwrap(), "// Hi there");
+    assert_eq!(
+        cursor.node().utf8_text(text.as_bytes()).unwrap(),
+        "// Hi there"
+    );
 
     assert!(!cursor.goto_previous_sibling());
 }

From 143ed959c9a4d591538413b59b935fdba1066a5c Mon Sep 17 00:00:00 2001
From: Daumantas Kavolis <daumantas.kavolis@sensmetry.com>
Date: Wed, 25 Oct 2023 10:47:55 +0300
Subject: [PATCH 347/347] Use single if block

---
 lib/src/tree_cursor.c | 12 ++++++------
 1 file changed, 6 insertions(+), 6 deletions(-)

diff --git a/lib/src/tree_cursor.c b/lib/src/tree_cursor.c
index f08b9692..63d22c8b 100644
--- a/lib/src/tree_cursor.c
+++ b/lib/src/tree_cursor.c
@@ -378,14 +378,14 @@ TreeCursorStep ts_tree_cursor_goto_previous_sibling_internal(TSTreeCursor *_self
   uint32_t child_index = array_back(&self->stack)->child_index;
   const Subtree *children = ts_subtree_children((*(parent->subtree)));
 
-  // skip first child padding since its position should match the position of the parent
-  if (child_index > 0)
+  if (child_index > 0) {
+    // skip first child padding since its position should match the position of the parent
     position = length_add(position, ts_subtree_size(children[0]));
-  for (uint32_t i = 1; i < child_index; ++i) {
-    position = length_add(position, ts_subtree_total_size(children[i]));
-  }
-  if (child_index > 0)
+    for (uint32_t i = 1; i < child_index; ++i) {
+      position = length_add(position, ts_subtree_total_size(children[i]));
+    }
     position = length_add(position, ts_subtree_padding(children[child_index]));
+  }
 
   array_back(&self->stack)->position = position;