From 3414d990001fc74d7fe44c1da2011a6385ab8132 Mon Sep 17 00:00:00 2001 From: Amaan Qureshi Date: Sun, 3 Mar 2024 21:23:35 -0500 Subject: [PATCH] feat: move delimiter parsing to the scanner Co-Authored-By: ObserverOfTime --- .github/workflows/ci.yml | 13 + Package.swift | 1 + binding.gyp | 1 + bindings/go/binding.go | 1 + bindings/rust/build.rs | 4 + bindings/rust/lib.rs | 17 + examples/attributes.tst | 39 + examples/invalid.tst | 9 + examples/simple.tst | 17 + examples/suffix.tst | 15 + grammar.js | 76 +- package.json | 3 +- setup.py | 1 + src/grammar.json | 322 ++++----- src/node-types.json | 100 +-- src/parser.c | 1480 +++++++++++++++++++++++++------------- src/scanner.c | 104 +++ 17 files changed, 1426 insertions(+), 777 deletions(-) create mode 100644 examples/attributes.tst create mode 100644 examples/invalid.tst create mode 100644 examples/simple.tst create mode 100644 examples/suffix.tst create mode 100644 src/scanner.c diff --git a/.github/workflows/ci.yml b/.github/workflows/ci.yml index 0482d3f..b3d287b 100644 --- a/.github/workflows/ci.yml +++ b/.github/workflows/ci.yml @@ -36,7 +36,20 @@ jobs: uses: tree-sitter/parser-setup-action@v1.1 with: node-version: ${{vars.NODE_VERSION}} + - name: Check for scanner changes + uses: tj-actions/changed-files@v42 + id: scanner-check + if: runner.os == 'Linux' + with: + files: src/scanner.c + - name: Fuzz scanner + uses: tree-sitter/fuzz-action@v4 + if: steps.scanner-check.outputs.any_changed == 'true' + with: + corpus: examples - name: Run tests uses: tree-sitter/parser-test-action@v1.2 with: test-library: ${{runner.os == 'Linux'}} + corpus-files: examples/* + invalid-files: examples/invalid.tst diff --git a/Package.swift b/Package.swift index e59b1eb..5e38ed3 100644 --- a/Package.swift +++ b/Package.swift @@ -36,6 +36,7 @@ let package = Package( ], sources: [ "src/parser.c", + "src/scanner.c" ], resources: [ .copy("queries") diff --git a/binding.gyp b/binding.gyp index b5ea5c6..a7d3bb9 100644 --- a/binding.gyp +++ b/binding.gyp @@ -11,6 +11,7 @@ "sources": [ "bindings/node/binding.cc", "src/parser.c", + "src/scanner.c", ], "cflags_c": [ "-std=c11", diff --git a/bindings/go/binding.go b/bindings/go/binding.go index a37103d..441c2ec 100644 --- a/bindings/go/binding.go +++ b/bindings/go/binding.go @@ -2,6 +2,7 @@ package tree_sitter_test // #cgo CFLAGS: -std=c11 -fPIC // #include "../../src/parser.c" +// #include "../../src/scanner.c" import "C" import "unsafe" diff --git a/bindings/rust/build.rs b/bindings/rust/build.rs index 07504bf..da068d1 100644 --- a/bindings/rust/build.rs +++ b/bindings/rust/build.rs @@ -8,5 +8,9 @@ fn main() { c_config.file(&parser_path); println!("cargo:rerun-if-changed={}", parser_path.to_str().unwrap()); + let scanner_path = src_dir.join("scanner.c"); + c_config.file(&scanner_path); + println!("cargo:rerun-if-changed={}", scanner_path.to_str().unwrap()); + c_config.compile("tree-sitter-test"); } diff --git a/bindings/rust/lib.rs b/bindings/rust/lib.rs index 9badd8c..c8617c7 100644 --- a/bindings/rust/lib.rs +++ b/bindings/rust/lib.rs @@ -5,6 +5,23 @@ //! //! ``` //! let code = r#" +//! ================== +//! Return statements +//! ================== +//! +//! func x() int { +//! return 1; +//! } +//! +//! --- +//! +//! (source_file +//! (function_definition +//! (identifier) +//! (parameter_list) +//! (primitive_type) +//! (block +//! (return_statement (number))))) //! "#; //! let mut parser = tree_sitter::Parser::new(); //! parser.set_language(&tree_sitter_test::language()).expect("Error loading Test grammar"); diff --git a/examples/attributes.tst b/examples/attributes.tst new file mode 100644 index 0000000..f7ca9e0 --- /dev/null +++ b/examples/attributes.tst @@ -0,0 +1,39 @@ +========================= +Test that will be skipped +:skip +========================= + +int main() {} + +------------------------- + +==================================== +Test that will run on Linux or macOS + +:platform(linux) +:platform(macos) +==================================== + +int main() {} + +------------------------------------ + +======================================================================== +Test that expects an error, and will fail fast if there's no parse error +:fail-fast +:error +======================================================================== + +int main ( {} + +------------------------------------------------------------------------ + +================================================= +Test that will parse with both Typescript and TSX +:language(typescript) +:language(tsx) +================================================= + +console.log('Hello, world!'); + +------------------------------------------------- diff --git a/examples/invalid.tst b/examples/invalid.tst new file mode 100644 index 0000000..a789334 --- /dev/null +++ b/examples/invalid.tst @@ -0,0 +1,9 @@ +==================||| +Invalid suffix +==================||| + +foo + +---|| + +(foo) diff --git a/examples/simple.tst b/examples/simple.tst new file mode 100644 index 0000000..ea10233 --- /dev/null +++ b/examples/simple.tst @@ -0,0 +1,17 @@ +================== +Return statements +================== + +func x() int { + return 1; +} + +--- + +(source_file + (function_definition + (identifier) + (parameter_list) + (primitive_type) + (block + (return_statement (number))))) diff --git a/examples/suffix.tst b/examples/suffix.tst new file mode 100644 index 0000000..fef0a2e --- /dev/null +++ b/examples/suffix.tst @@ -0,0 +1,15 @@ +==================||| +Basic module +==================||| + +---- MODULE Test ---- +increment(n) == n + 1 +==== + +---||| + +(source_file + (module (identifier) + (operator (identifier) + (parameter_list (identifier)) + (plus (identifier_ref) (number))))) diff --git a/grammar.js b/grammar.js index 7cd665c..90a4f9b 100644 --- a/grammar.js +++ b/grammar.js @@ -1,63 +1,69 @@ /// // @ts-check -const I = token.immediate; - module.exports = grammar({ name: "test", - extras: _ => [/\r?\n/], + externals: $ => [ + $._equals_begin, + $._equals_end, + $._dashes, + ], + + extras: _ => [], rules: { - file: $ => repeat($.test), + file: $ => repeat( + choice($.test, $._eol) + ), - test: $ => seq( + test: $ => prec.right(seq( $.header, - alias(repeat1(/./), $.input), + alias($._body, $.input), alias($._dashes, $.separator), - alias(repeat(/./), $.output) - ), + optional(alias($._body, $.output)), + )), + + _line: _ => /[^\r\n]+/, + + _body: $ => repeat1(choice($._line, $._eol)), header: $ => seq( - alias($._equals, $.separator), - alias(repeat1(/[^\r\n]/), $.name), + alias($._equals_begin, $.separator), + alias($._line, $.name), optional($.attributes), - alias($._equals, $.separator) + alias($._equals_end, $.separator), ), attributes: $ => repeat1( - field("attribute", choice( - $.skip, - $.error, - $.fail_fast, - $.language, - $.platform, - )) + choice($.attribute, $._eol) ), - skip: _ => ":skip", - - error: _ => ":error", - - fail_fast: _ => ":fail-fast", + attribute: $ => choice( + ":skip", + ":error", + ":fail-fast", + $._language, + $._platform, + ), - language: $ => seq( + _language: $ => seq( ":language", - I("("), - alias($._lang, $.parameter), - I(")") + "(", + field("language", alias($._lang, $.parameter)), + ")" ), - platform: $ => seq( + _platform: $ => seq( ":platform", - I("("), - alias($._os, $.parameter), - I(")") + "(", + field("platform", alias($._os, $.parameter)), + ")" ), - _lang: _ => I(repeat1(/[\w.-]/)), + _lang: _ => token(repeat1(/[\w.-]/)), - _os: _ => I(choice( + _os: _ => token(choice( "linux", "macos", "ios", @@ -70,8 +76,6 @@ module.exports = grammar({ "windows", )), - _equals: $ => token(prec(1, repeat1("="))), - - _dashes: $ => token(prec(1, seq("---", repeat("-")))) + _eol: _ => /[\r\n]|\r\n/ } }); diff --git a/package.json b/package.json index 8bead94..208728d 100644 --- a/package.json +++ b/package.json @@ -37,7 +37,8 @@ { "scope": "text.test", "highlights": "queries/highlights.scm", - "injections": "queries/injections.scm" + "injections": "queries/injections.scm", + "file-types": ["tst"] } ] } diff --git a/setup.py b/setup.py index 7d72391..bd95a9b 100644 --- a/setup.py +++ b/setup.py @@ -36,6 +36,7 @@ def get_tag(self): sources=[ "bindings/python/tree_sitter_test/binding.c", "src/parser.c", + "src/scanner.c", ], extra_compile_args=( ["-std=c11"] if system() != 'Windows' else [] diff --git a/src/grammar.json b/src/grammar.json index e7dfa10..b77d60d 100644 --- a/src/grammar.json +++ b/src/grammar.json @@ -4,51 +4,86 @@ "file": { "type": "REPEAT", "content": { - "type": "SYMBOL", - "name": "test" + "type": "CHOICE", + "members": [ + { + "type": "SYMBOL", + "name": "test" + }, + { + "type": "SYMBOL", + "name": "_eol" + } + ] } }, "test": { - "type": "SEQ", - "members": [ - { - "type": "SYMBOL", - "name": "header" - }, - { - "type": "ALIAS", - "content": { - "type": "REPEAT1", - "content": { - "type": "PATTERN", - "value": "." - } - }, - "named": true, - "value": "input" - }, - { - "type": "ALIAS", - "content": { + "type": "PREC_RIGHT", + "value": 0, + "content": { + "type": "SEQ", + "members": [ + { "type": "SYMBOL", - "name": "_dashes" + "name": "header" }, - "named": true, - "value": "separator" - }, - { - "type": "ALIAS", - "content": { - "type": "REPEAT", + { + "type": "ALIAS", "content": { - "type": "PATTERN", - "value": "." - } + "type": "SYMBOL", + "name": "_body" + }, + "named": true, + "value": "input" }, - "named": true, - "value": "output" - } - ] + { + "type": "ALIAS", + "content": { + "type": "SYMBOL", + "name": "_dashes" + }, + "named": true, + "value": "separator" + }, + { + "type": "CHOICE", + "members": [ + { + "type": "ALIAS", + "content": { + "type": "SYMBOL", + "name": "_body" + }, + "named": true, + "value": "output" + }, + { + "type": "BLANK" + } + ] + } + ] + } + }, + "_line": { + "type": "PATTERN", + "value": "[^\\r\\n]+" + }, + "_body": { + "type": "REPEAT1", + "content": { + "type": "CHOICE", + "members": [ + { + "type": "SYMBOL", + "name": "_line" + }, + { + "type": "SYMBOL", + "name": "_eol" + } + ] + } }, "header": { "type": "SEQ", @@ -57,7 +92,7 @@ "type": "ALIAS", "content": { "type": "SYMBOL", - "name": "_equals" + "name": "_equals_begin" }, "named": true, "value": "separator" @@ -65,11 +100,8 @@ { "type": "ALIAS", "content": { - "type": "REPEAT1", - "content": { - "type": "PATTERN", - "value": "[^\\r\\n]" - } + "type": "SYMBOL", + "name": "_line" }, "named": true, "value": "name" @@ -90,7 +122,7 @@ "type": "ALIAS", "content": { "type": "SYMBOL", - "name": "_equals" + "name": "_equals_end" }, "named": true, "value": "separator" @@ -100,48 +132,45 @@ "attributes": { "type": "REPEAT1", "content": { - "type": "FIELD", - "name": "attribute", - "content": { - "type": "CHOICE", - "members": [ - { - "type": "SYMBOL", - "name": "skip" - }, - { - "type": "SYMBOL", - "name": "error" - }, - { - "type": "SYMBOL", - "name": "fail_fast" - }, - { - "type": "SYMBOL", - "name": "language" - }, - { - "type": "SYMBOL", - "name": "platform" - } - ] - } + "type": "CHOICE", + "members": [ + { + "type": "SYMBOL", + "name": "attribute" + }, + { + "type": "SYMBOL", + "name": "_eol" + } + ] } }, - "skip": { - "type": "STRING", - "value": ":skip" - }, - "error": { - "type": "STRING", - "value": ":error" - }, - "fail_fast": { - "type": "STRING", - "value": ":fail-fast" + "attribute": { + "type": "CHOICE", + "members": [ + { + "type": "STRING", + "value": ":skip" + }, + { + "type": "STRING", + "value": ":error" + }, + { + "type": "STRING", + "value": ":fail-fast" + }, + { + "type": "SYMBOL", + "name": "_language" + }, + { + "type": "SYMBOL", + "name": "_platform" + } + ] }, - "language": { + "_language": { "type": "SEQ", "members": [ { @@ -149,31 +178,29 @@ "value": ":language" }, { - "type": "IMMEDIATE_TOKEN", - "content": { - "type": "STRING", - "value": "(" - } + "type": "STRING", + "value": "(" }, { - "type": "ALIAS", + "type": "FIELD", + "name": "language", "content": { - "type": "SYMBOL", - "name": "_lang" - }, - "named": true, - "value": "parameter" + "type": "ALIAS", + "content": { + "type": "SYMBOL", + "name": "_lang" + }, + "named": true, + "value": "parameter" + } }, { - "type": "IMMEDIATE_TOKEN", - "content": { - "type": "STRING", - "value": ")" - } + "type": "STRING", + "value": ")" } ] }, - "platform": { + "_platform": { "type": "SEQ", "members": [ { @@ -181,32 +208,30 @@ "value": ":platform" }, { - "type": "IMMEDIATE_TOKEN", - "content": { - "type": "STRING", - "value": "(" - } + "type": "STRING", + "value": "(" }, { - "type": "ALIAS", + "type": "FIELD", + "name": "platform", "content": { - "type": "SYMBOL", - "name": "_os" - }, - "named": true, - "value": "parameter" + "type": "ALIAS", + "content": { + "type": "SYMBOL", + "name": "_os" + }, + "named": true, + "value": "parameter" + } }, { - "type": "IMMEDIATE_TOKEN", - "content": { - "type": "STRING", - "value": ")" - } + "type": "STRING", + "value": ")" } ] }, "_lang": { - "type": "IMMEDIATE_TOKEN", + "type": "TOKEN", "content": { "type": "REPEAT1", "content": { @@ -216,7 +241,7 @@ } }, "_os": { - "type": "IMMEDIATE_TOKEN", + "type": "TOKEN", "content": { "type": "CHOICE", "members": [ @@ -263,53 +288,28 @@ ] } }, - "_equals": { - "type": "TOKEN", - "content": { - "type": "PREC", - "value": 1, - "content": { - "type": "REPEAT1", - "content": { - "type": "STRING", - "value": "=" - } - } - } - }, - "_dashes": { - "type": "TOKEN", - "content": { - "type": "PREC", - "value": 1, - "content": { - "type": "SEQ", - "members": [ - { - "type": "STRING", - "value": "---" - }, - { - "type": "REPEAT", - "content": { - "type": "STRING", - "value": "-" - } - } - ] - } - } + "_eol": { + "type": "PATTERN", + "value": "[\\r\\n]|\\r\\n" } }, - "extras": [ + "extras": [], + "conflicts": [], + "precedences": [], + "externals": [ { - "type": "PATTERN", - "value": "\\r?\\n" + "type": "SYMBOL", + "name": "_equals_begin" + }, + { + "type": "SYMBOL", + "name": "_equals_end" + }, + { + "type": "SYMBOL", + "name": "_dashes" } ], - "conflicts": [], - "precedences": [], - "externals": [], "inline": [], "supertypes": [] } diff --git a/src/node-types.json b/src/node-types.json index 81bf114..2d8fb52 100644 --- a/src/node-types.json +++ b/src/node-types.json @@ -1,36 +1,45 @@ [ { - "type": "attributes", + "type": "attribute", "named": true, "fields": { - "attribute": { - "multiple": true, - "required": true, + "language": { + "multiple": false, + "required": false, "types": [ { - "type": "error", - "named": true - }, - { - "type": "fail_fast", - "named": true - }, - { - "type": "language", + "type": "parameter", "named": true - }, - { - "type": "platform", - "named": true - }, + } + ] + }, + "platform": { + "multiple": false, + "required": false, + "types": [ { - "type": "skip", + "type": "parameter", "named": true } ] } } }, + { + "type": "attributes", + "named": true, + "fields": {}, + "children": { + "multiple": true, + "required": false, + "types": [ + { + "type": "attribute", + "named": true + } + ] + } + }, { "type": "file", "named": true, @@ -74,46 +83,11 @@ "named": true, "fields": {} }, - { - "type": "language", - "named": true, - "fields": {}, - "children": { - "multiple": false, - "required": true, - "types": [ - { - "type": "parameter", - "named": true - } - ] - } - }, - { - "type": "name", - "named": true, - "fields": {} - }, { "type": "output", "named": true, "fields": {} }, - { - "type": "platform", - "named": true, - "fields": {}, - "children": { - "multiple": false, - "required": true, - "types": [ - { - "type": "parameter", - "named": true - } - ] - } - }, { "type": "test", "named": true, @@ -149,6 +123,14 @@ "type": ")", "named": false }, + { + "type": ":error", + "named": false + }, + { + "type": ":fail-fast", + "named": false + }, { "type": ":language", "named": false @@ -158,11 +140,11 @@ "named": false }, { - "type": "error", - "named": true + "type": ":skip", + "named": false }, { - "type": "fail_fast", + "type": "name", "named": true }, { @@ -172,9 +154,5 @@ { "type": "separator", "named": true - }, - { - "type": "skip", - "named": true } ] \ No newline at end of file diff --git a/src/parser.c b/src/parser.c index 6543c2a..ed5e1f2 100644 --- a/src/parser.c +++ b/src/parser.c @@ -7,67 +7,69 @@ #define LANGUAGE_VERSION 14 #define STATE_COUNT 31 #define LARGE_STATE_COUNT 2 -#define SYMBOL_COUNT 24 +#define SYMBOL_COUNT 25 #define ALIAS_COUNT 3 -#define TOKEN_COUNT 14 -#define EXTERNAL_TOKEN_COUNT 0 -#define FIELD_COUNT 1 +#define TOKEN_COUNT 15 +#define EXTERNAL_TOKEN_COUNT 3 +#define FIELD_COUNT 2 #define MAX_ALIAS_SEQUENCE_LENGTH 4 -#define PRODUCTION_ID_COUNT 7 +#define PRODUCTION_ID_COUNT 8 enum ts_symbol_identifiers { - aux_sym_test_token1 = 1, - aux_sym_header_token1 = 2, - sym_skip = 3, - sym_error = 4, - sym_fail_fast = 5, - anon_sym_COLONlanguage = 6, - anon_sym_LPAREN = 7, - anon_sym_RPAREN = 8, - anon_sym_COLONplatform = 9, - sym__lang = 10, - sym__os = 11, - sym__equals = 12, - sym__dashes = 13, - sym_file = 14, - sym_test = 15, - sym_header = 16, - sym_attributes = 17, - sym_language = 18, - sym_platform = 19, - aux_sym_file_repeat1 = 20, - aux_sym_test_repeat1 = 21, - aux_sym_header_repeat1 = 22, - aux_sym_attributes_repeat1 = 23, - alias_sym_input = 24, - alias_sym_name = 25, - alias_sym_output = 26, + sym__line = 1, + anon_sym_COLONskip = 2, + anon_sym_COLONerror = 3, + anon_sym_COLONfail_DASHfast = 4, + anon_sym_COLONlanguage = 5, + anon_sym_LPAREN = 6, + anon_sym_RPAREN = 7, + anon_sym_COLONplatform = 8, + sym__lang = 9, + sym__os = 10, + sym__eol = 11, + sym__equals_begin = 12, + sym__equals_end = 13, + sym__dashes = 14, + sym_file = 15, + sym_test = 16, + aux_sym__body = 17, + sym_header = 18, + sym_attributes = 19, + sym_attribute = 20, + sym__language = 21, + sym__platform = 22, + aux_sym_file_repeat1 = 23, + aux_sym_attributes_repeat1 = 24, + alias_sym_input = 25, + alias_sym_name = 26, + alias_sym_output = 27, }; static const char * const ts_symbol_names[] = { [ts_builtin_sym_end] = "end", - [aux_sym_test_token1] = "test_token1", - [aux_sym_header_token1] = "header_token1", - [sym_skip] = "skip", - [sym_error] = "error", - [sym_fail_fast] = "fail_fast", + [sym__line] = "_line", + [anon_sym_COLONskip] = ":skip", + [anon_sym_COLONerror] = ":error", + [anon_sym_COLONfail_DASHfast] = ":fail-fast", [anon_sym_COLONlanguage] = ":language", [anon_sym_LPAREN] = "(", [anon_sym_RPAREN] = ")", [anon_sym_COLONplatform] = ":platform", [sym__lang] = "parameter", [sym__os] = "parameter", - [sym__equals] = "separator", + [sym__eol] = "_eol", + [sym__equals_begin] = "separator", + [sym__equals_end] = "separator", [sym__dashes] = "separator", [sym_file] = "file", [sym_test] = "test", + [aux_sym__body] = "_body", [sym_header] = "header", [sym_attributes] = "attributes", - [sym_language] = "language", - [sym_platform] = "platform", + [sym_attribute] = "attribute", + [sym__language] = "_language", + [sym__platform] = "_platform", [aux_sym_file_repeat1] = "file_repeat1", - [aux_sym_test_repeat1] = "test_repeat1", - [aux_sym_header_repeat1] = "header_repeat1", [aux_sym_attributes_repeat1] = "attributes_repeat1", [alias_sym_input] = "input", [alias_sym_name] = "name", @@ -76,28 +78,29 @@ static const char * const ts_symbol_names[] = { static const TSSymbol ts_symbol_map[] = { [ts_builtin_sym_end] = ts_builtin_sym_end, - [aux_sym_test_token1] = aux_sym_test_token1, - [aux_sym_header_token1] = aux_sym_header_token1, - [sym_skip] = sym_skip, - [sym_error] = sym_error, - [sym_fail_fast] = sym_fail_fast, + [sym__line] = sym__line, + [anon_sym_COLONskip] = anon_sym_COLONskip, + [anon_sym_COLONerror] = anon_sym_COLONerror, + [anon_sym_COLONfail_DASHfast] = anon_sym_COLONfail_DASHfast, [anon_sym_COLONlanguage] = anon_sym_COLONlanguage, [anon_sym_LPAREN] = anon_sym_LPAREN, [anon_sym_RPAREN] = anon_sym_RPAREN, [anon_sym_COLONplatform] = anon_sym_COLONplatform, [sym__lang] = sym__lang, [sym__os] = sym__lang, - [sym__equals] = sym__equals, - [sym__dashes] = sym__equals, + [sym__eol] = sym__eol, + [sym__equals_begin] = sym__equals_begin, + [sym__equals_end] = sym__equals_begin, + [sym__dashes] = sym__equals_begin, [sym_file] = sym_file, [sym_test] = sym_test, + [aux_sym__body] = aux_sym__body, [sym_header] = sym_header, [sym_attributes] = sym_attributes, - [sym_language] = sym_language, - [sym_platform] = sym_platform, + [sym_attribute] = sym_attribute, + [sym__language] = sym__language, + [sym__platform] = sym__platform, [aux_sym_file_repeat1] = aux_sym_file_repeat1, - [aux_sym_test_repeat1] = aux_sym_test_repeat1, - [aux_sym_header_repeat1] = aux_sym_header_repeat1, [aux_sym_attributes_repeat1] = aux_sym_attributes_repeat1, [alias_sym_input] = alias_sym_input, [alias_sym_name] = alias_sym_name, @@ -109,25 +112,21 @@ static const TSSymbolMetadata ts_symbol_metadata[] = { .visible = false, .named = true, }, - [aux_sym_test_token1] = { + [sym__line] = { .visible = false, - .named = false, - }, - [aux_sym_header_token1] = { - .visible = false, - .named = false, + .named = true, }, - [sym_skip] = { + [anon_sym_COLONskip] = { .visible = true, - .named = true, + .named = false, }, - [sym_error] = { + [anon_sym_COLONerror] = { .visible = true, - .named = true, + .named = false, }, - [sym_fail_fast] = { + [anon_sym_COLONfail_DASHfast] = { .visible = true, - .named = true, + .named = false, }, [anon_sym_COLONlanguage] = { .visible = true, @@ -153,7 +152,15 @@ static const TSSymbolMetadata ts_symbol_metadata[] = { .visible = true, .named = true, }, - [sym__equals] = { + [sym__eol] = { + .visible = false, + .named = true, + }, + [sym__equals_begin] = { + .visible = true, + .named = true, + }, + [sym__equals_end] = { .visible = true, .named = true, }, @@ -169,6 +176,10 @@ static const TSSymbolMetadata ts_symbol_metadata[] = { .visible = true, .named = true, }, + [aux_sym__body] = { + .visible = false, + .named = false, + }, [sym_header] = { .visible = true, .named = true, @@ -177,23 +188,19 @@ static const TSSymbolMetadata ts_symbol_metadata[] = { .visible = true, .named = true, }, - [sym_language] = { - .visible = true, - .named = true, - }, - [sym_platform] = { + [sym_attribute] = { .visible = true, .named = true, }, - [aux_sym_file_repeat1] = { + [sym__language] = { .visible = false, - .named = false, + .named = true, }, - [aux_sym_test_repeat1] = { + [sym__platform] = { .visible = false, - .named = false, + .named = true, }, - [aux_sym_header_repeat1] = { + [aux_sym_file_repeat1] = { .visible = false, .named = false, }, @@ -216,52 +223,53 @@ static const TSSymbolMetadata ts_symbol_metadata[] = { }; enum ts_field_identifiers { - field_attribute = 1, + field_language = 1, + field_platform = 2, }; static const char * const ts_field_names[] = { [0] = NULL, - [field_attribute] = "attribute", + [field_language] = "language", + [field_platform] = "platform", }; static const TSFieldMapSlice ts_field_map_slices[PRODUCTION_ID_COUNT] = { - [1] = {.index = 0, .length = 1}, + [2] = {.index = 0, .length = 1}, [3] = {.index = 1, .length = 1}, - [5] = {.index = 2, .length = 2}, + [6] = {.index = 2, .length = 1}, + [7] = {.index = 3, .length = 1}, }; static const TSFieldMapEntry ts_field_map_entries[] = { [0] = - {field_attribute, 0}, + {field_language, 0, .inherited = true}, [1] = - {field_attribute, 0, .inherited = true}, + {field_platform, 0, .inherited = true}, [2] = - {field_attribute, 0, .inherited = true}, - {field_attribute, 1, .inherited = true}, + {field_language, 2}, + [3] = + {field_platform, 2}, }; static const TSSymbol ts_alias_sequences[PRODUCTION_ID_COUNT][MAX_ALIAS_SEQUENCE_LENGTH] = { [0] = {0}, - [2] = { + [1] = { [1] = alias_sym_name, }, [4] = { [1] = alias_sym_input, }, - [6] = { + [5] = { [1] = alias_sym_input, [3] = alias_sym_output, }, }; static const uint16_t ts_non_terminal_alias_map[] = { - aux_sym_test_repeat1, 3, - aux_sym_test_repeat1, + aux_sym__body, 3, + aux_sym__body, alias_sym_input, alias_sym_output, - aux_sym_header_repeat1, 2, - aux_sym_header_repeat1, - alias_sym_name, 0, }; @@ -282,10 +290,10 @@ static const TSStateId ts_primary_state_ids[STATE_COUNT] = { [13] = 13, [14] = 14, [15] = 15, - [16] = 16, - [17] = 14, - [18] = 18, - [19] = 15, + [16] = 12, + [17] = 17, + [18] = 17, + [19] = 19, [20] = 20, [21] = 21, [22] = 22, @@ -304,368 +312,743 @@ static bool ts_lex(TSLexer *lexer, TSStateId state) { eof = lexer->eof(lexer); switch (state) { case 0: - if (eof) ADVANCE(84); - if (lookahead == '\n') SKIP(82) - if (lookahead == '\r') SKIP(81) - if (lookahead == '(') ADVANCE(93); - if (lookahead == ')') ADVANCE(94); - if (lookahead == ':') ADVANCE(88); - if (lookahead == '=') ADVANCE(98); + if (eof) ADVANCE(76); + if (lookahead == '\n') ADVANCE(129); + if (lookahead == '\r') ADVANCE(130); + if (lookahead == '(') ADVANCE(82); + if (lookahead == ')') ADVANCE(83); + if (lookahead == ':') ADVANCE(16); + if (lookahead == 'a') ADVANCE(105); + if (lookahead == 'd') ADVANCE(116); + if (lookahead == 'f') ADVANCE(117); + if (lookahead == 'i') ADVANCE(110); + if (lookahead == 'l') ADVANCE(100); + if (lookahead == 'm') ADVANCE(85); + if (lookahead == 'n') ADVANCE(93); + if (lookahead == 'o') ADVANCE(115); + if (lookahead == 's') ADVANCE(111); + if (lookahead == 'w') ADVANCE(102); if (lookahead == '-' || lookahead == '.' || ('0' <= lookahead && lookahead <= '9') || ('A' <= lookahead && lookahead <= 'Z') || lookahead == '_' || - ('a' <= lookahead && lookahead <= 'z')) ADVANCE(96); - if (lookahead != 0) ADVANCE(87); + ('b' <= lookahead && lookahead <= 'z')) ADVANCE(127); END_STATE(); case 1: - if (lookahead == '\n') SKIP(2) + if (lookahead == '-') ADVANCE(23); END_STATE(); case 2: - if (lookahead == '\n') SKIP(2) - if (lookahead == '\r') SKIP(1) - if (lookahead == ':') ADVANCE(88); - if (lookahead == '=') ADVANCE(98); - if (lookahead != 0) ADVANCE(87); + if (lookahead == 'a') ADVANCE(29); END_STATE(); case 3: - if (lookahead == '\n') SKIP(3) - if (lookahead == '\r') ADVANCE(85); - if (lookahead == '-') ADVANCE(86); - if (lookahead != 0) ADVANCE(85); + if (lookahead == 'a') ADVANCE(40); END_STATE(); case 4: - if (lookahead == '\n') SKIP(5) + if (lookahead == 'a') ADVANCE(66); END_STATE(); case 5: - if (lookahead == '\n') SKIP(5) - if (lookahead == '\r') SKIP(4) - if (lookahead != 0) ADVANCE(87); + if (lookahead == 'a') ADVANCE(64); END_STATE(); case 6: - if (lookahead == '\n') SKIP(6) - if (lookahead == '\r') ADVANCE(85); - if (lookahead != 0) ADVANCE(85); + if (lookahead == 'a') ADVANCE(12); END_STATE(); case 7: - if (lookahead == '(') ADVANCE(93); - if (lookahead == ')') ADVANCE(94); - if (lookahead == '-' || - lookahead == '.' || - ('0' <= lookahead && lookahead <= '9') || - ('A' <= lookahead && lookahead <= 'Z') || - lookahead == '_' || - ('a' <= lookahead && lookahead <= 'z')) ADVANCE(96); + if (lookahead == 'a') ADVANCE(41); + if (lookahead == 'd') ADVANCE(62); + if (lookahead == 'f') ADVANCE(59); + if (lookahead == 'i') ADVANCE(47); + if (lookahead == 'l') ADVANCE(31); + if (lookahead == 'm') ADVANCE(6); + if (lookahead == 'n') ADVANCE(19); + if (lookahead == 'o') ADVANCE(54); + if (lookahead == 's') ADVANCE(52); + if (lookahead == 'w') ADVANCE(33); END_STATE(); case 8: - if (lookahead == '-') ADVANCE(99); + if (lookahead == 'a') ADVANCE(26); END_STATE(); case 9: - if (lookahead == '-') ADVANCE(30); + if (lookahead == 'a') ADVANCE(27); END_STATE(); case 10: - if (lookahead == 'a') ADVANCE(36); + if (lookahead == 'a') ADVANCE(61); END_STATE(); case 11: - if (lookahead == 'a') ADVANCE(47); + if (lookahead == 'b') ADVANCE(65); END_STATE(); case 12: - if (lookahead == 'a') ADVANCE(73); + if (lookahead == 'c') ADVANCE(47); END_STATE(); case 13: - if (lookahead == 'a') ADVANCE(71); + if (lookahead == 'd') ADVANCE(128); END_STATE(); case 14: - if (lookahead == 'a') ADVANCE(20); + if (lookahead == 'd') ADVANCE(46); END_STATE(); case 15: - if (lookahead == 'a') ADVANCE(48); - if (lookahead == 'd') ADVANCE(69); - if (lookahead == 'f') ADVANCE(66); - if (lookahead == 'i') ADVANCE(54); - if (lookahead == 'l') ADVANCE(38); - if (lookahead == 'm') ADVANCE(14); - if (lookahead == 'n') ADVANCE(26); - if (lookahead == 'o') ADVANCE(61); - if (lookahead == 's') ADVANCE(59); - if (lookahead == 'w') ADVANCE(40); + if (lookahead == 'd') ADVANCE(60); END_STATE(); case 16: - if (lookahead == 'a') ADVANCE(33); + if (lookahead == 'e') ADVANCE(58); + if (lookahead == 'f') ADVANCE(2); + if (lookahead == 'l') ADVANCE(3); + if (lookahead == 'p') ADVANCE(37); + if (lookahead == 's') ADVANCE(34); END_STATE(); case 17: - if (lookahead == 'a') ADVANCE(34); + if (lookahead == 'e') ADVANCE(81); END_STATE(); case 18: - if (lookahead == 'a') ADVANCE(68); + if (lookahead == 'e') ADVANCE(11); END_STATE(); case 19: - if (lookahead == 'b') ADVANCE(72); + if (lookahead == 'e') ADVANCE(68); END_STATE(); case 20: - if (lookahead == 'c') ADVANCE(54); + if (lookahead == 'e') ADVANCE(42); END_STATE(); case 21: - if (lookahead == 'd') ADVANCE(97); + if (lookahead == 'e') ADVANCE(18); END_STATE(); case 22: - if (lookahead == 'd') ADVANCE(53); + if (lookahead == 'f') ADVANCE(36); END_STATE(); case 23: - if (lookahead == 'd') ADVANCE(67); + if (lookahead == 'f') ADVANCE(5); END_STATE(); case 24: - if (lookahead == 'e') ADVANCE(92); + if (lookahead == 'f') ADVANCE(49); END_STATE(); case 25: - if (lookahead == 'e') ADVANCE(19); + if (lookahead == 'g') ADVANCE(70); END_STATE(); case 26: - if (lookahead == 'e') ADVANCE(75); + if (lookahead == 'g') ADVANCE(17); END_STATE(); case 27: - if (lookahead == 'e') ADVANCE(49); + if (lookahead == 'g') ADVANCE(51); END_STATE(); case 28: - if (lookahead == 'e') ADVANCE(25); + if (lookahead == 'i') ADVANCE(53); END_STATE(); case 29: - if (lookahead == 'f') ADVANCE(43); + if (lookahead == 'i') ADVANCE(35); END_STATE(); case 30: - if (lookahead == 'f') ADVANCE(13); + if (lookahead == 'i') ADVANCE(63); END_STATE(); case 31: - if (lookahead == 'f') ADVANCE(56); + if (lookahead == 'i') ADVANCE(43); END_STATE(); case 32: - if (lookahead == 'g') ADVANCE(77); + if (lookahead == 'i') ADVANCE(13); END_STATE(); case 33: - if (lookahead == 'g') ADVANCE(24); + if (lookahead == 'i') ADVANCE(44); END_STATE(); case 34: - if (lookahead == 'g') ADVANCE(58); + if (lookahead == 'k') ADVANCE(28); END_STATE(); case 35: - if (lookahead == 'i') ADVANCE(60); + if (lookahead == 'l') ADVANCE(1); END_STATE(); case 36: - if (lookahead == 'i') ADVANCE(42); + if (lookahead == 'l') ADVANCE(73); END_STATE(); case 37: - if (lookahead == 'i') ADVANCE(70); + if (lookahead == 'l') ADVANCE(4); END_STATE(); case 38: - if (lookahead == 'i') ADVANCE(50); + if (lookahead == 'l') ADVANCE(10); END_STATE(); case 39: - if (lookahead == 'i') ADVANCE(21); + if (lookahead == 'm') ADVANCE(84); END_STATE(); case 40: - if (lookahead == 'i') ADVANCE(51); + if (lookahead == 'n') ADVANCE(25); END_STATE(); case 41: - if (lookahead == 'k') ADVANCE(35); + if (lookahead == 'n') ADVANCE(15); END_STATE(); case 42: - if (lookahead == 'l') ADVANCE(9); + if (lookahead == 'n') ADVANCE(11); END_STATE(); case 43: - if (lookahead == 'l') ADVANCE(80); + if (lookahead == 'n') ADVANCE(69); END_STATE(); case 44: - if (lookahead == 'l') ADVANCE(12); + if (lookahead == 'n') ADVANCE(14); END_STATE(); case 45: - if (lookahead == 'l') ADVANCE(18); + if (lookahead == 'n') ADVANCE(22); END_STATE(); case 46: - if (lookahead == 'm') ADVANCE(95); + if (lookahead == 'o') ADVANCE(71); END_STATE(); case 47: - if (lookahead == 'n') ADVANCE(32); + if (lookahead == 'o') ADVANCE(63); END_STATE(); case 48: - if (lookahead == 'n') ADVANCE(23); + if (lookahead == 'o') ADVANCE(56); END_STATE(); case 49: - if (lookahead == 'n') ADVANCE(19); + if (lookahead == 'o') ADVANCE(57); END_STATE(); case 50: - if (lookahead == 'n') ADVANCE(76); + if (lookahead == 'o') ADVANCE(32); END_STATE(); case 51: - if (lookahead == 'n') ADVANCE(22); + if (lookahead == 'o') ADVANCE(45); END_STATE(); case 52: - if (lookahead == 'n') ADVANCE(29); + if (lookahead == 'o') ADVANCE(38); END_STATE(); case 53: - if (lookahead == 'o') ADVANCE(78); + if (lookahead == 'p') ADVANCE(78); END_STATE(); case 54: - if (lookahead == 'o') ADVANCE(70); + if (lookahead == 'p') ADVANCE(20); END_STATE(); case 55: - if (lookahead == 'o') ADVANCE(63); + if (lookahead == 'r') ADVANCE(48); END_STATE(); case 56: - if (lookahead == 'o') ADVANCE(64); + if (lookahead == 'r') ADVANCE(79); END_STATE(); case 57: - if (lookahead == 'o') ADVANCE(39); + if (lookahead == 'r') ADVANCE(39); END_STATE(); case 58: - if (lookahead == 'o') ADVANCE(52); + if (lookahead == 'r') ADVANCE(55); END_STATE(); case 59: - if (lookahead == 'o') ADVANCE(45); + if (lookahead == 'r') ADVANCE(21); END_STATE(); case 60: - if (lookahead == 'p') ADVANCE(89); + if (lookahead == 'r') ADVANCE(50); END_STATE(); case 61: - if (lookahead == 'p') ADVANCE(27); + if (lookahead == 'r') ADVANCE(30); END_STATE(); case 62: - if (lookahead == 'r') ADVANCE(55); + if (lookahead == 'r') ADVANCE(9); END_STATE(); case 63: - if (lookahead == 'r') ADVANCE(90); + if (lookahead == 's') ADVANCE(128); END_STATE(); case 64: - if (lookahead == 'r') ADVANCE(46); + if (lookahead == 's') ADVANCE(67); END_STATE(); case 65: - if (lookahead == 'r') ADVANCE(62); + if (lookahead == 's') ADVANCE(13); END_STATE(); case 66: - if (lookahead == 'r') ADVANCE(28); + if (lookahead == 't') ADVANCE(24); END_STATE(); case 67: - if (lookahead == 'r') ADVANCE(57); + if (lookahead == 't') ADVANCE(80); END_STATE(); case 68: - if (lookahead == 'r') ADVANCE(37); + if (lookahead == 't') ADVANCE(11); END_STATE(); case 69: - if (lookahead == 'r') ADVANCE(17); + if (lookahead == 'u') ADVANCE(72); END_STATE(); case 70: - if (lookahead == 's') ADVANCE(97); + if (lookahead == 'u') ADVANCE(8); END_STATE(); case 71: - if (lookahead == 's') ADVANCE(74); + if (lookahead == 'w') ADVANCE(63); END_STATE(); case 72: - if (lookahead == 's') ADVANCE(21); + if (lookahead == 'x') ADVANCE(128); END_STATE(); case 73: - if (lookahead == 't') ADVANCE(31); + if (lookahead == 'y') ADVANCE(128); END_STATE(); case 74: - if (lookahead == 't') ADVANCE(91); + if (lookahead == '-' || + lookahead == '.' || + ('0' <= lookahead && lookahead <= '9') || + ('A' <= lookahead && lookahead <= 'Z') || + lookahead == '_' || + ('a' <= lookahead && lookahead <= 'z')) ADVANCE(127); END_STATE(); case 75: - if (lookahead == 't') ADVANCE(19); + if (eof) ADVANCE(76); + if (lookahead == '\n') ADVANCE(129); + if (lookahead == '\r') ADVANCE(130); + if (lookahead != 0) ADVANCE(77); END_STATE(); case 76: - if (lookahead == 'u') ADVANCE(79); + ACCEPT_TOKEN(ts_builtin_sym_end); END_STATE(); case 77: - if (lookahead == 'u') ADVANCE(16); + ACCEPT_TOKEN(sym__line); + if (lookahead != 0 && + lookahead != '\n' && + lookahead != '\r') ADVANCE(77); END_STATE(); case 78: - if (lookahead == 'w') ADVANCE(70); + ACCEPT_TOKEN(anon_sym_COLONskip); END_STATE(); case 79: - if (lookahead == 'x') ADVANCE(97); + ACCEPT_TOKEN(anon_sym_COLONerror); END_STATE(); case 80: - if (lookahead == 'y') ADVANCE(97); + ACCEPT_TOKEN(anon_sym_COLONfail_DASHfast); END_STATE(); case 81: - if (eof) ADVANCE(84); - if (lookahead == '\n') SKIP(82) + ACCEPT_TOKEN(anon_sym_COLONlanguage); END_STATE(); case 82: - if (eof) ADVANCE(84); - if (lookahead == '\n') SKIP(82) - if (lookahead == '\r') SKIP(81) - if (lookahead == ':') ADVANCE(88); - if (lookahead == '=') ADVANCE(98); - if (lookahead != 0) ADVANCE(87); + ACCEPT_TOKEN(anon_sym_LPAREN); END_STATE(); case 83: - if (eof) ADVANCE(84); - if (lookahead == '\n') SKIP(83) - if (lookahead == '\r') ADVANCE(85); - if (lookahead == '=') ADVANCE(98); - if (lookahead != 0) ADVANCE(85); + ACCEPT_TOKEN(anon_sym_RPAREN); END_STATE(); case 84: - ACCEPT_TOKEN(ts_builtin_sym_end); + ACCEPT_TOKEN(anon_sym_COLONplatform); END_STATE(); case 85: - ACCEPT_TOKEN(aux_sym_test_token1); + ACCEPT_TOKEN(sym__lang); + if (lookahead == 'a') ADVANCE(89); + if (lookahead == '-' || + lookahead == '.' || + ('0' <= lookahead && lookahead <= '9') || + ('A' <= lookahead && lookahead <= 'Z') || + lookahead == '_' || + ('b' <= lookahead && lookahead <= 'z')) ADVANCE(127); END_STATE(); case 86: - ACCEPT_TOKEN(aux_sym_test_token1); - if (lookahead == '-') ADVANCE(8); + ACCEPT_TOKEN(sym__lang); + if (lookahead == 'a') ADVANCE(98); + if (lookahead == '-' || + lookahead == '.' || + ('0' <= lookahead && lookahead <= '9') || + ('A' <= lookahead && lookahead <= 'Z') || + lookahead == '_' || + ('b' <= lookahead && lookahead <= 'z')) ADVANCE(127); END_STATE(); case 87: - ACCEPT_TOKEN(aux_sym_header_token1); + ACCEPT_TOKEN(sym__lang); + if (lookahead == 'a') ADVANCE(119); + if (lookahead == '-' || + lookahead == '.' || + ('0' <= lookahead && lookahead <= '9') || + ('A' <= lookahead && lookahead <= 'Z') || + lookahead == '_' || + ('b' <= lookahead && lookahead <= 'z')) ADVANCE(127); END_STATE(); case 88: - ACCEPT_TOKEN(aux_sym_header_token1); - if (lookahead == 'e') ADVANCE(65); - if (lookahead == 'f') ADVANCE(10); - if (lookahead == 'l') ADVANCE(11); - if (lookahead == 'p') ADVANCE(44); - if (lookahead == 's') ADVANCE(41); + ACCEPT_TOKEN(sym__lang); + if (lookahead == 'b') ADVANCE(121); + if (lookahead == '-' || + lookahead == '.' || + ('0' <= lookahead && lookahead <= '9') || + ('A' <= lookahead && lookahead <= 'Z') || + lookahead == '_' || + ('a' <= lookahead && lookahead <= 'z')) ADVANCE(127); END_STATE(); case 89: - ACCEPT_TOKEN(sym_skip); + ACCEPT_TOKEN(sym__lang); + if (lookahead == 'c') ADVANCE(110); + if (lookahead == '-' || + lookahead == '.' || + ('0' <= lookahead && lookahead <= '9') || + ('A' <= lookahead && lookahead <= 'Z') || + lookahead == '_' || + ('a' <= lookahead && lookahead <= 'z')) ADVANCE(127); END_STATE(); case 90: - ACCEPT_TOKEN(sym_error); + ACCEPT_TOKEN(sym__lang); + if (lookahead == 'd') ADVANCE(127); + if (lookahead == '-' || + lookahead == '.' || + ('0' <= lookahead && lookahead <= '9') || + ('A' <= lookahead && lookahead <= 'Z') || + lookahead == '_' || + ('a' <= lookahead && lookahead <= 'z')) ADVANCE(127); END_STATE(); case 91: - ACCEPT_TOKEN(sym_fail_fast); + ACCEPT_TOKEN(sym__lang); + if (lookahead == 'd') ADVANCE(118); + if (lookahead == '-' || + lookahead == '.' || + ('0' <= lookahead && lookahead <= '9') || + ('A' <= lookahead && lookahead <= 'Z') || + lookahead == '_' || + ('a' <= lookahead && lookahead <= 'z')) ADVANCE(127); END_STATE(); case 92: - ACCEPT_TOKEN(anon_sym_COLONlanguage); + ACCEPT_TOKEN(sym__lang); + if (lookahead == 'd') ADVANCE(112); + if (lookahead == '-' || + lookahead == '.' || + ('0' <= lookahead && lookahead <= '9') || + ('A' <= lookahead && lookahead <= 'Z') || + lookahead == '_' || + ('a' <= lookahead && lookahead <= 'z')) ADVANCE(127); END_STATE(); case 93: - ACCEPT_TOKEN(anon_sym_LPAREN); + ACCEPT_TOKEN(sym__lang); + if (lookahead == 'e') ADVANCE(122); + if (lookahead == '-' || + lookahead == '.' || + ('0' <= lookahead && lookahead <= '9') || + ('A' <= lookahead && lookahead <= 'Z') || + lookahead == '_' || + ('a' <= lookahead && lookahead <= 'z')) ADVANCE(127); END_STATE(); case 94: - ACCEPT_TOKEN(anon_sym_RPAREN); + ACCEPT_TOKEN(sym__lang); + if (lookahead == 'e') ADVANCE(88); + if (lookahead == '-' || + lookahead == '.' || + ('0' <= lookahead && lookahead <= '9') || + ('A' <= lookahead && lookahead <= 'Z') || + lookahead == '_' || + ('a' <= lookahead && lookahead <= 'z')) ADVANCE(127); END_STATE(); case 95: - ACCEPT_TOKEN(anon_sym_COLONplatform); + ACCEPT_TOKEN(sym__lang); + if (lookahead == 'e') ADVANCE(107); + if (lookahead == '-' || + lookahead == '.' || + ('0' <= lookahead && lookahead <= '9') || + ('A' <= lookahead && lookahead <= 'Z') || + lookahead == '_' || + ('a' <= lookahead && lookahead <= 'z')) ADVANCE(127); END_STATE(); case 96: ACCEPT_TOKEN(sym__lang); + if (lookahead == 'e') ADVANCE(94); if (lookahead == '-' || lookahead == '.' || ('0' <= lookahead && lookahead <= '9') || ('A' <= lookahead && lookahead <= 'Z') || lookahead == '_' || - ('a' <= lookahead && lookahead <= 'z')) ADVANCE(96); + ('a' <= lookahead && lookahead <= 'z')) ADVANCE(127); END_STATE(); case 97: - ACCEPT_TOKEN(sym__os); + ACCEPT_TOKEN(sym__lang); + if (lookahead == 'f') ADVANCE(103); + if (lookahead == '-' || + lookahead == '.' || + ('0' <= lookahead && lookahead <= '9') || + ('A' <= lookahead && lookahead <= 'Z') || + lookahead == '_' || + ('a' <= lookahead && lookahead <= 'z')) ADVANCE(127); END_STATE(); case 98: - ACCEPT_TOKEN(sym__equals); - if (lookahead == '=') ADVANCE(98); + ACCEPT_TOKEN(sym__lang); + if (lookahead == 'g') ADVANCE(114); + if (lookahead == '-' || + lookahead == '.' || + ('0' <= lookahead && lookahead <= '9') || + ('A' <= lookahead && lookahead <= 'Z') || + lookahead == '_' || + ('a' <= lookahead && lookahead <= 'z')) ADVANCE(127); END_STATE(); case 99: - ACCEPT_TOKEN(sym__dashes); - if (lookahead == '-') ADVANCE(99); + ACCEPT_TOKEN(sym__lang); + if (lookahead == 'i') ADVANCE(120); + if (lookahead == '-' || + lookahead == '.' || + ('0' <= lookahead && lookahead <= '9') || + ('A' <= lookahead && lookahead <= 'Z') || + lookahead == '_' || + ('a' <= lookahead && lookahead <= 'z')) ADVANCE(127); + END_STATE(); + case 100: + ACCEPT_TOKEN(sym__lang); + if (lookahead == 'i') ADVANCE(106); + if (lookahead == '-' || + lookahead == '.' || + ('0' <= lookahead && lookahead <= '9') || + ('A' <= lookahead && lookahead <= 'Z') || + lookahead == '_' || + ('a' <= lookahead && lookahead <= 'z')) ADVANCE(127); + END_STATE(); + case 101: + ACCEPT_TOKEN(sym__lang); + if (lookahead == 'i') ADVANCE(90); + if (lookahead == '-' || + lookahead == '.' || + ('0' <= lookahead && lookahead <= '9') || + ('A' <= lookahead && lookahead <= 'Z') || + lookahead == '_' || + ('a' <= lookahead && lookahead <= 'z')) ADVANCE(127); + END_STATE(); + case 102: + ACCEPT_TOKEN(sym__lang); + if (lookahead == 'i') ADVANCE(109); + if (lookahead == '-' || + lookahead == '.' || + ('0' <= lookahead && lookahead <= '9') || + ('A' <= lookahead && lookahead <= 'Z') || + lookahead == '_' || + ('a' <= lookahead && lookahead <= 'z')) ADVANCE(127); + END_STATE(); + case 103: + ACCEPT_TOKEN(sym__lang); + if (lookahead == 'l') ADVANCE(126); + if (lookahead == '-' || + lookahead == '.' || + ('0' <= lookahead && lookahead <= '9') || + ('A' <= lookahead && lookahead <= 'Z') || + lookahead == '_' || + ('a' <= lookahead && lookahead <= 'z')) ADVANCE(127); + END_STATE(); + case 104: + ACCEPT_TOKEN(sym__lang); + if (lookahead == 'l') ADVANCE(87); + if (lookahead == '-' || + lookahead == '.' || + ('0' <= lookahead && lookahead <= '9') || + ('A' <= lookahead && lookahead <= 'Z') || + lookahead == '_' || + ('a' <= lookahead && lookahead <= 'z')) ADVANCE(127); + END_STATE(); + case 105: + ACCEPT_TOKEN(sym__lang); + if (lookahead == 'n') ADVANCE(91); + if (lookahead == '-' || + lookahead == '.' || + ('0' <= lookahead && lookahead <= '9') || + ('A' <= lookahead && lookahead <= 'Z') || + lookahead == '_' || + ('a' <= lookahead && lookahead <= 'z')) ADVANCE(127); + END_STATE(); + case 106: + ACCEPT_TOKEN(sym__lang); + if (lookahead == 'n') ADVANCE(123); + if (lookahead == '-' || + lookahead == '.' || + ('0' <= lookahead && lookahead <= '9') || + ('A' <= lookahead && lookahead <= 'Z') || + lookahead == '_' || + ('a' <= lookahead && lookahead <= 'z')) ADVANCE(127); + END_STATE(); + case 107: + ACCEPT_TOKEN(sym__lang); + if (lookahead == 'n') ADVANCE(88); + if (lookahead == '-' || + lookahead == '.' || + ('0' <= lookahead && lookahead <= '9') || + ('A' <= lookahead && lookahead <= 'Z') || + lookahead == '_' || + ('a' <= lookahead && lookahead <= 'z')) ADVANCE(127); + END_STATE(); + case 108: + ACCEPT_TOKEN(sym__lang); + if (lookahead == 'n') ADVANCE(97); + if (lookahead == '-' || + lookahead == '.' || + ('0' <= lookahead && lookahead <= '9') || + ('A' <= lookahead && lookahead <= 'Z') || + lookahead == '_' || + ('a' <= lookahead && lookahead <= 'z')) ADVANCE(127); + END_STATE(); + case 109: + ACCEPT_TOKEN(sym__lang); + if (lookahead == 'n') ADVANCE(92); + if (lookahead == '-' || + lookahead == '.' || + ('0' <= lookahead && lookahead <= '9') || + ('A' <= lookahead && lookahead <= 'Z') || + lookahead == '_' || + ('a' <= lookahead && lookahead <= 'z')) ADVANCE(127); + END_STATE(); + case 110: + ACCEPT_TOKEN(sym__lang); + if (lookahead == 'o') ADVANCE(120); + if (lookahead == '-' || + lookahead == '.' || + ('0' <= lookahead && lookahead <= '9') || + ('A' <= lookahead && lookahead <= 'Z') || + lookahead == '_' || + ('a' <= lookahead && lookahead <= 'z')) ADVANCE(127); + END_STATE(); + case 111: + ACCEPT_TOKEN(sym__lang); + if (lookahead == 'o') ADVANCE(104); + if (lookahead == '-' || + lookahead == '.' || + ('0' <= lookahead && lookahead <= '9') || + ('A' <= lookahead && lookahead <= 'Z') || + lookahead == '_' || + ('a' <= lookahead && lookahead <= 'z')) ADVANCE(127); + END_STATE(); + case 112: + ACCEPT_TOKEN(sym__lang); + if (lookahead == 'o') ADVANCE(124); + if (lookahead == '-' || + lookahead == '.' || + ('0' <= lookahead && lookahead <= '9') || + ('A' <= lookahead && lookahead <= 'Z') || + lookahead == '_' || + ('a' <= lookahead && lookahead <= 'z')) ADVANCE(127); + END_STATE(); + case 113: + ACCEPT_TOKEN(sym__lang); + if (lookahead == 'o') ADVANCE(101); + if (lookahead == '-' || + lookahead == '.' || + ('0' <= lookahead && lookahead <= '9') || + ('A' <= lookahead && lookahead <= 'Z') || + lookahead == '_' || + ('a' <= lookahead && lookahead <= 'z')) ADVANCE(127); + END_STATE(); + case 114: + ACCEPT_TOKEN(sym__lang); + if (lookahead == 'o') ADVANCE(108); + if (lookahead == '-' || + lookahead == '.' || + ('0' <= lookahead && lookahead <= '9') || + ('A' <= lookahead && lookahead <= 'Z') || + lookahead == '_' || + ('a' <= lookahead && lookahead <= 'z')) ADVANCE(127); + END_STATE(); + case 115: + ACCEPT_TOKEN(sym__lang); + if (lookahead == 'p') ADVANCE(95); + if (lookahead == '-' || + lookahead == '.' || + ('0' <= lookahead && lookahead <= '9') || + ('A' <= lookahead && lookahead <= 'Z') || + lookahead == '_' || + ('a' <= lookahead && lookahead <= 'z')) ADVANCE(127); + END_STATE(); + case 116: + ACCEPT_TOKEN(sym__lang); + if (lookahead == 'r') ADVANCE(86); + if (lookahead == '-' || + lookahead == '.' || + ('0' <= lookahead && lookahead <= '9') || + ('A' <= lookahead && lookahead <= 'Z') || + lookahead == '_' || + ('a' <= lookahead && lookahead <= 'z')) ADVANCE(127); + END_STATE(); + case 117: + ACCEPT_TOKEN(sym__lang); + if (lookahead == 'r') ADVANCE(96); + if (lookahead == '-' || + lookahead == '.' || + ('0' <= lookahead && lookahead <= '9') || + ('A' <= lookahead && lookahead <= 'Z') || + lookahead == '_' || + ('a' <= lookahead && lookahead <= 'z')) ADVANCE(127); + END_STATE(); + case 118: + ACCEPT_TOKEN(sym__lang); + if (lookahead == 'r') ADVANCE(113); + if (lookahead == '-' || + lookahead == '.' || + ('0' <= lookahead && lookahead <= '9') || + ('A' <= lookahead && lookahead <= 'Z') || + lookahead == '_' || + ('a' <= lookahead && lookahead <= 'z')) ADVANCE(127); + END_STATE(); + case 119: + ACCEPT_TOKEN(sym__lang); + if (lookahead == 'r') ADVANCE(99); + if (lookahead == '-' || + lookahead == '.' || + ('0' <= lookahead && lookahead <= '9') || + ('A' <= lookahead && lookahead <= 'Z') || + lookahead == '_' || + ('a' <= lookahead && lookahead <= 'z')) ADVANCE(127); + END_STATE(); + case 120: + ACCEPT_TOKEN(sym__lang); + if (lookahead == 's') ADVANCE(127); + if (lookahead == '-' || + lookahead == '.' || + ('0' <= lookahead && lookahead <= '9') || + ('A' <= lookahead && lookahead <= 'Z') || + lookahead == '_' || + ('a' <= lookahead && lookahead <= 'z')) ADVANCE(127); + END_STATE(); + case 121: + ACCEPT_TOKEN(sym__lang); + if (lookahead == 's') ADVANCE(90); + if (lookahead == '-' || + lookahead == '.' || + ('0' <= lookahead && lookahead <= '9') || + ('A' <= lookahead && lookahead <= 'Z') || + lookahead == '_' || + ('a' <= lookahead && lookahead <= 'z')) ADVANCE(127); + END_STATE(); + case 122: + ACCEPT_TOKEN(sym__lang); + if (lookahead == 't') ADVANCE(88); + if (lookahead == '-' || + lookahead == '.' || + ('0' <= lookahead && lookahead <= '9') || + ('A' <= lookahead && lookahead <= 'Z') || + lookahead == '_' || + ('a' <= lookahead && lookahead <= 'z')) ADVANCE(127); + END_STATE(); + case 123: + ACCEPT_TOKEN(sym__lang); + if (lookahead == 'u') ADVANCE(125); + if (lookahead == '-' || + lookahead == '.' || + ('0' <= lookahead && lookahead <= '9') || + ('A' <= lookahead && lookahead <= 'Z') || + lookahead == '_' || + ('a' <= lookahead && lookahead <= 'z')) ADVANCE(127); + END_STATE(); + case 124: + ACCEPT_TOKEN(sym__lang); + if (lookahead == 'w') ADVANCE(120); + if (lookahead == '-' || + lookahead == '.' || + ('0' <= lookahead && lookahead <= '9') || + ('A' <= lookahead && lookahead <= 'Z') || + lookahead == '_' || + ('a' <= lookahead && lookahead <= 'z')) ADVANCE(127); + END_STATE(); + case 125: + ACCEPT_TOKEN(sym__lang); + if (lookahead == 'x') ADVANCE(127); + if (lookahead == '-' || + lookahead == '.' || + ('0' <= lookahead && lookahead <= '9') || + ('A' <= lookahead && lookahead <= 'Z') || + lookahead == '_' || + ('a' <= lookahead && lookahead <= 'z')) ADVANCE(127); + END_STATE(); + case 126: + ACCEPT_TOKEN(sym__lang); + if (lookahead == 'y') ADVANCE(127); + if (lookahead == '-' || + lookahead == '.' || + ('0' <= lookahead && lookahead <= '9') || + ('A' <= lookahead && lookahead <= 'Z') || + lookahead == '_' || + ('a' <= lookahead && lookahead <= 'z')) ADVANCE(127); + END_STATE(); + case 127: + ACCEPT_TOKEN(sym__lang); + if (lookahead == '-' || + lookahead == '.' || + ('0' <= lookahead && lookahead <= '9') || + ('A' <= lookahead && lookahead <= 'Z') || + lookahead == '_' || + ('a' <= lookahead && lookahead <= 'z')) ADVANCE(127); + END_STATE(); + case 128: + ACCEPT_TOKEN(sym__os); + END_STATE(); + case 129: + ACCEPT_TOKEN(sym__eol); + END_STATE(); + case 130: + ACCEPT_TOKEN(sym__eol); + if (lookahead == '\n') ADVANCE(129); END_STATE(); default: return false; @@ -673,364 +1056,416 @@ static bool ts_lex(TSLexer *lexer, TSStateId state) { } static const TSLexMode ts_lex_modes[STATE_COUNT] = { - [0] = {.lex_state = 0}, - [1] = {.lex_state = 0}, - [2] = {.lex_state = 2}, - [3] = {.lex_state = 0}, - [4] = {.lex_state = 0}, - [5] = {.lex_state = 2}, - [6] = {.lex_state = 2}, - [7] = {.lex_state = 0}, - [8] = {.lex_state = 0}, - [9] = {.lex_state = 0}, - [10] = {.lex_state = 0}, - [11] = {.lex_state = 0}, - [12] = {.lex_state = 83}, - [13] = {.lex_state = 83}, - [14] = {.lex_state = 83}, - [15] = {.lex_state = 83}, - [16] = {.lex_state = 3}, - [17] = {.lex_state = 3}, - [18] = {.lex_state = 5}, - [19] = {.lex_state = 3}, - [20] = {.lex_state = 6}, - [21] = {.lex_state = 6}, - [22] = {.lex_state = 6}, + [0] = {.lex_state = 0, .external_lex_state = 1}, + [1] = {.lex_state = 0, .external_lex_state = 2}, + [2] = {.lex_state = 0, .external_lex_state = 3}, + [3] = {.lex_state = 0, .external_lex_state = 3}, + [4] = {.lex_state = 0, .external_lex_state = 3}, + [5] = {.lex_state = 0, .external_lex_state = 3}, + [6] = {.lex_state = 0, .external_lex_state = 3}, + [7] = {.lex_state = 0, .external_lex_state = 3}, + [8] = {.lex_state = 0, .external_lex_state = 3}, + [9] = {.lex_state = 0, .external_lex_state = 3}, + [10] = {.lex_state = 0, .external_lex_state = 2}, + [11] = {.lex_state = 0, .external_lex_state = 2}, + [12] = {.lex_state = 75, .external_lex_state = 2}, + [13] = {.lex_state = 75, .external_lex_state = 2}, + [14] = {.lex_state = 75, .external_lex_state = 2}, + [15] = {.lex_state = 75, .external_lex_state = 4}, + [16] = {.lex_state = 75, .external_lex_state = 4}, + [17] = {.lex_state = 75, .external_lex_state = 2}, + [18] = {.lex_state = 75, .external_lex_state = 4}, + [19] = {.lex_state = 75}, + [20] = {.lex_state = 75}, + [21] = {.lex_state = 75}, + [22] = {.lex_state = 0, .external_lex_state = 3}, [23] = {.lex_state = 7}, - [24] = {.lex_state = 15}, - [25] = {.lex_state = 7}, - [26] = {.lex_state = 7}, - [27] = {.lex_state = 0}, + [24] = {.lex_state = 74}, + [25] = {.lex_state = 0}, + [26] = {.lex_state = 0}, + [27] = {.lex_state = 75}, [28] = {.lex_state = 0}, - [29] = {.lex_state = 7}, - [30] = {.lex_state = 7}, + [29] = {.lex_state = 0}, + [30] = {.lex_state = 0}, }; static const uint16_t ts_parse_table[LARGE_STATE_COUNT][SYMBOL_COUNT] = { [0] = { [ts_builtin_sym_end] = ACTIONS(1), - [aux_sym_header_token1] = ACTIONS(1), - [sym_skip] = ACTIONS(1), - [sym_error] = ACTIONS(1), - [sym_fail_fast] = ACTIONS(1), + [anon_sym_COLONskip] = ACTIONS(1), + [anon_sym_COLONerror] = ACTIONS(1), + [anon_sym_COLONfail_DASHfast] = ACTIONS(1), [anon_sym_COLONlanguage] = ACTIONS(1), [anon_sym_LPAREN] = ACTIONS(1), [anon_sym_RPAREN] = ACTIONS(1), [anon_sym_COLONplatform] = ACTIONS(1), [sym__lang] = ACTIONS(1), - [sym__equals] = ACTIONS(1), + [sym__os] = ACTIONS(1), + [sym__eol] = ACTIONS(1), + [sym__equals_begin] = ACTIONS(1), + [sym__equals_end] = ACTIONS(1), + [sym__dashes] = ACTIONS(1), }, [1] = { - [sym_file] = STATE(27), + [sym_file] = STATE(30), [sym_test] = STATE(10), - [sym_header] = STATE(20), + [sym_header] = STATE(19), [aux_sym_file_repeat1] = STATE(10), [ts_builtin_sym_end] = ACTIONS(3), - [sym__equals] = ACTIONS(5), + [sym__eol] = ACTIONS(5), + [sym__equals_begin] = ACTIONS(7), }, }; static const uint16_t ts_small_parse_table[] = { [0] = 9, - ACTIONS(7), 1, - aux_sym_header_token1, ACTIONS(11), 1, anon_sym_COLONlanguage, ACTIONS(13), 1, anon_sym_COLONplatform, ACTIONS(15), 1, - sym__equals, - STATE(4), 1, - aux_sym_attributes_repeat1, - STATE(5), 1, - aux_sym_header_repeat1, - STATE(28), 1, + sym__eol, + ACTIONS(17), 1, + sym__equals_end, + STATE(6), 1, + sym__platform, + STATE(7), 1, + sym__language, + STATE(22), 1, sym_attributes, - STATE(7), 2, - sym_language, - sym_platform, + STATE(4), 2, + sym_attribute, + aux_sym_attributes_repeat1, ACTIONS(9), 3, - sym_skip, - sym_error, - sym_fail_fast, - [31] = 6, - ACTIONS(20), 1, + anon_sym_COLONskip, + anon_sym_COLONerror, + anon_sym_COLONfail_DASHfast, + [31] = 8, + ACTIONS(22), 1, anon_sym_COLONlanguage, - ACTIONS(23), 1, + ACTIONS(25), 1, anon_sym_COLONplatform, - ACTIONS(26), 1, - sym__equals, - STATE(3), 1, + ACTIONS(28), 1, + sym__eol, + ACTIONS(31), 1, + sym__equals_end, + STATE(6), 1, + sym__platform, + STATE(7), 1, + sym__language, + STATE(3), 2, + sym_attribute, aux_sym_attributes_repeat1, - STATE(7), 2, - sym_language, - sym_platform, - ACTIONS(17), 3, - sym_skip, - sym_error, - sym_fail_fast, - [53] = 6, + ACTIONS(19), 3, + anon_sym_COLONskip, + anon_sym_COLONerror, + anon_sym_COLONfail_DASHfast, + [59] = 8, ACTIONS(11), 1, anon_sym_COLONlanguage, ACTIONS(13), 1, anon_sym_COLONplatform, - ACTIONS(28), 1, - sym__equals, - STATE(3), 1, + ACTIONS(33), 1, + sym__eol, + ACTIONS(35), 1, + sym__equals_end, + STATE(6), 1, + sym__platform, + STATE(7), 1, + sym__language, + STATE(3), 2, + sym_attribute, aux_sym_attributes_repeat1, - STATE(7), 2, - sym_language, - sym_platform, ACTIONS(9), 3, - sym_skip, - sym_error, - sym_fail_fast, - [75] = 3, - ACTIONS(30), 1, - aux_sym_header_token1, - STATE(5), 1, - aux_sym_header_repeat1, - ACTIONS(33), 6, - sym_skip, - sym_error, - sym_fail_fast, + anon_sym_COLONskip, + anon_sym_COLONerror, + anon_sym_COLONfail_DASHfast, + [87] = 1, + ACTIONS(37), 7, + sym__equals_end, + anon_sym_COLONskip, + anon_sym_COLONerror, + anon_sym_COLONfail_DASHfast, anon_sym_COLONlanguage, anon_sym_COLONplatform, - sym__equals, - [90] = 2, - ACTIONS(35), 1, - aux_sym_header_token1, - ACTIONS(37), 6, - sym_skip, - sym_error, - sym_fail_fast, + sym__eol, + [97] = 1, + ACTIONS(39), 7, + sym__equals_end, + anon_sym_COLONskip, + anon_sym_COLONerror, + anon_sym_COLONfail_DASHfast, anon_sym_COLONlanguage, anon_sym_COLONplatform, - sym__equals, - [102] = 1, - ACTIONS(39), 6, - sym_skip, - sym_error, - sym_fail_fast, + sym__eol, + [107] = 1, + ACTIONS(41), 7, + sym__equals_end, + anon_sym_COLONskip, + anon_sym_COLONerror, + anon_sym_COLONfail_DASHfast, anon_sym_COLONlanguage, anon_sym_COLONplatform, - sym__equals, - [111] = 1, - ACTIONS(41), 6, - sym_skip, - sym_error, - sym_fail_fast, + sym__eol, + [117] = 1, + ACTIONS(43), 7, + sym__equals_end, + anon_sym_COLONskip, + anon_sym_COLONerror, + anon_sym_COLONfail_DASHfast, anon_sym_COLONlanguage, anon_sym_COLONplatform, - sym__equals, - [120] = 1, - ACTIONS(43), 6, - sym_skip, - sym_error, - sym_fail_fast, + sym__eol, + [127] = 1, + ACTIONS(45), 7, + sym__equals_end, + anon_sym_COLONskip, + anon_sym_COLONerror, + anon_sym_COLONfail_DASHfast, anon_sym_COLONlanguage, anon_sym_COLONplatform, - sym__equals, - [129] = 4, - ACTIONS(5), 1, - sym__equals, - ACTIONS(45), 1, + sym__eol, + [137] = 5, + ACTIONS(7), 1, + sym__equals_begin, + ACTIONS(47), 1, ts_builtin_sym_end, - STATE(20), 1, + ACTIONS(49), 1, + sym__eol, + STATE(19), 1, sym_header, STATE(11), 2, sym_test, aux_sym_file_repeat1, - [143] = 4, - ACTIONS(47), 1, + [154] = 5, + ACTIONS(51), 1, ts_builtin_sym_end, - ACTIONS(49), 1, - sym__equals, - STATE(20), 1, + ACTIONS(53), 1, + sym__eol, + ACTIONS(56), 1, + sym__equals_begin, + STATE(19), 1, sym_header, STATE(11), 2, sym_test, aux_sym_file_repeat1, - [157] = 4, - ACTIONS(52), 1, - ts_builtin_sym_end, - ACTIONS(54), 1, - aux_sym_test_token1, - ACTIONS(56), 1, - sym__equals, - STATE(14), 1, - aux_sym_test_repeat1, - [170] = 4, - ACTIONS(54), 1, - aux_sym_test_token1, - ACTIONS(58), 1, + [171] = 3, + STATE(12), 1, + aux_sym__body, + ACTIONS(59), 2, + sym__equals_begin, ts_builtin_sym_end, - ACTIONS(60), 1, - sym__equals, + ACTIONS(61), 2, + sym__line, + sym__eol, + [183] = 3, STATE(12), 1, - aux_sym_test_repeat1, - [183] = 4, - ACTIONS(62), 1, + aux_sym__body, + ACTIONS(64), 2, + sym__equals_begin, ts_builtin_sym_end, - ACTIONS(64), 1, - aux_sym_test_token1, - ACTIONS(67), 1, - sym__equals, - STATE(14), 1, - aux_sym_test_repeat1, - [196] = 2, - ACTIONS(69), 1, + ACTIONS(66), 2, + sym__line, + sym__eol, + [195] = 3, + STATE(13), 1, + aux_sym__body, + ACTIONS(66), 2, + sym__line, + sym__eol, + ACTIONS(68), 2, + sym__equals_begin, ts_builtin_sym_end, - ACTIONS(71), 2, - aux_sym_test_token1, - sym__equals, - [204] = 3, - ACTIONS(73), 1, - aux_sym_test_token1, - ACTIONS(75), 1, - sym__dashes, - STATE(17), 1, - aux_sym_test_repeat1, - [214] = 3, - ACTIONS(67), 1, + [207] = 3, + ACTIONS(72), 1, sym__dashes, - ACTIONS(77), 1, - aux_sym_test_token1, - STATE(17), 1, - aux_sym_test_repeat1, - [224] = 2, - ACTIONS(80), 1, - aux_sym_header_token1, - STATE(2), 1, - aux_sym_header_repeat1, - [231] = 1, - ACTIONS(71), 2, - aux_sym_test_token1, + STATE(16), 1, + aux_sym__body, + ACTIONS(70), 2, + sym__line, + sym__eol, + [218] = 3, + ACTIONS(59), 1, sym__dashes, - [236] = 2, - ACTIONS(82), 1, - aux_sym_test_token1, STATE(16), 1, - aux_sym_test_repeat1, - [243] = 1, - ACTIONS(84), 1, - aux_sym_test_token1, - [247] = 1, - ACTIONS(86), 1, - aux_sym_test_token1, - [251] = 1, - ACTIONS(88), 1, - sym__lang, + aux_sym__body, + ACTIONS(74), 2, + sym__line, + sym__eol, + [229] = 1, + ACTIONS(77), 4, + sym__equals_begin, + ts_builtin_sym_end, + sym__line, + sym__eol, + [236] = 1, + ACTIONS(77), 3, + sym__dashes, + sym__line, + sym__eol, + [242] = 2, + STATE(15), 1, + aux_sym__body, + ACTIONS(70), 2, + sym__line, + sym__eol, + [250] = 1, + ACTIONS(79), 2, + sym__line, + sym__eol, [255] = 1, - ACTIONS(90), 1, + ACTIONS(81), 2, + sym__line, + sym__eol, + [260] = 1, + ACTIONS(83), 1, + sym__equals_end, + [264] = 1, + ACTIONS(85), 1, sym__os, - [259] = 1, - ACTIONS(92), 1, + [268] = 1, + ACTIONS(87), 1, + sym__lang, + [272] = 1, + ACTIONS(89), 1, anon_sym_RPAREN, - [263] = 1, - ACTIONS(94), 1, + [276] = 1, + ACTIONS(91), 1, anon_sym_RPAREN, - [267] = 1, - ACTIONS(96), 1, - ts_builtin_sym_end, - [271] = 1, - ACTIONS(98), 1, - sym__equals, - [275] = 1, - ACTIONS(100), 1, + [280] = 1, + ACTIONS(93), 1, + sym__line, + [284] = 1, + ACTIONS(95), 1, anon_sym_LPAREN, - [279] = 1, - ACTIONS(102), 1, + [288] = 1, + ACTIONS(97), 1, anon_sym_LPAREN, + [292] = 1, + ACTIONS(99), 1, + ts_builtin_sym_end, }; static const uint32_t ts_small_parse_table_map[] = { [SMALL_STATE(2)] = 0, [SMALL_STATE(3)] = 31, - [SMALL_STATE(4)] = 53, - [SMALL_STATE(5)] = 75, - [SMALL_STATE(6)] = 90, - [SMALL_STATE(7)] = 102, - [SMALL_STATE(8)] = 111, - [SMALL_STATE(9)] = 120, - [SMALL_STATE(10)] = 129, - [SMALL_STATE(11)] = 143, - [SMALL_STATE(12)] = 157, - [SMALL_STATE(13)] = 170, - [SMALL_STATE(14)] = 183, - [SMALL_STATE(15)] = 196, - [SMALL_STATE(16)] = 204, - [SMALL_STATE(17)] = 214, - [SMALL_STATE(18)] = 224, - [SMALL_STATE(19)] = 231, - [SMALL_STATE(20)] = 236, - [SMALL_STATE(21)] = 243, - [SMALL_STATE(22)] = 247, - [SMALL_STATE(23)] = 251, - [SMALL_STATE(24)] = 255, - [SMALL_STATE(25)] = 259, - [SMALL_STATE(26)] = 263, - [SMALL_STATE(27)] = 267, - [SMALL_STATE(28)] = 271, - [SMALL_STATE(29)] = 275, - [SMALL_STATE(30)] = 279, + [SMALL_STATE(4)] = 59, + [SMALL_STATE(5)] = 87, + [SMALL_STATE(6)] = 97, + [SMALL_STATE(7)] = 107, + [SMALL_STATE(8)] = 117, + [SMALL_STATE(9)] = 127, + [SMALL_STATE(10)] = 137, + [SMALL_STATE(11)] = 154, + [SMALL_STATE(12)] = 171, + [SMALL_STATE(13)] = 183, + [SMALL_STATE(14)] = 195, + [SMALL_STATE(15)] = 207, + [SMALL_STATE(16)] = 218, + [SMALL_STATE(17)] = 229, + [SMALL_STATE(18)] = 236, + [SMALL_STATE(19)] = 242, + [SMALL_STATE(20)] = 250, + [SMALL_STATE(21)] = 255, + [SMALL_STATE(22)] = 260, + [SMALL_STATE(23)] = 264, + [SMALL_STATE(24)] = 268, + [SMALL_STATE(25)] = 272, + [SMALL_STATE(26)] = 276, + [SMALL_STATE(27)] = 280, + [SMALL_STATE(28)] = 284, + [SMALL_STATE(29)] = 288, + [SMALL_STATE(30)] = 292, }; static const TSParseActionEntry ts_parse_actions[] = { [0] = {.entry = {.count = 0, .reusable = false}}, [1] = {.entry = {.count = 1, .reusable = false}}, RECOVER(), [3] = {.entry = {.count = 1, .reusable = true}}, REDUCE(sym_file, 0), - [5] = {.entry = {.count = 1, .reusable = true}}, SHIFT(18), - [7] = {.entry = {.count = 1, .reusable = false}}, SHIFT(6), - [9] = {.entry = {.count = 1, .reusable = true}}, SHIFT(7), - [11] = {.entry = {.count = 1, .reusable = true}}, SHIFT(30), - [13] = {.entry = {.count = 1, .reusable = true}}, SHIFT(29), - [15] = {.entry = {.count = 1, .reusable = true}}, SHIFT(21), - [17] = {.entry = {.count = 2, .reusable = true}}, REDUCE(aux_sym_attributes_repeat1, 2, .production_id = 5), SHIFT_REPEAT(7), - [20] = {.entry = {.count = 2, .reusable = true}}, REDUCE(aux_sym_attributes_repeat1, 2, .production_id = 5), SHIFT_REPEAT(30), - [23] = {.entry = {.count = 2, .reusable = true}}, REDUCE(aux_sym_attributes_repeat1, 2, .production_id = 5), SHIFT_REPEAT(29), - [26] = {.entry = {.count = 1, .reusable = true}}, REDUCE(aux_sym_attributes_repeat1, 2, .production_id = 5), - [28] = {.entry = {.count = 1, .reusable = true}}, REDUCE(sym_attributes, 1, .production_id = 3), - [30] = {.entry = {.count = 2, .reusable = false}}, REDUCE(aux_sym_header_repeat1, 2), SHIFT_REPEAT(6), - [33] = {.entry = {.count = 1, .reusable = true}}, REDUCE(aux_sym_header_repeat1, 2), - [35] = {.entry = {.count = 1, .reusable = false}}, REDUCE(aux_sym_header_repeat1, 1), - [37] = {.entry = {.count = 1, .reusable = true}}, REDUCE(aux_sym_header_repeat1, 1), - [39] = {.entry = {.count = 1, .reusable = true}}, REDUCE(aux_sym_attributes_repeat1, 1, .production_id = 1), - [41] = {.entry = {.count = 1, .reusable = true}}, REDUCE(sym_language, 4), - [43] = {.entry = {.count = 1, .reusable = true}}, REDUCE(sym_platform, 4), - [45] = {.entry = {.count = 1, .reusable = true}}, REDUCE(sym_file, 1), - [47] = {.entry = {.count = 1, .reusable = true}}, REDUCE(aux_sym_file_repeat1, 2), - [49] = {.entry = {.count = 2, .reusable = true}}, REDUCE(aux_sym_file_repeat1, 2), SHIFT_REPEAT(18), - [52] = {.entry = {.count = 1, .reusable = true}}, REDUCE(sym_test, 4, .production_id = 6), - [54] = {.entry = {.count = 1, .reusable = false}}, SHIFT(15), - [56] = {.entry = {.count = 1, .reusable = false}}, REDUCE(sym_test, 4, .production_id = 6), - [58] = {.entry = {.count = 1, .reusable = true}}, REDUCE(sym_test, 3, .production_id = 4), - [60] = {.entry = {.count = 1, .reusable = false}}, REDUCE(sym_test, 3, .production_id = 4), - [62] = {.entry = {.count = 1, .reusable = true}}, REDUCE(aux_sym_test_repeat1, 2), - [64] = {.entry = {.count = 2, .reusable = false}}, REDUCE(aux_sym_test_repeat1, 2), SHIFT_REPEAT(15), - [67] = {.entry = {.count = 1, .reusable = false}}, REDUCE(aux_sym_test_repeat1, 2), - [69] = {.entry = {.count = 1, .reusable = true}}, REDUCE(aux_sym_test_repeat1, 1), - [71] = {.entry = {.count = 1, .reusable = false}}, REDUCE(aux_sym_test_repeat1, 1), - [73] = {.entry = {.count = 1, .reusable = false}}, SHIFT(19), - [75] = {.entry = {.count = 1, .reusable = false}}, SHIFT(13), - [77] = {.entry = {.count = 2, .reusable = false}}, REDUCE(aux_sym_test_repeat1, 2), SHIFT_REPEAT(19), - [80] = {.entry = {.count = 1, .reusable = true}}, SHIFT(6), - [82] = {.entry = {.count = 1, .reusable = true}}, SHIFT(19), - [84] = {.entry = {.count = 1, .reusable = true}}, REDUCE(sym_header, 3, .production_id = 2), - [86] = {.entry = {.count = 1, .reusable = true}}, REDUCE(sym_header, 4, .production_id = 2), - [88] = {.entry = {.count = 1, .reusable = true}}, SHIFT(25), - [90] = {.entry = {.count = 1, .reusable = true}}, SHIFT(26), - [92] = {.entry = {.count = 1, .reusable = true}}, SHIFT(8), - [94] = {.entry = {.count = 1, .reusable = true}}, SHIFT(9), - [96] = {.entry = {.count = 1, .reusable = true}}, ACCEPT_INPUT(), - [98] = {.entry = {.count = 1, .reusable = true}}, SHIFT(22), - [100] = {.entry = {.count = 1, .reusable = true}}, SHIFT(24), - [102] = {.entry = {.count = 1, .reusable = true}}, SHIFT(23), + [5] = {.entry = {.count = 1, .reusable = true}}, SHIFT(10), + [7] = {.entry = {.count = 1, .reusable = true}}, SHIFT(27), + [9] = {.entry = {.count = 1, .reusable = true}}, SHIFT(5), + [11] = {.entry = {.count = 1, .reusable = true}}, SHIFT(29), + [13] = {.entry = {.count = 1, .reusable = true}}, SHIFT(28), + [15] = {.entry = {.count = 1, .reusable = true}}, SHIFT(4), + [17] = {.entry = {.count = 1, .reusable = true}}, SHIFT(20), + [19] = {.entry = {.count = 2, .reusable = true}}, REDUCE(aux_sym_attributes_repeat1, 2), SHIFT_REPEAT(5), + [22] = {.entry = {.count = 2, .reusable = true}}, REDUCE(aux_sym_attributes_repeat1, 2), SHIFT_REPEAT(29), + [25] = {.entry = {.count = 2, .reusable = true}}, REDUCE(aux_sym_attributes_repeat1, 2), SHIFT_REPEAT(28), + [28] = {.entry = {.count = 2, .reusable = true}}, REDUCE(aux_sym_attributes_repeat1, 2), SHIFT_REPEAT(3), + [31] = {.entry = {.count = 1, .reusable = true}}, REDUCE(aux_sym_attributes_repeat1, 2), + [33] = {.entry = {.count = 1, .reusable = true}}, SHIFT(3), + [35] = {.entry = {.count = 1, .reusable = true}}, REDUCE(sym_attributes, 1), + [37] = {.entry = {.count = 1, .reusable = true}}, REDUCE(sym_attribute, 1), + [39] = {.entry = {.count = 1, .reusable = true}}, REDUCE(sym_attribute, 1, .production_id = 3), + [41] = {.entry = {.count = 1, .reusable = true}}, REDUCE(sym_attribute, 1, .production_id = 2), + [43] = {.entry = {.count = 1, .reusable = true}}, REDUCE(sym__language, 4, .production_id = 6), + [45] = {.entry = {.count = 1, .reusable = true}}, REDUCE(sym__platform, 4, .production_id = 7), + [47] = {.entry = {.count = 1, .reusable = true}}, REDUCE(sym_file, 1), + [49] = {.entry = {.count = 1, .reusable = true}}, SHIFT(11), + [51] = {.entry = {.count = 1, .reusable = true}}, REDUCE(aux_sym_file_repeat1, 2), + [53] = {.entry = {.count = 2, .reusable = true}}, REDUCE(aux_sym_file_repeat1, 2), SHIFT_REPEAT(11), + [56] = {.entry = {.count = 2, .reusable = true}}, REDUCE(aux_sym_file_repeat1, 2), SHIFT_REPEAT(27), + [59] = {.entry = {.count = 1, .reusable = true}}, REDUCE(aux_sym__body, 2), + [61] = {.entry = {.count = 2, .reusable = true}}, REDUCE(aux_sym__body, 2), SHIFT_REPEAT(17), + [64] = {.entry = {.count = 1, .reusable = true}}, REDUCE(sym_test, 4, .production_id = 5), + [66] = {.entry = {.count = 1, .reusable = true}}, SHIFT(17), + [68] = {.entry = {.count = 1, .reusable = true}}, REDUCE(sym_test, 3, .production_id = 4), + [70] = {.entry = {.count = 1, .reusable = true}}, SHIFT(18), + [72] = {.entry = {.count = 1, .reusable = true}}, SHIFT(14), + [74] = {.entry = {.count = 2, .reusable = true}}, REDUCE(aux_sym__body, 2), SHIFT_REPEAT(18), + [77] = {.entry = {.count = 1, .reusable = true}}, REDUCE(aux_sym__body, 1), + [79] = {.entry = {.count = 1, .reusable = true}}, REDUCE(sym_header, 3, .production_id = 1), + [81] = {.entry = {.count = 1, .reusable = true}}, REDUCE(sym_header, 4, .production_id = 1), + [83] = {.entry = {.count = 1, .reusable = true}}, SHIFT(21), + [85] = {.entry = {.count = 1, .reusable = true}}, SHIFT(26), + [87] = {.entry = {.count = 1, .reusable = true}}, SHIFT(25), + [89] = {.entry = {.count = 1, .reusable = true}}, SHIFT(8), + [91] = {.entry = {.count = 1, .reusable = true}}, SHIFT(9), + [93] = {.entry = {.count = 1, .reusable = true}}, SHIFT(2), + [95] = {.entry = {.count = 1, .reusable = true}}, SHIFT(23), + [97] = {.entry = {.count = 1, .reusable = true}}, SHIFT(24), + [99] = {.entry = {.count = 1, .reusable = true}}, ACCEPT_INPUT(), +}; + +enum ts_external_scanner_symbol_identifiers { + ts_external_token__equals_begin = 0, + ts_external_token__equals_end = 1, + ts_external_token__dashes = 2, +}; + +static const TSSymbol ts_external_scanner_symbol_map[EXTERNAL_TOKEN_COUNT] = { + [ts_external_token__equals_begin] = sym__equals_begin, + [ts_external_token__equals_end] = sym__equals_end, + [ts_external_token__dashes] = sym__dashes, +}; + +static const bool ts_external_scanner_states[5][EXTERNAL_TOKEN_COUNT] = { + [1] = { + [ts_external_token__equals_begin] = true, + [ts_external_token__equals_end] = true, + [ts_external_token__dashes] = true, + }, + [2] = { + [ts_external_token__equals_begin] = true, + }, + [3] = { + [ts_external_token__equals_end] = true, + }, + [4] = { + [ts_external_token__dashes] = true, + }, }; #ifdef __cplusplus extern "C" { #endif +void *tree_sitter_test_external_scanner_create(void); +void tree_sitter_test_external_scanner_destroy(void *); +bool tree_sitter_test_external_scanner_scan(void *, TSLexer *, const bool *); +unsigned tree_sitter_test_external_scanner_serialize(void *, char *); +void tree_sitter_test_external_scanner_deserialize(void *, const char *, unsigned); + #ifdef TS_PUBLIC #undef TS_PUBLIC #endif @@ -1067,6 +1502,15 @@ TS_PUBLIC const TSLanguage *tree_sitter_test() { .alias_sequences = &ts_alias_sequences[0][0], .lex_modes = ts_lex_modes, .lex_fn = ts_lex, + .external_scanner = { + &ts_external_scanner_states[0][0], + ts_external_scanner_symbol_map, + tree_sitter_test_external_scanner_create, + tree_sitter_test_external_scanner_destroy, + tree_sitter_test_external_scanner_scan, + tree_sitter_test_external_scanner_serialize, + tree_sitter_test_external_scanner_deserialize, + }, .primary_state_ids = ts_primary_state_ids, }; return &language; diff --git a/src/scanner.c b/src/scanner.c new file mode 100644 index 0000000..2eb3c15 --- /dev/null +++ b/src/scanner.c @@ -0,0 +1,104 @@ +#include "tree_sitter/alloc.h" +#include "tree_sitter/parser.h" + +#include +#include + +enum TokenType { + EQUALS_BEGIN, + EQUALS_END, + DASHES, +}; + +// FIXME: support different characters +typedef struct { + uint32_t length; + wchar_t suffix; + bool initialized; +} Scanner; + +#define MIN_LENGTH 3 + +#define at_eol(lexer) ((lexer)->lookahead == '\r' || (lexer)->lookahead == '\n') + +static inline void advance(TSLexer *lexer) { lexer->advance(lexer, false); } + +static inline void skip(TSLexer *lexer) { lexer->advance(lexer, true); } + +static inline bool scan(TSLexer *lexer, Scanner *scanner, char chr, int symbol) { + uint32_t length; + + for (length = 0; !lexer->eof(lexer) && lexer->lookahead == chr; ++length) { + advance(lexer); + } + + if (length < MIN_LENGTH) return false; + + for (length = 0; !lexer->eof(lexer) && !at_eol(lexer); ++length) { + if (symbol == EQUALS_BEGIN && !scanner->initialized) + scanner->suffix = lexer->lookahead; + if (scanner->suffix != lexer->lookahead) + return false; + + advance(lexer); + } + + if (symbol == EQUALS_BEGIN && !scanner->initialized) + scanner->length = length; + + if (scanner->length != length) return symbol == DASHES; + + if (lexer->lookahead == '\r') skip(lexer); + if (lexer->lookahead == '\n') skip(lexer); + + lexer->result_symbol = symbol; + return true; +} + +void *tree_sitter_test_external_scanner_create() { + Scanner *scanner = ts_malloc(sizeof(Scanner)); + scanner->length = 0; + scanner->suffix = '\0'; + scanner->initialized = false; + return scanner; +} + +unsigned tree_sitter_test_external_scanner_serialize(void *payload, char *buffer) { + Scanner *scanner = (Scanner *)payload; + + if (scanner->length + 1 > TREE_SITTER_SERIALIZATION_BUFFER_SIZE) + return 0; + + memset(buffer, true, 1); + memset(buffer + 1, scanner->suffix, scanner->length); + return scanner->length + 1; +} + +void tree_sitter_test_external_scanner_deserialize(void *payload, const char *buffer, uint32_t length) { + if (length == 0) return; + + Scanner *scanner = (Scanner *)payload; + scanner->length = length - 1; + scanner->suffix = buffer[1]; + scanner->initialized = buffer[0]; +} + +bool tree_sitter_test_external_scanner_scan(void *payload, TSLexer *lexer, const bool *valid_symbols) { + Scanner *scanner = (Scanner *)payload; + + if (valid_symbols[EQUALS_BEGIN]) + return scan(lexer, scanner, '=', EQUALS_BEGIN); + + if (valid_symbols[EQUALS_END]) + return scan(lexer, scanner, '=', EQUALS_END); + + if (valid_symbols[DASHES]) + return scan(lexer, scanner, '-', DASHES); + + return false; +} + +void tree_sitter_test_external_scanner_destroy(void *payload) { + Scanner *scanner = (Scanner *)payload; + ts_free(scanner); +}