local api = vim.api local language = require('vim.treesitter.language') ---@class Query ---@field captures string[] List of captures used in query ---@field info TSQueryInfo Contains used queries, predicates, directives ---@field query userdata Parsed query local Query = {} Query.__index = Query ---@class TSQueryInfo ---@field captures table ---@field patterns table ---@class TSQueryModule local M = {} ---@param files string[] ---@return string[] local function dedupe_files(files) local result = {} ---@type table local seen = {} for _, path in ipairs(files) do if not seen[path] then table.insert(result, path) seen[path] = true end end return result end local function safe_read(filename, read_quantifier) local file, err = io.open(filename, 'r') if not file then error(err) end local content = file:read(read_quantifier) io.close(file) return content end --- Adds {ilang} to {base_langs}, only if {ilang} is different than {lang} --- ---@return boolean true If lang == ilang local function add_included_lang(base_langs, lang, ilang) if lang == ilang then return true end table.insert(base_langs, ilang) return false end ---@deprecated function M.get_query_files(...) vim.deprecate( 'vim.treesitter.query.get_query_files()', 'vim.treesitter.query.get_files()', '0.10' ) return M.get_files(...) end --- Gets the list of files used to make up a query --- ---@param lang string Language to get query for ---@param query_name string Name of the query to load (e.g., "highlights") ---@param is_included (boolean|nil) Internal parameter, most of the time left as `nil` ---@return string[] query_files List of files to load for given query and language function M.get_files(lang, query_name, is_included) local query_path = string.format('queries/%s/%s.scm', lang, query_name) local lang_files = dedupe_files(api.nvim_get_runtime_file(query_path, true)) if #lang_files == 0 then return {} end local base_query = nil ---@type string? local extensions = {} local base_langs = {} ---@type string[] -- Now get the base languages by looking at the first line of every file -- The syntax is the following : -- ;+ inherits: ({language},)*{language} -- -- {language} ::= {lang} | ({lang}) local MODELINE_FORMAT = '^;+%s*inherits%s*:?%s*([a-z_,()]+)%s*$' local EXTENDS_FORMAT = '^;+%s*extends%s*$' for _, filename in ipairs(lang_files) do local file, err = io.open(filename, 'r') if not file then error(err) end local extension = false for modeline in ---@return string function() return file:read('*l') end do if not vim.startswith(modeline, ';') then break end local langlist = modeline:match(MODELINE_FORMAT) if langlist then ---@diagnostic disable-next-line:param-type-mismatch for _, incllang in ipairs(vim.split(langlist, ',', true)) do local is_optional = incllang:match('%(.*%)') if is_optional then if not is_included then if add_included_lang(base_langs, lang, incllang:sub(2, #incllang - 1)) then extension = true end end else if add_included_lang(base_langs, lang, incllang) then extension = true end end end elseif modeline:match(EXTENDS_FORMAT) then extension = true end end if extension then table.insert(extensions, filename) elseif base_query == nil then base_query = filename end io.close(file) end local query_files = {} for _, base_lang in ipairs(base_langs) do local base_files = M.get_files(base_lang, query_name, true) vim.list_extend(query_files, base_files) end vim.list_extend(query_files, { base_query }) vim.list_extend(query_files, extensions) return query_files end ---@param filenames string[] ---@return string local function read_query_files(filenames) local contents = {} for _, filename in ipairs(filenames) do table.insert(contents, safe_read(filename, '*a')) end return table.concat(contents, '') end -- The explicitly set queries from |vim.treesitter.query.set()| ---@type table> local explicit_queries = setmetatable({}, { __index = function(t, k) local lang_queries = {} rawset(t, k, lang_queries) return lang_queries end, }) ---@deprecated function M.set_query(...) vim.deprecate('vim.treesitter.query.set_query()', 'vim.treesitter.query.set()', '0.10') M.set(...) end --- Sets the runtime query named {query_name} for {lang} --- --- This allows users to override any runtime files and/or configuration --- set by plugins. --- ---@param lang string Language to use for the query ---@param query_name string Name of the query (e.g., "highlights") ---@param text string Query text (unparsed). function M.set(lang, query_name, text) explicit_queries[lang][query_name] = M.parse(lang, text) end ---@deprecated function M.get_query(...) vim.deprecate('vim.treesitter.query.get_query()', 'vim.treesitter.query.get()', '0.10') return M.get(...) end --- Returns the runtime query {query_name} for {lang}. --- ---@param lang string Language to use for the query ---@param query_name string Name of the query (e.g. "highlights") --- ---@return Query|nil Parsed query M.get = vim.func._memoize('concat-2', function(lang, query_name) if explicit_queries[lang][query_name] then return explicit_queries[lang][query_name] end local query_files = M.get_files(lang, query_name) local query_string = read_query_files(query_files) if #query_string == 0 then return nil end return M.parse(lang, query_string) end) ---@deprecated function M.parse_query(...) vim.deprecate('vim.treesitter.query.parse_query()', 'vim.treesitter.query.parse()', '0.10') return M.parse(...) end --- Parse {query} as a string. (If the query is in a file, the caller --- should read the contents into a string before calling). --- --- Returns a `Query` (see |lua-treesitter-query|) object which can be used to --- search nodes in the syntax tree for the patterns defined in {query} --- using `iter_*` methods below. --- --- Exposes `info` and `captures` with additional context about {query}. --- - `captures` contains the list of unique capture names defined in --- {query}. --- -` info.captures` also points to `captures`. --- - `info.patterns` contains information about predicates. --- ---@param lang string Language to use for the query ---@param query string Query in s-expr syntax --- ---@return Query Parsed query M.parse = vim.func._memoize('concat-2', function(lang, query) language.add(lang) local self = setmetatable({}, Query) self.query = vim._ts_parse_query(lang, query) self.info = self.query:inspect() self.captures = self.info.captures return self end) ---@deprecated function M.get_range(...) vim.deprecate('vim.treesitter.query.get_range()', 'vim.treesitter.get_range()', '0.10') return vim.treesitter.get_range(...) end ---@deprecated function M.get_node_text(...) vim.deprecate('vim.treesitter.query.get_node_text()', 'vim.treesitter.get_node_text()', '0.10') return vim.treesitter.get_node_text(...) end ---@alias TSMatch table ---@alias TSPredicate fun(match: TSMatch, _, _, predicate: any[]): boolean -- Predicate handler receive the following arguments -- (match, pattern, bufnr, predicate) ---@type table local predicate_handlers = { ['eq?'] = function(match, _, source, predicate) local node = match[predicate[2]] if not node then return true end local node_text = vim.treesitter.get_node_text(node, source) local str ---@type string if type(predicate[3]) == 'string' then -- (#eq? @aa "foo") str = predicate[3] else -- (#eq? @aa @bb) str = vim.treesitter.get_node_text(match[predicate[3]], source) end if node_text ~= str or str == nil then return false end return true end, ['lua-match?'] = function(match, _, source, predicate) local node = match[predicate[2]] if not node then return true end local regex = predicate[3] return string.find(vim.treesitter.get_node_text(node, source), regex) ~= nil end, ['match?'] = (function() local magic_prefixes = { ['\\v'] = true, ['\\m'] = true, ['\\M'] = true, ['\\V'] = true } local function check_magic(str) if string.len(str) < 2 or magic_prefixes[string.sub(str, 1, 2)] then return str end return '\\v' .. str end local compiled_vim_regexes = setmetatable({}, { __index = function(t, pattern) local res = vim.regex(check_magic(pattern)) rawset(t, pattern, res) return res end, }) return function(match, _, source, pred) ---@cast match TSMatch local node = match[pred[2]] if not node then return true end ---@diagnostic disable-next-line no-unknown local regex = compiled_vim_regexes[pred[3]] return regex:match_str(vim.treesitter.get_node_text(node, source)) end end)(), ['contains?'] = function(match, _, source, predicate) local node = match[predicate[2]] if not node then return true end local node_text = vim.treesitter.get_node_text(node, source) for i = 3, #predicate do if string.find(node_text, predicate[i], 1, true) then return true end end return false end, ['any-of?'] = function(match, _, source, predicate) local node = match[predicate[2]] if not node then return true end local node_text = vim.treesitter.get_node_text(node, source) -- Since 'predicate' will not be used by callers of this function, use it -- to store a string set built from the list of words to check against. local string_set = predicate['string_set'] if not string_set then string_set = {} for i = 3, #predicate do ---@diagnostic disable-next-line:no-unknown string_set[predicate[i]] = true end predicate['string_set'] = string_set end return string_set[node_text] end, ['has-ancestor?'] = function(match, _, _, predicate) local node = match[predicate[2]] if not node then return true end local ancestor_types = {} for _, type in ipairs({ unpack(predicate, 3) }) do ancestor_types[type] = true end node = node:parent() while node do if ancestor_types[node:type()] then return true end node = node:parent() end return false end, ['has-parent?'] = function(match, _, _, predicate) local node = match[predicate[2]] if not node then return true end if vim.list_contains({ unpack(predicate, 3) }, node:parent():type()) then return true end return false end, } -- As we provide lua-match? also expose vim-match? predicate_handlers['vim-match?'] = predicate_handlers['match?'] ---@class TSMetadata ---@field range? Range ---@field conceal? string ---@field [integer] TSMetadata ---@field [string] integer|string ---@alias TSDirective fun(match: TSMatch, _, _, predicate: (string|integer)[], metadata: TSMetadata) -- Predicate handler receive the following arguments -- (match, pattern, bufnr, predicate) -- Directives store metadata or perform side effects against a match. -- Directives should always end with a `!`. -- Directive handler receive the following arguments -- (match, pattern, bufnr, predicate, metadata) ---@type table local directive_handlers = { ['set!'] = function(_, _, _, pred, metadata) if #pred >= 3 and type(pred[2]) == 'number' then -- (#set! @capture key value) local capture_id, key, value = pred[2], pred[3], pred[4] if not metadata[capture_id] then metadata[capture_id] = {} end metadata[capture_id][key] = value else -- (#set! key value) local key, value = pred[2], pred[3] metadata[key] = value or true end end, -- Shifts the range of a node. -- Example: (#offset! @_node 0 1 0 -1) ['offset!'] = function(match, _, _, pred, metadata) ---@cast pred integer[] local capture_id = pred[2] if not metadata[capture_id] then metadata[capture_id] = {} end local range = metadata[capture_id].range or { match[capture_id]:range() } local start_row_offset = pred[3] or 0 local start_col_offset = pred[4] or 0 local end_row_offset = pred[5] or 0 local end_col_offset = pred[6] or 0 range[1] = range[1] + start_row_offset range[2] = range[2] + start_col_offset range[3] = range[3] + end_row_offset range[4] = range[4] + end_col_offset -- If this produces an invalid range, we just skip it. if range[1] < range[3] or (range[1] == range[3] and range[2] <= range[4]) then metadata[capture_id].range = range end end, -- Transform the content of the node -- Example: (#gsub! @_node ".*%.(.*)" "%1") ['gsub!'] = function(match, _, bufnr, pred, metadata) assert(#pred == 4) local id = pred[2] assert(type(id) == 'number') local node = match[id] local text = vim.treesitter.get_node_text(node, bufnr, { metadata = metadata[id] }) or '' if not metadata[id] then metadata[id] = {} end local pattern, replacement = pred[3], pred[4] assert(type(pattern) == 'string') assert(type(replacement) == 'string') metadata[id].text = text:gsub(pattern, replacement) end, -- Trim blank lines from end of the node -- Example: (#trim! @fold) -- TODO(clason): generalize to arbitrary whitespace removal ['trim!'] = function(match, _, bufnr, pred, metadata) local capture_id = pred[2] assert(type(capture_id) == 'number') local node = match[capture_id] if not node then return end local start_row, start_col, end_row, end_col = node:range() -- Don't trim if region ends in middle of a line if end_col ~= 0 then return end while end_row >= start_row do -- As we only care when end_col == 0, always inspect one line above end_row. local end_line = api.nvim_buf_get_lines(bufnr, end_row - 1, end_row, true)[1] if end_line ~= '' then break end end_row = end_row - 1 end -- If this produces an invalid range, we just skip it. if start_row < end_row or (start_row == end_row and start_col <= end_col) then metadata[capture_id] = metadata[capture_id] or {} metadata[capture_id].range = { start_row, start_col, end_row, end_col } end end, } --- Adds a new predicate to be used in queries --- ---@param name string Name of the predicate, without leading # ---@param handler function(match:table, pattern:string, bufnr:integer, predicate:string[]) --- - see |vim.treesitter.query.add_directive()| for argument meanings ---@param force boolean|nil function M.add_predicate(name, handler, force) if predicate_handlers[name] and not force then error(string.format('Overriding %s', name)) end predicate_handlers[name] = handler end --- Adds a new directive to be used in queries --- --- Handlers can set match level data by setting directly on the --- metadata object `metadata.key = value`, additionally, handlers --- can set node level data by using the capture id on the --- metadata table `metadata[capture_id].key = value` --- ---@param name string Name of the directive, without leading # ---@param handler function(match:table, pattern:string, bufnr:integer, predicate:string[], metadata:table) --- - match: see |treesitter-query| --- - node-level data are accessible via `match[capture_id]` --- - pattern: see |treesitter-query| --- - predicate: list of strings containing the full directive being called, e.g. --- `(node (#set! conceal "-"))` would get the predicate `{ "#set!", "conceal", "-" }` ---@param force boolean|nil function M.add_directive(name, handler, force) if directive_handlers[name] and not force then error(string.format('Overriding %s', name)) end directive_handlers[name] = handler end --- Lists the currently available directives to use in queries. ---@return string[] List of supported directives. function M.list_directives() return vim.tbl_keys(directive_handlers) end --- Lists the currently available predicates to use in queries. ---@return string[] List of supported predicates. function M.list_predicates() return vim.tbl_keys(predicate_handlers) end local function xor(x, y) return (x or y) and not (x and y) end local function is_directive(name) return string.sub(name, -1) == '!' end ---@private ---@param match TSMatch ---@param pattern string ---@param source integer|string function Query:match_preds(match, pattern, source) local preds = self.info.patterns[pattern] for _, pred in pairs(preds or {}) do -- Here we only want to return if a predicate DOES NOT match, and -- continue on the other case. This way unknown predicates will not be considered, -- which allows some testing and easier user extensibility (#12173). -- Also, tree-sitter strips the leading # from predicates for us. local pred_name ---@type string local is_not ---@type boolean -- Skip over directives... they will get processed after all the predicates. if not is_directive(pred[1]) then if string.sub(pred[1], 1, 4) == 'not-' then pred_name = string.sub(pred[1], 5) is_not = true else pred_name = pred[1] is_not = false end local handler = predicate_handlers[pred_name] if not handler then error(string.format('No handler for %s', pred[1])) return false end local pred_matches = handler(match, pattern, source, pred) if not xor(is_not, pred_matches) then return false end end end return true end ---@private ---@param match TSMatch ---@param metadata TSMetadata function Query:apply_directives(match, pattern, source, metadata) local preds = self.info.patterns[pattern] for _, pred in pairs(preds or {}) do if is_directive(pred[1]) then local handler = directive_handlers[pred[1]] if not handler then error(string.format('No handler for %s', pred[1])) return end handler(match, pattern, source, pred, metadata) end end end --- Returns the start and stop value if set else the node's range. -- When the node's range is used, the stop is incremented by 1 -- to make the search inclusive. ---@param start integer ---@param stop integer ---@param node TSNode ---@return integer, integer local function value_or_node_range(start, stop, node) if start == nil and stop == nil then local node_start, _, node_stop, _ = node:range() return node_start, node_stop + 1 -- Make stop inclusive end return start, stop end --- Iterate over all captures from all matches inside {node} --- --- {source} is needed if the query contains predicates; then the caller --- must ensure to use a freshly parsed tree consistent with the current --- text of the buffer (if relevant). {start} and {stop} can be used to limit --- matches inside a row range (this is typically used with root node --- as the {node}, i.e., to get syntax highlight matches in the current --- viewport). When omitted, the {start} and {stop} row values are used from the given node. --- --- The iterator returns three values: a numeric id identifying the capture, --- the captured node, and metadata from any directives processing the match. --- The following example shows how to get captures by name: --- --- ```lua --- for id, node, metadata in query:iter_captures(tree:root(), bufnr, first, last) do --- local name = query.captures[id] -- name of the capture in the query --- -- typically useful info about the node: --- local type = node:type() -- type of the captured node --- local row1, col1, row2, col2 = node:range() -- range of the capture --- -- ... use the info here ... --- end --- ``` --- ---@param node TSNode under which the search will occur ---@param source (integer|string) Source buffer or string to extract text from ---@param start integer Starting line for the search ---@param stop integer Stopping line for the search (end-exclusive) --- ---@return (fun(end_line: integer|nil): integer, TSNode, TSMetadata): --- capture id, capture node, metadata function Query:iter_captures(node, source, start, stop) if type(source) == 'number' and source == 0 then source = api.nvim_get_current_buf() end start, stop = value_or_node_range(start, stop, node) local raw_iter = node:_rawquery(self.query, true, start, stop) local function iter(end_line) local capture, captured_node, match = raw_iter() local metadata = {} if match ~= nil then local active = self:match_preds(match, match.pattern, source) match.active = active if not active then if end_line and captured_node:range() > end_line then return nil, captured_node, nil end return iter(end_line) -- tail call: try next match end self:apply_directives(match, match.pattern, source, metadata) end return capture, captured_node, metadata end return iter end --- Iterates the matches of self on a given range. --- --- Iterate over all matches within a {node}. The arguments are the same as --- for |Query:iter_captures()| but the iterated values are different: --- an (1-based) index of the pattern in the query, a table mapping --- capture indices to nodes, and metadata from any directives processing the match. --- If the query has more than one pattern, the capture table might be sparse --- and e.g. `pairs()` method should be used over `ipairs`. --- Here is an example iterating over all captures in every match: --- --- ```lua --- for pattern, match, metadata in cquery:iter_matches(tree:root(), bufnr, first, last) do --- for id, node in pairs(match) do --- local name = query.captures[id] --- -- `node` was captured by the `name` capture in the match --- --- local node_data = metadata[id] -- Node level metadata --- --- -- ... use the info here ... --- end --- end --- ``` --- ---@param node TSNode under which the search will occur ---@param source (integer|string) Source buffer or string to search ---@param start integer Starting line for the search ---@param stop integer Stopping line for the search (end-exclusive) ---@param opts table|nil Options: --- - max_start_depth (integer) if non-zero, sets the maximum start depth --- for each match. This is used to prevent traversing too deep into a tree. --- Requires treesitter >= 0.20.9. --- ---@return (fun(): integer, table, table): pattern id, match, metadata function Query:iter_matches(node, source, start, stop, opts) if type(source) == 'number' and source == 0 then source = api.nvim_get_current_buf() end start, stop = value_or_node_range(start, stop, node) local raw_iter = node:_rawquery(self.query, false, start, stop, opts) ---@cast raw_iter fun(): string, any local function iter() local pattern, match = raw_iter() local metadata = {} if match ~= nil then local active = self:match_preds(match, pattern, source) if not active then return iter() -- tail call: try next match end self:apply_directives(match, pattern, source, metadata) end return pattern, match, metadata end return iter end ---@class QueryLinterOpts ---@field langs (string|string[]|nil) ---@field clear (boolean) --- Lint treesitter queries using installed parser, or clear lint errors. --- --- Use |treesitter-parsers| in runtimepath to check the query file in {buf} for errors: --- --- - verify that used nodes are valid identifiers in the grammar. --- - verify that predicates and directives are valid. --- - verify that top-level s-expressions are valid. --- --- The found diagnostics are reported using |diagnostic-api|. --- By default, the parser used for verification is determined by the containing folder --- of the query file, e.g., if the path ends in `/lua/highlights.scm`, the parser for the --- `lua` language will be used. ---@param buf (integer) Buffer handle ---@param opts (QueryLinterOpts|nil) Optional keyword arguments: --- - langs (string|string[]|nil) Language(s) to use for checking the query. --- If multiple languages are specified, queries are validated for all of them --- - clear (boolean) if `true`, just clear current lint errors function M.lint(buf, opts) if opts and opts.clear then require('vim.treesitter._query_linter').clear(buf) else require('vim.treesitter._query_linter').lint(buf, opts) end end --- Omnifunc for completing node names and predicates in treesitter queries. --- --- Use via --- --- ```lua --- vim.bo.omnifunc = 'v:lua.vim.treesitter.query.omnifunc' --- ``` --- function M.omnifunc(findstart, base) return require('vim.treesitter._query_linter').omnifunc(findstart, base) end --- Opens a live editor to query the buffer you started from. --- --- Can also be shown with *:EditQuery*. --- --- If you move the cursor to a capture name ("@foo"), text matching the capture is highlighted in --- the source buffer. The query editor is a scratch buffer, use `:write` to save it. You can find --- example queries at `$VIMRUNTIME/queries/`. --- --- @param lang? string language to open the query editor for. If omitted, inferred from the current buffer's filetype. function M.edit(lang) require('vim.treesitter.dev').edit_query(lang) end return M