mirror of
				https://github.com/neovim/neovim.git
				synced 2025-11-04 09:44:31 +00:00 
			
		
		
		
	fix(treesitter): return correct match table in iter_captures()
This commit is contained in:
		
				
					committed by
					
						
						Lewis Russell
					
				
			
			
				
	
			
			
			
						parent
						
							c4e1930851
						
					
				
				
					commit
					7d97150084
				
			@@ -1166,7 +1166,7 @@ Query:iter_captures({node}, {source}, {start}, {stop})
 | 
				
			|||||||
                  Defaults to `node:end_()`.
 | 
					                  Defaults to `node:end_()`.
 | 
				
			||||||
 | 
					
 | 
				
			||||||
    Return: ~
 | 
					    Return: ~
 | 
				
			||||||
        (`fun(end_line: integer?): integer, TSNode, vim.treesitter.query.TSMetadata, table<integer,TSNode[]>?`)
 | 
					        (`fun(end_line: integer?): integer, TSNode, vim.treesitter.query.TSMetadata, TSQueryMatch`)
 | 
				
			||||||
        capture id, capture node, metadata, match
 | 
					        capture id, capture node, metadata, match
 | 
				
			||||||
 | 
					
 | 
				
			||||||
                                                        *Query:iter_matches()*
 | 
					                                                        *Query:iter_matches()*
 | 
				
			||||||
 
 | 
				
			|||||||
@@ -32,10 +32,11 @@ local M = {}
 | 
				
			|||||||
---     first n arguments passed to {fn}.
 | 
					---     first n arguments passed to {fn}.
 | 
				
			||||||
---
 | 
					---
 | 
				
			||||||
--- @param fn F Function to memoize.
 | 
					--- @param fn F Function to memoize.
 | 
				
			||||||
 | 
					--- @param strong? boolean Do not use a weak table
 | 
				
			||||||
--- @return F # Memoized version of {fn}
 | 
					--- @return F # Memoized version of {fn}
 | 
				
			||||||
--- @nodoc
 | 
					--- @nodoc
 | 
				
			||||||
function M._memoize(hash, fn)
 | 
					function M._memoize(hash, fn, strong)
 | 
				
			||||||
  return require('vim.func._memoize')(hash, fn)
 | 
					  return require('vim.func._memoize')(hash, fn, strong)
 | 
				
			||||||
end
 | 
					end
 | 
				
			||||||
 | 
					
 | 
				
			||||||
return M
 | 
					return M
 | 
				
			||||||
 
 | 
				
			|||||||
@@ -36,15 +36,19 @@ end
 | 
				
			|||||||
--- @generic F: function
 | 
					--- @generic F: function
 | 
				
			||||||
--- @param hash integer|string|fun(...): any
 | 
					--- @param hash integer|string|fun(...): any
 | 
				
			||||||
--- @param fn F
 | 
					--- @param fn F
 | 
				
			||||||
 | 
					--- @param strong? boolean
 | 
				
			||||||
--- @return F
 | 
					--- @return F
 | 
				
			||||||
return function(hash, fn)
 | 
					return function(hash, fn, strong)
 | 
				
			||||||
  vim.validate({
 | 
					  vim.validate({
 | 
				
			||||||
    hash = { hash, { 'number', 'string', 'function' } },
 | 
					    hash = { hash, { 'number', 'string', 'function' } },
 | 
				
			||||||
    fn = { fn, 'function' },
 | 
					    fn = { fn, 'function' },
 | 
				
			||||||
  })
 | 
					  })
 | 
				
			||||||
 | 
					
 | 
				
			||||||
  ---@type table<any,table<any,any>>
 | 
					  ---@type table<any,table<any,any>>
 | 
				
			||||||
  local cache = setmetatable({}, { __mode = 'kv' })
 | 
					  local cache = {}
 | 
				
			||||||
 | 
					  if not strong then
 | 
				
			||||||
 | 
					    setmetatable(cache, { __mode = 'kv' })
 | 
				
			||||||
 | 
					  end
 | 
				
			||||||
 | 
					
 | 
				
			||||||
  hash = resolve_hash(hash)
 | 
					  hash = resolve_hash(hash)
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 
 | 
				
			|||||||
@@ -4,7 +4,7 @@ local Range = require('vim.treesitter._range')
 | 
				
			|||||||
 | 
					
 | 
				
			||||||
local ns = api.nvim_create_namespace('treesitter/highlighter')
 | 
					local ns = api.nvim_create_namespace('treesitter/highlighter')
 | 
				
			||||||
 | 
					
 | 
				
			||||||
---@alias vim.treesitter.highlighter.Iter fun(end_line: integer|nil): integer, TSNode, vim.treesitter.query.TSMetadata, table<integer, TSNode[]>
 | 
					---@alias vim.treesitter.highlighter.Iter fun(end_line: integer|nil): integer, TSNode, vim.treesitter.query.TSMetadata, TSQueryMatch
 | 
				
			||||||
 | 
					
 | 
				
			||||||
---@class (private) vim.treesitter.highlighter.Query
 | 
					---@class (private) vim.treesitter.highlighter.Query
 | 
				
			||||||
---@field private _query vim.treesitter.Query?
 | 
					---@field private _query vim.treesitter.Query?
 | 
				
			||||||
@@ -243,7 +243,7 @@ function TSHighlighter:get_query(lang)
 | 
				
			|||||||
  return self._queries[lang]
 | 
					  return self._queries[lang]
 | 
				
			||||||
end
 | 
					end
 | 
				
			||||||
 | 
					
 | 
				
			||||||
--- @param match table<integer,TSNode[]>
 | 
					--- @param match TSQueryMatch
 | 
				
			||||||
--- @param bufnr integer
 | 
					--- @param bufnr integer
 | 
				
			||||||
--- @param capture integer
 | 
					--- @param capture integer
 | 
				
			||||||
--- @param metadata vim.treesitter.query.TSMetadata
 | 
					--- @param metadata vim.treesitter.query.TSMetadata
 | 
				
			||||||
@@ -256,13 +256,15 @@ local function get_url(match, bufnr, capture, metadata)
 | 
				
			|||||||
    return url
 | 
					    return url
 | 
				
			||||||
  end
 | 
					  end
 | 
				
			||||||
 | 
					
 | 
				
			||||||
  if not match or not match[url] then
 | 
					  local captures = match:captures()
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					  if not captures[url] then
 | 
				
			||||||
    return
 | 
					    return
 | 
				
			||||||
  end
 | 
					  end
 | 
				
			||||||
 | 
					
 | 
				
			||||||
  -- Assume there is only one matching node. If there is more than one, take the URL
 | 
					  -- Assume there is only one matching node. If there is more than one, take the URL
 | 
				
			||||||
  -- from the first.
 | 
					  -- from the first.
 | 
				
			||||||
  local other_node = match[url][1]
 | 
					  local other_node = captures[url][1]
 | 
				
			||||||
 | 
					
 | 
				
			||||||
  return vim.treesitter.get_node_text(other_node, bufnr, {
 | 
					  return vim.treesitter.get_node_text(other_node, bufnr, {
 | 
				
			||||||
    metadata = metadata[url],
 | 
					    metadata = metadata[url],
 | 
				
			||||||
@@ -296,6 +298,10 @@ local function on_line_impl(self, buf, line, is_spell_nav)
 | 
				
			|||||||
    end
 | 
					    end
 | 
				
			||||||
 | 
					
 | 
				
			||||||
    if state.iter == nil or state.next_row < line then
 | 
					    if state.iter == nil or state.next_row < line then
 | 
				
			||||||
 | 
					      -- Mainly used to skip over folds
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					      -- TODO(lewis6991): Creating a new iterator loses the cached predicate results for query
 | 
				
			||||||
 | 
					      -- matches. Move this logic inside iter_captures() so we can maintain the cache.
 | 
				
			||||||
      state.iter =
 | 
					      state.iter =
 | 
				
			||||||
        state.highlighter_query:query():iter_captures(root_node, self.bufnr, line, root_end_row + 1)
 | 
					        state.highlighter_query:query():iter_captures(root_node, self.bufnr, line, root_end_row + 1)
 | 
				
			||||||
    end
 | 
					    end
 | 
				
			||||||
 
 | 
				
			|||||||
@@ -1,5 +1,6 @@
 | 
				
			|||||||
local api = vim.api
 | 
					local api = vim.api
 | 
				
			||||||
local language = require('vim.treesitter.language')
 | 
					local language = require('vim.treesitter.language')
 | 
				
			||||||
 | 
					local memoize = vim.func._memoize
 | 
				
			||||||
 | 
					
 | 
				
			||||||
local M = {}
 | 
					local M = {}
 | 
				
			||||||
 | 
					
 | 
				
			||||||
@@ -212,7 +213,7 @@ end
 | 
				
			|||||||
---@param query_name string Name of the query (e.g. "highlights")
 | 
					---@param query_name string Name of the query (e.g. "highlights")
 | 
				
			||||||
---
 | 
					---
 | 
				
			||||||
---@return vim.treesitter.Query? : Parsed query. `nil` if no query files are found.
 | 
					---@return vim.treesitter.Query? : Parsed query. `nil` if no query files are found.
 | 
				
			||||||
M.get = vim.func._memoize('concat-2', function(lang, query_name)
 | 
					M.get = memoize('concat-2', function(lang, query_name)
 | 
				
			||||||
  if explicit_queries[lang][query_name] then
 | 
					  if explicit_queries[lang][query_name] then
 | 
				
			||||||
    return explicit_queries[lang][query_name]
 | 
					    return explicit_queries[lang][query_name]
 | 
				
			||||||
  end
 | 
					  end
 | 
				
			||||||
@@ -245,7 +246,7 @@ end)
 | 
				
			|||||||
---@return vim.treesitter.Query : Parsed query
 | 
					---@return vim.treesitter.Query : Parsed query
 | 
				
			||||||
---
 | 
					---
 | 
				
			||||||
---@see [vim.treesitter.query.get()]
 | 
					---@see [vim.treesitter.query.get()]
 | 
				
			||||||
M.parse = vim.func._memoize('concat-2', function(lang, query)
 | 
					M.parse = memoize('concat-2', function(lang, query)
 | 
				
			||||||
  language.add(lang)
 | 
					  language.add(lang)
 | 
				
			||||||
 | 
					
 | 
				
			||||||
  local ts_query = vim._ts_parse_query(lang, query)
 | 
					  local ts_query = vim._ts_parse_query(lang, query)
 | 
				
			||||||
@@ -812,6 +813,12 @@ local function value_or_node_range(start, stop, node)
 | 
				
			|||||||
  return start, stop
 | 
					  return start, stop
 | 
				
			||||||
end
 | 
					end
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					--- @param match TSQueryMatch
 | 
				
			||||||
 | 
					--- @return integer
 | 
				
			||||||
 | 
					local function match_id_hash(_, match)
 | 
				
			||||||
 | 
					  return (match:info())
 | 
				
			||||||
 | 
					end
 | 
				
			||||||
 | 
					
 | 
				
			||||||
--- Iterate over all captures from all matches inside {node}
 | 
					--- Iterate over all captures from all matches inside {node}
 | 
				
			||||||
---
 | 
					---
 | 
				
			||||||
--- {source} is needed if the query contains predicates; then the caller
 | 
					--- {source} is needed if the query contains predicates; then the caller
 | 
				
			||||||
@@ -841,7 +848,7 @@ end
 | 
				
			|||||||
---@param start? integer Starting line for the search. Defaults to `node:start()`.
 | 
					---@param start? integer Starting line for the search. Defaults to `node:start()`.
 | 
				
			||||||
---@param stop? integer Stopping line for the search (end-exclusive). Defaults to `node:end_()`.
 | 
					---@param stop? integer Stopping line for the search (end-exclusive). Defaults to `node:end_()`.
 | 
				
			||||||
---
 | 
					---
 | 
				
			||||||
---@return (fun(end_line: integer|nil): integer, TSNode, vim.treesitter.query.TSMetadata, table<integer,TSNode[]>?):
 | 
					---@return (fun(end_line: integer|nil): integer, TSNode, vim.treesitter.query.TSMetadata, TSQueryMatch):
 | 
				
			||||||
---        capture id, capture node, metadata, match
 | 
					---        capture id, capture node, metadata, match
 | 
				
			||||||
---
 | 
					---
 | 
				
			||||||
---@note Captures are only returned if the query pattern of a specific capture contained predicates.
 | 
					---@note Captures are only returned if the query pattern of a specific capture contained predicates.
 | 
				
			||||||
@@ -854,7 +861,8 @@ function Query:iter_captures(node, source, start, stop)
 | 
				
			|||||||
 | 
					
 | 
				
			||||||
  local cursor = vim._create_ts_querycursor(node, self.query, start, stop, { match_limit = 256 })
 | 
					  local cursor = vim._create_ts_querycursor(node, self.query, start, stop, { match_limit = 256 })
 | 
				
			||||||
 | 
					
 | 
				
			||||||
  local max_match_id = -1
 | 
					  local apply_directives = memoize(match_id_hash, self.apply_directives, true)
 | 
				
			||||||
 | 
					  local match_preds = memoize(match_id_hash, self.match_preds, true)
 | 
				
			||||||
 | 
					
 | 
				
			||||||
  local function iter(end_line)
 | 
					  local function iter(end_line)
 | 
				
			||||||
    local capture, captured_node, match = cursor:next_capture()
 | 
					    local capture, captured_node, match = cursor:next_capture()
 | 
				
			||||||
@@ -863,27 +871,18 @@ function Query:iter_captures(node, source, start, stop)
 | 
				
			|||||||
      return
 | 
					      return
 | 
				
			||||||
    end
 | 
					    end
 | 
				
			||||||
 | 
					
 | 
				
			||||||
    local captures --- @type table<integer,TSNode[]>?
 | 
					    if not match_preds(self, match, source) then
 | 
				
			||||||
    local match_id, pattern_index = match:info()
 | 
					      local match_id = match:info()
 | 
				
			||||||
 | 
					 | 
				
			||||||
    local metadata = {}
 | 
					 | 
				
			||||||
 | 
					 | 
				
			||||||
    local preds = self.info.patterns[pattern_index] or {}
 | 
					 | 
				
			||||||
 | 
					 | 
				
			||||||
    if #preds > 0 and match_id > max_match_id then
 | 
					 | 
				
			||||||
      captures = match:captures()
 | 
					 | 
				
			||||||
      max_match_id = match_id
 | 
					 | 
				
			||||||
      if not self:match_preds(match, source) then
 | 
					 | 
				
			||||||
      cursor:remove_match(match_id)
 | 
					      cursor:remove_match(match_id)
 | 
				
			||||||
      if end_line and captured_node:range() > end_line then
 | 
					      if end_line and captured_node:range() > end_line then
 | 
				
			||||||
          return nil, captured_node, nil
 | 
					        return nil, captured_node, nil, nil
 | 
				
			||||||
      end
 | 
					      end
 | 
				
			||||||
      return iter(end_line) -- tail call: try next match
 | 
					      return iter(end_line) -- tail call: try next match
 | 
				
			||||||
    end
 | 
					    end
 | 
				
			||||||
 | 
					
 | 
				
			||||||
      metadata = self:apply_directives(match, source)
 | 
					    local metadata = apply_directives(self, match, source)
 | 
				
			||||||
    end
 | 
					
 | 
				
			||||||
    return capture, captured_node, metadata, captures
 | 
					    return capture, captured_node, metadata, match
 | 
				
			||||||
  end
 | 
					  end
 | 
				
			||||||
  return iter
 | 
					  return iter
 | 
				
			||||||
end
 | 
					end
 | 
				
			||||||
@@ -972,6 +971,7 @@ function Query:iter_matches(node, source, start, stop, opts)
 | 
				
			|||||||
      return pattern, old_match, metadata
 | 
					      return pattern, old_match, metadata
 | 
				
			||||||
    end
 | 
					    end
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					    -- TODO(lewis6991): create a new function that returns {match, metadata}
 | 
				
			||||||
    return pattern, captures, metadata
 | 
					    return pattern, captures, metadata
 | 
				
			||||||
  end
 | 
					  end
 | 
				
			||||||
  return iter
 | 
					  return iter
 | 
				
			||||||
 
 | 
				
			|||||||
@@ -281,8 +281,8 @@ local function filter_decl(line)
 | 
				
			|||||||
  -- M.fun = vim._memoize(function(...)
 | 
					  -- M.fun = vim._memoize(function(...)
 | 
				
			||||||
  --   ->
 | 
					  --   ->
 | 
				
			||||||
  -- function M.fun(...)
 | 
					  -- function M.fun(...)
 | 
				
			||||||
  line = line:gsub('^local (.+) = .*_memoize%([^,]+, function%((.*)%)$', 'local function %1(%2)')
 | 
					  line = line:gsub('^local (.+) = memoize%([^,]+, function%((.*)%)$', 'local function %1(%2)')
 | 
				
			||||||
  line = line:gsub('^(.+) = .*_memoize%([^,]+, function%((.*)%)$', 'function %1(%2)')
 | 
					  line = line:gsub('^(.+) = memoize%([^,]+, function%((.*)%)$', 'function %1(%2)')
 | 
				
			||||||
  return line
 | 
					  return line
 | 
				
			||||||
end
 | 
					end
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 
 | 
				
			|||||||
@@ -696,4 +696,82 @@ void ui_refresh(void)
 | 
				
			|||||||
      '((identifier) @id \n(#eq? @id\n@ok.capture\n))'
 | 
					      '((identifier) @id \n(#eq? @id\n@ok.capture\n))'
 | 
				
			||||||
    )
 | 
					    )
 | 
				
			||||||
  end)
 | 
					  end)
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					  describe('Query:iter_captures', function()
 | 
				
			||||||
 | 
					    it('includes metadata for all captured nodes #23664', function()
 | 
				
			||||||
 | 
					      insert([[
 | 
				
			||||||
 | 
					        const char *sql = "SELECT * FROM Students WHERE name = 'Robert'); DROP TABLE Students;--";
 | 
				
			||||||
 | 
					      ]])
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					      local query = [[
 | 
				
			||||||
 | 
					        (declaration
 | 
				
			||||||
 | 
					          type: (_)
 | 
				
			||||||
 | 
					          declarator: (init_declarator
 | 
				
			||||||
 | 
					            declarator: (pointer_declarator
 | 
				
			||||||
 | 
					              declarator: (identifier)) @_id
 | 
				
			||||||
 | 
					            value: (string_literal
 | 
				
			||||||
 | 
					              (string_content) @injection.content))
 | 
				
			||||||
 | 
					          (#set! injection.language "sql")
 | 
				
			||||||
 | 
					          (#contains? @_id "sql"))
 | 
				
			||||||
 | 
					      ]]
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					      local result = exec_lua(
 | 
				
			||||||
 | 
					        [=[
 | 
				
			||||||
 | 
					        local query = vim.treesitter.query.parse("c", ...)
 | 
				
			||||||
 | 
					        local parser = vim.treesitter.get_parser(0, "c")
 | 
				
			||||||
 | 
					        local root = parser:parse()[1]:root()
 | 
				
			||||||
 | 
					        local t = {}
 | 
				
			||||||
 | 
					        for id, node, metadata in query:iter_captures(root, 0) do
 | 
				
			||||||
 | 
					          t[query.captures[id]] = metadata
 | 
				
			||||||
 | 
					        end
 | 
				
			||||||
 | 
					        return t
 | 
				
			||||||
 | 
					      ]=],
 | 
				
			||||||
 | 
					        query
 | 
				
			||||||
 | 
					      )
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					      eq({
 | 
				
			||||||
 | 
					        ['_id'] = { ['injection.language'] = 'sql' },
 | 
				
			||||||
 | 
					        ['injection.content'] = { ['injection.language'] = 'sql' },
 | 
				
			||||||
 | 
					      }, result)
 | 
				
			||||||
 | 
					    end)
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					    it('only evaluates predicates once per match', function()
 | 
				
			||||||
 | 
					      insert([[
 | 
				
			||||||
 | 
					        void foo(int x, int y);
 | 
				
			||||||
 | 
					      ]])
 | 
				
			||||||
 | 
					      local query = [[
 | 
				
			||||||
 | 
					        (declaration
 | 
				
			||||||
 | 
					          type: (_)
 | 
				
			||||||
 | 
					          declarator: (function_declarator
 | 
				
			||||||
 | 
					            declarator: (identifier) @function.name
 | 
				
			||||||
 | 
					            parameters: (parameter_list
 | 
				
			||||||
 | 
					              (parameter_declaration
 | 
				
			||||||
 | 
					                type: (_)
 | 
				
			||||||
 | 
					                declarator: (identifier) @argument)))
 | 
				
			||||||
 | 
					          (#eq? @function.name "foo"))
 | 
				
			||||||
 | 
					      ]]
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					      local result = exec_lua(
 | 
				
			||||||
 | 
					        [[
 | 
				
			||||||
 | 
					        local query = vim.treesitter.query.parse("c", ...)
 | 
				
			||||||
 | 
					        local match_preds = query.match_preds
 | 
				
			||||||
 | 
					        local called = 0
 | 
				
			||||||
 | 
					        function query:match_preds(...)
 | 
				
			||||||
 | 
					          called = called + 1
 | 
				
			||||||
 | 
					          return match_preds(self, ...)
 | 
				
			||||||
 | 
					        end
 | 
				
			||||||
 | 
					        local parser = vim.treesitter.get_parser(0, "c")
 | 
				
			||||||
 | 
					        local root = parser:parse()[1]:root()
 | 
				
			||||||
 | 
					        local captures = {}
 | 
				
			||||||
 | 
					        for id, node in query:iter_captures(root, 0) do
 | 
				
			||||||
 | 
					          captures[#captures + 1] = id
 | 
				
			||||||
 | 
					        end
 | 
				
			||||||
 | 
					        return { called, captures }
 | 
				
			||||||
 | 
					      ]],
 | 
				
			||||||
 | 
					        query
 | 
				
			||||||
 | 
					      )
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					      eq({ 2, { 1, 1, 2, 2 } }, result)
 | 
				
			||||||
 | 
					    end)
 | 
				
			||||||
 | 
					  end)
 | 
				
			||||||
end)
 | 
					end)
 | 
				
			||||||
 
 | 
				
			|||||||
		Reference in New Issue
	
	Block a user