mirror of
https://github.com/neovim/neovim.git
synced 2025-02-25 18:55:25 -06:00
feat(treesitter): add filetype -> lang API
Problem: vim.treesitter does not know how to map a specific filetype to a parser. This creates problems since in a few places (including in vim.treesitter itself), the filetype is incorrectly used in place of lang. Solution: Add an API to enable this: - Add vim.treesitter.language.add() as a replacement for vim.treesitter.language.require_language(). - Optional arguments are now passed via an opts table. - Also takes a filetype (or list of filetypes) so we can keep track of what filetypes are associated with which langs. - Deprecated vim.treesitter.language.require_language(). - Add vim.treesitter.language.get_lang() which returns the associated lang for a given filetype. - Add vim.treesitter.language.register() to associate filetypes to a lang without loading the parser.
This commit is contained in:
parent
344a1ee8e6
commit
8714a4009c
@ -164,6 +164,9 @@ The following new APIs or features were added.
|
|||||||
• |vim.treesitter.query.get_node_text()| now accepts a `metadata` option for
|
• |vim.treesitter.query.get_node_text()| now accepts a `metadata` option for
|
||||||
writing custom directives using |vim.treesitter.query.add_directive()|.
|
writing custom directives using |vim.treesitter.query.add_directive()|.
|
||||||
|
|
||||||
|
• |vim.treesitter.language.add()| as a new replacement for
|
||||||
|
`vim.treesitter.language.require_language`.
|
||||||
|
|
||||||
==============================================================================
|
==============================================================================
|
||||||
CHANGED FEATURES *news-changes*
|
CHANGED FEATURES *news-changes*
|
||||||
|
|
||||||
@ -202,6 +205,8 @@ DEPRECATIONS *news-deprecations*
|
|||||||
The following functions are now deprecated and will be removed in the next
|
The following functions are now deprecated and will be removed in the next
|
||||||
release.
|
release.
|
||||||
|
|
||||||
|
• `vim.treesitter.language.require_language()` has been deprecated in favour
|
||||||
|
of |vim.treesitter.language.add()|.
|
||||||
|
|
||||||
|
|
||||||
vim:tw=78:ts=8:sw=2:et:ft=help:norl:
|
vim:tw=78:ts=8:sw=2:et:ft=help:norl:
|
||||||
|
@ -666,6 +666,36 @@ stop({bufnr}) *vim.treesitter.stop()*
|
|||||||
==============================================================================
|
==============================================================================
|
||||||
Lua module: vim.treesitter.language *lua-treesitter-language*
|
Lua module: vim.treesitter.language *lua-treesitter-language*
|
||||||
|
|
||||||
|
add({lang}, {opts}) *vim.treesitter.language.add()*
|
||||||
|
Asserts that a parser for the language {lang} is installed.
|
||||||
|
|
||||||
|
Parsers are searched in the `parser` runtime directory, or the provided
|
||||||
|
{path}
|
||||||
|
|
||||||
|
Parameters: ~
|
||||||
|
• {lang} (string) Language the parser should parse (alphanumerical and
|
||||||
|
`_` only)
|
||||||
|
• {opts} (table|nil) Options:
|
||||||
|
• filetype (string|string[]) Filetype(s) that lang can be
|
||||||
|
parsed with. Note this is not strictly the same as lang
|
||||||
|
since a single lang can parse multiple filetypes. Defaults
|
||||||
|
to lang.
|
||||||
|
• path (string|nil) Optional path the parser is located at
|
||||||
|
• symbol_name (string|nil) Internal symbol name for the
|
||||||
|
language to load
|
||||||
|
• silent (boolean|nil) Don't throw an error if language not
|
||||||
|
found
|
||||||
|
|
||||||
|
Return: ~
|
||||||
|
(boolean) If the specified language is installed
|
||||||
|
|
||||||
|
get_lang({filetype}) *vim.treesitter.language.get_lang()*
|
||||||
|
Parameters: ~
|
||||||
|
• {filetype} (string)
|
||||||
|
|
||||||
|
Return: ~
|
||||||
|
(string|nil)
|
||||||
|
|
||||||
inspect_language({lang}) *vim.treesitter.language.inspect_language()*
|
inspect_language({lang}) *vim.treesitter.language.inspect_language()*
|
||||||
Inspects the provided language.
|
Inspects the provided language.
|
||||||
|
|
||||||
@ -678,24 +708,12 @@ inspect_language({lang}) *vim.treesitter.language.inspect_language()*
|
|||||||
Return: ~
|
Return: ~
|
||||||
(table)
|
(table)
|
||||||
|
|
||||||
*vim.treesitter.language.require_language()*
|
register({lang}, {filetype}) *vim.treesitter.language.register()*
|
||||||
require_language({lang}, {path}, {silent}, {symbol_name})
|
Register a lang to be used for a filetype (or list of filetypes).
|
||||||
Asserts that a parser for the language {lang} is installed.
|
|
||||||
|
|
||||||
Parsers are searched in the `parser` runtime directory, or the provided
|
|
||||||
{path}
|
|
||||||
|
|
||||||
Parameters: ~
|
Parameters: ~
|
||||||
• {lang} (string) Language the parser should parse
|
• {lang} (string) Language to register
|
||||||
(alphanumerical and `_` only)
|
• {filetype} string|string[] Filetype(s) to associate with lang
|
||||||
• {path} (string|nil) Optional path the parser is located at
|
|
||||||
• {silent} (boolean|nil) Don't throw an error if language not
|
|
||||||
found
|
|
||||||
• {symbol_name} (string|nil) Internal symbol name for the language to
|
|
||||||
load
|
|
||||||
|
|
||||||
Return: ~
|
|
||||||
(boolean) If the specified language is installed
|
|
||||||
|
|
||||||
|
|
||||||
==============================================================================
|
==============================================================================
|
||||||
|
@ -29,6 +29,8 @@ setmetatable(M, {
|
|||||||
end,
|
end,
|
||||||
})
|
})
|
||||||
|
|
||||||
|
---@diagnostic disable:invisible
|
||||||
|
|
||||||
--- Creates a new parser
|
--- Creates a new parser
|
||||||
---
|
---
|
||||||
--- It is not recommended to use this; use |get_parser()| instead.
|
--- It is not recommended to use this; use |get_parser()| instead.
|
||||||
@ -39,16 +41,15 @@ setmetatable(M, {
|
|||||||
---
|
---
|
||||||
---@return LanguageTree object to use for parsing
|
---@return LanguageTree object to use for parsing
|
||||||
function M._create_parser(bufnr, lang, opts)
|
function M._create_parser(bufnr, lang, opts)
|
||||||
language.require_language(lang)
|
|
||||||
if bufnr == 0 then
|
if bufnr == 0 then
|
||||||
bufnr = vim.api.nvim_get_current_buf()
|
bufnr = vim.api.nvim_get_current_buf()
|
||||||
end
|
end
|
||||||
|
|
||||||
vim.fn.bufload(bufnr)
|
vim.fn.bufload(bufnr)
|
||||||
|
|
||||||
local self = LanguageTree.new(bufnr, lang, opts)
|
language.add(lang, { filetype = vim.bo[bufnr].filetype })
|
||||||
|
|
||||||
---@diagnostic disable:invisible
|
local self = LanguageTree.new(bufnr, lang, opts)
|
||||||
|
|
||||||
---@private
|
---@private
|
||||||
local function bytes_cb(_, ...)
|
local function bytes_cb(_, ...)
|
||||||
@ -96,13 +97,16 @@ function M.get_parser(bufnr, lang, opts)
|
|||||||
if bufnr == nil or bufnr == 0 then
|
if bufnr == nil or bufnr == 0 then
|
||||||
bufnr = a.nvim_get_current_buf()
|
bufnr = a.nvim_get_current_buf()
|
||||||
end
|
end
|
||||||
|
if lang == nil then
|
||||||
|
local ft = vim.bo[bufnr].filetype
|
||||||
|
lang = language.get_lang(ft) or ft
|
||||||
|
-- TODO(lewis6991): we should error here and not default to ft
|
||||||
|
-- if not lang then
|
||||||
|
-- error(string.format('filetype %s of buffer %d is not associated with any lang', ft, bufnr))
|
||||||
|
-- end
|
||||||
|
end
|
||||||
|
|
||||||
if parsers[bufnr] == nil then
|
if parsers[bufnr] == nil or parsers[bufnr]:lang() ~= lang then
|
||||||
lang = lang or a.nvim_buf_get_option(bufnr, 'filetype')
|
|
||||||
parsers[bufnr] = M._create_parser(bufnr, lang, opts)
|
|
||||||
elseif lang and parsers[bufnr]:lang() ~= lang then
|
|
||||||
-- Only try to create a new parser if lang is provided
|
|
||||||
-- and it doesn't match the stored parser
|
|
||||||
parsers[bufnr] = M._create_parser(bufnr, lang, opts)
|
parsers[bufnr] = M._create_parser(bufnr, lang, opts)
|
||||||
end
|
end
|
||||||
|
|
||||||
@ -123,7 +127,7 @@ function M.get_string_parser(str, lang, opts)
|
|||||||
str = { str, 'string' },
|
str = { str, 'string' },
|
||||||
lang = { lang, 'string' },
|
lang = { lang, 'string' },
|
||||||
})
|
})
|
||||||
language.require_language(lang)
|
language.add(lang)
|
||||||
|
|
||||||
return LanguageTree.new(str, lang, opts)
|
return LanguageTree.new(str, lang, opts)
|
||||||
end
|
end
|
||||||
|
@ -17,7 +17,7 @@ function M.check()
|
|||||||
|
|
||||||
for _, parser in pairs(parsers) do
|
for _, parser in pairs(parsers) do
|
||||||
local parsername = vim.fn.fnamemodify(parser, ':t:r')
|
local parsername = vim.fn.fnamemodify(parser, ':t:r')
|
||||||
local is_loadable, ret = pcall(ts.language.require_language, parsername)
|
local is_loadable, ret = pcall(ts.language.add, parsername)
|
||||||
|
|
||||||
if not is_loadable or not ret then
|
if not is_loadable or not ret then
|
||||||
health.report_error(
|
health.report_error(
|
||||||
|
@ -2,19 +2,66 @@ local a = vim.api
|
|||||||
|
|
||||||
local M = {}
|
local M = {}
|
||||||
|
|
||||||
|
---@type table<string,string>
|
||||||
|
local ft_to_lang = {}
|
||||||
|
|
||||||
|
---@param filetype string
|
||||||
|
---@return string|nil
|
||||||
|
function M.get_lang(filetype)
|
||||||
|
return ft_to_lang[filetype]
|
||||||
|
end
|
||||||
|
|
||||||
|
---@deprecated
|
||||||
|
function M.require_language(lang, path, silent, symbol_name)
|
||||||
|
return M.add(lang, {
|
||||||
|
silent = silent,
|
||||||
|
path = path,
|
||||||
|
symbol_name = symbol_name,
|
||||||
|
})
|
||||||
|
end
|
||||||
|
|
||||||
|
---@class treesitter.RequireLangOpts
|
||||||
|
---@field path? string
|
||||||
|
---@field silent? boolean
|
||||||
|
---@field filetype? string|string[]
|
||||||
|
---@field symbol_name? string
|
||||||
|
|
||||||
--- Asserts that a parser for the language {lang} is installed.
|
--- Asserts that a parser for the language {lang} is installed.
|
||||||
---
|
---
|
||||||
--- Parsers are searched in the `parser` runtime directory, or the provided {path}
|
--- Parsers are searched in the `parser` runtime directory, or the provided {path}
|
||||||
---
|
---
|
||||||
---@param lang string Language the parser should parse (alphanumerical and `_` only)
|
---@param lang string Language the parser should parse (alphanumerical and `_` only)
|
||||||
---@param path (string|nil) Optional path the parser is located at
|
---@param opts (table|nil) Options:
|
||||||
---@param silent (boolean|nil) Don't throw an error if language not found
|
--- - filetype (string|string[]) Filetype(s) that lang can be parsed with.
|
||||||
---@param symbol_name (string|nil) Internal symbol name for the language to load
|
--- Note this is not strictly the same as lang since a single lang can
|
||||||
|
--- parse multiple filetypes.
|
||||||
|
--- Defaults to lang.
|
||||||
|
--- - path (string|nil) Optional path the parser is located at
|
||||||
|
--- - symbol_name (string|nil) Internal symbol name for the language to load
|
||||||
|
--- - silent (boolean|nil) Don't throw an error if language not found
|
||||||
---@return boolean If the specified language is installed
|
---@return boolean If the specified language is installed
|
||||||
function M.require_language(lang, path, silent, symbol_name)
|
function M.add(lang, opts)
|
||||||
|
---@cast opts treesitter.RequireLangOpts
|
||||||
|
opts = opts or {}
|
||||||
|
local path = opts.path
|
||||||
|
local silent = opts.silent
|
||||||
|
local filetype = opts.filetype or lang
|
||||||
|
local symbol_name = opts.symbol_name
|
||||||
|
|
||||||
|
vim.validate({
|
||||||
|
lang = { lang, 'string' },
|
||||||
|
path = { path, 'string', true },
|
||||||
|
silent = { silent, 'boolean', true },
|
||||||
|
symbol_name = { symbol_name, 'string', true },
|
||||||
|
filetype = { filetype, { 'string', 'table' }, true },
|
||||||
|
})
|
||||||
|
|
||||||
|
M.register(lang, filetype or lang)
|
||||||
|
|
||||||
if vim._ts_has_language(lang) then
|
if vim._ts_has_language(lang) then
|
||||||
return true
|
return true
|
||||||
end
|
end
|
||||||
|
|
||||||
if path == nil then
|
if path == nil then
|
||||||
if not (lang and lang:match('[%w_]+') == lang) then
|
if not (lang and lang:match('[%w_]+') == lang) then
|
||||||
if silent then
|
if silent then
|
||||||
@ -35,9 +82,9 @@ function M.require_language(lang, path, silent, symbol_name)
|
|||||||
end
|
end
|
||||||
|
|
||||||
if silent then
|
if silent then
|
||||||
return pcall(function()
|
if not pcall(vim._ts_add_language, path, lang, symbol_name) then
|
||||||
vim._ts_add_language(path, lang, symbol_name)
|
return false
|
||||||
end)
|
end
|
||||||
else
|
else
|
||||||
vim._ts_add_language(path, lang, symbol_name)
|
vim._ts_add_language(path, lang, symbol_name)
|
||||||
end
|
end
|
||||||
@ -45,6 +92,27 @@ function M.require_language(lang, path, silent, symbol_name)
|
|||||||
return true
|
return true
|
||||||
end
|
end
|
||||||
|
|
||||||
|
--- Register a lang to be used for a filetype (or list of filetypes).
|
||||||
|
---@param lang string Language to register
|
||||||
|
---@param filetype string|string[] Filetype(s) to associate with lang
|
||||||
|
function M.register(lang, filetype)
|
||||||
|
vim.validate({
|
||||||
|
lang = { lang, 'string' },
|
||||||
|
filetype = { filetype, { 'string', 'table' } },
|
||||||
|
})
|
||||||
|
|
||||||
|
local filetypes ---@type string[]
|
||||||
|
if type(filetype) == 'string' then
|
||||||
|
filetypes = { filetype }
|
||||||
|
else
|
||||||
|
filetypes = filetype
|
||||||
|
end
|
||||||
|
|
||||||
|
for _, f in ipairs(filetypes) do
|
||||||
|
ft_to_lang[f] = lang
|
||||||
|
end
|
||||||
|
end
|
||||||
|
|
||||||
--- Inspects the provided language.
|
--- Inspects the provided language.
|
||||||
---
|
---
|
||||||
--- Inspecting provides some useful information on the language like node names, ...
|
--- Inspecting provides some useful information on the language like node names, ...
|
||||||
@ -52,7 +120,7 @@ end
|
|||||||
---@param lang string Language
|
---@param lang string Language
|
||||||
---@return table
|
---@return table
|
||||||
function M.inspect_language(lang)
|
function M.inspect_language(lang)
|
||||||
M.require_language(lang)
|
M.add(lang)
|
||||||
return vim._ts_inspect_language(lang)
|
return vim._ts_inspect_language(lang)
|
||||||
end
|
end
|
||||||
|
|
||||||
|
@ -51,7 +51,7 @@ LanguageTree.__index = LanguageTree
|
|||||||
--- query per language.
|
--- query per language.
|
||||||
---@return LanguageTree parser object
|
---@return LanguageTree parser object
|
||||||
function LanguageTree.new(source, lang, opts)
|
function LanguageTree.new(source, lang, opts)
|
||||||
language.require_language(lang)
|
language.add(lang)
|
||||||
---@type LanguageTreeOpts
|
---@type LanguageTreeOpts
|
||||||
opts = opts or {}
|
opts = opts or {}
|
||||||
|
|
||||||
@ -170,7 +170,7 @@ function LanguageTree:parse()
|
|||||||
local seen_langs = {} ---@type table<string,boolean>
|
local seen_langs = {} ---@type table<string,boolean>
|
||||||
|
|
||||||
for lang, injection_ranges in pairs(injections_by_lang) do
|
for lang, injection_ranges in pairs(injections_by_lang) do
|
||||||
local has_lang = language.require_language(lang, nil, true)
|
local has_lang = language.add(lang, { silent = true })
|
||||||
|
|
||||||
-- Child language trees should just be ignored if not found, since
|
-- Child language trees should just be ignored if not found, since
|
||||||
-- they can depend on the text of a node. Intermediate strings
|
-- they can depend on the text of a node. Intermediate strings
|
||||||
|
@ -252,7 +252,7 @@ end)
|
|||||||
---
|
---
|
||||||
---@return Query Parsed query
|
---@return Query Parsed query
|
||||||
function M.parse_query(lang, query)
|
function M.parse_query(lang, query)
|
||||||
language.require_language(lang)
|
language.add(lang)
|
||||||
local cached = query_cache[lang][query]
|
local cached = query_cache[lang][query]
|
||||||
if cached then
|
if cached then
|
||||||
return cached
|
return cached
|
||||||
|
@ -18,22 +18,23 @@ describe('treesitter language API', function()
|
|||||||
|
|
||||||
-- actual message depends on platform
|
-- actual message depends on platform
|
||||||
matches("Failed to load parser for language 'borklang': uv_dlopen: .+",
|
matches("Failed to load parser for language 'borklang': uv_dlopen: .+",
|
||||||
pcall_err(exec_lua, "parser = vim.treesitter.require_language('borklang', 'borkbork.so')"))
|
pcall_err(exec_lua, "parser = vim.treesitter.add('borklang', { path = 'borkbork.so' })"))
|
||||||
|
|
||||||
-- Should not throw an error when silent
|
-- Should not throw an error when silent
|
||||||
eq(false, exec_lua("return vim.treesitter.require_language('borklang', nil, true)"))
|
eq(false, exec_lua("return vim.treesitter.add('borklang', { silent = true })"))
|
||||||
eq(false, exec_lua("return vim.treesitter.require_language('borklang', 'borkbork.so', true)"))
|
|
||||||
|
eq(false, exec_lua("return vim.treesitter.add('borklang', { path = 'borkbork.so', silent = true })"))
|
||||||
|
|
||||||
eq(".../language.lua:0: no parser for 'borklang' language, see :help treesitter-parsers",
|
eq(".../language.lua:0: no parser for 'borklang' language, see :help treesitter-parsers",
|
||||||
pcall_err(exec_lua, "parser = vim.treesitter.inspect_language('borklang')"))
|
pcall_err(exec_lua, "parser = vim.treesitter.inspect_language('borklang')"))
|
||||||
|
|
||||||
matches("Failed to load parser: uv_dlsym: .+",
|
matches("Failed to load parser: uv_dlsym: .+",
|
||||||
pcall_err(exec_lua, 'vim.treesitter.require_language("c", nil, false, "borklang")'))
|
pcall_err(exec_lua, 'vim.treesitter.add("c", { symbol_name = "borklang" })'))
|
||||||
end)
|
end)
|
||||||
|
|
||||||
it('shows error for invalid language name', function()
|
it('shows error for invalid language name', function()
|
||||||
eq(".../language.lua:0: '/foo/' is not a valid language name",
|
eq(".../language.lua:0: '/foo/' is not a valid language name",
|
||||||
pcall_err(exec_lua, 'vim.treesitter.require_language("/foo/", nil, false)'))
|
pcall_err(exec_lua, 'vim.treesitter.add("/foo/", nil, false)'))
|
||||||
end)
|
end)
|
||||||
|
|
||||||
it('inspects language', function()
|
it('inspects language', function()
|
||||||
|
@ -182,8 +182,9 @@ void ui_refresh(void)
|
|||||||
local firstrun = q(1)
|
local firstrun = q(1)
|
||||||
local manyruns = q(100)
|
local manyruns = q(100)
|
||||||
|
|
||||||
|
local factor = is_os('win') and 3 or 4
|
||||||
-- First run should be at least 4x slower.
|
-- First run should be at least 4x slower.
|
||||||
assert(400 * manyruns < firstrun, ('firstrun: %d ms, manyruns: %d ms'):format(firstrun / 1000, manyruns / 1000))
|
assert(factor * 100 * manyruns < firstrun, ('firstrun: %d ms, manyruns: %d ms'):format(firstrun / 1000, manyruns / 1000))
|
||||||
end)
|
end)
|
||||||
|
|
||||||
it('support query and iter by capture', function()
|
it('support query and iter by capture', function()
|
||||||
|
Loading…
Reference in New Issue
Block a user