snacks.nvim/lua/snacks/picker/core/matcher.lua

566 lines
15 KiB
Lua

local Async = require("snacks.picker.util.async")
---@class snacks.picker.Item
---@field match_tick? number
---@field match_topk? number
---@class snacks.picker.matcher.Config
---@field regex? boolean used internally for positions of sources that use regex
---@field on_match? fun(matcher: snacks.picker.Matcher, item: snacks.picker.Item)
---@field on_done? fun(matcher: snacks.picker.Matcher)
---@class snacks.picker.Matcher
---@field opts snacks.picker.matcher.Config
---@field mods snacks.picker.matcher.Mods[][]
---@field one? snacks.picker.matcher.Mods
---@field pattern string
---@field tick number
---@field task snacks.picker.Async
---@field live? boolean
---@field score snacks.picker.Score
---@field sorting? boolean
---@field file? {path: string, pos: snacks.picker.Pos}
---@field cwd string
---@field frecency? snacks.picker.Frecency
---@field subset? boolean
local M = {}
M.__index = M
M.DEFAULT_SCORE = 1000
M.INVERSE_SCORE = 1000
local BONUS_FRECENCY = 8
local BONUS_CWD = 10
local YIELD_MATCH = 1 -- ms
---@class snacks.picker.matcher.Mods
---@field pattern string
---@field chars string[]
---@field entropy number higher entropy is less likely to match
---@field field? string
---@field ignorecase? boolean
---@field fuzzy? boolean
---@field regex? boolean
---@field word? boolean
---@field exact_suffix? boolean
---@field exact_prefix? boolean
---@field inverse? boolean
---@param opts? snacks.picker.matcher.Config|{}
function M.new(opts)
local self = setmetatable({}, M)
self.opts = vim.tbl_deep_extend("force", {
fuzzy = true,
smartcase = true,
ignorecase = true,
}, opts or {})
self.pattern = ""
self.task = Async.nop()
self.mods = {}
self.sorting = true
self.tick = 0
self.score = require("snacks.picker.core.score").new(self.opts)
self.frecency = self.opts.frecency and require("snacks.picker.core.frecency").new() or nil
return self
end
function M:empty()
return not next(self.mods)
end
function M:running()
return self.task:running()
end
function M:abort()
self.task:abort()
end
function M:close()
self:abort()
self.task = Async.nop()
end
---@param picker snacks.Picker
function M:run(picker)
self.task:abort()
picker.list:clear()
self.cwd = svim.fs.normalize(picker.opts.cwd or (vim.uv or vim.loop).cwd() or ".")
self.sorting = not self:empty() or picker.opts.matcher.sort_empty
-- PERF: fast path for empty pattern
if not (self.sorting or picker.finder.task:running()) then
picker.list.items = picker.finder.items
picker:update({ force = true })
if self.opts.on_done then
self.opts.on_done(self)
end
return
end
---@async
self.task = Async.new(function()
local yield = Async.yielder(YIELD_MATCH)
---@async
---@param item snacks.picker.Item
local function check(item)
if self:update(item) then
picker.list:add(item, self.sorting)
end
yield()
end
local count = #picker.finder.items
-- process topk first
for i = 1, count do
local item = picker.finder.items[i]
if item.match_topk then
item.match_topk = nil
check(item)
else
item.match_topk = nil
end
end
-- process matches next
for i = 1, count do
local item = picker.finder.items[i]
if item.score > 0 and item.match_tick ~= self.tick then
check(item)
end
end
-- if pattern is a subset of the previous pattern, then
-- only process items that didn't match previously
if self.subset then
for i = 1, count do
local item = picker.finder.items[i]
if item.score == 0 and item.match_tick == self.tick - 1 then
item.match_tick = self.tick
end
end
end
-- then the rest
local idx = 0
repeat
while idx < #picker.finder.items do
idx = idx + 1
local item = picker.finder.items[idx]
if item.match_tick ~= self.tick then
check(item)
end
end
-- suspend till we have more items
if picker.finder.task:running() then
Async.suspend()
end
until idx >= #picker.finder.items and not picker.finder.task:running()
picker:update({ force = true })
if self.opts.on_done then
vim.schedule(function()
self.opts.on_done(self)
end)
end
end)
end
---@param pattern string
---@return boolean changed
function M:init(pattern)
pattern = vim.trim(pattern)
if pattern == self.pattern then
return false
end
self.tick = self.tick + 1
self.file = nil
self.mods = {}
self.subset = self.pattern ~= "" and pattern:find(self.pattern, 1, true) == 1 and not pattern:find("[^%s%w]")
self.pattern = pattern
self:abort()
self.one = nil
if pattern == "" then
return true
end
if self.opts.regex then
self.mods = { { self:_prepare(pattern) } }
else
local is_or = false
for _, p in ipairs(vim.split(pattern, " +")) do
if p == "|" then
is_or = true
else
local mods = self:_prepare(p)
if mods.pattern ~= "" then
if is_or and #self.mods > 0 then
table.insert(self.mods[#self.mods], mods)
else
table.insert(self.mods, { mods })
end
end
is_or = false
end
end
end
for _, ors in ipairs(self.mods) do
-- sort by entropy, lower entropy is more likely to match
table.sort(ors, function(a, b)
return a.entropy < b.entropy
end)
end
-- sort by entropy, higher entropy is less likely to match
table.sort(self.mods, function(a, b)
return a[1].entropy > b[1].entropy
end)
if #self.mods == 1 and #self.mods[1] == 1 then
self.one = self.mods[1][1]
end
return true
end
---@param pattern string
---@return snacks.picker.matcher.Mods
function M:_prepare(pattern)
---@type snacks.picker.matcher.Mods
local mods = { pattern = pattern, entropy = 0, chars = {} }
if self.opts.regex then
mods.regex = true
else
local file_patterns = {
"^(.*[/\\].*):(%d*):(%d*)$",
"^(.*[/\\].*):(%d*)$",
"^(.+%.[a-z_]+):(%d*):(%d*)$",
"^(.+%.[a-z_]+):(%d*)$",
}
for _, p in ipairs(file_patterns) do
local file, line, col = pattern:match(p)
if file then
mods.field = "file"
mods.pattern = file .. "$"
self.file = {
path = file,
pos = { tonumber(line) or 1, tonumber(col) or 0 },
}
break
end
end
-- minimum two chars for field pattern
local field, p = pattern:match("^([%w_][%w_]+):(.*)$")
if field then
mods.field = field
mods.pattern = p
end
mods.ignorecase = self.opts.ignorecase
local is_lower = mods.pattern:lower() == mods.pattern
if self.opts.smartcase then
mods.ignorecase = is_lower
end
mods.fuzzy = self.opts.fuzzy
if not mods.fuzzy then
mods.entropy = mods.entropy + 10
end
if mods.pattern:sub(1, 1) == "!" then
mods.fuzzy, mods.inverse = false, true
mods.pattern = mods.pattern:sub(2)
mods.entropy = mods.entropy - 1
end
if mods.pattern:sub(1, 1) == "'" then
mods.fuzzy = false
mods.pattern = mods.pattern:sub(2)
mods.entropy = mods.entropy + 10
if mods.pattern:sub(-1, -1) == "'" then
mods.word = true
mods.pattern = mods.pattern:sub(1, -2)
mods.entropy = mods.entropy + 10
end
elseif mods.pattern:sub(1, 1) == "^" then
mods.fuzzy, mods.exact_prefix = false, true
mods.pattern = mods.pattern:sub(2)
mods.entropy = mods.entropy + 20
end
if mods.pattern:sub(-1, -1) == "$" then
mods.fuzzy = false
mods.exact_suffix = true
mods.pattern = mods.pattern:sub(1, -2)
mods.entropy = mods.entropy + 20
end
local rare_chars = #mods.pattern:gsub("[%w%s]", "")
mods.entropy = mods.entropy + math.min(#mods.pattern, 20) + rare_chars * 2
if not mods.ignorecase and not is_lower then
mods.entropy = mods.entropy * 2
end
if mods.ignorecase then
mods.pattern = mods.pattern:lower()
end
end
for c = 1, #mods.pattern do
mods.chars[c] = mods.pattern:sub(c, c)
end
return mods
end
---@param item snacks.picker.Item
---@return boolean matched
function M:update(item)
if item.match_pos then
item.pos = nil
end
local score = self:match(item)
item.match_tick, item.match_topk = self.tick, nil
if score ~= 0 then
if item.score_add then
score = score + item.score_add
end
if item.score_mul then
score = score * item.score_mul
end
if self.file and not item.pos then
item.pos = self.file.pos
item.match_pos = true
end
if item.file then
if self.frecency then
item.frecency = item.frecency or self.frecency:get(item)
score = score + (1 - 1 / (1 + item.frecency)) * BONUS_FRECENCY
end
if
self.opts.cwd_bonus
and (self.cwd == item.cwd or Snacks.picker.util.path(item):find(self.cwd, 1, true) == 1)
then
score = score + BONUS_CWD
end
end
item.score = score
if self.opts.on_match then
self.opts.on_match(self, item)
end
else
item.score = 0
end
return score > 0
end
--- Matches an item and returns the score.
--- Score is 0 if no match is found.
---@param item snacks.picker.Item
function M:match(item)
if self:empty() then
return M.DEFAULT_SCORE -- empty pattern matches everything
end
local score, s = 0, nil
-- fast path for single pattern
if self.one then
return self:_match(item, self.one) or 0
end
for _, any in ipairs(self.mods) do
-- fast path for single OR pattern
if #any == 1 then
s = self:_match(item, any[1])
else
for _, mods in ipairs(any) do
s = self:_match(item, mods)
if s then
break
end
end
end
if not s then
return 0
end
score = score + s
end
return score
end
--- Returns the fields that are used in the pattern.
---@return string[]
function M:fields()
local ret = {} ---@type table<string,boolean>
for _, any in ipairs(self.mods) do
for _, mods in ipairs(any) do
ret[mods.field or "text"] = true
end
end
return vim.tbl_keys(ret)
end
--- Returns the positions of the matched pattern in the item.
--- All search patterns are combined with OR.
---@param item snacks.picker.Item
function M:positions(item)
local all = {} ---@type snacks.picker.matcher.Mods[]
local ret = {} ---@type table<string,number[]>
for _, any in ipairs(self.mods) do
vim.list_extend(all, any)
end
for _, mods in ipairs(all) do
local _, from, to, str = self:_match(item, mods)
if from and to and str then
local field = mods.field or "text"
ret[field] = ret[field] or {}
local pos = ret[field]
if mods.fuzzy then
vim.list_extend(pos, self:fuzzy_positions(str, mods.chars, from))
else
for c = from, to do
pos[#pos + 1] = c
end
end
end
end
return ret
end
--- Returns the column of the first position of the matched pattern in the item.
---@param buf number
---@param item snacks.picker.Item
---@return snacks.picker.Pos?
function M:bufpos(buf, item)
if not item.pos then
return
end
local line = vim.api.nvim_buf_get_lines(buf, item.pos[1] - 1, item.pos[1], false)[1] or ""
local positions = self:positions({ text = line, idx = 1, score = 0 }).text or {}
table.sort(positions)
return #positions > 0 and { item.pos[1], positions[1] - 1 } or nil
end
---@param str string
---@param pattern string[]
---@param from number
function M:fuzzy_positions(str, pattern, from)
local ret = { from } ---@type number[]
for i = 2, #pattern do
ret[#ret + 1] = string.find(str, pattern[i], ret[#ret] + 1, true)
end
return ret
end
---@param str string
---@param pattern string
---@return number? score, number? from, number? to, string? str
function M:regex(str, pattern)
local ok, re = pcall(vim.regex, pattern)
if not ok then
return
end
local from, to = re:match_str(str)
if from and to then
from = from + 1
return self.score:get(str, from, to), from, to, str
end
end
---@param item snacks.picker.Item
---@param mods snacks.picker.matcher.Mods
---@return number? score, number? from, number? to, string? str
function M:_match(item, mods)
self.score.is_file = item.file ~= nil
local str = item.text
if mods.regex then
return self:regex(str, mods.pattern)
end
if mods.field then
if item[mods.field] == nil then
if mods.inverse then
return M.INVERSE_SCORE
end
return
end
str = tostring(item[mods.field])
end
local str_orig = str
str = mods.ignorecase and str:lower() or str
local from, to ---@type number?, number?
if mods.fuzzy then
return self:fuzzy(str, mods.chars)
end
if mods.exact_prefix then
if str:sub(1, #mods.pattern) == mods.pattern then
from, to = 1, #mods.pattern
end
elseif mods.exact_suffix then
if str:sub(-#mods.pattern) == mods.pattern then
from, to = #str - #mods.pattern + 1, #str
end
else
from, to = str:find(mods.pattern, 1, true)
-- word match
while mods.word and from and to do
local bound_left = self.score:is_left_boundary(str, from)
local bound_right = self.score:is_right_boundary(str, to)
if bound_left and bound_right then
break
end
from, to = str:find(mods.pattern, to + 1, true)
end
end
if mods.inverse then
if not from then
return M.INVERSE_SCORE
end
return
end
if from then
---@cast to number
return self.score:get(str_orig, from, to), from, to, str
end
end
---@param str string
---@param pattern string[]
---@param init? number
---@return number? from, number? to
function M:fuzzy_find(str, pattern, init)
local from = string.find(str, pattern[1], init or 1, true)
if not from then
return
end
self.score:init(str, from)
---@type number?, number
local last, n = from, #pattern
for i = 2, n do
last = string.find(str, pattern[i], last + 1, true)
if last then
self.score:update(last)
else
return
end
end
return from, last
end
--- Does a forward scan followed by a backward scan for each end position,
--- to find the best match.
---@param str string
---@param pattern string[]
---@return number? score, number? from, number? to, string? str
function M:fuzzy(str, pattern)
local from, to = self:fuzzy_find(str, pattern)
if not from then
return
end
---@cast to number
local best_from, best_to, best_score = from, to, self.score.score
while from do
if self.score.score > best_score then
best_from, best_to, best_score = from, to, self.score.score
end
from, to = self:fuzzy_find(str, pattern, from + 1)
end
return best_score, best_from, best_to, str
end
return M