2022-05-31 22:34:14 +02:00
|
|
|
-- mod-version:3
|
2020-11-21 23:22:44 +01:00
|
|
|
local core = require "core"
|
|
|
|
local command = require "core.command"
|
2021-02-18 10:10:06 +01:00
|
|
|
local common = require "core.common"
|
2020-11-21 23:22:44 +01:00
|
|
|
local config = require "core.config"
|
2022-03-15 23:14:27 +01:00
|
|
|
local core_syntax = require "core.syntax"
|
2020-11-21 23:22:44 +01:00
|
|
|
local DocView = require "core.docview"
|
|
|
|
local Doc = require "core.doc"
|
|
|
|
|
|
|
|
local cache = setmetatable({}, { __mode = "k" })
|
2022-03-15 23:14:27 +01:00
|
|
|
local comments_cache = {}
|
|
|
|
local auto_detect_max_lines = 150
|
2020-11-21 23:22:44 +01:00
|
|
|
|
|
|
|
|
2022-03-15 23:14:27 +01:00
|
|
|
local function indent_occurrences_more_than_once(stat, idx)
|
|
|
|
if stat[idx-1] and stat[idx-1] == stat[idx] then
|
|
|
|
return true
|
|
|
|
elseif stat[idx+1] and stat[idx+1] == stat[idx] then
|
|
|
|
return true
|
2020-11-21 23:22:44 +01:00
|
|
|
end
|
2022-03-15 23:14:27 +01:00
|
|
|
return false
|
2020-11-21 23:22:44 +01:00
|
|
|
end
|
|
|
|
|
|
|
|
|
|
|
|
local function optimal_indent_from_stat(stat)
|
|
|
|
if #stat == 0 then return nil, 0 end
|
2022-03-15 23:14:27 +01:00
|
|
|
table.sort(stat, function(a, b) return a > b end)
|
|
|
|
local best_indent = 0
|
|
|
|
local best_score = 0
|
|
|
|
local count = #stat
|
|
|
|
for x=1, count do
|
|
|
|
local indent = stat[x]
|
2020-11-21 23:22:44 +01:00
|
|
|
local score = 0
|
2022-03-15 23:14:27 +01:00
|
|
|
for y=1, count do
|
|
|
|
if y ~= x and stat[y] % indent == 0 then
|
|
|
|
score = score + 1
|
|
|
|
elseif
|
|
|
|
indent > stat[y]
|
|
|
|
and
|
2023-05-09 19:51:20 +02:00
|
|
|
(
|
|
|
|
indent_occurrences_more_than_once(stat, y)
|
|
|
|
or
|
|
|
|
(y == count and stat[y] > 1)
|
|
|
|
)
|
2022-03-15 23:14:27 +01:00
|
|
|
then
|
|
|
|
score = 0
|
|
|
|
break
|
2020-11-21 23:22:44 +01:00
|
|
|
end
|
|
|
|
end
|
2022-03-15 23:14:27 +01:00
|
|
|
if score > best_score then
|
|
|
|
best_indent = indent
|
|
|
|
best_score = score
|
|
|
|
end
|
|
|
|
if score > 0 then
|
|
|
|
break
|
|
|
|
end
|
2020-11-21 23:22:44 +01:00
|
|
|
end
|
2022-03-15 23:14:27 +01:00
|
|
|
return best_score > 0 and best_indent or nil, best_score
|
2020-11-21 23:22:44 +01:00
|
|
|
end
|
|
|
|
|
2021-02-18 10:10:06 +01:00
|
|
|
|
2022-03-15 23:14:27 +01:00
|
|
|
local function escape_comment_tokens(token)
|
|
|
|
local special_chars = "*-%[].()+?^$"
|
|
|
|
local escaped = ""
|
|
|
|
for x=1, token:len() do
|
|
|
|
local found = false
|
|
|
|
for y=1, special_chars:len() do
|
|
|
|
if token:sub(x, x) == special_chars:sub(y, y) then
|
|
|
|
escaped = escaped .. "%" .. token:sub(x, x)
|
|
|
|
found = true
|
|
|
|
break
|
|
|
|
end
|
|
|
|
end
|
|
|
|
if not found then
|
|
|
|
escaped = escaped .. token:sub(x, x)
|
|
|
|
end
|
|
|
|
end
|
|
|
|
return escaped
|
|
|
|
end
|
|
|
|
|
|
|
|
|
2022-12-21 03:28:29 +01:00
|
|
|
local function get_comment_patterns(syntax, _loop)
|
|
|
|
_loop = _loop or 1
|
|
|
|
if _loop > 5 then return end
|
2022-03-22 15:35:44 +01:00
|
|
|
if comments_cache[syntax] then
|
|
|
|
if #comments_cache[syntax] > 0 then
|
|
|
|
return comments_cache[syntax]
|
2022-03-15 23:14:27 +01:00
|
|
|
else
|
|
|
|
return nil
|
|
|
|
end
|
|
|
|
end
|
|
|
|
local comments = {}
|
|
|
|
for idx=1, #syntax.patterns do
|
|
|
|
local pattern = syntax.patterns[idx]
|
|
|
|
local startp = ""
|
|
|
|
if
|
|
|
|
type(pattern.type) == "string"
|
|
|
|
and
|
|
|
|
(pattern.type == "comment" or pattern.type == "string")
|
|
|
|
then
|
|
|
|
local not_is_string = pattern.type ~= "string"
|
|
|
|
if pattern.pattern then
|
|
|
|
startp = type(pattern.pattern) == "table"
|
|
|
|
and pattern.pattern[1] or pattern.pattern
|
|
|
|
if not_is_string and startp:sub(1, 1) ~= "^" then
|
|
|
|
startp = "^%s*" .. startp
|
|
|
|
elseif not_is_string then
|
|
|
|
startp = "^%s*" .. startp:sub(2, startp:len())
|
|
|
|
end
|
|
|
|
if type(pattern.pattern) == "table" then
|
|
|
|
table.insert(comments, {"p", startp, pattern.pattern[2]})
|
|
|
|
elseif not_is_string then
|
|
|
|
table.insert(comments, {"p", startp})
|
|
|
|
end
|
|
|
|
elseif pattern.regex then
|
|
|
|
startp = type(pattern.regex) == "table"
|
|
|
|
and pattern.regex[1] or pattern.regex
|
|
|
|
if not_is_string and startp:sub(1, 1) ~= "^" then
|
|
|
|
startp = "^\\s*" .. startp
|
|
|
|
elseif not_is_string then
|
|
|
|
startp = "^\\s*" .. startp:sub(2, startp:len())
|
|
|
|
end
|
|
|
|
if type(pattern.regex) == "table" then
|
|
|
|
table.insert(comments, {
|
2023-05-09 19:51:20 +02:00
|
|
|
"r", regex.compile(startp), regex.compile(pattern.regex[2]), r=startp
|
2022-03-15 23:14:27 +01:00
|
|
|
})
|
|
|
|
elseif not_is_string then
|
2023-05-09 19:51:20 +02:00
|
|
|
table.insert(comments, {"r", regex.compile(startp), r=startp})
|
2022-03-15 23:14:27 +01:00
|
|
|
end
|
|
|
|
end
|
|
|
|
elseif pattern.syntax then
|
2022-03-22 15:17:42 +01:00
|
|
|
local subsyntax = type(pattern.syntax) == 'table' and pattern.syntax
|
|
|
|
or core_syntax.get("file"..pattern.syntax, "")
|
2022-12-21 03:28:29 +01:00
|
|
|
local sub_comments = get_comment_patterns(subsyntax, _loop + 1)
|
2022-03-15 23:14:27 +01:00
|
|
|
if sub_comments then
|
|
|
|
for s=1, #sub_comments do
|
|
|
|
table.insert(comments, sub_comments[s])
|
|
|
|
end
|
|
|
|
end
|
2021-02-18 10:10:06 +01:00
|
|
|
end
|
|
|
|
end
|
2022-03-15 23:14:27 +01:00
|
|
|
if #comments == 0 then
|
|
|
|
local single_line_comment = syntax.comment
|
|
|
|
and escape_comment_tokens(syntax.comment) or nil
|
|
|
|
local block_comment = nil
|
|
|
|
if syntax.block_comment then
|
|
|
|
block_comment = {
|
|
|
|
escape_comment_tokens(syntax.block_comment[1]),
|
|
|
|
escape_comment_tokens(syntax.block_comment[2])
|
|
|
|
}
|
|
|
|
end
|
|
|
|
if single_line_comment then
|
|
|
|
table.insert(comments, {"p", "^%s*" .. single_line_comment})
|
|
|
|
end
|
|
|
|
if block_comment then
|
|
|
|
table.insert(comments, {"p", "^%s*" .. block_comment[1], block_comment[2]})
|
|
|
|
end
|
|
|
|
end
|
2023-05-09 19:51:20 +02:00
|
|
|
-- Put comments first and strings last
|
|
|
|
table.sort(comments, function(c1, c2)
|
|
|
|
local comment1, comment2 = false, false
|
|
|
|
if
|
|
|
|
(c1[1] == "p" and string.find(c1[2], "^%s*", 1, true))
|
|
|
|
or
|
|
|
|
(c1[1] == "r" and string.find(c1["r"], "^\\s*", 1, true))
|
|
|
|
then
|
|
|
|
comment1 = true
|
|
|
|
end
|
|
|
|
if
|
|
|
|
(c2[1] == "p" and string.find(c2[2], "^%s*", 1, true))
|
|
|
|
or
|
|
|
|
(c2[1] == "r" and string.find(c2["r"], "^\\s*", 1, true))
|
|
|
|
then
|
|
|
|
comment2 = true
|
|
|
|
end
|
|
|
|
return comment1 and not comment2
|
|
|
|
end)
|
2022-03-22 15:35:44 +01:00
|
|
|
comments_cache[syntax] = comments
|
2022-03-15 23:14:27 +01:00
|
|
|
if #comments > 0 then
|
|
|
|
return comments
|
|
|
|
end
|
|
|
|
return nil
|
2021-02-18 10:10:06 +01:00
|
|
|
end
|
|
|
|
|
2022-03-15 23:14:27 +01:00
|
|
|
|
2021-02-18 10:10:06 +01:00
|
|
|
local function get_non_empty_lines(syntax, lines)
|
|
|
|
return coroutine.wrap(function()
|
2022-03-15 23:14:27 +01:00
|
|
|
local comments = get_comment_patterns(syntax)
|
|
|
|
|
2021-02-19 09:23:55 +01:00
|
|
|
local i = 0
|
2022-03-15 23:14:27 +01:00
|
|
|
local end_regex = nil
|
|
|
|
local end_pattern = nil
|
|
|
|
local inside_comment = false
|
2021-02-19 09:23:55 +01:00
|
|
|
for _, line in ipairs(lines) do
|
2022-03-15 23:14:27 +01:00
|
|
|
if line:gsub("^%s+", "") ~= "" then
|
|
|
|
local is_comment = false
|
|
|
|
if comments then
|
|
|
|
if not inside_comment then
|
|
|
|
for c=1, #comments do
|
|
|
|
local comment = comments[c]
|
|
|
|
if comment[1] == "p" then
|
|
|
|
if comment[3] then
|
|
|
|
local start, ending = line:find(comment[2])
|
|
|
|
if start then
|
|
|
|
if not line:find(comment[3], ending+1) then
|
|
|
|
is_comment = true
|
|
|
|
inside_comment = true
|
|
|
|
end_pattern = comment[3]
|
|
|
|
end
|
|
|
|
break
|
|
|
|
end
|
|
|
|
elseif line:find(comment[2]) then
|
|
|
|
is_comment = true
|
|
|
|
break
|
|
|
|
end
|
|
|
|
else
|
|
|
|
if comment[3] then
|
2022-12-12 03:25:42 +01:00
|
|
|
local start, ending = regex.find_offsets(
|
2022-03-15 23:14:27 +01:00
|
|
|
comment[2], line, 1, regex.ANCHORED
|
|
|
|
)
|
|
|
|
if start then
|
2022-12-12 03:25:42 +01:00
|
|
|
if not regex.find_offsets(
|
2022-03-15 23:14:27 +01:00
|
|
|
comment[3], line, ending+1, regex.ANCHORED
|
|
|
|
)
|
|
|
|
then
|
|
|
|
is_comment = true
|
|
|
|
inside_comment = true
|
|
|
|
end_regex = comment[3]
|
|
|
|
end
|
|
|
|
break
|
|
|
|
end
|
2022-12-12 03:25:42 +01:00
|
|
|
elseif regex.find_offsets(comment[2], line, 1, regex.ANCHORED) then
|
2022-03-15 23:14:27 +01:00
|
|
|
is_comment = true
|
|
|
|
break
|
|
|
|
end
|
|
|
|
end
|
|
|
|
end
|
|
|
|
elseif end_pattern and line:find(end_pattern) then
|
|
|
|
is_comment = true
|
|
|
|
inside_comment = false
|
|
|
|
end_pattern = nil
|
2022-12-12 03:25:42 +01:00
|
|
|
elseif end_regex and regex.find_offsets(end_regex, line) then
|
2022-03-15 23:14:27 +01:00
|
|
|
is_comment = true
|
|
|
|
inside_comment = false
|
|
|
|
end_regex = nil
|
|
|
|
end
|
|
|
|
end
|
|
|
|
if
|
|
|
|
not is_comment
|
|
|
|
and
|
|
|
|
not inside_comment
|
|
|
|
then
|
|
|
|
i = i + 1
|
|
|
|
coroutine.yield(i, line)
|
|
|
|
end
|
2021-02-18 10:10:06 +01:00
|
|
|
end
|
|
|
|
end
|
|
|
|
end)
|
|
|
|
end
|
|
|
|
|
|
|
|
|
2020-11-21 23:22:44 +01:00
|
|
|
local function detect_indent_stat(doc)
|
|
|
|
local stat = {}
|
|
|
|
local tab_count = 0
|
2022-03-15 23:14:27 +01:00
|
|
|
local runs = 1
|
|
|
|
local max_lines = auto_detect_max_lines
|
2021-02-18 10:10:06 +01:00
|
|
|
for i, text in get_non_empty_lines(doc.syntax, doc.lines) do
|
2022-03-15 23:14:27 +01:00
|
|
|
local spaces = text:match("^ +")
|
|
|
|
if spaces then table.insert(stat, spaces:len()) end
|
|
|
|
local tabs = text:match("^\t+")
|
|
|
|
if tabs then tab_count = tab_count + 1 end
|
|
|
|
-- if nothing found for first lines try at least 4 more times
|
|
|
|
if i == max_lines and runs < 5 and #stat == 0 and tab_count == 0 then
|
|
|
|
max_lines = max_lines + auto_detect_max_lines
|
|
|
|
runs = runs + 1
|
2020-11-21 23:22:44 +01:00
|
|
|
-- Stop parsing when files is very long. Not needed for euristic determination.
|
2022-03-15 23:14:27 +01:00
|
|
|
elseif i > max_lines then break end
|
2020-11-21 23:22:44 +01:00
|
|
|
end
|
|
|
|
local indent, score = optimal_indent_from_stat(stat)
|
|
|
|
if tab_count > score then
|
2021-02-20 22:56:52 +01:00
|
|
|
return "hard", config.indent_size, tab_count
|
2021-02-19 11:51:49 +01:00
|
|
|
else
|
|
|
|
return "soft", indent or config.indent_size, score or 0
|
2020-11-21 23:22:44 +01:00
|
|
|
end
|
|
|
|
end
|
|
|
|
|
|
|
|
|
|
|
|
local function update_cache(doc)
|
2021-02-19 11:51:49 +01:00
|
|
|
local type, size, score = detect_indent_stat(doc)
|
2022-03-15 23:14:27 +01:00
|
|
|
local score_threshold = 2
|
2021-09-06 18:58:58 +02:00
|
|
|
if score < score_threshold then
|
|
|
|
-- use default values
|
|
|
|
type = config.tab_type
|
|
|
|
size = config.indent_size
|
|
|
|
end
|
2021-05-27 16:17:19 +02:00
|
|
|
cache[doc] = { type = type, size = size, confirmed = (score >= score_threshold) }
|
2021-02-20 22:56:52 +01:00
|
|
|
doc.indent_info = cache[doc]
|
2020-11-21 23:22:44 +01:00
|
|
|
end
|
|
|
|
|
|
|
|
|
|
|
|
local new = Doc.new
|
|
|
|
function Doc:new(...)
|
|
|
|
new(self, ...)
|
|
|
|
update_cache(self)
|
|
|
|
end
|
|
|
|
|
|
|
|
local clean = Doc.clean
|
|
|
|
function Doc:clean(...)
|
|
|
|
clean(self, ...)
|
2021-11-20 03:22:53 +01:00
|
|
|
local _, _, confirmed = self:get_indent_info()
|
|
|
|
if not confirmed then
|
2021-09-06 22:58:43 +02:00
|
|
|
update_cache(self)
|
|
|
|
end
|
2020-11-21 23:22:44 +01:00
|
|
|
end
|
|
|
|
|
|
|
|
|
2021-09-07 02:38:32 +02:00
|
|
|
local function set_indent_type(doc, type)
|
2021-11-20 03:22:53 +01:00
|
|
|
local _, indent_size = doc:get_indent_info()
|
2022-03-15 23:14:27 +01:00
|
|
|
cache[doc] = {
|
|
|
|
type = type,
|
|
|
|
size = indent_size,
|
|
|
|
confirmed = true
|
|
|
|
}
|
2021-09-07 02:38:32 +02:00
|
|
|
doc.indent_info = cache[doc]
|
|
|
|
end
|
|
|
|
|
2022-08-14 01:56:58 +02:00
|
|
|
local function set_indent_type_command(dv)
|
2022-05-30 22:06:47 +02:00
|
|
|
core.command_view:enter("Specify indent style for this file", {
|
|
|
|
submit = function(value)
|
2022-08-14 01:56:58 +02:00
|
|
|
local doc = dv.doc
|
2021-09-07 02:38:32 +02:00
|
|
|
value = value:lower()
|
|
|
|
set_indent_type(doc, value == "tabs" and "hard" or "soft")
|
|
|
|
end,
|
2022-05-30 22:06:47 +02:00
|
|
|
suggest = function(text)
|
2021-09-07 02:38:32 +02:00
|
|
|
return common.fuzzy_match({"tabs", "spaces"}, text)
|
|
|
|
end,
|
2022-05-30 22:06:47 +02:00
|
|
|
validate = function(text)
|
2021-09-07 02:38:32 +02:00
|
|
|
local t = text:lower()
|
|
|
|
return t == "tabs" or t == "spaces"
|
|
|
|
end
|
2022-05-30 22:06:47 +02:00
|
|
|
})
|
2021-09-07 02:38:32 +02:00
|
|
|
end
|
|
|
|
|
|
|
|
|
|
|
|
local function set_indent_size(doc, size)
|
2021-11-20 03:22:53 +01:00
|
|
|
local indent_type = doc:get_indent_info()
|
2022-03-15 23:14:27 +01:00
|
|
|
cache[doc] = {
|
|
|
|
type = indent_type,
|
|
|
|
size = size,
|
|
|
|
confirmed = true
|
|
|
|
}
|
2021-09-07 02:38:32 +02:00
|
|
|
doc.indent_info = cache[doc]
|
|
|
|
end
|
|
|
|
|
2022-08-14 01:56:58 +02:00
|
|
|
local function set_indent_size_command(dv)
|
2022-05-30 22:06:47 +02:00
|
|
|
core.command_view:enter("Specify indent size for current file", {
|
|
|
|
submit = function(value)
|
2022-03-15 23:14:27 +01:00
|
|
|
value = math.floor(tonumber(value))
|
2022-08-14 01:56:58 +02:00
|
|
|
local doc = dv.doc
|
2021-09-07 02:38:32 +02:00
|
|
|
set_indent_size(doc, value)
|
|
|
|
end,
|
2022-05-30 22:06:47 +02:00
|
|
|
validate = function(value)
|
2022-03-15 23:14:27 +01:00
|
|
|
value = tonumber(value)
|
2021-09-07 02:38:32 +02:00
|
|
|
return value ~= nil and value >= 1
|
|
|
|
end
|
2022-05-30 22:06:47 +02:00
|
|
|
})
|
2021-09-07 02:38:32 +02:00
|
|
|
end
|
|
|
|
|
|
|
|
|
|
|
|
command.add("core.docview", {
|
|
|
|
["indent:set-file-indent-type"] = set_indent_type_command,
|
|
|
|
["indent:set-file-indent-size"] = set_indent_size_command
|
|
|
|
})
|
|
|
|
|
2022-03-15 23:14:27 +01:00
|
|
|
command.add(
|
|
|
|
function()
|
2021-09-07 02:38:32 +02:00
|
|
|
return core.active_view:is(DocView)
|
2022-03-15 23:14:27 +01:00
|
|
|
and cache[core.active_view.doc]
|
|
|
|
and cache[core.active_view.doc].type == "soft"
|
2021-09-07 02:38:32 +02:00
|
|
|
end, {
|
2022-03-15 23:14:27 +01:00
|
|
|
["indent:switch-file-to-tabs-indentation"] = function()
|
|
|
|
set_indent_type(core.active_view.doc, "hard")
|
|
|
|
end
|
2021-09-07 02:38:32 +02:00
|
|
|
})
|
|
|
|
|
2022-03-15 23:14:27 +01:00
|
|
|
command.add(
|
|
|
|
function()
|
2021-09-07 02:38:32 +02:00
|
|
|
return core.active_view:is(DocView)
|
2022-03-15 23:14:27 +01:00
|
|
|
and cache[core.active_view.doc]
|
|
|
|
and cache[core.active_view.doc].type == "hard"
|
2021-09-07 02:38:32 +02:00
|
|
|
end, {
|
2022-03-15 23:14:27 +01:00
|
|
|
["indent:switch-file-to-spaces-indentation"] = function()
|
|
|
|
set_indent_type(core.active_view.doc, "soft")
|
|
|
|
end
|
2021-09-07 02:38:32 +02:00
|
|
|
})
|