2021-07-28 18:39:09 +02:00
|
|
|
function is_whitespace(char)
|
|
|
|
return char == " " or char == "\t" or char == "\r" or char == "\n"
|
|
|
|
end
|
|
|
|
|
2021-07-28 18:54:44 +02:00
|
|
|
local function table_map(tbl, func)
|
|
|
|
local result = {}
|
|
|
|
for i,value in ipairs(tbl) do
|
|
|
|
local newval = func(value, i)
|
|
|
|
if newval ~= nil then table.insert(result, newval) end
|
|
|
|
end
|
|
|
|
return result
|
|
|
|
end
|
|
|
|
|
2021-07-28 18:39:09 +02:00
|
|
|
function split_shell(text)
|
|
|
|
local text_length = #text
|
|
|
|
local scan_pos = 1
|
|
|
|
local result = { }
|
|
|
|
local acc = {}
|
|
|
|
local mode = "NORMAL" -- NORMAL, INSIDE_QUOTES_SINGLE, INSIDE_QUOTES_DOUBLE
|
|
|
|
|
|
|
|
|
|
|
|
for i=1,text_length do
|
|
|
|
local prevchar = ""
|
|
|
|
local curchar = text:sub(i,i)
|
|
|
|
local nextchar = ""
|
|
|
|
local nextnextchar = ""
|
|
|
|
if i > 1 then prevchar = text:sub(i-1, i-1) end
|
|
|
|
if i < text_length then nextchar = text:sub(i+1, i+1) end
|
|
|
|
if i+1 < text_length then nextnextchar = text:sub(i+2, i+2) end
|
|
|
|
|
|
|
|
if mode == "NORMAL" then
|
|
|
|
if is_whitespace(curchar) and #acc > 0 then
|
|
|
|
table.insert(result, table.concat(acc, ""))
|
|
|
|
acc = {}
|
|
|
|
elseif (curchar == "\"" or curchar == "'") and #acc == 0 and prevchar ~= "\\" then
|
|
|
|
if curchar == "\"" then
|
|
|
|
mode = "INSIDE_QUOTES_DOUBLE"
|
|
|
|
else
|
|
|
|
mode = "INSIDE_QUOTES_SINGLE"
|
|
|
|
end
|
|
|
|
else
|
|
|
|
table.insert(acc, curchar)
|
|
|
|
end
|
|
|
|
elseif mode == "INSIDE_QUOTES_DOUBLE" then
|
|
|
|
if curchar == "\"" and prevchar ~= "\\" and is_whitespace(nextchar) then
|
|
|
|
-- It's the end of a quote!
|
|
|
|
mode = "NORMAL"
|
2021-07-28 18:49:18 +02:00
|
|
|
elseif (curchar == "\\" and (
|
|
|
|
nextchar ~= "\""
|
|
|
|
or (nextchar == "\"" and not is_whitespace(nextnextchar))
|
|
|
|
)) or curchar ~= "\\" then
|
2021-07-28 18:39:09 +02:00
|
|
|
-- It's a regular character
|
|
|
|
table.insert(acc, curchar)
|
|
|
|
end
|
|
|
|
elseif mode == "INSIDE_QUOTES_SINGLE" then
|
|
|
|
if curchar == "'" and prevchar ~= "\\" and is_whitespace(nextchar) then
|
|
|
|
-- It's the end of a quote!
|
|
|
|
mode = "NORMAL"
|
2021-07-28 18:49:18 +02:00
|
|
|
elseif (curchar == "\\" and (
|
|
|
|
nextchar ~= "'"
|
|
|
|
or (nextchar == "'" and not is_whitespace(nextnextchar))
|
|
|
|
)) or curchar ~= "\\" then
|
2021-07-28 18:39:09 +02:00
|
|
|
-- It's a regular character
|
|
|
|
table.insert(acc, curchar)
|
|
|
|
end
|
|
|
|
end
|
|
|
|
end
|
|
|
|
|
|
|
|
if #acc > 0 then
|
|
|
|
table.insert(result, table.concat(acc, ""))
|
|
|
|
end
|
2021-07-28 18:54:44 +02:00
|
|
|
|
|
|
|
-- Unwind all escapes by 1 level
|
|
|
|
return table_map(result, function(str)
|
|
|
|
return str:gsub("\\([\"'\\])", "%1")
|
|
|
|
end)
|
2021-07-28 18:39:09 +02:00
|
|
|
end
|
|
|
|
|
|
|
|
function test(text)
|
|
|
|
print("Source", text)
|
|
|
|
for i,value in ipairs(split_shell(text)) do
|
|
|
|
print("i", i, "→", value)
|
|
|
|
end
|
|
|
|
print("************")
|
|
|
|
end
|
|
|
|
|
|
|
|
test("yay yay yay")
|
|
|
|
test("yay \"yay yay\" yay")
|
|
|
|
test("yay \"yay\\\" yay\" yay")
|
2021-07-28 18:54:44 +02:00
|
|
|
test("yay \"yay 'inside quotes' yay\\\"\" yay")
|
2021-07-28 18:39:09 +02:00
|
|
|
test("yay 'inside quotes' another")
|
2021-07-28 18:49:18 +02:00
|
|
|
test("y\"ay \"yay 'in\\\"side quotes' yay\" y\\\"ay")
|
|
|
|
|
|
|
|
-- for i=1,10000 do
|
|
|
|
-- split_shell("y\"ay \"yay 'in\\\"side quotes' yay\" y\\\"ay")
|
|
|
|
-- end
|