Skip to content

Commit f40b2ea

Browse files
authored
fix: split function accounting for quotes (#158)
* fix #157: split function accounting for quotes Added Util.splitCSVLine() function that splits a CSV-formatted string into an array of tokens, accounting for quotes (single and double) and escape characters. * fix CI warning Warning: "src/util/Util.lua:263:24: (W311) value assigned to variable sep is unused" * update split function - renamed from splitCSVLine to splitEnhanced, since it's not compliant to RFC 4180 and it could be deceiving; - added optional parameters; - now throws error if quotes are not closed; * update Util.splitEnhanced() - fixed its behaviour to comply with Casbin documentation (see the note at https://casbin.org/docs/policy-storage#loading-policy-from-a-csv-file and issue 886 at casbin/casbin): "If your file contains commas and double quotes, you should enclose the field in double quotes and double any embedded double quotes." Therefore I removed the extra behaviour related to single quotes ' and escape character \ and refactored the function. * added example with double quotes * Unit test for Util.splitEnhanced() * fixed basic with regex example * Update basic_policy_with_regex.csv typo * Unit test for regexMatch with {N,M} quantifier * more unit tests for Util.splitEnhanced - check if the last field is a quoted field - throwing error when there are extra characters after the double quote that closes the quoted field. * Update Util.lua - support for quotes in last field; - throws an exception if there are other characters after the double quote that closes the quoted field. * changed "sep" parameter name to "delim" (uniform to Util.split() ) * changed "line" parameter name to "str" (uniform to Util.split() )
1 parent 24bd8d6 commit f40b2ea

File tree

6 files changed

+149
-1
lines changed

6 files changed

+149
-1
lines changed

examples/basic_model_with_regex.conf

+11
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,11 @@
1+
[request_definition]
2+
r = sub, obj, act
3+
4+
[policy_definition]
5+
p = sub, obj, act
6+
7+
[policy_effect]
8+
e = some(where (p.eft == allow))
9+
10+
[matchers]
11+
m = regexMatch(r.sub, p.sub) && regexMatch(r.obj, p.obj) && regexMatch(r.act, p.act)

examples/basic_policy_with_regex.csv

+3
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,3 @@
1+
p, ^admin$, .*, .*
2+
p, ^user.*, "^/users/[a-zA-Z0-9]{4,10}$", PUT|POST|PATCH|GET|OPTIONS
3+
p, ^guest$, ^/guest/.*, GET|OPTIONS

src/persist/Adapter.lua

+1-1
Original file line numberDiff line numberDiff line change
@@ -28,7 +28,7 @@ function Adapter.loadPolicyLine(line, model)
2828
return
2929
end
3030

31-
local tokens = Util.split(line, ",")
31+
local tokens = Util.splitEnhanced(line, ',', true)
3232
local key = tokens[1]
3333
local sec = key:sub(1, 1)
3434

src/util/Util.lua

+81
Original file line numberDiff line numberDiff line change
@@ -252,4 +252,85 @@ function Util.printTable(t)
252252
return s
253253
end
254254

255+
function Util.isOnlyWhitespaces(str)
256+
return str:match("^%s*$") ~= nil
257+
end
258+
259+
function Util.splitEnhanced(str, delim, trimFields)
260+
local result = {}
261+
local i = 1
262+
local quotedField
263+
local escaping = false
264+
local field = ""
265+
266+
if delim == nil then delim = ',' end
267+
if trimFields == nil then trimFields = true end
268+
269+
-- Loop over the characters of the string
270+
while i <= #str do
271+
local char = str:sub(i, i)
272+
273+
-- Check if it's the first character and it's a double quote.
274+
if Util.isOnlyWhitespaces(field) and char == '"' then
275+
-- Then this field is a quoted field
276+
quotedField = true
277+
else
278+
if quotedField then
279+
if escaping then
280+
-- ", End of quoted field
281+
if char == delim then
282+
if trimFields then
283+
field = Util.trim(field)
284+
end
285+
286+
table.insert(result, field)
287+
field = ""
288+
quotedField = false
289+
-- "" Escapes the double quote character
290+
elseif char == '"' then
291+
field = field .. char
292+
escaping = false
293+
-- " followed by some other character (not allowed)
294+
else
295+
error("Quoted fields cannot have extra characters outside double quotes.")
296+
end
297+
else -- Not escaping
298+
if char == '"' then
299+
escaping = true
300+
else
301+
field = field .. char
302+
end
303+
end
304+
305+
else -- Not quotedField
306+
if char == delim then
307+
if trimFields then
308+
field = Util.trim(field)
309+
end
310+
311+
table.insert(result, field)
312+
field = ""
313+
else
314+
field = field .. char
315+
end
316+
end
317+
end
318+
319+
i = i + 1
320+
end
321+
322+
-- Throw error if there are quotes left open
323+
if quotedField and not escaping then
324+
error("Unmatched quotes.")
325+
end
326+
327+
-- Add the last field (since it won't have the delimiter after it)
328+
if trimFields then
329+
field = Util.trim(field)
330+
end
331+
table.insert(result, field)
332+
333+
return result
334+
end
335+
255336
return Util

tests/main/enforcer_spec.lua

+24
Original file line numberDiff line numberDiff line change
@@ -515,4 +515,28 @@ describe("Enforcer tests", function ()
515515
assert.is.True(e:enforce("bob", "data2", "write"))
516516
assert.is.False(e:enforce("bogus", "data2", "write")) -- Non-existent subject
517517
end)
518+
519+
520+
it("regexMatch test", function ()
521+
522+
local model = path .. "/examples/basic_model_with_regex.conf"
523+
local policy = path .. "/examples/basic_policy_with_regex.csv"
524+
local e = Enforcer:new(model, policy)
525+
526+
assert.is.True(e:enforce("admin", "/", "PUT"))
527+
assert.is.True(e:enforce("admin", "/admin", "GET"))
528+
assert.is.True(e:enforce("admin", "/admin/anything", "POST"))
529+
assert.is.False(e:enforce("admin123", "/admin", "PUT"))
530+
531+
assert.is.True(e:enforce("user", "/users/alice", "GET"))
532+
assert.is.True(e:enforce("user", "/users/alice", "PUT"))
533+
assert.is.True(e:enforce("user123", "/users/alice", "PUT"))
534+
assert.is.False(e:enforce("user", "/users/", "PUT"))
535+
assert.is.False(e:enforce("user", "/users/123", "PUT"))
536+
assert.is.False(e:enforce("user", "/users/alice123456789", "PUT"))
537+
assert.is.False(e:enforce("user", "/admin", "PUT"))
538+
539+
assert.is.True(e:enforce("guest", "/guest/test", "GET"))
540+
assert.is.False(e:enforce("guest", "/guest/test", "PUT"))
541+
end)
518542
end)

tests/util/util_spec.lua

+29
Original file line numberDiff line numberDiff line change
@@ -84,6 +84,35 @@ describe("util tests", function()
8484
assert.are.same({"a", "b", "c"}, Util.split(" a, b ,c ", ","))
8585
end)
8686

87+
it("test isOnlyWhitespaces", function()
88+
assert.is.True(Util.isOnlyWhitespaces(" "))
89+
assert.is.True(Util.isOnlyWhitespaces(""))
90+
assert.is.True(Util.isOnlyWhitespaces("\t\t"))
91+
assert.is.False(Util.isOnlyWhitespaces(" abc"))
92+
assert.is.False(Util.isOnlyWhitespaces("abc\t"))
93+
assert.is.False(Util.isOnlyWhitespaces("\""))
94+
end)
95+
96+
it("test splitEnhanced", function()
97+
assert.are.same({"a", "b", "c"}, Util.splitEnhanced("a ,b ,c", ",", true))
98+
assert.are.same({"a", "b", "c"}, Util.splitEnhanced("a,b,c", ",", true))
99+
assert.are.same({"a", "b", "c"}, Util.splitEnhanced("a, b, c", ",", true))
100+
assert.are.same({"a", "b", "c"}, Util.splitEnhanced(" a, b ,c ", ",", true))
101+
102+
assert.are.same({"a", " b", " c"}, Util.splitEnhanced('a, b, c', ",", false))
103+
assert.are.same({"a", "b", "c"}, Util.splitEnhanced('a,b,c', ",", false))
104+
assert.are.same({" a", "b", "c"}, Util.splitEnhanced(' a,b,c', ",", false))
105+
assert.are.same({"a, b", "c"}, Util.splitEnhanced('"a, b", c', ",", true))
106+
assert.are.same({"a, b", "c"}, Util.splitEnhanced('" a, b", c', ",", true))
107+
assert.are.same({"a == \"b\"", "c"}, Util.splitEnhanced('a == "b", c', ",", true))
108+
assert.are.same({"a == \"b\"", "c"}, Util.splitEnhanced('"a == ""b"" ", c', ",", true))
109+
assert.are.same({"a", "b, c"}, Util.splitEnhanced('a, "b, c"', ",", true))
110+
111+
assert.has_error(function () Util.splitEnhanced('a, "b, c" ', ",", true) end, "Quoted fields cannot have extra characters outside double quotes.")
112+
assert.has_error(function () Util.splitEnhanced('"a, b" hello, c', ",", true) end, "Quoted fields cannot have extra characters outside double quotes.")
113+
assert.has_error(function () Util.splitEnhanced('a, b, "c ') end, "Unmatched quotes.")
114+
end)
115+
87116
it("test isInstance", function()
88117
local parent = {}
89118
parent.__index = parent

0 commit comments

Comments
 (0)