Skip to content

Commit

Permalink
feat(router) implement groups captures from regex URIs
Browse files Browse the repository at this point in the history
We now perform efficient matching for URIs based on its property and the
regex being evaluated. We favorise running `ngx.re.find` when the more
expensive `ngx.re.match` is not necessary.

When a regex URI has capture groups, we return them from the router
`exec()` for further processing inside the core, which will be
responsible for passing them along to plugins.

This also has the advantage of being more performant on router cache
hits, since URI stripping is done only once, at matching type, and
cached in the LRU structure. The same way, groups matching is cached as
well.

Implements: #677 (partially)
  • Loading branch information
thibaultcha committed Jul 20, 2017
1 parent 5597b7f commit 5ee1d60
Show file tree
Hide file tree
Showing 2 changed files with 203 additions and 29 deletions.
114 changes: 85 additions & 29 deletions kong/core/router.lua
Original file line number Diff line number Diff line change
Expand Up @@ -82,6 +82,15 @@ local match_api
local reduce


local function has_capturing_groups(subj)
local s = find(subj, "[^\\]%(.-[^\\]%)")
s = s or find(subj, "^%(.-[^\\]%)")
s = s or find(subj, "%(%)")

return s ~= nil
end


local function marshall_api(api)
local api_t = {
api = api,
Expand Down Expand Up @@ -172,16 +181,19 @@ local function marshall_api(api)

else
-- regex URI
local strip_regex = uri .. [[/?(?P<stripped_uri>.*)]]
local strip_regex = uri .. [[/?(?P<stripped_uri>.*)]]
local has_captures = has_capturing_groups(uri)

api_t.uris[uri] = {
has_captures = has_captures,
strip_regex = strip_regex,
}

insert(api_t.uris, {
value = uri,
regex = uri,
strip_regex = strip_regex,
value = uri,
regex = uri,
has_captures = has_captures,
strip_regex = strip_regex,
})
end
end
Expand Down Expand Up @@ -319,31 +331,77 @@ do
end,

[MATCH_RULES.URI] = function(api_t, ctx)
local uri = ctx.uri_regex or ctx.uri_prefix or ctx.uri
do
local uri = ctx.uri_regex or ctx.uri_prefix or ctx.uri
local regex_t = api_t.uris[uri]

if regex_t then
if api_t.strip_uri or regex_t.has_captures then
local m, err = re_match(ctx.uri, regex_t.strip_regex, "ajo")
if err then
log(ERR, "could not evaluate URI prefix/regex: ", err)
return
end

if api_t.uris[uri] then
if api_t.strip_uri then
ctx.strip_uri_regex = api_t.uris[uri].strip_regex
end
if m then
if m.stripped_uri then
ctx.stripped_uri = "/" .. m.stripped_uri
-- remove the stripped_uri group
m[#m] = nil
m.stripped_uri = nil
end

return true
if regex_t.has_captures then
m[0] = nil
ctx.uri_captures = m
end

return true
end
end

-- plain or prefix match from the index without strip_uri
return true
end
end

for i = 1, #api_t.uris do
local regex_t = api_t.uris[i]

local from, _, err = re_find(ctx.uri, regex_t.regex, "ajo")
if err then
log(ERR, "could not evaluate URI prefix/regex: ", err)
return
end
if api_t.strip_uri or regex_t.has_captures then
local m, err = re_match(ctx.uri, regex_t.strip_regex, "ajo")
if err then
log(ERR, "could not evaluate URI prefix/regex: ", err)
return
end

if from then
if api_t.strip_uri then
ctx.strip_uri_regex = regex_t.strip_regex
if m then
if m.stripped_uri then
ctx.stripped_uri = "/" .. m.stripped_uri
-- remove the stripped_uri group
m[#m] = nil
m.stripped_uri = nil
end

if regex_t.has_captures then
m[0] = nil
ctx.uri_captures = m
end

return true
end

return true
else
-- prefix match without strip_uri
local from, _, err = re_find(ctx.uri, regex_t.regex, "ajo")
if err then
log(ERR, "could not evaluate URI prefix/regex: ", err)
return
end

if from then
return true
end
end
end
end,
Expand Down Expand Up @@ -445,6 +503,9 @@ end
local _M = {}


_M.has_capturing_groups = has_capturing_groups


function _M.new(apis)
if type(apis) ~= "table" then
return error("expected arg #1 apis to be a table")
Expand Down Expand Up @@ -667,7 +728,8 @@ function _M.new(apis)
cache:set(cache_key, {
api_t = matched_api,
ctx = {
strip_uri_regex = ctx.strip_uri_regex,
stripped_uri = ctx.stripped_uri,
uri_captures = ctx.uri_captures,
}
})

Expand Down Expand Up @@ -717,14 +779,8 @@ function _M.new(apis)

local uri_root = request_uri == "/"

if not uri_root and ctx.strip_uri_regex then
local m, err = re_match(uri, ctx.strip_uri_regex, "ajo")
if not m then
log(ERR, "could not strip URI: ", err)
return
end

uri = "/" .. m.stripped_uri
if not uri_root and api_t.strip_uri and ctx.stripped_uri then
uri = ctx.stripped_uri
end


Expand Down Expand Up @@ -765,7 +821,7 @@ function _M.new(apis)
ngx.header["Kong-Api-Name"] = api_t.api.name
end

return api_t.api, api_t.upstream, host_header, uri
return api_t.api, api_t.upstream, host_header, uri, ctx.uri_captures
end


Expand Down
118 changes: 118 additions & 0 deletions spec/01-unit/010-router_spec.lua
Original file line number Diff line number Diff line change
Expand Up @@ -1176,6 +1176,85 @@ describe("Router", function()
local _, _, _, uri = router.exec(_ngx)
assert.equal("/hello/world", uri)
end)

it("returns groups captures from a [uri regex]", function()
local use_case = {
{
name = "api-1",
uris = { [[/users/(?P<user_id>\d+)/profile/?(?P<scope>[a-z]*)]] },
},
}

local router = assert(Router.new(use_case))

local _ngx = mock_ngx("GET", "/users/1984/profile", {})
local _, _, _, _, uri_captures = router.exec(_ngx)
assert.equal("1984", uri_captures[1])
assert.equal("1984", uri_captures.user_id)
assert.equal("", uri_captures[2])
assert.equal("", uri_captures.scope)
-- no full match
assert.is_nil(uri_captures[0])
-- no stripped_uri capture
assert.is_nil(uri_captures.stripped_uri)
assert.equal(2, #uri_captures)

-- again, this time from the LRU cache
local _, _, _, _, uri_captures = router.exec(_ngx)
assert.equal("1984", uri_captures[1])
assert.equal("1984", uri_captures.user_id)
assert.equal("", uri_captures[2])
assert.equal("", uri_captures.scope)
-- no full match
assert.is_nil(uri_captures[0])
-- no stripped_uri capture
assert.is_nil(uri_captures.stripped_uri)
assert.equal(2, #uri_captures)

local _ngx = mock_ngx("GET", "/users/1984/profile/email", {})
local _, _, _, _, uri_captures = router.exec(_ngx)
assert.equal("1984", uri_captures[1])
assert.equal("1984", uri_captures.user_id)
assert.equal("email", uri_captures[2])
assert.equal("email", uri_captures.scope)
-- no full match
assert.is_nil(uri_captures[0])
-- no stripped_uri capture
assert.is_nil(uri_captures.stripped_uri)
assert.equal(2, #uri_captures)
end)

it("returns no group capture from a [uri prefix] match", function()
local use_case = {
{
name = "api-1",
uris = { "/hello" },
strip_uri = true,
},
}

local router = assert(Router.new(use_case))

local _ngx = mock_ngx("GET", "/hello/world", {})
local _, _, _, uri, uri_captures = router.exec(_ngx)
assert.equal("/world", uri)
assert.is_nil(uri_captures)
end)

it("returns no group capture from a [uri regex] match without groups", function()
local use_case = {
{
name = "api-1",
uris = { [[/users/\d+/profile]] },
},
}

local router = assert(Router.new(use_case))

local _ngx = mock_ngx("GET", "/users/1984/profile", {})
local _, _, _, _, uri_captures = router.exec(_ngx)
assert.is_nil(uri_captures)
end)
end)

describe("preserve Host header", function()
Expand Down Expand Up @@ -1339,4 +1418,43 @@ describe("Router", function()
end
end)
end)

describe("has_capturing_groups()", function()
-- load the `assert.fail` assertion
require "spec.helpers"

it("detects if a string has capturing groups", function()
local uris = {
["/users/(foo)"] = true,
["/users/()"] = true,
["/users/()/foo"] = true,
["/users/(hello(foo)world)"] = true,
["/users/(hello(foo)world"] = true,
["/users/(foo)/thing/(bar)"] = true,
["/users/\\(foo\\)/thing/(bar)"] = true,
-- 0-indexed capture groups
["()/world"] = true,
["(/hello)/world"] = true,

["/users/\\(foo\\)"] = false,
["/users/\\(\\)"] = false,
-- unbalanced capture groups
["(/hello\\)/world"] = false,
["/users/(foo"] = false,
["/users/\\(foo)"] = false,
["/users/(foo\\)"] = false,
}

for uri, expected_to_match in pairs(uris) do
local has_captures = Router.has_capturing_groups(uri)
if expected_to_match and not has_captures then
assert.fail(uri, "has capturing groups that were not detected")

elseif not expected_to_match and has_captures then
assert.fail(uri, "has no capturing groups but false-positives " ..
"were detected")
end
end
end)
end)
end)

0 comments on commit 5ee1d60

Please sign in to comment.