lua-nginx-module/t/037-gsub.t

677 строки
13 KiB
Plaintext
Исходник Постоянная ссылка Ответственный История

Этот файл содержит неоднозначные символы Юникода!

Этот файл содержит неоднозначные символы Юникода, которые могут быть перепутаны с другими в текущей локали. Если это намеренно, можете спокойно проигнорировать это предупреждение. Используйте кнопку Экранировать, чтобы подсветить эти символы.

# vim:set ft= ts=4 sw=4 et fdm=marker:
use Test::Nginx::Socket::Lua;
#worker_connections(1014);
#master_on();
#workers(2);
log_level('warn');
repeat_each(2);
plan tests => repeat_each() * (blocks() * 2 + 16);
#no_diff();
no_long_string();
run_tests();
__DATA__
=== TEST 1: sanity
--- config
location /re {
content_by_lua '
local s, n = ngx.re.gsub("[hello, world]", "[a-z]+", "howdy")
ngx.say(s)
ngx.say(n)
';
}
--- request
GET /re
--- response_body
[howdy, howdy]
2
=== TEST 2: trimmed
--- config
location /re {
content_by_lua '
local s, n = ngx.re.gsub("hello, world", "[a-z]+", "howdy")
ngx.say(s)
ngx.say(n)
';
}
--- request
GET /re
--- response_body
howdy, howdy
2
=== TEST 3: not matched
--- config
location /re {
content_by_lua '
local s, n = ngx.re.gsub("hello, world", "[A-Z]+", "howdy")
ngx.say(s)
ngx.say(n)
';
}
--- request
GET /re
--- response_body
hello, world
0
=== TEST 4: replace by function (trimmed)
--- config
location /re {
content_by_lua '
local f = function (m)
return "[" .. m[0] .. "," .. m[1] .. "]"
end
local s, n = ngx.re.gsub("hello, world", "([a-z])[a-z]+", f)
ngx.say(s)
ngx.say(n)
';
}
--- request
GET /re
--- response_body
[hello,h], [world,w]
2
=== TEST 5: replace by function (not trimmed)
--- config
location /re {
content_by_lua '
local f = function (m)
return "[" .. m[0] .. "," .. m[1] .. "]"
end
local s, n = ngx.re.gsub("{hello, world}", "([a-z])[a-z]+", f)
ngx.say(s)
ngx.say(n)
';
}
--- request
GET /re
--- response_body
{[hello,h], [world,w]}
2
=== TEST 6: replace by script (trimmed)
--- config
location /re {
content_by_lua '
local s, n = ngx.re.gsub("hello, world", "([a-z])[a-z]+", "[$0,$1]")
ngx.say(s)
ngx.say(n)
';
}
--- request
GET /re
--- response_body
[hello,h], [world,w]
2
=== TEST 7: replace by script (not trimmed)
--- config
location /re {
content_by_lua '
local s, n = ngx.re.gsub("{hello, world}", "([a-z])[a-z]+", "[$0,$1]")
ngx.say(s)
ngx.say(n)
';
}
--- request
GET /re
--- response_body
{[hello,h], [world,w]}
2
=== TEST 8: set_by_lua
--- config
location /re {
set_by_lua $res '
local f = function (m)
return "[" .. m[0] .. "," .. m[1] .. "]"
end
local s, n = ngx.re.gsub("{hello, world}", "([a-z])[a-z]+", f)
return s
';
echo $res;
}
--- request
GET /re
--- response_body
{[hello,h], [world,w]}
=== TEST 9: look-behind assertion
--- config
location /re {
content_by_lua '
local s, n = ngx.re.gsub("{foobarbaz}", "(?<=foo)bar|(?<=bar)baz", "h$0")
ngx.say(s)
ngx.say(n)
';
}
--- request
GET /re
--- response_body
{foohbarhbaz}
2
=== TEST 10: gsub with a patch matching an empty substring (string template)
--- config
location /re {
content_by_lua '
local s, n = ngx.re.gsub("hello", "a|", "b")
ngx.say("s: ", s)
ngx.say("n: ", n)
';
}
--- request
GET /re
--- response_body
s: bhbeblblbob
n: 6
--- no_error_log
[error]
=== TEST 11: gsub with a patch matching an empty substring (string template, empty subj)
--- config
location /re {
content_by_lua '
local s, n = ngx.re.gsub("", "a|", "b")
ngx.say("s: ", s)
ngx.say("n: ", n)
';
}
--- request
GET /re
--- response_body
s: b
n: 1
--- no_error_log
[error]
=== TEST 12: gsub with a patch matching an empty substring (func)
--- config
location /re {
content_by_lua '
local s, n = ngx.re.gsub("hello", "a|", function () return "b" end)
ngx.say("s: ", s)
ngx.say("n: ", n)
';
}
--- request
GET /re
--- response_body
s: bhbeblblbob
n: 6
--- no_error_log
[error]
=== TEST 13: gsub with a patch matching an empty substring (func, empty subj)
--- config
location /re {
content_by_lua '
local s, n = ngx.re.gsub("", "a|", function () return "b" end)
ngx.say("s: ", s)
ngx.say("n: ", n)
';
}
--- request
GET /re
--- response_body
s: b
n: 1
--- no_error_log
[error]
=== TEST 14: big subject string exceeding the luabuf chunk size (with trailing unmatched data, func repl)
--- config
location /re {
content_by_lua '
local subj = string.rep("a", 8000)
.. string.rep("b", 1000)
.. string.rep("a", 8000)
.. string.rep("b", 1000)
.. "aaa"
local function repl(m)
return string.rep("c", string.len(m[0]))
end
local s, n = ngx.re.gsub(subj, "b+", repl)
ngx.say(s)
ngx.say(n)
';
}
--- request
GET /re
--- response_body eval
("a" x 8000) . ("c" x 1000) . ("a" x 8000) . ("c" x 1000)
. "aaa
2
"
--- no_error_log
[error]
=== TEST 15: big subject string exceeding the luabuf chunk size (without trailing unmatched data, func repl)
--- config
location /re {
content_by_lua '
local subj = string.rep("a", 8000)
.. string.rep("b", 1000)
.. string.rep("a", 8000)
.. string.rep("b", 1000)
local function repl(m)
return string.rep("c", string.len(m[0]))
end
local s, n = ngx.re.gsub(subj, "b+", repl)
ngx.say(s)
ngx.say(n)
';
}
--- request
GET /re
--- response_body eval
("a" x 8000) . ("c" x 1000) . ("a" x 8000) . ("c" x 1000)
. "\n2\n"
--- no_error_log
[error]
=== TEST 16: big subject string exceeding the luabuf chunk size (with trailing unmatched data, str repl)
--- config
location /re {
content_by_lua '
local subj = string.rep("a", 8000)
.. string.rep("b", 1000)
.. string.rep("a", 8000)
.. string.rep("b", 1000)
.. "aaa"
local s, n = ngx.re.gsub(subj, "b(b+)(b)", "$1 $2")
ngx.say(s)
ngx.say(n)
';
}
--- request
GET /re
--- response_body eval
("a" x 8000) . ("b" x 998) . " b" . ("a" x 8000) . ("b" x 998) . " baaa
2
"
--- no_error_log
[error]
=== TEST 17: big subject string exceeding the luabuf chunk size (without trailing unmatched data, str repl)
--- config
location /re {
content_by_lua '
local subj = string.rep("a", 8000)
.. string.rep("b", 1000)
.. string.rep("a", 8000)
.. string.rep("b", 1000)
local s, n = ngx.re.gsub(subj, "b(b+)(b)", "$1 $2")
ngx.say(s)
ngx.say(n)
';
}
--- request
GET /re
--- response_body eval
("a" x 8000) . ("b" x 998) . " b" . ("a" x 8000) . ("b" x 998) . " b\n2\n"
--- no_error_log
[error]
=== TEST 18: named pattern repl w/ callback
--- config
location /re {
content_by_lua '
local repl = function (m)
return "[" .. m[0] .. "," .. m["first"] .. "]"
end
local s, n = ngx.re.gsub("hello, world", "(?<first>[a-z])[a-z]+", repl)
ngx.say(s)
ngx.say(n)
';
}
--- request
GET /re
--- response_body
[hello,h], [world,w]
2
=== TEST 19: $0 without parens
--- config
location /re {
content_by_lua '
local s, n = ngx.re.gsub("a b c d", [[\w]], "[$0]")
ngx.say(s)
ngx.say(n)
';
}
--- request
GET /re
--- response_body
[a] [b] [c] [d]
4
--- no_error_log
[error]
=== TEST 20: bad UTF-8
--- config
location = /t {
content_by_lua '
local target = "你好"
local regex = "你好"
-- Note the D here
local s, n, err = ngx.re.gsub(string.sub(target, 1, 4), regex, "", "u")
if s then
ngx.say(s, ": ", n)
else
ngx.say("error: ", err)
end
';
}
--- request
GET /t
--- response_body_like chop
error: pcre_exec\(\) failed: -10
--- no_error_log
[error]
=== TEST 21: UTF-8 mode without UTF-8 sequence checks
--- config
location /re {
content_by_lua '
local s, n, err = ngx.re.gsub("你好", ".", "a", "U")
if s then
ngx.say("s: ", s)
end
';
}
--- stap
probe process("$LIBPCRE_PATH").function("pcre_compile") {
printf("compile opts: %x\n", $options)
}
probe process("$LIBPCRE_PATH").function("pcre_exec") {
printf("exec opts: %x\n", $options)
}
--- stap_out
compile opts: 800
exec opts: 2000
exec opts: 2000
exec opts: 2000
--- request
GET /re
--- response_body
s: aa
--- no_error_log
[error]
=== TEST 22: UTF-8 mode with UTF-8 sequence checks
--- config
location /re {
content_by_lua '
local s, n, err = ngx.re.gsub("你好", ".", "a", "u")
if s then
ngx.say("s: ", s)
end
';
}
--- stap
probe process("$LIBPCRE_PATH").function("pcre_compile") {
printf("compile opts: %x\n", $options)
}
probe process("$LIBPCRE_PATH").function("pcre_exec") {
printf("exec opts: %x\n", $options)
}
--- stap_out
compile opts: 800
exec opts: 0
exec opts: 0
exec opts: 0
--- request
GET /re
--- response_body
s: aa
--- no_error_log
[error]
=== TEST 23: just hit match limit
--- http_config
lua_regex_match_limit 5600;
--- config
location /re {
content_by_lua_file html/a.lua;
}
--- user_files
>>> a.lua
local re = [==[(?i:([\s'\"`´\(\)]*)?([\d\w]+)([\s'\"`´\(\)]*)?(?:=|<=>|r?like|sounds\s+like|regexp)([\s'\"`´\(\)]*)?\2|([\s'\"`´\(\)]*)?([\d\w]+)([\s'\"`´\(\)]*)?(?:!=|<=|>=|<>|<|>|\^|is\s+not|not\s+like|not\s+regexp)([\s'\"`´\(\)]*)?(?!\6)([\d\w]+))]==]
s = string.rep([[ABCDEFG]], 10)
local start = ngx.now()
local res, cnt, err = ngx.re.gsub(s, re, "", "o")
--[[
ngx.update_time()
local elapsed = ngx.now() - start
ngx.say(elapsed, " sec elapsed.")
]]
if err then
ngx.say("error: ", err)
return
end
ngx.say("gsub: ", cnt)
--- request
GET /re
--- response_body
error: pcre_exec() failed: -8
=== TEST 24: just not hit match limit
--- http_config
lua_regex_match_limit 5700;
--- config
location /re {
content_by_lua_file html/a.lua;
}
--- user_files
>>> a.lua
local re = [==[(?i:([\s'\"`´\(\)]*)?([\d\w]+)([\s'\"`´\(\)]*)?(?:=|<=>|r?like|sounds\s+like|regexp)([\s'\"`´\(\)]*)?\2|([\s'\"`´\(\)]*)?([\d\w]+)([\s'\"`´\(\)]*)?(?:!=|<=|>=|<>|<|>|\^|is\s+not|not\s+like|not\s+regexp)([\s'\"`´\(\)]*)?(?!\6)([\d\w]+))]==]
local s = string.rep([[ABCDEFG]], 10)
local start = ngx.now()
local res, cnt, err = ngx.re.gsub(s, re, "", "o")
--[[
ngx.update_time()
local elapsed = ngx.now() - start
ngx.say(elapsed, " sec elapsed.")
]]
if err then
ngx.say("error: ", err)
return
end
ngx.say("gsub: ", cnt)
--- request
GET /re
--- response_body
gsub: 0
--- timeout: 10
=== TEST 25: bug: gsub incorrectly swallowed a character is the first character
Original bad result: estCase
--- config
location /re {
content_by_lua '
local s, n = ngx.re.gsub("TestCase", "^ *", "", "o")
if s then
ngx.say(s)
end
';
}
--- request
GET /re
--- response_body
TestCase
=== TEST 26: bug: gsub incorrectly swallowed a character is not the first character
Original bad result: .b.d
--- config
location /re {
content_by_lua '
local s, n = ngx.re.gsub("abcd", "a|(?=c)", ".")
if s then
ngx.say(s)
end
';
}
--- request
GET /re
--- response_body
.b.cd
=== TEST 27: use of ngx.req.get_headers in the user callback
--- config
location = /t {
content_by_lua '
local data = [[
INNER
INNER
]]
-- ngx.say(data)
local res = ngx.re.gsub(data, "INNER", function(inner_matches)
local header = ngx.req.get_headers()["Host"]
-- local header = ngx.var["http_HEADER"]
return "INNER_REPLACED"
end, "s")
ngx.print(res)
';
}
--- request
GET /t
--- response_body
INNER_REPLACED
INNER_REPLACED
--- no_error_log
[error]
=== TEST 28: use of ngx.var in the user callback
--- config
location = /t {
content_by_lua '
local data = [[
INNER
INNER
]]
-- ngx.say(data)
local res = ngx.re.gsub(data, "INNER", function(inner_matches)
-- local header = ngx.req.get_headers()["Host"]
local header = ngx.var["http_HEADER"]
return "INNER_REPLACED"
end, "s")
ngx.print(res)
';
}
--- request
GET /t
--- response_body
INNER_REPLACED
INNER_REPLACED
--- no_error_log
[error]