2015-12-16 08:07:31 +03:00
|
|
|
# frozen_string_literal: false
|
2003-10-05 10:09:26 +04:00
|
|
|
require 'test/unit'
|
2019-08-19 12:37:22 +03:00
|
|
|
require 'envutil'
|
2003-10-04 08:02:16 +04:00
|
|
|
require 'uri'
|
|
|
|
|
2003-10-05 10:09:26 +04:00
|
|
|
module URI
|
|
|
|
|
|
|
|
|
|
|
|
class TestCommon < Test::Unit::TestCase
|
2003-10-04 08:02:16 +04:00
|
|
|
def setup
|
|
|
|
end
|
|
|
|
|
|
|
|
def teardown
|
|
|
|
end
|
|
|
|
|
|
|
|
def test_extract
|
2014-06-23 07:18:17 +04:00
|
|
|
EnvUtil.suppress_warning do
|
|
|
|
assert_equal(['http://example.com'],
|
|
|
|
URI.extract('http://example.com'))
|
|
|
|
assert_equal(['http://example.com'],
|
|
|
|
URI.extract('(http://example.com)'))
|
|
|
|
assert_equal(['http://example.com/foo)'],
|
|
|
|
URI.extract('(http://example.com/foo)'))
|
|
|
|
assert_equal(['http://example.jphttp://example.jp'],
|
|
|
|
URI.extract('http://example.jphttp://example.jp'), "[ruby-list:36086]")
|
|
|
|
assert_equal(['http://example.jphttp://example.jp'],
|
|
|
|
URI.extract('http://example.jphttp://example.jp', ['http']), "[ruby-list:36086]")
|
|
|
|
assert_equal(['http://', 'mailto:'].sort,
|
|
|
|
URI.extract('ftp:// http:// mailto: https://', ['http', 'mailto']).sort)
|
|
|
|
# reported by Doug Kearns <djkea2@mugca.its.monash.edu.au>
|
|
|
|
assert_equal(['From:', 'mailto:xxx@xxx.xxx.xxx]'].sort,
|
|
|
|
URI.extract('From: XXX [mailto:xxx@xxx.xxx.xxx]').sort)
|
|
|
|
end
|
2003-10-04 08:02:16 +04:00
|
|
|
end
|
2003-12-08 07:09:02 +03:00
|
|
|
|
|
|
|
def test_regexp
|
2014-06-27 10:25:44 +04:00
|
|
|
EnvUtil.suppress_warning do
|
|
|
|
assert_instance_of Regexp, URI.regexp
|
|
|
|
assert_instance_of Regexp, URI.regexp(['http'])
|
|
|
|
assert_equal URI.regexp, URI.regexp
|
|
|
|
assert_equal 'http://', 'x http:// x'.slice(URI.regexp)
|
|
|
|
assert_equal 'http://', 'x http:// x'.slice(URI.regexp(['http']))
|
|
|
|
assert_equal 'http://', 'x http:// x ftp://'.slice(URI.regexp(['http']))
|
|
|
|
assert_equal nil, 'http://'.slice(URI.regexp([]))
|
|
|
|
assert_equal nil, ''.slice(URI.regexp)
|
|
|
|
assert_equal nil, 'xxxx'.slice(URI.regexp)
|
|
|
|
assert_equal nil, ':'.slice(URI.regexp)
|
|
|
|
assert_equal 'From:', 'From:'.slice(URI.regexp)
|
|
|
|
end
|
2003-12-08 07:09:02 +03:00
|
|
|
end
|
2004-07-05 18:06:10 +04:00
|
|
|
|
|
|
|
def test_kernel_uri
|
|
|
|
expected = URI.parse("http://www.ruby-lang.org/")
|
|
|
|
assert_equal(expected, URI("http://www.ruby-lang.org/"))
|
|
|
|
assert_equal(expected, Kernel::URI("http://www.ruby-lang.org/"))
|
|
|
|
assert_raise(NoMethodError) { Object.new.URI("http://www.ruby-lang.org/") }
|
|
|
|
end
|
2010-03-12 12:00:48 +03:00
|
|
|
|
2010-03-17 18:35:38 +03:00
|
|
|
def test_encode_www_form_component
|
|
|
|
assert_equal("%00+%21%22%23%24%25%26%27%28%29*%2B%2C-.%2F09%3A%3B%3C%3D%3E%3F%40" \
|
2010-03-12 12:00:48 +03:00
|
|
|
"AZ%5B%5C%5D%5E_%60az%7B%7C%7D%7E",
|
2010-03-17 18:35:38 +03:00
|
|
|
URI.encode_www_form_component("\x00 !\"\#$%&'()*+,-./09:;<=>?@AZ[\\]^_`az{|}~"))
|
2010-03-21 15:36:14 +03:00
|
|
|
assert_equal("%95A", URI.encode_www_form_component(
|
2010-03-17 18:35:38 +03:00
|
|
|
"\x95\x41".force_encoding(Encoding::Shift_JIS)))
|
2013-04-25 09:27:41 +04:00
|
|
|
assert_equal("0B", URI.encode_www_form_component(
|
2010-03-17 18:35:38 +03:00
|
|
|
"\x30\x42".force_encoding(Encoding::UTF_16BE)))
|
2010-03-21 15:36:14 +03:00
|
|
|
assert_equal("%1B%24B%24%22%1B%28B", URI.encode_www_form_component(
|
|
|
|
"\e$B$\"\e(B".force_encoding(Encoding::ISO_2022_JP)))
|
2013-04-25 09:27:41 +04:00
|
|
|
|
|
|
|
assert_equal("%E3%81%82", URI.encode_www_form_component(
|
|
|
|
"\u3042", Encoding::ASCII_8BIT))
|
|
|
|
assert_equal("%82%A0", URI.encode_www_form_component(
|
|
|
|
"\u3042", Encoding::Windows_31J))
|
|
|
|
assert_equal("%E3%81%82", URI.encode_www_form_component(
|
|
|
|
"\u3042", Encoding::UTF_8))
|
|
|
|
|
|
|
|
assert_equal("%82%A0", URI.encode_www_form_component(
|
|
|
|
"\u3042".encode("sjis"), Encoding::ASCII_8BIT))
|
|
|
|
assert_equal("%A4%A2", URI.encode_www_form_component(
|
|
|
|
"\u3042".encode("sjis"), Encoding::EUC_JP))
|
|
|
|
assert_equal("%E3%81%82", URI.encode_www_form_component(
|
|
|
|
"\u3042".encode("sjis"), Encoding::UTF_8))
|
|
|
|
assert_equal("B0", URI.encode_www_form_component(
|
|
|
|
"\u3042".encode("sjis"), Encoding::UTF_16LE))
|
2019-06-21 00:47:15 +03:00
|
|
|
assert_equal("%26%23730%3B", URI.encode_www_form_component(
|
|
|
|
"\u02DA", Encoding::WINDOWS_1252))
|
2013-04-25 09:27:41 +04:00
|
|
|
|
|
|
|
# invalid
|
|
|
|
assert_equal("%EF%BF%BD%EF%BF%BD", URI.encode_www_form_component(
|
|
|
|
"\xE3\x81\xFF", "utf-8"))
|
|
|
|
assert_equal("%E6%9F%8A%EF%BF%BD%EF%BF%BD", URI.encode_www_form_component(
|
|
|
|
"\x95\x41\xff\xff".force_encoding(Encoding::Shift_JIS), "utf-8"))
|
2010-03-12 12:00:48 +03:00
|
|
|
end
|
|
|
|
|
2010-03-17 18:35:38 +03:00
|
|
|
def test_decode_www_form_component
|
|
|
|
assert_equal(" !\"\#$%&'()*+,-./09:;<=>?@AZ[\\]^_`az{|}~",
|
|
|
|
URI.decode_www_form_component(
|
|
|
|
"%20+%21%22%23%24%25%26%27%28%29*%2B%2C-.%2F09%3A%3B%3C%3D%3E%3F%40" \
|
2010-03-12 12:00:48 +03:00
|
|
|
"AZ%5B%5C%5D%5E_%60az%7B%7C%7D%7E"))
|
2010-03-21 15:36:14 +03:00
|
|
|
assert_equal("\xA1\xA2".force_encoding(Encoding::EUC_JP),
|
|
|
|
URI.decode_www_form_component("%A1%A2", "EUC-JP"))
|
2013-07-31 13:00:18 +04:00
|
|
|
assert_equal("\xE3\x81\x82\xE3\x81\x82".force_encoding("UTF-8"),
|
|
|
|
URI.decode_www_form_component("\xE3\x81\x82%E3%81%82".force_encoding("UTF-8")))
|
|
|
|
|
2010-04-11 02:05:02 +04:00
|
|
|
assert_raise(ArgumentError){URI.decode_www_form_component("%")}
|
2014-08-25 11:29:50 +04:00
|
|
|
assert_raise(ArgumentError){URI.decode_www_form_component("%a")}
|
|
|
|
assert_raise(ArgumentError){URI.decode_www_form_component("x%a_")}
|
|
|
|
assert_nothing_raised(ArgumentError){URI.decode_www_form_component("x"*(1024*1024))}
|
2010-03-12 12:00:48 +03:00
|
|
|
end
|
|
|
|
|
|
|
|
def test_encode_www_form
|
|
|
|
assert_equal("a=1", URI.encode_www_form("a" => "1"))
|
|
|
|
assert_equal("a=1", URI.encode_www_form(a: 1))
|
|
|
|
assert_equal("a=1", URI.encode_www_form([["a", "1"]]))
|
|
|
|
assert_equal("a=1", URI.encode_www_form([[:a, 1]]))
|
|
|
|
expected = "a=1&%E3%81%82=%E6%BC%A2"
|
|
|
|
assert_equal(expected, URI.encode_www_form("a" => "1", "\u3042" => "\u6F22"))
|
|
|
|
assert_equal(expected, URI.encode_www_form(a: 1, :"\u3042" => "\u6F22"))
|
|
|
|
assert_equal(expected, URI.encode_www_form([["a", "1"], ["\u3042", "\u6F22"]]))
|
|
|
|
assert_equal(expected, URI.encode_www_form([[:a, 1], [:"\u3042", "\u6F22"]]))
|
2013-04-25 09:27:41 +04:00
|
|
|
assert_equal("a=1&%82%A0=%8A%BF",
|
|
|
|
URI.encode_www_form({"a" => "1", "\u3042" => "\u6F22"}, "sjis"))
|
2010-09-30 04:48:01 +04:00
|
|
|
|
|
|
|
assert_equal('+a+=+1+', URI.encode_www_form([[' a ', ' 1 ']]))
|
|
|
|
assert_equal('text=x%0Ay', URI.encode_www_form([['text', "x\u000Ay"]]))
|
|
|
|
assert_equal('constellation=Bo%C3%B6tes', URI.encode_www_form([['constellation', "Bo\u00F6tes"]]))
|
|
|
|
assert_equal('name=%00value', URI.encode_www_form([['name', "\u0000value"]]))
|
|
|
|
assert_equal('Cipher=c%3D%28m%5Ee%29%25n', URI.encode_www_form([['Cipher', 'c=(m^e)%n']]))
|
|
|
|
assert_equal('&', URI.encode_www_form([['', nil], ['', nil]]))
|
|
|
|
assert_equal('&=', URI.encode_www_form([['', nil], ['', '']]))
|
|
|
|
assert_equal('=&', URI.encode_www_form([['', ''], ['', nil]]))
|
|
|
|
assert_equal('=&=', URI.encode_www_form([['', ''], ['', '']]))
|
|
|
|
assert_equal('', URI.encode_www_form([['', nil]]))
|
|
|
|
assert_equal('', URI.encode_www_form([]))
|
|
|
|
assert_equal('=', URI.encode_www_form([['', '']]))
|
|
|
|
assert_equal('a%26b=1&c=2%3B3&e=4', URI.encode_www_form([['a&b', '1'], ['c', '2;3'], ['e', '4']]))
|
|
|
|
assert_equal('image&title&price', URI.encode_www_form([['image', nil], ['title', nil], ['price', nil]]))
|
2010-12-06 13:01:42 +03:00
|
|
|
|
|
|
|
assert_equal("q=ruby&lang=en", URI.encode_www_form([["q", "ruby"], ["lang", "en"]]))
|
|
|
|
assert_equal("q=ruby&lang=en", URI.encode_www_form("q" => "ruby", "lang" => "en"))
|
|
|
|
assert_equal("q=ruby&q=perl&lang=en", URI.encode_www_form("q" => ["ruby", "perl"], "lang" => "en"))
|
|
|
|
assert_equal("q=ruby&q=perl&lang=en", URI.encode_www_form([["q", "ruby"], ["q", "perl"], ["lang", "en"]]))
|
2010-03-12 12:00:48 +03:00
|
|
|
end
|
2010-03-17 18:35:38 +03:00
|
|
|
|
|
|
|
def test_decode_www_form
|
|
|
|
assert_equal([%w[a 1], %w[a 2]], URI.decode_www_form("a=1&a=2"))
|
2013-04-25 09:27:41 +04:00
|
|
|
assert_equal([%w[a 1;a=2]], URI.decode_www_form("a=1;a=2"))
|
|
|
|
assert_equal([%w[a 1], ['', ''], %w[a 2]], URI.decode_www_form("a=1&&a=2"))
|
|
|
|
assert_raise(ArgumentError){URI.decode_www_form("\u3042")}
|
2010-03-17 18:35:38 +03:00
|
|
|
assert_equal([%w[a 1], ["\u3042", "\u6F22"]],
|
2013-04-25 09:27:41 +04:00
|
|
|
URI.decode_www_form("a=1&%E3%81%82=%E6%BC%A2"))
|
2013-05-18 22:58:13 +04:00
|
|
|
assert_equal([%w[a 1], ["\uFFFD%8", "\uFFFD"]],
|
|
|
|
URI.decode_www_form("a=1&%E3%81%8=%E6%BC"))
|
2010-04-09 15:58:20 +04:00
|
|
|
assert_equal([%w[?a 1], %w[a 2]], URI.decode_www_form("?a=1&a=2"))
|
2010-04-11 02:05:02 +04:00
|
|
|
assert_equal([], URI.decode_www_form(""))
|
2013-04-25 09:27:41 +04:00
|
|
|
assert_equal([%w[% 1]], URI.decode_www_form("%=1"))
|
|
|
|
assert_equal([%w[a %]], URI.decode_www_form("a=%"))
|
|
|
|
assert_equal([%w[a 1], %w[% 2]], URI.decode_www_form("a=1&%=2"))
|
|
|
|
assert_equal([%w[a 1], %w[b %]], URI.decode_www_form("a=1&b=%"))
|
|
|
|
assert_equal([['a', ''], ['b', '']], URI.decode_www_form("a&b"))
|
2010-11-29 16:55:27 +03:00
|
|
|
bug4098 = '[ruby-core:33464]'
|
2013-04-25 09:27:41 +04:00
|
|
|
assert_equal([['a', 'AAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA'], ['b', '']], URI.decode_www_form("a=AAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA&b"), bug4098)
|
|
|
|
|
|
|
|
assert_raise(ArgumentError){ URI.decode_www_form("a=1&%82%A0=%8A%BF", "x-sjis") }
|
|
|
|
assert_equal([["a", "1"], [s("\x82\xA0"), s("\x8a\xBF")]],
|
|
|
|
URI.decode_www_form("a=1&%82%A0=%8A%BF", "sjis"))
|
|
|
|
assert_equal([["a", "1"], [s("\x82\xA0"), s("\x8a\xBF")], %w[_charset_ sjis], [s("\x82\xA1"), s("\x8a\xC0")]],
|
|
|
|
URI.decode_www_form("a=1&%82%A0=%8A%BF&_charset_=sjis&%82%A1=%8A%C0", use__charset_: true))
|
|
|
|
assert_equal([["", "isindex"], ["a", "1"]],
|
|
|
|
URI.decode_www_form("isindex&a=1", isindex: true))
|
2010-03-17 18:35:38 +03:00
|
|
|
end
|
2013-04-25 09:27:41 +04:00
|
|
|
|
|
|
|
private
|
|
|
|
def s(str) str.force_encoding(Encoding::Windows_31J); end
|
2003-10-04 08:02:16 +04:00
|
|
|
end
|
|
|
|
|
2003-10-05 10:09:26 +04:00
|
|
|
|
2003-10-04 08:02:16 +04:00
|
|
|
end
|