git/t/unit-tests/t-urlmatch-normalization.c

272 lines
10 KiB
C

#include "test-lib.h"
#include "urlmatch.h"
static void check_url_normalizable(const char *url, unsigned int normalizable)
{
char *url_norm = url_normalize(url, NULL);
if (!check_int(normalizable, ==, url_norm ? 1 : 0))
test_msg("input url: %s", url);
free(url_norm);
}
static void check_normalized_url(const char *url, const char *expect)
{
char *url_norm = url_normalize(url, NULL);
if (!check_str(url_norm, expect))
test_msg("input url: %s", url);
free(url_norm);
}
static void compare_normalized_urls(const char *url1, const char *url2,
unsigned int equal)
{
char *url1_norm = url_normalize(url1, NULL);
char *url2_norm = url_normalize(url2, NULL);
if (equal) {
if (!check_str(url1_norm, url2_norm))
test_msg("input url1: %s\n input url2: %s", url1,
url2);
} else if (!check_int(strcmp(url1_norm, url2_norm), !=, 0)) {
test_msg(" normalized url1: %s\n normalized url2: %s\n"
" input url1: %s\n input url2: %s",
url1_norm, url2_norm, url1, url2);
}
free(url1_norm);
free(url2_norm);
}
static void check_normalized_url_length(const char *url, size_t len)
{
struct url_info info;
char *url_norm = url_normalize(url, &info);
if (!check_int(info.url_len, ==, len))
test_msg(" input url: %s\n normalized url: %s", url,
url_norm);
free(url_norm);
}
/* Note that only "file:" URLs should be allowed without a host */
static void t_url_scheme(void)
{
check_url_normalizable("", 0);
check_url_normalizable("_", 0);
check_url_normalizable("scheme", 0);
check_url_normalizable("scheme:", 0);
check_url_normalizable("scheme:/", 0);
check_url_normalizable("scheme://", 0);
check_url_normalizable("file", 0);
check_url_normalizable("file:", 0);
check_url_normalizable("file:/", 0);
check_url_normalizable("file://", 1);
check_url_normalizable("://acme.co", 0);
check_url_normalizable("x_test://acme.co", 0);
check_url_normalizable("-test://acme.co", 0);
check_url_normalizable("0test://acme.co", 0);
check_url_normalizable("+test://acme.co", 0);
check_url_normalizable(".test://acme.co", 0);
check_url_normalizable("schem%6e://", 0);
check_url_normalizable("x-Test+v1.0://acme.co", 1);
check_normalized_url("AbCdeF://x.Y", "abcdef://x.y/");
}
static void t_url_authority(void)
{
check_url_normalizable("scheme://user:pass@", 0);
check_url_normalizable("scheme://?", 0);
check_url_normalizable("scheme://#", 0);
check_url_normalizable("scheme:///", 0);
check_url_normalizable("scheme://:", 0);
check_url_normalizable("scheme://:555", 0);
check_url_normalizable("file://user:pass@", 1);
check_url_normalizable("file://?", 1);
check_url_normalizable("file://#", 1);
check_url_normalizable("file:///", 1);
check_url_normalizable("file://:", 1);
check_url_normalizable("file://:555", 0);
check_url_normalizable("scheme://user:pass@host", 1);
check_url_normalizable("scheme://@host", 1);
check_url_normalizable("scheme://%00@host", 1);
check_url_normalizable("scheme://%%@host", 0);
check_url_normalizable("scheme://host_", 1);
check_url_normalizable("scheme://user:pass@host/", 1);
check_url_normalizable("scheme://@host/", 1);
check_url_normalizable("scheme://host/", 1);
check_url_normalizable("scheme://host?x", 1);
check_url_normalizable("scheme://host#x", 1);
check_url_normalizable("scheme://host/@", 1);
check_url_normalizable("scheme://host?@x", 1);
check_url_normalizable("scheme://host#@x", 1);
check_url_normalizable("scheme://[::1]", 1);
check_url_normalizable("scheme://[::1]/", 1);
check_url_normalizable("scheme://hos%41/", 0);
check_url_normalizable("scheme://[invalid....:/", 1);
check_url_normalizable("scheme://invalid....:]/", 1);
check_url_normalizable("scheme://invalid....:[/", 0);
check_url_normalizable("scheme://invalid....:[", 0);
}
static void t_url_port(void)
{
check_url_normalizable("xyz://q@some.host:", 1);
check_url_normalizable("xyz://q@some.host:456/", 1);
check_url_normalizable("xyz://q@some.host:0", 0);
check_url_normalizable("xyz://q@some.host:0000000", 0);
check_url_normalizable("xyz://q@some.host:0000001?", 1);
check_url_normalizable("xyz://q@some.host:065535#", 1);
check_url_normalizable("xyz://q@some.host:65535", 1);
check_url_normalizable("xyz://q@some.host:65536", 0);
check_url_normalizable("xyz://q@some.host:99999", 0);
check_url_normalizable("xyz://q@some.host:100000", 0);
check_url_normalizable("xyz://q@some.host:100001", 0);
check_url_normalizable("http://q@some.host:80", 1);
check_url_normalizable("https://q@some.host:443", 1);
check_url_normalizable("http://q@some.host:80/", 1);
check_url_normalizable("https://q@some.host:443?", 1);
check_url_normalizable("http://q@:8008", 0);
check_url_normalizable("http://:8080", 0);
check_url_normalizable("http://:", 0);
check_url_normalizable("xyz://q@some.host:456/", 1);
check_url_normalizable("xyz://[::1]:456/", 1);
check_url_normalizable("xyz://[::1]:/", 1);
check_url_normalizable("xyz://[::1]:000/", 0);
check_url_normalizable("xyz://[::1]:0%300/", 0);
check_url_normalizable("xyz://[::1]:0x80/", 0);
check_url_normalizable("xyz://[::1]:4294967297/", 0);
check_url_normalizable("xyz://[::1]:030f/", 0);
}
static void t_url_port_normalization(void)
{
check_normalized_url("http://x:800", "http://x:800/");
check_normalized_url("http://x:0800", "http://x:800/");
check_normalized_url("http://x:00000800", "http://x:800/");
check_normalized_url("http://x:065535", "http://x:65535/");
check_normalized_url("http://x:1", "http://x:1/");
check_normalized_url("http://x:80", "http://x/");
check_normalized_url("http://x:080", "http://x/");
check_normalized_url("http://x:000000080", "http://x/");
check_normalized_url("https://x:443", "https://x/");
check_normalized_url("https://x:0443", "https://x/");
check_normalized_url("https://x:000000443", "https://x/");
}
static void t_url_general_escape(void)
{
check_url_normalizable("http://x.y?%fg", 0);
check_normalized_url("X://W/%7e%41^%3a", "x://w/~A%5E%3A");
check_normalized_url("X://W/:/?#[]@", "x://w/:/?#[]@");
check_normalized_url("X://W/$&()*+,;=", "x://w/$&()*+,;=");
check_normalized_url("X://W/'", "x://w/'");
check_normalized_url("X://W?!", "x://w/?!");
}
static void t_url_high_bit(void)
{
check_normalized_url(
"x://q/\x01\x02\x03\x04\x05\x06\x07\x08\x0e\x0f\x10\x11\x12",
"x://q/%01%02%03%04%05%06%07%08%0E%0F%10%11%12");
check_normalized_url(
"x://q/\x13\x14\x15\x16\x17\x18\x19\x1b\x1c\x1d\x1e\x1f\x7f",
"x://q/%13%14%15%16%17%18%19%1B%1C%1D%1E%1F%7F");
check_normalized_url(
"x://q/\x80\x81\x82\x83\x84\x85\x86\x87\x88\x89\x8a\x8b\x8c\x8d\x8e\x8f",
"x://q/%80%81%82%83%84%85%86%87%88%89%8A%8B%8C%8D%8E%8F");
check_normalized_url(
"x://q/\x90\x91\x92\x93\x94\x95\x96\x97\x98\x99\x9a\x9b\x9c\x9d\x9e\x9f",
"x://q/%90%91%92%93%94%95%96%97%98%99%9A%9B%9C%9D%9E%9F");
check_normalized_url(
"x://q/\xa0\xa1\xa2\xa3\xa4\xa5\xa6\xa7\xa8\xa9\xaa\xab\xac\xad\xae\xaf",
"x://q/%A0%A1%A2%A3%A4%A5%A6%A7%A8%A9%AA%AB%AC%AD%AE%AF");
check_normalized_url(
"x://q/\xb0\xb1\xb2\xb3\xb4\xb5\xb6\xb7\xb8\xb9\xba\xbb\xbc\xbd\xbe\xbf",
"x://q/%B0%B1%B2%B3%B4%B5%B6%B7%B8%B9%BA%BB%BC%BD%BE%BF");
check_normalized_url(
"x://q/\xc0\xc1\xc2\xc3\xc4\xc5\xc6\xc7\xc8\xc9\xca\xcb\xcc\xcd\xce\xcf",
"x://q/%C0%C1%C2%C3%C4%C5%C6%C7%C8%C9%CA%CB%CC%CD%CE%CF");
check_normalized_url(
"x://q/\xd0\xd1\xd2\xd3\xd4\xd5\xd6\xd7\xd8\xd9\xda\xdb\xdc\xdd\xde\xdf",
"x://q/%D0%D1%D2%D3%D4%D5%D6%D7%D8%D9%DA%DB%DC%DD%DE%DF");
check_normalized_url(
"x://q/\xe0\xe1\xe2\xe3\xe4\xe5\xe6\xe7\xe8\xe9\xea\xeb\xec\xed\xee\xef",
"x://q/%E0%E1%E2%E3%E4%E5%E6%E7%E8%E9%EA%EB%EC%ED%EE%EF");
check_normalized_url(
"x://q/\xf0\xf1\xf2\xf3\xf4\xf5\xf6\xf7\xf8\xf9\xfa\xfb\xfc\xfd\xfe\xff",
"x://q/%F0%F1%F2%F3%F4%F5%F6%F7%F8%F9%FA%FB%FC%FD%FE%FF");
}
static void t_url_utf8_escape(void)
{
check_normalized_url(
"x://q/\xc2\x80\xdf\xbf\xe0\xa0\x80\xef\xbf\xbd\xf0\x90\x80\x80\xf0\xaf\xbf\xbd",
"x://q/%C2%80%DF%BF%E0%A0%80%EF%BF%BD%F0%90%80%80%F0%AF%BF%BD");
}
static void t_url_username_pass(void)
{
check_normalized_url("x://%41%62(^):%70+d@foo", "x://Ab(%5E):p+d@foo/");
}
static void t_url_length(void)
{
check_normalized_url_length("Http://%4d%65:%4d^%70@The.Host", 25);
check_normalized_url_length("http://%41:%42@x.y/%61/", 17);
check_normalized_url_length("http://@x.y/^", 15);
}
static void t_url_dots(void)
{
check_normalized_url("x://y/.", "x://y/");
check_normalized_url("x://y/./", "x://y/");
check_normalized_url("x://y/a/.", "x://y/a");
check_normalized_url("x://y/a/./", "x://y/a/");
check_normalized_url("x://y/.?", "x://y/?");
check_normalized_url("x://y/./?", "x://y/?");
check_normalized_url("x://y/a/.?", "x://y/a?");
check_normalized_url("x://y/a/./?", "x://y/a/?");
check_normalized_url("x://y/a/./b/.././../c", "x://y/c");
check_normalized_url("x://y/a/./b/../.././c/", "x://y/c/");
check_normalized_url("x://y/a/./b/.././../c/././.././.", "x://y/");
check_url_normalizable("x://y/a/./b/.././../c/././.././..", 0);
check_normalized_url("x://y/a/./?/././..", "x://y/a/?/././..");
check_normalized_url("x://y/%2e/", "x://y/");
check_normalized_url("x://y/%2E/", "x://y/");
check_normalized_url("x://y/a/%2e./", "x://y/");
check_normalized_url("x://y/b/.%2E/", "x://y/");
check_normalized_url("x://y/c/%2e%2E/", "x://y/");
}
/*
* "http://@foo" specifies an empty user name but does not specify a password.
* "http://foo" specifies neither a user name nor a password.
* So they should not be equivalent.
*/
static void t_url_equivalents(void)
{
compare_normalized_urls("httP://x", "Http://X/", 1);
compare_normalized_urls("Http://%4d%65:%4d^%70@The.Host", "hTTP://Me:%4D^p@the.HOST:80/", 1);
compare_normalized_urls("https://@x.y/^", "httpS://x.y:443/^", 0);
compare_normalized_urls("https://@x.y/^", "httpS://@x.y:0443/^", 1);
compare_normalized_urls("https://@x.y/^/../abc", "httpS://@x.y:0443/abc", 1);
compare_normalized_urls("https://@x.y/^/..", "httpS://@x.y:0443/", 1);
}
int cmd_main(int argc UNUSED, const char **argv UNUSED)
{
TEST(t_url_scheme(), "url scheme");
TEST(t_url_authority(), "url authority");
TEST(t_url_port(), "url port checks");
TEST(t_url_port_normalization(), "url port normalization");
TEST(t_url_general_escape(), "url general escapes");
TEST(t_url_high_bit(), "url high-bit escapes");
TEST(t_url_utf8_escape(), "url utf8 escapes");
TEST(t_url_username_pass(), "url username/password escapes");
TEST(t_url_length(), "url normalized lengths");
TEST(t_url_dots(), "url . and .. segments");
TEST(t_url_equivalents(), "url equivalents");
return test_done();
}