LayoutTests/fast/url/script-tests/path.js - platform/external/webkit - Git at Google

 description("Canonicalization of paths.");

 cases = [
   ["/././foo", "/foo"],
   ["/./.foo", "/.foo"],
   ["/foo/.", "/foo/"],
   ["/foo/./", "/foo/"],
   // double dots followed by a slash or the end of the string count
   ["/foo/bar/..", "/foo/"],
   ["/foo/bar/../", "/foo/"],
   // don't count double dots when they aren't followed by a slash
   ["/foo/..bar", "/foo/..bar"],
   // some in the middle
   ["/foo/bar/../ton", "/foo/ton"],
   ["/foo/bar/../ton/../../a", "/a"],
   // we should not be able to go above the root
   ["/foo/../../..", "/"],
   ["/foo/../../../ton", "/ton"],
   // escaped dots should be unescaped and treated the same as dots
   ["/foo/%2e", "/foo/"],
   ["/foo/%2e%2", "/foo/.%2"],
   ["/foo/%2e./%2e%2e/.%2e/%2e.bar", "/..bar"],
   // Multiple slashes in a row should be preserved and treated like empty
   // directory names.
   ["////../..", "//"],
   ["/foo/bar//../..", "/foo/"],
   ["/foo/bar//..", "/foo/bar/"],
   ["/foo/bar/..", "/foo/"],

   // ----- escaping tests -----
   ["/foo", "/foo"],
   // Valid escape sequence
   ["/%20foo", "/%20foo"],
   // Invalid escape sequence we should pass through unchanged.
   ["/foo%", "/foo%"],
   ["/foo%2", "/foo%2"],
   // Invalid escape sequence: bad characters should be treated the same as
   // the sourrounding text, not as escaped (in this case, UTF-8).
   ["/foo%2zbar", "/foo%2zbar"],
   // (Disabled because requires UTF8)
   // ["/foo%2\xc2\xa9zbar", "/foo%2%C2%A9zbar"],
   ["/foo%2\u00c2\u00a9zbar", "/foo%2%C3%82%C2%A9zbar"],
   // Regular characters that are escaped should be unescaped
   ["/foo%41%7a", "/fooAz"],
   // Funny characters that are unescaped should be escaped
   ["/foo\u0009\u0091%91", "/foo%09%C2%91%91"],
   // Invalid characters that are escaped should cause a failure.
   ["/foo%00%51", "/foo%00Q"],
   // Some characters should be passed through unchanged regardless of esc.
   ["/(%28:%3A%29)", "/(%28:%3A%29)"],
   // Characters that are properly escaped should not have the case changed
   // of hex letters.
   ["/%3A%3a%3C%3c", "/%3A%3a%3C%3c"],
   // Funny characters that are unescaped should be escaped
   ["/foo\tbar", "/foo%09bar"],
   // Backslashes should get converted to forward slashes
   ["\\\\foo\\\\bar", "/foo/bar"],
   // Hashes found in paths (possibly only when the caller explicitly sets
   // the path on an already-parsed URL) should be escaped.
   // (Disabled because requires ability to set path directly.)
   // ["/foo#bar", "/foo%23bar"],
   // %7f should be allowed and %3D should not be unescaped (these were wrong
   // in a previous version).
   ["/%7Ffp3%3Eju%3Dduvgw%3Dd", "/%7Ffp3%3Eju%3Dduvgw%3Dd"],
   // @ should be passed through unchanged (escaped or unescaped).
   ["/@asdf%40", "/@asdf%40"],

   // ----- encoding tests -----
   // Basic conversions
   ["/\u4f60\u597d\u4f60\u597d", "/%E4%BD%A0%E5%A5%BD%E4%BD%A0%E5%A5%BD"],
   // Invalid unicode characters should fail. We only do validation on
   // UTF-16 input, so this doesn't happen on 8-bit.
   ["/\ufdd0zyx", "/%EF%BF%BDzyx"],

 ];

 for (var i = 0; i < cases.length; ++i) {
   test_vector = cases[i][0];
   expected_result = cases[i][1];
   shouldBe("canonicalize('http://example.com" + test_vector + "')",
            "'http://example.com" + expected_result + "'");
 }

 var successfullyParsed = true;
	description("Canonicalization of paths.");

	cases = [
	["/././foo", "/foo"],
	["/./.foo", "/.foo"],
	["/foo/.", "/foo/"],
	["/foo/./", "/foo/"],
	// double dots followed by a slash or the end of the string count
	["/foo/bar/..", "/foo/"],
	["/foo/bar/../", "/foo/"],
	// don't count double dots when they aren't followed by a slash
	["/foo/..bar", "/foo/..bar"],
	// some in the middle
	["/foo/bar/../ton", "/foo/ton"],
	["/foo/bar/../ton/../../a", "/a"],
	// we should not be able to go above the root
	["/foo/../../..", "/"],
	["/foo/../../../ton", "/ton"],
	// escaped dots should be unescaped and treated the same as dots
	["/foo/%2e", "/foo/"],
	["/foo/%2e%2", "/foo/.%2"],
	["/foo/%2e./%2e%2e/.%2e/%2e.bar", "/..bar"],
	// Multiple slashes in a row should be preserved and treated like empty
	// directory names.
	["////../..", "//"],
	["/foo/bar//../..", "/foo/"],
	["/foo/bar//..", "/foo/bar/"],
	["/foo/bar/..", "/foo/"],

	// ----- escaping tests -----
	["/foo", "/foo"],
	// Valid escape sequence
	["/%20foo", "/%20foo"],
	// Invalid escape sequence we should pass through unchanged.
	["/foo%", "/foo%"],
	["/foo%2", "/foo%2"],
	// Invalid escape sequence: bad characters should be treated the same as
	// the sourrounding text, not as escaped (in this case, UTF-8).
	["/foo%2zbar", "/foo%2zbar"],
	// (Disabled because requires UTF8)
	// ["/foo%2\xc2\xa9zbar", "/foo%2%C2%A9zbar"],
	["/foo%2\u00c2\u00a9zbar", "/foo%2%C3%82%C2%A9zbar"],
	// Regular characters that are escaped should be unescaped
	["/foo%41%7a", "/fooAz"],
	// Funny characters that are unescaped should be escaped
	["/foo\u0009\u0091%91", "/foo%09%C2%91%91"],
	// Invalid characters that are escaped should cause a failure.
	["/foo%00%51", "/foo%00Q"],
	// Some characters should be passed through unchanged regardless of esc.
	["/(%28:%3A%29)", "/(%28:%3A%29)"],
	// Characters that are properly escaped should not have the case changed
	// of hex letters.
	["/%3A%3a%3C%3c", "/%3A%3a%3C%3c"],
	// Funny characters that are unescaped should be escaped
	["/foo\tbar", "/foo%09bar"],
	// Backslashes should get converted to forward slashes
	["\\\\foo\\\\bar", "/foo/bar"],
	// Hashes found in paths (possibly only when the caller explicitly sets
	// the path on an already-parsed URL) should be escaped.
	// (Disabled because requires ability to set path directly.)
	// ["/foo#bar", "/foo%23bar"],
	// %7f should be allowed and %3D should not be unescaped (these were wrong
	// in a previous version).
	["/%7Ffp3%3Eju%3Dduvgw%3Dd", "/%7Ffp3%3Eju%3Dduvgw%3Dd"],
	// @ should be passed through unchanged (escaped or unescaped).
	["/@asdf%40", "/@asdf%40"],

	// ----- encoding tests -----
	// Basic conversions
	["/\u4f60\u597d\u4f60\u597d", "/%E4%BD%A0%E5%A5%BD%E4%BD%A0%E5%A5%BD"],
	// Invalid unicode characters should fail. We only do validation on
	// UTF-16 input, so this doesn't happen on 8-bit.
	["/\ufdd0zyx", "/%EF%BF%BDzyx"],

	];

	for (var i = 0; i < cases.length; ++i) {
	test_vector = cases[i][0];
	expected_result = cases[i][1];
	shouldBe("canonicalize('http://example.com" + test_vector + "')",
	"'http://example.com" + expected_result + "'");
	}

	var successfullyParsed = true;