| description("Canonicalization of paths."); |
| |
| cases = [ |
| ["/././foo", "/foo"], |
| ["/./.foo", "/.foo"], |
| ["/foo/.", "/foo/"], |
| ["/foo/./", "/foo/"], |
| // double dots followed by a slash or the end of the string count |
| ["/foo/bar/..", "/foo/"], |
| ["/foo/bar/../", "/foo/"], |
| // don't count double dots when they aren't followed by a slash |
| ["/foo/..bar", "/foo/..bar"], |
| // some in the middle |
| ["/foo/bar/../ton", "/foo/ton"], |
| ["/foo/bar/../ton/../../a", "/a"], |
| // we should not be able to go above the root |
| ["/foo/../../..", "/"], |
| ["/foo/../../../ton", "/ton"], |
| // escaped dots should be unescaped and treated the same as dots |
| ["/foo/%2e", "/foo/"], |
| ["/foo/%2e%2", "/foo/.%2"], |
| ["/foo/%2e./%2e%2e/.%2e/%2e.bar", "/..bar"], |
| // Multiple slashes in a row should be preserved and treated like empty |
| // directory names. |
| ["////../..", "//"], |
| ["/foo/bar//../..", "/foo/"], |
| ["/foo/bar//..", "/foo/bar/"], |
| ["/foo/bar/..", "/foo/"], |
| |
| // ----- escaping tests ----- |
| ["/foo", "/foo"], |
| // Valid escape sequence |
| ["/%20foo", "/%20foo"], |
| // Invalid escape sequence we should pass through unchanged. |
| ["/foo%", "/foo%"], |
| ["/foo%2", "/foo%2"], |
| // Invalid escape sequence: bad characters should be treated the same as |
| // the sourrounding text, not as escaped (in this case, UTF-8). |
| ["/foo%2zbar", "/foo%2zbar"], |
| // (Disabled because requires UTF8) |
| // ["/foo%2\xc2\xa9zbar", "/foo%2%C2%A9zbar"], |
| ["/foo%2\u00c2\u00a9zbar", "/foo%2%C3%82%C2%A9zbar"], |
| // Regular characters that are escaped should be unescaped |
| ["/foo%41%7a", "/fooAz"], |
| // Funny characters that are unescaped should be escaped |
| ["/foo\u0009\u0091%91", "/foo%09%C2%91%91"], |
| // Invalid characters that are escaped should cause a failure. |
| ["/foo%00%51", "/foo%00Q"], |
| // Some characters should be passed through unchanged regardless of esc. |
| ["/(%28:%3A%29)", "/(%28:%3A%29)"], |
| // Characters that are properly escaped should not have the case changed |
| // of hex letters. |
| ["/%3A%3a%3C%3c", "/%3A%3a%3C%3c"], |
| // Funny characters that are unescaped should be escaped |
| ["/foo\tbar", "/foo%09bar"], |
| // Backslashes should get converted to forward slashes |
| ["\\\\foo\\\\bar", "/foo/bar"], |
| // Hashes found in paths (possibly only when the caller explicitly sets |
| // the path on an already-parsed URL) should be escaped. |
| // (Disabled because requires ability to set path directly.) |
| // ["/foo#bar", "/foo%23bar"], |
| // %7f should be allowed and %3D should not be unescaped (these were wrong |
| // in a previous version). |
| ["/%7Ffp3%3Eju%3Dduvgw%3Dd", "/%7Ffp3%3Eju%3Dduvgw%3Dd"], |
| // @ should be passed through unchanged (escaped or unescaped). |
| ["/@asdf%40", "/@asdf%40"], |
| |
| // ----- encoding tests ----- |
| // Basic conversions |
| ["/\u4f60\u597d\u4f60\u597d", "/%E4%BD%A0%E5%A5%BD%E4%BD%A0%E5%A5%BD"], |
| // Invalid unicode characters should fail. We only do validation on |
| // UTF-16 input, so this doesn't happen on 8-bit. |
| ["/\ufdd0zyx", "/%EF%BF%BDzyx"], |
| |
| ]; |
| |
| for (var i = 0; i < cases.length; ++i) { |
| test_vector = cases[i][0]; |
| expected_result = cases[i][1]; |
| shouldBe("canonicalize('http://example.com" + test_vector + "')", |
| "'http://example.com" + expected_result + "'"); |
| } |
| |
| var successfullyParsed = true; |