aboutsummaryrefslogtreecommitdiff
diff options
context:
space:
mode:
authorRuss Cox <rsc@golang.org>2015-08-05 22:12:16 -0400
committerRuss Cox <rsc@golang.org>2015-08-06 02:59:16 +0000
commitfced03a5c6dd22dd486106e3dd116510c28c6e4a (patch)
treea5bcc2f104eb3da8ccacd905b38dc1a8dc72ad0a
parente8be9a170c3044d7460a6b2c8349a723b1a21dd2 (diff)
downloadgo-fced03a5c6dd22dd486106e3dd116510c28c6e4a.tar.gz
go-fced03a5c6dd22dd486106e3dd116510c28c6e4a.zip
net/url: allow all valid host chars in RawPath
The old code was only allowing the chars we choose not to escape. We sometimes prefer to escape chars that do not strictly need it. Allowing those to be used in RawPath lets people override that preference, which is in fact the whole point of RawPath (new in Go 1.5). While we are here, also allow [ ] in RawPath. This is not strictly spec-compliant, but it is what modern browers do and what at least some people expect, and the [ ] do not cause any ambiguity (the usual reason they would be escaped, as they are part of the RFC gen-delims class). The argument for allowing them now instead of waiting until Go 1.6 is that this way RawPath has one fixed meaning at the time it is introduced, that we should not need to change or expand. Fixes #5684. Change-Id: If9c82a18f522d7ee1d10310a22821ada9286ee5c Reviewed-on: https://go-review.googlesource.com/13258 Reviewed-by: Andrew Gerrand <adg@golang.org>
-rw-r--r--src/net/url/url.go18
-rw-r--r--src/net/url/url_test.go24
2 files changed, 39 insertions, 3 deletions
diff --git a/src/net/url/url.go b/src/net/url/url.go
index efbb4c36e9..8ffad663d5 100644
--- a/src/net/url/url.go
+++ b/src/net/url/url.go
@@ -550,8 +550,22 @@ func (u *URL) EscapedPath() string {
// It must not contain any bytes that require escaping during path encoding.
func validEncodedPath(s string) bool {
for i := 0; i < len(s); i++ {
- if s[i] != '%' && shouldEscape(s[i], encodePath) {
- return false
+ // RFC 3986, Appendix A.
+ // pchar = unreserved / pct-encoded / sub-delims / ":" / "@".
+ // shouldEscape is not quite compliant with the RFC,
+ // so we check the sub-delims ourselves and let
+ // shouldEscape handle the others.
+ switch s[i] {
+ case '!', '$', '&', '\'', '(', ')', '*', '+', ',', ';', '=', ':', '@':
+ // ok
+ case '[', ']':
+ // ok - not specified in RFC 3986 but left alone by modern browsers
+ case '%':
+ // ok - percent encoded, will decode
+ default:
+ if shouldEscape(s[i], encodePath) {
+ return false
+ }
}
}
return true
diff --git a/src/net/url/url_test.go b/src/net/url/url_test.go
index 80a2b80efa..ff6e9e4541 100644
--- a/src/net/url/url_test.go
+++ b/src/net/url/url_test.go
@@ -392,7 +392,7 @@ var urltests = []URLTest{
},
"",
},
- // worst case host
+ // worst case host, still round trips
{
"scheme://!$&'()*+,;=hello!:port/path",
&URL{
@@ -402,6 +402,28 @@ var urltests = []URLTest{
},
"",
},
+ // worst case path, still round trips
+ {
+ "http://host/!$&'()*+,;=:@[hello]",
+ &URL{
+ Scheme: "http",
+ Host: "host",
+ Path: "/!$&'()*+,;=:@[hello]",
+ RawPath: "/!$&'()*+,;=:@[hello]",
+ },
+ "",
+ },
+ // golang.org/issue/5684
+ {
+ "http://example.com/oid/[order_id]",
+ &URL{
+ Scheme: "http",
+ Host: "example.com",
+ Path: "/oid/[order_id]",
+ RawPath: "/oid/[order_id]",
+ },
+ "",
+ },
}
// more useful string for debugging than fmt's struct printer