Revert "net/url, net/http/httputil: accept invalid percent encodings"

author Damien Neil <dneil@google.com>

Tue, 22 Nov 2022 17:22:13 +0000 (09:22 -0800)

committer Damien Neil <dneil@google.com>

Tue, 22 Nov 2022 18:25:01 +0000 (18:25 +0000)
author Damien Neil <dneil@google.com>
Tue, 22 Nov 2022 17:22:13 +0000 (09:22 -0800)
committer Damien Neil <dneil@google.com>
Tue, 22 Nov 2022 18:25:01 +0000 (18:25 +0000)
diff --git a/src/net/http/httputil/reverseproxy.go b/src/net/http/httputil/reverseproxy.go

index ad0221ff334ef2cf7da96bd4f0c0023656ee4f44..190279ca007d6c49228ff8d55571184b1276a888 100644 (file)
--- a/src/net/http/httputil/reverseproxy.go
+++ b/src/net/http/httputil/reverseproxy.go
@@ -816,9 +816,34 @@ func (c switchProtocolCopier) copyToBackend(errc chan<- error) {
  }
  
  func cleanQueryParams(s string) string {
-       if strings.Contains(s, ";") {
+       reencode := func(s string) string {
                 v, _ := url.ParseQuery(s)
                 return v.Encode()
         }
+       for i := 0; i < len(s); {
+               switch s[i] {
+               case ';':
+                       return reencode(s)
+               case '%':
+                       if i+2 >= len(s) || !ishex(s[i+1]) || !ishex(s[i+2]) {
+                               return reencode(s)
+                       }
+                       i += 3
+               default:
+                       i++
+               }
+       }
         return s
  }
+
+func ishex(c byte) bool {
+       switch {
+       case '0' <= c && c <= '9':
+               return true
+       case 'a' <= c && c <= 'f':
+               return true
+       case 'A' <= c && c <= 'F':
+               return true
+       }
+       return false
+}
diff --git a/src/net/http/httputil/reverseproxy_test.go b/src/net/http/httputil/reverseproxy_test.go

index 5a0237494c7d30852ebc483b3e32f14e458cd0bd..5b882d3a45638c54aee1bbba4fdfad13fe8b9502 100644 (file)
--- a/src/net/http/httputil/reverseproxy_test.go
+++ b/src/net/http/httputil/reverseproxy_test.go
@@ -1831,7 +1831,7 @@ func testReverseProxyQueryParameterSmuggling(t *testing.T, wantCleanQuery bool,
                 cleanQuery: "a=1",
         }, {
                 rawQuery:   "a=1&a=%zz&b=3",
-               cleanQuery: "a=1&a=%zz&b=3",
+               cleanQuery: "a=1&b=3",
         }} {
                 res, err := frontend.Client().Get(frontend.URL + "?" + test.rawQuery)
                 if err != nil {
diff --git a/src/net/url/url.go b/src/net/url/url.go

index e959ed4ee6c7d32992edd107af19130acc48f494..d530a50d40d19fe2467e021308a808e009877d41 100644 (file)
--- a/src/net/url/url.go
+++ b/src/net/url/url.go
@@ -198,24 +198,20 @@ func PathUnescape(s string) (string, error) {
  // unescape unescapes a string; the mode specifies
  // which section of the URL string is being unescaped.
  func unescape(s string, mode encoding) (string, error) {
-       isPercentEscape := func(s string, i int) bool {
-               return i+2 < len(s) && ishex(s[i+1]) && ishex(s[i+2])
-       }
-
         // Count %, check that they're well-formed.
         n := 0
         hasPlus := false
         for i := 0; i < len(s); {
                 switch s[i] {
                 case '%':
-                       if !isPercentEscape(s, i) {
-                               // https://url.spec.whatwg.org/#percent-encoded-bytes
-                               // says that % followed by non-hex characters
-                               // should be accepted with no error.
-                               i++
-                               continue
-                       }
                         n++
+                       if i+2 >= len(s) || !ishex(s[i+1]) || !ishex(s[i+2]) {
+                               s = s[i:]
+                               if len(s) > 3 {
+                                       s = s[:3]
+                               }
+                               return "", EscapeError(s)
+                       }
                         // Per https://tools.ietf.org/html/rfc3986#page-21
                         // in the host component %-encoding can only be used
                         // for non-ASCII bytes.
@@ -259,12 +255,8 @@ func unescape(s string, mode encoding) (string, error) {
         for i := 0; i < len(s); i++ {
                 switch s[i] {
                 case '%':
-                       if !isPercentEscape(s, i) {
-                               t.WriteByte('%')
-                       } else {
-                               t.WriteByte(unhex(s[i+1])<<4 | unhex(s[i+2]))
-                               i += 2
-                       }
+                       t.WriteByte(unhex(s[i+1])<<4 | unhex(s[i+2]))
+                       i += 2
                 case '+':
                         if mode == encodeQueryComponent {
                                 t.WriteByte(' ')
diff --git a/src/net/url/url_test.go b/src/net/url/url_test.go

index 899ec99e434976e0f8f019a304e7c5f017b2b59d..577cf631c835e1986ff65107dc1cd9fc32651cd3 100644 (file)
--- a/src/net/url/url_test.go
+++ b/src/net/url/url_test.go
@@ -704,11 +704,9 @@ var parseRequestURLTests = []struct {
         // These two cases are valid as textual representations as
         // described in RFC 4007, but are not valid as address
         // literals with IPv6 zone identifiers in URIs as described in
-       // RFC 6874. However, this seems to be overridden by
-       // https://url.spec.whatwg.org/#percent-encoded-bytes
-       // which permits unencoded % characters.
-       {"http://[fe80::1%en0]/", true},
-       {"http://[fe80::1%en0]:8080/", true},
+       // RFC 6874.
+       {"http://[fe80::1%en0]/", false},
+       {"http://[fe80::1%en0]:8080/", false},
  }
  
  func TestParseRequestURI(t *testing.T) {
@@ -898,28 +896,28 @@ var unescapeTests = []EscapeTest{
         },
         {
                 "%", // not enough characters after %
-               "%",
-               nil,
+               "",
+               EscapeError("%"),
         },
         {
                 "%a", // not enough characters after %
-               "%a",
-               nil,
+               "",
+               EscapeError("%a"),
         },
         {
                 "%1", // not enough characters after %
-               "%1",
-               nil,
+               "",
+               EscapeError("%1"),
         },
         {
                 "123%45%6", // not enough characters after %
-               "123E%6",
-               nil,
+               "",
+               EscapeError("%6"),
         },
         {
                 "%zzzzz", // invalid hex digits
-               "%zzzzz",
-               nil,
+               "",
+               EscapeError("%zz"),
         },
         {
                 "a+b",
@@ -1593,6 +1591,16 @@ func TestRequestURI(t *testing.T) {
         }
  }
  
+func TestParseFailure(t *testing.T) {
+       // Test that the first parse error is returned.
+       const url = "%gh&%ij"
+       _, err := ParseQuery(url)
+       errStr := fmt.Sprint(err)
+       if !strings.Contains(errStr, "%gh") {
+               t.Errorf(`ParseQuery(%q) returned error %q, want something containing %q"`, url, errStr, "%gh")
+       }
+}
+
  func TestParseErrors(t *testing.T) {
         tests := []struct {
                 in      string
@@ -2110,7 +2118,6 @@ func TestJoinPath(t *testing.T) {
                 {
                         base: "http://[fe80::1%en0]:8080/",
                         elem: []string{"/go"},
-                       out:  "http://[fe80::1%25en0]:8080/go",
                 },
                 {
                         base: "https://go.googlesource.com",
author	Damien Neil <dneil@google.com>
	Tue, 22 Nov 2022 17:22:13 +0000 (09:22 -0800)
committer	Damien Neil <dneil@google.com>
	Tue, 22 Nov 2022 18:25:01 +0000 (18:25 +0000)
src/net/http/httputil/reverseproxy.go		patch \| blob \| history
src/net/http/httputil/reverseproxy_test.go		patch \| blob \| history
src/net/url/url.go		patch \| blob \| history
src/net/url/url_test.go		patch \| blob \| history