Violate RFC 2396 and 3986 URI handling requirements.

author Amos Jeffries <squid3@treenet.co.nz>

Thu, 16 Jul 2015 05:09:30 +0000 (22:09 -0700)

committer Amos Jeffries <squid3@treenet.co.nz>

Thu, 16 Jul 2015 05:09:30 +0000 (22:09 -0700)
author Amos Jeffries <squid3@treenet.co.nz>
Thu, 16 Jul 2015 05:09:30 +0000 (22:09 -0700)
committer Amos Jeffries <squid3@treenet.co.nz>
Thu, 16 Jul 2015 05:09:30 +0000 (22:09 -0700)
diff --git a/src/http/one/Parser.cc b/src/http/one/Parser.cc

index 7352e606fa576e43ccd357beaed5da35c5f96f23..dca2c768102114a27ae4c26b1fbfb02bd23b4efe 100644 (file)
--- a/src/http/one/Parser.cc
+++ b/src/http/one/Parser.cc
@@ -43,7 +43,8 @@ Http::One::Parser::grabMimeBlock(const char *which, const size_t limit)
  {
      // MIME headers block exist in (only) HTTP/1.x and ICY
      const bool expectMime = (msgProtocol_.protocol == AnyP::PROTO_HTTP && msgProtocol_.major == 1) ||
-                            msgProtocol_.protocol == AnyP::PROTO_ICY;
+                            msgProtocol_.protocol == AnyP::PROTO_ICY ||
+                            hackExpectsMime_;
  
      if (expectMime) {
          /* NOTE: HTTP/0.9 messages do not have a mime header block.
diff --git a/src/http/one/Parser.h b/src/http/one/Parser.h

index e59202a3713edc1f72c18ef71983ea0a35753cb8..d63b3be9d53f5533ac8acbb8c8b6bb7aa607aff5 100644 (file)
--- a/src/http/one/Parser.h
+++ b/src/http/one/Parser.h
@@ -41,7 +41,7 @@ class Parser : public RefCountable
  public:
      typedef SBuf::size_type size_type;
  
-    Parser() : parseStatusCode(Http::scNone), parsingStage_(HTTP_PARSE_NONE) {}
+    Parser() : parseStatusCode(Http::scNone), parsingStage_(HTTP_PARSE_NONE), hackExpectsMime_(false) {}
      virtual ~Parser() {}
  
      /// Set this parser back to a default state.
@@ -131,6 +131,9 @@ protected:
  
      /// buffer holding the mime headers (if any)
      SBuf mimeHeaderBlock_;
+
+    /// Whether the invalid HTTP as HTTP/0.9 hack expects a mime header block
+    bool hackExpectsMime_;
  };
  
  } // namespace One
diff --git a/src/http/one/RequestParser.cc b/src/http/one/RequestParser.cc

index 97545d8b29b92ed01b7a460c3f0ac3701321aab3..6da9f151066be89752eb6e0866bec9958c32e09b 100644 (file)
--- a/src/http/one/RequestParser.cc
+++ b/src/http/one/RequestParser.cc
@@ -261,6 +261,7 @@ Http::One::RequestParser::parseRequestFirstLine()
          WspDelim += CharacterSet::HTAB
                      + CharacterSet("VT,FF","\x0B\x0C")
                      + CharacterSet::CR;
+        debugs(74, 5, "using Parser relaxed WSP characters");
      }
  
      // only search for method if we have not yet found one
@@ -288,6 +289,8 @@ Http::One::RequestParser::parseRequestFirstLine()
      if (Config.onoff.relaxed_header_parser) {
          // whitespace tolerant
  
+        int warnOnError = (Config.onoff.relaxed_header_parser <= 0 ? DBG_IMPORTANT : 2);
+
          // NOTES:
          // * this would be static, except WspDelim changes with reconfigure
          // * HTTP-version charset is included by uriValidCharacters()
@@ -305,7 +308,7 @@ Http::One::RequestParser::parseRequestFirstLine()
                  uri_ = rTok.remaining();
                  msgProtocol_ = Http::ProtocolVersion(1, (*digit.rawContent() - '0'));
                  if (uri_.isEmpty()) {
-                    debugs(33, 5, "invalid request-line. missing URL");
+                    debugs(33, warnOnError, "invalid request-line. missing URL");
                      parseStatusCode = Http::scBadRequest;
                      return -1;
                  }
@@ -325,11 +328,77 @@ Http::One::RequestParser::parseRequestFirstLine()
                  return 1;
              }
  
-            debugs(33, 5, "invalid request-line. not HTTP");
+            debugs(33, warnOnError, "invalid request-line. not HTTP");
              parseStatusCode = Http::scBadRequest;
              return -1;
          }
  
+        if (!tok.atEnd()) {
+
+#if USE_HTTP_VIOLATIONS
+            /*
+             * RFC 3986 explicitly lists the characters permitted in URI.
+             * A non-permitted character was found somewhere in the request-line.
+             * However, as long as we can find the LF, accept the characters
+             * which we know are invalid in any URI but actively used.
+             */
+            LfDelim.add('\0'); // Java
+            LfDelim.add(' ');  // IIS
+            LfDelim.add('\"'); // Bing
+            LfDelim.add('\\'); // MSIE, Firefox
+            LfDelim.add('|');  // Amazon
+            LfDelim.add('^');  // Microsoft News
+
+            // other ASCII characters for which RFC 2396 has explicitly disallowed use
+            // since 1998 and which were not later permitted by RFC 3986 in 2005.
+            LfDelim.add('<');  // HTML embedded in URL
+            LfDelim.add('>');  // HTML embedded in URL
+            LfDelim.add('`');  // Shell Script embedded in URL
+            LfDelim.add('{');  // JSON or Javascript embedded in URL
+            LfDelim.add('}');  // JSON or Javascript embedded in URL
+
+            // reset the tokenizer from anything the above did, then seek the LF character.
+            tok.reset(buf_);
+
+            if (tok.prefix(line, LfDelim) && tok.skip('\n')) {
+
+                Http1::Tokenizer rTok(line);
+
+                // strip terminating CR (if any)
+                SBuf nil;
+                (void)rTok.suffix(nil,CharacterSet::CR); // optional CR in terminator
+                line = rTok.remaining();
+
+                // strip terminating 'WSP HTTP-version' (if any)
+                if (rTok.suffix(nil,CharacterSet::DIGIT) && rTok.skipSuffix(Http1magic) && rTok.suffix(nil,WspDelim)) {
+                    hackExpectsMime_ = true; // client thinks its speaking HTTP, probably sent a mime block.
+                    uri_ = rTok.remaining();
+                } else
+                    uri_ = line; // no HTTP/1.x label found. Use the whole line.
+
+                if (uri_.isEmpty()) {
+                    debugs(33, warnOnError, "invalid request-line. missing URL");
+                    parseStatusCode = Http::scBadRequest;
+                    return -1;
+                }
+
+                debugs(33, warnOnError, "invalid request-line. treating as HTTP/0.9" << (hackExpectsMime_?" (with mime)":""));
+                msgProtocol_ = Http::ProtocolVersion(0,9);
+                parseStatusCode = Http::scOkay;
+                buf_ = tok.remaining(); // incremental parse checkpoint
+                return 1;
+
+            } else if (tok.atEnd()) {
+                debugs(74, 5, "Parser needs more data");
+                return 0;
+            }
+            // else, drop back to invalid request-line handling
+#endif
+            const SBuf t = tok.remaining();
+            debugs(33, warnOnError, "invalid request-line characters." << Raw("data", t.rawContent(), t.length()));
+            parseStatusCode = Http::scBadRequest;
+            return -1;
+        }
          debugs(74, 5, "Parser needs more data");
          return 0;
      }
author	Amos Jeffries <squid3@treenet.co.nz>
	Thu, 16 Jul 2015 05:09:30 +0000 (22:09 -0700)
committer	Amos Jeffries <squid3@treenet.co.nz>
	Thu, 16 Jul 2015 05:09:30 +0000 (22:09 -0700)
src/http/one/Parser.cc		patch \| blob \| blame \| history
src/http/one/Parser.h		patch \| blob \| blame \| history
src/http/one/RequestParser.cc		patch \| blob \| blame \| history