]> git.ipfire.org Git - thirdparty/squid.git/blob - src/http.cc
Supply AccessLogEntry (ALE) for more fast ACL checks. (#182)
[thirdparty/squid.git] / src / http.cc
1 /*
2 * Copyright (C) 1996-2018 The Squid Software Foundation and contributors
3 *
4 * Squid software is distributed under GPLv2+ license and includes
5 * contributions from numerous individuals and organizations.
6 * Please see the COPYING and CONTRIBUTORS files for details.
7 */
8
9 /* DEBUG: section 11 Hypertext Transfer Protocol (HTTP) */
10
11 /*
12 * Anonymizing patch by lutz@as-node.jena.thur.de
13 * have a look into http-anon.c to get more informations.
14 */
15
16 #include "squid.h"
17 #include "acl/FilledChecklist.h"
18 #include "base/AsyncJobCalls.h"
19 #include "base/TextException.h"
20 #include "base64.h"
21 #include "CachePeer.h"
22 #include "client_side.h"
23 #include "comm/Connection.h"
24 #include "comm/Read.h"
25 #include "comm/Write.h"
26 #include "CommRead.h"
27 #include "err_detail_type.h"
28 #include "errorpage.h"
29 #include "fd.h"
30 #include "fde.h"
31 #include "globals.h"
32 #include "http.h"
33 #include "http/one/ResponseParser.h"
34 #include "http/one/TeChunkedParser.h"
35 #include "http/Stream.h"
36 #include "HttpControlMsg.h"
37 #include "HttpHdrCc.h"
38 #include "HttpHdrContRange.h"
39 #include "HttpHdrSc.h"
40 #include "HttpHdrScTarget.h"
41 #include "HttpHeaderTools.h"
42 #include "HttpReply.h"
43 #include "HttpRequest.h"
44 #include "log/access_log.h"
45 #include "MemBuf.h"
46 #include "MemObject.h"
47 #include "neighbors.h"
48 #include "peer_proxy_negotiate_auth.h"
49 #include "profiler/Profiler.h"
50 #include "refresh.h"
51 #include "RefreshPattern.h"
52 #include "rfc1738.h"
53 #include "SquidConfig.h"
54 #include "SquidTime.h"
55 #include "StatCounters.h"
56 #include "Store.h"
57 #include "StrList.h"
58 #include "tools.h"
59 #include "URL.h"
60 #include "util.h"
61
62 #if USE_AUTH
63 #include "auth/UserRequest.h"
64 #endif
65 #if USE_DELAY_POOLS
66 #include "DelayPools.h"
67 #endif
68
69 #define SQUID_ENTER_THROWING_CODE() try {
70 #define SQUID_EXIT_THROWING_CODE(status) \
71 status = true; \
72 } \
73 catch (const std::exception &e) { \
74 debugs (11, 1, "Exception error:" << e.what()); \
75 status = false; \
76 }
77
78 CBDATA_CLASS_INIT(HttpStateData);
79
80 static const char *const crlf = "\r\n";
81
82 static void httpMaybeRemovePublic(StoreEntry *, Http::StatusCode);
83 static void copyOneHeaderFromClientsideRequestToUpstreamRequest(const HttpHeaderEntry *e, const String strConnection, const HttpRequest * request,
84 HttpHeader * hdr_out, const int we_do_ranges, const Http::StateFlags &);
85
86 HttpStateData::HttpStateData(FwdState *theFwdState) :
87 AsyncJob("HttpStateData"),
88 Client(theFwdState),
89 lastChunk(0),
90 httpChunkDecoder(NULL),
91 payloadSeen(0),
92 payloadTruncated(0),
93 sawDateGoBack(false)
94 {
95 debugs(11,5,HERE << "HttpStateData " << this << " created");
96 ignoreCacheControl = false;
97 surrogateNoStore = false;
98 serverConnection = fwd->serverConnection();
99
100 if (fwd->serverConnection() != NULL)
101 _peer = cbdataReference(fwd->serverConnection()->getPeer()); /* might be NULL */
102
103 if (_peer) {
104 request->flags.proxying = true;
105 /*
106 * This NEIGHBOR_PROXY_ONLY check probably shouldn't be here.
107 * We might end up getting the object from somewhere else if,
108 * for example, the request to this neighbor fails.
109 */
110 if (_peer->options.proxy_only)
111 entry->releaseRequest(true);
112
113 #if USE_DELAY_POOLS
114 entry->setNoDelay(_peer->options.no_delay);
115 #endif
116 }
117
118 /*
119 * register the handler to free HTTP state data when the FD closes
120 */
121 typedef CommCbMemFunT<HttpStateData, CommCloseCbParams> Dialer;
122 closeHandler = JobCallback(9, 5, Dialer, this, HttpStateData::httpStateConnClosed);
123 comm_add_close_handler(serverConnection->fd, closeHandler);
124 }
125
126 HttpStateData::~HttpStateData()
127 {
128 /*
129 * don't forget that ~Client() gets called automatically
130 */
131
132 if (httpChunkDecoder)
133 delete httpChunkDecoder;
134
135 cbdataReferenceDone(_peer);
136
137 debugs(11,5, HERE << "HttpStateData " << this << " destroyed; " << serverConnection);
138 }
139
140 const Comm::ConnectionPointer &
141 HttpStateData::dataConnection() const
142 {
143 return serverConnection;
144 }
145
146 void
147 HttpStateData::httpStateConnClosed(const CommCloseCbParams &params)
148 {
149 debugs(11, 5, "httpStateFree: FD " << params.fd << ", httpState=" << params.data);
150 doneWithFwd = "httpStateConnClosed()"; // assume FwdState is monitoring too
151 mustStop("HttpStateData::httpStateConnClosed");
152 }
153
154 void
155 HttpStateData::httpTimeout(const CommTimeoutCbParams &)
156 {
157 debugs(11, 4, serverConnection << ": '" << entry->url() << "'");
158
159 if (entry->store_status == STORE_PENDING) {
160 fwd->fail(new ErrorState(ERR_READ_TIMEOUT, Http::scGatewayTimeout, fwd->request));
161 }
162
163 closeServer();
164 mustStop("HttpStateData::httpTimeout");
165 }
166
167 static StoreEntry *
168 findPreviouslyCachedEntry(StoreEntry *newEntry) {
169 assert(newEntry->mem_obj);
170 return newEntry->mem_obj->request ?
171 storeGetPublicByRequest(newEntry->mem_obj->request.getRaw()) :
172 storeGetPublic(newEntry->mem_obj->storeId(), newEntry->mem_obj->method);
173 }
174
175 /// Remove an existing public store entry if the incoming response (to be
176 /// stored in a currently private entry) is going to invalidate it.
177 static void
178 httpMaybeRemovePublic(StoreEntry * e, Http::StatusCode status)
179 {
180 int remove = 0;
181 int forbidden = 0;
182
183 // If the incoming response already goes into a public entry, then there is
184 // nothing to remove. This protects ready-for-collapsing entries as well.
185 if (!EBIT_TEST(e->flags, KEY_PRIVATE))
186 return;
187
188 // If the new/incoming response cannot be stored, then it does not
189 // compete with the old stored response for the public key, and the
190 // old stored response should be left as is.
191 if (e->mem_obj->request && !e->mem_obj->request->flags.cachable)
192 return;
193
194 switch (status) {
195
196 case Http::scOkay:
197
198 case Http::scNonAuthoritativeInformation:
199
200 case Http::scMultipleChoices:
201
202 case Http::scMovedPermanently:
203
204 case Http::scFound:
205
206 case Http::scSeeOther:
207
208 case Http::scGone:
209
210 case Http::scNotFound:
211 remove = 1;
212
213 break;
214
215 case Http::scForbidden:
216
217 case Http::scMethodNotAllowed:
218 forbidden = 1;
219
220 break;
221
222 #if WORK_IN_PROGRESS
223
224 case Http::scUnauthorized:
225 forbidden = 1;
226
227 break;
228
229 #endif
230
231 default:
232 #if QUESTIONABLE
233 /*
234 * Any 2xx response should eject previously cached entities...
235 */
236
237 if (status >= 200 && status < 300)
238 remove = 1;
239
240 #endif
241
242 break;
243 }
244
245 if (!remove && !forbidden)
246 return;
247
248 StoreEntry *pe = findPreviouslyCachedEntry(e);
249
250 if (pe != NULL) {
251 assert(e != pe);
252 #if USE_HTCP
253 neighborsHtcpClear(e, nullptr, e->mem_obj->request.getRaw(), e->mem_obj->method, HTCP_CLR_INVALIDATION);
254 #endif
255 pe->release(true);
256 }
257
258 /** \par
259 * Also remove any cached HEAD response in case the object has
260 * changed.
261 */
262 if (e->mem_obj->request)
263 pe = storeGetPublicByRequestMethod(e->mem_obj->request.getRaw(), Http::METHOD_HEAD);
264 else
265 pe = storeGetPublic(e->mem_obj->storeId(), Http::METHOD_HEAD);
266
267 if (pe != NULL) {
268 assert(e != pe);
269 #if USE_HTCP
270 neighborsHtcpClear(e, nullptr, e->mem_obj->request.getRaw(), HttpRequestMethod(Http::METHOD_HEAD), HTCP_CLR_INVALIDATION);
271 #endif
272 pe->release(true);
273 }
274 }
275
276 void
277 HttpStateData::processSurrogateControl(HttpReply *reply)
278 {
279 if (request->flags.accelerated && reply->surrogate_control) {
280 HttpHdrScTarget *sctusable = reply->surrogate_control->getMergedTarget(Config.Accel.surrogate_id);
281
282 if (sctusable) {
283 if (sctusable->hasNoStore() ||
284 (Config.onoff.surrogate_is_remote
285 && sctusable->noStoreRemote())) {
286 surrogateNoStore = true;
287 // Be conservative for now and make it non-shareable because
288 // there is no enough information here to make the decision.
289 entry->makePrivate(false);
290 }
291
292 /* The HttpHeader logic cannot tell if the header it's parsing is a reply to an
293 * accelerated request or not...
294 * Still, this is an abstraction breach. - RC
295 */
296 if (sctusable->hasMaxAge()) {
297 if (sctusable->maxAge() < sctusable->maxStale())
298 reply->expires = reply->date + sctusable->maxAge();
299 else
300 reply->expires = reply->date + sctusable->maxStale();
301
302 /* And update the timestamps */
303 entry->timestampsSet();
304 }
305
306 /* We ignore cache-control directives as per the Surrogate specification */
307 ignoreCacheControl = true;
308
309 delete sctusable;
310 }
311 }
312 }
313
314 HttpStateData::ReuseDecision::Answers
315 HttpStateData::reusableReply(HttpStateData::ReuseDecision &decision)
316 {
317 HttpReply const *rep = finalReply();
318 HttpHeader const *hdr = &rep->header;
319 const char *v;
320 #if USE_HTTP_VIOLATIONS
321
322 const RefreshPattern *R = NULL;
323
324 /* This strange looking define first looks up the refresh pattern
325 * and then checks if the specified flag is set. The main purpose
326 * of this is to simplify the refresh pattern lookup and USE_HTTP_VIOLATIONS
327 * condition
328 */
329 #define REFRESH_OVERRIDE(flag) \
330 ((R = (R ? R : refreshLimits(entry->mem_obj->storeId()))) , \
331 (R && R->flags.flag))
332 #else
333 #define REFRESH_OVERRIDE(flag) 0
334 #endif
335
336 if (EBIT_TEST(entry->flags, RELEASE_REQUEST))
337 return decision.make(ReuseDecision::doNotCacheButShare, "the entry has been released");
338
339 // RFC 7234 section 4: a cache MUST use the most recent response
340 // (as determined by the Date header field)
341 // TODO: whether such responses could be shareable?
342 if (sawDateGoBack)
343 return decision.make(ReuseDecision::reuseNot, "the response has an older date header");
344
345 // Check for Surrogate/1.0 protocol conditions
346 // NP: reverse-proxy traffic our parent server has instructed us never to cache
347 if (surrogateNoStore)
348 return decision.make(ReuseDecision::reuseNot, "Surrogate-Control:no-store");
349
350 // RFC 2616: HTTP/1.1 Cache-Control conditions
351 if (!ignoreCacheControl) {
352 // XXX: check to see if the request headers alone were enough to prevent caching earlier
353 // (ie no-store request header) no need to check those all again here if so.
354 // for now we are not reliably doing that so we waste CPU re-checking request CC
355
356 // RFC 2616 section 14.9.2 - MUST NOT cache any response with request CC:no-store
357 if (request && request->cache_control && request->cache_control->hasNoStore() &&
358 !REFRESH_OVERRIDE(ignore_no_store))
359 return decision.make(ReuseDecision::reuseNot,
360 "client request Cache-Control:no-store");
361
362 // NP: request CC:no-cache only means cache READ is forbidden. STORE is permitted.
363 if (rep->cache_control && rep->cache_control->hasNoCacheWithParameters()) {
364 /* TODO: we are allowed to cache when no-cache= has parameters.
365 * Provided we strip away any of the listed headers unless they are revalidated
366 * successfully (ie, must revalidate AND these headers are prohibited on stale replies).
367 * That is a bit tricky for squid right now so we avoid caching entirely.
368 */
369 return decision.make(ReuseDecision::reuseNot,
370 "server reply Cache-Control:no-cache has parameters");
371 }
372
373 // NP: request CC:private is undefined. We ignore.
374 // NP: other request CC flags are limiters on HIT/MISS. We don't care about here.
375
376 // RFC 2616 section 14.9.2 - MUST NOT cache any response with CC:no-store
377 if (rep->cache_control && rep->cache_control->hasNoStore() &&
378 !REFRESH_OVERRIDE(ignore_no_store))
379 return decision.make(ReuseDecision::reuseNot,
380 "server reply Cache-Control:no-store");
381
382 // RFC 2616 section 14.9.1 - MUST NOT cache any response with CC:private in a shared cache like Squid.
383 // CC:private overrides CC:public when both are present in a response.
384 // TODO: add a shared/private cache configuration possibility.
385 if (rep->cache_control &&
386 rep->cache_control->hasPrivate() &&
387 !REFRESH_OVERRIDE(ignore_private)) {
388 /* TODO: we are allowed to cache when private= has parameters.
389 * Provided we strip away any of the listed headers unless they are revalidated
390 * successfully (ie, must revalidate AND these headers are prohibited on stale replies).
391 * That is a bit tricky for squid right now so we avoid caching entirely.
392 */
393 return decision.make(ReuseDecision::reuseNot,
394 "server reply Cache-Control:private");
395 }
396 }
397
398 // RFC 2068, sec 14.9.4 - MUST NOT cache any response with Authentication UNLESS certain CC controls are present
399 // allow HTTP violations to IGNORE those controls (ie re-block caching Auth)
400 if (request && (request->flags.auth || request->flags.authSent)) {
401 if (!rep->cache_control)
402 return decision.make(ReuseDecision::reuseNot,
403 "authenticated and server reply missing Cache-Control");
404
405 if (ignoreCacheControl)
406 return decision.make(ReuseDecision::reuseNot,
407 "authenticated and ignoring Cache-Control");
408
409 bool mayStore = false;
410 // HTTPbis pt6 section 3.2: a response CC:public is present
411 if (rep->cache_control->hasPublic()) {
412 debugs(22, 3, HERE << "Authenticated but server reply Cache-Control:public");
413 mayStore = true;
414
415 // HTTPbis pt6 section 3.2: a response CC:must-revalidate is present
416 } else if (rep->cache_control->hasMustRevalidate()) {
417 debugs(22, 3, HERE << "Authenticated but server reply Cache-Control:must-revalidate");
418 mayStore = true;
419
420 #if USE_HTTP_VIOLATIONS
421 // NP: given the must-revalidate exception we should also be able to exempt no-cache.
422 // HTTPbis WG verdict on this is that it is omitted from the spec due to being 'unexpected' by
423 // some. The caching+revalidate is not exactly unsafe though with Squids interpretation of no-cache
424 // (without parameters) as equivalent to must-revalidate in the reply.
425 } else if (rep->cache_control->hasNoCacheWithoutParameters()) {
426 debugs(22, 3, HERE << "Authenticated but server reply Cache-Control:no-cache (equivalent to must-revalidate)");
427 mayStore = true;
428 #endif
429
430 // HTTPbis pt6 section 3.2: a response CC:s-maxage is present
431 } else if (rep->cache_control->hasSMaxAge()) {
432 debugs(22, 3, HERE << "Authenticated but server reply Cache-Control:s-maxage");
433 mayStore = true;
434 }
435
436 if (!mayStore)
437 return decision.make(ReuseDecision::reuseNot, "authenticated transaction");
438
439 // NP: response CC:no-cache is equivalent to CC:must-revalidate,max-age=0. We MAY cache, and do so.
440 // NP: other request CC flags are limiters on HIT/MISS/REFRESH. We don't care about here.
441 }
442
443 /* HACK: The "multipart/x-mixed-replace" content type is used for
444 * continuous push replies. These are generally dynamic and
445 * probably should not be cachable
446 */
447 if ((v = hdr->getStr(Http::HdrType::CONTENT_TYPE)))
448 if (!strncasecmp(v, "multipart/x-mixed-replace", 25))
449 return decision.make(ReuseDecision::reuseNot, "Content-Type:multipart/x-mixed-replace");
450
451 // TODO: if possible, provide more specific message for each status code
452 static const char *shareableError = "shareable error status code";
453 static const char *nonShareableError = "non-shareable error status code";
454 ReuseDecision::Answers statusAnswer = ReuseDecision::reuseNot;
455 const char *statusReason = nonShareableError;
456
457 switch (rep->sline.status()) {
458
459 /* There are several situations when a non-cacheable response may be
460 * still shareable (e.g., among collapsed clients). We assume that these
461 * are 3xx and 5xx responses, indicating server problems and some of
462 * 4xx responses, common for all clients with a given cache key (e.g.,
463 * 404 Not Found or 414 URI Too Long). On the other hand, we should not
464 * share non-cacheable client-specific errors, such as 400 Bad Request
465 * or 406 Not Acceptable.
466 */
467
468 /* Responses that are cacheable */
469
470 case Http::scOkay:
471
472 case Http::scNonAuthoritativeInformation:
473
474 case Http::scMultipleChoices:
475
476 case Http::scMovedPermanently:
477 case Http::scPermanentRedirect:
478
479 case Http::scGone:
480 /*
481 * Don't cache objects that need to be refreshed on next request,
482 * unless we know how to refresh it.
483 */
484
485 if (refreshIsCachable(entry) || REFRESH_OVERRIDE(store_stale))
486 decision.make(ReuseDecision::cachePositively, "refresh check returned cacheable");
487 else
488 decision.make(ReuseDecision::doNotCacheButShare, "refresh check returned non-cacheable");
489 break;
490
491 /* Responses that only are cacheable if the server says so */
492
493 case Http::scFound:
494 case Http::scTemporaryRedirect:
495 if (rep->date <= 0)
496 decision.make(ReuseDecision::doNotCacheButShare, "Date is missing/invalid");
497 else if (rep->expires > rep->date)
498 decision.make(ReuseDecision::cachePositively, "Expires > Date");
499 else
500 decision.make(ReuseDecision::doNotCacheButShare, "Expires <= Date");
501 break;
502
503 /* These responses can be negatively cached. Most can also be shared. */
504 case Http::scNoContent:
505 case Http::scUseProxy:
506 case Http::scForbidden:
507 case Http::scNotFound:
508 case Http::scMethodNotAllowed:
509 case Http::scUriTooLong:
510 case Http::scInternalServerError:
511 case Http::scNotImplemented:
512 case Http::scBadGateway:
513 case Http::scServiceUnavailable:
514 case Http::scGatewayTimeout:
515 case Http::scMisdirectedRequest:
516 statusAnswer = ReuseDecision::doNotCacheButShare;
517 statusReason = shareableError;
518 // fall through to the actual decision making below
519
520 case Http::scBadRequest: // no sharing; perhaps the server did not like something specific to this request
521 #if USE_HTTP_VIOLATIONS
522 if (Config.negativeTtl > 0)
523 decision.make(ReuseDecision::cacheNegatively, "Config.negativeTtl > 0");
524 else
525 #endif
526 decision.make(statusAnswer, statusReason);
527 break;
528
529 /* these responses can never be cached, some
530 of them can be shared though */
531 case Http::scSeeOther:
532 case Http::scNotModified:
533 case Http::scUnauthorized:
534 case Http::scProxyAuthenticationRequired:
535 case Http::scPaymentRequired:
536 case Http::scInsufficientStorage:
537 // TODO: use more specific reason for non-error status codes
538 decision.make(ReuseDecision::doNotCacheButShare, shareableError);
539 break;
540
541 case Http::scPartialContent: /* Not yet supported. TODO: make shareable for suitable ranges */
542 case Http::scNotAcceptable:
543 case Http::scRequestTimeout: // TODO: is this shareable?
544 case Http::scConflict: // TODO: is this shareable?
545 case Http::scLengthRequired:
546 case Http::scPreconditionFailed:
547 case Http::scPayloadTooLarge:
548 case Http::scUnsupportedMediaType:
549 case Http::scUnprocessableEntity:
550 case Http::scLocked: // TODO: is this shareable?
551 case Http::scFailedDependency:
552 case Http::scRequestedRangeNotSatisfied:
553 case Http::scExpectationFailed:
554 case Http::scInvalidHeader: /* Squid header parsing error */
555 case Http::scHeaderTooLarge:
556 decision.make(ReuseDecision::reuseNot, nonShareableError);
557 break;
558
559 default:
560 /* RFC 2616 section 6.1.1: an unrecognized response MUST NOT be cached. */
561 decision.make(ReuseDecision::reuseNot, "unknown status code");
562 break;
563 }
564
565 return decision.answer;
566 }
567
568 /// assemble a variant key (vary-mark) from the given Vary header and HTTP request
569 static void
570 assembleVaryKey(String &vary, SBuf &vstr, const HttpRequest &request)
571 {
572 static const SBuf asterisk("*");
573 const char *pos = nullptr;
574 const char *item = nullptr;
575 int ilen = 0;
576
577 while (strListGetItem(&vary, ',', &item, &ilen, &pos)) {
578 SBuf name(item, ilen);
579 if (name == asterisk) {
580 vstr = asterisk;
581 break;
582 }
583 name.toLower();
584 if (!vstr.isEmpty())
585 vstr.append(", ", 2);
586 vstr.append(name);
587 String hdr(request.header.getByName(name));
588 const char *value = hdr.termedBuf();
589 if (value) {
590 value = rfc1738_escape_part(value);
591 vstr.append("=\"", 2);
592 vstr.append(value);
593 vstr.append("\"", 1);
594 }
595
596 hdr.clean();
597 }
598 }
599
600 /*
601 * For Vary, store the relevant request headers as
602 * virtual headers in the reply
603 * Returns an empty SBuf if the variance cannot be stored
604 */
605 SBuf
606 httpMakeVaryMark(HttpRequest * request, HttpReply const * reply)
607 {
608 SBuf vstr;
609 String vary;
610
611 vary = reply->header.getList(Http::HdrType::VARY);
612 assembleVaryKey(vary, vstr, *request);
613
614 #if X_ACCELERATOR_VARY
615 vary.clean();
616 vary = reply->header.getList(Http::HdrType::HDR_X_ACCELERATOR_VARY);
617 assembleVaryKey(vary, vstr, *request);
618 #endif
619
620 debugs(11, 3, vstr);
621 return vstr;
622 }
623
624 void
625 HttpStateData::keepaliveAccounting(HttpReply *reply)
626 {
627 if (flags.keepalive)
628 if (_peer)
629 ++ _peer->stats.n_keepalives_sent;
630
631 if (reply->keep_alive) {
632 if (_peer)
633 ++ _peer->stats.n_keepalives_recv;
634
635 if (Config.onoff.detect_broken_server_pconns
636 && reply->bodySize(request->method) == -1 && !flags.chunked) {
637 debugs(11, DBG_IMPORTANT, "keepaliveAccounting: Impossible keep-alive header from '" << entry->url() << "'" );
638 // debugs(11, 2, "GOT HTTP REPLY HDR:\n---------\n" << readBuf->content() << "\n----------" );
639 flags.keepalive_broken = true;
640 }
641 }
642 }
643
644 void
645 HttpStateData::checkDateSkew(HttpReply *reply)
646 {
647 if (reply->date > -1 && !_peer) {
648 int skew = abs((int)(reply->date - squid_curtime));
649
650 if (skew > 86400)
651 debugs(11, 3, "" << request->url.host() << "'s clock is skewed by " << skew << " seconds!");
652 }
653 }
654
655 /**
656 * This creates the error page itself.. its likely
657 * that the forward ported reply header max size patch
658 * generates non http conformant error pages - in which
659 * case the errors where should be 'BAD_GATEWAY' etc
660 */
661 void
662 HttpStateData::processReplyHeader()
663 {
664 /** Creates a blank header. If this routine is made incremental, this will not do */
665
666 /* NP: all exit points to this function MUST call ctx_exit(ctx) */
667 Ctx ctx = ctx_enter(entry->mem_obj->urlXXX());
668
669 debugs(11, 3, "processReplyHeader: key '" << entry->getMD5Text() << "'");
670
671 assert(!flags.headers_parsed);
672
673 if (!inBuf.length()) {
674 ctx_exit(ctx);
675 return;
676 }
677
678 /* Attempt to parse the first line; this will define where the protocol, status, reason-phrase and header begin */
679 {
680 if (hp == NULL)
681 hp = new Http1::ResponseParser;
682
683 bool parsedOk = hp->parse(inBuf);
684
685 // sync the buffers after parsing.
686 inBuf = hp->remaining();
687
688 if (hp->needsMoreData()) {
689 if (eof) { // no more data coming
690 /* Bug 2879: Replies may terminate with \r\n then EOF instead of \r\n\r\n.
691 * We also may receive truncated responses.
692 * Ensure here that we have at minimum two \r\n when EOF is seen.
693 */
694 inBuf.append("\r\n\r\n", 4);
695 // retry the parse
696 parsedOk = hp->parse(inBuf);
697 // sync the buffers after parsing.
698 inBuf = hp->remaining();
699 } else {
700 debugs(33, 5, "Incomplete response, waiting for end of response headers");
701 ctx_exit(ctx);
702 return;
703 }
704 }
705
706 if (!parsedOk) {
707 // unrecoverable parsing error
708 // TODO: Use Raw! XXX: inBuf no longer has the [beginning of the] malformed header.
709 debugs(11, 3, "Non-HTTP-compliant header:\n---------\n" << inBuf << "\n----------");
710 flags.headers_parsed = true;
711 HttpReply *newrep = new HttpReply;
712 newrep->sline.set(Http::ProtocolVersion(), hp->parseStatusCode);
713 setVirginReply(newrep);
714 ctx_exit(ctx);
715 return;
716 }
717 }
718
719 /* We know the whole response is in parser now */
720 debugs(11, 2, "HTTP Server " << serverConnection);
721 debugs(11, 2, "HTTP Server RESPONSE:\n---------\n" <<
722 hp->messageProtocol() << " " << hp->messageStatus() << " " << hp->reasonPhrase() << "\n" <<
723 hp->mimeHeader() <<
724 "----------");
725
726 // reset payload tracking to begin after message headers
727 payloadSeen = inBuf.length();
728
729 HttpReply *newrep = new HttpReply;
730 // XXX: RFC 7230 indicates we MAY ignore the reason phrase,
731 // and use an empty string on unknown status.
732 // We do that now to avoid performance regression from using SBuf::c_str()
733 newrep->sline.set(Http::ProtocolVersion(1,1), hp->messageStatus() /* , hp->reasonPhrase() */);
734 newrep->sline.protocol = newrep->sline.version.protocol = hp->messageProtocol().protocol;
735 newrep->sline.version.major = hp->messageProtocol().major;
736 newrep->sline.version.minor = hp->messageProtocol().minor;
737
738 // parse headers
739 if (!newrep->parseHeader(*hp)) {
740 // XXX: when Http::ProtocolVersion is a function, remove this hack. just set with messageProtocol()
741 newrep->sline.set(Http::ProtocolVersion(), Http::scInvalidHeader);
742 newrep->sline.version.protocol = hp->messageProtocol().protocol;
743 newrep->sline.version.major = hp->messageProtocol().major;
744 newrep->sline.version.minor = hp->messageProtocol().minor;
745 debugs(11, 2, "error parsing response headers mime block");
746 }
747
748 // done with Parser, now process using the HttpReply
749 hp = NULL;
750
751 newrep->sources |= request->url.getScheme() == AnyP::PROTO_HTTPS ? Http::Message::srcHttps : Http::Message::srcHttp;
752
753 newrep->removeStaleWarnings();
754
755 if (newrep->sline.protocol == AnyP::PROTO_HTTP && newrep->sline.status() >= 100 && newrep->sline.status() < 200) {
756 handle1xx(newrep);
757 ctx_exit(ctx);
758 return;
759 }
760
761 flags.chunked = false;
762 if (newrep->sline.protocol == AnyP::PROTO_HTTP && newrep->header.chunked()) {
763 flags.chunked = true;
764 httpChunkDecoder = new Http1::TeChunkedParser;
765 }
766
767 if (!peerSupportsConnectionPinning())
768 request->flags.connectionAuthDisabled = true;
769
770 HttpReply *vrep = setVirginReply(newrep);
771 flags.headers_parsed = true;
772
773 keepaliveAccounting(vrep);
774
775 checkDateSkew(vrep);
776
777 processSurrogateControl (vrep);
778
779 request->hier.peer_reply_status = newrep->sline.status();
780
781 ctx_exit(ctx);
782 }
783
784 /// ignore or start forwarding the 1xx response (a.k.a., control message)
785 void
786 HttpStateData::handle1xx(HttpReply *reply)
787 {
788 HttpReply::Pointer msg(reply); // will destroy reply if unused
789
790 // one 1xx at a time: we must not be called while waiting for previous 1xx
791 Must(!flags.handling1xx);
792 flags.handling1xx = true;
793
794 if (!request->canHandle1xx() || request->forcedBodyContinuation) {
795 debugs(11, 2, "ignoring 1xx because it is " << (request->forcedBodyContinuation ? "already sent" : "not supported by client"));
796 proceedAfter1xx();
797 return;
798 }
799
800 #if USE_HTTP_VIOLATIONS
801 // check whether the 1xx response forwarding is allowed by squid.conf
802 if (Config.accessList.reply) {
803 ACLFilledChecklist ch(Config.accessList.reply, originalRequest().getRaw());
804 ch.al = fwd->al;
805 ch.reply = reply;
806 ch.syncAle(originalRequest().getRaw(), nullptr);
807 HTTPMSGLOCK(ch.reply);
808 if (!ch.fastCheck().allowed()) { // TODO: support slow lookups?
809 debugs(11, 3, HERE << "ignoring denied 1xx");
810 proceedAfter1xx();
811 return;
812 }
813 }
814 #endif // USE_HTTP_VIOLATIONS
815
816 debugs(11, 2, HERE << "forwarding 1xx to client");
817
818 // the Sink will use this to call us back after writing 1xx to the client
819 typedef NullaryMemFunT<HttpStateData> CbDialer;
820 const AsyncCall::Pointer cb = JobCallback(11, 3, CbDialer, this,
821 HttpStateData::proceedAfter1xx);
822 CallJobHere1(11, 4, request->clientConnectionManager, ConnStateData,
823 ConnStateData::sendControlMsg, HttpControlMsg(msg, cb));
824 // If the call is not fired, then the Sink is gone, and HttpStateData
825 // will terminate due to an aborted store entry or another similar error.
826 // If we get stuck, it is not handle1xx fault if we could get stuck
827 // for similar reasons without a 1xx response.
828 }
829
830 /// restores state and resumes processing after 1xx is ignored or forwarded
831 void
832 HttpStateData::proceedAfter1xx()
833 {
834 Must(flags.handling1xx);
835 debugs(11, 2, "continuing with " << payloadSeen << " bytes in buffer after 1xx");
836 CallJobHere(11, 3, this, HttpStateData, HttpStateData::processReply);
837 }
838
839 /**
840 * returns true if the peer can support connection pinning
841 */
842 bool
843 HttpStateData::peerSupportsConnectionPinning() const
844 {
845 if (!_peer)
846 return true;
847
848 /*If this peer does not support connection pinning (authenticated
849 connections) return false
850 */
851 if (!_peer->connection_auth)
852 return false;
853
854 const HttpReplyPointer rep(entry->mem_obj->getReply());
855
856 /*The peer supports connection pinning and the http reply status
857 is not unauthorized, so the related connection can be pinned
858 */
859 if (rep->sline.status() != Http::scUnauthorized)
860 return true;
861
862 /*The server respond with Http::scUnauthorized and the peer configured
863 with "connection-auth=on" we know that the peer supports pinned
864 connections
865 */
866 if (_peer->connection_auth == 1)
867 return true;
868
869 /*At this point peer has configured with "connection-auth=auto"
870 parameter so we need some extra checks to decide if we are going
871 to allow pinned connections or not
872 */
873
874 /*if the peer configured with originserver just allow connection
875 pinning (squid 2.6 behaviour)
876 */
877 if (_peer->options.originserver)
878 return true;
879
880 /*if the connections it is already pinned it is OK*/
881 if (request->flags.pinned)
882 return true;
883
884 /*Allow pinned connections only if the Proxy-support header exists in
885 reply and has in its list the "Session-Based-Authentication"
886 which means that the peer supports connection pinning.
887 */
888 if (rep->header.hasListMember(Http::HdrType::PROXY_SUPPORT, "Session-Based-Authentication", ','))
889 return true;
890
891 return false;
892 }
893
894 // Called when we parsed (and possibly adapted) the headers but
895 // had not starting storing (a.k.a., sending) the body yet.
896 void
897 HttpStateData::haveParsedReplyHeaders()
898 {
899 Client::haveParsedReplyHeaders();
900
901 Ctx ctx = ctx_enter(entry->mem_obj->urlXXX());
902 HttpReply *rep = finalReply();
903 const Http::StatusCode statusCode = rep->sline.status();
904
905 entry->timestampsSet();
906
907 /* Check if object is cacheable or not based on reply code */
908 debugs(11, 3, "HTTP CODE: " << statusCode);
909
910 if (StoreEntry *oldEntry = findPreviouslyCachedEntry(entry)) {
911 oldEntry->lock("HttpStateData::haveParsedReplyHeaders");
912 sawDateGoBack = rep->olderThan(oldEntry->getReply());
913 oldEntry->unlock("HttpStateData::haveParsedReplyHeaders");
914 }
915
916 if (neighbors_do_private_keys && !sawDateGoBack)
917 httpMaybeRemovePublic(entry, rep->sline.status());
918
919 bool varyFailure = false;
920 if (rep->header.has(Http::HdrType::VARY)
921 #if X_ACCELERATOR_VARY
922 || rep->header.has(Http::HdrType::HDR_X_ACCELERATOR_VARY)
923 #endif
924 ) {
925 const SBuf vary(httpMakeVaryMark(request.getRaw(), rep));
926
927 if (vary.isEmpty()) {
928 // TODO: check whether such responses are shareable.
929 // Do not share for now.
930 entry->makePrivate(false);
931 if (!fwd->reforwardableStatus(rep->sline.status()))
932 EBIT_CLR(entry->flags, ENTRY_FWD_HDR_WAIT);
933 varyFailure = true;
934 } else {
935 entry->mem_obj->vary_headers = vary;
936
937 // RFC 7231 section 7.1.4
938 // Vary:* can be cached, but has mandatory revalidation
939 static const SBuf asterisk("*");
940 if (vary == asterisk)
941 EBIT_SET(entry->flags, ENTRY_REVALIDATE_ALWAYS);
942 }
943 }
944
945 if (!varyFailure) {
946 /*
947 * If its not a reply that we will re-forward, then
948 * allow the client to get it.
949 */
950 if (!fwd->reforwardableStatus(rep->sline.status()))
951 EBIT_CLR(entry->flags, ENTRY_FWD_HDR_WAIT);
952
953 ReuseDecision decision(entry, statusCode);
954
955 switch (reusableReply(decision)) {
956
957 case ReuseDecision::reuseNot:
958 entry->makePrivate(false);
959 break;
960
961 case ReuseDecision::cachePositively:
962 if (!entry->makePublic()) {
963 decision.make(ReuseDecision::doNotCacheButShare, "public key creation error");
964 entry->makePrivate(true);
965 }
966 break;
967
968 case ReuseDecision::cacheNegatively:
969 if (!entry->cacheNegatively()) {
970 decision.make(ReuseDecision::doNotCacheButShare, "public key creation error");
971 entry->makePrivate(true);
972 }
973 break;
974
975 case ReuseDecision::doNotCacheButShare:
976 entry->makePrivate(true);
977 break;
978
979 default:
980 assert(0);
981 break;
982 }
983 debugs(11, 3, "decided: " << decision);
984 }
985
986 if (!ignoreCacheControl) {
987 if (rep->cache_control) {
988 // We are required to revalidate on many conditions.
989 // For security reasons we do so even if storage was caused by refresh_pattern ignore-* option
990
991 // CC:must-revalidate or CC:proxy-revalidate
992 const bool ccMustRevalidate = (rep->cache_control->hasProxyRevalidate() || rep->cache_control->hasMustRevalidate());
993
994 // CC:no-cache (only if there are no parameters)
995 const bool ccNoCacheNoParams = rep->cache_control->hasNoCacheWithoutParameters();
996
997 // CC:s-maxage=N
998 const bool ccSMaxAge = rep->cache_control->hasSMaxAge();
999
1000 // CC:private (yes, these can sometimes be stored)
1001 const bool ccPrivate = rep->cache_control->hasPrivate();
1002
1003 if (ccNoCacheNoParams || ccPrivate)
1004 EBIT_SET(entry->flags, ENTRY_REVALIDATE_ALWAYS);
1005 else if (ccMustRevalidate || ccSMaxAge)
1006 EBIT_SET(entry->flags, ENTRY_REVALIDATE_STALE);
1007 }
1008 #if USE_HTTP_VIOLATIONS // response header Pragma::no-cache is undefined in HTTP
1009 else {
1010 // Expensive calculation. So only do it IF the CC: header is not present.
1011
1012 /* HACK: Pragma: no-cache in _replies_ is not documented in HTTP,
1013 * but servers like "Active Imaging Webcast/2.0" sure do use it */
1014 if (rep->header.has(Http::HdrType::PRAGMA) &&
1015 rep->header.hasListMember(Http::HdrType::PRAGMA,"no-cache",','))
1016 EBIT_SET(entry->flags, ENTRY_REVALIDATE_ALWAYS);
1017 }
1018 #endif
1019 }
1020
1021 #if HEADERS_LOG
1022 headersLog(1, 0, request->method, rep);
1023
1024 #endif
1025
1026 ctx_exit(ctx);
1027 }
1028
1029 HttpStateData::ConnectionStatus
1030 HttpStateData::statusIfComplete() const
1031 {
1032 const HttpReply *rep = virginReply();
1033 /** \par
1034 * If the reply wants to close the connection, it takes precedence */
1035
1036 static SBuf close("close", 5);
1037 if (httpHeaderHasConnDir(&rep->header, close))
1038 return COMPLETE_NONPERSISTENT_MSG;
1039
1040 /** \par
1041 * If we didn't send a keep-alive request header, then this
1042 * can not be a persistent connection.
1043 */
1044 if (!flags.keepalive)
1045 return COMPLETE_NONPERSISTENT_MSG;
1046
1047 /** \par
1048 * If we haven't sent the whole request then this can not be a persistent
1049 * connection.
1050 */
1051 if (!flags.request_sent) {
1052 debugs(11, 2, "Request not yet fully sent " << request->method << ' ' << entry->url());
1053 return COMPLETE_NONPERSISTENT_MSG;
1054 }
1055
1056 /** \par
1057 * What does the reply have to say about keep-alive?
1058 */
1059 /**
1060 \bug XXX BUG?
1061 * If the origin server (HTTP/1.0) does not send a keep-alive
1062 * header, but keeps the connection open anyway, what happens?
1063 * We'll return here and http.c waits for an EOF before changing
1064 * store_status to STORE_OK. Combine this with ENTRY_FWD_HDR_WAIT
1065 * and an error status code, and we might have to wait until
1066 * the server times out the socket.
1067 */
1068 if (!rep->keep_alive)
1069 return COMPLETE_NONPERSISTENT_MSG;
1070
1071 return COMPLETE_PERSISTENT_MSG;
1072 }
1073
1074 HttpStateData::ConnectionStatus
1075 HttpStateData::persistentConnStatus() const
1076 {
1077 debugs(11, 3, HERE << serverConnection << " eof=" << eof);
1078 if (eof) // already reached EOF
1079 return COMPLETE_NONPERSISTENT_MSG;
1080
1081 /* If server fd is closing (but we have not been notified yet), stop Comm
1082 I/O to avoid assertions. TODO: Change Comm API to handle callers that
1083 want more I/O after async closing (usually initiated by others). */
1084 // XXX: add canReceive or s/canSend/canTalkToServer/
1085 if (!Comm::IsConnOpen(serverConnection))
1086 return COMPLETE_NONPERSISTENT_MSG;
1087
1088 /** \par
1089 * In chunked response we do not know the content length but we are absolutely
1090 * sure about the end of response, so we are calling the statusIfComplete to
1091 * decide if we can be persistant
1092 */
1093 if (lastChunk && flags.chunked)
1094 return statusIfComplete();
1095
1096 const HttpReply *vrep = virginReply();
1097 debugs(11, 5, "persistentConnStatus: content_length=" << vrep->content_length);
1098
1099 const int64_t clen = vrep->bodySize(request->method);
1100
1101 debugs(11, 5, "persistentConnStatus: clen=" << clen);
1102
1103 /* If the body size is unknown we must wait for EOF */
1104 if (clen < 0)
1105 return INCOMPLETE_MSG;
1106
1107 /** \par
1108 * If the body size is known, we must wait until we've gotten all of it. */
1109 if (clen > 0) {
1110 debugs(11,5, "payloadSeen=" << payloadSeen << " content_length=" << vrep->content_length);
1111
1112 if (payloadSeen < vrep->content_length)
1113 return INCOMPLETE_MSG;
1114
1115 if (payloadTruncated > 0) // already read more than needed
1116 return COMPLETE_NONPERSISTENT_MSG; // disable pconns
1117 }
1118
1119 /** \par
1120 * If there is no message body or we got it all, we can be persistent */
1121 return statusIfComplete();
1122 }
1123
1124 static void
1125 readDelayed(void *context, CommRead const &)
1126 {
1127 HttpStateData *state = static_cast<HttpStateData*>(context);
1128 state->flags.do_next_read = true;
1129 state->maybeReadVirginBody();
1130 }
1131
1132 void
1133 HttpStateData::readReply(const CommIoCbParams &io)
1134 {
1135 Must(!flags.do_next_read); // XXX: should have been set false by mayReadVirginBody()
1136 flags.do_next_read = false;
1137
1138 debugs(11, 5, io.conn);
1139
1140 // Bail out early on Comm::ERR_CLOSING - close handlers will tidy up for us
1141 if (io.flag == Comm::ERR_CLOSING) {
1142 debugs(11, 3, "http socket closing");
1143 return;
1144 }
1145
1146 if (EBIT_TEST(entry->flags, ENTRY_ABORTED)) {
1147 abortTransaction("store entry aborted while reading reply");
1148 return;
1149 }
1150
1151 Must(Comm::IsConnOpen(serverConnection));
1152 Must(io.conn->fd == serverConnection->fd);
1153
1154 /*
1155 * Don't reset the timeout value here. The value should be
1156 * counting Config.Timeout.request and applies to the request
1157 * as a whole, not individual read() calls.
1158 * Plus, it breaks our lame *HalfClosed() detection
1159 */
1160
1161 Must(maybeMakeSpaceAvailable(true));
1162 CommIoCbParams rd(this); // will be expanded with ReadNow results
1163 rd.conn = io.conn;
1164 rd.size = entry->bytesWanted(Range<size_t>(0, inBuf.spaceSize()));
1165
1166 if (rd.size <= 0) {
1167 assert(entry->mem_obj);
1168 AsyncCall::Pointer nilCall;
1169 entry->mem_obj->delayRead(DeferredRead(readDelayed, this, CommRead(io.conn, NULL, 0, nilCall)));
1170 return;
1171 }
1172
1173 switch (Comm::ReadNow(rd, inBuf)) {
1174 case Comm::INPROGRESS:
1175 if (inBuf.isEmpty())
1176 debugs(33, 2, io.conn << ": no data to process, " << xstrerr(rd.xerrno));
1177 flags.do_next_read = true;
1178 maybeReadVirginBody();
1179 return;
1180
1181 case Comm::OK:
1182 {
1183 payloadSeen += rd.size;
1184 #if USE_DELAY_POOLS
1185 DelayId delayId = entry->mem_obj->mostBytesAllowed();
1186 delayId.bytesIn(rd.size);
1187 #endif
1188
1189 statCounter.server.all.kbytes_in += rd.size;
1190 statCounter.server.http.kbytes_in += rd.size;
1191 ++ IOStats.Http.reads;
1192
1193 int bin = 0;
1194 for (int clen = rd.size - 1; clen; ++bin)
1195 clen >>= 1;
1196
1197 ++ IOStats.Http.read_hist[bin];
1198
1199 request->hier.notePeerRead();
1200 }
1201
1202 /* Continue to process previously read data */
1203 break;
1204
1205 case Comm::ENDFILE: // close detected by 0-byte read
1206 eof = 1;
1207 flags.do_next_read = false;
1208
1209 /* Continue to process previously read data */
1210 break;
1211
1212 // case Comm::COMM_ERROR:
1213 default: // no other flags should ever occur
1214 debugs(11, 2, io.conn << ": read failure: " << xstrerr(rd.xerrno));
1215 ErrorState *err = new ErrorState(ERR_READ_ERROR, Http::scBadGateway, fwd->request);
1216 err->xerrno = rd.xerrno;
1217 fwd->fail(err);
1218 flags.do_next_read = false;
1219 closeServer();
1220 mustStop("HttpStateData::readReply");
1221 return;
1222 }
1223
1224 /* Process next response from buffer */
1225 processReply();
1226 }
1227
1228 /// processes the already read and buffered response data, possibly after
1229 /// waiting for asynchronous 1xx control message processing
1230 void
1231 HttpStateData::processReply()
1232 {
1233
1234 if (flags.handling1xx) { // we came back after handling a 1xx response
1235 debugs(11, 5, HERE << "done with 1xx handling");
1236 flags.handling1xx = false;
1237 Must(!flags.headers_parsed);
1238 }
1239
1240 if (!flags.headers_parsed) { // have not parsed headers yet?
1241 PROF_start(HttpStateData_processReplyHeader);
1242 processReplyHeader();
1243 PROF_stop(HttpStateData_processReplyHeader);
1244
1245 if (!continueAfterParsingHeader()) // parsing error or need more data
1246 return; // TODO: send errors to ICAP
1247
1248 adaptOrFinalizeReply(); // may write to, abort, or "close" the entry
1249 }
1250
1251 // kick more reads if needed and/or process the response body, if any
1252 PROF_start(HttpStateData_processReplyBody);
1253 processReplyBody(); // may call serverComplete()
1254 PROF_stop(HttpStateData_processReplyBody);
1255 }
1256
1257 /**
1258 \retval true if we can continue with processing the body or doing ICAP.
1259 */
1260 bool
1261 HttpStateData::continueAfterParsingHeader()
1262 {
1263 if (flags.handling1xx) {
1264 debugs(11, 5, HERE << "wait for 1xx handling");
1265 Must(!flags.headers_parsed);
1266 return false;
1267 }
1268
1269 if (!flags.headers_parsed && !eof) {
1270 debugs(11, 9, "needs more at " << inBuf.length());
1271 flags.do_next_read = true;
1272 /** \retval false If we have not finished parsing the headers and may get more data.
1273 * Schedules more reads to retrieve the missing data.
1274 */
1275 maybeReadVirginBody(); // schedules all kinds of reads; TODO: rename
1276 return false;
1277 }
1278
1279 /** If we are done with parsing, check for errors */
1280
1281 err_type error = ERR_NONE;
1282
1283 if (flags.headers_parsed) { // parsed headers, possibly with errors
1284 // check for header parsing errors
1285 if (HttpReply *vrep = virginReply()) {
1286 const Http::StatusCode s = vrep->sline.status();
1287 const AnyP::ProtocolVersion &v = vrep->sline.version;
1288 if (s == Http::scInvalidHeader && v != Http::ProtocolVersion(0,9)) {
1289 debugs(11, DBG_IMPORTANT, "WARNING: HTTP: Invalid Response: Bad header encountered from " << entry->url() << " AKA " << request->url);
1290 error = ERR_INVALID_RESP;
1291 } else if (s == Http::scHeaderTooLarge) {
1292 fwd->dontRetry(true);
1293 error = ERR_TOO_BIG;
1294 } else if (vrep->header.conflictingContentLength()) {
1295 fwd->dontRetry(true);
1296 error = ERR_INVALID_RESP;
1297 } else {
1298 return true; // done parsing, got reply, and no error
1299 }
1300 } else {
1301 // parsed headers but got no reply
1302 debugs(11, DBG_IMPORTANT, "WARNING: HTTP: Invalid Response: No reply at all for " << entry->url() << " AKA " << request->url);
1303 error = ERR_INVALID_RESP;
1304 }
1305 } else {
1306 assert(eof);
1307 if (inBuf.length()) {
1308 error = ERR_INVALID_RESP;
1309 debugs(11, DBG_IMPORTANT, "WARNING: HTTP: Invalid Response: Headers did not parse at all for " << entry->url() << " AKA " << request->url);
1310 } else {
1311 error = ERR_ZERO_SIZE_OBJECT;
1312 debugs(11, (request->flags.accelerated?DBG_IMPORTANT:2), "WARNING: HTTP: Invalid Response: No object data received for " << entry->url() << " AKA " << request->url);
1313 }
1314 }
1315
1316 assert(error != ERR_NONE);
1317 entry->reset();
1318 fwd->fail(new ErrorState(error, Http::scBadGateway, fwd->request));
1319 flags.do_next_read = false;
1320 closeServer();
1321 mustStop("HttpStateData::continueAfterParsingHeader");
1322 return false; // quit on error
1323 }
1324
1325 /** truncate what we read if we read too much so that writeReplyBody()
1326 writes no more than what we should have read */
1327 void
1328 HttpStateData::truncateVirginBody()
1329 {
1330 assert(flags.headers_parsed);
1331
1332 HttpReply *vrep = virginReply();
1333 int64_t clen = -1;
1334 if (!vrep->expectingBody(request->method, clen) || clen < 0)
1335 return; // no body or a body of unknown size, including chunked
1336
1337 if (payloadSeen - payloadTruncated <= clen)
1338 return; // we did not read too much or already took care of the extras
1339
1340 if (const int64_t extras = payloadSeen - payloadTruncated - clen) {
1341 // server sent more that the advertised content length
1342 debugs(11, 5, "payloadSeen=" << payloadSeen <<
1343 " clen=" << clen << '/' << vrep->content_length <<
1344 " trucated=" << payloadTruncated << '+' << extras);
1345
1346 inBuf.chop(0, inBuf.length() - extras);
1347 payloadTruncated += extras;
1348 }
1349 }
1350
1351 /**
1352 * Call this when there is data from the origin server
1353 * which should be sent to either StoreEntry, or to ICAP...
1354 */
1355 void
1356 HttpStateData::writeReplyBody()
1357 {
1358 truncateVirginBody(); // if needed
1359 const char *data = inBuf.rawContent();
1360 int len = inBuf.length();
1361 addVirginReplyBody(data, len);
1362 inBuf.consume(len);
1363 }
1364
1365 bool
1366 HttpStateData::decodeAndWriteReplyBody()
1367 {
1368 const char *data = NULL;
1369 int len;
1370 bool wasThereAnException = false;
1371 assert(flags.chunked);
1372 assert(httpChunkDecoder);
1373 SQUID_ENTER_THROWING_CODE();
1374 MemBuf decodedData;
1375 decodedData.init();
1376 httpChunkDecoder->setPayloadBuffer(&decodedData);
1377 const bool doneParsing = httpChunkDecoder->parse(inBuf);
1378 inBuf = httpChunkDecoder->remaining(); // sync buffers after parse
1379 len = decodedData.contentSize();
1380 data=decodedData.content();
1381 addVirginReplyBody(data, len);
1382 if (doneParsing) {
1383 lastChunk = 1;
1384 flags.do_next_read = false;
1385 }
1386 SQUID_EXIT_THROWING_CODE(wasThereAnException);
1387 return wasThereAnException;
1388 }
1389
1390 /**
1391 * processReplyBody has two purposes:
1392 * 1 - take the reply body data, if any, and put it into either
1393 * the StoreEntry, or give it over to ICAP.
1394 * 2 - see if we made it to the end of the response (persistent
1395 * connections and such)
1396 */
1397 void
1398 HttpStateData::processReplyBody()
1399 {
1400 if (!flags.headers_parsed) {
1401 flags.do_next_read = true;
1402 maybeReadVirginBody();
1403 return;
1404 }
1405
1406 #if USE_ADAPTATION
1407 debugs(11,5, HERE << "adaptationAccessCheckPending=" << adaptationAccessCheckPending);
1408 if (adaptationAccessCheckPending)
1409 return;
1410
1411 #endif
1412
1413 /*
1414 * At this point the reply headers have been parsed and consumed.
1415 * That means header content has been removed from readBuf and
1416 * it contains only body data.
1417 */
1418 if (entry->isAccepting()) {
1419 if (flags.chunked) {
1420 if (!decodeAndWriteReplyBody()) {
1421 flags.do_next_read = false;
1422 serverComplete();
1423 return;
1424 }
1425 } else
1426 writeReplyBody();
1427 }
1428
1429 // storing/sending methods like earlier adaptOrFinalizeReply() or
1430 // above writeReplyBody() may release/abort the store entry.
1431 if (EBIT_TEST(entry->flags, ENTRY_ABORTED)) {
1432 // TODO: In some cases (e.g., 304), we should keep persistent conn open.
1433 // Detect end-of-reply (and, hence, pool our idle pconn) earlier (ASAP).
1434 abortTransaction("store entry aborted while storing reply");
1435 return;
1436 } else
1437 switch (persistentConnStatus()) {
1438 case INCOMPLETE_MSG: {
1439 debugs(11, 5, "processReplyBody: INCOMPLETE_MSG from " << serverConnection);
1440 /* Wait for more data or EOF condition */
1441 AsyncCall::Pointer nil;
1442 if (flags.keepalive_broken) {
1443 commSetConnTimeout(serverConnection, 10, nil);
1444 } else {
1445 commSetConnTimeout(serverConnection, Config.Timeout.read, nil);
1446 }
1447
1448 flags.do_next_read = true;
1449 }
1450 break;
1451
1452 case COMPLETE_PERSISTENT_MSG: {
1453 debugs(11, 5, "processReplyBody: COMPLETE_PERSISTENT_MSG from " << serverConnection);
1454
1455 // TODO: Remove serverConnectionSaved but preserve exception safety.
1456
1457 commUnsetConnTimeout(serverConnection);
1458 flags.do_next_read = false;
1459
1460 comm_remove_close_handler(serverConnection->fd, closeHandler);
1461 closeHandler = NULL;
1462
1463 Ip::Address client_addr; // XXX: Remove as unused. Why was it added?
1464 if (request->flags.spoofClientIp)
1465 client_addr = request->client_addr;
1466
1467 auto serverConnectionSaved = serverConnection;
1468 fwd->unregister(serverConnection);
1469 serverConnection = nullptr;
1470
1471 bool ispinned = false; // TODO: Rename to isOrShouldBePinned
1472 if (request->flags.pinned) {
1473 ispinned = true;
1474 } else if (request->flags.connectionAuth && request->flags.authSent) {
1475 ispinned = true;
1476 }
1477
1478 if (ispinned) {
1479 if (request->clientConnectionManager.valid()) {
1480 CallJobHere1(11, 4, request->clientConnectionManager,
1481 ConnStateData,
1482 notePinnedConnectionBecameIdle,
1483 ConnStateData::PinnedIdleContext(serverConnectionSaved, request));
1484 } else {
1485 // must not pool/share ispinned connections, even orphaned ones
1486 serverConnectionSaved->close();
1487 }
1488 } else {
1489 fwd->pconnPush(serverConnectionSaved, request->url.host());
1490 }
1491
1492 serverComplete();
1493 return;
1494 }
1495
1496 case COMPLETE_NONPERSISTENT_MSG:
1497 debugs(11, 5, "processReplyBody: COMPLETE_NONPERSISTENT_MSG from " << serverConnection);
1498 serverComplete();
1499 return;
1500 }
1501
1502 maybeReadVirginBody();
1503 }
1504
1505 bool
1506 HttpStateData::mayReadVirginReplyBody() const
1507 {
1508 // TODO: Be more precise here. For example, if/when reading trailer, we may
1509 // not be doneWithServer() yet, but we should return false. Similarly, we
1510 // could still be writing the request body after receiving the whole reply.
1511 return !doneWithServer();
1512 }
1513
1514 void
1515 HttpStateData::maybeReadVirginBody()
1516 {
1517 // too late to read
1518 if (!Comm::IsConnOpen(serverConnection) || fd_table[serverConnection->fd].closing())
1519 return;
1520
1521 if (!maybeMakeSpaceAvailable(false))
1522 return;
1523
1524 // XXX: get rid of the do_next_read flag
1525 // check for the proper reasons preventing read(2)
1526 if (!flags.do_next_read)
1527 return;
1528
1529 flags.do_next_read = false;
1530
1531 // must not already be waiting for read(2) ...
1532 assert(!Comm::MonitorsRead(serverConnection->fd));
1533
1534 // wait for read(2) to be possible.
1535 typedef CommCbMemFunT<HttpStateData, CommIoCbParams> Dialer;
1536 AsyncCall::Pointer call = JobCallback(11, 5, Dialer, this, HttpStateData::readReply);
1537 Comm::Read(serverConnection, call);
1538 }
1539
1540 bool
1541 HttpStateData::maybeMakeSpaceAvailable(bool doGrow)
1542 {
1543 // how much we are allowed to buffer
1544 const int limitBuffer = (flags.headers_parsed ? Config.readAheadGap : Config.maxReplyHeaderSize);
1545
1546 if (limitBuffer < 0 || inBuf.length() >= (SBuf::size_type)limitBuffer) {
1547 // when buffer is at or over limit already
1548 debugs(11, 7, "wont read up to " << limitBuffer << ". buffer has (" << inBuf.length() << "/" << inBuf.spaceSize() << ") from " << serverConnection);
1549 debugs(11, DBG_DATA, "buffer has {" << inBuf << "}");
1550 // Process next response from buffer
1551 processReply();
1552 return false;
1553 }
1554
1555 // how much we want to read
1556 const size_t read_size = calcBufferSpaceToReserve(inBuf.spaceSize(), (limitBuffer - inBuf.length()));
1557
1558 if (!read_size) {
1559 debugs(11, 7, "wont read up to " << read_size << " into buffer (" << inBuf.length() << "/" << inBuf.spaceSize() << ") from " << serverConnection);
1560 return false;
1561 }
1562
1563 // just report whether we could grow or not, dont actually do it
1564 if (doGrow)
1565 return (read_size >= 2);
1566
1567 // we may need to grow the buffer
1568 inBuf.reserveSpace(read_size);
1569 debugs(11, 8, (!flags.do_next_read ? "wont" : "may") <<
1570 " read up to " << read_size << " bytes info buf(" << inBuf.length() << "/" << inBuf.spaceSize() <<
1571 ") from " << serverConnection);
1572
1573 return (inBuf.spaceSize() >= 2); // only read if there is 1+ bytes of space available
1574 }
1575
1576 /// called after writing the very last request byte (body, last-chunk, etc)
1577 void
1578 HttpStateData::wroteLast(const CommIoCbParams &io)
1579 {
1580 debugs(11, 5, HERE << serverConnection << ": size " << io.size << ": errflag " << io.flag << ".");
1581 #if URL_CHECKSUM_DEBUG
1582
1583 entry->mem_obj->checkUrlChecksum();
1584 #endif
1585
1586 // XXX: Keep in sync with Client::sentRequestBody().
1587 // TODO: Extract common parts.
1588
1589 if (io.size > 0) {
1590 fd_bytes(io.fd, io.size, FD_WRITE);
1591 statCounter.server.all.kbytes_out += io.size;
1592 statCounter.server.http.kbytes_out += io.size;
1593 }
1594
1595 if (io.flag == Comm::ERR_CLOSING)
1596 return;
1597
1598 // both successful and failed writes affect response times
1599 request->hier.notePeerWrite();
1600
1601 if (io.flag) {
1602 ErrorState *err = new ErrorState(ERR_WRITE_ERROR, Http::scBadGateway, fwd->request);
1603 err->xerrno = io.xerrno;
1604 fwd->fail(err);
1605 closeServer();
1606 mustStop("HttpStateData::wroteLast");
1607 return;
1608 }
1609
1610 sendComplete();
1611 }
1612
1613 /// successfully wrote the entire request (including body, last-chunk, etc.)
1614 void
1615 HttpStateData::sendComplete()
1616 {
1617 /*
1618 * Set the read timeout here because it hasn't been set yet.
1619 * We only set the read timeout after the request has been
1620 * fully written to the peer. If we start the timeout
1621 * after connection establishment, then we are likely to hit
1622 * the timeout for POST/PUT requests that have very large
1623 * request bodies.
1624 */
1625 typedef CommCbMemFunT<HttpStateData, CommTimeoutCbParams> TimeoutDialer;
1626 AsyncCall::Pointer timeoutCall = JobCallback(11, 5,
1627 TimeoutDialer, this, HttpStateData::httpTimeout);
1628
1629 commSetConnTimeout(serverConnection, Config.Timeout.read, timeoutCall);
1630 flags.request_sent = true;
1631 }
1632
1633 void
1634 HttpStateData::closeServer()
1635 {
1636 debugs(11,5, HERE << "closing HTTP server " << serverConnection << " this " << this);
1637
1638 if (Comm::IsConnOpen(serverConnection)) {
1639 fwd->unregister(serverConnection);
1640 comm_remove_close_handler(serverConnection->fd, closeHandler);
1641 closeHandler = NULL;
1642 serverConnection->close();
1643 }
1644 }
1645
1646 bool
1647 HttpStateData::doneWithServer() const
1648 {
1649 return !Comm::IsConnOpen(serverConnection);
1650 }
1651
1652 /*
1653 * Fixup authentication request headers for special cases
1654 */
1655 static void
1656 httpFixupAuthentication(HttpRequest * request, const HttpHeader * hdr_in, HttpHeader * hdr_out, const Http::StateFlags &flags)
1657 {
1658 Http::HdrType header = flags.originpeer ? Http::HdrType::AUTHORIZATION : Http::HdrType::PROXY_AUTHORIZATION;
1659
1660 /* Nothing to do unless we are forwarding to a peer */
1661 if (!request->flags.proxying)
1662 return;
1663
1664 /* Needs to be explicitly enabled */
1665 if (!request->peer_login)
1666 return;
1667
1668 /* Maybe already dealt with? */
1669 if (hdr_out->has(header))
1670 return;
1671
1672 /* Nothing to do here for PASSTHRU */
1673 if (strcmp(request->peer_login, "PASSTHRU") == 0)
1674 return;
1675
1676 /* PROXYPASS is a special case, single-signon to servers with the proxy password (basic only) */
1677 if (flags.originpeer && strcmp(request->peer_login, "PROXYPASS") == 0 && hdr_in->has(Http::HdrType::PROXY_AUTHORIZATION)) {
1678 const char *auth = hdr_in->getStr(Http::HdrType::PROXY_AUTHORIZATION);
1679
1680 if (auth && strncasecmp(auth, "basic ", 6) == 0) {
1681 hdr_out->putStr(header, auth);
1682 return;
1683 }
1684 }
1685
1686 char loginbuf[base64_encode_len(MAX_LOGIN_SZ)];
1687 size_t blen;
1688 struct base64_encode_ctx ctx;
1689 base64_encode_init(&ctx);
1690
1691 /* Special mode to pass the username to the upstream cache */
1692 if (*request->peer_login == '*') {
1693 const char *username = "-";
1694
1695 if (request->extacl_user.size())
1696 username = request->extacl_user.termedBuf();
1697 #if USE_AUTH
1698 else if (request->auth_user_request != NULL)
1699 username = request->auth_user_request->username();
1700 #endif
1701
1702 blen = base64_encode_update(&ctx, loginbuf, strlen(username), reinterpret_cast<const uint8_t*>(username));
1703 blen += base64_encode_update(&ctx, loginbuf+blen, strlen(request->peer_login +1), reinterpret_cast<const uint8_t*>(request->peer_login +1));
1704 blen += base64_encode_final(&ctx, loginbuf+blen);
1705 httpHeaderPutStrf(hdr_out, header, "Basic %.*s", (int)blen, loginbuf);
1706 return;
1707 }
1708
1709 /* external_acl provided credentials */
1710 if (request->extacl_user.size() && request->extacl_passwd.size() &&
1711 (strcmp(request->peer_login, "PASS") == 0 ||
1712 strcmp(request->peer_login, "PROXYPASS") == 0)) {
1713
1714 blen = base64_encode_update(&ctx, loginbuf, request->extacl_user.size(), reinterpret_cast<const uint8_t*>(request->extacl_user.rawBuf()));
1715 blen += base64_encode_update(&ctx, loginbuf+blen, 1, reinterpret_cast<const uint8_t*>(":"));
1716 blen += base64_encode_update(&ctx, loginbuf+blen, request->extacl_passwd.size(), reinterpret_cast<const uint8_t*>(request->extacl_passwd.rawBuf()));
1717 blen += base64_encode_final(&ctx, loginbuf+blen);
1718 httpHeaderPutStrf(hdr_out, header, "Basic %.*s", (int)blen, loginbuf);
1719 return;
1720 }
1721 // if no external user credentials are available to fake authentication with PASS acts like PASSTHRU
1722 if (strcmp(request->peer_login, "PASS") == 0)
1723 return;
1724
1725 /* Kerberos login to peer */
1726 #if HAVE_AUTH_MODULE_NEGOTIATE && HAVE_KRB5 && HAVE_GSSAPI
1727 if (strncmp(request->peer_login, "NEGOTIATE",strlen("NEGOTIATE")) == 0) {
1728 char *Token=NULL;
1729 char *PrincipalName=NULL,*p;
1730 int negotiate_flags = 0;
1731
1732 if ((p=strchr(request->peer_login,':')) != NULL ) {
1733 PrincipalName=++p;
1734 }
1735 if (request->flags.auth_no_keytab) {
1736 negotiate_flags |= PEER_PROXY_NEGOTIATE_NOKEYTAB;
1737 }
1738 Token = peer_proxy_negotiate_auth(PrincipalName, request->peer_host, negotiate_flags);
1739 if (Token) {
1740 httpHeaderPutStrf(hdr_out, header, "Negotiate %s",Token);
1741 }
1742 return;
1743 }
1744 #endif /* HAVE_KRB5 && HAVE_GSSAPI */
1745
1746 blen = base64_encode_update(&ctx, loginbuf, strlen(request->peer_login), reinterpret_cast<const uint8_t*>(request->peer_login));
1747 blen += base64_encode_final(&ctx, loginbuf+blen);
1748 httpHeaderPutStrf(hdr_out, header, "Basic %.*s", (int)blen, loginbuf);
1749 return;
1750 }
1751
1752 /*
1753 * build request headers and append them to a given MemBuf
1754 * used by buildRequestPrefix()
1755 * note: initialised the HttpHeader, the caller is responsible for Clean()-ing
1756 */
1757 void
1758 HttpStateData::httpBuildRequestHeader(HttpRequest * request,
1759 StoreEntry * entry,
1760 const AccessLogEntryPointer &al,
1761 HttpHeader * hdr_out,
1762 const Http::StateFlags &flags)
1763 {
1764 /* building buffer for complex strings */
1765 #define BBUF_SZ (MAX_URL+32)
1766 LOCAL_ARRAY(char, bbuf, BBUF_SZ);
1767 LOCAL_ARRAY(char, ntoabuf, MAX_IPSTRLEN);
1768 const HttpHeader *hdr_in = &request->header;
1769 const HttpHeaderEntry *e = NULL;
1770 HttpHeaderPos pos = HttpHeaderInitPos;
1771 assert (hdr_out->owner == hoRequest);
1772
1773 /* use our IMS header if the cached entry has Last-Modified time */
1774 if (request->lastmod > -1)
1775 hdr_out->putTime(Http::HdrType::IF_MODIFIED_SINCE, request->lastmod);
1776
1777 // Add our own If-None-Match field if the cached entry has a strong ETag.
1778 // copyOneHeaderFromClientsideRequestToUpstreamRequest() adds client ones.
1779 if (request->etag.size() > 0) {
1780 hdr_out->addEntry(new HttpHeaderEntry(Http::HdrType::IF_NONE_MATCH, SBuf(),
1781 request->etag.termedBuf()));
1782 }
1783
1784 bool we_do_ranges = decideIfWeDoRanges (request);
1785
1786 String strConnection (hdr_in->getList(Http::HdrType::CONNECTION));
1787
1788 while ((e = hdr_in->getEntry(&pos)))
1789 copyOneHeaderFromClientsideRequestToUpstreamRequest(e, strConnection, request, hdr_out, we_do_ranges, flags);
1790
1791 /* Abstraction break: We should interpret multipart/byterange responses
1792 * into offset-length data, and this works around our inability to do so.
1793 */
1794 if (!we_do_ranges && request->multipartRangeRequest()) {
1795 /* don't cache the result */
1796 request->flags.cachable = false;
1797 /* pretend it's not a range request */
1798 request->ignoreRange("want to request the whole object");
1799 request->flags.isRanged = false;
1800 }
1801
1802 hdr_out->addVia(request->http_ver, hdr_in);
1803
1804 if (request->flags.accelerated) {
1805 /* Append Surrogate-Capabilities */
1806 String strSurrogate(hdr_in->getList(Http::HdrType::SURROGATE_CAPABILITY));
1807 #if USE_SQUID_ESI
1808 snprintf(bbuf, BBUF_SZ, "%s=\"Surrogate/1.0 ESI/1.0\"", Config.Accel.surrogate_id);
1809 #else
1810 snprintf(bbuf, BBUF_SZ, "%s=\"Surrogate/1.0\"", Config.Accel.surrogate_id);
1811 #endif
1812 strListAdd(&strSurrogate, bbuf, ',');
1813 hdr_out->putStr(Http::HdrType::SURROGATE_CAPABILITY, strSurrogate.termedBuf());
1814 }
1815
1816 /** \pre Handle X-Forwarded-For */
1817 if (strcmp(opt_forwarded_for, "delete") != 0) {
1818
1819 String strFwd = hdr_in->getList(Http::HdrType::X_FORWARDED_FOR);
1820
1821 // if we cannot double strFwd size, then it grew past 50% of the limit
1822 if (!strFwd.canGrowBy(strFwd.size())) {
1823 // There is probably a forwarding loop with Via detection disabled.
1824 // If we do nothing, String will assert on overflow soon.
1825 // TODO: Terminate all transactions with huge XFF?
1826 strFwd = "error";
1827
1828 static int warnedCount = 0;
1829 if (warnedCount++ < 100) {
1830 const SBuf url(entry ? SBuf(entry->url()) : request->effectiveRequestUri());
1831 debugs(11, DBG_IMPORTANT, "Warning: likely forwarding loop with " << url);
1832 }
1833 }
1834
1835 if (strcmp(opt_forwarded_for, "on") == 0) {
1836 /** If set to ON - append client IP or 'unknown'. */
1837 if ( request->client_addr.isNoAddr() )
1838 strListAdd(&strFwd, "unknown", ',');
1839 else
1840 strListAdd(&strFwd, request->client_addr.toStr(ntoabuf, MAX_IPSTRLEN), ',');
1841 } else if (strcmp(opt_forwarded_for, "off") == 0) {
1842 /** If set to OFF - append 'unknown'. */
1843 strListAdd(&strFwd, "unknown", ',');
1844 } else if (strcmp(opt_forwarded_for, "transparent") == 0) {
1845 /** If set to TRANSPARENT - pass through unchanged. */
1846 } else if (strcmp(opt_forwarded_for, "truncate") == 0) {
1847 /** If set to TRUNCATE - drop existing list and replace with client IP or 'unknown'. */
1848 if ( request->client_addr.isNoAddr() )
1849 strFwd = "unknown";
1850 else
1851 strFwd = request->client_addr.toStr(ntoabuf, MAX_IPSTRLEN);
1852 }
1853 if (strFwd.size() > 0)
1854 hdr_out->putStr(Http::HdrType::X_FORWARDED_FOR, strFwd.termedBuf());
1855 }
1856 /** If set to DELETE - do not copy through. */
1857
1858 /* append Host if not there already */
1859 if (!hdr_out->has(Http::HdrType::HOST)) {
1860 if (request->peer_domain) {
1861 hdr_out->putStr(Http::HdrType::HOST, request->peer_domain);
1862 } else {
1863 SBuf authority = request->url.authority();
1864 hdr_out->putStr(Http::HdrType::HOST, authority.c_str());
1865 }
1866 }
1867
1868 /* append Authorization if known in URL, not in header and going direct */
1869 if (!hdr_out->has(Http::HdrType::AUTHORIZATION)) {
1870 if (!request->flags.proxying && !request->url.userInfo().isEmpty()) {
1871 static char result[base64_encode_len(MAX_URL*2)]; // should be big enough for a single URI segment
1872 struct base64_encode_ctx ctx;
1873 base64_encode_init(&ctx);
1874 size_t blen = base64_encode_update(&ctx, result, request->url.userInfo().length(), reinterpret_cast<const uint8_t*>(request->url.userInfo().rawContent()));
1875 blen += base64_encode_final(&ctx, result+blen);
1876 result[blen] = '\0';
1877 if (blen)
1878 httpHeaderPutStrf(hdr_out, Http::HdrType::AUTHORIZATION, "Basic %.*s", (int)blen, result);
1879 }
1880 }
1881
1882 /* Fixup (Proxy-)Authorization special cases. Plain relaying dealt with above */
1883 httpFixupAuthentication(request, hdr_in, hdr_out, flags);
1884
1885 /* append Cache-Control, add max-age if not there already */
1886 {
1887 HttpHdrCc *cc = hdr_in->getCc();
1888
1889 if (!cc)
1890 cc = new HttpHdrCc();
1891
1892 #if 0 /* see bug 2330 */
1893 /* Set no-cache if determined needed but not found */
1894 if (request->flags.nocache)
1895 EBIT_SET(cc->mask, HttpHdrCcType::CC_NO_CACHE);
1896 #endif
1897
1898 /* Add max-age only without no-cache */
1899 if (!cc->hasMaxAge() && !cc->hasNoCache()) {
1900 // XXX: performance regression. c_str() reallocates
1901 SBuf tmp(request->effectiveRequestUri());
1902 cc->maxAge(getMaxAge(entry ? entry->url() : tmp.c_str()));
1903 }
1904
1905 /* Enforce sibling relations */
1906 if (flags.only_if_cached)
1907 cc->onlyIfCached(true);
1908
1909 hdr_out->putCc(cc);
1910
1911 delete cc;
1912 }
1913
1914 /* maybe append Connection: keep-alive */
1915 if (flags.keepalive) {
1916 hdr_out->putStr(Http::HdrType::CONNECTION, "keep-alive");
1917 }
1918
1919 /* append Front-End-Https */
1920 if (flags.front_end_https) {
1921 if (flags.front_end_https == 1 || request->url.getScheme() == AnyP::PROTO_HTTPS)
1922 hdr_out->putStr(Http::HdrType::FRONT_END_HTTPS, "On");
1923 }
1924
1925 if (flags.chunked_request) {
1926 // Do not just copy the original value so that if the client-side
1927 // starts decode other encodings, this code may remain valid.
1928 hdr_out->putStr(Http::HdrType::TRANSFER_ENCODING, "chunked");
1929 }
1930
1931 /* Now mangle the headers. */
1932 httpHdrMangleList(hdr_out, request, al, ROR_REQUEST);
1933
1934 strConnection.clean();
1935 }
1936
1937 /**
1938 * Decides whether a particular header may be cloned from the received Clients request
1939 * to our outgoing fetch request.
1940 */
1941 void
1942 copyOneHeaderFromClientsideRequestToUpstreamRequest(const HttpHeaderEntry *e, const String strConnection, const HttpRequest * request, HttpHeader * hdr_out, const int we_do_ranges, const Http::StateFlags &flags)
1943 {
1944 debugs(11, 5, "httpBuildRequestHeader: " << e->name << ": " << e->value );
1945
1946 switch (e->id) {
1947
1948 /** \par RFC 2616 sect 13.5.1 - Hop-by-Hop headers which Squid should not pass on. */
1949
1950 case Http::HdrType::PROXY_AUTHORIZATION:
1951 /** \par Proxy-Authorization:
1952 * Only pass on proxy authentication to peers for which
1953 * authentication forwarding is explicitly enabled
1954 */
1955 if (!flags.originpeer && flags.proxying && request->peer_login &&
1956 (strcmp(request->peer_login, "PASS") == 0 ||
1957 strcmp(request->peer_login, "PROXYPASS") == 0 ||
1958 strcmp(request->peer_login, "PASSTHRU") == 0)) {
1959 hdr_out->addEntry(e->clone());
1960 }
1961 break;
1962
1963 /** \par RFC 2616 sect 13.5.1 - Hop-by-Hop headers which Squid does not pass on. */
1964
1965 case Http::HdrType::CONNECTION: /** \par Connection: */
1966 case Http::HdrType::TE: /** \par TE: */
1967 case Http::HdrType::KEEP_ALIVE: /** \par Keep-Alive: */
1968 case Http::HdrType::PROXY_AUTHENTICATE: /** \par Proxy-Authenticate: */
1969 case Http::HdrType::TRAILER: /** \par Trailer: */
1970 case Http::HdrType::UPGRADE: /** \par Upgrade: */
1971 case Http::HdrType::TRANSFER_ENCODING: /** \par Transfer-Encoding: */
1972 break;
1973
1974 /** \par OTHER headers I haven't bothered to track down yet. */
1975
1976 case Http::HdrType::AUTHORIZATION:
1977 /** \par WWW-Authorization:
1978 * Pass on WWW authentication */
1979
1980 if (!flags.originpeer) {
1981 hdr_out->addEntry(e->clone());
1982 } else {
1983 /** \note In accelerators, only forward authentication if enabled
1984 * (see also httpFixupAuthentication for special cases)
1985 */
1986 if (request->peer_login &&
1987 (strcmp(request->peer_login, "PASS") == 0 ||
1988 strcmp(request->peer_login, "PASSTHRU") == 0 ||
1989 strcmp(request->peer_login, "PROXYPASS") == 0)) {
1990 hdr_out->addEntry(e->clone());
1991 }
1992 }
1993
1994 break;
1995
1996 case Http::HdrType::HOST:
1997 /** \par Host:
1998 * Normally Squid rewrites the Host: header.
1999 * However, there is one case when we don't: If the URL
2000 * went through our redirector and the admin configured
2001 * 'redir_rewrites_host' to be off.
2002 */
2003 if (request->peer_domain)
2004 hdr_out->putStr(Http::HdrType::HOST, request->peer_domain);
2005 else if (request->flags.redirected && !Config.onoff.redir_rewrites_host)
2006 hdr_out->addEntry(e->clone());
2007 else {
2008 SBuf authority = request->url.authority();
2009 hdr_out->putStr(Http::HdrType::HOST, authority.c_str());
2010 }
2011
2012 break;
2013
2014 case Http::HdrType::IF_MODIFIED_SINCE:
2015 /** \par If-Modified-Since:
2016 * append unless we added our own,
2017 * but only if cache_miss_revalidate is enabled, or
2018 * the request is not cacheable, or
2019 * the request contains authentication credentials.
2020 * \note at most one client's If-Modified-Since header can pass through
2021 */
2022 // XXX: need to check and cleanup the auth case so cacheable auth requests get cached.
2023 if (hdr_out->has(Http::HdrType::IF_MODIFIED_SINCE))
2024 break;
2025 else if (Config.onoff.cache_miss_revalidate || !request->flags.cachable || request->flags.auth)
2026 hdr_out->addEntry(e->clone());
2027 break;
2028
2029 case Http::HdrType::IF_NONE_MATCH:
2030 /** \par If-None-Match:
2031 * append if the wildcard '*' special case value is present, or
2032 * cache_miss_revalidate is disabled, or
2033 * the request is not cacheable in this proxy, or
2034 * the request contains authentication credentials.
2035 * \note this header lists a set of responses for the server to elide sending. Squid added values are extending that set.
2036 */
2037 // XXX: need to check and cleanup the auth case so cacheable auth requests get cached.
2038 if (hdr_out->hasListMember(Http::HdrType::IF_MATCH, "*", ',') || Config.onoff.cache_miss_revalidate || !request->flags.cachable || request->flags.auth)
2039 hdr_out->addEntry(e->clone());
2040 break;
2041
2042 case Http::HdrType::MAX_FORWARDS:
2043 /** \par Max-Forwards:
2044 * pass only on TRACE or OPTIONS requests */
2045 if (request->method == Http::METHOD_TRACE || request->method == Http::METHOD_OPTIONS) {
2046 const int64_t hops = e->getInt64();
2047
2048 if (hops > 0)
2049 hdr_out->putInt64(Http::HdrType::MAX_FORWARDS, hops - 1);
2050 }
2051
2052 break;
2053
2054 case Http::HdrType::VIA:
2055 /** \par Via:
2056 * If Via is disabled then forward any received header as-is.
2057 * Otherwise leave for explicit updated addition later. */
2058
2059 if (!Config.onoff.via)
2060 hdr_out->addEntry(e->clone());
2061
2062 break;
2063
2064 case Http::HdrType::RANGE:
2065
2066 case Http::HdrType::IF_RANGE:
2067
2068 case Http::HdrType::REQUEST_RANGE:
2069 /** \par Range:, If-Range:, Request-Range:
2070 * Only pass if we accept ranges */
2071 if (!we_do_ranges)
2072 hdr_out->addEntry(e->clone());
2073
2074 break;
2075
2076 case Http::HdrType::PROXY_CONNECTION: // SHOULD ignore. But doing so breaks things.
2077 break;
2078
2079 case Http::HdrType::CONTENT_LENGTH:
2080 // pass through unless we chunk; also, keeping this away from default
2081 // prevents request smuggling via Connection: Content-Length tricks
2082 if (!flags.chunked_request)
2083 hdr_out->addEntry(e->clone());
2084 break;
2085
2086 case Http::HdrType::X_FORWARDED_FOR:
2087
2088 case Http::HdrType::CACHE_CONTROL:
2089 /** \par X-Forwarded-For:, Cache-Control:
2090 * handled specially by Squid, so leave off for now.
2091 * append these after the loop if needed */
2092 break;
2093
2094 case Http::HdrType::FRONT_END_HTTPS:
2095 /** \par Front-End-Https:
2096 * Pass thru only if peer is configured with front-end-https */
2097 if (!flags.front_end_https)
2098 hdr_out->addEntry(e->clone());
2099
2100 break;
2101
2102 default:
2103 /** \par default.
2104 * pass on all other header fields
2105 * which are NOT listed by the special Connection: header. */
2106 if (strConnection.size()>0 && strListIsMember(&strConnection, e->name, ',')) {
2107 debugs(11, 2, "'" << e->name << "' header cropped by Connection: definition");
2108 return;
2109 }
2110
2111 hdr_out->addEntry(e->clone());
2112 }
2113 }
2114
2115 bool
2116 HttpStateData::decideIfWeDoRanges (HttpRequest * request)
2117 {
2118 bool result = true;
2119 /* decide if we want to do Ranges ourselves
2120 * and fetch the whole object now)
2121 * We want to handle Ranges ourselves iff
2122 * - we can actually parse client Range specs
2123 * - the specs are expected to be simple enough (e.g. no out-of-order ranges)
2124 * - reply will be cachable
2125 * (If the reply will be uncachable we have to throw it away after
2126 * serving this request, so it is better to forward ranges to
2127 * the server and fetch only the requested content)
2128 */
2129
2130 int64_t roffLimit = request->getRangeOffsetLimit();
2131
2132 if (NULL == request->range || !request->flags.cachable
2133 || request->range->offsetLimitExceeded(roffLimit) || request->flags.connectionAuth)
2134 result = false;
2135
2136 debugs(11, 8, "decideIfWeDoRanges: range specs: " <<
2137 request->range << ", cachable: " <<
2138 request->flags.cachable << "; we_do_ranges: " << result);
2139
2140 return result;
2141 }
2142
2143 /* build request prefix and append it to a given MemBuf;
2144 * return the length of the prefix */
2145 mb_size_t
2146 HttpStateData::buildRequestPrefix(MemBuf * mb)
2147 {
2148 const int offset = mb->size;
2149 /* Uses a local httpver variable to print the HTTP label
2150 * since the HttpRequest may have an older version label.
2151 * XXX: This could create protocol bugs as the headers sent and
2152 * flow control should all be based on the HttpRequest version
2153 * not the one we are sending. Needs checking.
2154 */
2155 const AnyP::ProtocolVersion httpver = Http::ProtocolVersion();
2156 const SBuf url(_peer && !_peer->options.originserver ? request->effectiveRequestUri() : request->url.path());
2157 mb->appendf(SQUIDSBUFPH " " SQUIDSBUFPH " %s/%d.%d\r\n",
2158 SQUIDSBUFPRINT(request->method.image()),
2159 SQUIDSBUFPRINT(url),
2160 AnyP::ProtocolType_str[httpver.protocol],
2161 httpver.major,httpver.minor);
2162 /* build and pack headers */
2163 {
2164 HttpHeader hdr(hoRequest);
2165 httpBuildRequestHeader(request.getRaw(), entry, fwd->al, &hdr, flags);
2166
2167 if (request->flags.pinned && request->flags.connectionAuth)
2168 request->flags.authSent = true;
2169 else if (hdr.has(Http::HdrType::AUTHORIZATION))
2170 request->flags.authSent = true;
2171
2172 hdr.packInto(mb);
2173 hdr.clean();
2174 }
2175 /* append header terminator */
2176 mb->append(crlf, 2);
2177 return mb->size - offset;
2178 }
2179
2180 /* This will be called when connect completes. Write request. */
2181 bool
2182 HttpStateData::sendRequest()
2183 {
2184 MemBuf mb;
2185
2186 debugs(11, 5, HERE << serverConnection << ", request " << request << ", this " << this << ".");
2187
2188 if (!Comm::IsConnOpen(serverConnection)) {
2189 debugs(11,3, HERE << "cannot send request to closing " << serverConnection);
2190 assert(closeHandler != NULL);
2191 return false;
2192 }
2193
2194 typedef CommCbMemFunT<HttpStateData, CommTimeoutCbParams> TimeoutDialer;
2195 AsyncCall::Pointer timeoutCall = JobCallback(11, 5,
2196 TimeoutDialer, this, HttpStateData::httpTimeout);
2197 commSetConnTimeout(serverConnection, Config.Timeout.lifetime, timeoutCall);
2198 flags.do_next_read = true;
2199 maybeReadVirginBody();
2200
2201 if (request->body_pipe != NULL) {
2202 if (!startRequestBodyFlow()) // register to receive body data
2203 return false;
2204 typedef CommCbMemFunT<HttpStateData, CommIoCbParams> Dialer;
2205 requestSender = JobCallback(11,5,
2206 Dialer, this, HttpStateData::sentRequestBody);
2207
2208 Must(!flags.chunked_request);
2209 // use chunked encoding if we do not know the length
2210 if (request->content_length < 0)
2211 flags.chunked_request = true;
2212 } else {
2213 assert(!requestBodySource);
2214 typedef CommCbMemFunT<HttpStateData, CommIoCbParams> Dialer;
2215 requestSender = JobCallback(11,5,
2216 Dialer, this, HttpStateData::wroteLast);
2217 }
2218
2219 flags.originpeer = (_peer != NULL && _peer->options.originserver);
2220 flags.proxying = (_peer != NULL && !flags.originpeer);
2221
2222 /*
2223 * Is keep-alive okay for all request methods?
2224 */
2225 if (request->flags.mustKeepalive)
2226 flags.keepalive = true;
2227 else if (request->flags.pinned)
2228 flags.keepalive = request->persistent();
2229 else if (!Config.onoff.server_pconns)
2230 flags.keepalive = false;
2231 else if (_peer == NULL)
2232 flags.keepalive = true;
2233 else if (_peer->stats.n_keepalives_sent < 10)
2234 flags.keepalive = true;
2235 else if ((double) _peer->stats.n_keepalives_recv /
2236 (double) _peer->stats.n_keepalives_sent > 0.50)
2237 flags.keepalive = true;
2238
2239 if (_peer) {
2240 /*The old code here was
2241 if (neighborType(_peer, request->url) == PEER_SIBLING && ...
2242 which is equivalent to:
2243 if (neighborType(_peer, URL()) == PEER_SIBLING && ...
2244 or better:
2245 if (((_peer->type == PEER_MULTICAST && p->options.mcast_siblings) ||
2246 _peer->type == PEER_SIBLINGS ) && _peer->options.allow_miss)
2247 flags.only_if_cached = 1;
2248
2249 But I suppose it was a bug
2250 */
2251 if (neighborType(_peer, request->url) == PEER_SIBLING && !_peer->options.allow_miss)
2252 flags.only_if_cached = true;
2253
2254 flags.front_end_https = _peer->front_end_https;
2255 }
2256
2257 mb.init();
2258 request->peer_host=_peer?_peer->host:NULL;
2259 buildRequestPrefix(&mb);
2260
2261 debugs(11, 2, "HTTP Server " << serverConnection);
2262 debugs(11, 2, "HTTP Server REQUEST:\n---------\n" << mb.buf << "\n----------");
2263
2264 Comm::Write(serverConnection, &mb, requestSender);
2265 return true;
2266 }
2267
2268 bool
2269 HttpStateData::getMoreRequestBody(MemBuf &buf)
2270 {
2271 // parent's implementation can handle the no-encoding case
2272 if (!flags.chunked_request)
2273 return Client::getMoreRequestBody(buf);
2274
2275 MemBuf raw;
2276
2277 Must(requestBodySource != NULL);
2278 if (!requestBodySource->getMoreData(raw))
2279 return false; // no request body bytes to chunk yet
2280
2281 // optimization: pre-allocate buffer size that should be enough
2282 const mb_size_t rawDataSize = raw.contentSize();
2283 // we may need to send: hex-chunk-size CRLF raw-data CRLF last-chunk
2284 buf.init(16 + 2 + rawDataSize + 2 + 5, raw.max_capacity);
2285
2286 buf.appendf("%x\r\n", static_cast<unsigned int>(rawDataSize));
2287 buf.append(raw.content(), rawDataSize);
2288 buf.append("\r\n", 2);
2289
2290 Must(rawDataSize > 0); // we did not accidently created last-chunk above
2291
2292 // Do not send last-chunk unless we successfully received everything
2293 if (receivedWholeRequestBody) {
2294 Must(!flags.sentLastChunk);
2295 flags.sentLastChunk = true;
2296 buf.append("0\r\n\r\n", 5);
2297 }
2298
2299 return true;
2300 }
2301
2302 void
2303 httpStart(FwdState *fwd)
2304 {
2305 debugs(11, 3, fwd->request->method << ' ' << fwd->entry->url());
2306 AsyncJob::Start(new HttpStateData(fwd));
2307 }
2308
2309 void
2310 HttpStateData::start()
2311 {
2312 if (!sendRequest()) {
2313 debugs(11, 3, "httpStart: aborted");
2314 mustStop("HttpStateData::start failed");
2315 return;
2316 }
2317
2318 ++ statCounter.server.all.requests;
2319 ++ statCounter.server.http.requests;
2320
2321 /*
2322 * We used to set the read timeout here, but not any more.
2323 * Now its set in httpSendComplete() after the full request,
2324 * including request body, has been written to the server.
2325 */
2326 }
2327
2328 /// if broken posts are enabled for the request, try to fix and return true
2329 bool
2330 HttpStateData::finishingBrokenPost()
2331 {
2332 #if USE_HTTP_VIOLATIONS
2333 if (!Config.accessList.brokenPosts) {
2334 debugs(11, 5, HERE << "No brokenPosts list");
2335 return false;
2336 }
2337
2338 ACLFilledChecklist ch(Config.accessList.brokenPosts, originalRequest().getRaw());
2339 ch.al = fwd->al;
2340 ch.syncAle(originalRequest().getRaw(), nullptr);
2341 if (!ch.fastCheck().allowed()) {
2342 debugs(11, 5, HERE << "didn't match brokenPosts");
2343 return false;
2344 }
2345
2346 if (!Comm::IsConnOpen(serverConnection)) {
2347 debugs(11, 3, HERE << "ignoring broken POST for closed " << serverConnection);
2348 assert(closeHandler != NULL);
2349 return true; // prevent caller from proceeding as if nothing happened
2350 }
2351
2352 debugs(11, 3, "finishingBrokenPost: fixing broken POST");
2353 typedef CommCbMemFunT<HttpStateData, CommIoCbParams> Dialer;
2354 requestSender = JobCallback(11,5,
2355 Dialer, this, HttpStateData::wroteLast);
2356 Comm::Write(serverConnection, "\r\n", 2, requestSender, NULL);
2357 return true;
2358 #else
2359 return false;
2360 #endif /* USE_HTTP_VIOLATIONS */
2361 }
2362
2363 /// if needed, write last-chunk to end the request body and return true
2364 bool
2365 HttpStateData::finishingChunkedRequest()
2366 {
2367 if (flags.sentLastChunk) {
2368 debugs(11, 5, HERE << "already sent last-chunk");
2369 return false;
2370 }
2371
2372 Must(receivedWholeRequestBody); // or we should not be sending last-chunk
2373 flags.sentLastChunk = true;
2374
2375 typedef CommCbMemFunT<HttpStateData, CommIoCbParams> Dialer;
2376 requestSender = JobCallback(11,5, Dialer, this, HttpStateData::wroteLast);
2377 Comm::Write(serverConnection, "0\r\n\r\n", 5, requestSender, NULL);
2378 return true;
2379 }
2380
2381 void
2382 HttpStateData::doneSendingRequestBody()
2383 {
2384 Client::doneSendingRequestBody();
2385 debugs(11,5, HERE << serverConnection);
2386
2387 // do we need to write something after the last body byte?
2388 if (flags.chunked_request && finishingChunkedRequest())
2389 return;
2390 if (!flags.chunked_request && finishingBrokenPost())
2391 return;
2392
2393 sendComplete();
2394 }
2395
2396 // more origin request body data is available
2397 void
2398 HttpStateData::handleMoreRequestBodyAvailable()
2399 {
2400 if (eof || !Comm::IsConnOpen(serverConnection)) {
2401 // XXX: we should check this condition in other callbacks then!
2402 // TODO: Check whether this can actually happen: We should unsubscribe
2403 // as a body consumer when the above condition(s) are detected.
2404 debugs(11, DBG_IMPORTANT, HERE << "Transaction aborted while reading HTTP body");
2405 return;
2406 }
2407
2408 assert(requestBodySource != NULL);
2409
2410 if (requestBodySource->buf().hasContent()) {
2411 // XXX: why does not this trigger a debug message on every request?
2412
2413 if (flags.headers_parsed && !flags.abuse_detected) {
2414 flags.abuse_detected = true;
2415 debugs(11, DBG_IMPORTANT, "http handleMoreRequestBodyAvailable: Likely proxy abuse detected '" << request->client_addr << "' -> '" << entry->url() << "'" );
2416
2417 if (virginReply()->sline.status() == Http::scInvalidHeader) {
2418 closeServer();
2419 mustStop("HttpStateData::handleMoreRequestBodyAvailable");
2420 return;
2421 }
2422 }
2423 }
2424
2425 HttpStateData::handleMoreRequestBodyAvailable();
2426 }
2427
2428 // premature end of the request body
2429 void
2430 HttpStateData::handleRequestBodyProducerAborted()
2431 {
2432 Client::handleRequestBodyProducerAborted();
2433 if (entry->isEmpty()) {
2434 debugs(11, 3, "request body aborted: " << serverConnection);
2435 // We usually get here when ICAP REQMOD aborts during body processing.
2436 // We might also get here if client-side aborts, but then our response
2437 // should not matter because either client-side will provide its own or
2438 // there will be no response at all (e.g., if the the client has left).
2439 ErrorState *err = new ErrorState(ERR_ICAP_FAILURE, Http::scInternalServerError, fwd->request);
2440 err->detailError(ERR_DETAIL_SRV_REQMOD_REQ_BODY);
2441 fwd->fail(err);
2442 }
2443
2444 abortTransaction("request body producer aborted");
2445 }
2446
2447 // called when we wrote request headers(!) or a part of the body
2448 void
2449 HttpStateData::sentRequestBody(const CommIoCbParams &io)
2450 {
2451 if (io.size > 0)
2452 statCounter.server.http.kbytes_out += io.size;
2453
2454 Client::sentRequestBody(io);
2455 }
2456
2457 void
2458 HttpStateData::abortAll(const char *reason)
2459 {
2460 debugs(11,5, HERE << "aborting transaction for " << reason <<
2461 "; " << serverConnection << ", this " << this);
2462 mustStop(reason);
2463 }
2464
2465 HttpStateData::ReuseDecision::ReuseDecision(const StoreEntry *e, const Http::StatusCode code)
2466 : answer(HttpStateData::ReuseDecision::reuseNot), reason(nullptr), entry(e), statusCode(code) {}
2467
2468 HttpStateData::ReuseDecision::Answers
2469 HttpStateData::ReuseDecision::make(const HttpStateData::ReuseDecision::Answers ans, const char *why)
2470 {
2471 answer = ans;
2472 reason = why;
2473 return answer;
2474 }
2475
2476 std::ostream &operator <<(std::ostream &os, const HttpStateData::ReuseDecision &d)
2477 {
2478 static const char *ReuseMessages[] = {
2479 "do not cache and do not share", // reuseNot
2480 "cache positively and share", // cachePositively
2481 "cache negatively and share", // cacheNegatively
2482 "do not cache but share" // doNotCacheButShare
2483 };
2484
2485 assert(d.answer >= HttpStateData::ReuseDecision::reuseNot &&
2486 d.answer <= HttpStateData::ReuseDecision::doNotCacheButShare);
2487 return os << ReuseMessages[d.answer] << " because " << d.reason <<
2488 "; HTTP status " << d.statusCode << " " << *(d.entry);
2489 }
2490