]> git.ipfire.org Git - thirdparty/squid.git/blob - src/http.cc
Cleanup: base64 coder de-duplication and upgrade
[thirdparty/squid.git] / src / http.cc
1
2 /*
3 * $Id$
4 *
5 * DEBUG: section 11 Hypertext Transfer Protocol (HTTP)
6 * AUTHOR: Harvest Derived
7 *
8 * SQUID Web Proxy Cache http://www.squid-cache.org/
9 * ----------------------------------------------------------
10 *
11 * Squid is the result of efforts by numerous individuals from
12 * the Internet community; see the CONTRIBUTORS file for full
13 * details. Many organizations have provided support for Squid's
14 * development; see the SPONSORS file for full details. Squid is
15 * Copyrighted (C) 2001 by the Regents of the University of
16 * California; see the COPYRIGHT file for full details. Squid
17 * incorporates software developed and/or copyrighted by other
18 * sources; see the CREDITS file for full details.
19 *
20 * This program is free software; you can redistribute it and/or modify
21 * it under the terms of the GNU General Public License as published by
22 * the Free Software Foundation; either version 2 of the License, or
23 * (at your option) any later version.
24 *
25 * This program is distributed in the hope that it will be useful,
26 * but WITHOUT ANY WARRANTY; without even the implied warranty of
27 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
28 * GNU General Public License for more details.
29 *
30 * You should have received a copy of the GNU General Public License
31 * along with this program; if not, write to the Free Software
32 * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111, USA.
33 *
34 */
35
36 /*
37 * Anonymizing patch by lutz@as-node.jena.thur.de
38 * have a look into http-anon.c to get more informations.
39 */
40
41 #include "squid.h"
42
43 #include "acl/FilledChecklist.h"
44 #if USE_AUTH
45 #include "auth/UserRequest.h"
46 #endif
47 #include "base/AsyncJobCalls.h"
48 #include "base/TextException.h"
49 #include "base64.h"
50 #include "comm/Write.h"
51 #if USE_DELAY_POOLS
52 #include "DelayPools.h"
53 #endif
54 #include "err_detail_type.h"
55 #include "errorpage.h"
56 #include "http.h"
57 #include "HttpControlMsg.h"
58 #include "HttpHdrContRange.h"
59 #include "HttpHdrSc.h"
60 #include "HttpHdrScTarget.h"
61 #include "HttpReply.h"
62 #include "HttpRequest.h"
63 #include "MemBuf.h"
64 #include "MemObject.h"
65 #include "protos.h"
66 #include "rfc1738.h"
67 #include "SquidTime.h"
68 #include "Store.h"
69
70
71 #define SQUID_ENTER_THROWING_CODE() try {
72 #define SQUID_EXIT_THROWING_CODE(status) \
73 status = true; \
74 } \
75 catch (const std::exception &e) { \
76 debugs (11, 1, "Exception error:" << e.what()); \
77 status = false; \
78 }
79
80 CBDATA_CLASS_INIT(HttpStateData);
81
82 static const char *const crlf = "\r\n";
83
84 static void httpMaybeRemovePublic(StoreEntry *, http_status);
85 static void copyOneHeaderFromClientsideRequestToUpstreamRequest(const HttpHeaderEntry *e, const String strConnection, HttpRequest * request, const HttpRequest * orig_request,
86 HttpHeader * hdr_out, const int we_do_ranges, const http_state_flags);
87
88 HttpStateData::HttpStateData(FwdState *theFwdState) : AsyncJob("HttpStateData"), ServerStateData(theFwdState),
89 lastChunk(0), header_bytes_read(0), reply_bytes_read(0),
90 body_bytes_truncated(0), httpChunkDecoder(NULL)
91 {
92 debugs(11,5,HERE << "HttpStateData " << this << " created");
93 ignoreCacheControl = false;
94 surrogateNoStore = false;
95 fd = fwd->server_fd;
96 readBuf = new MemBuf;
97 readBuf->init(16*1024, 256*1024);
98 orig_request = HTTPMSGLOCK(fwd->request);
99
100 // reset peer response time stats for %<pt
101 orig_request->hier.peer_http_request_sent.tv_sec = 0;
102 orig_request->hier.peer_http_request_sent.tv_usec = 0;
103
104 if (fwd->servers)
105 _peer = fwd->servers->_peer; /* might be NULL */
106
107 if (_peer) {
108 const char *url;
109
110 if (_peer->options.originserver)
111 url = orig_request->urlpath.termedBuf();
112 else
113 url = entry->url();
114
115 HttpRequest * proxy_req = new HttpRequest(orig_request->method,
116 orig_request->protocol, url);
117
118 proxy_req->SetHost(_peer->host);
119
120 proxy_req->port = _peer->http_port;
121
122 proxy_req->flags = orig_request->flags;
123
124 proxy_req->lastmod = orig_request->lastmod;
125
126 proxy_req->flags.proxying = 1;
127
128 HTTPMSGUNLOCK(request);
129
130 request = HTTPMSGLOCK(proxy_req);
131
132 /*
133 * This NEIGHBOR_PROXY_ONLY check probably shouldn't be here.
134 * We might end up getting the object from somewhere else if,
135 * for example, the request to this neighbor fails.
136 */
137 if (_peer->options.proxy_only)
138 entry->releaseRequest();
139
140 #if USE_DELAY_POOLS
141 entry->setNoDelay(_peer->options.no_delay);
142 #endif
143 }
144
145 /*
146 * register the handler to free HTTP state data when the FD closes
147 */
148 typedef CommCbMemFunT<HttpStateData, CommCloseCbParams> Dialer;
149 closeHandler = JobCallback(9, 5,
150 Dialer, this, HttpStateData::httpStateConnClosed);
151 comm_add_close_handler(fd, closeHandler);
152 }
153
154 HttpStateData::~HttpStateData()
155 {
156 /*
157 * don't forget that ~ServerStateData() gets called automatically
158 */
159
160 if (!readBuf->isNull())
161 readBuf->clean();
162
163 delete readBuf;
164
165 if (httpChunkDecoder)
166 delete httpChunkDecoder;
167
168 HTTPMSGUNLOCK(orig_request);
169
170 debugs(11,5, HERE << "HttpStateData " << this << " destroyed; FD " << fd);
171 }
172
173 int
174 HttpStateData::dataDescriptor() const
175 {
176 return fd;
177 }
178 /*
179 static void
180 httpStateFree(int fd, void *data)
181 {
182 HttpStateData *httpState = static_cast<HttpStateData *>(data);
183 debugs(11, 5, "httpStateFree: FD " << fd << ", httpState=" << data);
184 delete httpState;
185 }*/
186
187 void
188 HttpStateData::httpStateConnClosed(const CommCloseCbParams &params)
189 {
190 debugs(11, 5, "httpStateFree: FD " << params.fd << ", httpState=" << params.data);
191 deleteThis("HttpStateData::httpStateConnClosed");
192 }
193
194 int
195 httpCachable(const HttpRequestMethod& method)
196 {
197 /* GET and HEAD are cachable. Others are not. */
198
199 // TODO: replase to HttpRequestMethod::isCachable() ?
200 if (method != METHOD_GET && method != METHOD_HEAD)
201 return 0;
202
203 /* else cachable */
204 return 1;
205 }
206
207 void
208 HttpStateData::httpTimeout(const CommTimeoutCbParams &params)
209 {
210 debugs(11, 4, "httpTimeout: FD " << fd << ": '" << entry->url() << "'" );
211
212 if (entry->store_status == STORE_PENDING) {
213 fwd->fail(errorCon(ERR_READ_TIMEOUT, HTTP_GATEWAY_TIMEOUT, fwd->request));
214 }
215
216 comm_close(fd);
217 }
218
219 static void
220 httpMaybeRemovePublic(StoreEntry * e, http_status status)
221 {
222 int remove = 0;
223 int forbidden = 0;
224 StoreEntry *pe;
225
226 if (!EBIT_TEST(e->flags, KEY_PRIVATE))
227 return;
228
229 switch (status) {
230
231 case HTTP_OK:
232
233 case HTTP_NON_AUTHORITATIVE_INFORMATION:
234
235 case HTTP_MULTIPLE_CHOICES:
236
237 case HTTP_MOVED_PERMANENTLY:
238
239 case HTTP_MOVED_TEMPORARILY:
240
241 case HTTP_GONE:
242
243 case HTTP_NOT_FOUND:
244 remove = 1;
245
246 break;
247
248 case HTTP_FORBIDDEN:
249
250 case HTTP_METHOD_NOT_ALLOWED:
251 forbidden = 1;
252
253 break;
254
255 #if WORK_IN_PROGRESS
256
257 case HTTP_UNAUTHORIZED:
258 forbidden = 1;
259
260 break;
261
262 #endif
263
264 default:
265 #if QUESTIONABLE
266 /*
267 * Any 2xx response should eject previously cached entities...
268 */
269
270 if (status >= 200 && status < 300)
271 remove = 1;
272
273 #endif
274
275 break;
276 }
277
278 if (!remove && !forbidden)
279 return;
280
281 assert(e->mem_obj);
282
283 if (e->mem_obj->request)
284 pe = storeGetPublicByRequest(e->mem_obj->request);
285 else
286 pe = storeGetPublic(e->mem_obj->url, e->mem_obj->method);
287
288 if (pe != NULL) {
289 assert(e != pe);
290 #if USE_HTCP
291 neighborsHtcpClear(e, NULL, e->mem_obj->request, e->mem_obj->method, HTCP_CLR_INVALIDATION);
292 #endif
293 pe->release();
294 }
295
296 /** \par
297 * Also remove any cached HEAD response in case the object has
298 * changed.
299 */
300 if (e->mem_obj->request)
301 pe = storeGetPublicByRequestMethod(e->mem_obj->request, METHOD_HEAD);
302 else
303 pe = storeGetPublic(e->mem_obj->url, METHOD_HEAD);
304
305 if (pe != NULL) {
306 assert(e != pe);
307 #if USE_HTCP
308 neighborsHtcpClear(e, NULL, e->mem_obj->request, HttpRequestMethod(METHOD_HEAD), HTCP_CLR_INVALIDATION);
309 #endif
310 pe->release();
311 }
312 }
313
314 void
315 HttpStateData::processSurrogateControl(HttpReply *reply)
316 {
317 if (request->flags.accelerated && reply->surrogate_control) {
318 HttpHdrScTarget *sctusable = httpHdrScGetMergedTarget(reply->surrogate_control, Config.Accel.surrogate_id);
319
320 if (sctusable) {
321 if (EBIT_TEST(sctusable->mask, SC_NO_STORE) ||
322 (Config.onoff.surrogate_is_remote
323 && EBIT_TEST(sctusable->mask, SC_NO_STORE_REMOTE))) {
324 surrogateNoStore = true;
325 entry->makePrivate();
326 }
327
328 /* The HttpHeader logic cannot tell if the header it's parsing is a reply to an
329 * accelerated request or not...
330 * Still, this is an abstraction breach. - RC
331 */
332 if (sctusable->max_age != -1) {
333 if (sctusable->max_age < sctusable->max_stale)
334 reply->expires = reply->date + sctusable->max_age;
335 else
336 reply->expires = reply->date + sctusable->max_stale;
337
338 /* And update the timestamps */
339 entry->timestampsSet();
340 }
341
342 /* We ignore cache-control directives as per the Surrogate specification */
343 ignoreCacheControl = true;
344
345 httpHdrScTargetDestroy(sctusable);
346 }
347 }
348 }
349
350 int
351 HttpStateData::cacheableReply()
352 {
353 HttpReply const *rep = finalReply();
354 HttpHeader const *hdr = &rep->header;
355 const int cc_mask = (rep->cache_control) ? rep->cache_control->mask : 0;
356 const char *v;
357 #if USE_HTTP_VIOLATIONS
358
359 const refresh_t *R = NULL;
360
361 /* This strange looking define first looks up the refresh pattern
362 * and then checks if the specified flag is set. The main purpose
363 * of this is to simplify the refresh pattern lookup and USE_HTTP_VIOLATIONS
364 * condition
365 */
366 #define REFRESH_OVERRIDE(flag) \
367 ((R = (R ? R : refreshLimits(entry->mem_obj->url))) , \
368 (R && R->flags.flag))
369 #else
370 #define REFRESH_OVERRIDE(flag) 0
371 #endif
372
373 if (surrogateNoStore)
374 return 0;
375
376 // RFC 2616: do not cache replies to responses with no-store CC directive
377 if (request && request->cache_control &&
378 EBIT_TEST(request->cache_control->mask, CC_NO_STORE) &&
379 !REFRESH_OVERRIDE(ignore_no_store))
380 return 0;
381
382 if (!ignoreCacheControl) {
383 if (EBIT_TEST(cc_mask, CC_PRIVATE)) {
384 if (!REFRESH_OVERRIDE(ignore_private))
385 return 0;
386 }
387
388 if (EBIT_TEST(cc_mask, CC_NO_CACHE)) {
389 if (!REFRESH_OVERRIDE(ignore_no_cache))
390 return 0;
391 }
392
393 if (EBIT_TEST(cc_mask, CC_NO_STORE)) {
394 if (!REFRESH_OVERRIDE(ignore_no_store))
395 return 0;
396 }
397 }
398
399 if (request->flags.auth || request->flags.auth_sent) {
400 /*
401 * Responses to requests with authorization may be cached
402 * only if a Cache-Control: public reply header is present.
403 * RFC 2068, sec 14.9.4
404 */
405
406 if (!EBIT_TEST(cc_mask, CC_PUBLIC)) {
407 if (!REFRESH_OVERRIDE(ignore_auth))
408 return 0;
409 }
410 }
411
412 /* Pragma: no-cache in _replies_ is not documented in HTTP,
413 * but servers like "Active Imaging Webcast/2.0" sure do use it */
414 if (hdr->has(HDR_PRAGMA)) {
415 String s = hdr->getList(HDR_PRAGMA);
416 const int no_cache = strListIsMember(&s, "no-cache", ',');
417 s.clean();
418
419 if (no_cache) {
420 if (!REFRESH_OVERRIDE(ignore_no_cache))
421 return 0;
422 }
423 }
424
425 /*
426 * The "multipart/x-mixed-replace" content type is used for
427 * continuous push replies. These are generally dynamic and
428 * probably should not be cachable
429 */
430 if ((v = hdr->getStr(HDR_CONTENT_TYPE)))
431 if (!strncasecmp(v, "multipart/x-mixed-replace", 25))
432 return 0;
433
434 switch (rep->sline.status) {
435 /* Responses that are cacheable */
436
437 case HTTP_OK:
438
439 case HTTP_NON_AUTHORITATIVE_INFORMATION:
440
441 case HTTP_MULTIPLE_CHOICES:
442
443 case HTTP_MOVED_PERMANENTLY:
444
445 case HTTP_GONE:
446 /*
447 * Don't cache objects that need to be refreshed on next request,
448 * unless we know how to refresh it.
449 */
450
451 if (!refreshIsCachable(entry) && !REFRESH_OVERRIDE(store_stale)) {
452 debugs(22, 3, "refreshIsCachable() returned non-cacheable..");
453 return 0;
454 } else
455 return 1;
456
457 /* NOTREACHED */
458 break;
459
460 /* Responses that only are cacheable if the server says so */
461
462 case HTTP_MOVED_TEMPORARILY:
463 case HTTP_TEMPORARY_REDIRECT:
464 if (rep->expires > rep->date && rep->date > 0)
465 return 1;
466 else
467 return 0;
468
469 /* NOTREACHED */
470 break;
471
472 /* Errors can be negatively cached */
473
474 case HTTP_NO_CONTENT:
475
476 case HTTP_USE_PROXY:
477
478 case HTTP_BAD_REQUEST:
479
480 case HTTP_FORBIDDEN:
481
482 case HTTP_NOT_FOUND:
483
484 case HTTP_METHOD_NOT_ALLOWED:
485
486 case HTTP_REQUEST_URI_TOO_LARGE:
487
488 case HTTP_INTERNAL_SERVER_ERROR:
489
490 case HTTP_NOT_IMPLEMENTED:
491
492 case HTTP_BAD_GATEWAY:
493
494 case HTTP_SERVICE_UNAVAILABLE:
495
496 case HTTP_GATEWAY_TIMEOUT:
497 return -1;
498
499 /* NOTREACHED */
500 break;
501
502 /* Some responses can never be cached */
503
504 case HTTP_PARTIAL_CONTENT: /* Not yet supported */
505
506 case HTTP_SEE_OTHER:
507
508 case HTTP_NOT_MODIFIED:
509
510 case HTTP_UNAUTHORIZED:
511
512 case HTTP_PROXY_AUTHENTICATION_REQUIRED:
513
514 case HTTP_INVALID_HEADER: /* Squid header parsing error */
515
516 case HTTP_HEADER_TOO_LARGE:
517
518 case HTTP_PAYMENT_REQUIRED:
519 case HTTP_NOT_ACCEPTABLE:
520 case HTTP_REQUEST_TIMEOUT:
521 case HTTP_CONFLICT:
522 case HTTP_LENGTH_REQUIRED:
523 case HTTP_PRECONDITION_FAILED:
524 case HTTP_REQUEST_ENTITY_TOO_LARGE:
525 case HTTP_UNSUPPORTED_MEDIA_TYPE:
526 case HTTP_UNPROCESSABLE_ENTITY:
527 case HTTP_LOCKED:
528 case HTTP_FAILED_DEPENDENCY:
529 case HTTP_INSUFFICIENT_STORAGE:
530 case HTTP_REQUESTED_RANGE_NOT_SATISFIABLE:
531 case HTTP_EXPECTATION_FAILED:
532
533 return 0;
534
535 default:
536 /* RFC 2616 section 6.1.1: an unrecognized response MUST NOT be cached. */
537 debugs (11, 3, HERE << "Unknown HTTP status code " << rep->sline.status << ". Not cacheable.");
538
539 return 0;
540
541 /* NOTREACHED */
542 break;
543 }
544
545 /* NOTREACHED */
546 }
547
548 /*
549 * For Vary, store the relevant request headers as
550 * virtual headers in the reply
551 * Returns false if the variance cannot be stored
552 */
553 const char *
554 httpMakeVaryMark(HttpRequest * request, HttpReply const * reply)
555 {
556 String vary, hdr;
557 const char *pos = NULL;
558 const char *item;
559 const char *value;
560 int ilen;
561 static String vstr;
562
563 vstr.clean();
564 vary = reply->header.getList(HDR_VARY);
565
566 while (strListGetItem(&vary, ',', &item, &ilen, &pos)) {
567 char *name = (char *)xmalloc(ilen + 1);
568 xstrncpy(name, item, ilen + 1);
569 Tolower(name);
570
571 if (strcmp(name, "*") == 0) {
572 /* Can not handle "Vary: *" withtout ETag support */
573 safe_free(name);
574 vstr.clean();
575 break;
576 }
577
578 strListAdd(&vstr, name, ',');
579 hdr = request->header.getByName(name);
580 safe_free(name);
581 value = hdr.termedBuf();
582
583 if (value) {
584 value = rfc1738_escape_part(value);
585 vstr.append("=\"", 2);
586 vstr.append(value);
587 vstr.append("\"", 1);
588 }
589
590 hdr.clean();
591 }
592
593 vary.clean();
594 #if X_ACCELERATOR_VARY
595
596 pos = NULL;
597 vary = reply->header.getList(HDR_X_ACCELERATOR_VARY);
598
599 while (strListGetItem(&vary, ',', &item, &ilen, &pos)) {
600 char *name = (char *)xmalloc(ilen + 1);
601 xstrncpy(name, item, ilen + 1);
602 Tolower(name);
603 strListAdd(&vstr, name, ',');
604 hdr = request->header.getByName(name);
605 safe_free(name);
606 value = hdr.termedBuf();
607
608 if (value) {
609 value = rfc1738_escape_part(value);
610 vstr.append("=\"", 2);
611 vstr.append(value);
612 vstr.append("\"", 1);
613 }
614
615 hdr.clean();
616 }
617
618 vary.clean();
619 #endif
620
621 debugs(11, 3, "httpMakeVaryMark: " << vstr);
622 return vstr.termedBuf();
623 }
624
625 void
626 HttpStateData::keepaliveAccounting(HttpReply *reply)
627 {
628 if (flags.keepalive)
629 if (_peer)
630 _peer->stats.n_keepalives_sent++;
631
632 if (reply->keep_alive) {
633 if (_peer)
634 _peer->stats.n_keepalives_recv++;
635
636 if (Config.onoff.detect_broken_server_pconns
637 && reply->bodySize(request->method) == -1 && !flags.chunked) {
638 debugs(11, 1, "keepaliveAccounting: Impossible keep-alive header from '" << entry->url() << "'" );
639 // debugs(11, 2, "GOT HTTP REPLY HDR:\n---------\n" << readBuf->content() << "\n----------" );
640 flags.keepalive_broken = 1;
641 }
642 }
643 }
644
645 void
646 HttpStateData::checkDateSkew(HttpReply *reply)
647 {
648 if (reply->date > -1 && !_peer) {
649 int skew = abs((int)(reply->date - squid_curtime));
650
651 if (skew > 86400)
652 debugs(11, 3, "" << request->GetHost() << "'s clock is skewed by " << skew << " seconds!");
653 }
654 }
655
656 /**
657 * This creates the error page itself.. its likely
658 * that the forward ported reply header max size patch
659 * generates non http conformant error pages - in which
660 * case the errors where should be 'BAD_GATEWAY' etc
661 */
662 void
663 HttpStateData::processReplyHeader()
664 {
665 /** Creates a blank header. If this routine is made incremental, this will not do */
666
667 /* NP: all exit points to this function MUST call ctx_exit(ctx) */
668 Ctx ctx = ctx_enter(entry->mem_obj->url);
669
670 debugs(11, 3, "processReplyHeader: key '" << entry->getMD5Text() << "'");
671
672 assert(!flags.headers_parsed);
673
674 if (!readBuf->hasContent()) {
675 ctx_exit(ctx);
676 return;
677 }
678
679 http_status error = HTTP_STATUS_NONE;
680
681 HttpReply *newrep = new HttpReply;
682 const bool parsed = newrep->parse(readBuf, eof, &error);
683
684 if (!parsed && readBuf->contentSize() > 5 && strncmp(readBuf->content(), "HTTP/", 5) != 0 && strncmp(readBuf->content(), "ICY", 3) != 0) {
685 MemBuf *mb;
686 HttpReply *tmprep = new HttpReply;
687 tmprep->setHeaders(HTTP_OK, "Gatewaying", NULL, -1, -1, -1);
688 tmprep->header.putExt("X-Transformed-From", "HTTP/0.9");
689 mb = tmprep->pack();
690 newrep->parse(mb, eof, &error);
691 delete mb;
692 delete tmprep;
693 } else {
694 if (!parsed && error > 0) { // unrecoverable parsing error
695 debugs(11, 3, "processReplyHeader: Non-HTTP-compliant header: '" << readBuf->content() << "'");
696 flags.headers_parsed = 1;
697 newrep->sline.version = HttpVersion(1,1);
698 newrep->sline.status = error;
699 HttpReply *vrep = setVirginReply(newrep);
700 entry->replaceHttpReply(vrep);
701 ctx_exit(ctx);
702 return;
703 }
704
705 if (!parsed) { // need more data
706 assert(!error);
707 assert(!eof);
708 delete newrep;
709 ctx_exit(ctx);
710 return;
711 }
712
713 debugs(11, 9, "GOT HTTP REPLY HDR:\n---------\n" << readBuf->content() << "\n----------");
714
715 header_bytes_read = headersEnd(readBuf->content(), readBuf->contentSize());
716 readBuf->consume(header_bytes_read);
717 }
718
719 newrep->removeStaleWarnings();
720
721 if (newrep->sline.protocol == AnyP::PROTO_HTTP && newrep->sline.status >= 100 && newrep->sline.status < 200) {
722 handle1xx(newrep);
723 ctx_exit(ctx);
724 return;
725 }
726
727 flags.chunked = 0;
728 if (newrep->sline.protocol == AnyP::PROTO_HTTP && newrep->header.chunked()) {
729 flags.chunked = 1;
730 httpChunkDecoder = new ChunkedCodingParser;
731 }
732
733 if (!peerSupportsConnectionPinning())
734 orig_request->flags.connection_auth_disabled = 1;
735
736 HttpReply *vrep = setVirginReply(newrep);
737 flags.headers_parsed = 1;
738
739 keepaliveAccounting(vrep);
740
741 checkDateSkew(vrep);
742
743 processSurrogateControl (vrep);
744
745 /** \todo IF the reply is a 1.0 reply, AND it has a Connection: Header
746 * Parse the header and remove all referenced headers
747 */
748
749 orig_request->hier.peer_reply_status = newrep->sline.status;
750
751 ctx_exit(ctx);
752 }
753
754 /// ignore or start forwarding the 1xx response (a.k.a., control message)
755 void
756 HttpStateData::handle1xx(HttpReply *reply)
757 {
758 HttpMsgPointerT<HttpReply> msg(reply); // will destroy reply if unused
759
760 // one 1xx at a time: we must not be called while waiting for previous 1xx
761 Must(!flags.handling1xx);
762 flags.handling1xx = true;
763
764 if (!orig_request->canHandle1xx()) {
765 debugs(11, 2, HERE << "ignoring client-unsupported 1xx");
766 proceedAfter1xx();
767 return;
768 }
769
770 #if USE_HTTP_VIOLATIONS
771 // check whether the 1xx response forwarding is allowed by squid.conf
772 if (Config.accessList.reply) {
773 ACLFilledChecklist ch(Config.accessList.reply, originalRequest(), NULL);
774 ch.reply = HTTPMSGLOCK(reply);
775 if (!ch.fastCheck()) { // TODO: support slow lookups?
776 debugs(11, 3, HERE << "ignoring denied 1xx");
777 proceedAfter1xx();
778 return;
779 }
780 }
781 #endif // USE_HTTP_VIOLATIONS
782
783 debugs(11, 2, HERE << "forwarding 1xx to client");
784
785 // the Sink will use this to call us back after writing 1xx to the client
786 typedef NullaryMemFunT<HttpStateData> CbDialer;
787 const AsyncCall::Pointer cb = JobCallback(11, 3, CbDialer, this,
788 HttpStateData::proceedAfter1xx);
789 CallJobHere1(11, 4, orig_request->clientConnection, ConnStateData,
790 ConnStateData::sendControlMsg, HttpControlMsg(msg, cb));
791 // If the call is not fired, then the Sink is gone, and HttpStateData
792 // will terminate due to an aborted store entry or another similar error.
793 // If we get stuck, it is not handle1xx fault if we could get stuck
794 // for similar reasons without a 1xx response.
795 }
796
797 /// restores state and resumes processing after 1xx is ignored or forwarded
798 void
799 HttpStateData::proceedAfter1xx()
800 {
801 Must(flags.handling1xx);
802
803 debugs(11, 2, HERE << "consuming " << header_bytes_read <<
804 " header and " << reply_bytes_read << " body bytes read after 1xx");
805 header_bytes_read = 0;
806 reply_bytes_read = 0;
807
808 CallJobHere(11, 3, this, HttpStateData, HttpStateData::processReply);
809 }
810
811
812 /**
813 * returns true if the peer can support connection pinning
814 */
815 bool HttpStateData::peerSupportsConnectionPinning() const
816 {
817 const HttpReply *rep = entry->mem_obj->getReply();
818 const HttpHeader *hdr = &rep->header;
819 bool rc;
820 String header;
821
822 if (!_peer)
823 return true;
824
825 /*If this peer does not support connection pinning (authenticated
826 connections) return false
827 */
828 if (!_peer->connection_auth)
829 return false;
830
831 /*The peer supports connection pinning and the http reply status
832 is not unauthorized, so the related connection can be pinned
833 */
834 if (rep->sline.status != HTTP_UNAUTHORIZED)
835 return true;
836
837 /*The server respond with HTTP_UNAUTHORIZED and the peer configured
838 with "connection-auth=on" we know that the peer supports pinned
839 connections
840 */
841 if (_peer->connection_auth == 1)
842 return true;
843
844 /*At this point peer has configured with "connection-auth=auto"
845 parameter so we need some extra checks to decide if we are going
846 to allow pinned connections or not
847 */
848
849 /*if the peer configured with originserver just allow connection
850 pinning (squid 2.6 behaviour)
851 */
852 if (_peer->options.originserver)
853 return true;
854
855 /*if the connections it is already pinned it is OK*/
856 if (request->flags.pinned)
857 return true;
858
859 /*Allow pinned connections only if the Proxy-support header exists in
860 reply and has in its list the "Session-Based-Authentication"
861 which means that the peer supports connection pinning.
862 */
863 if (!hdr->has(HDR_PROXY_SUPPORT))
864 return false;
865
866 header = hdr->getStrOrList(HDR_PROXY_SUPPORT);
867 /* XXX This ought to be done in a case-insensitive manner */
868 rc = (strstr(header.termedBuf(), "Session-Based-Authentication") != NULL);
869
870 return rc;
871 }
872
873 // Called when we parsed (and possibly adapted) the headers but
874 // had not starting storing (a.k.a., sending) the body yet.
875 void
876 HttpStateData::haveParsedReplyHeaders()
877 {
878 ServerStateData::haveParsedReplyHeaders();
879
880 Ctx ctx = ctx_enter(entry->mem_obj->url);
881 HttpReply *rep = finalReply();
882
883 if (rep->sline.status == HTTP_PARTIAL_CONTENT &&
884 rep->content_range)
885 currentOffset = rep->content_range->spec.offset;
886
887 entry->timestampsSet();
888
889 /* Check if object is cacheable or not based on reply code */
890 debugs(11, 3, "haveParsedReplyHeaders: HTTP CODE: " << rep->sline.status);
891
892 if (neighbors_do_private_keys)
893 httpMaybeRemovePublic(entry, rep->sline.status);
894
895 if (rep->header.has(HDR_VARY)
896 #if X_ACCELERATOR_VARY
897 || rep->header.has(HDR_X_ACCELERATOR_VARY)
898 #endif
899 ) {
900 const char *vary = httpMakeVaryMark(orig_request, rep);
901
902 if (!vary) {
903 entry->makePrivate();
904 if (!fwd->reforwardableStatus(rep->sline.status))
905 EBIT_CLR(entry->flags, ENTRY_FWD_HDR_WAIT);
906 goto no_cache;
907 }
908
909 entry->mem_obj->vary_headers = xstrdup(vary);
910 }
911
912 /*
913 * If its not a reply that we will re-forward, then
914 * allow the client to get it.
915 */
916 if (!fwd->reforwardableStatus(rep->sline.status))
917 EBIT_CLR(entry->flags, ENTRY_FWD_HDR_WAIT);
918
919 switch (cacheableReply()) {
920
921 case 1:
922 entry->makePublic();
923 break;
924
925 case 0:
926 entry->makePrivate();
927 break;
928
929 case -1:
930
931 #if USE_HTTP_VIOLATIONS
932 if (Config.negativeTtl > 0)
933 entry->cacheNegatively();
934 else
935 #endif
936 entry->makePrivate();
937
938 break;
939
940 default:
941 assert(0);
942
943 break;
944 }
945
946 no_cache:
947
948 if (!ignoreCacheControl && rep->cache_control) {
949 if (EBIT_TEST(rep->cache_control->mask, CC_PROXY_REVALIDATE) ||
950 EBIT_TEST(rep->cache_control->mask, CC_MUST_REVALIDATE) ||
951 EBIT_TEST(rep->cache_control->mask, CC_S_MAXAGE))
952 EBIT_SET(entry->flags, ENTRY_REVALIDATE);
953 }
954
955 #if HEADERS_LOG
956 headersLog(1, 0, request->method, rep);
957
958 #endif
959
960 ctx_exit(ctx);
961 }
962
963 HttpStateData::ConnectionStatus
964 HttpStateData::statusIfComplete() const
965 {
966 const HttpReply *rep = virginReply();
967 /** \par
968 * If the reply wants to close the connection, it takes precedence */
969
970 if (httpHeaderHasConnDir(&rep->header, "close"))
971 return COMPLETE_NONPERSISTENT_MSG;
972
973 /** \par
974 * If we didn't send a keep-alive request header, then this
975 * can not be a persistent connection.
976 */
977 if (!flags.keepalive)
978 return COMPLETE_NONPERSISTENT_MSG;
979
980 /** \par
981 * If we haven't sent the whole request then this can not be a persistent
982 * connection.
983 */
984 if (!flags.request_sent) {
985 debugs(11, 2, "statusIfComplete: Request not yet fully sent \"" << RequestMethodStr(orig_request->method) << " " << entry->url() << "\"" );
986 return COMPLETE_NONPERSISTENT_MSG;
987 }
988
989 /** \par
990 * What does the reply have to say about keep-alive?
991 */
992 /**
993 \bug XXX BUG?
994 * If the origin server (HTTP/1.0) does not send a keep-alive
995 * header, but keeps the connection open anyway, what happens?
996 * We'll return here and http.c waits for an EOF before changing
997 * store_status to STORE_OK. Combine this with ENTRY_FWD_HDR_WAIT
998 * and an error status code, and we might have to wait until
999 * the server times out the socket.
1000 */
1001 if (!rep->keep_alive)
1002 return COMPLETE_NONPERSISTENT_MSG;
1003
1004 return COMPLETE_PERSISTENT_MSG;
1005 }
1006
1007 HttpStateData::ConnectionStatus
1008 HttpStateData::persistentConnStatus() const
1009 {
1010 debugs(11, 3, "persistentConnStatus: FD " << fd << " eof=" << eof);
1011 if (eof) // already reached EOF
1012 return COMPLETE_NONPERSISTENT_MSG;
1013
1014 /* If server fd is closing (but we have not been notified yet), stop Comm
1015 I/O to avoid assertions. TODO: Change Comm API to handle callers that
1016 want more I/O after async closing (usually initiated by others). */
1017 // XXX: add canReceive or s/canSend/canTalkToServer/
1018 if (!canSend(fd))
1019 return COMPLETE_NONPERSISTENT_MSG;
1020
1021 /** \par
1022 * In chunked response we do not know the content length but we are absolutely
1023 * sure about the end of response, so we are calling the statusIfComplete to
1024 * decide if we can be persistant
1025 */
1026 if (lastChunk && flags.chunked)
1027 return statusIfComplete();
1028
1029 const HttpReply *vrep = virginReply();
1030 debugs(11, 5, "persistentConnStatus: content_length=" << vrep->content_length);
1031
1032 const int64_t clen = vrep->bodySize(request->method);
1033
1034 debugs(11, 5, "persistentConnStatus: clen=" << clen);
1035
1036 /* If the body size is unknown we must wait for EOF */
1037 if (clen < 0)
1038 return INCOMPLETE_MSG;
1039
1040 /** \par
1041 * If the body size is known, we must wait until we've gotten all of it. */
1042 if (clen > 0) {
1043 // old technique:
1044 // if (entry->mem_obj->endOffset() < vrep->content_length + vrep->hdr_sz)
1045 const int64_t body_bytes_read = reply_bytes_read - header_bytes_read;
1046 debugs(11,5, "persistentConnStatus: body_bytes_read=" <<
1047 body_bytes_read << " content_length=" << vrep->content_length);
1048
1049 if (body_bytes_read < vrep->content_length)
1050 return INCOMPLETE_MSG;
1051
1052 if (body_bytes_truncated > 0) // already read more than needed
1053 return COMPLETE_NONPERSISTENT_MSG; // disable pconns
1054 }
1055
1056 /** \par
1057 * If there is no message body or we got it all, we can be persistent */
1058 return statusIfComplete();
1059 }
1060
1061 /*
1062 * This is the callback after some data has been read from the network
1063 */
1064 /*
1065 void
1066 HttpStateData::ReadReplyWrapper(int fd, char *buf, size_t len, comm_err_t flag, int xerrno, void *data)
1067 {
1068 HttpStateData *httpState = static_cast<HttpStateData *>(data);
1069 assert (fd == httpState->fd);
1070 // assert(buf == readBuf->content());
1071 PROF_start(HttpStateData_readReply);
1072 httpState->readReply(len, flag, xerrno);
1073 PROF_stop(HttpStateData_readReply);
1074 }
1075 */
1076
1077 /* XXX this function is too long! */
1078 void
1079 HttpStateData::readReply(const CommIoCbParams &io)
1080 {
1081 int bin;
1082 int clen;
1083 int len = io.size;
1084
1085 assert(fd == io.fd);
1086
1087 flags.do_next_read = 0;
1088
1089 debugs(11, 5, "httpReadReply: FD " << fd << ": len " << len << ".");
1090
1091 // Bail out early on COMM_ERR_CLOSING - close handlers will tidy up for us
1092 if (io.flag == COMM_ERR_CLOSING) {
1093 debugs(11, 3, "http socket closing");
1094 return;
1095 }
1096
1097 if (EBIT_TEST(entry->flags, ENTRY_ABORTED)) {
1098 maybeReadVirginBody();
1099 return;
1100 }
1101
1102 // handle I/O errors
1103 if (io.flag != COMM_OK || len < 0) {
1104 debugs(11, 2, "httpReadReply: FD " << fd << ": read failure: " << xstrerror() << ".");
1105
1106 if (ignoreErrno(io.xerrno)) {
1107 flags.do_next_read = 1;
1108 } else {
1109 ErrorState *err;
1110 err = errorCon(ERR_READ_ERROR, HTTP_BAD_GATEWAY, fwd->request);
1111 err->xerrno = io.xerrno;
1112 fwd->fail(err);
1113 flags.do_next_read = 0;
1114 comm_close(fd);
1115 }
1116
1117 return;
1118 }
1119
1120 // update I/O stats
1121 if (len > 0) {
1122 readBuf->appended(len);
1123 reply_bytes_read += len;
1124 #if USE_DELAY_POOLS
1125 DelayId delayId = entry->mem_obj->mostBytesAllowed();
1126 delayId.bytesIn(len);
1127 #endif
1128
1129 kb_incr(&statCounter.server.all.kbytes_in, len);
1130 kb_incr(&statCounter.server.http.kbytes_in, len);
1131 IOStats.Http.reads++;
1132
1133 for (clen = len - 1, bin = 0; clen; bin++)
1134 clen >>= 1;
1135
1136 IOStats.Http.read_hist[bin]++;
1137
1138 // update peer response time stats (%<pt)
1139 const timeval &sent = orig_request->hier.peer_http_request_sent;
1140 orig_request->hier.peer_response_time =
1141 sent.tv_sec ? tvSubMsec(sent, current_time) : -1;
1142 }
1143
1144 /** \par
1145 * Here the RFC says we should ignore whitespace between replies, but we can't as
1146 * doing so breaks HTTP/0.9 replies beginning with witespace, and in addition
1147 * the response splitting countermeasures is extremely likely to trigger on this,
1148 * not allowing connection reuse in the first place.
1149 */
1150 #if DONT_DO_THIS
1151 if (!flags.headers_parsed && len > 0 && fd_table[fd].uses > 1) {
1152 /* Skip whitespace between replies */
1153
1154 while (len > 0 && xisspace(*buf))
1155 memmove(buf, buf + 1, len--);
1156
1157 if (len == 0) {
1158 /* Continue to read... */
1159 /* Timeout NOT increased. This whitespace was from previous reply */
1160 flags.do_next_read = 1;
1161 maybeReadVirginBody();
1162 return;
1163 }
1164 }
1165
1166 #endif
1167
1168 if (len == 0) { // reached EOF?
1169 eof = 1;
1170 flags.do_next_read = 0;
1171
1172 /* Bug 2879: Replies may terminate with \r\n then EOF instead of \r\n\r\n
1173 * Ensure here that we have at minimum two \r\n when EOF is seen.
1174 * TODO: Add eof parameter to headersEnd() and move this hack there.
1175 */
1176 if (readBuf->contentSize() && !flags.headers_parsed) {
1177 /*
1178 * Yes Henrik, there is a point to doing this. When we
1179 * called httpProcessReplyHeader() before, we didn't find
1180 * the end of headers, but now we are definately at EOF, so
1181 * we want to process the reply headers.
1182 */
1183 /* Fake an "end-of-headers" to work around such broken servers */
1184 readBuf->append("\r\n", 2);
1185 }
1186 }
1187
1188 processReply();
1189 }
1190
1191 /// processes the already read and buffered response data, possibly after
1192 /// waiting for asynchronous 1xx control message processing
1193 void
1194 HttpStateData::processReply()
1195 {
1196
1197 if (flags.handling1xx) { // we came back after handling a 1xx response
1198 debugs(11, 5, HERE << "done with 1xx handling");
1199 flags.handling1xx = false;
1200 Must(!flags.headers_parsed);
1201 }
1202
1203 if (!flags.headers_parsed) { // have not parsed headers yet?
1204 PROF_start(HttpStateData_processReplyHeader);
1205 processReplyHeader();
1206 PROF_stop(HttpStateData_processReplyHeader);
1207
1208 if (!continueAfterParsingHeader()) // parsing error or need more data
1209 return; // TODO: send errors to ICAP
1210
1211 adaptOrFinalizeReply();
1212 }
1213
1214 // kick more reads if needed and/or process the response body, if any
1215 PROF_start(HttpStateData_processReplyBody);
1216 processReplyBody(); // may call serverComplete()
1217 PROF_stop(HttpStateData_processReplyBody);
1218 }
1219
1220 /**
1221 \retval true if we can continue with processing the body or doing ICAP.
1222 */
1223 bool
1224 HttpStateData::continueAfterParsingHeader()
1225 {
1226 if (flags.handling1xx) {
1227 debugs(11, 5, HERE << "wait for 1xx handling");
1228 Must(!flags.headers_parsed);
1229 return false;
1230 }
1231
1232 if (!flags.headers_parsed && !eof) {
1233 debugs(11, 9, HERE << "needs more at " << readBuf->contentSize());
1234 flags.do_next_read = 1;
1235 /** \retval false If we have not finished parsing the headers and may get more data.
1236 * Schedules more reads to retrieve the missing data.
1237 */
1238 maybeReadVirginBody(); // schedules all kinds of reads; TODO: rename
1239 return false;
1240 }
1241
1242 /** If we are done with parsing, check for errors */
1243
1244 err_type error = ERR_NONE;
1245
1246 if (flags.headers_parsed) { // parsed headers, possibly with errors
1247 // check for header parsing errors
1248 if (HttpReply *vrep = virginReply()) {
1249 const http_status s = vrep->sline.status;
1250 const HttpVersion &v = vrep->sline.version;
1251 if (s == HTTP_INVALID_HEADER && v != HttpVersion(0,9)) {
1252 debugs(11, DBG_IMPORTANT, "WARNING: HTTP: Invalid Response: Bad header encountered from " << entry->url() << " AKA " << orig_request->GetHost() << orig_request->urlpath.termedBuf() );
1253 error = ERR_INVALID_RESP;
1254 } else if (s == HTTP_HEADER_TOO_LARGE) {
1255 fwd->dontRetry(true);
1256 error = ERR_TOO_BIG;
1257 } else {
1258 return true; // done parsing, got reply, and no error
1259 }
1260 } else {
1261 // parsed headers but got no reply
1262 debugs(11, DBG_IMPORTANT, "WARNING: HTTP: Invalid Response: No reply at all for " << entry->url() << " AKA " << orig_request->GetHost() << orig_request->urlpath.termedBuf() );
1263 error = ERR_INVALID_RESP;
1264 }
1265 } else {
1266 assert(eof);
1267 if (readBuf->hasContent()) {
1268 error = ERR_INVALID_RESP;
1269 debugs(11, DBG_IMPORTANT, "WARNING: HTTP: Invalid Response: Headers did not parse at all for " << entry->url() << " AKA " << orig_request->GetHost() << orig_request->urlpath.termedBuf() );
1270 } else {
1271 error = ERR_ZERO_SIZE_OBJECT;
1272 debugs(11, (orig_request->flags.accelerated?DBG_IMPORTANT:2), "WARNING: HTTP: Invalid Response: No object data received for " <<
1273 entry->url() << " AKA " << orig_request->GetHost() << orig_request->urlpath.termedBuf() );
1274 }
1275 }
1276
1277 assert(error != ERR_NONE);
1278 entry->reset();
1279 fwd->fail(errorCon(error, HTTP_BAD_GATEWAY, fwd->request));
1280 flags.do_next_read = 0;
1281 comm_close(fd);
1282 return false; // quit on error
1283 }
1284
1285 /** truncate what we read if we read too much so that writeReplyBody()
1286 writes no more than what we should have read */
1287 void
1288 HttpStateData::truncateVirginBody()
1289 {
1290 assert(flags.headers_parsed);
1291
1292 HttpReply *vrep = virginReply();
1293 int64_t clen = -1;
1294 if (!vrep->expectingBody(request->method, clen) || clen < 0)
1295 return; // no body or a body of unknown size, including chunked
1296
1297 const int64_t body_bytes_read = reply_bytes_read - header_bytes_read;
1298 if (body_bytes_read - body_bytes_truncated <= clen)
1299 return; // we did not read too much or already took care of the extras
1300
1301 if (const int64_t extras = body_bytes_read - body_bytes_truncated - clen) {
1302 // server sent more that the advertised content length
1303 debugs(11,5, HERE << "body_bytes_read=" << body_bytes_read <<
1304 " clen=" << clen << '/' << vrep->content_length <<
1305 " body_bytes_truncated=" << body_bytes_truncated << '+' << extras);
1306
1307 readBuf->truncate(extras);
1308 body_bytes_truncated += extras;
1309 }
1310 }
1311
1312 /**
1313 * Call this when there is data from the origin server
1314 * which should be sent to either StoreEntry, or to ICAP...
1315 */
1316 void
1317 HttpStateData::writeReplyBody()
1318 {
1319 truncateVirginBody(); // if needed
1320 const char *data = readBuf->content();
1321 int len = readBuf->contentSize();
1322 addVirginReplyBody(data, len);
1323 readBuf->consume(len);
1324 }
1325
1326 bool
1327 HttpStateData::decodeAndWriteReplyBody()
1328 {
1329 const char *data = NULL;
1330 int len;
1331 bool wasThereAnException = false;
1332 assert(flags.chunked);
1333 assert(httpChunkDecoder);
1334 SQUID_ENTER_THROWING_CODE();
1335 MemBuf decodedData;
1336 decodedData.init();
1337 const bool doneParsing = httpChunkDecoder->parse(readBuf,&decodedData);
1338 len = decodedData.contentSize();
1339 data=decodedData.content();
1340 addVirginReplyBody(data, len);
1341 if (doneParsing) {
1342 lastChunk = 1;
1343 flags.do_next_read = 0;
1344 }
1345 SQUID_EXIT_THROWING_CODE(wasThereAnException);
1346 return wasThereAnException;
1347 }
1348
1349 /**
1350 * processReplyBody has two purposes:
1351 * 1 - take the reply body data, if any, and put it into either
1352 * the StoreEntry, or give it over to ICAP.
1353 * 2 - see if we made it to the end of the response (persistent
1354 * connections and such)
1355 */
1356 void
1357 HttpStateData::processReplyBody()
1358 {
1359 AsyncCall::Pointer call;
1360 Ip::Address client_addr;
1361 bool ispinned = false;
1362
1363 if (!flags.headers_parsed) {
1364 flags.do_next_read = 1;
1365 maybeReadVirginBody();
1366 return;
1367 }
1368
1369 #if USE_ADAPTATION
1370 debugs(11,5, HERE << "adaptationAccessCheckPending=" << adaptationAccessCheckPending);
1371 if (adaptationAccessCheckPending)
1372 return;
1373
1374 #endif
1375
1376 /*
1377 * At this point the reply headers have been parsed and consumed.
1378 * That means header content has been removed from readBuf and
1379 * it contains only body data.
1380 */
1381 if (flags.chunked) {
1382 if (!decodeAndWriteReplyBody()) {
1383 flags.do_next_read = 0;
1384 serverComplete();
1385 return;
1386 }
1387 } else
1388 writeReplyBody();
1389
1390 if (EBIT_TEST(entry->flags, ENTRY_ABORTED)) {
1391 /*
1392 * The above writeReplyBody() call could ABORT this entry,
1393 * in that case, the server FD should already be closed.
1394 * there's nothing for us to do.
1395 */
1396 (void) 0;
1397 } else
1398 switch (persistentConnStatus()) {
1399 case INCOMPLETE_MSG:
1400 debugs(11, 5, "processReplyBody: INCOMPLETE_MSG");
1401 /* Wait for more data or EOF condition */
1402 if (flags.keepalive_broken) {
1403 call = NULL;
1404 commSetTimeout(fd, 10, call);
1405 } else {
1406 call = NULL;
1407 commSetTimeout(fd, Config.Timeout.read, call);
1408 }
1409
1410 flags.do_next_read = 1;
1411 break;
1412
1413 case COMPLETE_PERSISTENT_MSG:
1414 debugs(11, 5, "processReplyBody: COMPLETE_PERSISTENT_MSG");
1415 /* yes we have to clear all these! */
1416 call = NULL;
1417 commSetTimeout(fd, -1, call);
1418 flags.do_next_read = 0;
1419
1420 comm_remove_close_handler(fd, closeHandler);
1421 closeHandler = NULL;
1422 fwd->unregister(fd);
1423
1424 if (orig_request->flags.spoof_client_ip)
1425 client_addr = orig_request->client_addr;
1426
1427
1428 if (request->flags.pinned) {
1429 ispinned = true;
1430 } else if (request->flags.connection_auth && request->flags.auth_sent) {
1431 ispinned = true;
1432 }
1433
1434 if (orig_request->pinnedConnection() && ispinned) {
1435 orig_request->pinnedConnection()->pinConnection(fd, orig_request, _peer,
1436 (request->flags.connection_auth != 0));
1437 } else {
1438 fwd->pconnPush(fd, _peer, request, orig_request->GetHost(), client_addr);
1439 }
1440
1441 fd = -1;
1442
1443 serverComplete();
1444 return;
1445
1446 case COMPLETE_NONPERSISTENT_MSG:
1447 debugs(11, 5, "processReplyBody: COMPLETE_NONPERSISTENT_MSG");
1448 serverComplete();
1449 return;
1450 }
1451
1452 maybeReadVirginBody();
1453 }
1454
1455 void
1456 HttpStateData::maybeReadVirginBody()
1457 {
1458 // we may need to grow the buffer if headers do not fit
1459 const int minRead = flags.headers_parsed ? 0 :1024;
1460 const int read_size = replyBodySpace(*readBuf, minRead);
1461
1462 debugs(11,9, HERE << (flags.do_next_read ? "may" : "wont") <<
1463 " read up to " << read_size << " bytes from FD " << fd);
1464
1465 /*
1466 * why <2? Because delayAwareRead() won't actually read if
1467 * you ask it to read 1 byte. The delayed read request
1468 * just gets re-queued until the client side drains, then
1469 * the I/O thread hangs. Better to not register any read
1470 * handler until we get a notification from someone that
1471 * its okay to read again.
1472 */
1473 if (read_size < 2)
1474 return;
1475
1476 if (flags.do_next_read) {
1477 flags.do_next_read = 0;
1478 typedef CommCbMemFunT<HttpStateData, CommIoCbParams> Dialer;
1479 entry->delayAwareRead(fd, readBuf->space(read_size), read_size,
1480 JobCallback(11, 5, Dialer, this, HttpStateData::readReply));
1481 }
1482 }
1483
1484 /// called after writing the very last request byte (body, last-chunk, etc)
1485 void
1486 HttpStateData::wroteLast(const CommIoCbParams &io)
1487 {
1488 debugs(11, 5, HERE << "FD " << fd << ": size " << io.size << ": errflag " << io.flag << ".");
1489 #if URL_CHECKSUM_DEBUG
1490
1491 entry->mem_obj->checkUrlChecksum();
1492 #endif
1493
1494 if (io.size > 0) {
1495 fd_bytes(fd, io.size, FD_WRITE);
1496 kb_incr(&statCounter.server.all.kbytes_out, io.size);
1497 kb_incr(&statCounter.server.http.kbytes_out, io.size);
1498 }
1499
1500 if (io.flag == COMM_ERR_CLOSING)
1501 return;
1502
1503 if (io.flag) {
1504 ErrorState *err;
1505 err = errorCon(ERR_WRITE_ERROR, HTTP_BAD_GATEWAY, fwd->request);
1506 err->xerrno = io.xerrno;
1507 fwd->fail(err);
1508 comm_close(fd);
1509 return;
1510 }
1511
1512 sendComplete();
1513 }
1514
1515 /// successfully wrote the entire request (including body, last-chunk, etc.)
1516 void
1517 HttpStateData::sendComplete()
1518 {
1519 /*
1520 * Set the read timeout here because it hasn't been set yet.
1521 * We only set the read timeout after the request has been
1522 * fully written to the server-side. If we start the timeout
1523 * after connection establishment, then we are likely to hit
1524 * the timeout for POST/PUT requests that have very large
1525 * request bodies.
1526 */
1527 typedef CommCbMemFunT<HttpStateData, CommTimeoutCbParams> TimeoutDialer;
1528 AsyncCall::Pointer timeoutCall = JobCallback(11, 5,
1529 TimeoutDialer, this, HttpStateData::httpTimeout);
1530
1531 commSetTimeout(fd, Config.Timeout.read, timeoutCall);
1532
1533 flags.request_sent = 1;
1534
1535 orig_request->hier.peer_http_request_sent = current_time;
1536 }
1537
1538 // Close the HTTP server connection. Used by serverComplete().
1539 void
1540 HttpStateData::closeServer()
1541 {
1542 debugs(11,5, HERE << "closing HTTP server FD " << fd << " this " << this);
1543
1544 if (fd >= 0) {
1545 fwd->unregister(fd);
1546 comm_remove_close_handler(fd, closeHandler);
1547 closeHandler = NULL;
1548 comm_close(fd);
1549 fd = -1;
1550 }
1551 }
1552
1553 bool
1554 HttpStateData::doneWithServer() const
1555 {
1556 return fd < 0;
1557 }
1558
1559
1560 /*
1561 * Fixup authentication request headers for special cases
1562 */
1563 static void
1564 httpFixupAuthentication(HttpRequest * request, HttpRequest * orig_request, const HttpHeader * hdr_in, HttpHeader * hdr_out, http_state_flags flags)
1565 {
1566 http_hdr_type header = flags.originpeer ? HDR_AUTHORIZATION : HDR_PROXY_AUTHORIZATION;
1567
1568 /* Nothing to do unless we are forwarding to a peer */
1569 if (!request->flags.proxying)
1570 return;
1571
1572 /* Needs to be explicitly enabled */
1573 if (!orig_request->peer_login)
1574 return;
1575
1576 /* Maybe already dealt with? */
1577 if (hdr_out->has(header))
1578 return;
1579
1580 /* Nothing to do here for PASSTHRU */
1581 if (strcmp(orig_request->peer_login, "PASSTHRU") == 0)
1582 return;
1583
1584 /* PROXYPASS is a special case, single-signon to servers with the proxy password (basic only) */
1585 if (flags.originpeer && strcmp(orig_request->peer_login, "PROXYPASS") == 0 && hdr_in->has(HDR_PROXY_AUTHORIZATION)) {
1586 const char *auth = hdr_in->getStr(HDR_PROXY_AUTHORIZATION);
1587
1588 if (auth && strncasecmp(auth, "basic ", 6) == 0) {
1589 hdr_out->putStr(header, auth);
1590 return;
1591 }
1592 }
1593
1594 /* Special mode to pass the username to the upstream cache */
1595 if (*orig_request->peer_login == '*') {
1596 char loginbuf[256];
1597 const char *username = "-";
1598
1599 if (orig_request->extacl_user.size())
1600 username = orig_request->extacl_user.termedBuf();
1601 #if USE_AUTH
1602 else if (orig_request->auth_user_request != NULL)
1603 username = orig_request->auth_user_request->username();
1604 #endif
1605
1606 snprintf(loginbuf, sizeof(loginbuf), "%s%s", username, orig_request->peer_login + 1);
1607
1608 httpHeaderPutStrf(hdr_out, header, "Basic %s",
1609 old_base64_encode(loginbuf));
1610 return;
1611 }
1612
1613 /* external_acl provided credentials */
1614 if (orig_request->extacl_user.size() && orig_request->extacl_passwd.size() &&
1615 (strcmp(orig_request->peer_login, "PASS") == 0 ||
1616 strcmp(orig_request->peer_login, "PROXYPASS") == 0)) {
1617 char loginbuf[256];
1618 snprintf(loginbuf, sizeof(loginbuf), SQUIDSTRINGPH ":" SQUIDSTRINGPH,
1619 SQUIDSTRINGPRINT(orig_request->extacl_user),
1620 SQUIDSTRINGPRINT(orig_request->extacl_passwd));
1621 httpHeaderPutStrf(hdr_out, header, "Basic %s",
1622 old_base64_encode(loginbuf));
1623 return;
1624 }
1625
1626 /* Kerberos login to peer */
1627 #if HAVE_AUTH_MODULE_NEGOTIATE && HAVE_KRB5 && HAVE_GSSAPI
1628 if (strncmp(orig_request->peer_login, "NEGOTIATE",strlen("NEGOTIATE")) == 0) {
1629 char *Token=NULL;
1630 char *PrincipalName=NULL,*p;
1631 if ((p=strchr(orig_request->peer_login,':')) != NULL ) {
1632 PrincipalName=++p;
1633 }
1634 Token = peer_proxy_negotiate_auth(PrincipalName,request->peer_host);
1635 if (Token) {
1636 httpHeaderPutStrf(hdr_out, HDR_PROXY_AUTHORIZATION, "Negotiate %s",Token);
1637 }
1638 return;
1639 }
1640 #endif /* HAVE_KRB5 && HAVE_GSSAPI */
1641
1642 httpHeaderPutStrf(hdr_out, header, "Basic %s",
1643 old_base64_encode(orig_request->peer_login));
1644 return;
1645 }
1646
1647 /*
1648 * build request headers and append them to a given MemBuf
1649 * used by buildRequestPrefix()
1650 * note: initialised the HttpHeader, the caller is responsible for Clean()-ing
1651 */
1652 void
1653 HttpStateData::httpBuildRequestHeader(HttpRequest * request,
1654 HttpRequest * orig_request,
1655 StoreEntry * entry,
1656 HttpHeader * hdr_out,
1657 const http_state_flags flags)
1658 {
1659 /* building buffer for complex strings */
1660 #define BBUF_SZ (MAX_URL+32)
1661 LOCAL_ARRAY(char, bbuf, BBUF_SZ);
1662 LOCAL_ARRAY(char, ntoabuf, MAX_IPSTRLEN);
1663 const HttpHeader *hdr_in = &orig_request->header;
1664 const HttpHeaderEntry *e = NULL;
1665 HttpHeaderPos pos = HttpHeaderInitPos;
1666 assert (hdr_out->owner == hoRequest);
1667
1668 /* append our IMS header */
1669 if (request->lastmod > -1)
1670 hdr_out->putTime(HDR_IF_MODIFIED_SINCE, request->lastmod);
1671
1672 bool we_do_ranges = decideIfWeDoRanges (orig_request);
1673
1674 String strConnection (hdr_in->getList(HDR_CONNECTION));
1675
1676 while ((e = hdr_in->getEntry(&pos)))
1677 copyOneHeaderFromClientsideRequestToUpstreamRequest(e, strConnection, request, orig_request, hdr_out, we_do_ranges, flags);
1678
1679 /* Abstraction break: We should interpret multipart/byterange responses
1680 * into offset-length data, and this works around our inability to do so.
1681 */
1682 if (!we_do_ranges && orig_request->multipartRangeRequest()) {
1683 /* don't cache the result */
1684 orig_request->flags.cachable = 0;
1685 /* pretend it's not a range request */
1686 delete orig_request->range;
1687 orig_request->range = NULL;
1688 orig_request->flags.range = 0;
1689 }
1690
1691 /* append Via */
1692 if (Config.onoff.via) {
1693 String strVia;
1694 strVia = hdr_in->getList(HDR_VIA);
1695 snprintf(bbuf, BBUF_SZ, "%d.%d %s",
1696 orig_request->http_ver.major,
1697 orig_request->http_ver.minor, ThisCache);
1698 strListAdd(&strVia, bbuf, ',');
1699 hdr_out->putStr(HDR_VIA, strVia.termedBuf());
1700 strVia.clean();
1701 }
1702
1703 if (orig_request->flags.accelerated) {
1704 /* Append Surrogate-Capabilities */
1705 String strSurrogate(hdr_in->getList(HDR_SURROGATE_CAPABILITY));
1706 #if USE_SQUID_ESI
1707 snprintf(bbuf, BBUF_SZ, "%s=\"Surrogate/1.0 ESI/1.0\"", Config.Accel.surrogate_id);
1708 #else
1709 snprintf(bbuf, BBUF_SZ, "%s=\"Surrogate/1.0\"", Config.Accel.surrogate_id);
1710 #endif
1711 strListAdd(&strSurrogate, bbuf, ',');
1712 hdr_out->putStr(HDR_SURROGATE_CAPABILITY, strSurrogate.termedBuf());
1713 }
1714
1715 /** \pre Handle X-Forwarded-For */
1716 if (strcmp(opt_forwarded_for, "delete") != 0) {
1717
1718 String strFwd = hdr_in->getList(HDR_X_FORWARDED_FOR);
1719
1720 if (strFwd.size() > 65536/2) {
1721 // There is probably a forwarding loop with Via detection disabled.
1722 // If we do nothing, String will assert on overflow soon.
1723 // TODO: Terminate all transactions with huge XFF?
1724 strFwd = "error";
1725
1726 static int warnedCount = 0;
1727 if (warnedCount++ < 100) {
1728 const char *url = entry ? entry->url() : urlCanonical(orig_request);
1729 debugs(11, 1, "Warning: likely forwarding loop with " << url);
1730 }
1731 }
1732
1733 if (strcmp(opt_forwarded_for, "on") == 0) {
1734 /** If set to ON - append client IP or 'unknown'. */
1735 if ( orig_request->client_addr.IsNoAddr() )
1736 strListAdd(&strFwd, "unknown", ',');
1737 else
1738 strListAdd(&strFwd, orig_request->client_addr.NtoA(ntoabuf, MAX_IPSTRLEN), ',');
1739 } else if (strcmp(opt_forwarded_for, "off") == 0) {
1740 /** If set to OFF - append 'unknown'. */
1741 strListAdd(&strFwd, "unknown", ',');
1742 } else if (strcmp(opt_forwarded_for, "transparent") == 0) {
1743 /** If set to TRANSPARENT - pass through unchanged. */
1744 } else if (strcmp(opt_forwarded_for, "truncate") == 0) {
1745 /** If set to TRUNCATE - drop existing list and replace with client IP or 'unknown'. */
1746 if ( orig_request->client_addr.IsNoAddr() )
1747 strFwd = "unknown";
1748 else
1749 strFwd = orig_request->client_addr.NtoA(ntoabuf, MAX_IPSTRLEN);
1750 }
1751 if (strFwd.size() > 0)
1752 hdr_out->putStr(HDR_X_FORWARDED_FOR, strFwd.termedBuf());
1753 }
1754 /** If set to DELETE - do not copy through. */
1755
1756 /* append Host if not there already */
1757 if (!hdr_out->has(HDR_HOST)) {
1758 if (orig_request->peer_domain) {
1759 hdr_out->putStr(HDR_HOST, orig_request->peer_domain);
1760 } else if (orig_request->port == urlDefaultPort(orig_request->protocol)) {
1761 /* use port# only if not default */
1762 hdr_out->putStr(HDR_HOST, orig_request->GetHost());
1763 } else {
1764 httpHeaderPutStrf(hdr_out, HDR_HOST, "%s:%d",
1765 orig_request->GetHost(),
1766 (int) orig_request->port);
1767 }
1768 }
1769
1770 /* append Authorization if known in URL, not in header and going direct */
1771 if (!hdr_out->has(HDR_AUTHORIZATION)) {
1772 if (!request->flags.proxying && *request->login) {
1773 httpHeaderPutStrf(hdr_out, HDR_AUTHORIZATION, "Basic %s",
1774 old_base64_encode(request->login));
1775 }
1776 }
1777
1778 /* Fixup (Proxy-)Authorization special cases. Plain relaying dealt with above */
1779 httpFixupAuthentication(request, orig_request, hdr_in, hdr_out, flags);
1780
1781 /* append Cache-Control, add max-age if not there already */
1782 {
1783 HttpHdrCc *cc = hdr_in->getCc();
1784
1785 if (!cc)
1786 cc = httpHdrCcCreate();
1787
1788 #if 0 /* see bug 2330 */
1789 /* Set no-cache if determined needed but not found */
1790 if (orig_request->flags.nocache)
1791 EBIT_SET(cc->mask, CC_NO_CACHE);
1792 #endif
1793
1794 /* Add max-age only without no-cache */
1795 if (!EBIT_TEST(cc->mask, CC_MAX_AGE) && !EBIT_TEST(cc->mask, CC_NO_CACHE)) {
1796 const char *url =
1797 entry ? entry->url() : urlCanonical(orig_request);
1798 httpHdrCcSetMaxAge(cc, getMaxAge(url));
1799
1800 if (request->urlpath.size())
1801 assert(strstr(url, request->urlpath.termedBuf()));
1802 }
1803
1804 /* Enforce sibling relations */
1805 if (flags.only_if_cached)
1806 EBIT_SET(cc->mask, CC_ONLY_IF_CACHED);
1807
1808 hdr_out->putCc(cc);
1809
1810 httpHdrCcDestroy(cc);
1811 }
1812
1813 /* maybe append Connection: keep-alive */
1814 if (flags.keepalive) {
1815 hdr_out->putStr(HDR_CONNECTION, "keep-alive");
1816 }
1817
1818 /* append Front-End-Https */
1819 if (flags.front_end_https) {
1820 if (flags.front_end_https == 1 || request->protocol == AnyP::PROTO_HTTPS)
1821 hdr_out->putStr(HDR_FRONT_END_HTTPS, "On");
1822 }
1823
1824 if (flags.chunked_request) {
1825 // Do not just copy the original value so that if the client-side
1826 // starts decode other encodings, this code may remain valid.
1827 hdr_out->putStr(HDR_TRANSFER_ENCODING, "chunked");
1828 }
1829
1830 /* Now mangle the headers. */
1831 if (Config2.onoff.mangle_request_headers)
1832 httpHdrMangleList(hdr_out, request, ROR_REQUEST);
1833
1834 strConnection.clean();
1835 }
1836
1837 /**
1838 * Decides whether a particular header may be cloned from the received Clients request
1839 * to our outgoing fetch request.
1840 */
1841 void
1842 copyOneHeaderFromClientsideRequestToUpstreamRequest(const HttpHeaderEntry *e, const String strConnection, HttpRequest * request, const HttpRequest * orig_request, HttpHeader * hdr_out, const int we_do_ranges, const http_state_flags flags)
1843 {
1844 debugs(11, 5, "httpBuildRequestHeader: " << e->name << ": " << e->value );
1845
1846 switch (e->id) {
1847
1848 /** \par RFC 2616 sect 13.5.1 - Hop-by-Hop headers which Squid should not pass on. */
1849
1850 case HDR_PROXY_AUTHORIZATION:
1851 /** \par Proxy-Authorization:
1852 * Only pass on proxy authentication to peers for which
1853 * authentication forwarding is explicitly enabled
1854 */
1855 if (!flags.originpeer && flags.proxying && orig_request->peer_login &&
1856 (strcmp(orig_request->peer_login, "PASS") == 0 ||
1857 strcmp(orig_request->peer_login, "PROXYPASS") == 0 ||
1858 strcmp(orig_request->peer_login, "PASSTHRU") == 0)) {
1859 hdr_out->addEntry(e->clone());
1860 }
1861 break;
1862
1863 /** \par RFC 2616 sect 13.5.1 - Hop-by-Hop headers which Squid does not pass on. */
1864
1865 case HDR_CONNECTION: /** \par Connection: */
1866 case HDR_TE: /** \par TE: */
1867 case HDR_KEEP_ALIVE: /** \par Keep-Alive: */
1868 case HDR_PROXY_AUTHENTICATE: /** \par Proxy-Authenticate: */
1869 case HDR_TRAILER: /** \par Trailer: */
1870 case HDR_UPGRADE: /** \par Upgrade: */
1871 case HDR_TRANSFER_ENCODING: /** \par Transfer-Encoding: */
1872 break;
1873
1874
1875 /** \par OTHER headers I haven't bothered to track down yet. */
1876
1877 case HDR_AUTHORIZATION:
1878 /** \par WWW-Authorization:
1879 * Pass on WWW authentication */
1880
1881 if (!flags.originpeer) {
1882 hdr_out->addEntry(e->clone());
1883 } else {
1884 /** \note In accelerators, only forward authentication if enabled
1885 * (see also httpFixupAuthentication for special cases)
1886 */
1887 if (orig_request->peer_login &&
1888 (strcmp(orig_request->peer_login, "PASS") == 0 ||
1889 strcmp(orig_request->peer_login, "PASSTHRU") == 0 ||
1890 strcmp(orig_request->peer_login, "PROXYPASS") == 0)) {
1891 hdr_out->addEntry(e->clone());
1892 }
1893 }
1894
1895 break;
1896
1897 case HDR_HOST:
1898 /** \par Host:
1899 * Normally Squid rewrites the Host: header.
1900 * However, there is one case when we don't: If the URL
1901 * went through our redirector and the admin configured
1902 * 'redir_rewrites_host' to be off.
1903 */
1904 if (orig_request->peer_domain)
1905 hdr_out->putStr(HDR_HOST, orig_request->peer_domain);
1906 else if (request->flags.redirected && !Config.onoff.redir_rewrites_host)
1907 hdr_out->addEntry(e->clone());
1908 else {
1909 /* use port# only if not default */
1910
1911 if (orig_request->port == urlDefaultPort(orig_request->protocol)) {
1912 hdr_out->putStr(HDR_HOST, orig_request->GetHost());
1913 } else {
1914 httpHeaderPutStrf(hdr_out, HDR_HOST, "%s:%d",
1915 orig_request->GetHost(),
1916 (int) orig_request->port);
1917 }
1918 }
1919
1920 break;
1921
1922 case HDR_IF_MODIFIED_SINCE:
1923 /** \par If-Modified-Since:
1924 * append unless we added our own;
1925 * \note at most one client's ims header can pass through */
1926
1927 if (!hdr_out->has(HDR_IF_MODIFIED_SINCE))
1928 hdr_out->addEntry(e->clone());
1929
1930 break;
1931
1932 case HDR_MAX_FORWARDS:
1933 /** \par Max-Forwards:
1934 * pass only on TRACE or OPTIONS requests */
1935 if (orig_request->method == METHOD_TRACE || orig_request->method == METHOD_OPTIONS) {
1936 const int64_t hops = e->getInt64();
1937
1938 if (hops > 0)
1939 hdr_out->putInt64(HDR_MAX_FORWARDS, hops - 1);
1940 }
1941
1942 break;
1943
1944 case HDR_VIA:
1945 /** \par Via:
1946 * If Via is disabled then forward any received header as-is.
1947 * Otherwise leave for explicit updated addition later. */
1948
1949 if (!Config.onoff.via)
1950 hdr_out->addEntry(e->clone());
1951
1952 break;
1953
1954 case HDR_RANGE:
1955
1956 case HDR_IF_RANGE:
1957
1958 case HDR_REQUEST_RANGE:
1959 /** \par Range:, If-Range:, Request-Range:
1960 * Only pass if we accept ranges */
1961 if (!we_do_ranges)
1962 hdr_out->addEntry(e->clone());
1963
1964 break;
1965
1966 case HDR_PROXY_CONNECTION: // SHOULD ignore. But doing so breaks things.
1967 break;
1968
1969 case HDR_CONTENT_LENGTH:
1970 // pass through unless we chunk; also, keeping this away from default
1971 // prevents request smuggling via Connection: Content-Length tricks
1972 if (!flags.chunked_request)
1973 hdr_out->addEntry(e->clone());
1974 break;
1975
1976 case HDR_X_FORWARDED_FOR:
1977
1978 case HDR_CACHE_CONTROL:
1979 /** \par X-Forwarded-For:, Cache-Control:
1980 * handled specially by Squid, so leave off for now.
1981 * append these after the loop if needed */
1982 break;
1983
1984 case HDR_FRONT_END_HTTPS:
1985 /** \par Front-End-Https:
1986 * Pass thru only if peer is configured with front-end-https */
1987 if (!flags.front_end_https)
1988 hdr_out->addEntry(e->clone());
1989
1990 break;
1991
1992 default:
1993 /** \par default.
1994 * pass on all other header fields
1995 * which are NOT listed by the special Connection: header. */
1996
1997 if (strConnection.size()>0 && strListIsMember(&strConnection, e->name.termedBuf(), ',')) {
1998 debugs(11, 2, "'" << e->name << "' header cropped by Connection: definition");
1999 return;
2000 }
2001
2002 hdr_out->addEntry(e->clone());
2003 }
2004 }
2005
2006 bool
2007 HttpStateData::decideIfWeDoRanges (HttpRequest * orig_request)
2008 {
2009 bool result = true;
2010 /* decide if we want to do Ranges ourselves
2011 * and fetch the whole object now)
2012 * We want to handle Ranges ourselves iff
2013 * - we can actually parse client Range specs
2014 * - the specs are expected to be simple enough (e.g. no out-of-order ranges)
2015 * - reply will be cachable
2016 * (If the reply will be uncachable we have to throw it away after
2017 * serving this request, so it is better to forward ranges to
2018 * the server and fetch only the requested content)
2019 */
2020
2021 int64_t roffLimit = orig_request->getRangeOffsetLimit();
2022
2023 if (NULL == orig_request->range || !orig_request->flags.cachable
2024 || orig_request->range->offsetLimitExceeded(roffLimit) || orig_request->flags.connection_auth)
2025 result = false;
2026
2027 debugs(11, 8, "decideIfWeDoRanges: range specs: " <<
2028 orig_request->range << ", cachable: " <<
2029 orig_request->flags.cachable << "; we_do_ranges: " << result);
2030
2031 return result;
2032 }
2033
2034 /* build request prefix and append it to a given MemBuf;
2035 * return the length of the prefix */
2036 mb_size_t
2037 HttpStateData::buildRequestPrefix(HttpRequest * aRequest,
2038 HttpRequest * original_request,
2039 StoreEntry * sentry,
2040 MemBuf * mb)
2041 {
2042 const int offset = mb->size;
2043 HttpVersion httpver(1,1);
2044 mb->Printf("%s %s HTTP/%d.%d\r\n",
2045 RequestMethodStr(aRequest->method),
2046 aRequest->urlpath.size() ? aRequest->urlpath.termedBuf() : "/",
2047 httpver.major,httpver.minor);
2048 /* build and pack headers */
2049 {
2050 HttpHeader hdr(hoRequest);
2051 Packer p;
2052 httpBuildRequestHeader(aRequest, original_request, sentry, &hdr, flags);
2053
2054 if (aRequest->flags.pinned && aRequest->flags.connection_auth)
2055 aRequest->flags.auth_sent = 1;
2056 else if (hdr.has(HDR_AUTHORIZATION))
2057 aRequest->flags.auth_sent = 1;
2058
2059 packerToMemInit(&p, mb);
2060 hdr.packInto(&p);
2061 hdr.clean();
2062 packerClean(&p);
2063 }
2064 /* append header terminator */
2065 mb->append(crlf, 2);
2066 return mb->size - offset;
2067 }
2068
2069 /* This will be called when connect completes. Write request. */
2070 bool
2071 HttpStateData::sendRequest()
2072 {
2073 MemBuf mb;
2074
2075 debugs(11, 5, "httpSendRequest: FD " << fd << ", request " << request << ", this " << this << ".");
2076
2077 if (!canSend(fd)) {
2078 debugs(11,3, HERE << "cannot send request to closing FD " << fd);
2079 assert(closeHandler != NULL);
2080 return false;
2081 }
2082
2083 typedef CommCbMemFunT<HttpStateData, CommTimeoutCbParams> TimeoutDialer;
2084 AsyncCall::Pointer timeoutCall = JobCallback(11, 5,
2085 TimeoutDialer, this, HttpStateData::httpTimeout);
2086 commSetTimeout(fd, Config.Timeout.lifetime, timeoutCall);
2087 flags.do_next_read = 1;
2088 maybeReadVirginBody();
2089
2090 if (orig_request->body_pipe != NULL) {
2091 if (!startRequestBodyFlow()) // register to receive body data
2092 return false;
2093 typedef CommCbMemFunT<HttpStateData, CommIoCbParams> Dialer;
2094 requestSender = JobCallback(11,5,
2095 Dialer, this, HttpStateData::sentRequestBody);
2096
2097 Must(!flags.chunked_request);
2098 // use chunked encoding if we do not know the length
2099 if (orig_request->content_length < 0)
2100 flags.chunked_request = 1;
2101 } else {
2102 assert(!requestBodySource);
2103 typedef CommCbMemFunT<HttpStateData, CommIoCbParams> Dialer;
2104 requestSender = JobCallback(11,5,
2105 Dialer, this, HttpStateData::wroteLast);
2106 }
2107
2108 if (_peer != NULL) {
2109 if (_peer->options.originserver) {
2110 flags.proxying = 0;
2111 flags.originpeer = 1;
2112 } else {
2113 flags.proxying = 1;
2114 flags.originpeer = 0;
2115 }
2116 } else {
2117 flags.proxying = 0;
2118 flags.originpeer = 0;
2119 }
2120
2121 /*
2122 * Is keep-alive okay for all request methods?
2123 */
2124 if (orig_request->flags.must_keepalive)
2125 flags.keepalive = 1;
2126 else if (!Config.onoff.server_pconns)
2127 flags.keepalive = 0;
2128 else if (_peer == NULL)
2129 flags.keepalive = 1;
2130 else if (_peer->stats.n_keepalives_sent < 10)
2131 flags.keepalive = 1;
2132 else if ((double) _peer->stats.n_keepalives_recv /
2133 (double) _peer->stats.n_keepalives_sent > 0.50)
2134 flags.keepalive = 1;
2135
2136 if (_peer) {
2137 if (neighborType(_peer, request) == PEER_SIBLING &&
2138 !_peer->options.allow_miss)
2139 flags.only_if_cached = 1;
2140
2141 flags.front_end_https = _peer->front_end_https;
2142 }
2143
2144 mb.init();
2145 request->peer_host=_peer?_peer->host:NULL;
2146 buildRequestPrefix(request, orig_request, entry, &mb);
2147 debugs(11, 6, "httpSendRequest: FD " << fd << ":\n" << mb.buf);
2148 Comm::Write(fd, &mb, requestSender);
2149
2150 return true;
2151 }
2152
2153 bool
2154 HttpStateData::getMoreRequestBody(MemBuf &buf)
2155 {
2156 // parent's implementation can handle the no-encoding case
2157 if (!flags.chunked_request)
2158 return ServerStateData::getMoreRequestBody(buf);
2159
2160 MemBuf raw;
2161
2162 Must(requestBodySource != NULL);
2163 if (!requestBodySource->getMoreData(raw))
2164 return false; // no request body bytes to chunk yet
2165
2166 // optimization: pre-allocate buffer size that should be enough
2167 const mb_size_t rawDataSize = raw.contentSize();
2168 // we may need to send: hex-chunk-size CRLF raw-data CRLF last-chunk
2169 buf.init(16 + 2 + rawDataSize + 2 + 5, raw.max_capacity);
2170
2171 buf.Printf("%x\r\n", static_cast<unsigned int>(rawDataSize));
2172 buf.append(raw.content(), rawDataSize);
2173 buf.Printf("\r\n");
2174
2175 Must(rawDataSize > 0); // we did not accidently created last-chunk above
2176
2177 // Do not send last-chunk unless we successfully received everything
2178 if (receivedWholeRequestBody) {
2179 Must(!flags.sentLastChunk);
2180 flags.sentLastChunk = true;
2181 buf.append("0\r\n\r\n", 5);
2182 }
2183
2184 return true;
2185 }
2186
2187 void
2188 httpStart(FwdState *fwd)
2189 {
2190 debugs(11, 3, "httpStart: \"" << RequestMethodStr(fwd->request->method) << " " << fwd->entry->url() << "\"" );
2191 HttpStateData *httpState = new HttpStateData(fwd);
2192
2193 if (!httpState->sendRequest()) {
2194 debugs(11, 3, "httpStart: aborted");
2195 delete httpState;
2196 return;
2197 }
2198
2199 statCounter.server.all.requests++;
2200 statCounter.server.http.requests++;
2201
2202 /*
2203 * We used to set the read timeout here, but not any more.
2204 * Now its set in httpSendComplete() after the full request,
2205 * including request body, has been written to the server.
2206 */
2207 }
2208
2209 /// if broken posts are enabled for the request, try to fix and return true
2210 bool
2211 HttpStateData::finishingBrokenPost()
2212 {
2213 #if USE_HTTP_VIOLATIONS
2214 if (!Config.accessList.brokenPosts) {
2215 debugs(11, 5, HERE << "No brokenPosts list");
2216 return false;
2217 }
2218
2219 ACLFilledChecklist ch(Config.accessList.brokenPosts, originalRequest(), NULL);
2220 if (!ch.fastCheck()) {
2221 debugs(11, 5, HERE << "didn't match brokenPosts");
2222 return false;
2223 }
2224
2225 if (!canSend(fd)) {
2226 debugs(11,2, HERE << "ignoring broken POST for closing FD " << fd);
2227 assert(closeHandler != NULL);
2228 return true; // prevent caller from proceeding as if nothing happened
2229 }
2230
2231 debugs(11, 2, "finishingBrokenPost: fixing broken POST");
2232 typedef CommCbMemFunT<HttpStateData, CommIoCbParams> Dialer;
2233 requestSender = JobCallback(11,5,
2234 Dialer, this, HttpStateData::wroteLast);
2235 Comm::Write(fd, "\r\n", 2, requestSender, NULL);
2236 return true;
2237 #else
2238 return false;
2239 #endif /* USE_HTTP_VIOLATIONS */
2240 }
2241
2242 /// if needed, write last-chunk to end the request body and return true
2243 bool
2244 HttpStateData::finishingChunkedRequest()
2245 {
2246 if (flags.sentLastChunk) {
2247 debugs(11, 5, HERE << "already sent last-chunk");
2248 return false;
2249 }
2250
2251 Must(receivedWholeRequestBody); // or we should not be sending last-chunk
2252 flags.sentLastChunk = true;
2253
2254 typedef CommCbMemFunT<HttpStateData, CommIoCbParams> Dialer;
2255 requestSender = JobCallback(11,5,
2256 Dialer, this, HttpStateData::wroteLast);
2257 Comm::Write(fd, "0\r\n\r\n", 5, requestSender, NULL);
2258 return true;
2259 }
2260
2261 void
2262 HttpStateData::doneSendingRequestBody()
2263 {
2264 ServerStateData::doneSendingRequestBody();
2265 debugs(11,5, HERE << "doneSendingRequestBody: FD " << fd);
2266
2267 // do we need to write something after the last body byte?
2268 if (flags.chunked_request && finishingChunkedRequest())
2269 return;
2270 if (!flags.chunked_request && finishingBrokenPost())
2271 return;
2272
2273 sendComplete();
2274 }
2275
2276 // more origin request body data is available
2277 void
2278 HttpStateData::handleMoreRequestBodyAvailable()
2279 {
2280 if (eof || fd < 0) {
2281 // XXX: we should check this condition in other callbacks then!
2282 // TODO: Check whether this can actually happen: We should unsubscribe
2283 // as a body consumer when the above condition(s) are detected.
2284 debugs(11, 1, HERE << "Transaction aborted while reading HTTP body");
2285 return;
2286 }
2287
2288 assert(requestBodySource != NULL);
2289
2290 if (requestBodySource->buf().hasContent()) {
2291 // XXX: why does not this trigger a debug message on every request?
2292
2293 if (flags.headers_parsed && !flags.abuse_detected) {
2294 flags.abuse_detected = 1;
2295 debugs(11, 1, "http handleMoreRequestBodyAvailable: Likely proxy abuse detected '" << orig_request->client_addr << "' -> '" << entry->url() << "'" );
2296
2297 if (virginReply()->sline.status == HTTP_INVALID_HEADER) {
2298 comm_close(fd);
2299 return;
2300 }
2301 }
2302 }
2303
2304 HttpStateData::handleMoreRequestBodyAvailable();
2305 }
2306
2307 // premature end of the request body
2308 void
2309 HttpStateData::handleRequestBodyProducerAborted()
2310 {
2311 ServerStateData::handleRequestBodyProducerAborted();
2312 if (entry->isEmpty()) {
2313 debugs(11, 3, "request body aborted: FD " << fd);
2314 ErrorState *err;
2315 // We usually get here when ICAP REQMOD aborts during body processing.
2316 // We might also get here if client-side aborts, but then our response
2317 // should not matter because either client-side will provide its own or
2318 // there will be no response at all (e.g., if the the client has left).
2319 err = errorCon(ERR_ICAP_FAILURE, HTTP_INTERNAL_SERVER_ERROR, fwd->request);
2320 err->xerrno = ERR_DETAIL_SRV_REQMOD_REQ_BODY;
2321 fwd->fail(err);
2322 }
2323
2324 abortTransaction("request body producer aborted");
2325 }
2326
2327 // called when we wrote request headers(!) or a part of the body
2328 void
2329 HttpStateData::sentRequestBody(const CommIoCbParams &io)
2330 {
2331 if (io.size > 0)
2332 kb_incr(&statCounter.server.http.kbytes_out, io.size);
2333
2334 ServerStateData::sentRequestBody(io);
2335 }
2336
2337 // Quickly abort the transaction
2338 // TODO: destruction should be sufficient as the destructor should cleanup,
2339 // including canceling close handlers
2340 void
2341 HttpStateData::abortTransaction(const char *reason)
2342 {
2343 debugs(11,5, HERE << "aborting transaction for " << reason <<
2344 "; FD " << fd << ", this " << this);
2345
2346 if (fd >= 0) {
2347 comm_close(fd);
2348 return;
2349 }
2350
2351 fwd->handleUnregisteredServerEnd();
2352 deleteThis("HttpStateData::abortTransaction");
2353 }
2354
2355 HttpRequest *
2356 HttpStateData::originalRequest()
2357 {
2358 return orig_request;
2359 }