]> git.ipfire.org Git - thirdparty/squid.git/blame - src/http.cc
Fix assert in StoreEntry::write() when aborted entry is written.
[thirdparty/squid.git] / src / http.cc
CommitLineData
da2b3a17 1
30a4f2a8 2/*
262a0e14 3 * $Id$
30a4f2a8 4 *
5 * DEBUG: section 11 Hypertext Transfer Protocol (HTTP)
6 * AUTHOR: Harvest Derived
7 *
2b6662ba 8 * SQUID Web Proxy Cache http://www.squid-cache.org/
e25c139f 9 * ----------------------------------------------------------
30a4f2a8 10 *
2b6662ba 11 * Squid is the result of efforts by numerous individuals from
12 * the Internet community; see the CONTRIBUTORS file for full
13 * details. Many organizations have provided support for Squid's
14 * development; see the SPONSORS file for full details. Squid is
15 * Copyrighted (C) 2001 by the Regents of the University of
16 * California; see the COPYRIGHT file for full details. Squid
17 * incorporates software developed and/or copyrighted by other
18 * sources; see the CREDITS file for full details.
30a4f2a8 19 *
20 * This program is free software; you can redistribute it and/or modify
21 * it under the terms of the GNU General Public License as published by
22 * the Free Software Foundation; either version 2 of the License, or
23 * (at your option) any later version.
9e008dda 24 *
30a4f2a8 25 * This program is distributed in the hope that it will be useful,
26 * but WITHOUT ANY WARRANTY; without even the implied warranty of
27 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
28 * GNU General Public License for more details.
9e008dda 29 *
30a4f2a8 30 * You should have received a copy of the GNU General Public License
31 * along with this program; if not, write to the Free Software
cbdec147 32 * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111, USA.
e25c139f 33 *
30a4f2a8 34 */
019dd986 35
4a83b852 36/*
37 * Anonymizing patch by lutz@as-node.jena.thur.de
de3bdb4c 38 * have a look into http-anon.c to get more informations.
4a83b852 39 */
40
44a47c6e 41#include "squid.h"
9ca29d23
AJ
42
43#include "acl/FilledChecklist.h"
2f1431ea 44#if USE_AUTH
9ca29d23 45#include "auth/UserRequest.h"
2f1431ea 46#endif
655daa06 47#include "base/AsyncJobCalls.h"
3d93a84d 48#include "base/TextException.h"
25f98340 49#include "base64.h"
ec41b64c 50#include "comm/Write.h"
9a0a18de 51#if USE_DELAY_POOLS
9ca29d23
AJ
52#include "DelayPools.h"
53#endif
8b997339 54#include "err_detail_type.h"
aa839030 55#include "errorpage.h"
e6ccf245 56#include "http.h"
655daa06 57#include "HttpControlMsg.h"
528b2c61 58#include "HttpHdrContRange.h"
b19dd748 59#include "HttpHdrSc.h"
60#include "HttpHdrScTarget.h"
9ca29d23
AJ
61#include "HttpReply.h"
62#include "HttpRequest.h"
63#include "MemBuf.h"
64#include "MemObject.h"
65#include "protos.h"
1fa9b1a7 66#include "rfc1738.h"
985c86bc 67#include "SquidTime.h"
9ca29d23 68#include "Store.h"
af0bb8e5 69
9ca29d23 70
af0bb8e5 71#define SQUID_ENTER_THROWING_CODE() try {
72#define SQUID_EXIT_THROWING_CODE(status) \
73 status = true; \
74 } \
0a8bbeeb
AR
75 catch (const std::exception &e) { \
76 debugs (11, 1, "Exception error:" << e.what()); \
af0bb8e5 77 status = false; \
9e008dda 78 }
e6ccf245 79
2afaba07 80CBDATA_CLASS_INIT(HttpStateData);
090089c4 81
6bf8443a 82static const char *const crlf = "\r\n";
4db43fab 83
f9cece6e 84static void httpMaybeRemovePublic(StoreEntry *, http_status);
9e498bfb
AJ
85static void copyOneHeaderFromClientsideRequestToUpstreamRequest(const HttpHeaderEntry *e, const String strConnection, HttpRequest * request, const HttpRequest * orig_request,
86 HttpHeader * hdr_out, const int we_do_ranges, const http_state_flags);
528b2c61 87
dc56a9b1 88HttpStateData::HttpStateData(FwdState *theFwdState) : AsyncJob("HttpStateData"), ServerStateData(theFwdState),
e1381638
AJ
89 lastChunk(0), header_bytes_read(0), reply_bytes_read(0),
90 body_bytes_truncated(0), httpChunkDecoder(NULL)
2bb867b5 91{
92 debugs(11,5,HERE << "HttpStateData " << this << " created");
a3d50c30 93 ignoreCacheControl = false;
94 surrogateNoStore = false;
a3d50c30 95 fd = fwd->server_fd;
96 readBuf = new MemBuf;
9cfb5f4d 97 readBuf->init(16*1024, 256*1024);
6dd9f4bd 98 orig_request = HTTPMSGLOCK(fwd->request);
a3d50c30 99
3ff65596
AR
100 // reset peer response time stats for %<pt
101 orig_request->hier.peer_http_request_sent.tv_sec = 0;
102 orig_request->hier.peer_http_request_sent.tv_usec = 0;
103
a3d50c30 104 if (fwd->servers)
105 _peer = fwd->servers->_peer; /* might be NULL */
106
107 if (_peer) {
108 const char *url;
109
110 if (_peer->options.originserver)
d53b3f6d 111 url = orig_request->urlpath.termedBuf();
a3d50c30 112 else
3900307b 113 url = entry->url();
a3d50c30 114
5cafad19 115 HttpRequest * proxy_req = new HttpRequest(orig_request->method,
9e008dda 116 orig_request->protocol, url);
a3d50c30 117
cc192b50 118 proxy_req->SetHost(_peer->host);
a3d50c30 119
120 proxy_req->port = _peer->http_port;
121
122 proxy_req->flags = orig_request->flags;
123
124 proxy_req->lastmod = orig_request->lastmod;
125
126 proxy_req->flags.proxying = 1;
127
6dd9f4bd 128 HTTPMSGUNLOCK(request);
253caccb 129
6dd9f4bd 130 request = HTTPMSGLOCK(proxy_req);
a3d50c30 131
132 /*
133 * This NEIGHBOR_PROXY_ONLY check probably shouldn't be here.
134 * We might end up getting the object from somewhere else if,
135 * for example, the request to this neighbor fails.
136 */
137 if (_peer->options.proxy_only)
d88e3c49 138 entry->releaseRequest();
a3d50c30 139
9a0a18de 140#if USE_DELAY_POOLS
a3d50c30 141 entry->setNoDelay(_peer->options.no_delay);
a3d50c30 142#endif
a3d50c30 143 }
144
145 /*
146 * register the handler to free HTTP state data when the FD closes
147 */
dc56a9b1 148 typedef CommCbMemFunT<HttpStateData, CommCloseCbParams> Dialer;
4299f876 149 closeHandler = JobCallback(9, 5,
4cb2536f 150 Dialer, this, HttpStateData::httpStateConnClosed);
dc56a9b1 151 comm_add_close_handler(fd, closeHandler);
2bb867b5 152}
b8d8561b 153
2afaba07 154HttpStateData::~HttpStateData()
f5558c95 155{
253caccb 156 /*
3b299123 157 * don't forget that ~ServerStateData() gets called automatically
253caccb 158 */
159
2afaba07 160 if (!readBuf->isNull())
161 readBuf->clean();
62e76326 162
2afaba07 163 delete readBuf;
164
9e008dda
AJ
165 if (httpChunkDecoder)
166 delete httpChunkDecoder;
af0bb8e5 167
6dd9f4bd 168 HTTPMSGUNLOCK(orig_request);
2afaba07 169
5f8252d2 170 debugs(11,5, HERE << "HttpStateData " << this << " destroyed; FD " << fd);
171}
172
173int
fc68f6b1 174HttpStateData::dataDescriptor() const
175{
5f8252d2 176 return fd;
2afaba07 177}
dc56a9b1 178/*
2afaba07 179static void
180httpStateFree(int fd, void *data)
181{
182 HttpStateData *httpState = static_cast<HttpStateData *>(data);
bf8fe701 183 debugs(11, 5, "httpStateFree: FD " << fd << ", httpState=" << data);
5f8252d2 184 delete httpState;
dc56a9b1 185}*/
186
9e008dda 187void
dc56a9b1 188HttpStateData::httpStateConnClosed(const CommCloseCbParams &params)
189{
190 debugs(11, 5, "httpStateFree: FD " << params.fd << ", httpState=" << params.data);
191 deleteThis("HttpStateData::httpStateConnClosed");
f5558c95 192}
193
b8d8561b 194int
60745f24 195httpCachable(const HttpRequestMethod& method)
090089c4 196{
090089c4 197 /* GET and HEAD are cachable. Others are not. */
62e76326 198
9e008dda 199 // TODO: replase to HttpRequestMethod::isCachable() ?
6eb42cae 200 if (method != METHOD_GET && method != METHOD_HEAD)
62e76326 201 return 0;
202
090089c4 203 /* else cachable */
204 return 1;
205}
206
dc56a9b1 207void
208HttpStateData::httpTimeout(const CommTimeoutCbParams &params)
090089c4 209{
bf8fe701 210 debugs(11, 4, "httpTimeout: FD " << fd << ": '" << entry->url() << "'" );
62e76326 211
12158bdc 212 if (entry->store_status == STORE_PENDING) {
dc56a9b1 213 fwd->fail(errorCon(ERR_READ_TIMEOUT, HTTP_GATEWAY_TIMEOUT, fwd->request));
9b312a19 214 }
62e76326 215
0d4d4170 216 comm_close(fd);
090089c4 217}
218
f9cece6e 219static void
220httpMaybeRemovePublic(StoreEntry * e, http_status status)
221{
914b89a2 222 int remove = 0;
7e3ce7b9 223 int forbidden = 0;
f9cece6e 224 StoreEntry *pe;
62e76326 225
d46a87a8 226 if (!EBIT_TEST(e->flags, KEY_PRIVATE))
62e76326 227 return;
228
f9cece6e 229 switch (status) {
62e76326 230
f9cece6e 231 case HTTP_OK:
62e76326 232
f9cece6e 233 case HTTP_NON_AUTHORITATIVE_INFORMATION:
62e76326 234
f9cece6e 235 case HTTP_MULTIPLE_CHOICES:
62e76326 236
f9cece6e 237 case HTTP_MOVED_PERMANENTLY:
62e76326 238
f9cece6e 239 case HTTP_MOVED_TEMPORARILY:
62e76326 240
f9cece6e 241 case HTTP_GONE:
62e76326 242
7e3ce7b9 243 case HTTP_NOT_FOUND:
914b89a2 244 remove = 1;
62e76326 245
246 break;
247
7e3ce7b9 248 case HTTP_FORBIDDEN:
62e76326 249
7e3ce7b9 250 case HTTP_METHOD_NOT_ALLOWED:
62e76326 251 forbidden = 1;
252
253 break;
254
f9cece6e 255#if WORK_IN_PROGRESS
62e76326 256
c8fd0193 257 case HTTP_UNAUTHORIZED:
62e76326 258 forbidden = 1;
259
260 break;
261
f9cece6e 262#endif
62e76326 263
f9cece6e 264 default:
7e3ce7b9 265#if QUESTIONABLE
62e76326 266 /*
267 * Any 2xx response should eject previously cached entities...
268 */
abb929f0 269
62e76326 270 if (status >= 200 && status < 300)
914b89a2 271 remove = 1;
62e76326 272
7e3ce7b9 273#endif
62e76326 274
275 break;
f9cece6e 276 }
62e76326 277
914b89a2 278 if (!remove && !forbidden)
62e76326 279 return;
280
f9cece6e 281 assert(e->mem_obj);
62e76326 282
f66a9ef4 283 if (e->mem_obj->request)
62e76326 284 pe = storeGetPublicByRequest(e->mem_obj->request);
f66a9ef4 285 else
62e76326 286 pe = storeGetPublic(e->mem_obj->url, e->mem_obj->method);
287
f66a9ef4 288 if (pe != NULL) {
62e76326 289 assert(e != pe);
d9129474 290#if USE_HTCP
8dceeee3 291 neighborsHtcpClear(e, NULL, e->mem_obj->request, e->mem_obj->method, HTCP_CLR_INVALIDATION);
d9129474 292#endif
5f33b71d 293 pe->release();
0856d155 294 }
62e76326 295
914b89a2 296 /** \par
7e3ce7b9 297 * Also remove any cached HEAD response in case the object has
298 * changed.
299 */
f66a9ef4 300 if (e->mem_obj->request)
62e76326 301 pe = storeGetPublicByRequestMethod(e->mem_obj->request, METHOD_HEAD);
f66a9ef4 302 else
62e76326 303 pe = storeGetPublic(e->mem_obj->url, METHOD_HEAD);
304
f66a9ef4 305 if (pe != NULL) {
62e76326 306 assert(e != pe);
d9129474 307#if USE_HTCP
8dceeee3 308 neighborsHtcpClear(e, NULL, e->mem_obj->request, HttpRequestMethod(METHOD_HEAD), HTCP_CLR_INVALIDATION);
d9129474 309#endif
5f33b71d 310 pe->release();
7e3ce7b9 311 }
f9cece6e 312}
313
43ae1d95 314void
315HttpStateData::processSurrogateControl(HttpReply *reply)
316{
43ae1d95 317 if (request->flags.accelerated && reply->surrogate_control) {
45cca89d 318 HttpHdrScTarget *sctusable = httpHdrScGetMergedTarget(reply->surrogate_control, Config.Accel.surrogate_id);
43ae1d95 319
320 if (sctusable) {
321 if (EBIT_TEST(sctusable->mask, SC_NO_STORE) ||
322 (Config.onoff.surrogate_is_remote
323 && EBIT_TEST(sctusable->mask, SC_NO_STORE_REMOTE))) {
324 surrogateNoStore = true;
5ed72359 325 entry->makePrivate();
43ae1d95 326 }
327
328 /* The HttpHeader logic cannot tell if the header it's parsing is a reply to an
329 * accelerated request or not...
45cca89d 330 * Still, this is an abstraction breach. - RC
43ae1d95 331 */
332 if (sctusable->max_age != -1) {
333 if (sctusable->max_age < sctusable->max_stale)
334 reply->expires = reply->date + sctusable->max_age;
335 else
336 reply->expires = reply->date + sctusable->max_stale;
337
338 /* And update the timestamps */
3900307b 339 entry->timestampsSet();
43ae1d95 340 }
341
342 /* We ignore cache-control directives as per the Surrogate specification */
343 ignoreCacheControl = true;
344
345 httpHdrScTargetDestroy(sctusable);
346 }
347 }
43ae1d95 348}
349
924f73bc 350int
351HttpStateData::cacheableReply()
c54e9052 352{
585ab260 353 HttpReply const *rep = finalReply();
528b2c61 354 HttpHeader const *hdr = &rep->header;
d8b249ef 355 const int cc_mask = (rep->cache_control) ? rep->cache_control->mask : 0;
c68e9c6b 356 const char *v;
626096be 357#if USE_HTTP_VIOLATIONS
62e76326 358
38f9c547 359 const refresh_t *R = NULL;
b6445726 360
346be6ad 361 /* This strange looking define first looks up the refresh pattern
b6445726 362 * and then checks if the specified flag is set. The main purpose
626096be 363 * of this is to simplify the refresh pattern lookup and USE_HTTP_VIOLATIONS
b6445726 364 * condition
365 */
366#define REFRESH_OVERRIDE(flag) \
5f8252d2 367 ((R = (R ? R : refreshLimits(entry->mem_obj->url))) , \
368 (R && R->flags.flag))
b445957e 369#else
370#define REFRESH_OVERRIDE(flag) 0
38f9c547 371#endif
43ae1d95 372
38f9c547 373 if (surrogateNoStore)
62e76326 374 return 0;
375
8466a4af
AR
376 // RFC 2616: do not cache replies to responses with no-store CC directive
377 if (request && request->cache_control &&
ab745b44
A
378 EBIT_TEST(request->cache_control->mask, CC_NO_STORE) &&
379 !REFRESH_OVERRIDE(ignore_no_store))
8466a4af
AR
380 return 0;
381
924f73bc 382 if (!ignoreCacheControl) {
38f9c547 383 if (EBIT_TEST(cc_mask, CC_PRIVATE)) {
b6445726 384 if (!REFRESH_OVERRIDE(ignore_private))
38f9c547 385 return 0;
386 }
387
388 if (EBIT_TEST(cc_mask, CC_NO_CACHE)) {
b6445726 389 if (!REFRESH_OVERRIDE(ignore_no_cache))
38f9c547 390 return 0;
391 }
392
393 if (EBIT_TEST(cc_mask, CC_NO_STORE)) {
b6445726 394 if (!REFRESH_OVERRIDE(ignore_no_store))
38f9c547 395 return 0;
396 }
43ae1d95 397 }
398
d67acb4e 399 if (request->flags.auth || request->flags.auth_sent) {
62e76326 400 /*
401 * Responses to requests with authorization may be cached
402 * only if a Cache-Control: public reply header is present.
403 * RFC 2068, sec 14.9.4
404 */
405
38f9c547 406 if (!EBIT_TEST(cc_mask, CC_PUBLIC)) {
b6445726 407 if (!REFRESH_OVERRIDE(ignore_auth))
38f9c547 408 return 0;
409 }
a6dfe2d9 410 }
62e76326 411
c68e9c6b 412 /* Pragma: no-cache in _replies_ is not documented in HTTP,
413 * but servers like "Active Imaging Webcast/2.0" sure do use it */
a9925b40 414 if (hdr->has(HDR_PRAGMA)) {
30abd221 415 String s = hdr->getList(HDR_PRAGMA);
62e76326 416 const int no_cache = strListIsMember(&s, "no-cache", ',');
30abd221 417 s.clean();
62e76326 418
38f9c547 419 if (no_cache) {
b6445726 420 if (!REFRESH_OVERRIDE(ignore_no_cache))
38f9c547 421 return 0;
422 }
c68e9c6b 423 }
62e76326 424
c68e9c6b 425 /*
426 * The "multipart/x-mixed-replace" content type is used for
427 * continuous push replies. These are generally dynamic and
428 * probably should not be cachable
429 */
a9925b40 430 if ((v = hdr->getStr(HDR_CONTENT_TYPE)))
62e76326 431 if (!strncasecmp(v, "multipart/x-mixed-replace", 25))
432 return 0;
433
585ab260 434 switch (rep->sline.status) {
62e76326 435 /* Responses that are cacheable */
436
19a04dac 437 case HTTP_OK:
62e76326 438
19a04dac 439 case HTTP_NON_AUTHORITATIVE_INFORMATION:
62e76326 440
19a04dac 441 case HTTP_MULTIPLE_CHOICES:
62e76326 442
19a04dac 443 case HTTP_MOVED_PERMANENTLY:
62e76326 444
19a04dac 445 case HTTP_GONE:
62e76326 446 /*
447 * Don't cache objects that need to be refreshed on next request,
448 * unless we know how to refresh it.
449 */
450
3d8b6ba4 451 if (!refreshIsCachable(entry) && !REFRESH_OVERRIDE(store_stale)) {
bf8fe701 452 debugs(22, 3, "refreshIsCachable() returned non-cacheable..");
62e76326 453 return 0;
ca34dacd 454 } else
62e76326 455 return 1;
456
62e76326 457 /* NOTREACHED */
458 break;
459
460 /* Responses that only are cacheable if the server says so */
461
19a04dac 462 case HTTP_MOVED_TEMPORARILY:
f18c86fd 463 case HTTP_TEMPORARY_REDIRECT:
6a2bf8f4 464 if (rep->expires > rep->date && rep->date > 0)
62e76326 465 return 1;
466 else
467 return 0;
468
469 /* NOTREACHED */
470 break;
471
472 /* Errors can be negatively cached */
473
19a04dac 474 case HTTP_NO_CONTENT:
62e76326 475
19a04dac 476 case HTTP_USE_PROXY:
62e76326 477
19a04dac 478 case HTTP_BAD_REQUEST:
62e76326 479
19a04dac 480 case HTTP_FORBIDDEN:
62e76326 481
19a04dac 482 case HTTP_NOT_FOUND:
62e76326 483
19a04dac 484 case HTTP_METHOD_NOT_ALLOWED:
62e76326 485
19a04dac 486 case HTTP_REQUEST_URI_TOO_LARGE:
62e76326 487
19a04dac 488 case HTTP_INTERNAL_SERVER_ERROR:
62e76326 489
19a04dac 490 case HTTP_NOT_IMPLEMENTED:
62e76326 491
19a04dac 492 case HTTP_BAD_GATEWAY:
62e76326 493
19a04dac 494 case HTTP_SERVICE_UNAVAILABLE:
62e76326 495
19a04dac 496 case HTTP_GATEWAY_TIMEOUT:
62e76326 497 return -1;
498
499 /* NOTREACHED */
500 break;
501
502 /* Some responses can never be cached */
503
0cdcddb9 504 case HTTP_PARTIAL_CONTENT: /* Not yet supported */
62e76326 505
19a04dac 506 case HTTP_SEE_OTHER:
62e76326 507
19a04dac 508 case HTTP_NOT_MODIFIED:
62e76326 509
19a04dac 510 case HTTP_UNAUTHORIZED:
62e76326 511
19a04dac 512 case HTTP_PROXY_AUTHENTICATION_REQUIRED:
62e76326 513
0cdcddb9 514 case HTTP_INVALID_HEADER: /* Squid header parsing error */
4eb368f9 515
516 case HTTP_HEADER_TOO_LARGE:
b004a7fc 517
518 case HTTP_PAYMENT_REQUIRED:
519 case HTTP_NOT_ACCEPTABLE:
520 case HTTP_REQUEST_TIMEOUT:
521 case HTTP_CONFLICT:
522 case HTTP_LENGTH_REQUIRED:
523 case HTTP_PRECONDITION_FAILED:
524 case HTTP_REQUEST_ENTITY_TOO_LARGE:
525 case HTTP_UNSUPPORTED_MEDIA_TYPE:
526 case HTTP_UNPROCESSABLE_ENTITY:
527 case HTTP_LOCKED:
528 case HTTP_FAILED_DEPENDENCY:
529 case HTTP_INSUFFICIENT_STORAGE:
cc7c3c84 530 case HTTP_REQUESTED_RANGE_NOT_SATISFIABLE:
531 case HTTP_EXPECTATION_FAILED:
b004a7fc 532
62e76326 533 return 0;
534
41217979
AJ
535 default:
536 /* RFC 2616 section 6.1.1: an unrecognized response MUST NOT be cached. */
537 debugs (11, 3, HERE << "Unknown HTTP status code " << rep->sline.status << ". Not cacheable.");
62e76326 538
539 return 0;
540
541 /* NOTREACHED */
542 break;
c54e9052 543 }
62e76326 544
79d39a72 545 /* NOTREACHED */
c54e9052 546}
090089c4 547
f66a9ef4 548/*
9e008dda 549 * For Vary, store the relevant request headers as
f66a9ef4 550 * virtual headers in the reply
551 * Returns false if the variance cannot be stored
552 */
553const char *
190154cf 554httpMakeVaryMark(HttpRequest * request, HttpReply const * reply)
f66a9ef4 555{
30abd221 556 String vary, hdr;
f66a9ef4 557 const char *pos = NULL;
558 const char *item;
559 const char *value;
560 int ilen;
30abd221 561 static String vstr;
f66a9ef4 562
30abd221 563 vstr.clean();
a9925b40 564 vary = reply->header.getList(HDR_VARY);
62e76326 565
f66a9ef4 566 while (strListGetItem(&vary, ',', &item, &ilen, &pos)) {
62e76326 567 char *name = (char *)xmalloc(ilen + 1);
568 xstrncpy(name, item, ilen + 1);
569 Tolower(name);
9776e3cc 570
571 if (strcmp(name, "*") == 0) {
572 /* Can not handle "Vary: *" withtout ETag support */
573 safe_free(name);
30abd221 574 vstr.clean();
9776e3cc 575 break;
576 }
577
62e76326 578 strListAdd(&vstr, name, ',');
a9925b40 579 hdr = request->header.getByName(name);
62e76326 580 safe_free(name);
d53b3f6d 581 value = hdr.termedBuf();
62e76326 582
583 if (value) {
584 value = rfc1738_escape_part(value);
585 vstr.append("=\"", 2);
586 vstr.append(value);
587 vstr.append("\"", 1);
588 }
589
30abd221 590 hdr.clean();
f66a9ef4 591 }
62e76326 592
30abd221 593 vary.clean();
f66a9ef4 594#if X_ACCELERATOR_VARY
62e76326 595
aa38be4a 596 pos = NULL;
a9925b40 597 vary = reply->header.getList(HDR_X_ACCELERATOR_VARY);
62e76326 598
f66a9ef4 599 while (strListGetItem(&vary, ',', &item, &ilen, &pos)) {
62e76326 600 char *name = (char *)xmalloc(ilen + 1);
601 xstrncpy(name, item, ilen + 1);
602 Tolower(name);
603 strListAdd(&vstr, name, ',');
a9925b40 604 hdr = request->header.getByName(name);
62e76326 605 safe_free(name);
d53b3f6d 606 value = hdr.termedBuf();
62e76326 607
608 if (value) {
609 value = rfc1738_escape_part(value);
610 vstr.append("=\"", 2);
611 vstr.append(value);
612 vstr.append("\"", 1);
613 }
614
30abd221 615 hdr.clean();
f66a9ef4 616 }
62e76326 617
30abd221 618 vary.clean();
f66a9ef4 619#endif
62e76326 620
d53b3f6d
FC
621 debugs(11, 3, "httpMakeVaryMark: " << vstr);
622 return vstr.termedBuf();
f66a9ef4 623}
624
2afaba07 625void
626HttpStateData::keepaliveAccounting(HttpReply *reply)
627{
628 if (flags.keepalive)
629 if (_peer)
630 _peer->stats.n_keepalives_sent++;
631
632 if (reply->keep_alive) {
633 if (_peer)
634 _peer->stats.n_keepalives_recv++;
635
af6a12ee
AJ
636 if (Config.onoff.detect_broken_server_pconns
637 && reply->bodySize(request->method) == -1 && !flags.chunked) {
bf8fe701 638 debugs(11, 1, "keepaliveAccounting: Impossible keep-alive header from '" << entry->url() << "'" );
639 // debugs(11, 2, "GOT HTTP REPLY HDR:\n---------\n" << readBuf->content() << "\n----------" );
2afaba07 640 flags.keepalive_broken = 1;
641 }
642 }
643}
644
645void
646HttpStateData::checkDateSkew(HttpReply *reply)
647{
648 if (reply->date > -1 && !_peer) {
649 int skew = abs((int)(reply->date - squid_curtime));
650
651 if (skew > 86400)
cc192b50 652 debugs(11, 3, "" << request->GetHost() << "'s clock is skewed by " << skew << " seconds!");
2afaba07 653 }
654}
655
073ba374 656/**
4eb368f9 657 * This creates the error page itself.. its likely
658 * that the forward ported reply header max size patch
659 * generates non http conformant error pages - in which
660 * case the errors where should be 'BAD_GATEWAY' etc
661 */
b8d8561b 662void
2afaba07 663HttpStateData::processReplyHeader()
f5558c95 664{
073ba374 665 /** Creates a blank header. If this routine is made incremental, this will not do */
859f1666
AJ
666
667 /* NP: all exit points to this function MUST call ctx_exit(ctx) */
82384411 668 Ctx ctx = ctx_enter(entry->mem_obj->url);
859f1666 669
bf8fe701 670 debugs(11, 3, "processReplyHeader: key '" << entry->getMD5Text() << "'");
62e76326 671
1a98175f 672 assert(!flags.headers_parsed);
62e76326 673
859f1666
AJ
674 if (!readBuf->hasContent()) {
675 ctx_exit(ctx);
b73a07d6 676 return;
859f1666 677 }
b73a07d6 678
2afaba07 679 http_status error = HTTP_STATUS_NONE;
62e76326 680
585ab260 681 HttpReply *newrep = new HttpReply;
4a56ee8d 682 const bool parsed = newrep->parse(readBuf, eof, &error);
62e76326 683
e77d7ef0 684 if (!parsed && readBuf->contentSize() > 5 && strncmp(readBuf->content(), "HTTP/", 5) != 0 && strncmp(readBuf->content(), "ICY", 3) != 0) {
9e008dda
AJ
685 MemBuf *mb;
686 HttpReply *tmprep = new HttpReply;
11992b6f 687 tmprep->setHeaders(HTTP_OK, "Gatewaying", NULL, -1, -1, -1);
9e008dda
AJ
688 tmprep->header.putExt("X-Transformed-From", "HTTP/0.9");
689 mb = tmprep->pack();
690 newrep->parse(mb, eof, &error);
ddbe383d 691 delete mb;
9e008dda
AJ
692 delete tmprep;
693 } else {
694 if (!parsed && error > 0) { // unrecoverable parsing error
695 debugs(11, 3, "processReplyHeader: Non-HTTP-compliant header: '" << readBuf->content() << "'");
696 flags.headers_parsed = 1;
871c031f 697 newrep->sline.version = HttpVersion(1,1);
9e008dda
AJ
698 newrep->sline.status = error;
699 HttpReply *vrep = setVirginReply(newrep);
700 entry->replaceHttpReply(vrep);
701 ctx_exit(ctx);
702 return;
703 }
704
705 if (!parsed) { // need more data
706 assert(!error);
707 assert(!eof);
708 delete newrep;
709 ctx_exit(ctx);
710 return;
711 }
712
713 debugs(11, 9, "GOT HTTP REPLY HDR:\n---------\n" << readBuf->content() << "\n----------");
714
715 header_bytes_read = headersEnd(readBuf->content(), readBuf->contentSize());
716 readBuf->consume(header_bytes_read);
f5558c95 717 }
62e76326 718
c679653d
AR
719 newrep->removeStaleWarnings();
720
0c3d3f65 721 if (newrep->sline.protocol == AnyP::PROTO_HTTP && newrep->sline.status >= 100 && newrep->sline.status < 200) {
655daa06 722 handle1xx(newrep);
3d9e71e6 723 ctx_exit(ctx);
3d9e71e6
AJ
724 return;
725 }
726
af0bb8e5 727 flags.chunked = 0;
0c3d3f65 728 if (newrep->sline.protocol == AnyP::PROTO_HTTP && newrep->header.chunked()) {
9e008dda
AJ
729 flags.chunked = 1;
730 httpChunkDecoder = new ChunkedCodingParser;
af0bb8e5 731 }
732
9e008dda
AJ
733 if (!peerSupportsConnectionPinning())
734 orig_request->flags.connection_auth_disabled = 1;
d67acb4e 735
585ab260 736 HttpReply *vrep = setVirginReply(newrep);
6965ab28 737 flags.headers_parsed = 1;
738
585ab260 739 keepaliveAccounting(vrep);
47ac2ebe 740
585ab260 741 checkDateSkew(vrep);
47ac2ebe 742
585ab260 743 processSurrogateControl (vrep);
528b2c61 744
073ba374 745 /** \todo IF the reply is a 1.0 reply, AND it has a Connection: Header
528b2c61 746 * Parse the header and remove all referenced headers
747 */
748
3ff65596
AR
749 orig_request->hier.peer_reply_status = newrep->sline.status;
750
2afaba07 751 ctx_exit(ctx);
752}
753
655daa06
AR
754/// ignore or start forwarding the 1xx response (a.k.a., control message)
755void
756HttpStateData::handle1xx(HttpReply *reply)
757{
758 HttpMsgPointerT<HttpReply> msg(reply); // will destroy reply if unused
759
760 // one 1xx at a time: we must not be called while waiting for previous 1xx
761 Must(!flags.handling1xx);
762 flags.handling1xx = true;
763
764 if (!orig_request->canHandle1xx()) {
765 debugs(11, 2, HERE << "ignoring client-unsupported 1xx");
766 proceedAfter1xx();
767 return;
768 }
769
770#if USE_HTTP_VIOLATIONS
771 // check whether the 1xx response forwarding is allowed by squid.conf
772 if (Config.accessList.reply) {
e11513e1 773 ACLFilledChecklist ch(Config.accessList.reply, originalRequest(), NULL);
655daa06
AR
774 ch.reply = HTTPMSGLOCK(reply);
775 if (!ch.fastCheck()) { // TODO: support slow lookups?
776 debugs(11, 3, HERE << "ignoring denied 1xx");
777 proceedAfter1xx();
778 return;
de48b288 779 }
655daa06
AR
780 }
781#endif // USE_HTTP_VIOLATIONS
782
783 debugs(11, 2, HERE << "forwarding 1xx to client");
784
785 // the Sink will use this to call us back after writing 1xx to the client
786 typedef NullaryMemFunT<HttpStateData> CbDialer;
787 const AsyncCall::Pointer cb = JobCallback(11, 3, CbDialer, this,
de48b288 788 HttpStateData::proceedAfter1xx);
b1cf2350 789 CallJobHere1(11, 4, orig_request->clientConnectionManager, ConnStateData,
655daa06
AR
790 ConnStateData::sendControlMsg, HttpControlMsg(msg, cb));
791 // If the call is not fired, then the Sink is gone, and HttpStateData
792 // will terminate due to an aborted store entry or another similar error.
793 // If we get stuck, it is not handle1xx fault if we could get stuck
794 // for similar reasons without a 1xx response.
795}
796
797/// restores state and resumes processing after 1xx is ignored or forwarded
798void
799HttpStateData::proceedAfter1xx()
800{
801 Must(flags.handling1xx);
802
803 debugs(11, 2, HERE << "consuming " << header_bytes_read <<
de48b288 804 " header and " << reply_bytes_read << " body bytes read after 1xx");
655daa06
AR
805 header_bytes_read = 0;
806 reply_bytes_read = 0;
807
808 CallJobHere(11, 3, this, HttpStateData, HttpStateData::processReply);
809}
810
811
d67acb4e
AJ
812/**
813 * returns true if the peer can support connection pinning
814*/
815bool HttpStateData::peerSupportsConnectionPinning() const
816{
817 const HttpReply *rep = entry->mem_obj->getReply();
818 const HttpHeader *hdr = &rep->header;
819 bool rc;
820 String header;
821
822 if (!_peer)
9e008dda
AJ
823 return true;
824
825 /*If this peer does not support connection pinning (authenticated
d67acb4e
AJ
826 connections) return false
827 */
828 if (!_peer->connection_auth)
9e008dda 829 return false;
d67acb4e 830
9e008dda 831 /*The peer supports connection pinning and the http reply status
d67acb4e
AJ
832 is not unauthorized, so the related connection can be pinned
833 */
834 if (rep->sline.status != HTTP_UNAUTHORIZED)
9e008dda
AJ
835 return true;
836
837 /*The server respond with HTTP_UNAUTHORIZED and the peer configured
838 with "connection-auth=on" we know that the peer supports pinned
d67acb4e
AJ
839 connections
840 */
841 if (_peer->connection_auth == 1)
9e008dda 842 return true;
d67acb4e 843
9e008dda
AJ
844 /*At this point peer has configured with "connection-auth=auto"
845 parameter so we need some extra checks to decide if we are going
d67acb4e
AJ
846 to allow pinned connections or not
847 */
848
9e008dda 849 /*if the peer configured with originserver just allow connection
d67acb4e
AJ
850 pinning (squid 2.6 behaviour)
851 */
852 if (_peer->options.originserver)
9e008dda 853 return true;
d67acb4e
AJ
854
855 /*if the connections it is already pinned it is OK*/
856 if (request->flags.pinned)
9e008dda
AJ
857 return true;
858
859 /*Allow pinned connections only if the Proxy-support header exists in
860 reply and has in its list the "Session-Based-Authentication"
d67acb4e
AJ
861 which means that the peer supports connection pinning.
862 */
863 if (!hdr->has(HDR_PROXY_SUPPORT))
9e008dda 864 return false;
d67acb4e
AJ
865
866 header = hdr->getStrOrList(HDR_PROXY_SUPPORT);
867 /* XXX This ought to be done in a case-insensitive manner */
d53b3f6d 868 rc = (strstr(header.termedBuf(), "Session-Based-Authentication") != NULL);
d67acb4e
AJ
869
870 return rc;
871}
872
5f8252d2 873// Called when we parsed (and possibly adapted) the headers but
874// had not starting storing (a.k.a., sending) the body yet.
2afaba07 875void
876HttpStateData::haveParsedReplyHeaders()
877{
c1520b67
AJ
878 ServerStateData::haveParsedReplyHeaders();
879
2afaba07 880 Ctx ctx = ctx_enter(entry->mem_obj->url);
585ab260 881 HttpReply *rep = finalReply();
2afaba07 882
585ab260 883 if (rep->sline.status == HTTP_PARTIAL_CONTENT &&
884 rep->content_range)
885 currentOffset = rep->content_range->spec.offset;
62e76326 886
3900307b 887 entry->timestampsSet();
62e76326 888
9bc73deb 889 /* Check if object is cacheable or not based on reply code */
585ab260 890 debugs(11, 3, "haveParsedReplyHeaders: HTTP CODE: " << rep->sline.status);
62e76326 891
9bc73deb 892 if (neighbors_do_private_keys)
585ab260 893 httpMaybeRemovePublic(entry, rep->sline.status);
e6ccf245 894
585ab260 895 if (rep->header.has(HDR_VARY)
f66a9ef4 896#if X_ACCELERATOR_VARY
585ab260 897 || rep->header.has(HDR_X_ACCELERATOR_VARY)
f66a9ef4 898#endif
4b44c907 899 ) {
585ab260 900 const char *vary = httpMakeVaryMark(orig_request, rep);
4b44c907 901
902 if (!vary) {
5ed72359 903 entry->makePrivate();
d7d3253b
AJ
904 if (!fwd->reforwardableStatus(rep->sline.status))
905 EBIT_CLR(entry->flags, ENTRY_FWD_HDR_WAIT);
4b44c907 906 goto no_cache;
62e76326 907 }
908
4b44c907 909 entry->mem_obj->vary_headers = xstrdup(vary);
910 }
911
2afaba07 912 /*
913 * If its not a reply that we will re-forward, then
914 * allow the client to get it.
915 */
585ab260 916 if (!fwd->reforwardableStatus(rep->sline.status))
2afaba07 917 EBIT_CLR(entry->flags, ENTRY_FWD_HDR_WAIT);
918
4b44c907 919 switch (cacheableReply()) {
920
921 case 1:
5ed72359 922 entry->makePublic();
62e76326 923 break;
924
9bc73deb 925 case 0:
5ed72359 926 entry->makePrivate();
62e76326 927 break;
928
9bc73deb 929 case -1:
4b44c907 930
626096be 931#if USE_HTTP_VIOLATIONS
4b44c907 932 if (Config.negativeTtl > 0)
5ed72359 933 entry->cacheNegatively();
4b44c907 934 else
ac9cc053 935#endif
5ed72359 936 entry->makePrivate();
4b44c907 937
62e76326 938 break;
939
9bc73deb 940 default:
62e76326 941 assert(0);
4b44c907 942
62e76326 943 break;
9bc73deb 944 }
62e76326 945
4b44c907 946no_cache:
947
585ab260 948 if (!ignoreCacheControl && rep->cache_control) {
7948b784 949 if (EBIT_TEST(rep->cache_control->mask, CC_PROXY_REVALIDATE) ||
477438e1
A
950 EBIT_TEST(rep->cache_control->mask, CC_MUST_REVALIDATE) ||
951 EBIT_TEST(rep->cache_control->mask, CC_S_MAXAGE))
62e76326 952 EBIT_SET(entry->flags, ENTRY_REVALIDATE);
9bc73deb 953 }
62e76326 954
c3609322 955#if HEADERS_LOG
585ab260 956 headersLog(1, 0, request->method, rep);
fc68f6b1 957
c3609322 958#endif
5f8252d2 959
960 ctx_exit(ctx);
f5558c95 961}
962
528b2c61 963HttpStateData::ConnectionStatus
964HttpStateData::statusIfComplete() const
603a02fd 965{
585ab260 966 const HttpReply *rep = virginReply();
073ba374
AJ
967 /** \par
968 * If the reply wants to close the connection, it takes precedence */
62e76326 969
2afaba07 970 if (httpHeaderHasConnDir(&rep->header, "close"))
62e76326 971 return COMPLETE_NONPERSISTENT_MSG;
972
073ba374
AJ
973 /** \par
974 * If we didn't send a keep-alive request header, then this
978e455f 975 * can not be a persistent connection.
976 */
528b2c61 977 if (!flags.keepalive)
62e76326 978 return COMPLETE_NONPERSISTENT_MSG;
979
073ba374 980 /** \par
72b63f06 981 * If we haven't sent the whole request then this can not be a persistent
982 * connection.
983 */
984 if (!flags.request_sent) {
f4762666 985 debugs(11, 2, "statusIfComplete: Request not yet fully sent \"" << RequestMethodStr(orig_request->method) << " " << entry->url() << "\"" );
72b63f06 986 return COMPLETE_NONPERSISTENT_MSG;
987 }
988
073ba374 989 /** \par
9f5a2895 990 * What does the reply have to say about keep-alive?
991 */
073ba374
AJ
992 /**
993 \bug XXX BUG?
b6a2f15e 994 * If the origin server (HTTP/1.0) does not send a keep-alive
995 * header, but keeps the connection open anyway, what happens?
996 * We'll return here and http.c waits for an EOF before changing
997 * store_status to STORE_OK. Combine this with ENTRY_FWD_HDR_WAIT
998 * and an error status code, and we might have to wait until
999 * the server times out the socket.
1000 */
2afaba07 1001 if (!rep->keep_alive)
528b2c61 1002 return COMPLETE_NONPERSISTENT_MSG;
62e76326 1003
528b2c61 1004 return COMPLETE_PERSISTENT_MSG;
1005}
1006
1007HttpStateData::ConnectionStatus
1008HttpStateData::persistentConnStatus() const
1009{
ba82c452 1010 debugs(11, 3, "persistentConnStatus: FD " << fd << " eof=" << eof);
839291ac
AJ
1011 if (eof) // already reached EOF
1012 return COMPLETE_NONPERSISTENT_MSG;
1013
505c2f28
AR
1014 /* If server fd is closing (but we have not been notified yet), stop Comm
1015 I/O to avoid assertions. TODO: Change Comm API to handle callers that
1016 want more I/O after async closing (usually initiated by others). */
1017 // XXX: add canReceive or s/canSend/canTalkToServer/
1018 if (!canSend(fd))
1019 return COMPLETE_NONPERSISTENT_MSG;
1020
9035d1d5
AJ
1021 /** \par
1022 * In chunked response we do not know the content length but we are absolutely
af0bb8e5 1023 * sure about the end of response, so we are calling the statusIfComplete to
9e008dda 1024 * decide if we can be persistant
af0bb8e5 1025 */
839291ac 1026 if (lastChunk && flags.chunked)
9e008dda 1027 return statusIfComplete();
af0bb8e5 1028
718d84bf
AR
1029 const HttpReply *vrep = virginReply();
1030 debugs(11, 5, "persistentConnStatus: content_length=" << vrep->content_length);
1031
47f6e231 1032 const int64_t clen = vrep->bodySize(request->method);
fc68f6b1 1033
bf8fe701 1034 debugs(11, 5, "persistentConnStatus: clen=" << clen);
2afaba07 1035
35282fbf 1036 /* If the body size is unknown we must wait for EOF */
1037 if (clen < 0)
62e76326 1038 return INCOMPLETE_MSG;
1039
9035d1d5
AJ
1040 /** \par
1041 * If the body size is known, we must wait until we've gotten all of it. */
5f8252d2 1042 if (clen > 0) {
1043 // old technique:
585ab260 1044 // if (entry->mem_obj->endOffset() < vrep->content_length + vrep->hdr_sz)
47f6e231 1045 const int64_t body_bytes_read = reply_bytes_read - header_bytes_read;
5f8252d2 1046 debugs(11,5, "persistentConnStatus: body_bytes_read=" <<
585ab260 1047 body_bytes_read << " content_length=" << vrep->content_length);
2afaba07 1048
585ab260 1049 if (body_bytes_read < vrep->content_length)
5f8252d2 1050 return INCOMPLETE_MSG;
821beb5e
AR
1051
1052 if (body_bytes_truncated > 0) // already read more than needed
1053 return COMPLETE_NONPERSISTENT_MSG; // disable pconns
5f8252d2 1054 }
62e76326 1055
9035d1d5
AJ
1056 /** \par
1057 * If there is no message body or we got it all, we can be persistent */
5f8252d2 1058 return statusIfComplete();
603a02fd 1059}
090089c4 1060
2afaba07 1061/*
1062 * This is the callback after some data has been read from the network
1063 */
dc56a9b1 1064/*
e5ee81f0 1065void
d53b3f6d 1066HttpStateData::ReadReplyWrapper(int fd, char *buf, size_t len, comm_err_t flag, int xerrno, void *data)
c4b7a5a9 1067{
1068 HttpStateData *httpState = static_cast<HttpStateData *>(data);
7194987f 1069 assert (fd == httpState->fd);
d53b3f6d 1070 // assert(buf == readBuf->content());
1d5161bd 1071 PROF_start(HttpStateData_readReply);
e6edd8df 1072 httpState->readReply(len, flag, xerrno);
1d5161bd 1073 PROF_stop(HttpStateData_readReply);
c4b7a5a9 1074}
dc56a9b1 1075*/
073ba374 1076
2afdbf48 1077/* XXX this function is too long! */
c4b7a5a9 1078void
e6edd8df 1079HttpStateData::readReply(const CommIoCbParams &io)
090089c4 1080{
30a4f2a8 1081 int bin;
090089c4 1082 int clen;
dc56a9b1 1083 int len = io.size;
c4b7a5a9 1084
dc56a9b1 1085 assert(fd == io.fd);
1086
1087 flags.do_next_read = 0;
9e008dda 1088
7a7cc03f 1089 debugs(11, 5, "httpReadReply: FD " << fd << ": len " << len << ".");
62e76326 1090
7a7cc03f 1091 // Bail out early on COMM_ERR_CLOSING - close handlers will tidy up for us
dc56a9b1 1092 if (io.flag == COMM_ERR_CLOSING) {
bf8fe701 1093 debugs(11, 3, "http socket closing");
c4b7a5a9 1094 return;
1095 }
1096
e92e4e44 1097 if (EBIT_TEST(entry->flags, ENTRY_ABORTED)) {
5f8252d2 1098 maybeReadVirginBody();
62e76326 1099 return;
e92e4e44 1100 }
c4b7a5a9 1101
fdf55365 1102 // handle I/O errors
dc56a9b1 1103 if (io.flag != COMM_OK || len < 0) {
7a7cc03f 1104 debugs(11, 2, "httpReadReply: FD " << fd << ": read failure: " << xstrerror() << ".");
fdf55365 1105
dc56a9b1 1106 if (ignoreErrno(io.xerrno)) {
fdf55365 1107 flags.do_next_read = 1;
1108 } else {
1109 ErrorState *err;
1110 err = errorCon(ERR_READ_ERROR, HTTP_BAD_GATEWAY, fwd->request);
dc56a9b1 1111 err->xerrno = io.xerrno;
fdf55365 1112 fwd->fail(err);
1113 flags.do_next_read = 0;
1114 comm_close(fd);
1115 }
1116
1117 return;
1118 }
1119
7a7cc03f 1120 // update I/O stats
fdf55365 1121 if (len > 0) {
2afaba07 1122 readBuf->appended(len);
5f8252d2 1123 reply_bytes_read += len;
9a0a18de 1124#if USE_DELAY_POOLS
2afaba07 1125 DelayId delayId = entry->mem_obj->mostBytesAllowed();
62e76326 1126 delayId.bytesIn(len);
447e176b 1127#endif
62e76326 1128
1129 kb_incr(&statCounter.server.all.kbytes_in, len);
1130 kb_incr(&statCounter.server.http.kbytes_in, len);
62e76326 1131 IOStats.Http.reads++;
1132
1133 for (clen = len - 1, bin = 0; clen; bin++)
1134 clen >>= 1;
1135
1136 IOStats.Http.read_hist[bin]++;
3ff65596
AR
1137
1138 // update peer response time stats (%<pt)
1139 const timeval &sent = orig_request->hier.peer_http_request_sent;
1140 orig_request->hier.peer_response_time =
1141 sent.tv_sec ? tvSubMsec(sent, current_time) : -1;
30a4f2a8 1142 }
62e76326 1143
073ba374
AJ
1144 /** \par
1145 * Here the RFC says we should ignore whitespace between replies, but we can't as
5fa061b8 1146 * doing so breaks HTTP/0.9 replies beginning with witespace, and in addition
1147 * the response splitting countermeasures is extremely likely to trigger on this,
1148 * not allowing connection reuse in the first place.
1149 */
1150#if DONT_DO_THIS
fdf55365 1151 if (!flags.headers_parsed && len > 0 && fd_table[fd].uses > 1) {
5fa061b8 1152 /* Skip whitespace between replies */
62e76326 1153
d53b3f6d 1154 while (len > 0 && xisspace(*buf))
41d00cd3 1155 memmove(buf, buf + 1, len--);
62e76326 1156
1157 if (len == 0) {
1158 /* Continue to read... */
21b92762 1159 /* Timeout NOT increased. This whitespace was from previous reply */
f61f0107 1160 flags.do_next_read = 1;
5f8252d2 1161 maybeReadVirginBody();
62e76326 1162 return;
1163 }
5ede6c8f 1164 }
62e76326 1165
5fa061b8 1166#endif
1167
ba82c452 1168 if (len == 0) { // reached EOF?
62e76326 1169 eof = 1;
f61f0107 1170 flags.do_next_read = 0;
da6c8415 1171
b73a07d6 1172 /* Bug 2879: Replies may terminate with \r\n then EOF instead of \r\n\r\n
da6c8415 1173 * Ensure here that we have at minimum two \r\n when EOF is seen.
b73a07d6 1174 * TODO: Add eof parameter to headersEnd() and move this hack there.
da6c8415 1175 */
b73a07d6 1176 if (readBuf->contentSize() && !flags.headers_parsed) {
da6c8415
AJ
1177 /*
1178 * Yes Henrik, there is a point to doing this. When we
1179 * called httpProcessReplyHeader() before, we didn't find
1180 * the end of headers, but now we are definately at EOF, so
1181 * we want to process the reply headers.
1182 */
1183 /* Fake an "end-of-headers" to work around such broken servers */
1184 readBuf->append("\r\n", 2);
da6c8415 1185 }
ba82c452 1186 }
62e76326 1187
655daa06
AR
1188 processReply();
1189}
1190
1191/// processes the already read and buffered response data, possibly after
1192/// waiting for asynchronous 1xx control message processing
1193void
de48b288
A
1194HttpStateData::processReply()
1195{
655daa06
AR
1196
1197 if (flags.handling1xx) { // we came back after handling a 1xx response
1198 debugs(11, 5, HERE << "done with 1xx handling");
1199 flags.handling1xx = false;
1200 Must(!flags.headers_parsed);
1201 }
1202
ba82c452 1203 if (!flags.headers_parsed) { // have not parsed headers yet?
1204 PROF_start(HttpStateData_processReplyHeader);
1205 processReplyHeader();
1206 PROF_stop(HttpStateData_processReplyHeader);
1207
1208 if (!continueAfterParsingHeader()) // parsing error or need more data
1209 return; // TODO: send errors to ICAP
1210
585ab260 1211 adaptOrFinalizeReply();
c3169a09
DK
1212 // adaptOrFinalizeReply() may abort or otherwise "close" the entry
1213 if (!entry->isAccepting())
1214 return;
ba82c452 1215 }
1216
1217 // kick more reads if needed and/or process the response body, if any
1218 PROF_start(HttpStateData_processReplyBody);
1219 processReplyBody(); // may call serverComplete()
1220 PROF_stop(HttpStateData_processReplyBody);
1221}
1222
073ba374
AJ
1223/**
1224 \retval true if we can continue with processing the body or doing ICAP.
1225 */
ba82c452 1226bool
1227HttpStateData::continueAfterParsingHeader()
1228{
655daa06
AR
1229 if (flags.handling1xx) {
1230 debugs(11, 5, HERE << "wait for 1xx handling");
1231 Must(!flags.headers_parsed);
1232 return false;
1233 }
1234
073ba374 1235 if (!flags.headers_parsed && !eof) {
ba82c452 1236 debugs(11, 9, HERE << "needs more at " << readBuf->contentSize());
1237 flags.do_next_read = 1;
073ba374
AJ
1238 /** \retval false If we have not finished parsing the headers and may get more data.
1239 * Schedules more reads to retrieve the missing data.
1240 */
ba82c452 1241 maybeReadVirginBody(); // schedules all kinds of reads; TODO: rename
073ba374 1242 return false;
ba82c452 1243 }
1244
073ba374 1245 /** If we are done with parsing, check for errors */
ba82c452 1246
1247 err_type error = ERR_NONE;
1248
1249 if (flags.headers_parsed) { // parsed headers, possibly with errors
1250 // check for header parsing errors
585ab260 1251 if (HttpReply *vrep = virginReply()) {
1252 const http_status s = vrep->sline.status;
1253 const HttpVersion &v = vrep->sline.version;
ba82c452 1254 if (s == HTTP_INVALID_HEADER && v != HttpVersion(0,9)) {
9121eba6 1255 debugs(11, DBG_IMPORTANT, "WARNING: HTTP: Invalid Response: Bad header encountered from " << entry->url() << " AKA " << orig_request->GetHost() << orig_request->urlpath.termedBuf() );
ba82c452 1256 error = ERR_INVALID_RESP;
e1381638
AJ
1257 } else if (s == HTTP_HEADER_TOO_LARGE) {
1258 fwd->dontRetry(true);
1259 error = ERR_TOO_BIG;
1260 } else {
1261 return true; // done parsing, got reply, and no error
1262 }
ba82c452 1263 } else {
1264 // parsed headers but got no reply
9121eba6 1265 debugs(11, DBG_IMPORTANT, "WARNING: HTTP: Invalid Response: No reply at all for " << entry->url() << " AKA " << orig_request->GetHost() << orig_request->urlpath.termedBuf() );
ba82c452 1266 error = ERR_INVALID_RESP;
62e76326 1267 }
090089c4 1268 } else {
ba82c452 1269 assert(eof);
9121eba6
AJ
1270 if (readBuf->hasContent()) {
1271 error = ERR_INVALID_RESP;
1272 debugs(11, DBG_IMPORTANT, "WARNING: HTTP: Invalid Response: Headers did not parse at all for " << entry->url() << " AKA " << orig_request->GetHost() << orig_request->urlpath.termedBuf() );
1273 } else {
1274 error = ERR_ZERO_SIZE_OBJECT;
94a1d715
AJ
1275 debugs(11, (orig_request->flags.accelerated?DBG_IMPORTANT:2), "WARNING: HTTP: Invalid Response: No object data received for " <<
1276 entry->url() << " AKA " << orig_request->GetHost() << orig_request->urlpath.termedBuf() );
9121eba6 1277 }
2afaba07 1278 }
ba82c452 1279
1280 assert(error != ERR_NONE);
1281 entry->reset();
1282 fwd->fail(errorCon(error, HTTP_BAD_GATEWAY, fwd->request));
1283 flags.do_next_read = 0;
1284 comm_close(fd);
1285 return false; // quit on error
2afaba07 1286}
1287
821beb5e
AR
1288/** truncate what we read if we read too much so that writeReplyBody()
1289 writes no more than what we should have read */
1290void
1291HttpStateData::truncateVirginBody()
1292{
1293 assert(flags.headers_parsed);
1294
1295 HttpReply *vrep = virginReply();
1296 int64_t clen = -1;
1297 if (!vrep->expectingBody(request->method, clen) || clen < 0)
1298 return; // no body or a body of unknown size, including chunked
1299
1300 const int64_t body_bytes_read = reply_bytes_read - header_bytes_read;
e1381638 1301 if (body_bytes_read - body_bytes_truncated <= clen)
821beb5e
AR
1302 return; // we did not read too much or already took care of the extras
1303
1304 if (const int64_t extras = body_bytes_read - body_bytes_truncated - clen) {
1305 // server sent more that the advertised content length
e1381638
AJ
1306 debugs(11,5, HERE << "body_bytes_read=" << body_bytes_read <<
1307 " clen=" << clen << '/' << vrep->content_length <<
1308 " body_bytes_truncated=" << body_bytes_truncated << '+' << extras);
821beb5e
AR
1309
1310 readBuf->truncate(extras);
1311 body_bytes_truncated += extras;
1312 }
1313}
1314
073ba374 1315/**
2afaba07 1316 * Call this when there is data from the origin server
1317 * which should be sent to either StoreEntry, or to ICAP...
1318 */
1319void
5f8252d2 1320HttpStateData::writeReplyBody()
2afaba07 1321{
821beb5e 1322 truncateVirginBody(); // if needed
5f8252d2 1323 const char *data = readBuf->content();
1324 int len = readBuf->contentSize();
bc81cb2b 1325 addVirginReplyBody(data, len);
5f8252d2 1326 readBuf->consume(len);
af0bb8e5 1327}
fc68f6b1 1328
af0bb8e5 1329bool
1330HttpStateData::decodeAndWriteReplyBody()
1331{
1332 const char *data = NULL;
1333 int len;
e053c141 1334 bool wasThereAnException = false;
af0bb8e5 1335 assert(flags.chunked);
1336 assert(httpChunkDecoder);
1337 SQUID_ENTER_THROWING_CODE();
1338 MemBuf decodedData;
1339 decodedData.init();
e053c141 1340 const bool doneParsing = httpChunkDecoder->parse(readBuf,&decodedData);
af0bb8e5 1341 len = decodedData.contentSize();
1342 data=decodedData.content();
1343 addVirginReplyBody(data, len);
e053c141 1344 if (doneParsing) {
839291ac
AJ
1345 lastChunk = 1;
1346 flags.do_next_read = 0;
af0bb8e5 1347 }
e053c141
FC
1348 SQUID_EXIT_THROWING_CODE(wasThereAnException);
1349 return wasThereAnException;
e6ccf245 1350}
1351
073ba374 1352/**
2afaba07 1353 * processReplyBody has two purposes:
1354 * 1 - take the reply body data, if any, and put it into either
1355 * the StoreEntry, or give it over to ICAP.
1356 * 2 - see if we made it to the end of the response (persistent
1357 * connections and such)
1358 */
e6ccf245 1359void
2afaba07 1360HttpStateData::processReplyBody()
e6ccf245 1361{
dc56a9b1 1362 AsyncCall::Pointer call;
b7ac5457 1363 Ip::Address client_addr;
d67acb4e 1364 bool ispinned = false;
fc68f6b1 1365
1a98175f 1366 if (!flags.headers_parsed) {
f61f0107 1367 flags.do_next_read = 1;
5f8252d2 1368 maybeReadVirginBody();
62e76326 1369 return;
528b2c61 1370 }
62e76326 1371
a83c6ed6 1372#if USE_ADAPTATION
c30ac6ea 1373 debugs(11,5, HERE << "adaptationAccessCheckPending=" << adaptationAccessCheckPending);
a83c6ed6 1374 if (adaptationAccessCheckPending)
2afaba07 1375 return;
fc68f6b1 1376
2afaba07 1377#endif
62e76326 1378
2afaba07 1379 /*
1380 * At this point the reply headers have been parsed and consumed.
1381 * That means header content has been removed from readBuf and
1382 * it contains only body data.
1383 */
9e008dda
AJ
1384 if (flags.chunked) {
1385 if (!decodeAndWriteReplyBody()) {
1386 flags.do_next_read = 0;
1387 serverComplete();
1388 return;
1389 }
1390 } else
1391 writeReplyBody();
528b2c61 1392
e6ccf245 1393 if (EBIT_TEST(entry->flags, ENTRY_ABORTED)) {
62e76326 1394 /*
073ba374 1395 * The above writeReplyBody() call could ABORT this entry,
62e76326 1396 * in that case, the server FD should already be closed.
1397 * there's nothing for us to do.
1398 */
1399 (void) 0;
1400 } else
1401 switch (persistentConnStatus()) {
62e76326 1402 case INCOMPLETE_MSG:
bf8fe701 1403 debugs(11, 5, "processReplyBody: INCOMPLETE_MSG");
21b92762 1404 /* Wait for more data or EOF condition */
21b92762 1405 if (flags.keepalive_broken) {
9e008dda 1406 call = NULL;
dc56a9b1 1407 commSetTimeout(fd, 10, call);
21b92762 1408 } else {
9e008dda 1409 call = NULL;
dc56a9b1 1410 commSetTimeout(fd, Config.Timeout.read, call);
21b92762 1411 }
1412
f61f0107 1413 flags.do_next_read = 1;
62e76326 1414 break;
1415
1416 case COMPLETE_PERSISTENT_MSG:
bf8fe701 1417 debugs(11, 5, "processReplyBody: COMPLETE_PERSISTENT_MSG");
62e76326 1418 /* yes we have to clear all these! */
9e008dda 1419 call = NULL;
dc56a9b1 1420 commSetTimeout(fd, -1, call);
f61f0107 1421 flags.do_next_read = 0;
62e76326 1422
9e008dda 1423 comm_remove_close_handler(fd, closeHandler);
dc56a9b1 1424 closeHandler = NULL;
b6b6f466 1425 fwd->unregister(fd);
fc68f6b1 1426
f165d2fb 1427 if (orig_request->flags.spoof_client_ip)
cc192b50 1428 client_addr = orig_request->client_addr;
fc68f6b1 1429
d67acb4e 1430
9e008dda
AJ
1431 if (request->flags.pinned) {
1432 ispinned = true;
1433 } else if (request->flags.connection_auth && request->flags.auth_sent) {
1434 ispinned = true;
1435 }
1436
1437 if (orig_request->pinnedConnection() && ispinned) {
1438 orig_request->pinnedConnection()->pinConnection(fd, orig_request, _peer,
1439 (request->flags.connection_auth != 0));
bd0723ad 1440 } else {
06093389 1441 fwd->pconnPush(fd, _peer, request, orig_request->GetHost(), client_addr);
bd0723ad 1442 }
1443
62e76326 1444 fd = -1;
2afaba07 1445
5f8252d2 1446 serverComplete();
62e76326 1447 return;
1448
1449 case COMPLETE_NONPERSISTENT_MSG:
bf8fe701 1450 debugs(11, 5, "processReplyBody: COMPLETE_NONPERSISTENT_MSG");
5f8252d2 1451 serverComplete();
62e76326 1452 return;
1453 }
1454
5f8252d2 1455 maybeReadVirginBody();
c4b7a5a9 1456}
1457
1458void
5f8252d2 1459HttpStateData::maybeReadVirginBody()
c4b7a5a9 1460{
52edecde 1461 // we may need to grow the buffer if headers do not fit
1c9605c5 1462 const int minRead = flags.headers_parsed ? 0 :1024;
d5f8d05f 1463 const int read_size = replyBodySpace(*readBuf, minRead);
2afaba07 1464
5f8252d2 1465 debugs(11,9, HERE << (flags.do_next_read ? "may" : "wont") <<
d5f8d05f 1466 " read up to " << read_size << " bytes from FD " << fd);
2afaba07 1467
1468 /*
1469 * why <2? Because delayAwareRead() won't actually read if
1470 * you ask it to read 1 byte. The delayed read request
1471 * just gets re-queued until the client side drains, then
1472 * the I/O thread hangs. Better to not register any read
1473 * handler until we get a notification from someone that
1474 * its okay to read again.
1475 */
d5f8d05f 1476 if (read_size < 2)
52edecde 1477 return;
2afaba07 1478
f61f0107 1479 if (flags.do_next_read) {
dc56a9b1 1480 flags.do_next_read = 0;
1481 typedef CommCbMemFunT<HttpStateData, CommIoCbParams> Dialer;
d5f8d05f 1482 entry->delayAwareRead(fd, readBuf->space(read_size), read_size,
4cb2536f 1483 JobCallback(11, 5, Dialer, this, HttpStateData::readReply));
528b2c61 1484 }
090089c4 1485}
1486
39cb8c41 1487/// called after writing the very last request byte (body, last-chunk, etc)
d576a6a6 1488void
39cb8c41 1489HttpStateData::wroteLast(const CommIoCbParams &io)
090089c4 1490{
39cb8c41 1491 debugs(11, 5, HERE << "FD " << fd << ": size " << io.size << ": errflag " << io.flag << ".");
bc87dc25 1492#if URL_CHECKSUM_DEBUG
62e76326 1493
528b2c61 1494 entry->mem_obj->checkUrlChecksum();
bc87dc25 1495#endif
62e76326 1496
dc56a9b1 1497 if (io.size > 0) {
1498 fd_bytes(fd, io.size, FD_WRITE);
1499 kb_incr(&statCounter.server.all.kbytes_out, io.size);
1500 kb_incr(&statCounter.server.http.kbytes_out, io.size);
ee1679df 1501 }
62e76326 1502
dc56a9b1 1503 if (io.flag == COMM_ERR_CLOSING)
62e76326 1504 return;
1505
dc56a9b1 1506 if (io.flag) {
6cae5db1 1507 ErrorState *err;
dc56a9b1 1508 err = errorCon(ERR_WRITE_ERROR, HTTP_BAD_GATEWAY, fwd->request);
1509 err->xerrno = io.xerrno;
1510 fwd->fail(err);
62e76326 1511 comm_close(fd);
1512 return;
090089c4 1513 }
72b63f06 1514
39cb8c41
AR
1515 sendComplete();
1516}
1517
1518/// successfully wrote the entire request (including body, last-chunk, etc.)
1519void
1520HttpStateData::sendComplete()
1521{
2afaba07 1522 /*
1523 * Set the read timeout here because it hasn't been set yet.
1524 * We only set the read timeout after the request has been
1525 * fully written to the server-side. If we start the timeout
1526 * after connection establishment, then we are likely to hit
1527 * the timeout for POST/PUT requests that have very large
1528 * request bodies.
1529 */
dc56a9b1 1530 typedef CommCbMemFunT<HttpStateData, CommTimeoutCbParams> TimeoutDialer;
4299f876 1531 AsyncCall::Pointer timeoutCall = JobCallback(11, 5,
4cb2536f 1532 TimeoutDialer, this, HttpStateData::httpTimeout);
2afaba07 1533
dc56a9b1 1534 commSetTimeout(fd, Config.Timeout.read, timeoutCall);
1535
1536 flags.request_sent = 1;
e1381638 1537
3ff65596 1538 orig_request->hier.peer_http_request_sent = current_time;
090089c4 1539}
1540
5f8252d2 1541// Close the HTTP server connection. Used by serverComplete().
2afaba07 1542void
5f8252d2 1543HttpStateData::closeServer()
2afaba07 1544{
5f8252d2 1545 debugs(11,5, HERE << "closing HTTP server FD " << fd << " this " << this);
fc68f6b1 1546
2afaba07 1547 if (fd >= 0) {
b6b6f466 1548 fwd->unregister(fd);
9e008dda 1549 comm_remove_close_handler(fd, closeHandler);
dc56a9b1 1550 closeHandler = NULL;
2afaba07 1551 comm_close(fd);
1552 fd = -1;
1553 }
5f8252d2 1554}
2afaba07 1555
5f8252d2 1556bool
1557HttpStateData::doneWithServer() const
1558{
1559 return fd < 0;
2afaba07 1560}
1561
ee0b94f4
HN
1562
1563/*
1564 * Fixup authentication request headers for special cases
1565 */
1566static void
1567httpFixupAuthentication(HttpRequest * request, HttpRequest * orig_request, const HttpHeader * hdr_in, HttpHeader * hdr_out, http_state_flags flags)
1568{
1569 http_hdr_type header = flags.originpeer ? HDR_AUTHORIZATION : HDR_PROXY_AUTHORIZATION;
1570
1571 /* Nothing to do unless we are forwarding to a peer */
1572 if (!request->flags.proxying)
f54f527e 1573 return;
ee0b94f4
HN
1574
1575 /* Needs to be explicitly enabled */
dcde39a7 1576 if (!orig_request->peer_login)
f54f527e 1577 return;
ee0b94f4
HN
1578
1579 /* Maybe already dealt with? */
1580 if (hdr_out->has(header))
f54f527e 1581 return;
ee0b94f4
HN
1582
1583 /* Nothing to do here for PASSTHRU */
1584 if (strcmp(orig_request->peer_login, "PASSTHRU") == 0)
f54f527e 1585 return;
ee0b94f4
HN
1586
1587 /* PROXYPASS is a special case, single-signon to servers with the proxy password (basic only) */
1588 if (flags.originpeer && strcmp(orig_request->peer_login, "PROXYPASS") == 0 && hdr_in->has(HDR_PROXY_AUTHORIZATION)) {
f54f527e 1589 const char *auth = hdr_in->getStr(HDR_PROXY_AUTHORIZATION);
ee0b94f4 1590
f54f527e
AJ
1591 if (auth && strncasecmp(auth, "basic ", 6) == 0) {
1592 hdr_out->putStr(header, auth);
1593 return;
1594 }
ee0b94f4
HN
1595 }
1596
1597 /* Special mode to pass the username to the upstream cache */
1598 if (*orig_request->peer_login == '*') {
f54f527e
AJ
1599 char loginbuf[256];
1600 const char *username = "-";
ee0b94f4 1601
f54f527e
AJ
1602 if (orig_request->extacl_user.size())
1603 username = orig_request->extacl_user.termedBuf();
2f1431ea 1604#if USE_AUTH
a33a428a 1605 else if (orig_request->auth_user_request != NULL)
f54f527e 1606 username = orig_request->auth_user_request->username();
2f1431ea 1607#endif
ee0b94f4 1608
f54f527e 1609 snprintf(loginbuf, sizeof(loginbuf), "%s%s", username, orig_request->peer_login + 1);
ee0b94f4 1610
f54f527e 1611 httpHeaderPutStrf(hdr_out, header, "Basic %s",
8bdd0cec 1612 old_base64_encode(loginbuf));
f54f527e 1613 return;
ee0b94f4
HN
1614 }
1615
1616 /* external_acl provided credentials */
1617 if (orig_request->extacl_user.size() && orig_request->extacl_passwd.size() &&
f54f527e
AJ
1618 (strcmp(orig_request->peer_login, "PASS") == 0 ||
1619 strcmp(orig_request->peer_login, "PROXYPASS") == 0)) {
1620 char loginbuf[256];
1621 snprintf(loginbuf, sizeof(loginbuf), SQUIDSTRINGPH ":" SQUIDSTRINGPH,
1622 SQUIDSTRINGPRINT(orig_request->extacl_user),
1623 SQUIDSTRINGPRINT(orig_request->extacl_passwd));
1624 httpHeaderPutStrf(hdr_out, header, "Basic %s",
8bdd0cec 1625 old_base64_encode(loginbuf));
f54f527e 1626 return;
ee0b94f4
HN
1627 }
1628
9ca29d23 1629 /* Kerberos login to peer */
2f1431ea 1630#if HAVE_AUTH_MODULE_NEGOTIATE && HAVE_KRB5 && HAVE_GSSAPI
9ca29d23
AJ
1631 if (strncmp(orig_request->peer_login, "NEGOTIATE",strlen("NEGOTIATE")) == 0) {
1632 char *Token=NULL;
1633 char *PrincipalName=NULL,*p;
1634 if ((p=strchr(orig_request->peer_login,':')) != NULL ) {
1635 PrincipalName=++p;
1636 }
1637 Token = peer_proxy_negotiate_auth(PrincipalName,request->peer_host);
1638 if (Token) {
1639 httpHeaderPutStrf(hdr_out, HDR_PROXY_AUTHORIZATION, "Negotiate %s",Token);
1640 }
1641 return;
1642 }
1643#endif /* HAVE_KRB5 && HAVE_GSSAPI */
1644
0606266f 1645 httpHeaderPutStrf(hdr_out, header, "Basic %s",
8bdd0cec 1646 old_base64_encode(orig_request->peer_login));
ee0b94f4
HN
1647 return;
1648}
1649
99edd1c3 1650/*
9e008dda 1651 * build request headers and append them to a given MemBuf
e5ee81f0 1652 * used by buildRequestPrefix()
818c6c9e 1653 * note: initialised the HttpHeader, the caller is responsible for Clean()-ing
99edd1c3 1654 */
e1e72f06 1655void
e5ee81f0 1656HttpStateData::httpBuildRequestHeader(HttpRequest * request,
1657 HttpRequest * orig_request,
1658 StoreEntry * entry,
1659 HttpHeader * hdr_out,
386c7842 1660 const http_state_flags flags)
6bf8443a 1661{
99edd1c3 1662 /* building buffer for complex strings */
5999b776 1663#define BBUF_SZ (MAX_URL+32)
99edd1c3 1664 LOCAL_ARRAY(char, bbuf, BBUF_SZ);
67c06f0d 1665 LOCAL_ARRAY(char, ntoabuf, MAX_IPSTRLEN);
99edd1c3 1666 const HttpHeader *hdr_in = &orig_request->header;
67c06f0d 1667 const HttpHeaderEntry *e = NULL;
99edd1c3 1668 HttpHeaderPos pos = HttpHeaderInitPos;
75faaa7a 1669 assert (hdr_out->owner == hoRequest);
62e76326 1670
262a0e14 1671 /* append our IMS header */
fa3e249f 1672 if (request->lastmod > -1)
a9925b40 1673 hdr_out->putTime(HDR_IF_MODIFIED_SINCE, request->lastmod);
99edd1c3 1674
528b2c61 1675 bool we_do_ranges = decideIfWeDoRanges (orig_request);
1676
30abd221 1677 String strConnection (hdr_in->getList(HDR_CONNECTION));
62e76326 1678
a9925b40 1679 while ((e = hdr_in->getEntry(&pos)))
62e76326 1680 copyOneHeaderFromClientsideRequestToUpstreamRequest(e, strConnection, request, orig_request, hdr_out, we_do_ranges, flags);
528b2c61 1681
43ae1d95 1682 /* Abstraction break: We should interpret multipart/byterange responses
528b2c61 1683 * into offset-length data, and this works around our inability to do so.
1684 */
62e76326 1685 if (!we_do_ranges && orig_request->multipartRangeRequest()) {
1686 /* don't cache the result */
1687 orig_request->flags.cachable = 0;
1688 /* pretend it's not a range request */
00d77d6b 1689 delete orig_request->range;
62e76326 1690 orig_request->range = NULL;
1691 orig_request->flags.range = 0;
1692 }
528b2c61 1693
99edd1c3 1694 /* append Via */
736cb6aa 1695 if (Config.onoff.via) {
30abd221 1696 String strVia;
a9925b40 1697 strVia = hdr_in->getList(HDR_VIA);
62e76326 1698 snprintf(bbuf, BBUF_SZ, "%d.%d %s",
1699 orig_request->http_ver.major,
1700 orig_request->http_ver.minor, ThisCache);
1701 strListAdd(&strVia, bbuf, ',');
d53b3f6d 1702 hdr_out->putStr(HDR_VIA, strVia.termedBuf());
30abd221 1703 strVia.clean();
736cb6aa 1704 }
62e76326 1705
432bc83c 1706 if (orig_request->flags.accelerated) {
43ae1d95 1707 /* Append Surrogate-Capabilities */
45cca89d
AJ
1708 String strSurrogate(hdr_in->getList(HDR_SURROGATE_CAPABILITY));
1709#if USE_SQUID_ESI
1710 snprintf(bbuf, BBUF_SZ, "%s=\"Surrogate/1.0 ESI/1.0\"", Config.Accel.surrogate_id);
1711#else
1712 snprintf(bbuf, BBUF_SZ, "%s=\"Surrogate/1.0\"", Config.Accel.surrogate_id);
1713#endif
43ae1d95 1714 strListAdd(&strSurrogate, bbuf, ',');
d53b3f6d 1715 hdr_out->putStr(HDR_SURROGATE_CAPABILITY, strSurrogate.termedBuf());
43ae1d95 1716 }
43ae1d95 1717
67c06f0d 1718 /** \pre Handle X-Forwarded-For */
9e008dda 1719 if (strcmp(opt_forwarded_for, "delete") != 0) {
c4f30223
AR
1720
1721 String strFwd = hdr_in->getList(HDR_X_FORWARDED_FOR);
1722
1723 if (strFwd.size() > 65536/2) {
1724 // There is probably a forwarding loop with Via detection disabled.
1725 // If we do nothing, String will assert on overflow soon.
1726 // TODO: Terminate all transactions with huge XFF?
1727 strFwd = "error";
1728
1729 static int warnedCount = 0;
1730 if (warnedCount++ < 100) {
1731 const char *url = entry ? entry->url() : urlCanonical(orig_request);
1732 debugs(11, 1, "Warning: likely forwarding loop with " << url);
1733 }
1734 }
1735
9e008dda 1736 if (strcmp(opt_forwarded_for, "on") == 0) {
67c06f0d 1737 /** If set to ON - append client IP or 'unknown'. */
9e008dda 1738 if ( orig_request->client_addr.IsNoAddr() )
67c06f0d
AJ
1739 strListAdd(&strFwd, "unknown", ',');
1740 else
1741 strListAdd(&strFwd, orig_request->client_addr.NtoA(ntoabuf, MAX_IPSTRLEN), ',');
9e008dda 1742 } else if (strcmp(opt_forwarded_for, "off") == 0) {
67c06f0d 1743 /** If set to OFF - append 'unknown'. */
67c06f0d 1744 strListAdd(&strFwd, "unknown", ',');
9e008dda 1745 } else if (strcmp(opt_forwarded_for, "transparent") == 0) {
67c06f0d 1746 /** If set to TRANSPARENT - pass through unchanged. */
9e008dda 1747 } else if (strcmp(opt_forwarded_for, "truncate") == 0) {
67c06f0d 1748 /** If set to TRUNCATE - drop existing list and replace with client IP or 'unknown'. */
9e008dda 1749 if ( orig_request->client_addr.IsNoAddr() )
67c06f0d
AJ
1750 strFwd = "unknown";
1751 else
1752 strFwd = orig_request->client_addr.NtoA(ntoabuf, MAX_IPSTRLEN);
1753 }
9e008dda 1754 if (strFwd.size() > 0)
d53b3f6d 1755 hdr_out->putStr(HDR_X_FORWARDED_FOR, strFwd.termedBuf());
cc192b50 1756 }
67c06f0d 1757 /** If set to DELETE - do not copy through. */
6bccf575 1758
99edd1c3 1759 /* append Host if not there already */
a9925b40 1760 if (!hdr_out->has(HDR_HOST)) {
62e76326 1761 if (orig_request->peer_domain) {
a9925b40 1762 hdr_out->putStr(HDR_HOST, orig_request->peer_domain);
62e76326 1763 } else if (orig_request->port == urlDefaultPort(orig_request->protocol)) {
1764 /* use port# only if not default */
cc192b50 1765 hdr_out->putStr(HDR_HOST, orig_request->GetHost());
62e76326 1766 } else {
1767 httpHeaderPutStrf(hdr_out, HDR_HOST, "%s:%d",
cc192b50 1768 orig_request->GetHost(),
1769 (int) orig_request->port);
62e76326 1770 }
6bf8443a 1771 }
62e76326 1772
c68e9c6b 1773 /* append Authorization if known in URL, not in header and going direct */
a9925b40 1774 if (!hdr_out->has(HDR_AUTHORIZATION)) {
62e76326 1775 if (!request->flags.proxying && *request->login) {
1776 httpHeaderPutStrf(hdr_out, HDR_AUTHORIZATION, "Basic %s",
8bdd0cec 1777 old_base64_encode(request->login));
62e76326 1778 }
c68e9c6b 1779 }
62e76326 1780
ee0b94f4
HN
1781 /* Fixup (Proxy-)Authorization special cases. Plain relaying dealt with above */
1782 httpFixupAuthentication(request, orig_request, hdr_in, hdr_out, flags);
62e76326 1783
ee0b94f4
HN
1784 /* append Cache-Control, add max-age if not there already */
1785 {
a9925b40 1786 HttpHdrCc *cc = hdr_in->getCc();
62e76326 1787
1788 if (!cc)
1789 cc = httpHdrCcCreate();
1790
7dc5c309
AJ
1791#if 0 /* see bug 2330 */
1792 /* Set no-cache if determined needed but not found */
1793 if (orig_request->flags.nocache)
1794 EBIT_SET(cc->mask, CC_NO_CACHE);
1795#endif
1796
af6a12ee
AJ
1797 /* Add max-age only without no-cache */
1798 if (!EBIT_TEST(cc->mask, CC_MAX_AGE) && !EBIT_TEST(cc->mask, CC_NO_CACHE)) {
43ae1d95 1799 const char *url =
3900307b 1800 entry ? entry->url() : urlCanonical(orig_request);
62e76326 1801 httpHdrCcSetMaxAge(cc, getMaxAge(url));
1802
1803 if (request->urlpath.size())
e8466ea9 1804 assert(strstr(url, request->urlpath.termedBuf()));
62e76326 1805 }
1806
ce2d6441 1807 /* Enforce sibling relations */
62e76326 1808 if (flags.only_if_cached)
1809 EBIT_SET(cc->mask, CC_ONLY_IF_CACHED);
1810
a9925b40 1811 hdr_out->putCc(cc);
62e76326 1812
1813 httpHdrCcDestroy(cc);
6bf8443a 1814 }
62e76326 1815
99edd1c3 1816 /* maybe append Connection: keep-alive */
b515fc11 1817 if (flags.keepalive) {
95e78500 1818 hdr_out->putStr(HDR_CONNECTION, "keep-alive");
603a02fd 1819 }
62e76326 1820
a7ad6e4e 1821 /* append Front-End-Https */
1822 if (flags.front_end_https) {
0c3d3f65 1823 if (flags.front_end_https == 1 || request->protocol == AnyP::PROTO_HTTPS)
a9925b40 1824 hdr_out->putStr(HDR_FRONT_END_HTTPS, "On");
a7ad6e4e 1825 }
1826
e31a1e67
AR
1827 if (flags.chunked_request) {
1828 // Do not just copy the original value so that if the client-side
1829 // starts decode other encodings, this code may remain valid.
39cb8c41
AR
1830 hdr_out->putStr(HDR_TRANSFER_ENCODING, "chunked");
1831 }
1832
6bccf575 1833 /* Now mangle the headers. */
4f56514c 1834 if (Config2.onoff.mangle_request_headers)
5967c0bf 1835 httpHdrMangleList(hdr_out, request, ROR_REQUEST);
62e76326 1836
30abd221 1837 strConnection.clean();
99edd1c3 1838}
1839
9e498bfb
AJ
1840/**
1841 * Decides whether a particular header may be cloned from the received Clients request
1842 * to our outgoing fetch request.
1843 */
528b2c61 1844void
9e498bfb 1845copyOneHeaderFromClientsideRequestToUpstreamRequest(const HttpHeaderEntry *e, const String strConnection, HttpRequest * request, const HttpRequest * orig_request, HttpHeader * hdr_out, const int we_do_ranges, const http_state_flags flags)
528b2c61 1846{
e8466ea9 1847 debugs(11, 5, "httpBuildRequestHeader: " << e->name << ": " << e->value );
62e76326 1848
528b2c61 1849 switch (e->id) {
62e76326 1850
af6a12ee 1851 /** \par RFC 2616 sect 13.5.1 - Hop-by-Hop headers which Squid should not pass on. */
9e498bfb 1852
be753325 1853 case HDR_PROXY_AUTHORIZATION:
9e498bfb
AJ
1854 /** \par Proxy-Authorization:
1855 * Only pass on proxy authentication to peers for which
62e76326 1856 * authentication forwarding is explicitly enabled
1857 */
ee0b94f4 1858 if (!flags.originpeer && flags.proxying && orig_request->peer_login &&
f54f527e
AJ
1859 (strcmp(orig_request->peer_login, "PASS") == 0 ||
1860 strcmp(orig_request->peer_login, "PROXYPASS") == 0 ||
1861 strcmp(orig_request->peer_login, "PASSTHRU") == 0)) {
eede25e7 1862 hdr_out->addEntry(e->clone());
62e76326 1863 }
62e76326 1864 break;
1865
af6a12ee 1866 /** \par RFC 2616 sect 13.5.1 - Hop-by-Hop headers which Squid does not pass on. */
9e498bfb
AJ
1867
1868 case HDR_CONNECTION: /** \par Connection: */
1869 case HDR_TE: /** \par TE: */
1870 case HDR_KEEP_ALIVE: /** \par Keep-Alive: */
1871 case HDR_PROXY_AUTHENTICATE: /** \par Proxy-Authenticate: */
a1651bad 1872 case HDR_TRAILER: /** \par Trailer: */
9e498bfb
AJ
1873 case HDR_UPGRADE: /** \par Upgrade: */
1874 case HDR_TRANSFER_ENCODING: /** \par Transfer-Encoding: */
1875 break;
1876
1877
af6a12ee 1878 /** \par OTHER headers I haven't bothered to track down yet. */
9e498bfb 1879
be753325 1880 case HDR_AUTHORIZATION:
9e498bfb
AJ
1881 /** \par WWW-Authorization:
1882 * Pass on WWW authentication */
62e76326 1883
1884 if (!flags.originpeer) {
eede25e7 1885 hdr_out->addEntry(e->clone());
62e76326 1886 } else {
9e498bfb 1887 /** \note In accelerators, only forward authentication if enabled
ee0b94f4 1888 * (see also httpFixupAuthentication for special cases)
62e76326 1889 */
abb929f0 1890 if (orig_request->peer_login &&
1891 (strcmp(orig_request->peer_login, "PASS") == 0 ||
11e4c5e5 1892 strcmp(orig_request->peer_login, "PASSTHRU") == 0 ||
abb929f0 1893 strcmp(orig_request->peer_login, "PROXYPASS") == 0)) {
eede25e7 1894 hdr_out->addEntry(e->clone());
62e76326 1895 }
1896 }
1897
1898 break;
1899
be753325 1900 case HDR_HOST:
9e498bfb 1901 /** \par Host:
b883b594 1902 * Normally Squid rewrites the Host: header.
1903 * However, there is one case when we don't: If the URL
62e76326 1904 * went through our redirector and the admin configured
1905 * 'redir_rewrites_host' to be off.
1906 */
9e008dda 1907 if (orig_request->peer_domain)
488b27c5
HN
1908 hdr_out->putStr(HDR_HOST, orig_request->peer_domain);
1909 else if (request->flags.redirected && !Config.onoff.redir_rewrites_host)
eede25e7 1910 hdr_out->addEntry(e->clone());
b883b594 1911 else {
1912 /* use port# only if not default */
1913
1914 if (orig_request->port == urlDefaultPort(orig_request->protocol)) {
cc192b50 1915 hdr_out->putStr(HDR_HOST, orig_request->GetHost());
b883b594 1916 } else {
1917 httpHeaderPutStrf(hdr_out, HDR_HOST, "%s:%d",
cc192b50 1918 orig_request->GetHost(),
1919 (int) orig_request->port);
b883b594 1920 }
1921 }
62e76326 1922
1923 break;
1924
be753325 1925 case HDR_IF_MODIFIED_SINCE:
9e498bfb 1926 /** \par If-Modified-Since:
af6a12ee 1927 * append unless we added our own;
9e498bfb 1928 * \note at most one client's ims header can pass through */
b883b594 1929
a9925b40 1930 if (!hdr_out->has(HDR_IF_MODIFIED_SINCE))
eede25e7 1931 hdr_out->addEntry(e->clone());
62e76326 1932
1933 break;
1934
be753325 1935 case HDR_MAX_FORWARDS:
9e498bfb 1936 /** \par Max-Forwards:
fc90edc3
AJ
1937 * pass only on TRACE or OPTIONS requests */
1938 if (orig_request->method == METHOD_TRACE || orig_request->method == METHOD_OPTIONS) {
1939 const int64_t hops = e->getInt64();
62e76326 1940
1941 if (hops > 0)
fc90edc3 1942 hdr_out->putInt64(HDR_MAX_FORWARDS, hops - 1);
62e76326 1943 }
1944
1945 break;
1946
be753325 1947 case HDR_VIA:
9e498bfb
AJ
1948 /** \par Via:
1949 * If Via is disabled then forward any received header as-is.
1950 * Otherwise leave for explicit updated addition later. */
62e76326 1951
1952 if (!Config.onoff.via)
eede25e7 1953 hdr_out->addEntry(e->clone());
62e76326 1954
1955 break;
1956
be753325 1957 case HDR_RANGE:
62e76326 1958
be753325 1959 case HDR_IF_RANGE:
62e76326 1960
be753325 1961 case HDR_REQUEST_RANGE:
9e498bfb
AJ
1962 /** \par Range:, If-Range:, Request-Range:
1963 * Only pass if we accept ranges */
62e76326 1964 if (!we_do_ranges)
eede25e7 1965 hdr_out->addEntry(e->clone());
62e76326 1966
1967 break;
1968
95e78500
AJ
1969 case HDR_PROXY_CONNECTION: // SHOULD ignore. But doing so breaks things.
1970 break;
62e76326 1971
f228d6f6
AR
1972 case HDR_CONTENT_LENGTH:
1973 // pass through unless we chunk; also, keeping this away from default
1974 // prevents request smuggling via Connection: Content-Length tricks
1975 if (!flags.chunked_request)
1976 hdr_out->addEntry(e->clone());
1977 break;
1978
be753325 1979 case HDR_X_FORWARDED_FOR:
62e76326 1980
be753325 1981 case HDR_CACHE_CONTROL:
95e78500 1982 /** \par X-Forwarded-For:, Cache-Control:
9e498bfb
AJ
1983 * handled specially by Squid, so leave off for now.
1984 * append these after the loop if needed */
62e76326 1985 break;
1986
be753325 1987 case HDR_FRONT_END_HTTPS:
9e498bfb
AJ
1988 /** \par Front-End-Https:
1989 * Pass thru only if peer is configured with front-end-https */
62e76326 1990 if (!flags.front_end_https)
eede25e7 1991 hdr_out->addEntry(e->clone());
62e76326 1992
1993 break;
1994
be753325 1995 default:
9e498bfb
AJ
1996 /** \par default.
1997 * pass on all other header fields
1998 * which are NOT listed by the special Connection: header. */
1999
a7a42b14 2000 if (strConnection.size()>0 && strListIsMember(&strConnection, e->name.termedBuf(), ',')) {
e1ea7456 2001 debugs(11, 2, "'" << e->name << "' header cropped by Connection: definition");
9e498bfb
AJ
2002 return;
2003 }
2004
eede25e7 2005 hdr_out->addEntry(e->clone());
528b2c61 2006 }
2007}
2008
e5ee81f0 2009bool
2010HttpStateData::decideIfWeDoRanges (HttpRequest * orig_request)
528b2c61 2011{
e5ee81f0 2012 bool result = true;
62e76326 2013 /* decide if we want to do Ranges ourselves
2014 * and fetch the whole object now)
2015 * We want to handle Ranges ourselves iff
2016 * - we can actually parse client Range specs
2017 * - the specs are expected to be simple enough (e.g. no out-of-order ranges)
2018 * - reply will be cachable
2019 * (If the reply will be uncachable we have to throw it away after
2020 * serving this request, so it is better to forward ranges to
2021 * the server and fetch only the requested content)
2022 */
2023
11e3fa1c
AJ
2024 int64_t roffLimit = orig_request->getRangeOffsetLimit();
2025
62e76326 2026 if (NULL == orig_request->range || !orig_request->flags.cachable
11e3fa1c 2027 || orig_request->range->offsetLimitExceeded(roffLimit) || orig_request->flags.connection_auth)
e5ee81f0 2028 result = false;
62e76326 2029
9e008dda
AJ
2030 debugs(11, 8, "decideIfWeDoRanges: range specs: " <<
2031 orig_request->range << ", cachable: " <<
2032 orig_request->flags.cachable << "; we_do_ranges: " << result);
62e76326 2033
2034 return result;
528b2c61 2035}
2036
62e76326 2037/* build request prefix and append it to a given MemBuf;
99edd1c3 2038 * return the length of the prefix */
9bc73deb 2039mb_size_t
e053c141
FC
2040HttpStateData::buildRequestPrefix(HttpRequest * aRequest,
2041 HttpRequest * original_request,
2042 StoreEntry * sentry,
386c7842 2043 MemBuf * mb)
99edd1c3 2044{
2045 const int offset = mb->size;
3872be7c 2046 HttpVersion httpver(1,1);
2fe7eff9 2047 mb->Printf("%s %s HTTP/%d.%d\r\n",
e053c141
FC
2048 RequestMethodStr(aRequest->method),
2049 aRequest->urlpath.size() ? aRequest->urlpath.termedBuf() : "/",
2fe7eff9 2050 httpver.major,httpver.minor);
99edd1c3 2051 /* build and pack headers */
2052 {
75faaa7a 2053 HttpHeader hdr(hoRequest);
62e76326 2054 Packer p;
386c7842 2055 httpBuildRequestHeader(aRequest, original_request, sentry, &hdr, flags);
9e008dda 2056
e053c141
FC
2057 if (aRequest->flags.pinned && aRequest->flags.connection_auth)
2058 aRequest->flags.auth_sent = 1;
d67acb4e 2059 else if (hdr.has(HDR_AUTHORIZATION))
e053c141 2060 aRequest->flags.auth_sent = 1;
d67acb4e 2061
62e76326 2062 packerToMemInit(&p, mb);
a9925b40 2063 hdr.packInto(&p);
519e0948 2064 hdr.clean();
62e76326 2065 packerClean(&p);
9d9d144b 2066 }
99edd1c3 2067 /* append header terminator */
2fe7eff9 2068 mb->append(crlf, 2);
99edd1c3 2069 return mb->size - offset;
6bf8443a 2070}
62e76326 2071
090089c4 2072/* This will be called when connect completes. Write request. */
5f8252d2 2073bool
2bb867b5 2074HttpStateData::sendRequest()
090089c4 2075{
99edd1c3 2076 MemBuf mb;
090089c4 2077
bf8fe701 2078 debugs(11, 5, "httpSendRequest: FD " << fd << ", request " << request << ", this " << this << ".");
a0297974
AR
2079
2080 if (!canSend(fd)) {
2081 debugs(11,3, HERE << "cannot send request to closing FD " << fd);
2082 assert(closeHandler != NULL);
2083 return false;
2084 }
2085
dc56a9b1 2086 typedef CommCbMemFunT<HttpStateData, CommTimeoutCbParams> TimeoutDialer;
4299f876 2087 AsyncCall::Pointer timeoutCall = JobCallback(11, 5,
4cb2536f 2088 TimeoutDialer, this, HttpStateData::httpTimeout);
dc56a9b1 2089 commSetTimeout(fd, Config.Timeout.lifetime, timeoutCall);
2bb867b5 2090 flags.do_next_read = 1;
5f8252d2 2091 maybeReadVirginBody();
2092
2093 if (orig_request->body_pipe != NULL) {
123ec4de 2094 if (!startRequestBodyFlow()) // register to receive body data
5f8252d2 2095 return false;
9e008dda 2096 typedef CommCbMemFunT<HttpStateData, CommIoCbParams> Dialer;
4299f876 2097 requestSender = JobCallback(11,5,
4cb2536f 2098 Dialer, this, HttpStateData::sentRequestBody);
e31a1e67
AR
2099
2100 Must(!flags.chunked_request);
f228d6f6
AR
2101 // use chunked encoding if we do not know the length
2102 if (orig_request->content_length < 0)
e31a1e67 2103 flags.chunked_request = 1;
5f8252d2 2104 } else {
2105 assert(!requestBodySource);
9e008dda 2106 typedef CommCbMemFunT<HttpStateData, CommIoCbParams> Dialer;
4299f876 2107 requestSender = JobCallback(11,5,
39cb8c41 2108 Dialer, this, HttpStateData::wroteLast);
5f8252d2 2109 }
54220df8 2110
2bb867b5 2111 if (_peer != NULL) {
2112 if (_peer->options.originserver) {
2113 flags.proxying = 0;
2114 flags.originpeer = 1;
62e76326 2115 } else {
2bb867b5 2116 flags.proxying = 1;
2117 flags.originpeer = 0;
62e76326 2118 }
be753325 2119 } else {
2bb867b5 2120 flags.proxying = 0;
2121 flags.originpeer = 0;
be753325 2122 }
62e76326 2123
efb9218c 2124 /*
99edd1c3 2125 * Is keep-alive okay for all request methods?
efb9218c 2126 */
d67acb4e 2127 if (orig_request->flags.must_keepalive)
9e008dda 2128 flags.keepalive = 1;
d67acb4e 2129 else if (!Config.onoff.server_pconns)
2bb867b5 2130 flags.keepalive = 0;
2131 else if (_peer == NULL)
2132 flags.keepalive = 1;
2133 else if (_peer->stats.n_keepalives_sent < 10)
2134 flags.keepalive = 1;
2135 else if ((double) _peer->stats.n_keepalives_recv /
2136 (double) _peer->stats.n_keepalives_sent > 0.50)
2137 flags.keepalive = 1;
2138
2139 if (_peer) {
2140 if (neighborType(_peer, request) == PEER_SIBLING &&
2141 !_peer->options.allow_miss)
2142 flags.only_if_cached = 1;
2143
2144 flags.front_end_https = _peer->front_end_https;
a7ad6e4e 2145 }
62e76326 2146
2fe7eff9 2147 mb.init();
9ca29d23 2148 request->peer_host=_peer?_peer->host:NULL;
386c7842 2149 buildRequestPrefix(request, orig_request, entry, &mb);
bf8fe701 2150 debugs(11, 6, "httpSendRequest: FD " << fd << ":\n" << mb.buf);
ec41b64c 2151 Comm::Write(fd, &mb, requestSender);
5f8252d2 2152
2153 return true;
090089c4 2154}
b6a2f15e 2155
39cb8c41
AR
2156bool
2157HttpStateData::getMoreRequestBody(MemBuf &buf)
2158{
2159 // parent's implementation can handle the no-encoding case
e31a1e67 2160 if (!flags.chunked_request)
39cb8c41
AR
2161 return ServerStateData::getMoreRequestBody(buf);
2162
2163 MemBuf raw;
2164
2165 Must(requestBodySource != NULL);
2166 if (!requestBodySource->getMoreData(raw))
2167 return false; // no request body bytes to chunk yet
2168
2169 // optimization: pre-allocate buffer size that should be enough
2170 const mb_size_t rawDataSize = raw.contentSize();
2171 // we may need to send: hex-chunk-size CRLF raw-data CRLF last-chunk
2172 buf.init(16 + 2 + rawDataSize + 2 + 5, raw.max_capacity);
2173
d958d14f 2174 buf.Printf("%x\r\n", static_cast<unsigned int>(rawDataSize));
39cb8c41
AR
2175 buf.append(raw.content(), rawDataSize);
2176 buf.Printf("\r\n");
2177
2178 Must(rawDataSize > 0); // we did not accidently created last-chunk above
2179
2180 // Do not send last-chunk unless we successfully received everything
2181 if (receivedWholeRequestBody) {
2182 Must(!flags.sentLastChunk);
2183 flags.sentLastChunk = true;
de48b288 2184 buf.append("0\r\n\r\n", 5);
39cb8c41
AR
2185 }
2186
2187 return true;
2188}
2189
910169e5 2190void
b6b6f466 2191httpStart(FwdState *fwd)
603a02fd 2192{
60745f24 2193 debugs(11, 3, "httpStart: \"" << RequestMethodStr(fwd->request->method) << " " << fwd->entry->url() << "\"" );
a3d50c30 2194 HttpStateData *httpState = new HttpStateData(fwd);
62e76326 2195
5f8252d2 2196 if (!httpState->sendRequest()) {
bf8fe701 2197 debugs(11, 3, "httpStart: aborted");
5f8252d2 2198 delete httpState;
2199 return;
2200 }
62e76326 2201
5f8252d2 2202 statCounter.server.all.requests++;
83704487 2203 statCounter.server.http.requests++;
62e76326 2204
b6a2f15e 2205 /*
2206 * We used to set the read timeout here, but not any more.
2207 * Now its set in httpSendComplete() after the full request,
2208 * including request body, has been written to the server.
2209 */
090089c4 2210}
2211
39cb8c41
AR
2212/// if broken posts are enabled for the request, try to fix and return true
2213bool
2214HttpStateData::finishingBrokenPost()
2bb867b5 2215{
626096be 2216#if USE_HTTP_VIOLATIONS
39cb8c41
AR
2217 if (!Config.accessList.brokenPosts) {
2218 debugs(11, 5, HERE << "No brokenPosts list");
2219 return false;
2220 }
a0297974 2221
e11513e1 2222 ACLFilledChecklist ch(Config.accessList.brokenPosts, originalRequest(), NULL);
39cb8c41
AR
2223 if (!ch.fastCheck()) {
2224 debugs(11, 5, HERE << "didn't match brokenPosts");
2225 return false;
2226 }
a0297974 2227
39cb8c41
AR
2228 if (!canSend(fd)) {
2229 debugs(11,2, HERE << "ignoring broken POST for closing FD " << fd);
2230 assert(closeHandler != NULL);
2231 return true; // prevent caller from proceeding as if nothing happened
54220df8 2232 }
39cb8c41
AR
2233
2234 debugs(11, 2, "finishingBrokenPost: fixing broken POST");
2235 typedef CommCbMemFunT<HttpStateData, CommIoCbParams> Dialer;
2236 requestSender = JobCallback(11,5,
2237 Dialer, this, HttpStateData::wroteLast);
ec41b64c 2238 Comm::Write(fd, "\r\n", 2, requestSender, NULL);
39cb8c41
AR
2239 return true;
2240#else
2241 return false;
626096be 2242#endif /* USE_HTTP_VIOLATIONS */
39cb8c41
AR
2243}
2244
2245/// if needed, write last-chunk to end the request body and return true
2246bool
2247HttpStateData::finishingChunkedRequest()
2248{
2249 if (flags.sentLastChunk) {
2250 debugs(11, 5, HERE << "already sent last-chunk");
2251 return false;
2252 }
2253
2254 Must(receivedWholeRequestBody); // or we should not be sending last-chunk
2255 flags.sentLastChunk = true;
2256
2257 typedef CommCbMemFunT<HttpStateData, CommIoCbParams> Dialer;
2258 requestSender = JobCallback(11,5,
2259 Dialer, this, HttpStateData::wroteLast);
ec41b64c 2260 Comm::Write(fd, "0\r\n\r\n", 5, requestSender, NULL);
39cb8c41
AR
2261 return true;
2262}
2263
2264void
2265HttpStateData::doneSendingRequestBody()
2266{
2267 ServerStateData::doneSendingRequestBody();
2268 debugs(11,5, HERE << "doneSendingRequestBody: FD " << fd);
2269
2270 // do we need to write something after the last body byte?
e31a1e67 2271 if (flags.chunked_request && finishingChunkedRequest())
39cb8c41 2272 return;
e31a1e67 2273 if (!flags.chunked_request && finishingBrokenPost())
39cb8c41 2274 return;
aa49962c 2275
39cb8c41 2276 sendComplete();
94439e4e 2277}
2278
5f8252d2 2279// more origin request body data is available
2bb867b5 2280void
5f8252d2 2281HttpStateData::handleMoreRequestBodyAvailable()
2bb867b5 2282{
2bb867b5 2283 if (eof || fd < 0) {
5f8252d2 2284 // XXX: we should check this condition in other callbacks then!
2285 // TODO: Check whether this can actually happen: We should unsubscribe
2286 // as a body consumer when the above condition(s) are detected.
2bb867b5 2287 debugs(11, 1, HERE << "Transaction aborted while reading HTTP body");
2bb867b5 2288 return;
2289 }
62e76326 2290
5f8252d2 2291 assert(requestBodySource != NULL);
fc68f6b1 2292
5f8252d2 2293 if (requestBodySource->buf().hasContent()) {
2294 // XXX: why does not this trigger a debug message on every request?
fc68f6b1 2295
2bb867b5 2296 if (flags.headers_parsed && !flags.abuse_detected) {
2297 flags.abuse_detected = 1;
cc192b50 2298 debugs(11, 1, "http handleMoreRequestBodyAvailable: Likely proxy abuse detected '" << orig_request->client_addr << "' -> '" << entry->url() << "'" );
21b92762 2299
585ab260 2300 if (virginReply()->sline.status == HTTP_INVALID_HEADER) {
2bb867b5 2301 comm_close(fd);
21b92762 2302 return;
2303 }
2304 }
b6a2f15e 2305 }
5f8252d2 2306
2307 HttpStateData::handleMoreRequestBodyAvailable();
376bb137 2308}
2309
5f8252d2 2310// premature end of the request body
2bb867b5 2311void
5f8252d2 2312HttpStateData::handleRequestBodyProducerAborted()
376bb137 2313{
5f8252d2 2314 ServerStateData::handleRequestBodyProducerAborted();
64b66b76
CT
2315 if (entry->isEmpty()) {
2316 debugs(11, 3, "request body aborted: FD " << fd);
2317 ErrorState *err;
8b997339
AR
2318 // We usually get here when ICAP REQMOD aborts during body processing.
2319 // We might also get here if client-side aborts, but then our response
2320 // should not matter because either client-side will provide its own or
2321 // there will be no response at all (e.g., if the the client has left).
2322 err = errorCon(ERR_ICAP_FAILURE, HTTP_INTERNAL_SERVER_ERROR, fwd->request);
2323 err->xerrno = ERR_DETAIL_SRV_REQMOD_REQ_BODY;
64b66b76
CT
2324 fwd->fail(err);
2325 }
2326
39cb8c41 2327 abortTransaction("request body producer aborted");
2bb867b5 2328}
2329
5f8252d2 2330// called when we wrote request headers(!) or a part of the body
2bb867b5 2331void
dc56a9b1 2332HttpStateData::sentRequestBody(const CommIoCbParams &io)
2bb867b5 2333{
dc56a9b1 2334 if (io.size > 0)
2335 kb_incr(&statCounter.server.http.kbytes_out, io.size);
fc68f6b1 2336
dc56a9b1 2337 ServerStateData::sentRequestBody(io);
5f8252d2 2338}
3b299123 2339
5f8252d2 2340// Quickly abort the transaction
2341// TODO: destruction should be sufficient as the destructor should cleanup,
2342// including canceling close handlers
2343void
2344HttpStateData::abortTransaction(const char *reason)
2345{
2346 debugs(11,5, HERE << "aborting transaction for " << reason <<
2347 "; FD " << fd << ", this " << this);
fc68f6b1 2348
3e8c047e 2349 if (fd >= 0) {
62e76326 2350 comm_close(fd);
3e8c047e 2351 return;
c23f0c74 2352 }
3e8c047e 2353
2354 fwd->handleUnregisteredServerEnd();
dc56a9b1 2355 deleteThis("HttpStateData::abortTransaction");
54220df8 2356}
ccf44862 2357
7c4e4e7f 2358HttpRequest *
2359HttpStateData::originalRequest()
2afaba07 2360{
7c4e4e7f 2361 return orig_request;
2afaba07 2362}