src/http.cc

   1
   2 /*
   3  * $Id$
   4  *
   5  * DEBUG: section 11    Hypertext Transfer Protocol (HTTP)
   6  * AUTHOR: Harvest Derived
   7  *
   8  * SQUID Web Proxy Cache          http://www.squid-cache.org/
   9  * ----------------------------------------------------------
  10  *
  11  *  Squid is the result of efforts by numerous individuals from
  12  *  the Internet community; see the CONTRIBUTORS file for full
  13  *  details.   Many organizations have provided support for Squid's
  14  *  development; see the SPONSORS file for full details.  Squid is
  15  *  Copyrighted (C) 2001 by the Regents of the University of
  16  *  California; see the COPYRIGHT file for full details.  Squid
  17  *  incorporates software developed and/or copyrighted by other
  18  *  sources; see the CREDITS file for full details.
  19  *
  20  *  This program is free software; you can redistribute it and/or modify
  21  *  it under the terms of the GNU General Public License as published by
  22  *  the Free Software Foundation; either version 2 of the License, or
  23  *  (at your option) any later version.
  24  *
  25  *  This program is distributed in the hope that it will be useful,
  26  *  but WITHOUT ANY WARRANTY; without even the implied warranty of
  27  *  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
  28  *  GNU General Public License for more details.
  29  *
  30  *  You should have received a copy of the GNU General Public License
  31  *  along with this program; if not, write to the Free Software
  32  *  Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111, USA.
  33  *
  34  */
  35
  36 /*
  37  * Anonymizing patch by lutz@as-node.jena.thur.de
  38  * have a look into http-anon.c to get more informations.
  39  */
  40
  41 #include "squid.h"
  42
  43 #include "acl/FilledChecklist.h"
  44 #if USE_AUTH
  45 #include "auth/UserRequest.h"
  46 #endif
  47 #include "base/AsyncJobCalls.h"
  48 #include "base/TextException.h"
  49 #include "base64.h"
  50 #include "comm/Write.h"
  51 #if USE_DELAY_POOLS
  52 #include "DelayPools.h"
  53 #endif
  54 #include "err_detail_type.h"
  55 #include "errorpage.h"
  56 #include "http.h"
  57 #include "HttpControlMsg.h"
  58 #include "HttpHdrContRange.h"
  59 #include "HttpHdrSc.h"
  60 #include "HttpHdrScTarget.h"
  61 #include "HttpReply.h"
  62 #include "HttpRequest.h"
  63 #include "MemBuf.h"
  64 #include "MemObject.h"
  65 #include "protos.h"
  66 #include "rfc1738.h"
  67 #include "SquidTime.h"
  68 #include "Store.h"
  69
  70
  71 #define SQUID_ENTER_THROWING_CODE() try {
  72 #define SQUID_EXIT_THROWING_CODE(status) \
  73         status = true; \
  74     } \
  75     catch (const std::exception &e) { \
  76         debugs (11, 1, "Exception error:" << e.what()); \
  77         status = false; \
  78     }
  79
  80 CBDATA_CLASS_INIT(HttpStateData);
  81
  82 static const char *const crlf = "\r\n";
  83
  84 static void httpMaybeRemovePublic(StoreEntry *, http_status);
  85 static void copyOneHeaderFromClientsideRequestToUpstreamRequest(const HttpHeaderEntry *e, const String strConnection, HttpRequest * request, const HttpRequest * orig_request,
  86         HttpHeader * hdr_out, const int we_do_ranges, const http_state_flags);
  87
  88 HttpStateData::HttpStateData(FwdState *theFwdState) : AsyncJob("HttpStateData"), ServerStateData(theFwdState),
  89         lastChunk(0), header_bytes_read(0), reply_bytes_read(0),
  90         body_bytes_truncated(0), httpChunkDecoder(NULL)
  91 {
  92     debugs(11,5,HERE << "HttpStateData " << this << " created");
  93     ignoreCacheControl = false;
  94     surrogateNoStore = false;
  95     fd = fwd->server_fd;
  96     readBuf = new MemBuf;
  97     readBuf->init(16*1024, 256*1024);
  98     orig_request = HTTPMSGLOCK(fwd->request);
  99
 100     // reset peer response time stats for %<pt
 101     orig_request->hier.peer_http_request_sent.tv_sec = 0;
 102     orig_request->hier.peer_http_request_sent.tv_usec = 0;
 103
 104     if (fwd->servers)
 105         _peer = fwd->servers->_peer;         /* might be NULL */
 106
 107     if (_peer) {
 108         const char *url;
 109
 110         if (_peer->options.originserver)
 111             url = orig_request->urlpath.termedBuf();
 112         else
 113             url = entry->url();
 114
 115         HttpRequest * proxy_req = new HttpRequest(orig_request->method,
 116                 orig_request->protocol, url);
 117
 118         proxy_req->SetHost(_peer->host);
 119
 120         proxy_req->port = _peer->http_port;
 121
 122         proxy_req->flags = orig_request->flags;
 123
 124         proxy_req->lastmod = orig_request->lastmod;
 125
 126         proxy_req->flags.proxying = 1;
 127
 128         HTTPMSGUNLOCK(request);
 129
 130         request = HTTPMSGLOCK(proxy_req);
 131
 132         /*
 133          * This NEIGHBOR_PROXY_ONLY check probably shouldn't be here.
 134          * We might end up getting the object from somewhere else if,
 135          * for example, the request to this neighbor fails.
 136          */
 137         if (_peer->options.proxy_only)
 138             entry->releaseRequest();
 139
 140 #if USE_DELAY_POOLS
 141         entry->setNoDelay(_peer->options.no_delay);
 142 #endif
 143     }
 144
 145     /*
 146      * register the handler to free HTTP state data when the FD closes
 147      */
 148     typedef CommCbMemFunT<HttpStateData, CommCloseCbParams> Dialer;
 149     closeHandler = JobCallback(9, 5,
 150                                Dialer, this, HttpStateData::httpStateConnClosed);
 151     comm_add_close_handler(fd, closeHandler);
 152 }
 153
 154 HttpStateData::~HttpStateData()
 155 {
 156     /*
 157      * don't forget that ~ServerStateData() gets called automatically
 158      */
 159
 160     if (!readBuf->isNull())
 161         readBuf->clean();
 162
 163     delete readBuf;
 164
 165     if (httpChunkDecoder)
 166         delete httpChunkDecoder;
 167
 168     HTTPMSGUNLOCK(orig_request);
 169
 170     debugs(11,5, HERE << "HttpStateData " << this << " destroyed; FD " << fd);
 171 }
 172
 173 int
 174 HttpStateData::dataDescriptor() const
 175 {
 176     return fd;
 177 }
 178 /*
 179 static void
 180 httpStateFree(int fd, void *data)
 181 {
 182     HttpStateData *httpState = static_cast<HttpStateData *>(data);
 183     debugs(11, 5, "httpStateFree: FD " << fd << ", httpState=" << data);
 184     delete httpState;
 185 }*/
 186
 187 void
 188 HttpStateData::httpStateConnClosed(const CommCloseCbParams &params)
 189 {
 190     debugs(11, 5, "httpStateFree: FD " << params.fd << ", httpState=" << params.data);
 191     deleteThis("HttpStateData::httpStateConnClosed");
 192 }
 193
 194 int
 195 httpCachable(const HttpRequestMethod& method)
 196 {
 197     /* GET and HEAD are cachable. Others are not. */
 198
 199     // TODO: replase to HttpRequestMethod::isCachable() ?
 200     if (method != METHOD_GET && method != METHOD_HEAD)
 201         return 0;
 202
 203     /* else cachable */
 204     return 1;
 205 }
 206
 207 void
 208 HttpStateData::httpTimeout(const CommTimeoutCbParams &params)
 209 {
 210     debugs(11, 4, "httpTimeout: FD " << fd << ": '" << entry->url() << "'" );
 211
 212     if (entry->store_status == STORE_PENDING) {
 213         fwd->fail(errorCon(ERR_READ_TIMEOUT, HTTP_GATEWAY_TIMEOUT, fwd->request));
 214     }
 215
 216     comm_close(fd);
 217 }
 218
 219 static void
 220 httpMaybeRemovePublic(StoreEntry * e, http_status status)
 221 {
 222     int remove = 0;
 223     int forbidden = 0;
 224     StoreEntry *pe;
 225
 226     if (!EBIT_TEST(e->flags, KEY_PRIVATE))
 227         return;
 228
 229     switch (status) {
 230
 231     case HTTP_OK:
 232
 233     case HTTP_NON_AUTHORITATIVE_INFORMATION:
 234
 235     case HTTP_MULTIPLE_CHOICES:
 236
 237     case HTTP_MOVED_PERMANENTLY:
 238
 239     case HTTP_MOVED_TEMPORARILY:
 240
 241     case HTTP_GONE:
 242
 243     case HTTP_NOT_FOUND:
 244         remove = 1;
 245
 246         break;
 247
 248     case HTTP_FORBIDDEN:
 249
 250     case HTTP_METHOD_NOT_ALLOWED:
 251         forbidden = 1;
 252
 253         break;
 254
 255 #if WORK_IN_PROGRESS
 256
 257     case HTTP_UNAUTHORIZED:
 258         forbidden = 1;
 259
 260         break;
 261
 262 #endif
 263
 264     default:
 265 #if QUESTIONABLE
 266         /*
 267          * Any 2xx response should eject previously cached entities...
 268          */
 269
 270         if (status >= 200 && status < 300)
 271             remove = 1;
 272
 273 #endif
 274
 275         break;
 276     }
 277
 278     if (!remove && !forbidden)
 279         return;
 280
 281     assert(e->mem_obj);
 282
 283     if (e->mem_obj->request)
 284         pe = storeGetPublicByRequest(e->mem_obj->request);
 285     else
 286         pe = storeGetPublic(e->mem_obj->url, e->mem_obj->method);
 287
 288     if (pe != NULL) {
 289         assert(e != pe);
 290 #if USE_HTCP
 291         neighborsHtcpClear(e, NULL, e->mem_obj->request, e->mem_obj->method, HTCP_CLR_INVALIDATION);
 292 #endif
 293         pe->release();
 294     }
 295
 296     /** \par
 297      * Also remove any cached HEAD response in case the object has
 298      * changed.
 299      */
 300     if (e->mem_obj->request)
 301         pe = storeGetPublicByRequestMethod(e->mem_obj->request, METHOD_HEAD);
 302     else
 303         pe = storeGetPublic(e->mem_obj->url, METHOD_HEAD);
 304
 305     if (pe != NULL) {
 306         assert(e != pe);
 307 #if USE_HTCP
 308         neighborsHtcpClear(e, NULL, e->mem_obj->request, HttpRequestMethod(METHOD_HEAD), HTCP_CLR_INVALIDATION);
 309 #endif
 310         pe->release();
 311     }
 312 }
 313
 314 void
 315 HttpStateData::processSurrogateControl(HttpReply *reply)
 316 {
 317     if (request->flags.accelerated && reply->surrogate_control) {
 318         HttpHdrScTarget *sctusable = httpHdrScGetMergedTarget(reply->surrogate_control, Config.Accel.surrogate_id);
 319
 320         if (sctusable) {
 321             if (EBIT_TEST(sctusable->mask, SC_NO_STORE) ||
 322                     (Config.onoff.surrogate_is_remote
 323                      && EBIT_TEST(sctusable->mask, SC_NO_STORE_REMOTE))) {
 324                 surrogateNoStore = true;
 325                 entry->makePrivate();
 326             }
 327
 328             /* The HttpHeader logic cannot tell if the header it's parsing is a reply to an
 329              * accelerated request or not...
 330              * Still, this is an abstraction breach. - RC
 331              */
 332             if (sctusable->max_age != -1) {
 333                 if (sctusable->max_age < sctusable->max_stale)
 334                     reply->expires = reply->date + sctusable->max_age;
 335                 else
 336                     reply->expires = reply->date + sctusable->max_stale;
 337
 338                 /* And update the timestamps */
 339                 entry->timestampsSet();
 340             }
 341
 342             /* We ignore cache-control directives as per the Surrogate specification */
 343             ignoreCacheControl = true;
 344
 345             httpHdrScTargetDestroy(sctusable);
 346         }
 347     }
 348 }
 349
 350 int
 351 HttpStateData::cacheableReply()
 352 {
 353     HttpReply const *rep = finalReply();
 354     HttpHeader const *hdr = &rep->header;
 355     const int cc_mask = (rep->cache_control) ? rep->cache_control->mask : 0;
 356     const char *v;
 357 #if USE_HTTP_VIOLATIONS
 358
 359     const refresh_t *R = NULL;
 360
 361     /* This strange looking define first looks up the refresh pattern
 362      * and then checks if the specified flag is set. The main purpose
 363      * of this is to simplify the refresh pattern lookup and USE_HTTP_VIOLATIONS
 364      * condition
 365      */
 366 #define REFRESH_OVERRIDE(flag) \
 367     ((R = (R ? R : refreshLimits(entry->mem_obj->url))) , \
 368     (R && R->flags.flag))
 369 #else
 370 #define REFRESH_OVERRIDE(flag) 0
 371 #endif
 372
 373     if (surrogateNoStore)
 374         return 0;
 375
 376     // RFC 2616: do not cache replies to responses with no-store CC directive
 377     if (request && request->cache_control &&
 378             EBIT_TEST(request->cache_control->mask, CC_NO_STORE) &&
 379             !REFRESH_OVERRIDE(ignore_no_store))
 380         return 0;
 381
 382     if (!ignoreCacheControl) {
 383         if (EBIT_TEST(cc_mask, CC_PRIVATE)) {
 384             if (!REFRESH_OVERRIDE(ignore_private))
 385                 return 0;
 386         }
 387
 388         if (EBIT_TEST(cc_mask, CC_NO_CACHE)) {
 389             if (!REFRESH_OVERRIDE(ignore_no_cache))
 390                 return 0;
 391         }
 392
 393         if (EBIT_TEST(cc_mask, CC_NO_STORE)) {
 394             if (!REFRESH_OVERRIDE(ignore_no_store))
 395                 return 0;
 396         }
 397     }
 398
 399     if (request->flags.auth || request->flags.auth_sent) {
 400         /*
 401          * Responses to requests with authorization may be cached
 402          * only if a Cache-Control: public reply header is present.
 403          * RFC 2068, sec 14.9.4
 404          */
 405
 406         if (!EBIT_TEST(cc_mask, CC_PUBLIC)) {
 407             if (!REFRESH_OVERRIDE(ignore_auth))
 408                 return 0;
 409         }
 410     }
 411
 412     /* Pragma: no-cache in _replies_ is not documented in HTTP,
 413      * but servers like "Active Imaging Webcast/2.0" sure do use it */
 414     if (hdr->has(HDR_PRAGMA)) {
 415         String s = hdr->getList(HDR_PRAGMA);
 416         const int no_cache = strListIsMember(&s, "no-cache", ',');
 417         s.clean();
 418
 419         if (no_cache) {
 420             if (!REFRESH_OVERRIDE(ignore_no_cache))
 421                 return 0;
 422         }
 423     }
 424
 425     /*
 426      * The "multipart/x-mixed-replace" content type is used for
 427      * continuous push replies.  These are generally dynamic and
 428      * probably should not be cachable
 429      */
 430     if ((v = hdr->getStr(HDR_CONTENT_TYPE)))
 431         if (!strncasecmp(v, "multipart/x-mixed-replace", 25))
 432             return 0;
 433
 434     switch (rep->sline.status) {
 435         /* Responses that are cacheable */
 436
 437     case HTTP_OK:
 438
 439     case HTTP_NON_AUTHORITATIVE_INFORMATION:
 440
 441     case HTTP_MULTIPLE_CHOICES:
 442
 443     case HTTP_MOVED_PERMANENTLY:
 444
 445     case HTTP_GONE:
 446         /*
 447          * Don't cache objects that need to be refreshed on next request,
 448          * unless we know how to refresh it.
 449          */
 450
 451         if (!refreshIsCachable(entry) && !REFRESH_OVERRIDE(store_stale)) {
 452             debugs(22, 3, "refreshIsCachable() returned non-cacheable..");
 453             return 0;
 454         } else
 455             return 1;
 456
 457         /* NOTREACHED */
 458         break;
 459
 460         /* Responses that only are cacheable if the server says so */
 461
 462     case HTTP_MOVED_TEMPORARILY:
 463     case HTTP_TEMPORARY_REDIRECT:
 464         if (rep->expires > rep->date && rep->date > 0)
 465             return 1;
 466         else
 467             return 0;
 468
 469         /* NOTREACHED */
 470         break;
 471
 472         /* Errors can be negatively cached */
 473
 474     case HTTP_NO_CONTENT:
 475
 476     case HTTP_USE_PROXY:
 477
 478     case HTTP_BAD_REQUEST:
 479
 480     case HTTP_FORBIDDEN:
 481
 482     case HTTP_NOT_FOUND:
 483
 484     case HTTP_METHOD_NOT_ALLOWED:
 485
 486     case HTTP_REQUEST_URI_TOO_LARGE:
 487
 488     case HTTP_INTERNAL_SERVER_ERROR:
 489
 490     case HTTP_NOT_IMPLEMENTED:
 491
 492     case HTTP_BAD_GATEWAY:
 493
 494     case HTTP_SERVICE_UNAVAILABLE:
 495
 496     case HTTP_GATEWAY_TIMEOUT:
 497         return -1;
 498
 499         /* NOTREACHED */
 500         break;
 501
 502         /* Some responses can never be cached */
 503
 504     case HTTP_PARTIAL_CONTENT:  /* Not yet supported */
 505
 506     case HTTP_SEE_OTHER:
 507
 508     case HTTP_NOT_MODIFIED:
 509
 510     case HTTP_UNAUTHORIZED:
 511
 512     case HTTP_PROXY_AUTHENTICATION_REQUIRED:
 513
 514     case HTTP_INVALID_HEADER:   /* Squid header parsing error */
 515
 516     case HTTP_HEADER_TOO_LARGE:
 517
 518     case HTTP_PAYMENT_REQUIRED:
 519     case HTTP_NOT_ACCEPTABLE:
 520     case HTTP_REQUEST_TIMEOUT:
 521     case HTTP_CONFLICT:
 522     case HTTP_LENGTH_REQUIRED:
 523     case HTTP_PRECONDITION_FAILED:
 524     case HTTP_REQUEST_ENTITY_TOO_LARGE:
 525     case HTTP_UNSUPPORTED_MEDIA_TYPE:
 526     case HTTP_UNPROCESSABLE_ENTITY:
 527     case HTTP_LOCKED:
 528     case HTTP_FAILED_DEPENDENCY:
 529     case HTTP_INSUFFICIENT_STORAGE:
 530     case HTTP_REQUESTED_RANGE_NOT_SATISFIABLE:
 531     case HTTP_EXPECTATION_FAILED:
 532
 533         return 0;
 534
 535     default:
 536         /* RFC 2616 section 6.1.1: an unrecognized response MUST NOT be cached. */
 537         debugs (11, 3, HERE << "Unknown HTTP status code " << rep->sline.status << ". Not cacheable.");
 538
 539         return 0;
 540
 541         /* NOTREACHED */
 542         break;
 543     }
 544
 545     /* NOTREACHED */
 546 }
 547
 548 /*
 549  * For Vary, store the relevant request headers as
 550  * virtual headers in the reply
 551  * Returns false if the variance cannot be stored
 552  */
 553 const char *
 554 httpMakeVaryMark(HttpRequest * request, HttpReply const * reply)
 555 {
 556     String vary, hdr;
 557     const char *pos = NULL;
 558     const char *item;
 559     const char *value;
 560     int ilen;
 561     static String vstr;
 562
 563     vstr.clean();
 564     vary = reply->header.getList(HDR_VARY);
 565
 566     while (strListGetItem(&vary, ',', &item, &ilen, &pos)) {
 567         char *name = (char *)xmalloc(ilen + 1);
 568         xstrncpy(name, item, ilen + 1);
 569         Tolower(name);
 570
 571         if (strcmp(name, "*") == 0) {
 572             /* Can not handle "Vary: *" withtout ETag support */
 573             safe_free(name);
 574             vstr.clean();
 575             break;
 576         }
 577
 578         strListAdd(&vstr, name, ',');
 579         hdr = request->header.getByName(name);
 580         safe_free(name);
 581         value = hdr.termedBuf();
 582
 583         if (value) {
 584             value = rfc1738_escape_part(value);
 585             vstr.append("=\"", 2);
 586             vstr.append(value);
 587             vstr.append("\"", 1);
 588         }
 589
 590         hdr.clean();
 591     }
 592
 593     vary.clean();
 594 #if X_ACCELERATOR_VARY
 595
 596     pos = NULL;
 597     vary = reply->header.getList(HDR_X_ACCELERATOR_VARY);
 598
 599     while (strListGetItem(&vary, ',', &item, &ilen, &pos)) {
 600         char *name = (char *)xmalloc(ilen + 1);
 601         xstrncpy(name, item, ilen + 1);
 602         Tolower(name);
 603         strListAdd(&vstr, name, ',');
 604         hdr = request->header.getByName(name);
 605         safe_free(name);
 606         value = hdr.termedBuf();
 607
 608         if (value) {
 609             value = rfc1738_escape_part(value);
 610             vstr.append("=\"", 2);
 611             vstr.append(value);
 612             vstr.append("\"", 1);
 613         }
 614
 615         hdr.clean();
 616     }
 617
 618     vary.clean();
 619 #endif
 620
 621     debugs(11, 3, "httpMakeVaryMark: " << vstr);
 622     return vstr.termedBuf();
 623 }
 624
 625 void
 626 HttpStateData::keepaliveAccounting(HttpReply *reply)
 627 {
 628     if (flags.keepalive)
 629         if (_peer)
 630             _peer->stats.n_keepalives_sent++;
 631
 632     if (reply->keep_alive) {
 633         if (_peer)
 634             _peer->stats.n_keepalives_recv++;
 635
 636         if (Config.onoff.detect_broken_server_pconns
 637                 && reply->bodySize(request->method) == -1 && !flags.chunked) {
 638             debugs(11, 1, "keepaliveAccounting: Impossible keep-alive header from '" << entry->url() << "'" );
 639             // debugs(11, 2, "GOT HTTP REPLY HDR:\n---------\n" << readBuf->content() << "\n----------" );
 640             flags.keepalive_broken = 1;
 641         }
 642     }
 643 }
 644
 645 void
 646 HttpStateData::checkDateSkew(HttpReply *reply)
 647 {
 648     if (reply->date > -1 && !_peer) {
 649         int skew = abs((int)(reply->date - squid_curtime));
 650
 651         if (skew > 86400)
 652             debugs(11, 3, "" << request->GetHost() << "'s clock is skewed by " << skew << " seconds!");
 653     }
 654 }
 655
 656 /**
 657  * This creates the error page itself.. its likely
 658  * that the forward ported reply header max size patch
 659  * generates non http conformant error pages - in which
 660  * case the errors where should be 'BAD_GATEWAY' etc
 661  */
 662 void
 663 HttpStateData::processReplyHeader()
 664 {
 665     /** Creates a blank header. If this routine is made incremental, this will not do */
 666
 667     /* NP: all exit points to this function MUST call ctx_exit(ctx) */
 668     Ctx ctx = ctx_enter(entry->mem_obj->url);
 669
 670     debugs(11, 3, "processReplyHeader: key '" << entry->getMD5Text() << "'");
 671
 672     assert(!flags.headers_parsed);
 673
 674     if (!readBuf->hasContent()) {
 675         ctx_exit(ctx);
 676         return;
 677     }
 678
 679     http_status error = HTTP_STATUS_NONE;
 680
 681     HttpReply *newrep = new HttpReply;
 682     const bool parsed = newrep->parse(readBuf, eof, &error);
 683
 684     if (!parsed && readBuf->contentSize() > 5 && strncmp(readBuf->content(), "HTTP/", 5) != 0 && strncmp(readBuf->content(), "ICY", 3) != 0) {
 685         MemBuf *mb;
 686         HttpReply *tmprep = new HttpReply;
 687         tmprep->setHeaders(HTTP_OK, "Gatewaying", NULL, -1, -1, -1);
 688         tmprep->header.putExt("X-Transformed-From", "HTTP/0.9");
 689         mb = tmprep->pack();
 690         newrep->parse(mb, eof, &error);
 691         delete mb;
 692         delete tmprep;
 693     } else {
 694         if (!parsed && error > 0) { // unrecoverable parsing error
 695             debugs(11, 3, "processReplyHeader: Non-HTTP-compliant header: '" <<  readBuf->content() << "'");
 696             flags.headers_parsed = 1;
 697             newrep->sline.version = HttpVersion(1,1);
 698             newrep->sline.status = error;
 699             HttpReply *vrep = setVirginReply(newrep);
 700             entry->replaceHttpReply(vrep);
 701             ctx_exit(ctx);
 702             return;
 703         }
 704
 705         if (!parsed) { // need more data
 706             assert(!error);
 707             assert(!eof);
 708             delete newrep;
 709             ctx_exit(ctx);
 710             return;
 711         }
 712
 713         debugs(11, 9, "GOT HTTP REPLY HDR:\n---------\n" << readBuf->content() << "\n----------");
 714
 715         header_bytes_read = headersEnd(readBuf->content(), readBuf->contentSize());
 716         readBuf->consume(header_bytes_read);
 717     }
 718
 719     newrep->removeStaleWarnings();
 720
 721     if (newrep->sline.protocol == AnyP::PROTO_HTTP && newrep->sline.status >= 100 && newrep->sline.status < 200) {
 722         handle1xx(newrep);
 723         ctx_exit(ctx);
 724         return;
 725     }
 726
 727     flags.chunked = 0;
 728     if (newrep->sline.protocol == AnyP::PROTO_HTTP && newrep->header.chunked()) {
 729         flags.chunked = 1;
 730         httpChunkDecoder = new ChunkedCodingParser;
 731     }
 732
 733     if (!peerSupportsConnectionPinning())
 734         orig_request->flags.connection_auth_disabled = 1;
 735
 736     HttpReply *vrep = setVirginReply(newrep);
 737     flags.headers_parsed = 1;
 738
 739     keepaliveAccounting(vrep);
 740
 741     checkDateSkew(vrep);
 742
 743     processSurrogateControl (vrep);
 744
 745     /** \todo IF the reply is a 1.0 reply, AND it has a Connection: Header
 746      * Parse the header and remove all referenced headers
 747      */
 748
 749     orig_request->hier.peer_reply_status = newrep->sline.status;
 750
 751     ctx_exit(ctx);
 752 }
 753
 754 /// ignore or start forwarding the 1xx response (a.k.a., control message)
 755 void
 756 HttpStateData::handle1xx(HttpReply *reply)
 757 {
 758     HttpMsgPointerT<HttpReply> msg(reply); // will destroy reply if unused
 759
 760     // one 1xx at a time: we must not be called while waiting for previous 1xx
 761     Must(!flags.handling1xx);
 762     flags.handling1xx = true;
 763
 764     if (!orig_request->canHandle1xx()) {
 765         debugs(11, 2, HERE << "ignoring client-unsupported 1xx");
 766         proceedAfter1xx();
 767         return;
 768     }
 769
 770 #if USE_HTTP_VIOLATIONS
 771     // check whether the 1xx response forwarding is allowed by squid.conf
 772     if (Config.accessList.reply) {
 773         ACLFilledChecklist ch(Config.accessList.reply, originalRequest(), NULL);
 774         ch.reply = HTTPMSGLOCK(reply);
 775         if (!ch.fastCheck()) { // TODO: support slow lookups?
 776             debugs(11, 3, HERE << "ignoring denied 1xx");
 777             proceedAfter1xx();
 778             return;
 779         }
 780     }
 781 #endif // USE_HTTP_VIOLATIONS
 782
 783     debugs(11, 2, HERE << "forwarding 1xx to client");
 784
 785     // the Sink will use this to call us back after writing 1xx to the client
 786     typedef NullaryMemFunT<HttpStateData> CbDialer;
 787     const AsyncCall::Pointer cb = JobCallback(11, 3, CbDialer, this,
 788                                   HttpStateData::proceedAfter1xx);
 789     CallJobHere1(11, 4, orig_request->clientConnection, ConnStateData,
 790                  ConnStateData::sendControlMsg, HttpControlMsg(msg, cb));
 791     // If the call is not fired, then the Sink is gone, and HttpStateData
 792     // will terminate due to an aborted store entry or another similar error.
 793     // If we get stuck, it is not handle1xx fault if we could get stuck
 794     // for similar reasons without a 1xx response.
 795 }
 796
 797 /// restores state and resumes processing after 1xx is ignored or forwarded
 798 void
 799 HttpStateData::proceedAfter1xx()
 800 {
 801     Must(flags.handling1xx);
 802
 803     debugs(11, 2, HERE << "consuming " << header_bytes_read <<
 804            " header and " << reply_bytes_read << " body bytes read after 1xx");
 805     header_bytes_read = 0;
 806     reply_bytes_read = 0;
 807
 808     CallJobHere(11, 3, this, HttpStateData, HttpStateData::processReply);
 809 }
 810
 811
 812 /**
 813  * returns true if the peer can support connection pinning
 814 */
 815 bool HttpStateData::peerSupportsConnectionPinning() const
 816 {
 817     const HttpReply *rep = entry->mem_obj->getReply();
 818     const HttpHeader *hdr = &rep->header;
 819     bool rc;
 820     String header;
 821
 822     if (!_peer)
 823         return true;
 824
 825     /*If this peer does not support connection pinning (authenticated
 826       connections) return false
 827      */
 828     if (!_peer->connection_auth)
 829         return false;
 830
 831     /*The peer supports connection pinning and the http reply status
 832       is not unauthorized, so the related connection can be pinned
 833      */
 834     if (rep->sline.status != HTTP_UNAUTHORIZED)
 835         return true;
 836
 837     /*The server respond with HTTP_UNAUTHORIZED and the peer configured
 838       with "connection-auth=on" we know that the peer supports pinned
 839       connections
 840     */
 841     if (_peer->connection_auth == 1)
 842         return true;
 843
 844     /*At this point peer has configured with "connection-auth=auto"
 845       parameter so we need some extra checks to decide if we are going
 846       to allow pinned connections or not
 847     */
 848
 849     /*if the peer configured with originserver just allow connection
 850         pinning (squid 2.6 behaviour)
 851      */
 852     if (_peer->options.originserver)
 853         return true;
 854
 855     /*if the connections it is already pinned it is OK*/
 856     if (request->flags.pinned)
 857         return true;
 858
 859     /*Allow pinned connections only if the Proxy-support header exists in
 860       reply and has in its list the "Session-Based-Authentication"
 861       which means that the peer supports connection pinning.
 862      */
 863     if (!hdr->has(HDR_PROXY_SUPPORT))
 864         return false;
 865
 866     header = hdr->getStrOrList(HDR_PROXY_SUPPORT);
 867     /* XXX This ought to be done in a case-insensitive manner */
 868     rc = (strstr(header.termedBuf(), "Session-Based-Authentication") != NULL);
 869
 870     return rc;
 871 }
 872
 873 // Called when we parsed (and possibly adapted) the headers but
 874 // had not starting storing (a.k.a., sending) the body yet.
 875 void
 876 HttpStateData::haveParsedReplyHeaders()
 877 {
 878     ServerStateData::haveParsedReplyHeaders();
 879
 880     Ctx ctx = ctx_enter(entry->mem_obj->url);
 881     HttpReply *rep = finalReply();
 882
 883     if (rep->sline.status == HTTP_PARTIAL_CONTENT &&
 884             rep->content_range)
 885         currentOffset = rep->content_range->spec.offset;
 886
 887     entry->timestampsSet();
 888
 889     /* Check if object is cacheable or not based on reply code */
 890     debugs(11, 3, "haveParsedReplyHeaders: HTTP CODE: " << rep->sline.status);
 891
 892     if (neighbors_do_private_keys)
 893         httpMaybeRemovePublic(entry, rep->sline.status);
 894
 895     if (rep->header.has(HDR_VARY)
 896 #if X_ACCELERATOR_VARY
 897             || rep->header.has(HDR_X_ACCELERATOR_VARY)
 898 #endif
 899        ) {
 900         const char *vary = httpMakeVaryMark(orig_request, rep);
 901
 902         if (!vary) {
 903             entry->makePrivate();
 904             if (!fwd->reforwardableStatus(rep->sline.status))
 905                 EBIT_CLR(entry->flags, ENTRY_FWD_HDR_WAIT);
 906             goto no_cache;
 907         }
 908
 909         entry->mem_obj->vary_headers = xstrdup(vary);
 910     }
 911
 912     /*
 913      * If its not a reply that we will re-forward, then
 914      * allow the client to get it.
 915      */
 916     if (!fwd->reforwardableStatus(rep->sline.status))
 917         EBIT_CLR(entry->flags, ENTRY_FWD_HDR_WAIT);
 918
 919     switch (cacheableReply()) {
 920
 921     case 1:
 922         entry->makePublic();
 923         break;
 924
 925     case 0:
 926         entry->makePrivate();
 927         break;
 928
 929     case -1:
 930
 931 #if USE_HTTP_VIOLATIONS
 932         if (Config.negativeTtl > 0)
 933             entry->cacheNegatively();
 934         else
 935 #endif
 936             entry->makePrivate();
 937
 938         break;
 939
 940     default:
 941         assert(0);
 942
 943         break;
 944     }
 945
 946 no_cache:
 947
 948     if (!ignoreCacheControl && rep->cache_control) {
 949         if (EBIT_TEST(rep->cache_control->mask, CC_PROXY_REVALIDATE) ||
 950                 EBIT_TEST(rep->cache_control->mask, CC_MUST_REVALIDATE) ||
 951                 EBIT_TEST(rep->cache_control->mask, CC_S_MAXAGE))
 952             EBIT_SET(entry->flags, ENTRY_REVALIDATE);
 953     }
 954
 955 #if HEADERS_LOG
 956     headersLog(1, 0, request->method, rep);
 957
 958 #endif
 959
 960     ctx_exit(ctx);
 961 }
 962
 963 HttpStateData::ConnectionStatus
 964 HttpStateData::statusIfComplete() const
 965 {
 966     const HttpReply *rep = virginReply();
 967     /** \par
 968      * If the reply wants to close the connection, it takes precedence */
 969
 970     if (httpHeaderHasConnDir(&rep->header, "close"))
 971         return COMPLETE_NONPERSISTENT_MSG;
 972
 973     /** \par
 974      * If we didn't send a keep-alive request header, then this
 975      * can not be a persistent connection.
 976      */
 977     if (!flags.keepalive)
 978         return COMPLETE_NONPERSISTENT_MSG;
 979
 980     /** \par
 981      * If we haven't sent the whole request then this can not be a persistent
 982      * connection.
 983      */
 984     if (!flags.request_sent) {
 985         debugs(11, 2, "statusIfComplete: Request not yet fully sent \"" << RequestMethodStr(orig_request->method) << " " << entry->url() << "\"" );
 986         return COMPLETE_NONPERSISTENT_MSG;
 987     }
 988
 989     /** \par
 990      * What does the reply have to say about keep-alive?
 991      */
 992     /**
 993      \bug XXX BUG?
 994      * If the origin server (HTTP/1.0) does not send a keep-alive
 995      * header, but keeps the connection open anyway, what happens?
 996      * We'll return here and http.c waits for an EOF before changing
 997      * store_status to STORE_OK.   Combine this with ENTRY_FWD_HDR_WAIT
 998      * and an error status code, and we might have to wait until
 999      * the server times out the socket.
1000      */
1001     if (!rep->keep_alive)
1002         return COMPLETE_NONPERSISTENT_MSG;
1003
1004     return COMPLETE_PERSISTENT_MSG;
1005 }
1006
1007 HttpStateData::ConnectionStatus
1008 HttpStateData::persistentConnStatus() const
1009 {
1010     debugs(11, 3, "persistentConnStatus: FD " << fd << " eof=" << eof);
1011     if (eof) // already reached EOF
1012         return COMPLETE_NONPERSISTENT_MSG;
1013
1014     /* If server fd is closing (but we have not been notified yet), stop Comm
1015        I/O to avoid assertions. TODO: Change Comm API to handle callers that
1016        want more I/O after async closing (usually initiated by others). */
1017     // XXX: add canReceive or s/canSend/canTalkToServer/
1018     if (!canSend(fd))
1019         return COMPLETE_NONPERSISTENT_MSG;
1020
1021     /** \par
1022      * In chunked response we do not know the content length but we are absolutely
1023      * sure about the end of response, so we are calling the statusIfComplete to
1024      * decide if we can be persistant
1025      */
1026     if (lastChunk && flags.chunked)
1027         return statusIfComplete();
1028
1029     const HttpReply *vrep = virginReply();
1030     debugs(11, 5, "persistentConnStatus: content_length=" << vrep->content_length);
1031
1032     const int64_t clen = vrep->bodySize(request->method);
1033
1034     debugs(11, 5, "persistentConnStatus: clen=" << clen);
1035
1036     /* If the body size is unknown we must wait for EOF */
1037     if (clen < 0)
1038         return INCOMPLETE_MSG;
1039
1040     /** \par
1041      * If the body size is known, we must wait until we've gotten all of it. */
1042     if (clen > 0) {
1043         // old technique:
1044         // if (entry->mem_obj->endOffset() < vrep->content_length + vrep->hdr_sz)
1045         const int64_t body_bytes_read = reply_bytes_read - header_bytes_read;
1046         debugs(11,5, "persistentConnStatus: body_bytes_read=" <<
1047                body_bytes_read << " content_length=" << vrep->content_length);
1048
1049         if (body_bytes_read < vrep->content_length)
1050             return INCOMPLETE_MSG;
1051
1052         if (body_bytes_truncated > 0) // already read more than needed
1053             return COMPLETE_NONPERSISTENT_MSG; // disable pconns
1054     }
1055
1056     /** \par
1057      * If there is no message body or we got it all, we can be persistent */
1058     return statusIfComplete();
1059 }
1060
1061 /*
1062  * This is the callback after some data has been read from the network
1063  */
1064 /*
1065 void
1066 HttpStateData::ReadReplyWrapper(int fd, char *buf, size_t len, comm_err_t flag, int xerrno, void *data)
1067 {
1068     HttpStateData *httpState = static_cast<HttpStateData *>(data);
1069     assert (fd == httpState->fd);
1070     // assert(buf == readBuf->content());
1071     PROF_start(HttpStateData_readReply);
1072     httpState->readReply(len, flag, xerrno);
1073     PROF_stop(HttpStateData_readReply);
1074 }
1075 */
1076
1077 /* XXX this function is too long! */
1078 void
1079 HttpStateData::readReply(const CommIoCbParams &io)
1080 {
1081     int bin;
1082     int clen;
1083     int len = io.size;
1084
1085     assert(fd == io.fd);
1086
1087     flags.do_next_read = 0;
1088
1089     debugs(11, 5, "httpReadReply: FD " << fd << ": len " << len << ".");
1090
1091     // Bail out early on COMM_ERR_CLOSING - close handlers will tidy up for us
1092     if (io.flag == COMM_ERR_CLOSING) {
1093         debugs(11, 3, "http socket closing");
1094         return;
1095     }
1096
1097     if (EBIT_TEST(entry->flags, ENTRY_ABORTED)) {
1098         maybeReadVirginBody();
1099         return;
1100     }
1101
1102     // handle I/O errors
1103     if (io.flag != COMM_OK || len < 0) {
1104         debugs(11, 2, "httpReadReply: FD " << fd << ": read failure: " << xstrerror() << ".");
1105
1106         if (ignoreErrno(io.xerrno)) {
1107             flags.do_next_read = 1;
1108         } else {
1109             ErrorState *err;
1110             err = errorCon(ERR_READ_ERROR, HTTP_BAD_GATEWAY, fwd->request);
1111             err->xerrno = io.xerrno;
1112             fwd->fail(err);
1113             flags.do_next_read = 0;
1114             comm_close(fd);
1115         }
1116
1117         return;
1118     }
1119
1120     // update I/O stats
1121     if (len > 0) {
1122         readBuf->appended(len);
1123         reply_bytes_read += len;
1124 #if USE_DELAY_POOLS
1125         DelayId delayId = entry->mem_obj->mostBytesAllowed();
1126         delayId.bytesIn(len);
1127 #endif
1128
1129         kb_incr(&statCounter.server.all.kbytes_in, len);
1130         kb_incr(&statCounter.server.http.kbytes_in, len);
1131         IOStats.Http.reads++;
1132
1133         for (clen = len - 1, bin = 0; clen; bin++)
1134             clen >>= 1;
1135
1136         IOStats.Http.read_hist[bin]++;
1137
1138         // update peer response time stats (%<pt)
1139         const timeval &sent = orig_request->hier.peer_http_request_sent;
1140         orig_request->hier.peer_response_time =
1141             sent.tv_sec ? tvSubMsec(sent, current_time) : -1;
1142     }
1143
1144     /** \par
1145      * Here the RFC says we should ignore whitespace between replies, but we can't as
1146      * doing so breaks HTTP/0.9 replies beginning with witespace, and in addition
1147      * the response splitting countermeasures is extremely likely to trigger on this,
1148      * not allowing connection reuse in the first place.
1149      */
1150 #if DONT_DO_THIS
1151     if (!flags.headers_parsed && len > 0 && fd_table[fd].uses > 1) {
1152         /* Skip whitespace between replies */
1153
1154         while (len > 0 && xisspace(*buf))
1155             memmove(buf, buf + 1, len--);
1156
1157         if (len == 0) {
1158             /* Continue to read... */
1159             /* Timeout NOT increased. This whitespace was from previous reply */
1160             flags.do_next_read = 1;
1161             maybeReadVirginBody();
1162             return;
1163         }
1164     }
1165
1166 #endif
1167
1168     if (len == 0) { // reached EOF?
1169         eof = 1;
1170         flags.do_next_read = 0;
1171
1172         /* Bug 2879: Replies may terminate with \r\n then EOF instead of \r\n\r\n
1173          * Ensure here that we have at minimum two \r\n when EOF is seen.
1174          * TODO: Add eof parameter to headersEnd() and move this hack there.
1175          */
1176         if (readBuf->contentSize() && !flags.headers_parsed) {
1177             /*
1178              * Yes Henrik, there is a point to doing this.  When we
1179              * called httpProcessReplyHeader() before, we didn't find
1180              * the end of headers, but now we are definately at EOF, so
1181              * we want to process the reply headers.
1182              */
1183             /* Fake an "end-of-headers" to work around such broken servers */
1184             readBuf->append("\r\n", 2);
1185         }
1186     }
1187
1188     processReply();
1189 }
1190
1191 /// processes the already read and buffered response data, possibly after
1192 /// waiting for asynchronous 1xx control message processing
1193 void
1194 HttpStateData::processReply()
1195 {
1196
1197     if (flags.handling1xx) { // we came back after handling a 1xx response
1198         debugs(11, 5, HERE << "done with 1xx handling");
1199         flags.handling1xx = false;
1200         Must(!flags.headers_parsed);
1201     }
1202
1203     if (!flags.headers_parsed) { // have not parsed headers yet?
1204         PROF_start(HttpStateData_processReplyHeader);
1205         processReplyHeader();
1206         PROF_stop(HttpStateData_processReplyHeader);
1207
1208         if (!continueAfterParsingHeader()) // parsing error or need more data
1209             return; // TODO: send errors to ICAP
1210
1211         adaptOrFinalizeReply();
1212     }
1213
1214     // kick more reads if needed and/or process the response body, if any
1215     PROF_start(HttpStateData_processReplyBody);
1216     processReplyBody(); // may call serverComplete()
1217     PROF_stop(HttpStateData_processReplyBody);
1218 }
1219
1220 /**
1221  \retval true    if we can continue with processing the body or doing ICAP.
1222  */
1223 bool
1224 HttpStateData::continueAfterParsingHeader()
1225 {
1226     if (flags.handling1xx) {
1227         debugs(11, 5, HERE << "wait for 1xx handling");
1228         Must(!flags.headers_parsed);
1229         return false;
1230     }
1231
1232     if (!flags.headers_parsed && !eof) {
1233         debugs(11, 9, HERE << "needs more at " << readBuf->contentSize());
1234         flags.do_next_read = 1;
1235         /** \retval false If we have not finished parsing the headers and may get more data.
1236          *                Schedules more reads to retrieve the missing data.
1237          */
1238         maybeReadVirginBody(); // schedules all kinds of reads; TODO: rename
1239         return false;
1240     }
1241
1242     /** If we are done with parsing, check for errors */
1243
1244     err_type error = ERR_NONE;
1245
1246     if (flags.headers_parsed) { // parsed headers, possibly with errors
1247         // check for header parsing errors
1248         if (HttpReply *vrep = virginReply()) {
1249             const http_status s = vrep->sline.status;
1250             const HttpVersion &v = vrep->sline.version;
1251             if (s == HTTP_INVALID_HEADER && v != HttpVersion(0,9)) {
1252                 debugs(11, DBG_IMPORTANT, "WARNING: HTTP: Invalid Response: Bad header encountered from " << entry->url() << " AKA " << orig_request->GetHost() << orig_request->urlpath.termedBuf() );
1253                 error = ERR_INVALID_RESP;
1254             } else if (s == HTTP_HEADER_TOO_LARGE) {
1255                 fwd->dontRetry(true);
1256                 error = ERR_TOO_BIG;
1257             } else {
1258                 return true; // done parsing, got reply, and no error
1259             }
1260         } else {
1261             // parsed headers but got no reply
1262             debugs(11, DBG_IMPORTANT, "WARNING: HTTP: Invalid Response: No reply at all for " << entry->url() << " AKA " << orig_request->GetHost() << orig_request->urlpath.termedBuf() );
1263             error = ERR_INVALID_RESP;
1264         }
1265     } else {
1266         assert(eof);
1267         if (readBuf->hasContent()) {
1268             error = ERR_INVALID_RESP;
1269             debugs(11, DBG_IMPORTANT, "WARNING: HTTP: Invalid Response: Headers did not parse at all for " << entry->url() << " AKA " << orig_request->GetHost() << orig_request->urlpath.termedBuf() );
1270         } else {
1271             error = ERR_ZERO_SIZE_OBJECT;
1272             debugs(11, (orig_request->flags.accelerated?DBG_IMPORTANT:2), "WARNING: HTTP: Invalid Response: No object data received for " <<
1273                    entry->url() << " AKA " << orig_request->GetHost() << orig_request->urlpath.termedBuf() );
1274         }
1275     }
1276
1277     assert(error != ERR_NONE);
1278     entry->reset();
1279     fwd->fail(errorCon(error, HTTP_BAD_GATEWAY, fwd->request));
1280     flags.do_next_read = 0;
1281     comm_close(fd);
1282     return false; // quit on error
1283 }
1284
1285 /** truncate what we read if we read too much so that writeReplyBody()
1286     writes no more than what we should have read */
1287 void
1288 HttpStateData::truncateVirginBody()
1289 {
1290     assert(flags.headers_parsed);
1291
1292     HttpReply *vrep = virginReply();
1293     int64_t clen = -1;
1294     if (!vrep->expectingBody(request->method, clen) || clen < 0)
1295         return; // no body or a body of unknown size, including chunked
1296
1297     const int64_t body_bytes_read = reply_bytes_read - header_bytes_read;
1298     if (body_bytes_read - body_bytes_truncated <= clen)
1299         return; // we did not read too much or already took care of the extras
1300
1301     if (const int64_t extras = body_bytes_read - body_bytes_truncated - clen) {
1302         // server sent more that the advertised content length
1303         debugs(11,5, HERE << "body_bytes_read=" << body_bytes_read <<
1304                " clen=" << clen << '/' << vrep->content_length <<
1305                " body_bytes_truncated=" << body_bytes_truncated << '+' << extras);
1306
1307         readBuf->truncate(extras);
1308         body_bytes_truncated += extras;
1309     }
1310 }
1311
1312 /**
1313  * Call this when there is data from the origin server
1314  * which should be sent to either StoreEntry, or to ICAP...
1315  */
1316 void
1317 HttpStateData::writeReplyBody()
1318 {
1319     truncateVirginBody(); // if needed
1320     const char *data = readBuf->content();
1321     int len = readBuf->contentSize();
1322     addVirginReplyBody(data, len);
1323     readBuf->consume(len);
1324 }
1325
1326 bool
1327 HttpStateData::decodeAndWriteReplyBody()
1328 {
1329     const char *data = NULL;
1330     int len;
1331     bool wasThereAnException = false;
1332     assert(flags.chunked);
1333     assert(httpChunkDecoder);
1334     SQUID_ENTER_THROWING_CODE();
1335     MemBuf decodedData;
1336     decodedData.init();
1337     const bool doneParsing = httpChunkDecoder->parse(readBuf,&decodedData);
1338     len = decodedData.contentSize();
1339     data=decodedData.content();
1340     addVirginReplyBody(data, len);
1341     if (doneParsing) {
1342         lastChunk = 1;
1343         flags.do_next_read = 0;
1344     }
1345     SQUID_EXIT_THROWING_CODE(wasThereAnException);
1346     return wasThereAnException;
1347 }
1348
1349 /**
1350  * processReplyBody has two purposes:
1351  *  1 - take the reply body data, if any, and put it into either
1352  *      the StoreEntry, or give it over to ICAP.
1353  *  2 - see if we made it to the end of the response (persistent
1354  *      connections and such)
1355  */
1356 void
1357 HttpStateData::processReplyBody()
1358 {
1359     AsyncCall::Pointer call;
1360     Ip::Address client_addr;
1361     bool ispinned = false;
1362
1363     if (!flags.headers_parsed) {
1364         flags.do_next_read = 1;
1365         maybeReadVirginBody();
1366         return;
1367     }
1368
1369 #if USE_ADAPTATION
1370     debugs(11,5, HERE << "adaptationAccessCheckPending=" << adaptationAccessCheckPending);
1371     if (adaptationAccessCheckPending)
1372         return;
1373
1374 #endif
1375
1376     /*
1377      * At this point the reply headers have been parsed and consumed.
1378      * That means header content has been removed from readBuf and
1379      * it contains only body data.
1380      */
1381     if (flags.chunked) {
1382         if (!decodeAndWriteReplyBody()) {
1383             flags.do_next_read = 0;
1384             serverComplete();
1385             return;
1386         }
1387     } else
1388         writeReplyBody();
1389
1390     if (EBIT_TEST(entry->flags, ENTRY_ABORTED)) {
1391         /*
1392          * The above writeReplyBody() call could ABORT this entry,
1393          * in that case, the server FD should already be closed.
1394          * there's nothing for us to do.
1395          */
1396         (void) 0;
1397     } else
1398         switch (persistentConnStatus()) {
1399         case INCOMPLETE_MSG:
1400             debugs(11, 5, "processReplyBody: INCOMPLETE_MSG");
1401             /* Wait for more data or EOF condition */
1402             if (flags.keepalive_broken) {
1403                 call = NULL;
1404                 commSetTimeout(fd, 10, call);
1405             } else {
1406                 call = NULL;
1407                 commSetTimeout(fd, Config.Timeout.read, call);
1408             }
1409
1410             flags.do_next_read = 1;
1411             break;
1412
1413         case COMPLETE_PERSISTENT_MSG:
1414             debugs(11, 5, "processReplyBody: COMPLETE_PERSISTENT_MSG");
1415             /* yes we have to clear all these! */
1416             call = NULL;
1417             commSetTimeout(fd, -1, call);
1418             flags.do_next_read = 0;
1419
1420             comm_remove_close_handler(fd, closeHandler);
1421             closeHandler = NULL;
1422             fwd->unregister(fd);
1423
1424             if (orig_request->flags.spoof_client_ip)
1425                 client_addr = orig_request->client_addr;
1426
1427
1428             if (request->flags.pinned) {
1429                 ispinned = true;
1430             } else if (request->flags.connection_auth && request->flags.auth_sent) {
1431                 ispinned = true;
1432             }
1433
1434             if (orig_request->pinnedConnection() && ispinned) {
1435                 orig_request->pinnedConnection()->pinConnection(fd, orig_request, _peer,
1436                         (request->flags.connection_auth != 0));
1437             } else {
1438                 fwd->pconnPush(fd, _peer, request, orig_request->GetHost(), client_addr);
1439             }
1440
1441             fd = -1;
1442
1443             serverComplete();
1444             return;
1445
1446         case COMPLETE_NONPERSISTENT_MSG:
1447             debugs(11, 5, "processReplyBody: COMPLETE_NONPERSISTENT_MSG");
1448             serverComplete();
1449             return;
1450         }
1451
1452     maybeReadVirginBody();
1453 }
1454
1455 void
1456 HttpStateData::maybeReadVirginBody()
1457 {
1458     // we may need to grow the buffer if headers do not fit
1459     const int minRead = flags.headers_parsed ? 0 :1024;
1460     const int read_size = replyBodySpace(*readBuf, minRead);
1461
1462     debugs(11,9, HERE << (flags.do_next_read ? "may" : "wont") <<
1463            " read up to " << read_size << " bytes from FD " << fd);
1464
1465     /*
1466      * why <2? Because delayAwareRead() won't actually read if
1467      * you ask it to read 1 byte.  The delayed read request
1468      * just gets re-queued until the client side drains, then
1469      * the I/O thread hangs.  Better to not register any read
1470      * handler until we get a notification from someone that
1471      * its okay to read again.
1472      */
1473     if (read_size < 2)
1474         return;
1475
1476     if (flags.do_next_read) {
1477         flags.do_next_read = 0;
1478         typedef CommCbMemFunT<HttpStateData, CommIoCbParams> Dialer;
1479         entry->delayAwareRead(fd, readBuf->space(read_size), read_size,
1480                               JobCallback(11, 5, Dialer, this,  HttpStateData::readReply));
1481     }
1482 }
1483
1484 /// called after writing the very last request byte (body, last-chunk, etc)
1485 void
1486 HttpStateData::wroteLast(const CommIoCbParams &io)
1487 {
1488     debugs(11, 5, HERE << "FD " << fd << ": size " << io.size << ": errflag " << io.flag << ".");
1489 #if URL_CHECKSUM_DEBUG
1490
1491     entry->mem_obj->checkUrlChecksum();
1492 #endif
1493
1494     if (io.size > 0) {
1495         fd_bytes(fd, io.size, FD_WRITE);
1496         kb_incr(&statCounter.server.all.kbytes_out, io.size);
1497         kb_incr(&statCounter.server.http.kbytes_out, io.size);
1498     }
1499
1500     if (io.flag == COMM_ERR_CLOSING)
1501         return;
1502
1503     if (io.flag) {
1504         ErrorState *err;
1505         err = errorCon(ERR_WRITE_ERROR, HTTP_BAD_GATEWAY, fwd->request);
1506         err->xerrno = io.xerrno;
1507         fwd->fail(err);
1508         comm_close(fd);
1509         return;
1510     }
1511
1512     sendComplete();
1513 }
1514
1515 /// successfully wrote the entire request (including body, last-chunk, etc.)
1516 void
1517 HttpStateData::sendComplete()
1518 {
1519     /*
1520      * Set the read timeout here because it hasn't been set yet.
1521      * We only set the read timeout after the request has been
1522      * fully written to the server-side.  If we start the timeout
1523      * after connection establishment, then we are likely to hit
1524      * the timeout for POST/PUT requests that have very large
1525      * request bodies.
1526      */
1527     typedef CommCbMemFunT<HttpStateData, CommTimeoutCbParams> TimeoutDialer;
1528     AsyncCall::Pointer timeoutCall =  JobCallback(11, 5,
1529                                       TimeoutDialer, this, HttpStateData::httpTimeout);
1530
1531     commSetTimeout(fd, Config.Timeout.read, timeoutCall);
1532
1533     flags.request_sent = 1;
1534
1535     orig_request->hier.peer_http_request_sent = current_time;
1536 }
1537
1538 // Close the HTTP server connection. Used by serverComplete().
1539 void
1540 HttpStateData::closeServer()
1541 {
1542     debugs(11,5, HERE << "closing HTTP server FD " << fd << " this " << this);
1543
1544     if (fd >= 0) {
1545         fwd->unregister(fd);
1546         comm_remove_close_handler(fd, closeHandler);
1547         closeHandler = NULL;
1548         comm_close(fd);
1549         fd = -1;
1550     }
1551 }
1552
1553 bool
1554 HttpStateData::doneWithServer() const
1555 {
1556     return fd < 0;
1557 }
1558
1559
1560 /*
1561  * Fixup authentication request headers for special cases
1562  */
1563 static void
1564 httpFixupAuthentication(HttpRequest * request, HttpRequest * orig_request, const HttpHeader * hdr_in, HttpHeader * hdr_out, http_state_flags flags)
1565 {
1566     http_hdr_type header = flags.originpeer ? HDR_AUTHORIZATION : HDR_PROXY_AUTHORIZATION;
1567
1568     /* Nothing to do unless we are forwarding to a peer */
1569     if (!request->flags.proxying)
1570         return;
1571
1572     /* Needs to be explicitly enabled */
1573     if (!orig_request->peer_login)
1574         return;
1575
1576     /* Maybe already dealt with? */
1577     if (hdr_out->has(header))
1578         return;
1579
1580     /* Nothing to do here for PASSTHRU */
1581     if (strcmp(orig_request->peer_login, "PASSTHRU") == 0)
1582         return;
1583
1584     /* PROXYPASS is a special case, single-signon to servers with the proxy password (basic only) */
1585     if (flags.originpeer && strcmp(orig_request->peer_login, "PROXYPASS") == 0 && hdr_in->has(HDR_PROXY_AUTHORIZATION)) {
1586         const char *auth = hdr_in->getStr(HDR_PROXY_AUTHORIZATION);
1587
1588         if (auth && strncasecmp(auth, "basic ", 6) == 0) {
1589             hdr_out->putStr(header, auth);
1590             return;
1591         }
1592     }
1593
1594     /* Special mode to pass the username to the upstream cache */
1595     if (*orig_request->peer_login == '*') {
1596         char loginbuf[256];
1597         const char *username = "-";
1598
1599         if (orig_request->extacl_user.size())
1600             username = orig_request->extacl_user.termedBuf();
1601 #if USE_AUTH
1602         else if (orig_request->auth_user_request != NULL)
1603             username = orig_request->auth_user_request->username();
1604 #endif
1605
1606         snprintf(loginbuf, sizeof(loginbuf), "%s%s", username, orig_request->peer_login + 1);
1607
1608         httpHeaderPutStrf(hdr_out, header, "Basic %s",
1609                           old_base64_encode(loginbuf));
1610         return;
1611     }
1612
1613     /* external_acl provided credentials */
1614     if (orig_request->extacl_user.size() && orig_request->extacl_passwd.size() &&
1615             (strcmp(orig_request->peer_login, "PASS") == 0 ||
1616              strcmp(orig_request->peer_login, "PROXYPASS") == 0)) {
1617         char loginbuf[256];
1618         snprintf(loginbuf, sizeof(loginbuf), SQUIDSTRINGPH ":" SQUIDSTRINGPH,
1619                  SQUIDSTRINGPRINT(orig_request->extacl_user),
1620                  SQUIDSTRINGPRINT(orig_request->extacl_passwd));
1621         httpHeaderPutStrf(hdr_out, header, "Basic %s",
1622                           old_base64_encode(loginbuf));
1623         return;
1624     }
1625
1626     /* Kerberos login to peer */
1627 #if HAVE_AUTH_MODULE_NEGOTIATE && HAVE_KRB5 && HAVE_GSSAPI
1628     if (strncmp(orig_request->peer_login, "NEGOTIATE",strlen("NEGOTIATE")) == 0) {
1629         char *Token=NULL;
1630         char *PrincipalName=NULL,*p;
1631         if ((p=strchr(orig_request->peer_login,':')) != NULL ) {
1632             PrincipalName=++p;
1633         }
1634         Token = peer_proxy_negotiate_auth(PrincipalName,request->peer_host);
1635         if (Token) {
1636             httpHeaderPutStrf(hdr_out, HDR_PROXY_AUTHORIZATION, "Negotiate %s",Token);
1637         }
1638         return;
1639     }
1640 #endif /* HAVE_KRB5 && HAVE_GSSAPI */
1641
1642     httpHeaderPutStrf(hdr_out, header, "Basic %s",
1643                       old_base64_encode(orig_request->peer_login));
1644     return;
1645 }
1646
1647 /*
1648  * build request headers and append them to a given MemBuf
1649  * used by buildRequestPrefix()
1650  * note: initialised the HttpHeader, the caller is responsible for Clean()-ing
1651  */
1652 void
1653 HttpStateData::httpBuildRequestHeader(HttpRequest * request,
1654                                       HttpRequest * orig_request,
1655                                       StoreEntry * entry,
1656                                       HttpHeader * hdr_out,
1657                                       const http_state_flags flags)
1658 {
1659     /* building buffer for complex strings */
1660 #define BBUF_SZ (MAX_URL+32)
1661     LOCAL_ARRAY(char, bbuf, BBUF_SZ);
1662     LOCAL_ARRAY(char, ntoabuf, MAX_IPSTRLEN);
1663     const HttpHeader *hdr_in = &orig_request->header;
1664     const HttpHeaderEntry *e = NULL;
1665     HttpHeaderPos pos = HttpHeaderInitPos;
1666     assert (hdr_out->owner == hoRequest);
1667
1668     /* append our IMS header */
1669     if (request->lastmod > -1)
1670         hdr_out->putTime(HDR_IF_MODIFIED_SINCE, request->lastmod);
1671
1672     bool we_do_ranges = decideIfWeDoRanges (orig_request);
1673
1674     String strConnection (hdr_in->getList(HDR_CONNECTION));
1675
1676     while ((e = hdr_in->getEntry(&pos)))
1677         copyOneHeaderFromClientsideRequestToUpstreamRequest(e, strConnection, request, orig_request, hdr_out, we_do_ranges, flags);
1678
1679     /* Abstraction break: We should interpret multipart/byterange responses
1680      * into offset-length data, and this works around our inability to do so.
1681      */
1682     if (!we_do_ranges && orig_request->multipartRangeRequest()) {
1683         /* don't cache the result */
1684         orig_request->flags.cachable = 0;
1685         /* pretend it's not a range request */
1686         delete orig_request->range;
1687         orig_request->range = NULL;
1688         orig_request->flags.range = 0;
1689     }
1690
1691     /* append Via */
1692     if (Config.onoff.via) {
1693         String strVia;
1694         strVia = hdr_in->getList(HDR_VIA);
1695         snprintf(bbuf, BBUF_SZ, "%d.%d %s",
1696                  orig_request->http_ver.major,
1697                  orig_request->http_ver.minor, ThisCache);
1698         strListAdd(&strVia, bbuf, ',');
1699         hdr_out->putStr(HDR_VIA, strVia.termedBuf());
1700         strVia.clean();
1701     }
1702
1703     if (orig_request->flags.accelerated) {
1704         /* Append Surrogate-Capabilities */
1705         String strSurrogate(hdr_in->getList(HDR_SURROGATE_CAPABILITY));
1706 #if USE_SQUID_ESI
1707         snprintf(bbuf, BBUF_SZ, "%s=\"Surrogate/1.0 ESI/1.0\"", Config.Accel.surrogate_id);
1708 #else
1709         snprintf(bbuf, BBUF_SZ, "%s=\"Surrogate/1.0\"", Config.Accel.surrogate_id);
1710 #endif
1711         strListAdd(&strSurrogate, bbuf, ',');
1712         hdr_out->putStr(HDR_SURROGATE_CAPABILITY, strSurrogate.termedBuf());
1713     }
1714
1715     /** \pre Handle X-Forwarded-For */
1716     if (strcmp(opt_forwarded_for, "delete") != 0) {
1717
1718         String strFwd = hdr_in->getList(HDR_X_FORWARDED_FOR);
1719
1720         if (strFwd.size() > 65536/2) {
1721             // There is probably a forwarding loop with Via detection disabled.
1722             // If we do nothing, String will assert on overflow soon.
1723             // TODO: Terminate all transactions with huge XFF?
1724             strFwd = "error";
1725
1726             static int warnedCount = 0;
1727             if (warnedCount++ < 100) {
1728                 const char *url = entry ? entry->url() : urlCanonical(orig_request);
1729                 debugs(11, 1, "Warning: likely forwarding loop with " << url);
1730             }
1731         }
1732
1733         if (strcmp(opt_forwarded_for, "on") == 0) {
1734             /** If set to ON - append client IP or 'unknown'. */
1735             if ( orig_request->client_addr.IsNoAddr() )
1736                 strListAdd(&strFwd, "unknown", ',');
1737             else
1738                 strListAdd(&strFwd, orig_request->client_addr.NtoA(ntoabuf, MAX_IPSTRLEN), ',');
1739         } else if (strcmp(opt_forwarded_for, "off") == 0) {
1740             /** If set to OFF - append 'unknown'. */
1741             strListAdd(&strFwd, "unknown", ',');
1742         } else if (strcmp(opt_forwarded_for, "transparent") == 0) {
1743             /** If set to TRANSPARENT - pass through unchanged. */
1744         } else if (strcmp(opt_forwarded_for, "truncate") == 0) {
1745             /** If set to TRUNCATE - drop existing list and replace with client IP or 'unknown'. */
1746             if ( orig_request->client_addr.IsNoAddr() )
1747                 strFwd = "unknown";
1748             else
1749                 strFwd = orig_request->client_addr.NtoA(ntoabuf, MAX_IPSTRLEN);
1750         }
1751         if (strFwd.size() > 0)
1752             hdr_out->putStr(HDR_X_FORWARDED_FOR, strFwd.termedBuf());
1753     }
1754     /** If set to DELETE - do not copy through. */
1755
1756     /* append Host if not there already */
1757     if (!hdr_out->has(HDR_HOST)) {
1758         if (orig_request->peer_domain) {
1759             hdr_out->putStr(HDR_HOST, orig_request->peer_domain);
1760         } else if (orig_request->port == urlDefaultPort(orig_request->protocol)) {
1761             /* use port# only if not default */
1762             hdr_out->putStr(HDR_HOST, orig_request->GetHost());
1763         } else {
1764             httpHeaderPutStrf(hdr_out, HDR_HOST, "%s:%d",
1765                               orig_request->GetHost(),
1766                               (int) orig_request->port);
1767         }
1768     }
1769
1770     /* append Authorization if known in URL, not in header and going direct */
1771     if (!hdr_out->has(HDR_AUTHORIZATION)) {
1772         if (!request->flags.proxying && *request->login) {
1773             httpHeaderPutStrf(hdr_out, HDR_AUTHORIZATION, "Basic %s",
1774                               old_base64_encode(request->login));
1775         }
1776     }
1777
1778     /* Fixup (Proxy-)Authorization special cases. Plain relaying dealt with above */
1779     httpFixupAuthentication(request, orig_request, hdr_in, hdr_out, flags);
1780
1781     /* append Cache-Control, add max-age if not there already */
1782     {
1783         HttpHdrCc *cc = hdr_in->getCc();
1784
1785         if (!cc)
1786             cc = httpHdrCcCreate();
1787
1788 #if 0 /* see bug 2330 */
1789         /* Set no-cache if determined needed but not found */
1790         if (orig_request->flags.nocache)
1791             EBIT_SET(cc->mask, CC_NO_CACHE);
1792 #endif
1793
1794         /* Add max-age only without no-cache */
1795         if (!EBIT_TEST(cc->mask, CC_MAX_AGE) && !EBIT_TEST(cc->mask, CC_NO_CACHE)) {
1796             const char *url =
1797                 entry ? entry->url() : urlCanonical(orig_request);
1798             httpHdrCcSetMaxAge(cc, getMaxAge(url));
1799
1800             if (request->urlpath.size())
1801                 assert(strstr(url, request->urlpath.termedBuf()));
1802         }
1803
1804         /* Enforce sibling relations */
1805         if (flags.only_if_cached)
1806             EBIT_SET(cc->mask, CC_ONLY_IF_CACHED);
1807
1808         hdr_out->putCc(cc);
1809
1810         httpHdrCcDestroy(cc);
1811     }
1812
1813     /* maybe append Connection: keep-alive */
1814     if (flags.keepalive) {
1815         hdr_out->putStr(HDR_CONNECTION, "keep-alive");
1816     }
1817
1818     /* append Front-End-Https */
1819     if (flags.front_end_https) {
1820         if (flags.front_end_https == 1 || request->protocol == AnyP::PROTO_HTTPS)
1821             hdr_out->putStr(HDR_FRONT_END_HTTPS, "On");
1822     }
1823
1824     if (flags.chunked_request) {
1825         // Do not just copy the original value so that if the client-side
1826         // starts decode other encodings, this code may remain valid.
1827         hdr_out->putStr(HDR_TRANSFER_ENCODING, "chunked");
1828     }
1829
1830     /* Now mangle the headers. */
1831     if (Config2.onoff.mangle_request_headers)
1832         httpHdrMangleList(hdr_out, request, ROR_REQUEST);
1833
1834     strConnection.clean();
1835 }
1836
1837 /**
1838  * Decides whether a particular header may be cloned from the received Clients request
1839  * to our outgoing fetch request.
1840  */
1841 void
1842 copyOneHeaderFromClientsideRequestToUpstreamRequest(const HttpHeaderEntry *e, const String strConnection, HttpRequest * request, const HttpRequest * orig_request, HttpHeader * hdr_out, const int we_do_ranges, const http_state_flags flags)
1843 {
1844     debugs(11, 5, "httpBuildRequestHeader: " << e->name << ": " << e->value );
1845
1846     switch (e->id) {
1847
1848         /** \par RFC 2616 sect 13.5.1 - Hop-by-Hop headers which Squid should not pass on. */
1849
1850     case HDR_PROXY_AUTHORIZATION:
1851         /** \par Proxy-Authorization:
1852          * Only pass on proxy authentication to peers for which
1853          * authentication forwarding is explicitly enabled
1854          */
1855         if (!flags.originpeer && flags.proxying && orig_request->peer_login &&
1856                 (strcmp(orig_request->peer_login, "PASS") == 0 ||
1857                  strcmp(orig_request->peer_login, "PROXYPASS") == 0 ||
1858                  strcmp(orig_request->peer_login, "PASSTHRU") == 0)) {
1859             hdr_out->addEntry(e->clone());
1860         }
1861         break;
1862
1863         /** \par RFC 2616 sect 13.5.1 - Hop-by-Hop headers which Squid does not pass on. */
1864
1865     case HDR_CONNECTION:          /** \par Connection: */
1866     case HDR_TE:                  /** \par TE: */
1867     case HDR_KEEP_ALIVE:          /** \par Keep-Alive: */
1868     case HDR_PROXY_AUTHENTICATE:  /** \par Proxy-Authenticate: */
1869     case HDR_TRAILER:             /** \par Trailer: */
1870     case HDR_UPGRADE:             /** \par Upgrade: */
1871     case HDR_TRANSFER_ENCODING:   /** \par Transfer-Encoding: */
1872         break;
1873
1874
1875         /** \par OTHER headers I haven't bothered to track down yet. */
1876
1877     case HDR_AUTHORIZATION:
1878         /** \par WWW-Authorization:
1879          * Pass on WWW authentication */
1880
1881         if (!flags.originpeer) {
1882             hdr_out->addEntry(e->clone());
1883         } else {
1884             /** \note In accelerators, only forward authentication if enabled
1885              * (see also httpFixupAuthentication for special cases)
1886              */
1887             if (orig_request->peer_login &&
1888                     (strcmp(orig_request->peer_login, "PASS") == 0 ||
1889                      strcmp(orig_request->peer_login, "PASSTHRU") == 0 ||
1890                      strcmp(orig_request->peer_login, "PROXYPASS") == 0)) {
1891                 hdr_out->addEntry(e->clone());
1892             }
1893         }
1894
1895         break;
1896
1897     case HDR_HOST:
1898         /** \par Host:
1899          * Normally Squid rewrites the Host: header.
1900          * However, there is one case when we don't: If the URL
1901          * went through our redirector and the admin configured
1902          * 'redir_rewrites_host' to be off.
1903          */
1904         if (orig_request->peer_domain)
1905             hdr_out->putStr(HDR_HOST, orig_request->peer_domain);
1906         else if (request->flags.redirected && !Config.onoff.redir_rewrites_host)
1907             hdr_out->addEntry(e->clone());
1908         else {
1909             /* use port# only if not default */
1910
1911             if (orig_request->port == urlDefaultPort(orig_request->protocol)) {
1912                 hdr_out->putStr(HDR_HOST, orig_request->GetHost());
1913             } else {
1914                 httpHeaderPutStrf(hdr_out, HDR_HOST, "%s:%d",
1915                                   orig_request->GetHost(),
1916                                   (int) orig_request->port);
1917             }
1918         }
1919
1920         break;
1921
1922     case HDR_IF_MODIFIED_SINCE:
1923         /** \par If-Modified-Since:
1924         * append unless we added our own;
1925          * \note at most one client's ims header can pass through */
1926
1927         if (!hdr_out->has(HDR_IF_MODIFIED_SINCE))
1928             hdr_out->addEntry(e->clone());
1929
1930         break;
1931
1932     case HDR_MAX_FORWARDS:
1933         /** \par Max-Forwards:
1934          * pass only on TRACE or OPTIONS requests */
1935         if (orig_request->method == METHOD_TRACE || orig_request->method == METHOD_OPTIONS) {
1936             const int64_t hops = e->getInt64();
1937
1938             if (hops > 0)
1939                 hdr_out->putInt64(HDR_MAX_FORWARDS, hops - 1);
1940         }
1941
1942         break;
1943
1944     case HDR_VIA:
1945         /** \par Via:
1946          * If Via is disabled then forward any received header as-is.
1947          * Otherwise leave for explicit updated addition later. */
1948
1949         if (!Config.onoff.via)
1950             hdr_out->addEntry(e->clone());
1951
1952         break;
1953
1954     case HDR_RANGE:
1955
1956     case HDR_IF_RANGE:
1957
1958     case HDR_REQUEST_RANGE:
1959         /** \par Range:, If-Range:, Request-Range:
1960          * Only pass if we accept ranges */
1961         if (!we_do_ranges)
1962             hdr_out->addEntry(e->clone());
1963
1964         break;
1965
1966     case HDR_PROXY_CONNECTION: // SHOULD ignore. But doing so breaks things.
1967         break;
1968
1969     case HDR_CONTENT_LENGTH:
1970         // pass through unless we chunk; also, keeping this away from default
1971         // prevents request smuggling via Connection: Content-Length tricks
1972         if (!flags.chunked_request)
1973             hdr_out->addEntry(e->clone());
1974         break;
1975
1976     case HDR_X_FORWARDED_FOR:
1977
1978     case HDR_CACHE_CONTROL:
1979         /** \par X-Forwarded-For:, Cache-Control:
1980          * handled specially by Squid, so leave off for now.
1981          * append these after the loop if needed */
1982         break;
1983
1984     case HDR_FRONT_END_HTTPS:
1985         /** \par Front-End-Https:
1986          * Pass thru only if peer is configured with front-end-https */
1987         if (!flags.front_end_https)
1988             hdr_out->addEntry(e->clone());
1989
1990         break;
1991
1992     default:
1993         /** \par default.
1994          * pass on all other header fields
1995          * which are NOT listed by the special Connection: header. */
1996
1997         if (strConnection.size()>0 && strListIsMember(&strConnection, e->name.termedBuf(), ',')) {
1998             debugs(11, 2, "'" << e->name << "' header cropped by Connection: definition");
1999             return;
2000         }
2001
2002         hdr_out->addEntry(e->clone());
2003     }
2004 }
2005
2006 bool
2007 HttpStateData::decideIfWeDoRanges (HttpRequest * orig_request)
2008 {
2009     bool result = true;
2010     /* decide if we want to do Ranges ourselves
2011      * and fetch the whole object now)
2012      * We want to handle Ranges ourselves iff
2013      *    - we can actually parse client Range specs
2014      *    - the specs are expected to be simple enough (e.g. no out-of-order ranges)
2015      *    - reply will be cachable
2016      * (If the reply will be uncachable we have to throw it away after
2017      *  serving this request, so it is better to forward ranges to
2018      *  the server and fetch only the requested content)
2019      */
2020
2021     int64_t roffLimit = orig_request->getRangeOffsetLimit();
2022
2023     if (NULL == orig_request->range || !orig_request->flags.cachable
2024             || orig_request->range->offsetLimitExceeded(roffLimit) || orig_request->flags.connection_auth)
2025         result = false;
2026
2027     debugs(11, 8, "decideIfWeDoRanges: range specs: " <<
2028            orig_request->range << ", cachable: " <<
2029            orig_request->flags.cachable << "; we_do_ranges: " << result);
2030
2031     return result;
2032 }
2033
2034 /* build request prefix and append it to a given MemBuf;
2035  * return the length of the prefix */
2036 mb_size_t
2037 HttpStateData::buildRequestPrefix(HttpRequest * aRequest,
2038                                   HttpRequest * original_request,
2039                                   StoreEntry * sentry,
2040                                   MemBuf * mb)
2041 {
2042     const int offset = mb->size;
2043     HttpVersion httpver(1,1);
2044     mb->Printf("%s %s HTTP/%d.%d\r\n",
2045                RequestMethodStr(aRequest->method),
2046                aRequest->urlpath.size() ? aRequest->urlpath.termedBuf() : "/",
2047                httpver.major,httpver.minor);
2048     /* build and pack headers */
2049     {
2050         HttpHeader hdr(hoRequest);
2051         Packer p;
2052         httpBuildRequestHeader(aRequest, original_request, sentry, &hdr, flags);
2053
2054         if (aRequest->flags.pinned && aRequest->flags.connection_auth)
2055             aRequest->flags.auth_sent = 1;
2056         else if (hdr.has(HDR_AUTHORIZATION))
2057             aRequest->flags.auth_sent = 1;
2058
2059         packerToMemInit(&p, mb);
2060         hdr.packInto(&p);
2061         hdr.clean();
2062         packerClean(&p);
2063     }
2064     /* append header terminator */
2065     mb->append(crlf, 2);
2066     return mb->size - offset;
2067 }
2068
2069 /* This will be called when connect completes. Write request. */
2070 bool
2071 HttpStateData::sendRequest()
2072 {
2073     MemBuf mb;
2074
2075     debugs(11, 5, "httpSendRequest: FD " << fd << ", request " << request << ", this " << this << ".");
2076
2077     if (!canSend(fd)) {
2078         debugs(11,3, HERE << "cannot send request to closing FD " << fd);
2079         assert(closeHandler != NULL);
2080         return false;
2081     }
2082
2083     typedef CommCbMemFunT<HttpStateData, CommTimeoutCbParams> TimeoutDialer;
2084     AsyncCall::Pointer timeoutCall =  JobCallback(11, 5,
2085                                       TimeoutDialer, this, HttpStateData::httpTimeout);
2086     commSetTimeout(fd, Config.Timeout.lifetime, timeoutCall);
2087     flags.do_next_read = 1;
2088     maybeReadVirginBody();
2089
2090     if (orig_request->body_pipe != NULL) {
2091         if (!startRequestBodyFlow()) // register to receive body data
2092             return false;
2093         typedef CommCbMemFunT<HttpStateData, CommIoCbParams> Dialer;
2094         requestSender = JobCallback(11,5,
2095                                     Dialer, this, HttpStateData::sentRequestBody);
2096
2097         Must(!flags.chunked_request);
2098         // use chunked encoding if we do not know the length
2099         if (orig_request->content_length < 0)
2100             flags.chunked_request = 1;
2101     } else {
2102         assert(!requestBodySource);
2103         typedef CommCbMemFunT<HttpStateData, CommIoCbParams> Dialer;
2104         requestSender = JobCallback(11,5,
2105                                     Dialer, this,  HttpStateData::wroteLast);
2106     }
2107
2108     if (_peer != NULL) {
2109         if (_peer->options.originserver) {
2110             flags.proxying = 0;
2111             flags.originpeer = 1;
2112         } else {
2113             flags.proxying = 1;
2114             flags.originpeer = 0;
2115         }
2116     } else {
2117         flags.proxying = 0;
2118         flags.originpeer = 0;
2119     }
2120
2121     /*
2122      * Is keep-alive okay for all request methods?
2123      */
2124     if (orig_request->flags.must_keepalive)
2125         flags.keepalive = 1;
2126     else if (!Config.onoff.server_pconns)
2127         flags.keepalive = 0;
2128     else if (_peer == NULL)
2129         flags.keepalive = 1;
2130     else if (_peer->stats.n_keepalives_sent < 10)
2131         flags.keepalive = 1;
2132     else if ((double) _peer->stats.n_keepalives_recv /
2133              (double) _peer->stats.n_keepalives_sent > 0.50)
2134         flags.keepalive = 1;
2135
2136     if (_peer) {
2137         if (neighborType(_peer, request) == PEER_SIBLING &&
2138                 !_peer->options.allow_miss)
2139             flags.only_if_cached = 1;
2140
2141         flags.front_end_https = _peer->front_end_https;
2142     }
2143
2144     mb.init();
2145     request->peer_host=_peer?_peer->host:NULL;
2146     buildRequestPrefix(request, orig_request, entry, &mb);
2147     debugs(11, 6, "httpSendRequest: FD " << fd << ":\n" << mb.buf);
2148     Comm::Write(fd, &mb, requestSender);
2149
2150     return true;
2151 }
2152
2153 bool
2154 HttpStateData::getMoreRequestBody(MemBuf &buf)
2155 {
2156     // parent's implementation can handle the no-encoding case
2157     if (!flags.chunked_request)
2158         return ServerStateData::getMoreRequestBody(buf);
2159
2160     MemBuf raw;
2161
2162     Must(requestBodySource != NULL);
2163     if (!requestBodySource->getMoreData(raw))
2164         return false; // no request body bytes to chunk yet
2165
2166     // optimization: pre-allocate buffer size that should be enough
2167     const mb_size_t rawDataSize = raw.contentSize();
2168     // we may need to send: hex-chunk-size CRLF raw-data CRLF last-chunk
2169     buf.init(16 + 2 + rawDataSize + 2 + 5, raw.max_capacity);
2170
2171     buf.Printf("%x\r\n", static_cast<unsigned int>(rawDataSize));
2172     buf.append(raw.content(), rawDataSize);
2173     buf.Printf("\r\n");
2174
2175     Must(rawDataSize > 0); // we did not accidently created last-chunk above
2176
2177     // Do not send last-chunk unless we successfully received everything
2178     if (receivedWholeRequestBody) {
2179         Must(!flags.sentLastChunk);
2180         flags.sentLastChunk = true;
2181         buf.append("0\r\n\r\n", 5);
2182     }
2183
2184     return true;
2185 }
2186
2187 void
2188 httpStart(FwdState *fwd)
2189 {
2190     debugs(11, 3, "httpStart: \"" << RequestMethodStr(fwd->request->method) << " " << fwd->entry->url() << "\"" );
2191     HttpStateData *httpState = new HttpStateData(fwd);
2192
2193     if (!httpState->sendRequest()) {
2194         debugs(11, 3, "httpStart: aborted");
2195         delete httpState;
2196         return;
2197     }
2198
2199     statCounter.server.all.requests++;
2200     statCounter.server.http.requests++;
2201
2202     /*
2203      * We used to set the read timeout here, but not any more.
2204      * Now its set in httpSendComplete() after the full request,
2205      * including request body, has been written to the server.
2206      */
2207 }
2208
2209 /// if broken posts are enabled for the request, try to fix and return true
2210 bool
2211 HttpStateData::finishingBrokenPost()
2212 {
2213 #if USE_HTTP_VIOLATIONS
2214     if (!Config.accessList.brokenPosts) {
2215         debugs(11, 5, HERE << "No brokenPosts list");
2216         return false;
2217     }
2218
2219     ACLFilledChecklist ch(Config.accessList.brokenPosts, originalRequest(), NULL);
2220     if (!ch.fastCheck()) {
2221         debugs(11, 5, HERE << "didn't match brokenPosts");
2222         return false;
2223     }
2224
2225     if (!canSend(fd)) {
2226         debugs(11,2, HERE << "ignoring broken POST for closing FD " << fd);
2227         assert(closeHandler != NULL);
2228         return true; // prevent caller from proceeding as if nothing happened
2229     }
2230
2231     debugs(11, 2, "finishingBrokenPost: fixing broken POST");
2232     typedef CommCbMemFunT<HttpStateData, CommIoCbParams> Dialer;
2233     requestSender = JobCallback(11,5,
2234                                 Dialer, this, HttpStateData::wroteLast);
2235     Comm::Write(fd, "\r\n", 2, requestSender, NULL);
2236     return true;
2237 #else
2238     return false;
2239 #endif /* USE_HTTP_VIOLATIONS */
2240 }
2241
2242 /// if needed, write last-chunk to end the request body and return true
2243 bool
2244 HttpStateData::finishingChunkedRequest()
2245 {
2246     if (flags.sentLastChunk) {
2247         debugs(11, 5, HERE << "already sent last-chunk");
2248         return false;
2249     }
2250
2251     Must(receivedWholeRequestBody); // or we should not be sending last-chunk
2252     flags.sentLastChunk = true;
2253
2254     typedef CommCbMemFunT<HttpStateData, CommIoCbParams> Dialer;
2255     requestSender = JobCallback(11,5,
2256                                 Dialer, this, HttpStateData::wroteLast);
2257     Comm::Write(fd, "0\r\n\r\n", 5, requestSender, NULL);
2258     return true;
2259 }
2260
2261 void
2262 HttpStateData::doneSendingRequestBody()
2263 {
2264     ServerStateData::doneSendingRequestBody();
2265     debugs(11,5, HERE << "doneSendingRequestBody: FD " << fd);
2266
2267     // do we need to write something after the last body byte?
2268     if (flags.chunked_request && finishingChunkedRequest())
2269         return;
2270     if (!flags.chunked_request && finishingBrokenPost())
2271         return;
2272
2273     sendComplete();
2274 }
2275
2276 // more origin request body data is available
2277 void
2278 HttpStateData::handleMoreRequestBodyAvailable()
2279 {
2280     if (eof || fd < 0) {
2281         // XXX: we should check this condition in other callbacks then!
2282         // TODO: Check whether this can actually happen: We should unsubscribe
2283         // as a body consumer when the above condition(s) are detected.
2284         debugs(11, 1, HERE << "Transaction aborted while reading HTTP body");
2285         return;
2286     }
2287
2288     assert(requestBodySource != NULL);
2289
2290     if (requestBodySource->buf().hasContent()) {
2291         // XXX: why does not this trigger a debug message on every request?
2292
2293         if (flags.headers_parsed && !flags.abuse_detected) {
2294             flags.abuse_detected = 1;
2295             debugs(11, 1, "http handleMoreRequestBodyAvailable: Likely proxy abuse detected '" << orig_request->client_addr << "' -> '" << entry->url() << "'" );
2296
2297             if (virginReply()->sline.status == HTTP_INVALID_HEADER) {
2298                 comm_close(fd);
2299                 return;
2300             }
2301         }
2302     }
2303
2304     HttpStateData::handleMoreRequestBodyAvailable();
2305 }
2306
2307 // premature end of the request body
2308 void
2309 HttpStateData::handleRequestBodyProducerAborted()
2310 {
2311     ServerStateData::handleRequestBodyProducerAborted();
2312     if (entry->isEmpty()) {
2313         debugs(11, 3, "request body aborted: FD " << fd);
2314         ErrorState *err;
2315         // We usually get here when ICAP REQMOD aborts during body processing.
2316         // We might also get here if client-side aborts, but then our response
2317         // should not matter because either client-side will provide its own or
2318         // there will be no response at all (e.g., if the the client has left).
2319         err = errorCon(ERR_ICAP_FAILURE, HTTP_INTERNAL_SERVER_ERROR, fwd->request);
2320         err->xerrno = ERR_DETAIL_SRV_REQMOD_REQ_BODY;
2321         fwd->fail(err);
2322     }
2323
2324     abortTransaction("request body producer aborted");
2325 }
2326
2327 // called when we wrote request headers(!) or a part of the body
2328 void
2329 HttpStateData::sentRequestBody(const CommIoCbParams &io)
2330 {
2331     if (io.size > 0)
2332         kb_incr(&statCounter.server.http.kbytes_out, io.size);
2333
2334     ServerStateData::sentRequestBody(io);
2335 }
2336
2337 // Quickly abort the transaction
2338 // TODO: destruction should be sufficient as the destructor should cleanup,
2339 // including canceling close handlers
2340 void
2341 HttpStateData::abortTransaction(const char *reason)
2342 {
2343     debugs(11,5, HERE << "aborting transaction for " << reason <<
2344            "; FD " << fd << ", this " << this);
2345
2346     if (fd >= 0) {
2347         comm_close(fd);
2348         return;
2349     }
2350
2351     fwd->handleUnregisteredServerEnd();
2352     deleteThis("HttpStateData::abortTransaction");
2353 }
2354
2355 HttpRequest *
2356 HttpStateData::originalRequest()
2357 {
2358     return orig_request;
2359 }