src/http.cc

   1 /*
   2  * Copyright (C) 1996-2015 The Squid Software Foundation and contributors
   3  *
   4  * Squid software is distributed under GPLv2+ license and includes
   5  * contributions from numerous individuals and organizations.
   6  * Please see the COPYING and CONTRIBUTORS files for details.
   7  */
   8
   9 /* DEBUG: section 11    Hypertext Transfer Protocol (HTTP) */
  10
  11 /*
  12  * Anonymizing patch by lutz@as-node.jena.thur.de
  13  * have a look into http-anon.c to get more informations.
  14  */
  15
  16 #include "squid.h"
  17 #include "acl/FilledChecklist.h"
  18 #include "base/AsyncJobCalls.h"
  19 #include "base/TextException.h"
  20 #include "base64.h"
  21 #include "CachePeer.h"
  22 #include "ChunkedCodingParser.h"
  23 #include "client_side.h"
  24 #include "comm/Connection.h"
  25 #include "comm/Read.h"
  26 #include "comm/Write.h"
  27 #include "CommRead.h"
  28 #include "err_detail_type.h"
  29 #include "errorpage.h"
  30 #include "fd.h"
  31 #include "fde.h"
  32 #include "globals.h"
  33 #include "http.h"
  34 #include "http/one/ResponseParser.h"
  35 #include "HttpControlMsg.h"
  36 #include "HttpHdrCc.h"
  37 #include "HttpHdrContRange.h"
  38 #include "HttpHdrSc.h"
  39 #include "HttpHdrScTarget.h"
  40 #include "HttpHeaderTools.h"
  41 #include "HttpReply.h"
  42 #include "HttpRequest.h"
  43 #include "HttpStateFlags.h"
  44 #include "log/access_log.h"
  45 #include "MemBuf.h"
  46 #include "MemObject.h"
  47 #include "neighbors.h"
  48 #include "peer_proxy_negotiate_auth.h"
  49 #include "profiler/Profiler.h"
  50 #include "refresh.h"
  51 #include "RefreshPattern.h"
  52 #include "rfc1738.h"
  53 #include "SquidConfig.h"
  54 #include "SquidTime.h"
  55 #include "StatCounters.h"
  56 #include "Store.h"
  57 #include "StrList.h"
  58 #include "tools.h"
  59 #include "URL.h"
  60 #include "util.h"
  61
  62 #if USE_AUTH
  63 #include "auth/UserRequest.h"
  64 #endif
  65 #if USE_DELAY_POOLS
  66 #include "DelayPools.h"
  67 #endif
  68
  69 #define SQUID_ENTER_THROWING_CODE() try {
  70 #define SQUID_EXIT_THROWING_CODE(status) \
  71     status = true; \
  72     } \
  73     catch (const std::exception &e) { \
  74     debugs (11, 1, "Exception error:" << e.what()); \
  75     status = false; \
  76     }
  77
  78 CBDATA_CLASS_INIT(HttpStateData);
  79
  80 static const char *const crlf = "\r\n";
  81
  82 static void httpMaybeRemovePublic(StoreEntry *, Http::StatusCode);
  83 static void copyOneHeaderFromClientsideRequestToUpstreamRequest(const HttpHeaderEntry *e, const String strConnection, const HttpRequest * request,
  84         HttpHeader * hdr_out, const int we_do_ranges, const HttpStateFlags &);
  85 //Declared in HttpHeaderTools.cc
  86 void httpHdrAdd(HttpHeader *heads, HttpRequest *request, const AccessLogEntryPointer &al, HeaderWithAclList &headers_add);
  87
  88 HttpStateData::HttpStateData(FwdState *theFwdState) :
  89     AsyncJob("HttpStateData"),
  90     Client(theFwdState),
  91     lastChunk(0),
  92     httpChunkDecoder(NULL),
  93     payloadSeen(0),
  94     payloadTruncated(0)
  95 {
  96     debugs(11,5,HERE << "HttpStateData " << this << " created");
  97     ignoreCacheControl = false;
  98     surrogateNoStore = false;
  99     serverConnection = fwd->serverConnection();
 100
 101     // reset peer response time stats for %<pt
 102     request->hier.peer_http_request_sent.tv_sec = 0;
 103     request->hier.peer_http_request_sent.tv_usec = 0;
 104
 105     if (fwd->serverConnection() != NULL)
 106         _peer = cbdataReference(fwd->serverConnection()->getPeer());         /* might be NULL */
 107
 108     if (_peer) {
 109         request->flags.proxying = true;
 110         /*
 111          * This NEIGHBOR_PROXY_ONLY check probably shouldn't be here.
 112          * We might end up getting the object from somewhere else if,
 113          * for example, the request to this neighbor fails.
 114          */
 115         if (_peer->options.proxy_only)
 116             entry->releaseRequest();
 117
 118 #if USE_DELAY_POOLS
 119         entry->setNoDelay(_peer->options.no_delay);
 120 #endif
 121     }
 122
 123     /*
 124      * register the handler to free HTTP state data when the FD closes
 125      */
 126     typedef CommCbMemFunT<HttpStateData, CommCloseCbParams> Dialer;
 127     closeHandler = JobCallback(9, 5, Dialer, this, HttpStateData::httpStateConnClosed);
 128     comm_add_close_handler(serverConnection->fd, closeHandler);
 129 }
 130
 131 HttpStateData::~HttpStateData()
 132 {
 133     /*
 134      * don't forget that ~Client() gets called automatically
 135      */
 136
 137     if (httpChunkDecoder)
 138         delete httpChunkDecoder;
 139
 140     cbdataReferenceDone(_peer);
 141
 142     debugs(11,5, HERE << "HttpStateData " << this << " destroyed; " << serverConnection);
 143 }
 144
 145 const Comm::ConnectionPointer &
 146 HttpStateData::dataConnection() const
 147 {
 148     return serverConnection;
 149 }
 150
 151 void
 152 HttpStateData::httpStateConnClosed(const CommCloseCbParams &params)
 153 {
 154     debugs(11, 5, "httpStateFree: FD " << params.fd << ", httpState=" << params.data);
 155     mustStop("HttpStateData::httpStateConnClosed");
 156 }
 157
 158 void
 159 HttpStateData::httpTimeout(const CommTimeoutCbParams &)
 160 {
 161     debugs(11, 4, serverConnection << ": '" << entry->url() << "'");
 162
 163     if (entry->store_status == STORE_PENDING) {
 164         fwd->fail(new ErrorState(ERR_READ_TIMEOUT, Http::scGatewayTimeout, fwd->request));
 165     }
 166
 167     serverConnection->close();
 168 }
 169
 170 /// Remove an existing public store entry if the incoming response (to be
 171 /// stored in a currently private entry) is going to invalidate it.
 172 static void
 173 httpMaybeRemovePublic(StoreEntry * e, Http::StatusCode status)
 174 {
 175     int remove = 0;
 176     int forbidden = 0;
 177     StoreEntry *pe;
 178
 179     // If the incoming response already goes into a public entry, then there is
 180     // nothing to remove. This protects ready-for-collapsing entries as well.
 181     if (!EBIT_TEST(e->flags, KEY_PRIVATE))
 182         return;
 183
 184     switch (status) {
 185
 186     case Http::scOkay:
 187
 188     case Http::scNonAuthoritativeInformation:
 189
 190     case Http::scMultipleChoices:
 191
 192     case Http::scMovedPermanently:
 193
 194     case Http::scFound:
 195
 196     case Http::scGone:
 197
 198     case Http::scNotFound:
 199         remove = 1;
 200
 201         break;
 202
 203     case Http::scForbidden:
 204
 205     case Http::scMethodNotAllowed:
 206         forbidden = 1;
 207
 208         break;
 209
 210 #if WORK_IN_PROGRESS
 211
 212     case Http::scUnauthorized:
 213         forbidden = 1;
 214
 215         break;
 216
 217 #endif
 218
 219     default:
 220 #if QUESTIONABLE
 221         /*
 222          * Any 2xx response should eject previously cached entities...
 223          */
 224
 225         if (status >= 200 && status < 300)
 226             remove = 1;
 227
 228 #endif
 229
 230         break;
 231     }
 232
 233     if (!remove && !forbidden)
 234         return;
 235
 236     assert(e->mem_obj);
 237
 238     if (e->mem_obj->request)
 239         pe = storeGetPublicByRequest(e->mem_obj->request);
 240     else
 241         pe = storeGetPublic(e->mem_obj->storeId(), e->mem_obj->method);
 242
 243     if (pe != NULL) {
 244         assert(e != pe);
 245 #if USE_HTCP
 246         neighborsHtcpClear(e, NULL, e->mem_obj->request, e->mem_obj->method, HTCP_CLR_INVALIDATION);
 247 #endif
 248         pe->release();
 249     }
 250
 251     /** \par
 252      * Also remove any cached HEAD response in case the object has
 253      * changed.
 254      */
 255     if (e->mem_obj->request)
 256         pe = storeGetPublicByRequestMethod(e->mem_obj->request, Http::METHOD_HEAD);
 257     else
 258         pe = storeGetPublic(e->mem_obj->storeId(), Http::METHOD_HEAD);
 259
 260     if (pe != NULL) {
 261         assert(e != pe);
 262 #if USE_HTCP
 263         neighborsHtcpClear(e, NULL, e->mem_obj->request, HttpRequestMethod(Http::METHOD_HEAD), HTCP_CLR_INVALIDATION);
 264 #endif
 265         pe->release();
 266     }
 267 }
 268
 269 void
 270 HttpStateData::processSurrogateControl(HttpReply *reply)
 271 {
 272     if (request->flags.accelerated && reply->surrogate_control) {
 273         HttpHdrScTarget *sctusable = reply->surrogate_control->getMergedTarget(Config.Accel.surrogate_id);
 274
 275         if (sctusable) {
 276             if (sctusable->noStore() ||
 277                     (Config.onoff.surrogate_is_remote
 278                      && sctusable->noStoreRemote())) {
 279                 surrogateNoStore = true;
 280                 entry->makePrivate();
 281             }
 282
 283             /* The HttpHeader logic cannot tell if the header it's parsing is a reply to an
 284              * accelerated request or not...
 285              * Still, this is an abstraction breach. - RC
 286              */
 287             if (sctusable->hasMaxAge()) {
 288                 if (sctusable->maxAge() < sctusable->maxStale())
 289                     reply->expires = reply->date + sctusable->maxAge();
 290                 else
 291                     reply->expires = reply->date + sctusable->maxStale();
 292
 293                 /* And update the timestamps */
 294                 entry->timestampsSet();
 295             }
 296
 297             /* We ignore cache-control directives as per the Surrogate specification */
 298             ignoreCacheControl = true;
 299
 300             delete sctusable;
 301         }
 302     }
 303 }
 304
 305 int
 306 HttpStateData::cacheableReply()
 307 {
 308     HttpReply const *rep = finalReply();
 309     HttpHeader const *hdr = &rep->header;
 310     const char *v;
 311 #if USE_HTTP_VIOLATIONS
 312
 313     const RefreshPattern *R = NULL;
 314
 315     /* This strange looking define first looks up the refresh pattern
 316      * and then checks if the specified flag is set. The main purpose
 317      * of this is to simplify the refresh pattern lookup and USE_HTTP_VIOLATIONS
 318      * condition
 319      */
 320 #define REFRESH_OVERRIDE(flag) \
 321     ((R = (R ? R : refreshLimits(entry->mem_obj->storeId()))) , \
 322     (R && R->flags.flag))
 323 #else
 324 #define REFRESH_OVERRIDE(flag) 0
 325 #endif
 326
 327     if (EBIT_TEST(entry->flags, RELEASE_REQUEST)) {
 328         debugs(22, 3, "NO because " << *entry << " has been released.");
 329         return 0;
 330     }
 331
 332     // Check for Surrogate/1.0 protocol conditions
 333     // NP: reverse-proxy traffic our parent server has instructed us never to cache
 334     if (surrogateNoStore) {
 335         debugs(22, 3, HERE << "NO because Surrogate-Control:no-store");
 336         return 0;
 337     }
 338
 339     // RFC 2616: HTTP/1.1 Cache-Control conditions
 340     if (!ignoreCacheControl) {
 341         // XXX: check to see if the request headers alone were enough to prevent caching earlier
 342         // (ie no-store request header) no need to check those all again here if so.
 343         // for now we are not reliably doing that so we waste CPU re-checking request CC
 344
 345         // RFC 2616 section 14.9.2 - MUST NOT cache any response with request CC:no-store
 346         if (request && request->cache_control && request->cache_control->noStore() &&
 347                 !REFRESH_OVERRIDE(ignore_no_store)) {
 348             debugs(22, 3, HERE << "NO because client request Cache-Control:no-store");
 349             return 0;
 350         }
 351
 352         // NP: request CC:no-cache only means cache READ is forbidden. STORE is permitted.
 353         if (rep->cache_control && rep->cache_control->hasNoCache() && rep->cache_control->noCache().size() > 0) {
 354             /* TODO: we are allowed to cache when no-cache= has parameters.
 355              * Provided we strip away any of the listed headers unless they are revalidated
 356              * successfully (ie, must revalidate AND these headers are prohibited on stale replies).
 357              * That is a bit tricky for squid right now so we avoid caching entirely.
 358              */
 359             debugs(22, 3, HERE << "NO because server reply Cache-Control:no-cache has parameters");
 360             return 0;
 361         }
 362
 363         // NP: request CC:private is undefined. We ignore.
 364         // NP: other request CC flags are limiters on HIT/MISS. We don't care about here.
 365
 366         // RFC 2616 section 14.9.2 - MUST NOT cache any response with CC:no-store
 367         if (rep->cache_control && rep->cache_control->noStore() &&
 368                 !REFRESH_OVERRIDE(ignore_no_store)) {
 369             debugs(22, 3, HERE << "NO because server reply Cache-Control:no-store");
 370             return 0;
 371         }
 372
 373         // RFC 2616 section 14.9.1 - MUST NOT cache any response with CC:private in a shared cache like Squid.
 374         // CC:private overrides CC:public when both are present in a response.
 375         // TODO: add a shared/private cache configuration possibility.
 376         if (rep->cache_control &&
 377                 rep->cache_control->hasPrivate() &&
 378                 !REFRESH_OVERRIDE(ignore_private)) {
 379             /* TODO: we are allowed to cache when private= has parameters.
 380              * Provided we strip away any of the listed headers unless they are revalidated
 381              * successfully (ie, must revalidate AND these headers are prohibited on stale replies).
 382              * That is a bit tricky for squid right now so we avoid caching entirely.
 383              */
 384             debugs(22, 3, HERE << "NO because server reply Cache-Control:private");
 385             return 0;
 386         }
 387     }
 388
 389     // RFC 2068, sec 14.9.4 - MUST NOT cache any response with Authentication UNLESS certain CC controls are present
 390     // allow HTTP violations to IGNORE those controls (ie re-block caching Auth)
 391     if (request && (request->flags.auth || request->flags.authSent)) {
 392         if (!rep->cache_control) {
 393             debugs(22, 3, HERE << "NO because Authenticated and server reply missing Cache-Control");
 394             return 0;
 395         }
 396
 397         if (ignoreCacheControl) {
 398             debugs(22, 3, HERE << "NO because Authenticated and ignoring Cache-Control");
 399             return 0;
 400         }
 401
 402         bool mayStore = false;
 403         // HTTPbis pt6 section 3.2: a response CC:public is present
 404         if (rep->cache_control->Public()) {
 405             debugs(22, 3, HERE << "Authenticated but server reply Cache-Control:public");
 406             mayStore = true;
 407
 408             // HTTPbis pt6 section 3.2: a response CC:must-revalidate is present
 409         } else if (rep->cache_control->mustRevalidate() && !REFRESH_OVERRIDE(ignore_must_revalidate)) {
 410             debugs(22, 3, HERE << "Authenticated but server reply Cache-Control:must-revalidate");
 411             mayStore = true;
 412
 413 #if USE_HTTP_VIOLATIONS
 414             // NP: given the must-revalidate exception we should also be able to exempt no-cache.
 415             // HTTPbis WG verdict on this is that it is omitted from the spec due to being 'unexpected' by
 416             // some. The caching+revalidate is not exactly unsafe though with Squids interpretation of no-cache
 417             // (without parameters) as equivalent to must-revalidate in the reply.
 418         } else if (rep->cache_control->hasNoCache() && rep->cache_control->noCache().size() == 0 && !REFRESH_OVERRIDE(ignore_must_revalidate)) {
 419             debugs(22, 3, HERE << "Authenticated but server reply Cache-Control:no-cache (equivalent to must-revalidate)");
 420             mayStore = true;
 421 #endif
 422
 423             // HTTPbis pt6 section 3.2: a response CC:s-maxage is present
 424         } else if (rep->cache_control->sMaxAge()) {
 425             debugs(22, 3, HERE << "Authenticated but server reply Cache-Control:s-maxage");
 426             mayStore = true;
 427         }
 428
 429         if (!mayStore) {
 430             debugs(22, 3, HERE << "NO because Authenticated transaction");
 431             return 0;
 432         }
 433
 434         // NP: response CC:no-cache is equivalent to CC:must-revalidate,max-age=0. We MAY cache, and do so.
 435         // NP: other request CC flags are limiters on HIT/MISS/REFRESH. We don't care about here.
 436     }
 437
 438     /* HACK: The "multipart/x-mixed-replace" content type is used for
 439      * continuous push replies.  These are generally dynamic and
 440      * probably should not be cachable
 441      */
 442     if ((v = hdr->getStr(HDR_CONTENT_TYPE)))
 443         if (!strncasecmp(v, "multipart/x-mixed-replace", 25)) {
 444             debugs(22, 3, HERE << "NO because Content-Type:multipart/x-mixed-replace");
 445             return 0;
 446         }
 447
 448     switch (rep->sline.status()) {
 449     /* Responses that are cacheable */
 450
 451     case Http::scOkay:
 452
 453     case Http::scNonAuthoritativeInformation:
 454
 455     case Http::scMultipleChoices:
 456
 457     case Http::scMovedPermanently:
 458     case Http::scPermanentRedirect:
 459
 460     case Http::scGone:
 461         /*
 462          * Don't cache objects that need to be refreshed on next request,
 463          * unless we know how to refresh it.
 464          */
 465
 466         if (!refreshIsCachable(entry) && !REFRESH_OVERRIDE(store_stale)) {
 467             debugs(22, 3, "NO because refreshIsCachable() returned non-cacheable..");
 468             return 0;
 469         } else {
 470             debugs(22, 3, HERE << "YES because HTTP status " << rep->sline.status());
 471             return 1;
 472         }
 473         /* NOTREACHED */
 474         break;
 475
 476     /* Responses that only are cacheable if the server says so */
 477
 478     case Http::scFound:
 479     case Http::scTemporaryRedirect:
 480         if (rep->date <= 0) {
 481             debugs(22, 3, HERE << "NO because HTTP status " << rep->sline.status() << " and Date missing/invalid");
 482             return 0;
 483         }
 484         if (rep->expires > rep->date) {
 485             debugs(22, 3, HERE << "YES because HTTP status " << rep->sline.status() << " and Expires > Date");
 486             return 1;
 487         } else {
 488             debugs(22, 3, HERE << "NO because HTTP status " << rep->sline.status() << " and Expires <= Date");
 489             return 0;
 490         }
 491         /* NOTREACHED */
 492         break;
 493
 494     /* Errors can be negatively cached */
 495
 496     case Http::scNoContent:
 497
 498     case Http::scUseProxy:
 499
 500     case Http::scBadRequest:
 501
 502     case Http::scForbidden:
 503
 504     case Http::scNotFound:
 505
 506     case Http::scMethodNotAllowed:
 507
 508     case Http::scUriTooLong:
 509
 510     case Http::scInternalServerError:
 511
 512     case Http::scNotImplemented:
 513
 514     case Http::scBadGateway:
 515
 516     case Http::scServiceUnavailable:
 517
 518     case Http::scGatewayTimeout:
 519     case Http::scMisdirectedRequest:
 520
 521         debugs(22, 3, "MAYBE because HTTP status " << rep->sline.status());
 522         return -1;
 523
 524         /* NOTREACHED */
 525         break;
 526
 527     /* Some responses can never be cached */
 528
 529     case Http::scPartialContent:    /* Not yet supported */
 530
 531     case Http::scSeeOther:
 532
 533     case Http::scNotModified:
 534
 535     case Http::scUnauthorized:
 536
 537     case Http::scProxyAuthenticationRequired:
 538
 539     case Http::scInvalidHeader: /* Squid header parsing error */
 540
 541     case Http::scHeaderTooLarge:
 542
 543     case Http::scPaymentRequired:
 544     case Http::scNotAcceptable:
 545     case Http::scRequestTimeout:
 546     case Http::scConflict:
 547     case Http::scLengthRequired:
 548     case Http::scPreconditionFailed:
 549     case Http::scPayloadTooLarge:
 550     case Http::scUnsupportedMediaType:
 551     case Http::scUnprocessableEntity:
 552     case Http::scLocked:
 553     case Http::scFailedDependency:
 554     case Http::scInsufficientStorage:
 555     case Http::scRequestedRangeNotSatisfied:
 556     case Http::scExpectationFailed:
 557
 558         debugs(22, 3, HERE << "NO because HTTP status " << rep->sline.status());
 559         return 0;
 560
 561     default:
 562         /* RFC 2616 section 6.1.1: an unrecognized response MUST NOT be cached. */
 563         debugs (11, 3, HERE << "NO because unknown HTTP status code " << rep->sline.status());
 564         return 0;
 565
 566         /* NOTREACHED */
 567         break;
 568     }
 569
 570     /* NOTREACHED */
 571 }
 572
 573 /*
 574  * For Vary, store the relevant request headers as
 575  * virtual headers in the reply
 576  * Returns false if the variance cannot be stored
 577  */
 578 const char *
 579 httpMakeVaryMark(HttpRequest * request, HttpReply const * reply)
 580 {
 581     String vary, hdr;
 582     const char *pos = NULL;
 583     const char *item;
 584     const char *value;
 585     int ilen;
 586     static String vstr;
 587
 588     vstr.clean();
 589     vary = reply->header.getList(HDR_VARY);
 590
 591     while (strListGetItem(&vary, ',', &item, &ilen, &pos)) {
 592         char *name = (char *)xmalloc(ilen + 1);
 593         xstrncpy(name, item, ilen + 1);
 594         Tolower(name);
 595
 596         if (strcmp(name, "*") == 0) {
 597             /* Can not handle "Vary: *" withtout ETag support */
 598             safe_free(name);
 599             vstr.clean();
 600             break;
 601         }
 602
 603         strListAdd(&vstr, name, ',');
 604         hdr = request->header.getByName(name);
 605         safe_free(name);
 606         value = hdr.termedBuf();
 607
 608         if (value) {
 609             value = rfc1738_escape_part(value);
 610             vstr.append("=\"", 2);
 611             vstr.append(value);
 612             vstr.append("\"", 1);
 613         }
 614
 615         hdr.clean();
 616     }
 617
 618     vary.clean();
 619 #if X_ACCELERATOR_VARY
 620
 621     pos = NULL;
 622     vary = reply->header.getList(HDR_X_ACCELERATOR_VARY);
 623
 624     while (strListGetItem(&vary, ',', &item, &ilen, &pos)) {
 625         char *name = (char *)xmalloc(ilen + 1);
 626         xstrncpy(name, item, ilen + 1);
 627         Tolower(name);
 628         strListAdd(&vstr, name, ',');
 629         hdr = request->header.getByName(name);
 630         safe_free(name);
 631         value = hdr.termedBuf();
 632
 633         if (value) {
 634             value = rfc1738_escape_part(value);
 635             vstr.append("=\"", 2);
 636             vstr.append(value);
 637             vstr.append("\"", 1);
 638         }
 639
 640         hdr.clean();
 641     }
 642
 643     vary.clean();
 644 #endif
 645
 646     debugs(11, 3, "httpMakeVaryMark: " << vstr);
 647     return vstr.termedBuf();
 648 }
 649
 650 void
 651 HttpStateData::keepaliveAccounting(HttpReply *reply)
 652 {
 653     if (flags.keepalive)
 654         if (_peer)
 655             ++ _peer->stats.n_keepalives_sent;
 656
 657     if (reply->keep_alive) {
 658         if (_peer)
 659             ++ _peer->stats.n_keepalives_recv;
 660
 661         if (Config.onoff.detect_broken_server_pconns
 662                 && reply->bodySize(request->method) == -1 && !flags.chunked) {
 663             debugs(11, DBG_IMPORTANT, "keepaliveAccounting: Impossible keep-alive header from '" << entry->url() << "'" );
 664             // debugs(11, 2, "GOT HTTP REPLY HDR:\n---------\n" << readBuf->content() << "\n----------" );
 665             flags.keepalive_broken = true;
 666         }
 667     }
 668 }
 669
 670 void
 671 HttpStateData::checkDateSkew(HttpReply *reply)
 672 {
 673     if (reply->date > -1 && !_peer) {
 674         int skew = abs((int)(reply->date - squid_curtime));
 675
 676         if (skew > 86400)
 677             debugs(11, 3, "" << request->GetHost() << "'s clock is skewed by " << skew << " seconds!");
 678     }
 679 }
 680
 681 /**
 682  * This creates the error page itself.. its likely
 683  * that the forward ported reply header max size patch
 684  * generates non http conformant error pages - in which
 685  * case the errors where should be 'BAD_GATEWAY' etc
 686  */
 687 void
 688 HttpStateData::processReplyHeader()
 689 {
 690     /** Creates a blank header. If this routine is made incremental, this will not do */
 691
 692     /* NP: all exit points to this function MUST call ctx_exit(ctx) */
 693     Ctx ctx = ctx_enter(entry->mem_obj->urlXXX());
 694
 695     debugs(11, 3, "processReplyHeader: key '" << entry->getMD5Text() << "'");
 696
 697     assert(!flags.headers_parsed);
 698
 699     if (!inBuf.length()) {
 700         ctx_exit(ctx);
 701         return;
 702     }
 703
 704     /* Attempt to parse the first line; this will define where the protocol, status, reason-phrase and header begin */
 705     {
 706         if (hp == NULL)
 707             hp = new Http1::ResponseParser;
 708
 709         bool parsedOk = hp->parse(inBuf);
 710
 711         // sync the buffers after parsing.
 712         inBuf = hp->remaining();
 713
 714         if (hp->needsMoreData()) {
 715             if (eof) { // no more data coming
 716                 /* Bug 2879: Replies may terminate with \r\n then EOF instead of \r\n\r\n.
 717                  * We also may receive truncated responses.
 718                  * Ensure here that we have at minimum two \r\n when EOF is seen.
 719                  */
 720                 inBuf.append("\r\n\r\n", 4);
 721                 // retry the parse
 722                 parsedOk = hp->parse(inBuf);
 723                 // sync the buffers after parsing.
 724                 inBuf = hp->remaining();
 725             } else {
 726                 debugs(33, 5, "Incomplete response, waiting for end of response headers");
 727                 ctx_exit(ctx);
 728                 return;
 729             }
 730         }
 731
 732         flags.headers_parsed = true;
 733
 734         if (!parsedOk) {
 735             // unrecoverable parsing error
 736             debugs(11, 3, "Non-HTTP-compliant header:\n---------\n" << inBuf << "\n----------");
 737             HttpReply *newrep = new HttpReply;
 738             newrep->sline.set(Http::ProtocolVersion(), hp->messageStatus());
 739             HttpReply *vrep = setVirginReply(newrep);
 740             entry->replaceHttpReply(vrep);
 741             // XXX: close the server connection ?
 742             ctx_exit(ctx);
 743             return;
 744         }
 745     }
 746
 747     /* We know the whole response is in parser now */
 748     debugs(11, 2, "HTTP Server " << serverConnection);
 749     debugs(11, 2, "HTTP Server RESPONSE:\n---------\n" <<
 750            hp->messageProtocol() << " " << hp->messageStatus() << " " << hp->reasonPhrase() << "\n" <<
 751            hp->mimeHeader() <<
 752            "----------");
 753
 754     // reset payload tracking to begin after message headers
 755     payloadSeen = inBuf.length();
 756
 757     HttpReply *newrep = new HttpReply;
 758     // XXX: RFC 7230 indicates we MAY ignore the reason phrase,
 759     //      and use an empty string on unknown status.
 760     //      We do that now to avoid performance regression from using SBuf::c_str()
 761     newrep->sline.set(Http::ProtocolVersion(1,1), hp->messageStatus() /* , hp->reasonPhrase() */);
 762     newrep->sline.protocol = newrep->sline.version.protocol = hp->messageProtocol().protocol;
 763     newrep->sline.version.major = hp->messageProtocol().major;
 764     newrep->sline.version.minor = hp->messageProtocol().minor;
 765
 766     // parse headers
 767     newrep->pstate = psReadyToParseHeaders;
 768     if (newrep->httpMsgParseStep(hp->mimeHeader().rawContent(), hp->mimeHeader().length(), true) < 0) {
 769         // XXX: when Http::ProtocolVersion is a function, remove this hack. just set with messageProtocol()
 770         newrep->sline.set(Http::ProtocolVersion(), Http::scInvalidHeader);
 771         newrep->sline.version.protocol = hp->messageProtocol().protocol;
 772         newrep->sline.version.major = hp->messageProtocol().major;
 773         newrep->sline.version.minor = hp->messageProtocol().minor;
 774         debugs(11, 2, "error parsing response headers mime block");
 775     }
 776
 777     // done with Parser, now process using the HttpReply
 778     hp = NULL;
 779
 780     newrep->removeStaleWarnings();
 781
 782     if (newrep->sline.protocol == AnyP::PROTO_HTTP && newrep->sline.status() >= 100 && newrep->sline.status() < 200) {
 783         handle1xx(newrep);
 784         ctx_exit(ctx);
 785         return;
 786     }
 787
 788     flags.chunked = false;
 789     if (newrep->sline.protocol == AnyP::PROTO_HTTP && newrep->header.chunked()) {
 790         flags.chunked = true;
 791         httpChunkDecoder = new ChunkedCodingParser;
 792     }
 793
 794     if (!peerSupportsConnectionPinning())
 795         request->flags.connectionAuthDisabled = true;
 796
 797     HttpReply *vrep = setVirginReply(newrep);
 798     flags.headers_parsed = true;
 799
 800     keepaliveAccounting(vrep);
 801
 802     checkDateSkew(vrep);
 803
 804     processSurrogateControl (vrep);
 805
 806     request->hier.peer_reply_status = newrep->sline.status();
 807
 808     ctx_exit(ctx);
 809 }
 810
 811 /// ignore or start forwarding the 1xx response (a.k.a., control message)
 812 void
 813 HttpStateData::handle1xx(HttpReply *reply)
 814 {
 815     HttpReply::Pointer msg(reply); // will destroy reply if unused
 816
 817     // one 1xx at a time: we must not be called while waiting for previous 1xx
 818     Must(!flags.handling1xx);
 819     flags.handling1xx = true;
 820
 821     if (!request->canHandle1xx() || request->forcedBodyContinuation) {
 822         debugs(11, 2, "ignoring 1xx because it is " << (request->forcedBodyContinuation ? "already sent" : "not supported by client"));
 823         proceedAfter1xx();
 824         return;
 825     }
 826
 827 #if USE_HTTP_VIOLATIONS
 828     // check whether the 1xx response forwarding is allowed by squid.conf
 829     if (Config.accessList.reply) {
 830         ACLFilledChecklist ch(Config.accessList.reply, originalRequest(), NULL);
 831         ch.reply = reply;
 832         HTTPMSGLOCK(ch.reply);
 833         if (ch.fastCheck() != ACCESS_ALLOWED) { // TODO: support slow lookups?
 834             debugs(11, 3, HERE << "ignoring denied 1xx");
 835             proceedAfter1xx();
 836             return;
 837         }
 838     }
 839 #endif // USE_HTTP_VIOLATIONS
 840
 841     debugs(11, 2, HERE << "forwarding 1xx to client");
 842
 843     // the Sink will use this to call us back after writing 1xx to the client
 844     typedef NullaryMemFunT<HttpStateData> CbDialer;
 845     const AsyncCall::Pointer cb = JobCallback(11, 3, CbDialer, this,
 846                                   HttpStateData::proceedAfter1xx);
 847     CallJobHere1(11, 4, request->clientConnectionManager, ConnStateData,
 848                  ConnStateData::sendControlMsg, HttpControlMsg(msg, cb));
 849     // If the call is not fired, then the Sink is gone, and HttpStateData
 850     // will terminate due to an aborted store entry or another similar error.
 851     // If we get stuck, it is not handle1xx fault if we could get stuck
 852     // for similar reasons without a 1xx response.
 853 }
 854
 855 /// restores state and resumes processing after 1xx is ignored or forwarded
 856 void
 857 HttpStateData::proceedAfter1xx()
 858 {
 859     Must(flags.handling1xx);
 860     debugs(11, 2, "continuing with " << payloadSeen << " bytes in buffer after 1xx");
 861     CallJobHere(11, 3, this, HttpStateData, HttpStateData::processReply);
 862 }
 863
 864 /**
 865  * returns true if the peer can support connection pinning
 866 */
 867 bool HttpStateData::peerSupportsConnectionPinning() const
 868 {
 869     const HttpReply *rep = entry->mem_obj->getReply();
 870     const HttpHeader *hdr = &rep->header;
 871     bool rc;
 872     String header;
 873
 874     if (!_peer)
 875         return true;
 876
 877     /*If this peer does not support connection pinning (authenticated
 878       connections) return false
 879      */
 880     if (!_peer->connection_auth)
 881         return false;
 882
 883     /*The peer supports connection pinning and the http reply status
 884       is not unauthorized, so the related connection can be pinned
 885      */
 886     if (rep->sline.status() != Http::scUnauthorized)
 887         return true;
 888
 889     /*The server respond with Http::scUnauthorized and the peer configured
 890       with "connection-auth=on" we know that the peer supports pinned
 891       connections
 892     */
 893     if (_peer->connection_auth == 1)
 894         return true;
 895
 896     /*At this point peer has configured with "connection-auth=auto"
 897       parameter so we need some extra checks to decide if we are going
 898       to allow pinned connections or not
 899     */
 900
 901     /*if the peer configured with originserver just allow connection
 902         pinning (squid 2.6 behaviour)
 903      */
 904     if (_peer->options.originserver)
 905         return true;
 906
 907     /*if the connections it is already pinned it is OK*/
 908     if (request->flags.pinned)
 909         return true;
 910
 911     /*Allow pinned connections only if the Proxy-support header exists in
 912       reply and has in its list the "Session-Based-Authentication"
 913       which means that the peer supports connection pinning.
 914      */
 915     if (!hdr->has(HDR_PROXY_SUPPORT))
 916         return false;
 917
 918     header = hdr->getStrOrList(HDR_PROXY_SUPPORT);
 919     /* XXX This ought to be done in a case-insensitive manner */
 920     rc = (strstr(header.termedBuf(), "Session-Based-Authentication") != NULL);
 921
 922     return rc;
 923 }
 924
 925 // Called when we parsed (and possibly adapted) the headers but
 926 // had not starting storing (a.k.a., sending) the body yet.
 927 void
 928 HttpStateData::haveParsedReplyHeaders()
 929 {
 930     Client::haveParsedReplyHeaders();
 931
 932     Ctx ctx = ctx_enter(entry->mem_obj->urlXXX());
 933     HttpReply *rep = finalReply();
 934
 935     entry->timestampsSet();
 936
 937     /* Check if object is cacheable or not based on reply code */
 938     debugs(11, 3, "HTTP CODE: " << rep->sline.status());
 939
 940     if (neighbors_do_private_keys)
 941         httpMaybeRemovePublic(entry, rep->sline.status());
 942
 943     bool varyFailure = false;
 944     if (rep->header.has(HDR_VARY)
 945 #if X_ACCELERATOR_VARY
 946             || rep->header.has(HDR_X_ACCELERATOR_VARY)
 947 #endif
 948        ) {
 949         const char *vary = httpMakeVaryMark(request, rep);
 950
 951         if (!vary) {
 952             entry->makePrivate();
 953             if (!fwd->reforwardableStatus(rep->sline.status()))
 954                 EBIT_CLR(entry->flags, ENTRY_FWD_HDR_WAIT);
 955             varyFailure = true;
 956         } else {
 957             entry->mem_obj->vary_headers = xstrdup(vary);
 958         }
 959     }
 960
 961     if (!varyFailure) {
 962         /*
 963          * If its not a reply that we will re-forward, then
 964          * allow the client to get it.
 965          */
 966         if (!fwd->reforwardableStatus(rep->sline.status()))
 967             EBIT_CLR(entry->flags, ENTRY_FWD_HDR_WAIT);
 968
 969         switch (cacheableReply()) {
 970
 971         case 1:
 972             entry->makePublic();
 973             break;
 974
 975         case 0:
 976             entry->makePrivate();
 977             break;
 978
 979         case -1:
 980
 981 #if USE_HTTP_VIOLATIONS
 982             if (Config.negativeTtl > 0)
 983                 entry->cacheNegatively();
 984             else
 985 #endif
 986                 entry->makePrivate();
 987             break;
 988
 989         default:
 990             assert(0);
 991             break;
 992         }
 993     }
 994
 995     if (!ignoreCacheControl) {
 996         if (rep->cache_control) {
 997             // We are required to revalidate on many conditions.
 998             // For security reasons we do so even if storage was caused by refresh_pattern ignore-* option
 999
1000             // CC:must-revalidate or CC:proxy-revalidate
1001             const bool ccMustRevalidate = (rep->cache_control->proxyRevalidate() || rep->cache_control->mustRevalidate());
1002
1003             // CC:no-cache (only if there are no parameters)
1004             const bool ccNoCacheNoParams = (rep->cache_control->hasNoCache() && rep->cache_control->noCache().size()==0);
1005
1006             // CC:s-maxage=N
1007             const bool ccSMaxAge = rep->cache_control->hasSMaxAge();
1008
1009             // CC:private (yes, these can sometimes be stored)
1010             const bool ccPrivate = rep->cache_control->hasPrivate();
1011
1012             if (ccMustRevalidate || ccNoCacheNoParams || ccSMaxAge || ccPrivate)
1013                 EBIT_SET(entry->flags, ENTRY_REVALIDATE);
1014         }
1015 #if USE_HTTP_VIOLATIONS // response header Pragma::no-cache is undefined in HTTP
1016         else {
1017             // Expensive calculation. So only do it IF the CC: header is not present.
1018
1019             /* HACK: Pragma: no-cache in _replies_ is not documented in HTTP,
1020              * but servers like "Active Imaging Webcast/2.0" sure do use it */
1021             if (rep->header.has(HDR_PRAGMA) &&
1022                     rep->header.hasListMember(HDR_PRAGMA,"no-cache",','))
1023                 EBIT_SET(entry->flags, ENTRY_REVALIDATE);
1024         }
1025 #endif
1026     }
1027
1028 #if HEADERS_LOG
1029     headersLog(1, 0, request->method, rep);
1030
1031 #endif
1032
1033     ctx_exit(ctx);
1034 }
1035
1036 HttpStateData::ConnectionStatus
1037 HttpStateData::statusIfComplete() const
1038 {
1039     const HttpReply *rep = virginReply();
1040     /** \par
1041      * If the reply wants to close the connection, it takes precedence */
1042
1043     if (httpHeaderHasConnDir(&rep->header, "close"))
1044         return COMPLETE_NONPERSISTENT_MSG;
1045
1046     /** \par
1047      * If we didn't send a keep-alive request header, then this
1048      * can not be a persistent connection.
1049      */
1050     if (!flags.keepalive)
1051         return COMPLETE_NONPERSISTENT_MSG;
1052
1053     /** \par
1054      * If we haven't sent the whole request then this can not be a persistent
1055      * connection.
1056      */
1057     if (!flags.request_sent) {
1058         debugs(11, 2, "Request not yet fully sent " << request->method << ' ' << entry->url());
1059         return COMPLETE_NONPERSISTENT_MSG;
1060     }
1061
1062     /** \par
1063      * What does the reply have to say about keep-alive?
1064      */
1065     /**
1066      \bug XXX BUG?
1067      * If the origin server (HTTP/1.0) does not send a keep-alive
1068      * header, but keeps the connection open anyway, what happens?
1069      * We'll return here and http.c waits for an EOF before changing
1070      * store_status to STORE_OK.   Combine this with ENTRY_FWD_HDR_WAIT
1071      * and an error status code, and we might have to wait until
1072      * the server times out the socket.
1073      */
1074     if (!rep->keep_alive)
1075         return COMPLETE_NONPERSISTENT_MSG;
1076
1077     return COMPLETE_PERSISTENT_MSG;
1078 }
1079
1080 HttpStateData::ConnectionStatus
1081 HttpStateData::persistentConnStatus() const
1082 {
1083     debugs(11, 3, HERE << serverConnection << " eof=" << eof);
1084     if (eof) // already reached EOF
1085         return COMPLETE_NONPERSISTENT_MSG;
1086
1087     /* If server fd is closing (but we have not been notified yet), stop Comm
1088        I/O to avoid assertions. TODO: Change Comm API to handle callers that
1089        want more I/O after async closing (usually initiated by others). */
1090     // XXX: add canReceive or s/canSend/canTalkToServer/
1091     if (!Comm::IsConnOpen(serverConnection))
1092         return COMPLETE_NONPERSISTENT_MSG;
1093
1094     /** \par
1095      * In chunked response we do not know the content length but we are absolutely
1096      * sure about the end of response, so we are calling the statusIfComplete to
1097      * decide if we can be persistant
1098      */
1099     if (lastChunk && flags.chunked)
1100         return statusIfComplete();
1101
1102     const HttpReply *vrep = virginReply();
1103     debugs(11, 5, "persistentConnStatus: content_length=" << vrep->content_length);
1104
1105     const int64_t clen = vrep->bodySize(request->method);
1106
1107     debugs(11, 5, "persistentConnStatus: clen=" << clen);
1108
1109     /* If the body size is unknown we must wait for EOF */
1110     if (clen < 0)
1111         return INCOMPLETE_MSG;
1112
1113     /** \par
1114      * If the body size is known, we must wait until we've gotten all of it. */
1115     if (clen > 0) {
1116         debugs(11,5, "payloadSeen=" << payloadSeen << " content_length=" << vrep->content_length);
1117
1118         if (payloadSeen < vrep->content_length)
1119             return INCOMPLETE_MSG;
1120
1121         if (payloadTruncated > 0) // already read more than needed
1122             return COMPLETE_NONPERSISTENT_MSG; // disable pconns
1123     }
1124
1125     /** \par
1126      * If there is no message body or we got it all, we can be persistent */
1127     return statusIfComplete();
1128 }
1129
1130 #if USE_DELAY_POOLS
1131 static void
1132 readDelayed(void *context, CommRead const &)
1133 {
1134     HttpStateData *state = static_cast<HttpStateData*>(context);
1135     state->flags.do_next_read = true;
1136     state->maybeReadVirginBody();
1137 }
1138 #endif
1139
1140 void
1141 HttpStateData::readReply(const CommIoCbParams &io)
1142 {
1143     Must(!flags.do_next_read); // XXX: should have been set false by mayReadVirginBody()
1144     flags.do_next_read = false;
1145
1146     debugs(11, 5, io.conn);
1147
1148     // Bail out early on Comm::ERR_CLOSING - close handlers will tidy up for us
1149     if (io.flag == Comm::ERR_CLOSING) {
1150         debugs(11, 3, "http socket closing");
1151         return;
1152     }
1153
1154     if (EBIT_TEST(entry->flags, ENTRY_ABORTED)) {
1155         abortTransaction("store entry aborted while reading reply");
1156         return;
1157     }
1158
1159     Must(Comm::IsConnOpen(serverConnection));
1160     Must(io.conn->fd == serverConnection->fd);
1161
1162     /*
1163      * Don't reset the timeout value here. The value should be
1164      * counting Config.Timeout.request and applies to the request
1165      * as a whole, not individual read() calls.
1166      * Plus, it breaks our lame *HalfClosed() detection
1167      */
1168
1169     Must(maybeMakeSpaceAvailable(true));
1170     CommIoCbParams rd(this); // will be expanded with ReadNow results
1171     rd.conn = io.conn;
1172     rd.size = entry->bytesWanted(Range<size_t>(0, inBuf.spaceSize()));
1173 #if USE_DELAY_POOLS
1174     if (rd.size < 1) {
1175         assert(entry->mem_obj);
1176
1177         /* read ahead limit */
1178         /* Perhaps these two calls should both live in MemObject */
1179         AsyncCall::Pointer nilCall;
1180         if (!entry->mem_obj->readAheadPolicyCanRead()) {
1181             entry->mem_obj->delayRead(DeferredRead(readDelayed, this, CommRead(io.conn, NULL, 0, nilCall)));
1182             return;
1183         }
1184
1185         /* delay id limit */
1186         entry->mem_obj->mostBytesAllowed().delayRead(DeferredRead(readDelayed, this, CommRead(io.conn, NULL, 0, nilCall)));
1187         return;
1188     }
1189 #endif
1190
1191     switch (Comm::ReadNow(rd, inBuf)) {
1192     case Comm::INPROGRESS:
1193         if (inBuf.isEmpty())
1194             debugs(33, 2, io.conn << ": no data to process, " << xstrerr(rd.xerrno));
1195         flags.do_next_read = true;
1196         maybeReadVirginBody();
1197         return;
1198
1199     case Comm::OK:
1200     {
1201         payloadSeen += rd.size;
1202 #if USE_DELAY_POOLS
1203         DelayId delayId = entry->mem_obj->mostBytesAllowed();
1204         delayId.bytesIn(rd.size);
1205 #endif
1206
1207         kb_incr(&(statCounter.server.all.kbytes_in), rd.size);
1208         kb_incr(&(statCounter.server.http.kbytes_in), rd.size);
1209         ++ IOStats.Http.reads;
1210
1211         int bin = 0;
1212         for (int clen = rd.size - 1; clen; ++bin)
1213             clen >>= 1;
1214
1215         ++ IOStats.Http.read_hist[bin];
1216
1217         // update peer response time stats (%<pt)
1218         const timeval &sent = request->hier.peer_http_request_sent;
1219         if (sent.tv_sec)
1220             tvSub(request->hier.peer_response_time, sent, current_time);
1221         else
1222             request->hier.peer_response_time.tv_sec = -1;
1223     }
1224
1225         /* Continue to process previously read data */
1226     break;
1227
1228     case Comm::ENDFILE: // close detected by 0-byte read
1229         eof = 1;
1230         flags.do_next_read = false;
1231
1232         /* Continue to process previously read data */
1233         break;
1234
1235     // case Comm::COMM_ERROR:
1236     default: // no other flags should ever occur
1237         debugs(11, 2, io.conn << ": read failure: " << xstrerr(rd.xerrno));
1238         ErrorState *err = new ErrorState(ERR_READ_ERROR, Http::scBadGateway, fwd->request);
1239         err->xerrno = rd.xerrno;
1240         fwd->fail(err);
1241         flags.do_next_read = false;
1242         io.conn->close();
1243
1244         return;
1245     }
1246
1247     /* Process next response from buffer */
1248     processReply();
1249 }
1250
1251 /// processes the already read and buffered response data, possibly after
1252 /// waiting for asynchronous 1xx control message processing
1253 void
1254 HttpStateData::processReply()
1255 {
1256
1257     if (flags.handling1xx) { // we came back after handling a 1xx response
1258         debugs(11, 5, HERE << "done with 1xx handling");
1259         flags.handling1xx = false;
1260         Must(!flags.headers_parsed);
1261     }
1262
1263     if (!flags.headers_parsed) { // have not parsed headers yet?
1264         PROF_start(HttpStateData_processReplyHeader);
1265         processReplyHeader();
1266         PROF_stop(HttpStateData_processReplyHeader);
1267
1268         if (!continueAfterParsingHeader()) // parsing error or need more data
1269             return; // TODO: send errors to ICAP
1270
1271         adaptOrFinalizeReply(); // may write to, abort, or "close" the entry
1272     }
1273
1274     // kick more reads if needed and/or process the response body, if any
1275     PROF_start(HttpStateData_processReplyBody);
1276     processReplyBody(); // may call serverComplete()
1277     PROF_stop(HttpStateData_processReplyBody);
1278 }
1279
1280 /**
1281  \retval true    if we can continue with processing the body or doing ICAP.
1282  */
1283 bool
1284 HttpStateData::continueAfterParsingHeader()
1285 {
1286     if (flags.handling1xx) {
1287         debugs(11, 5, HERE << "wait for 1xx handling");
1288         Must(!flags.headers_parsed);
1289         return false;
1290     }
1291
1292     if (!flags.headers_parsed && !eof) {
1293         debugs(11, 9, "needs more at " << inBuf.length());
1294         flags.do_next_read = true;
1295         /** \retval false If we have not finished parsing the headers and may get more data.
1296          *                Schedules more reads to retrieve the missing data.
1297          */
1298         maybeReadVirginBody(); // schedules all kinds of reads; TODO: rename
1299         return false;
1300     }
1301
1302     /** If we are done with parsing, check for errors */
1303
1304     err_type error = ERR_NONE;
1305
1306     if (flags.headers_parsed) { // parsed headers, possibly with errors
1307         // check for header parsing errors
1308         if (HttpReply *vrep = virginReply()) {
1309             const Http::StatusCode s = vrep->sline.status();
1310             const AnyP::ProtocolVersion &v = vrep->sline.version;
1311             if (s == Http::scInvalidHeader && v != Http::ProtocolVersion(0,9)) {
1312                 debugs(11, DBG_IMPORTANT, "WARNING: HTTP: Invalid Response: Bad header encountered from " << entry->url() << " AKA " << request->GetHost() << request->urlpath.termedBuf() );
1313                 error = ERR_INVALID_RESP;
1314             } else if (s == Http::scHeaderTooLarge) {
1315                 fwd->dontRetry(true);
1316                 error = ERR_TOO_BIG;
1317             } else {
1318                 return true; // done parsing, got reply, and no error
1319             }
1320         } else {
1321             // parsed headers but got no reply
1322             debugs(11, DBG_IMPORTANT, "WARNING: HTTP: Invalid Response: No reply at all for " << entry->url() << " AKA " << request->GetHost() << request->urlpath.termedBuf() );
1323             error = ERR_INVALID_RESP;
1324         }
1325     } else {
1326         assert(eof);
1327         if (inBuf.length()) {
1328             error = ERR_INVALID_RESP;
1329             debugs(11, DBG_IMPORTANT, "WARNING: HTTP: Invalid Response: Headers did not parse at all for " << entry->url() << " AKA " << request->GetHost() << request->urlpath.termedBuf() );
1330         } else {
1331             error = ERR_ZERO_SIZE_OBJECT;
1332             debugs(11, (request->flags.accelerated?DBG_IMPORTANT:2), "WARNING: HTTP: Invalid Response: No object data received for " <<
1333                    entry->url() << " AKA " << request->GetHost() << request->urlpath.termedBuf() );
1334         }
1335     }
1336
1337     assert(error != ERR_NONE);
1338     entry->reset();
1339     fwd->fail(new ErrorState(error, Http::scBadGateway, fwd->request));
1340     flags.do_next_read = false;
1341     serverConnection->close();
1342     return false; // quit on error
1343 }
1344
1345 /** truncate what we read if we read too much so that writeReplyBody()
1346     writes no more than what we should have read */
1347 void
1348 HttpStateData::truncateVirginBody()
1349 {
1350     assert(flags.headers_parsed);
1351
1352     HttpReply *vrep = virginReply();
1353     int64_t clen = -1;
1354     if (!vrep->expectingBody(request->method, clen) || clen < 0)
1355         return; // no body or a body of unknown size, including chunked
1356
1357     if (payloadSeen - payloadTruncated <= clen)
1358         return; // we did not read too much or already took care of the extras
1359
1360     if (const int64_t extras = payloadSeen - payloadTruncated - clen) {
1361         // server sent more that the advertised content length
1362         debugs(11, 5, "payloadSeen=" << payloadSeen <<
1363                " clen=" << clen << '/' << vrep->content_length <<
1364                " trucated=" << payloadTruncated << '+' << extras);
1365
1366         inBuf.chop(0, inBuf.length() - extras);
1367         payloadTruncated += extras;
1368     }
1369 }
1370
1371 /**
1372  * Call this when there is data from the origin server
1373  * which should be sent to either StoreEntry, or to ICAP...
1374  */
1375 void
1376 HttpStateData::writeReplyBody()
1377 {
1378     truncateVirginBody(); // if needed
1379     const char *data = inBuf.rawContent();
1380     int len = inBuf.length();
1381     addVirginReplyBody(data, len);
1382     inBuf.consume(len);
1383 }
1384
1385 bool
1386 HttpStateData::decodeAndWriteReplyBody()
1387 {
1388     const char *data = NULL;
1389     int len;
1390     bool wasThereAnException = false;
1391     assert(flags.chunked);
1392     assert(httpChunkDecoder);
1393     SQUID_ENTER_THROWING_CODE();
1394     MemBuf decodedData;
1395     decodedData.init();
1396     // XXX: performance regression. SBuf-convert (or Parser-convert?) the chunked decoder.
1397     MemBuf encodedData;
1398     encodedData.init();
1399     // NP: we must do this instead of pointing encodedData at the SBuf::rawContent
1400     // because chunked decoder uses MemBuf::consume, which shuffles buffer bytes around.
1401     encodedData.append(inBuf.rawContent(), inBuf.length());
1402     const bool doneParsing = httpChunkDecoder->parse(&encodedData,&decodedData);
1403     // XXX: httpChunkDecoder has consumed from MemBuf.
1404     inBuf.consume(inBuf.length() - encodedData.contentSize());
1405     len = decodedData.contentSize();
1406     data=decodedData.content();
1407     addVirginReplyBody(data, len);
1408     if (doneParsing) {
1409         lastChunk = 1;
1410         flags.do_next_read = false;
1411     }
1412     SQUID_EXIT_THROWING_CODE(wasThereAnException);
1413     return wasThereAnException;
1414 }
1415
1416 /**
1417  * processReplyBody has two purposes:
1418  *  1 - take the reply body data, if any, and put it into either
1419  *      the StoreEntry, or give it over to ICAP.
1420  *  2 - see if we made it to the end of the response (persistent
1421  *      connections and such)
1422  */
1423 void
1424 HttpStateData::processReplyBody()
1425 {
1426     Ip::Address client_addr;
1427     bool ispinned = false;
1428
1429     if (!flags.headers_parsed) {
1430         flags.do_next_read = true;
1431         maybeReadVirginBody();
1432         return;
1433     }
1434
1435 #if USE_ADAPTATION
1436     debugs(11,5, HERE << "adaptationAccessCheckPending=" << adaptationAccessCheckPending);
1437     if (adaptationAccessCheckPending)
1438         return;
1439
1440 #endif
1441
1442     /*
1443      * At this point the reply headers have been parsed and consumed.
1444      * That means header content has been removed from readBuf and
1445      * it contains only body data.
1446      */
1447     if (entry->isAccepting()) {
1448         if (flags.chunked) {
1449             if (!decodeAndWriteReplyBody()) {
1450                 flags.do_next_read = false;
1451                 serverComplete();
1452                 return;
1453             }
1454         } else
1455             writeReplyBody();
1456     }
1457
1458     if (EBIT_TEST(entry->flags, ENTRY_ABORTED)) {
1459         // The above writeReplyBody() call may have aborted the store entry.
1460         abortTransaction("store entry aborted while storing reply");
1461         return;
1462     } else
1463         switch (persistentConnStatus()) {
1464         case INCOMPLETE_MSG: {
1465             debugs(11, 5, "processReplyBody: INCOMPLETE_MSG from " << serverConnection);
1466             /* Wait for more data or EOF condition */
1467             AsyncCall::Pointer nil;
1468             if (flags.keepalive_broken) {
1469                 commSetConnTimeout(serverConnection, 10, nil);
1470             } else {
1471                 commSetConnTimeout(serverConnection, Config.Timeout.read, nil);
1472             }
1473
1474             flags.do_next_read = true;
1475         }
1476         break;
1477
1478         case COMPLETE_PERSISTENT_MSG:
1479             debugs(11, 5, "processReplyBody: COMPLETE_PERSISTENT_MSG from " << serverConnection);
1480             /* yes we have to clear all these! */
1481             commUnsetConnTimeout(serverConnection);
1482             flags.do_next_read = false;
1483
1484             comm_remove_close_handler(serverConnection->fd, closeHandler);
1485             closeHandler = NULL;
1486             fwd->unregister(serverConnection);
1487
1488             if (request->flags.spoofClientIp)
1489                 client_addr = request->client_addr;
1490
1491             if (request->flags.pinned) {
1492                 ispinned = true;
1493             } else if (request->flags.connectionAuth && request->flags.authSent) {
1494                 ispinned = true;
1495             }
1496
1497             if (ispinned && request->clientConnectionManager.valid()) {
1498                 request->clientConnectionManager->pinConnection(serverConnection, request, _peer,
1499                         (request->flags.connectionAuth));
1500             } else {
1501                 fwd->pconnPush(serverConnection, request->GetHost());
1502             }
1503
1504             serverConnection = NULL;
1505             serverComplete();
1506             return;
1507
1508         case COMPLETE_NONPERSISTENT_MSG:
1509             debugs(11, 5, "processReplyBody: COMPLETE_NONPERSISTENT_MSG from " << serverConnection);
1510             serverComplete();
1511             return;
1512         }
1513
1514     maybeReadVirginBody();
1515 }
1516
1517 bool
1518 HttpStateData::mayReadVirginReplyBody() const
1519 {
1520     // TODO: Be more precise here. For example, if/when reading trailer, we may
1521     // not be doneWithServer() yet, but we should return false. Similarly, we
1522     // could still be writing the request body after receiving the whole reply.
1523     return !doneWithServer();
1524 }
1525
1526 void
1527 HttpStateData::maybeReadVirginBody()
1528 {
1529     // too late to read
1530     if (!Comm::IsConnOpen(serverConnection) || fd_table[serverConnection->fd].closing())
1531         return;
1532
1533     if (!maybeMakeSpaceAvailable(false))
1534         return;
1535
1536     // XXX: get rid of the do_next_read flag
1537     // check for the proper reasons preventing read(2)
1538     if (!flags.do_next_read)
1539         return;
1540
1541     flags.do_next_read = false;
1542
1543     // must not already be waiting for read(2) ...
1544     assert(!Comm::MonitorsRead(serverConnection->fd));
1545
1546     // wait for read(2) to be possible.
1547     typedef CommCbMemFunT<HttpStateData, CommIoCbParams> Dialer;
1548     AsyncCall::Pointer call = JobCallback(11, 5, Dialer, this, HttpStateData::readReply);
1549     Comm::Read(serverConnection, call);
1550 }
1551
1552 bool
1553 HttpStateData::maybeMakeSpaceAvailable(bool doGrow)
1554 {
1555     // how much we are allowed to buffer
1556     const int limitBuffer = (flags.headers_parsed ? Config.readAheadGap : Config.maxReplyHeaderSize);
1557
1558     if (limitBuffer < 0 || inBuf.length() >= (SBuf::size_type)limitBuffer) {
1559         // when buffer is at or over limit already
1560         debugs(11, 7, "wont read up to " << limitBuffer << ". buffer has (" << inBuf.length() << "/" << inBuf.spaceSize() << ") from " << serverConnection);
1561         debugs(11, DBG_DATA, "buffer has {" << inBuf << "}");
1562         // Process next response from buffer
1563         processReply();
1564         return false;
1565     }
1566
1567     // how much we want to read
1568     const size_t read_size = calcBufferSpaceToReserve(inBuf.spaceSize(), (limitBuffer - inBuf.length()));
1569
1570     if (!read_size) {
1571         debugs(11, 7, "wont read up to " << read_size << " into buffer (" << inBuf.length() << "/" << inBuf.spaceSize() << ") from " << serverConnection);
1572         return false;
1573     }
1574
1575     // just report whether we could grow or not, dont actually do it
1576     if (doGrow)
1577         return (read_size >= 2);
1578
1579     // we may need to grow the buffer
1580     inBuf.reserveSpace(read_size);
1581     debugs(11, 8, (!flags.do_next_read ? "wont" : "may") <<
1582            " read up to " << read_size << " bytes info buf(" << inBuf.length() << "/" << inBuf.spaceSize() <<
1583            ") from " << serverConnection);
1584
1585     return (inBuf.spaceSize() >= 2); // only read if there is 1+ bytes of space available
1586 }
1587
1588 /// called after writing the very last request byte (body, last-chunk, etc)
1589 void
1590 HttpStateData::wroteLast(const CommIoCbParams &io)
1591 {
1592     debugs(11, 5, HERE << serverConnection << ": size " << io.size << ": errflag " << io.flag << ".");
1593 #if URL_CHECKSUM_DEBUG
1594
1595     entry->mem_obj->checkUrlChecksum();
1596 #endif
1597
1598     if (io.size > 0) {
1599         fd_bytes(io.fd, io.size, FD_WRITE);
1600         kb_incr(&(statCounter.server.all.kbytes_out), io.size);
1601         kb_incr(&(statCounter.server.http.kbytes_out), io.size);
1602     }
1603
1604     if (io.flag == Comm::ERR_CLOSING)
1605         return;
1606
1607     if (io.flag) {
1608         ErrorState *err = new ErrorState(ERR_WRITE_ERROR, Http::scBadGateway, fwd->request);
1609         err->xerrno = io.xerrno;
1610         fwd->fail(err);
1611         serverConnection->close();
1612         return;
1613     }
1614
1615     sendComplete();
1616 }
1617
1618 /// successfully wrote the entire request (including body, last-chunk, etc.)
1619 void
1620 HttpStateData::sendComplete()
1621 {
1622     /*
1623      * Set the read timeout here because it hasn't been set yet.
1624      * We only set the read timeout after the request has been
1625      * fully written to the peer.  If we start the timeout
1626      * after connection establishment, then we are likely to hit
1627      * the timeout for POST/PUT requests that have very large
1628      * request bodies.
1629      */
1630     typedef CommCbMemFunT<HttpStateData, CommTimeoutCbParams> TimeoutDialer;
1631     AsyncCall::Pointer timeoutCall =  JobCallback(11, 5,
1632                                       TimeoutDialer, this, HttpStateData::httpTimeout);
1633
1634     commSetConnTimeout(serverConnection, Config.Timeout.read, timeoutCall);
1635     flags.request_sent = true;
1636     request->hier.peer_http_request_sent = current_time;
1637 }
1638
1639 // Close the HTTP server connection. Used by serverComplete().
1640 void
1641 HttpStateData::closeServer()
1642 {
1643     debugs(11,5, HERE << "closing HTTP server " << serverConnection << " this " << this);
1644
1645     if (Comm::IsConnOpen(serverConnection)) {
1646         fwd->unregister(serverConnection);
1647         comm_remove_close_handler(serverConnection->fd, closeHandler);
1648         closeHandler = NULL;
1649         serverConnection->close();
1650     }
1651 }
1652
1653 bool
1654 HttpStateData::doneWithServer() const
1655 {
1656     return !Comm::IsConnOpen(serverConnection);
1657 }
1658
1659 /*
1660  * Fixup authentication request headers for special cases
1661  */
1662 static void
1663 httpFixupAuthentication(HttpRequest * request, const HttpHeader * hdr_in, HttpHeader * hdr_out, const HttpStateFlags &flags)
1664 {
1665     http_hdr_type header = flags.originpeer ? HDR_AUTHORIZATION : HDR_PROXY_AUTHORIZATION;
1666
1667     /* Nothing to do unless we are forwarding to a peer */
1668     if (!request->flags.proxying)
1669         return;
1670
1671     /* Needs to be explicitly enabled */
1672     if (!request->peer_login)
1673         return;
1674
1675     /* Maybe already dealt with? */
1676     if (hdr_out->has(header))
1677         return;
1678
1679     /* Nothing to do here for PASSTHRU */
1680     if (strcmp(request->peer_login, "PASSTHRU") == 0)
1681         return;
1682
1683     /* PROXYPASS is a special case, single-signon to servers with the proxy password (basic only) */
1684     if (flags.originpeer && strcmp(request->peer_login, "PROXYPASS") == 0 && hdr_in->has(HDR_PROXY_AUTHORIZATION)) {
1685         const char *auth = hdr_in->getStr(HDR_PROXY_AUTHORIZATION);
1686
1687         if (auth && strncasecmp(auth, "basic ", 6) == 0) {
1688             hdr_out->putStr(header, auth);
1689             return;
1690         }
1691     }
1692
1693     uint8_t loginbuf[base64_encode_len(MAX_LOGIN_SZ)];
1694     size_t blen;
1695     struct base64_encode_ctx ctx;
1696     base64_encode_init(&ctx);
1697
1698     /* Special mode to pass the username to the upstream cache */
1699     if (*request->peer_login == '*') {
1700         const char *username = "-";
1701
1702         if (request->extacl_user.size())
1703             username = request->extacl_user.termedBuf();
1704 #if USE_AUTH
1705         else if (request->auth_user_request != NULL)
1706             username = request->auth_user_request->username();
1707 #endif
1708
1709         blen = base64_encode_update(&ctx, loginbuf, strlen(username), reinterpret_cast<const uint8_t*>(username));
1710         blen += base64_encode_update(&ctx, loginbuf+blen, strlen(request->peer_login +1), reinterpret_cast<const uint8_t*>(request->peer_login +1));
1711         blen += base64_encode_final(&ctx, loginbuf+blen);
1712         httpHeaderPutStrf(hdr_out, header, "Basic %.*s", (int)blen, loginbuf);
1713         return;
1714     }
1715
1716     /* external_acl provided credentials */
1717     if (request->extacl_user.size() && request->extacl_passwd.size() &&
1718             (strcmp(request->peer_login, "PASS") == 0 ||
1719              strcmp(request->peer_login, "PROXYPASS") == 0)) {
1720
1721         blen = base64_encode_update(&ctx, loginbuf, request->extacl_user.size(), reinterpret_cast<const uint8_t*>(request->extacl_user.rawBuf()));
1722         blen += base64_encode_update(&ctx, loginbuf+blen, 1, reinterpret_cast<const uint8_t*>(":"));
1723         blen += base64_encode_update(&ctx, loginbuf+blen, request->extacl_passwd.size(), reinterpret_cast<const uint8_t*>(request->extacl_passwd.rawBuf()));
1724         blen += base64_encode_final(&ctx, loginbuf+blen);
1725         httpHeaderPutStrf(hdr_out, header, "Basic %.*s", (int)blen, loginbuf);
1726         return;
1727     }
1728     // if no external user credentials are available to fake authentication with PASS acts like PASSTHRU
1729     if (strcmp(request->peer_login, "PASS") == 0)
1730         return;
1731
1732     /* Kerberos login to peer */
1733 #if HAVE_AUTH_MODULE_NEGOTIATE && HAVE_KRB5 && HAVE_GSSAPI
1734     if (strncmp(request->peer_login, "NEGOTIATE",strlen("NEGOTIATE")) == 0) {
1735         char *Token=NULL;
1736         char *PrincipalName=NULL,*p;
1737         if ((p=strchr(request->peer_login,':')) != NULL ) {
1738             PrincipalName=++p;
1739         }
1740         Token = peer_proxy_negotiate_auth(PrincipalName, request->peer_host);
1741         if (Token) {
1742             httpHeaderPutStrf(hdr_out, header, "Negotiate %s",Token);
1743         }
1744         return;
1745     }
1746 #endif /* HAVE_KRB5 && HAVE_GSSAPI */
1747
1748     blen = base64_encode_update(&ctx, loginbuf, strlen(request->peer_login), reinterpret_cast<const uint8_t*>(request->peer_login));
1749     blen += base64_encode_final(&ctx, loginbuf+blen);
1750     httpHeaderPutStrf(hdr_out, header, "Basic %.*s", (int)blen, loginbuf);
1751     return;
1752 }
1753
1754 /*
1755  * build request headers and append them to a given MemBuf
1756  * used by buildRequestPrefix()
1757  * note: initialised the HttpHeader, the caller is responsible for Clean()-ing
1758  */
1759 void
1760 HttpStateData::httpBuildRequestHeader(HttpRequest * request,
1761                                       StoreEntry * entry,
1762                                       const AccessLogEntryPointer &al,
1763                                       HttpHeader * hdr_out,
1764                                       const HttpStateFlags &flags)
1765 {
1766     /* building buffer for complex strings */
1767 #define BBUF_SZ (MAX_URL+32)
1768     LOCAL_ARRAY(char, bbuf, BBUF_SZ);
1769     LOCAL_ARRAY(char, ntoabuf, MAX_IPSTRLEN);
1770     const HttpHeader *hdr_in = &request->header;
1771     const HttpHeaderEntry *e = NULL;
1772     HttpHeaderPos pos = HttpHeaderInitPos;
1773     assert (hdr_out->owner == hoRequest);
1774
1775     /* use our IMS header if the cached entry has Last-Modified time */
1776     if (request->lastmod > -1)
1777         hdr_out->putTime(HDR_IF_MODIFIED_SINCE, request->lastmod);
1778
1779     // Add our own If-None-Match field if the cached entry has a strong ETag.
1780     // copyOneHeaderFromClientsideRequestToUpstreamRequest() adds client ones.
1781     if (request->etag.size() > 0) {
1782         hdr_out->addEntry(new HttpHeaderEntry(HDR_IF_NONE_MATCH, NULL,
1783                                               request->etag.termedBuf()));
1784     }
1785
1786     bool we_do_ranges = decideIfWeDoRanges (request);
1787
1788     String strConnection (hdr_in->getList(HDR_CONNECTION));
1789
1790     while ((e = hdr_in->getEntry(&pos)))
1791         copyOneHeaderFromClientsideRequestToUpstreamRequest(e, strConnection, request, hdr_out, we_do_ranges, flags);
1792
1793     /* Abstraction break: We should interpret multipart/byterange responses
1794      * into offset-length data, and this works around our inability to do so.
1795      */
1796     if (!we_do_ranges && request->multipartRangeRequest()) {
1797         /* don't cache the result */
1798         request->flags.cachable = false;
1799         /* pretend it's not a range request */
1800         request->ignoreRange("want to request the whole object");
1801         request->flags.isRanged = false;
1802     }
1803
1804     /* append Via */
1805     if (Config.onoff.via) {
1806         String strVia;
1807         strVia = hdr_in->getList(HDR_VIA);
1808         snprintf(bbuf, BBUF_SZ, "%d.%d %s",
1809                  request->http_ver.major,
1810                  request->http_ver.minor, ThisCache);
1811         strListAdd(&strVia, bbuf, ',');
1812         hdr_out->putStr(HDR_VIA, strVia.termedBuf());
1813         strVia.clean();
1814     }
1815
1816     if (request->flags.accelerated) {
1817         /* Append Surrogate-Capabilities */
1818         String strSurrogate(hdr_in->getList(HDR_SURROGATE_CAPABILITY));
1819 #if USE_SQUID_ESI
1820         snprintf(bbuf, BBUF_SZ, "%s=\"Surrogate/1.0 ESI/1.0\"", Config.Accel.surrogate_id);
1821 #else
1822         snprintf(bbuf, BBUF_SZ, "%s=\"Surrogate/1.0\"", Config.Accel.surrogate_id);
1823 #endif
1824         strListAdd(&strSurrogate, bbuf, ',');
1825         hdr_out->putStr(HDR_SURROGATE_CAPABILITY, strSurrogate.termedBuf());
1826     }
1827
1828     /** \pre Handle X-Forwarded-For */
1829     if (strcmp(opt_forwarded_for, "delete") != 0) {
1830
1831         String strFwd = hdr_in->getList(HDR_X_FORWARDED_FOR);
1832
1833         if (strFwd.size() > 65536/2) {
1834             // There is probably a forwarding loop with Via detection disabled.
1835             // If we do nothing, String will assert on overflow soon.
1836             // TODO: Terminate all transactions with huge XFF?
1837             strFwd = "error";
1838
1839             static int warnedCount = 0;
1840             if (warnedCount++ < 100) {
1841                 const char *url = entry ? entry->url() : urlCanonical(request);
1842                 debugs(11, DBG_IMPORTANT, "Warning: likely forwarding loop with " << url);
1843             }
1844         }
1845
1846         if (strcmp(opt_forwarded_for, "on") == 0) {
1847             /** If set to ON - append client IP or 'unknown'. */
1848             if ( request->client_addr.isNoAddr() )
1849                 strListAdd(&strFwd, "unknown", ',');
1850             else
1851                 strListAdd(&strFwd, request->client_addr.toStr(ntoabuf, MAX_IPSTRLEN), ',');
1852         } else if (strcmp(opt_forwarded_for, "off") == 0) {
1853             /** If set to OFF - append 'unknown'. */
1854             strListAdd(&strFwd, "unknown", ',');
1855         } else if (strcmp(opt_forwarded_for, "transparent") == 0) {
1856             /** If set to TRANSPARENT - pass through unchanged. */
1857         } else if (strcmp(opt_forwarded_for, "truncate") == 0) {
1858             /** If set to TRUNCATE - drop existing list and replace with client IP or 'unknown'. */
1859             if ( request->client_addr.isNoAddr() )
1860                 strFwd = "unknown";
1861             else
1862                 strFwd = request->client_addr.toStr(ntoabuf, MAX_IPSTRLEN);
1863         }
1864         if (strFwd.size() > 0)
1865             hdr_out->putStr(HDR_X_FORWARDED_FOR, strFwd.termedBuf());
1866     }
1867     /** If set to DELETE - do not copy through. */
1868
1869     /* append Host if not there already */
1870     if (!hdr_out->has(HDR_HOST)) {
1871         if (request->peer_domain) {
1872             hdr_out->putStr(HDR_HOST, request->peer_domain);
1873         } else if (request->port == urlDefaultPort(request->url.getScheme())) {
1874             /* use port# only if not default */
1875             hdr_out->putStr(HDR_HOST, request->GetHost());
1876         } else {
1877             httpHeaderPutStrf(hdr_out, HDR_HOST, "%s:%d",
1878                               request->GetHost(),
1879                               (int) request->port);
1880         }
1881     }
1882
1883     /* append Authorization if known in URL, not in header and going direct */
1884     if (!hdr_out->has(HDR_AUTHORIZATION)) {
1885         if (!request->flags.proxying && !request->url.userInfo().isEmpty()) {
1886             static uint8_t result[base64_encode_len(MAX_URL*2)]; // should be big enough for a single URI segment
1887             struct base64_encode_ctx ctx;
1888             base64_encode_init(&ctx);
1889             size_t blen = base64_encode_update(&ctx, result, request->url.userInfo().length(), reinterpret_cast<const uint8_t*>(request->url.userInfo().rawContent()));
1890             blen += base64_encode_final(&ctx, result+blen);
1891             result[blen] = '\0';
1892             if (blen)
1893                 httpHeaderPutStrf(hdr_out, HDR_AUTHORIZATION, "Basic %.*s", (int)blen, result);
1894         }
1895     }
1896
1897     /* Fixup (Proxy-)Authorization special cases. Plain relaying dealt with above */
1898     httpFixupAuthentication(request, hdr_in, hdr_out, flags);
1899
1900     /* append Cache-Control, add max-age if not there already */
1901     {
1902         HttpHdrCc *cc = hdr_in->getCc();
1903
1904         if (!cc)
1905             cc = new HttpHdrCc();
1906
1907 #if 0 /* see bug 2330 */
1908         /* Set no-cache if determined needed but not found */
1909         if (request->flags.nocache)
1910             EBIT_SET(cc->mask, CC_NO_CACHE);
1911 #endif
1912
1913         /* Add max-age only without no-cache */
1914         if (!cc->hasMaxAge() && !cc->hasNoCache()) {
1915             const char *url =
1916                 entry ? entry->url() : urlCanonical(request);
1917             cc->maxAge(getMaxAge(url));
1918
1919         }
1920
1921         /* Enforce sibling relations */
1922         if (flags.only_if_cached)
1923             cc->onlyIfCached(true);
1924
1925         hdr_out->putCc(cc);
1926
1927         delete cc;
1928     }
1929
1930     /* maybe append Connection: keep-alive */
1931     if (flags.keepalive) {
1932         hdr_out->putStr(HDR_CONNECTION, "keep-alive");
1933     }
1934
1935     /* append Front-End-Https */
1936     if (flags.front_end_https) {
1937         if (flags.front_end_https == 1 || request->url.getScheme() == AnyP::PROTO_HTTPS)
1938             hdr_out->putStr(HDR_FRONT_END_HTTPS, "On");
1939     }
1940
1941     if (flags.chunked_request) {
1942         // Do not just copy the original value so that if the client-side
1943         // starts decode other encodings, this code may remain valid.
1944         hdr_out->putStr(HDR_TRANSFER_ENCODING, "chunked");
1945     }
1946
1947     /* Now mangle the headers. */
1948     if (Config2.onoff.mangle_request_headers)
1949         httpHdrMangleList(hdr_out, request, ROR_REQUEST);
1950
1951     if (Config.request_header_add && !Config.request_header_add->empty())
1952         httpHdrAdd(hdr_out, request, al, *Config.request_header_add);
1953
1954     strConnection.clean();
1955 }
1956
1957 /**
1958  * Decides whether a particular header may be cloned from the received Clients request
1959  * to our outgoing fetch request.
1960  */
1961 void
1962 copyOneHeaderFromClientsideRequestToUpstreamRequest(const HttpHeaderEntry *e, const String strConnection, const HttpRequest * request, HttpHeader * hdr_out, const int we_do_ranges, const HttpStateFlags &flags)
1963 {
1964     debugs(11, 5, "httpBuildRequestHeader: " << e->name << ": " << e->value );
1965
1966     switch (e->id) {
1967
1968     /** \par RFC 2616 sect 13.5.1 - Hop-by-Hop headers which Squid should not pass on. */
1969
1970     case HDR_PROXY_AUTHORIZATION:
1971         /** \par Proxy-Authorization:
1972          * Only pass on proxy authentication to peers for which
1973          * authentication forwarding is explicitly enabled
1974          */
1975         if (!flags.originpeer && flags.proxying && request->peer_login &&
1976                 (strcmp(request->peer_login, "PASS") == 0 ||
1977                  strcmp(request->peer_login, "PROXYPASS") == 0 ||
1978                  strcmp(request->peer_login, "PASSTHRU") == 0)) {
1979             hdr_out->addEntry(e->clone());
1980         }
1981         break;
1982
1983     /** \par RFC 2616 sect 13.5.1 - Hop-by-Hop headers which Squid does not pass on. */
1984
1985     case HDR_CONNECTION:          /** \par Connection: */
1986     case HDR_TE:                  /** \par TE: */
1987     case HDR_KEEP_ALIVE:          /** \par Keep-Alive: */
1988     case HDR_PROXY_AUTHENTICATE:  /** \par Proxy-Authenticate: */
1989     case HDR_TRAILER:             /** \par Trailer: */
1990     case HDR_UPGRADE:             /** \par Upgrade: */
1991     case HDR_TRANSFER_ENCODING:   /** \par Transfer-Encoding: */
1992         break;
1993
1994     /** \par OTHER headers I haven't bothered to track down yet. */
1995
1996     case HDR_AUTHORIZATION:
1997         /** \par WWW-Authorization:
1998          * Pass on WWW authentication */
1999
2000         if (!flags.originpeer) {
2001             hdr_out->addEntry(e->clone());
2002         } else {
2003             /** \note In accelerators, only forward authentication if enabled
2004              * (see also httpFixupAuthentication for special cases)
2005              */
2006             if (request->peer_login &&
2007                     (strcmp(request->peer_login, "PASS") == 0 ||
2008                      strcmp(request->peer_login, "PASSTHRU") == 0 ||
2009                      strcmp(request->peer_login, "PROXYPASS") == 0)) {
2010                 hdr_out->addEntry(e->clone());
2011             }
2012         }
2013
2014         break;
2015
2016     case HDR_HOST:
2017         /** \par Host:
2018          * Normally Squid rewrites the Host: header.
2019          * However, there is one case when we don't: If the URL
2020          * went through our redirector and the admin configured
2021          * 'redir_rewrites_host' to be off.
2022          */
2023         if (request->peer_domain)
2024             hdr_out->putStr(HDR_HOST, request->peer_domain);
2025         else if (request->flags.redirected && !Config.onoff.redir_rewrites_host)
2026             hdr_out->addEntry(e->clone());
2027         else {
2028             /* use port# only if not default */
2029
2030             if (request->port == urlDefaultPort(request->url.getScheme())) {
2031                 hdr_out->putStr(HDR_HOST, request->GetHost());
2032             } else {
2033                 httpHeaderPutStrf(hdr_out, HDR_HOST, "%s:%d",
2034                                   request->GetHost(),
2035                                   (int) request->port);
2036             }
2037         }
2038
2039         break;
2040
2041     case HDR_IF_MODIFIED_SINCE:
2042         /** \par If-Modified-Since:
2043          * append unless we added our own,
2044          * but only if cache_miss_revalidate is enabled, or
2045          *  the request is not cacheable, or
2046          *  the request contains authentication credentials.
2047          * \note at most one client's If-Modified-Since header can pass through
2048          */
2049         // XXX: need to check and cleanup the auth case so cacheable auth requests get cached.
2050         if (hdr_out->has(HDR_IF_MODIFIED_SINCE))
2051             break;
2052         else if (Config.onoff.cache_miss_revalidate || !request->flags.cachable || request->flags.auth)
2053             hdr_out->addEntry(e->clone());
2054         break;
2055
2056     case HDR_IF_NONE_MATCH:
2057         /** \par If-None-Match:
2058          * append if the wildcard '*' special case value is present, or
2059          *   cache_miss_revalidate is disabled, or
2060          *   the request is not cacheable in this proxy, or
2061          *   the request contains authentication credentials.
2062          * \note this header lists a set of responses for the server to elide sending. Squid added values are extending that set.
2063          */
2064         // XXX: need to check and cleanup the auth case so cacheable auth requests get cached.
2065         if (hdr_out->hasListMember(HDR_IF_MATCH, "*", ',') || Config.onoff.cache_miss_revalidate || !request->flags.cachable || request->flags.auth)
2066             hdr_out->addEntry(e->clone());
2067         break;
2068
2069     case HDR_MAX_FORWARDS:
2070         /** \par Max-Forwards:
2071          * pass only on TRACE or OPTIONS requests */
2072         if (request->method == Http::METHOD_TRACE || request->method == Http::METHOD_OPTIONS) {
2073             const int64_t hops = e->getInt64();
2074
2075             if (hops > 0)
2076                 hdr_out->putInt64(HDR_MAX_FORWARDS, hops - 1);
2077         }
2078
2079         break;
2080
2081     case HDR_VIA:
2082         /** \par Via:
2083          * If Via is disabled then forward any received header as-is.
2084          * Otherwise leave for explicit updated addition later. */
2085
2086         if (!Config.onoff.via)
2087             hdr_out->addEntry(e->clone());
2088
2089         break;
2090
2091     case HDR_RANGE:
2092
2093     case HDR_IF_RANGE:
2094
2095     case HDR_REQUEST_RANGE:
2096         /** \par Range:, If-Range:, Request-Range:
2097          * Only pass if we accept ranges */
2098         if (!we_do_ranges)
2099             hdr_out->addEntry(e->clone());
2100
2101         break;
2102
2103     case HDR_PROXY_CONNECTION: // SHOULD ignore. But doing so breaks things.
2104         break;
2105
2106     case HDR_CONTENT_LENGTH:
2107         // pass through unless we chunk; also, keeping this away from default
2108         // prevents request smuggling via Connection: Content-Length tricks
2109         if (!flags.chunked_request)
2110             hdr_out->addEntry(e->clone());
2111         break;
2112
2113     case HDR_X_FORWARDED_FOR:
2114
2115     case HDR_CACHE_CONTROL:
2116         /** \par X-Forwarded-For:, Cache-Control:
2117          * handled specially by Squid, so leave off for now.
2118          * append these after the loop if needed */
2119         break;
2120
2121     case HDR_FRONT_END_HTTPS:
2122         /** \par Front-End-Https:
2123          * Pass thru only if peer is configured with front-end-https */
2124         if (!flags.front_end_https)
2125             hdr_out->addEntry(e->clone());
2126
2127         break;
2128
2129     default:
2130         /** \par default.
2131          * pass on all other header fields
2132          * which are NOT listed by the special Connection: header. */
2133
2134         if (strConnection.size()>0 && strListIsMember(&strConnection, e->name.termedBuf(), ',')) {
2135             debugs(11, 2, "'" << e->name << "' header cropped by Connection: definition");
2136             return;
2137         }
2138
2139         hdr_out->addEntry(e->clone());
2140     }
2141 }
2142
2143 bool
2144 HttpStateData::decideIfWeDoRanges (HttpRequest * request)
2145 {
2146     bool result = true;
2147     /* decide if we want to do Ranges ourselves
2148      * and fetch the whole object now)
2149      * We want to handle Ranges ourselves iff
2150      *    - we can actually parse client Range specs
2151      *    - the specs are expected to be simple enough (e.g. no out-of-order ranges)
2152      *    - reply will be cachable
2153      * (If the reply will be uncachable we have to throw it away after
2154      *  serving this request, so it is better to forward ranges to
2155      *  the server and fetch only the requested content)
2156      */
2157
2158     int64_t roffLimit = request->getRangeOffsetLimit();
2159
2160     if (NULL == request->range || !request->flags.cachable
2161             || request->range->offsetLimitExceeded(roffLimit) || request->flags.connectionAuth)
2162         result = false;
2163
2164     debugs(11, 8, "decideIfWeDoRanges: range specs: " <<
2165            request->range << ", cachable: " <<
2166            request->flags.cachable << "; we_do_ranges: " << result);
2167
2168     return result;
2169 }
2170
2171 /* build request prefix and append it to a given MemBuf;
2172  * return the length of the prefix */
2173 mb_size_t
2174 HttpStateData::buildRequestPrefix(MemBuf * mb)
2175 {
2176     const int offset = mb->size;
2177     /* Uses a local httpver variable to print the HTTP label
2178      * since the HttpRequest may have an older version label.
2179      * XXX: This could create protocol bugs as the headers sent and
2180      * flow control should all be based on the HttpRequest version
2181      * not the one we are sending. Needs checking.
2182      */
2183     const AnyP::ProtocolVersion httpver = Http::ProtocolVersion();
2184     const char * url;
2185     if (_peer && !_peer->options.originserver)
2186         url = urlCanonical(request);
2187     else
2188         url = request->urlpath.termedBuf();
2189     mb->Printf(SQUIDSBUFPH " %s %s/%d.%d\r\n",
2190                SQUIDSBUFPRINT(request->method.image()),
2191                url && *url ? url : "/",
2192                AnyP::ProtocolType_str[httpver.protocol],
2193                httpver.major,httpver.minor);
2194     /* build and pack headers */
2195     {
2196         HttpHeader hdr(hoRequest);
2197         Packer p;
2198         httpBuildRequestHeader(request, entry, fwd->al, &hdr, flags);
2199
2200         if (request->flags.pinned && request->flags.connectionAuth)
2201             request->flags.authSent = true;
2202         else if (hdr.has(HDR_AUTHORIZATION))
2203             request->flags.authSent = true;
2204
2205         packerToMemInit(&p, mb);
2206         hdr.packInto(&p);
2207         hdr.clean();
2208     }
2209     /* append header terminator */
2210     mb->append(crlf, 2);
2211     return mb->size - offset;
2212 }
2213
2214 /* This will be called when connect completes. Write request. */
2215 bool
2216 HttpStateData::sendRequest()
2217 {
2218     MemBuf mb;
2219
2220     debugs(11, 5, HERE << serverConnection << ", request " << request << ", this " << this << ".");
2221
2222     if (!Comm::IsConnOpen(serverConnection)) {
2223         debugs(11,3, HERE << "cannot send request to closing " << serverConnection);
2224         assert(closeHandler != NULL);
2225         return false;
2226     }
2227
2228     typedef CommCbMemFunT<HttpStateData, CommTimeoutCbParams> TimeoutDialer;
2229     AsyncCall::Pointer timeoutCall =  JobCallback(11, 5,
2230                                       TimeoutDialer, this, HttpStateData::httpTimeout);
2231     commSetConnTimeout(serverConnection, Config.Timeout.lifetime, timeoutCall);
2232     flags.do_next_read = true;
2233     maybeReadVirginBody();
2234
2235     if (request->body_pipe != NULL) {
2236         if (!startRequestBodyFlow()) // register to receive body data
2237             return false;
2238         typedef CommCbMemFunT<HttpStateData, CommIoCbParams> Dialer;
2239         requestSender = JobCallback(11,5,
2240                                     Dialer, this, HttpStateData::sentRequestBody);
2241
2242         Must(!flags.chunked_request);
2243         // use chunked encoding if we do not know the length
2244         if (request->content_length < 0)
2245             flags.chunked_request = true;
2246     } else {
2247         assert(!requestBodySource);
2248         typedef CommCbMemFunT<HttpStateData, CommIoCbParams> Dialer;
2249         requestSender = JobCallback(11,5,
2250                                     Dialer, this,  HttpStateData::wroteLast);
2251     }
2252
2253     flags.originpeer = (_peer != NULL && _peer->options.originserver);
2254     flags.proxying = (_peer != NULL && !flags.originpeer);
2255
2256     /*
2257      * Is keep-alive okay for all request methods?
2258      */
2259     if (request->flags.mustKeepalive)
2260         flags.keepalive = true;
2261     else if (request->flags.pinned)
2262         flags.keepalive = request->persistent();
2263     else if (!Config.onoff.server_pconns)
2264         flags.keepalive = false;
2265     else if (_peer == NULL)
2266         flags.keepalive = true;
2267     else if (_peer->stats.n_keepalives_sent < 10)
2268         flags.keepalive = true;
2269     else if ((double) _peer->stats.n_keepalives_recv /
2270              (double) _peer->stats.n_keepalives_sent > 0.50)
2271         flags.keepalive = true;
2272
2273     if (_peer) {
2274         /*The old code here was
2275           if (neighborType(_peer, request) == PEER_SIBLING && ...
2276           which is equivalent to:
2277           if (neighborType(_peer, NULL) == PEER_SIBLING && ...
2278           or better:
2279           if (((_peer->type == PEER_MULTICAST && p->options.mcast_siblings) ||
2280                  _peer->type == PEER_SIBLINGS ) && _peer->options.allow_miss)
2281                flags.only_if_cached = 1;
2282
2283            But I suppose it was a bug
2284          */
2285         if (neighborType(_peer, request) == PEER_SIBLING &&
2286                 !_peer->options.allow_miss)
2287             flags.only_if_cached = true;
2288
2289         flags.front_end_https = _peer->front_end_https;
2290     }
2291
2292     mb.init();
2293     request->peer_host=_peer?_peer->host:NULL;
2294     buildRequestPrefix(&mb);
2295
2296     debugs(11, 2, "HTTP Server " << serverConnection);
2297     debugs(11, 2, "HTTP Server REQUEST:\n---------\n" << mb.buf << "\n----------");
2298
2299     Comm::Write(serverConnection, &mb, requestSender);
2300     return true;
2301 }
2302
2303 bool
2304 HttpStateData::getMoreRequestBody(MemBuf &buf)
2305 {
2306     // parent's implementation can handle the no-encoding case
2307     if (!flags.chunked_request)
2308         return Client::getMoreRequestBody(buf);
2309
2310     MemBuf raw;
2311
2312     Must(requestBodySource != NULL);
2313     if (!requestBodySource->getMoreData(raw))
2314         return false; // no request body bytes to chunk yet
2315
2316     // optimization: pre-allocate buffer size that should be enough
2317     const mb_size_t rawDataSize = raw.contentSize();
2318     // we may need to send: hex-chunk-size CRLF raw-data CRLF last-chunk
2319     buf.init(16 + 2 + rawDataSize + 2 + 5, raw.max_capacity);
2320
2321     buf.Printf("%x\r\n", static_cast<unsigned int>(rawDataSize));
2322     buf.append(raw.content(), rawDataSize);
2323     buf.Printf("\r\n");
2324
2325     Must(rawDataSize > 0); // we did not accidently created last-chunk above
2326
2327     // Do not send last-chunk unless we successfully received everything
2328     if (receivedWholeRequestBody) {
2329         Must(!flags.sentLastChunk);
2330         flags.sentLastChunk = true;
2331         buf.append("0\r\n\r\n", 5);
2332     }
2333
2334     return true;
2335 }
2336
2337 void
2338 httpStart(FwdState *fwd)
2339 {
2340     debugs(11, 3, fwd->request->method << ' ' << fwd->entry->url());
2341     AsyncJob::Start(new HttpStateData(fwd));
2342 }
2343
2344 void
2345 HttpStateData::start()
2346 {
2347     if (!sendRequest()) {
2348         debugs(11, 3, "httpStart: aborted");
2349         mustStop("HttpStateData::start failed");
2350         return;
2351     }
2352
2353     ++ statCounter.server.all.requests;
2354     ++ statCounter.server.http.requests;
2355
2356     /*
2357      * We used to set the read timeout here, but not any more.
2358      * Now its set in httpSendComplete() after the full request,
2359      * including request body, has been written to the server.
2360      */
2361 }
2362
2363 /// if broken posts are enabled for the request, try to fix and return true
2364 bool
2365 HttpStateData::finishingBrokenPost()
2366 {
2367 #if USE_HTTP_VIOLATIONS
2368     if (!Config.accessList.brokenPosts) {
2369         debugs(11, 5, HERE << "No brokenPosts list");
2370         return false;
2371     }
2372
2373     ACLFilledChecklist ch(Config.accessList.brokenPosts, originalRequest(), NULL);
2374     if (ch.fastCheck() != ACCESS_ALLOWED) {
2375         debugs(11, 5, HERE << "didn't match brokenPosts");
2376         return false;
2377     }
2378
2379     if (!Comm::IsConnOpen(serverConnection)) {
2380         debugs(11, 3, HERE << "ignoring broken POST for closed " << serverConnection);
2381         assert(closeHandler != NULL);
2382         return true; // prevent caller from proceeding as if nothing happened
2383     }
2384
2385     debugs(11, 3, "finishingBrokenPost: fixing broken POST");
2386     typedef CommCbMemFunT<HttpStateData, CommIoCbParams> Dialer;
2387     requestSender = JobCallback(11,5,
2388                                 Dialer, this, HttpStateData::wroteLast);
2389     Comm::Write(serverConnection, "\r\n", 2, requestSender, NULL);
2390     return true;
2391 #else
2392     return false;
2393 #endif /* USE_HTTP_VIOLATIONS */
2394 }
2395
2396 /// if needed, write last-chunk to end the request body and return true
2397 bool
2398 HttpStateData::finishingChunkedRequest()
2399 {
2400     if (flags.sentLastChunk) {
2401         debugs(11, 5, HERE << "already sent last-chunk");
2402         return false;
2403     }
2404
2405     Must(receivedWholeRequestBody); // or we should not be sending last-chunk
2406     flags.sentLastChunk = true;
2407
2408     typedef CommCbMemFunT<HttpStateData, CommIoCbParams> Dialer;
2409     requestSender = JobCallback(11,5, Dialer, this, HttpStateData::wroteLast);
2410     Comm::Write(serverConnection, "0\r\n\r\n", 5, requestSender, NULL);
2411     return true;
2412 }
2413
2414 void
2415 HttpStateData::doneSendingRequestBody()
2416 {
2417     Client::doneSendingRequestBody();
2418     debugs(11,5, HERE << serverConnection);
2419
2420     // do we need to write something after the last body byte?
2421     if (flags.chunked_request && finishingChunkedRequest())
2422         return;
2423     if (!flags.chunked_request && finishingBrokenPost())
2424         return;
2425
2426     sendComplete();
2427 }
2428
2429 // more origin request body data is available
2430 void
2431 HttpStateData::handleMoreRequestBodyAvailable()
2432 {
2433     if (eof || !Comm::IsConnOpen(serverConnection)) {
2434         // XXX: we should check this condition in other callbacks then!
2435         // TODO: Check whether this can actually happen: We should unsubscribe
2436         // as a body consumer when the above condition(s) are detected.
2437         debugs(11, DBG_IMPORTANT, HERE << "Transaction aborted while reading HTTP body");
2438         return;
2439     }
2440
2441     assert(requestBodySource != NULL);
2442
2443     if (requestBodySource->buf().hasContent()) {
2444         // XXX: why does not this trigger a debug message on every request?
2445
2446         if (flags.headers_parsed && !flags.abuse_detected) {
2447             flags.abuse_detected = true;
2448             debugs(11, DBG_IMPORTANT, "http handleMoreRequestBodyAvailable: Likely proxy abuse detected '" << request->client_addr << "' -> '" << entry->url() << "'" );
2449
2450             if (virginReply()->sline.status() == Http::scInvalidHeader) {
2451                 serverConnection->close();
2452                 return;
2453             }
2454         }
2455     }
2456
2457     HttpStateData::handleMoreRequestBodyAvailable();
2458 }
2459
2460 // premature end of the request body
2461 void
2462 HttpStateData::handleRequestBodyProducerAborted()
2463 {
2464     Client::handleRequestBodyProducerAborted();
2465     if (entry->isEmpty()) {
2466         debugs(11, 3, "request body aborted: " << serverConnection);
2467         // We usually get here when ICAP REQMOD aborts during body processing.
2468         // We might also get here if client-side aborts, but then our response
2469         // should not matter because either client-side will provide its own or
2470         // there will be no response at all (e.g., if the the client has left).
2471         ErrorState *err = new ErrorState(ERR_ICAP_FAILURE, Http::scInternalServerError, fwd->request);
2472         err->detailError(ERR_DETAIL_SRV_REQMOD_REQ_BODY);
2473         fwd->fail(err);
2474     }
2475
2476     abortTransaction("request body producer aborted");
2477 }
2478
2479 // called when we wrote request headers(!) or a part of the body
2480 void
2481 HttpStateData::sentRequestBody(const CommIoCbParams &io)
2482 {
2483     if (io.size > 0)
2484         kb_incr(&statCounter.server.http.kbytes_out, io.size);
2485
2486     Client::sentRequestBody(io);
2487 }
2488
2489 // Quickly abort the transaction
2490 // TODO: destruction should be sufficient as the destructor should cleanup,
2491 // including canceling close handlers
2492 void
2493 HttpStateData::abortTransaction(const char *reason)
2494 {
2495     debugs(11,5, HERE << "aborting transaction for " << reason <<
2496            "; " << serverConnection << ", this " << this);
2497
2498     if (Comm::IsConnOpen(serverConnection)) {
2499         serverConnection->close();
2500         return;
2501     }
2502
2503     fwd->handleUnregisteredServerEnd();
2504     mustStop("HttpStateData::abortTransaction");
2505 }
2506