]> git.ipfire.org Git - thirdparty/squid.git/blob - src/HttpHdrRange.cc
Add string API layer for better string handling.
[thirdparty/squid.git] / src / HttpHdrRange.cc
1
2 /*
3 * $Id: HttpHdrRange.cc,v 1.43 2007/05/18 06:41:22 amosjeffries Exp $
4 *
5 * DEBUG: section 64 HTTP Range Header
6 * AUTHOR: Alex Rousskov
7 *
8 * SQUID Web Proxy Cache http://www.squid-cache.org/
9 * ----------------------------------------------------------
10 *
11 * Squid is the result of efforts by numerous individuals from
12 * the Internet community; see the CONTRIBUTORS file for full
13 * details. Many organizations have provided support for Squid's
14 * development; see the SPONSORS file for full details. Squid is
15 * Copyrighted (C) 2001 by the Regents of the University of
16 * California; see the COPYRIGHT file for full details. Squid
17 * incorporates software developed and/or copyrighted by other
18 * sources; see the CREDITS file for full details.
19 *
20 * This program is free software; you can redistribute it and/or modify
21 * it under the terms of the GNU General Public License as published by
22 * the Free Software Foundation; either version 2 of the License, or
23 * (at your option) any later version.
24 *
25 * This program is distributed in the hope that it will be useful,
26 * but WITHOUT ANY WARRANTY; without even the implied warranty of
27 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
28 * GNU General Public License for more details.
29 *
30 * You should have received a copy of the GNU General Public License
31 * along with this program; if not, write to the Free Software
32 * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111, USA.
33 *
34 */
35
36 #include "squid.h"
37 #include "Store.h"
38 #include "HttpHeaderRange.h"
39 #include "client_side_request.h"
40 #include "HttpReply.h"
41
42 /*
43 * Currently only byte ranges are supported
44 *
45 * Essentially, there are three types of byte ranges:
46 *
47 * 1) first-byte-pos "-" last-byte-pos // range
48 * 2) first-byte-pos "-" // trailer
49 * 3) "-" suffix-length // suffix (last length bytes)
50 *
51 *
52 * When Range field is parsed, we have no clue about the content
53 * length of the document. Thus, we simply code an "absent" part
54 * using HttpHdrRangeSpec::UnknownPosition constant.
55 *
56 * Note: when response length becomes known, we convert any range
57 * spec into type one above. (Canonization process).
58 */
59
60
61 /* local routines */
62 #define known_spec(s) ((s) > HttpHdrRangeSpec::UnknownPosition)
63
64 /* globals */
65 size_t HttpHdrRange::ParsedCount = 0;
66 ssize_t const HttpHdrRangeSpec::UnknownPosition = -1;
67
68 /*
69 * Range-Spec
70 */
71
72 HttpHdrRangeSpec::HttpHdrRangeSpec() : offset(UnknownPosition), length(UnknownPosition){}
73
74 /* parses range-spec and returns new object on success */
75 HttpHdrRangeSpec *
76 HttpHdrRangeSpec::Create(const char *field, int flen)
77 {
78 HttpHdrRangeSpec spec;
79
80 if (!spec.parseInit(field, flen))
81 return NULL;
82
83 return new HttpHdrRangeSpec(spec);
84 }
85
86 bool
87 HttpHdrRangeSpec::parseInit(const char *field, int flen)
88 {
89 const char *p;
90
91 if (flen < 2)
92 return false;
93
94 /* is it a suffix-byte-range-spec ? */
95 if (*field == '-') {
96 if (!httpHeaderParseSize(field + 1, &length))
97 return false;
98 } else
99 /* must have a '-' somewhere in _this_ field */
100 if (!((p = strchr(field, '-')) || (p - field >= flen))) {
101 debugs(64, 2, "ignoring invalid (missing '-') range-spec near: '" << field << "'");
102 return false;
103 } else {
104 if (!httpHeaderParseSize(field, &offset))
105 return false;
106
107 p++;
108
109 /* do we have last-pos ? */
110 if (p - field < flen) {
111 ssize_t last_pos;
112
113 if (!httpHeaderParseSize(p, &last_pos))
114 return false;
115
116 HttpHdrRangeSpec::HttpRange aSpec (offset, last_pos + 1);
117
118 length = aSpec.size();
119 }
120 }
121
122 /* we managed to parse, check if the result makes sence */
123 if (length == 0) {
124 debugs(64, 2, "ignoring invalid (zero length) range-spec near: '" << field << "'");
125 return false;
126 }
127
128 return true;
129 }
130
131 void
132 HttpHdrRangeSpec::packInto(Packer * packer) const
133 {
134 if (!known_spec(offset)) /* suffix */
135 packerPrintf(packer, "-%ld", (long int) length);
136 else if (!known_spec(length)) /* trailer */
137 packerPrintf(packer, "%ld-", (long int) offset);
138 else /* range */
139 packerPrintf(packer, "%ld-%ld",
140 (long int) offset, (long int) offset + length - 1);
141 }
142
143 void
144 HttpHdrRangeSpec::outputInfo( char const *note) const
145 {
146 debugs(64, 5, "HttpHdrRangeSpec::canonize: " << note << ": [" <<
147 (long int) offset << ", " << (long int) offset + length <<
148 ") len: " << (long int) length);
149 }
150
151 /* fills "absent" positions in range specification based on response body size
152 * returns true if the range is still valid
153 * range is valid if its intersection with [0,length-1] is not empty
154 */
155 int
156 HttpHdrRangeSpec::canonize(size_t clen)
157 {
158 outputInfo ("have");
159 HttpRange object(0, clen);
160
161 if (!known_spec(offset)) /* suffix */
162 {
163 assert(known_spec(length));
164 offset = object.intersection(HttpRange (clen - length, clen)).start;
165 } else if (!known_spec(length)) /* trailer */
166 {
167 assert(known_spec(offset));
168 HttpRange newRange = object.intersection(HttpRange (offset, clen));
169 length = newRange.size();
170 }
171 /* we have a "range" now, adjust length if needed */
172 assert(known_spec(length));
173
174 assert(known_spec(offset));
175
176 HttpRange newRange = object.intersection (HttpRange (offset, offset + length));
177
178 length = newRange.size();
179
180 outputInfo ("done");
181
182 return length > 0;
183 }
184
185 /* merges recepient with donor if possible; returns true on success
186 * both specs must be canonized prior to merger, of course */
187 bool
188 HttpHdrRangeSpec::mergeWith(const HttpHdrRangeSpec * donor)
189 {
190 bool merged (false);
191 #if MERGING_BREAKS_NOTHING
192 /* Note: this code works, but some clients may not like its effects */
193 size_t rhs = offset + length; /* no -1 ! */
194 const size_t donor_rhs = donor->offset + donor->length; /* no -1 ! */
195 assert(known_spec(offset));
196 assert(known_spec(donor->offset));
197 assert(length > 0);
198 assert(donor->length > 0);
199 /* do we have a left hand side overlap? */
200
201 if (donor->offset < offset && offset <= donor_rhs) {
202 offset = donor->offset; /* decrease left offset */
203 merged = 1;
204 }
205
206 /* do we have a right hand side overlap? */
207 if (donor->offset <= rhs && rhs < donor_rhs) {
208 rhs = donor_rhs; /* increase right offset */
209 merged = 1;
210 }
211
212 /* adjust length if offsets have been changed */
213 if (merged) {
214 assert(rhs > offset);
215 length = rhs - offset;
216 } else {
217 /* does recepient contain donor? */
218 merged =
219 offset <= donor->offset && donor->offset < rhs;
220 }
221
222 #endif
223 return merged;
224 }
225
226 /*
227 * Range
228 */
229
230 HttpHdrRange::HttpHdrRange () : clen (HttpHdrRangeSpec::UnknownPosition)
231 {}
232
233 HttpHdrRange *
234 HttpHdrRange::ParseCreate(const string * range_spec)
235 {
236 HttpHdrRange *r = new HttpHdrRange;
237
238 if (!r->parseInit(range_spec)) {
239 delete r;
240 r = NULL;
241 }
242
243 return r;
244 }
245
246 /* returns true if ranges are valid; inits HttpHdrRange */
247 bool
248 HttpHdrRange::parseInit(const string * range_spec)
249 {
250 const char *item;
251 const char *pos = NULL;
252 int ilen;
253 int count = 0;
254 assert(this && range_spec);
255 ++ParsedCount;
256 debugs(64, 8, "parsing range field: '" << *range_spec << "'");
257 /* check range type */
258
259 if (strncasecmp(*range_spec,"bytes=", 6))
260 return 0;
261
262 /* skip "bytes="; hack! */
263 pos = range_spec->c_str() + 5;
264
265 /* iterate through comma separated list */
266 while (strListGetItem(range_spec, ',', &item, &ilen, &pos)) {
267 HttpHdrRangeSpec *spec = HttpHdrRangeSpec::Create(item, ilen);
268 /*
269 * HTTP/1.1 draft says we must ignore the whole header field if one spec
270 * is invalid. However, RFC 2068 just says that we must ignore that spec.
271 */
272
273 if (spec)
274 specs.push_back(spec);
275
276 ++count;
277 }
278
279 debugs(64, 8, "parsed range range count: " << count << ", kept " << specs.size());
280 return specs.count != 0;
281 }
282
283 HttpHdrRange::~HttpHdrRange()
284 {
285 while (specs.size())
286 delete specs.pop_back();
287 }
288
289 HttpHdrRange::HttpHdrRange(HttpHdrRange const &old) : specs()
290 {
291 specs.reserve(old.specs.size());
292
293 for (const_iterator i = old.begin(); i != old.end(); ++i)
294 specs.push_back(new HttpHdrRangeSpec ( **i));
295
296 assert(old.specs.size() == specs.size());
297 }
298
299 HttpHdrRange::iterator
300 HttpHdrRange::begin()
301 {
302 return specs.begin();
303 }
304
305 HttpHdrRange::iterator
306 HttpHdrRange::end()
307 {
308 return specs.end();
309 }
310
311 HttpHdrRange::const_iterator
312 HttpHdrRange::begin() const
313 {
314 return specs.begin();
315 }
316
317 HttpHdrRange::const_iterator
318 HttpHdrRange::end() const
319 {
320 return specs.end();
321 }
322
323 void
324 HttpHdrRange::packInto(Packer * packer) const
325 {
326 const_iterator pos = begin();
327 assert(this);
328
329 while (pos != end()) {
330 if (pos != begin())
331 packerAppend(packer, ",", 1);
332
333 (*pos)->packInto(packer);
334
335 ++pos;
336 }
337 }
338
339 void
340 HttpHdrRange::merge (Vector<HttpHdrRangeSpec *> &basis)
341 {
342 /* reset old array */
343 specs.clean();
344 /* merge specs:
345 * take one spec from "goods" and merge it with specs from
346 * "specs" (if any) until there is no overlap */
347 iterator i = basis.begin();
348
349 while (i != basis.end()) {
350 if (specs.size() && (*i)->mergeWith(specs.back())) {
351 /* merged with current so get rid of the prev one */
352 delete specs.pop_back();
353 continue; /* re-iterate */
354 }
355
356 specs.push_back (*i);
357 ++i; /* progress */
358 }
359
360 debugs(64, 3, "HttpHdrRange::merge: had " << basis.size() <<
361 " specs, merged " << basis.size() - specs.size() << " specs");
362 }
363
364
365 void
366 HttpHdrRange::getCanonizedSpecs (Vector<HttpHdrRangeSpec *> &copy)
367 {
368 /* canonize each entry and destroy bad ones if any */
369
370 for (iterator pos (begin()); pos != end(); ++pos) {
371 if ((*pos)->canonize(clen))
372 copy.push_back (*pos);
373 else
374 delete (*pos);
375 }
376
377 debugs(64, 3, "HttpHdrRange::getCanonizedSpecs: found " <<
378 specs.size() - copy.size() << " bad specs");
379 }
380
381 #include "HttpHdrContRange.h"
382
383 /*
384 * canonizes all range specs within a set preserving the order
385 * returns true if the set is valid after canonization;
386 * the set is valid if
387 * - all range specs are valid and
388 * - there is at least one range spec
389 */
390 int
391 HttpHdrRange::canonize(HttpReply *rep)
392 {
393 assert(this && rep);
394
395 if (rep->content_range)
396 clen = rep->content_range->elength;
397 else
398 clen = rep->content_length;
399
400 return canonize (clen);
401 }
402
403 int
404 HttpHdrRange::canonize (size_t newClen)
405 {
406 clen = newClen;
407 debugs(64, 3, "HttpHdrRange::canonize: started with " << specs.count <<
408 " specs, clen: " << clen);
409 Vector<HttpHdrRangeSpec*> goods;
410 getCanonizedSpecs(goods);
411 merge (goods);
412 debugs(64, 3, "HttpHdrRange::canonize: finished with " << specs.count <<
413 " specs");
414 return specs.count > 0;
415 }
416
417 /* hack: returns true if range specs are too "complex" for Squid to handle */
418 /* requires that specs are "canonized" first! */
419 bool
420 HttpHdrRange::isComplex() const
421 {
422 size_t offset = 0;
423 assert(this);
424 /* check that all rangers are in "strong" order */
425 const_iterator pos (begin());
426
427 while (pos != end()) {
428 /* Ensure typecasts is safe */
429 assert ((*pos)->offset >= 0);
430
431 if ((unsigned int)(*pos)->offset < offset)
432 return 1;
433
434 offset = (*pos)->offset + (*pos)->length;
435
436 ++pos;
437 }
438
439 return 0;
440 }
441
442 /*
443 * hack: returns true if range specs may be too "complex" when "canonized".
444 * see also: HttpHdrRange::isComplex.
445 */
446 bool
447 HttpHdrRange::willBeComplex() const
448 {
449 assert(this);
450 /* check that all rangers are in "strong" order, */
451 /* as far as we can tell without the content length */
452 size_t offset = 0;
453
454 for (const_iterator pos (begin()); pos != end(); ++pos) {
455 if (!known_spec((*pos)->offset)) /* ignore unknowns */
456 continue;
457
458 /* Ensure typecasts is safe */
459 assert ((*pos)->offset >= 0);
460
461 if ((size_t) (*pos)->offset < offset)
462 return true;
463
464 offset = (*pos)->offset;
465
466 if (known_spec((*pos)->length)) /* avoid unknowns */
467 offset += (*pos)->length;
468 }
469
470 return false;
471 }
472
473 /*
474 * Returns lowest known offset in range spec(s),
475 * or HttpHdrRangeSpec::UnknownPosition
476 * this is used for size limiting
477 */
478 ssize_t
479 HttpHdrRange::firstOffset() const
480 {
481 ssize_t offset = HttpHdrRangeSpec::UnknownPosition;
482 assert(this);
483 const_iterator pos = begin();
484
485 while (pos != end()) {
486 if ((*pos)->offset < offset || !known_spec(offset))
487 offset = (*pos)->offset;
488
489 ++pos;
490 }
491
492 return offset;
493 }
494
495 /*
496 * Returns lowest offset in range spec(s), 0 if unknown.
497 * This is used for finding out where we need to start if all
498 * ranges are combined into one, for example FTP REST.
499 * Use 0 for size if unknown
500 */
501 ssize_t
502 HttpHdrRange::lowestOffset(ssize_t size) const
503 {
504 ssize_t offset = HttpHdrRangeSpec::UnknownPosition;
505 const_iterator pos = begin();
506 assert(this);
507
508 while (pos != end()) {
509 ssize_t current = (*pos)->offset;
510
511 if (!known_spec(current)) {
512 if ((*pos)->length > size || !known_spec((*pos)->length))
513 return 0; /* Unknown. Assume start of file */
514
515 current = size - (*pos)->length;
516 }
517
518 if (current < offset || !known_spec(offset))
519 offset = current;
520
521 ++pos;
522 }
523
524 return known_spec(offset) ? offset : 0;
525 }
526
527 /*
528 * Return true if the first range offset is larger than the configured
529 * limit.
530 * Note that exceeding the limit (returning true) results in only
531 * grabbing the needed range elements from the origin.
532 */
533 bool
534 HttpHdrRange::offsetLimitExceeded() const
535 {
536 if (NULL == this)
537 /* not a range request */
538 return false;
539
540 if (-1 == (ssize_t)Config.rangeOffsetLimit)
541 /* disabled */
542 return false;
543
544 if (firstOffset() == -1)
545 /* tail request */
546 return true;
547
548 if ((ssize_t)Config.rangeOffsetLimit >= firstOffset())
549 /* below the limit */
550 return false;
551
552 return true;
553 }
554
555 bool
556 HttpHdrRange::contains(HttpHdrRangeSpec& r) const
557 {
558 assert(r.length >= 0);
559 HttpHdrRangeSpec::HttpRange rrange(r.offset, r.offset + r.length);
560
561 for (const_iterator i = begin(); i != end(); ++i) {
562 HttpHdrRangeSpec::HttpRange irange((*i)->offset, (*i)->offset + (*i)->length);
563 HttpHdrRangeSpec::HttpRange intersection = rrange.intersection(irange);
564
565 if (intersection.start == irange.start && intersection.size() == irange.size())
566 return true;
567 }
568
569 return false;
570 }
571
572 const HttpHdrRangeSpec *
573 HttpHdrRangeIter::currentSpec() const
574 {
575 if (pos.incrementable())
576 return *pos;
577
578 return NULL;
579 }
580
581 void
582 HttpHdrRangeIter::updateSpec()
583 {
584 assert (debt_size == 0);
585 assert (valid);
586
587 if (pos.incrementable()) {
588 debt(currentSpec()->length);
589 }
590 }
591
592 ssize_t
593 HttpHdrRangeIter::debt() const
594 {
595 debugs(64, 3, "HttpHdrRangeIter::debt: debt is " << debt_size);
596 return debt_size;
597 }
598
599 void HttpHdrRangeIter::debt(ssize_t newDebt)
600 {
601 debugs(64, 3, "HttpHdrRangeIter::debt: was " << debt_size << " now " << newDebt);
602 debt_size = newDebt;
603 }