]>
Commit | Line | Data |
---|---|---|
64413630 | 1 | #include "builtin.h" |
bad50dc8 | 2 | #include "cache.h" |
74536958 | 3 | #include "object.h" |
8ee378a0 | 4 | #include "delta.h" |
a733cb60 | 5 | #include "pack.h" |
8e440259 PE |
6 | #include "blob.h" |
7 | #include "commit.h" | |
8 | #include "tag.h" | |
9 | #include "tree.h" | |
96a02f8f | 10 | #include "progress.h" |
bad50dc8 | 11 | |
3b67d291 JH |
12 | static int dry_run, quiet, recover, has_errors; |
13 | static const char unpack_usage[] = "git-unpack-objects [-n] [-q] [-r] < pack-file"; | |
bad50dc8 | 14 | |
67e5a5ec LT |
15 | /* We always read in 4kB chunks. */ |
16 | static unsigned char buffer[4096]; | |
d7dd0223 NP |
17 | static unsigned int offset, len; |
18 | static off_t consumed_bytes; | |
67e5a5ec | 19 | static SHA_CTX ctx; |
bad50dc8 | 20 | |
67e5a5ec LT |
21 | /* |
22 | * Make sure at least "min" bytes are available in the buffer, and | |
23 | * return the pointer to the buffer. | |
24 | */ | |
79a65697 | 25 | static void *fill(int min) |
67e5a5ec LT |
26 | { |
27 | if (min <= len) | |
28 | return buffer + offset; | |
67e5a5ec LT |
29 | if (min > sizeof(buffer)) |
30 | die("cannot fill %d bytes", min); | |
31 | if (offset) { | |
32 | SHA1_Update(&ctx, buffer, offset); | |
79a65697 | 33 | memmove(buffer, buffer + offset, len); |
67e5a5ec LT |
34 | offset = 0; |
35 | } | |
36 | do { | |
8a912bcb | 37 | ssize_t ret = xread(0, buffer + len, sizeof(buffer) - len); |
67e5a5ec LT |
38 | if (ret <= 0) { |
39 | if (!ret) | |
40 | die("early EOF"); | |
67e5a5ec LT |
41 | die("read error on input: %s", strerror(errno)); |
42 | } | |
43 | len += ret; | |
44 | } while (len < min); | |
45 | return buffer; | |
46 | } | |
74536958 | 47 | |
67e5a5ec LT |
48 | static void use(int bytes) |
49 | { | |
50 | if (bytes > len) | |
51 | die("used more bytes than were available"); | |
52 | len -= bytes; | |
53 | offset += bytes; | |
d7dd0223 NP |
54 | |
55 | /* make sure off_t is sufficiently large not to wrap */ | |
56 | if (consumed_bytes > consumed_bytes + bytes) | |
57 | die("pack too large for current definition of off_t"); | |
209c554a | 58 | consumed_bytes += bytes; |
67e5a5ec | 59 | } |
bad50dc8 | 60 | |
67e5a5ec | 61 | static void *get_data(unsigned long size) |
bad50dc8 | 62 | { |
67e5a5ec LT |
63 | z_stream stream; |
64 | void *buf = xmalloc(size); | |
65 | ||
67e5a5ec LT |
66 | memset(&stream, 0, sizeof(stream)); |
67 | ||
68 | stream.next_out = buf; | |
69 | stream.avail_out = size; | |
70 | stream.next_in = fill(1); | |
71 | stream.avail_in = len; | |
72 | inflateInit(&stream); | |
73 | ||
74 | for (;;) { | |
75 | int ret = inflate(&stream, 0); | |
76 | use(len - stream.avail_in); | |
77 | if (stream.total_out == size && ret == Z_STREAM_END) | |
78 | break; | |
f986f2c8 JH |
79 | if (ret != Z_OK) { |
80 | error("inflate returned %d\n", ret); | |
81 | free(buf); | |
82 | buf = NULL; | |
3b67d291 | 83 | if (!recover) |
f986f2c8 JH |
84 | exit(1); |
85 | has_errors = 1; | |
86 | break; | |
87 | } | |
67e5a5ec LT |
88 | stream.next_in = fill(1); |
89 | stream.avail_in = len; | |
90 | } | |
ee639140 | 91 | inflateEnd(&stream); |
67e5a5ec | 92 | return buf; |
bad50dc8 LT |
93 | } |
94 | ||
67e5a5ec LT |
95 | struct delta_info { |
96 | unsigned char base_sha1[20]; | |
d7dd0223 NP |
97 | unsigned nr; |
98 | off_t base_offset; | |
67e5a5ec LT |
99 | unsigned long size; |
100 | void *delta; | |
101 | struct delta_info *next; | |
102 | }; | |
103 | ||
104 | static struct delta_info *delta_list; | |
105 | ||
209c554a | 106 | static void add_delta_to_list(unsigned nr, unsigned const char *base_sha1, |
d7dd0223 | 107 | off_t base_offset, |
209c554a | 108 | void *delta, unsigned long size) |
bad50dc8 | 109 | { |
67e5a5ec | 110 | struct delta_info *info = xmalloc(sizeof(*info)); |
bad50dc8 | 111 | |
e702496e | 112 | hashcpy(info->base_sha1, base_sha1); |
209c554a | 113 | info->base_offset = base_offset; |
67e5a5ec LT |
114 | info->size = size; |
115 | info->delta = delta; | |
209c554a | 116 | info->nr = nr; |
67e5a5ec LT |
117 | info->next = delta_list; |
118 | delta_list = info; | |
bad50dc8 LT |
119 | } |
120 | ||
209c554a | 121 | struct obj_info { |
d7dd0223 | 122 | off_t offset; |
209c554a NP |
123 | unsigned char sha1[20]; |
124 | }; | |
125 | ||
126 | static struct obj_info *obj_list; | |
67e5a5ec | 127 | |
21666f1a NP |
128 | static void added_object(unsigned nr, enum object_type type, |
129 | void *data, unsigned long size); | |
209c554a | 130 | |
21666f1a NP |
131 | static void write_object(unsigned nr, enum object_type type, |
132 | void *buf, unsigned long size) | |
cca7081a | 133 | { |
21666f1a | 134 | if (write_sha1_file(buf, size, typename(type), obj_list[nr].sha1) < 0) |
cca7081a | 135 | die("failed to write object"); |
209c554a | 136 | added_object(nr, type, buf, size); |
cca7081a LT |
137 | } |
138 | ||
21666f1a | 139 | static void resolve_delta(unsigned nr, enum object_type type, |
f986f2c8 JH |
140 | void *base, unsigned long base_size, |
141 | void *delta, unsigned long delta_size) | |
bad50dc8 | 142 | { |
67e5a5ec LT |
143 | void *result; |
144 | unsigned long result_size; | |
bad50dc8 | 145 | |
67e5a5ec LT |
146 | result = patch_delta(base, base_size, |
147 | delta, delta_size, | |
148 | &result_size); | |
149 | if (!result) | |
150 | die("failed to apply delta"); | |
151 | free(delta); | |
21666f1a | 152 | write_object(nr, type, result, result_size); |
67e5a5ec | 153 | free(result); |
bad50dc8 LT |
154 | } |
155 | ||
21666f1a NP |
156 | static void added_object(unsigned nr, enum object_type type, |
157 | void *data, unsigned long size) | |
74536958 | 158 | { |
67e5a5ec LT |
159 | struct delta_info **p = &delta_list; |
160 | struct delta_info *info; | |
161 | ||
162 | while ((info = *p) != NULL) { | |
209c554a NP |
163 | if (!hashcmp(info->base_sha1, obj_list[nr].sha1) || |
164 | info->base_offset == obj_list[nr].offset) { | |
67e5a5ec LT |
165 | *p = info->next; |
166 | p = &delta_list; | |
209c554a NP |
167 | resolve_delta(info->nr, type, data, size, |
168 | info->delta, info->size); | |
67e5a5ec LT |
169 | free(info); |
170 | continue; | |
171 | } | |
172 | p = &info->next; | |
173 | } | |
174 | } | |
175 | ||
21666f1a | 176 | static void unpack_non_delta_entry(enum object_type type, unsigned long size, |
209c554a | 177 | unsigned nr) |
67e5a5ec LT |
178 | { |
179 | void *buf = get_data(size); | |
8ee378a0 | 180 | |
f986f2c8 | 181 | if (!dry_run && buf) |
21666f1a | 182 | write_object(nr, type, buf, size); |
67e5a5ec | 183 | free(buf); |
8ee378a0 JH |
184 | } |
185 | ||
21666f1a | 186 | static void unpack_delta_entry(enum object_type type, unsigned long delta_size, |
209c554a | 187 | unsigned nr) |
8ee378a0 | 188 | { |
67e5a5ec LT |
189 | void *delta_data, *base; |
190 | unsigned long base_size; | |
67e5a5ec | 191 | unsigned char base_sha1[20]; |
8ee378a0 | 192 | |
21666f1a | 193 | if (type == OBJ_REF_DELTA) { |
209c554a NP |
194 | hashcpy(base_sha1, fill(20)); |
195 | use(20); | |
196 | delta_data = get_data(delta_size); | |
197 | if (dry_run || !delta_data) { | |
198 | free(delta_data); | |
199 | return; | |
200 | } | |
201 | if (!has_sha1_file(base_sha1)) { | |
202 | hashcpy(obj_list[nr].sha1, null_sha1); | |
203 | add_delta_to_list(nr, base_sha1, 0, delta_data, delta_size); | |
204 | return; | |
205 | } | |
206 | } else { | |
207 | unsigned base_found = 0; | |
208 | unsigned char *pack, c; | |
d7dd0223 | 209 | off_t base_offset; |
209c554a | 210 | unsigned lo, mid, hi; |
c4fb06c0 | 211 | |
209c554a NP |
212 | pack = fill(1); |
213 | c = *pack; | |
214 | use(1); | |
215 | base_offset = c & 127; | |
216 | while (c & 128) { | |
217 | base_offset += 1; | |
8723f216 | 218 | if (!base_offset || MSB(base_offset, 7)) |
209c554a NP |
219 | die("offset value overflow for delta base object"); |
220 | pack = fill(1); | |
221 | c = *pack; | |
222 | use(1); | |
223 | base_offset = (base_offset << 7) + (c & 127); | |
224 | } | |
225 | base_offset = obj_list[nr].offset - base_offset; | |
8ee378a0 | 226 | |
209c554a NP |
227 | delta_data = get_data(delta_size); |
228 | if (dry_run || !delta_data) { | |
229 | free(delta_data); | |
230 | return; | |
231 | } | |
232 | lo = 0; | |
233 | hi = nr; | |
234 | while (lo < hi) { | |
235 | mid = (lo + hi)/2; | |
236 | if (base_offset < obj_list[mid].offset) { | |
237 | hi = mid; | |
238 | } else if (base_offset > obj_list[mid].offset) { | |
239 | lo = mid + 1; | |
240 | } else { | |
241 | hashcpy(base_sha1, obj_list[mid].sha1); | |
242 | base_found = !is_null_sha1(base_sha1); | |
243 | break; | |
244 | } | |
245 | } | |
246 | if (!base_found) { | |
247 | /* The delta base object is itself a delta that | |
248 | has not been resolved yet. */ | |
249 | hashcpy(obj_list[nr].sha1, null_sha1); | |
250 | add_delta_to_list(nr, null_sha1, base_offset, delta_data, delta_size); | |
251 | return; | |
252 | } | |
8ee378a0 | 253 | } |
209c554a | 254 | |
21666f1a | 255 | base = read_sha1_file(base_sha1, &type, &base_size); |
f986f2c8 JH |
256 | if (!base) { |
257 | error("failed to read delta-pack base object %s", | |
258 | sha1_to_hex(base_sha1)); | |
3b67d291 | 259 | if (!recover) |
f986f2c8 JH |
260 | exit(1); |
261 | has_errors = 1; | |
262 | return; | |
263 | } | |
209c554a | 264 | resolve_delta(nr, type, base, base_size, delta_data, delta_size); |
ee639140 | 265 | free(base); |
8ee378a0 JH |
266 | } |
267 | ||
96a02f8f | 268 | static void unpack_one(unsigned nr) |
8ee378a0 | 269 | { |
01247d87 | 270 | unsigned shift; |
a733cb60 | 271 | unsigned char *pack, c; |
67e5a5ec LT |
272 | unsigned long size; |
273 | enum object_type type; | |
74536958 | 274 | |
209c554a NP |
275 | obj_list[nr].offset = consumed_bytes; |
276 | ||
67e5a5ec LT |
277 | pack = fill(1); |
278 | c = *pack; | |
279 | use(1); | |
a733cb60 LT |
280 | type = (c >> 4) & 7; |
281 | size = (c & 15); | |
01247d87 | 282 | shift = 4; |
a733cb60 | 283 | while (c & 0x80) { |
67e5a5ec | 284 | pack = fill(1); |
209c554a | 285 | c = *pack; |
67e5a5ec | 286 | use(1); |
01247d87 LT |
287 | size += (c & 0x7f) << shift; |
288 | shift += 7; | |
a733cb60 | 289 | } |
96a02f8f | 290 | |
a733cb60 LT |
291 | switch (type) { |
292 | case OBJ_COMMIT: | |
293 | case OBJ_TREE: | |
294 | case OBJ_BLOB: | |
295 | case OBJ_TAG: | |
209c554a | 296 | unpack_non_delta_entry(type, size, nr); |
a733cb60 | 297 | return; |
eb32d236 | 298 | case OBJ_REF_DELTA: |
209c554a NP |
299 | case OBJ_OFS_DELTA: |
300 | unpack_delta_entry(type, size, nr); | |
a733cb60 | 301 | return; |
67e5a5ec | 302 | default: |
f986f2c8 JH |
303 | error("bad object type %d", type); |
304 | has_errors = 1; | |
3b67d291 | 305 | if (recover) |
f986f2c8 JH |
306 | return; |
307 | exit(1); | |
74536958 LT |
308 | } |
309 | } | |
310 | ||
74536958 LT |
311 | static void unpack_all(void) |
312 | { | |
67e5a5ec | 313 | int i; |
96a02f8f | 314 | struct progress progress; |
67e5a5ec | 315 | struct pack_header *hdr = fill(sizeof(struct pack_header)); |
67e5a5ec LT |
316 | unsigned nr_objects = ntohl(hdr->hdr_entries); |
317 | ||
318 | if (ntohl(hdr->hdr_signature) != PACK_SIGNATURE) | |
319 | die("bad pack file"); | |
d60fc1c8 NP |
320 | if (!pack_version_ok(hdr->hdr_version)) |
321 | die("unknown pack file version %d", ntohl(hdr->hdr_version)); | |
96a02f8f | 322 | use(sizeof(struct pack_header)); |
67e5a5ec | 323 | |
13aaf148 NP |
324 | if (!quiet) |
325 | start_progress(&progress, "Unpacking %u objects...", "", nr_objects); | |
209c554a | 326 | obj_list = xmalloc(nr_objects * sizeof(*obj_list)); |
96a02f8f NP |
327 | for (i = 0; i < nr_objects; i++) { |
328 | unpack_one(i); | |
329 | if (!quiet) | |
330 | display_progress(&progress, i + 1); | |
331 | } | |
332 | if (!quiet) | |
333 | stop_progress(&progress); | |
334 | ||
67e5a5ec LT |
335 | if (delta_list) |
336 | die("unresolved deltas left after unpacking"); | |
74536958 LT |
337 | } |
338 | ||
64413630 | 339 | int cmd_unpack_objects(int argc, const char **argv, const char *prefix) |
bad50dc8 LT |
340 | { |
341 | int i; | |
67e5a5ec | 342 | unsigned char sha1[20]; |
bad50dc8 | 343 | |
8e273641 | 344 | git_config(git_default_config); |
53228a5f | 345 | |
476e8011 JH |
346 | quiet = !isatty(2); |
347 | ||
bad50dc8 LT |
348 | for (i = 1 ; i < argc; i++) { |
349 | const char *arg = argv[i]; | |
350 | ||
351 | if (*arg == '-') { | |
74536958 LT |
352 | if (!strcmp(arg, "-n")) { |
353 | dry_run = 1; | |
354 | continue; | |
355 | } | |
d36f7b80 LT |
356 | if (!strcmp(arg, "-q")) { |
357 | quiet = 1; | |
358 | continue; | |
359 | } | |
f986f2c8 | 360 | if (!strcmp(arg, "-r")) { |
3b67d291 | 361 | recover = 1; |
f986f2c8 JH |
362 | continue; |
363 | } | |
cc44c765 | 364 | if (!prefixcmp(arg, "--pack_header=")) { |
bed006fb NP |
365 | struct pack_header *hdr; |
366 | char *c; | |
367 | ||
368 | hdr = (struct pack_header *)buffer; | |
369 | hdr->hdr_signature = htonl(PACK_SIGNATURE); | |
370 | hdr->hdr_version = htonl(strtoul(arg + 14, &c, 10)); | |
371 | if (*c != ',') | |
372 | die("bad %s", arg); | |
373 | hdr->hdr_entries = htonl(strtoul(c + 1, &c, 10)); | |
374 | if (*c) | |
375 | die("bad %s", arg); | |
376 | len = sizeof(*hdr); | |
377 | continue; | |
378 | } | |
bad50dc8 LT |
379 | usage(unpack_usage); |
380 | } | |
67e5a5ec LT |
381 | |
382 | /* We don't take any non-flag arguments now.. Maybe some day */ | |
bad50dc8 | 383 | usage(unpack_usage); |
67e5a5ec LT |
384 | } |
385 | SHA1_Init(&ctx); | |
74536958 | 386 | unpack_all(); |
67e5a5ec LT |
387 | SHA1_Update(&ctx, buffer, offset); |
388 | SHA1_Final(sha1, &ctx); | |
a89fccd2 | 389 | if (hashcmp(fill(20), sha1)) |
67e5a5ec LT |
390 | die("final sha1 did not match"); |
391 | use(20); | |
392 | ||
393 | /* Write the last part of the buffer to stdout */ | |
394 | while (len) { | |
1c15afb9 JH |
395 | int ret = xwrite(1, buffer + offset, len); |
396 | if (ret <= 0) | |
67e5a5ec | 397 | break; |
67e5a5ec LT |
398 | len -= ret; |
399 | offset += ret; | |
400 | } | |
401 | ||
402 | /* All done */ | |
f986f2c8 | 403 | return has_errors; |
bad50dc8 | 404 | } |