]>
Commit | Line | Data |
---|---|---|
0fcfd160 LT |
1 | /* |
2 | * GIT - The information manager from hell | |
3 | * | |
4 | * Copyright (C) Linus Torvalds, 2005 | |
5 | * | |
6 | * This handles basic git sha1 object files - packing, unpacking, | |
7 | * creation etc. | |
8 | */ | |
1f688557 JH |
9 | #include <sys/types.h> |
10 | #include <dirent.h> | |
0fcfd160 | 11 | #include "cache.h" |
1f688557 | 12 | #include "delta.h" |
a733cb60 | 13 | #include "pack.h" |
0fcfd160 | 14 | |
144bde78 LT |
15 | #ifndef O_NOATIME |
16 | #if defined(__linux__) && (defined(__i386__) || defined(__PPC__)) | |
17 | #define O_NOATIME 01000000 | |
18 | #else | |
19 | #define O_NOATIME 0 | |
20 | #endif | |
21 | #endif | |
22 | ||
88cd621d JH |
23 | const unsigned char null_sha1[20] = { 0, }; |
24 | ||
144bde78 LT |
25 | static unsigned int sha1_file_open_flag = O_NOATIME; |
26 | ||
0fcfd160 LT |
27 | static unsigned hexval(char c) |
28 | { | |
29 | if (c >= '0' && c <= '9') | |
30 | return c - '0'; | |
31 | if (c >= 'a' && c <= 'f') | |
32 | return c - 'a' + 10; | |
33 | if (c >= 'A' && c <= 'F') | |
34 | return c - 'A' + 10; | |
35 | return ~0; | |
36 | } | |
37 | ||
38 | int get_sha1_hex(const char *hex, unsigned char *sha1) | |
39 | { | |
40 | int i; | |
41 | for (i = 0; i < 20; i++) { | |
42 | unsigned int val = (hexval(hex[0]) << 4) | hexval(hex[1]); | |
43 | if (val & ~0xff) | |
44 | return -1; | |
45 | *sha1++ = val; | |
46 | hex += 2; | |
47 | } | |
48 | return 0; | |
49 | } | |
50 | ||
b2cb9425 JH |
51 | int safe_create_leading_directories(char *path) |
52 | { | |
53 | char *pos = path; | |
67ffdf4c JS |
54 | if (*pos == '/') |
55 | pos++; | |
b2cb9425 JH |
56 | |
57 | while (pos) { | |
58 | pos = strchr(pos, '/'); | |
59 | if (!pos) | |
60 | break; | |
61 | *pos = 0; | |
62 | if (mkdir(path, 0777) < 0) | |
63 | if (errno != EEXIST) { | |
64 | *pos = '/'; | |
65 | return -1; | |
66 | } | |
67 | *pos++ = '/'; | |
68 | } | |
69 | return 0; | |
70 | } | |
723c31fe | 71 | |
0fcfd160 LT |
72 | char * sha1_to_hex(const unsigned char *sha1) |
73 | { | |
74 | static char buffer[50]; | |
75 | static const char hex[] = "0123456789abcdef"; | |
76 | char *buf = buffer; | |
77 | int i; | |
78 | ||
79 | for (i = 0; i < 20; i++) { | |
80 | unsigned int val = *sha1++; | |
81 | *buf++ = hex[val >> 4]; | |
82 | *buf++ = hex[val & 0xf]; | |
83 | } | |
84 | return buffer; | |
85 | } | |
86 | ||
ace1534d JH |
87 | static void fill_sha1_path(char *pathbuf, const unsigned char *sha1) |
88 | { | |
89 | int i; | |
90 | for (i = 0; i < 20; i++) { | |
91 | static char hex[] = "0123456789abcdef"; | |
92 | unsigned int val = sha1[i]; | |
93 | char *pos = pathbuf + i*2 + (i > 0); | |
94 | *pos++ = hex[val >> 4]; | |
95 | *pos = hex[val & 0xf]; | |
96 | } | |
97 | } | |
98 | ||
0fcfd160 LT |
99 | /* |
100 | * NOTE! This returns a statically allocated buffer, so you have to be | |
101 | * careful about using it. Do a "strdup()" if you need to save the | |
102 | * filename. | |
ace1534d JH |
103 | * |
104 | * Also note that this returns the location for creating. Reading | |
105 | * SHA1 file can happen from any alternate directory listed in the | |
d19938ab | 106 | * DB_ENVIRONMENT environment variable if it is not found in |
ace1534d | 107 | * the primary object database. |
0fcfd160 LT |
108 | */ |
109 | char *sha1_file_name(const unsigned char *sha1) | |
110 | { | |
0fcfd160 LT |
111 | static char *name, *base; |
112 | ||
113 | if (!base) { | |
d19938ab | 114 | const char *sha1_file_directory = get_object_directory(); |
0fcfd160 | 115 | int len = strlen(sha1_file_directory); |
812666c8 | 116 | base = xmalloc(len + 60); |
0fcfd160 LT |
117 | memcpy(base, sha1_file_directory, len); |
118 | memset(base+len, 0, 60); | |
119 | base[len] = '/'; | |
120 | base[len+3] = '/'; | |
121 | name = base + len + 1; | |
122 | } | |
ace1534d | 123 | fill_sha1_path(name, sha1); |
0fcfd160 LT |
124 | return base; |
125 | } | |
126 | ||
bf592c50 DB |
127 | char *sha1_pack_name(const unsigned char *sha1) |
128 | { | |
129 | static const char hex[] = "0123456789abcdef"; | |
130 | static char *name, *base, *buf; | |
131 | int i; | |
132 | ||
133 | if (!base) { | |
134 | const char *sha1_file_directory = get_object_directory(); | |
135 | int len = strlen(sha1_file_directory); | |
136 | base = xmalloc(len + 60); | |
137 | sprintf(base, "%s/pack/pack-1234567890123456789012345678901234567890.pack", sha1_file_directory); | |
138 | name = base + len + 11; | |
139 | } | |
140 | ||
141 | buf = name; | |
142 | ||
143 | for (i = 0; i < 20; i++) { | |
144 | unsigned int val = *sha1++; | |
145 | *buf++ = hex[val >> 4]; | |
146 | *buf++ = hex[val & 0xf]; | |
147 | } | |
148 | ||
149 | return base; | |
150 | } | |
151 | ||
152 | char *sha1_pack_index_name(const unsigned char *sha1) | |
153 | { | |
154 | static const char hex[] = "0123456789abcdef"; | |
155 | static char *name, *base, *buf; | |
156 | int i; | |
157 | ||
158 | if (!base) { | |
159 | const char *sha1_file_directory = get_object_directory(); | |
160 | int len = strlen(sha1_file_directory); | |
161 | base = xmalloc(len + 60); | |
162 | sprintf(base, "%s/pack/pack-1234567890123456789012345678901234567890.idx", sha1_file_directory); | |
163 | name = base + len + 11; | |
164 | } | |
165 | ||
166 | buf = name; | |
167 | ||
168 | for (i = 0; i < 20; i++) { | |
169 | unsigned int val = *sha1++; | |
170 | *buf++ = hex[val >> 4]; | |
171 | *buf++ = hex[val & 0xf]; | |
172 | } | |
173 | ||
174 | return base; | |
175 | } | |
176 | ||
d5a63b99 JH |
177 | struct alternate_object_database *alt_odb_list; |
178 | static struct alternate_object_database **alt_odb_tail; | |
ace1534d | 179 | |
ddd5d056 JH |
180 | /* |
181 | * Prepare alternate object database registry. | |
d5a63b99 JH |
182 | * |
183 | * The variable alt_odb_list points at the list of struct | |
184 | * alternate_object_database. The elements on this list come from | |
185 | * non-empty elements from colon separated ALTERNATE_DB_ENVIRONMENT | |
186 | * environment variable, and $GIT_OBJECT_DIRECTORY/info/alternates, | |
187 | * whose contents is exactly in the same format as that environment | |
188 | * variable. Its base points at a statically allocated buffer that | |
189 | * contains "/the/directory/corresponding/to/.git/objects/...", while | |
190 | * its name points just after the slash at the end of ".git/objects/" | |
191 | * in the example above, and has enough space to hold 40-byte hex | |
192 | * SHA1, an extra slash for the first level indirection, and the | |
193 | * terminating NUL. | |
ddd5d056 | 194 | */ |
ccfd3e99 JH |
195 | static void link_alt_odb_entries(const char *alt, const char *ep, int sep, |
196 | const char *relative_base) | |
ace1534d | 197 | { |
ace1534d | 198 | const char *cp, *last; |
d5a63b99 | 199 | struct alternate_object_database *ent; |
ccfd3e99 | 200 | int base_len = -1; |
d5a63b99 JH |
201 | |
202 | last = alt; | |
9577e7e3 JH |
203 | while (last < ep) { |
204 | cp = last; | |
205 | if (cp < ep && *cp == '#') { | |
206 | while (cp < ep && *cp != sep) | |
207 | cp++; | |
208 | last = cp + 1; | |
209 | continue; | |
210 | } | |
211 | for ( ; cp < ep && *cp != sep; cp++) | |
d5a63b99 JH |
212 | ; |
213 | if (last != cp) { | |
214 | /* 43 = 40-byte + 2 '/' + terminating NUL */ | |
215 | int pfxlen = cp - last; | |
216 | int entlen = pfxlen + 43; | |
217 | ||
ccfd3e99 JH |
218 | if (*last != '/' && relative_base) { |
219 | /* Relative alt-odb */ | |
220 | if (base_len < 0) | |
221 | base_len = strlen(relative_base) + 1; | |
222 | entlen += base_len; | |
223 | pfxlen += base_len; | |
224 | } | |
d5a63b99 JH |
225 | ent = xmalloc(sizeof(*ent) + entlen); |
226 | *alt_odb_tail = ent; | |
227 | alt_odb_tail = &(ent->next); | |
228 | ent->next = NULL; | |
ccfd3e99 JH |
229 | if (*last != '/' && relative_base) { |
230 | memcpy(ent->base, relative_base, base_len - 1); | |
231 | ent->base[base_len - 1] = '/'; | |
232 | memcpy(ent->base + base_len, | |
233 | last, cp - last); | |
234 | } | |
235 | else | |
236 | memcpy(ent->base, last, pfxlen); | |
d5a63b99 JH |
237 | ent->name = ent->base + pfxlen + 1; |
238 | ent->base[pfxlen] = ent->base[pfxlen + 3] = '/'; | |
239 | ent->base[entlen-1] = 0; | |
240 | } | |
9577e7e3 | 241 | while (cp < ep && *cp == sep) |
d5a63b99 JH |
242 | cp++; |
243 | last = cp; | |
9577e7e3 | 244 | } |
d5a63b99 JH |
245 | } |
246 | ||
247 | void prepare_alt_odb(void) | |
248 | { | |
249 | char path[PATH_MAX]; | |
9577e7e3 | 250 | char *map; |
d5a63b99 JH |
251 | int fd; |
252 | struct stat st; | |
c7c81b3a JR |
253 | char *alt; |
254 | ||
a9ab586a | 255 | alt = getenv(ALTERNATE_DB_ENVIRONMENT); |
c7c81b3a | 256 | if (!alt) alt = ""; |
ace1534d | 257 | |
d5a63b99 JH |
258 | if (alt_odb_tail) |
259 | return; | |
260 | alt_odb_tail = &alt_odb_list; | |
ccfd3e99 | 261 | link_alt_odb_entries(alt, alt + strlen(alt), ':', NULL); |
d5a63b99 | 262 | |
ccfd3e99 | 263 | sprintf(path, "%s/info/alternates", get_object_directory()); |
d5a63b99 JH |
264 | fd = open(path, O_RDONLY); |
265 | if (fd < 0) | |
266 | return; | |
267 | if (fstat(fd, &st) || (st.st_size == 0)) { | |
268 | close(fd); | |
9a217f2a | 269 | return; |
ace1534d | 270 | } |
d5a63b99 JH |
271 | map = mmap(NULL, st.st_size, PROT_READ, MAP_PRIVATE, fd, 0); |
272 | close(fd); | |
273 | if (map == MAP_FAILED) | |
274 | return; | |
275 | ||
ccfd3e99 JH |
276 | link_alt_odb_entries(map, map + st.st_size, '\n', |
277 | get_object_directory()); | |
d5a63b99 | 278 | munmap(map, st.st_size); |
ace1534d JH |
279 | } |
280 | ||
281 | static char *find_sha1_file(const unsigned char *sha1, struct stat *st) | |
282 | { | |
ace1534d | 283 | char *name = sha1_file_name(sha1); |
d5a63b99 | 284 | struct alternate_object_database *alt; |
ace1534d JH |
285 | |
286 | if (!stat(name, st)) | |
287 | return name; | |
9a217f2a | 288 | prepare_alt_odb(); |
d5a63b99 JH |
289 | for (alt = alt_odb_list; alt; alt = alt->next) { |
290 | name = alt->name; | |
ace1534d | 291 | fill_sha1_path(name, sha1); |
d5a63b99 JH |
292 | if (!stat(alt->base, st)) |
293 | return alt->base; | |
ace1534d JH |
294 | } |
295 | return NULL; | |
296 | } | |
297 | ||
1f688557 JH |
298 | #define PACK_MAX_SZ (1<<26) |
299 | static int pack_used_ctr; | |
300 | static unsigned long pack_mapped; | |
9a217f2a | 301 | struct packed_git *packed_git; |
1f688557 | 302 | |
1f688557 JH |
303 | static int check_packed_git_idx(const char *path, unsigned long *idx_size_, |
304 | void **idx_map_) | |
305 | { | |
306 | void *idx_map; | |
307 | unsigned int *index; | |
308 | unsigned long idx_size; | |
309 | int nr, i; | |
310 | int fd = open(path, O_RDONLY); | |
311 | struct stat st; | |
312 | if (fd < 0) | |
313 | return -1; | |
314 | if (fstat(fd, &st)) { | |
315 | close(fd); | |
316 | return -1; | |
317 | } | |
318 | idx_size = st.st_size; | |
319 | idx_map = mmap(NULL, idx_size, PROT_READ, MAP_PRIVATE, fd, 0); | |
320 | close(fd); | |
321 | if (idx_map == MAP_FAILED) | |
322 | return -1; | |
323 | ||
324 | index = idx_map; | |
4d235c80 LT |
325 | *idx_map_ = idx_map; |
326 | *idx_size_ = idx_size; | |
1f688557 JH |
327 | |
328 | /* check index map */ | |
f9253394 | 329 | if (idx_size < 4*256 + 20 + 20) |
1f688557 JH |
330 | return error("index file too small"); |
331 | nr = 0; | |
332 | for (i = 0; i < 256; i++) { | |
333 | unsigned int n = ntohl(index[i]); | |
334 | if (n < nr) | |
335 | return error("non-monotonic index"); | |
336 | nr = n; | |
337 | } | |
338 | ||
339 | /* | |
340 | * Total size: | |
341 | * - 256 index entries 4 bytes each | |
342 | * - 24-byte entries * nr (20-byte sha1 + 4-byte offset) | |
343 | * - 20-byte SHA1 of the packfile | |
344 | * - 20-byte SHA1 file checksum | |
345 | */ | |
346 | if (idx_size != 4*256 + nr * 24 + 20 + 20) | |
347 | return error("wrong index file size"); | |
348 | ||
1f688557 JH |
349 | return 0; |
350 | } | |
351 | ||
f9253394 | 352 | static int unuse_one_packed_git(void) |
1f688557 | 353 | { |
f9253394 JH |
354 | struct packed_git *p, *lru = NULL; |
355 | ||
356 | for (p = packed_git; p; p = p->next) { | |
357 | if (p->pack_use_cnt || !p->pack_base) | |
358 | continue; | |
359 | if (!lru || p->pack_last_used < lru->pack_last_used) | |
360 | lru = p; | |
361 | } | |
362 | if (!lru) | |
363 | return 0; | |
364 | munmap(lru->pack_base, lru->pack_size); | |
365 | lru->pack_base = NULL; | |
366 | return 1; | |
367 | } | |
368 | ||
369 | void unuse_packed_git(struct packed_git *p) | |
370 | { | |
371 | p->pack_use_cnt--; | |
1f688557 JH |
372 | } |
373 | ||
f9253394 | 374 | int use_packed_git(struct packed_git *p) |
1f688557 | 375 | { |
bf592c50 DB |
376 | if (!p->pack_size) { |
377 | struct stat st; | |
378 | // We created the struct before we had the pack | |
379 | stat(p->pack_name, &st); | |
380 | if (!S_ISREG(st.st_mode)) | |
381 | die("packfile %s not a regular file", p->pack_name); | |
382 | p->pack_size = st.st_size; | |
383 | } | |
1f688557 JH |
384 | if (!p->pack_base) { |
385 | int fd; | |
386 | struct stat st; | |
387 | void *map; | |
388 | ||
389 | pack_mapped += p->pack_size; | |
f9253394 JH |
390 | while (PACK_MAX_SZ < pack_mapped && unuse_one_packed_git()) |
391 | ; /* nothing */ | |
1f688557 JH |
392 | fd = open(p->pack_name, O_RDONLY); |
393 | if (fd < 0) | |
f9253394 | 394 | die("packfile %s cannot be opened", p->pack_name); |
1f688557 JH |
395 | if (fstat(fd, &st)) { |
396 | close(fd); | |
f9253394 | 397 | die("packfile %s cannot be opened", p->pack_name); |
1f688557 JH |
398 | } |
399 | if (st.st_size != p->pack_size) | |
f9253394 | 400 | die("packfile %s size mismatch.", p->pack_name); |
1f688557 JH |
401 | map = mmap(NULL, p->pack_size, PROT_READ, MAP_PRIVATE, fd, 0); |
402 | close(fd); | |
403 | if (map == MAP_FAILED) | |
f9253394 | 404 | die("packfile %s cannot be mapped.", p->pack_name); |
1f688557 | 405 | p->pack_base = map; |
f9253394 JH |
406 | |
407 | /* Check if the pack file matches with the index file. | |
408 | * this is cheap. | |
409 | */ | |
410 | if (memcmp((char*)(p->index_base) + p->index_size - 40, | |
bf592c50 DB |
411 | p->pack_base + p->pack_size - 20, 20)) { |
412 | ||
f9253394 | 413 | die("packfile %s does not match index.", p->pack_name); |
bf592c50 | 414 | } |
1f688557 JH |
415 | } |
416 | p->pack_last_used = pack_used_ctr++; | |
f9253394 | 417 | p->pack_use_cnt++; |
1f688557 JH |
418 | return 0; |
419 | } | |
420 | ||
9d835df2 | 421 | struct packed_git *add_packed_git(char *path, int path_len, int local) |
1f688557 JH |
422 | { |
423 | struct stat st; | |
424 | struct packed_git *p; | |
425 | unsigned long idx_size; | |
426 | void *idx_map; | |
27dedf0c | 427 | unsigned char sha1[20]; |
1f688557 JH |
428 | |
429 | if (check_packed_git_idx(path, &idx_size, &idx_map)) | |
430 | return NULL; | |
431 | ||
432 | /* do we have a corresponding .pack file? */ | |
433 | strcpy(path + path_len - 4, ".pack"); | |
434 | if (stat(path, &st) || !S_ISREG(st.st_mode)) { | |
435 | munmap(idx_map, idx_size); | |
436 | return NULL; | |
437 | } | |
438 | /* ok, it looks sane as far as we can check without | |
439 | * actually mapping the pack file. | |
440 | */ | |
441 | p = xmalloc(sizeof(*p) + path_len + 2); | |
442 | strcpy(p->pack_name, path); | |
443 | p->index_size = idx_size; | |
444 | p->pack_size = st.st_size; | |
445 | p->index_base = idx_map; | |
446 | p->next = NULL; | |
d85a4fee | 447 | p->pack_base = NULL; |
1f688557 | 448 | p->pack_last_used = 0; |
f9253394 | 449 | p->pack_use_cnt = 0; |
9d835df2 | 450 | p->pack_local = local; |
c283ab21 LS |
451 | if (!get_sha1_hex(path + path_len - 40 - 4, sha1)) |
452 | memcpy(p->sha1, sha1, 20); | |
1f688557 JH |
453 | return p; |
454 | } | |
455 | ||
bf592c50 | 456 | struct packed_git *parse_pack_index(unsigned char *sha1) |
c508df5e DB |
457 | { |
458 | char *path = sha1_pack_index_name(sha1); | |
459 | return parse_pack_index_file(sha1, path); | |
460 | } | |
461 | ||
2ab141a2 | 462 | struct packed_git *parse_pack_index_file(const unsigned char *sha1, char *idx_path) |
bf592c50 DB |
463 | { |
464 | struct packed_git *p; | |
465 | unsigned long idx_size; | |
466 | void *idx_map; | |
c508df5e | 467 | char *path; |
bf592c50 | 468 | |
c508df5e | 469 | if (check_packed_git_idx(idx_path, &idx_size, &idx_map)) |
bf592c50 DB |
470 | return NULL; |
471 | ||
472 | path = sha1_pack_name(sha1); | |
473 | ||
474 | p = xmalloc(sizeof(*p) + strlen(path) + 2); | |
475 | strcpy(p->pack_name, path); | |
476 | p->index_size = idx_size; | |
477 | p->pack_size = 0; | |
478 | p->index_base = idx_map; | |
479 | p->next = NULL; | |
480 | p->pack_base = NULL; | |
481 | p->pack_last_used = 0; | |
482 | p->pack_use_cnt = 0; | |
483 | memcpy(p->sha1, sha1, 20); | |
484 | return p; | |
485 | } | |
486 | ||
487 | void install_packed_git(struct packed_git *pack) | |
488 | { | |
489 | pack->next = packed_git; | |
490 | packed_git = pack; | |
491 | } | |
492 | ||
9d835df2 | 493 | static void prepare_packed_git_one(char *objdir, int local) |
1f688557 JH |
494 | { |
495 | char path[PATH_MAX]; | |
496 | int len; | |
497 | DIR *dir; | |
498 | struct dirent *de; | |
499 | ||
500 | sprintf(path, "%s/pack", objdir); | |
501 | len = strlen(path); | |
502 | dir = opendir(path); | |
503 | if (!dir) | |
504 | return; | |
505 | path[len++] = '/'; | |
506 | while ((de = readdir(dir)) != NULL) { | |
507 | int namelen = strlen(de->d_name); | |
508 | struct packed_git *p; | |
509 | ||
510 | if (strcmp(de->d_name + namelen - 4, ".idx")) | |
511 | continue; | |
512 | ||
513 | /* we have .idx. Is it a file we can map? */ | |
514 | strcpy(path + len, de->d_name); | |
9d835df2 | 515 | p = add_packed_git(path, len + namelen, local); |
1f688557 JH |
516 | if (!p) |
517 | continue; | |
518 | p->next = packed_git; | |
519 | packed_git = p; | |
520 | } | |
5b35bcd5 | 521 | closedir(dir); |
1f688557 JH |
522 | } |
523 | ||
9a217f2a | 524 | void prepare_packed_git(void) |
1f688557 | 525 | { |
1f688557 | 526 | static int run_once = 0; |
d5a63b99 | 527 | struct alternate_object_database *alt; |
1f688557 | 528 | |
d5a63b99 | 529 | if (run_once) |
1f688557 | 530 | return; |
9d835df2 | 531 | prepare_packed_git_one(get_object_directory(), 1); |
9a217f2a | 532 | prepare_alt_odb(); |
d5a63b99 JH |
533 | for (alt = alt_odb_list; alt; alt = alt->next) { |
534 | alt->name[0] = 0; | |
9d835df2 | 535 | prepare_packed_git_one(alt->base, 0); |
1f688557 | 536 | } |
d5a63b99 | 537 | run_once = 1; |
1f688557 JH |
538 | } |
539 | ||
5d6ccf5c | 540 | int check_sha1_signature(const unsigned char *sha1, void *map, unsigned long size, const char *type) |
0fcfd160 | 541 | { |
d98b46f8 | 542 | char header[100]; |
0fcfd160 LT |
543 | unsigned char real_sha1[20]; |
544 | SHA_CTX c; | |
545 | ||
546 | SHA1_Init(&c); | |
d98b46f8 | 547 | SHA1_Update(&c, header, 1+sprintf(header, "%s %lu", type, size)); |
0fcfd160 LT |
548 | SHA1_Update(&c, map, size); |
549 | SHA1_Final(real_sha1, &c); | |
550 | return memcmp(sha1, real_sha1, 20) ? -1 : 0; | |
551 | } | |
552 | ||
1f688557 | 553 | static void *map_sha1_file_internal(const unsigned char *sha1, |
d5f1befc | 554 | unsigned long *size) |
0fcfd160 | 555 | { |
0fcfd160 LT |
556 | struct stat st; |
557 | void *map; | |
144bde78 | 558 | int fd; |
ace1534d JH |
559 | char *filename = find_sha1_file(sha1, &st); |
560 | ||
561 | if (!filename) { | |
ace1534d JH |
562 | return NULL; |
563 | } | |
0fcfd160 | 564 | |
144bde78 | 565 | fd = open(filename, O_RDONLY | sha1_file_open_flag); |
0fcfd160 | 566 | if (fd < 0) { |
144bde78 LT |
567 | /* See if it works without O_NOATIME */ |
568 | switch (sha1_file_open_flag) { | |
569 | default: | |
570 | fd = open(filename, O_RDONLY); | |
571 | if (fd >= 0) | |
572 | break; | |
573 | /* Fallthrough */ | |
574 | case 0: | |
144bde78 LT |
575 | return NULL; |
576 | } | |
577 | ||
1f688557 JH |
578 | /* If it failed once, it will probably fail again. |
579 | * Stop using O_NOATIME | |
580 | */ | |
144bde78 | 581 | sha1_file_open_flag = 0; |
0fcfd160 | 582 | } |
0fcfd160 LT |
583 | map = mmap(NULL, st.st_size, PROT_READ, MAP_PRIVATE, fd, 0); |
584 | close(fd); | |
e35f9824 | 585 | if (map == MAP_FAILED) |
0fcfd160 LT |
586 | return NULL; |
587 | *size = st.st_size; | |
588 | return map; | |
589 | } | |
590 | ||
c4483576 LT |
591 | int unpack_sha1_header(z_stream *stream, void *map, unsigned long mapsize, void *buffer, unsigned long size) |
592 | { | |
593 | /* Get the data stream */ | |
594 | memset(stream, 0, sizeof(*stream)); | |
595 | stream->next_in = map; | |
596 | stream->avail_in = mapsize; | |
597 | stream->next_out = buffer; | |
598 | stream->avail_out = size; | |
599 | ||
600 | inflateInit(stream); | |
601 | return inflate(stream, 0); | |
602 | } | |
603 | ||
6da4016a | 604 | static void *unpack_sha1_rest(z_stream *stream, void *buffer, unsigned long size) |
5180cacc LT |
605 | { |
606 | int bytes = strlen(buffer) + 1; | |
d565b341 | 607 | unsigned char *buf = xmalloc(1+size); |
5180cacc LT |
608 | |
609 | memcpy(buf, buffer + bytes, stream->total_out - bytes); | |
610 | bytes = stream->total_out - bytes; | |
611 | if (bytes < size) { | |
612 | stream->next_out = buf + bytes; | |
613 | stream->avail_out = size - bytes; | |
614 | while (inflate(stream, Z_FINISH) == Z_OK) | |
615 | /* nothing */; | |
616 | } | |
617 | buf[size] = 0; | |
618 | inflateEnd(stream); | |
619 | return buf; | |
620 | } | |
621 | ||
622 | /* | |
623 | * We used to just use "sscanf()", but that's actually way | |
624 | * too permissive for what we want to check. So do an anal | |
625 | * object header parse by hand. | |
626 | */ | |
627 | int parse_sha1_header(char *hdr, char *type, unsigned long *sizep) | |
628 | { | |
629 | int i; | |
630 | unsigned long size; | |
631 | ||
632 | /* | |
633 | * The type can be at most ten bytes (including the | |
634 | * terminating '\0' that we add), and is followed by | |
635 | * a space. | |
636 | */ | |
637 | i = 10; | |
638 | for (;;) { | |
639 | char c = *hdr++; | |
640 | if (c == ' ') | |
641 | break; | |
642 | if (!--i) | |
643 | return -1; | |
644 | *type++ = c; | |
645 | } | |
646 | *type = 0; | |
647 | ||
648 | /* | |
649 | * The length must follow immediately, and be in canonical | |
650 | * decimal format (ie "010" is not valid). | |
651 | */ | |
652 | size = *hdr++ - '0'; | |
653 | if (size > 9) | |
654 | return -1; | |
655 | if (size) { | |
656 | for (;;) { | |
657 | unsigned long c = *hdr - '0'; | |
658 | if (c > 9) | |
659 | break; | |
660 | hdr++; | |
661 | size = size * 10 + c; | |
662 | } | |
663 | } | |
664 | *sizep = size; | |
665 | ||
666 | /* | |
667 | * The length must be followed by a zero byte | |
668 | */ | |
669 | return *hdr ? -1 : 0; | |
670 | } | |
671 | ||
0fcfd160 LT |
672 | void * unpack_sha1_file(void *map, unsigned long mapsize, char *type, unsigned long *size) |
673 | { | |
5180cacc | 674 | int ret; |
0fcfd160 | 675 | z_stream stream; |
5180cacc | 676 | char hdr[8192]; |
0fcfd160 | 677 | |
5180cacc LT |
678 | ret = unpack_sha1_header(&stream, map, mapsize, hdr, sizeof(hdr)); |
679 | if (ret < Z_OK || parse_sha1_header(hdr, type, size) < 0) | |
0fcfd160 LT |
680 | return NULL; |
681 | ||
5180cacc | 682 | return unpack_sha1_rest(&stream, hdr, *size); |
0fcfd160 LT |
683 | } |
684 | ||
f3bf9224 JH |
685 | /* forward declaration for a mutually recursive function */ |
686 | static int packed_object_info(struct pack_entry *entry, | |
687 | char *type, unsigned long *sizep); | |
688 | ||
5db47c2b JH |
689 | static int packed_delta_info(unsigned char *base_sha1, |
690 | unsigned long delta_size, | |
691 | unsigned long left, | |
692 | char *type, | |
f3bf9224 JH |
693 | unsigned long *sizep, |
694 | struct packed_git *p) | |
5db47c2b | 695 | { |
f3bf9224 JH |
696 | struct pack_entry base_ent; |
697 | ||
5db47c2b JH |
698 | if (left < 20) |
699 | die("truncated pack file"); | |
5db47c2b | 700 | |
f3bf9224 JH |
701 | /* The base entry _must_ be in the same pack */ |
702 | if (!find_pack_entry_one(base_sha1, &base_ent, p)) | |
703 | die("failed to find delta-pack base object %s", | |
704 | sha1_to_hex(base_sha1)); | |
705 | ||
c62266f3 JH |
706 | /* We choose to only get the type of the base object and |
707 | * ignore potentially corrupt pack file that expects the delta | |
708 | * based on a base with a wrong size. This saves tons of | |
709 | * inflate() calls. | |
710 | */ | |
5db47c2b | 711 | |
f3bf9224 | 712 | if (packed_object_info(&base_ent, type, NULL)) |
c62266f3 | 713 | die("cannot get info for delta-pack base"); |
5db47c2b | 714 | |
c62266f3 JH |
715 | if (sizep) { |
716 | const unsigned char *data; | |
717 | unsigned char delta_head[64]; | |
718 | unsigned long result_size; | |
719 | z_stream stream; | |
720 | int st; | |
721 | ||
722 | memset(&stream, 0, sizeof(stream)); | |
723 | ||
724 | data = stream.next_in = base_sha1 + 20; | |
725 | stream.avail_in = left - 20; | |
726 | stream.next_out = delta_head; | |
727 | stream.avail_out = sizeof(delta_head); | |
728 | ||
729 | inflateInit(&stream); | |
730 | st = inflate(&stream, Z_FINISH); | |
731 | inflateEnd(&stream); | |
732 | if ((st != Z_STREAM_END) && | |
733 | stream.total_out != sizeof(delta_head)) | |
734 | die("delta data unpack-initial failed"); | |
735 | ||
736 | /* Examine the initial part of the delta to figure out | |
737 | * the result size. | |
738 | */ | |
739 | data = delta_head; | |
740 | get_delta_hdr_size(&data); /* ignore base size */ | |
5db47c2b | 741 | |
c62266f3 JH |
742 | /* Read the result size */ |
743 | result_size = get_delta_hdr_size(&data); | |
744 | *sizep = result_size; | |
745 | } | |
5db47c2b JH |
746 | return 0; |
747 | } | |
748 | ||
a733cb60 LT |
749 | static unsigned long unpack_object_header(struct packed_git *p, unsigned long offset, |
750 | enum object_type *type, unsigned long *sizep) | |
751 | { | |
01247d87 | 752 | unsigned shift; |
a733cb60 LT |
753 | unsigned char *pack, c; |
754 | unsigned long size; | |
755 | ||
756 | if (offset >= p->pack_size) | |
757 | die("object offset outside of pack file"); | |
758 | ||
759 | pack = p->pack_base + offset; | |
760 | c = *pack++; | |
761 | offset++; | |
762 | *type = (c >> 4) & 7; | |
763 | size = c & 15; | |
01247d87 | 764 | shift = 4; |
a733cb60 LT |
765 | while (c & 0x80) { |
766 | if (offset >= p->pack_size) | |
767 | die("object offset outside of pack file"); | |
768 | c = *pack++; | |
769 | offset++; | |
01247d87 LT |
770 | size += (c & 0x7f) << shift; |
771 | shift += 7; | |
a733cb60 LT |
772 | } |
773 | *sizep = size; | |
774 | return offset; | |
775 | } | |
776 | ||
ad8c80a5 JH |
777 | void packed_object_info_detail(struct pack_entry *e, |
778 | char *type, | |
779 | unsigned long *size, | |
780 | unsigned long *store_size, | |
781 | int *delta_chain_length, | |
782 | unsigned char *base_sha1) | |
783 | { | |
784 | struct packed_git *p = e->p; | |
785 | unsigned long offset, left; | |
786 | unsigned char *pack; | |
787 | enum object_type kind; | |
788 | ||
789 | offset = unpack_object_header(p, e->offset, &kind, size); | |
790 | pack = p->pack_base + offset; | |
791 | left = p->pack_size - offset; | |
792 | if (kind != OBJ_DELTA) | |
793 | *delta_chain_length = 0; | |
794 | else { | |
795 | int chain_length = 0; | |
796 | memcpy(base_sha1, pack, 20); | |
797 | do { | |
798 | struct pack_entry base_ent; | |
799 | unsigned long junk; | |
800 | ||
801 | find_pack_entry_one(pack, &base_ent, p); | |
802 | offset = unpack_object_header(p, base_ent.offset, | |
803 | &kind, &junk); | |
804 | pack = p->pack_base + offset; | |
805 | chain_length++; | |
806 | } while (kind == OBJ_DELTA); | |
807 | *delta_chain_length = chain_length; | |
808 | } | |
809 | switch (kind) { | |
810 | case OBJ_COMMIT: | |
811 | strcpy(type, "commit"); | |
812 | break; | |
813 | case OBJ_TREE: | |
814 | strcpy(type, "tree"); | |
815 | break; | |
816 | case OBJ_BLOB: | |
817 | strcpy(type, "blob"); | |
818 | break; | |
819 | case OBJ_TAG: | |
820 | strcpy(type, "tag"); | |
821 | break; | |
822 | default: | |
264b16b6 JH |
823 | die("corrupted pack file %s containing object of kind %d", |
824 | p->pack_name, kind); | |
ad8c80a5 JH |
825 | } |
826 | *store_size = 0; /* notyet */ | |
827 | } | |
828 | ||
1f688557 JH |
829 | static int packed_object_info(struct pack_entry *entry, |
830 | char *type, unsigned long *sizep) | |
831 | { | |
832 | struct packed_git *p = entry->p; | |
833 | unsigned long offset, size, left; | |
834 | unsigned char *pack; | |
a733cb60 | 835 | enum object_type kind; |
f9253394 | 836 | int retval; |
5db47c2b JH |
837 | |
838 | if (use_packed_git(p)) | |
839 | die("cannot map packed file"); | |
840 | ||
a733cb60 | 841 | offset = unpack_object_header(p, entry->offset, &kind, &size); |
1f688557 | 842 | pack = p->pack_base + offset; |
a733cb60 LT |
843 | left = p->pack_size - offset; |
844 | ||
845 | switch (kind) { | |
846 | case OBJ_DELTA: | |
f3bf9224 | 847 | retval = packed_delta_info(pack, size, left, type, sizep, p); |
f9253394 JH |
848 | unuse_packed_git(p); |
849 | return retval; | |
a733cb60 | 850 | case OBJ_COMMIT: |
1f688557 JH |
851 | strcpy(type, "commit"); |
852 | break; | |
a733cb60 | 853 | case OBJ_TREE: |
1f688557 JH |
854 | strcpy(type, "tree"); |
855 | break; | |
a733cb60 | 856 | case OBJ_BLOB: |
1f688557 JH |
857 | strcpy(type, "blob"); |
858 | break; | |
a733cb60 | 859 | case OBJ_TAG: |
a69d0943 LT |
860 | strcpy(type, "tag"); |
861 | break; | |
1f688557 | 862 | default: |
264b16b6 JH |
863 | die("corrupted pack file %s containing object of kind %d", |
864 | p->pack_name, kind); | |
1f688557 | 865 | } |
c62266f3 JH |
866 | if (sizep) |
867 | *sizep = size; | |
f9253394 | 868 | unuse_packed_git(p); |
1f688557 JH |
869 | return 0; |
870 | } | |
871 | ||
872 | /* forward declaration for a mutually recursive function */ | |
873 | static void *unpack_entry(struct pack_entry *, char *, unsigned long *); | |
874 | ||
875 | static void *unpack_delta_entry(unsigned char *base_sha1, | |
876 | unsigned long delta_size, | |
877 | unsigned long left, | |
878 | char *type, | |
f3bf9224 JH |
879 | unsigned long *sizep, |
880 | struct packed_git *p) | |
1f688557 | 881 | { |
f3bf9224 | 882 | struct pack_entry base_ent; |
1f688557 JH |
883 | void *data, *delta_data, *result, *base; |
884 | unsigned long data_size, result_size, base_size; | |
885 | z_stream stream; | |
886 | int st; | |
887 | ||
888 | if (left < 20) | |
889 | die("truncated pack file"); | |
890 | data = base_sha1 + 20; | |
891 | data_size = left - 20; | |
892 | delta_data = xmalloc(delta_size); | |
893 | ||
894 | memset(&stream, 0, sizeof(stream)); | |
895 | ||
896 | stream.next_in = data; | |
897 | stream.avail_in = data_size; | |
898 | stream.next_out = delta_data; | |
899 | stream.avail_out = delta_size; | |
900 | ||
901 | inflateInit(&stream); | |
902 | st = inflate(&stream, Z_FINISH); | |
903 | inflateEnd(&stream); | |
904 | if ((st != Z_STREAM_END) || stream.total_out != delta_size) | |
905 | die("delta data unpack failed"); | |
906 | ||
f3bf9224 JH |
907 | /* The base entry _must_ be in the same pack */ |
908 | if (!find_pack_entry_one(base_sha1, &base_ent, p)) | |
909 | die("failed to find delta-pack base object %s", | |
910 | sha1_to_hex(base_sha1)); | |
911 | base = unpack_entry_gently(&base_ent, type, &base_size); | |
1f688557 JH |
912 | if (!base) |
913 | die("failed to read delta-pack base object %s", | |
914 | sha1_to_hex(base_sha1)); | |
915 | result = patch_delta(base, base_size, | |
916 | delta_data, delta_size, | |
917 | &result_size); | |
918 | if (!result) | |
919 | die("failed to apply delta"); | |
920 | free(delta_data); | |
921 | free(base); | |
922 | *sizep = result_size; | |
923 | return result; | |
924 | } | |
925 | ||
926 | static void *unpack_non_delta_entry(unsigned char *data, | |
927 | unsigned long size, | |
928 | unsigned long left) | |
929 | { | |
930 | int st; | |
931 | z_stream stream; | |
4d235c80 | 932 | unsigned char *buffer; |
1f688557 JH |
933 | |
934 | buffer = xmalloc(size + 1); | |
935 | buffer[size] = 0; | |
936 | memset(&stream, 0, sizeof(stream)); | |
937 | stream.next_in = data; | |
938 | stream.avail_in = left; | |
939 | stream.next_out = buffer; | |
940 | stream.avail_out = size; | |
941 | ||
942 | inflateInit(&stream); | |
943 | st = inflate(&stream, Z_FINISH); | |
944 | inflateEnd(&stream); | |
945 | if ((st != Z_STREAM_END) || stream.total_out != size) { | |
946 | free(buffer); | |
947 | return NULL; | |
948 | } | |
949 | ||
950 | return buffer; | |
951 | } | |
952 | ||
953 | static void *unpack_entry(struct pack_entry *entry, | |
954 | char *type, unsigned long *sizep) | |
955 | { | |
956 | struct packed_git *p = entry->p; | |
f9253394 | 957 | void *retval; |
1f688557 JH |
958 | |
959 | if (use_packed_git(p)) | |
960 | die("cannot map packed file"); | |
f3bf9224 JH |
961 | retval = unpack_entry_gently(entry, type, sizep); |
962 | unuse_packed_git(p); | |
963 | if (!retval) | |
264b16b6 | 964 | die("corrupted pack file %s", p->pack_name); |
f3bf9224 JH |
965 | return retval; |
966 | } | |
967 | ||
968 | /* The caller is responsible for use_packed_git()/unuse_packed_git() pair */ | |
969 | void *unpack_entry_gently(struct pack_entry *entry, | |
970 | char *type, unsigned long *sizep) | |
971 | { | |
972 | struct packed_git *p = entry->p; | |
973 | unsigned long offset, size, left; | |
974 | unsigned char *pack; | |
975 | enum object_type kind; | |
976 | void *retval; | |
1f688557 | 977 | |
a733cb60 | 978 | offset = unpack_object_header(p, entry->offset, &kind, &size); |
1f688557 | 979 | pack = p->pack_base + offset; |
a733cb60 LT |
980 | left = p->pack_size - offset; |
981 | switch (kind) { | |
982 | case OBJ_DELTA: | |
f3bf9224 | 983 | retval = unpack_delta_entry(pack, size, left, type, sizep, p); |
f9253394 | 984 | return retval; |
a733cb60 | 985 | case OBJ_COMMIT: |
1f688557 JH |
986 | strcpy(type, "commit"); |
987 | break; | |
a733cb60 | 988 | case OBJ_TREE: |
1f688557 JH |
989 | strcpy(type, "tree"); |
990 | break; | |
a733cb60 | 991 | case OBJ_BLOB: |
1f688557 JH |
992 | strcpy(type, "blob"); |
993 | break; | |
a733cb60 | 994 | case OBJ_TAG: |
a69d0943 LT |
995 | strcpy(type, "tag"); |
996 | break; | |
1f688557 | 997 | default: |
f3bf9224 | 998 | return NULL; |
1f688557 JH |
999 | } |
1000 | *sizep = size; | |
f9253394 | 1001 | retval = unpack_non_delta_entry(pack, size, left); |
f9253394 | 1002 | return retval; |
1f688557 JH |
1003 | } |
1004 | ||
9a217f2a JH |
1005 | int num_packed_objects(const struct packed_git *p) |
1006 | { | |
f9253394 | 1007 | /* See check_packed_git_idx() */ |
9a217f2a JH |
1008 | return (p->index_size - 20 - 20 - 4*256) / 24; |
1009 | } | |
1010 | ||
1011 | int nth_packed_object_sha1(const struct packed_git *p, int n, | |
1012 | unsigned char* sha1) | |
1013 | { | |
1014 | void *index = p->index_base + 256; | |
1015 | if (n < 0 || num_packed_objects(p) <= n) | |
1016 | return -1; | |
1017 | memcpy(sha1, (index + 24 * n + 4), 20); | |
1018 | return 0; | |
1019 | } | |
1020 | ||
f3bf9224 JH |
1021 | int find_pack_entry_one(const unsigned char *sha1, |
1022 | struct pack_entry *e, struct packed_git *p) | |
1f688557 | 1023 | { |
4d235c80 | 1024 | unsigned int *level1_ofs = p->index_base; |
1f688557 JH |
1025 | int hi = ntohl(level1_ofs[*sha1]); |
1026 | int lo = ((*sha1 == 0x0) ? 0 : ntohl(level1_ofs[*sha1 - 1])); | |
1027 | void *index = p->index_base + 256; | |
1028 | ||
1029 | do { | |
1030 | int mi = (lo + hi) / 2; | |
1031 | int cmp = memcmp(index + 24 * mi + 4, sha1, 20); | |
1032 | if (!cmp) { | |
1033 | e->offset = ntohl(*((int*)(index + 24 * mi))); | |
1034 | memcpy(e->sha1, sha1, 20); | |
1035 | e->p = p; | |
1036 | return 1; | |
1037 | } | |
1038 | if (cmp > 0) | |
1039 | hi = mi; | |
1040 | else | |
1041 | lo = mi+1; | |
1042 | } while (lo < hi); | |
1043 | return 0; | |
1044 | } | |
1045 | ||
1046 | static int find_pack_entry(const unsigned char *sha1, struct pack_entry *e) | |
1047 | { | |
1048 | struct packed_git *p; | |
1049 | prepare_packed_git(); | |
1050 | ||
1051 | for (p = packed_git; p; p = p->next) { | |
f3bf9224 | 1052 | if (find_pack_entry_one(sha1, e, p)) |
1f688557 JH |
1053 | return 1; |
1054 | } | |
1055 | return 0; | |
1056 | } | |
1057 | ||
bf592c50 DB |
1058 | struct packed_git *find_sha1_pack(const unsigned char *sha1, |
1059 | struct packed_git *packs) | |
1060 | { | |
1061 | struct packed_git *p; | |
1062 | struct pack_entry e; | |
1063 | ||
1064 | for (p = packs; p; p = p->next) { | |
1065 | if (find_pack_entry_one(sha1, &e, p)) | |
1066 | return p; | |
1067 | } | |
1068 | return NULL; | |
1069 | ||
1070 | } | |
1071 | ||
36e4d74a | 1072 | int sha1_object_info(const unsigned char *sha1, char *type, unsigned long *sizep) |
65c2e0c3 | 1073 | { |
36e4d74a | 1074 | int status; |
65c2e0c3 JH |
1075 | unsigned long mapsize, size; |
1076 | void *map; | |
1077 | z_stream stream; | |
36e4d74a | 1078 | char hdr[128]; |
65c2e0c3 | 1079 | |
d5f1befc | 1080 | map = map_sha1_file_internal(sha1, &mapsize); |
1f688557 JH |
1081 | if (!map) { |
1082 | struct pack_entry e; | |
1083 | ||
1084 | if (!find_pack_entry(sha1, &e)) | |
1085 | return error("unable to find %s", sha1_to_hex(sha1)); | |
c62266f3 | 1086 | return packed_object_info(&e, type, sizep); |
1f688557 | 1087 | } |
36e4d74a JH |
1088 | if (unpack_sha1_header(&stream, map, mapsize, hdr, sizeof(hdr)) < 0) |
1089 | status = error("unable to unpack %s header", | |
1090 | sha1_to_hex(sha1)); | |
1091 | if (parse_sha1_header(hdr, type, &size) < 0) | |
1092 | status = error("unable to parse %s header", sha1_to_hex(sha1)); | |
c4584ae3 | 1093 | else { |
65c2e0c3 | 1094 | status = 0; |
c62266f3 JH |
1095 | if (sizep) |
1096 | *sizep = size; | |
65c2e0c3 | 1097 | } |
65c2e0c3 JH |
1098 | inflateEnd(&stream); |
1099 | munmap(map, mapsize); | |
1100 | return status; | |
1101 | } | |
1102 | ||
1f688557 JH |
1103 | static void *read_packed_sha1(const unsigned char *sha1, char *type, unsigned long *size) |
1104 | { | |
1105 | struct pack_entry e; | |
1106 | ||
1107 | if (!find_pack_entry(sha1, &e)) { | |
1108 | error("cannot read sha1_file for %s", sha1_to_hex(sha1)); | |
1109 | return NULL; | |
1110 | } | |
1111 | return unpack_entry(&e, type, size); | |
1112 | } | |
1113 | ||
0fcfd160 LT |
1114 | void * read_sha1_file(const unsigned char *sha1, char *type, unsigned long *size) |
1115 | { | |
1116 | unsigned long mapsize; | |
1117 | void *map, *buf; | |
ab90ea5d | 1118 | struct pack_entry e; |
0fcfd160 | 1119 | |
ab90ea5d JH |
1120 | if (find_pack_entry(sha1, &e)) |
1121 | return read_packed_sha1(sha1, type, size); | |
d5f1befc | 1122 | map = map_sha1_file_internal(sha1, &mapsize); |
0fcfd160 LT |
1123 | if (map) { |
1124 | buf = unpack_sha1_file(map, mapsize, type, size); | |
1125 | munmap(map, mapsize); | |
1126 | return buf; | |
1127 | } | |
ab90ea5d | 1128 | return NULL; |
0fcfd160 LT |
1129 | } |
1130 | ||
40469ee9 | 1131 | void *read_object_with_reference(const unsigned char *sha1, |
bf0f910d | 1132 | const char *required_type, |
40469ee9 JH |
1133 | unsigned long *size, |
1134 | unsigned char *actual_sha1_return) | |
f4913f91 JH |
1135 | { |
1136 | char type[20]; | |
1137 | void *buffer; | |
1138 | unsigned long isize; | |
40469ee9 | 1139 | unsigned char actual_sha1[20]; |
f4913f91 | 1140 | |
40469ee9 JH |
1141 | memcpy(actual_sha1, sha1, 20); |
1142 | while (1) { | |
1143 | int ref_length = -1; | |
1144 | const char *ref_type = NULL; | |
f4913f91 | 1145 | |
40469ee9 JH |
1146 | buffer = read_sha1_file(actual_sha1, type, &isize); |
1147 | if (!buffer) | |
1148 | return NULL; | |
1149 | if (!strcmp(type, required_type)) { | |
1150 | *size = isize; | |
1151 | if (actual_sha1_return) | |
1152 | memcpy(actual_sha1_return, actual_sha1, 20); | |
1153 | return buffer; | |
1154 | } | |
1155 | /* Handle references */ | |
1156 | else if (!strcmp(type, "commit")) | |
1157 | ref_type = "tree "; | |
1158 | else if (!strcmp(type, "tag")) | |
1159 | ref_type = "object "; | |
1160 | else { | |
1161 | free(buffer); | |
1162 | return NULL; | |
1163 | } | |
1164 | ref_length = strlen(ref_type); | |
f4913f91 | 1165 | |
40469ee9 JH |
1166 | if (memcmp(buffer, ref_type, ref_length) || |
1167 | get_sha1_hex(buffer + ref_length, actual_sha1)) { | |
1168 | free(buffer); | |
1169 | return NULL; | |
1170 | } | |
1cf58e72 | 1171 | free(buffer); |
40469ee9 JH |
1172 | /* Now we have the ID of the referred-to object in |
1173 | * actual_sha1. Check again. */ | |
f4913f91 | 1174 | } |
f4913f91 JH |
1175 | } |
1176 | ||
7672db20 BL |
1177 | char *write_sha1_file_prepare(void *buf, |
1178 | unsigned long len, | |
1179 | const char *type, | |
1180 | unsigned char *sha1, | |
1181 | unsigned char *hdr, | |
1182 | int *hdrlen) | |
d410c0f5 JH |
1183 | { |
1184 | SHA_CTX c; | |
1185 | ||
1186 | /* Generate the header */ | |
1187 | *hdrlen = sprintf((char *)hdr, "%s %lu", type, len)+1; | |
1188 | ||
1189 | /* Sha1.. */ | |
1190 | SHA1_Init(&c); | |
1191 | SHA1_Update(&c, hdr, *hdrlen); | |
1192 | SHA1_Update(&c, buf, len); | |
1193 | SHA1_Final(sha1, &c); | |
1194 | ||
1195 | return sha1_file_name(sha1); | |
1196 | } | |
1197 | ||
230f1322 LT |
1198 | /* |
1199 | * Link the tempfile to the final place, possibly creating the | |
1200 | * last directory level as you do so. | |
1201 | * | |
1202 | * Returns the errno on failure, 0 on success. | |
1203 | */ | |
1204 | static int link_temp_to_file(const char *tmpfile, char *filename) | |
1205 | { | |
1206 | int ret; | |
1207 | ||
1208 | if (!link(tmpfile, filename)) | |
1209 | return 0; | |
1210 | ||
1211 | /* | |
1212 | * Try to mkdir the last path component if that failed | |
1213 | * with an ENOENT. | |
1214 | * | |
1215 | * Re-try the "link()" regardless of whether the mkdir | |
1216 | * succeeds, since a race might mean that somebody | |
1217 | * else succeeded. | |
1218 | */ | |
1219 | ret = errno; | |
1220 | if (ret == ENOENT) { | |
1221 | char *dir = strrchr(filename, '/'); | |
1222 | if (dir) { | |
1223 | *dir = 0; | |
1224 | mkdir(filename, 0777); | |
1225 | *dir = '/'; | |
1226 | if (!link(tmpfile, filename)) | |
1227 | return 0; | |
1228 | ret = errno; | |
1229 | } | |
1230 | } | |
1231 | return ret; | |
1232 | } | |
1233 | ||
1234 | /* | |
1235 | * Move the just written object into its final resting place | |
1236 | */ | |
b721e01f | 1237 | int move_temp_to_file(const char *tmpfile, char *filename) |
230f1322 LT |
1238 | { |
1239 | int ret = link_temp_to_file(tmpfile, filename); | |
7ebb6fca LT |
1240 | |
1241 | /* | |
1242 | * Coda hack - coda doesn't like cross-directory links, | |
1243 | * so we fall back to a rename, which will mean that it | |
1244 | * won't be able to check collisions, but that's not a | |
1245 | * big deal. | |
1246 | * | |
1247 | * The same holds for FAT formatted media. | |
1248 | * | |
1249 | * When this succeeds, we just return 0. We have nothing | |
1250 | * left to unlink. | |
1251 | */ | |
1252 | if (ret && ret != EEXIST) { | |
1253 | if (!rename(tmpfile, filename)) | |
230f1322 | 1254 | return 0; |
9e48b389 | 1255 | ret = errno; |
230f1322 LT |
1256 | } |
1257 | unlink(tmpfile); | |
1258 | if (ret) { | |
1259 | if (ret != EEXIST) { | |
1260 | fprintf(stderr, "unable to write sha1 filename %s: %s", filename, strerror(ret)); | |
1261 | return -1; | |
1262 | } | |
1263 | /* FIXME!!! Collision check here ? */ | |
1264 | } | |
1265 | ||
1266 | return 0; | |
1267 | } | |
1268 | ||
bf0f910d | 1269 | int write_sha1_file(void *buf, unsigned long len, const char *type, unsigned char *returnsha1) |
0fcfd160 LT |
1270 | { |
1271 | int size; | |
bf0f910d | 1272 | unsigned char *compressed; |
0fcfd160 LT |
1273 | z_stream stream; |
1274 | unsigned char sha1[20]; | |
706bc531 | 1275 | char *filename; |
aac17941 | 1276 | static char tmpfile[PATH_MAX]; |
bf0f910d | 1277 | unsigned char hdr[50]; |
230f1322 | 1278 | int fd, hdrlen; |
a44c9a5e | 1279 | |
d410c0f5 JH |
1280 | /* Normally if we have it in the pack then we do not bother writing |
1281 | * it out into .git/objects/??/?{38} file. | |
1282 | */ | |
1283 | filename = write_sha1_file_prepare(buf, len, type, sha1, hdr, &hdrlen); | |
706bc531 LT |
1284 | if (returnsha1) |
1285 | memcpy(returnsha1, sha1, 20); | |
d410c0f5 JH |
1286 | if (has_sha1_file(sha1)) |
1287 | return 0; | |
aac17941 LT |
1288 | fd = open(filename, O_RDONLY); |
1289 | if (fd >= 0) { | |
706bc531 | 1290 | /* |
aac17941 LT |
1291 | * FIXME!!! We might do collision checking here, but we'd |
1292 | * need to uncompress the old file and check it. Later. | |
706bc531 | 1293 | */ |
aac17941 | 1294 | close(fd); |
706bc531 LT |
1295 | return 0; |
1296 | } | |
1297 | ||
aac17941 LT |
1298 | if (errno != ENOENT) { |
1299 | fprintf(stderr, "sha1 file %s: %s", filename, strerror(errno)); | |
1300 | return -1; | |
1301 | } | |
1302 | ||
1303 | snprintf(tmpfile, sizeof(tmpfile), "%s/obj_XXXXXX", get_object_directory()); | |
ace1534d | 1304 | |
aac17941 LT |
1305 | fd = mkstemp(tmpfile); |
1306 | if (fd < 0) { | |
1307 | fprintf(stderr, "unable to create temporary sha1 filename %s: %s", tmpfile, strerror(errno)); | |
1308 | return -1; | |
1309 | } | |
1310 | ||
0fcfd160 LT |
1311 | /* Set it up */ |
1312 | memset(&stream, 0, sizeof(stream)); | |
1313 | deflateInit(&stream, Z_BEST_COMPRESSION); | |
a44c9a5e | 1314 | size = deflateBound(&stream, len+hdrlen); |
812666c8 | 1315 | compressed = xmalloc(size); |
0fcfd160 LT |
1316 | |
1317 | /* Compress it */ | |
0fcfd160 LT |
1318 | stream.next_out = compressed; |
1319 | stream.avail_out = size; | |
a44c9a5e LT |
1320 | |
1321 | /* First header.. */ | |
1322 | stream.next_in = hdr; | |
1323 | stream.avail_in = hdrlen; | |
1324 | while (deflate(&stream, 0) == Z_OK) | |
6ffcee88 | 1325 | /* nothing */; |
a44c9a5e LT |
1326 | |
1327 | /* Then the data itself.. */ | |
1328 | stream.next_in = buf; | |
1329 | stream.avail_in = len; | |
0fcfd160 LT |
1330 | while (deflate(&stream, Z_FINISH) == Z_OK) |
1331 | /* nothing */; | |
1332 | deflateEnd(&stream); | |
1333 | size = stream.total_out; | |
1334 | ||
706bc531 LT |
1335 | if (write(fd, compressed, size) != size) |
1336 | die("unable to write file"); | |
aac17941 | 1337 | fchmod(fd, 0444); |
706bc531 | 1338 | close(fd); |
383f85b7 | 1339 | free(compressed); |
0fcfd160 | 1340 | |
230f1322 | 1341 | return move_temp_to_file(tmpfile, filename); |
0fcfd160 | 1342 | } |
8237b185 | 1343 | |
a5eda52b DB |
1344 | int write_sha1_to_fd(int fd, const unsigned char *sha1) |
1345 | { | |
1346 | ssize_t size; | |
1347 | unsigned long objsize; | |
1348 | int posn = 0; | |
bfc66daf SV |
1349 | void *map = map_sha1_file_internal(sha1, &objsize); |
1350 | void *buf = map; | |
1351 | void *temp_obj = NULL; | |
a5eda52b | 1352 | z_stream stream; |
bfc66daf | 1353 | |
a5eda52b DB |
1354 | if (!buf) { |
1355 | unsigned char *unpacked; | |
1356 | unsigned long len; | |
1357 | char type[20]; | |
1358 | char hdr[50]; | |
1359 | int hdrlen; | |
1360 | // need to unpack and recompress it by itself | |
1361 | unpacked = read_packed_sha1(sha1, type, &len); | |
1362 | ||
1363 | hdrlen = sprintf(hdr, "%s %lu", type, len) + 1; | |
1364 | ||
1365 | /* Set it up */ | |
1366 | memset(&stream, 0, sizeof(stream)); | |
1367 | deflateInit(&stream, Z_BEST_COMPRESSION); | |
1368 | size = deflateBound(&stream, len + hdrlen); | |
bfc66daf | 1369 | temp_obj = buf = xmalloc(size); |
a5eda52b DB |
1370 | |
1371 | /* Compress it */ | |
1372 | stream.next_out = buf; | |
1373 | stream.avail_out = size; | |
1374 | ||
1375 | /* First header.. */ | |
0ee19dce | 1376 | stream.next_in = (void *)hdr; |
a5eda52b DB |
1377 | stream.avail_in = hdrlen; |
1378 | while (deflate(&stream, 0) == Z_OK) | |
1379 | /* nothing */; | |
1380 | ||
1381 | /* Then the data itself.. */ | |
1382 | stream.next_in = unpacked; | |
1383 | stream.avail_in = len; | |
1384 | while (deflate(&stream, Z_FINISH) == Z_OK) | |
1385 | /* nothing */; | |
1386 | deflateEnd(&stream); | |
bfc66daf | 1387 | free(unpacked); |
a5eda52b DB |
1388 | |
1389 | objsize = stream.total_out; | |
1390 | } | |
1391 | ||
1392 | do { | |
1393 | size = write(fd, buf + posn, objsize - posn); | |
1394 | if (size <= 0) { | |
1395 | if (!size) { | |
1396 | fprintf(stderr, "write closed"); | |
1397 | } else { | |
1398 | perror("write "); | |
1399 | } | |
1400 | return -1; | |
1401 | } | |
1402 | posn += size; | |
1403 | } while (posn < objsize); | |
bfc66daf SV |
1404 | |
1405 | if (map) | |
1406 | munmap(map, objsize); | |
1407 | if (temp_obj) | |
1408 | free(temp_obj); | |
1409 | ||
a5eda52b DB |
1410 | return 0; |
1411 | } | |
1412 | ||
70b9829e DB |
1413 | int write_sha1_from_fd(const unsigned char *sha1, int fd, char *buffer, |
1414 | size_t bufsize, size_t *bufposn) | |
8237b185 | 1415 | { |
230f1322 | 1416 | char tmpfile[PATH_MAX]; |
8237b185 DB |
1417 | int local; |
1418 | z_stream stream; | |
1419 | unsigned char real_sha1[20]; | |
bf0f910d | 1420 | unsigned char discard[4096]; |
8237b185 DB |
1421 | int ret; |
1422 | SHA_CTX c; | |
1423 | ||
230f1322 | 1424 | snprintf(tmpfile, sizeof(tmpfile), "%s/obj_XXXXXX", get_object_directory()); |
8237b185 | 1425 | |
230f1322 | 1426 | local = mkstemp(tmpfile); |
8237b185 | 1427 | if (local < 0) |
230f1322 | 1428 | return error("Couldn't open %s for %s\n", tmpfile, sha1_to_hex(sha1)); |
8237b185 DB |
1429 | |
1430 | memset(&stream, 0, sizeof(stream)); | |
1431 | ||
1432 | inflateInit(&stream); | |
1433 | ||
1434 | SHA1_Init(&c); | |
1435 | ||
1436 | do { | |
1437 | ssize_t size; | |
70b9829e DB |
1438 | if (*bufposn) { |
1439 | stream.avail_in = *bufposn; | |
96ad15ae | 1440 | stream.next_in = (unsigned char *) buffer; |
70b9829e DB |
1441 | do { |
1442 | stream.next_out = discard; | |
1443 | stream.avail_out = sizeof(discard); | |
1444 | ret = inflate(&stream, Z_SYNC_FLUSH); | |
1445 | SHA1_Update(&c, discard, sizeof(discard) - | |
1446 | stream.avail_out); | |
1447 | } while (stream.avail_in && ret == Z_OK); | |
1448 | write(local, buffer, *bufposn - stream.avail_in); | |
1449 | memmove(buffer, buffer + *bufposn - stream.avail_in, | |
1450 | stream.avail_in); | |
1451 | *bufposn = stream.avail_in; | |
1452 | if (ret != Z_OK) | |
1453 | break; | |
1454 | } | |
1455 | size = read(fd, buffer + *bufposn, bufsize - *bufposn); | |
8237b185 DB |
1456 | if (size <= 0) { |
1457 | close(local); | |
230f1322 | 1458 | unlink(tmpfile); |
8237b185 DB |
1459 | if (!size) |
1460 | return error("Connection closed?"); | |
1461 | perror("Reading from connection"); | |
1462 | return -1; | |
1463 | } | |
70b9829e DB |
1464 | *bufposn += size; |
1465 | } while (1); | |
8237b185 DB |
1466 | inflateEnd(&stream); |
1467 | ||
1468 | close(local); | |
1469 | SHA1_Final(real_sha1, &c); | |
1470 | if (ret != Z_STREAM_END) { | |
230f1322 | 1471 | unlink(tmpfile); |
8237b185 DB |
1472 | return error("File %s corrupted", sha1_to_hex(sha1)); |
1473 | } | |
1474 | if (memcmp(sha1, real_sha1, 20)) { | |
230f1322 | 1475 | unlink(tmpfile); |
8237b185 DB |
1476 | return error("File %s has bad hash\n", sha1_to_hex(sha1)); |
1477 | } | |
230f1322 LT |
1478 | |
1479 | return move_temp_to_file(tmpfile, sha1_file_name(sha1)); | |
8237b185 DB |
1480 | } |
1481 | ||
bf592c50 DB |
1482 | int has_pack_index(const unsigned char *sha1) |
1483 | { | |
1484 | struct stat st; | |
1485 | if (stat(sha1_pack_index_name(sha1), &st)) | |
1486 | return 0; | |
1487 | return 1; | |
1488 | } | |
1489 | ||
1490 | int has_pack_file(const unsigned char *sha1) | |
1491 | { | |
1492 | struct stat st; | |
1493 | if (stat(sha1_pack_name(sha1), &st)) | |
1494 | return 0; | |
1495 | return 1; | |
1496 | } | |
1497 | ||
dade09c2 LT |
1498 | int has_sha1_pack(const unsigned char *sha1) |
1499 | { | |
1500 | struct pack_entry e; | |
1501 | return find_pack_entry(sha1, &e); | |
1502 | } | |
1503 | ||
8237b185 DB |
1504 | int has_sha1_file(const unsigned char *sha1) |
1505 | { | |
8237b185 | 1506 | struct stat st; |
1f688557 JH |
1507 | struct pack_entry e; |
1508 | ||
ab90ea5d | 1509 | if (find_pack_entry(sha1, &e)) |
1f688557 | 1510 | return 1; |
ab90ea5d | 1511 | return find_sha1_file(sha1, &st) ? 1 : 0; |
8237b185 | 1512 | } |
74400e71 | 1513 | |
7672db20 | 1514 | int index_fd(unsigned char *sha1, int fd, struct stat *st, int write_object, const char *type) |
74400e71 | 1515 | { |
74400e71 | 1516 | unsigned long size = st->st_size; |
aac17941 LT |
1517 | void *buf; |
1518 | int ret; | |
7672db20 BL |
1519 | unsigned char hdr[50]; |
1520 | int hdrlen; | |
74400e71 | 1521 | |
aac17941 | 1522 | buf = ""; |
74400e71 | 1523 | if (size) |
aac17941 | 1524 | buf = mmap(NULL, size, PROT_READ, MAP_PRIVATE, fd, 0); |
74400e71 | 1525 | close(fd); |
e35f9824 | 1526 | if (buf == MAP_FAILED) |
74400e71 JH |
1527 | return -1; |
1528 | ||
7672db20 BL |
1529 | if (!type) |
1530 | type = "blob"; | |
1531 | if (write_object) | |
1532 | ret = write_sha1_file(buf, size, type, sha1); | |
1533 | else { | |
1534 | write_sha1_file_prepare(buf, size, type, sha1, hdr, &hdrlen); | |
1535 | ret = 0; | |
1536 | } | |
aac17941 LT |
1537 | if (size) |
1538 | munmap(buf, size); | |
1539 | return ret; | |
74400e71 | 1540 | } |
ec1fcc16 JH |
1541 | |
1542 | int index_path(unsigned char *sha1, const char *path, struct stat *st, int write_object) | |
1543 | { | |
1544 | int fd; | |
1545 | char *target; | |
1546 | ||
1547 | switch (st->st_mode & S_IFMT) { | |
1548 | case S_IFREG: | |
1549 | fd = open(path, O_RDONLY); | |
1550 | if (fd < 0) | |
1551 | return error("open(\"%s\"): %s", path, | |
1552 | strerror(errno)); | |
1553 | if (index_fd(sha1, fd, st, write_object, NULL) < 0) | |
1554 | return error("%s: failed to insert into database", | |
1555 | path); | |
1556 | break; | |
1557 | case S_IFLNK: | |
1558 | target = xmalloc(st->st_size+1); | |
1559 | if (readlink(path, target, st->st_size+1) != st->st_size) { | |
1560 | char *errstr = strerror(errno); | |
1561 | free(target); | |
1562 | return error("readlink(\"%s\"): %s", path, | |
1563 | errstr); | |
1564 | } | |
1565 | if (!write_object) { | |
1566 | unsigned char hdr[50]; | |
1567 | int hdrlen; | |
1568 | write_sha1_file_prepare(target, st->st_size, "blob", | |
1569 | sha1, hdr, &hdrlen); | |
1570 | } else if (write_sha1_file(target, st->st_size, "blob", sha1)) | |
1571 | return error("%s: failed to insert into database", | |
1572 | path); | |
1573 | free(target); | |
1574 | break; | |
1575 | default: | |
1576 | return error("%s: unsupported file type", path); | |
1577 | } | |
1578 | return 0; | |
1579 | } |