2 * Copyright (c) 2018 Stefan Sperling <stsp@openbsd.org>
4 * Permission to use, copy, modify, and distribute this software for any
5 * purpose with or without fee is hereby granted, provided that the above
6 * copyright notice and this permission notice appear in all copies.
8 * THE SOFTWARE IS PROVIDED "AS IS" AND THE AUTHOR DISCLAIMS ALL WARRANTIES
9 * WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF
10 * MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR
11 * ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES
12 * WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN
13 * ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF
14 * OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE.
17 #include <sys/types.h>
19 #include <sys/queue.h>
32 #include "got_error.h"
33 #include "got_object.h"
34 #include "got_repository.h"
39 #define GOT_PACK_PREFIX "pack-"
40 #define GOT_PACKFILE_SUFFIX ".pack"
41 #define GOT_PACKIDX_SUFFIX ".idx"
42 #define GOT_PACKFILE_NAMELEN (strlen(GOT_PACK_PREFIX) + \
43 SHA1_DIGEST_STRING_LENGTH - 1 + \
44 strlen(GOT_PACKFILE_SUFFIX))
45 #define GOT_PACKIDX_NAMELEN (strlen(GOT_PACK_PREFIX) + \
46 SHA1_DIGEST_STRING_LENGTH - 1 + \
47 strlen(GOT_PACKIDX_SUFFIX))
50 #define MIN(_a,_b) ((_a) < (_b) ? (_a) : (_b))
53 static const struct got_error *
54 verify_fanout_table(uint32_t *fanout_table)
58 for (i = 0; i < 0xff - 1; i++) {
59 if (be32toh(fanout_table[i]) > be32toh(fanout_table[i + 1]))
60 return got_error(GOT_ERR_BAD_PACKIDX);
66 static const struct got_error *
67 get_packfile_size(size_t *size, const char *path_idx)
71 char base_path[PATH_MAX];
74 if (strlcpy(base_path, path_idx, PATH_MAX) > PATH_MAX)
75 return got_error(GOT_ERR_NO_SPACE);
77 dot = strrchr(base_path, '.');
79 return got_error(GOT_ERR_BAD_PATH);
81 if (asprintf(&path_pack, "%s.pack", base_path) == -1)
82 return got_error(GOT_ERR_NO_MEM);
84 if (stat(path_pack, &sb) != 0) {
86 return got_error(GOT_ERR_IO);
95 const struct got_error *
96 got_packidx_open(struct got_packidx_v2_hdr **packidx, const char *path)
98 struct got_packidx_v2_hdr *p;
100 const struct got_error *err = NULL;
101 size_t n, nobj, packfile_size;
103 uint8_t sha1[SHA1_DIGEST_LENGTH];
107 f = fopen(path, "rb");
109 return got_error(GOT_ERR_BAD_PATH);
111 err = get_packfile_size(&packfile_size, path);
115 p = calloc(1, sizeof(*p));
117 err = got_error(GOT_ERR_NO_MEM);
121 n = fread(&p->magic, sizeof(p->magic), 1, f);
123 err = got_error(ferror(f) ? GOT_ERR_IO : GOT_ERR_BAD_PACKIDX);
127 if (betoh32(p->magic) != GOT_PACKIDX_V2_MAGIC) {
128 err = got_error(GOT_ERR_BAD_PACKIDX);
132 SHA1Update(&ctx, (uint8_t *)&p->magic, sizeof(p->magic));
134 n = fread(&p->version, sizeof(p->version), 1, f);
136 err = got_error(ferror(f) ? GOT_ERR_IO : GOT_ERR_BAD_PACKIDX);
140 if (betoh32(p->version) != GOT_PACKIDX_VERSION) {
141 err = got_error(GOT_ERR_BAD_PACKIDX);
145 SHA1Update(&ctx, (uint8_t *)&p->version, sizeof(p->version));
147 n = fread(&p->fanout_table, sizeof(p->fanout_table), 1, f);
149 err = got_error(ferror(f) ? GOT_ERR_IO : GOT_ERR_BAD_PACKIDX);
153 err = verify_fanout_table(p->fanout_table);
157 SHA1Update(&ctx, (uint8_t *)p->fanout_table, sizeof(p->fanout_table));
159 nobj = betoh32(p->fanout_table[0xff]);
161 p->sorted_ids = calloc(nobj, sizeof(*p->sorted_ids));
162 if (p->sorted_ids == NULL) {
163 err = got_error(GOT_ERR_NO_MEM);
167 n = fread(p->sorted_ids, sizeof(*p->sorted_ids), nobj, f);
169 err = got_error(ferror(f) ? GOT_ERR_IO : GOT_ERR_BAD_PACKIDX);
173 SHA1Update(&ctx, (uint8_t *)p->sorted_ids,
174 nobj * sizeof(*p->sorted_ids));
176 p->crc32 = calloc(nobj, sizeof(*p->crc32));
177 if (p->crc32 == NULL) {
178 err = got_error(GOT_ERR_NO_MEM);
182 n = fread(p->crc32, sizeof(*p->crc32), nobj, f);
184 err = got_error(ferror(f) ? GOT_ERR_IO : GOT_ERR_BAD_PACKIDX);
188 SHA1Update(&ctx, (uint8_t *)p->crc32, nobj * sizeof(*p->crc32));
190 p->offsets = calloc(nobj, sizeof(*p->offsets));
191 if (p->offsets == NULL) {
192 err = got_error(GOT_ERR_NO_MEM);
196 n = fread(p->offsets, sizeof(*p->offsets), nobj, f);
198 err = got_error(ferror(f) ? GOT_ERR_IO : GOT_ERR_BAD_PACKIDX);
202 SHA1Update(&ctx, (uint8_t *)p->offsets, nobj * sizeof(*p->offsets));
204 /* Large file offsets are contained only in files > 2GB. */
205 if (packfile_size <= 0x80000000)
208 p->large_offsets = calloc(nobj, sizeof(*p->large_offsets));
209 if (p->large_offsets == NULL) {
210 err = got_error(GOT_ERR_NO_MEM);
214 n = fread(p->large_offsets, sizeof(*p->large_offsets), nobj, f);
216 err = got_error(ferror(f) ? GOT_ERR_IO : GOT_ERR_BAD_PACKIDX);
220 SHA1Update(&ctx, (uint8_t*)p->large_offsets,
221 nobj * sizeof(*p->large_offsets));
224 n = fread(&p->trailer, sizeof(p->trailer), 1, f);
226 err = got_error(ferror(f) ? GOT_ERR_IO : GOT_ERR_BAD_PACKIDX);
230 SHA1Update(&ctx, p->trailer.packfile_sha1, SHA1_DIGEST_LENGTH);
231 SHA1Final(sha1, &ctx);
232 if (memcmp(p->trailer.packidx_sha1, sha1, SHA1_DIGEST_LENGTH) != 0)
233 err = got_error(GOT_ERR_PACKIDX_CSUM);
237 got_packidx_close(p);
244 got_packidx_close(struct got_packidx_v2_hdr *packidx)
246 free(packidx->sorted_ids);
247 free(packidx->offsets);
248 free(packidx->crc32);
249 free(packidx->large_offsets);
254 is_packidx_filename(const char *name, size_t len)
256 if (len != GOT_PACKIDX_NAMELEN)
259 if (strncmp(name, GOT_PACK_PREFIX, strlen(GOT_PACK_PREFIX)) != 0)
262 if (strcmp(name + strlen(GOT_PACK_PREFIX) +
263 SHA1_DIGEST_STRING_LENGTH - 1, GOT_PACKIDX_SUFFIX) != 0)
270 get_object_offset(struct got_packidx_v2_hdr *packidx, int idx)
272 uint32_t totobj = betoh32(packidx->fanout_table[0xff]);
273 uint32_t offset = betoh32(packidx->offsets[idx]);
274 if (offset & GOT_PACKIDX_OFFSET_VAL_IS_LARGE_IDX) {
276 idx = offset & GOT_PACKIDX_OFFSET_VAL_MASK;
277 if (idx < 0 || idx > totobj || packidx->large_offsets == NULL)
279 loffset = betoh64(packidx->large_offsets[idx]);
280 return (loffset > INT64_MAX ? -1 : (off_t)loffset);
282 return (off_t)(offset & GOT_PACKIDX_OFFSET_VAL_MASK);
286 get_object_idx(struct got_packidx_v2_hdr *packidx, struct got_object_id *id)
288 u_int8_t id0 = id->sha1[0];
289 uint32_t totobj = betoh32(packidx->fanout_table[0xff]);
293 i = betoh32(packidx->fanout_table[id0 - 1]);
296 struct got_object_id *oid = &packidx->sorted_ids[i++];
299 if (got_object_id_cmp(id, oid) < 0)
301 if (got_object_id_cmp(id, oid) > 0)
310 const struct got_error *
311 read_packfile_hdr(FILE *f, struct got_packidx_v2_hdr *packidx)
313 const struct got_error *err = NULL;
314 uint32_t totobj = betoh32(packidx->fanout_table[0xff]);
315 struct got_packfile_hdr hdr;
318 n = fread(&hdr, sizeof(hdr), 1, f);
320 return got_error(ferror(f) ? GOT_ERR_IO : GOT_ERR_BAD_PACKFILE);
322 if (betoh32(hdr.signature) != GOT_PACKFILE_SIGNATURE ||
323 betoh32(hdr.version) != GOT_PACKFILE_VERSION ||
324 betoh32(hdr.nobjects) != totobj)
325 err = got_error(GOT_ERR_BAD_PACKFILE);
330 static const struct got_error *
331 dump_packed_object(FILE **f, FILE *packfile, off_t offset)
333 const struct got_error *err = NULL;
334 const char *template = "/tmp/got.XXXXXXXXXX";
340 const char *type_tag;
344 err = got_error(GOT_ERR_FILE_OPEN);
348 if (fseeko(packfile, offset, SEEK_SET) != 0) {
349 err = got_error(errno == EIO ? GOT_ERR_IO : GOT_ERR_BAD_PATH);
355 /* We do not support size values which don't fit in 64 bit. */
357 err = got_error(GOT_ERR_NO_SPACE);
361 n = fread(&sizeN, sizeof(sizeN), 1, packfile);
363 err = got_error(ferror(packfile) ?
364 GOT_ERR_IO : GOT_ERR_BAD_PACKFILE);
368 type = (sizeN & GOT_PACK_OBJ_SIZE0_TYPE_MASK) >>
369 GOT_PACK_OBJ_SIZE0_TYPE_MASK_SHIFT;
370 size = (sizeN & GOT_PACK_OBJ_SIZE0_VAL_MASK);
372 size_t shift = 4 + 7 * (i - 1);
373 size |= ((sizeN & GOT_PACK_OBJ_SIZE_VAL_MASK) << shift);
376 } while (sizeN & GOT_PACK_OBJ_SIZE_MORE);
378 if (type == GOT_OBJ_TYPE_OFFSET_DELTA)
379 printf("object type OFFSET_DELTA not yet implemented\n");
380 else if (type == GOT_OBJ_TYPE_REF_DELTA)
381 printf("object type REF_DELTA not yet implemented\n");
382 else if (type == GOT_OBJ_TYPE_TAG)
383 printf("object type TAG not yet implemented\n");
385 type_tag = got_object_get_type_tag(type);
386 if (type_tag == NULL) {
387 err = got_error(GOT_ERR_BAD_OBJ_HDR);
391 fprintf(*f, "%s %llu", type_tag, size);
396 size_t len = MIN(size, sizeof(data));
398 n = fread(data, len, 1, packfile);
400 err = got_error(ferror(packfile) ?
401 GOT_ERR_IO : GOT_ERR_BAD_PACKFILE);
405 n = fwrite(data, len, 1, *f);
407 err = got_error(ferror(*f) ?
408 GOT_ERR_IO : GOT_ERR_BAD_PACKFILE);
415 printf("object type is %d\n", type);
422 static const struct got_error *
423 extract_object(FILE **f, const char *path_packdir,
424 struct got_packidx_v2_hdr *packidx, struct got_object_id *id)
426 const struct got_error *err = NULL;
427 int idx = get_object_idx(packidx, id);
431 char hex[SHA1_DIGEST_STRING_LENGTH];
435 if (idx == -1) /* object not found in pack index */
438 offset = get_object_offset(packidx, idx);
439 if (offset == (uint64_t)-1)
440 return got_error(GOT_ERR_BAD_PACKIDX);
442 sha1str = got_sha1_digest_to_str(packidx->trailer.packfile_sha1,
445 return got_error(GOT_ERR_PACKIDX_CSUM);
447 if (asprintf(&path_packfile, "%s/%s%s%s", path_packdir,
448 GOT_PACK_PREFIX, sha1str, GOT_PACKFILE_SUFFIX) == -1)
449 return got_error(GOT_ERR_NO_MEM);
451 packfile = fopen(path_packfile, "rb");
452 if (packfile == NULL) {
453 err = got_error(errno == EIO ? GOT_ERR_IO : GOT_ERR_BAD_PATH);
457 err = read_packfile_hdr(packfile, packidx);
461 printf("Dumping object at offset %llu\n", offset);
462 err = dump_packed_object(f, packfile, offset);
468 if (packfile && fclose(packfile) == -1 && errno == EIO && err == 0)
469 err = got_error(GOT_ERR_IO);
473 const struct got_error *
474 got_packfile_extract_object(FILE **f, struct got_object_id *id,
475 struct got_repository *repo)
477 const struct got_error *err = NULL;
480 char *path_packdir = got_repo_get_path_objects_pack(repo);
482 if (path_packdir == NULL) {
483 err = got_error(GOT_ERR_NO_MEM);
487 packdir = opendir(path_packdir);
488 if (packdir == NULL) {
489 err = got_error(errno == EIO ? GOT_ERR_IO : GOT_ERR_BAD_PATH);
493 while ((dent = readdir(packdir)) != NULL) {
494 struct got_packidx_v2_hdr *packidx;
495 char *path_packidx, *path_object;
497 if (!is_packidx_filename(dent->d_name, dent->d_namlen))
500 if (asprintf(&path_packidx, "%s/%s", path_packdir,
501 dent->d_name) == -1) {
502 err = got_error(GOT_ERR_NO_MEM);
506 err = got_packidx_open(&packidx, path_packidx);
511 err = extract_object(f, path_packdir, packidx, id);
520 if (packdir && closedir(packdir) != 0 && errno == EIO && err == 0)
521 err = got_error(GOT_ERR_IO);