Blame


1 7f8fc4ec 2017-12-03 stsp /*
2 0a0a3048 2018-01-10 stsp * Copyright (c) 2018 Stefan Sperling <stsp@openbsd.org>
3 7f8fc4ec 2017-12-03 stsp *
4 7f8fc4ec 2017-12-03 stsp * Permission to use, copy, modify, and distribute this software for any
5 7f8fc4ec 2017-12-03 stsp * purpose with or without fee is hereby granted, provided that the above
6 7f8fc4ec 2017-12-03 stsp * copyright notice and this permission notice appear in all copies.
7 7f8fc4ec 2017-12-03 stsp *
8 7f8fc4ec 2017-12-03 stsp * THE SOFTWARE IS PROVIDED "AS IS" AND THE AUTHOR DISCLAIMS ALL WARRANTIES
9 7f8fc4ec 2017-12-03 stsp * WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF
10 7f8fc4ec 2017-12-03 stsp * MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR
11 7f8fc4ec 2017-12-03 stsp * ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES
12 7f8fc4ec 2017-12-03 stsp * WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN
13 7f8fc4ec 2017-12-03 stsp * ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF
14 7f8fc4ec 2017-12-03 stsp * OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE.
15 7f8fc4ec 2017-12-03 stsp */
16 7f8fc4ec 2017-12-03 stsp
17 7f8fc4ec 2017-12-03 stsp /* See Documentation/technical/pack-format.txt in Git. */
18 7f8fc4ec 2017-12-03 stsp
19 0a0a3048 2018-01-10 stsp struct got_packidx_trailer {
20 a1fd68d8 2018-01-12 stsp u_int8_t packfile_sha1[SHA1_DIGEST_LENGTH];
21 a1fd68d8 2018-01-12 stsp u_int8_t packidx_sha1[SHA1_DIGEST_LENGTH];
22 7f8fc4ec 2017-12-03 stsp } __attribute__((__packed__));
23 7f8fc4ec 2017-12-03 stsp
24 7f8fc4ec 2017-12-03 stsp /* Ignore pack index version 1 which is no longer written by Git. */
25 7f8fc4ec 2017-12-03 stsp #define GOT_PACKIDX_VERSION 2
26 7f8fc4ec 2017-12-03 stsp
27 7f8fc4ec 2017-12-03 stsp struct got_packidx_v2_hdr {
28 7f8fc4ec 2017-12-03 stsp uint32_t magic; /* big endian */
29 7f8fc4ec 2017-12-03 stsp #define GOT_PACKIDX_V2_MAGIC 0xff744f63 /* "\377t0c" */
30 7f8fc4ec 2017-12-03 stsp uint32_t version;
31 7f8fc4ec 2017-12-03 stsp
32 7f8fc4ec 2017-12-03 stsp /*
33 7f8fc4ec 2017-12-03 stsp * Each entry N in the fanout table contains the number of objects in
34 7f8fc4ec 2017-12-03 stsp * the packfile whose SHA1 begins with a byte less than or equal to N.
35 7f8fc4ec 2017-12-03 stsp * The last entry (index 255) contains the number of objects in the
36 7f8fc4ec 2017-12-03 stsp * pack file whose first SHA1 byte is <= 0xff, and thus records the
37 7f8fc4ec 2017-12-03 stsp * total number of objects in the pack file. All pointer variables
38 7f8fc4ec 2017-12-03 stsp * below point to tables with a corresponding number of entries.
39 7f8fc4ec 2017-12-03 stsp */
40 0a0a3048 2018-01-10 stsp uint32_t fanout_table[0xff + 1]; /* values are big endian */
41 7f8fc4ec 2017-12-03 stsp
42 7f8fc4ec 2017-12-03 stsp /* Sorted SHA1 checksums for each object in the pack file. */
43 a1fd68d8 2018-01-12 stsp struct got_object_id *sorted_ids;
44 7f8fc4ec 2017-12-03 stsp
45 a1fd68d8 2018-01-12 stsp /* CRC32 of the packed representation of each object. */
46 a1fd68d8 2018-01-12 stsp uint32_t *crc32;
47 a1fd68d8 2018-01-12 stsp
48 7f8fc4ec 2017-12-03 stsp /* Offset into the pack file for each object. */
49 7f8fc4ec 2017-12-03 stsp uint32_t *offsets; /* values are big endian */
50 7f8fc4ec 2017-12-03 stsp #define GOT_PACKIDX_OFFSET_VAL_MASK 0x7fffffff
51 7f8fc4ec 2017-12-03 stsp #define GOT_PACKIDX_OFFSET_VAL_IS_LARGE_IDX 0x80000000
52 7f8fc4ec 2017-12-03 stsp
53 7f8fc4ec 2017-12-03 stsp /* Large offsets table is empty for pack files < 2 GB. */
54 7f8fc4ec 2017-12-03 stsp uint64_t *large_offsets; /* values are big endian */
55 7f8fc4ec 2017-12-03 stsp
56 0a0a3048 2018-01-10 stsp struct got_packidx_trailer trailer;
57 7f8fc4ec 2017-12-03 stsp };
58 7f8fc4ec 2017-12-03 stsp
59 7f8fc4ec 2017-12-03 stsp struct got_packfile_hdr {
60 7f8fc4ec 2017-12-03 stsp uint32_t signature;
61 82708eb3 2017-12-03 stsp #define GOT_PACKFILE_SIGNATURE 0x5041434b /* 'P' 'A' 'C' 'K' */
62 7f8fc4ec 2017-12-03 stsp uint32_t version; /* big endian */
63 7f8fc4ec 2017-12-03 stsp #define GOT_PACKFILE_VERSION 2
64 7f8fc4ec 2017-12-03 stsp uint32_t nobjects; /* big endian */
65 7f8fc4ec 2017-12-03 stsp };
66 7f8fc4ec 2017-12-03 stsp
67 7f8fc4ec 2017-12-03 stsp struct got_packfile_obj_hdr {
68 7f8fc4ec 2017-12-03 stsp /*
69 7f8fc4ec 2017-12-03 stsp * The object size field uses a variable length encoding:
70 7f8fc4ec 2017-12-03 stsp * size0...sizeN form a 4+7+7+...+7 bit integer, where size0 is the
71 7f8fc4ec 2017-12-03 stsp * least significant part and sizeN is the most significant part.
72 7f8fc4ec 2017-12-03 stsp * If the MSB of a size byte is set, an additional size byte follows.
73 7f8fc4ec 2017-12-03 stsp * Of the 7 remaining bits of size0, the first 3 bits indicate the
74 7f8fc4ec 2017-12-03 stsp * object's type, and the remaining 4 bits contribute to the size.
75 7f8fc4ec 2017-12-03 stsp */
76 7f8fc4ec 2017-12-03 stsp uint8_t *size; /* variable length */
77 7f8fc4ec 2017-12-03 stsp #define GOT_PACK_OBJ_SIZE_MORE 0x80
78 7f8fc4ec 2017-12-03 stsp #define GOT_PACK_OBJ_SIZE0_TYPE_MASK 0x70 /* See struct got_object->type */
79 a1fd68d8 2018-01-12 stsp #define GOT_PACK_OBJ_SIZE0_TYPE_MASK_SHIFT 4
80 7f8fc4ec 2017-12-03 stsp #define GOT_PACK_OBJ_SIZE0_VAL_MASK 0x0f
81 a1fd68d8 2018-01-12 stsp #define GOT_PACK_OBJ_SIZE_VAL_MASK 0x7f
82 7f8fc4ec 2017-12-03 stsp };
83 7f8fc4ec 2017-12-03 stsp
84 7f8fc4ec 2017-12-03 stsp /* If object is not a DELTA type. */
85 7f8fc4ec 2017-12-03 stsp struct got_packfile_object_data {
86 7f8fc4ec 2017-12-03 stsp uint8_t *data; /* compressed */
87 7f8fc4ec 2017-12-03 stsp };
88 7f8fc4ec 2017-12-03 stsp
89 7f8fc4ec 2017-12-03 stsp /* If object is of type GOT_OBJ_TYPE_REF_DELTA. */
90 7f8fc4ec 2017-12-03 stsp struct got_packfile_object_data_ref_delta {
91 a1fd68d8 2018-01-12 stsp struct got_object_id id;
92 7f8fc4ec 2017-12-03 stsp uint8_t *delta_data; /* compressed */
93 7f8fc4ec 2017-12-03 stsp };
94 7f8fc4ec 2017-12-03 stsp
95 7f8fc4ec 2017-12-03 stsp /* If object is of type GOT_OBJ_TYPE_OFFSET_DELTA. */
96 7f8fc4ec 2017-12-03 stsp struct got_packfile_object_data_offset_delta {
97 7f8fc4ec 2017-12-03 stsp /*
98 7f8fc4ec 2017-12-03 stsp * This offset is interpreted as a negative offset from
99 7f8fc4ec 2017-12-03 stsp * the got_packfile_obj_hdr corresponding to this object.
100 7f8fc4ec 2017-12-03 stsp * The size provided in the header specifies the amount
101 7f8fc4ec 2017-12-03 stsp * of compressed delta data that follows.
102 7f8fc4ec 2017-12-03 stsp *
103 7f8fc4ec 2017-12-03 stsp * This field uses a variable length encoding of N bytes,
104 7f8fc4ec 2017-12-03 stsp * where the MSB is always set except for the last byte.
105 7f8fc4ec 2017-12-03 stsp * The value is encoded as a series of N 7 bit integers,
106 7f8fc4ec 2017-12-03 stsp * which are concatenated, and if N > 1 the value 2^7 +
107 7f8fc4ec 2017-12-03 stsp * 2^14 + ... + 2^(7 * (n-1)) is added to the result.
108 7f8fc4ec 2017-12-03 stsp */
109 7f8fc4ec 2017-12-03 stsp uint8_t *offset; /* variable length */
110 b107e67f 2018-01-19 stsp #define GOT_PACK_OBJ_DELTA_OFF_MORE 0x80
111 b107e67f 2018-01-19 stsp #define GOT_PACK_OBJ_DELTA_OFF_VAL_MASK 0x7f
112 b107e67f 2018-01-19 stsp uint8_t *delta_data; /* compressed */
113 7f8fc4ec 2017-12-03 stsp };
114 7f8fc4ec 2017-12-03 stsp
115 7f8fc4ec 2017-12-03 stsp struct got_packfile_obj_data {
116 7f8fc4ec 2017-12-03 stsp union {
117 0a0a3048 2018-01-10 stsp struct got_packfile_object_data data;
118 0a0a3048 2018-01-10 stsp struct got_packfile_object_data_ref_delta ref_delta;
119 0a0a3048 2018-01-10 stsp struct got_packfile_object_data_offset_delta offset_delta;
120 7f8fc4ec 2017-12-03 stsp } __attribute__((__packed__));
121 7f8fc4ec 2017-12-03 stsp } __attribute__((__packed__));
122 0a0a3048 2018-01-10 stsp
123 0a0a3048 2018-01-10 stsp const struct got_error *got_packidx_open(struct got_packidx_v2_hdr **,
124 0a0a3048 2018-01-10 stsp const char *);
125 0a0a3048 2018-01-10 stsp void got_packidx_close(struct got_packidx_v2_hdr *);
126 a1fd68d8 2018-01-12 stsp
127 6c00b545 2018-01-17 stsp const struct got_error *got_packfile_open_object(struct got_object **,
128 a1fd68d8 2018-01-12 stsp struct got_object_id *, struct got_repository *);
129 3ee5fc21 2018-01-17 stsp const struct got_error *got_packfile_extract_object(FILE **,
130 3ee5fc21 2018-01-17 stsp struct got_object *, struct got_repository *);