2 5aa81393 2020-01-06 stsp * Copyright (c) 2018, 2019, 2020 Stefan Sperling <stsp@openbsd.org>
4 a440fac0 2018-09-06 stsp * Permission to use, copy, modify, and distribute this software for any
5 a440fac0 2018-09-06 stsp * purpose with or without fee is hereby granted, provided that the above
6 a440fac0 2018-09-06 stsp * copyright notice and this permission notice appear in all copies.
8 a440fac0 2018-09-06 stsp * THE SOFTWARE IS PROVIDED "AS IS" AND THE AUTHOR DISCLAIMS ALL WARRANTIES
9 a440fac0 2018-09-06 stsp * WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF
10 a440fac0 2018-09-06 stsp * MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR
11 a440fac0 2018-09-06 stsp * ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES
12 a440fac0 2018-09-06 stsp * WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN
13 a440fac0 2018-09-06 stsp * ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF
14 a440fac0 2018-09-06 stsp * OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE.
17 a440fac0 2018-09-06 stsp #include <sys/types.h>
18 a440fac0 2018-09-06 stsp #include <sys/stat.h>
19 a440fac0 2018-09-06 stsp #include <sys/queue.h>
20 f8b19efd 2021-10-13 stsp #include <sys/tree.h>
21 a440fac0 2018-09-06 stsp #include <sys/uio.h>
22 a440fac0 2018-09-06 stsp #include <sys/socket.h>
23 a440fac0 2018-09-06 stsp #include <sys/wait.h>
24 64a8571e 2022-01-07 stsp #include <sys/mman.h>
26 a440fac0 2018-09-06 stsp #include <errno.h>
27 a440fac0 2018-09-06 stsp #include <stdio.h>
28 a440fac0 2018-09-06 stsp #include <stdlib.h>
29 a440fac0 2018-09-06 stsp #include <string.h>
30 a440fac0 2018-09-06 stsp #include <stdint.h>
31 a440fac0 2018-09-06 stsp #include <sha1.h>
32 69c6accf 2023-02-04 op #include <sha2.h>
33 a440fac0 2018-09-06 stsp #include <zlib.h>
34 a440fac0 2018-09-06 stsp #include <ctype.h>
35 a440fac0 2018-09-06 stsp #include <limits.h>
36 a440fac0 2018-09-06 stsp #include <imsg.h>
37 a440fac0 2018-09-06 stsp #include <time.h>
38 ad242220 2018-09-08 stsp #include <unistd.h>
40 a440fac0 2018-09-06 stsp #include "got_error.h"
41 a440fac0 2018-09-06 stsp #include "got_object.h"
42 a440fac0 2018-09-06 stsp #include "got_repository.h"
43 a440fac0 2018-09-06 stsp #include "got_opentemp.h"
44 324d37e7 2019-05-11 stsp #include "got_path.h"
46 1362b0e3 2023-02-04 op #include "got_lib_hash.h"
47 a440fac0 2018-09-06 stsp #include "got_lib_delta.h"
48 41fa1437 2018-11-05 stsp #include "got_lib_inflate.h"
49 41fa1437 2018-11-05 stsp #include "got_lib_object.h"
50 3022d272 2019-11-14 stsp #include "got_lib_object_parse.h"
51 6bef87be 2018-09-11 stsp #include "got_lib_object_cache.h"
52 15a94983 2018-12-23 stsp #include "got_lib_pack.h"
53 ad242220 2018-09-08 stsp #include "got_lib_repository.h"
55 a440fac0 2018-09-06 stsp #ifndef nitems
56 a440fac0 2018-09-06 stsp #define nitems(_a) (sizeof(_a) / sizeof((_a)[0]))
59 ca6e02ac 2020-01-07 stsp struct got_object_id *
60 ca6e02ac 2020-01-07 stsp got_object_id_dup(struct got_object_id *id1)
62 ca6e02ac 2020-01-07 stsp struct got_object_id *id2;
64 ca6e02ac 2020-01-07 stsp id2 = malloc(sizeof(*id2));
65 ca6e02ac 2020-01-07 stsp if (id2 == NULL)
66 ca6e02ac 2020-01-07 stsp return NULL;
67 ca6e02ac 2020-01-07 stsp memcpy(id2, id1, sizeof(*id2));
72 f054b67a 2018-11-05 stsp got_object_id_cmp(const struct got_object_id *id1,
73 f054b67a 2018-11-05 stsp const struct got_object_id *id2)
75 b94703ce 2023-02-04 op if (id1->algo != id2->algo)
78 b94703ce 2023-02-04 op if (id1->algo == GOT_HASH_SHA256)
79 b94703ce 2023-02-04 op return memcmp(id1->hash, id2->hash, SHA256_DIGEST_LENGTH);
80 b94703ce 2023-02-04 op if (id1->algo == GOT_HASH_SHA1)
81 b94703ce 2023-02-04 op return memcmp(id1->hash, id2->hash, SHA1_DIGEST_LENGTH);
85 2ff12563 2018-09-15 stsp const struct got_error *
86 5df4932d 2018-11-05 stsp got_object_qid_alloc_partial(struct got_object_qid **qid)
88 5df4932d 2018-11-05 stsp *qid = malloc(sizeof(**qid));
89 5df4932d 2018-11-05 stsp if (*qid == NULL)
90 638f9024 2019-05-13 stsp return got_error_from_errno("malloc");
92 74a2356f 2021-06-18 stsp (*qid)->data = NULL;
93 5df4932d 2018-11-05 stsp return NULL;
96 5df4932d 2018-11-05 stsp const struct got_error *
97 2ff12563 2018-09-15 stsp got_object_id_str(char **outbuf, struct got_object_id *id)
99 bbc740ac 2023-02-04 op static const size_t len = GOT_OBJECT_ID_HEX_MAXLEN;
101 2ff12563 2018-09-15 stsp *outbuf = malloc(len);
102 2ff12563 2018-09-15 stsp if (*outbuf == NULL)
103 638f9024 2019-05-13 stsp return got_error_from_errno("malloc");
105 bbc740ac 2023-02-04 op if (got_object_id_hex(id, *outbuf, len) == NULL) {
106 2ff12563 2018-09-15 stsp free(*outbuf);
107 2ff12563 2018-09-15 stsp *outbuf = NULL;
108 2ff12563 2018-09-15 stsp return got_error(GOT_ERR_BAD_OBJ_ID_STR);
111 2ff12563 2018-09-15 stsp return NULL;
115 bbc740ac 2023-02-04 op got_object_id_hex(struct got_object_id *id, char *buf, size_t len)
117 bbc740ac 2023-02-04 op return got_sha1_digest_to_str(id->sha1, buf, len);
121 03fa71c8 2018-09-06 stsp got_object_close(struct got_object *obj)
123 03fa71c8 2018-09-06 stsp if (obj->refcnt > 0) {
124 03fa71c8 2018-09-06 stsp obj->refcnt--;
125 03fa71c8 2018-09-06 stsp if (obj->refcnt > 0)
129 03fa71c8 2018-09-06 stsp if (obj->flags & GOT_OBJ_FLAG_DELTIFIED) {
130 03fa71c8 2018-09-06 stsp struct got_delta *delta;
131 dbdddfee 2021-06-23 naddy while (!STAILQ_EMPTY(&obj->deltas.entries)) {
132 dbdddfee 2021-06-23 naddy delta = STAILQ_FIRST(&obj->deltas.entries);
133 dbdddfee 2021-06-23 naddy STAILQ_REMOVE_HEAD(&obj->deltas.entries, entry);
134 2256993b 2019-07-15 stsp free(delta);
140 d3c116bf 2021-10-15 stsp const struct got_error *
141 d3c116bf 2021-10-15 stsp got_object_raw_close(struct got_raw_object *obj)
143 d3c116bf 2021-10-15 stsp const struct got_error *err = NULL;
145 d3c116bf 2021-10-15 stsp if (obj->refcnt > 0) {
146 d3c116bf 2021-10-15 stsp obj->refcnt--;
147 d3c116bf 2021-10-15 stsp if (obj->refcnt > 0)
148 d3c116bf 2021-10-15 stsp return NULL;
151 13b2bc37 2022-10-23 stsp if (obj->close_cb)
152 13b2bc37 2022-10-23 stsp obj->close_cb(obj);
154 64a8571e 2022-01-07 stsp if (obj->f == NULL) {
155 64a8571e 2022-01-07 stsp if (obj->fd != -1) {
156 64a8571e 2022-01-07 stsp if (munmap(obj->data, obj->hdrlen + obj->size) == -1)
157 64a8571e 2022-01-07 stsp err = got_error_from_errno("munmap");
158 64a8571e 2022-01-07 stsp if (close(obj->fd) == -1 && err == NULL)
159 64a8571e 2022-01-07 stsp err = got_error_from_errno("close");
161 64a8571e 2022-01-07 stsp free(obj->data);
163 64a8571e 2022-01-07 stsp if (fclose(obj->f) == EOF && err == NULL)
164 64a8571e 2022-01-07 stsp err = got_error_from_errno("fclose");
167 d3c116bf 2021-10-15 stsp return err;
171 03fa71c8 2018-09-06 stsp got_object_qid_free(struct got_object_qid *qid)
177 dd88155e 2019-06-29 stsp got_object_id_queue_free(struct got_object_id_queue *ids)
179 dd88155e 2019-06-29 stsp struct got_object_qid *qid;
181 dbdddfee 2021-06-23 naddy while (!STAILQ_EMPTY(ids)) {
182 dbdddfee 2021-06-23 naddy qid = STAILQ_FIRST(ids);
183 dbdddfee 2021-06-23 naddy STAILQ_REMOVE_HEAD(ids, entry);
184 dd88155e 2019-06-29 stsp got_object_qid_free(qid);
188 1785f84a 2018-12-23 stsp const struct got_error *
189 1785f84a 2018-12-23 stsp got_object_parse_header(struct got_object **obj, char *buf, size_t len)
191 ff2a4428 2019-03-19 stsp const char *obj_labels[] = {
192 ff2a4428 2019-03-19 stsp GOT_OBJ_LABEL_COMMIT,
193 ff2a4428 2019-03-19 stsp GOT_OBJ_LABEL_TREE,
194 ff2a4428 2019-03-19 stsp GOT_OBJ_LABEL_BLOB,
195 ff2a4428 2019-03-19 stsp GOT_OBJ_LABEL_TAG,
197 1785f84a 2018-12-23 stsp const int obj_types[] = {
198 1785f84a 2018-12-23 stsp GOT_OBJ_TYPE_COMMIT,
199 1785f84a 2018-12-23 stsp GOT_OBJ_TYPE_TREE,
200 1785f84a 2018-12-23 stsp GOT_OBJ_TYPE_BLOB,
201 1785f84a 2018-12-23 stsp GOT_OBJ_TYPE_TAG,
203 1785f84a 2018-12-23 stsp int type = 0;
204 c7b17232 2022-01-28 stsp size_t size = 0;
208 1785f84a 2018-12-23 stsp *obj = NULL;
210 c7b17232 2022-01-28 stsp end = memchr(buf, '\0', len);
211 c7b17232 2022-01-28 stsp if (end == NULL)
212 9ef4ac16 2019-04-13 stsp return got_error(GOT_ERR_BAD_OBJ_HDR);
214 ff2a4428 2019-03-19 stsp for (i = 0; i < nitems(obj_labels); i++) {
215 ff2a4428 2019-03-19 stsp const char *label = obj_labels[i];
216 ff2a4428 2019-03-19 stsp size_t label_len = strlen(label);
217 1785f84a 2018-12-23 stsp const char *errstr;
219 c7b17232 2022-01-28 stsp if (len <= label_len || buf + label_len >= end ||
220 c7b17232 2022-01-28 stsp strncmp(buf, label, label_len) != 0)
223 1785f84a 2018-12-23 stsp type = obj_types[i];
224 ff2a4428 2019-03-19 stsp size = strtonum(buf + label_len, 0, LONG_MAX, &errstr);
225 1785f84a 2018-12-23 stsp if (errstr != NULL)
226 1785f84a 2018-12-23 stsp return got_error(GOT_ERR_BAD_OBJ_HDR);
230 1785f84a 2018-12-23 stsp if (type == 0)
231 1785f84a 2018-12-23 stsp return got_error(GOT_ERR_BAD_OBJ_HDR);
233 1785f84a 2018-12-23 stsp *obj = calloc(1, sizeof(**obj));
234 1785f84a 2018-12-23 stsp if (*obj == NULL)
235 638f9024 2019-05-13 stsp return got_error_from_errno("calloc");
236 1785f84a 2018-12-23 stsp (*obj)->type = type;
237 c7b17232 2022-01-28 stsp (*obj)->hdrlen = end - buf + 1;
238 1785f84a 2018-12-23 stsp (*obj)->size = size;
239 1785f84a 2018-12-23 stsp return NULL;
242 1785f84a 2018-12-23 stsp const struct got_error *
243 1785f84a 2018-12-23 stsp got_object_read_header(struct got_object **obj, int fd)
245 1785f84a 2018-12-23 stsp const struct got_error *err;
246 23bc48a9 2019-03-19 stsp struct got_inflate_buf zb;
247 31e61ec1 2021-09-28 naddy uint8_t *buf;
248 1785f84a 2018-12-23 stsp const size_t zbsize = 64;
249 1785f84a 2018-12-23 stsp size_t outlen, totlen;
250 1785f84a 2018-12-23 stsp int nbuf = 1;
252 1785f84a 2018-12-23 stsp *obj = NULL;
254 1785f84a 2018-12-23 stsp buf = malloc(zbsize);
255 1785f84a 2018-12-23 stsp if (buf == NULL)
256 638f9024 2019-05-13 stsp return got_error_from_errno("malloc");
257 c7b17232 2022-01-28 stsp buf[0] = '\0';
259 1e87a3c3 2020-03-18 stsp err = got_inflate_init(&zb, buf, zbsize, NULL);
261 1785f84a 2018-12-23 stsp return err;
263 1785f84a 2018-12-23 stsp totlen = 0;
265 3ab5e33c 2020-03-18 stsp err = got_inflate_read_fd(&zb, fd, &outlen, NULL);
268 1785f84a 2018-12-23 stsp if (outlen == 0)
270 1785f84a 2018-12-23 stsp totlen += outlen;
271 dedbbd9d 2019-04-13 stsp if (memchr(zb.outbuf, '\0', outlen) == NULL) {
272 31e61ec1 2021-09-28 naddy uint8_t *newbuf;
274 1785f84a 2018-12-23 stsp newbuf = recallocarray(buf, nbuf - 1, nbuf, zbsize);
275 1785f84a 2018-12-23 stsp if (newbuf == NULL) {
276 638f9024 2019-05-13 stsp err = got_error_from_errno("recallocarray");
279 1785f84a 2018-12-23 stsp buf = newbuf;
280 1785f84a 2018-12-23 stsp zb.outbuf = newbuf + totlen;
281 1785f84a 2018-12-23 stsp zb.outlen = (nbuf * zbsize) - totlen;
283 dedbbd9d 2019-04-13 stsp } while (memchr(zb.outbuf, '\0', outlen) == NULL);
285 1785f84a 2018-12-23 stsp err = got_object_parse_header(obj, buf, totlen);
288 1785f84a 2018-12-23 stsp got_inflate_end(&zb);
289 1785f84a 2018-12-23 stsp return err;
292 13b2bc37 2022-10-23 stsp const struct got_error *
293 13b2bc37 2022-10-23 stsp got_object_read_raw(uint8_t **outbuf, off_t *size, size_t *hdrlen,
294 13b2bc37 2022-10-23 stsp size_t max_in_mem_size, int outfd, struct got_object_id *expected_id,
297 13b2bc37 2022-10-23 stsp const struct got_error *err = NULL;
298 13b2bc37 2022-10-23 stsp struct got_object *obj;
299 13b2bc37 2022-10-23 stsp struct got_inflate_checksum csum;
300 a1f06df2 2023-02-04 op uint8_t sha256[SHA256_DIGEST_LENGTH];
301 a1f06df2 2023-02-04 op SHA2_CTX sha256_ctx;
302 13b2bc37 2022-10-23 stsp uint8_t sha1[SHA1_DIGEST_LENGTH];
303 13b2bc37 2022-10-23 stsp SHA1_CTX sha1_ctx;
304 13b2bc37 2022-10-23 stsp size_t len, consumed;
305 13b2bc37 2022-10-23 stsp FILE *f = NULL;
308 13b2bc37 2022-10-23 stsp *outbuf = NULL;
310 13b2bc37 2022-10-23 stsp *hdrlen = 0;
312 a1f06df2 2023-02-04 op memset(&csum, 0, sizeof(csum));
313 a1f06df2 2023-02-04 op if (expected_id->algo == GOT_HASH_SHA256) {
314 a1f06df2 2023-02-04 op SHA256Init(&sha256_ctx);
315 a1f06df2 2023-02-04 op csum.output_sha256 = &sha256_ctx;
317 a1f06df2 2023-02-04 op SHA1Init(&sha1_ctx);
318 a1f06df2 2023-02-04 op csum.output_sha1 = &sha1_ctx;
321 13b2bc37 2022-10-23 stsp if (lseek(infd, SEEK_SET, 0) == -1)
322 13b2bc37 2022-10-23 stsp return got_error_from_errno("lseek");
324 13b2bc37 2022-10-23 stsp err = got_object_read_header(&obj, infd);
326 13b2bc37 2022-10-23 stsp return err;
328 13b2bc37 2022-10-23 stsp if (lseek(infd, SEEK_SET, 0) == -1)
329 13b2bc37 2022-10-23 stsp return got_error_from_errno("lseek");
331 13b2bc37 2022-10-23 stsp if (obj->size + obj->hdrlen <= max_in_mem_size) {
332 13b2bc37 2022-10-23 stsp err = got_inflate_to_mem_fd(outbuf, &len, &consumed, &csum,
333 13b2bc37 2022-10-23 stsp obj->size + obj->hdrlen, infd);
337 13b2bc37 2022-10-23 stsp * XXX This uses an extra file descriptor for no good reason.
338 13b2bc37 2022-10-23 stsp * We should have got_inflate_fd_to_fd().
340 13b2bc37 2022-10-23 stsp fd = dup(infd);
341 13b2bc37 2022-10-23 stsp if (fd == -1)
342 13b2bc37 2022-10-23 stsp return got_error_from_errno("dup");
343 13b2bc37 2022-10-23 stsp f = fdopen(fd, "r");
344 13b2bc37 2022-10-23 stsp if (f == NULL) {
345 13b2bc37 2022-10-23 stsp err = got_error_from_errno("fdopen");
350 13b2bc37 2022-10-23 stsp err = got_inflate_to_fd(&len, f, &csum, outfd);
355 13b2bc37 2022-10-23 stsp if (len < obj->hdrlen || len != obj->hdrlen + obj->size) {
356 13b2bc37 2022-10-23 stsp err = got_error(GOT_ERR_BAD_OBJ_HDR);
360 a1f06df2 2023-02-04 op if (expected_id->algo == GOT_HASH_SHA256) {
361 a1f06df2 2023-02-04 op SHA256Final(sha256, &sha256_ctx);
362 a1f06df2 2023-02-04 op r = memcmp(expected_id->hash, sha256, sizeof(sha256));
364 a1f06df2 2023-02-04 op SHA1Final(sha1, &sha1_ctx);
365 a1f06df2 2023-02-04 op r = memcmp(expected_id->hash, sha1, sizeof(sha1));
368 a1f06df2 2023-02-04 op if (r != 0) {
369 3c23f6cd 2023-02-04 op err = got_error_checksum(expected_id);
373 13b2bc37 2022-10-23 stsp *size = obj->size;
374 13b2bc37 2022-10-23 stsp *hdrlen = obj->hdrlen;
376 13b2bc37 2022-10-23 stsp got_object_close(obj);
377 13b2bc37 2022-10-23 stsp if (f && fclose(f) == EOF && err == NULL)
378 13b2bc37 2022-10-23 stsp err = got_error_from_errno("fclose");
379 13b2bc37 2022-10-23 stsp return err;
382 a440fac0 2018-09-06 stsp struct got_commit_object *
383 a440fac0 2018-09-06 stsp got_object_commit_alloc_partial(void)
385 a440fac0 2018-09-06 stsp struct got_commit_object *commit;
387 a440fac0 2018-09-06 stsp commit = calloc(1, sizeof(*commit));
388 a440fac0 2018-09-06 stsp if (commit == NULL)
389 a440fac0 2018-09-06 stsp return NULL;
390 acf0c7c6 2018-11-05 stsp commit->tree_id = malloc(sizeof(*commit->tree_id));
391 a440fac0 2018-09-06 stsp if (commit->tree_id == NULL) {
392 a440fac0 2018-09-06 stsp free(commit);
393 a440fac0 2018-09-06 stsp return NULL;
396 dbdddfee 2021-06-23 naddy STAILQ_INIT(&commit->parent_ids);
398 a440fac0 2018-09-06 stsp return commit;
401 a440fac0 2018-09-06 stsp const struct got_error *
402 a440fac0 2018-09-06 stsp got_object_commit_add_parent(struct got_commit_object *commit,
403 cf67c0d9 2023-02-04 op const char *id_str, int algo)
405 a440fac0 2018-09-06 stsp const struct got_error *err = NULL;
406 a440fac0 2018-09-06 stsp struct got_object_qid *qid;
408 5df4932d 2018-11-05 stsp err = got_object_qid_alloc_partial(&qid);
410 7762fe12 2018-11-05 stsp return err;
412 cf67c0d9 2023-02-04 op if (!got_parse_hash_digest(qid->id.hash, id_str, algo, NULL)) {
413 a440fac0 2018-09-06 stsp err = got_error(GOT_ERR_BAD_OBJ_DATA);
414 00eb6a1f 2019-07-15 stsp got_object_qid_free(qid);
415 a440fac0 2018-09-06 stsp return err;
417 cf67c0d9 2023-02-04 op qid->id.algo = algo;
419 dbdddfee 2021-06-23 naddy STAILQ_INSERT_TAIL(&commit->parent_ids, qid, entry);
420 a440fac0 2018-09-06 stsp commit->nparents++;
422 a440fac0 2018-09-06 stsp return NULL;
425 a440fac0 2018-09-06 stsp static const struct got_error *
426 a440fac0 2018-09-06 stsp parse_gmtoff(time_t *gmtoff, const char *tzstr)
428 a440fac0 2018-09-06 stsp int sign = 1;
429 a440fac0 2018-09-06 stsp const char *p = tzstr;
430 a440fac0 2018-09-06 stsp time_t h, m;
432 a440fac0 2018-09-06 stsp *gmtoff = 0;
434 a440fac0 2018-09-06 stsp if (*p == '-')
436 a440fac0 2018-09-06 stsp else if (*p != '+')
437 a440fac0 2018-09-06 stsp return got_error(GOT_ERR_BAD_OBJ_DATA);
439 99fd9ff4 2022-11-17 op if (!isdigit((unsigned char)*p) &&
440 99fd9ff4 2022-11-17 op !isdigit((unsigned char)*(p + 1)))
441 a440fac0 2018-09-06 stsp return got_error(GOT_ERR_BAD_OBJ_DATA);
442 a440fac0 2018-09-06 stsp h = (((*p - '0') * 10) + (*(p + 1) - '0'));
445 99fd9ff4 2022-11-17 op if (!isdigit((unsigned char)*p) &&
446 99fd9ff4 2022-11-17 op !isdigit((unsigned char)*(p + 1)))
447 a440fac0 2018-09-06 stsp return got_error(GOT_ERR_BAD_OBJ_DATA);
448 a440fac0 2018-09-06 stsp m = ((*p - '0') * 10) + (*(p + 1) - '0');
450 a440fac0 2018-09-06 stsp *gmtoff = (h * 60 * 60 + m * 60) * sign;
451 a440fac0 2018-09-06 stsp return NULL;
454 a440fac0 2018-09-06 stsp static const struct got_error *
455 ccb26ccd 2018-11-05 stsp parse_commit_time(time_t *time, time_t *gmtoff, char *committer)
457 a440fac0 2018-09-06 stsp const struct got_error *err = NULL;
458 a440fac0 2018-09-06 stsp const char *errstr;
459 a440fac0 2018-09-06 stsp char *space, *tzstr;
461 a440fac0 2018-09-06 stsp /* Parse and strip off trailing timezone indicator string. */
462 a440fac0 2018-09-06 stsp space = strrchr(committer, ' ');
463 a440fac0 2018-09-06 stsp if (space == NULL)
464 a440fac0 2018-09-06 stsp return got_error(GOT_ERR_BAD_OBJ_DATA);
465 a440fac0 2018-09-06 stsp tzstr = strdup(space + 1);
466 a440fac0 2018-09-06 stsp if (tzstr == NULL)
467 638f9024 2019-05-13 stsp return got_error_from_errno("strdup");
468 ccb26ccd 2018-11-05 stsp err = parse_gmtoff(gmtoff, tzstr);
469 a440fac0 2018-09-06 stsp free(tzstr);
471 9dbd8627 2021-02-04 stsp if (err->code != GOT_ERR_BAD_OBJ_DATA)
472 9dbd8627 2021-02-04 stsp return err;
473 9dbd8627 2021-02-04 stsp /* Old versions of Git omitted the timestamp. */
475 9dbd8627 2021-02-04 stsp *gmtoff = 0;
476 9dbd8627 2021-02-04 stsp return NULL;
478 a440fac0 2018-09-06 stsp *space = '\0';
480 a440fac0 2018-09-06 stsp /* Timestamp is separated from committer name + email by space. */
481 a440fac0 2018-09-06 stsp space = strrchr(committer, ' ');
482 a440fac0 2018-09-06 stsp if (space == NULL)
483 a440fac0 2018-09-06 stsp return got_error(GOT_ERR_BAD_OBJ_DATA);
485 09867e48 2019-08-13 stsp /* Timestamp parsed here is expressed as UNIX timestamp (UTC). */
486 ccb26ccd 2018-11-05 stsp *time = strtonum(space + 1, 0, INT64_MAX, &errstr);
487 a440fac0 2018-09-06 stsp if (errstr)
488 a440fac0 2018-09-06 stsp return got_error(GOT_ERR_BAD_OBJ_DATA);
490 a440fac0 2018-09-06 stsp /* Strip off parsed time information, leaving just author and email. */
491 a440fac0 2018-09-06 stsp *space = '\0';
493 a440fac0 2018-09-06 stsp return NULL;
497 03fa71c8 2018-09-06 stsp got_object_commit_close(struct got_commit_object *commit)
499 03fa71c8 2018-09-06 stsp if (commit->refcnt > 0) {
500 03fa71c8 2018-09-06 stsp commit->refcnt--;
501 03fa71c8 2018-09-06 stsp if (commit->refcnt > 0)
505 dd88155e 2019-06-29 stsp got_object_id_queue_free(&commit->parent_ids);
506 03fa71c8 2018-09-06 stsp free(commit->tree_id);
507 03fa71c8 2018-09-06 stsp free(commit->author);
508 03fa71c8 2018-09-06 stsp free(commit->committer);
509 03fa71c8 2018-09-06 stsp free(commit->logmsg);
510 03fa71c8 2018-09-06 stsp free(commit);
513 45d799e2 2018-12-23 stsp struct got_object_id *
514 45d799e2 2018-12-23 stsp got_object_commit_get_tree_id(struct got_commit_object *commit)
516 45d799e2 2018-12-23 stsp return commit->tree_id;
520 45d799e2 2018-12-23 stsp got_object_commit_get_nparents(struct got_commit_object *commit)
522 45d799e2 2018-12-23 stsp return commit->nparents;
525 45d799e2 2018-12-23 stsp const struct got_object_id_queue *
526 45d799e2 2018-12-23 stsp got_object_commit_get_parent_ids(struct got_commit_object *commit)
528 45d799e2 2018-12-23 stsp return &commit->parent_ids;
531 45d799e2 2018-12-23 stsp const char *
532 45d799e2 2018-12-23 stsp got_object_commit_get_author(struct got_commit_object *commit)
534 45d799e2 2018-12-23 stsp return commit->author;
538 45d799e2 2018-12-23 stsp got_object_commit_get_author_time(struct got_commit_object *commit)
540 45d799e2 2018-12-23 stsp return commit->author_time;
543 45d799e2 2018-12-23 stsp time_t got_object_commit_get_author_gmtoff(struct got_commit_object *commit)
545 45d799e2 2018-12-23 stsp return commit->author_gmtoff;
548 45d799e2 2018-12-23 stsp const char *
549 45d799e2 2018-12-23 stsp got_object_commit_get_committer(struct got_commit_object *commit)
551 45d799e2 2018-12-23 stsp return commit->committer;
555 45d799e2 2018-12-23 stsp got_object_commit_get_committer_time(struct got_commit_object *commit)
557 45d799e2 2018-12-23 stsp return commit->committer_time;
561 45d799e2 2018-12-23 stsp got_object_commit_get_committer_gmtoff(struct got_commit_object *commit)
563 45d799e2 2018-12-23 stsp return commit->committer_gmtoff;
566 5943eee2 2019-08-13 stsp const struct got_error *
567 5943eee2 2019-08-13 stsp got_object_commit_get_logmsg(char **logmsg, struct got_commit_object *commit)
569 5943eee2 2019-08-13 stsp const struct got_error *err = NULL;
570 b9c41b54 2021-08-03 stsp const char *src;
572 5943eee2 2019-08-13 stsp size_t len;
574 b9c41b54 2021-08-03 stsp len = strlen(commit->logmsg);
575 b9c41b54 2021-08-03 stsp *logmsg = malloc(len + 2); /* leave room for a trailing \n and \0 */
576 b9c41b54 2021-08-03 stsp if (*logmsg == NULL)
577 b9c41b54 2021-08-03 stsp return got_error_from_errno("malloc");
580 b9c41b54 2021-08-03 stsp * Strip out unusual headers. Headers are separated from the commit
581 b9c41b54 2021-08-03 stsp * message body by a single empty line.
583 b9c41b54 2021-08-03 stsp src = commit->logmsg;
584 b9c41b54 2021-08-03 stsp dst = *logmsg;
585 b9c41b54 2021-08-03 stsp while (*src != '\0' && *src != '\n') {
586 b9c41b54 2021-08-03 stsp int copy_header = 1, eol = 0;
587 b9c41b54 2021-08-03 stsp if (strncmp(src, GOT_COMMIT_LABEL_TREE,
588 b9c41b54 2021-08-03 stsp strlen(GOT_COMMIT_LABEL_TREE)) != 0 &&
589 b9c41b54 2021-08-03 stsp strncmp(src, GOT_COMMIT_LABEL_AUTHOR,
590 b9c41b54 2021-08-03 stsp strlen(GOT_COMMIT_LABEL_AUTHOR)) != 0 &&
591 b9c41b54 2021-08-03 stsp strncmp(src, GOT_COMMIT_LABEL_PARENT,
592 b9c41b54 2021-08-03 stsp strlen(GOT_COMMIT_LABEL_PARENT)) != 0 &&
593 b9c41b54 2021-08-03 stsp strncmp(src, GOT_COMMIT_LABEL_COMMITTER,
594 b9c41b54 2021-08-03 stsp strlen(GOT_COMMIT_LABEL_COMMITTER)) != 0)
595 b9c41b54 2021-08-03 stsp copy_header = 0;
597 b9c41b54 2021-08-03 stsp while (*src != '\0' && !eol) {
598 b9c41b54 2021-08-03 stsp if (copy_header) {
599 b9c41b54 2021-08-03 stsp *dst = *src;
602 b9c41b54 2021-08-03 stsp if (*src == '\n')
607 b9c41b54 2021-08-03 stsp *dst = '\0';
609 b9c41b54 2021-08-03 stsp if (strlcat(*logmsg, src, len + 1) >= len + 1) {
610 b9c41b54 2021-08-03 stsp err = got_error(GOT_ERR_NO_SPACE);
614 5943eee2 2019-08-13 stsp /* Trim redundant trailing whitespace. */
615 5943eee2 2019-08-13 stsp len = strlen(*logmsg);
616 5943eee2 2019-08-13 stsp while (len > 1 && isspace((unsigned char)(*logmsg)[len - 2]) &&
617 5943eee2 2019-08-13 stsp isspace((unsigned char)(*logmsg)[len - 1])) {
618 5943eee2 2019-08-13 stsp (*logmsg)[len - 1] = '\0';
622 b9c41b54 2021-08-03 stsp /* Append a trailing newline if missing. */
623 b9c41b54 2021-08-03 stsp if (len > 0 && (*logmsg)[len - 1] != '\n') {
624 b9c41b54 2021-08-03 stsp (*logmsg)[len] = '\n';
625 b9c41b54 2021-08-03 stsp (*logmsg)[len + 1] = '\0';
629 5943eee2 2019-08-13 stsp free(*logmsg);
630 5943eee2 2019-08-13 stsp *logmsg = NULL;
632 5943eee2 2019-08-13 stsp return err;
635 24ea5512 2019-08-22 stsp const char *
636 24ea5512 2019-08-22 stsp got_object_commit_get_logmsg_raw(struct got_commit_object *commit)
638 24ea5512 2019-08-22 stsp return commit->logmsg;
641 a440fac0 2018-09-06 stsp const struct got_error *
642 5e0b25c4 2018-12-24 stsp got_object_parse_commit(struct got_commit_object **commit, char *buf,
643 cf67c0d9 2023-02-04 op size_t len, int algo)
645 a440fac0 2018-09-06 stsp const struct got_error *err = NULL;
646 a440fac0 2018-09-06 stsp char *s = buf;
647 ff2a4428 2019-03-19 stsp size_t label_len;
648 cf67c0d9 2023-02-04 op size_t digest_strlen;
649 a440fac0 2018-09-06 stsp ssize_t remain = (ssize_t)len;
651 cf67c0d9 2023-02-04 op if (algo == GOT_HASH_SHA256)
652 cf67c0d9 2023-02-04 op digest_strlen = SHA256_DIGEST_STRING_LENGTH;
654 cf67c0d9 2023-02-04 op digest_strlen = SHA1_DIGEST_STRING_LENGTH;
656 4793d91b 2019-09-22 stsp if (remain == 0)
657 4793d91b 2019-09-22 stsp return got_error(GOT_ERR_BAD_OBJ_DATA);
659 a440fac0 2018-09-06 stsp *commit = got_object_commit_alloc_partial();
660 a440fac0 2018-09-06 stsp if (*commit == NULL)
661 638f9024 2019-05-13 stsp return got_error_from_errno("got_object_commit_alloc_partial");
663 ff2a4428 2019-03-19 stsp label_len = strlen(GOT_COMMIT_LABEL_TREE);
664 ff2a4428 2019-03-19 stsp if (strncmp(s, GOT_COMMIT_LABEL_TREE, label_len) == 0) {
665 ff2a4428 2019-03-19 stsp remain -= label_len;
666 cf67c0d9 2023-02-04 op if (remain < digest_strlen) {
667 a440fac0 2018-09-06 stsp err = got_error(GOT_ERR_BAD_OBJ_DATA);
670 ff2a4428 2019-03-19 stsp s += label_len;
671 cf67c0d9 2023-02-04 op if (!got_parse_hash_digest((*commit)->tree_id->hash, s,
672 cf67c0d9 2023-02-04 op algo, NULL)) {
673 a440fac0 2018-09-06 stsp err = got_error(GOT_ERR_BAD_OBJ_DATA);
676 a1f06df2 2023-02-04 op (*commit)->tree_id->algo = algo;
677 cf67c0d9 2023-02-04 op remain -= digest_strlen;
678 cf67c0d9 2023-02-04 op s += digest_strlen;
680 a440fac0 2018-09-06 stsp err = got_error(GOT_ERR_BAD_OBJ_DATA);
684 ff2a4428 2019-03-19 stsp label_len = strlen(GOT_COMMIT_LABEL_PARENT);
685 ff2a4428 2019-03-19 stsp while (strncmp(s, GOT_COMMIT_LABEL_PARENT, label_len) == 0) {
686 ff2a4428 2019-03-19 stsp remain -= label_len;
687 cf67c0d9 2023-02-04 op if (remain < digest_strlen) {
688 a440fac0 2018-09-06 stsp err = got_error(GOT_ERR_BAD_OBJ_DATA);
691 ff2a4428 2019-03-19 stsp s += label_len;
692 cf67c0d9 2023-02-04 op err = got_object_commit_add_parent(*commit, s, algo);
696 cf67c0d9 2023-02-04 op remain -= digest_strlen;
697 cf67c0d9 2023-02-04 op s += digest_strlen;
700 ff2a4428 2019-03-19 stsp label_len = strlen(GOT_COMMIT_LABEL_AUTHOR);
701 ff2a4428 2019-03-19 stsp if (strncmp(s, GOT_COMMIT_LABEL_AUTHOR, label_len) == 0) {
703 a440fac0 2018-09-06 stsp size_t slen;
705 ff2a4428 2019-03-19 stsp remain -= label_len;
706 a440fac0 2018-09-06 stsp if (remain <= 0) {
707 a440fac0 2018-09-06 stsp err = got_error(GOT_ERR_BAD_OBJ_DATA);
710 ff2a4428 2019-03-19 stsp s += label_len;
711 dedbbd9d 2019-04-13 stsp p = memchr(s, '\n', remain);
712 a440fac0 2018-09-06 stsp if (p == NULL) {
713 a440fac0 2018-09-06 stsp err = got_error(GOT_ERR_BAD_OBJ_DATA);
717 a440fac0 2018-09-06 stsp slen = strlen(s);
718 ccb26ccd 2018-11-05 stsp err = parse_commit_time(&(*commit)->author_time,
719 ccb26ccd 2018-11-05 stsp &(*commit)->author_gmtoff, s);
722 a440fac0 2018-09-06 stsp (*commit)->author = strdup(s);
723 a440fac0 2018-09-06 stsp if ((*commit)->author == NULL) {
724 638f9024 2019-05-13 stsp err = got_error_from_errno("strdup");
727 a440fac0 2018-09-06 stsp s += slen + 1;
728 a440fac0 2018-09-06 stsp remain -= slen + 1;
731 ff2a4428 2019-03-19 stsp label_len = strlen(GOT_COMMIT_LABEL_COMMITTER);
732 ff2a4428 2019-03-19 stsp if (strncmp(s, GOT_COMMIT_LABEL_COMMITTER, label_len) == 0) {
734 a440fac0 2018-09-06 stsp size_t slen;
736 ff2a4428 2019-03-19 stsp remain -= label_len;
737 a440fac0 2018-09-06 stsp if (remain <= 0) {
738 a440fac0 2018-09-06 stsp err = got_error(GOT_ERR_BAD_OBJ_DATA);
741 ff2a4428 2019-03-19 stsp s += label_len;
742 dedbbd9d 2019-04-13 stsp p = memchr(s, '\n', remain);
743 a440fac0 2018-09-06 stsp if (p == NULL) {
744 a440fac0 2018-09-06 stsp err = got_error(GOT_ERR_BAD_OBJ_DATA);
748 a440fac0 2018-09-06 stsp slen = strlen(s);
749 ccb26ccd 2018-11-05 stsp err = parse_commit_time(&(*commit)->committer_time,
750 ccb26ccd 2018-11-05 stsp &(*commit)->committer_gmtoff, s);
753 a440fac0 2018-09-06 stsp (*commit)->committer = strdup(s);
754 a440fac0 2018-09-06 stsp if ((*commit)->committer == NULL) {
755 638f9024 2019-05-13 stsp err = got_error_from_errno("strdup");
758 a440fac0 2018-09-06 stsp s += slen + 1;
759 a440fac0 2018-09-06 stsp remain -= slen + 1;
762 a440fac0 2018-09-06 stsp (*commit)->logmsg = strndup(s, remain);
763 a440fac0 2018-09-06 stsp if ((*commit)->logmsg == NULL) {
764 638f9024 2019-05-13 stsp err = got_error_from_errno("strndup");
769 a440fac0 2018-09-06 stsp got_object_commit_close(*commit);
770 a440fac0 2018-09-06 stsp *commit = NULL;
772 a440fac0 2018-09-06 stsp return err;
775 13b2bc37 2022-10-23 stsp const struct got_error *
776 13b2bc37 2022-10-23 stsp got_object_read_commit(struct got_commit_object **commit, int fd,
777 13b2bc37 2022-10-23 stsp struct got_object_id *expected_id, size_t expected_size)
779 13b2bc37 2022-10-23 stsp struct got_object *obj = NULL;
780 13b2bc37 2022-10-23 stsp const struct got_error *err = NULL;
781 13b2bc37 2022-10-23 stsp size_t len;
782 13b2bc37 2022-10-23 stsp uint8_t *p;
783 13b2bc37 2022-10-23 stsp struct got_inflate_checksum csum;
784 13b2bc37 2022-10-23 stsp SHA1_CTX sha1_ctx;
785 cf67c0d9 2023-02-04 op SHA2_CTX sha256_ctx;
786 13b2bc37 2022-10-23 stsp struct got_object_id id;
788 13b2bc37 2022-10-23 stsp memset(&csum, 0, sizeof(csum));
789 cf67c0d9 2023-02-04 op id.algo = expected_id->algo;
790 cf67c0d9 2023-02-04 op if (expected_id->algo == GOT_HASH_SHA256) {
791 cf67c0d9 2023-02-04 op SHA256Init(&sha256_ctx);
792 cf67c0d9 2023-02-04 op csum.output_sha256 = &sha256_ctx;
794 cf67c0d9 2023-02-04 op SHA1Init(&sha1_ctx);
795 cf67c0d9 2023-02-04 op csum.output_sha1 = &sha1_ctx;
798 13b2bc37 2022-10-23 stsp err = got_inflate_to_mem_fd(&p, &len, NULL, &csum, expected_size, fd);
800 13b2bc37 2022-10-23 stsp return err;
802 cf67c0d9 2023-02-04 op if (expected_id->algo == GOT_HASH_SHA256)
803 cf67c0d9 2023-02-04 op SHA256Final(id.hash, &sha256_ctx);
805 cf67c0d9 2023-02-04 op SHA1Final(id.hash, &sha1_ctx);
807 7f959095 2023-02-02 op if (got_object_id_cmp(expected_id, &id) != 0) {
808 3c23f6cd 2023-02-04 op err = got_error_checksum(expected_id);
812 13b2bc37 2022-10-23 stsp err = got_object_parse_header(&obj, p, len);
816 13b2bc37 2022-10-23 stsp if (len < obj->hdrlen + obj->size) {
817 13b2bc37 2022-10-23 stsp err = got_error(GOT_ERR_BAD_OBJ_DATA);
821 13b2bc37 2022-10-23 stsp if (obj->type != GOT_OBJ_TYPE_COMMIT) {
822 13b2bc37 2022-10-23 stsp err = got_error(GOT_ERR_OBJ_TYPE);
826 13b2bc37 2022-10-23 stsp /* Skip object header. */
827 13b2bc37 2022-10-23 stsp len -= obj->hdrlen;
828 cf67c0d9 2023-02-04 op err = got_object_parse_commit(commit, p + obj->hdrlen, len,
829 cf67c0d9 2023-02-04 op expected_id->algo);
833 13b2bc37 2022-10-23 stsp got_object_close(obj);
834 13b2bc37 2022-10-23 stsp return err;
838 ed175427 2019-05-09 stsp got_object_tree_close(struct got_tree_object *tree)
840 03fa71c8 2018-09-06 stsp if (tree->refcnt > 0) {
841 03fa71c8 2018-09-06 stsp tree->refcnt--;
842 03fa71c8 2018-09-06 stsp if (tree->refcnt > 0)
846 56e0773d 2019-11-28 stsp free(tree->entries);
847 03fa71c8 2018-09-06 stsp free(tree);
850 a440fac0 2018-09-06 stsp static const struct got_error *
851 9985f404 2022-05-19 stsp parse_tree_entry(struct got_parsed_tree_entry *pte, size_t *elen, char *buf,
852 a1f06df2 2023-02-04 op size_t maxlen, size_t idlen)
854 8914529d 2019-04-13 stsp char *p, *space;
858 9ef4ac16 2019-04-13 stsp *elen = strnlen(buf, maxlen) + 1;
859 9985f404 2022-05-19 stsp if (*elen > maxlen)
860 a440fac0 2018-09-06 stsp return got_error(GOT_ERR_BAD_OBJ_DATA);
862 dedbbd9d 2019-04-13 stsp space = memchr(buf, ' ', *elen);
863 9985f404 2022-05-19 stsp if (space == NULL || space <= buf)
864 9985f404 2022-05-19 stsp return got_error(GOT_ERR_BAD_OBJ_DATA);
866 9985f404 2022-05-19 stsp pte->mode = 0;
868 8914529d 2019-04-13 stsp while (p < space) {
869 00d10bca 2023-01-19 mark if (*p < '0' || *p > '7')
870 9985f404 2022-05-19 stsp return got_error(GOT_ERR_BAD_OBJ_DATA);
871 9985f404 2022-05-19 stsp pte->mode <<= 3;
872 9985f404 2022-05-19 stsp pte->mode |= *p - '0';
876 a1f06df2 2023-02-04 op if (*elen > maxlen || maxlen - *elen < idlen)
877 9985f404 2022-05-19 stsp return got_error(GOT_ERR_BAD_OBJ_DATA);
879 9985f404 2022-05-19 stsp pte->name = space + 1;
880 9985f404 2022-05-19 stsp pte->namelen = strlen(pte->name);
881 68bf1b1e 2018-11-07 stsp buf += *elen;
882 9985f404 2022-05-19 stsp pte->id = buf;
883 a1f06df2 2023-02-04 op pte->idlen = idlen;
884 a1f06df2 2023-02-04 op *elen += idlen;
885 9985f404 2022-05-19 stsp return NULL;
889 9985f404 2022-05-19 stsp pte_cmp(const void *pa, const void *pb)
891 9985f404 2022-05-19 stsp const struct got_parsed_tree_entry *a = pa, *b = pb;
893 9985f404 2022-05-19 stsp return got_path_cmp(a->name, b->name, a->namelen, b->namelen);
896 a440fac0 2018-09-06 stsp const struct got_error *
897 d294b1dc 2022-10-18 stsp got_object_parse_tree(struct got_parsed_tree_entry **entries, size_t *nentries,
898 a1f06df2 2023-02-04 op size_t *nentries_alloc, uint8_t *buf, size_t len, int algo)
900 3022d272 2019-11-14 stsp const struct got_error *err = NULL;
901 d294b1dc 2022-10-18 stsp size_t remain = len;
902 9985f404 2022-05-19 stsp const size_t nalloc = 16;
903 9985f404 2022-05-19 stsp struct got_parsed_tree_entry *pte;
904 a1f06df2 2023-02-04 op size_t idlen = SHA256_DIGEST_LENGTH;
907 a1f06df2 2023-02-04 op if (algo != GOT_HASH_SHA256)
908 a1f06df2 2023-02-04 op idlen = SHA1_DIGEST_LENGTH;
910 3022d272 2019-11-14 stsp *nentries = 0;
911 db1d3576 2019-10-04 stsp if (remain == 0)
912 db1d3576 2019-10-04 stsp return NULL; /* tree is empty */
914 a440fac0 2018-09-06 stsp while (remain > 0) {
915 a440fac0 2018-09-06 stsp size_t elen;
917 d294b1dc 2022-10-18 stsp if (*nentries >= *nentries_alloc) {
918 d294b1dc 2022-10-18 stsp pte = recallocarray(*entries, *nentries_alloc,
919 d294b1dc 2022-10-18 stsp *nentries_alloc + nalloc, sizeof(**entries));
920 9985f404 2022-05-19 stsp if (pte == NULL) {
921 9985f404 2022-05-19 stsp err = got_error_from_errno("recallocarray");
924 9985f404 2022-05-19 stsp *entries = pte;
925 d294b1dc 2022-10-18 stsp *nentries_alloc += nalloc;
928 9985f404 2022-05-19 stsp pte = &(*entries)[*nentries];
929 a1f06df2 2023-02-04 op err = parse_tree_entry(pte, &elen, buf, remain, idlen);
932 a440fac0 2018-09-06 stsp buf += elen;
933 a440fac0 2018-09-06 stsp remain -= elen;
934 3022d272 2019-11-14 stsp (*nentries)++;
937 a440fac0 2018-09-06 stsp if (remain != 0) {
938 f5d3d7af 2019-02-05 stsp err = got_error(GOT_ERR_BAD_OBJ_DATA);
942 9985f404 2022-05-19 stsp if (*nentries > 1) {
943 9985f404 2022-05-19 stsp mergesort(*entries, *nentries, sizeof(**entries), pte_cmp);
945 9985f404 2022-05-19 stsp for (i = 0; i < *nentries - 1; i++) {
946 9985f404 2022-05-19 stsp struct got_parsed_tree_entry *prev = &(*entries)[i];
947 9985f404 2022-05-19 stsp pte = &(*entries)[i + 1];
948 9985f404 2022-05-19 stsp if (got_path_cmp(prev->name, pte->name,
949 9985f404 2022-05-19 stsp prev->namelen, pte->namelen) == 0) {
950 9985f404 2022-05-19 stsp err = got_error(GOT_ERR_TREE_DUP_ENTRY);
957 3022d272 2019-11-14 stsp *nentries = 0;
958 f5d3d7af 2019-02-05 stsp return err;
961 13b2bc37 2022-10-23 stsp const struct got_error *
962 13b2bc37 2022-10-23 stsp got_object_read_tree(struct got_parsed_tree_entry **entries, size_t *nentries,
963 13b2bc37 2022-10-23 stsp size_t *nentries_alloc, uint8_t **p, int fd,
964 13b2bc37 2022-10-23 stsp struct got_object_id *expected_id)
966 13b2bc37 2022-10-23 stsp const struct got_error *err = NULL;
967 13b2bc37 2022-10-23 stsp struct got_object *obj = NULL;
968 13b2bc37 2022-10-23 stsp size_t len;
969 13b2bc37 2022-10-23 stsp struct got_inflate_checksum csum;
970 a1f06df2 2023-02-04 op SHA2_CTX sha256_ctx;
971 13b2bc37 2022-10-23 stsp SHA1_CTX sha1_ctx;
972 13b2bc37 2022-10-23 stsp struct got_object_id id;
974 13b2bc37 2022-10-23 stsp memset(&csum, 0, sizeof(csum));
975 a1f06df2 2023-02-04 op id.algo = expected_id->algo;
976 a1f06df2 2023-02-04 op if (expected_id->algo == GOT_HASH_SHA256) {
977 a1f06df2 2023-02-04 op SHA256Init(&sha256_ctx);
978 a1f06df2 2023-02-04 op csum.output_sha256 = &sha256_ctx;
980 a1f06df2 2023-02-04 op SHA1Init(&sha1_ctx);
981 a1f06df2 2023-02-04 op csum.output_sha1 = &sha1_ctx;
984 13b2bc37 2022-10-23 stsp err = got_inflate_to_mem_fd(p, &len, NULL, &csum, 0, fd);
986 13b2bc37 2022-10-23 stsp return err;
988 a1f06df2 2023-02-04 op if (expected_id->algo == GOT_HASH_SHA256)
989 a1f06df2 2023-02-04 op SHA256Final(id.hash, &sha256_ctx);
991 a1f06df2 2023-02-04 op SHA1Final(id.hash, &sha1_ctx);
992 7f959095 2023-02-02 op if (got_object_id_cmp(expected_id, &id) != 0) {
993 3c23f6cd 2023-02-04 op err = got_error_checksum(expected_id);
997 13b2bc37 2022-10-23 stsp err = got_object_parse_header(&obj, *p, len);
1001 13b2bc37 2022-10-23 stsp if (len < obj->hdrlen + obj->size) {
1002 13b2bc37 2022-10-23 stsp err = got_error(GOT_ERR_BAD_OBJ_DATA);
1003 13b2bc37 2022-10-23 stsp goto done;
1006 13b2bc37 2022-10-23 stsp /* Skip object header. */
1007 13b2bc37 2022-10-23 stsp len -= obj->hdrlen;
1008 13b2bc37 2022-10-23 stsp err = got_object_parse_tree(entries, nentries, nentries_alloc,
1009 a1f06df2 2023-02-04 op *p + obj->hdrlen, len, expected_id->algo);
1012 13b2bc37 2022-10-23 stsp got_object_close(obj);
1013 13b2bc37 2022-10-23 stsp return err;
1017 f4a881ce 2018-11-17 stsp got_object_tag_close(struct got_tag_object *tag)
1019 ca0d469c 2019-08-13 stsp if (tag->refcnt > 0) {
1020 ca0d469c 2019-08-13 stsp tag->refcnt--;
1021 ca0d469c 2019-08-13 stsp if (tag->refcnt > 0)
1025 f4a881ce 2018-11-17 stsp free(tag->tag);
1026 f4a881ce 2018-11-17 stsp free(tag->tagger);
1027 f4a881ce 2018-11-17 stsp free(tag->tagmsg);
1028 f4a881ce 2018-11-17 stsp free(tag);
1031 ad242220 2018-09-08 stsp const struct got_error *
1032 a1f06df2 2023-02-04 op got_object_parse_tag(struct got_tag_object **tag, uint8_t *buf, size_t len,
1035 f4a881ce 2018-11-17 stsp const struct got_error *err = NULL;
1036 f4a881ce 2018-11-17 stsp size_t remain = len;
1037 f4a881ce 2018-11-17 stsp char *s = buf;
1038 a1f06df2 2023-02-04 op size_t label_len, digest_strlen = SHA256_DIGEST_STRING_LENGTH;
1040 a1f06df2 2023-02-04 op if (algo != GOT_HASH_SHA256)
1041 a1f06df2 2023-02-04 op digest_strlen = SHA1_DIGEST_STRING_LENGTH;
1043 4793d91b 2019-09-22 stsp if (remain == 0)
1044 4793d91b 2019-09-22 stsp return got_error(GOT_ERR_BAD_OBJ_DATA);
1046 f4a881ce 2018-11-17 stsp *tag = calloc(1, sizeof(**tag));
1047 f4a881ce 2018-11-17 stsp if (*tag == NULL)
1048 638f9024 2019-05-13 stsp return got_error_from_errno("calloc");
1050 ff2a4428 2019-03-19 stsp label_len = strlen(GOT_TAG_LABEL_OBJECT);
1051 ff2a4428 2019-03-19 stsp if (strncmp(s, GOT_TAG_LABEL_OBJECT, label_len) == 0) {
1052 ff2a4428 2019-03-19 stsp remain -= label_len;
1053 a1f06df2 2023-02-04 op if (remain < digest_strlen) {
1054 f4a881ce 2018-11-17 stsp err = got_error(GOT_ERR_BAD_OBJ_DATA);
1055 f4a881ce 2018-11-17 stsp goto done;
1057 ff2a4428 2019-03-19 stsp s += label_len;
1058 a1f06df2 2023-02-04 op if (!got_parse_hash_digest((*tag)->id.hash, s, algo, NULL)) {
1059 f4a881ce 2018-11-17 stsp err = got_error(GOT_ERR_BAD_OBJ_DATA);
1060 f4a881ce 2018-11-17 stsp goto done;
1062 a1f06df2 2023-02-04 op (*tag)->id.algo = algo;
1063 a1f06df2 2023-02-04 op remain -= digest_strlen;
1064 a1f06df2 2023-02-04 op s += digest_strlen;
1066 f4a881ce 2018-11-17 stsp err = got_error(GOT_ERR_BAD_OBJ_DATA);
1067 f4a881ce 2018-11-17 stsp goto done;
1070 f4a881ce 2018-11-17 stsp if (remain <= 0) {
1071 f4a881ce 2018-11-17 stsp err = got_error(GOT_ERR_BAD_OBJ_DATA);
1072 f4a881ce 2018-11-17 stsp goto done;
1075 ff2a4428 2019-03-19 stsp label_len = strlen(GOT_TAG_LABEL_TYPE);
1076 ff2a4428 2019-03-19 stsp if (strncmp(s, GOT_TAG_LABEL_TYPE, label_len) == 0) {
1077 ff2a4428 2019-03-19 stsp remain -= label_len;
1078 f4a881ce 2018-11-17 stsp if (remain <= 0) {
1079 f4a881ce 2018-11-17 stsp err = got_error(GOT_ERR_BAD_OBJ_DATA);
1080 f4a881ce 2018-11-17 stsp goto done;
1082 ff2a4428 2019-03-19 stsp s += label_len;
1083 ff2a4428 2019-03-19 stsp if (strncmp(s, GOT_OBJ_LABEL_COMMIT,
1084 ff2a4428 2019-03-19 stsp strlen(GOT_OBJ_LABEL_COMMIT)) == 0) {
1085 f4a881ce 2018-11-17 stsp (*tag)->obj_type = GOT_OBJ_TYPE_COMMIT;
1086 ff2a4428 2019-03-19 stsp label_len = strlen(GOT_OBJ_LABEL_COMMIT);
1087 ff2a4428 2019-03-19 stsp s += label_len;
1088 ff2a4428 2019-03-19 stsp remain -= label_len;
1089 ff2a4428 2019-03-19 stsp } else if (strncmp(s, GOT_OBJ_LABEL_TREE,
1090 ff2a4428 2019-03-19 stsp strlen(GOT_OBJ_LABEL_TREE)) == 0) {
1091 f4a881ce 2018-11-17 stsp (*tag)->obj_type = GOT_OBJ_TYPE_TREE;
1092 ff2a4428 2019-03-19 stsp label_len = strlen(GOT_OBJ_LABEL_TREE);
1093 ff2a4428 2019-03-19 stsp s += label_len;
1094 ff2a4428 2019-03-19 stsp remain -= label_len;
1095 ff2a4428 2019-03-19 stsp } else if (strncmp(s, GOT_OBJ_LABEL_BLOB,
1096 ff2a4428 2019-03-19 stsp strlen(GOT_OBJ_LABEL_BLOB)) == 0) {
1097 f4a881ce 2018-11-17 stsp (*tag)->obj_type = GOT_OBJ_TYPE_BLOB;
1098 ff2a4428 2019-03-19 stsp label_len = strlen(GOT_OBJ_LABEL_BLOB);
1099 ff2a4428 2019-03-19 stsp s += label_len;
1100 ff2a4428 2019-03-19 stsp remain -= label_len;
1101 ff2a4428 2019-03-19 stsp } else if (strncmp(s, GOT_OBJ_LABEL_TAG,
1102 ff2a4428 2019-03-19 stsp strlen(GOT_OBJ_LABEL_TAG)) == 0) {
1103 f4a881ce 2018-11-17 stsp (*tag)->obj_type = GOT_OBJ_TYPE_TAG;
1104 ff2a4428 2019-03-19 stsp label_len = strlen(GOT_OBJ_LABEL_TAG);
1105 ff2a4428 2019-03-19 stsp s += label_len;
1106 ff2a4428 2019-03-19 stsp remain -= label_len;
1108 f4a881ce 2018-11-17 stsp err = got_error(GOT_ERR_BAD_OBJ_DATA);
1109 f4a881ce 2018-11-17 stsp goto done;
1112 f4a881ce 2018-11-17 stsp if (remain <= 0 || *s != '\n') {
1113 f4a881ce 2018-11-17 stsp err = got_error(GOT_ERR_BAD_OBJ_DATA);
1114 f4a881ce 2018-11-17 stsp goto done;
1118 f4a881ce 2018-11-17 stsp if (remain <= 0) {
1119 f4a881ce 2018-11-17 stsp err = got_error(GOT_ERR_BAD_OBJ_DATA);
1120 f4a881ce 2018-11-17 stsp goto done;
1123 f4a881ce 2018-11-17 stsp err = got_error(GOT_ERR_BAD_OBJ_DATA);
1124 f4a881ce 2018-11-17 stsp goto done;
1127 ff2a4428 2019-03-19 stsp label_len = strlen(GOT_TAG_LABEL_TAG);
1128 ff2a4428 2019-03-19 stsp if (strncmp(s, GOT_TAG_LABEL_TAG, label_len) == 0) {
1130 f4a881ce 2018-11-17 stsp size_t slen;
1131 ff2a4428 2019-03-19 stsp remain -= label_len;
1132 f4a881ce 2018-11-17 stsp if (remain <= 0) {
1133 f4a881ce 2018-11-17 stsp err = got_error(GOT_ERR_BAD_OBJ_DATA);
1134 f4a881ce 2018-11-17 stsp goto done;
1136 ff2a4428 2019-03-19 stsp s += label_len;
1137 dedbbd9d 2019-04-13 stsp p = memchr(s, '\n', remain);
1138 f4a881ce 2018-11-17 stsp if (p == NULL) {
1139 f4a881ce 2018-11-17 stsp err = got_error(GOT_ERR_BAD_OBJ_DATA);
1140 f4a881ce 2018-11-17 stsp goto done;
1142 f4a881ce 2018-11-17 stsp *p = '\0';
1143 f4a881ce 2018-11-17 stsp slen = strlen(s);
1144 f4a881ce 2018-11-17 stsp (*tag)->tag = strndup(s, slen);
1145 f4a881ce 2018-11-17 stsp if ((*tag)->tag == NULL) {
1146 638f9024 2019-05-13 stsp err = got_error_from_errno("strndup");
1147 f4a881ce 2018-11-17 stsp goto done;
1149 f4a881ce 2018-11-17 stsp s += slen + 1;
1150 f4a881ce 2018-11-17 stsp remain -= slen + 1;
1151 f4a881ce 2018-11-17 stsp if (remain <= 0) {
1152 f4a881ce 2018-11-17 stsp err = got_error(GOT_ERR_BAD_OBJ_DATA);
1153 f4a881ce 2018-11-17 stsp goto done;
1156 f4a881ce 2018-11-17 stsp err = got_error(GOT_ERR_BAD_OBJ_DATA);
1157 f4a881ce 2018-11-17 stsp goto done;
1160 ff2a4428 2019-03-19 stsp label_len = strlen(GOT_TAG_LABEL_TAGGER);
1161 ff2a4428 2019-03-19 stsp if (strncmp(s, GOT_TAG_LABEL_TAGGER, label_len) == 0) {
1163 f4a881ce 2018-11-17 stsp size_t slen;
1165 ff2a4428 2019-03-19 stsp remain -= label_len;
1166 f4a881ce 2018-11-17 stsp if (remain <= 0) {
1167 f4a881ce 2018-11-17 stsp err = got_error(GOT_ERR_BAD_OBJ_DATA);
1168 f4a881ce 2018-11-17 stsp goto done;
1170 ff2a4428 2019-03-19 stsp s += label_len;
1171 dedbbd9d 2019-04-13 stsp p = memchr(s, '\n', remain);
1172 f4a881ce 2018-11-17 stsp if (p == NULL) {
1173 f4a881ce 2018-11-17 stsp err = got_error(GOT_ERR_BAD_OBJ_DATA);
1174 f4a881ce 2018-11-17 stsp goto done;
1176 f4a881ce 2018-11-17 stsp *p = '\0';
1177 f4a881ce 2018-11-17 stsp slen = strlen(s);
1178 f4a881ce 2018-11-17 stsp err = parse_commit_time(&(*tag)->tagger_time,
1179 f4a881ce 2018-11-17 stsp &(*tag)->tagger_gmtoff, s);
1181 f4a881ce 2018-11-17 stsp goto done;
1182 f4a881ce 2018-11-17 stsp (*tag)->tagger = strdup(s);
1183 f4a881ce 2018-11-17 stsp if ((*tag)->tagger == NULL) {
1184 638f9024 2019-05-13 stsp err = got_error_from_errno("strdup");
1185 f4a881ce 2018-11-17 stsp goto done;
1187 f4a881ce 2018-11-17 stsp s += slen + 1;
1188 f4a881ce 2018-11-17 stsp remain -= slen + 1;
1189 5a8b373c 2020-12-18 stsp if (remain < 0) {
1190 f4a881ce 2018-11-17 stsp err = got_error(GOT_ERR_BAD_OBJ_DATA);
1191 f4a881ce 2018-11-17 stsp goto done;
1194 e0e55b50 2019-02-01 stsp /* Some old tags in the Linux git repo have no tagger. */
1195 e0e55b50 2019-02-01 stsp (*tag)->tagger = strdup("");
1196 e0e55b50 2019-02-01 stsp if ((*tag)->tagger == NULL) {
1197 638f9024 2019-05-13 stsp err = got_error_from_errno("strdup");
1198 e0e55b50 2019-02-01 stsp goto done;
1202 f4a881ce 2018-11-17 stsp (*tag)->tagmsg = strndup(s, remain);
1203 f4a881ce 2018-11-17 stsp if ((*tag)->tagmsg == NULL) {
1204 638f9024 2019-05-13 stsp err = got_error_from_errno("strndup");
1205 f4a881ce 2018-11-17 stsp goto done;
1208 f4a881ce 2018-11-17 stsp if (err) {
1209 f4a881ce 2018-11-17 stsp got_object_tag_close(*tag);
1210 f4a881ce 2018-11-17 stsp *tag = NULL;
1212 13b2bc37 2022-10-23 stsp return err;
1215 13b2bc37 2022-10-23 stsp const struct got_error *
1216 758dc042 2022-11-06 stsp got_object_read_tag(struct got_tag_object **tag, int fd,
1217 13b2bc37 2022-10-23 stsp struct got_object_id *expected_id, size_t expected_size)
1219 13b2bc37 2022-10-23 stsp const struct got_error *err = NULL;
1220 13b2bc37 2022-10-23 stsp struct got_object *obj = NULL;
1221 13b2bc37 2022-10-23 stsp size_t len;
1222 13b2bc37 2022-10-23 stsp uint8_t *p;
1223 13b2bc37 2022-10-23 stsp struct got_inflate_checksum csum;
1224 a1f06df2 2023-02-04 op SHA2_CTX sha256_ctx;
1225 13b2bc37 2022-10-23 stsp SHA1_CTX sha1_ctx;
1226 13b2bc37 2022-10-23 stsp struct got_object_id id;
1228 13b2bc37 2022-10-23 stsp memset(&csum, 0, sizeof(csum));
1229 a1f06df2 2023-02-04 op id.algo = expected_id->algo;
1230 a1f06df2 2023-02-04 op if (expected_id->algo == GOT_HASH_SHA256) {
1231 a1f06df2 2023-02-04 op SHA256Init(&sha256_ctx);
1232 a1f06df2 2023-02-04 op csum.output_sha256 = &sha256_ctx;
1234 a1f06df2 2023-02-04 op SHA1Init(&sha1_ctx);
1235 a1f06df2 2023-02-04 op csum.output_sha1 = &sha1_ctx;
1238 13b2bc37 2022-10-23 stsp err = got_inflate_to_mem_fd(&p, &len, NULL, &csum,
1239 13b2bc37 2022-10-23 stsp expected_size, fd);
1241 13b2bc37 2022-10-23 stsp return err;
1243 a1f06df2 2023-02-04 op if (expected_id->algo == GOT_HASH_SHA256)
1244 a1f06df2 2023-02-04 op SHA256Final(id.hash, &sha256_ctx);
1246 a1f06df2 2023-02-04 op SHA1Final(id.hash, &sha1_ctx);
1247 7f959095 2023-02-02 op if (got_object_id_cmp(expected_id, &id) != 0) {
1248 3c23f6cd 2023-02-04 op err = got_error_checksum(expected_id);
1249 13b2bc37 2022-10-23 stsp goto done;
1252 13b2bc37 2022-10-23 stsp err = got_object_parse_header(&obj, p, len);
1254 13b2bc37 2022-10-23 stsp goto done;
1256 13b2bc37 2022-10-23 stsp if (len < obj->hdrlen + obj->size) {
1257 13b2bc37 2022-10-23 stsp err = got_error(GOT_ERR_BAD_OBJ_DATA);
1258 13b2bc37 2022-10-23 stsp goto done;
1261 13b2bc37 2022-10-23 stsp /* Skip object header. */
1262 13b2bc37 2022-10-23 stsp len -= obj->hdrlen;
1263 a1f06df2 2023-02-04 op err = got_object_parse_tag(tag, p + obj->hdrlen, len, expected_id->algo);
1267 13b2bc37 2022-10-23 stsp got_object_close(obj);
1268 f4a881ce 2018-11-17 stsp return err;
1271 f4a881ce 2018-11-17 stsp const struct got_error *
1272 ad242220 2018-09-08 stsp got_read_file_to_mem(uint8_t **outbuf, size_t *outlen, FILE *f)
1274 a440fac0 2018-09-06 stsp const struct got_error *err = NULL;
1275 a440fac0 2018-09-06 stsp static const size_t blocksize = 512;
1276 a440fac0 2018-09-06 stsp size_t n, total, remain;
1277 a440fac0 2018-09-06 stsp uint8_t *buf;
1279 a440fac0 2018-09-06 stsp *outbuf = NULL;
1280 a440fac0 2018-09-06 stsp *outlen = 0;
1282 a440fac0 2018-09-06 stsp buf = malloc(blocksize);
1283 a440fac0 2018-09-06 stsp if (buf == NULL)
1284 638f9024 2019-05-13 stsp return got_error_from_errno("malloc");
1286 a440fac0 2018-09-06 stsp remain = blocksize;
1287 a440fac0 2018-09-06 stsp total = 0;
1289 a440fac0 2018-09-06 stsp if (remain == 0) {
1290 a440fac0 2018-09-06 stsp uint8_t *newbuf;
1291 a440fac0 2018-09-06 stsp newbuf = reallocarray(buf, 1, total + blocksize);
1292 a440fac0 2018-09-06 stsp if (newbuf == NULL) {
1293 638f9024 2019-05-13 stsp err = got_error_from_errno("reallocarray");
1294 a440fac0 2018-09-06 stsp goto done;
1296 a440fac0 2018-09-06 stsp buf = newbuf;
1297 a440fac0 2018-09-06 stsp remain += blocksize;
1299 a440fac0 2018-09-06 stsp n = fread(buf + total, 1, remain, f);
1300 a440fac0 2018-09-06 stsp if (n == 0) {
1301 a440fac0 2018-09-06 stsp if (ferror(f)) {
1302 a440fac0 2018-09-06 stsp err = got_ferror(f, GOT_ERR_IO);
1303 a440fac0 2018-09-06 stsp goto done;
1305 a440fac0 2018-09-06 stsp break; /* EOF */
1307 a440fac0 2018-09-06 stsp remain -= n;
1308 a440fac0 2018-09-06 stsp total += n;
1312 a440fac0 2018-09-06 stsp if (err == NULL) {
1313 a440fac0 2018-09-06 stsp *outbuf = buf;
1314 a440fac0 2018-09-06 stsp *outlen = total;
1316 a440fac0 2018-09-06 stsp free(buf);
1317 ad242220 2018-09-08 stsp return err;