Commit Diff


commit - e1e77cc43b61294facdf656a456a4108c13eb638
commit + 93658fb90d8fedd9c447896835e7c76f35e04ed2
blob - 709948a09b358cf01d39d50454f4f9c08fad9c28
blob + 27b8780c69c81f08f6abd29001c803e5e4e2f601
--- got/Makefile
+++ got/Makefile
@@ -8,7 +8,7 @@ SRCS=		got.c blame.c commit_graph.c delta.c diff.c \
 		object_idset.c object_parse.c opentemp.c path.c pack.c \
 		privsep.c reference.c repository.c sha1.c worktree.c \
 		inflate.c buf.c rcsutil.c diff3.c lockfile.c \
-		deflate.c object_create.c delta_cache.c
+		deflate.c object_create.c delta_cache.c fetch.c
 MAN =		${PROG}.1 got-worktree.5 git-repository.5
 
 CPPFLAGS = -I${.CURDIR}/../include -I${.CURDIR}/../lib
blob - 16acb2621cdd21bffe0bafda2a0d4139eb8c1a0f
blob + fa392ce43029ddbfe734698a174ff138dd4b4966
--- got/got.c
+++ got/got.c
@@ -1,6 +1,7 @@
 /*
  * Copyright (c) 2017 Martin Pieuchot <mpi@openbsd.org>
  * Copyright (c) 2018, 2019, 2020 Stefan Sperling <stsp@openbsd.org>
+ * Copyright (c) 2020 Ori Bernstein <ori@openbsd.org>
  *
  * Permission to use, copy, modify, and distribute this software for any
  * purpose with or without fee is hereby granted, provided that the above
@@ -48,6 +49,7 @@
 #include "got_worktree.h"
 #include "got_diff.h"
 #include "got_commit_graph.h"
+#include "got_lib_fetch.h"
 #include "got_blame.h"
 #include "got_privsep.h"
 #include "got_opentemp.h"
@@ -83,6 +85,7 @@ __dead static void	usage(int);
 __dead static void	usage_init(void);
 __dead static void	usage_import(void);
 __dead static void	usage_checkout(void);
+__dead static void	usage_clone(void);
 __dead static void	usage_update(void);
 __dead static void	usage_log(void);
 __dead static void	usage_diff(void);
@@ -107,6 +110,7 @@ __dead static void	usage_cat(void);
 
 static const struct got_error*		cmd_init(int, char *[]);
 static const struct got_error*		cmd_import(int, char *[]);
+static const struct got_error*		cmd_clone(int, char *[]);
 static const struct got_error*		cmd_checkout(int, char *[]);
 static const struct got_error*		cmd_update(int, char *[]);
 static const struct got_error*		cmd_log(int, char *[]);
@@ -134,6 +138,7 @@ static struct got_cmd got_commands[] = {
 	{ "init",	cmd_init,	usage_init,	"in" },
 	{ "import",	cmd_import,	usage_import,	"im" },
 	{ "checkout",	cmd_checkout,	usage_checkout,	"co" },
+	{ "clone",	cmd_clone,	usage_clone,	"cl" },
 	{ "update",	cmd_update,	usage_update,	"up" },
 	{ "log",	cmd_log,	usage_log,	"" },
 	{ "diff",	cmd_diff,	usage_diff,	"di" },
@@ -797,6 +802,13 @@ done:
 	if (head_ref)
 		got_ref_close(head_ref);
 	return error;
+}
+
+__dead static void
+usage_clone(void)
+{
+	fprintf(stderr, "usage: %s clone repo-url\n", getprogname());
+	exit(1);
 }
 
 __dead static void
@@ -954,6 +966,34 @@ done:
 	if (!err && !is_same_branch)
 		err = got_error(GOT_ERR_ANCESTRY);
 	return err;
+}
+
+static const struct got_error *
+cmd_clone(int argc, char *argv[])
+{
+	char *uri, *branch_filter, *dirname;
+	int ch;
+
+	while ((ch = getopt(argc, argv, "b:")) != -1) {
+		switch (ch) {
+		case 'b':
+			branch_filter = optarg;
+			break;
+		default:
+			usage_clone();
+			break;
+		}
+	}
+	argc -= optind;
+	argv += optind;
+	uri = argv[0];
+	if(argc == 1)
+		dirname = NULL;
+	else if(argc == 2)
+		dirname = argv[1];
+	else
+		usage_clone();
+	return got_clone(argv[0], branch_filter, dirname);
 }
 
 static const struct got_error *
blob - 80f9b0ed32b5cf77045b2016ae220f3802661f48
blob + 71d643171b205c69e05d0a68dd5cec264b1d8ecc
--- include/got_error.h
+++ include/got_error.h
@@ -1,5 +1,6 @@
 /*
  * Copyright (c) 2018, 2019, 2020 Stefan Sperling <stsp@openbsd.org>
+ * Copyright (c) 2020 Ori Bernstein <ori@openbsd.org>
  *
  * Permission to use, copy, modify, and distribute this software for any
  * purpose with or without fee is hereby granted, provided that the above
@@ -128,9 +129,12 @@
 #define GOT_ERR_REGEX		112
 #define GOT_ERR_REF_NAME_MINUS	113
 #define GOT_ERR_GITCONFIG_SYNTAX 114
-#define GOT_ERR_REBASE_OUT_OF_DATE 115
-#define GOT_ERR_CACHE_DUP_ENTRY	116
-#define GOT_ERR_QUERYSTRING	117
+#define GOT_ERR_FETCH_FAILED	115
+#define GOT_ERR_PARSE_URI	116
+#define GOT_ERR_BAD_PROTO	117
+#define GOT_ERR_REBASE_OUT_OF_DATE 118
+#define GOT_ERR_CACHE_DUP_ENTRY	119
+#define GOT_ERR_QUERYSTRING	120
 
 static const struct got_error {
 	int code;
@@ -269,6 +273,9 @@ static const struct got_error {
 	    "can be used to rebase a branch" },
 	{ GOT_ERR_CACHE_DUP_ENTRY, "duplicate cache entry" },
 	{ GOT_ERR_QUERYSTRING, "bad querystring" },
+	{ GOT_ERR_FETCH_FAILED, "fetch failed" },
+	{ GOT_ERR_PARSE_URI, "failed to parse uri" },
+	{ GOT_ERR_BAD_PROTO, "unknown protocol" },
 };
 
 /*
blob - /dev/null
blob + be04a7dc049d95312f53007d313519f18f5699f5 (mode 644)
--- /dev/null
+++ lib/fetch.c
@@ -0,0 +1,360 @@
+/*
+ * Copyright (c) 2018, 2019 Ori Bernstein <ori@openbsd.org>
+ *
+ * Permission to use, copy, modify, and distribute this software for any
+ * purpose with or without fee is hereby granted, provided that the above
+ * copyright notice and this permission notice appear in all copies.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS" AND THE AUTHOR DISCLAIMS ALL WARRANTIES
+ * WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF
+ * MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR
+ * ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES
+ * WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN
+ * ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF
+ * OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE.
+ */
+
+#include <sys/types.h>
+#include <sys/stat.h>
+#include <sys/queue.h>
+#include <sys/uio.h>
+#include <sys/socket.h>
+#include <sys/wait.h>
+#include <sys/syslimits.h>
+#include <sys/resource.h>
+#include <sys/socket.h>
+
+#include <errno.h>
+#include <fcntl.h>
+#include <stdio.h>
+#include <stdlib.h>
+#include <string.h>
+#include <stdint.h>
+#include <sha1.h>
+#include <zlib.h>
+#include <ctype.h>
+#include <limits.h>
+#include <imsg.h>
+#include <time.h>
+#include <uuid.h>
+#include <netdb.h>
+#include <netinet/in.h>
+
+#include "got_error.h"
+#include "got_reference.h"
+#include "got_repository.h"
+#include "got_path.h"
+#include "got_cancel.h"
+#include "got_worktree.h"
+#include "got_object.h"
+
+#include "got_lib_delta.h"
+#include "got_lib_inflate.h"
+#include "got_lib_object.h"
+#include "got_lib_object_parse.h"
+#include "got_lib_object_create.h"
+#include "got_lib_pack.h"
+#include "got_lib_sha1.h"
+#include "got_lib_privsep.h"
+#include "got_lib_object_cache.h"
+#include "got_lib_repository.h"
+
+#define GOT_PROTOMAX	64
+#define GOT_HOSTMAX	256
+#define GOT_PATHMAX	512
+#define GOT_REPOMAX	256
+#define GOT_PORTMAX	16
+#define GOT_URIMAX	1024
+
+static int
+mkpath(char *path)
+{
+	char *p, namebuf[PATH_MAX];
+	struct stat sb;
+	int done;
+
+	while (*path == '/')
+		path++;
+	if (strlcpy(namebuf, path, sizeof(namebuf)) >= sizeof(namebuf)) {
+		errno = ENAMETOOLONG;
+		return -1;
+	}
+
+	p = namebuf;
+	for (;;) {
+		p += strspn(p, "/");
+		p += strcspn(p, "/");
+		done = (*p == '\0');
+		*p = '\0';
+
+		if (mkdir(namebuf, 0755) != 0) {
+			int mkdir_errno = errno;
+			if (stat(path, &sb) == -1) {
+				/* Not there; use mkdir()s errno */
+				errno = mkdir_errno;
+				return -1;
+			}
+			if (!S_ISDIR(sb.st_mode)) {
+				/* Is there, but isn't a directory */
+				errno = ENOTDIR;
+				return -1;
+			}
+		}
+
+		if (done)
+			break;
+		*p = '/';
+	}
+
+	return 0;
+}
+
+static int
+hassuffix(char *base, char *suf)
+{
+	int nb, ns;
+
+	nb = strlen(base);
+	ns = strlen(suf);
+	if (ns <= nb && strcmp(base + (nb - ns), suf) == 0)
+		return 1;
+	return 0;
+}
+
+static int
+grab(char *dst, int n, char *p, char *e)
+{
+	int l;
+
+	l = e - p;
+	if (l >= n) {
+		errno = ENAMETOOLONG;
+		return -1;
+	}
+	return strlcpy(dst, p, l + 1);
+}
+
+static int
+got_dial_ssh(char *host, char *port, char *path, char *direction)
+{
+	int pid, pfd[2];
+	char cmd[64];
+
+	if (pipe(pfd) == -1)
+		return -1;
+	pid = fork();
+	if (pid == -1)
+		return -1;
+	if (pid == 0) {
+		close(pfd[1]);
+		dup2(pfd[0], 0);
+		dup2(pfd[0], 1);
+		snprintf(cmd, sizeof(cmd), "git-%s-pack", direction);
+		execlp("ssh", "ssh", host, cmd, path, NULL);
+		abort();
+	}else{
+		close(pfd[0]);
+		return pfd[1];
+	}
+}
+
+static int
+got_dial_git(char *host, char *port, char *path, char *direction)
+{
+	struct addrinfo hints, *servinfo, *p;
+	char *cmd, *pkt;
+	int fd, l, r;
+
+	memset(&hints, 0, sizeof hints);
+	hints.ai_family = AF_UNSPEC;
+	hints.ai_socktype = SOCK_STREAM;
+	if (getaddrinfo(host, port, &hints, &servinfo) != 0)
+		return -1;
+
+	for (p = servinfo; p != NULL; p = p->ai_next) {
+		if ((fd = socket(p->ai_family, p->ai_socktype,
+		    p->ai_protocol)) == -1)
+			continue;
+		if (connect(fd, p->ai_addr, p->ai_addrlen) == 0)
+			break;
+		close(fd);
+	}
+	if (p == NULL)
+		return -1;
+
+	if ((l = asprintf(&cmd, "git-%s-pack %s\n", direction, path)) == -1)
+		return -1;
+	if ((l = asprintf(&pkt, "%04x%s", l+4, cmd)) == -1)
+		return -1;
+	r = write(fd, pkt, l);
+	free(cmd);
+	free(pkt);
+	if (r == -1) {
+		close(fd);
+		return -1;
+	}
+	return fd;
+}
+
+int
+got_parse_uri(char *uri, char *proto, char *host, char *port, char *path, char *repo)
+{
+	char *s, *p, *q;
+	int n, hasport;
+
+	p = strstr(uri, "://");
+	if (!p) {
+		//werrstr("missing protocol");
+		return -1;
+	}
+	if (grab(proto, GOT_PROTOMAX, uri, p) == -1)
+		return -1;
+	hasport = (strcmp(proto, "git") == 0 || strstr(proto, "http") == proto);
+	s = p + 3;
+	p = NULL;
+	if (!hasport) {
+		p = strstr(s, ":");
+		if (p != NULL)
+			p++;
+	}
+	if (p == NULL)
+		p = strstr(s, "/");
+	if (p == NULL || strlen(p) == 1) {
+		//werrstr("missing path");
+		return -1;
+	}
+
+	q = memchr(s, ':', p - s);
+	if (q) {
+		grab(host, GOT_HOSTMAX, s, q);
+		grab(port, GOT_PORTMAX, q + 1, p);
+	}else{
+		grab(host, GOT_HOSTMAX, s, p);
+		snprintf(port, GOT_PORTMAX, "9418");
+	}
+
+	snprintf(path, GOT_PATHMAX, "%s", p);
+	p = strrchr(p, '/') + 1;
+	if (!p || strlen(p) == 0) {
+		//werrstr("missing repository in uri");
+		return -1;
+	}
+	n = strlen(p);
+	if (hassuffix(p, ".git"))
+		n -= 4;
+	grab(repo, GOT_REPOMAX, p, p + n);
+	return 0;
+}
+
+const struct got_error*
+got_clone(char *uri, char *branch_filter, char *dirname)
+{
+	char proto[GOT_PROTOMAX], host[GOT_HOSTMAX], port[GOT_PORTMAX];
+	char repo[GOT_REPOMAX], path[GOT_PATHMAX];
+	int imsg_fetchfds[2], imsg_idxfds[2], fetchfd;
+	int packfd, npackfd, idxfd, nidxfd, status;
+	struct got_object_id packhash;
+	const struct got_error *err;
+	struct imsgbuf ibuf;
+	pid_t pid;
+
+	fetchfd = -1;
+	if (got_parse_uri(uri, proto, host, port, path, repo) == -1)
+		return got_error(GOT_ERR_PARSE_URI);
+	if (dirname == NULL)
+		dirname = repo;
+	err = got_repo_init(dirname);
+	if (err != NULL)
+		return err;
+	if (chdir(dirname))
+		return got_error_from_errno("enter new repo");
+	if (mkpath(".git/objects/pack") == -1)
+		return got_error_from_errno("mkpath");
+	packfd = open(".git/objects/pack/fetching.pack", O_CREAT|O_RDWR, 0644);
+	if (packfd == -1)
+		return got_error_from_errno("open pack");
+	npackfd = dup(packfd);
+	if (npackfd == -1)
+		return got_error_from_errno("dup");
+	idxfd = open(".git/objects/pack/fetching.idx", O_CREAT|O_RDWR, 0644);
+	if (idxfd == -1)
+		return got_error_from_errno("open pack");
+	nidxfd = dup(idxfd);
+	if (nidxfd == -1)
+		return got_error_from_errno("dup");
+
+	if (strcmp(proto, "ssh") == 0 || strcmp(proto, "git+ssh") == 0)
+		fetchfd = got_dial_ssh(host, port, path, "upload");
+	else if (strcmp(proto, "git") == 0)
+		fetchfd = got_dial_git(host, port, path, "upload");
+	else if (strcmp(proto, "http") == 0 || strcmp(proto, "git+http") == 0)
+		err = got_error(GOT_ERR_BAD_PROTO);
+	else
+		err = got_error(GOT_ERR_BAD_PROTO);
+
+	if (fetchfd == -1)
+		err = got_error_from_errno("dial uri");
+	if (socketpair(AF_UNIX, SOCK_STREAM, PF_UNSPEC, imsg_fetchfds) == -1)
+		return got_error_from_errno("socketpair");
+
+	pid = fork();
+	if (pid == -1)
+		return got_error_from_errno("fork");
+	else if (pid == 0){
+		got_privsep_exec_child(imsg_fetchfds, GOT_PATH_PROG_FETCH_PACK, ".");
+	}
+
+	if (close(imsg_fetchfds[1]) != 0)
+		return got_error_from_errno("close");
+	imsg_init(&ibuf, imsg_fetchfds[0]);
+	err = got_privsep_send_fetch_req(&ibuf, fetchfd);
+	if (err != NULL)
+		return err;
+	err = got_privsep_wait_ack(&ibuf);
+	if (err != NULL)
+		return err;
+	err = got_privsep_send_tmpfd(&ibuf, npackfd);
+	if (err != NULL)
+		return err;
+	npackfd = dup(packfd);
+	if (npackfd == -1)
+		return got_error_from_errno("dup");
+	err = got_privsep_wait_fetch_done(&ibuf, &packhash);
+	if (err != NULL)
+		return err;
+	if (waitpid(pid, &status, 0) == -1)
+		return got_error_from_errno("child exit");
+
+	if (socketpair(AF_UNIX, SOCK_STREAM, PF_UNSPEC, imsg_idxfds) == -1)
+		return got_error_from_errno("socketpair");
+	pid = fork();
+	if (pid == -1)
+		return got_error_from_errno("fork");
+	else if (pid == 0)
+		got_privsep_exec_child(imsg_idxfds, GOT_PATH_PROG_INDEX_PACK, ".");
+	if (close(imsg_idxfds[1]) != 0)
+		return got_error_from_errno("close");
+	imsg_init(&ibuf, imsg_idxfds[0]);
+
+	err = got_privsep_send_index_pack_req(&ibuf, npackfd, packhash);
+	if (err != NULL)
+		return err;
+	err = got_privsep_wait_ack(&ibuf);
+	if (err != NULL)
+		return err;
+	err = got_privsep_send_tmpfd(&ibuf, nidxfd);
+	if (err != NULL)
+		return err;
+	err = got_privsep_wait_index_pack_done(&ibuf);
+	if (err != NULL)
+		return err;
+	imsg_clear(&ibuf);
+	if (close(imsg_idxfds[0]) == -1)
+		return got_error_from_errno("close child");
+	if (waitpid(pid, &status, 0) == -1)
+		return got_error_from_errno("child exit");
+
+
+	return NULL;
+
+}
blob - /dev/null
blob + 6ffe7e529b3664b6119e0d4ab2ef31d41644d718 (mode 644)
--- /dev/null
+++ lib/got_lib_fetch.h
@@ -0,0 +1,17 @@
+/*
+ * Copyright (c) 2018, 2019 Ori Bernstein <ori@openbsd.org>
+ *
+ * Permission to use, copy, modify, and distribute this software for any
+ * purpose with or without fee is hereby granted, provided that the above
+ * copyright notice and this permission notice appear in all copies.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS" AND THE AUTHOR DISCLAIMS ALL WARRANTIES
+ * WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF
+ * MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR
+ * ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES
+ * WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN
+ * ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF
+ * OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE.
+ */
+
+const struct got_error* got_clone(char *, char *, char *);
blob - 6ae68d96bfa9ec1cf42dbe4e49500d0ea2c61a89
blob + af18cee80cb335a5dc991b1aeae0c924ccf4016a
--- lib/got_lib_object_idset.h
+++ lib/got_lib_object_idset.h
@@ -1,5 +1,6 @@
 /*
  * Copyright (c) 2018 Stefan Sperling <stsp@openbsd.org>
+ * Copyright (c) 2019 Ori Bernstein <stsp@openbsd.org>
  *
  * Permission to use, copy, modify, and distribute this software for any
  * purpose with or without fee is hereby granted, provided that the above
@@ -26,6 +27,8 @@ const struct got_error *got_object_idset_remove(void *
     struct got_object_idset *, struct got_object_id *);
 int got_object_idset_contains(struct got_object_idset *,
     struct got_object_id *);
+void *got_object_idset_lookup_data(struct got_object_idset *,
+    struct got_object_id *);
 const struct got_error *got_object_idset_for_each(struct got_object_idset *,
     const struct got_error *(*cb)(struct got_object_id *, void *, void *),
     void *);
blob - f73c2bf8b3f3e83d497b150a9723302b20ff6408
blob + 0c4a043a653118f69c831430705349acaca9bd80
--- lib/got_lib_privsep.h
+++ lib/got_lib_privsep.h
@@ -1,5 +1,6 @@
 /*
  * Copyright (c) 2018, 2019 Stefan Sperling <stsp@openbsd.org>
+ * Copyright (c) 2019, Ori Bernstein <ori@openbsd.org>
  *
  * Permission to use, copy, modify, and distribute this software for any
  * purpose with or without fee is hereby granted, provided that the above
@@ -42,6 +43,9 @@
 #define GOT_PROG_READ_TAG	got-read-tag
 #define GOT_PROG_READ_PACK	got-read-pack
 #define GOT_PROG_READ_GITCONFIG	got-read-gitconfig
+#define GOT_PROG_FETCH_PACK	got-fetch-pack
+#define GOT_PROG_INDEX_PACK	got-index-pack
+#define GOT_PROG_SEND_PACK	got-send-pack
 
 #define GOT_STRINGIFY(x) #x
 #define GOT_STRINGVAL(x) GOT_STRINGIFY(x)
@@ -61,6 +65,12 @@
 	GOT_STRINGVAL(GOT_LIBEXECDIR) "/" GOT_STRINGVAL(GOT_PROG_READ_PACK)
 #define GOT_PATH_PROG_READ_GITCONFIG \
 	GOT_STRINGVAL(GOT_LIBEXECDIR) "/" GOT_STRINGVAL(GOT_PROG_READ_GITCONFIG)
+#define GOT_PATH_PROG_FETCH_PACK \
+	GOT_STRINGVAL(GOT_LIBEXECDIR) "/" GOT_STRINGVAL(GOT_PROG_FETCH_PACK)
+#define GOT_PATH_PROG_SEND_PACK \
+	GOT_STRINGVAL(GOT_LIBEXECDIR) "/" GOT_STRINGVAL(GOT_PROG_SEND_PACK)
+#define GOT_PATH_PROG_INDEX_PACK \
+	GOT_STRINGVAL(GOT_LIBEXECDIR) "/" GOT_STRINGVAL(GOT_PROG_INDEX_PACK)
 
 struct got_privsep_child {
 	int imsg_fd;
@@ -75,6 +85,9 @@ enum got_imsg_type {
 	/* Stop the child process. */
 	GOT_IMSG_STOP,
 
+	/* We got a message as part of a sequence */
+	GOT_IMSG_ACK,
+
 	/*
 	 * Messages concerned with read access to objects in a repository.
 	 * Object and pack files are opened by the main process, where
@@ -98,6 +111,12 @@ enum got_imsg_type {
 	GOT_IMSG_TAG,
 	GOT_IMSG_TAG_TAGMSG,
 
+	/* Messages related to networking. */
+	GOT_IMSG_FETCH_REQUEST,
+	GOT_IMSG_FETCH_DONE,
+	GOT_IMSG_IDXPACK_REQUEST,
+	GOT_IMSG_IDXPACK_DONE,
+
 	/* Messages related to pack files. */
 	GOT_IMSG_PACKIDX,
 	GOT_IMSG_PACK,
@@ -273,11 +292,14 @@ struct got_pack;
 struct got_packidx;
 struct got_pathlist_head;
 
+const struct got_error *got_send_ack(pid_t);
 const struct got_error *got_privsep_wait_for_child(pid_t);
 const struct got_error *got_privsep_send_stop(int);
 const struct got_error *got_privsep_recv_imsg(struct imsg *, struct imsgbuf *,
     size_t);
 void got_privsep_send_error(struct imsgbuf *, const struct got_error *);
+const struct got_error *got_privsep_send_ack(struct imsgbuf *);
+const struct got_error *got_privsep_wait_ack(struct imsgbuf *);
 const struct got_error *got_privsep_send_obj_req(struct imsgbuf *, int);
 const struct got_error *got_privsep_send_commit_req(struct imsgbuf *, int,
     struct got_object_id *, int);
@@ -291,6 +313,15 @@ const struct got_error *got_privsep_send_blob_outfd(st
 const struct got_error *got_privsep_send_tmpfd(struct imsgbuf *, int);
 const struct got_error *got_privsep_send_obj(struct imsgbuf *,
     struct got_object *);
+const struct got_error *got_privsep_send_index_pack_req(struct imsgbuf *, int,
+    struct got_object_id);
+const struct got_error *got_privsep_send_index_pack_done(struct imsgbuf *);
+const struct got_error *got_privsep_wait_index_pack_done(struct imsgbuf *);
+const struct got_error *got_privsep_send_fetch_req(struct imsgbuf *, int);
+const struct got_error *got_privsep_send_fetch_done(struct imsgbuf *,
+    struct got_object_id);
+const struct got_error *got_privsep_wait_fetch_done(struct imsgbuf *,
+    struct got_object_id*);
 const struct got_error *got_privsep_get_imsg_obj(struct got_object **,
     struct imsg *, struct imsgbuf *);
 const struct got_error *got_privsep_recv_obj(struct got_object **,
blob - 472aaa11edacfa2b14007043174136b80ff00ba9
blob + b72db6aaa7fa5c47899a453ee52a55222314cd79
--- lib/inflate.c
+++ lib/inflate.c
@@ -86,12 +86,16 @@ got_inflate_read(struct got_inflate_buf *zb, FILE *f, 
 	size_t last_total_out = zb->z.total_out;
 	z_stream *z = &zb->z;
 	int ret = Z_ERRNO;
+	off_t off, consumed;
 
 	z->next_out = zb->outbuf;
 	z->avail_out = zb->outlen;
 
 	*outlenp = 0;
+	off = ftello(f);
+	consumed = 0;
 	do {
+		size_t last_total_in = zb->z.total_in;
 		if (z->avail_in == 0) {
 			size_t n = fread(zb->inbuf, 1, zb->inlen, f);
 			if (n == 0) {
@@ -105,6 +109,7 @@ got_inflate_read(struct got_inflate_buf *zb, FILE *f, 
 			z->avail_in = n;
 		}
 		ret = inflate(z, Z_SYNC_FLUSH);
+		consumed += z->total_in - last_total_in;
 	} while (ret == Z_OK && z->avail_out > 0);
 
 	if (ret == Z_OK || ret == Z_BUF_ERROR) {
@@ -116,6 +121,7 @@ got_inflate_read(struct got_inflate_buf *zb, FILE *f, 
 	}
 
 	*outlenp = z->total_out - last_total_out;
+	fseek(f, off + consumed, SEEK_SET);
 	return NULL;
 }
 
blob - ea5232abfd828a7f52894757aaa990fca8c07c9b
blob + 7d2de740418dca59c54252352e0955b9f4d9bd9a
--- lib/object.c
+++ lib/object.c
@@ -51,6 +51,7 @@
 #include "got_lib_object_cache.h"
 #include "got_lib_object_parse.h"
 #include "got_lib_pack.h"
+#include "got_lib_fetch.h"
 #include "got_lib_repository.h"
 
 #ifndef MIN
blob - /dev/null
blob + 4de1da9f601aaf70c7674ea5b42dc2a10ff4f650 (mode 644)
--- /dev/null
+++ lib/index.c
@@ -0,0 +1,108 @@
+/*
+ * Copyright (c) 2018, 2019 Ori Bernstein <ori@eigenstate.org>
+ *
+ * Permission to use, copy, modify, and distribute this software for any
+ * purpose with or without fee is hereby granted, provided that the above
+ * copyright notice and this permission notice appear in all copies.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS" AND THE AUTHOR DISCLAIMS ALL WARRANTIES
+ * WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF
+ * MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR
+ * ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES
+ * WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN
+ * ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF
+ * OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE.
+ */
+
+#include <sys/types.h>
+#include <sys/stat.h>
+#include <sys/queue.h>
+#include <sys/uio.h>
+#include <sys/socket.h>
+#include <sys/wait.h>
+#include <sys/syslimits.h>
+#include <sys/resource.h>
+
+#include <errno.h>
+#include <fcntl.h>
+#include <stdio.h>
+#include <stdlib.h>
+#include <string.h>
+#include <stdint.h>
+#include <sha1.h>
+#include <zlib.h>
+#include <ctype.h>
+#include <limits.h>
+#include <imsg.h>
+#include <time.h>
+#include <uuid.h>
+
+#include "got_error.h"
+#include "got_reference.h"
+#include "got_repository.h"
+#include "got_path.h"
+#include "got_cancel.h"
+#include "got_worktree.h"
+#include "got_object.h"
+
+#include "got_lib_delta.h"
+#include "got_lib_inflate.h"
+#include "got_lib_object.h"
+#include "got_lib_object_parse.h"
+#include "got_lib_object_create.h"
+#include "got_lib_pack.h"
+#include "got_lib_sha1.h"
+#include "got_lib_privsep.h"
+#include "got_lib_object_cache.h"
+#include "got_lib_repository.h"
+
+static int
+hassuffix(char *base, char *suf)
+{
+	int nb, ns;
+
+	nb = strlen(base);
+	ns = strlen(suf);
+	if(ns <= nb && strcmp(base + (nb - ns), suf) == 0)
+		return 1;
+	return 0;
+}
+
+static int
+got_make_index_path(char *idxpath, size_t idxpathsz, char *path)
+{
+	size_t len;
+
+	len = strlen(path);
+	if(hassuffix(path, ".pack"))
+		len -= strlen(".pack");
+	if (strlcpy(idxpath, path, idxpathsz) >= idxpathsz)
+		return -1;
+	if (strlcpy(idxpath + len, ".idx", idxpathsz - len) >= idxpathsz - len)
+		return -1;
+	return 0;
+}
+
+const struct got_error*
+got_index_pack(char *path)
+{
+	int packfd, idxfd;
+	char idxpath[PATH_MAX];
+
+	got_make_index_path(idxpath, sizeof(idxpath), path);
+	printf("index path %s\n", idxpath);
+	if ((fd = open(path)) == -1)
+		return got_error_from_errno("open pack");
+
+	pid = fork();
+	if (pid == -1)
+		return got_error_from_errno("fork");
+	else if (pid == 0)
+		got_privsep_exec_child(imsg_fds, GOT_PATH_PROG_INDEX_PACK, ".");
+
+	if (close(imsg_fds[1]) != 0)
+		return got_error_from_errno("close");
+	err = got_privsep_send_index_pack_req(&ibuf, fetchfd);
+	if (err != NULL)
+		return err;
+}
blob - 527383c259fb8d8e90ecf8f6b8efd21fd94a4327
blob + 510b59e911ac900872569b89923df71d5eb9eecf
--- lib/object_idset.c
+++ lib/object_idset.c
@@ -168,6 +168,14 @@ got_object_idset_contains(struct got_object_idset *set
 	return entry ? 1 : 0;
 }
 
+void *
+got_object_idset_lookup_data(struct got_object_idset *set,
+    struct got_object_id *id)
+{
+	struct got_object_idset_element *entry = find_element(set, id);
+	return entry ? entry->data : NULL;
+}
+
 const struct got_error *
 got_object_idset_for_each(struct got_object_idset *set,
     const struct got_error *(*cb)(struct got_object_id *, void *, void *),
blob - 5528473fc4fe3a28a7c2e409b1a9285ce6f4e716
blob + b5ea8d20c9397777b036e28835ffe9f983563ddd
--- lib/privsep.c
+++ lib/privsep.c
@@ -1,5 +1,6 @@
 /*
  * Copyright (c) 2018, 2019, 2020 Stefan Sperling <stsp@openbsd.org>
+ * Copyright (c) 2020 Ori Bernstein <ori@openbsd.org>
  *
  * Permission to use, copy, modify, and distribute this software for any
  * purpose with or without fee is hereby granted, provided that the above
@@ -228,6 +229,31 @@ got_privsep_send_stop(int fd)
 	imsg_clear(&ibuf);
 	return err;
 }
+
+const struct got_error *
+got_privsep_send_ack(struct imsgbuf *ibuf)
+{
+	if (imsg_compose(ibuf, GOT_IMSG_ACK, 0, 0, -1, NULL, 0) == -1)
+		return got_error_from_errno("imsg_compose ACK");
+	return flush_imsg(ibuf);
+}
+
+const struct got_error *
+got_privsep_wait_ack(struct imsgbuf *ibuf)
+{
+	const struct got_error *err = NULL;
+	struct imsg imsg;
+
+	err = got_privsep_recv_imsg(&imsg, ibuf, 0);
+	if (err)
+		return err;
+	if (imsg.hdr.type == GOT_IMSG_ACK && imsg.hdr.len - IMSG_HEADER_SIZE == 0)
+		return NULL;
+	else
+		return got_error(GOT_ERR_PRIVSEP_MSG);
+	imsg_free(&imsg);
+}
+
 
 const struct got_error *
 got_privsep_send_obj_req(struct imsgbuf *ibuf, int fd)
@@ -404,6 +430,85 @@ got_privsep_send_obj(struct imsgbuf *ibuf, struct got_
 }
 
 const struct got_error *
+got_privsep_send_fetch_req(struct imsgbuf *ibuf, int fd)
+{
+	const struct got_error *err = NULL;
+
+	if (imsg_compose(ibuf, GOT_IMSG_FETCH_REQUEST, 0, 0, fd,
+	    NULL, 0) == -1) {
+		err = got_error_from_errno("imsg_compose FETCH_REQUEST");
+		close(fd);
+		return err;
+	}
+	return flush_imsg(ibuf);
+}
+
+const struct got_error *
+got_privsep_send_fetch_done(struct imsgbuf *ibuf, struct got_object_id hash)
+{
+	if (imsg_compose(ibuf, GOT_IMSG_FETCH_DONE, 0, 0, -1,
+	    hash.sha1, SHA1_DIGEST_LENGTH) == -1)
+		return got_error_from_errno("imsg_compose FETCH");
+	return flush_imsg(ibuf);
+}
+
+const struct got_error *
+got_privsep_wait_fetch_done(struct imsgbuf *ibuf, struct got_object_id *hash)
+{
+	const struct got_error *err = NULL;
+	struct imsg imsg;
+
+	err = got_privsep_recv_imsg(&imsg, ibuf, 0);
+	if (err)
+		return err;
+	if (imsg.hdr.type == GOT_IMSG_FETCH_DONE &&
+	    imsg.hdr.len - sizeof(imsg.hdr) == SHA1_DIGEST_LENGTH)
+		return NULL;
+	else
+		return got_error(GOT_ERR_PRIVSEP_MSG);
+	imsg_free(&imsg);
+}
+
+
+const struct got_error *
+got_privsep_send_index_pack_req(struct imsgbuf *ibuf, int fd, struct got_object_id hash)
+{
+	const struct got_error *err = NULL;
+
+	if (imsg_compose(ibuf, GOT_IMSG_IDXPACK_REQUEST, 0, 0, fd,
+	    hash.sha1, SHA1_DIGEST_LENGTH) == -1) {
+		err = got_error_from_errno("imsg_compose INDEX_REQUEST");
+		close(fd);
+		return err;
+	}
+	return flush_imsg(ibuf);
+}
+
+const struct got_error *
+got_privsep_send_index_pack_done(struct imsgbuf *ibuf)
+{
+	if (imsg_compose(ibuf, GOT_IMSG_IDXPACK_DONE, 0, 0, -1, NULL, 0) == -1)
+		return got_error_from_errno("imsg_compose FETCH");
+	return flush_imsg(ibuf);
+}
+
+const struct got_error *
+got_privsep_wait_index_pack_done(struct imsgbuf *ibuf)
+{
+	const struct got_error *err = NULL;
+	struct imsg imsg;
+
+	err = got_privsep_recv_imsg(&imsg, ibuf, 0);
+	if (err)
+		return err;
+	if (imsg.hdr.type == GOT_IMSG_IDXPACK_DONE)
+		return NULL;
+	else
+		return got_error(GOT_ERR_PRIVSEP_MSG);
+	imsg_free(&imsg);
+}
+
+const struct got_error *
 got_privsep_get_imsg_obj(struct got_object **obj, struct imsg *imsg,
     struct imsgbuf *ibuf)
 {
blob - a4c900b7f50d8d643524becc373f46951d405243
blob + 41c5a86903979f5cc3495303157b082ea384ee7f
--- libexec/Makefile
+++ libexec/Makefile
@@ -1,4 +1,5 @@
 SUBDIR = got-read-blob got-read-commit got-read-object got-read-tree \
-	got-read-tag got-read-pack got-read-gitconfig
+	got-read-tag got-fetch-pack got-index-pack got-read-pack \
+	got-read-gitconfig
 
 .include <bsd.subdir.mk>
blob - /dev/null
blob + 7823de67fa57fb34bafd9fa68b43a821a157c101 (mode 644)
--- /dev/null
+++ libexec/got-fetch-pack/Makefile
@@ -0,0 +1,13 @@
+.PATH:${.CURDIR}/../../lib
+
+.include "../../got-version.mk"
+
+PROG=		got-fetch-pack
+SRCS=		got-fetch-pack.c error.c inflate.c object_parse.c \
+		path.c privsep.c sha1.c
+
+CPPFLAGS = -I${.CURDIR}/../../include -I${.CURDIR}/../../lib
+LDADD = -lutil -lz
+DPADD = ${LIBZ} ${LIBUTIL}
+
+.include <bsd.prog.mk>
blob - /dev/null
blob + 8d9608005fc74a2d524f92b5d221a03d4f1992d9 (mode 644)
--- /dev/null
+++ libexec/got-fetch-pack/got-fetch-pack.c
@@ -0,0 +1,466 @@
+/*
+ * Copyright (c) 2019 Ori Bernstein <ori@openbsd.org>
+ *
+ * Permission to use, copy, modify, and distribute this software for any
+ * purpose with or without fee is hereby granted, provided that the above
+ * copyright notice and this permission notice appear in all copies.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS" AND THE AUTHOR DISCLAIMS ALL WARRANTIES
+ * WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF
+ * MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR
+ * ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES
+ * WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN
+ * ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF
+ * OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE.
+ */
+
+#include <sys/types.h>
+#include <sys/queue.h>
+#include <sys/uio.h>
+#include <sys/time.h>
+#include <sys/stat.h>
+#include <sys/syslimits.h>
+
+#include <stdint.h>
+#include <errno.h>
+#include <imsg.h>
+#include <limits.h>
+#include <signal.h>
+#include <stdio.h>
+#include <stdlib.h>
+#include <string.h>
+#include <ctype.h>
+#include <sha1.h>
+#include <fcntl.h>
+#include <zlib.h>
+#include <err.h>
+
+#include "got_error.h"
+#include "got_object.h"
+
+#include "got_lib_sha1.h"
+#include "got_lib_delta.h"
+#include "got_lib_inflate.h"
+#include "got_lib_object.h"
+#include "got_lib_object_parse.h"
+#include "got_lib_privsep.h"
+
+#define GOT_PKTMAX	65536
+
+struct got_object *indexed;
+static int chattygit;
+static char *fetchbranch;
+static char *upstream = "origin";
+static char *packtmp = ".git/objects/pack/fetch.tmp";
+static struct got_object_id zhash = {.sha1={0}};
+
+static char*
+strip(char *ref)
+{
+	return ref;
+}
+
+int
+readn(int fd, void *buf, size_t n)
+{
+	ssize_t r, off;
+
+	off = 0;
+	while (off != n) {
+		r = read(fd, buf + off, n - off);
+		if (r < 0)
+			return -1;
+		if (r == 0)
+			return off;
+		off += r;
+	}
+	return off;
+}
+
+int
+flushpkt(int fd)
+{
+	if(chattygit)
+		fprintf(stderr, "writepkt: 0000\n");
+	return write(fd, "0000", 4);
+}
+
+
+int
+readpkt(int fd, char *buf, int nbuf)
+{
+	char len[5];
+	char *e;
+	int n, r;
+
+	if(readn(fd, len, 4) == -1){
+		return -1;
+	}
+	len[4] = 0;
+	n = strtol(len, &e, 16);
+	if(n == 0){
+		if(chattygit)
+			fprintf(stderr, "readpkt: 0000\n");
+		return 0;
+	}
+	if(e != len + 4 || n <= 4)
+		err(1, "invalid packet line length");
+	n  -= 4;
+	if(n >= nbuf)
+		err(1, "buffer too small");
+	if((r = readn(fd, buf, n)) != n)
+		return -1;
+	buf[n] = 0;
+	if(chattygit)
+		fprintf(stderr, "readpkt: %s:\t%.*s\n", len, nbuf, buf);
+	return n;
+}
+
+int
+writepkt(int fd, char *buf, int nbuf)
+{
+	char len[5];
+	int i;
+
+	if (snprintf(len, sizeof(len), "%04x", nbuf + 4) >= sizeof(len))
+		return -1;
+	if(write(fd, len, 4) != 4)
+		return -1;
+	if(write(fd, buf, nbuf) != nbuf)
+		return -1;
+	if(chattygit){
+		fprintf(stderr, "writepkt: %s:\t", len);
+		fwrite(buf, 1, nbuf, stderr);
+		for(i = 0; i < nbuf; i++){
+			if(isprint(buf[i]))
+				fputc(buf[i], stderr);
+		}
+	}
+	return 0;
+}
+
+
+int
+got_resolve_remote_ref(struct got_object_id *id, char *ref)
+{
+	char buf[128], *s;
+	int r, f;
+
+	ref = strip(ref);
+	if(!got_parse_sha1_digest(id->sha1, ref))
+		return 0;
+
+	/* Slightly special handling: translate remote refs to local ones. */
+	if (strcmp(ref, "HEAD") == 0) {
+		if(snprintf(buf, sizeof(buf), ".git/HEAD") >= sizeof(buf))
+			return -1;
+	} else if(strstr(ref, "refs/heads") == ref) {
+		ref += strlen("refs/heads");
+		if(snprintf(buf, sizeof(buf),
+		    ".git/refs/remotes/%s/%s", upstream, ref) >= sizeof(buf))
+			return -1;
+	} else if(strstr(ref, "refs/tags") == ref) {
+		ref += strlen("refs/tags");
+		if(snprintf(buf, sizeof(buf),
+		    ".git/refs/tags/%s/%s", upstream, ref) >= sizeof(buf))
+			return -1;
+	} else {
+		return -1;
+	}
+
+	r = -1;
+	s = strip(buf);
+	if((f = open(s, O_RDONLY)) == -1)
+		goto err;
+	if(readn(f, buf, sizeof(buf)) < 40)
+		goto err;
+	if(!got_parse_sha1_digest(id->sha1, buf))
+		goto err;
+err:
+	close(f);
+	if(r == -1 && strstr(buf, "ref:") == buf)
+		return got_resolve_remote_ref(id, buf + strlen("ref:"));
+	return r;
+}
+
+static int
+got_check_pack_hash(int fd, size_t sz, uint8_t *hcomp)
+{
+	SHA1_CTX ctx;
+	uint8_t hexpect[SHA1_DIGEST_LENGTH];
+	char s1[SHA1_DIGEST_STRING_LENGTH + 1];
+	char s2[SHA1_DIGEST_STRING_LENGTH + 1];
+	uint8_t buf[32*1024];
+	ssize_t n, r, nr;
+
+	if(sz < 28)
+		return -1;
+
+	n = 0;
+	SHA1Init(&ctx);
+	while(n < sz - 20){
+		nr = sizeof(buf);
+		if(sz - n - 20 < sizeof(buf))
+			nr = sz - n - 20;
+		r = readn(fd, buf, nr);
+		if(r != nr)
+			return -1;
+		SHA1Update(&ctx, buf, nr);
+		n += r;
+	}
+	SHA1Final(hcomp, &ctx);
+
+	if(readn(fd, hexpect, sizeof(hexpect)) != sizeof(hexpect))
+		errx(1, "truncated packfile");
+	if(memcmp(hcomp, hexpect, SHA1_DIGEST_LENGTH) != 0){
+		got_sha1_digest_to_str(hcomp, s1, sizeof(s1));
+		got_sha1_digest_to_str(hexpect, s2, sizeof(s2));
+		printf("hash mismatch %s != %s\n", s1, s2);
+		return -1;
+	}
+	return 0;
+}
+
+int
+got_has_object(struct got_object_id *obj)
+{
+	return 0;
+}
+
+/*static */int
+got_make_pack_dir(char *path)
+{
+	char s[128];
+	char *p;
+
+	if(snprintf(s, sizeof(s), "%s", path) >= sizeof(s))
+		return -1;
+	for(p=strchr(s+1, '/'); p; p=strchr(p+1, '/')){
+		*p = 0;
+		if (mkdir(s, 0755) == -1)
+			if(errno != EEXIST)
+				return -1;
+		*p = '/';
+	}
+	return 0;
+}
+
+static int
+got_match_branch(char *br, char *pat)
+{
+	char name[128];
+
+	if(strstr(pat, "refs/heads") == pat) {
+		if (snprintf(name, sizeof(name), "%s", pat) >= sizeof(name))
+			return -1;
+	} else if(strstr(pat, "heads")) {
+		if (snprintf(name, sizeof(name), "refs/%s", pat) >= sizeof(name))
+			return -1;
+	} else {
+		if (snprintf(name, sizeof(name), "refs/heads/%s", pat) >= sizeof(name))
+			return -1;
+	}
+	return strcmp(br, name) == 0;
+}
+
+static int
+got_tokenize_refline(char *line, char **sp, size_t nsp)
+{
+	char *p;
+	size_t i, j;
+
+	for (i = 0; i < nsp; i++) {
+		while (isspace(*line))
+			line++;
+		p = line;
+		while (*line != '\0' && (!isspace(*line) || i == nsp - 1))
+			line++;
+		sp[i] = strndup(p, line - p);
+	}
+	for (j = i; j < nsp; j++)
+		sp[j] = NULL;
+	return i;
+}
+
+static int
+got_fetch_pack(int fd, int packfd, char *packtmp, struct got_object_id *packid)
+{
+	char buf[GOT_PKTMAX], idxtmp[256], *sp[3];
+	char hashstr[SHA1_DIGEST_STRING_LENGTH];
+	struct got_object_id *have, *want;
+	int nref, refsz;
+	int i, n, req;
+	off_t packsz;
+
+	nref = 0;
+	refsz = 16;
+	have = malloc(refsz * sizeof(have[0]));
+	if(have == NULL)
+		err(1, "malloc packs");
+	want = malloc(refsz * sizeof(want[0]));
+	if(want == NULL)
+		err(1, "malloc packs");
+	if(chattygit)
+		fprintf(stderr, "starting fetch\n");
+	while(1){
+		n = readpkt(fd, buf, sizeof(buf));
+		if(n == -1){
+			err(1, "readpkt:");
+			return -1;
+		}
+		if(n == 0)
+			break;
+		if(strncmp(buf, "ERR ", 4) == 0)
+			err(1, "%s", buf + 4);
+		if(got_tokenize_refline(buf, sp, 3) <= 2)
+			err(1, "malformed ref line");
+		if(strstr(sp[1], "^{}"))
+			continue;
+		if(fetchbranch && !got_match_branch(sp[1], fetchbranch))
+			continue;
+		if(refsz == nref + 1){
+			refsz *= 2;
+			have = realloc(have, refsz * sizeof(have[0]));
+			if (have == NULL)
+				err(1, "realloc have");
+			want = realloc(want, refsz * sizeof(want[0]));
+			if (want == NULL)
+				err(1, "realloc want");
+		}
+		if(!got_parse_sha1_digest(want[nref].sha1, sp[0]))
+			errx(1, "invalid hash %s", sp[0]);
+		if (got_resolve_remote_ref(&have[nref], sp[1]) == -1)
+			memset(&have[nref], 0, sizeof(have[nref]));
+		// TODO: send IMSG with progress.
+		if (chattygit)
+			fprintf(stderr, "remote %s\n", sp[1]);
+		nref++;
+	}
+
+	req = 0;
+	for(i = 0; i < nref; i++){
+		if (got_object_id_cmp(&have[i], &want[i]) == 0)
+			continue;
+		if (got_has_object(&want[i]))
+			continue;
+		got_sha1_digest_to_str(want[i].sha1, hashstr, sizeof(hashstr));
+		n = snprintf(buf, sizeof(buf), "want %s\n", hashstr);
+		if (n >= sizeof(buf))
+			errx(1, "undersized buffer");
+		if(writepkt(fd, buf, n) == -1)
+			errx(1, "could not send want");
+		req = 1;
+	}
+	flushpkt(fd);
+	for(i = 0; i < nref; i++){
+		if (got_object_id_cmp(&have[i], &zhash) == 0)
+			continue;
+		got_sha1_digest_to_str(want[i].sha1, hashstr, sizeof(hashstr));
+		n = snprintf(buf, sizeof(buf), "have %s\n", hashstr);
+		if (n >= sizeof(buf))
+			errx(1, "undersized buffer");
+		if (writepkt(fd, buf, n + 1) == -1)
+			errx(1, "could not send have");
+	}
+	if(!req){
+		fprintf(stderr, "up to date\n");
+		flushpkt(fd);
+	}
+	n = snprintf(buf, sizeof(buf), "done\n");
+	if(writepkt(fd, buf, n) == -1)
+		errx(1, "lost connection write");
+	if(!req)
+		return 0;
+
+	if((n = readpkt(fd, buf, sizeof(buf))) == -1)
+		errx(1, "lost connection read");
+	buf[n] = 0;
+
+	fprintf(stderr, "fetching...\n");
+	packsz = 0;
+	while(1){
+		n = readn(fd, buf, sizeof buf);
+		if(n == 0)
+			break;
+		if(n == -1 || write(packfd, buf, n) != n)
+			err(1, "could not fetch packfile:");
+		packsz += n;
+	}
+	if(lseek(packfd, 0, SEEK_SET) == -1)
+		err(1, "packfile seek:");
+	if(got_check_pack_hash(packfd, packsz, packid->sha1) == -1)
+		errx(1, "corrupt packfile");
+	close(packfd);
+	n = strlen(packtmp) - strlen(".tmp");
+	memcpy(idxtmp, packtmp, n);
+	memcpy(idxtmp + n, ".idx", strlen(".idx") + 1);
+	return 0;
+}
+
+
+int
+main(int argc, char **argv)
+{
+	const struct got_error *err = NULL;
+	int fetchfd, packfd;
+	struct got_object_id packid;
+	struct imsgbuf ibuf;
+	struct imsg imsg;
+
+	if(getenv("GOT_DEBUG") != NULL){
+		fprintf(stderr, "fetch-pack being chatty!\n");
+		chattygit = 1;
+	}
+
+	imsg_init(&ibuf, GOT_IMSG_FD_CHILD);
+	if((err = got_privsep_recv_imsg(&imsg, &ibuf, 0)) != 0) {
+		if (err->code == GOT_ERR_PRIVSEP_PIPE)
+			err = NULL;
+		goto done;
+	}
+	if (imsg.hdr.type == GOT_IMSG_STOP)
+		goto done;
+	if (imsg.hdr.type != GOT_IMSG_FETCH_REQUEST) {
+		err = got_error(GOT_ERR_PRIVSEP_MSG);
+		goto done;
+	}
+	if (imsg.hdr.len - IMSG_HEADER_SIZE != 0) {
+		err = got_error(GOT_ERR_PRIVSEP_LEN);
+		goto done;
+	}
+	fetchfd = imsg.fd;
+	got_privsep_send_ack(&ibuf);
+
+	if((err = got_privsep_recv_imsg(&imsg, &ibuf, 0)) != 0) {
+		if (err->code == GOT_ERR_PRIVSEP_PIPE)
+			err = NULL;
+		goto done;
+	}
+	if (imsg.hdr.type == GOT_IMSG_STOP)
+		goto done;
+	if (imsg.hdr.type != GOT_IMSG_TMPFD) {
+		err = got_error(GOT_ERR_PRIVSEP_MSG);
+		goto done;
+	}
+	if (imsg.hdr.len - IMSG_HEADER_SIZE != 0) {
+		err = got_error(GOT_ERR_PRIVSEP_LEN);
+		goto done;
+	}
+	packfd = imsg.fd;
+
+	if(got_fetch_pack(fetchfd, packfd, packtmp, &packid) == -1) {
+		err = got_error(GOT_ERR_FETCH_FAILED);
+		goto done;
+	}
+done:
+	if(err != NULL)
+		got_privsep_send_error(&ibuf, err);
+	else
+		err = got_privsep_send_fetch_done(&ibuf, packid);
+	if(err != NULL) {
+		fprintf(stderr, "%s: %s\n", getprogname(), err->msg);
+		got_privsep_send_error(&ibuf, err);
+	}
+
+	exit(0);
+}
blob - /dev/null
blob + fcaafeb345feccfcee8a0a7445de7b1a800b1e47 (mode 644)
--- /dev/null
+++ libexec/got-index-pack/Makefile
@@ -0,0 +1,13 @@
+.PATH:${.CURDIR}/../../lib
+
+.include "../../got-version.mk"
+
+PROG=		got-index-pack
+SRCS=		got-index-pack.c error.c inflate.c object_parse.c object_idset.c \
+		path.c privsep.c sha1.c
+
+CPPFLAGS = -I${.CURDIR}/../../include -I${.CURDIR}/../../lib
+LDADD = -lutil -lz
+DPADD = ${LIBZ} ${LIBUTIL}
+
+.include <bsd.prog.mk>
blob - /dev/null
blob + c000f2cb994a50009b3495de8cf361532742b517 (mode 644)
--- /dev/null
+++ libexec/got-index-pack/got-index-pack.c
@@ -0,0 +1,1270 @@
+/*
+ * Copyright (c) 2019 Ori Bernstein <ori@openbsd.org>
+ *
+ * Permission to use, copy, modify, and distribute this software for any
+ * purpose with or without fee is hereby granted, provided that the above
+ * copyright notice and this permission notice appear in all copies.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS" AND THE AUTHOR DISCLAIMS ALL WARRANTIES
+ * WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF
+ * MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR
+ * ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES
+ * WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN
+ * ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF
+ * OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE.
+ */
+
+#include <sys/queue.h>
+#include <sys/stat.h>
+#include <sys/syslimits.h>
+#include <sys/time.h>
+#include <sys/types.h>
+#include <sys/uio.h>
+
+#include <stdint.h>
+#include <errno.h>
+#include <imsg.h>
+#include <limits.h>
+#include <signal.h>
+#include <stdio.h>
+#include <stdlib.h>
+#include <string.h>
+#include <ctype.h>
+#include <sha1.h>
+#include <fcntl.h>
+#include <zlib.h>
+#include <err.h>
+#include <assert.h>
+#include <dirent.h>
+
+#include "got_error.h"
+#include "got_object.h"
+
+#include "got_lib_sha1.h"
+#include "got_lib_delta.h"
+#include "got_lib_inflate.h"
+#include "got_lib_object.h"
+#include "got_lib_object_parse.h"
+#include "got_lib_object_idset.h"
+#include "got_lib_privsep.h"
+
+typedef struct Cinfo	Cinfo;
+typedef struct Tinfo	Tinfo;
+typedef struct Object	Object;
+typedef struct Pack	Pack;
+typedef struct Buf	Buf;
+typedef struct Dirent	Dirent;
+typedef struct Idxent	Idxent;
+typedef struct Ols	Ols;
+
+enum {
+	/* 5k objects should be enough */
+	Cachemax	= 5*1024,
+	Pathmax		= 512,
+	Hashsz		= 20,
+	Pktmax		= 65536,
+
+	Nproto	= 16,
+	Nport	= 16,
+	Nhost	= 256,
+	Npath	= 128,
+	Nrepo	= 64,
+	Nbranch	= 32,
+};
+
+typedef enum Type {
+	GNone	= 0,
+	GCommit	= 1,
+	GTree	= 2,
+	GBlob	= 3,
+	GTag	= 4,
+	GOdelta	= 6,
+	GRdelta	= 7,
+} Type;
+
+enum {
+	Cloaded	= 1 << 0,
+	Cidx	= 1 << 1,
+	Ccache	= 1 << 2,
+	Cexist	= 1 << 3,
+	Cparsed	= 1 << 5,
+};
+
+struct Dirent {
+	char *name;
+	int modref;
+	int mode;
+	struct got_object_id h;
+};
+
+struct Object {
+	/* Git data */
+	struct got_object_id	hash;
+	Type	type;
+
+	/* Cache */
+	int	id;
+	int	flag;
+	int	refs;
+	Object	*next;
+	Object	*prev;
+
+	/* For indexing */
+	off_t	off;
+	off_t	len;
+	uint32_t	crc;
+
+	/* Everything below here gets cleared */
+	char	*all;
+	char	*data;
+	/* size excludes header */
+	off_t	size;
+
+	union {
+		Cinfo *commit;
+		Tinfo *tree;
+	};
+};
+
+struct Tinfo {
+	/* Tree */
+	Dirent	*ent;
+	int	nent;
+};
+
+struct Cinfo {
+	/* Commit */
+	struct got_object_id	*parent;
+	int	nparent;
+	struct got_object_id	tree;
+	char	*author;
+	char	*committer;
+	char	*msg;
+	int	nmsg;
+	off_t	ctime;
+	off_t	mtime;
+};
+
+typedef struct Buf Buf;
+
+struct Buf {
+	int len;
+	int sz;
+	char *data;
+};
+
+static int	readpacked(FILE *, Object *, int);
+static Object	*readidxobject(FILE *, struct got_object_id, int);
+
+struct got_object_idset *objcache;
+int	next_object_id;
+Object *lruhead;
+Object *lrutail;
+int	ncache;
+
+#define GETBE16(b)\
+		((((b)[0] & 0xFFul) <<  8) | \
+		 (((b)[1] & 0xFFul) <<  0))
+
+#define GETBE32(b)\
+		((((b)[0] & 0xFFul) << 24) | \
+		 (((b)[1] & 0xFFul) << 16) | \
+		 (((b)[2] & 0xFFul) <<  8) | \
+		 (((b)[3] & 0xFFul) <<  0))
+#define GETBE64(b)\
+		((((b)[0] & 0xFFull) << 56) | \
+		 (((b)[1] & 0xFFull) << 48) | \
+		 (((b)[2] & 0xFFull) << 40) | \
+		 (((b)[3] & 0xFFull) << 32) | \
+		 (((b)[4] & 0xFFull) << 24) | \
+		 (((b)[5] & 0xFFull) << 16) | \
+		 (((b)[6] & 0xFFull) <<  8) | \
+		 (((b)[7] & 0xFFull) <<  0))
+
+#define PUTBE16(b, n)\
+	do{ \
+		(b)[0] = (n) >> 8; \
+		(b)[1] = (n) >> 0; \
+	} while(0)
+
+#define PUTBE32(b, n)\
+	do{ \
+		(b)[0] = (n) >> 24; \
+		(b)[1] = (n) >> 16; \
+		(b)[2] = (n) >> 8; \
+		(b)[3] = (n) >> 0; \
+	} while(0)
+
+#define PUTBE64(b, n)\
+	do{ \
+		(b)[0] = (n) >> 56; \
+		(b)[1] = (n) >> 48; \
+		(b)[2] = (n) >> 40; \
+		(b)[3] = (n) >> 32; \
+		(b)[4] = (n) >> 24; \
+		(b)[5] = (n) >> 16; \
+		(b)[6] = (n) >> 8; \
+		(b)[7] = (n) >> 0; \
+	} while(0)
+
+static int
+charval(int c, int *err)
+{
+	if(c >= '0' && c <= '9')
+		return c - '0';
+	if(c >= 'a' && c <= 'f')
+		return c - 'a' + 10;
+	if(c >= 'A' && c <= 'F')
+		return c - 'A' + 10;
+	*err = 1;
+	return -1;
+}
+
+static int
+hparse(struct got_object_id *h, char *b)
+{
+	int i, err;
+
+	err = 0;
+	for(i = 0; i < sizeof(h->sha1); i++){
+		err = 0;
+		h->sha1[i] = 0;
+		h->sha1[i] |= ((charval(b[2*i], &err) & 0xf) << 4);
+		h->sha1[i] |= ((charval(b[2*i+1], &err)& 0xf) << 0);
+		if(err)
+			return -1;
+	}
+	return 0;
+}
+
+static void *
+emalloc(size_t n)
+{
+	void *v;
+
+	v = calloc(n, 1);
+	if(v == NULL)
+		err(1, "malloc:");
+	return v;
+}
+
+static void *
+erealloc(void *p, ulong n)
+{
+	void *v;
+
+	v = realloc(p, n);
+	if(v == NULL)
+		err(1, "realloc:");
+	memset(v, 0, n);
+	return v;
+}
+
+static int
+hasheq(struct got_object_id *a, struct got_object_id *b)
+{
+	return memcmp(a->sha1, b->sha1, sizeof(a->sha1)) == 0;
+}
+
+static char *
+typestr(int t)
+{
+	char *types[] = {
+		"???",
+		"commit",
+		"tree",
+		"blob",
+		"tag",
+		"odelta",
+		"rdelta",
+	};
+	if (t < 0 || t >= sizeof(types)/sizeof(types[0]))
+		abort();
+	return types[t];
+}
+
+static char *
+hashfmt(char *out, size_t nout, struct got_object_id *h)
+{
+	int i, n, c0, c1;
+	char *p;
+
+	if (nout < 2*sizeof(h->sha1) + 1)
+		return NULL;
+	p = out;
+	for(i = 0; i < sizeof(h->sha1); i++){
+		n = (h->sha1[i] >> 4) & 0xf;
+		c0 = (n >= 10) ? n-10 + 'a' : n + '0';
+		n = h->sha1[i] & 0xf;
+		c1 = (n >= 10) ? n-10 + 'a' : n + '0';
+		*p++ = c0;
+		*p++ = c1;
+	}
+	*p++ = 0;
+	return out;
+}
+
+static void
+clear(Object *o)
+{
+	if(!o)
+		return;
+
+	assert(o->refs == 0);
+	assert((o->flag & Ccache) == 0);
+	assert(o->flag & Cloaded);
+	switch(o->type){
+	case GCommit:
+		if(!o->commit)
+			break;
+		free(o->commit->parent);
+		free(o->commit->author);
+		free(o->commit->committer);
+		free(o->commit);
+		o->commit = NULL;
+		break;
+	case GTree:
+		if(!o->tree)
+			break;
+		free(o->tree->ent);
+		free(o->tree);
+		o->tree = NULL;
+		break;
+	default:
+		break;
+	}
+
+	free(o->all);
+	o->all = NULL;
+	o->data = NULL;
+	o->flag &= ~Cloaded;
+}
+
+static void
+unref(Object *o)
+{
+	if(!o)
+		return;
+	o->refs--;
+	if(!o->refs)
+		clear(o);
+}
+
+static Object*
+ref(Object *o)
+{
+	o->refs++;
+	return o;
+}
+
+static void
+cache(Object *o)
+{
+	char buf[41];
+	Object *p;
+
+	hashfmt(buf, sizeof(buf), &o->hash);
+	if(o == lruhead)
+		return;
+	if(o == lrutail)
+		lrutail = lrutail->prev;
+	if(!(o->flag & Cexist)){
+		got_object_idset_add(objcache, &o->hash, o);
+		o->id = next_object_id++;
+		o->flag |= Cexist;
+	}
+	if(o->prev)
+		o->prev->next = o->next;
+	if(o->next)
+		o->next->prev = o->prev;
+	if(lrutail == o){
+		lrutail = o->prev;
+		lrutail->next = NULL;
+	}else if(!lrutail)
+		lrutail = o;
+	if(lruhead)
+		lruhead->prev = o;
+	o->next = lruhead;
+	o->prev = NULL;
+	lruhead = o;
+
+	if(!(o->flag & Ccache)){
+		o->flag |= Ccache;
+		ref(o);
+		ncache++;
+	}
+	while(ncache > Cachemax){
+		p = lrutail;
+		lrutail = p->prev;
+		lrutail->next = NULL;
+		p->flag &= ~Ccache;
+		p->prev = NULL;
+		p->next = NULL;
+		unref(p);
+		ncache--;
+	}
+}
+
+static int
+preadbe32(FILE *b, int *v, off_t off)
+{
+	char buf[4];
+
+	if(fseek(b, off, 0) == -1)
+		return -1;
+	if(fread(buf, 1, sizeof(buf), b) == -1)
+		return -1;
+	*v = GETBE32(buf);
+
+	return 0;
+}
+static int
+preadbe64(FILE *b, off_t *v, off_t off)
+{
+	char buf[8];
+
+	if(fseek(b, off, 0) == -1)
+		return -1;
+	if(fread(buf, 1, sizeof(buf), b) == -1)
+		return -1;
+	*v = GETBE64(buf);
+	return 0;
+}
+
+static int
+readvint(char *p, char **pp)
+{
+	int i, n, c;
+
+	i = 0;
+	n = 0;
+	do {
+		c = *p++;
+		n |= (c & 0x7f) << i;
+		i += 7;
+	} while (c & 0x80);
+	*pp = p;
+
+	return n;
+}
+
+static int
+applydelta(Object *dst, Object *base, char *d, int nd)
+{
+	char *r, *b, *ed, *er;
+	int n, nr, c;
+	off_t o, l;
+
+	ed = d + nd;
+	b = base->data;
+	n = readvint(d, &d);
+	if(n != base->size){
+		fprintf(stderr, "mismatched source size");
+		return -1;
+	}
+
+	nr = readvint(d, &d);
+	r = emalloc(nr + 64);
+	n = snprintf(r, 64, "%s %d", typestr(base->type), nr) + 1;
+	dst->all = r;
+	dst->type = base->type;
+	dst->data = r + n;
+	dst->size = nr;
+	er = dst->data + nr;
+	r = dst->data;
+
+	while(1){
+		if(d == ed)
+			break;
+		c = *d++;
+		if(!c){
+			fprintf(stderr, "bad delta encoding");
+			return -1;
+		}
+		/* copy from base */
+		if(c & 0x80){
+			o = 0;
+			l = 0;
+			/* Offset in base */
+			if(c & 0x01 && d != ed) o |= (*d++ <<  0) & 0x000000ff;
+			if(c & 0x02 && d != ed) o |= (*d++ <<  8) & 0x0000ff00;
+			if(c & 0x04 && d != ed) o |= (*d++ << 16) & 0x00ff0000;
+			if(c & 0x08 && d != ed) o |= (*d++ << 24) & 0xff000000;
+
+			/* Length to copy */
+			if(c & 0x10 && d != ed) l |= (*d++ <<  0) & 0x0000ff;
+			if(c & 0x20 && d != ed) l |= (*d++ <<  8) & 0x00ff00;
+			if(c & 0x40 && d != ed) l |= (*d++ << 16) & 0xff0000;
+			if(l == 0) l = 0x10000;
+
+			assert(o + l <= base->size);
+			memmove(r, b + o, l);
+			r += l;
+		/* inline data */
+		}else{
+			memmove(r, d, c);
+			d += c;
+			r += c;
+		}
+
+	}
+	if(r != er){
+		fprintf(stderr, "truncated delta (%zd)", er - r);
+		return -1;
+	}
+
+	return nr;
+}
+
+static int
+readrdelta(FILE *f, Object *o, int nd, int flag)
+{
+	const struct got_error *e;
+	struct got_object_id h;
+	Object *b;
+	uint8_t *d;
+	size_t n;
+
+	d = NULL;
+	if(fread(h.sha1, 1, sizeof(h.sha1), f) != sizeof(h.sha1))
+		goto error;
+	if(hasheq(&o->hash, &h))
+		goto error;
+	if ((e = got_inflate_to_mem(&d, &n, f)) != NULL)
+		goto error;
+	o->len = ftello(f) - o->off;
+	if(d == NULL || n != nd)
+		goto error;
+	if((b = readidxobject(f, h, flag)) == NULL)
+		goto error;
+	if(applydelta(o, b, d, n) == -1)
+		goto error;
+	free(d);
+	return 0;
+error:
+	free(d);
+	return -1;
+}
+
+static int
+readodelta(FILE *f, Object *o, off_t nd, off_t p, int flag)
+{
+	Object b;
+	uint8_t *d;
+	off_t r;
+	size_t n;
+	int c;
+
+	r = 0;
+	d = NULL;
+	while(1){
+		if((c = fgetc(f)) == -1)
+			goto error;
+		r |= c & 0x7f;
+		if (!(c & 0x80))
+			break;
+		r++;
+		r <<= 7;
+	}while(c & 0x80);
+
+	if(r > p){
+		fprintf(stderr, "junk offset -%lld (from %lld)", r, p);
+		goto error;
+	}
+
+	if (got_inflate_to_mem(&d, &n, f) == NULL)
+		goto error;
+	o->len = ftello(f) - o->off;
+	if(d == NULL || n != nd)
+		goto error;
+	if(fseek(f, p - r, 0) == -1)
+		goto error;
+	if(readpacked(f, &b, flag) == -1)
+		goto error;
+	if(applydelta(o, &b, d, nd) == -1)
+		goto error;
+	free(d);
+	return 0;
+error:
+	free(d);
+	return -1;
+}
+
+static int
+readpacked(FILE *f, Object *o, int flag)
+{
+	const struct got_error *e;
+	int c, s, n;
+	off_t l, p;
+	size_t ndata;
+	uint8_t *data;
+	Type t;
+	Buf b;
+
+	p = ftello(f);
+	c = fgetc(f);
+	if(c == -1)
+		return -1;
+	l = c & 0xf;
+	s = 4;
+	t = (c >> 4) & 0x7;
+	if(!t){
+		fprintf(stderr, "unknown type for byte %x", c);
+		return -1;
+	}
+	while(c & 0x80){
+		if((c = fgetc(f)) == -1)
+			return -1;
+		l |= (c & 0x7f) << s;
+		s += 7;
+	}
+
+	switch(t){
+	default:
+		fprintf(stderr, "invalid object at %lld", ftello(f));
+		return -1;
+	case GCommit:
+	case GTree:
+	case GTag:
+	case GBlob:
+		b.sz = 64 + l;
+
+		b.data = emalloc(b.sz);
+		n = snprintf(b.data, 64, "%s %lld", typestr(t), l) + 1;
+		b.len = n;
+		e = got_inflate_to_mem(&data, &ndata, f);
+		if (e != NULL || n + ndata >= b.sz) {
+			free(b.data);
+			return -1;
+		}
+		memcpy(b.data + n, data, ndata);
+		o->len = ftello(f) - o->off;
+		o->type = t;
+		o->all = b.data;
+		o->data = b.data + n;
+		o->size = ndata;
+		free(data);
+		break;
+	case GOdelta:
+		if(readodelta(f, o, l, p, flag) == -1)
+			return -1;
+		break;
+	case GRdelta:
+		if(readrdelta(f, o, l, flag) == -1)
+			return -1;
+		break;
+	}
+	o->flag |= Cloaded|flag;
+	return 0;
+}
+
+static int
+readloose(FILE *f, Object *o, int flag)
+{
+	struct { char *tag; int type; } *p, types[] = {
+		{"blob", GBlob},
+		{"tree", GTree},
+		{"commit", GCommit},
+		{"tag", GTag},
+		{NULL},
+	};
+	char *s, *e;
+	uint8_t *d;
+	off_t sz;
+	size_t n;
+	int l;
+
+	if (got_inflate_to_mem(&d, &n, f) != NULL)
+		return -1;
+
+	s = (char *)d;
+	o->type = GNone;
+	for(p = types; p->tag; p++){
+		l = strlen(p->tag);
+		if(strncmp(s, p->tag, l) == 0){
+			s += l;
+			o->type = p->type;
+			while(!isspace(*s))
+				s++;
+			break;
+		}
+	}
+	if(o->type == GNone){
+		free(o->data);
+		return -1;
+	}
+	sz = strtol(s, &e, 0);
+	if(e == s || *e++ != 0){
+		fprintf(stderr, "malformed object header");
+		goto error;
+	}
+	if(sz != n - (e - (char *)d)){
+		fprintf(stderr, "mismatched sizes");
+		goto error;
+	}
+	o->size = sz;
+	o->data = e;
+	o->all = d;
+	o->flag |= Cloaded|flag;
+	return 0;
+
+error:
+	free(d);
+	return -1;
+}
+
+static off_t
+searchindex(FILE *f, struct got_object_id h)
+{
+	int lo, hi, idx, i, nent;
+	off_t o, oo;
+	struct got_object_id hh;
+
+	o = 8;
+	/*
+	 * Read the fanout table. The fanout table
+	 * contains 256 entries, corresponsding to
+	 * the first byte of the hash. Each entry
+	 * is a 4 byte big endian integer, containing
+	 * the total number of entries with a leading
+	 * byte <= the table index, allowing us to
+	 * rapidly do a binary search on them.
+	 */
+	if (h.sha1[0] == 0){
+		lo = 0;
+		if(preadbe32(f, &hi, o) == -1)
+			goto err;
+	} else {
+		o += h.sha1[0]*4 - 4;
+		if(preadbe32(f, &lo, o + 0) == -1)
+			goto err;
+		if(preadbe32(f, &hi, o + 4) == -1)
+			goto err;
+	}
+	if(hi == lo)
+		goto notfound;
+	if(preadbe32(f, &nent, 8 + 255*4) == -1)
+		goto err;
+
+	/*
+	 * Now that we know the range of hashes that the
+	 * entry may exist in, read them in so we can do
+	 * a bsearch.
+	 */
+	idx = -1;
+	fseek(f, Hashsz*lo + 8 + 256*4, 0);
+	for(i = 0; i < hi - lo; i++){
+		if(fread(hh.sha1, 1, sizeof(hh.sha1), f) == -1)
+			goto err;
+		if(hasheq(&hh, &h))
+			idx = lo + i;
+	}
+	if(idx == -1)
+		goto notfound;
+
+
+	/*
+	 * We found the entry. If it's 32 bits, then we
+	 * can just return the oset, otherwise the 32
+	 * bit entry contains the oset to the 64 bit
+	 * entry.
+	 */
+	oo = 8;			/* Header */
+	oo += 256*4;		/* Fanout table */
+	oo += Hashsz*nent;	/* Hashes */
+	oo += 4*nent;		/* Checksums */
+	oo += 4*idx;		/* Offset offset */
+	if(preadbe32(f, &i, oo) == -1)
+		goto err;
+	o = i & 0xffffffff;
+	if(o & (1ull << 31)){
+		o &= 0x7fffffff;
+		if(preadbe64(f, &o, o) == -1)
+			goto err;
+	}
+	return o;
+
+err:
+	fprintf(stderr, "unable to read packfile\n");
+	return -1;
+notfound:
+	{
+		char hstr[41];
+		hashfmt(hstr, sizeof(hstr), &h);
+		fprintf(stdout, "could not find object %s\n", hstr);
+	}
+	return -1;
+}
+
+/*
+ * Scans for non-empty word, copying it into buf.
+ * Strips off word, leading, and trailing space
+ * from input.
+ *
+ * Returns -1 on empty string or error, leaving
+ * input unmodified.
+ */
+static int
+scanword(char **str, int *nstr, char *buf, int nbuf)
+{
+	char *p;
+	int n, r;
+
+	r = -1;
+	p = *str;
+	n = *nstr;
+	while(n && isblank(*p)){
+		n--;
+		p++;
+	}
+
+	for(; n && *p && !isspace(*p); p++, n--){
+		r = 0;
+		*buf++ = *p;
+		nbuf--;
+		if(nbuf == 0)
+			return -1;
+	}
+	while(n && isblank(*p)){
+		n--;
+		p++;
+	}
+	*buf = 0;
+	*str = p;
+	*nstr = n;
+	return r;
+}
+
+static void
+nextline(char **str, int *nstr)
+{
+	char *s;
+
+	if((s = strchr(*str, '\n')) != NULL){
+		*nstr -= s - *str + 1;
+		*str = s + 1;
+	}
+}
+
+static int
+parseauthor(char **str, int *nstr, char **name, off_t *time)
+{
+	return 0;
+}
+
+static void
+parsecommit(Object *o)
+{
+	char *p, *t, buf[128];
+	int np;
+
+	p = o->data;
+	np = o->size;
+	o->commit = emalloc(sizeof(Cinfo));
+	while(1){
+		if(scanword(&p, &np, buf, sizeof(buf)) == -1)
+			break;
+		if(strcmp(buf, "tree") == 0){
+			if(scanword(&p, &np, buf, sizeof(buf)) == -1)
+				errx(1, "invalid commit: tree missing");
+			if(hparse(&o->commit->tree, buf) == -1)
+				errx(1, "invalid commit: garbled tree");
+		}else if(strcmp(buf, "parent") == 0){
+			if(scanword(&p, &np, buf, sizeof(buf)) == -1)
+				errx(1, "invalid commit: missing parent");
+			o->commit->parent = realloc(o->commit->parent, ++o->commit->nparent * sizeof(struct got_object_id));
+			if(!o->commit->parent)
+				err(1, "unable to malloc: ");
+			if(hparse(&o->commit->parent[o->commit->nparent - 1], buf) == -1)
+				errx(1, "invalid commit: garbled parent");
+		}else if(strcmp(buf, "author") == 0){
+			parseauthor(&p, &np, &o->commit->author, &o->commit->mtime);
+		}else if(strcmp(buf, "committer") == 0){
+			parseauthor(&p, &np, &o->commit->committer, &o->commit->ctime);
+		}else if(strcmp(buf, "gpgsig") == 0){
+			/* just drop it */
+			if((t = strstr(p, "-----END PGP SIGNATURE-----")) == NULL)
+				errx(1, "malformed gpg signature");
+			np -= t - p;
+			p = t;
+		}
+		nextline(&p, &np);
+	}
+	while (np && isspace(*p)) {
+		p++;
+		np--;
+	}
+	o->commit->msg = p;
+	o->commit->nmsg = np;
+}
+
+static void
+parsetree(Object *o)
+{
+	char *p, buf[256];
+	int np, nn, m;
+	Dirent *t;
+
+	p = o->data;
+	np = o->size;
+	o->tree = emalloc(sizeof(Tinfo));
+	while(np > 0){
+		if(scanword(&p, &np, buf, sizeof(buf)) == -1)
+			break;
+		o->tree->ent = erealloc(o->tree->ent, ++o->tree->nent * sizeof(Dirent));
+		t = &o->tree->ent[o->tree->nent - 1];
+		memset(t, 0, sizeof(Dirent));
+		m = strtol(buf, NULL, 8);
+		/* FIXME: symlinks and other BS */
+		if(m == 0160000){
+			t->mode |= S_IFDIR;
+			t->modref = 1;
+		}
+		t->mode = m & 0777;
+		if(m & 0040000)
+			t->mode |= S_IFDIR;
+		t->name = p;
+		nn = strlen(p) + 1;
+		p += nn;
+		np -= nn;
+		if(np < sizeof(t->h.sha1))
+			errx(1, "malformed tree, remaining %d (%s)", np, p);
+		memcpy(t->h.sha1, p, sizeof(t->h.sha1));
+		p += sizeof(t->h.sha1);
+		np -= sizeof(t->h.sha1);
+	}
+}
+
+void
+parseobject(Object *o)
+{
+	if(o->flag & Cparsed)
+		return;
+	switch(o->type){
+	case GTree:	parsetree(o);	break;
+	case GCommit:	parsecommit(o);	break;
+	//case GTag:	parsetag(o);	break;
+	default:	break;
+	}
+	o->flag |= Cparsed;
+}
+
+static Object*
+readidxobject(FILE *idx, struct got_object_id h, int flag)
+{
+	char path[Pathmax];
+	char hbuf[41];
+	FILE *f;
+	Object *obj;
+	int l, n;
+	off_t o;
+	struct dirent *ent;
+	DIR *d;
+
+
+	if ((obj = got_object_idset_lookup_data(objcache, &h))) {
+		if(obj->flag & Cloaded)
+			return obj;
+		if(obj->flag & Cidx){
+			assert(idx != NULL);
+			o = ftello(idx);
+			if(fseek(idx, obj->off, 0) == -1)
+				errx(1, "could not seek to object offset");
+			if(readpacked(idx, obj, flag) == -1)
+				errx(1, "could not reload object");
+			if(fseek(idx, o, 0) == -1)
+				errx(1, "could not restore offset");
+			cache(obj);
+			return obj;
+		}
+	}
+
+	d = NULL;
+	/* We're not putting it in the cache yet... */
+	obj = emalloc(sizeof(Object));
+	obj->id = next_object_id + 1;
+	obj->hash = h;
+
+	hashfmt(hbuf, sizeof(hbuf), &h);
+	snprintf(path, sizeof(path), ".git/objects/%c%c/%s", hbuf[0], hbuf[1], hbuf + 2);
+	if((f = fopen(path, "r")) != NULL){
+		if(readloose(f, obj, flag) == -1)
+			goto error;
+		fclose(f);
+		parseobject(obj);
+		hashfmt(hbuf, sizeof(hbuf), &obj->hash);
+		fprintf(stderr, "object %s cached", hbuf);
+		cache(obj);
+		return obj;
+	}
+
+	o = -1;
+	if ((d = opendir(".git/objects/pack")) == NULL)
+		err(1, "open pack dir");
+	while ((ent = readdir(d)) != NULL) {
+		l = strlen(ent->d_name);
+		if(l > 4 && strcmp(ent->d_name + l - 4, ".idx") != 0)
+			continue;
+		snprintf(path, sizeof(path), ".git/objects/pack/%s", ent->d_name);
+		if((f = fopen(path, "r")) == NULL)
+			continue;
+		o = searchindex(f, h);
+		fclose(f);
+		if(o == -1)
+			continue;
+		break;
+	}
+	closedir(d);
+
+	if (o == -1)
+		goto error;
+
+	if((n = snprintf(path, sizeof(path), "%s", path)) >= sizeof(path) - 4)
+		goto error;
+	memcpy(path + n - 4, ".pack", 6);
+	if((f = fopen(path, "r")) == NULL)
+		goto error;
+	if(fseek(f, o, 0) == -1)
+		goto error;
+	if(readpacked(f, obj, flag) == -1)
+		goto error;
+	fclose(f);
+	parseobject(obj);
+	cache(obj);
+	return obj;
+error:
+	free(obj);
+	return NULL;
+}
+
+Object*
+readobject(struct got_object_id h)
+{
+	Object *o;
+
+	o = readidxobject(NULL, h, 0);
+	if(o)
+		ref(o);
+	return o;
+}
+
+int
+objcmp(const void *pa, const void *pb)
+{
+	Object *a, *b;
+
+	a = *(Object**)pa;
+	b = *(Object**)pb;
+	return memcmp(a->hash.sha1, b->hash.sha1, sizeof(a->hash.sha1));
+}
+
+static int
+hwrite(FILE *b, void *buf, int len, SHA1_CTX *ctx)
+{
+	SHA1Update(ctx, buf, len);
+	return fwrite(buf, 1, len, b);
+}
+
+static uint32_t
+objectcrc(FILE *f, Object *o)
+{
+	char buf[8096];
+	int n, r;
+
+	o->crc = 0;
+	fseek(f, o->off, 0);
+	for(n = o->len; n > 0; n -= r){
+		r = fread(buf, 1, n > sizeof(buf) ? sizeof(buf) : n, f);
+		if(r == -1)
+			return -1;
+		if(r == 0)
+			return 0;
+		o->crc = crc32(o->crc, buf, r);
+	}
+	return 0;
+}
+
+int
+indexpack(int packfd, int idxfd, struct got_object_id packhash)
+{
+	char hdr[4*3], buf[8];
+	int nobj, nvalid, nbig, n, i, step;
+	Object *o, **objects;
+	char *valid;
+	SHA1_CTX ctx, objctx;
+	FILE *f;
+	struct got_object_id h;
+	int c;
+
+	if ((f = fdopen(packfd, "r")) == NULL)
+		return -1;
+	if (fseek(f, 0, SEEK_SET) == -1)
+		return -1;
+	if (fread(hdr, 1, sizeof(hdr), f) != sizeof(hdr)) {
+		fprintf(stderr, "short read on header");
+		return -1;
+	}
+	if (memcmp(hdr, "PACK\0\0\0\2", 8) != 0) {
+		fprintf(stderr, "invalid header");
+		return -1;
+	}
+
+	nvalid = 0;
+	nobj = GETBE32(hdr + 8);
+	objects = calloc(nobj, sizeof(Object*));
+	valid = calloc(nobj, sizeof(char));
+	step = nobj/100;
+	if(!step)
+		step++;
+	while (nvalid != nobj) {
+		fprintf(stderr, "indexing (%d/%d):", nvalid, nobj);
+		n = 0;
+		for (i = 0; i < nobj; i++) {
+			if (valid[i]) {
+				n++;
+				continue;
+			}
+			if (i % step == 0)
+				fprintf(stderr, ".");
+			if (!objects[i]) {
+				o = emalloc(sizeof(Object));
+				o->off = ftello(f);
+				objects[i] = o;
+			}
+			o = objects[i];
+			fseek(f, o->off, 0);
+			if (readpacked(f, o, Cidx) == 0){
+				SHA1Init(&objctx);
+				SHA1Update(&objctx, (uint8_t*)o->all, o->size + strlen(o->all) + 1);
+				SHA1Final(o->hash.sha1, &objctx);
+				cache(o);
+				valid[i] = 1;
+				n++;
+			}
+			if(objectcrc(f, o) == -1)
+				return -1;
+		}
+		fprintf(stderr, "\n");
+		if (n == nvalid) {
+			errx(1, "fix point reached too early: %d/%d", nvalid, nobj);
+			goto error;
+		}
+		nvalid = n;
+	}
+	fclose(f);
+
+	SHA1Init(&ctx);
+	qsort(objects, nobj, sizeof(Object*), objcmp);
+	if((f = fdopen(idxfd, "w")) == NULL)
+		return -1;
+	if(hwrite(f, "\xfftOc\x00\x00\x00\x02", 8, &ctx) != 8)
+		goto error;
+	/* fanout table */
+	c = 0;
+	for(i = 0; i < 256; i++){
+		while(c < nobj && (objects[c]->hash.sha1[0] & 0xff) <= i)
+			c++;
+		PUTBE32(buf, c);
+		hwrite(f, buf, 4, &ctx);
+	}
+	for(i = 0; i < nobj; i++){
+		o = objects[i];
+		hwrite(f, o->hash.sha1, sizeof(o->hash.sha1), &ctx);
+	}
+
+	/* pointless, nothing uses this */
+	for(i = 0; i < nobj; i++){
+		PUTBE32(buf, objects[i]->crc);
+		hwrite(f, buf, 4, &ctx);
+	}
+
+	nbig = 0;
+	for(i = 0; i < nobj; i++){
+		if(objects[i]->off <= (1ull<<31))
+			PUTBE32(buf, objects[i]->off);
+		else
+			PUTBE32(buf, (1ull << 31) | nbig++);
+		hwrite(f, buf, 4, &ctx);
+	}
+	for(i = 0; i < nobj; i++){
+		if(objects[i]->off > (1ull<<31)){
+			PUTBE64(buf, objects[i]->off);
+			hwrite(f, buf, 8, &ctx);
+		}
+	}
+	hwrite(f, packhash.sha1, sizeof(packhash.sha1), &ctx);
+	SHA1Final(h.sha1, &ctx);
+	fwrite(h.sha1, 1, sizeof(h.sha1), f);
+
+	free(objects);
+	free(valid);
+	fclose(f);
+	return 0;
+
+error:
+	free(objects);
+	free(valid);
+	fclose(f);
+	return -1;
+}
+
+int
+main(int argc, char **argv)
+{
+	const struct got_error *err = NULL;
+	struct got_object_id packhash;
+	struct imsgbuf ibuf;
+	struct imsg imsg;
+	int packfd, idxfd;
+
+	objcache = got_object_idset_alloc();
+	imsg_init(&ibuf, GOT_IMSG_FD_CHILD);
+	if((err = got_privsep_recv_imsg(&imsg, &ibuf, 0)) != 0) {
+		if (err->code == GOT_ERR_PRIVSEP_PIPE)
+			err = NULL;
+		goto done;
+	}
+	if (imsg.hdr.type == GOT_IMSG_STOP)
+		goto done;
+	if (imsg.hdr.type != GOT_IMSG_IDXPACK_REQUEST) {
+		err = got_error(GOT_ERR_PRIVSEP_MSG);
+		goto done;
+	}
+	if (imsg.hdr.len - IMSG_HEADER_SIZE != SHA1_DIGEST_LENGTH) {
+		err = got_error(GOT_ERR_PRIVSEP_LEN);
+		goto done;
+	}
+	packfd = imsg.fd;
+	memcpy(packhash.sha1, imsg.data, SHA1_DIGEST_LENGTH);
+	got_privsep_send_ack(&ibuf);
+
+	if((err = got_privsep_recv_imsg(&imsg, &ibuf, 0)) != 0) {
+		if (err->code == GOT_ERR_PRIVSEP_PIPE)
+			err = NULL;
+		goto done;
+	}
+	if (imsg.hdr.type == GOT_IMSG_STOP)
+		goto done;
+	if (imsg.hdr.type != GOT_IMSG_TMPFD) {
+		err = got_error(GOT_ERR_PRIVSEP_MSG);
+		goto done;
+	}
+	if (imsg.hdr.len - IMSG_HEADER_SIZE != 0) {
+		err = got_error(GOT_ERR_PRIVSEP_LEN);
+		goto done;
+	}
+	idxfd = imsg.fd;
+
+	indexpack(packfd, idxfd, packhash);
+done:
+	if(err != NULL)
+		got_privsep_send_error(&ibuf, err);
+	else
+		err = got_privsep_send_index_pack_done(&ibuf);
+	if(err != NULL) {
+		fprintf(stderr, "%s: %s\n", getprogname(), err->msg);
+		got_privsep_send_error(&ibuf, err);
+	}
+
+	exit(0);
+}