"GOT", but the "O" is a cute, smiling pufferfish. Index | Thread | Search

From:
Stefan Sperling <stsp@stsp.name>
Subject:
Re: fix got_opentemp() overhead of got-read-pack
To:
gameoftrees@openbsd.org
Date:
Mon, 3 Jan 2022 15:00:14 +0100

Download raw body.

Thread
On Fri, Dec 31, 2021 at 07:02:31PM +0100, Stefan Sperling wrote:
> Turns out the problem where gotadmin pack spends about 30% of its time
> opening temporary files can be fixed independently from using mmap.
> 
> With this patch we open temporary files used during delta application
> just once, instead of opening new temporary files during every request
> for a blob object or a raw object.
> 
> This makes gotadmin pack significantly faster, and will likely also
> speed up other tasks which need to load a lot of blobs.
> 
> ok?

The previous patch triggered pledge violations for commands which
do not use the "cpath" promise, such as 'got branch -l'.

This is fixed in the new version below. We can wait with opening
temporary files until we are certain that they will be needed, i.e.
when a request for a blob or a raw object is sent to the child.

ok?


diff 46f5b76fad8d22e4cb7949ad4ce9462ede847a64 0f639468088c75c028b204d850ac5b1e5052dd1f
blob - dc97d615eecefa57ba072dfa818660e2362700e1
blob + 2a9c135628c6fed4aeef4fb17093f23e0b5df9ae
--- lib/got_lib_pack.h
+++ lib/got_lib_pack.h
@@ -21,6 +21,7 @@ struct got_pack {
 	uint8_t *map;
 	size_t filesize;
 	struct got_privsep_child *privsep_child;
+	int child_has_tempfiles;
 	struct got_delta_cache *delta_cache;
 };
 
blob - a4cf395476aee75f57a0281a2184b91a09e360e3
blob + fd5a9771d547a2696e75c7663d977c2e02cb367f
--- lib/object.c
+++ lib/object.c
@@ -166,58 +166,65 @@ request_packed_object(struct got_object **obj, struct 
 	return NULL;
 }
 
+/* Create temporary files used during delta application. */
 static const struct got_error *
+pack_child_send_tempfiles(struct imsgbuf *ibuf, struct got_pack *pack)
+{
+	const struct got_error *err;
+	int basefd, accumfd;
+
+	/* 
+	 * For performance reasons, the child will keep reusing the
+	 * same temporary files during every object request.
+	 * Opening and closing new files for every object request is
+	 * too expensive during operations such as 'gotadmin pack'.
+	 */
+	if (pack->child_has_tempfiles)
+		return NULL;
+
+	basefd = got_opentempfd();
+	if (basefd == -1)
+		return got_error_from_errno("got_opentempfd");
+
+	err = got_privsep_send_tmpfd(ibuf, basefd);
+	if (err)
+		return err;
+
+	accumfd = got_opentempfd();
+	if (accumfd == -1)
+		return got_error_from_errno("got_opentempfd");
+
+	err = got_privsep_send_tmpfd(ibuf, accumfd);
+	if (err)
+		return err;
+
+	pack->child_has_tempfiles = 1;
+	return NULL;
+}
+
+static const struct got_error *
 request_packed_object_raw(uint8_t **outbuf, off_t *size, size_t *hdrlen,
     int outfd, struct got_pack *pack, int idx, struct got_object_id *id)
 {
 	const struct got_error *err = NULL;
 	struct imsgbuf *ibuf = pack->privsep_child->ibuf;
 	int outfd_child;
-	int basefd, accumfd; /* temporary files for delta application */
 
-	basefd = got_opentempfd();
-	if (basefd == -1)
-		return got_error_from_errno("got_opentempfd");
-
-	accumfd = got_opentempfd();
-	if (accumfd == -1) {
-		close(basefd);
-		return got_error_from_errno("got_opentempfd");
-	}
-
-	outfd_child = dup(outfd);
-	if (outfd_child == -1) {
-		err = got_error_from_errno("dup");
-		close(basefd);
-		close(accumfd);
+	 err = pack_child_send_tempfiles(ibuf, pack);
+	 if (err)
 		return err;
-	}
 
+	outfd_child = dup(outfd);
+	if (outfd_child == -1)
+		return got_error_from_errno("dup");
+
 	err = got_privsep_send_packed_raw_obj_req(ibuf, idx, id);
 	if (err) {
-		close(basefd);
-		close(accumfd);
 		close(outfd_child);
 		return err;
 	}
 
 	err = got_privsep_send_raw_obj_outfd(ibuf, outfd_child);
-	if (err) {
-		close(basefd);
-		close(accumfd);
-		return err;
-	}
-
-
-	err = got_privsep_send_tmpfd(pack->privsep_child->ibuf,
-	    basefd);
-	if (err) {
-		close(accumfd);
-		return err;
-	}
-
-	err = got_privsep_send_tmpfd(pack->privsep_child->ibuf,
-	    accumfd);
 	if (err)
 		return err;
 
@@ -258,6 +265,7 @@ start_pack_privsep_child(struct got_pack *pack, struct
 		free(ibuf);
 		return err;
 	}
+	pack->child_has_tempfiles = 0;
 
 	if (socketpair(AF_UNIX, SOCK_STREAM, PF_UNSPEC, imsg_fds) == -1) {
 		err = got_error_from_errno("socketpair");
@@ -1191,15 +1199,12 @@ request_packed_blob(uint8_t **outbuf, size_t *size, si
     struct got_object_id *id)
 {
 	const struct got_error *err = NULL;
+	struct imsgbuf *ibuf = pack->privsep_child->ibuf;
 	int outfd_child;
-	int basefd, accumfd; /* temporary files for delta application */
 
-	basefd = got_opentempfd();
-	if (basefd == -1)
-		return got_error_from_errno("got_opentempfd");
-	accumfd = got_opentempfd();
-	if (accumfd == -1)
-		return got_error_from_errno("got_opentempfd");
+	 err = pack_child_send_tempfiles(ibuf, pack);
+	 if (err)
+		return err;
 
 	outfd_child = dup(outfd);
 	if (outfd_child == -1)
@@ -1212,23 +1217,9 @@ request_packed_blob(uint8_t **outbuf, size_t *size, si
 	err = got_privsep_send_blob_outfd(pack->privsep_child->ibuf,
 	    outfd_child);
 	if (err) {
-		close(basefd);
-		close(accumfd);
 		return err;
 	}
 
-	err = got_privsep_send_tmpfd(pack->privsep_child->ibuf,
-	    basefd);
-	if (err) {
-		close(accumfd);
-		return err;
-	}
-
-	err = got_privsep_send_tmpfd(pack->privsep_child->ibuf,
-	    accumfd);
-	if (err)
-		return err;
-
 	err = got_privsep_recv_blob(outbuf, size, hdrlen,
 	    pack->privsep_child->ibuf);
 	if (err)
blob - 8bbfe87a70dfd1f3c936dd572b1ab0dcf33aff61
blob + 1ea0d617c52732faf35724fe601e28a24b03992f
--- libexec/got-read-pack/got-read-pack.c
+++ libexec/got-read-pack/got-read-pack.c
@@ -289,13 +289,43 @@ done:
 }
 
 static const struct got_error *
+receive_tempfile(FILE **basefile, FILE **accumfile, struct imsg *imsg,
+    struct imsgbuf *ibuf)
+{
+	size_t datalen;
+	FILE **f;
+
+	datalen = imsg->hdr.len - IMSG_HEADER_SIZE;
+	if (datalen != 0)
+		return got_error(GOT_ERR_PRIVSEP_LEN);
+
+	if (imsg->fd == -1)
+		return got_error(GOT_ERR_PRIVSEP_NO_FD);
+
+	if (*basefile == NULL)
+		f = basefile;
+	else if (*accumfile == NULL)
+		f = accumfile;
+	else
+		return got_error(GOT_ERR_PRIVSEP_MSG);
+
+	*f = fdopen(imsg->fd, "w+");
+	if (*f == NULL)
+		return got_error_from_errno("fdopen");
+	imsg->fd = -1;
+
+	return NULL;
+}
+
+static const struct got_error *
 blob_request(struct imsg *imsg, struct imsgbuf *ibuf, struct got_pack *pack,
-    struct got_packidx *packidx, struct got_object_cache *objcache)
+    struct got_packidx *packidx, struct got_object_cache *objcache,
+    FILE *basefile, FILE *accumfile)
 {
 	const struct got_error *err = NULL;
 	struct got_imsg_packed_object iobj;
 	struct got_object *obj = NULL;
-	FILE *outfile = NULL, *basefile = NULL, *accumfile = NULL;
+	FILE *outfile = NULL;
 	struct got_object_id id;
 	size_t datalen;
 	uint64_t blob_size;
@@ -320,12 +350,6 @@ blob_request(struct imsg *imsg, struct imsgbuf *ibuf, 
 	err = receive_file(&outfile, ibuf, GOT_IMSG_BLOB_OUTFD);
 	if (err)
 		goto done;
-	err = receive_file(&basefile, ibuf, GOT_IMSG_TMPFD);
-	if (err)
-		goto done;
-	err = receive_file(&accumfile, ibuf, GOT_IMSG_TMPFD);
-	if (err)
-		goto done;
 
 	if (obj->flags & GOT_OBJ_FLAG_DELTIFIED) {
 		err = got_pack_get_max_delta_object_size(&blob_size, obj, pack);
@@ -348,10 +372,6 @@ done:
 	free(buf);
 	if (outfile && fclose(outfile) == EOF && err == NULL)
 		err = got_error_from_errno("fclose");
-	if (basefile && fclose(basefile) == EOF && err == NULL)
-		err = got_error_from_errno("fclose");
-	if (accumfile && fclose(accumfile) == EOF && err == NULL)
-		err = got_error_from_errno("fclose");
 	got_object_close(obj);
 	if (err && err->code != GOT_ERR_PRIVSEP_PIPE)
 		got_privsep_send_error(ibuf, err);
@@ -775,12 +795,12 @@ done:
 static const struct got_error *
 raw_object_request(struct imsg *imsg, struct imsgbuf *ibuf,
     struct got_pack *pack, struct got_packidx *packidx,
-    struct got_object_cache *objcache)
+    struct got_object_cache *objcache, FILE *basefile, FILE *accumfile)
 {
 	const struct got_error *err = NULL;
 	uint8_t *buf = NULL;
 	uint64_t size = 0;
-	FILE *outfile = NULL, *basefile = NULL, *accumfile = NULL;
+	FILE *outfile = NULL;
 	struct got_imsg_packed_object iobj;
 	struct got_object *obj;
 	struct got_object_id id;
@@ -805,12 +825,6 @@ raw_object_request(struct imsg *imsg, struct imsgbuf *
 	err = receive_file(&outfile, ibuf, GOT_IMSG_RAW_OBJECT_OUTFD);
 	if (err)
 		return err;
-	err = receive_file(&basefile, ibuf, GOT_IMSG_TMPFD);
-	if (err)
-		goto done;
-	err = receive_file(&accumfile, ibuf, GOT_IMSG_TMPFD);
-	if (err)
-		goto done;
 
 	if (obj->flags & GOT_OBJ_FLAG_DELTIFIED) {
 		err = got_pack_get_max_delta_object_size(&size, obj, pack);
@@ -833,10 +847,6 @@ done:
 	free(buf);
 	if (outfile && fclose(outfile) == EOF && err == NULL)
 		err = got_error_from_errno("fclose");
-	if (basefile && fclose(basefile) == EOF && err == NULL)
-		err = got_error_from_errno("fclose");
-	if (accumfile && fclose(accumfile) == EOF && err == NULL)
-		err = got_error_from_errno("fclose");
 	got_object_close(obj);
 	if (err && err->code != GOT_ERR_PRIVSEP_PIPE)
 		got_privsep_send_error(ibuf, err);
@@ -999,6 +1009,7 @@ main(int argc, char *argv[])
 	struct got_packidx *packidx = NULL;
 	struct got_pack *pack = NULL;
 	struct got_object_cache objcache;
+	FILE *basefile = NULL, *accumfile = NULL;
 
 	//static int attached;
 	//while (!attached) sleep(1);
@@ -1054,13 +1065,21 @@ main(int argc, char *argv[])
 			break;
 
 		switch (imsg.hdr.type) {
+		case GOT_IMSG_TMPFD:
+			err = receive_tempfile(&basefile, &accumfile,
+			    &imsg, &ibuf);
+			break;
 		case GOT_IMSG_PACKED_OBJECT_REQUEST:
 			err = object_request(&imsg, &ibuf, pack, packidx,
 			    &objcache);
 			break;
 		case GOT_IMSG_PACKED_RAW_OBJECT_REQUEST:
+			if (basefile == NULL || accumfile == NULL) {
+				err = got_error(GOT_ERR_PRIVSEP_MSG);
+				break;
+			}
 			err = raw_object_request(&imsg, &ibuf, pack, packidx,
-			    &objcache);
+			    &objcache, basefile, accumfile);
 			break;
 		case GOT_IMSG_COMMIT_REQUEST:
 			err = commit_request(&imsg, &ibuf, pack, packidx,
@@ -1071,8 +1090,12 @@ main(int argc, char *argv[])
 			    &objcache);
 			break;
 		case GOT_IMSG_BLOB_REQUEST:
+			if (basefile == NULL || accumfile == NULL) {
+				err = got_error(GOT_ERR_PRIVSEP_MSG);
+				break;
+			}
 			err = blob_request(&imsg, &ibuf, pack, packidx,
-			    &objcache);
+			    &objcache, basefile, accumfile);
 			break;
 		case GOT_IMSG_TAG_REQUEST:
 			err = tag_request(&imsg, &ibuf, pack, packidx,
@@ -1100,6 +1123,10 @@ main(int argc, char *argv[])
 		got_pack_close(pack);
 	got_object_cache_close(&objcache);
 	imsg_clear(&ibuf);
+	if (basefile && fclose(basefile) == EOF && err == NULL)
+		err = got_error_from_errno("fclose");
+	if (accumfile && fclose(accumfile) == EOF && err == NULL)
+		err = got_error_from_errno("fclose");
 	if (err) {
 		if (!sigint_received && err->code != GOT_ERR_PRIVSEP_PIPE) {
 			fprintf(stderr, "%s: %s\n", getprogname(), err->msg);