Download raw body.
rate-limiting of gotadmin progress output
Some time ago naddy pointed out that 'gotadmin cleanup' produces a
huge amount of progress output which easily overwhelms slow terminals.
The same is true for 'gotadmin pack'.
The patch below uses a similar approach to the patch naddy suggested at
the time. (naddy's patch was not applied because of naddy's own cosmetic
concerns about his patch.)
With a thin API layer on top of clock_gettime() and timespecs, progress
updates are rate-limited to every 500 msec, which seems fine to me.
I would have no problem with tweaking this timeout if needed.
In my test case the volume of progress output from 'gotadmin pack -a'
is reduced from 182Kb to 10Kb. The output volume of 'gotadmin cleanup'
goes down from 736Kb to 2Kb.
The run time of 'gotadmin cleanup' improves from 18 seconds to 12 seconds.
I am leaving other progress reports alone for now. We can easily
introduce more use of this new rate-limiting API over time.
ok?
diff 0f639468088c75c028b204d850ac5b1e5052dd1f 19f1646bd8e01a81d9c170af20efecd6c5a57ee7
blob - 7e44f914b454fcd320fd03610f840109df3f7539
blob + 8b431936ed43a5398c391d18637ae6dbc0f5348f
--- got/Makefile
+++ got/Makefile
@@ -13,7 +13,7 @@ SRCS= got.c blame.c commit_graph.c delta.c diff.c \
diff_myers.c diff_output.c diff_output_plain.c \
diff_output_unidiff.c diff_output_edscript.c \
diff_patience.c send.c deltify.c pack_create.c dial.c \
- bloom.c murmurhash2.c
+ bloom.c murmurhash2.c ratelimit.c
MAN = ${PROG}.1 got-worktree.5 git-repository.5 got.conf.5
blob - 47d9d105cc92076d9e33ac2abdf1adf89ab25dc9
blob + 781133bbc9837ad999231c521ae9da3239c0232b
--- gotadmin/Makefile
+++ gotadmin/Makefile
@@ -8,7 +8,7 @@ SRCS= gotadmin.c \
inflate.c lockfile.c object.c object_cache.c object_create.c \
object_idset.c object_parse.c opentemp.c pack.c pack_create.c \
path.c privsep.c reference.c repository.c repository_admin.c \
- worktree_open.c sha1.c bloom.c murmurhash2.c
+ worktree_open.c sha1.c bloom.c murmurhash2.c ratelimit.c
MAN = ${PROG}.1
CPPFLAGS = -I${.CURDIR}/../include -I${.CURDIR}/../lib
blob - /dev/null
blob + 9b95dcd8f24e8a9a1ad8900a16ece71c03e03a94 (mode 644)
--- /dev/null
+++ lib/got_lib_ratelimit.h
@@ -0,0 +1,23 @@
+/*
+ * Copyright (c) 2022 Stefan Sperling <stsp@openbsd.org>
+ *
+ * Permission to use, copy, modify, and distribute this software for any
+ * purpose with or without fee is hereby granted, provided that the above
+ * copyright notice and this permission notice appear in all copies.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS" AND THE AUTHOR DISCLAIMS ALL WARRANTIES
+ * WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF
+ * MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR
+ * ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES
+ * WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN
+ * ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF
+ * OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE.
+ */
+
+struct got_ratelimit {
+ struct timespec last;
+ struct timespec interval;
+};
+
+void got_ratelimit_init(struct got_ratelimit *, time_t, unsigned int);
+const struct got_error *got_ratelimit_check(int *, struct got_ratelimit *);
blob - 5e229ab44b13c2e63ed9807f70837898eeda1e43
blob + 2e421bd245bb3702600302716d83053e5785c51a
--- lib/pack_create.c
+++ lib/pack_create.c
@@ -20,6 +20,7 @@
#include <sys/tree.h>
#include <sys/uio.h>
#include <sys/stat.h>
+#include <sys/time.h>
#include <stdint.h>
#include <imsg.h>
@@ -27,6 +28,7 @@
#include <stdlib.h>
#include <string.h>
#include <sha1.h>
+#include <time.h>
#include <limits.h>
#include <zlib.h>
@@ -47,6 +49,7 @@
#include "got_lib_pack.h"
#include "got_lib_privsep.h"
#include "got_lib_repository.h"
+#include "got_lib_ratelimit.h"
#ifndef MIN
#define MIN(_a,_b) ((_a) < (_b) ? (_a) : (_b))
@@ -249,12 +252,30 @@ encode_delta(struct got_pack_meta *m, struct got_raw_o
return NULL;
}
+static const struct got_error *
+report_progress(got_pack_progress_cb progress_cb, void *progress_arg,
+ struct got_ratelimit *rl, off_t packfile_size, int ncommits,
+ int nobj_total, int obj_deltify, int nobj_written)
+{
+ const struct got_error *err;
+ int elapsed;
+ if (progress_cb == NULL)
+ return NULL;
+
+ err = got_ratelimit_check(&elapsed, rl);
+ if (err || !elapsed)
+ return err;
+
+ return progress_cb(progress_arg, packfile_size, ncommits,
+ nobj_total, obj_deltify, nobj_written);
+}
+
static const struct got_error *
pick_deltas(struct got_pack_meta **meta, int nmeta, int nours,
FILE *delta_cache, struct got_repository *repo,
got_pack_progress_cb progress_cb, void *progress_arg,
- got_cancel_cb cancel_cb, void *cancel_arg)
+ struct got_ratelimit *rl, got_cancel_cb cancel_cb, void *cancel_arg)
{
const struct got_error *err = NULL;
struct got_pack_meta *m = NULL, *base = NULL;
@@ -271,11 +292,10 @@ pick_deltas(struct got_pack_meta **meta, int nmeta, in
if (err)
break;
}
- if (progress_cb) {
- err = progress_cb(progress_arg, 0L, nours, nmeta, i, 0);
- if (err)
- goto done;
- }
+ err = report_progress(progress_cb, progress_arg, rl,
+ 0L, nours, nmeta, i, 0);
+ if (err)
+ goto done;
m = meta[i];
if (m->obj_type == GOT_OBJ_TYPE_COMMIT ||
@@ -923,7 +943,7 @@ read_meta(struct got_pack_meta ***meta, int *nmeta,
struct got_object_id **theirs, int ntheirs,
struct got_object_id **ours, int nours, struct got_repository *repo,
int loose_obj_only, got_pack_progress_cb progress_cb, void *progress_arg,
- got_cancel_cb cancel_cb, void *cancel_arg)
+ struct got_ratelimit *rl, got_cancel_cb cancel_cb, void *cancel_arg)
{
const struct got_error *err = NULL;
struct got_object_id **ids = NULL;
@@ -964,12 +984,10 @@ read_meta(struct got_pack_meta ***meta, int *nmeta,
loose_obj_only, cancel_cb, cancel_arg);
if (err)
goto done;
- if (progress_cb) {
- err = progress_cb(progress_arg, 0L, nours,
- v.nmeta, 0, 0);
- if (err)
- goto done;
- }
+ err = report_progress(progress_cb, progress_arg, rl,
+ 0L, nours, v.nmeta, 0, 0);
+ if (err)
+ goto done;
}
for (i = 0; i < ntheirs; i++) {
@@ -990,12 +1008,10 @@ read_meta(struct got_pack_meta ***meta, int *nmeta,
loose_obj_only, cancel_cb, cancel_arg);
if (err)
goto done;
- if (progress_cb) {
- err = progress_cb(progress_arg, 0L, nours,
- v.nmeta, 0, 0);
- if (err)
- goto done;
- }
+ err = report_progress(progress_cb, progress_arg, rl,
+ 0L, nours, v.nmeta, 0, 0);
+ if (err)
+ goto done;
}
for (i = 0; i < nobj; i++) {
@@ -1003,12 +1019,12 @@ read_meta(struct got_pack_meta ***meta, int *nmeta,
loose_obj_only, cancel_cb, cancel_arg);
if (err)
goto done;
- if (progress_cb) {
- err = progress_cb(progress_arg, 0L, nours,
- v.nmeta, 0, 0);
- if (err)
- goto done;
- }
+ if (err)
+ goto done;
+ err = report_progress(progress_cb, progress_arg, rl,
+ 0L, nours, v.nmeta, 0, 0);
+ if (err)
+ goto done;
}
for (i = 0; i < nours; i++) {
@@ -1029,14 +1045,17 @@ read_meta(struct got_pack_meta ***meta, int *nmeta,
loose_obj_only, cancel_cb, cancel_arg);
if (err)
goto done;
- if (progress_cb) {
- err = progress_cb(progress_arg, 0L, nours,
- v.nmeta, 0, 0);
- if (err)
- goto done;
- }
+ err = report_progress(progress_cb, progress_arg, rl,
+ 0L, nours, v.nmeta, 0, 0);
+ if (err)
+ goto done;
}
+ if (progress_cb) {
+ err = progress_cb(progress_arg, 0L, nours, v.nmeta, 0, 0);
+ if (err)
+ goto done;
+ }
done:
for (i = 0; i < nobj; i++) {
free(ids[i]);
@@ -1136,6 +1155,7 @@ genpack(uint8_t *pack_sha1, FILE *packfile, FILE *delt
struct got_pack_meta **meta, int nmeta, int nours,
int use_offset_deltas, struct got_repository *repo,
got_pack_progress_cb progress_cb, void *progress_arg,
+ struct got_ratelimit *rl,
got_cancel_cb cancel_cb, void *cancel_arg)
{
const struct got_error *err = NULL;
@@ -1167,12 +1187,10 @@ genpack(uint8_t *pack_sha1, FILE *packfile, FILE *delt
goto done;
qsort(meta, nmeta, sizeof(struct got_pack_meta *), write_order_cmp);
for (i = 0; i < nmeta; i++) {
- if (progress_cb) {
- err = progress_cb(progress_arg, packfile_size, nours,
- nmeta, nmeta, i);
- if (err)
- goto done;
- }
+ err = report_progress(progress_cb, progress_arg, rl,
+ packfile_size, nours, nmeta, nmeta, i);
+ if (err)
+ goto done;
m = meta[i];
m->off = ftello(packfile);
err = got_object_raw_open(&raw, &outfd, repo, &m->id);
@@ -1281,10 +1299,12 @@ genpack(uint8_t *pack_sha1, FILE *packfile, FILE *delt
err = got_ferror(packfile, GOT_ERR_IO);
packfile_size += SHA1_DIGEST_LENGTH;
packfile_size += sizeof(struct got_packfile_hdr);
- err = progress_cb(progress_arg, packfile_size, nours,
- nmeta, nmeta, nmeta);
- if (err)
- goto done;
+ if (progress_cb) {
+ err = progress_cb(progress_arg, packfile_size, nours,
+ nmeta, nmeta, nmeta);
+ if (err)
+ goto done;
+ }
done:
if (delta_file && fclose(delta_file) == EOF && err == NULL)
err = got_error_from_errno("fclose");
@@ -1307,9 +1327,13 @@ got_pack_create(uint8_t *packsha1, FILE *packfile,
struct got_pack_meta **meta;
int nmeta;
FILE *delta_cache = NULL;
+ struct got_ratelimit rl;
+ got_ratelimit_init(&rl, 0, 500);
+
err = read_meta(&meta, &nmeta, theirs, ntheirs, ours, nours, repo,
- loose_obj_only, progress_cb, progress_arg, cancel_cb, cancel_arg);
+ loose_obj_only, progress_cb, progress_arg, &rl,
+ cancel_cb, cancel_arg);
if (err)
return err;
@@ -1326,7 +1350,7 @@ got_pack_create(uint8_t *packsha1, FILE *packfile,
if (nmeta > 0) {
err = pick_deltas(meta, nmeta, nours, delta_cache, repo,
- progress_cb, progress_arg, cancel_cb, cancel_arg);
+ progress_cb, progress_arg, &rl, cancel_cb, cancel_arg);
if (err)
goto done;
if (fseeko(delta_cache, 0L, SEEK_SET) == -1) {
@@ -1336,7 +1360,7 @@ got_pack_create(uint8_t *packsha1, FILE *packfile,
}
err = genpack(packsha1, packfile, delta_cache, meta, nmeta, nours, 1,
- repo, progress_cb, progress_arg, cancel_cb, cancel_arg);
+ repo, progress_cb, progress_arg, &rl, cancel_cb, cancel_arg);
if (err)
goto done;
done:
blob - /dev/null
blob + 219e7905e4765ae964a3ab7a1e8145d1ce344c2f (mode 644)
--- /dev/null
+++ lib/ratelimit.c
@@ -0,0 +1,55 @@
+/*
+ * Copyright (c) 2022 Stefan Sperling <stsp@openbsd.org>
+ *
+ * Permission to use, copy, modify, and distribute this software for any
+ * purpose with or without fee is hereby granted, provided that the above
+ * copyright notice and this permission notice appear in all copies.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS" AND THE AUTHOR DISCLAIMS ALL WARRANTIES
+ * WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF
+ * MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR
+ * ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES
+ * WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN
+ * ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF
+ * OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE.
+ */
+
+#include <sys/time.h>
+
+#include <stdio.h>
+#include <limits.h>
+#include <string.h>
+#include <time.h>
+
+#include "got_lib_ratelimit.h"
+
+#include "got_error.h"
+
+void
+got_ratelimit_init(struct got_ratelimit *rl, time_t interval_sec,
+ unsigned int interval_msec)
+{
+ memset(rl, 0, sizeof(*rl));
+ rl->interval.tv_sec = interval_sec;
+ rl->interval.tv_nsec = interval_msec * 1000000UL;
+}
+
+const struct got_error *
+got_ratelimit_check(int *elapsed, struct got_ratelimit *rl)
+{
+ struct timespec now, delta;
+
+ if (clock_gettime(CLOCK_MONOTONIC, &now) == -1)
+ return got_error_from_errno("clock_gettime");
+
+ if (timespecisset(&rl->last)) {
+ timespecsub(&now, &rl->last, &delta);
+ *elapsed = timespeccmp(&delta, &rl->interval, >=) ? 1 : 0;
+ } else
+ *elapsed = 1;
+
+ if (*elapsed)
+ rl->last = now;
+
+ return NULL;
+}
blob - 4e1253bcafe34044a40c52250b6a96a552b4b609
blob + 40af887d57530bc64cde9dbfdd26426592ae93c3
--- lib/repository_admin.c
+++ lib/repository_admin.c
@@ -54,6 +54,7 @@
#include "got_lib_pack_create.h"
#include "got_lib_sha1.h"
#include "got_lib_lockfile.h"
+#include "got_lib_ratelimit.h"
#ifndef nitems
#define nitems(_a) (sizeof((_a)) / sizeof((_a)[0]))
@@ -598,9 +599,27 @@ done:
}
static const struct got_error *
+report_cleanup_progress(got_cleanup_progress_cb progress_cb,
+ void *progress_arg, struct got_ratelimit *rl,
+ int nloose, int ncommits, int npurged)
+{
+ const struct got_error *err;
+ int elapsed;
+
+ if (progress_cb == NULL)
+ return NULL;
+
+ err = got_ratelimit_check(&elapsed, rl);
+ if (err || !elapsed)
+ return err;
+
+ return progress_cb(progress_arg, nloose, ncommits, npurged);
+}
+
+static const struct got_error *
get_loose_object_ids(struct got_object_idset **loose_ids, off_t *ondisk_size,
got_cleanup_progress_cb progress_cb, void *progress_arg,
- struct got_repository *repo)
+ struct got_ratelimit *rl, struct got_repository *repo)
{
const struct got_error *err = NULL;
char *path_objects = NULL, *path = NULL;
@@ -688,13 +707,11 @@ get_loose_object_ids(struct got_object_idset **loose_i
err = got_object_idset_add(*loose_ids, &id, NULL);
if (err)
goto done;
- if (progress_cb) {
- err = progress_cb(progress_arg,
- got_object_idset_num_elements(*loose_ids),
- -1, -1);
- if (err)
- goto done;
- }
+ err = report_cleanup_progress(progress_cb,
+ progress_arg, rl,
+ got_object_idset_num_elements(*loose_ids), -1, -1);
+ if (err)
+ goto done;
}
if (closedir(dir) != 0) {
@@ -878,7 +895,8 @@ static const struct got_error *
load_commit_or_tag(struct got_object_idset *loose_ids, int *ncommits,
int *npacked, struct got_object_idset *traversed_ids,
struct got_object_id *id, struct got_repository *repo,
- got_cleanup_progress_cb progress_cb, void *progress_arg, int nloose,
+ got_cleanup_progress_cb progress_cb, void *progress_arg,
+ struct got_ratelimit *rl, int nloose,
got_cancel_cb cancel_cb, void *cancel_arg)
{
const struct got_error *err;
@@ -986,11 +1004,10 @@ load_commit_or_tag(struct got_object_idset *loose_ids,
if (commit || tag)
(*ncommits)++; /* scanned tags are counted as commits */
- if (progress_cb) {
- err = progress_cb(progress_arg, nloose, *ncommits, -1);
- if (err)
- break;
- }
+ err = report_cleanup_progress(progress_cb, progress_arg, rl,
+ nloose, *ncommits, -1);
+ if (err)
+ break;
if (commit) {
/* Find parent commits to scan. */
@@ -1024,6 +1041,7 @@ struct purge_loose_object_arg {
struct got_repository *repo;
got_cleanup_progress_cb progress_cb;
void *progress_arg;
+ struct got_ratelimit *rl;
int nloose;
int ncommits;
int npurged;
@@ -1075,10 +1093,10 @@ purge_loose_object(struct got_object_id *id, void *dat
a->npurged++;
a->size_purged += sb.st_size;
- if (a->progress_cb) {
- err = a->progress_cb(a->progress_arg, a->nloose,
- a->ncommits, a->npurged);
- }
+ err = report_cleanup_progress(a->progress_cb, a->progress_arg,
+ a->rl, a->nloose, a->ncommits, a->npurged);
+ if (err)
+ goto done;
}
done:
if (fd != -1 && close(fd) == -1 && err == NULL)
@@ -1104,15 +1122,17 @@ got_repo_purge_unreferenced_loose_objects(struct got_r
struct got_reflist_entry *re;
struct purge_loose_object_arg arg;
time_t max_mtime = 0;
+ struct got_ratelimit rl;
TAILQ_INIT(&refs);
+ got_ratelimit_init(&rl, 0, 500);
*size_before = 0;
*size_after = 0;
*npacked = 0;
err = get_loose_object_ids(&loose_ids, size_before,
- progress_cb, progress_arg, repo);
+ progress_cb, progress_arg, &rl, repo);
if (err)
return err;
nloose = got_object_idset_num_elements(loose_ids);
@@ -1153,23 +1173,17 @@ got_repo_purge_unreferenced_loose_objects(struct got_r
for (i = 0; i < nreferenced; i++) {
struct got_object_id *id = referenced_ids[i];
err = load_commit_or_tag(loose_ids, &ncommits, npacked,
- traversed_ids, id, repo, progress_cb, progress_arg, nloose,
- cancel_cb, cancel_arg);
+ traversed_ids, id, repo, progress_cb, progress_arg, &rl,
+ nloose, cancel_cb, cancel_arg);
if (err)
goto done;
}
- /* Produce a final progress report in case no objects can be purged. */
- if (got_object_idset_num_elements(loose_ids) == 0 && progress_cb) {
- err = progress_cb(progress_arg, nloose, ncommits, 0);
- if (err)
- goto done;
- }
-
/* Any remaining loose objects are unreferenced and can be purged. */
arg.repo = repo;
arg.progress_arg = progress_arg;
arg.progress_cb = progress_cb;
+ arg.rl = &rl;
arg.nloose = nloose;
arg.npurged = 0;
arg.size_purged = 0;
@@ -1181,6 +1195,14 @@ got_repo_purge_unreferenced_loose_objects(struct got_r
if (err)
goto done;
*size_after = *size_before - arg.size_purged;
+
+ /* Produce a final progress report. */
+ if (progress_cb) {
+ err = progress_cb(progress_arg, nloose, ncommits,
+ got_object_idset_num_elements(loose_ids));
+ if (err)
+ goto done;
+ }
done:
got_object_idset_free(loose_ids);
got_object_idset_free(traversed_ids);
rate-limiting of gotadmin progress output