summaryrefslogtreecommitdiffstats
path: root/reachable.c
diff options
context:
space:
mode:
authorDaniel Baumann <daniel.baumann@progress-linux.org>2024-04-09 13:34:27 +0000
committerDaniel Baumann <daniel.baumann@progress-linux.org>2024-04-09 13:34:27 +0000
commit4dbdc42d9e7c3968ff7f690d00680419c9b8cb0f (patch)
tree47c1d492e9c956c1cd2b74dbd3b9d8b0db44dc4e /reachable.c
parentInitial commit. (diff)
downloadgit-4dbdc42d9e7c3968ff7f690d00680419c9b8cb0f.tar.xz
git-4dbdc42d9e7c3968ff7f690d00680419c9b8cb0f.zip
Adding upstream version 1:2.43.0.upstream/1%2.43.0
Signed-off-by: Daniel Baumann <daniel.baumann@progress-linux.org>
Diffstat (limited to 'reachable.c')
-rw-r--r--reachable.c354
1 files changed, 354 insertions, 0 deletions
diff --git a/reachable.c b/reachable.c
new file mode 100644
index 0000000..0ce8f83
--- /dev/null
+++ b/reachable.c
@@ -0,0 +1,354 @@
+#include "git-compat-util.h"
+#include "gettext.h"
+#include "hex.h"
+#include "refs.h"
+#include "tag.h"
+#include "commit.h"
+#include "blob.h"
+#include "diff.h"
+#include "revision.h"
+#include "reachable.h"
+#include "cache-tree.h"
+#include "progress.h"
+#include "list-objects.h"
+#include "packfile.h"
+#include "worktree.h"
+#include "object-store-ll.h"
+#include "pack-bitmap.h"
+#include "pack-mtimes.h"
+#include "config.h"
+#include "run-command.h"
+
+struct connectivity_progress {
+ struct progress *progress;
+ unsigned long count;
+};
+
+static void update_progress(struct connectivity_progress *cp)
+{
+ cp->count++;
+ if ((cp->count & 1023) == 0)
+ display_progress(cp->progress, cp->count);
+}
+
+static int add_one_ref(const char *path, const struct object_id *oid,
+ int flag, void *cb_data)
+{
+ struct rev_info *revs = (struct rev_info *)cb_data;
+ struct object *object;
+
+ if ((flag & REF_ISSYMREF) && (flag & REF_ISBROKEN)) {
+ warning("symbolic ref is dangling: %s", path);
+ return 0;
+ }
+
+ object = parse_object_or_die(oid, path);
+ add_pending_object(revs, object, "");
+
+ return 0;
+}
+
+/*
+ * The traversal will have already marked us as SEEN, so we
+ * only need to handle any progress reporting here.
+ */
+static void mark_object(struct object *obj UNUSED,
+ const char *name UNUSED,
+ void *data)
+{
+ update_progress(data);
+}
+
+static void mark_commit(struct commit *c, void *data)
+{
+ mark_object(&c->object, NULL, data);
+}
+
+struct recent_data {
+ struct rev_info *revs;
+ timestamp_t timestamp;
+ report_recent_object_fn *cb;
+ int ignore_in_core_kept_packs;
+
+ struct oidset extra_recent_oids;
+ int extra_recent_oids_loaded;
+};
+
+static int run_one_gc_recent_objects_hook(struct oidset *set,
+ const char *args)
+{
+ struct child_process cmd = CHILD_PROCESS_INIT;
+ struct strbuf buf = STRBUF_INIT;
+ FILE *out;
+ int ret = 0;
+
+ cmd.use_shell = 1;
+ cmd.out = -1;
+
+ strvec_push(&cmd.args, args);
+
+ if (start_command(&cmd))
+ return -1;
+
+ out = xfdopen(cmd.out, "r");
+ while (strbuf_getline(&buf, out) != EOF) {
+ struct object_id oid;
+ const char *rest;
+
+ if (parse_oid_hex(buf.buf, &oid, &rest) || *rest) {
+ ret = error(_("invalid extra cruft tip: '%s'"), buf.buf);
+ break;
+ }
+
+ oidset_insert(set, &oid);
+ }
+
+ fclose(out);
+ ret |= finish_command(&cmd);
+
+ strbuf_release(&buf);
+ return ret;
+}
+
+static void load_gc_recent_objects(struct recent_data *data)
+{
+ const struct string_list *programs;
+ int ret = 0;
+ size_t i;
+
+ data->extra_recent_oids_loaded = 1;
+
+ if (git_config_get_string_multi("gc.recentobjectshook", &programs))
+ return;
+
+ for (i = 0; i < programs->nr; i++) {
+ ret = run_one_gc_recent_objects_hook(&data->extra_recent_oids,
+ programs->items[i].string);
+ if (ret)
+ die(_("unable to enumerate additional recent objects"));
+ }
+}
+
+static int obj_is_recent(const struct object_id *oid, timestamp_t mtime,
+ struct recent_data *data)
+{
+ if (mtime > data->timestamp)
+ return 1;
+
+ if (!data->extra_recent_oids_loaded)
+ load_gc_recent_objects(data);
+ return oidset_contains(&data->extra_recent_oids, oid);
+}
+
+static void add_recent_object(const struct object_id *oid,
+ struct packed_git *pack,
+ off_t offset,
+ timestamp_t mtime,
+ struct recent_data *data)
+{
+ struct object *obj;
+ enum object_type type;
+
+ if (!obj_is_recent(oid, mtime, data))
+ return;
+
+ /*
+ * We do not want to call parse_object here, because
+ * inflating blobs and trees could be very expensive.
+ * However, we do need to know the correct type for
+ * later processing, and the revision machinery expects
+ * commits and tags to have been parsed.
+ */
+ type = oid_object_info(the_repository, oid, NULL);
+ if (type < 0)
+ die("unable to get object info for %s", oid_to_hex(oid));
+
+ switch (type) {
+ case OBJ_TAG:
+ case OBJ_COMMIT:
+ obj = parse_object_or_die(oid, NULL);
+ break;
+ case OBJ_TREE:
+ obj = (struct object *)lookup_tree(the_repository, oid);
+ break;
+ case OBJ_BLOB:
+ obj = (struct object *)lookup_blob(the_repository, oid);
+ break;
+ default:
+ die("unknown object type for %s: %s",
+ oid_to_hex(oid), type_name(type));
+ }
+
+ if (!obj)
+ die("unable to lookup %s", oid_to_hex(oid));
+
+ add_pending_object(data->revs, obj, "");
+ if (data->cb)
+ data->cb(obj, pack, offset, mtime);
+}
+
+static int want_recent_object(struct recent_data *data,
+ const struct object_id *oid)
+{
+ if (data->ignore_in_core_kept_packs &&
+ has_object_kept_pack(oid, IN_CORE_KEEP_PACKS))
+ return 0;
+ return 1;
+}
+
+static int add_recent_loose(const struct object_id *oid,
+ const char *path, void *data)
+{
+ struct stat st;
+ struct object *obj;
+
+ if (!want_recent_object(data, oid))
+ return 0;
+
+ obj = lookup_object(the_repository, oid);
+
+ if (obj && obj->flags & SEEN)
+ return 0;
+
+ if (stat(path, &st) < 0) {
+ /*
+ * It's OK if an object went away during our iteration; this
+ * could be due to a simultaneous repack. But anything else
+ * we should abort, since we might then fail to mark objects
+ * which should not be pruned.
+ */
+ if (errno == ENOENT)
+ return 0;
+ return error_errno("unable to stat %s", oid_to_hex(oid));
+ }
+
+ add_recent_object(oid, NULL, 0, st.st_mtime, data);
+ return 0;
+}
+
+static int add_recent_packed(const struct object_id *oid,
+ struct packed_git *p,
+ uint32_t pos,
+ void *data)
+{
+ struct object *obj;
+ timestamp_t mtime = p->mtime;
+
+ if (!want_recent_object(data, oid))
+ return 0;
+
+ obj = lookup_object(the_repository, oid);
+
+ if (obj && obj->flags & SEEN)
+ return 0;
+ if (p->is_cruft) {
+ if (load_pack_mtimes(p) < 0)
+ die(_("could not load cruft pack .mtimes"));
+ mtime = nth_packed_mtime(p, pos);
+ }
+ add_recent_object(oid, p, nth_packed_object_offset(p, pos), mtime, data);
+ return 0;
+}
+
+int add_unseen_recent_objects_to_traversal(struct rev_info *revs,
+ timestamp_t timestamp,
+ report_recent_object_fn *cb,
+ int ignore_in_core_kept_packs)
+{
+ struct recent_data data;
+ enum for_each_object_flags flags;
+ int r;
+
+ data.revs = revs;
+ data.timestamp = timestamp;
+ data.cb = cb;
+ data.ignore_in_core_kept_packs = ignore_in_core_kept_packs;
+
+ oidset_init(&data.extra_recent_oids, 0);
+ data.extra_recent_oids_loaded = 0;
+
+ r = for_each_loose_object(add_recent_loose, &data,
+ FOR_EACH_OBJECT_LOCAL_ONLY);
+ if (r)
+ goto done;
+
+ flags = FOR_EACH_OBJECT_LOCAL_ONLY | FOR_EACH_OBJECT_PACK_ORDER;
+ if (ignore_in_core_kept_packs)
+ flags |= FOR_EACH_OBJECT_SKIP_IN_CORE_KEPT_PACKS;
+
+ r = for_each_packed_object(add_recent_packed, &data, flags);
+
+done:
+ oidset_clear(&data.extra_recent_oids);
+
+ return r;
+}
+
+static int mark_object_seen(const struct object_id *oid,
+ enum object_type type,
+ int exclude UNUSED,
+ uint32_t name_hash UNUSED,
+ struct packed_git *found_pack UNUSED,
+ off_t found_offset UNUSED)
+{
+ struct object *obj = lookup_object_by_type(the_repository, oid, type);
+ if (!obj)
+ die("unable to create object '%s'", oid_to_hex(oid));
+
+ obj->flags |= SEEN;
+ return 0;
+}
+
+void mark_reachable_objects(struct rev_info *revs, int mark_reflog,
+ timestamp_t mark_recent, struct progress *progress)
+{
+ struct connectivity_progress cp;
+ struct bitmap_index *bitmap_git;
+
+ /*
+ * Set up revision parsing, and mark us as being interested
+ * in all object types, not just commits.
+ */
+ revs->tag_objects = 1;
+ revs->blob_objects = 1;
+ revs->tree_objects = 1;
+
+ /* Add all refs from the index file */
+ add_index_objects_to_pending(revs, 0);
+
+ /* Add all external refs */
+ for_each_ref(add_one_ref, revs);
+
+ /* detached HEAD is not included in the list above */
+ head_ref(add_one_ref, revs);
+ other_head_refs(add_one_ref, revs);
+
+ /* Add all reflog info */
+ if (mark_reflog)
+ add_reflogs_to_pending(revs, 0);
+
+ cp.progress = progress;
+ cp.count = 0;
+
+ bitmap_git = prepare_bitmap_walk(revs, 0);
+ if (bitmap_git) {
+ traverse_bitmap_commit_list(bitmap_git, revs, mark_object_seen);
+ free_bitmap_index(bitmap_git);
+ } else {
+ if (prepare_revision_walk(revs))
+ die("revision walk setup failed");
+ traverse_commit_list(revs, mark_commit, mark_object, &cp);
+ }
+
+ if (mark_recent) {
+ revs->ignore_missing_links = 1;
+ if (add_unseen_recent_objects_to_traversal(revs, mark_recent,
+ NULL, 0))
+ die("unable to mark recent objects");
+ if (prepare_revision_walk(revs))
+ die("revision walk setup failed");
+ traverse_commit_list(revs, mark_commit, mark_object, &cp);
+ }
+
+ display_progress(cp.progress, cp.count);
+}