diff options
Diffstat (limited to '')
-rw-r--r-- | reachable.c | 354 |
1 files changed, 354 insertions, 0 deletions
diff --git a/reachable.c b/reachable.c new file mode 100644 index 0000000..0ce8f83 --- /dev/null +++ b/reachable.c @@ -0,0 +1,354 @@ +#include "git-compat-util.h" +#include "gettext.h" +#include "hex.h" +#include "refs.h" +#include "tag.h" +#include "commit.h" +#include "blob.h" +#include "diff.h" +#include "revision.h" +#include "reachable.h" +#include "cache-tree.h" +#include "progress.h" +#include "list-objects.h" +#include "packfile.h" +#include "worktree.h" +#include "object-store-ll.h" +#include "pack-bitmap.h" +#include "pack-mtimes.h" +#include "config.h" +#include "run-command.h" + +struct connectivity_progress { + struct progress *progress; + unsigned long count; +}; + +static void update_progress(struct connectivity_progress *cp) +{ + cp->count++; + if ((cp->count & 1023) == 0) + display_progress(cp->progress, cp->count); +} + +static int add_one_ref(const char *path, const struct object_id *oid, + int flag, void *cb_data) +{ + struct rev_info *revs = (struct rev_info *)cb_data; + struct object *object; + + if ((flag & REF_ISSYMREF) && (flag & REF_ISBROKEN)) { + warning("symbolic ref is dangling: %s", path); + return 0; + } + + object = parse_object_or_die(oid, path); + add_pending_object(revs, object, ""); + + return 0; +} + +/* + * The traversal will have already marked us as SEEN, so we + * only need to handle any progress reporting here. + */ +static void mark_object(struct object *obj UNUSED, + const char *name UNUSED, + void *data) +{ + update_progress(data); +} + +static void mark_commit(struct commit *c, void *data) +{ + mark_object(&c->object, NULL, data); +} + +struct recent_data { + struct rev_info *revs; + timestamp_t timestamp; + report_recent_object_fn *cb; + int ignore_in_core_kept_packs; + + struct oidset extra_recent_oids; + int extra_recent_oids_loaded; +}; + +static int run_one_gc_recent_objects_hook(struct oidset *set, + const char *args) +{ + struct child_process cmd = CHILD_PROCESS_INIT; + struct strbuf buf = STRBUF_INIT; + FILE *out; + int ret = 0; + + cmd.use_shell = 1; + cmd.out = -1; + + strvec_push(&cmd.args, args); + + if (start_command(&cmd)) + return -1; + + out = xfdopen(cmd.out, "r"); + while (strbuf_getline(&buf, out) != EOF) { + struct object_id oid; + const char *rest; + + if (parse_oid_hex(buf.buf, &oid, &rest) || *rest) { + ret = error(_("invalid extra cruft tip: '%s'"), buf.buf); + break; + } + + oidset_insert(set, &oid); + } + + fclose(out); + ret |= finish_command(&cmd); + + strbuf_release(&buf); + return ret; +} + +static void load_gc_recent_objects(struct recent_data *data) +{ + const struct string_list *programs; + int ret = 0; + size_t i; + + data->extra_recent_oids_loaded = 1; + + if (git_config_get_string_multi("gc.recentobjectshook", &programs)) + return; + + for (i = 0; i < programs->nr; i++) { + ret = run_one_gc_recent_objects_hook(&data->extra_recent_oids, + programs->items[i].string); + if (ret) + die(_("unable to enumerate additional recent objects")); + } +} + +static int obj_is_recent(const struct object_id *oid, timestamp_t mtime, + struct recent_data *data) +{ + if (mtime > data->timestamp) + return 1; + + if (!data->extra_recent_oids_loaded) + load_gc_recent_objects(data); + return oidset_contains(&data->extra_recent_oids, oid); +} + +static void add_recent_object(const struct object_id *oid, + struct packed_git *pack, + off_t offset, + timestamp_t mtime, + struct recent_data *data) +{ + struct object *obj; + enum object_type type; + + if (!obj_is_recent(oid, mtime, data)) + return; + + /* + * We do not want to call parse_object here, because + * inflating blobs and trees could be very expensive. + * However, we do need to know the correct type for + * later processing, and the revision machinery expects + * commits and tags to have been parsed. + */ + type = oid_object_info(the_repository, oid, NULL); + if (type < 0) + die("unable to get object info for %s", oid_to_hex(oid)); + + switch (type) { + case OBJ_TAG: + case OBJ_COMMIT: + obj = parse_object_or_die(oid, NULL); + break; + case OBJ_TREE: + obj = (struct object *)lookup_tree(the_repository, oid); + break; + case OBJ_BLOB: + obj = (struct object *)lookup_blob(the_repository, oid); + break; + default: + die("unknown object type for %s: %s", + oid_to_hex(oid), type_name(type)); + } + + if (!obj) + die("unable to lookup %s", oid_to_hex(oid)); + + add_pending_object(data->revs, obj, ""); + if (data->cb) + data->cb(obj, pack, offset, mtime); +} + +static int want_recent_object(struct recent_data *data, + const struct object_id *oid) +{ + if (data->ignore_in_core_kept_packs && + has_object_kept_pack(oid, IN_CORE_KEEP_PACKS)) + return 0; + return 1; +} + +static int add_recent_loose(const struct object_id *oid, + const char *path, void *data) +{ + struct stat st; + struct object *obj; + + if (!want_recent_object(data, oid)) + return 0; + + obj = lookup_object(the_repository, oid); + + if (obj && obj->flags & SEEN) + return 0; + + if (stat(path, &st) < 0) { + /* + * It's OK if an object went away during our iteration; this + * could be due to a simultaneous repack. But anything else + * we should abort, since we might then fail to mark objects + * which should not be pruned. + */ + if (errno == ENOENT) + return 0; + return error_errno("unable to stat %s", oid_to_hex(oid)); + } + + add_recent_object(oid, NULL, 0, st.st_mtime, data); + return 0; +} + +static int add_recent_packed(const struct object_id *oid, + struct packed_git *p, + uint32_t pos, + void *data) +{ + struct object *obj; + timestamp_t mtime = p->mtime; + + if (!want_recent_object(data, oid)) + return 0; + + obj = lookup_object(the_repository, oid); + + if (obj && obj->flags & SEEN) + return 0; + if (p->is_cruft) { + if (load_pack_mtimes(p) < 0) + die(_("could not load cruft pack .mtimes")); + mtime = nth_packed_mtime(p, pos); + } + add_recent_object(oid, p, nth_packed_object_offset(p, pos), mtime, data); + return 0; +} + +int add_unseen_recent_objects_to_traversal(struct rev_info *revs, + timestamp_t timestamp, + report_recent_object_fn *cb, + int ignore_in_core_kept_packs) +{ + struct recent_data data; + enum for_each_object_flags flags; + int r; + + data.revs = revs; + data.timestamp = timestamp; + data.cb = cb; + data.ignore_in_core_kept_packs = ignore_in_core_kept_packs; + + oidset_init(&data.extra_recent_oids, 0); + data.extra_recent_oids_loaded = 0; + + r = for_each_loose_object(add_recent_loose, &data, + FOR_EACH_OBJECT_LOCAL_ONLY); + if (r) + goto done; + + flags = FOR_EACH_OBJECT_LOCAL_ONLY | FOR_EACH_OBJECT_PACK_ORDER; + if (ignore_in_core_kept_packs) + flags |= FOR_EACH_OBJECT_SKIP_IN_CORE_KEPT_PACKS; + + r = for_each_packed_object(add_recent_packed, &data, flags); + +done: + oidset_clear(&data.extra_recent_oids); + + return r; +} + +static int mark_object_seen(const struct object_id *oid, + enum object_type type, + int exclude UNUSED, + uint32_t name_hash UNUSED, + struct packed_git *found_pack UNUSED, + off_t found_offset UNUSED) +{ + struct object *obj = lookup_object_by_type(the_repository, oid, type); + if (!obj) + die("unable to create object '%s'", oid_to_hex(oid)); + + obj->flags |= SEEN; + return 0; +} + +void mark_reachable_objects(struct rev_info *revs, int mark_reflog, + timestamp_t mark_recent, struct progress *progress) +{ + struct connectivity_progress cp; + struct bitmap_index *bitmap_git; + + /* + * Set up revision parsing, and mark us as being interested + * in all object types, not just commits. + */ + revs->tag_objects = 1; + revs->blob_objects = 1; + revs->tree_objects = 1; + + /* Add all refs from the index file */ + add_index_objects_to_pending(revs, 0); + + /* Add all external refs */ + for_each_ref(add_one_ref, revs); + + /* detached HEAD is not included in the list above */ + head_ref(add_one_ref, revs); + other_head_refs(add_one_ref, revs); + + /* Add all reflog info */ + if (mark_reflog) + add_reflogs_to_pending(revs, 0); + + cp.progress = progress; + cp.count = 0; + + bitmap_git = prepare_bitmap_walk(revs, 0); + if (bitmap_git) { + traverse_bitmap_commit_list(bitmap_git, revs, mark_object_seen); + free_bitmap_index(bitmap_git); + } else { + if (prepare_revision_walk(revs)) + die("revision walk setup failed"); + traverse_commit_list(revs, mark_commit, mark_object, &cp); + } + + if (mark_recent) { + revs->ignore_missing_links = 1; + if (add_unseen_recent_objects_to_traversal(revs, mark_recent, + NULL, 0)) + die("unable to mark recent objects"); + if (prepare_revision_walk(revs)) + die("revision walk setup failed"); + traverse_commit_list(revs, mark_commit, mark_object, &cp); + } + + display_progress(cp.progress, cp.count); +} |