|  | #define USE_THE_REPOSITORY_VARIABLE | 
|  |  | 
|  | #include "git-compat-util.h" | 
|  | #include "gettext.h" | 
|  | #include "hex.h" | 
|  | #include "refs.h" | 
|  | #include "commit.h" | 
|  | #include "blob.h" | 
|  | #include "diff.h" | 
|  | #include "revision.h" | 
|  | #include "reachable.h" | 
|  | #include "cache-tree.h" | 
|  | #include "progress.h" | 
|  | #include "list-objects.h" | 
|  | #include "packfile.h" | 
|  | #include "worktree.h" | 
|  | #include "object-file.h" | 
|  | #include "pack-bitmap.h" | 
|  | #include "pack-mtimes.h" | 
|  | #include "config.h" | 
|  | #include "run-command.h" | 
|  | #include "sequencer.h" | 
|  |  | 
|  | struct connectivity_progress { | 
|  | struct progress *progress; | 
|  | unsigned long count; | 
|  | }; | 
|  |  | 
|  | static void update_progress(struct connectivity_progress *cp) | 
|  | { | 
|  | cp->count++; | 
|  | if ((cp->count & 1023) == 0) | 
|  | display_progress(cp->progress, cp->count); | 
|  | } | 
|  |  | 
|  | static void add_one_file(const char *path, struct rev_info *revs) | 
|  | { | 
|  | struct strbuf buf = STRBUF_INIT; | 
|  | struct object_id oid; | 
|  | struct object *object; | 
|  |  | 
|  | if (!read_oneliner(&buf, path, READ_ONELINER_SKIP_IF_EMPTY)) { | 
|  | strbuf_release(&buf); | 
|  | return; | 
|  | } | 
|  | strbuf_trim(&buf); | 
|  | if (!get_oid_hex(buf.buf, &oid)) { | 
|  | object = parse_object_or_die(the_repository, &oid, buf.buf); | 
|  | add_pending_object(revs, object, ""); | 
|  | } | 
|  | strbuf_release(&buf); | 
|  | } | 
|  |  | 
|  | /* Mark objects recorded in rebase state files as reachable. */ | 
|  | static void add_rebase_files(struct rev_info *revs) | 
|  | { | 
|  | struct strbuf buf = STRBUF_INIT; | 
|  | size_t len; | 
|  | const char *path[] = { | 
|  | "rebase-apply/autostash", | 
|  | "rebase-apply/orig-head", | 
|  | "rebase-merge/autostash", | 
|  | "rebase-merge/orig-head", | 
|  | }; | 
|  | struct worktree **worktrees = get_worktrees(); | 
|  |  | 
|  | for (struct worktree **wt = worktrees; *wt; wt++) { | 
|  | char *wt_gitdir = get_worktree_git_dir(*wt); | 
|  |  | 
|  | strbuf_reset(&buf); | 
|  | strbuf_addstr(&buf, wt_gitdir); | 
|  | strbuf_complete(&buf, '/'); | 
|  | len = buf.len; | 
|  | for (size_t i = 0; i < ARRAY_SIZE(path); i++) { | 
|  | strbuf_setlen(&buf, len); | 
|  | strbuf_addstr(&buf, path[i]); | 
|  | add_one_file(buf.buf, revs); | 
|  | } | 
|  |  | 
|  | free(wt_gitdir); | 
|  | } | 
|  | strbuf_release(&buf); | 
|  | free_worktrees(worktrees); | 
|  | } | 
|  |  | 
|  | static int add_one_ref(const char *path, const char *referent UNUSED, const struct object_id *oid, | 
|  | int flag, void *cb_data) | 
|  | { | 
|  | struct rev_info *revs = (struct rev_info *)cb_data; | 
|  | struct object *object; | 
|  |  | 
|  | if ((flag & REF_ISSYMREF) && (flag & REF_ISBROKEN)) { | 
|  | warning("symbolic ref is dangling: %s", path); | 
|  | return 0; | 
|  | } | 
|  |  | 
|  | object = parse_object_or_die(the_repository, oid, path); | 
|  | add_pending_object(revs, object, ""); | 
|  |  | 
|  | return 0; | 
|  | } | 
|  |  | 
|  | /* | 
|  | * The traversal will have already marked us as SEEN, so we | 
|  | * only need to handle any progress reporting here. | 
|  | */ | 
|  | static void mark_object(struct object *obj UNUSED, | 
|  | const char *name UNUSED, | 
|  | void *data) | 
|  | { | 
|  | update_progress(data); | 
|  | } | 
|  |  | 
|  | static void mark_commit(struct commit *c, void *data) | 
|  | { | 
|  | mark_object(&c->object, NULL, data); | 
|  | } | 
|  |  | 
|  | struct recent_data { | 
|  | struct rev_info *revs; | 
|  | timestamp_t timestamp; | 
|  | report_recent_object_fn *cb; | 
|  | int ignore_in_core_kept_packs; | 
|  |  | 
|  | struct oidset extra_recent_oids; | 
|  | int extra_recent_oids_loaded; | 
|  | }; | 
|  |  | 
|  | static int run_one_gc_recent_objects_hook(struct oidset *set, | 
|  | const char *args) | 
|  | { | 
|  | struct child_process cmd = CHILD_PROCESS_INIT; | 
|  | struct strbuf buf = STRBUF_INIT; | 
|  | FILE *out; | 
|  | int ret = 0; | 
|  |  | 
|  | cmd.use_shell = 1; | 
|  | cmd.out = -1; | 
|  |  | 
|  | strvec_push(&cmd.args, args); | 
|  |  | 
|  | if (start_command(&cmd)) | 
|  | return -1; | 
|  |  | 
|  | out = xfdopen(cmd.out, "r"); | 
|  | while (strbuf_getline(&buf, out) != EOF) { | 
|  | struct object_id oid; | 
|  | const char *rest; | 
|  |  | 
|  | if (parse_oid_hex(buf.buf, &oid, &rest) || *rest) { | 
|  | ret = error(_("invalid extra cruft tip: '%s'"), buf.buf); | 
|  | break; | 
|  | } | 
|  |  | 
|  | oidset_insert(set, &oid); | 
|  | } | 
|  |  | 
|  | fclose(out); | 
|  | ret |= finish_command(&cmd); | 
|  |  | 
|  | strbuf_release(&buf); | 
|  | return ret; | 
|  | } | 
|  |  | 
|  | static void load_gc_recent_objects(struct recent_data *data) | 
|  | { | 
|  | const struct string_list *programs; | 
|  | int ret = 0; | 
|  | size_t i; | 
|  |  | 
|  | data->extra_recent_oids_loaded = 1; | 
|  |  | 
|  | if (repo_config_get_string_multi(the_repository, "gc.recentobjectshook", &programs)) | 
|  | return; | 
|  |  | 
|  | for (i = 0; i < programs->nr; i++) { | 
|  | ret = run_one_gc_recent_objects_hook(&data->extra_recent_oids, | 
|  | programs->items[i].string); | 
|  | if (ret) | 
|  | die(_("unable to enumerate additional recent objects")); | 
|  | } | 
|  | } | 
|  |  | 
|  | static int obj_is_recent(const struct object_id *oid, timestamp_t mtime, | 
|  | struct recent_data *data) | 
|  | { | 
|  | if (mtime > data->timestamp) | 
|  | return 1; | 
|  |  | 
|  | if (!data->extra_recent_oids_loaded) | 
|  | load_gc_recent_objects(data); | 
|  | return oidset_contains(&data->extra_recent_oids, oid); | 
|  | } | 
|  |  | 
|  | static void add_recent_object(const struct object_id *oid, | 
|  | struct packed_git *pack, | 
|  | off_t offset, | 
|  | timestamp_t mtime, | 
|  | struct recent_data *data) | 
|  | { | 
|  | struct object *obj; | 
|  | enum object_type type; | 
|  |  | 
|  | if (!obj_is_recent(oid, mtime, data)) | 
|  | return; | 
|  |  | 
|  | /* | 
|  | * We do not want to call parse_object here, because | 
|  | * inflating blobs and trees could be very expensive. | 
|  | * However, we do need to know the correct type for | 
|  | * later processing, and the revision machinery expects | 
|  | * commits and tags to have been parsed. | 
|  | */ | 
|  | type = odb_read_object_info(the_repository->objects, oid, NULL); | 
|  | if (type < 0) | 
|  | die("unable to get object info for %s", oid_to_hex(oid)); | 
|  |  | 
|  | switch (type) { | 
|  | case OBJ_TAG: | 
|  | case OBJ_COMMIT: | 
|  | obj = parse_object_or_die(the_repository, oid, NULL); | 
|  | break; | 
|  | case OBJ_TREE: | 
|  | obj = (struct object *)lookup_tree(the_repository, oid); | 
|  | break; | 
|  | case OBJ_BLOB: | 
|  | obj = (struct object *)lookup_blob(the_repository, oid); | 
|  | break; | 
|  | default: | 
|  | die("unknown object type for %s: %s", | 
|  | oid_to_hex(oid), type_name(type)); | 
|  | } | 
|  |  | 
|  | if (!obj) | 
|  | die("unable to lookup %s", oid_to_hex(oid)); | 
|  |  | 
|  | add_pending_object(data->revs, obj, ""); | 
|  | if (data->cb) | 
|  | data->cb(obj, pack, offset, mtime); | 
|  | } | 
|  |  | 
|  | static int want_recent_object(struct recent_data *data, | 
|  | const struct object_id *oid) | 
|  | { | 
|  | if (data->ignore_in_core_kept_packs && | 
|  | has_object_kept_pack(data->revs->repo, oid, IN_CORE_KEEP_PACKS)) | 
|  | return 0; | 
|  | return 1; | 
|  | } | 
|  |  | 
|  | static int add_recent_loose(const struct object_id *oid, | 
|  | const char *path, void *data) | 
|  | { | 
|  | struct stat st; | 
|  | struct object *obj; | 
|  |  | 
|  | if (!want_recent_object(data, oid)) | 
|  | return 0; | 
|  |  | 
|  | obj = lookup_object(the_repository, oid); | 
|  |  | 
|  | if (obj && obj->flags & SEEN) | 
|  | return 0; | 
|  |  | 
|  | if (stat(path, &st) < 0) { | 
|  | /* | 
|  | * It's OK if an object went away during our iteration; this | 
|  | * could be due to a simultaneous repack. But anything else | 
|  | * we should abort, since we might then fail to mark objects | 
|  | * which should not be pruned. | 
|  | */ | 
|  | if (errno == ENOENT) | 
|  | return 0; | 
|  | return error_errno("unable to stat %s", oid_to_hex(oid)); | 
|  | } | 
|  |  | 
|  | add_recent_object(oid, NULL, 0, st.st_mtime, data); | 
|  | return 0; | 
|  | } | 
|  |  | 
|  | static int add_recent_packed(const struct object_id *oid, | 
|  | struct packed_git *p, | 
|  | uint32_t pos, | 
|  | void *data) | 
|  | { | 
|  | struct object *obj; | 
|  | timestamp_t mtime = p->mtime; | 
|  |  | 
|  | if (!want_recent_object(data, oid)) | 
|  | return 0; | 
|  |  | 
|  | obj = lookup_object(the_repository, oid); | 
|  |  | 
|  | if (obj && obj->flags & SEEN) | 
|  | return 0; | 
|  | if (p->is_cruft) { | 
|  | if (load_pack_mtimes(p) < 0) | 
|  | die(_("could not load cruft pack .mtimes")); | 
|  | mtime = nth_packed_mtime(p, pos); | 
|  | } | 
|  | add_recent_object(oid, p, nth_packed_object_offset(p, pos), mtime, data); | 
|  | return 0; | 
|  | } | 
|  |  | 
|  | int add_unseen_recent_objects_to_traversal(struct rev_info *revs, | 
|  | timestamp_t timestamp, | 
|  | report_recent_object_fn *cb, | 
|  | int ignore_in_core_kept_packs) | 
|  | { | 
|  | struct recent_data data; | 
|  | enum for_each_object_flags flags; | 
|  | int r; | 
|  |  | 
|  | data.revs = revs; | 
|  | data.timestamp = timestamp; | 
|  | data.cb = cb; | 
|  | data.ignore_in_core_kept_packs = ignore_in_core_kept_packs; | 
|  |  | 
|  | oidset_init(&data.extra_recent_oids, 0); | 
|  | data.extra_recent_oids_loaded = 0; | 
|  |  | 
|  | r = for_each_loose_object(the_repository->objects, add_recent_loose, &data, | 
|  | FOR_EACH_OBJECT_LOCAL_ONLY); | 
|  | if (r) | 
|  | goto done; | 
|  |  | 
|  | flags = FOR_EACH_OBJECT_LOCAL_ONLY | FOR_EACH_OBJECT_PACK_ORDER; | 
|  | if (ignore_in_core_kept_packs) | 
|  | flags |= FOR_EACH_OBJECT_SKIP_IN_CORE_KEPT_PACKS; | 
|  |  | 
|  | r = for_each_packed_object(revs->repo, add_recent_packed, &data, flags); | 
|  |  | 
|  | done: | 
|  | oidset_clear(&data.extra_recent_oids); | 
|  |  | 
|  | return r; | 
|  | } | 
|  |  | 
|  | static int mark_object_seen(const struct object_id *oid, | 
|  | enum object_type type, | 
|  | int exclude UNUSED, | 
|  | uint32_t name_hash UNUSED, | 
|  | struct packed_git *found_pack UNUSED, | 
|  | off_t found_offset UNUSED, | 
|  | void *payload UNUSED) | 
|  | { | 
|  | struct object *obj = lookup_object_by_type(the_repository, oid, type); | 
|  | if (!obj) | 
|  | die("unable to create object '%s'", oid_to_hex(oid)); | 
|  |  | 
|  | obj->flags |= SEEN; | 
|  | return 0; | 
|  | } | 
|  |  | 
|  | void mark_reachable_objects(struct rev_info *revs, int mark_reflog, | 
|  | timestamp_t mark_recent, struct progress *progress) | 
|  | { | 
|  | struct connectivity_progress cp; | 
|  | struct bitmap_index *bitmap_git; | 
|  |  | 
|  | /* | 
|  | * Set up revision parsing, and mark us as being interested | 
|  | * in all object types, not just commits. | 
|  | */ | 
|  | revs->tag_objects = 1; | 
|  | revs->blob_objects = 1; | 
|  | revs->tree_objects = 1; | 
|  |  | 
|  | /* Add all refs from the index file */ | 
|  | add_index_objects_to_pending(revs, 0); | 
|  |  | 
|  | /* Add all external refs */ | 
|  | refs_for_each_ref(get_main_ref_store(the_repository), add_one_ref, | 
|  | revs); | 
|  |  | 
|  | /* detached HEAD is not included in the list above */ | 
|  | refs_head_ref(get_main_ref_store(the_repository), add_one_ref, revs); | 
|  | other_head_refs(add_one_ref, revs); | 
|  |  | 
|  | /* rebase autostash and orig-head */ | 
|  | add_rebase_files(revs); | 
|  |  | 
|  | /* Add all reflog info */ | 
|  | if (mark_reflog) | 
|  | add_reflogs_to_pending(revs, 0); | 
|  |  | 
|  | cp.progress = progress; | 
|  | cp.count = 0; | 
|  |  | 
|  | bitmap_git = prepare_bitmap_walk(revs, 0); | 
|  | if (bitmap_git) { | 
|  | traverse_bitmap_commit_list(bitmap_git, revs, mark_object_seen); | 
|  | free_bitmap_index(bitmap_git); | 
|  | } else { | 
|  | if (prepare_revision_walk(revs)) | 
|  | die("revision walk setup failed"); | 
|  | traverse_commit_list(revs, mark_commit, mark_object, &cp); | 
|  | } | 
|  |  | 
|  | if (mark_recent) { | 
|  | revs->ignore_missing_links = 1; | 
|  | if (add_unseen_recent_objects_to_traversal(revs, mark_recent, | 
|  | NULL, 0)) | 
|  | die("unable to mark recent objects"); | 
|  | if (prepare_revision_walk(revs)) | 
|  | die("revision walk setup failed"); | 
|  | traverse_commit_list(revs, mark_commit, mark_object, &cp); | 
|  | } | 
|  |  | 
|  | display_progress(cp.progress, cp.count); | 
|  | } |