blob: 3b85add243ba79a4ccc90c9faacbb9fee2742303 [file] [log] [blame]
Elijah Newren98750582023-03-21 06:26:04 +00001#include "git-compat-util.h"
Elijah Newrenf394e092023-03-21 06:25:54 +00002#include "gettext.h"
Elijah Newren41771fa2023-02-24 00:09:27 +00003#include "hex.h"
Junio C Hamano94421472007-01-06 02:16:17 -08004#include "refs.h"
Junio C Hamano94421472007-01-06 02:16:17 -08005#include "commit.h"
6#include "blob.h"
7#include "diff.h"
8#include "revision.h"
9#include "reachable.h"
10#include "cache-tree.h"
Nguyễn Thái Ngọc Duydc347192011-11-05 19:00:08 +070011#include "progress.h"
Jeff King5f78a432014-10-15 18:37:28 -040012#include "list-objects.h"
Jonathan Tan7709f462017-08-18 15:20:38 -070013#include "packfile.h"
Nguyễn Thái Ngọc Duyd0c39a42017-08-23 19:36:59 +070014#include "worktree.h"
Elijah Newrena034e912023-05-16 06:34:06 +000015#include "object-store-ll.h"
Jeff Kingfde67d62019-02-13 23:37:43 -050016#include "pack-bitmap.h"
Taylor Blaufb546d62022-05-20 19:17:57 -040017#include "pack-mtimes.h"
Taylor Blau4dc16e22023-06-07 18:58:17 -040018#include "config.h"
19#include "run-command.h"
Phillip Woodbc7f5db2024-02-09 16:19:39 +000020#include "sequencer.h"
Junio C Hamano94421472007-01-06 02:16:17 -080021
Jeff King0b26abc2011-11-08 00:37:00 -050022struct connectivity_progress {
23 struct progress *progress;
24 unsigned long count;
25};
26
27static void update_progress(struct connectivity_progress *cp)
28{
29 cp->count++;
30 if ((cp->count & 1023) == 0)
31 display_progress(cp->progress, cp->count);
32}
33
Phillip Woodbc7f5db2024-02-09 16:19:39 +000034static void add_one_file(const char *path, struct rev_info *revs)
35{
36 struct strbuf buf = STRBUF_INIT;
37 struct object_id oid;
38 struct object *object;
39
40 if (!read_oneliner(&buf, path, READ_ONELINER_SKIP_IF_EMPTY)) {
41 strbuf_release(&buf);
42 return;
43 }
44 strbuf_trim(&buf);
45 if (!get_oid_hex(buf.buf, &oid)) {
46 object = parse_object_or_die(&oid, buf.buf);
47 add_pending_object(revs, object, "");
48 }
49 strbuf_release(&buf);
50}
51
52/* Mark objects recorded in rebase state files as reachable. */
53static void add_rebase_files(struct rev_info *revs)
54{
55 struct strbuf buf = STRBUF_INIT;
56 size_t len;
57 const char *path[] = {
58 "rebase-apply/autostash",
59 "rebase-apply/orig-head",
60 "rebase-merge/autostash",
61 "rebase-merge/orig-head",
62 };
63 struct worktree **worktrees = get_worktrees();
64
65 for (struct worktree **wt = worktrees; *wt; wt++) {
66 strbuf_reset(&buf);
67 strbuf_addstr(&buf, get_worktree_git_dir(*wt));
68 strbuf_complete(&buf, '/');
69 len = buf.len;
70 for (size_t i = 0; i < ARRAY_SIZE(path); i++) {
71 strbuf_setlen(&buf, len);
72 strbuf_addstr(&buf, path[i]);
73 add_one_file(buf.buf, revs);
74 }
75 }
76 strbuf_release(&buf);
77 free_worktrees(worktrees);
78}
79
Michael Haggerty635170f2015-05-25 18:39:00 +000080static int add_one_ref(const char *path, const struct object_id *oid,
81 int flag, void *cb_data)
Junio C Hamano94421472007-01-06 02:16:17 -080082{
Junio C Hamano94421472007-01-06 02:16:17 -080083 struct rev_info *revs = (struct rev_info *)cb_data;
Johannes Schindelin14886b42015-09-28 16:01:25 +020084 struct object *object;
Junio C Hamano94421472007-01-06 02:16:17 -080085
Johannes Schindelin14886b42015-09-28 16:01:25 +020086 if ((flag & REF_ISSYMREF) && (flag & REF_ISBROKEN)) {
87 warning("symbolic ref is dangling: %s", path);
88 return 0;
89 }
90
brian m. carlsonc251c832017-05-06 22:10:38 +000091 object = parse_object_or_die(oid, path);
Junio C Hamano94421472007-01-06 02:16:17 -080092 add_pending_object(revs, object, "");
93
94 return 0;
95}
96
Jeff King5f78a432014-10-15 18:37:28 -040097/*
98 * The traversal will have already marked us as SEEN, so we
99 * only need to handle any progress reporting here.
100 */
Jeff Kingc50dca22023-02-24 01:39:22 -0500101static void mark_object(struct object *obj UNUSED,
102 const char *name UNUSED,
103 void *data)
Jeff King5f78a432014-10-15 18:37:28 -0400104{
105 update_progress(data);
106}
107
108static void mark_commit(struct commit *c, void *data)
109{
Jeff Kingde1e67d2016-02-11 17:28:36 -0500110 mark_object(&c->object, NULL, data);
Jeff King5f78a432014-10-15 18:37:28 -0400111}
112
Jeff Kingd3038d22014-10-15 18:41:35 -0400113struct recent_data {
114 struct rev_info *revs;
Johannes Schindelindddbad72017-04-26 21:29:31 +0200115 timestamp_t timestamp;
Taylor Blau2fb90402022-05-20 19:17:54 -0400116 report_recent_object_fn *cb;
117 int ignore_in_core_kept_packs;
Taylor Blau4dc16e22023-06-07 18:58:17 -0400118
119 struct oidset extra_recent_oids;
120 int extra_recent_oids_loaded;
Jeff Kingd3038d22014-10-15 18:41:35 -0400121};
122
Taylor Blau4dc16e22023-06-07 18:58:17 -0400123static int run_one_gc_recent_objects_hook(struct oidset *set,
124 const char *args)
125{
126 struct child_process cmd = CHILD_PROCESS_INIT;
127 struct strbuf buf = STRBUF_INIT;
128 FILE *out;
129 int ret = 0;
130
131 cmd.use_shell = 1;
132 cmd.out = -1;
133
134 strvec_push(&cmd.args, args);
135
136 if (start_command(&cmd))
137 return -1;
138
139 out = xfdopen(cmd.out, "r");
140 while (strbuf_getline(&buf, out) != EOF) {
141 struct object_id oid;
142 const char *rest;
143
144 if (parse_oid_hex(buf.buf, &oid, &rest) || *rest) {
145 ret = error(_("invalid extra cruft tip: '%s'"), buf.buf);
146 break;
147 }
148
149 oidset_insert(set, &oid);
150 }
151
152 fclose(out);
153 ret |= finish_command(&cmd);
154
155 strbuf_release(&buf);
156 return ret;
157}
158
159static void load_gc_recent_objects(struct recent_data *data)
160{
161 const struct string_list *programs;
162 int ret = 0;
163 size_t i;
164
165 data->extra_recent_oids_loaded = 1;
166
167 if (git_config_get_string_multi("gc.recentobjectshook", &programs))
168 return;
169
170 for (i = 0; i < programs->nr; i++) {
171 ret = run_one_gc_recent_objects_hook(&data->extra_recent_oids,
172 programs->items[i].string);
173 if (ret)
174 die(_("unable to enumerate additional recent objects"));
175 }
176}
177
Taylor Blau01e9ca42023-06-07 18:58:12 -0400178static int obj_is_recent(const struct object_id *oid, timestamp_t mtime,
179 struct recent_data *data)
180{
Taylor Blau4dc16e22023-06-07 18:58:17 -0400181 if (mtime > data->timestamp)
182 return 1;
183
184 if (!data->extra_recent_oids_loaded)
185 load_gc_recent_objects(data);
186 return oidset_contains(&data->extra_recent_oids, oid);
Taylor Blau01e9ca42023-06-07 18:58:12 -0400187}
188
brian m. carlson76c1d9a2017-02-21 23:47:35 +0000189static void add_recent_object(const struct object_id *oid,
Taylor Blau2fb90402022-05-20 19:17:54 -0400190 struct packed_git *pack,
191 off_t offset,
Johannes Schindelindddbad72017-04-26 21:29:31 +0200192 timestamp_t mtime,
Jeff Kingd3038d22014-10-15 18:41:35 -0400193 struct recent_data *data)
194{
195 struct object *obj;
196 enum object_type type;
197
Taylor Blau01e9ca42023-06-07 18:58:12 -0400198 if (!obj_is_recent(oid, mtime, data))
Jeff Kingd3038d22014-10-15 18:41:35 -0400199 return;
200
201 /*
202 * We do not want to call parse_object here, because
203 * inflating blobs and trees could be very expensive.
204 * However, we do need to know the correct type for
205 * later processing, and the revision machinery expects
206 * commits and tags to have been parsed.
207 */
Stefan Beller0df8e962018-04-25 11:20:59 -0700208 type = oid_object_info(the_repository, oid, NULL);
Jeff Kingd3038d22014-10-15 18:41:35 -0400209 if (type < 0)
brian m. carlson76c1d9a2017-02-21 23:47:35 +0000210 die("unable to get object info for %s", oid_to_hex(oid));
Jeff Kingd3038d22014-10-15 18:41:35 -0400211
212 switch (type) {
213 case OBJ_TAG:
214 case OBJ_COMMIT:
brian m. carlsonc251c832017-05-06 22:10:38 +0000215 obj = parse_object_or_die(oid, NULL);
Jeff Kingd3038d22014-10-15 18:41:35 -0400216 break;
217 case OBJ_TREE:
Stefan Bellerf86bcc72018-06-28 18:21:56 -0700218 obj = (struct object *)lookup_tree(the_repository, oid);
Jeff Kingd3038d22014-10-15 18:41:35 -0400219 break;
220 case OBJ_BLOB:
Stefan Bellerda14a7f2018-06-28 18:21:55 -0700221 obj = (struct object *)lookup_blob(the_repository, oid);
Jeff Kingd3038d22014-10-15 18:41:35 -0400222 break;
223 default:
224 die("unknown object type for %s: %s",
Brandon Williamsdebca9d2018-02-14 10:59:24 -0800225 oid_to_hex(oid), type_name(type));
Jeff Kingd3038d22014-10-15 18:41:35 -0400226 }
227
228 if (!obj)
brian m. carlson76c1d9a2017-02-21 23:47:35 +0000229 die("unable to lookup %s", oid_to_hex(oid));
Jeff Kingd3038d22014-10-15 18:41:35 -0400230
231 add_pending_object(data->revs, obj, "");
Taylor Blau2fb90402022-05-20 19:17:54 -0400232 if (data->cb)
233 data->cb(obj, pack, offset, mtime);
234}
235
236static int want_recent_object(struct recent_data *data,
237 const struct object_id *oid)
238{
239 if (data->ignore_in_core_kept_packs &&
240 has_object_kept_pack(oid, IN_CORE_KEEP_PACKS))
241 return 0;
242 return 1;
Jeff Kingd3038d22014-10-15 18:41:35 -0400243}
244
brian m. carlson76c1d9a2017-02-21 23:47:35 +0000245static int add_recent_loose(const struct object_id *oid,
Jeff Kingd3038d22014-10-15 18:41:35 -0400246 const char *path, void *data)
247{
248 struct stat st;
Taylor Blau2fb90402022-05-20 19:17:54 -0400249 struct object *obj;
250
251 if (!want_recent_object(data, oid))
252 return 0;
253
254 obj = lookup_object(the_repository, oid);
Jeff Kingd3038d22014-10-15 18:41:35 -0400255
256 if (obj && obj->flags & SEEN)
257 return 0;
258
259 if (stat(path, &st) < 0) {
260 /*
261 * It's OK if an object went away during our iteration; this
262 * could be due to a simultaneous repack. But anything else
263 * we should abort, since we might then fail to mark objects
264 * which should not be pruned.
265 */
266 if (errno == ENOENT)
267 return 0;
brian m. carlson76c1d9a2017-02-21 23:47:35 +0000268 return error_errno("unable to stat %s", oid_to_hex(oid));
Jeff Kingd3038d22014-10-15 18:41:35 -0400269 }
270
Taylor Blau2fb90402022-05-20 19:17:54 -0400271 add_recent_object(oid, NULL, 0, st.st_mtime, data);
Jeff Kingd3038d22014-10-15 18:41:35 -0400272 return 0;
273}
274
brian m. carlson76c1d9a2017-02-21 23:47:35 +0000275static int add_recent_packed(const struct object_id *oid,
Jeff Kingbe252d32023-02-24 01:39:24 -0500276 struct packed_git *p,
277 uint32_t pos,
Jeff Kingd3038d22014-10-15 18:41:35 -0400278 void *data)
279{
Taylor Blau2fb90402022-05-20 19:17:54 -0400280 struct object *obj;
Taylor Blaufb546d62022-05-20 19:17:57 -0400281 timestamp_t mtime = p->mtime;
Taylor Blau2fb90402022-05-20 19:17:54 -0400282
283 if (!want_recent_object(data, oid))
284 return 0;
285
286 obj = lookup_object(the_repository, oid);
Jeff Kingd3038d22014-10-15 18:41:35 -0400287
288 if (obj && obj->flags & SEEN)
289 return 0;
Taylor Blaufb546d62022-05-20 19:17:57 -0400290 if (p->is_cruft) {
291 if (load_pack_mtimes(p) < 0)
292 die(_("could not load cruft pack .mtimes"));
293 mtime = nth_packed_mtime(p, pos);
294 }
295 add_recent_object(oid, p, nth_packed_object_offset(p, pos), mtime, data);
Jeff Kingd3038d22014-10-15 18:41:35 -0400296 return 0;
297}
298
Jeff Kingabcb8652014-10-15 18:42:09 -0400299int add_unseen_recent_objects_to_traversal(struct rev_info *revs,
Taylor Blau2fb90402022-05-20 19:17:54 -0400300 timestamp_t timestamp,
301 report_recent_object_fn *cb,
302 int ignore_in_core_kept_packs)
Jeff Kingd3038d22014-10-15 18:41:35 -0400303{
304 struct recent_data data;
Taylor Blau2fb90402022-05-20 19:17:54 -0400305 enum for_each_object_flags flags;
Jeff Kingd3038d22014-10-15 18:41:35 -0400306 int r;
307
308 data.revs = revs;
309 data.timestamp = timestamp;
Taylor Blau2fb90402022-05-20 19:17:54 -0400310 data.cb = cb;
311 data.ignore_in_core_kept_packs = ignore_in_core_kept_packs;
Jeff Kingd3038d22014-10-15 18:41:35 -0400312
Taylor Blau4dc16e22023-06-07 18:58:17 -0400313 oidset_init(&data.extra_recent_oids, 0);
314 data.extra_recent_oids_loaded = 0;
315
Jeff King1385bb72015-03-27 07:32:41 -0400316 r = for_each_loose_object(add_recent_loose, &data,
317 FOR_EACH_OBJECT_LOCAL_ONLY);
Jeff Kingd3038d22014-10-15 18:41:35 -0400318 if (r)
Taylor Blau4dc16e22023-06-07 18:58:17 -0400319 goto done;
Taylor Blau2fb90402022-05-20 19:17:54 -0400320
321 flags = FOR_EACH_OBJECT_LOCAL_ONLY | FOR_EACH_OBJECT_PACK_ORDER;
322 if (ignore_in_core_kept_packs)
323 flags |= FOR_EACH_OBJECT_SKIP_IN_CORE_KEPT_PACKS;
324
Taylor Blau4dc16e22023-06-07 18:58:17 -0400325 r = for_each_packed_object(add_recent_packed, &data, flags);
326
327done:
328 oidset_clear(&data.extra_recent_oids);
329
330 return r;
Jeff Kingd3038d22014-10-15 18:41:35 -0400331}
332
Jeff Kingfde67d62019-02-13 23:37:43 -0500333static int mark_object_seen(const struct object_id *oid,
334 enum object_type type,
Jeff Kingc50dca22023-02-24 01:39:22 -0500335 int exclude UNUSED,
336 uint32_t name_hash UNUSED,
337 struct packed_git *found_pack UNUSED,
338 off_t found_offset UNUSED)
Jeff Kingfde67d62019-02-13 23:37:43 -0500339{
340 struct object *obj = lookup_object_by_type(the_repository, oid, type);
341 if (!obj)
342 die("unable to create object '%s'", oid_to_hex(oid));
343
344 obj->flags |= SEEN;
345 return 0;
346}
347
Nguyễn Thái Ngọc Duydc347192011-11-05 19:00:08 +0700348void mark_reachable_objects(struct rev_info *revs, int mark_reflog,
Johannes Schindelindddbad72017-04-26 21:29:31 +0200349 timestamp_t mark_recent, struct progress *progress)
Junio C Hamano94421472007-01-06 02:16:17 -0800350{
Jeff King0b26abc2011-11-08 00:37:00 -0500351 struct connectivity_progress cp;
Jeff Kingfde67d62019-02-13 23:37:43 -0500352 struct bitmap_index *bitmap_git;
Jeff King0b26abc2011-11-08 00:37:00 -0500353
Junio C Hamano94421472007-01-06 02:16:17 -0800354 /*
355 * Set up revision parsing, and mark us as being interested
356 * in all object types, not just commits.
357 */
358 revs->tag_objects = 1;
359 revs->blob_objects = 1;
360 revs->tree_objects = 1;
361
362 /* Add all refs from the index file */
Jeff King1be111d2014-10-16 20:44:30 -0400363 add_index_objects_to_pending(revs, 0);
Junio C Hamano94421472007-01-06 02:16:17 -0800364
365 /* Add all external refs */
Michael Haggerty635170f2015-05-25 18:39:00 +0000366 for_each_ref(add_one_ref, revs);
Junio C Hamano94421472007-01-06 02:16:17 -0800367
Max Kirillovc40fdd02014-09-03 19:14:10 +0300368 /* detached HEAD is not included in the list above */
Michael Haggerty635170f2015-05-25 18:39:00 +0000369 head_ref(add_one_ref, revs);
Nguyễn Thái Ngọc Duyd0c39a42017-08-23 19:36:59 +0700370 other_head_refs(add_one_ref, revs);
Max Kirillovc40fdd02014-09-03 19:14:10 +0300371
Phillip Woodbc7f5db2024-02-09 16:19:39 +0000372 /* rebase autostash and orig-head */
373 add_rebase_files(revs);
374
Nicolas Pitreeb8381c2007-02-03 13:25:43 -0500375 /* Add all reflog info */
Junio C Hamano94421472007-01-06 02:16:17 -0800376 if (mark_reflog)
Jeff King718ccc92014-10-15 18:38:31 -0400377 add_reflogs_to_pending(revs, 0);
Junio C Hamano94421472007-01-06 02:16:17 -0800378
Jeff King0b26abc2011-11-08 00:37:00 -0500379 cp.progress = progress;
380 cp.count = 0;
381
Derrick Stolee09d4a792022-03-09 16:01:35 +0000382 bitmap_git = prepare_bitmap_walk(revs, 0);
Jeff Kingfde67d62019-02-13 23:37:43 -0500383 if (bitmap_git) {
Jeff King4eb707e2020-02-14 13:22:27 -0500384 traverse_bitmap_commit_list(bitmap_git, revs, mark_object_seen);
Jeff Kingfde67d62019-02-13 23:37:43 -0500385 free_bitmap_index(bitmap_git);
Jeff King2ba582b2021-04-28 11:42:43 -0400386 } else {
387 if (prepare_revision_walk(revs))
388 die("revision walk setup failed");
389 traverse_commit_list(revs, mark_commit, mark_object, &cp);
Jeff Kingfde67d62019-02-13 23:37:43 -0500390 }
391
Jeff Kingd3038d22014-10-15 18:41:35 -0400392 if (mark_recent) {
393 revs->ignore_missing_links = 1;
Taylor Blau2fb90402022-05-20 19:17:54 -0400394 if (add_unseen_recent_objects_to_traversal(revs, mark_recent,
395 NULL, 0))
Jeff Kingd3038d22014-10-15 18:41:35 -0400396 die("unable to mark recent objects");
397 if (prepare_revision_walk(revs))
398 die("revision walk setup failed");
399 traverse_commit_list(revs, mark_commit, mark_object, &cp);
400 }
401
Jeff King0b26abc2011-11-08 00:37:00 -0500402 display_progress(cp.progress, cp.count);
Junio C Hamano94421472007-01-06 02:16:17 -0800403}