blob: 5e534f0fcc8d131a6e759ed1658b0e0984123a6e [file] [log] [blame]
Derrick Stolee08fd81c2018-04-02 16:34:19 -04001#ifndef COMMIT_GRAPH_H
2#define COMMIT_GRAPH_H
3
Elijah Newrena034e912023-05-16 06:34:06 +00004#include "object-store-ll.h"
Taylor Blau6830c362020-04-13 22:04:25 -06005#include "oidset.h"
Derrick Stolee2a2e32b2018-04-10 08:56:02 -04006
Derrick Stolee859fdc02018-08-29 05:49:04 -07007#define GIT_TEST_COMMIT_GRAPH "GIT_TEST_COMMIT_GRAPH"
Derrick Stolee7b671f82020-06-23 17:47:01 +00008#define GIT_TEST_COMMIT_GRAPH_DIE_ON_PARSE "GIT_TEST_COMMIT_GRAPH_DIE_ON_PARSE"
Garima Singhd5b873c2020-04-06 16:59:55 +00009#define GIT_TEST_COMMIT_GRAPH_CHANGED_PATHS "GIT_TEST_COMMIT_GRAPH_CHANGED_PATHS"
Derrick Stolee859fdc02018-08-29 05:49:04 -070010
Derrick Stoleeb23ea972020-04-16 20:14:03 +000011/*
12 * This method is only used to enhance coverage of the commit-graph
13 * feature in the test suite with the GIT_TEST_COMMIT_GRAPH and
14 * GIT_TEST_COMMIT_GRAPH_CHANGED_PATHS environment variables. Do not
15 * call this method oustide of a builtin, and only if you know what
16 * you are doing!
17 */
18void git_test_write_commit_graph_or_die(void);
19
Jonathan Tane5c5ca22018-07-11 15:42:39 -070020struct commit;
Garima Singh76ffbca2020-04-06 16:59:49 +000021struct bloom_filter_settings;
SZEDER Gáborfa796532020-06-05 13:00:28 +000022struct repository;
23struct raw_object_store;
24struct string_list;
Jonathan Tane5c5ca22018-07-11 15:42:39 -070025
Taylor Blauad2dd5b2020-02-03 13:18:02 -080026char *get_commit_graph_filename(struct object_directory *odb);
Derrick Stolee663b2b12020-09-17 18:11:46 +000027char *get_commit_graph_chain_filename(struct object_directory *odb);
Ævar Arnfjörð Bjarmason61df89c2019-03-25 13:08:30 +010028int open_commit_graph(const char *graph_file, int *fd, struct stat *st);
Derrick Stolee2a2e32b2018-04-10 08:56:02 -040029
Derrick Stolee177722b2018-04-10 08:56:05 -040030/*
31 * Given a commit struct, try to fill the commit struct info, including:
32 * 1. tree object
33 * 2. date
34 * 3. parents.
35 *
36 * Returns 1 if and only if the commit was found in the packed graph.
37 *
38 * See parse_commit_buffer() for the fallback after this call.
39 */
Jonathan Tandade47c2018-07-11 15:42:42 -070040int parse_commit_in_graph(struct repository *r, struct commit *item);
Derrick Stolee177722b2018-04-10 08:56:05 -040041
Derrick Stoleee2838d82018-05-01 12:47:13 +000042/*
Taylor Blau78053602022-07-12 19:10:31 -040043 * Fills `*pos` with the graph position of `c`, and returns 1 if `c` is
44 * found in the commit-graph belonging to `r`, or 0 otherwise.
45 * Initializes the commit-graph belonging to `r` if it hasn't been
46 * already.
47 *
48 * Note: this is a low-level helper that does not alter any slab data
49 * associated with `c`. Useful in circumstances where the slab data is
50 * already being modified (e.g., writing the commit-graph itself).
51 *
52 * In most cases, callers should use `parse_commit_in_graph()` instead.
53 */
54int repo_find_commit_pos_in_graph(struct repository *r, struct commit *c,
55 uint32_t *pos);
56
57/*
Patrick Steinhardtf559d6d2021-08-09 10:12:03 +020058 * Look up the given commit ID in the commit-graph. This will only return a
59 * commit if the ID exists both in the graph and in the object database such
60 * that we don't return commits whose object has been pruned. Otherwise, this
61 * function returns `NULL`.
62 */
63struct commit *lookup_commit_in_graph(struct repository *repo, const struct object_id *id);
64
65/*
Derrick Stoleee2838d82018-05-01 12:47:13 +000066 * It is possible that we loaded commit contents from the commit buffer,
67 * but we also want to ensure the commit-graph content is correctly
68 * checked and filled. Fill the graph_pos and generation members of
69 * the given commit.
70 */
Jonathan Tandade47c2018-07-11 15:42:42 -070071void load_commit_graph_info(struct repository *r, struct commit *item);
Derrick Stoleee2838d82018-05-01 12:47:13 +000072
Jonathan Tandade47c2018-07-11 15:42:42 -070073struct tree *get_commit_tree_in_graph(struct repository *r,
74 const struct commit *c);
Derrick Stolee7b8a21d2018-04-06 19:09:46 +000075
Derrick Stolee2a2e32b2018-04-10 08:56:02 -040076struct commit_graph {
Derrick Stolee2a2e32b2018-04-10 08:56:02 -040077 const unsigned char *data;
78 size_t data_len;
79
80 unsigned char hash_len;
81 unsigned char num_chunks;
82 uint32_t num_commits;
83 struct object_id oid;
Derrick Stolee6c622f92019-06-18 11:14:27 -070084 char *filename;
Taylor Blau13c24992020-02-03 13:18:00 -080085 struct object_directory *odb;
Derrick Stolee2a2e32b2018-04-10 08:56:02 -040086
Derrick Stoleed4f4d602019-06-18 11:14:24 -070087 uint32_t num_commits_in_base;
Abhishek Kumar1fdc3832021-01-16 18:11:16 +000088 unsigned int read_generation_data;
Derrick Stoleed4f4d602019-06-18 11:14:24 -070089 struct commit_graph *base_graph;
90
Derrick Stolee2a2e32b2018-04-10 08:56:02 -040091 const uint32_t *chunk_oid_fanout;
92 const unsigned char *chunk_oid_lookup;
93 const unsigned char *chunk_commit_data;
Abhishek Kumare8b63002021-01-16 18:11:15 +000094 const unsigned char *chunk_generation_data;
95 const unsigned char *chunk_generation_data_overflow;
SZEDER Gábor5af74172019-01-19 21:21:13 +010096 const unsigned char *chunk_extra_edges;
Derrick Stolee118bd572019-06-18 11:14:26 -070097 const unsigned char *chunk_base_graphs;
Garima Singh76ffbca2020-04-06 16:59:49 +000098 const unsigned char *chunk_bloom_indexes;
99 const unsigned char *chunk_bloom_data;
100
Abhishek Kumar72a2bfc2021-01-16 18:11:12 +0000101 struct topo_level_slab *topo_levels;
Garima Singh76ffbca2020-04-06 16:59:49 +0000102 struct bloom_filter_settings *bloom_filter_settings;
Derrick Stolee2a2e32b2018-04-10 08:56:02 -0400103};
104
Taylor Blauab14d062020-09-09 11:22:56 -0400105struct commit_graph *load_commit_graph_one_fd_st(struct repository *r,
106 int fd, struct stat *st,
Taylor Blaua7df60c2020-02-03 13:18:04 -0800107 struct object_directory *odb);
Taylor Blau13c24992020-02-03 13:18:00 -0800108struct commit_graph *read_commit_graph_one(struct repository *r,
109 struct object_directory *odb);
Taylor Blaua92d8522022-07-14 14:43:06 -0700110
111/*
112 * Callers should initialize the repo_settings with prepare_repo_settings()
113 * prior to calling parse_commit_graph().
114 */
115struct commit_graph *parse_commit_graph(struct repo_settings *s,
Taylor Blauab14d062020-09-09 11:22:56 -0400116 void *graph_map, size_t graph_size);
Josh Steadmonaa658572019-01-15 14:25:50 -0800117
Derrick Stolee6cc01742018-07-20 16:33:30 +0000118/*
119 * Return 1 if and only if the repository has a commit-graph
120 * file and generation numbers are computed in that file.
121 */
122int generation_numbers_enabled(struct repository *r);
123
Abhishek Kumar8d00d7c2021-01-16 18:11:17 +0000124/*
125 * Return 1 if and only if the repository has a commit-graph
126 * file and generation data chunk has been written for the file.
127 */
128int corrected_commit_dates_enabled(struct repository *r);
129
Taylor Blau4f364402020-09-09 11:22:44 -0400130struct bloom_filter_settings *get_bloom_filter_settings(struct repository *r);
131
SZEDER Gábor39d88312019-08-05 10:02:39 +0200132enum commit_graph_write_flags {
133 COMMIT_GRAPH_WRITE_APPEND = (1 << 0),
134 COMMIT_GRAPH_WRITE_PROGRESS = (1 << 1),
SZEDER Gábor7c5c9b92019-08-05 10:02:40 +0200135 COMMIT_GRAPH_WRITE_SPLIT = (1 << 2),
Taylor Blau2f00c352020-05-13 15:59:55 -0600136 COMMIT_GRAPH_WRITE_BLOOM_FILTERS = (1 << 3),
Junio C Hamano70cdbbe2020-07-30 13:20:31 -0700137 COMMIT_GRAPH_NO_WRITE_BLOOM_FILTERS = (1 << 4),
SZEDER Gábor39d88312019-08-05 10:02:39 +0200138};
Derrick Stolee5af80392019-06-12 06:29:38 -0700139
Taylor Blau4f027352020-04-13 22:04:08 -0600140enum commit_graph_split_flags {
Taylor Blaufdbde822020-04-13 22:04:12 -0600141 COMMIT_GRAPH_SPLIT_UNSPECIFIED = 0,
Taylor Blau8a6ac282020-04-13 22:04:17 -0600142 COMMIT_GRAPH_SPLIT_MERGE_PROHIBITED = 1,
143 COMMIT_GRAPH_SPLIT_REPLACE = 2
Taylor Blau4f027352020-04-13 22:04:08 -0600144};
145
Taylor Blau98bb7962020-09-17 22:59:49 -0400146struct commit_graph_opts {
Derrick Stoleec2bc6e62019-06-18 11:14:32 -0700147 int size_multiple;
148 int max_commits;
149 timestamp_t expire_time;
Taylor Blau98bb7962020-09-17 22:59:49 -0400150 enum commit_graph_split_flags split_flags;
Taylor Blau809e0322020-09-18 09:27:27 -0400151 int max_new_filters;
Derrick Stoleec2bc6e62019-06-18 11:14:32 -0700152};
153
Derrick Stoleee103f722019-06-12 06:29:37 -0700154/*
155 * The write_commit_graph* methods return zero on success
156 * and a negative value on failure. Note that if the repository
157 * is not compatible with the commit-graph feature, then the
158 * methods will return 0 without writing a commit-graph.
159 */
Taylor Blau0bd52e22020-02-03 21:51:50 -0800160int write_commit_graph_reachable(struct object_directory *odb,
SZEDER Gábor39d88312019-08-05 10:02:39 +0200161 enum commit_graph_write_flags flags,
Taylor Blau98bb7962020-09-17 22:59:49 -0400162 const struct commit_graph_opts *opts);
Taylor Blau0bd52e22020-02-03 21:51:50 -0800163int write_commit_graph(struct object_directory *odb,
Ævar Arnfjörð Bjarmason4a047902022-03-04 19:32:12 +0100164 const struct string_list *pack_indexes,
Taylor Blau6830c362020-04-13 22:04:25 -0600165 struct oidset *commits,
SZEDER Gábor39d88312019-08-05 10:02:39 +0200166 enum commit_graph_write_flags flags,
Taylor Blau98bb7962020-09-17 22:59:49 -0400167 const struct commit_graph_opts *opts);
Derrick Stolee08fd81c2018-04-02 16:34:19 -0400168
Derrick Stolee3da4b602019-06-18 11:14:32 -0700169#define COMMIT_GRAPH_VERIFY_SHALLOW (1 << 0)
170
171int verify_commit_graph(struct repository *r, struct commit_graph *g, int flags);
Derrick Stolee283e68c2018-06-27 09:24:32 -0400172
Derrick Stoleec3a3a962019-05-17 11:41:47 -0700173void close_commit_graph(struct raw_object_store *);
Jonathan Tanc3756d52018-07-11 15:42:40 -0700174void free_commit_graph(struct commit_graph *);
175
Jeff King6abada12019-09-12 10:44:45 -0400176/*
177 * Disable further use of the commit graph in this process when parsing a
178 * "struct commit".
179 */
180void disable_commit_graph(struct repository *r);
181
Abhishek Kumar48448122020-06-17 14:44:09 +0530182struct commit_graph_data {
183 uint32_t graph_pos;
Abhishek Kumard7f92782021-01-16 18:11:13 +0000184 timestamp_t generation;
Abhishek Kumar48448122020-06-17 14:44:09 +0530185};
186
187/*
188 * Commits should be parsed before accessing generation, graph positions.
189 */
Abhishek Kumard7f92782021-01-16 18:11:13 +0000190timestamp_t commit_graph_generation(const struct commit *);
Abhishek Kumar48448122020-06-17 14:44:09 +0530191uint32_t commit_graph_position(const struct commit *);
Taylor Blauc08645b2023-03-20 11:26:52 +0000192
193/*
194 * After this method, all commits reachable from those in the given
195 * list will have non-zero, non-infinite generation numbers.
196 */
197void ensure_generations_valid(struct repository *r,
198 struct commit **commits, size_t nr);
199
Derrick Stolee08fd81c2018-04-02 16:34:19 -0400200#endif