blob: a3f6723857bf120f611e4f506e85428132f7ccc3 [file] [log] [blame]
Jonathan Tan4f39cd82017-08-18 15:20:16 -07001#ifndef PACKFILE_H
2#define PACKFILE_H
3
Beat Bollib42f98a2018-07-25 23:56:07 +02004#include "cache.h"
Jonathan Tan498f1f62017-12-05 16:58:44 +00005#include "oidset.h"
6
Stefan Bellercbd53a22018-05-15 16:42:15 -07007/* in object-store.h */
8struct packed_git;
9struct object_info;
Stefan Bellercbd53a22018-05-15 16:42:15 -070010
Jonathan Tan4f39cd82017-08-18 15:20:16 -070011/*
12 * Generate the filename to be used for a pack file with checksum "sha1" and
13 * extension "ext". The result is written into the strbuf "buf", overwriting
14 * any existing contents. A pointer to buf->buf is returned as a convenience.
15 *
16 * Example: odb_pack_name(out, sha1, "idx") => ".git/objects/pack/pack-1234..idx"
17 */
Jeff King336226c2019-04-05 14:03:41 -040018char *odb_pack_name(struct strbuf *buf, const unsigned char *sha1, const char *ext);
Jonathan Tan4f39cd82017-08-18 15:20:16 -070019
20/*
21 * Return the name of the (local) packfile with the specified sha1 in
22 * its name. The return value is a pointer to memory that is
23 * overwritten each time this function is called.
24 */
Jeff King336226c2019-04-05 14:03:41 -040025char *sha1_pack_name(const unsigned char *sha1);
Jonathan Tan4f39cd82017-08-18 15:20:16 -070026
27/*
28 * Return the name of the (local) pack index file with the specified
29 * sha1 in its name. The return value is a pointer to memory that is
30 * overwritten each time this function is called.
31 */
Jeff King336226c2019-04-05 14:03:41 -040032char *sha1_pack_index_name(const unsigned char *sha1);
Jonathan Tan4f39cd82017-08-18 15:20:16 -070033
Jeff Kingfc789152019-04-05 14:06:22 -040034/*
35 * Return the basename of the packfile, omitting any containing directory
36 * (e.g., "pack-1234abcd[...].pack").
37 */
38const char *pack_basename(struct packed_git *p);
39
Jeff King336226c2019-04-05 14:03:41 -040040struct packed_git *parse_pack_index(unsigned char *sha1, const char *idx_path);
Jonathan Tan0317f452017-08-18 15:20:19 -070041
Derrick Stolee9208e312018-07-12 15:39:25 -040042typedef void each_file_in_pack_dir_fn(const char *full_path, size_t full_path_len,
43 const char *file_pach, void *data);
44void for_each_file_in_pack_dir(const char *objdir,
45 each_file_in_pack_dir_fn fn,
46 void *data);
47
Jonathan Tan0abe14f2017-08-18 15:20:26 -070048/* A hook to report invalid files in pack directory */
49#define PACKDIR_FILE_PACK 1
50#define PACKDIR_FILE_IDX 2
51#define PACKDIR_FILE_GARBAGE 4
52extern void (*report_garbage)(unsigned seen_bits, const char *path);
53
Jeff King336226c2019-04-05 14:03:41 -040054void reprepare_packed_git(struct repository *r);
55void install_packed_git(struct repository *r, struct packed_git *pack);
Jonathan Tane65f1862017-08-18 15:20:25 -070056
Stefan Bellera80d72d2018-03-23 18:20:59 +010057struct packed_git *get_packed_git(struct repository *r);
58struct list_head *get_packed_git_mru(struct repository *r);
Derrick Stolee8aac67a2018-07-12 15:39:35 -040059struct multi_pack_index *get_multi_pack_index(struct repository *r);
Taylor Blau59552fb2020-08-28 16:22:13 -040060struct multi_pack_index *get_local_multi_pack_index(struct repository *r);
Derrick Stolee0bff5262018-08-20 16:52:02 +000061struct packed_git *get_all_packs(struct repository *r);
Stefan Bellera80d72d2018-03-23 18:20:59 +010062
Jonathan Tan0abe14f2017-08-18 15:20:26 -070063/*
64 * Give a rough count of objects in the repository. This sacrifices accuracy
65 * for speed.
66 */
Nguyễn Thái Ngọc Duy5038de12019-04-06 18:34:23 +070067unsigned long repo_approximate_object_count(struct repository *r);
68#define approximate_object_count() repo_approximate_object_count(the_repository)
Jonathan Tan0abe14f2017-08-18 15:20:26 -070069
Jeff King336226c2019-04-05 14:03:41 -040070struct packed_git *find_sha1_pack(const unsigned char *sha1,
71 struct packed_git *packs);
Jonathan Tand6fe0032017-08-18 15:20:34 -070072
Jeff King336226c2019-04-05 14:03:41 -040073void pack_report(void);
Jonathan Tan8e211762017-08-18 15:20:18 -070074
Jonathan Tan0317f452017-08-18 15:20:19 -070075/*
76 * mmap the index file for the specified packfile (if it is not
77 * already mmapped). Return 0 on success.
78 */
Jeff King336226c2019-04-05 14:03:41 -040079int open_pack_index(struct packed_git *);
Jonathan Tan0317f452017-08-18 15:20:19 -070080
Jonathan Tan3836d882017-08-18 15:20:21 -070081/*
82 * munmap the index file for the specified packfile (if it is
83 * currently mmapped).
84 */
Jeff King336226c2019-04-05 14:03:41 -040085void close_pack_index(struct packed_git *);
Jonathan Tan3836d882017-08-18 15:20:21 -070086
Jeff Hostetler5ae18df2019-03-21 12:36:15 -070087int close_pack_fd(struct packed_git *p);
88
Jeff King336226c2019-04-05 14:03:41 -040089uint32_t get_pack_fanout(struct packed_git *p, uint32_t value);
Derrick Stoleefe1ed562018-07-12 15:39:29 -040090
Jeff King336226c2019-04-05 14:03:41 -040091unsigned char *use_pack(struct packed_git *, struct pack_window **, off_t, unsigned long *);
92void close_pack_windows(struct packed_git *);
93void close_pack(struct packed_git *);
Junio C Hamano5cb7c732019-07-09 15:25:37 -070094void close_object_store(struct raw_object_store *o);
Jeff King336226c2019-04-05 14:03:41 -040095void unuse_pack(struct pack_window **);
96void clear_delta_base_cache(void);
97struct packed_git *add_packed_git(const char *path, size_t path_len, int local);
Jonathan Tan3836d882017-08-18 15:20:21 -070098
Jonathan Tand5a16762017-08-18 15:20:31 -070099/*
Derrick Stolee8434e852019-06-10 16:35:22 -0700100 * Unlink the .pack and associated extension files.
101 * Does not unlink if 'force_delete' is false and the pack-file is
102 * marked as ".keep".
103 */
Denton Liu415b7702019-08-19 02:26:19 -0400104void unlink_pack_path(const char *pack_name, int force_delete);
Derrick Stolee8434e852019-06-10 16:35:22 -0700105
106/*
Jonathan Tan9e0f45f2017-08-18 15:20:32 -0700107 * Make sure that a pointer access into an mmap'd index file is within bounds,
108 * and can provide at least 8 bytes of data.
109 *
110 * Note that this is only necessary for variable-length segments of the file
111 * (like the 64-bit extended offset table), as we compare the size to the
112 * fixed-length parts when we open the file.
113 */
Jeff King336226c2019-04-05 14:03:41 -0400114void check_pack_index_ptr(const struct packed_git *p, const void *ptr);
Jonathan Tan9e0f45f2017-08-18 15:20:32 -0700115
116/*
Derrick Stolee3d475f42018-03-22 13:40:09 -0400117 * Perform binary search on a pack-index for a given oid. Packfile is expected to
118 * have a valid pack-index.
119 *
120 * See 'bsearch_hash' for more information.
121 */
122int bsearch_pack(const struct object_id *oid, const struct packed_git *p, uint32_t *result);
123
124/*
Jeff King2fecc482020-02-23 23:37:54 -0500125 * Write the oid of the nth object within the specified packfile into the first
126 * parameter. Open the index if it is not already open. Returns 0 on success,
127 * negative otherwise.
Jonathan Tand5a16762017-08-18 15:20:31 -0700128 */
Jeff King07636712020-02-23 23:27:36 -0500129int nth_packed_object_id(struct object_id *, struct packed_git *, uint32_t n);
Jonathan Tand5a16762017-08-18 15:20:31 -0700130
Jonathan Tan9e0f45f2017-08-18 15:20:32 -0700131/*
132 * Return the offset of the nth object within the specified packfile.
133 * The index must already be opened.
134 */
Jeff King336226c2019-04-05 14:03:41 -0400135off_t nth_packed_object_offset(const struct packed_git *, uint32_t n);
Jonathan Tand5a16762017-08-18 15:20:31 -0700136
Jonathan Tana2551952017-08-18 15:20:33 -0700137/*
138 * If the object named sha1 is present in the specified packfile,
139 * return its offset within the packfile; otherwise, return 0.
140 */
Jeff King336226c2019-04-05 14:03:41 -0400141off_t find_pack_entry_one(const unsigned char *sha1, struct packed_git *);
Jonathan Tana2551952017-08-18 15:20:33 -0700142
Jeff King336226c2019-04-05 14:03:41 -0400143int is_pack_valid(struct packed_git *);
144void *unpack_entry(struct repository *r, struct packed_git *, off_t, enum object_type *, unsigned long *);
145unsigned long unpack_object_header_buffer(const unsigned char *buf, unsigned long len, enum object_type *type, unsigned long *sizep);
146unsigned long get_size_from_delta(struct packed_git *, struct pack_window **, off_t);
147int unpack_object_header(struct packed_git *, struct pack_window **, off_t *, unsigned long *);
Jeff King56d9cbe2019-09-13 15:02:18 +0200148off_t get_delta_base(struct packed_git *p, struct pack_window **w_curs,
149 off_t *curpos, enum object_type type,
150 off_t delta_obj_offset);
Jonathan Tan32b42e12017-08-18 15:20:27 -0700151
Jeff King336226c2019-04-05 14:03:41 -0400152void release_pack_memory(size_t);
Jonathan Tanf0e17e82017-08-18 15:20:20 -0700153
Jonathan Tanf1d81302017-08-18 15:20:30 -0700154/* global flag to enable extra checks when accessing packed objects */
155extern int do_check_packed_object_crc;
156
Jeff King336226c2019-04-05 14:03:41 -0400157int packed_object_info(struct repository *r,
158 struct packed_git *pack,
159 off_t offset, struct object_info *);
Jonathan Tanf1d81302017-08-18 15:20:30 -0700160
René Scharfe751530d2021-09-11 22:40:33 +0200161void mark_bad_packed_object(struct packed_git *, const struct object_id *);
René Scharfe7407d732021-09-11 22:42:20 +0200162const struct packed_git *has_packed_and_bad(struct repository *, const struct object_id *);
Jonathan Tan9e0f45f2017-08-18 15:20:32 -0700163
Taylor Blauf62312e2021-02-22 21:25:03 -0500164#define ON_DISK_KEEP_PACKS 1
165#define IN_CORE_KEEP_PACKS 2
166
Stefan Beller613b42f22018-03-23 18:45:25 +0100167/*
168 * Iff a pack file in the given repository contains the object named by sha1,
169 * return true and store its location to e.
170 */
Jeff King336226c2019-04-05 14:03:41 -0400171int find_pack_entry(struct repository *r, const struct object_id *oid, struct pack_entry *e);
Taylor Blauf62312e2021-02-22 21:25:03 -0500172int find_kept_pack_entry(struct repository *r, const struct object_id *oid, unsigned flags, struct pack_entry *e);
Jonathan Tan1a1e5d42017-08-18 15:20:35 -0700173
Jeff King336226c2019-04-05 14:03:41 -0400174int has_object_pack(const struct object_id *oid);
Taylor Blauf62312e2021-02-22 21:25:03 -0500175int has_object_kept_pack(const struct object_id *oid, unsigned flags);
Jonathan Tan150e3002017-08-18 15:20:36 -0700176
Jeff King336226c2019-04-05 14:03:41 -0400177int has_pack_index(const unsigned char *sha1);
Jonathan Tanf9a86722017-08-18 15:20:37 -0700178
Jonathan Tan7709f462017-08-18 15:20:38 -0700179/*
Jonathan Tan498f1f62017-12-05 16:58:44 +0000180 * Return 1 if an object in a promisor packfile is or refers to the given
181 * object, 0 otherwise.
182 */
Jeff King336226c2019-04-05 14:03:41 -0400183int is_promisor_object(const struct object_id *oid);
Jonathan Tan498f1f62017-12-05 16:58:44 +0000184
Josh Steadmon1127a982018-10-12 17:58:41 -0700185/*
186 * Expose a function for fuzz testing.
187 *
188 * load_idx() parses a block of memory as a packfile index and puts the results
189 * into a struct packed_git.
190 *
191 * This function should not be used directly. It is exposed here only so that we
192 * have a convenient entry-point for fuzz testing. For real uses, you should
193 * probably use open_pack_index() or parse_pack_index() instead.
194 */
Jeff King336226c2019-04-05 14:03:41 -0400195int load_idx(const char *path, const unsigned int hashsz, void *idx_map,
196 size_t idx_size, struct packed_git *p);
Josh Steadmon1127a982018-10-12 17:58:41 -0700197
Jonathan Tan4f39cd82017-08-18 15:20:16 -0700198#endif