Jeff King | 29c2bd5 | 2017-02-08 15:53:07 -0500 | [diff] [blame] | 1 | #ifndef OIDSET_H |
| 2 | #define OIDSET_H |
| 3 | |
René Scharfe | 8b2f8cb | 2018-10-04 17:13:06 +0200 | [diff] [blame] | 4 | #include "khash.h" |
Jonathan Tan | 9e6fabde | 2017-09-29 15:54:22 -0700 | [diff] [blame] | 5 | |
Jeff King | 29c2bd5 | 2017-02-08 15:53:07 -0500 | [diff] [blame] | 6 | /** |
Jeff King | 0740d0a | 2020-03-30 10:04:13 -0400 | [diff] [blame] | 7 | * This API is similar to oid-array, in that it maintains a set of object ids |
Jeff King | 29c2bd5 | 2017-02-08 15:53:07 -0500 | [diff] [blame] | 8 | * in a memory-efficient way. The major differences are: |
| 9 | * |
| 10 | * 1. It uses a hash, so we can do online duplicate removal, rather than |
| 11 | * sort-and-uniq at the end. This can reduce memory footprint if you have |
| 12 | * a large list of oids with many duplicates. |
| 13 | * |
| 14 | * 2. The per-unique-oid memory footprint is slightly higher due to hash |
| 15 | * table overhead. |
| 16 | */ |
| 17 | |
| 18 | /** |
| 19 | * A single oidset; should be zero-initialized (or use OIDSET_INIT). |
| 20 | */ |
| 21 | struct oidset { |
Jeff King | 8fbb558 | 2019-06-20 03:41:28 -0400 | [diff] [blame] | 22 | kh_oid_set_t set; |
Jeff King | 29c2bd5 | 2017-02-08 15:53:07 -0500 | [diff] [blame] | 23 | }; |
| 24 | |
René Scharfe | 8b2f8cb | 2018-10-04 17:13:06 +0200 | [diff] [blame] | 25 | #define OIDSET_INIT { { 0 } } |
Jeff King | 29c2bd5 | 2017-02-08 15:53:07 -0500 | [diff] [blame] | 26 | |
Jeff Hostetler | c3a9ad3 | 2017-11-21 20:58:49 +0000 | [diff] [blame] | 27 | |
René Scharfe | 8c84ae6 | 2018-10-04 17:14:37 +0200 | [diff] [blame] | 28 | /** |
| 29 | * Initialize the oidset structure `set`. |
| 30 | * |
| 31 | * If `initial_size` is bigger than 0 then preallocate to allow inserting |
| 32 | * the specified number of elements without further allocations. |
| 33 | */ |
| 34 | void oidset_init(struct oidset *set, size_t initial_size); |
Jeff Hostetler | c3a9ad3 | 2017-11-21 20:58:49 +0000 | [diff] [blame] | 35 | |
Jeff King | 29c2bd5 | 2017-02-08 15:53:07 -0500 | [diff] [blame] | 36 | /** |
| 37 | * Returns true iff `set` contains `oid`. |
| 38 | */ |
| 39 | int oidset_contains(const struct oidset *set, const struct object_id *oid); |
| 40 | |
| 41 | /** |
| 42 | * Insert the oid into the set; a copy is made, so "oid" does not need |
| 43 | * to persist after this function is called. |
| 44 | * |
| 45 | * Returns 1 if the oid was already in the set, 0 otherwise. This can be used |
| 46 | * to perform an efficient check-and-add. |
| 47 | */ |
| 48 | int oidset_insert(struct oidset *set, const struct object_id *oid); |
| 49 | |
| 50 | /** |
Jeff Hostetler | c3a9ad3 | 2017-11-21 20:58:49 +0000 | [diff] [blame] | 51 | * Remove the oid from the set. |
| 52 | * |
| 53 | * Returns 1 if the oid was present in the set, 0 otherwise. |
| 54 | */ |
| 55 | int oidset_remove(struct oidset *set, const struct object_id *oid); |
| 56 | |
| 57 | /** |
Taylor Blau | f478106 | 2020-04-13 22:04:22 -0600 | [diff] [blame] | 58 | * Returns the number of oids in the set. |
| 59 | */ |
René Scharfe | 325006f | 2021-09-11 22:36:40 +0200 | [diff] [blame] | 60 | static inline int oidset_size(const struct oidset *set) |
| 61 | { |
| 62 | return kh_size(&set->set); |
| 63 | } |
Taylor Blau | f478106 | 2020-04-13 22:04:22 -0600 | [diff] [blame] | 64 | |
| 65 | /** |
Jeff King | 29c2bd5 | 2017-02-08 15:53:07 -0500 | [diff] [blame] | 66 | * Remove all entries from the oidset, freeing any resources associated with |
| 67 | * it. |
| 68 | */ |
| 69 | void oidset_clear(struct oidset *set); |
| 70 | |
Barret Rhoden | f93895f | 2019-05-15 17:44:57 -0400 | [diff] [blame] | 71 | /** |
| 72 | * Add the contents of the file 'path' to an initialized oidset. Each line is |
| 73 | * an unabbreviated object name. Comments begin with '#', and trailing comments |
| 74 | * are allowed. Leading whitespace and empty or white-space only lines are |
| 75 | * ignored. |
| 76 | */ |
| 77 | void oidset_parse_file(struct oidset *set, const char *path); |
| 78 | |
Junio C Hamano | 610e2b9 | 2020-09-24 21:55:04 -0700 | [diff] [blame] | 79 | /* |
| 80 | * Similar to the above, but with a callback which can (1) return non-zero to |
| 81 | * signal displeasure with the object and (2) replace object ID with something |
| 82 | * else (meant to be used to "peel"). |
| 83 | */ |
| 84 | typedef int (*oidset_parse_tweak_fn)(struct object_id *, void *); |
| 85 | void oidset_parse_file_carefully(struct oidset *set, const char *path, |
| 86 | oidset_parse_tweak_fn fn, void *cbdata); |
| 87 | |
Jeff Hostetler | c3a9ad3 | 2017-11-21 20:58:49 +0000 | [diff] [blame] | 88 | struct oidset_iter { |
Jeff King | 8fbb558 | 2019-06-20 03:41:28 -0400 | [diff] [blame] | 89 | kh_oid_set_t *set; |
René Scharfe | 8b2f8cb | 2018-10-04 17:13:06 +0200 | [diff] [blame] | 90 | khiter_t iter; |
Jeff Hostetler | c3a9ad3 | 2017-11-21 20:58:49 +0000 | [diff] [blame] | 91 | }; |
| 92 | |
| 93 | static inline void oidset_iter_init(struct oidset *set, |
| 94 | struct oidset_iter *iter) |
| 95 | { |
René Scharfe | 8b2f8cb | 2018-10-04 17:13:06 +0200 | [diff] [blame] | 96 | iter->set = &set->set; |
| 97 | iter->iter = kh_begin(iter->set); |
Jeff Hostetler | c3a9ad3 | 2017-11-21 20:58:49 +0000 | [diff] [blame] | 98 | } |
| 99 | |
| 100 | static inline struct object_id *oidset_iter_next(struct oidset_iter *iter) |
| 101 | { |
René Scharfe | 8b2f8cb | 2018-10-04 17:13:06 +0200 | [diff] [blame] | 102 | for (; iter->iter != kh_end(iter->set); iter->iter++) { |
| 103 | if (kh_exist(iter->set, iter->iter)) |
| 104 | return &kh_key(iter->set, iter->iter++); |
| 105 | } |
| 106 | return NULL; |
Jeff Hostetler | c3a9ad3 | 2017-11-21 20:58:49 +0000 | [diff] [blame] | 107 | } |
| 108 | |
| 109 | static inline struct object_id *oidset_iter_first(struct oidset *set, |
| 110 | struct oidset_iter *iter) |
| 111 | { |
| 112 | oidset_iter_init(set, iter); |
| 113 | return oidset_iter_next(iter); |
| 114 | } |
| 115 | |
Jeff King | 29c2bd5 | 2017-02-08 15:53:07 -0500 | [diff] [blame] | 116 | #endif /* OIDSET_H */ |