7 #include "list-objects.h"
9 #include "pack-bitmap.h"
10 #include "pack-revindex.h"
11 #include "pack-objects.h"
13 #include "repository.h"
14 #include "object-store.h"
15 #include "list-objects-filter-options.h"
18 * An entry on the bitmap index, representing the bitmap for a given
21 struct stored_bitmap {
23 struct ewah_bitmap *root;
24 struct stored_bitmap *xor;
29 * The active bitmap index for a repository. By design, repositories only have
30 * a single bitmap index available (the index for the biggest packfile in
31 * the repository), since bitmap indexes need full closure.
33 * If there is more than one bitmap index available (e.g. because of alternates),
34 * the active bitmap index is the largest one.
37 /* Packfile to which this bitmap index belongs to */
38 struct packed_git *pack;
41 * Mark the first `reuse_objects` in the packfile as reused:
42 * they will be sent as-is without using them for repacking
45 uint32_t reuse_objects;
47 /* mmapped buffer of the whole bitmap index */
49 size_t map_size; /* size of the mmaped buffer */
50 size_t map_pos; /* current position when loading the index */
55 * Each bitmap marks which objects in the packfile are of the given
56 * type. This provides type information when yielding the objects from
57 * the packfile during a walk, which allows for better delta bases.
59 struct ewah_bitmap *commits;
60 struct ewah_bitmap *trees;
61 struct ewah_bitmap *blobs;
62 struct ewah_bitmap *tags;
64 /* Map from object ID -> `stored_bitmap` for all the bitmapped commits */
65 kh_oid_map_t *bitmaps;
67 /* Number of bitmapped commits */
70 /* If not NULL, this is a name-hash cache pointing into map. */
76 * When trying to perform bitmap operations with objects that are not
77 * packed in `pack`, these objects are added to this "fake index" and
78 * are assumed to appear at the end of the packfile for all operations
81 struct object **objects;
83 uint32_t count, alloc;
84 kh_oid_pos_t *positions;
87 /* Bitmap result of the last performed walk */
88 struct bitmap *result;
90 /* "have" bitmap from the last performed walk */
93 /* Version of the bitmap index */
97 static struct ewah_bitmap *lookup_stored_bitmap(struct stored_bitmap *st)
99 struct ewah_bitmap *parent;
100 struct ewah_bitmap *composed;
105 composed = ewah_pool_new();
106 parent = lookup_stored_bitmap(st->xor);
107 ewah_xor(st->root, parent, composed);
109 ewah_pool_free(st->root);
117 * Read a bitmap from the current read position on the mmaped
118 * index, and increase the read position accordingly
120 static struct ewah_bitmap *read_bitmap_1(struct bitmap_index *index)
122 struct ewah_bitmap *b = ewah_pool_new();
124 ssize_t bitmap_size = ewah_read_mmap(b,
125 index->map + index->map_pos,
126 index->map_size - index->map_pos);
128 if (bitmap_size < 0) {
129 error("Failed to load bitmap index (corrupted?)");
134 index->map_pos += bitmap_size;
138 static int load_bitmap_header(struct bitmap_index *index)
140 struct bitmap_disk_header *header = (void *)index->map;
142 if (index->map_size < sizeof(*header) + the_hash_algo->rawsz)
143 return error("Corrupted bitmap index (missing header data)");
145 if (memcmp(header->magic, BITMAP_IDX_SIGNATURE, sizeof(BITMAP_IDX_SIGNATURE)) != 0)
146 return error("Corrupted bitmap index file (wrong header)");
148 index->version = ntohs(header->version);
149 if (index->version != 1)
150 return error("Unsupported version for bitmap index file (%d)", index->version);
152 /* Parse known bitmap format options */
154 uint32_t flags = ntohs(header->options);
156 if ((flags & BITMAP_OPT_FULL_DAG) == 0)
157 return error("Unsupported options for bitmap index file "
158 "(Git requires BITMAP_OPT_FULL_DAG)");
160 if (flags & BITMAP_OPT_HASH_CACHE) {
161 unsigned char *end = index->map + index->map_size - the_hash_algo->rawsz;
162 index->hashes = ((uint32_t *)end) - index->pack->num_objects;
166 index->entry_count = ntohl(header->entry_count);
167 index->map_pos += sizeof(*header) - GIT_MAX_RAWSZ + the_hash_algo->rawsz;
171 static struct stored_bitmap *store_bitmap(struct bitmap_index *index,
172 struct ewah_bitmap *root,
173 const unsigned char *hash,
174 struct stored_bitmap *xor_with,
177 struct stored_bitmap *stored;
181 stored = xmalloc(sizeof(struct stored_bitmap));
183 stored->xor = xor_with;
184 stored->flags = flags;
185 oidread(&stored->oid, hash);
187 hash_pos = kh_put_oid_map(index->bitmaps, stored->oid, &ret);
189 /* a 0 return code means the insertion succeeded with no changes,
190 * because the SHA1 already existed on the map. this is bad, there
191 * shouldn't be duplicated commits in the index */
193 error("Duplicate entry in bitmap index: %s", hash_to_hex(hash));
197 kh_value(index->bitmaps, hash_pos) = stored;
201 static inline uint32_t read_be32(const unsigned char *buffer, size_t *pos)
203 uint32_t result = get_be32(buffer + *pos);
204 (*pos) += sizeof(result);
208 static inline uint8_t read_u8(const unsigned char *buffer, size_t *pos)
210 return buffer[(*pos)++];
213 #define MAX_XOR_OFFSET 160
215 static int load_bitmap_entries_v1(struct bitmap_index *index)
218 struct stored_bitmap *recent_bitmaps[MAX_XOR_OFFSET] = { NULL };
220 for (i = 0; i < index->entry_count; ++i) {
221 int xor_offset, flags;
222 struct ewah_bitmap *bitmap = NULL;
223 struct stored_bitmap *xor_bitmap = NULL;
224 uint32_t commit_idx_pos;
225 const unsigned char *sha1;
227 commit_idx_pos = read_be32(index->map, &index->map_pos);
228 xor_offset = read_u8(index->map, &index->map_pos);
229 flags = read_u8(index->map, &index->map_pos);
231 sha1 = nth_packed_object_sha1(index->pack, commit_idx_pos);
233 bitmap = read_bitmap_1(index);
237 if (xor_offset > MAX_XOR_OFFSET || xor_offset > i)
238 return error("Corrupted bitmap pack index");
240 if (xor_offset > 0) {
241 xor_bitmap = recent_bitmaps[(i - xor_offset) % MAX_XOR_OFFSET];
243 if (xor_bitmap == NULL)
244 return error("Invalid XOR offset in bitmap pack index");
247 recent_bitmaps[i % MAX_XOR_OFFSET] = store_bitmap(
248 index, bitmap, sha1, xor_bitmap, flags);
254 static char *pack_bitmap_filename(struct packed_git *p)
258 if (!strip_suffix(p->pack_name, ".pack", &len))
259 BUG("pack_name does not end in .pack");
260 return xstrfmt("%.*s.bitmap", (int)len, p->pack_name);
263 static int open_pack_bitmap_1(struct bitmap_index *bitmap_git, struct packed_git *packfile)
269 if (open_pack_index(packfile))
272 idx_name = pack_bitmap_filename(packfile);
273 fd = git_open(idx_name);
279 if (fstat(fd, &st)) {
284 if (bitmap_git->pack) {
285 warning("ignoring extra bitmap file: %s", packfile->pack_name);
290 bitmap_git->pack = packfile;
291 bitmap_git->map_size = xsize_t(st.st_size);
292 bitmap_git->map = xmmap(NULL, bitmap_git->map_size, PROT_READ, MAP_PRIVATE, fd, 0);
293 bitmap_git->map_pos = 0;
296 if (load_bitmap_header(bitmap_git) < 0) {
297 munmap(bitmap_git->map, bitmap_git->map_size);
298 bitmap_git->map = NULL;
299 bitmap_git->map_size = 0;
306 static int load_pack_bitmap(struct bitmap_index *bitmap_git)
308 assert(bitmap_git->map);
310 bitmap_git->bitmaps = kh_init_oid_map();
311 bitmap_git->ext_index.positions = kh_init_oid_pos();
312 if (load_pack_revindex(bitmap_git->pack))
315 if (!(bitmap_git->commits = read_bitmap_1(bitmap_git)) ||
316 !(bitmap_git->trees = read_bitmap_1(bitmap_git)) ||
317 !(bitmap_git->blobs = read_bitmap_1(bitmap_git)) ||
318 !(bitmap_git->tags = read_bitmap_1(bitmap_git)))
321 if (load_bitmap_entries_v1(bitmap_git) < 0)
327 munmap(bitmap_git->map, bitmap_git->map_size);
328 bitmap_git->map = NULL;
329 bitmap_git->map_size = 0;
333 static int open_pack_bitmap(struct repository *r,
334 struct bitmap_index *bitmap_git)
336 struct packed_git *p;
339 assert(!bitmap_git->map);
341 for (p = get_all_packs(r); p; p = p->next) {
342 if (open_pack_bitmap_1(bitmap_git, p) == 0)
349 struct bitmap_index *prepare_bitmap_git(struct repository *r)
351 struct bitmap_index *bitmap_git = xcalloc(1, sizeof(*bitmap_git));
353 if (!open_pack_bitmap(r, bitmap_git) && !load_pack_bitmap(bitmap_git))
356 free_bitmap_index(bitmap_git);
360 struct include_data {
361 struct bitmap_index *bitmap_git;
366 static inline int bitmap_position_extended(struct bitmap_index *bitmap_git,
367 const struct object_id *oid)
369 kh_oid_pos_t *positions = bitmap_git->ext_index.positions;
370 khiter_t pos = kh_get_oid_pos(positions, *oid);
372 if (pos < kh_end(positions)) {
373 int bitmap_pos = kh_value(positions, pos);
374 return bitmap_pos + bitmap_git->pack->num_objects;
380 static inline int bitmap_position_packfile(struct bitmap_index *bitmap_git,
381 const struct object_id *oid)
383 off_t offset = find_pack_entry_one(oid->hash, bitmap_git->pack);
387 return find_revindex_position(bitmap_git->pack, offset);
390 static int bitmap_position(struct bitmap_index *bitmap_git,
391 const struct object_id *oid)
393 int pos = bitmap_position_packfile(bitmap_git, oid);
394 return (pos >= 0) ? pos : bitmap_position_extended(bitmap_git, oid);
397 static int ext_index_add_object(struct bitmap_index *bitmap_git,
398 struct object *object, const char *name)
400 struct eindex *eindex = &bitmap_git->ext_index;
406 hash_pos = kh_put_oid_pos(eindex->positions, object->oid, &hash_ret);
408 if (eindex->count >= eindex->alloc) {
409 eindex->alloc = (eindex->alloc + 16) * 3 / 2;
410 REALLOC_ARRAY(eindex->objects, eindex->alloc);
411 REALLOC_ARRAY(eindex->hashes, eindex->alloc);
414 bitmap_pos = eindex->count;
415 eindex->objects[eindex->count] = object;
416 eindex->hashes[eindex->count] = pack_name_hash(name);
417 kh_value(eindex->positions, hash_pos) = bitmap_pos;
420 bitmap_pos = kh_value(eindex->positions, hash_pos);
423 return bitmap_pos + bitmap_git->pack->num_objects;
426 struct bitmap_show_data {
427 struct bitmap_index *bitmap_git;
431 static void show_object(struct object *object, const char *name, void *data_)
433 struct bitmap_show_data *data = data_;
436 bitmap_pos = bitmap_position(data->bitmap_git, &object->oid);
439 bitmap_pos = ext_index_add_object(data->bitmap_git, object,
442 bitmap_set(data->base, bitmap_pos);
445 static void show_commit(struct commit *commit, void *data)
449 static int add_to_include_set(struct bitmap_index *bitmap_git,
450 struct include_data *data,
451 const struct object_id *oid,
456 if (data->seen && bitmap_get(data->seen, bitmap_pos))
459 if (bitmap_get(data->base, bitmap_pos))
462 hash_pos = kh_get_oid_map(bitmap_git->bitmaps, *oid);
463 if (hash_pos < kh_end(bitmap_git->bitmaps)) {
464 struct stored_bitmap *st = kh_value(bitmap_git->bitmaps, hash_pos);
465 bitmap_or_ewah(data->base, lookup_stored_bitmap(st));
469 bitmap_set(data->base, bitmap_pos);
473 static int should_include(struct commit *commit, void *_data)
475 struct include_data *data = _data;
478 bitmap_pos = bitmap_position(data->bitmap_git, &commit->object.oid);
480 bitmap_pos = ext_index_add_object(data->bitmap_git,
481 (struct object *)commit,
484 if (!add_to_include_set(data->bitmap_git, data, &commit->object.oid,
486 struct commit_list *parent = commit->parents;
489 parent->item->object.flags |= SEEN;
490 parent = parent->next;
499 static struct bitmap *find_objects(struct bitmap_index *bitmap_git,
500 struct rev_info *revs,
501 struct object_list *roots,
504 struct bitmap *base = NULL;
507 struct object_list *not_mapped = NULL;
510 * Go through all the roots for the walk. The ones that have bitmaps
511 * on the bitmap index will be `or`ed together to form an initial
512 * global reachability analysis.
514 * The ones without bitmaps in the index will be stored in the
515 * `not_mapped_list` for further processing.
518 struct object *object = roots->item;
521 if (object->type == OBJ_COMMIT) {
522 khiter_t pos = kh_get_oid_map(bitmap_git->bitmaps, object->oid);
524 if (pos < kh_end(bitmap_git->bitmaps)) {
525 struct stored_bitmap *st = kh_value(bitmap_git->bitmaps, pos);
526 struct ewah_bitmap *or_with = lookup_stored_bitmap(st);
529 base = ewah_to_bitmap(or_with);
531 bitmap_or_ewah(base, or_with);
533 object->flags |= SEEN;
538 object_list_insert(object, ¬_mapped);
542 * Best case scenario: We found bitmaps for all the roots,
543 * so the resulting `or` bitmap has the full reachability analysis
545 if (not_mapped == NULL)
551 * Let's iterate through all the roots that don't have bitmaps to
552 * check if we can determine them to be reachable from the existing
555 * If we cannot find them in the existing global bitmap, we'll need
556 * to push them to an actual walk and run it until we can confirm
560 struct object *object = roots->item;
564 pos = bitmap_position(bitmap_git, &object->oid);
566 if (pos < 0 || base == NULL || !bitmap_get(base, pos)) {
567 object->flags &= ~UNINTERESTING;
568 add_pending_object(revs, object, "");
571 object->flags |= SEEN;
576 struct include_data incdata;
577 struct bitmap_show_data show_data;
582 incdata.bitmap_git = bitmap_git;
586 revs->include_check = should_include;
587 revs->include_check_data = &incdata;
589 if (prepare_revision_walk(revs))
590 die("revision walk setup failed");
592 show_data.bitmap_git = bitmap_git;
593 show_data.base = base;
595 traverse_commit_list(revs, show_commit, show_object,
602 static void show_extended_objects(struct bitmap_index *bitmap_git,
603 struct rev_info *revs,
604 show_reachable_fn show_reach)
606 struct bitmap *objects = bitmap_git->result;
607 struct eindex *eindex = &bitmap_git->ext_index;
610 for (i = 0; i < eindex->count; ++i) {
613 if (!bitmap_get(objects, bitmap_git->pack->num_objects + i))
616 obj = eindex->objects[i];
617 if ((obj->type == OBJ_BLOB && !revs->blob_objects) ||
618 (obj->type == OBJ_TREE && !revs->tree_objects) ||
619 (obj->type == OBJ_TAG && !revs->tag_objects))
622 show_reach(&obj->oid, obj->type, 0, eindex->hashes[i], NULL, 0);
626 static void init_type_iterator(struct ewah_iterator *it,
627 struct bitmap_index *bitmap_git,
628 enum object_type type)
632 ewah_iterator_init(it, bitmap_git->commits);
636 ewah_iterator_init(it, bitmap_git->trees);
640 ewah_iterator_init(it, bitmap_git->blobs);
644 ewah_iterator_init(it, bitmap_git->tags);
648 BUG("object type %d not stored by bitmap type index", type);
653 static void show_objects_for_type(
654 struct bitmap_index *bitmap_git,
655 enum object_type object_type,
656 show_reachable_fn show_reach)
658 size_t pos = 0, i = 0;
661 struct ewah_iterator it;
664 struct bitmap *objects = bitmap_git->result;
666 if (bitmap_git->reuse_objects == bitmap_git->pack->num_objects)
669 init_type_iterator(&it, bitmap_git, object_type);
671 while (i < objects->word_alloc && ewah_iterator_next(&filter, &it)) {
672 eword_t word = objects->words[i] & filter;
674 for (offset = 0; offset < BITS_IN_EWORD; ++offset) {
675 struct object_id oid;
676 struct revindex_entry *entry;
679 if ((word >> offset) == 0)
682 offset += ewah_bit_ctz64(word >> offset);
684 if (pos + offset < bitmap_git->reuse_objects)
687 entry = &bitmap_git->pack->revindex[pos + offset];
688 nth_packed_object_oid(&oid, bitmap_git->pack, entry->nr);
690 if (bitmap_git->hashes)
691 hash = get_be32(bitmap_git->hashes + entry->nr);
693 show_reach(&oid, object_type, 0, hash, bitmap_git->pack, entry->offset);
696 pos += BITS_IN_EWORD;
701 static int in_bitmapped_pack(struct bitmap_index *bitmap_git,
702 struct object_list *roots)
705 struct object *object = roots->item;
708 if (find_pack_entry_one(object->oid.hash, bitmap_git->pack) > 0)
715 static struct bitmap *find_tip_blobs(struct bitmap_index *bitmap_git,
716 struct object_list *tip_objects)
718 struct bitmap *result = bitmap_new();
719 struct object_list *p;
721 for (p = tip_objects; p; p = p->next) {
724 if (p->item->type != OBJ_BLOB)
727 pos = bitmap_position(bitmap_git, &p->item->oid);
731 bitmap_set(result, pos);
737 static void filter_bitmap_blob_none(struct bitmap_index *bitmap_git,
738 struct object_list *tip_objects,
739 struct bitmap *to_filter)
741 struct eindex *eindex = &bitmap_git->ext_index;
743 struct ewah_iterator it;
748 * The non-bitmap version of this filter never removes
749 * blobs which the other side specifically asked for,
750 * so we must match that behavior.
752 tips = find_tip_blobs(bitmap_git, tip_objects);
755 * We can use the blob type-bitmap to work in whole words
756 * for the objects that are actually in the bitmapped packfile.
758 for (i = 0, init_type_iterator(&it, bitmap_git, OBJ_BLOB);
759 i < to_filter->word_alloc && ewah_iterator_next(&mask, &it);
761 if (i < tips->word_alloc)
762 mask &= ~tips->words[i];
763 to_filter->words[i] &= ~mask;
767 * Clear any blobs that weren't in the packfile (and so would not have
768 * been caught by the loop above. We'll have to check them
771 for (i = 0; i < eindex->count; i++) {
772 uint32_t pos = i + bitmap_git->pack->num_objects;
773 if (eindex->objects[i]->type == OBJ_BLOB &&
774 bitmap_get(to_filter, pos) &&
775 !bitmap_get(tips, pos))
776 bitmap_unset(to_filter, pos);
782 static int filter_bitmap(struct bitmap_index *bitmap_git,
783 struct object_list *tip_objects,
784 struct bitmap *to_filter,
785 struct list_objects_filter_options *filter)
787 if (!filter || filter->choice == LOFC_DISABLED)
790 if (filter->choice == LOFC_BLOB_NONE) {
792 filter_bitmap_blob_none(bitmap_git, tip_objects,
797 /* filter choice not handled */
801 static int can_filter_bitmap(struct list_objects_filter_options *filter)
803 return !filter_bitmap(NULL, NULL, NULL, filter);
806 struct bitmap_index *prepare_bitmap_walk(struct rev_info *revs,
807 struct list_objects_filter_options *filter)
811 struct object_list *wants = NULL;
812 struct object_list *haves = NULL;
814 struct bitmap *wants_bitmap = NULL;
815 struct bitmap *haves_bitmap = NULL;
817 struct bitmap_index *bitmap_git;
820 * We can't do pathspec limiting with bitmaps, because we don't know
821 * which commits are associated with which object changes (let alone
822 * even which objects are associated with which paths).
827 if (!can_filter_bitmap(filter))
830 /* try to open a bitmapped pack, but don't parse it yet
831 * because we may not need to use it */
832 bitmap_git = xcalloc(1, sizeof(*bitmap_git));
833 if (open_pack_bitmap(revs->repo, bitmap_git) < 0)
836 for (i = 0; i < revs->pending.nr; ++i) {
837 struct object *object = revs->pending.objects[i].item;
839 if (object->type == OBJ_NONE)
840 parse_object_or_die(&object->oid, NULL);
842 while (object->type == OBJ_TAG) {
843 struct tag *tag = (struct tag *) object;
845 if (object->flags & UNINTERESTING)
846 object_list_insert(object, &haves);
848 object_list_insert(object, &wants);
850 object = parse_object_or_die(get_tagged_oid(tag), NULL);
853 if (object->flags & UNINTERESTING)
854 object_list_insert(object, &haves);
856 object_list_insert(object, &wants);
860 * if we have a HAVES list, but none of those haves is contained
861 * in the packfile that has a bitmap, we don't have anything to
864 if (haves && !in_bitmapped_pack(bitmap_git, haves))
867 /* if we don't want anything, we're done here */
872 * now we're going to use bitmaps, so load the actual bitmap entries
873 * from disk. this is the point of no return; after this the rev_list
874 * becomes invalidated and we must perform the revwalk through bitmaps
876 if (load_pack_bitmap(bitmap_git) < 0)
879 object_array_clear(&revs->pending);
882 revs->ignore_missing_links = 1;
883 haves_bitmap = find_objects(bitmap_git, revs, haves, NULL);
884 reset_revision_walk();
885 revs->ignore_missing_links = 0;
887 if (haves_bitmap == NULL)
888 BUG("failed to perform bitmap walk");
891 wants_bitmap = find_objects(bitmap_git, revs, wants, haves_bitmap);
894 BUG("failed to perform bitmap walk");
897 bitmap_and_not(wants_bitmap, haves_bitmap);
899 filter_bitmap(bitmap_git, wants, wants_bitmap, filter);
901 bitmap_git->result = wants_bitmap;
902 bitmap_git->haves = haves_bitmap;
904 object_list_free(&wants);
905 object_list_free(&haves);
910 free_bitmap_index(bitmap_git);
911 object_list_free(&wants);
912 object_list_free(&haves);
916 int reuse_partial_packfile_from_bitmap(struct bitmap_index *bitmap_git,
917 struct packed_git **packfile,
922 * Reuse the packfile content if we need more than
925 static const double REUSE_PERCENT = 0.9;
927 struct bitmap *result = bitmap_git->result;
928 uint32_t reuse_threshold;
929 uint32_t i, reuse_objects = 0;
933 for (i = 0; i < result->word_alloc; ++i) {
934 if (result->words[i] != (eword_t)~0) {
935 reuse_objects += ewah_bit_ctz64(~result->words[i]);
939 reuse_objects += BITS_IN_EWORD;
942 #ifdef GIT_BITMAP_DEBUG
944 const unsigned char *sha1;
945 struct revindex_entry *entry;
947 entry = &bitmap_git->reverse_index->revindex[reuse_objects];
948 sha1 = nth_packed_object_sha1(bitmap_git->pack, entry->nr);
950 fprintf(stderr, "Failed to reuse at %d (%016llx)\n",
951 reuse_objects, result->words[i]);
952 fprintf(stderr, " %s\n", hash_to_hex(sha1));
959 if (reuse_objects >= bitmap_git->pack->num_objects) {
960 bitmap_git->reuse_objects = *entries = bitmap_git->pack->num_objects;
961 *up_to = -1; /* reuse the full pack */
962 *packfile = bitmap_git->pack;
966 reuse_threshold = bitmap_popcount(bitmap_git->result) * REUSE_PERCENT;
968 if (reuse_objects < reuse_threshold)
971 bitmap_git->reuse_objects = *entries = reuse_objects;
972 *up_to = bitmap_git->pack->revindex[reuse_objects].offset;
973 *packfile = bitmap_git->pack;
978 void traverse_bitmap_commit_list(struct bitmap_index *bitmap_git,
979 struct rev_info *revs,
980 show_reachable_fn show_reachable)
982 assert(bitmap_git->result);
984 show_objects_for_type(bitmap_git, OBJ_COMMIT, show_reachable);
985 if (revs->tree_objects)
986 show_objects_for_type(bitmap_git, OBJ_TREE, show_reachable);
987 if (revs->blob_objects)
988 show_objects_for_type(bitmap_git, OBJ_BLOB, show_reachable);
989 if (revs->tag_objects)
990 show_objects_for_type(bitmap_git, OBJ_TAG, show_reachable);
992 show_extended_objects(bitmap_git, revs, show_reachable);
995 static uint32_t count_object_type(struct bitmap_index *bitmap_git,
996 enum object_type type)
998 struct bitmap *objects = bitmap_git->result;
999 struct eindex *eindex = &bitmap_git->ext_index;
1001 uint32_t i = 0, count = 0;
1002 struct ewah_iterator it;
1005 init_type_iterator(&it, bitmap_git, type);
1007 while (i < objects->word_alloc && ewah_iterator_next(&filter, &it)) {
1008 eword_t word = objects->words[i++] & filter;
1009 count += ewah_bit_popcount64(word);
1012 for (i = 0; i < eindex->count; ++i) {
1013 if (eindex->objects[i]->type == type &&
1014 bitmap_get(objects, bitmap_git->pack->num_objects + i))
1021 void count_bitmap_commit_list(struct bitmap_index *bitmap_git,
1022 uint32_t *commits, uint32_t *trees,
1023 uint32_t *blobs, uint32_t *tags)
1025 assert(bitmap_git->result);
1028 *commits = count_object_type(bitmap_git, OBJ_COMMIT);
1031 *trees = count_object_type(bitmap_git, OBJ_TREE);
1034 *blobs = count_object_type(bitmap_git, OBJ_BLOB);
1037 *tags = count_object_type(bitmap_git, OBJ_TAG);
1040 struct bitmap_test_data {
1041 struct bitmap_index *bitmap_git;
1042 struct bitmap *base;
1043 struct progress *prg;
1047 static void test_show_object(struct object *object, const char *name,
1050 struct bitmap_test_data *tdata = data;
1053 bitmap_pos = bitmap_position(tdata->bitmap_git, &object->oid);
1055 die("Object not in bitmap: %s\n", oid_to_hex(&object->oid));
1057 bitmap_set(tdata->base, bitmap_pos);
1058 display_progress(tdata->prg, ++tdata->seen);
1061 static void test_show_commit(struct commit *commit, void *data)
1063 struct bitmap_test_data *tdata = data;
1066 bitmap_pos = bitmap_position(tdata->bitmap_git,
1067 &commit->object.oid);
1069 die("Object not in bitmap: %s\n", oid_to_hex(&commit->object.oid));
1071 bitmap_set(tdata->base, bitmap_pos);
1072 display_progress(tdata->prg, ++tdata->seen);
1075 void test_bitmap_walk(struct rev_info *revs)
1077 struct object *root;
1078 struct bitmap *result = NULL;
1080 size_t result_popcnt;
1081 struct bitmap_test_data tdata;
1082 struct bitmap_index *bitmap_git;
1084 if (!(bitmap_git = prepare_bitmap_git(revs->repo)))
1085 die("failed to load bitmap indexes");
1087 if (revs->pending.nr != 1)
1088 die("you must specify exactly one commit to test");
1090 fprintf(stderr, "Bitmap v%d test (%d entries loaded)\n",
1091 bitmap_git->version, bitmap_git->entry_count);
1093 root = revs->pending.objects[0].item;
1094 pos = kh_get_oid_map(bitmap_git->bitmaps, root->oid);
1096 if (pos < kh_end(bitmap_git->bitmaps)) {
1097 struct stored_bitmap *st = kh_value(bitmap_git->bitmaps, pos);
1098 struct ewah_bitmap *bm = lookup_stored_bitmap(st);
1100 fprintf(stderr, "Found bitmap for %s. %d bits / %08x checksum\n",
1101 oid_to_hex(&root->oid), (int)bm->bit_size, ewah_checksum(bm));
1103 result = ewah_to_bitmap(bm);
1107 die("Commit %s doesn't have an indexed bitmap", oid_to_hex(&root->oid));
1109 revs->tag_objects = 1;
1110 revs->tree_objects = 1;
1111 revs->blob_objects = 1;
1113 result_popcnt = bitmap_popcount(result);
1115 if (prepare_revision_walk(revs))
1116 die("revision walk setup failed");
1118 tdata.bitmap_git = bitmap_git;
1119 tdata.base = bitmap_new();
1120 tdata.prg = start_progress("Verifying bitmap entries", result_popcnt);
1123 traverse_commit_list(revs, &test_show_commit, &test_show_object, &tdata);
1125 stop_progress(&tdata.prg);
1127 if (bitmap_equals(result, tdata.base))
1128 fprintf(stderr, "OK!\n");
1130 fprintf(stderr, "Mismatch!\n");
1132 free_bitmap_index(bitmap_git);
1135 static int rebuild_bitmap(uint32_t *reposition,
1136 struct ewah_bitmap *source,
1137 struct bitmap *dest)
1140 struct ewah_iterator it;
1143 ewah_iterator_init(&it, source);
1145 while (ewah_iterator_next(&word, &it)) {
1146 uint32_t offset, bit_pos;
1148 for (offset = 0; offset < BITS_IN_EWORD; ++offset) {
1149 if ((word >> offset) == 0)
1152 offset += ewah_bit_ctz64(word >> offset);
1154 bit_pos = reposition[pos + offset];
1156 bitmap_set(dest, bit_pos - 1);
1157 else /* can't reuse, we don't have the object */
1161 pos += BITS_IN_EWORD;
1166 int rebuild_existing_bitmaps(struct bitmap_index *bitmap_git,
1167 struct packing_data *mapping,
1168 kh_oid_map_t *reused_bitmaps,
1171 uint32_t i, num_objects;
1172 uint32_t *reposition;
1173 struct bitmap *rebuild;
1174 struct stored_bitmap *stored;
1175 struct progress *progress = NULL;
1180 num_objects = bitmap_git->pack->num_objects;
1181 reposition = xcalloc(num_objects, sizeof(uint32_t));
1183 for (i = 0; i < num_objects; ++i) {
1184 struct object_id oid;
1185 struct revindex_entry *entry;
1186 struct object_entry *oe;
1188 entry = &bitmap_git->pack->revindex[i];
1189 nth_packed_object_oid(&oid, bitmap_git->pack, entry->nr);
1190 oe = packlist_find(mapping, &oid);
1193 reposition[i] = oe_in_pack_pos(mapping, oe) + 1;
1196 rebuild = bitmap_new();
1200 progress = start_progress("Reusing bitmaps", 0);
1202 kh_foreach_value(bitmap_git->bitmaps, stored, {
1203 if (stored->flags & BITMAP_FLAG_REUSE) {
1204 if (!rebuild_bitmap(reposition,
1205 lookup_stored_bitmap(stored),
1207 hash_pos = kh_put_oid_map(reused_bitmaps,
1210 kh_value(reused_bitmaps, hash_pos) =
1211 bitmap_to_ewah(rebuild);
1213 bitmap_reset(rebuild);
1214 display_progress(progress, ++i);
1218 stop_progress(&progress);
1221 bitmap_free(rebuild);
1225 void free_bitmap_index(struct bitmap_index *b)
1231 munmap(b->map, b->map_size);
1232 ewah_pool_free(b->commits);
1233 ewah_pool_free(b->trees);
1234 ewah_pool_free(b->blobs);
1235 ewah_pool_free(b->tags);
1236 kh_destroy_oid_map(b->bitmaps);
1237 free(b->ext_index.objects);
1238 free(b->ext_index.hashes);
1239 bitmap_free(b->result);
1240 bitmap_free(b->haves);
1244 int bitmap_has_oid_in_uninteresting(struct bitmap_index *bitmap_git,
1245 const struct object_id *oid)
1250 return 0; /* no bitmap loaded */
1251 if (!bitmap_git->haves)
1252 return 0; /* walk had no "haves" */
1254 pos = bitmap_position_packfile(bitmap_git, oid);
1258 return bitmap_get(bitmap_git->haves, pos);