2013-11-14 13:43:51 +01:00
|
|
|
/**
|
|
|
|
* Copyright 2013, GitHub, Inc
|
|
|
|
* Copyright 2009-2013, Daniel Lemire, Cliff Moon,
|
|
|
|
* David McIntosh, Robert Becho, Google Inc. and Veronika Zenz
|
|
|
|
*
|
|
|
|
* This program is free software; you can redistribute it and/or
|
|
|
|
* modify it under the terms of the GNU General Public License
|
|
|
|
* as published by the Free Software Foundation; either version 2
|
|
|
|
* of the License, or (at your option) any later version.
|
|
|
|
*
|
|
|
|
* This program is distributed in the hope that it will be useful,
|
|
|
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
|
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
|
|
* GNU General Public License for more details.
|
|
|
|
*
|
|
|
|
* You should have received a copy of the GNU General Public License
|
2017-11-07 06:39:33 +01:00
|
|
|
* along with this program; if not, see <http://www.gnu.org/licenses/>.
|
2013-11-14 13:43:51 +01:00
|
|
|
*/
|
2016-02-22 23:45:15 +01:00
|
|
|
#include "cache.h"
|
2013-11-14 13:43:51 +01:00
|
|
|
#include "ewok.h"
|
|
|
|
|
2015-06-03 08:39:37 +02:00
|
|
|
#define EWAH_MASK(x) ((eword_t)1 << (x % BITS_IN_EWORD))
|
|
|
|
#define EWAH_BLOCK(x) (x / BITS_IN_EWORD)
|
2013-11-14 13:43:51 +01:00
|
|
|
|
2019-12-18 12:25:38 +01:00
|
|
|
struct bitmap *bitmap_word_alloc(size_t word_alloc)
|
2013-11-14 13:43:51 +01:00
|
|
|
{
|
2016-02-22 23:45:12 +01:00
|
|
|
struct bitmap *bitmap = xmalloc(sizeof(struct bitmap));
|
2019-12-18 12:25:38 +01:00
|
|
|
bitmap->words = xcalloc(word_alloc, sizeof(eword_t));
|
|
|
|
bitmap->word_alloc = word_alloc;
|
2013-11-14 13:43:51 +01:00
|
|
|
return bitmap;
|
|
|
|
}
|
|
|
|
|
2019-12-18 12:25:38 +01:00
|
|
|
struct bitmap *bitmap_new(void)
|
|
|
|
{
|
|
|
|
return bitmap_word_alloc(32);
|
|
|
|
}
|
|
|
|
|
2020-12-08 23:03:50 +01:00
|
|
|
struct bitmap *bitmap_dup(const struct bitmap *src)
|
|
|
|
{
|
|
|
|
struct bitmap *dst = bitmap_word_alloc(src->word_alloc);
|
|
|
|
COPY_ARRAY(dst->words, src->words, src->word_alloc);
|
|
|
|
return dst;
|
|
|
|
}
|
|
|
|
|
2020-12-08 23:03:38 +01:00
|
|
|
static void bitmap_grow(struct bitmap *self, size_t word_alloc)
|
2013-11-14 13:43:51 +01:00
|
|
|
{
|
ewah: make bitmap growth less aggressive
If you ask to set a bit in the Nth word and we haven't yet allocated
that many slots in our array, we'll increase the bitmap size to 2*N.
This means we might frequently end up with bitmaps that are twice the
necessary size (as soon as you ask for the biggest bit, we'll size up to
twice that).
But if we just allocate as many words as were asked for, we may not grow
fast enough. The worst case there is setting bit 0, then 1, etc. Each
time we grow we'd just extend by one more word, giving us linear
reallocations (and quadratic memory copies).
A middle ground is relying on alloc_nr(), which causes us to grow by a
factor of roughly 3/2 instead of 2. That's less aggressive than
doubling, and it may help avoid fragmenting memory. (If we start with N,
then grow twice, our total is N*(3/2)^2 = 9N/4. After growing twice,
that array of size 9N/4 can fit into the space vacated by the original
array and first growth, N+3N/2 = 10N/4 > 9N/4, leading to less
fragmentation in memory).
Our worst case is still 3/2N wasted bits (you set bit N-1, then setting
bit N causes us to grow by 3/2), but our average should be much better.
This isn't usually that big a deal, but it will matter as we shift the
reachability bitmap generation code to store more bitmaps in memory.
Signed-off-by: Jeff King <peff@peff.net>
Signed-off-by: Taylor Blau <me@ttaylorr.com>
Signed-off-by: Junio C Hamano <gitster@pobox.com>
2020-12-08 23:03:42 +01:00
|
|
|
size_t old_size = self->word_alloc;
|
|
|
|
ALLOC_GROW(self->words, word_alloc, self->word_alloc);
|
|
|
|
memset(self->words + old_size, 0x0,
|
|
|
|
(self->word_alloc - old_size) * sizeof(eword_t));
|
2020-12-08 23:03:38 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
void bitmap_set(struct bitmap *self, size_t pos)
|
|
|
|
{
|
|
|
|
size_t block = EWAH_BLOCK(pos);
|
2013-11-14 13:43:51 +01:00
|
|
|
|
2020-12-08 23:03:38 +01:00
|
|
|
bitmap_grow(self, block + 1);
|
2015-06-03 08:39:17 +02:00
|
|
|
self->words[block] |= EWAH_MASK(pos);
|
2013-11-14 13:43:51 +01:00
|
|
|
}
|
|
|
|
|
2020-02-14 19:22:34 +01:00
|
|
|
void bitmap_unset(struct bitmap *self, size_t pos)
|
|
|
|
{
|
|
|
|
size_t block = EWAH_BLOCK(pos);
|
|
|
|
|
|
|
|
if (block < self->word_alloc)
|
|
|
|
self->words[block] &= ~EWAH_MASK(pos);
|
|
|
|
}
|
|
|
|
|
2013-11-14 13:43:51 +01:00
|
|
|
int bitmap_get(struct bitmap *self, size_t pos)
|
|
|
|
{
|
2015-06-03 08:39:17 +02:00
|
|
|
size_t block = EWAH_BLOCK(pos);
|
2013-11-14 13:43:51 +01:00
|
|
|
return block < self->word_alloc &&
|
2015-06-03 08:39:17 +02:00
|
|
|
(self->words[block] & EWAH_MASK(pos)) != 0;
|
2013-11-14 13:43:51 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
struct ewah_bitmap *bitmap_to_ewah(struct bitmap *bitmap)
|
|
|
|
{
|
|
|
|
struct ewah_bitmap *ewah = ewah_new();
|
|
|
|
size_t i, running_empty_words = 0;
|
|
|
|
eword_t last_word = 0;
|
|
|
|
|
|
|
|
for (i = 0; i < bitmap->word_alloc; ++i) {
|
|
|
|
if (bitmap->words[i] == 0) {
|
|
|
|
running_empty_words++;
|
|
|
|
continue;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (last_word != 0)
|
|
|
|
ewah_add(ewah, last_word);
|
|
|
|
|
|
|
|
if (running_empty_words > 0) {
|
|
|
|
ewah_add_empty_words(ewah, 0, running_empty_words);
|
|
|
|
running_empty_words = 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
last_word = bitmap->words[i];
|
|
|
|
}
|
|
|
|
|
|
|
|
ewah_add(ewah, last_word);
|
|
|
|
return ewah;
|
|
|
|
}
|
|
|
|
|
|
|
|
struct bitmap *ewah_to_bitmap(struct ewah_bitmap *ewah)
|
|
|
|
{
|
|
|
|
struct bitmap *bitmap = bitmap_new();
|
|
|
|
struct ewah_iterator it;
|
|
|
|
eword_t blowup;
|
|
|
|
size_t i = 0;
|
|
|
|
|
|
|
|
ewah_iterator_init(&it, ewah);
|
|
|
|
|
|
|
|
while (ewah_iterator_next(&blowup, &it)) {
|
2016-02-22 23:45:15 +01:00
|
|
|
ALLOC_GROW(bitmap->words, i + 1, bitmap->word_alloc);
|
2013-11-14 13:43:51 +01:00
|
|
|
bitmap->words[i++] = blowup;
|
|
|
|
}
|
|
|
|
|
|
|
|
bitmap->word_alloc = i;
|
|
|
|
return bitmap;
|
|
|
|
}
|
|
|
|
|
|
|
|
void bitmap_and_not(struct bitmap *self, struct bitmap *other)
|
|
|
|
{
|
|
|
|
const size_t count = (self->word_alloc < other->word_alloc) ?
|
|
|
|
self->word_alloc : other->word_alloc;
|
|
|
|
|
|
|
|
size_t i;
|
|
|
|
|
|
|
|
for (i = 0; i < count; ++i)
|
|
|
|
self->words[i] &= ~other->words[i];
|
|
|
|
}
|
|
|
|
|
2020-12-08 23:03:46 +01:00
|
|
|
void bitmap_or(struct bitmap *self, const struct bitmap *other)
|
|
|
|
{
|
|
|
|
size_t i;
|
|
|
|
|
|
|
|
bitmap_grow(self, other->word_alloc);
|
|
|
|
for (i = 0; i < other->word_alloc; i++)
|
|
|
|
self->words[i] |= other->words[i];
|
|
|
|
}
|
|
|
|
|
2013-11-14 13:43:51 +01:00
|
|
|
void bitmap_or_ewah(struct bitmap *self, struct ewah_bitmap *other)
|
|
|
|
{
|
|
|
|
size_t original_size = self->word_alloc;
|
2015-06-03 08:39:37 +02:00
|
|
|
size_t other_final = (other->bit_size / BITS_IN_EWORD) + 1;
|
2013-11-14 13:43:51 +01:00
|
|
|
size_t i = 0;
|
|
|
|
struct ewah_iterator it;
|
|
|
|
eword_t word;
|
|
|
|
|
|
|
|
if (self->word_alloc < other_final) {
|
|
|
|
self->word_alloc = other_final;
|
2016-02-22 23:45:15 +01:00
|
|
|
REALLOC_ARRAY(self->words, self->word_alloc);
|
2013-11-14 13:43:51 +01:00
|
|
|
memset(self->words + original_size, 0x0,
|
|
|
|
(self->word_alloc - original_size) * sizeof(eword_t));
|
|
|
|
}
|
|
|
|
|
|
|
|
ewah_iterator_init(&it, other);
|
|
|
|
|
|
|
|
while (ewah_iterator_next(&word, &it))
|
|
|
|
self->words[i++] |= word;
|
|
|
|
}
|
|
|
|
|
|
|
|
size_t bitmap_popcount(struct bitmap *self)
|
|
|
|
{
|
|
|
|
size_t i, count = 0;
|
|
|
|
|
|
|
|
for (i = 0; i < self->word_alloc; ++i)
|
|
|
|
count += ewah_bit_popcount64(self->words[i]);
|
|
|
|
|
|
|
|
return count;
|
|
|
|
}
|
|
|
|
|
|
|
|
int bitmap_equals(struct bitmap *self, struct bitmap *other)
|
|
|
|
{
|
|
|
|
struct bitmap *big, *small;
|
|
|
|
size_t i;
|
|
|
|
|
|
|
|
if (self->word_alloc < other->word_alloc) {
|
|
|
|
small = self;
|
|
|
|
big = other;
|
|
|
|
} else {
|
|
|
|
small = other;
|
|
|
|
big = self;
|
|
|
|
}
|
|
|
|
|
|
|
|
for (i = 0; i < small->word_alloc; ++i) {
|
|
|
|
if (small->words[i] != big->words[i])
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
for (; i < big->word_alloc; ++i) {
|
|
|
|
if (big->words[i] != 0)
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
return 1;
|
|
|
|
}
|
|
|
|
|
2020-12-08 23:04:08 +01:00
|
|
|
int bitmap_is_subset(struct bitmap *self, struct bitmap *other)
|
|
|
|
{
|
|
|
|
size_t common_size, i;
|
|
|
|
|
|
|
|
if (self->word_alloc < other->word_alloc)
|
|
|
|
common_size = self->word_alloc;
|
|
|
|
else {
|
|
|
|
common_size = other->word_alloc;
|
|
|
|
for (i = common_size; i < self->word_alloc; i++) {
|
|
|
|
if (self->words[i])
|
|
|
|
return 1;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
for (i = 0; i < common_size; i++) {
|
|
|
|
if (self->words[i] & ~other->words[i])
|
|
|
|
return 1;
|
|
|
|
}
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
2013-11-14 13:43:51 +01:00
|
|
|
void bitmap_reset(struct bitmap *bitmap)
|
|
|
|
{
|
|
|
|
memset(bitmap->words, 0x0, bitmap->word_alloc * sizeof(eword_t));
|
|
|
|
}
|
|
|
|
|
|
|
|
void bitmap_free(struct bitmap *bitmap)
|
|
|
|
{
|
|
|
|
if (bitmap == NULL)
|
|
|
|
return;
|
|
|
|
|
|
|
|
free(bitmap->words);
|
|
|
|
free(bitmap);
|
|
|
|
}
|