vcpe/srcs/libs/bitset/bitset.c

383 lines
13 KiB
C

#include <stdlib.h>
#include <stdint.h>
#include <string.h>
#include "bitset/bitset.h"
/* Create a new bitset. Return NULL in case of failure. */
bitset_t *bitset_create() {
bitset_t *bitset = NULL;
/* Allocate the bitset itself. */
if ((bitset = (bitset_t *)malloc(sizeof(bitset_t))) == NULL) {
return NULL;
}
bitset->array = NULL;
bitset->arraysize = 0;
bitset->capacity = 0;
return bitset;
}
/* Create a new bitset able to contain size bits. Return NULL in case of failure. */
bitset_t *bitset_create_with_capacity(size_t size) {
bitset_t *bitset = NULL;
/* Allocate the bitset itself. */
if ((bitset = (bitset_t *)malloc(sizeof(bitset_t))) == NULL) {
return NULL;
}
bitset->arraysize = (size + sizeof(uint64_t) * 8 - 1) / (sizeof(uint64_t) * 8);
bitset->capacity = bitset->arraysize;
if ((bitset->array = (uint64_t *)calloc(bitset->arraysize, sizeof(uint64_t))) == NULL) {
free(bitset);
return NULL;
}
return bitset;
}
/* Create a copy */
bitset_t *bitset_copy(const bitset_t *bitset) {
bitset_t *copy = NULL;
/* Allocate the bitset itself. */
if ((copy = (bitset_t *)malloc(sizeof(bitset_t))) == NULL) {
return NULL;
}
memcpy(copy, bitset, sizeof(bitset_t));
copy->capacity = copy->arraysize;
if ((copy->array = (uint64_t *)malloc(sizeof(uint64_t) * bitset->arraysize)) == NULL) {
free(copy);
return NULL;
}
memcpy(copy->array, bitset->array, sizeof(uint64_t) * bitset->arraysize);
return copy;
}
void bitset_clear(bitset_t *bitset) {
memset(bitset->array, 0, sizeof(uint64_t) * bitset->arraysize);
}
void bitset_shift_left(bitset_t *bitset, size_t s) {
size_t extra_words = s / 64;
int inword_shift = (int)(s % 64);
size_t as = bitset->arraysize;
if (inword_shift == 0) {
bitset_resize(bitset, as + extra_words, FALSE);
// could be done with a memmove
for (size_t i = as + extra_words; i > extra_words; i--) {
bitset->array[i - 1] = bitset->array[i - 1 - extra_words];
}
} else {
bitset_resize(bitset, as + extra_words + 1, TRUE);
bitset->array[as + extra_words] = bitset->array[as - 1] >> (64 - inword_shift);
for (size_t i = as + extra_words; i >= extra_words + 2; i--) {
bitset->array[i - 1] = (bitset->array[i - 1 - extra_words] << inword_shift) |
(bitset->array[i - 2 - extra_words] >> (64 - inword_shift));
}
bitset->array[extra_words] = bitset->array[0] << inword_shift;
}
for (size_t i = 0; i < extra_words; i++) {
bitset->array[i] = 0;
}
}
void bitset_shift_right(bitset_t *bitset, size_t s) {
size_t extra_words = s / 64;
int inword_shift = (int)(s % 64);
size_t as = bitset->arraysize;
if (inword_shift == 0) {
// could be done with a memmove
for (size_t i = 0; i < as - extra_words; i++) {
bitset->array[i] = bitset->array[i + extra_words];
}
bitset_resize(bitset, as - extra_words, FALSE);
} else {
for (size_t i = 0; i + extra_words + 1 < as; i++) {
bitset->array[i] = (bitset->array[i + extra_words] >> inword_shift) |
(bitset->array[i + extra_words + 1] << (64 - inword_shift));
}
bitset->array[as - extra_words - 1] = (bitset->array[as - 1] >> inword_shift);
bitset_resize(bitset, as - extra_words, FALSE);
}
}
/* Free memory. */
void bitset_free(bitset_t *bitset) {
free(bitset->array);
free(bitset);
}
/* Resize the bitset so that it can support newarraysize * 64 bits. Return TRUE in case of success, FALSE for failure. */
int bitset_resize(bitset_t *bitset, size_t newarraysize, int padwithzeroes) {
size_t smallest = newarraysize < bitset->arraysize ? newarraysize : bitset->arraysize;
if (bitset->capacity < newarraysize) {
uint64_t *newarray;
bitset->capacity = newarraysize * 2;
if ((newarray = (uint64_t *)realloc(bitset->array, sizeof(uint64_t) * bitset->capacity)) == NULL) {
free(bitset->array);
return FALSE;
}
bitset->array = newarray;
}
if (padwithzeroes && (newarraysize > smallest)) {
memset(bitset->array + smallest, 0, sizeof(uint64_t) * (newarraysize - smallest));
}
bitset->arraysize = newarraysize;
return TRUE; // success!
}
size_t bitset_count(const bitset_t *bitset) {
size_t card = 0;
size_t k = 0;
// assumes that long long is 8 bytes
for (; k + 7 < bitset->arraysize; k += 8) {
card += __builtin_popcountll(bitset->array[k]);
card += __builtin_popcountll(bitset->array[k + 1]);
card += __builtin_popcountll(bitset->array[k + 2]);
card += __builtin_popcountll(bitset->array[k + 3]);
card += __builtin_popcountll(bitset->array[k + 4]);
card += __builtin_popcountll(bitset->array[k + 5]);
card += __builtin_popcountll(bitset->array[k + 6]);
card += __builtin_popcountll(bitset->array[k + 7]);
}
for (; k + 3 < bitset->arraysize; k += 4) {
card += __builtin_popcountll(bitset->array[k]);
card += __builtin_popcountll(bitset->array[k + 1]);
card += __builtin_popcountll(bitset->array[k + 2]);
card += __builtin_popcountll(bitset->array[k + 3]);
}
for (; k < bitset->arraysize; k++) {
card += __builtin_popcountll(bitset->array[k]);
}
return card;
}
int bitset_inplace_union(bitset_t *CBITSET_RESTRICT b1, const bitset_t *CBITSET_RESTRICT b2) {
size_t minlength = b1->arraysize < b2->arraysize ? b1->arraysize : b2->arraysize;
for (size_t k = 0; k < minlength; ++k) {
b1->array[k] |= b2->array[k];
}
if (b2->arraysize > b1->arraysize) {
size_t oldsize = b1->arraysize;
if (!bitset_resize(b1, b2->arraysize, FALSE)) {
return FALSE;
}
memcpy(b1->array + oldsize, b2->array + oldsize, (b2->arraysize - oldsize) * sizeof(uint64_t));
}
return TRUE;
}
size_t bitset_minimum(const bitset_t *bitset) {
for (size_t k = 0; k < bitset->arraysize; k++) {
uint64_t w = bitset->array[k];
if (w != 0) {
return __builtin_ctzll(w) + k * 64;
}
}
return 0;
}
size_t bitset_maximum(const bitset_t *bitset) {
for (size_t k = bitset->arraysize; k > 0; k--) {
uint64_t w = bitset->array[k - 1];
if (w != 0) {
return 63 - __builtin_clzll(w) + (k - 1) * 64;
}
}
return 0;
}
/* Returns TRUE if bitsets share no common elements, FALSE otherwise.
*
* Performs early-out if common element found. */
int bitsets_disjoint(const bitset_t *b1, const bitset_t *b2) {
size_t minlength = b1->arraysize < b2->arraysize ? b1->arraysize : b2->arraysize;
for (size_t k = 0; k < minlength; k++) {
if ((b1->array[k] & b2->array[k]) != 0) {
return FALSE;
}
}
return TRUE;
}
/* Returns TRUE if bitsets contain at least 1 common element, FALSE if they are
* disjoint.
*
* Performs early-out if common element found. */
int bitsets_intersect(const bitset_t *b1, const bitset_t *b2) {
size_t minlength = b1->arraysize < b2->arraysize ? b1->arraysize : b2->arraysize;
for (size_t k = 0; k < minlength; k++) {
if ((b1->array[k] & b2->array[k]) != 0) {
return TRUE;
}
}
return FALSE;
}
/* Returns TRUE if b has any bits set in or after b->array[starting_loc]. */
static int any_bits_set(const bitset_t *b, size_t starting_loc) {
if (starting_loc >= b->arraysize) {
return FALSE;
}
for (size_t k = starting_loc; k < b->arraysize; k++) {
if (b->array[k] != 0) {
return TRUE;
}
}
return FALSE;
}
/* Returns TRUE if b1 has all of b2's bits set.
*
* Performs early out if a bit is found in b2 that is not found in b1. */
int bitset_contains_all(const bitset_t *b1, const bitset_t *b2) {
for (size_t k = 0; k < b1->arraysize; k++) {
if ((b1->array[k] & b2->array[k]) != b2->array[k]) {
return FALSE;
}
}
if (b2->arraysize > b1->arraysize) {
/* Need to check if b2 has any bits set beyond b1's array */
return !any_bits_set(b2, b1->arraysize);
}
return TRUE;
}
size_t bitset_union_count(const bitset_t *CBITSET_RESTRICT b1, const bitset_t *CBITSET_RESTRICT b2) {
size_t answer = 0;
size_t minlength = b1->arraysize < b2->arraysize ? b1->arraysize : b2->arraysize;
size_t k = 0;
for (; k + 3 < minlength; k += 4) {
answer += __builtin_popcountll(b1->array[k] | b2->array[k]);
answer += __builtin_popcountll(b1->array[k + 1] | b2->array[k + 1]);
answer += __builtin_popcountll(b1->array[k + 2] | b2->array[k + 2]);
answer += __builtin_popcountll(b1->array[k + 3] | b2->array[k + 3]);
}
for (; k < minlength; ++k) {
answer += __builtin_popcountll(b1->array[k] | b2->array[k]);
}
if (b2->arraysize > b1->arraysize) {
//k = b1->arraysize;
for (; k + 3 < b2->arraysize; k += 4) {
answer += __builtin_popcountll(b2->array[k]);
answer += __builtin_popcountll(b2->array[k + 1]);
answer += __builtin_popcountll(b2->array[k + 2]);
answer += __builtin_popcountll(b2->array[k + 3]);
}
for (; k < b2->arraysize; ++k) {
answer += __builtin_popcountll(b2->array[k]);
}
} else {
//k = b2->arraysize;
for (; k + 3 < b1->arraysize; k += 4) {
answer += __builtin_popcountll(b1->array[k]);
answer += __builtin_popcountll(b1->array[k + 1]);
answer += __builtin_popcountll(b1->array[k + 2]);
answer += __builtin_popcountll(b1->array[k + 3]);
}
for (; k < b1->arraysize; ++k) {
answer += __builtin_popcountll(b1->array[k]);
}
}
return answer;
}
void bitset_inplace_intersection(bitset_t *CBITSET_RESTRICT b1, const bitset_t *CBITSET_RESTRICT b2) {
size_t minlength = b1->arraysize < b2->arraysize ? b1->arraysize : b2->arraysize;
size_t k = 0;
for (; k < minlength; ++k) {
b1->array[k] &= b2->array[k];
}
for (; k < b1->arraysize; ++k) {
b1->array[k] = 0; // memset could, maybe, be a tiny bit faster
}
}
size_t bitset_intersection_count(const bitset_t *CBITSET_RESTRICT b1, const bitset_t *CBITSET_RESTRICT b2) {
size_t answer = 0;
size_t minlength = b1->arraysize < b2->arraysize ? b1->arraysize : b2->arraysize;
for (size_t k = 0; k < minlength; ++k) {
answer += __builtin_popcountll(b1->array[k] & b2->array[k]);
}
return answer;
}
void bitset_inplace_difference(bitset_t *CBITSET_RESTRICT b1, const bitset_t *CBITSET_RESTRICT b2) {
size_t minlength = b1->arraysize < b2->arraysize ? b1->arraysize : b2->arraysize;
size_t k = 0;
for (; k < minlength; ++k) {
b1->array[k] &= ~(b2->array[k]);
}
}
size_t bitset_difference_count(const bitset_t *CBITSET_RESTRICT b1, const bitset_t *CBITSET_RESTRICT b2) {
size_t minlength = b1->arraysize < b2->arraysize ? b1->arraysize : b2->arraysize;
size_t k = 0;
size_t answer = 0;
for (; k < minlength; ++k) {
answer += __builtin_popcountll(b1->array[k] & ~(b2->array[k]));
}
for (; k < b1->arraysize; ++k) {
answer += __builtin_popcountll(b1->array[k]);
}
return answer;
}
int bitset_inplace_symmetric_difference(bitset_t *CBITSET_RESTRICT b1, const bitset_t *CBITSET_RESTRICT b2) {
size_t minlength = b1->arraysize < b2->arraysize ? b1->arraysize : b2->arraysize;
size_t k = 0;
for (; k < minlength; ++k) {
b1->array[k] ^= b2->array[k];
}
if (b2->arraysize > b1->arraysize) {
size_t oldsize = b1->arraysize;
if (!bitset_resize(b1, b2->arraysize, FALSE)) {
return FALSE;
}
memcpy(b1->array + oldsize, b2->array + oldsize, (b2->arraysize - oldsize) * sizeof(uint64_t));
}
return TRUE;
}
size_t bitset_symmetric_difference_count(const bitset_t *CBITSET_RESTRICT b1, const bitset_t *CBITSET_RESTRICT b2) {
size_t minlength = b1->arraysize < b2->arraysize ? b1->arraysize : b2->arraysize;
size_t k = 0;
size_t answer = 0;
for (; k < minlength; ++k) {
answer += __builtin_popcountll(b1->array[k] ^ b2->array[k]);
}
if (b2->arraysize > b1->arraysize) {
for (; k < b2->arraysize; ++k) {
answer += __builtin_popcountll(b2->array[k]);
}
} else {
for (; k < b1->arraysize; ++k) {
answer += __builtin_popcountll(b1->array[k]);
}
}
return answer;
}
int bitset_trim(bitset_t *bitset) {
size_t newsize = bitset->arraysize;
while (newsize > 0) {
if (bitset->array[newsize - 1] == 0) {
newsize -= 1;
} else {
break;
}
}
if (bitset->capacity == newsize) {
return TRUE; // nothing to do
}
bitset->capacity = newsize;
bitset->arraysize = newsize;
uint64_t *newarray;
if ((newarray = (uint64_t *)realloc(bitset->array, sizeof(uint64_t) * bitset->capacity)) == NULL) {
free(bitset->array);
return FALSE;
}
bitset->array = newarray;
return TRUE;
}