ref: 7f4f1776a930dc9b80f099ca869b0827bbc54383
parent: 6f1419495d556e914f5a4afa05c5f3cc8b0e1849
author: Ori Bernstein <[email protected]>
date: Wed Jan 4 11:43:43 EST 2017
Speed up bitset. Merge back Quentin's perf hacks.
--- a/util/bitset.c
+++ b/util/bitset.c
@@ -106,6 +106,31 @@
return n;
}
+inline static int firstbit(size_t b)
+{
+ int n;
+
+ n = 0;
+ if (!(b & 0xffffffff)) {
+ n += 32;
+ b >>= 32;
+ }
+ if (!(b & 0xffff)) {
+ n += 16;
+ b >>= 16;
+ }
+ if (!(b & 0xff)) {
+ n += 8;
+ b >>= 8;
+ }
+ if (!(b & 0xf)) {
+ n += 4;
+ b >>= 4;
+ }
+ n += (char[16]){4,0,1,0,2,0,1,0,3,0,1,0,2,0,1,0}[b & 0xf];
+ return n;
+}
+
/* A slightly tricky function to iterate over the contents
* of a bitset. It returns true immediately if 'elt' is in
* the bitset, otherwise it seeks forward to the next value
@@ -125,18 +150,24 @@
*/
int bsiter(Bitset *bs, size_t *elt)
{
- size_t i;
+ size_t b, t, i;
- for (i = *elt; i < bsmax(bs); i++) {
- while (i < bsmax(bs) && !bs->chunks[i / Sizetbits])
- i = (i + Sizetbits) & ~(Sizetbits - 1);
- if (bshas(bs, i)) {
- *elt = i;
- return 1;
- }
+ i = *elt;
+ t = i/Sizetbits;
+ if (t >= bs->nchunks)
+ return 0;
+ b = bs->chunks[t];
+ b &= ~((1ull << (i%Sizetbits)) - 1);
+ while (!b) {
+ ++t;
+ if (t >= bs->nchunks)
+ return 0;
+ b = bs->chunks[t];
}
- return 0;
+ *elt = Sizetbits*t + firstbit(b);
+ return 1;
}
+
/* Returns the largest value that the bitset can possibly
* hold. It's conservative, but scanning the entire bitset
--- a/util/util.h
+++ b/util/util.h
@@ -83,6 +83,7 @@
int bsiter(Bitset *bs, size_t *elt);
size_t bsmax(Bitset *bs);
size_t bscount(Bitset *bs);
+
/* inline for speed */
static inline int bshas(Bitset *bs, size_t elt)
{