Lucene 源码分析集------- BitUtil

const uint8_t BitUtil::ntzTable[] = {
    8, 0, 1, 0, 2, 0, 1, 0, 3, 0, 1, 0, 2, 0, 1, 0, 4, 0, 1, 0, 2, 0, 1, 0, 3, 0, 1, 0, 2, 0, 1, 0,
    5, 0, 1, 0, 2, 0, 1, 0, 3, 0, 1, 0, 2, 0, 1, 0, 4, 0, 1, 0, 2, 0, 1, 0, 3, 0, 1, 0, 2, 0, 1, 0,
    6, 0, 1, 0, 2, 0, 1, 0, 3, 0, 1, 0, 2, 0, 1, 0, 4, 0, 1, 0, 2, 0, 1, 0, 3, 0, 1, 0, 2, 0, 1, 0,
    5, 0, 1, 0, 2, 0, 1, 0, 3, 0, 1, 0, 2, 0, 1, 0, 4, 0, 1, 0, 2, 0, 1, 0, 3, 0, 1, 0, 2, 0, 1, 0,
    7, 0, 1, 0, 2, 0, 1, 0, 3, 0, 1, 0, 2, 0, 1, 0, 4, 0, 1, 0, 2, 0, 1, 0, 3, 0, 1, 0, 2, 0, 1, 0,
    5, 0, 1, 0, 2, 0, 1, 0, 3, 0, 1, 0, 2, 0, 1, 0, 4, 0, 1, 0, 2, 0, 1, 0, 3, 0, 1, 0, 2, 0, 1, 0,
    6, 0, 1, 0, 2, 0, 1, 0, 3, 0, 1, 0, 2, 0, 1, 0, 4, 0, 1, 0, 2, 0, 1, 0, 3, 0, 1, 0, 2, 0, 1, 0,
    5, 0, 1, 0, 2, 0, 1, 0, 3, 0, 1, 0, 2, 0, 1, 0, 4, 0, 1, 0, 2, 0, 1, 0, 3, 0, 1, 0, 2, 0, 1, 0
};

BitUtil::~BitUtil() {
}

// 对于64位的int,返回其bit为1的个数

int32_t BitUtil::pop(int64_t x) {
    x = x - (MiscUtils::unsignedShift(x, (int64_t)1) & 0x5555555555555555LL);
    x = (x & 0x3333333333333333LL) + (MiscUtils::unsignedShift(x, (int64_t)2) & 0x3333333333333333LL);
    x = (x + MiscUtils::unsignedShift(x, (int64_t)4)) & 0x0f0f0f0f0f0f0f0fLL;
    x = x + MiscUtils::unsignedShift(x, (int64_t)8);
    x = x + MiscUtils::unsignedShift(x, (int64_t)16);
    x = x + MiscUtils::unsignedShift(x, (int64_t)32);
    return (int32_t)x & 0x7f;
}

//对于64int的数组,从第wordOffset个开始,一直计算numWords个,计算其中bit为1的个数

int64_t BitUtil::pop_array(const int64_t* A, int32_t wordOffset, int32_t numWords) {
    int32_t n = wordOffset + numWords;
    int64_t tot = 0;
    int64_t tot8 = 0;
    int64_t ones = 0;
    int64_t twos = 0;
    int64_t fours = 0;

    int32_t i = wordOffset;
    for (; i <= n - 8; i += 8) {
        int64_t twosA;
        CSA(twosA, ones, ones, A[i], A[i + 1]);

        int64_t twosB;
        CSA(twosB, ones, ones, A[i + 2], A[i + 3]);

        int64_t foursA;
        CSA(foursA, twos, twos, twosA, twosB);

        CSA(twosA, ones, ones, A[i + 4], A[i + 5]);

        CSA(twosB, ones, ones, A[i + 6], A[i + 7]);

        int64_t foursB;
        CSA(foursB, twos, twos, twosA, twosB);

        int64_t eights;
        CSA(eights, fours, fours, foursA, foursB);

        tot8 += pop(eights);
    }

    // Handle trailing words in a binary-search manner.
    // Derived from the loop above by setting specific elements to 0.

    if (i <= n - 4) {
        int64_t twosA;
        CSA(twosA, ones, ones, A[i], A[i + 1]);

        int64_t twosB;
        CSA(twosB, ones, ones, A[i + 2], A[i + 3]);

        int64_t foursA;
        CSA(foursA, twos, twos, twosA, twosB);

        int64_t eights = fours & foursA;
        fours = fours ^ foursA;

        tot8 += pop(eights);
        i += 4;
    }

    if (i <= n - 2) {
        int64_t twosA;
        CSA(twosA, ones, ones, A[i], A[i + 1]);

        int64_t foursA = twos & twosA;
        twos = twos ^ twosA;

        int64_t eights = fours & foursA;
        fours = fours ^ foursA;

        tot8 += pop(eights);
        i += 2;
    }

    if (i < n) {
        tot += pop(A[i]);
    }

    tot += (pop(fours) << 2) + (pop(twos) << 1) + pop(ones) + (tot8 << 3);

    return tot;
}

int64_t BitUtil::pop_intersect(const int64_t* A, const int64_t* B, int32_t wordOffset, int32_t numWords) {
    int32_t n = wordOffset + numWords;
    int64_t tot = 0;
    int64_t tot8 = 0;
    int64_t ones = 0;
    int64_t twos = 0;
    int64_t fours = 0;

    int32_t i = wordOffset;
    for (; i <= n - 8; i += 8) {
        int64_t twosA;
        CSA(twosA, ones, ones, (A[i] & B[i]), (A[i + 1] & B[i + 1]));

        int64_t twosB;
        CSA(twosB, ones, ones, (A[i + 2] & B[i + 2]), (A[i + 3] & B[i + 3]));

        int64_t foursA;
        CSA(foursA, twos, twos, twosA, twosB);

        CSA(twosA, ones, ones, (A[i + 4] & B[i + 4]), (A[i + 5] & B[i + 5]));

        CSA(twosB, ones, ones, (A[i + 6] & B[i + 6]), (A[i + 7] & B[i + 7]));

        int64_t foursB;
        CSA(foursB, twos, twos, twosA, twosB);

        int64_t eights;
        CSA(eights, fours, fours, foursA, foursB);

        tot8 += pop(eights);
    }

    if (i <= n - 4) {
        int64_t twosA;
        CSA(twosA, ones, ones, (A[i] & B[i]), (A[i + 1] & B[i + 1]));

        int64_t twosB;
        CSA(twosB, ones, ones, (A[i + 2] & B[i + 2]), (A[i + 3] & B[i + 3]));

        int64_t foursA;
        CSA(foursA, twos, twos, twosA, twosB);

        int64_t eights = fours & foursA;
        fours = fours ^ foursA;

        tot8 += pop(eights);
        i += 4;
    }

    if (i <= n - 2) {
        int64_t twosA;
        CSA(twosA, ones, ones, (A[i] & B[i]), (A[i + 1] & B[i + 1]));

        int64_t foursA = twos & twosA;
        twos = twos ^ twosA;

        int64_t eights = fours & foursA;
        fours = fours ^ foursA;

        tot8 += pop(eights);
        i += 2;
    }

    if (i < n) {
        tot += pop((A[i] & B[i]));
    }

    tot += (pop(fours) << 2) + (pop(twos) << 1) + pop(ones) + (tot8 << 3);

    return tot;
}

int64_t BitUtil::pop_union(const int64_t* A, const int64_t* B, int32_t wordOffset, int32_t numWords) {
    int32_t n = wordOffset + numWords;
    int64_t tot = 0;
    int64_t tot8 = 0;
    int64_t ones = 0;
    int64_t twos = 0;
    int64_t fours = 0;

    int32_t i = wordOffset;
    for (; i <= n - 8; i += 8) {
        int64_t twosA;
        CSA(twosA, ones, ones, (A[i] | B[i]), (A[i + 1] | B[i + 1]));

        int64_t twosB;
        CSA(twosB, ones, ones, (A[i + 2] | B[i + 2]), (A[i + 3] | B[i + 3]));

        int64_t foursA;
        CSA(foursA, twos, twos, twosA, twosB);

        CSA(twosA, ones, ones, (A[i + 4] | B[i + 4]), (A[i + 5] | B[i + 5]));

        CSA(twosB, ones, ones, (A[i + 6] | B[i + 6]), (A[i + 7] | B[i + 7]));

        int64_t foursB;
        CSA(foursB, twos, twos, twosA, twosB);

        int64_t eights;
        CSA(eights, fours, fours, foursA, foursB);

        tot8 += pop(eights);
    }

    if (i <= n - 4) {
        int64_t twosA;
        CSA(twosA, ones, ones, (A[i] | B[i]), (A[i + 1] | B[i + 1]));

        int64_t twosB;
        CSA(twosB, ones, ones, (A[i + 2] | B[i + 2]), (A[i + 3] | B[i + 3]));

        int64_t foursA;
        CSA(foursA, twos, twos, twosA, twosB);

        int64_t eights = fours & foursA;
        fours = fours ^ foursA;

        tot8 += pop(eights);
        i += 4;
    }

    if (i <= n - 2) {
        int64_t twosA;
        CSA(twosA, ones, ones, (A[i] | B[i]), (A[i + 1] | B[i + 1]));

        int64_t foursA = twos & twosA;
        twos = twos ^ twosA;

        int64_t eights = fours & foursA;
        fours = fours ^ foursA;

        tot8 += pop(eights);
        i += 2;
    }

    if (i < n) {
        tot += pop((A[i] | B[i]));
    }

    tot += (pop(fours) << 2) + (pop(twos) << 1) + pop(ones) + (tot8 << 3);

    return tot;
}

int64_t BitUtil::pop_andnot(const int64_t* A, const int64_t* B, int32_t wordOffset, int32_t numWords) {
    int32_t n = wordOffset + numWords;
    int64_t tot = 0;
    int64_t tot8 = 0;
    int64_t ones = 0;
    int64_t twos = 0;
    int64_t fours = 0;

    int32_t i = wordOffset;
    for (; i <= n - 8; i += 8) {
        int64_t twosA;
        CSA(twosA, ones, ones, (A[i] & ~B[i]), (A[i + 1] & ~B[i + 1]));

        int64_t twosB;
        CSA(twosB, ones, ones, (A[i + 2] & ~B[i + 2]), (A[i + 3] & ~B[i + 3]));

        int64_t foursA;
        CSA(foursA, twos, twos, twosA, twosB);

        CSA(twosA, ones, ones, (A[i + 4] & ~B[i + 4]), (A[i + 5] & ~B[i + 5]));

        CSA(twosB, ones, ones, (A[i + 6] & ~B[i + 6]), (A[i + 7] & ~B[i + 7]));

        int64_t foursB;
        CSA(foursB, twos, twos, twosA, twosB);

        int64_t eights;
        CSA(eights, fours, fours, foursA, foursB);

        tot8 += pop(eights);
    }

    if (i <= n - 4) {
        int64_t twosA;
        CSA(twosA, ones, ones, (A[i] & ~B[i]), (A[i + 1] & ~B[i + 1]));

        int64_t twosB;
        CSA(twosB, ones, ones, (A[i + 2] & ~B[i + 2]), (A[i + 3] & ~B[i + 3]));

        int64_t foursA;
        CSA(foursA, twos, twos, twosA, twosB);

        int64_t eights = fours & foursA;
        fours = fours ^ foursA;

        tot8 += pop(eights);
        i += 4;
    }

    if (i <= n - 2) {
        int64_t twosA;
        CSA(twosA, ones, ones, (A[i] & ~B[i]), (A[i + 1] & ~B[i + 1]));

        int64_t foursA = twos & twosA;
        twos = twos ^ twosA;

        int64_t eights = fours & foursA;
        fours = fours ^ foursA;

        tot8 += pop(eights);
        i += 2;
    }

    if (i < n) {
        tot += pop((A[i] & ~B[i]));
    }

    tot += (pop(fours) << 2) + (pop(twos) << 1) + pop(ones) + (tot8 << 3);

    return tot;
}

int64_t BitUtil::pop_xor(const int64_t* A, const int64_t* B, int32_t wordOffset, int32_t numWords) {
    int32_t n = wordOffset + numWords;
    int64_t tot = 0;
    int64_t tot8 = 0;
    int64_t ones = 0;
    int64_t twos = 0;
    int64_t fours = 0;

    int32_t i = wordOffset;
    for (; i <= n - 8; i += 8) {
        int64_t twosA;
        CSA(twosA, ones, ones, (A[i] ^ B[i]), (A[i + 1] ^ B[i + 1]));

        int64_t twosB;
        CSA(twosB, ones, ones, (A[i + 2] ^ B[i + 2]), (A[i + 3] ^ B[i + 3]));

        int64_t foursA;
        CSA(foursA, twos, twos, twosA, twosB);

        CSA(twosA, ones, ones, (A[i + 4] ^ B[i + 4]), (A[i + 5] ^ B[i + 5]));

        CSA(twosB, ones, ones, (A[i + 6] ^ B[i + 6]), (A[i + 7] ^ B[i + 7]));

        int64_t foursB;
        CSA(foursB, twos, twos, twosA, twosB);

        int64_t eights;
        CSA(eights, fours, fours, foursA, foursB);

        tot8 += pop(eights);
    }

    if (i <= n - 4) {
        int64_t twosA;
        CSA(twosA, ones, ones, (A[i] ^ B[i]), (A[i + 1] ^ B[i + 1]));

        int64_t twosB;
        CSA(twosB, ones, ones, (A[i + 2] ^ B[i + 2]), (A[i + 3] ^ B[i + 3]));

        int64_t foursA;
        CSA(foursA, twos, twos, twosA, twosB);

        int64_t eights = fours & foursA;
        fours = fours ^ foursA;

        tot8 += pop(eights);
        i += 4;
    }

    if (i <= n - 2) {
        int64_t twosA;
        CSA(twosA, ones, ones, (A[i] ^ B[i]), (A[i + 1] ^ B[i + 1]));

        int64_t foursA = twos & twosA;
        twos = twos ^ twosA;

        int64_t eights = fours & foursA;
        fours = fours ^ foursA;

        tot8 += pop(eights);
        i += 2;
    }

    if (i < n) {
        tot += pop((A[i] ^ B[i]));
    }

    tot += (pop(fours) << 2) + (pop(twos) << 1) + pop(ones) + (tot8 << 3);

    return tot;
}

void BitUtil::CSA(int64_t& h, int64_t& l, int64_t a, int64_t b, int64_t c) {
    int64_t u = a ^ b;
    h = (a & b) | (u & c);
    l = u ^ c;
}

//对于64位int,计算其二进制的尾部有几个0

int32_t BitUtil::ntz(int64_t val) {
    // A full binary search to determine the low byte was slower than a linear search for nextSetBit().
    // This is most likely because the implementation of nextSetBit() shifts bits to the right, increasing
    // the probability that the first non-zero byte is in the rhs.

    // This implementation does a single binary search at the top level only so that all other bit shifting
    // can be done on ints instead of longs to remain friendly to 32 bit architectures.  In addition, the
    // case of a non-zero first byte is checked for first because it is the most common in dense bit arrays.

    int32_t lower = (int32_t)val;
    int32_t lowByte = lower & 0xff;
    if (lowByte != 0) {
        return ntzTable[lowByte];
    }

    if (lower != 0) {
        lowByte = MiscUtils::unsignedShift(lower, 8) & 0xff;
        if (lowByte != 0) {
            return ntzTable[lowByte] + 8;
        }
        lowByte = MiscUtils::unsignedShift(lower, 16) & 0xff;
        if (lowByte != 0) {
            return ntzTable[lowByte] + 16;
        }
        // no need to mask off low byte for the last byte in the 32 bit word
        // no need to check for zero on the last byte either.
        return ntzTable[MiscUtils::unsignedShift(lower, 24)] + 24;
    } else {
        // grab upper 32 bits
        int32_t upper = (int32_t)(val >> 32);
        lowByte = upper & 0xff;
        if (lowByte != 0) {
            return ntzTable[lowByte] + 32;
        }
        lowByte = MiscUtils::unsignedShift(upper, 8) & 0xff;
        if (lowByte != 0) {
            return ntzTable[lowByte] + 40;
        }
        lowByte = MiscUtils::unsignedShift(upper, 16) & 0xff;
        if (lowByte != 0) {
            return ntzTable[lowByte] + 48;
        }
        // no need to mask off low byte for the last byte in the 32 bit word
        // no need to check for zero on the last byte either.
        return ntzTable[MiscUtils::unsignedShift(upper, 24)] + 56;
    }
}

int32_t BitUtil::ntz(int32_t val) {
    // This implementation does a single binary search at the top level only.  In addition, the case
    // of a non-zero first byte is checked for first because it is the most common in dense bit arrays.

    int32_t lowByte = val & 0xff;
    if (lowByte != 0) {
        return ntzTable[lowByte];
    }
    lowByte = MiscUtils::unsignedShift(val, 8) & 0xff;
    if (lowByte != 0) {
        return ntzTable[lowByte] + 8;
    }
    lowByte = MiscUtils::unsignedShift(val, 16) & 0xff;
    if (lowByte != 0) {
        return ntzTable[lowByte] + 16;
    }
    // no need to mask off low byte for the last byte.
    // no need to check for zero on the last byte either.
    return ntzTable[MiscUtils::unsignedShift(val, 24)] + 24;
}

int32_t BitUtil::ntz2(int64_t x) {
    int32_t n = 0;
    int32_t y = (int32_t)x;
    if (y == 0) { // the only 64 bit shift necessary
        n += 32;
        y = (int32_t)MiscUtils::unsignedShift(x, (int64_t)32);
    }
    if ((y & 0x0000ffff) == 0) {
        n += 16;
        y = MiscUtils::unsignedShift(y, 16);
    }
    if ((y & 0x000000ff) == 0) {
        n += 8;
        y = MiscUtils::unsignedShift(y, 8);
    }
    return (ntzTable[y & 0xff]) + n;
}

int32_t BitUtil::ntz3(int64_t x) {
    int32_t n = 1;

    // do the first step as a long, all others as ints.
    int32_t y = (int32_t)x;
    if (y == 0) {
        n += 32;
        y = (int32_t)MiscUtils::unsignedShift(x, (int64_t)32);
    }
    if ((y & 0x0000ffff) == 0) {
        n += 16;
        y = MiscUtils::unsignedShift(y, 16);
    }
    if ((y & 0x000000ff) == 0) {
        n += 8;
        y = MiscUtils::unsignedShift(y, 8);
    }
    if ((y & 0x0000000f) == 0) {
        n += 4;
        y = MiscUtils::unsignedShift(y, 4);
    }
    if ((y & 0x00000003) == 0) {
        n += 2;
        y = MiscUtils::unsignedShift(y, 2);
    }
    return n - (y & 1);
}

// 是否2的幂次方

bool BitUtil::isPowerOfTwo(int32_t v) {
    return ((v & (v - 1)) == 0);
}

bool BitUtil::isPowerOfTwo(int64_t v) {
    return ((v & (v - 1)) == 0);
}

//对于32位int,计算大于等于当前值的最近的一个2的幂次方

int32_t BitUtil::nextHighestPowerOfTwo(int32_t v) {
    --v;
    v |= v >> 1;
    v |= v >> 2;
    v |= v >> 4;
    v |= v >> 8;
    v |= v >> 16;
    return ++v;
}

int64_t BitUtil::nextHighestPowerOfTwo(int64_t v) {
    --v;
    v |= v >> 1;
    v |= v >> 2;
    v |= v >> 4;
    v |= v >> 8;
    v |= v >> 16;
    v |= v >> 32;
    return ++v;
}

 

评论
添加红包

请填写红包祝福语或标题

红包个数最小为10个

红包金额最低5元

当前余额3.43前往充值 >
需支付:10.00
成就一亿技术人!
领取后你会自动成为博主和红包主的粉丝 规则
hope_wisdom
发出的红包
实付
使用余额支付
点击重新获取
扫码支付
钱包余额 0

抵扣说明:

1.余额是钱包充值的虚拟货币,按照1:1的比例进行支付金额的抵扣。
2.余额无法直接购买下载,可以购买VIP、付费专栏及课程。

余额充值