New bit manipulation functions and 128-bit value library (#7338)
Summary: These new functions and 128-bit value bit operations are expected to be used in a forthcoming Bloom filter alternative. No functional changes to production code, just new code only called by unit tests, cosmetic changes to existing headers, and fix an existing function for a yet-unused template instantiation (BitsSetToOne on something signed and smaller than 32 bits). Pull Request resolved: https://github.com/facebook/rocksdb/pull/7338 Test Plan: Unit tests included. Works with and without TEST_UINT128_COMPAT=1 to check compatibility with and without __uint128_t. Also added that parameter to the CircleCI build build-linux-shared_lib-alt_namespace-status_checked. Reviewed By: jay-zhuang Differential Revision: D23494945 Pulled By: pdillinger fbshipit-source-id: 5c0dc419100d9df5d4d9abb153b2855d5aea39e8main
parent
a09c3cf13e
commit
c4d8838a2b
@ -0,0 +1,223 @@ |
|||||||
|
// Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
|
||||||
|
// This source code is licensed under both the GPLv2 (found in the
|
||||||
|
// COPYING file in the root directory) and Apache 2.0 License
|
||||||
|
// (found in the LICENSE.Apache file in the root directory).
|
||||||
|
|
||||||
|
#pragma once |
||||||
|
|
||||||
|
#include "util/coding.h" |
||||||
|
#include "util/math.h" |
||||||
|
|
||||||
|
#ifdef TEST_UINT128_COMPAT |
||||||
|
#undef HAVE_UINT128_EXTENSION |
||||||
|
#endif |
||||||
|
|
||||||
|
namespace ROCKSDB_NAMESPACE { |
||||||
|
|
||||||
|
// Unsigned128 is a 128 bit value supporting (at least) bitwise operators,
|
||||||
|
// shifts, and comparisons. __uint128_t is not always available.
|
||||||
|
|
||||||
|
#ifdef HAVE_UINT128_EXTENSION |
||||||
|
using Unsigned128 = __uint128_t; |
||||||
|
#else |
||||||
|
struct Unsigned128 { |
||||||
|
uint64_t lo; |
||||||
|
uint64_t hi; |
||||||
|
|
||||||
|
inline Unsigned128() { |
||||||
|
static_assert(sizeof(Unsigned128) == 2 * sizeof(uint64_t), |
||||||
|
"unexpected overhead in representation"); |
||||||
|
lo = 0; |
||||||
|
hi = 0; |
||||||
|
} |
||||||
|
|
||||||
|
inline Unsigned128(uint64_t lower) { |
||||||
|
lo = lower; |
||||||
|
hi = 0; |
||||||
|
} |
||||||
|
|
||||||
|
inline Unsigned128(uint64_t lower, uint64_t upper) { |
||||||
|
lo = lower; |
||||||
|
hi = upper; |
||||||
|
} |
||||||
|
}; |
||||||
|
|
||||||
|
inline Unsigned128 operator<<(const Unsigned128& lhs, unsigned shift) { |
||||||
|
shift &= 127; |
||||||
|
Unsigned128 rv; |
||||||
|
if (shift >= 64) { |
||||||
|
rv.lo = 0; |
||||||
|
rv.hi = lhs.lo << (shift & 63); |
||||||
|
} else { |
||||||
|
uint64_t tmp = lhs.lo; |
||||||
|
rv.lo = tmp << shift; |
||||||
|
// Ensure shift==0 shifts away everything. (This avoids another
|
||||||
|
// conditional branch on shift == 0.)
|
||||||
|
tmp = tmp >> 1 >> (63 - shift); |
||||||
|
rv.hi = tmp | (lhs.hi << shift); |
||||||
|
} |
||||||
|
return rv; |
||||||
|
} |
||||||
|
|
||||||
|
inline Unsigned128& operator<<=(Unsigned128& lhs, unsigned shift) { |
||||||
|
lhs = lhs << shift; |
||||||
|
return lhs; |
||||||
|
} |
||||||
|
|
||||||
|
inline Unsigned128 operator>>(const Unsigned128& lhs, unsigned shift) { |
||||||
|
shift &= 127; |
||||||
|
Unsigned128 rv; |
||||||
|
if (shift >= 64) { |
||||||
|
rv.hi = 0; |
||||||
|
rv.lo = lhs.hi >> (shift & 63); |
||||||
|
} else { |
||||||
|
uint64_t tmp = lhs.hi; |
||||||
|
rv.hi = tmp >> shift; |
||||||
|
// Ensure shift==0 shifts away everything
|
||||||
|
tmp = tmp << 1 << (63 - shift); |
||||||
|
rv.lo = tmp | (lhs.lo >> shift); |
||||||
|
} |
||||||
|
return rv; |
||||||
|
} |
||||||
|
|
||||||
|
inline Unsigned128& operator>>=(Unsigned128& lhs, unsigned shift) { |
||||||
|
lhs = lhs >> shift; |
||||||
|
return lhs; |
||||||
|
} |
||||||
|
|
||||||
|
inline Unsigned128 operator&(const Unsigned128& lhs, const Unsigned128& rhs) { |
||||||
|
return Unsigned128(lhs.lo & rhs.lo, lhs.hi & rhs.hi); |
||||||
|
} |
||||||
|
|
||||||
|
inline Unsigned128& operator&=(Unsigned128& lhs, const Unsigned128& rhs) { |
||||||
|
lhs = lhs & rhs; |
||||||
|
return lhs; |
||||||
|
} |
||||||
|
|
||||||
|
inline Unsigned128 operator|(const Unsigned128& lhs, const Unsigned128& rhs) { |
||||||
|
return Unsigned128(lhs.lo | rhs.lo, lhs.hi | rhs.hi); |
||||||
|
} |
||||||
|
|
||||||
|
inline Unsigned128& operator|=(Unsigned128& lhs, const Unsigned128& rhs) { |
||||||
|
lhs = lhs | rhs; |
||||||
|
return lhs; |
||||||
|
} |
||||||
|
|
||||||
|
inline Unsigned128 operator^(const Unsigned128& lhs, const Unsigned128& rhs) { |
||||||
|
return Unsigned128(lhs.lo ^ rhs.lo, lhs.hi ^ rhs.hi); |
||||||
|
} |
||||||
|
|
||||||
|
inline Unsigned128& operator^=(Unsigned128& lhs, const Unsigned128& rhs) { |
||||||
|
lhs = lhs ^ rhs; |
||||||
|
return lhs; |
||||||
|
} |
||||||
|
|
||||||
|
inline Unsigned128 operator~(const Unsigned128& v) { |
||||||
|
return Unsigned128(~v.lo, ~v.hi); |
||||||
|
} |
||||||
|
|
||||||
|
inline bool operator==(const Unsigned128& lhs, const Unsigned128& rhs) { |
||||||
|
return lhs.lo == rhs.lo && lhs.hi == rhs.hi; |
||||||
|
} |
||||||
|
|
||||||
|
inline bool operator!=(const Unsigned128& lhs, const Unsigned128& rhs) { |
||||||
|
return lhs.lo != rhs.lo || lhs.hi != rhs.hi; |
||||||
|
} |
||||||
|
|
||||||
|
inline bool operator>(const Unsigned128& lhs, const Unsigned128& rhs) { |
||||||
|
return lhs.hi > rhs.hi || (lhs.hi == rhs.hi && lhs.lo > rhs.lo); |
||||||
|
} |
||||||
|
|
||||||
|
inline bool operator<(const Unsigned128& lhs, const Unsigned128& rhs) { |
||||||
|
return lhs.hi < rhs.hi || (lhs.hi == rhs.hi && lhs.lo < rhs.lo); |
||||||
|
} |
||||||
|
|
||||||
|
inline bool operator>=(const Unsigned128& lhs, const Unsigned128& rhs) { |
||||||
|
return lhs.hi > rhs.hi || (lhs.hi == rhs.hi && lhs.lo >= rhs.lo); |
||||||
|
} |
||||||
|
|
||||||
|
inline bool operator<=(const Unsigned128& lhs, const Unsigned128& rhs) { |
||||||
|
return lhs.hi < rhs.hi || (lhs.hi == rhs.hi && lhs.lo <= rhs.lo); |
||||||
|
} |
||||||
|
#endif |
||||||
|
|
||||||
|
inline uint64_t Lower64of128(Unsigned128 v) { |
||||||
|
#ifdef HAVE_UINT128_EXTENSION |
||||||
|
return static_cast<uint64_t>(v); |
||||||
|
#else |
||||||
|
return v.lo; |
||||||
|
#endif |
||||||
|
} |
||||||
|
|
||||||
|
inline uint64_t Upper64of128(Unsigned128 v) { |
||||||
|
#ifdef HAVE_UINT128_EXTENSION |
||||||
|
return static_cast<uint64_t>(v >> 64); |
||||||
|
#else |
||||||
|
return v.hi; |
||||||
|
#endif |
||||||
|
} |
||||||
|
|
||||||
|
// This generally compiles down to a single fast instruction on 64-bit.
|
||||||
|
// This doesn't really make sense as operator* because it's not a
|
||||||
|
// general 128x128 multiply and provides more output than 64x64 multiply.
|
||||||
|
inline Unsigned128 Multiply64to128(uint64_t a, uint64_t b) { |
||||||
|
#ifdef HAVE_UINT128_EXTENSION |
||||||
|
return Unsigned128{a} * Unsigned128{b}; |
||||||
|
#else |
||||||
|
// Full decomposition
|
||||||
|
// NOTE: GCC seems to fully understand this code as 64-bit x 64-bit
|
||||||
|
// -> 128-bit multiplication and optimize it appropriately.
|
||||||
|
uint64_t tmp = uint64_t{b & 0xffffFFFF} * uint64_t{a & 0xffffFFFF}; |
||||||
|
uint64_t lower = tmp & 0xffffFFFF; |
||||||
|
tmp >>= 32; |
||||||
|
tmp += uint64_t{b & 0xffffFFFF} * uint64_t{a >> 32}; |
||||||
|
// Avoid overflow: first add lower 32 of tmp2, and later upper 32
|
||||||
|
uint64_t tmp2 = uint64_t{b >> 32} * uint64_t{a & 0xffffFFFF}; |
||||||
|
tmp += tmp2 & 0xffffFFFF; |
||||||
|
lower |= tmp << 32; |
||||||
|
tmp >>= 32; |
||||||
|
tmp += tmp2 >> 32; |
||||||
|
tmp += uint64_t{b >> 32} * uint64_t{a >> 32}; |
||||||
|
return Unsigned128(lower, tmp); |
||||||
|
#endif |
||||||
|
} |
||||||
|
|
||||||
|
template <> |
||||||
|
inline int FloorLog2(Unsigned128 v) { |
||||||
|
if (Upper64of128(v) == 0) { |
||||||
|
return FloorLog2(Lower64of128(v)); |
||||||
|
} else { |
||||||
|
return FloorLog2(Upper64of128(v)) + 64; |
||||||
|
} |
||||||
|
} |
||||||
|
|
||||||
|
template <> |
||||||
|
inline int CountTrailingZeroBits(Unsigned128 v) { |
||||||
|
if (Lower64of128(v) != 0) { |
||||||
|
return CountTrailingZeroBits(Lower64of128(v)); |
||||||
|
} else { |
||||||
|
return CountTrailingZeroBits(Upper64of128(v)) + 64; |
||||||
|
} |
||||||
|
} |
||||||
|
|
||||||
|
template <> |
||||||
|
inline int BitsSetToOne(Unsigned128 v) { |
||||||
|
return BitsSetToOne(Lower64of128(v)) + BitsSetToOne(Upper64of128(v)); |
||||||
|
} |
||||||
|
|
||||||
|
template <> |
||||||
|
inline int BitParity(Unsigned128 v) { |
||||||
|
return BitParity(Lower64of128(v)) ^ BitParity(Upper64of128(v)); |
||||||
|
} |
||||||
|
|
||||||
|
inline void EncodeFixed128(char* dst, Unsigned128 value) { |
||||||
|
EncodeFixed64(dst, Lower64of128(value)); |
||||||
|
EncodeFixed64(dst + 8, Upper64of128(value)); |
||||||
|
} |
||||||
|
|
||||||
|
inline Unsigned128 DecodeFixed128(const char* ptr) { |
||||||
|
Unsigned128 rv = DecodeFixed64(ptr + 8); |
||||||
|
return (rv << 64) | DecodeFixed64(ptr); |
||||||
|
} |
||||||
|
|
||||||
|
} // namespace ROCKSDB_NAMESPACE
|
Loading…
Reference in new issue