New bit manipulation functions and 128-bit value library (#7338)
Summary: These new functions and 128-bit value bit operations are expected to be used in a forthcoming Bloom filter alternative. No functional changes to production code, just new code only called by unit tests, cosmetic changes to existing headers, and fix an existing function for a yet-unused template instantiation (BitsSetToOne on something signed and smaller than 32 bits). Pull Request resolved: https://github.com/facebook/rocksdb/pull/7338 Test Plan: Unit tests included. Works with and without TEST_UINT128_COMPAT=1 to check compatibility with and without __uint128_t. Also added that parameter to the CircleCI build build-linux-shared_lib-alt_namespace-status_checked. Reviewed By: jay-zhuang Differential Revision: D23494945 Pulled By: pdillinger fbshipit-source-id: 5c0dc419100d9df5d4d9abb153b2855d5aea39e8main
parent
a09c3cf13e
commit
c4d8838a2b
@ -0,0 +1,223 @@ |
||||
// Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved.
|
||||
// This source code is licensed under both the GPLv2 (found in the
|
||||
// COPYING file in the root directory) and Apache 2.0 License
|
||||
// (found in the LICENSE.Apache file in the root directory).
|
||||
|
||||
#pragma once |
||||
|
||||
#include "util/coding.h" |
||||
#include "util/math.h" |
||||
|
||||
#ifdef TEST_UINT128_COMPAT |
||||
#undef HAVE_UINT128_EXTENSION |
||||
#endif |
||||
|
||||
namespace ROCKSDB_NAMESPACE { |
||||
|
||||
// Unsigned128 is a 128 bit value supporting (at least) bitwise operators,
|
||||
// shifts, and comparisons. __uint128_t is not always available.
|
||||
|
||||
#ifdef HAVE_UINT128_EXTENSION |
||||
using Unsigned128 = __uint128_t; |
||||
#else |
||||
struct Unsigned128 { |
||||
uint64_t lo; |
||||
uint64_t hi; |
||||
|
||||
inline Unsigned128() { |
||||
static_assert(sizeof(Unsigned128) == 2 * sizeof(uint64_t), |
||||
"unexpected overhead in representation"); |
||||
lo = 0; |
||||
hi = 0; |
||||
} |
||||
|
||||
inline Unsigned128(uint64_t lower) { |
||||
lo = lower; |
||||
hi = 0; |
||||
} |
||||
|
||||
inline Unsigned128(uint64_t lower, uint64_t upper) { |
||||
lo = lower; |
||||
hi = upper; |
||||
} |
||||
}; |
||||
|
||||
inline Unsigned128 operator<<(const Unsigned128& lhs, unsigned shift) { |
||||
shift &= 127; |
||||
Unsigned128 rv; |
||||
if (shift >= 64) { |
||||
rv.lo = 0; |
||||
rv.hi = lhs.lo << (shift & 63); |
||||
} else { |
||||
uint64_t tmp = lhs.lo; |
||||
rv.lo = tmp << shift; |
||||
// Ensure shift==0 shifts away everything. (This avoids another
|
||||
// conditional branch on shift == 0.)
|
||||
tmp = tmp >> 1 >> (63 - shift); |
||||
rv.hi = tmp | (lhs.hi << shift); |
||||
} |
||||
return rv; |
||||
} |
||||
|
||||
inline Unsigned128& operator<<=(Unsigned128& lhs, unsigned shift) { |
||||
lhs = lhs << shift; |
||||
return lhs; |
||||
} |
||||
|
||||
inline Unsigned128 operator>>(const Unsigned128& lhs, unsigned shift) { |
||||
shift &= 127; |
||||
Unsigned128 rv; |
||||
if (shift >= 64) { |
||||
rv.hi = 0; |
||||
rv.lo = lhs.hi >> (shift & 63); |
||||
} else { |
||||
uint64_t tmp = lhs.hi; |
||||
rv.hi = tmp >> shift; |
||||
// Ensure shift==0 shifts away everything
|
||||
tmp = tmp << 1 << (63 - shift); |
||||
rv.lo = tmp | (lhs.lo >> shift); |
||||
} |
||||
return rv; |
||||
} |
||||
|
||||
inline Unsigned128& operator>>=(Unsigned128& lhs, unsigned shift) { |
||||
lhs = lhs >> shift; |
||||
return lhs; |
||||
} |
||||
|
||||
inline Unsigned128 operator&(const Unsigned128& lhs, const Unsigned128& rhs) { |
||||
return Unsigned128(lhs.lo & rhs.lo, lhs.hi & rhs.hi); |
||||
} |
||||
|
||||
inline Unsigned128& operator&=(Unsigned128& lhs, const Unsigned128& rhs) { |
||||
lhs = lhs & rhs; |
||||
return lhs; |
||||
} |
||||
|
||||
inline Unsigned128 operator|(const Unsigned128& lhs, const Unsigned128& rhs) { |
||||
return Unsigned128(lhs.lo | rhs.lo, lhs.hi | rhs.hi); |
||||
} |
||||
|
||||
inline Unsigned128& operator|=(Unsigned128& lhs, const Unsigned128& rhs) { |
||||
lhs = lhs | rhs; |
||||
return lhs; |
||||
} |
||||
|
||||
inline Unsigned128 operator^(const Unsigned128& lhs, const Unsigned128& rhs) { |
||||
return Unsigned128(lhs.lo ^ rhs.lo, lhs.hi ^ rhs.hi); |
||||
} |
||||
|
||||
inline Unsigned128& operator^=(Unsigned128& lhs, const Unsigned128& rhs) { |
||||
lhs = lhs ^ rhs; |
||||
return lhs; |
||||
} |
||||
|
||||
inline Unsigned128 operator~(const Unsigned128& v) { |
||||
return Unsigned128(~v.lo, ~v.hi); |
||||
} |
||||
|
||||
inline bool operator==(const Unsigned128& lhs, const Unsigned128& rhs) { |
||||
return lhs.lo == rhs.lo && lhs.hi == rhs.hi; |
||||
} |
||||
|
||||
inline bool operator!=(const Unsigned128& lhs, const Unsigned128& rhs) { |
||||
return lhs.lo != rhs.lo || lhs.hi != rhs.hi; |
||||
} |
||||
|
||||
inline bool operator>(const Unsigned128& lhs, const Unsigned128& rhs) { |
||||
return lhs.hi > rhs.hi || (lhs.hi == rhs.hi && lhs.lo > rhs.lo); |
||||
} |
||||
|
||||
inline bool operator<(const Unsigned128& lhs, const Unsigned128& rhs) { |
||||
return lhs.hi < rhs.hi || (lhs.hi == rhs.hi && lhs.lo < rhs.lo); |
||||
} |
||||
|
||||
inline bool operator>=(const Unsigned128& lhs, const Unsigned128& rhs) { |
||||
return lhs.hi > rhs.hi || (lhs.hi == rhs.hi && lhs.lo >= rhs.lo); |
||||
} |
||||
|
||||
inline bool operator<=(const Unsigned128& lhs, const Unsigned128& rhs) { |
||||
return lhs.hi < rhs.hi || (lhs.hi == rhs.hi && lhs.lo <= rhs.lo); |
||||
} |
||||
#endif |
||||
|
||||
inline uint64_t Lower64of128(Unsigned128 v) { |
||||
#ifdef HAVE_UINT128_EXTENSION |
||||
return static_cast<uint64_t>(v); |
||||
#else |
||||
return v.lo; |
||||
#endif |
||||
} |
||||
|
||||
inline uint64_t Upper64of128(Unsigned128 v) { |
||||
#ifdef HAVE_UINT128_EXTENSION |
||||
return static_cast<uint64_t>(v >> 64); |
||||
#else |
||||
return v.hi; |
||||
#endif |
||||
} |
||||
|
||||
// This generally compiles down to a single fast instruction on 64-bit.
|
||||
// This doesn't really make sense as operator* because it's not a
|
||||
// general 128x128 multiply and provides more output than 64x64 multiply.
|
||||
inline Unsigned128 Multiply64to128(uint64_t a, uint64_t b) { |
||||
#ifdef HAVE_UINT128_EXTENSION |
||||
return Unsigned128{a} * Unsigned128{b}; |
||||
#else |
||||
// Full decomposition
|
||||
// NOTE: GCC seems to fully understand this code as 64-bit x 64-bit
|
||||
// -> 128-bit multiplication and optimize it appropriately.
|
||||
uint64_t tmp = uint64_t{b & 0xffffFFFF} * uint64_t{a & 0xffffFFFF}; |
||||
uint64_t lower = tmp & 0xffffFFFF; |
||||
tmp >>= 32; |
||||
tmp += uint64_t{b & 0xffffFFFF} * uint64_t{a >> 32}; |
||||
// Avoid overflow: first add lower 32 of tmp2, and later upper 32
|
||||
uint64_t tmp2 = uint64_t{b >> 32} * uint64_t{a & 0xffffFFFF}; |
||||
tmp += tmp2 & 0xffffFFFF; |
||||
lower |= tmp << 32; |
||||
tmp >>= 32; |
||||
tmp += tmp2 >> 32; |
||||
tmp += uint64_t{b >> 32} * uint64_t{a >> 32}; |
||||
return Unsigned128(lower, tmp); |
||||
#endif |
||||
} |
||||
|
||||
template <> |
||||
inline int FloorLog2(Unsigned128 v) { |
||||
if (Upper64of128(v) == 0) { |
||||
return FloorLog2(Lower64of128(v)); |
||||
} else { |
||||
return FloorLog2(Upper64of128(v)) + 64; |
||||
} |
||||
} |
||||
|
||||
template <> |
||||
inline int CountTrailingZeroBits(Unsigned128 v) { |
||||
if (Lower64of128(v) != 0) { |
||||
return CountTrailingZeroBits(Lower64of128(v)); |
||||
} else { |
||||
return CountTrailingZeroBits(Upper64of128(v)) + 64; |
||||
} |
||||
} |
||||
|
||||
template <> |
||||
inline int BitsSetToOne(Unsigned128 v) { |
||||
return BitsSetToOne(Lower64of128(v)) + BitsSetToOne(Upper64of128(v)); |
||||
} |
||||
|
||||
template <> |
||||
inline int BitParity(Unsigned128 v) { |
||||
return BitParity(Lower64of128(v)) ^ BitParity(Upper64of128(v)); |
||||
} |
||||
|
||||
inline void EncodeFixed128(char* dst, Unsigned128 value) { |
||||
EncodeFixed64(dst, Lower64of128(value)); |
||||
EncodeFixed64(dst + 8, Upper64of128(value)); |
||||
} |
||||
|
||||
inline Unsigned128 DecodeFixed128(const char* ptr) { |
||||
Unsigned128 rv = DecodeFixed64(ptr + 8); |
||||
return (rv << 64) | DecodeFixed64(ptr); |
||||
} |
||||
|
||||
} // namespace ROCKSDB_NAMESPACE
|
Loading…
Reference in new issue