Optimize MayContainHash()

Summary:
In latest leaf's, MayContainHash() consistently consumes 5%~7% CPU usage.

I checked the code and did an experiment with/without inlining this method.

In release mode, with `1024 * 1024 * 256` bits and `1024 * 512` entries, both call 2^30 MayContainHash() with distinctive parameters.

As the result showed, this patch reduced the running time from 9.127 sec to 7.891 sec.

Test Plan: make check

Reviewers: sdong, haobo

CC: leveldb

Differential Revision: https://reviews.facebook.net/D15177
This commit is contained in:
Kai Liu 2014-01-14 21:30:13 -08:00
parent 9ea8bf90f1
commit cd535c2280
2 changed files with 35 additions and 45 deletions

View File

@ -20,50 +20,17 @@ DynamicBloom::DynamicBloom(uint32_t total_bits,
uint32_t (*hash_func)(const Slice& key), uint32_t (*hash_func)(const Slice& key),
uint32_t num_probes) uint32_t num_probes)
: hash_func_(hash_func), : hash_func_(hash_func),
total_bits_((total_bits + 7) / 8 * 8), kTotalBits((total_bits + 7) / 8 * 8),
num_probes_(num_probes) { kNumProbes(num_probes) {
assert(hash_func_); assert(hash_func_);
assert(num_probes_ > 0); assert(kNumProbes > 0);
assert(total_bits_ > 0); assert(kTotalBits > 0);
data_.reset(new unsigned char[total_bits_ / 8]()); data_.reset(new unsigned char[kTotalBits / 8]());
} }
DynamicBloom::DynamicBloom(uint32_t total_bits, DynamicBloom::DynamicBloom(uint32_t total_bits,
uint32_t num_probes) uint32_t num_probes)
: hash_func_(&BloomHash), : DynamicBloom(total_bits, &BloomHash, num_probes) {
total_bits_((total_bits + 7) / 8 * 8),
num_probes_(num_probes) {
assert(num_probes_ > 0);
assert(total_bits_ > 0);
data_.reset(new unsigned char[total_bits_ / 8]());
} }
void DynamicBloom::Add(const Slice& key) { } // rocksdb
AddHash(hash_func_(key));
}
void DynamicBloom::AddHash(uint32_t h) {
const uint32_t delta = (h >> 17) | (h << 15); // Rotate right 17 bits
for (uint32_t i = 0; i < num_probes_; i++) {
const uint32_t bitpos = h % total_bits_;
data_[bitpos/8] |= (1 << (bitpos % 8));
h += delta;
}
}
bool DynamicBloom::MayContain(const Slice& key) {
return (MayContainHash(hash_func_(key)));
}
bool DynamicBloom::MayContainHash(uint32_t h) {
const uint32_t delta = (h >> 17) | (h << 15); // Rotate right 17 bits
for (uint32_t i = 0; i < num_probes_; i++) {
const uint32_t bitpos = h % total_bits_;
if ((data_[bitpos/8] & (1 << (bitpos % 8)))
== 0) return false;
h += delta;
}
return true;
}
}

View File

@ -13,9 +13,7 @@ namespace rocksdb {
class Slice; class Slice;
class DynamicBloom { class DynamicBloom {
public: public:
// total_bits: fixed total bits for the bloom // total_bits: fixed total bits for the bloom
// hash_func: customized hash function // hash_func: customized hash function
// num_probes: number of hash probes for a single key // num_probes: number of hash probes for a single key
@ -26,7 +24,7 @@ class DynamicBloom {
explicit DynamicBloom(uint32_t total_bits, uint32_t num_probes = 6); explicit DynamicBloom(uint32_t total_bits, uint32_t num_probes = 6);
// Assuming single threaded access to Add // Assuming single threaded access to Add
void Add(const Slice& key); void Add(const Slice& key) { AddHash(hash_func_(key)); }
// Assuming single threaded access to Add // Assuming single threaded access to Add
void AddHash(uint32_t hash); void AddHash(uint32_t hash);
@ -39,9 +37,34 @@ class DynamicBloom {
private: private:
uint32_t (*hash_func_)(const Slice& key); uint32_t (*hash_func_)(const Slice& key);
uint32_t total_bits_; const uint32_t kTotalBits;
uint32_t num_probes_; const uint32_t kNumProbes;
std::unique_ptr<unsigned char[]> data_; std::unique_ptr<unsigned char[]> data_;
}; };
inline bool DynamicBloom::MayContain(const Slice& key) {
return (MayContainHash(hash_func_(key)));
} }
inline bool DynamicBloom::MayContainHash(uint32_t h) {
const uint32_t delta = (h >> 17) | (h << 15); // Rotate right 17 bits
for (uint32_t i = 0; i < kNumProbes; i++) {
const uint32_t bitpos = h % kTotalBits;
if (((data_[bitpos / 8]) & (1 << (bitpos % 8))) == 0) {
return false;
}
h += delta;
}
return true;
}
inline void DynamicBloom::AddHash(uint32_t h) {
const uint32_t delta = (h >> 17) | (h << 15); // Rotate right 17 bits
for (uint32_t i = 0; i < kNumProbes; i++) {
const uint32_t bitpos = h % kTotalBits;
data_[bitpos / 8] |= (1 << (bitpos % 8));
h += delta;
}
}
} // rocksdb