Fixed GetEstimatedActiveKeys

Summary:
Fixed a bug in GetEstimatedActiveKeys which does not normalized
the sampled information correctly.

Add a test in version_builder_test.

Test Plan: version_builder_test

Reviewers: ljin, igor, sdong

Reviewed By: sdong

Subscribers: dhruba, leveldb

Differential Revision: https://reviews.facebook.net/D28707
main
Yueh-Hsuan Chiang 10 years ago
parent 1f621e6abc
commit 5811419357
  1. 92
      db/version_builder_test.cc
  2. 9
      db/version_set.cc

@ -14,31 +14,31 @@ namespace rocksdb {
class VersionBuilderTest { class VersionBuilderTest {
public: public:
const Comparator* ucmp; const Comparator* ucmp_;
InternalKeyComparator icmp; InternalKeyComparator icmp_;
Options options; Options options_;
ImmutableCFOptions ioptions; ImmutableCFOptions ioptions_;
MutableCFOptions mutable_cf_options; MutableCFOptions mutable_cf_options_;
VersionStorageInfo vstorage; VersionStorageInfo vstorage_;
uint32_t file_num; uint32_t file_num_;
CompactionOptionsFIFO fifo_options; CompactionOptionsFIFO fifo_options_;
std::vector<uint64_t> size_being_compacted; std::vector<uint64_t> size_being_compacted_;
VersionBuilderTest() VersionBuilderTest()
: ucmp(BytewiseComparator()), : ucmp_(BytewiseComparator()),
icmp(ucmp), icmp_(ucmp_),
ioptions(options), ioptions_(options_),
mutable_cf_options(options, ioptions), mutable_cf_options_(options_, ioptions_),
vstorage(&icmp, ucmp, options.num_levels, kCompactionStyleLevel, vstorage_(&icmp_, ucmp_, options_.num_levels, kCompactionStyleLevel,
nullptr), nullptr),
file_num(1) { file_num_(1) {
mutable_cf_options.RefreshDerivedOptions(ioptions); mutable_cf_options_.RefreshDerivedOptions(ioptions_);
size_being_compacted.resize(options.num_levels); size_being_compacted_.resize(options_.num_levels);
} }
~VersionBuilderTest() { ~VersionBuilderTest() {
for (int i = 0; i < vstorage.num_levels(); i++) { for (int i = 0; i < vstorage_.num_levels(); i++) {
for (auto* f : vstorage.LevelFiles(i)) { for (auto* f : vstorage_.LevelFiles(i)) {
if (--f->refs == 0) { if (--f->refs == 0) {
delete f; delete f;
} }
@ -54,25 +54,33 @@ class VersionBuilderTest {
void Add(int level, uint32_t file_number, const char* smallest, void Add(int level, uint32_t file_number, const char* smallest,
const char* largest, uint64_t file_size = 0, uint32_t path_id = 0, const char* largest, uint64_t file_size = 0, uint32_t path_id = 0,
SequenceNumber smallest_seq = 100, SequenceNumber smallest_seq = 100,
SequenceNumber largest_seq = 100) { SequenceNumber largest_seq = 100,
assert(level < vstorage.num_levels()); uint64_t num_entries = 0, uint64_t num_deletions = 0,
bool sampled = false) {
assert(level < vstorage_.num_levels());
FileMetaData* f = new FileMetaData; FileMetaData* f = new FileMetaData;
f->fd = FileDescriptor(file_number, path_id, file_size); f->fd = FileDescriptor(file_number, path_id, file_size);
f->smallest = GetInternalKey(smallest, smallest_seq); f->smallest = GetInternalKey(smallest, smallest_seq);
f->largest = GetInternalKey(largest, largest_seq); f->largest = GetInternalKey(largest, largest_seq);
f->compensated_file_size = file_size; f->compensated_file_size = file_size;
f->refs = 0; f->refs = 0;
vstorage.MaybeAddFile(level, f); f->num_entries = num_entries;
f->num_deletions = num_deletions;
vstorage_.MaybeAddFile(level, f);
if (sampled) {
f->init_stats_from_file = true;
vstorage_.UpdateAccumulatedStats(f);
}
} }
void UpdateVersionStorageInfo() { void UpdateVersionStorageInfo() {
vstorage.ComputeCompactionScore(mutable_cf_options, fifo_options, vstorage_.ComputeCompactionScore(mutable_cf_options_, fifo_options_,
size_being_compacted); size_being_compacted_);
vstorage.UpdateFilesBySize(); vstorage_.UpdateFilesBySize();
vstorage.UpdateNumNonEmptyLevels(); vstorage_.UpdateNumNonEmptyLevels();
vstorage.GenerateFileIndexer(); vstorage_.GenerateFileIndexer();
vstorage.GenerateLevelFilesBrief(); vstorage_.GenerateLevelFilesBrief();
vstorage.SetFinalized(); vstorage_.SetFinalized();
} }
}; };
@ -99,9 +107,9 @@ TEST(VersionBuilderTest, ApplyAndSaveTo) {
EnvOptions env_options; EnvOptions env_options;
VersionBuilder version_builder(env_options, nullptr, &vstorage); VersionBuilder version_builder(env_options, nullptr, &vstorage_);
VersionStorageInfo new_vstorage(&icmp, ucmp, options.num_levels, VersionStorageInfo new_vstorage(&icmp_, ucmp_, options_.num_levels,
kCompactionStyleLevel, nullptr); kCompactionStyleLevel, nullptr);
version_builder.Apply(&version_edit); version_builder.Apply(&version_edit);
version_builder.SaveTo(&new_vstorage); version_builder.SaveTo(&new_vstorage);
@ -118,6 +126,28 @@ TEST(VersionBuilderTest, ApplyAndSaveTo) {
} }
} }
TEST(VersionBuilderTest, EstimatedActiveKeys) {
const uint64_t kTotalSamples = 20;
const uint64_t kNumLevels = 5;
const uint64_t kFilesPerLevel = 8;
const uint64_t kNumFiles = kNumLevels * kFilesPerLevel;
const uint64_t kEntriesPerFile = 1000;
const uint64_t kDeletionsPerFile = 100;
for (uint64_t i = 0; i < kNumFiles; ++i) {
Add(i / kFilesPerLevel, i + 1,
std::to_string((i + 100) * 1000).c_str(),
std::to_string((i + 100) * 1000 + 999).c_str(),
100U, 0, 100, 100,
kEntriesPerFile, kDeletionsPerFile,
(i < kTotalSamples));
}
// minus 2X for the number of deletion entries because:
// 1x for deletion entry does not count as a data entry.
// 1x for each deletion entry will actually remove one data entry.
ASSERT_EQ(vstorage_.GetEstimatedActiveKeys(),
(kEntriesPerFile - 2 * kDeletionsPerFile) * kNumFiles);
}
} // namespace rocksdb } // namespace rocksdb
int main(int argc, char** argv) { return rocksdb::test::RunAllTests(); } int main(int argc, char** argv) { return rocksdb::test::RunAllTests(); }

@ -658,11 +658,16 @@ uint64_t VersionStorageInfo::GetEstimatedActiveKeys() const {
return 0; return 0;
} }
if (num_samples_ < files_->size()) { uint64_t file_count = 0;
for (int level = 0; level < num_levels_; ++level) {
file_count += files_[level].size();
}
if (num_samples_ < file_count) {
// casting to avoid overflowing // casting to avoid overflowing
return static_cast<uint64_t>(static_cast<double>( return static_cast<uint64_t>(static_cast<double>(
accumulated_num_non_deletions_ - accumulated_num_deletions_) * accumulated_num_non_deletions_ - accumulated_num_deletions_) *
files_->size() / num_samples_); static_cast<double>(file_count) / num_samples_);
} else { } else {
return accumulated_num_non_deletions_ - accumulated_num_deletions_; return accumulated_num_non_deletions_ - accumulated_num_deletions_;
} }

Loading…
Cancel
Save