DBIter to use static allocated char array for saved_key_ (if it is not too long)

Summary: DBIter now uses a std::string for saved_key. Based on some profiling, it could be more expensive than we though. Optimize it with the same technique as LookupKey -- if it is short, we copy it to a static allocated char. Otherwise, dynamically allocate memory for it.

Test Plan: make all check

Reviewers: haobo, ljin

Reviewed By: haobo

CC: dhruba, igor, yhchiang, leveldb

Differential Revision: https://reviews.facebook.net/D17289
main
sdong 11 years ago
parent 807b2c2e02
commit e0a87c4cf1
  1. 119
      db/db_iter.cc
  2. 38
      db/db_test.cc
  3. 2
      db/dbformat.cc
  4. 2
      db/dbformat.h

@ -39,6 +39,71 @@ static void DumpInternalIter(Iterator* iter) {
namespace { namespace {
class IterLookupKey {
public:
IterLookupKey() : key_(space_), buf_size_(sizeof(space_)), key_size_(0) {}
~IterLookupKey() { Clear(); }
Slice GetKey() const {
if (key_ != nullptr) {
return Slice(key_, key_size_);
} else {
return Slice();
}
}
bool Valid() const { return key_ != nullptr; }
void Clear() {
if (key_ != nullptr && key_ != space_) {
delete[] key_;
}
key_ = space_;
buf_size_ = sizeof(buf_size_);
}
// Enlarge the buffer size if needed based on key_size.
// By default, static allocated buffer is used. Once there is a key
// larger than the static allocated buffer, another buffer is dynamically
// allocated, until a larger key buffer is requested. In that case, we
// reallocate buffer and delete the old one.
void EnlargeBufferIfNeeded(size_t key_size) {
// If size is smaller than buffer size, continue using current buffer,
// or the static allocated one, as default
if (key_size > buf_size_) {
// Need to enlarge the buffer.
Clear();
key_ = new char[key_size];
buf_size_ = key_size;
}
key_size_ = key_size;
}
void SetUserKey(const Slice& user_key) {
size_t size = user_key.size();
EnlargeBufferIfNeeded(size);
memcpy(key_, user_key.data(), size);
}
void SetInternalKey(const Slice& user_key, SequenceNumber s) {
size_t usize = user_key.size();
EnlargeBufferIfNeeded(usize + sizeof(uint64_t));
memcpy(key_, user_key.data(), usize);
EncodeFixed64(key_ + usize, PackSequenceAndType(s, kValueTypeForSeek));
}
private:
char* key_;
size_t buf_size_;
size_t key_size_;
char space_[32]; // Avoid allocation for short keys
// No copying allowed
IterLookupKey(const IterLookupKey&) = delete;
void operator=(const LookupKey&) = delete;
};
// Memtables and sstables that make the DB representation contain // Memtables and sstables that make the DB representation contain
// (userkey,seq,type) => uservalue entries. DBIter // (userkey,seq,type) => uservalue entries. DBIter
// combines multiple entries for the same userkey found in the DB // combines multiple entries for the same userkey found in the DB
@ -80,7 +145,7 @@ class DBIter: public Iterator {
virtual bool Valid() const { return valid_; } virtual bool Valid() const { return valid_; }
virtual Slice key() const { virtual Slice key() const {
assert(valid_); assert(valid_);
return saved_key_; return saved_key_.GetKey();
} }
virtual Slice value() const { virtual Slice value() const {
assert(valid_); assert(valid_);
@ -108,10 +173,6 @@ class DBIter: public Iterator {
bool ParseKey(ParsedInternalKey* key); bool ParseKey(ParsedInternalKey* key);
void MergeValuesNewToOld(); void MergeValuesNewToOld();
inline void SaveKey(const Slice& k, std::string* dst) {
dst->assign(k.data(), k.size());
}
inline void ClearSavedValue() { inline void ClearSavedValue() {
if (saved_value_.capacity() > 1048576) { if (saved_value_.capacity() > 1048576) {
std::string empty; std::string empty;
@ -130,7 +191,7 @@ class DBIter: public Iterator {
SequenceNumber const sequence_; SequenceNumber const sequence_;
Status status_; Status status_;
std::string saved_key_; // == current key when direction_==kReverse IterLookupKey saved_key_; // == current key when direction_==kReverse
std::string saved_value_; // == current raw value when direction_==kReverse std::string saved_value_; // == current raw value when direction_==kReverse
std::string skip_key_; std::string skip_key_;
Direction direction_; Direction direction_;
@ -170,7 +231,7 @@ void DBIter::Next() {
} }
if (!iter_->Valid()) { if (!iter_->Valid()) {
valid_ = false; valid_ = false;
saved_key_.clear(); saved_key_.Clear();
return; return;
} }
} }
@ -210,7 +271,7 @@ void DBIter::FindNextUserEntryInternal(bool skipping) {
ParsedInternalKey ikey; ParsedInternalKey ikey;
if (ParseKey(&ikey) && ikey.sequence <= sequence_) { if (ParseKey(&ikey) && ikey.sequence <= sequence_) {
if (skipping && if (skipping &&
user_comparator_->Compare(ikey.user_key, saved_key_) <= 0) { user_comparator_->Compare(ikey.user_key, saved_key_.GetKey()) <= 0) {
num_skipped++; // skip this entry num_skipped++; // skip this entry
BumpPerfCount(&perf_context.internal_key_skipped_count); BumpPerfCount(&perf_context.internal_key_skipped_count);
} else { } else {
@ -219,18 +280,18 @@ void DBIter::FindNextUserEntryInternal(bool skipping) {
case kTypeDeletion: case kTypeDeletion:
// Arrange to skip all upcoming entries for this key since // Arrange to skip all upcoming entries for this key since
// they are hidden by this deletion. // they are hidden by this deletion.
SaveKey(ikey.user_key, &saved_key_); saved_key_.SetUserKey(ikey.user_key);
skipping = true; skipping = true;
num_skipped = 0; num_skipped = 0;
BumpPerfCount(&perf_context.internal_delete_skipped_count); BumpPerfCount(&perf_context.internal_delete_skipped_count);
break; break;
case kTypeValue: case kTypeValue:
valid_ = true; valid_ = true;
SaveKey(ikey.user_key, &saved_key_); saved_key_.SetUserKey(ikey.user_key);
return; return;
case kTypeMerge: case kTypeMerge:
// By now, we are sure the current ikey is going to yield a value // By now, we are sure the current ikey is going to yield a value
SaveKey(ikey.user_key, &saved_key_); saved_key_.SetUserKey(ikey.user_key);
current_entry_is_merged_ = true; current_entry_is_merged_ = true;
valid_ = true; valid_ = true;
MergeValuesNewToOld(); // Go to a different state machine MergeValuesNewToOld(); // Go to a different state machine
@ -248,8 +309,8 @@ void DBIter::FindNextUserEntryInternal(bool skipping) {
if (skipping && num_skipped > max_skip_) { if (skipping && num_skipped > max_skip_) {
num_skipped = 0; num_skipped = 0;
std::string last_key; std::string last_key;
AppendInternalKey(&last_key, AppendInternalKey(&last_key, ParsedInternalKey(saved_key_.GetKey(), 0,
ParsedInternalKey(Slice(saved_key_), 0, kValueTypeForSeek)); kValueTypeForSeek));
iter_->Seek(last_key); iter_->Seek(last_key);
RecordTick(statistics_, NUMBER_OF_RESEEKS_IN_ITERATION); RecordTick(statistics_, NUMBER_OF_RESEEKS_IN_ITERATION);
} else { } else {
@ -284,7 +345,7 @@ void DBIter::MergeValuesNewToOld() {
continue; continue;
} }
if (user_comparator_->Compare(ikey.user_key, saved_key_) != 0) { if (user_comparator_->Compare(ikey.user_key, saved_key_.GetKey()) != 0) {
// hit the next user key, stop right here // hit the next user key, stop right here
break; break;
} }
@ -320,7 +381,7 @@ void DBIter::MergeValuesNewToOld() {
// a deletion marker. // a deletion marker.
// feed null as the existing value to the merge operator, such that // feed null as the existing value to the merge operator, such that
// client can differentiate this scenario and do things accordingly. // client can differentiate this scenario and do things accordingly.
user_merge_operator_->FullMerge(saved_key_, nullptr, operands, user_merge_operator_->FullMerge(saved_key_.GetKey(), nullptr, operands,
&saved_value_, logger_); &saved_value_, logger_);
} }
@ -339,17 +400,17 @@ void DBIter::Prev() {
// iter_ is pointing at the current entry. Scan backwards until // iter_ is pointing at the current entry. Scan backwards until
// the key changes so we can use the normal reverse scanning code. // the key changes so we can use the normal reverse scanning code.
assert(iter_->Valid()); // Otherwise valid_ would have been false assert(iter_->Valid()); // Otherwise valid_ would have been false
SaveKey(ExtractUserKey(iter_->key()), &saved_key_); saved_key_.SetUserKey(ExtractUserKey(iter_->key()));
while (true) { while (true) {
iter_->Prev(); iter_->Prev();
if (!iter_->Valid()) { if (!iter_->Valid()) {
valid_ = false; valid_ = false;
saved_key_.clear(); saved_key_.Clear();
ClearSavedValue(); ClearSavedValue();
return; return;
} }
if (user_comparator_->Compare(ExtractUserKey(iter_->key()), if (user_comparator_->Compare(ExtractUserKey(iter_->key()),
saved_key_) < 0) { saved_key_.GetKey()) < 0) {
break; break;
} }
} }
@ -370,13 +431,13 @@ void DBIter::FindPrevUserEntry() {
ParsedInternalKey ikey; ParsedInternalKey ikey;
if (ParseKey(&ikey) && ikey.sequence <= sequence_) { if (ParseKey(&ikey) && ikey.sequence <= sequence_) {
if ((value_type != kTypeDeletion) && if ((value_type != kTypeDeletion) &&
user_comparator_->Compare(ikey.user_key, saved_key_) < 0) { user_comparator_->Compare(ikey.user_key, saved_key_.GetKey()) < 0) {
// We encountered a non-deleted value in entries for previous keys, // We encountered a non-deleted value in entries for previous keys,
break; break;
} }
value_type = ikey.type; value_type = ikey.type;
if (value_type == kTypeDeletion) { if (value_type == kTypeDeletion) {
saved_key_.clear(); saved_key_.Clear();
ClearSavedValue(); ClearSavedValue();
saved_key_valid = false; saved_key_valid = false;
} else { } else {
@ -385,7 +446,7 @@ void DBIter::FindPrevUserEntry() {
std::string empty; std::string empty;
swap(empty, saved_value_); swap(empty, saved_value_);
} }
SaveKey(ExtractUserKey(iter_->key()), &saved_key_); saved_key_.SetUserKey(ExtractUserKey(iter_->key()));
saved_value_.assign(raw_value.data(), raw_value.size()); saved_value_.assign(raw_value.data(), raw_value.size());
} }
} else { } else {
@ -401,9 +462,9 @@ void DBIter::FindPrevUserEntry() {
if (saved_key_valid && num_skipped > max_skip_) { if (saved_key_valid && num_skipped > max_skip_) {
num_skipped = 0; num_skipped = 0;
std::string last_key; std::string last_key;
AppendInternalKey(&last_key, AppendInternalKey(&last_key, ParsedInternalKey(saved_key_.GetKey(),
ParsedInternalKey(Slice(saved_key_), kMaxSequenceNumber, kMaxSequenceNumber,
kValueTypeForSeek)); kValueTypeForSeek));
iter_->Seek(last_key); iter_->Seek(last_key);
RecordTick(statistics_, NUMBER_OF_RESEEKS_IN_ITERATION); RecordTick(statistics_, NUMBER_OF_RESEEKS_IN_ITERATION);
} else { } else {
@ -415,7 +476,7 @@ void DBIter::FindPrevUserEntry() {
if (value_type == kTypeDeletion) { if (value_type == kTypeDeletion) {
// End // End
valid_ = false; valid_ = false;
saved_key_.clear(); saved_key_.Clear();
ClearSavedValue(); ClearSavedValue();
direction_ = kForward; direction_ = kForward;
} else { } else {
@ -424,12 +485,12 @@ void DBIter::FindPrevUserEntry() {
} }
void DBIter::Seek(const Slice& target) { void DBIter::Seek(const Slice& target) {
saved_key_.clear(); saved_key_.Clear();
AppendInternalKey( // now savved_key is used to store internal key.
&saved_key_, ParsedInternalKey(target, sequence_, kValueTypeForSeek)); saved_key_.SetInternalKey(target, sequence_);
StopWatchNano internal_seek_timer(env_, false); StopWatchNano internal_seek_timer(env_, false);
StartPerfTimer(&internal_seek_timer); StartPerfTimer(&internal_seek_timer);
iter_->Seek(saved_key_); iter_->Seek(saved_key_.GetKey());
BumpPerfTime(&perf_context.seek_internal_seek_time, &internal_seek_timer); BumpPerfTime(&perf_context.seek_internal_seek_time, &internal_seek_timer);
if (iter_->Valid()) { if (iter_->Valid()) {
direction_ = kForward; direction_ = kForward;

@ -1372,6 +1372,44 @@ TEST(DBTest, IterSeekBeforePrev) {
delete iter; delete iter;
} }
std::string MakeLongKey(size_t length, char c) {
return std::string(length, c);
}
TEST(DBTest, IterLongKeys) {
ASSERT_OK(Put(MakeLongKey(20, 0), "0"));
ASSERT_OK(Put(MakeLongKey(32, 2), "2"));
ASSERT_OK(Put("a", "b"));
dbfull()->Flush(FlushOptions());
ASSERT_OK(Put(MakeLongKey(50, 1), "1"));
ASSERT_OK(Put(MakeLongKey(127, 3), "3"));
ASSERT_OK(Put(MakeLongKey(64, 4), "4"));
auto iter = db_->NewIterator(ReadOptions());
// Create a key that needs to be skipped for Seq too new
iter->Seek(MakeLongKey(20, 0));
ASSERT_EQ(IterStatus(iter), MakeLongKey(20, 0) + "->0");
iter->Next();
ASSERT_EQ(IterStatus(iter), MakeLongKey(50, 1) + "->1");
iter->Next();
ASSERT_EQ(IterStatus(iter), MakeLongKey(32, 2) + "->2");
iter->Next();
ASSERT_EQ(IterStatus(iter), MakeLongKey(127, 3) + "->3");
iter->Next();
ASSERT_EQ(IterStatus(iter), MakeLongKey(64, 4) + "->4");
delete iter;
iter = db_->NewIterator(ReadOptions());
iter->Seek(MakeLongKey(50, 1));
ASSERT_EQ(IterStatus(iter), MakeLongKey(50, 1) + "->1");
iter->Next();
ASSERT_EQ(IterStatus(iter), MakeLongKey(32, 2) + "->2");
iter->Next();
ASSERT_EQ(IterStatus(iter), MakeLongKey(127, 3) + "->3");
delete iter;
}
TEST(DBTest, IterNextWithNewerSeq) { TEST(DBTest, IterNextWithNewerSeq) {
ASSERT_OK(Put("0", "0")); ASSERT_OK(Put("0", "0"));
dbfull()->Flush(FlushOptions()); dbfull()->Flush(FlushOptions());

@ -15,7 +15,7 @@
namespace rocksdb { namespace rocksdb {
static uint64_t PackSequenceAndType(uint64_t seq, ValueType t) { uint64_t PackSequenceAndType(uint64_t seq, ValueType t) {
assert(seq <= kMaxSequenceNumber); assert(seq <= kMaxSequenceNumber);
assert(t <= kValueTypeForSeek); assert(t <= kValueTypeForSeek);
return (seq << 8) | t; return (seq << 8) | t;

@ -64,6 +64,8 @@ inline size_t InternalKeyEncodingLength(const ParsedInternalKey& key) {
return key.user_key.size() + 8; return key.user_key.size() + 8;
} }
extern uint64_t PackSequenceAndType(uint64_t seq, ValueType t);
// Append the serialization of "key" to *result. // Append the serialization of "key" to *result.
extern void AppendInternalKey(std::string* result, extern void AppendInternalKey(std::string* result,
const ParsedInternalKey& key); const ParsedInternalKey& key);

Loading…
Cancel
Save