db_stress: listners to implement all functions (#6197)

Summary:
Listners are one source of bugs because we frequently release some mutex to invoke them, which introduce race conditions. Implement all callback functions in db_stress's listener class, and randomly sleep.
Pull Request resolved: https://github.com/facebook/rocksdb/pull/6197

Test Plan: Run crash_test for a while and see no obvious problem.

Differential Revision: D19134015

fbshipit-source-id: b9ea8be9366e4501759119520cd4f204943538f6
main
sdong 5 years ago committed by Facebook Github Bot
parent 79cc8dc29b
commit 9d36c066c6
  1. 100
      db_stress_tool/db_stress_listener.h

@ -21,18 +21,29 @@ class DbStressListener : public EventListener {
db_paths_(db_paths), db_paths_(db_paths),
column_families_(column_families), column_families_(column_families),
num_pending_file_creations_(0) {} num_pending_file_creations_(0) {}
virtual ~DbStressListener() { assert(num_pending_file_creations_ == 0); }
#ifndef ROCKSDB_LITE #ifndef ROCKSDB_LITE
virtual void OnFlushCompleted(DB* /*db*/, const FlushJobInfo& info) override { ~DbStressListener() override { assert(num_pending_file_creations_ == 0); }
void OnFlushCompleted(DB* /*db*/, const FlushJobInfo& info) override {
assert(IsValidColumnFamilyName(info.cf_name)); assert(IsValidColumnFamilyName(info.cf_name));
VerifyFilePath(info.file_path); VerifyFilePath(info.file_path);
// pretending doing some work here // pretending doing some work here
std::this_thread::sleep_for( RandomSleep();
std::chrono::microseconds(Random::GetTLSInstance()->Uniform(5000))); }
void OnFlushBegin(DB* /*db*/,
const FlushJobInfo& /*flush_job_info*/) override {
RandomSleep();
}
void OnTableFileDeleted(const TableFileDeletionInfo& /*info*/) override {
RandomSleep();
}
void OnCompactionBegin(DB* /*db*/, const CompactionJobInfo& /*ci*/) override {
RandomSleep();
} }
virtual void OnCompactionCompleted(DB* /*db*/, void OnCompactionCompleted(DB* /*db*/, const CompactionJobInfo& ci) override {
const CompactionJobInfo& ci) override {
assert(IsValidColumnFamilyName(ci.cf_name)); assert(IsValidColumnFamilyName(ci.cf_name));
assert(ci.input_files.size() + ci.output_files.size() > 0U); assert(ci.input_files.size() + ci.output_files.size() > 0U);
for (const auto& file_path : ci.input_files) { for (const auto& file_path : ci.input_files) {
@ -42,15 +53,15 @@ class DbStressListener : public EventListener {
VerifyFilePath(file_path); VerifyFilePath(file_path);
} }
// pretending doing some work here // pretending doing some work here
std::this_thread::sleep_for( RandomSleep();
std::chrono::microseconds(Random::GetTLSInstance()->Uniform(5000)));
} }
virtual void OnTableFileCreationStarted( void OnTableFileCreationStarted(
const TableFileCreationBriefInfo& /*info*/) override { const TableFileCreationBriefInfo& /*info*/) override {
++num_pending_file_creations_; ++num_pending_file_creations_;
} }
virtual void OnTableFileCreated(const TableFileCreationInfo& info) override {
void OnTableFileCreated(const TableFileCreationInfo& info) override {
assert(info.db_name == db_name_); assert(info.db_name == db_name_);
assert(IsValidColumnFamilyName(info.cf_name)); assert(IsValidColumnFamilyName(info.cf_name));
if (info.file_size) { if (info.file_size) {
@ -66,6 +77,70 @@ class DbStressListener : public EventListener {
--num_pending_file_creations_; --num_pending_file_creations_;
} }
void OnMemTableSealed(const MemTableInfo& /*info*/) override {
RandomSleep();
}
void OnColumnFamilyHandleDeletionStarted(
ColumnFamilyHandle* /*handle*/) override {
RandomSleep();
}
void OnExternalFileIngested(
DB* /*db*/, const ExternalFileIngestionInfo& /*info*/) override {
RandomSleep();
}
void OnBackgroundError(BackgroundErrorReason /* reason */,
Status* /* bg_error */) override {
RandomSleep();
}
void OnStallConditionsChanged(const WriteStallInfo& /*info*/) override {
RandomSleep();
}
void OnFileReadFinish(const FileOperationInfo& info) override {
// Even empty callback is valuable because sometimes some locks are
// released in order to make the callback.
// Sleep carefully here as it is a frequent operation and we don't want
// to slow down the tests. We always sleep when the read is large.
// When read is small, sleep in a small chance.
size_t length_read = info.length;
if (length_read >= 1000000 || Random::GetTLSInstance()->OneIn(1000)) {
RandomSleep();
}
}
void OnFileWriteFinish(const FileOperationInfo& info) override {
// Even empty callback is valuable because sometimes some locks are
// released in order to make the callback.
// Sleep carefully here as it is a frequent operation and we don't want
// to slow down the tests. When the write is large, always sleep.
// Otherwise, sleep in a relatively small chance.
size_t length_write = info.length;
if (length_write >= 1000000 || Random::GetTLSInstance()->OneIn(64)) {
RandomSleep();
}
}
bool ShouldBeNotifiedOnFileIO() override {
RandomSleep();
return static_cast<bool>(Random::GetTLSInstance()->OneIn(1));
}
void OnErrorRecoveryBegin(BackgroundErrorReason /* reason */,
Status /* bg_error */,
bool* /* auto_recovery */) override {
RandomSleep();
}
void OnErrorRecoveryCompleted(Status /* old_bg_error */) override {
RandomSleep();
}
protected: protected:
bool IsValidColumnFamilyName(const std::string& cf_name) const { bool IsValidColumnFamilyName(const std::string& cf_name) const {
if (cf_name == kDefaultColumnFamilyName) { if (cf_name == kDefaultColumnFamilyName) {
@ -130,6 +205,11 @@ class DbStressListener : public EventListener {
(void)file_path; (void)file_path;
#endif // !NDEBUG #endif // !NDEBUG
} }
void RandomSleep() {
std::this_thread::sleep_for(
std::chrono::microseconds(Random::GetTLSInstance()->Uniform(5000)));
}
#endif // !ROCKSDB_LITE #endif // !ROCKSDB_LITE
private: private:

Loading…
Cancel
Save