Fix the potential deadlock in WriteImplWALOnly and UnorderedWriteMemtable (#7199)

Summary:
Pointed out by https://github.com/facebook/rocksdb/issues/7197 , there is a double lock in WriteImplWALOnly.
Also find another deadlock in UnorderedWriteMemtable. Move the check after switch_all_.notify_all().

Pull Request resolved: https://github.com/facebook/rocksdb/pull/7199

Test Plan: pass make check

Reviewed By: anand1976

Differential Revision: D22961714

Pulled By: zhichao-cao

fbshipit-source-id: 0707922dc50d28ea141a15a8cdcbd1c8993ea0d8
main
Zhichao Cao 4 years ago committed by Facebook GitHub Bot
parent 56f468b356
commit b79f13b2aa
  1. 4
      db/db_impl/db_impl.h
  2. 16
      db/db_impl/db_impl_write.cc

@ -1554,6 +1554,10 @@ class DBImpl : public DB {
uint64_t* log_used, uint64_t* log_used,
SequenceNumber* last_sequence, size_t seq_inc); SequenceNumber* last_sequence, size_t seq_inc);
// Used by WriteImpl to update bg_error_ if paranoid check is enabled.
// Caller must hold mutex_.
void WriteStatusCheckOnLocked(const Status& status);
// Used by WriteImpl to update bg_error_ if paranoid check is enabled. // Used by WriteImpl to update bg_error_ if paranoid check is enabled.
void WriteStatusCheck(const Status& status); void WriteStatusCheck(const Status& status);

@ -623,8 +623,6 @@ Status DBImpl::UnorderedWriteMemtable(const WriteOptions& write_options,
0 /*log_number*/, this, true /*concurrent_memtable_writes*/, 0 /*log_number*/, this, true /*concurrent_memtable_writes*/,
seq_per_batch_, sub_batch_cnt, true /*batch_per_txn*/, seq_per_batch_, sub_batch_cnt, true /*batch_per_txn*/,
write_options.memtable_insert_hint_per_batch); write_options.memtable_insert_hint_per_batch);
WriteStatusCheck(w.status);
if (write_options.disableWAL) { if (write_options.disableWAL) {
has_unpersisted_data_.store(true, std::memory_order_relaxed); has_unpersisted_data_.store(true, std::memory_order_relaxed);
} }
@ -639,6 +637,7 @@ Status DBImpl::UnorderedWriteMemtable(const WriteOptions& write_options,
std::lock_guard<std::mutex> lck(switch_mutex_); std::lock_guard<std::mutex> lck(switch_mutex_);
switch_cv_.notify_all(); switch_cv_.notify_all();
} }
WriteStatusCheck(w.status);
if (!w.FinalStatus().ok()) { if (!w.FinalStatus().ok()) {
return w.FinalStatus(); return w.FinalStatus();
@ -689,7 +688,7 @@ Status DBImpl::WriteImplWALOnly(
InstrumentedMutexLock l(&mutex_); InstrumentedMutexLock l(&mutex_);
bool need_log_sync = false; bool need_log_sync = false;
status = PreprocessWrite(write_options, &need_log_sync, &write_context); status = PreprocessWrite(write_options, &need_log_sync, &write_context);
WriteStatusCheck(status); WriteStatusCheckOnLocked(status);
} }
if (!status.ok()) { if (!status.ok()) {
WriteThread::WriteGroup write_group; WriteThread::WriteGroup write_group;
@ -830,6 +829,17 @@ Status DBImpl::WriteImplWALOnly(
return status; return status;
} }
void DBImpl::WriteStatusCheckOnLocked(const Status& status) {
// Is setting bg_error_ enough here? This will at least stop
// compaction and fail any further writes.
// Caller must hold mutex_.
mutex_.AssertHeld();
if (immutable_db_options_.paranoid_checks && !status.ok() &&
!status.IsBusy() && !status.IsIncomplete()) {
error_handler_.SetBGError(status, BackgroundErrorReason::kWriteCallback);
}
}
void DBImpl::WriteStatusCheck(const Status& status) { void DBImpl::WriteStatusCheck(const Status& status) {
// Is setting bg_error_ enough here? This will at least stop // Is setting bg_error_ enough here? This will at least stop
// compaction and fail any further writes. // compaction and fail any further writes.

Loading…
Cancel
Save