db_stress to add --open_metadata_write_fault_one_in (#8235)

Summary:
DB Stress to add --open_metadata_write_fault_one_in which would randomly fail in some file metadata modification operations during DB Open, including file creation, close, renaming and directory sync. Some operations can fail before and after the operations take place.
If DB open fails, db_stress would retry without the failure ingestion, and DB is expected to open successfully.
This option is enabled in crash test in half of the time.
Some follow up changes would allow write failures in open time, and ingesting those failures in non-DB open cases.

Pull Request resolved: https://github.com/facebook/rocksdb/pull/8235

Test Plan: Run stress tests for a while and see failures got triggered. This can reproduce the bug fixed by https://github.com/facebook/rocksdb/pull/8192 and a similar one that fails when fsyncing parent directory.

Reviewed By: anand1976

Differential Revision: D28010944

fbshipit-source-id: 36a96da4dc3633e5f7680cef3ea0a900fcdb5558
This commit is contained in:
sdong 2021-04-28 10:57:11 -07:00 committed by Facebook GitHub Bot
parent 3949731de3
commit cde69a7cfd
8 changed files with 233 additions and 55 deletions

View File

@ -28,7 +28,9 @@ class DbStressEnvWrapper : public EnvWrapper {
f.find(".restore") != std::string::npos) { f.find(".restore") != std::string::npos) {
return target()->DeleteFile(f); return target()->DeleteFile(f);
} }
return Status::OK(); // Rename the file instead of deletion to keep the history, and
// at the same time it is not visible to RocksDB.
return target()->RenameFile(f, f + "_renamed_");
} }
// If true, all manifest files will not be delted in DeleteFile(). // If true, all manifest files will not be delted in DeleteFile().

View File

@ -808,4 +808,8 @@ DEFINE_uint64(user_timestamp_size, 0,
"Number of bytes for a user-defined timestamp. Currently, only " "Number of bytes for a user-defined timestamp. Currently, only "
"8-byte is supported"); "8-byte is supported");
DEFINE_int32(open_metadata_write_fault_one_in, 0,
"On non-zero, enables fault injection on file metadata write "
"during DB reopen.");
#endif // GFLAGS #endif // GFLAGS

View File

@ -30,6 +30,7 @@ DECLARE_int32(compaction_thread_pool_adjust_interval);
DECLARE_int32(continuous_verification_interval); DECLARE_int32(continuous_verification_interval);
DECLARE_int32(read_fault_one_in); DECLARE_int32(read_fault_one_in);
DECLARE_int32(write_fault_one_in); DECLARE_int32(write_fault_one_in);
DECLARE_int32(open_metadata_write_fault_one_in);
namespace ROCKSDB_NAMESPACE { namespace ROCKSDB_NAMESPACE {
class StressTest; class StressTest;

View File

@ -2104,6 +2104,9 @@ void StressTest::PrintEnv() const {
static_cast<int>(FLAGS_level_compaction_dynamic_level_bytes)); static_cast<int>(FLAGS_level_compaction_dynamic_level_bytes));
fprintf(stdout, "Read fault one in : %d\n", FLAGS_read_fault_one_in); fprintf(stdout, "Read fault one in : %d\n", FLAGS_read_fault_one_in);
fprintf(stdout, "Write fault one in : %d\n", FLAGS_write_fault_one_in); fprintf(stdout, "Write fault one in : %d\n", FLAGS_write_fault_one_in);
fprintf(stdout, "Open metadata write fault one in:\n");
fprintf(stdout, " %d\n",
FLAGS_open_metadata_write_fault_one_in);
fprintf(stdout, "Sync fault injection : %d\n", FLAGS_sync_fault_injection); fprintf(stdout, "Sync fault injection : %d\n", FLAGS_sync_fault_injection);
fprintf(stdout, "Best efforts recovery : %d\n", fprintf(stdout, "Best efforts recovery : %d\n",
static_cast<int>(FLAGS_best_efforts_recovery)); static_cast<int>(FLAGS_best_efforts_recovery));
@ -2409,6 +2412,24 @@ void StressTest::Open() {
new DbStressListener(FLAGS_db, options_.db_paths, cf_descriptors)); new DbStressListener(FLAGS_db, options_.db_paths, cf_descriptors));
options_.create_missing_column_families = true; options_.create_missing_column_families = true;
if (!FLAGS_use_txn) { if (!FLAGS_use_txn) {
#ifndef NDEBUG
// Determine whether we need to ingest file metadata write failures
// during DB reopen. If it does, enable it.
// Only ingest metadata error if it is reopening, as initial open
// failure doesn't need to be handled.
// TODO cover transaction DB is not covered in this fault test too.
bool ingest_meta_error =
FLAGS_open_metadata_write_fault_one_in &&
fault_fs_guard
->FileExists(FLAGS_db + "/CURRENT", IOOptions(), nullptr)
.ok();
if (ingest_meta_error) {
fault_fs_guard->EnableMetadataWriteErrorInjection();
fault_fs_guard->SetRandomMetadataWriteError(
FLAGS_open_metadata_write_fault_one_in);
}
while (true) {
#endif // NDEBUG
#ifndef ROCKSDB_LITE #ifndef ROCKSDB_LITE
// StackableDB-based BlobDB // StackableDB-based BlobDB
if (FLAGS_use_blob_db) { if (FLAGS_use_blob_db) {
@ -2421,7 +2442,8 @@ void StressTest::Open() {
blob_db::BlobDB* blob_db = nullptr; blob_db::BlobDB* blob_db = nullptr;
s = blob_db::BlobDB::Open(options_, blob_db_options, FLAGS_db, s = blob_db::BlobDB::Open(options_, blob_db_options, FLAGS_db,
cf_descriptors, &column_families_, &blob_db); cf_descriptors, &column_families_,
&blob_db);
if (s.ok()) { if (s.ok()) {
db_ = blob_db; db_ = blob_db;
} }
@ -2429,13 +2451,39 @@ void StressTest::Open() {
#endif // !ROCKSDB_LITE #endif // !ROCKSDB_LITE
{ {
if (db_preload_finished_.load() && FLAGS_read_only) { if (db_preload_finished_.load() && FLAGS_read_only) {
s = DB::OpenForReadOnly(DBOptions(options_), FLAGS_db, cf_descriptors, s = DB::OpenForReadOnly(DBOptions(options_), FLAGS_db,
&column_families_, &db_); cf_descriptors, &column_families_, &db_);
} else { } else {
s = DB::Open(DBOptions(options_), FLAGS_db, cf_descriptors, s = DB::Open(DBOptions(options_), FLAGS_db, cf_descriptors,
&column_families_, &db_); &column_families_, &db_);
} }
} }
#ifndef NDEBUG
if (ingest_meta_error) {
fault_fs_guard->DisableMetadataWriteErrorInjection();
if (!s.ok()) {
// After failure to opening a DB due to IO error, retry should
// successfully open the DB with correct data if no IO error shows
// up.
ingest_meta_error = false;
Random rand(static_cast<uint32_t>(FLAGS_seed));
if (rand.OneIn(2)) {
fault_fs_guard->DeleteFilesCreatedAfterLastDirSync(IOOptions(),
nullptr);
}
if (rand.OneIn(3)) {
fault_fs_guard->DropUnsyncedFileData();
} else if (rand.OneIn(2)) {
fault_fs_guard->DropRandomUnsyncedFileData(&rand);
}
continue;
}
}
break;
}
#endif // NDEBUG
} else { } else {
#ifndef ROCKSDB_LITE #ifndef ROCKSDB_LITE
TransactionDBOptions txn_db_options; TransactionDBOptions txn_db_options;

View File

@ -98,7 +98,7 @@ int db_stress_tool(int argc, char** argv) {
#ifndef NDEBUG #ifndef NDEBUG
if (FLAGS_read_fault_one_in || FLAGS_sync_fault_injection || if (FLAGS_read_fault_one_in || FLAGS_sync_fault_injection ||
FLAGS_write_fault_one_in) { FLAGS_write_fault_one_in || FLAGS_open_metadata_write_fault_one_in) {
FaultInjectionTestFS* fs = FaultInjectionTestFS* fs =
new FaultInjectionTestFS(raw_env->GetFileSystem()); new FaultInjectionTestFS(raw_env->GetFileSystem());
fault_fs_guard.reset(fs); fault_fs_guard.reset(fs);

View File

@ -137,6 +137,7 @@ default_params = {
"max_key_len": 3, "max_key_len": 3,
"key_len_percent_dist": "1,30,69", "key_len_percent_dist": "1,30,69",
"read_fault_one_in": lambda: random.choice([0, 1000]), "read_fault_one_in": lambda: random.choice([0, 1000]),
"open_metadata_write_fault_one_in": lambda: random.choice([0, 8]),
"sync_fault_injection": False, "sync_fault_injection": False,
"get_property_one_in": 1000000, "get_property_one_in": 1000000,
"paranoid_file_checks": lambda: random.choice([0, 1, 1, 1]), "paranoid_file_checks": lambda: random.choice([0, 1, 1, 1]),

View File

@ -87,8 +87,21 @@ IOStatus TestFSDirectory::Fsync(const IOOptions& options, IODebugContext* dbg) {
if (!fs_->IsFilesystemActive()) { if (!fs_->IsFilesystemActive()) {
return fs_->GetError(); return fs_->GetError();
} }
{
IOStatus in_s = fs_->InjectMetadataWriteError();
if (!in_s.ok()) {
return in_s;
}
}
fs_->SyncDir(dirname_); fs_->SyncDir(dirname_);
return dir_->Fsync(options, dbg); IOStatus s = dir_->Fsync(options, dbg);
{
IOStatus in_s = fs_->InjectMetadataWriteError();
if (!in_s.ok()) {
return in_s;
}
}
return s;
} }
TestFSWritableFile::TestFSWritableFile(const std::string& fname, TestFSWritableFile::TestFSWritableFile(const std::string& fname,
@ -159,6 +172,12 @@ IOStatus TestFSWritableFile::Close(const IOOptions& options,
if (!fs_->IsFilesystemActive()) { if (!fs_->IsFilesystemActive()) {
return fs_->GetError(); return fs_->GetError();
} }
{
IOStatus in_s = fs_->InjectMetadataWriteError();
if (!in_s.ok()) {
return in_s;
}
}
writable_file_opened_ = false; writable_file_opened_ = false;
IOStatus io_s; IOStatus io_s;
io_s = target_->Append(state_.buffer_, options, dbg); io_s = target_->Append(state_.buffer_, options, dbg);
@ -170,6 +189,10 @@ IOStatus TestFSWritableFile::Close(const IOOptions& options,
} }
if (io_s.ok()) { if (io_s.ok()) {
fs_->WritableFileClosed(state_); fs_->WritableFileClosed(state_);
IOStatus in_s = fs_->InjectMetadataWriteError();
if (!in_s.ok()) {
return in_s;
}
} }
return io_s; return io_s;
} }
@ -294,6 +317,12 @@ IOStatus FaultInjectionTestFS::NewWritableFile(
if (!IsFilesystemActive()) { if (!IsFilesystemActive()) {
return GetError(); return GetError();
} }
{
IOStatus in_s = InjectMetadataWriteError();
if (!in_s.ok()) {
return in_s;
}
}
if (IsFilesystemDirectWritable()) { if (IsFilesystemDirectWritable()) {
return target()->NewWritableFile(fname, file_opts, result, dbg); return target()->NewWritableFile(fname, file_opts, result, dbg);
} }
@ -305,12 +334,20 @@ IOStatus FaultInjectionTestFS::NewWritableFile(
// WritableFileWriter* file is opened // WritableFileWriter* file is opened
// again then it will be truncated - so forget our saved state. // again then it will be truncated - so forget our saved state.
UntrackFile(fname); UntrackFile(fname);
{
MutexLock l(&mutex_); MutexLock l(&mutex_);
open_files_.insert(fname); open_files_.insert(fname);
auto dir_and_name = TestFSGetDirAndName(fname); auto dir_and_name = TestFSGetDirAndName(fname);
auto& list = dir_to_new_files_since_last_sync_[dir_and_name.first]; auto& list = dir_to_new_files_since_last_sync_[dir_and_name.first];
list.insert(dir_and_name.second); list.insert(dir_and_name.second);
} }
{
IOStatus in_s = InjectMetadataWriteError();
if (!in_s.ok()) {
return in_s;
}
}
}
return io_s; return io_s;
} }
@ -323,6 +360,12 @@ IOStatus FaultInjectionTestFS::ReopenWritableFile(
if (IsFilesystemDirectWritable()) { if (IsFilesystemDirectWritable()) {
return target()->ReopenWritableFile(fname, file_opts, result, dbg); return target()->ReopenWritableFile(fname, file_opts, result, dbg);
} }
{
IOStatus in_s = InjectMetadataWriteError();
if (!in_s.ok()) {
return in_s;
}
}
IOStatus io_s = target()->ReopenWritableFile(fname, file_opts, result, dbg); IOStatus io_s = target()->ReopenWritableFile(fname, file_opts, result, dbg);
if (io_s.ok()) { if (io_s.ok()) {
result->reset( result->reset(
@ -330,12 +373,20 @@ IOStatus FaultInjectionTestFS::ReopenWritableFile(
// WritableFileWriter* file is opened // WritableFileWriter* file is opened
// again then it will be truncated - so forget our saved state. // again then it will be truncated - so forget our saved state.
UntrackFile(fname); UntrackFile(fname);
{
MutexLock l(&mutex_); MutexLock l(&mutex_);
open_files_.insert(fname); open_files_.insert(fname);
auto dir_and_name = TestFSGetDirAndName(fname); auto dir_and_name = TestFSGetDirAndName(fname);
auto& list = dir_to_new_files_since_last_sync_[dir_and_name.first]; auto& list = dir_to_new_files_since_last_sync_[dir_and_name.first];
list.insert(dir_and_name.second); list.insert(dir_and_name.second);
} }
{
IOStatus in_s = InjectMetadataWriteError();
if (!in_s.ok()) {
return in_s;
}
}
}
return io_s; return io_s;
} }
@ -348,18 +399,32 @@ IOStatus FaultInjectionTestFS::NewRandomRWFile(
if (IsFilesystemDirectWritable()) { if (IsFilesystemDirectWritable()) {
return target()->NewRandomRWFile(fname, file_opts, result, dbg); return target()->NewRandomRWFile(fname, file_opts, result, dbg);
} }
{
IOStatus in_s = InjectMetadataWriteError();
if (!in_s.ok()) {
return in_s;
}
}
IOStatus io_s = target()->NewRandomRWFile(fname, file_opts, result, dbg); IOStatus io_s = target()->NewRandomRWFile(fname, file_opts, result, dbg);
if (io_s.ok()) { if (io_s.ok()) {
result->reset(new TestFSRandomRWFile(fname, std::move(*result), this)); result->reset(new TestFSRandomRWFile(fname, std::move(*result), this));
// WritableFileWriter* file is opened // WritableFileWriter* file is opened
// again then it will be truncated - so forget our saved state. // again then it will be truncated - so forget our saved state.
UntrackFile(fname); UntrackFile(fname);
{
MutexLock l(&mutex_); MutexLock l(&mutex_);
open_files_.insert(fname); open_files_.insert(fname);
auto dir_and_name = TestFSGetDirAndName(fname); auto dir_and_name = TestFSGetDirAndName(fname);
auto& list = dir_to_new_files_since_last_sync_[dir_and_name.first]; auto& list = dir_to_new_files_since_last_sync_[dir_and_name.first];
list.insert(dir_and_name.second); list.insert(dir_and_name.second);
} }
{
IOStatus in_s = InjectMetadataWriteError();
if (!in_s.ok()) {
return in_s;
}
}
}
return io_s; return io_s;
} }
@ -385,9 +450,21 @@ IOStatus FaultInjectionTestFS::DeleteFile(const std::string& f,
if (!IsFilesystemActive()) { if (!IsFilesystemActive()) {
return GetError(); return GetError();
} }
{
IOStatus in_s = InjectMetadataWriteError();
if (!in_s.ok()) {
return in_s;
}
}
IOStatus io_s = FileSystemWrapper::DeleteFile(f, options, dbg); IOStatus io_s = FileSystemWrapper::DeleteFile(f, options, dbg);
if (io_s.ok()) { if (io_s.ok()) {
UntrackFile(f); UntrackFile(f);
{
IOStatus in_s = InjectMetadataWriteError();
if (!in_s.ok()) {
return in_s;
}
}
} }
return io_s; return io_s;
} }
@ -399,9 +476,16 @@ IOStatus FaultInjectionTestFS::RenameFile(const std::string& s,
if (!IsFilesystemActive()) { if (!IsFilesystemActive()) {
return GetError(); return GetError();
} }
{
IOStatus in_s = InjectMetadataWriteError();
if (!in_s.ok()) {
return in_s;
}
}
IOStatus io_s = FileSystemWrapper::RenameFile(s, t, options, dbg); IOStatus io_s = FileSystemWrapper::RenameFile(s, t, options, dbg);
if (io_s.ok()) { if (io_s.ok()) {
{
MutexLock l(&mutex_); MutexLock l(&mutex_);
if (db_file_state_.find(s) != db_file_state_.end()) { if (db_file_state_.find(s) != db_file_state_.end()) {
db_file_state_[t] = db_file_state_[s]; db_file_state_[t] = db_file_state_[s];
@ -416,6 +500,11 @@ IOStatus FaultInjectionTestFS::RenameFile(const std::string& s,
tlist.insert(tdn.second); tlist.insert(tdn.second);
} }
} }
IOStatus in_s = InjectMetadataWriteError();
if (!in_s.ok()) {
return in_s;
}
}
return io_s; return io_s;
} }
@ -618,6 +707,16 @@ IOStatus FaultInjectionTestFS::InjectWriteError(const std::string& file_name) {
return IOStatus::OK(); return IOStatus::OK();
} }
IOStatus FaultInjectionTestFS::InjectMetadataWriteError() {
MutexLock l(&mutex_);
if (!enable_metadata_write_error_injection_ ||
!metadata_write_error_one_in_ ||
!write_error_rand_.OneIn(metadata_write_error_one_in_)) {
return IOStatus::OK();
}
return IOStatus::IOError();
}
void FaultInjectionTestFS::PrintFaultBacktrace() { void FaultInjectionTestFS::PrintFaultBacktrace() {
#if defined(OS_LINUX) #if defined(OS_LINUX)
ErrorContext* ctx = ErrorContext* ctx =

View File

@ -174,7 +174,10 @@ class FaultInjectionTestFS : public FileSystemWrapper {
filesystem_writable_(false), filesystem_writable_(false),
thread_local_error_(new ThreadLocalPtr(DeleteThreadLocalErrorContext)), thread_local_error_(new ThreadLocalPtr(DeleteThreadLocalErrorContext)),
enable_write_error_injection_(false), enable_write_error_injection_(false),
enable_metadata_write_error_injection_(false),
write_error_rand_(0), write_error_rand_(0),
write_error_one_in_(0),
metadata_write_error_one_in_(0),
ingest_data_corruption_before_write_(false) {} ingest_data_corruption_before_write_(false) {}
virtual ~FaultInjectionTestFS() { error_.PermitUncheckedError(); } virtual ~FaultInjectionTestFS() { error_.PermitUncheckedError(); }
@ -361,10 +364,18 @@ class FaultInjectionTestFS : public FileSystemWrapper {
write_error_allowed_types_ = types; write_error_allowed_types_ = types;
} }
void SetRandomMetadataWriteError(int one_in) {
MutexLock l(&mutex_);
metadata_write_error_one_in_ = one_in;
}
// Inject an write error with randomlized parameter and the predefined // Inject an write error with randomlized parameter and the predefined
// error type. Only the allowed file types will inject the write error // error type. Only the allowed file types will inject the write error
IOStatus InjectWriteError(const std::string& file_name); IOStatus InjectWriteError(const std::string& file_name);
// Ingest error to metadata operations.
IOStatus InjectMetadataWriteError();
// Inject an error. For a READ operation, a status of IOError(), a // Inject an error. For a READ operation, a status of IOError(), a
// corruption in the contents of scratch, or truncation of slice // corruption in the contents of scratch, or truncation of slice
// are the types of error with equal probability. For OPEN, // are the types of error with equal probability. For OPEN,
@ -397,6 +408,11 @@ class FaultInjectionTestFS : public FileSystemWrapper {
enable_write_error_injection_ = true; enable_write_error_injection_ = true;
} }
void EnableMetadataWriteErrorInjection() {
MutexLock l(&mutex_);
enable_metadata_write_error_injection_ = true;
}
void DisableWriteErrorInjection() { void DisableWriteErrorInjection() {
MutexLock l(&mutex_); MutexLock l(&mutex_);
enable_write_error_injection_ = false; enable_write_error_injection_ = false;
@ -410,6 +426,11 @@ class FaultInjectionTestFS : public FileSystemWrapper {
} }
} }
void DisableMetadataWriteErrorInjection() {
MutexLock l(&mutex_);
enable_metadata_write_error_injection_ = false;
}
// We capture a backtrace every time a fault is injected, for debugging // We capture a backtrace every time a fault is injected, for debugging
// purposes. This call prints the backtrace to stderr and frees the // purposes. This call prints the backtrace to stderr and frees the
// saved callstack // saved callstack
@ -456,8 +477,10 @@ class FaultInjectionTestFS : public FileSystemWrapper {
std::unique_ptr<ThreadLocalPtr> thread_local_error_; std::unique_ptr<ThreadLocalPtr> thread_local_error_;
bool enable_write_error_injection_; bool enable_write_error_injection_;
bool enable_metadata_write_error_injection_;
Random write_error_rand_; Random write_error_rand_;
int write_error_one_in_; int write_error_one_in_;
int metadata_write_error_one_in_;
std::vector<FileType> write_error_allowed_types_; std::vector<FileType> write_error_allowed_types_;
bool ingest_data_corruption_before_write_; bool ingest_data_corruption_before_write_;
ChecksumType checksum_handoff_func_tpye_; ChecksumType checksum_handoff_func_tpye_;