From ec43a8b9fbb71112e08cd6187eea63756b1320a2 Mon Sep 17 00:00:00 2001 From: sdong Date: Wed, 13 May 2015 10:29:49 -0700 Subject: [PATCH] Universal Compaction with multiple levels won't allocate up to output size Summary: Universal compactions with multiple levels should use file preallocation size based on file size if output level is not level 0 Test Plan: Run all tests. Reviewers: igor Reviewed By: igor Subscribers: leveldb, dhruba Differential Revision: https://reviews.facebook.net/D38439 --- db/compaction.cc | 11 ++++++----- db/db_test.cc | 21 ++++++++++++++++++++- include/rocksdb/env.h | 2 ++ 3 files changed, 28 insertions(+), 6 deletions(-) diff --git a/db/compaction.cc b/db/compaction.cc index f8f4cdbb5..7ece0c4e9 100644 --- a/db/compaction.cc +++ b/db/compaction.cc @@ -325,13 +325,14 @@ void Compaction::Summary(char* output, int len) { uint64_t Compaction::OutputFilePreallocationSize() { uint64_t preallocation_size = 0; - if (cfd_->ioptions()->compaction_style == kCompactionStyleLevel) { + if (cfd_->ioptions()->compaction_style == kCompactionStyleLevel || + output_level() > 0) { preallocation_size = max_output_file_size_; } else { - for (size_t level_iter = 0; level_iter < num_input_levels(); ++level_iter) { - for (const auto& f : inputs_[level_iter].files) { - preallocation_size += f->fd.GetFileSize(); - } + // output_level() == 0 + assert(num_input_levels() > 0); + for (const auto& f : inputs_[0].files) { + preallocation_size += f->fd.GetFileSize(); } } // Over-estimate slightly so we don't end up just barely crossing diff --git a/db/db_test.cc b/db/db_test.cc index 11aeeee9d..dd17fdc2f 100644 --- a/db/db_test.cc +++ b/db/db_test.cc @@ -200,7 +200,14 @@ class SpecialEnv : public EnvWrapper { return base_->Append(data); } } - Status Close() override { return base_->Close(); } + Status Close() override { + // Check preallocation size + // preallocation size is never passed to base file. + size_t preallocation_size = preallocation_block_size(); + TEST_SYNC_POINT_CALLBACK("DBTestWritableFile.GetPreallocationStatus", + &preallocation_size); + return base_->Close(); + } Status Flush() override { return base_->Flush(); } Status Sync() override { ++env_->sync_counter_; @@ -4067,6 +4074,16 @@ TEST_P(DBTestUniversalCompaction, UniversalCompactionTrigger) { DestroyAndReopen(options); CreateAndReopenWithCF({"pikachu"}, options); + rocksdb::SyncPoint::GetInstance()->SetCallBack( + "DBTestWritableFile.GetPreallocationStatus", [&](void* arg) { + ASSERT_TRUE(arg != nullptr); + size_t preallocation_size = *(static_cast(arg)); + if (num_levels_ > 3) { + ASSERT_LE(preallocation_size, options.target_file_size_base * 1.1); + } + }); + rocksdb::SyncPoint::GetInstance()->EnableProcessing(); + Random rnd(301); int key_idx = 0; @@ -4175,6 +4192,8 @@ TEST_P(DBTestUniversalCompaction, UniversalCompactionTrigger) { dbfull()->TEST_WaitForCompact(); // All files at level 0 will be compacted into a single one. ASSERT_EQ(NumSortedRuns(1), 1); + + rocksdb::SyncPoint::GetInstance()->DisableProcessing(); } TEST_P(DBTestUniversalCompaction, UniversalCompactionSizeAmplification) { diff --git a/include/rocksdb/env.h b/include/rocksdb/env.h index 64af02049..d7403f8c0 100644 --- a/include/rocksdb/env.h +++ b/include/rocksdb/env.h @@ -532,6 +532,8 @@ class WritableFile { return Status::OK(); } + size_t preallocation_block_size() { return preallocation_block_size_; } + private: size_t last_preallocated_block_; size_t preallocation_block_size_;