Revert to storing UncompressionDicts in the cache (#5645)
Summary: PR https://github.com/facebook/rocksdb/issues/5584 decoupled the uncompression dictionary object from the underlying block data; however, this defeats the purpose of the digested ZSTD dictionary, since the whole point of the digest is to create it once and reuse it over and over again. This patch goes back to storing the uncompression dictionary itself in the cache (which should be now safe to do, since it no longer includes a Statistics pointer), while preserving the rest of the refactoring. Pull Request resolved: https://github.com/facebook/rocksdb/pull/5645 Test Plan: make asan_check Differential Revision: D16551864 Pulled By: ltamasi fbshipit-source-id: 2a7e2d34bb16e70e3c816506d5afe1d842057800
This commit is contained in:
parent
d039c41b43
commit
fdc9b5248b
@ -68,6 +68,57 @@ BlockBasedTable::~BlockBasedTable() {
|
||||
|
||||
std::atomic<uint64_t> BlockBasedTable::next_cache_key_id_(0);
|
||||
|
||||
template <typename TBlocklike>
|
||||
class BlocklikeTraits;
|
||||
|
||||
template <>
|
||||
class BlocklikeTraits<BlockContents> {
|
||||
public:
|
||||
static BlockContents* Create(BlockContents&& contents,
|
||||
SequenceNumber /* global_seqno */,
|
||||
size_t /* read_amp_bytes_per_bit */,
|
||||
Statistics* /* statistics */,
|
||||
bool /* using_zstd */) {
|
||||
return new BlockContents(std::move(contents));
|
||||
}
|
||||
|
||||
static uint32_t GetNumRestarts(const BlockContents& /* contents */) {
|
||||
return 0;
|
||||
}
|
||||
};
|
||||
|
||||
template <>
|
||||
class BlocklikeTraits<Block> {
|
||||
public:
|
||||
static Block* Create(BlockContents&& contents, SequenceNumber global_seqno,
|
||||
size_t read_amp_bytes_per_bit, Statistics* statistics,
|
||||
bool /* using_zstd */) {
|
||||
return new Block(std::move(contents), global_seqno, read_amp_bytes_per_bit,
|
||||
statistics);
|
||||
}
|
||||
|
||||
static uint32_t GetNumRestarts(const Block& block) {
|
||||
return block.NumRestarts();
|
||||
}
|
||||
};
|
||||
|
||||
template <>
|
||||
class BlocklikeTraits<UncompressionDict> {
|
||||
public:
|
||||
static UncompressionDict* Create(BlockContents&& contents,
|
||||
SequenceNumber /* global_seqno */,
|
||||
size_t /* read_amp_bytes_per_bit */,
|
||||
Statistics* /* statistics */,
|
||||
bool using_zstd) {
|
||||
return new UncompressionDict(contents.data, std::move(contents.allocation),
|
||||
using_zstd);
|
||||
}
|
||||
|
||||
static uint32_t GetNumRestarts(const UncompressionDict& /* dict */) {
|
||||
return 0;
|
||||
}
|
||||
};
|
||||
|
||||
namespace {
|
||||
// Read the block identified by "handle" from "file".
|
||||
// The only relevant option is options.verify_checksums for now.
|
||||
@ -75,15 +126,16 @@ namespace {
|
||||
// On success fill *result and return OK - caller owns *result
|
||||
// @param uncompression_dict Data for presetting the compression library's
|
||||
// dictionary.
|
||||
template <typename TBlocklike>
|
||||
Status ReadBlockFromFile(
|
||||
RandomAccessFileReader* file, FilePrefetchBuffer* prefetch_buffer,
|
||||
const Footer& footer, const ReadOptions& options, const BlockHandle& handle,
|
||||
std::unique_ptr<Block>* result, const ImmutableCFOptions& ioptions,
|
||||
std::unique_ptr<TBlocklike>* result, const ImmutableCFOptions& ioptions,
|
||||
bool do_uncompress, bool maybe_compressed, BlockType block_type,
|
||||
const UncompressionDict& uncompression_dict,
|
||||
const PersistentCacheOptions& cache_options, SequenceNumber global_seqno,
|
||||
size_t read_amp_bytes_per_bit, MemoryAllocator* memory_allocator,
|
||||
bool for_compaction = false) {
|
||||
bool for_compaction, bool using_zstd) {
|
||||
assert(result);
|
||||
|
||||
BlockContents contents;
|
||||
@ -93,34 +145,9 @@ Status ReadBlockFromFile(
|
||||
cache_options, memory_allocator, nullptr, for_compaction);
|
||||
Status s = block_fetcher.ReadBlockContents();
|
||||
if (s.ok()) {
|
||||
result->reset(new Block(std::move(contents), global_seqno,
|
||||
read_amp_bytes_per_bit, ioptions.statistics));
|
||||
}
|
||||
|
||||
return s;
|
||||
}
|
||||
|
||||
Status ReadBlockFromFile(
|
||||
RandomAccessFileReader* file, FilePrefetchBuffer* prefetch_buffer,
|
||||
const Footer& footer, const ReadOptions& options, const BlockHandle& handle,
|
||||
std::unique_ptr<BlockContents>* result, const ImmutableCFOptions& ioptions,
|
||||
bool do_uncompress, bool maybe_compressed, BlockType block_type,
|
||||
const UncompressionDict& uncompression_dict,
|
||||
const PersistentCacheOptions& cache_options,
|
||||
SequenceNumber /* global_seqno */, size_t /* read_amp_bytes_per_bit */,
|
||||
MemoryAllocator* memory_allocator, bool for_compaction = false) {
|
||||
assert(result);
|
||||
|
||||
result->reset(new BlockContents);
|
||||
|
||||
BlockFetcher block_fetcher(
|
||||
file, prefetch_buffer, footer, options, handle, result->get(), ioptions,
|
||||
do_uncompress, maybe_compressed, block_type, uncompression_dict,
|
||||
cache_options, memory_allocator, nullptr, for_compaction);
|
||||
|
||||
const Status s = block_fetcher.ReadBlockContents();
|
||||
if (!s.ok()) {
|
||||
result->reset();
|
||||
result->reset(BlocklikeTraits<TBlocklike>::Create(
|
||||
std::move(contents), global_seqno, read_amp_bytes_per_bit,
|
||||
ioptions.statistics, using_zstd));
|
||||
}
|
||||
|
||||
return s;
|
||||
@ -1595,7 +1622,8 @@ Status BlockBasedTable::ReadMetaBlock(FilePrefetchBuffer* prefetch_buffer,
|
||||
true /* decompress */, true /*maybe_compressed*/, BlockType::kMetaIndex,
|
||||
UncompressionDict::GetEmptyDict(), rep_->persistent_cache_options,
|
||||
kDisableGlobalSequenceNumber, 0 /* read_amp_bytes_per_bit */,
|
||||
GetMemoryAllocator(rep_->table_options));
|
||||
GetMemoryAllocator(rep_->table_options), false /* for_compaction */,
|
||||
rep_->blocks_definitely_zstd_compressed);
|
||||
|
||||
if (!s.ok()) {
|
||||
ROCKS_LOG_ERROR(rep_->ioptions.info_log,
|
||||
@ -1612,38 +1640,6 @@ Status BlockBasedTable::ReadMetaBlock(FilePrefetchBuffer* prefetch_buffer,
|
||||
return Status::OK();
|
||||
}
|
||||
|
||||
template <typename TBlocklike>
|
||||
class BlocklikeTraits;
|
||||
|
||||
template <>
|
||||
class BlocklikeTraits<BlockContents> {
|
||||
public:
|
||||
static BlockContents* Create(BlockContents&& contents,
|
||||
SequenceNumber /* global_seqno */,
|
||||
size_t /* read_amp_bytes_per_bit */,
|
||||
Statistics* /* statistics */) {
|
||||
return new BlockContents(std::move(contents));
|
||||
}
|
||||
|
||||
static uint32_t GetNumRestarts(const BlockContents& /* contents */) {
|
||||
return 0;
|
||||
}
|
||||
};
|
||||
|
||||
template <>
|
||||
class BlocklikeTraits<Block> {
|
||||
public:
|
||||
static Block* Create(BlockContents&& contents, SequenceNumber global_seqno,
|
||||
size_t read_amp_bytes_per_bit, Statistics* statistics) {
|
||||
return new Block(std::move(contents), global_seqno, read_amp_bytes_per_bit,
|
||||
statistics);
|
||||
}
|
||||
|
||||
static uint32_t GetNumRestarts(const Block& block) {
|
||||
return block.NumRestarts();
|
||||
}
|
||||
};
|
||||
|
||||
template <typename TBlocklike>
|
||||
Status BlockBasedTable::GetDataBlockFromCache(
|
||||
const Slice& block_cache_key, const Slice& compressed_block_cache_key,
|
||||
@ -1715,7 +1711,8 @@ Status BlockBasedTable::GetDataBlockFromCache(
|
||||
std::unique_ptr<TBlocklike> block_holder(
|
||||
BlocklikeTraits<TBlocklike>::Create(
|
||||
std::move(contents), rep_->get_global_seqno(block_type),
|
||||
read_amp_bytes_per_bit, statistics)); // uncompressed block
|
||||
read_amp_bytes_per_bit, statistics,
|
||||
rep_->blocks_definitely_zstd_compressed)); // uncompressed block
|
||||
|
||||
if (block_cache != nullptr && block_holder->own_bytes() &&
|
||||
read_options.fill_cache) {
|
||||
@ -1786,11 +1783,11 @@ Status BlockBasedTable::PutDataBlockToCache(
|
||||
|
||||
block_holder.reset(BlocklikeTraits<TBlocklike>::Create(
|
||||
std::move(uncompressed_block_contents), seq_no, read_amp_bytes_per_bit,
|
||||
statistics));
|
||||
statistics, rep_->blocks_definitely_zstd_compressed));
|
||||
} else {
|
||||
block_holder.reset(BlocklikeTraits<TBlocklike>::Create(
|
||||
std::move(*raw_block_contents), seq_no, read_amp_bytes_per_bit,
|
||||
statistics));
|
||||
statistics, rep_->blocks_definitely_zstd_compressed));
|
||||
}
|
||||
|
||||
// Insert compressed block into compressed block cache.
|
||||
@ -1908,7 +1905,7 @@ TBlockIter* BlockBasedTable::NewDataBlockIterator(
|
||||
return iter;
|
||||
}
|
||||
|
||||
UncompressionDict uncompression_dict;
|
||||
CachableEntry<UncompressionDict> uncompression_dict;
|
||||
if (rep_->uncompression_dict_reader) {
|
||||
const bool no_io = (ro.read_tier == kBlockCacheTier);
|
||||
s = rep_->uncompression_dict_reader->GetOrReadUncompressionDictionary(
|
||||
@ -1920,9 +1917,13 @@ TBlockIter* BlockBasedTable::NewDataBlockIterator(
|
||||
}
|
||||
}
|
||||
|
||||
const UncompressionDict& dict = uncompression_dict.GetValue()
|
||||
? *uncompression_dict.GetValue()
|
||||
: UncompressionDict::GetEmptyDict();
|
||||
|
||||
CachableEntry<Block> block;
|
||||
s = RetrieveBlock(prefetch_buffer, ro, handle, uncompression_dict, &block,
|
||||
block_type, get_context, lookup_context, for_compaction,
|
||||
s = RetrieveBlock(prefetch_buffer, ro, handle, dict, &block, block_type,
|
||||
get_context, lookup_context, for_compaction,
|
||||
/* use_cache */ true);
|
||||
|
||||
if (!s.ok()) {
|
||||
@ -2272,15 +2273,11 @@ Status BlockBasedTable::MaybeReadBlockAndLoadToCache(
|
||||
// handles - A vector of block handles. Some of them me be NULL handles
|
||||
// scratch - An optional contiguous buffer to read compressed blocks into
|
||||
void BlockBasedTable::MaybeLoadBlocksToCache(
|
||||
const ReadOptions& options,
|
||||
const MultiGetRange* batch,
|
||||
const autovector<BlockHandle, MultiGetContext::MAX_BATCH_SIZE>* handles,
|
||||
const ReadOptions& options, const MultiGetRange* batch,
|
||||
const autovector<BlockHandle, MultiGetContext::MAX_BATCH_SIZE>* handles,
|
||||
autovector<Status, MultiGetContext::MAX_BATCH_SIZE>* statuses,
|
||||
autovector<
|
||||
CachableEntry<Block>, MultiGetContext::MAX_BATCH_SIZE>* results,
|
||||
char* scratch,
|
||||
const UncompressionDict& uncompression_dict) const {
|
||||
|
||||
autovector<CachableEntry<Block>, MultiGetContext::MAX_BATCH_SIZE>* results,
|
||||
char* scratch, const UncompressionDict& uncompression_dict) const {
|
||||
RandomAccessFileReader* file = rep_->file.get();
|
||||
const Footer& footer = rep_->footer;
|
||||
const ImmutableCFOptions& ioptions = rep_->ioptions;
|
||||
@ -2476,7 +2473,8 @@ Status BlockBasedTable::RetrieveBlock(
|
||||
block_type == BlockType::kData
|
||||
? rep_->table_options.read_amp_bytes_per_bit
|
||||
: 0,
|
||||
GetMemoryAllocator(rep_->table_options), for_compaction);
|
||||
GetMemoryAllocator(rep_->table_options), for_compaction,
|
||||
rep_->blocks_definitely_zstd_compressed);
|
||||
}
|
||||
|
||||
if (!s.ok()) {
|
||||
@ -2505,6 +2503,13 @@ template Status BlockBasedTable::RetrieveBlock<Block>(
|
||||
GetContext* get_context, BlockCacheLookupContext* lookup_context,
|
||||
bool for_compaction, bool use_cache) const;
|
||||
|
||||
template Status BlockBasedTable::RetrieveBlock<UncompressionDict>(
|
||||
FilePrefetchBuffer* prefetch_buffer, const ReadOptions& ro,
|
||||
const BlockHandle& handle, const UncompressionDict& uncompression_dict,
|
||||
CachableEntry<UncompressionDict>* block_entry, BlockType block_type,
|
||||
GetContext* get_context, BlockCacheLookupContext* lookup_context,
|
||||
bool for_compaction, bool use_cache) const;
|
||||
|
||||
BlockBasedTable::PartitionedIndexIteratorState::PartitionedIndexIteratorState(
|
||||
const BlockBasedTable* table,
|
||||
std::unordered_map<uint64_t, CachableEntry<Block>>* block_map)
|
||||
@ -3398,7 +3403,7 @@ void BlockBasedTable::MultiGet(const ReadOptions& read_options,
|
||||
MultiGetRange data_block_range(sst_file_range, sst_file_range.begin(),
|
||||
sst_file_range.end());
|
||||
|
||||
UncompressionDict uncompression_dict;
|
||||
CachableEntry<UncompressionDict> uncompression_dict;
|
||||
Status uncompression_dict_status;
|
||||
if (rep_->uncompression_dict_reader) {
|
||||
uncompression_dict_status =
|
||||
@ -3408,6 +3413,10 @@ void BlockBasedTable::MultiGet(const ReadOptions& read_options,
|
||||
&uncompression_dict);
|
||||
}
|
||||
|
||||
const UncompressionDict& dict = uncompression_dict.GetValue()
|
||||
? *uncompression_dict.GetValue()
|
||||
: UncompressionDict::GetEmptyDict();
|
||||
|
||||
size_t total_len = 0;
|
||||
ReadOptions ro = read_options;
|
||||
ro.read_tier = kBlockCacheTier;
|
||||
@ -3451,8 +3460,8 @@ void BlockBasedTable::MultiGet(const ReadOptions& read_options,
|
||||
}
|
||||
offset = v.handle.offset();
|
||||
BlockHandle handle = v.handle;
|
||||
Status s = GetDataBlockFromCache(ro, handle, uncompression_dict,
|
||||
&(results.back()), BlockType::kData, miter->get_context);
|
||||
Status s = GetDataBlockFromCache(ro, handle, dict, &(results.back()),
|
||||
BlockType::kData, miter->get_context);
|
||||
if (s.ok() && !results.back().IsEmpty()) {
|
||||
// Found it in the cache. Add NULL handle to indicate there is
|
||||
// nothing to read from disk
|
||||
@ -3483,9 +3492,8 @@ void BlockBasedTable::MultiGet(const ReadOptions& read_options,
|
||||
block_buf.reset(scratch);
|
||||
}
|
||||
}
|
||||
MaybeLoadBlocksToCache(read_options,
|
||||
&data_block_range, &block_handles, &statuses, &results,
|
||||
scratch, uncompression_dict);
|
||||
MaybeLoadBlocksToCache(read_options, &data_block_range, &block_handles,
|
||||
&statuses, &results, scratch, dict);
|
||||
}
|
||||
}
|
||||
|
||||
@ -4098,7 +4106,7 @@ Status BlockBasedTable::DumpTable(WritableFile* out_file) {
|
||||
|
||||
// Output compression dictionary
|
||||
if (rep_->uncompression_dict_reader) {
|
||||
UncompressionDict uncompression_dict;
|
||||
CachableEntry<UncompressionDict> uncompression_dict;
|
||||
s = rep_->uncompression_dict_reader->GetOrReadUncompressionDictionary(
|
||||
nullptr /* prefetch_buffer */, false /* no_io */,
|
||||
nullptr /* get_context */, nullptr /* lookup_context */,
|
||||
@ -4107,7 +4115,9 @@ Status BlockBasedTable::DumpTable(WritableFile* out_file) {
|
||||
return s;
|
||||
}
|
||||
|
||||
const Slice& raw_dict = uncompression_dict.GetRawDict();
|
||||
assert(uncompression_dict.GetValue());
|
||||
|
||||
const Slice& raw_dict = uncompression_dict.GetValue()->GetRawDict();
|
||||
out_file->Append(
|
||||
"Compression Dictionary:\n"
|
||||
"--------------------------------------\n");
|
||||
|
@ -309,10 +309,10 @@ class BlockBasedTable : public TableReader {
|
||||
|
||||
void MaybeLoadBlocksToCache(
|
||||
const ReadOptions& options, const MultiGetRange* batch,
|
||||
const autovector<BlockHandle, MultiGetContext::MAX_BATCH_SIZE>* handles,
|
||||
const autovector<BlockHandle, MultiGetContext::MAX_BATCH_SIZE>* handles,
|
||||
autovector<Status, MultiGetContext::MAX_BATCH_SIZE>* statuses,
|
||||
autovector<
|
||||
CachableEntry<Block>, MultiGetContext::MAX_BATCH_SIZE>* results,
|
||||
autovector<CachableEntry<Block>, MultiGetContext::MAX_BATCH_SIZE>*
|
||||
results,
|
||||
char* scratch, const UncompressionDict& uncompression_dict) const;
|
||||
|
||||
// Get the iterator from the index reader.
|
||||
|
@ -21,36 +21,36 @@ Status UncompressionDictReader::Create(
|
||||
assert(!pin || prefetch);
|
||||
assert(uncompression_dict_reader);
|
||||
|
||||
CachableEntry<BlockContents> uncompression_dict_block;
|
||||
CachableEntry<UncompressionDict> uncompression_dict;
|
||||
if (prefetch || !use_cache) {
|
||||
const Status s = ReadUncompressionDictionaryBlock(
|
||||
const Status s = ReadUncompressionDictionary(
|
||||
table, prefetch_buffer, ReadOptions(), use_cache,
|
||||
nullptr /* get_context */, lookup_context, &uncompression_dict_block);
|
||||
nullptr /* get_context */, lookup_context, &uncompression_dict);
|
||||
if (!s.ok()) {
|
||||
return s;
|
||||
}
|
||||
|
||||
if (use_cache && !pin) {
|
||||
uncompression_dict_block.Reset();
|
||||
uncompression_dict.Reset();
|
||||
}
|
||||
}
|
||||
|
||||
uncompression_dict_reader->reset(
|
||||
new UncompressionDictReader(table, std::move(uncompression_dict_block)));
|
||||
new UncompressionDictReader(table, std::move(uncompression_dict)));
|
||||
|
||||
return Status::OK();
|
||||
}
|
||||
|
||||
Status UncompressionDictReader::ReadUncompressionDictionaryBlock(
|
||||
Status UncompressionDictReader::ReadUncompressionDictionary(
|
||||
const BlockBasedTable* table, FilePrefetchBuffer* prefetch_buffer,
|
||||
const ReadOptions& read_options, bool use_cache, GetContext* get_context,
|
||||
BlockCacheLookupContext* lookup_context,
|
||||
CachableEntry<BlockContents>* uncompression_dict_block) {
|
||||
CachableEntry<UncompressionDict>* uncompression_dict) {
|
||||
// TODO: add perf counter for compression dictionary read time
|
||||
|
||||
assert(table);
|
||||
assert(uncompression_dict_block);
|
||||
assert(uncompression_dict_block->IsEmpty());
|
||||
assert(uncompression_dict);
|
||||
assert(uncompression_dict->IsEmpty());
|
||||
|
||||
const BlockBasedTable::Rep* const rep = table->get_rep();
|
||||
assert(rep);
|
||||
@ -58,7 +58,7 @@ Status UncompressionDictReader::ReadUncompressionDictionaryBlock(
|
||||
|
||||
const Status s = table->RetrieveBlock(
|
||||
prefetch_buffer, read_options, rep->compression_dict_handle,
|
||||
UncompressionDict::GetEmptyDict(), uncompression_dict_block,
|
||||
UncompressionDict::GetEmptyDict(), uncompression_dict,
|
||||
BlockType::kCompressionDictionary, get_context, lookup_context,
|
||||
/* for_compaction */ false, use_cache);
|
||||
|
||||
@ -73,15 +73,14 @@ Status UncompressionDictReader::ReadUncompressionDictionaryBlock(
|
||||
return s;
|
||||
}
|
||||
|
||||
Status UncompressionDictReader::GetOrReadUncompressionDictionaryBlock(
|
||||
Status UncompressionDictReader::GetOrReadUncompressionDictionary(
|
||||
FilePrefetchBuffer* prefetch_buffer, bool no_io, GetContext* get_context,
|
||||
BlockCacheLookupContext* lookup_context,
|
||||
CachableEntry<BlockContents>* uncompression_dict_block) const {
|
||||
assert(uncompression_dict_block);
|
||||
CachableEntry<UncompressionDict>* uncompression_dict) const {
|
||||
assert(uncompression_dict);
|
||||
|
||||
if (!uncompression_dict_block_.IsEmpty()) {
|
||||
uncompression_dict_block->SetUnownedValue(
|
||||
uncompression_dict_block_.GetValue());
|
||||
if (!uncompression_dict_.IsEmpty()) {
|
||||
uncompression_dict->SetUnownedValue(uncompression_dict_.GetValue());
|
||||
return Status::OK();
|
||||
}
|
||||
|
||||
@ -90,42 +89,17 @@ Status UncompressionDictReader::GetOrReadUncompressionDictionaryBlock(
|
||||
read_options.read_tier = kBlockCacheTier;
|
||||
}
|
||||
|
||||
return ReadUncompressionDictionaryBlock(
|
||||
table_, prefetch_buffer, read_options, cache_dictionary_blocks(),
|
||||
get_context, lookup_context, uncompression_dict_block);
|
||||
}
|
||||
|
||||
Status UncompressionDictReader::GetOrReadUncompressionDictionary(
|
||||
FilePrefetchBuffer* prefetch_buffer, bool no_io, GetContext* get_context,
|
||||
BlockCacheLookupContext* lookup_context,
|
||||
UncompressionDict* uncompression_dict) const {
|
||||
CachableEntry<BlockContents> uncompression_dict_block;
|
||||
const Status s = GetOrReadUncompressionDictionaryBlock(
|
||||
prefetch_buffer, no_io, get_context, lookup_context,
|
||||
&uncompression_dict_block);
|
||||
|
||||
if (!s.ok()) {
|
||||
return s;
|
||||
}
|
||||
|
||||
assert(uncompression_dict);
|
||||
assert(table_);
|
||||
assert(table_->get_rep());
|
||||
|
||||
UncompressionDict dict(uncompression_dict_block.GetValue()->data,
|
||||
table_->get_rep()->blocks_definitely_zstd_compressed);
|
||||
*uncompression_dict = std::move(dict);
|
||||
uncompression_dict_block.TransferTo(uncompression_dict);
|
||||
|
||||
return Status::OK();
|
||||
return ReadUncompressionDictionary(table_, prefetch_buffer, read_options,
|
||||
cache_dictionary_blocks(), get_context,
|
||||
lookup_context, uncompression_dict);
|
||||
}
|
||||
|
||||
size_t UncompressionDictReader::ApproximateMemoryUsage() const {
|
||||
assert(!uncompression_dict_block_.GetOwnValue() ||
|
||||
uncompression_dict_block_.GetValue() != nullptr);
|
||||
size_t usage = uncompression_dict_block_.GetOwnValue()
|
||||
? uncompression_dict_block_.GetValue()->ApproximateMemoryUsage()
|
||||
: 0;
|
||||
assert(!uncompression_dict_.GetOwnValue() ||
|
||||
uncompression_dict_.GetValue() != nullptr);
|
||||
size_t usage = uncompression_dict_.GetOwnValue()
|
||||
? uncompression_dict_.GetValue()->ApproximateMemoryUsage()
|
||||
: 0;
|
||||
|
||||
#ifdef ROCKSDB_MALLOC_USABLE_SIZE
|
||||
usage += malloc_usable_size(const_cast<UncompressionDictReader*>(this));
|
||||
|
@ -33,34 +33,27 @@ class UncompressionDictReader {
|
||||
Status GetOrReadUncompressionDictionary(
|
||||
FilePrefetchBuffer* prefetch_buffer, bool no_io, GetContext* get_context,
|
||||
BlockCacheLookupContext* lookup_context,
|
||||
UncompressionDict* uncompression_dict) const;
|
||||
CachableEntry<UncompressionDict>* uncompression_dict) const;
|
||||
|
||||
size_t ApproximateMemoryUsage() const;
|
||||
|
||||
private:
|
||||
UncompressionDictReader(
|
||||
const BlockBasedTable* t,
|
||||
CachableEntry<BlockContents>&& uncompression_dict_block)
|
||||
: table_(t),
|
||||
uncompression_dict_block_(std::move(uncompression_dict_block)) {
|
||||
UncompressionDictReader(const BlockBasedTable* t,
|
||||
CachableEntry<UncompressionDict>&& uncompression_dict)
|
||||
: table_(t), uncompression_dict_(std::move(uncompression_dict)) {
|
||||
assert(table_);
|
||||
}
|
||||
|
||||
bool cache_dictionary_blocks() const;
|
||||
|
||||
static Status ReadUncompressionDictionaryBlock(
|
||||
static Status ReadUncompressionDictionary(
|
||||
const BlockBasedTable* table, FilePrefetchBuffer* prefetch_buffer,
|
||||
const ReadOptions& read_options, bool use_cache, GetContext* get_context,
|
||||
BlockCacheLookupContext* lookup_context,
|
||||
CachableEntry<BlockContents>* uncompression_dict_block);
|
||||
|
||||
Status GetOrReadUncompressionDictionaryBlock(
|
||||
FilePrefetchBuffer* prefetch_buffer, bool no_io, GetContext* get_context,
|
||||
BlockCacheLookupContext* lookup_context,
|
||||
CachableEntry<BlockContents>* uncompression_dict_block) const;
|
||||
CachableEntry<UncompressionDict>* uncompression_dict);
|
||||
|
||||
const BlockBasedTable* table_;
|
||||
CachableEntry<BlockContents> uncompression_dict_block_;
|
||||
CachableEntry<UncompressionDict> uncompression_dict_;
|
||||
};
|
||||
|
||||
} // namespace rocksdb
|
||||
|
@ -21,7 +21,6 @@
|
||||
#include <string>
|
||||
|
||||
#include "memory/memory_allocator.h"
|
||||
#include "rocksdb/cleanable.h"
|
||||
#include "rocksdb/options.h"
|
||||
#include "rocksdb/table.h"
|
||||
#include "util/coding.h"
|
||||
@ -217,14 +216,19 @@ struct CompressionDict {
|
||||
|
||||
// Holds dictionary and related data, like ZSTD's digested uncompression
|
||||
// dictionary.
|
||||
struct UncompressionDict : public Cleanable {
|
||||
// Block containing the data for the compression dictionary. It is non-empty
|
||||
// only if the constructor that takes a string parameter is used.
|
||||
struct UncompressionDict {
|
||||
// Block containing the data for the compression dictionary in case the
|
||||
// constructor that takes a string parameter is used.
|
||||
std::string dict_;
|
||||
|
||||
// Slice pointing to the compression dictionary data. Points to
|
||||
// dict_ if the string constructor is used. In the case of the Slice
|
||||
// constructor, it is a copy of the Slice passed by the caller.
|
||||
// Block containing the data for the compression dictionary in case the
|
||||
// constructor that takes a Slice parameter is used and the passed in
|
||||
// CacheAllocationPtr is not nullptr.
|
||||
CacheAllocationPtr allocation_;
|
||||
|
||||
// Slice pointing to the compression dictionary data. Can point to
|
||||
// dict_, allocation_, or some other memory location, depending on how
|
||||
// the object was constructed.
|
||||
Slice slice_;
|
||||
|
||||
#ifdef ROCKSDB_ZSTD_DDICT
|
||||
@ -232,18 +236,12 @@ struct UncompressionDict : public Cleanable {
|
||||
ZSTD_DDict* zstd_ddict_ = nullptr;
|
||||
#endif // ROCKSDB_ZSTD_DDICT
|
||||
|
||||
// Slice constructor: it is the caller's responsibility to either
|
||||
// a) make sure slice remains valid throughout the lifecycle of this object OR
|
||||
// b) transfer the management of the underlying resource (e.g. cache handle)
|
||||
// to this object, in which case UncompressionDict is self-contained, and the
|
||||
// resource is guaranteed to be released (via the cleanup logic in Cleanable)
|
||||
// when UncompressionDict is destroyed.
|
||||
#ifdef ROCKSDB_ZSTD_DDICT
|
||||
UncompressionDict(Slice slice, bool using_zstd)
|
||||
UncompressionDict(std::string dict, bool using_zstd)
|
||||
#else // ROCKSDB_ZSTD_DDICT
|
||||
UncompressionDict(Slice slice, bool /*using_zstd*/)
|
||||
UncompressionDict(std::string dict, bool /* using_zstd */)
|
||||
#endif // ROCKSDB_ZSTD_DDICT
|
||||
: slice_(std::move(slice)) {
|
||||
: dict_(std::move(dict)), slice_(dict_) {
|
||||
#ifdef ROCKSDB_ZSTD_DDICT
|
||||
if (!slice_.empty() && using_zstd) {
|
||||
zstd_ddict_ = ZSTD_createDDict_byReference(slice_.data(), slice_.size());
|
||||
@ -252,14 +250,25 @@ struct UncompressionDict : public Cleanable {
|
||||
#endif // ROCKSDB_ZSTD_DDICT
|
||||
}
|
||||
|
||||
// String constructor: results in a self-contained UncompressionDict.
|
||||
UncompressionDict(std::string dict, bool using_zstd)
|
||||
: UncompressionDict(Slice(dict), using_zstd) {
|
||||
dict_ = std::move(dict);
|
||||
#ifdef ROCKSDB_ZSTD_DDICT
|
||||
UncompressionDict(Slice slice, CacheAllocationPtr&& allocation,
|
||||
bool using_zstd)
|
||||
#else // ROCKSDB_ZSTD_DDICT
|
||||
UncompressionDict(Slice slice, CacheAllocationPtr&& allocation,
|
||||
bool /* using_zstd */)
|
||||
#endif // ROCKSDB_ZSTD_DDICT
|
||||
: allocation_(std::move(allocation)), slice_(std::move(slice)) {
|
||||
#ifdef ROCKSDB_ZSTD_DDICT
|
||||
if (!slice_.empty() && using_zstd) {
|
||||
zstd_ddict_ = ZSTD_createDDict_byReference(slice_.data(), slice_.size());
|
||||
assert(zstd_ddict_ != nullptr);
|
||||
}
|
||||
#endif // ROCKSDB_ZSTD_DDICT
|
||||
}
|
||||
|
||||
UncompressionDict(UncompressionDict&& rhs)
|
||||
: dict_(std::move(rhs.dict_)),
|
||||
allocation_(std::move(rhs.allocation_)),
|
||||
slice_(std::move(rhs.slice_))
|
||||
#ifdef ROCKSDB_ZSTD_DDICT
|
||||
,
|
||||
@ -288,6 +297,7 @@ struct UncompressionDict : public Cleanable {
|
||||
}
|
||||
|
||||
dict_ = std::move(rhs.dict_);
|
||||
allocation_ = std::move(rhs.allocation_);
|
||||
slice_ = std::move(rhs.slice_);
|
||||
|
||||
#ifdef ROCKSDB_ZSTD_DDICT
|
||||
@ -298,6 +308,12 @@ struct UncompressionDict : public Cleanable {
|
||||
return *this;
|
||||
}
|
||||
|
||||
// The object is self-contained if the string constructor is used, or the
|
||||
// Slice constructor is invoked with a non-null allocation. Otherwise, it
|
||||
// is the caller's responsibility to ensure that the underlying storage
|
||||
// outlives this object.
|
||||
bool own_bytes() const { return !dict_.empty() || allocation_; }
|
||||
|
||||
const Slice& GetRawDict() const { return slice_; }
|
||||
|
||||
#ifdef ROCKSDB_ZSTD_DDICT
|
||||
@ -310,12 +326,19 @@ struct UncompressionDict : public Cleanable {
|
||||
}
|
||||
|
||||
size_t ApproximateMemoryUsage() const {
|
||||
size_t usage = 0;
|
||||
usage += sizeof(struct UncompressionDict);
|
||||
size_t usage = sizeof(struct UncompressionDict);
|
||||
usage += dict_.size();
|
||||
if (allocation_) {
|
||||
auto allocator = allocation_.get_deleter().allocator;
|
||||
if (allocator) {
|
||||
usage += allocator->UsableSize(allocation_.get(), slice_.size());
|
||||
} else {
|
||||
usage += slice_.size();
|
||||
}
|
||||
}
|
||||
#ifdef ROCKSDB_ZSTD_DDICT
|
||||
usage += ZSTD_sizeof_DDict(zstd_ddict_);
|
||||
#endif // ROCKSDB_ZSTD_DDICT
|
||||
usage += dict_.size();
|
||||
return usage;
|
||||
}
|
||||
|
||||
|
Loading…
x
Reference in New Issue
Block a user