22655a398b
Summary: The patch adds a class called `BlobFileReader` that can be used to retrieve blobs using the information available in blob references (e.g. blob file number, offset, and size). This will come in handy when implementing blob support for `Get`, `MultiGet`, and iterators, and also for compaction/garbage collection. When a `BlobFileReader` object is created (using the factory method `Create`), it first checks whether the specified file is potentially valid by comparing the file size against the combined size of the blob file header and footer (files smaller than the threshold are considered malformed). Then, it opens the file, and reads and verifies the header and footer. The verification involves magic number/CRC checks as well as checking for unexpected header/footer fields, e.g. incorrect column family ID or TTL blob files. Blobs can be retrieved using `GetBlob`. `GetBlob` validates the offset and compression type passed by the caller (because of the presence of the header and footer, the specified offset cannot be too close to the start/end of the file; also, the compression type has to match the one in the blob file header), and retrieves and potentially verifies and uncompresses the blob. In particular, when `ReadOptions::verify_checksums` is set, `BlobFileReader` reads the blob record header as well (as opposed to just the blob itself) and verifies the key/value size, the key itself, as well as the CRC of the blob record header and the key/value pair. In addition, the patch exposes the compression type from `BlobIndex` (both using an accessor and via `DebugString`), and adds a blob file read latency histogram to `InternalStats` that can be used with `BlobFileReader`. Pull Request resolved: https://github.com/facebook/rocksdb/pull/7461 Test Plan: `make check` Reviewed By: riversand963 Differential Revision: D23999219 Pulled By: ltamasi fbshipit-source-id: deb6b1160d251258b308d5156e2ec063c3e12e5e
185 lines
5.6 KiB
C++
185 lines
5.6 KiB
C++
// Copyright (c) 2011-present, Facebook, Inc. All rights reserved.
|
|
// This source code is licensed under both the GPLv2 (found in the
|
|
// COPYING file in the root directory) and Apache 2.0 License
|
|
// (found in the LICENSE.Apache file in the root directory).
|
|
#pragma once
|
|
|
|
#include <sstream>
|
|
#include <string>
|
|
|
|
#include "rocksdb/compression_type.h"
|
|
#include "util/coding.h"
|
|
#include "util/compression.h"
|
|
#include "util/string_util.h"
|
|
|
|
namespace ROCKSDB_NAMESPACE {
|
|
|
|
// BlobIndex is a pointer to the blob and metadata of the blob. The index is
|
|
// stored in base DB as ValueType::kTypeBlobIndex.
|
|
// There are three types of blob index:
|
|
//
|
|
// kInlinedTTL:
|
|
// +------+------------+---------------+
|
|
// | type | expiration | value |
|
|
// +------+------------+---------------+
|
|
// | char | varint64 | variable size |
|
|
// +------+------------+---------------+
|
|
//
|
|
// kBlob:
|
|
// +------+-------------+----------+----------+-------------+
|
|
// | type | file number | offset | size | compression |
|
|
// +------+-------------+----------+----------+-------------+
|
|
// | char | varint64 | varint64 | varint64 | char |
|
|
// +------+-------------+----------+----------+-------------+
|
|
//
|
|
// kBlobTTL:
|
|
// +------+------------+-------------+----------+----------+-------------+
|
|
// | type | expiration | file number | offset | size | compression |
|
|
// +------+------------+-------------+----------+----------+-------------+
|
|
// | char | varint64 | varint64 | varint64 | varint64 | char |
|
|
// +------+------------+-------------+----------+----------+-------------+
|
|
//
|
|
// There isn't a kInlined (without TTL) type since we can store it as a plain
|
|
// value (i.e. ValueType::kTypeValue).
|
|
class BlobIndex {
|
|
public:
|
|
enum class Type : unsigned char {
|
|
kInlinedTTL = 0,
|
|
kBlob = 1,
|
|
kBlobTTL = 2,
|
|
kUnknown = 3,
|
|
};
|
|
|
|
BlobIndex() : type_(Type::kUnknown) {}
|
|
|
|
bool IsInlined() const { return type_ == Type::kInlinedTTL; }
|
|
|
|
bool HasTTL() const {
|
|
return type_ == Type::kInlinedTTL || type_ == Type::kBlobTTL;
|
|
}
|
|
|
|
uint64_t expiration() const {
|
|
assert(HasTTL());
|
|
return expiration_;
|
|
}
|
|
|
|
const Slice& value() const {
|
|
assert(IsInlined());
|
|
return value_;
|
|
}
|
|
|
|
uint64_t file_number() const {
|
|
assert(!IsInlined());
|
|
return file_number_;
|
|
}
|
|
|
|
uint64_t offset() const {
|
|
assert(!IsInlined());
|
|
return offset_;
|
|
}
|
|
|
|
uint64_t size() const {
|
|
assert(!IsInlined());
|
|
return size_;
|
|
}
|
|
|
|
CompressionType compression() const {
|
|
assert(!IsInlined());
|
|
return compression_;
|
|
}
|
|
|
|
Status DecodeFrom(Slice slice) {
|
|
static const std::string kErrorMessage = "Error while decoding blob index";
|
|
assert(slice.size() > 0);
|
|
type_ = static_cast<Type>(*slice.data());
|
|
if (type_ >= Type::kUnknown) {
|
|
return Status::Corruption(
|
|
kErrorMessage,
|
|
"Unknown blob index type: " + ToString(static_cast<char>(type_)));
|
|
}
|
|
slice = Slice(slice.data() + 1, slice.size() - 1);
|
|
if (HasTTL()) {
|
|
if (!GetVarint64(&slice, &expiration_)) {
|
|
return Status::Corruption(kErrorMessage, "Corrupted expiration");
|
|
}
|
|
}
|
|
if (IsInlined()) {
|
|
value_ = slice;
|
|
} else {
|
|
if (GetVarint64(&slice, &file_number_) && GetVarint64(&slice, &offset_) &&
|
|
GetVarint64(&slice, &size_) && slice.size() == 1) {
|
|
compression_ = static_cast<CompressionType>(*slice.data());
|
|
} else {
|
|
return Status::Corruption(kErrorMessage, "Corrupted blob offset");
|
|
}
|
|
}
|
|
return Status::OK();
|
|
}
|
|
|
|
std::string DebugString(bool output_hex) const {
|
|
std::ostringstream oss;
|
|
|
|
if (IsInlined()) {
|
|
oss << "[inlined blob] value:" << value_.ToString(output_hex);
|
|
} else {
|
|
oss << "[blob ref] file:" << file_number_ << " offset:" << offset_
|
|
<< " size:" << size_
|
|
<< " compression: " << CompressionTypeToString(compression_);
|
|
}
|
|
|
|
if (HasTTL()) {
|
|
oss << " exp:" << expiration_;
|
|
}
|
|
|
|
return oss.str();
|
|
}
|
|
|
|
static void EncodeInlinedTTL(std::string* dst, uint64_t expiration,
|
|
const Slice& value) {
|
|
assert(dst != nullptr);
|
|
dst->clear();
|
|
dst->reserve(1 + kMaxVarint64Length + value.size());
|
|
dst->push_back(static_cast<char>(Type::kInlinedTTL));
|
|
PutVarint64(dst, expiration);
|
|
dst->append(value.data(), value.size());
|
|
}
|
|
|
|
static void EncodeBlob(std::string* dst, uint64_t file_number,
|
|
uint64_t offset, uint64_t size,
|
|
CompressionType compression) {
|
|
assert(dst != nullptr);
|
|
dst->clear();
|
|
dst->reserve(kMaxVarint64Length * 3 + 2);
|
|
dst->push_back(static_cast<char>(Type::kBlob));
|
|
PutVarint64(dst, file_number);
|
|
PutVarint64(dst, offset);
|
|
PutVarint64(dst, size);
|
|
dst->push_back(static_cast<char>(compression));
|
|
}
|
|
|
|
static void EncodeBlobTTL(std::string* dst, uint64_t expiration,
|
|
uint64_t file_number, uint64_t offset,
|
|
uint64_t size, CompressionType compression) {
|
|
assert(dst != nullptr);
|
|
dst->clear();
|
|
dst->reserve(kMaxVarint64Length * 4 + 2);
|
|
dst->push_back(static_cast<char>(Type::kBlobTTL));
|
|
PutVarint64(dst, expiration);
|
|
PutVarint64(dst, file_number);
|
|
PutVarint64(dst, offset);
|
|
PutVarint64(dst, size);
|
|
dst->push_back(static_cast<char>(compression));
|
|
}
|
|
|
|
private:
|
|
Type type_ = Type::kUnknown;
|
|
uint64_t expiration_ = 0;
|
|
Slice value_;
|
|
uint64_t file_number_ = 0;
|
|
uint64_t offset_ = 0;
|
|
uint64_t size_ = 0;
|
|
CompressionType compression_ = kNoCompression;
|
|
};
|
|
|
|
} // namespace ROCKSDB_NAMESPACE
|