2020-11-17 12:55:27 -08:00
|
|
|
// Copyright (c) 2011-present, Facebook, Inc. All rights reserved.
|
|
|
|
// This source code is licensed under both the GPLv2 (found in the
|
|
|
|
// COPYING file in the root directory) and Apache 2.0 License
|
|
|
|
// (found in the LICENSE.Apache file in the root directory).
|
|
|
|
|
|
|
|
#include <algorithm>
|
|
|
|
#include <iostream>
|
2020-12-11 16:07:48 -08:00
|
|
|
#include <memory>
|
|
|
|
#include <string>
|
2020-11-17 12:55:27 -08:00
|
|
|
|
|
|
|
#include "proto/gen/db_operation.pb.h"
|
|
|
|
#include "rocksdb/file_system.h"
|
|
|
|
#include "rocksdb/sst_file_writer.h"
|
|
|
|
#include "src/libfuzzer/libfuzzer_macro.h"
|
2022-02-01 10:29:56 -08:00
|
|
|
#include "table/table_builder.h"
|
2020-12-11 16:07:48 -08:00
|
|
|
#include "table/table_reader.h"
|
|
|
|
#include "util.h"
|
|
|
|
|
2022-02-01 10:29:56 -08:00
|
|
|
using ROCKSDB_NAMESPACE::BytewiseComparator;
|
|
|
|
using ROCKSDB_NAMESPACE::Comparator;
|
|
|
|
using ROCKSDB_NAMESPACE::EnvOptions;
|
|
|
|
using ROCKSDB_NAMESPACE::ExternalSstFileInfo;
|
|
|
|
using ROCKSDB_NAMESPACE::FileOptions;
|
|
|
|
using ROCKSDB_NAMESPACE::FileSystem;
|
|
|
|
using ROCKSDB_NAMESPACE::ImmutableCFOptions;
|
|
|
|
using ROCKSDB_NAMESPACE::ImmutableOptions;
|
|
|
|
using ROCKSDB_NAMESPACE::InternalIterator;
|
|
|
|
using ROCKSDB_NAMESPACE::IOOptions;
|
|
|
|
using ROCKSDB_NAMESPACE::kMaxSequenceNumber;
|
|
|
|
using ROCKSDB_NAMESPACE::Options;
|
|
|
|
using ROCKSDB_NAMESPACE::ParsedInternalKey;
|
|
|
|
using ROCKSDB_NAMESPACE::ParseInternalKey;
|
|
|
|
using ROCKSDB_NAMESPACE::RandomAccessFileReader;
|
|
|
|
using ROCKSDB_NAMESPACE::ReadOptions;
|
|
|
|
using ROCKSDB_NAMESPACE::SstFileWriter;
|
|
|
|
using ROCKSDB_NAMESPACE::Status;
|
|
|
|
using ROCKSDB_NAMESPACE::TableReader;
|
|
|
|
using ROCKSDB_NAMESPACE::TableReaderCaller;
|
|
|
|
using ROCKSDB_NAMESPACE::TableReaderOptions;
|
|
|
|
using ROCKSDB_NAMESPACE::ValueType;
|
|
|
|
|
2020-11-17 12:55:27 -08:00
|
|
|
// Keys in SST file writer operations must be unique and in ascending order.
|
|
|
|
// For each DBOperation generated by the fuzzer, this function is called on
|
|
|
|
// it to deduplicate and sort the keys in the DBOperations.
|
|
|
|
protobuf_mutator::libfuzzer::PostProcessorRegistration<DBOperations> reg = {
|
|
|
|
[](DBOperations* input, unsigned int /* seed */) {
|
2020-12-11 16:07:48 -08:00
|
|
|
const Comparator* comparator = BytewiseComparator();
|
2020-11-17 12:55:27 -08:00
|
|
|
auto ops = input->mutable_operations();
|
2020-12-11 16:07:48 -08:00
|
|
|
|
|
|
|
// Make sure begin <= end for DELETE_RANGE.
|
|
|
|
for (DBOperation& op : *ops) {
|
|
|
|
if (op.type() == OpType::DELETE_RANGE) {
|
|
|
|
auto begin = op.key();
|
|
|
|
auto end = op.value();
|
|
|
|
if (comparator->Compare(begin, end) > 0) {
|
|
|
|
std::swap(begin, end);
|
|
|
|
op.set_key(begin);
|
|
|
|
op.set_value(end);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2020-11-17 12:55:27 -08:00
|
|
|
std::sort(ops->begin(), ops->end(),
|
|
|
|
[&comparator](const DBOperation& a, const DBOperation& b) {
|
|
|
|
return comparator->Compare(a.key(), b.key()) < 0;
|
|
|
|
});
|
|
|
|
|
|
|
|
auto last = std::unique(
|
|
|
|
ops->begin(), ops->end(),
|
|
|
|
[&comparator](const DBOperation& a, const DBOperation& b) {
|
|
|
|
return comparator->Compare(a.key(), b.key()) == 0;
|
|
|
|
});
|
|
|
|
ops->erase(last, ops->end());
|
|
|
|
}};
|
|
|
|
|
2020-12-11 16:07:48 -08:00
|
|
|
TableReader* NewTableReader(const std::string& sst_file_path,
|
|
|
|
const Options& options,
|
|
|
|
const EnvOptions& env_options,
|
|
|
|
const ImmutableCFOptions& cf_ioptions) {
|
|
|
|
// This code block is similar to SstFileReader::Open.
|
|
|
|
|
|
|
|
uint64_t file_size = 0;
|
|
|
|
std::unique_ptr<RandomAccessFileReader> file_reader;
|
|
|
|
std::unique_ptr<TableReader> table_reader;
|
2021-01-28 22:08:46 -08:00
|
|
|
const auto& fs = options.env->GetFileSystem();
|
|
|
|
FileOptions fopts(env_options);
|
2022-02-01 10:29:56 -08:00
|
|
|
Status s = options.env->GetFileSize(sst_file_path, &file_size);
|
2020-12-11 16:07:48 -08:00
|
|
|
if (s.ok()) {
|
2021-01-28 22:08:46 -08:00
|
|
|
s = RandomAccessFileReader::Create(fs, sst_file_path, fopts, &file_reader,
|
|
|
|
nullptr);
|
2020-11-17 12:55:27 -08:00
|
|
|
}
|
2020-12-11 16:07:48 -08:00
|
|
|
if (s.ok()) {
|
2022-02-01 10:29:56 -08:00
|
|
|
ImmutableOptions iopts(options, cf_ioptions);
|
|
|
|
TableReaderOptions t_opt(iopts, /*prefix_extractor=*/nullptr, env_options,
|
|
|
|
cf_ioptions.internal_comparator);
|
2020-12-11 16:07:48 -08:00
|
|
|
t_opt.largest_seqno = kMaxSequenceNumber;
|
|
|
|
s = options.table_factory->NewTableReader(t_opt, std::move(file_reader),
|
|
|
|
file_size, &table_reader,
|
|
|
|
/*prefetch=*/false);
|
|
|
|
}
|
|
|
|
if (!s.ok()) {
|
|
|
|
std::cerr << "Failed to create TableReader for " << sst_file_path << ": "
|
|
|
|
<< s.ToString() << std::endl;
|
|
|
|
abort();
|
|
|
|
}
|
|
|
|
return table_reader.release();
|
|
|
|
}
|
|
|
|
|
|
|
|
ValueType ToValueType(OpType op_type) {
|
|
|
|
switch (op_type) {
|
|
|
|
case OpType::PUT:
|
|
|
|
return ValueType::kTypeValue;
|
|
|
|
case OpType::MERGE:
|
|
|
|
return ValueType::kTypeMerge;
|
|
|
|
case OpType::DELETE:
|
|
|
|
return ValueType::kTypeDeletion;
|
|
|
|
case OpType::DELETE_RANGE:
|
|
|
|
return ValueType::kTypeRangeDeletion;
|
|
|
|
default:
|
|
|
|
std::cerr << "Unknown operation type " << static_cast<int>(op_type)
|
|
|
|
<< std::endl;
|
|
|
|
abort();
|
|
|
|
}
|
|
|
|
}
|
2020-11-17 12:55:27 -08:00
|
|
|
|
|
|
|
// Fuzzes DB operations as input, let SstFileWriter generate a SST file
|
2020-12-11 16:07:48 -08:00
|
|
|
// according to the operations, then let TableReader read and check all the
|
|
|
|
// key-value pairs from the generated SST file.
|
2020-11-17 12:55:27 -08:00
|
|
|
DEFINE_PROTO_FUZZER(DBOperations& input) {
|
|
|
|
if (input.operations().empty()) {
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
std::string sstfile;
|
|
|
|
{
|
2020-12-11 16:07:48 -08:00
|
|
|
auto fs = FileSystem::Default();
|
2020-11-17 12:55:27 -08:00
|
|
|
std::string dir;
|
2020-12-11 16:07:48 -08:00
|
|
|
IOOptions opt;
|
|
|
|
CHECK_OK(fs->GetTestDirectory(opt, &dir, nullptr));
|
2020-11-17 12:55:27 -08:00
|
|
|
sstfile = dir + "/SstFileWriterFuzzer.sst";
|
|
|
|
}
|
|
|
|
|
2020-12-11 16:07:48 -08:00
|
|
|
Options options;
|
|
|
|
EnvOptions env_options(options);
|
|
|
|
ImmutableCFOptions cf_ioptions(options);
|
|
|
|
|
2020-11-17 12:55:27 -08:00
|
|
|
// Generate sst file.
|
2020-12-11 16:07:48 -08:00
|
|
|
SstFileWriter writer(env_options, options);
|
|
|
|
CHECK_OK(writer.Open(sstfile));
|
2020-11-17 12:55:27 -08:00
|
|
|
for (const DBOperation& op : input.operations()) {
|
|
|
|
switch (op.type()) {
|
2020-12-11 16:07:48 -08:00
|
|
|
case OpType::PUT: {
|
|
|
|
CHECK_OK(writer.Put(op.key(), op.value()));
|
2020-11-17 12:55:27 -08:00
|
|
|
break;
|
2020-12-11 16:07:48 -08:00
|
|
|
}
|
|
|
|
case OpType::MERGE: {
|
|
|
|
CHECK_OK(writer.Merge(op.key(), op.value()));
|
2020-11-17 12:55:27 -08:00
|
|
|
break;
|
2020-12-11 16:07:48 -08:00
|
|
|
}
|
|
|
|
case OpType::DELETE: {
|
|
|
|
CHECK_OK(writer.Delete(op.key()));
|
2020-11-17 12:55:27 -08:00
|
|
|
break;
|
2020-12-11 16:07:48 -08:00
|
|
|
}
|
|
|
|
case OpType::DELETE_RANGE: {
|
|
|
|
CHECK_OK(writer.DeleteRange(op.key(), op.value()));
|
2020-11-17 12:55:27 -08:00
|
|
|
break;
|
2020-12-11 16:07:48 -08:00
|
|
|
}
|
|
|
|
default: {
|
|
|
|
std::cerr << "Unsupported operation" << static_cast<int>(op.type())
|
|
|
|
<< std::endl;
|
|
|
|
abort();
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
ExternalSstFileInfo info;
|
|
|
|
CHECK_OK(writer.Finish(&info));
|
|
|
|
|
|
|
|
// Iterate and verify key-value pairs.
|
|
|
|
std::unique_ptr<TableReader> table_reader(
|
2022-02-01 10:29:56 -08:00
|
|
|
::NewTableReader(sstfile, options, env_options, cf_ioptions));
|
2020-12-11 16:07:48 -08:00
|
|
|
ReadOptions roptions;
|
|
|
|
CHECK_OK(table_reader->VerifyChecksum(roptions,
|
|
|
|
TableReaderCaller::kUncategorized));
|
|
|
|
std::unique_ptr<InternalIterator> it(
|
|
|
|
table_reader->NewIterator(roptions, /*prefix_extractor=*/nullptr,
|
|
|
|
/*arena=*/nullptr, /*skip_filters=*/true,
|
|
|
|
TableReaderCaller::kUncategorized));
|
|
|
|
it->SeekToFirst();
|
|
|
|
for (const DBOperation& op : input.operations()) {
|
|
|
|
if (op.type() == OpType::DELETE_RANGE) {
|
|
|
|
// InternalIterator cannot iterate over DELETE_RANGE entries.
|
|
|
|
continue;
|
|
|
|
}
|
|
|
|
CHECK_TRUE(it->Valid());
|
|
|
|
ParsedInternalKey ikey;
|
|
|
|
CHECK_OK(ParseInternalKey(it->key(), &ikey, /*log_err_key=*/true));
|
|
|
|
CHECK_EQ(ikey.user_key.ToString(), op.key());
|
|
|
|
CHECK_EQ(ikey.sequence, 0);
|
|
|
|
CHECK_EQ(ikey.type, ToValueType(op.type()));
|
|
|
|
if (op.type() != OpType::DELETE) {
|
|
|
|
CHECK_EQ(op.value(), it->value().ToString());
|
2020-11-17 12:55:27 -08:00
|
|
|
}
|
2020-12-11 16:07:48 -08:00
|
|
|
it->Next();
|
2020-11-17 12:55:27 -08:00
|
|
|
}
|
2020-12-11 16:07:48 -08:00
|
|
|
CHECK_TRUE(!it->Valid());
|
2020-11-17 12:55:27 -08:00
|
|
|
|
|
|
|
// Delete sst file.
|
|
|
|
remove(sstfile.c_str());
|
|
|
|
}
|