2016-02-10 00:12:00 +01:00
|
|
|
// Copyright (c) 2011-present, Facebook, Inc. All rights reserved.
|
2017-07-16 01:03:42 +02:00
|
|
|
// This source code is licensed under both the GPLv2 (found in the
|
|
|
|
// COPYING file in the root directory) and Apache 2.0 License
|
|
|
|
// (found in the LICENSE.Apache file in the root directory).
|
2013-10-29 01:54:09 +01:00
|
|
|
//
|
|
|
|
// Copyright (c) 2011 The LevelDB Authors. All rights reserved.
|
|
|
|
// Use of this source code is governed by a BSD-style license that can be
|
|
|
|
// found in the LICENSE file. See the AUTHORS file for names of contributors.
|
|
|
|
|
|
|
|
#pragma once
|
|
|
|
#include <stdint.h>
|
|
|
|
|
2014-05-15 23:09:03 +02:00
|
|
|
#include <memory>
|
|
|
|
#include <string>
|
|
|
|
|
2017-07-29 01:23:50 +02:00
|
|
|
#include "db/dbformat.h"
|
|
|
|
#include "options/options_helper.h"
|
|
|
|
#include "options/options_parser.h"
|
2013-11-20 07:00:48 +01:00
|
|
|
#include "rocksdb/flush_block_policy.h"
|
2013-10-29 01:54:09 +01:00
|
|
|
#include "rocksdb/table.h"
|
|
|
|
|
|
|
|
namespace rocksdb {
|
|
|
|
|
|
|
|
struct EnvOptions;
|
|
|
|
|
|
|
|
using std::unique_ptr;
|
|
|
|
class BlockBasedTableBuilder;
|
|
|
|
|
2018-07-20 23:31:27 +02:00
|
|
|
// A class used to track actual bytes written from the tail in the recent SST
|
|
|
|
// file opens, and provide a suggestion for following open.
|
|
|
|
class TailPrefetchStats {
|
|
|
|
public:
|
|
|
|
void RecordEffectiveSize(size_t len);
|
|
|
|
// 0 indicates no information to determine.
|
|
|
|
size_t GetSuggestedPrefetchSize();
|
|
|
|
|
|
|
|
private:
|
|
|
|
const static size_t kNumTracked = 32;
|
|
|
|
size_t records_[kNumTracked];
|
|
|
|
port::Mutex mutex_;
|
|
|
|
size_t next_ = 0;
|
|
|
|
size_t num_records_ = 0;
|
|
|
|
};
|
|
|
|
|
2014-01-28 06:58:46 +01:00
|
|
|
class BlockBasedTableFactory : public TableFactory {
|
2014-01-24 19:57:15 +01:00
|
|
|
public:
|
2014-01-28 06:58:46 +01:00
|
|
|
explicit BlockBasedTableFactory(
|
2014-03-01 01:39:27 +01:00
|
|
|
const BlockBasedTableOptions& table_options = BlockBasedTableOptions());
|
2013-11-21 03:42:12 +01:00
|
|
|
|
2014-01-24 19:57:15 +01:00
|
|
|
~BlockBasedTableFactory() {}
|
2013-11-20 07:00:48 +01:00
|
|
|
|
2017-07-29 01:23:50 +02:00
|
|
|
const char* Name() const override { return kName.c_str(); }
|
2013-11-20 07:00:48 +01:00
|
|
|
|
2016-07-20 20:23:31 +02:00
|
|
|
Status NewTableReader(
|
|
|
|
const TableReaderOptions& table_reader_options,
|
2018-11-09 20:17:34 +01:00
|
|
|
std::unique_ptr<RandomAccessFileReader>&& file, uint64_t file_size,
|
|
|
|
std::unique_ptr<TableReader>* table_reader,
|
2016-07-20 20:23:31 +02:00
|
|
|
bool prefetch_index_and_filter_in_cache = true) const override;
|
2013-10-29 01:54:09 +01:00
|
|
|
|
2014-01-27 22:53:22 +01:00
|
|
|
TableBuilder* NewTableBuilder(
|
A new call back to TablePropertiesCollector to allow users know the entry is add, delete or merge
Summary:
Currently users have no idea a key is add, delete or merge from TablePropertiesCollector call back. Add a new function to add it.
Also refactor the codes so that
(1) make table property collector and internal table property collector two separate data structures with the later one now exposed
(2) table builders only receive internal table properties
Test Plan: Add cases in table_properties_collector_test to cover both of old and new ways of using TablePropertiesCollector.
Reviewers: yhchiang, igor.sugak, rven, igor
Reviewed By: rven, igor
Subscribers: meyering, yoshinorim, maykov, leveldb, dhruba
Differential Revision: https://reviews.facebook.net/D35373
2015-04-06 19:04:30 +02:00
|
|
|
const TableBuilderOptions& table_builder_options,
|
2015-10-09 01:57:35 +02:00
|
|
|
uint32_t column_family_id, WritableFileWriter* file) const override;
|
2013-11-20 07:00:48 +01:00
|
|
|
|
2014-08-21 00:53:39 +02:00
|
|
|
// Sanitizes the specified DB Options.
|
2014-10-18 06:18:36 +02:00
|
|
|
Status SanitizeOptions(const DBOptions& db_opts,
|
|
|
|
const ColumnFamilyOptions& cf_opts) const override;
|
2014-08-21 00:53:39 +02:00
|
|
|
|
2014-08-25 23:24:09 +02:00
|
|
|
std::string GetPrintableTableOptions() const override;
|
|
|
|
|
2017-07-29 01:23:50 +02:00
|
|
|
Status GetOptionString(std::string* opt_string,
|
|
|
|
const std::string& delimiter) const override;
|
|
|
|
|
2015-10-30 23:58:46 +01:00
|
|
|
const BlockBasedTableOptions& table_options() const;
|
2014-11-21 04:24:39 +01:00
|
|
|
|
Add OptionsUtil::LoadOptionsFromFile() API
Summary:
This patch adds OptionsUtil::LoadOptionsFromFile() and
OptionsUtil::LoadLatestOptionsFromDB(), which allow developers
to construct DBOptions and ColumnFamilyOptions from a RocksDB
options file. Note that most pointer-typed options such as
merge_operator will not be constructed.
With this API, developers no longer need to remember all the
options in order to reopen an existing rocksdb instance like
the following:
DBOptions db_options;
std::vector<std::string> cf_names;
std::vector<ColumnFamilyOptions> cf_opts;
// Load primitive-typed options from an existing DB
OptionsUtil::LoadLatestOptionsFromDB(
dbname, &db_options, &cf_names, &cf_opts);
// Initialize necessary pointer-typed options
cf_opts[0].merge_operator.reset(new MyMergeOperator());
...
// Construct the vector of ColumnFamilyDescriptor
std::vector<ColumnFamilyDescriptor> cf_descs;
for (size_t i = 0; i < cf_opts.size(); ++i) {
cf_descs.emplace_back(cf_names[i], cf_opts[i]);
}
// Open the DB
DB* db = nullptr;
std::vector<ColumnFamilyHandle*> cf_handles;
auto s = DB::Open(db_options, dbname, cf_descs,
&handles, &db);
Test Plan:
Augment existing tests in column_family_test
options_test
db_test
Reviewers: igor, IslamAbdelRahman, sdong, anthony
Reviewed By: anthony
Subscribers: dhruba, leveldb
Differential Revision: https://reviews.facebook.net/D49095
2015-11-12 15:52:43 +01:00
|
|
|
void* GetOptions() override { return &table_options_; }
|
|
|
|
|
2017-07-13 01:49:56 +02:00
|
|
|
bool IsDeleteRangeSupported() const override { return true; }
|
|
|
|
|
2017-07-29 01:23:50 +02:00
|
|
|
static const std::string kName;
|
|
|
|
|
2013-11-20 07:00:48 +01:00
|
|
|
private:
|
2014-01-24 19:57:15 +01:00
|
|
|
BlockBasedTableOptions table_options_;
|
2018-07-20 23:31:27 +02:00
|
|
|
mutable TailPrefetchStats tail_prefetch_stats_;
|
2013-10-29 01:54:09 +01:00
|
|
|
};
|
|
|
|
|
2014-05-15 23:09:03 +02:00
|
|
|
extern const std::string kHashIndexPrefixesBlock;
|
|
|
|
extern const std::string kHashIndexPrefixesMetadataBlock;
|
2015-02-05 02:03:57 +01:00
|
|
|
extern const std::string kPropTrue;
|
|
|
|
extern const std::string kPropFalse;
|
2014-05-15 23:09:03 +02:00
|
|
|
|
2017-07-29 01:23:50 +02:00
|
|
|
#ifndef ROCKSDB_LITE
|
|
|
|
extern Status VerifyBlockBasedTableFactory(
|
|
|
|
const BlockBasedTableFactory* base_tf,
|
|
|
|
const BlockBasedTableFactory* file_tf,
|
|
|
|
OptionsSanityCheckLevel sanity_check_level);
|
|
|
|
|
|
|
|
static std::unordered_map<std::string, OptionTypeInfo>
|
|
|
|
block_based_table_type_info = {
|
|
|
|
/* currently not supported
|
|
|
|
std::shared_ptr<Cache> block_cache = nullptr;
|
|
|
|
std::shared_ptr<Cache> block_cache_compressed = nullptr;
|
2018-11-13 22:46:15 +01:00
|
|
|
std::shared_ptr<MemoryAllocator> memory_allocator = nullptr;
|
2017-07-29 01:23:50 +02:00
|
|
|
*/
|
|
|
|
{"flush_block_policy_factory",
|
|
|
|
{offsetof(struct BlockBasedTableOptions, flush_block_policy_factory),
|
|
|
|
OptionType::kFlushBlockPolicyFactory, OptionVerificationType::kByName,
|
|
|
|
false, 0}},
|
|
|
|
{"cache_index_and_filter_blocks",
|
|
|
|
{offsetof(struct BlockBasedTableOptions,
|
|
|
|
cache_index_and_filter_blocks),
|
|
|
|
OptionType::kBoolean, OptionVerificationType::kNormal, false, 0}},
|
|
|
|
{"cache_index_and_filter_blocks_with_high_priority",
|
|
|
|
{offsetof(struct BlockBasedTableOptions,
|
|
|
|
cache_index_and_filter_blocks_with_high_priority),
|
|
|
|
OptionType::kBoolean, OptionVerificationType::kNormal, false, 0}},
|
|
|
|
{"pin_l0_filter_and_index_blocks_in_cache",
|
|
|
|
{offsetof(struct BlockBasedTableOptions,
|
|
|
|
pin_l0_filter_and_index_blocks_in_cache),
|
|
|
|
OptionType::kBoolean, OptionVerificationType::kNormal, false, 0}},
|
|
|
|
{"index_type",
|
|
|
|
{offsetof(struct BlockBasedTableOptions, index_type),
|
|
|
|
OptionType::kBlockBasedTableIndexType,
|
|
|
|
OptionVerificationType::kNormal, false, 0}},
|
|
|
|
{"hash_index_allow_collision",
|
|
|
|
{offsetof(struct BlockBasedTableOptions, hash_index_allow_collision),
|
|
|
|
OptionType::kBoolean, OptionVerificationType::kNormal, false, 0}},
|
2018-07-28 00:35:41 +02:00
|
|
|
{"data_block_index_type",
|
|
|
|
{offsetof(struct BlockBasedTableOptions, data_block_index_type),
|
|
|
|
OptionType::kBlockBasedTableDataBlockIndexType,
|
|
|
|
OptionVerificationType::kNormal, false, 0}},
|
2018-08-15 23:27:47 +02:00
|
|
|
{"data_block_hash_table_util_ratio",
|
|
|
|
{offsetof(struct BlockBasedTableOptions,
|
|
|
|
data_block_hash_table_util_ratio),
|
|
|
|
OptionType::kDouble, OptionVerificationType::kNormal, false, 0}},
|
2017-07-29 01:23:50 +02:00
|
|
|
{"checksum",
|
|
|
|
{offsetof(struct BlockBasedTableOptions, checksum),
|
|
|
|
OptionType::kChecksumType, OptionVerificationType::kNormal, false,
|
|
|
|
0}},
|
|
|
|
{"no_block_cache",
|
|
|
|
{offsetof(struct BlockBasedTableOptions, no_block_cache),
|
|
|
|
OptionType::kBoolean, OptionVerificationType::kNormal, false, 0}},
|
|
|
|
{"block_size",
|
|
|
|
{offsetof(struct BlockBasedTableOptions, block_size),
|
|
|
|
OptionType::kSizeT, OptionVerificationType::kNormal, false, 0}},
|
|
|
|
{"block_size_deviation",
|
|
|
|
{offsetof(struct BlockBasedTableOptions, block_size_deviation),
|
|
|
|
OptionType::kInt, OptionVerificationType::kNormal, false, 0}},
|
|
|
|
{"block_restart_interval",
|
|
|
|
{offsetof(struct BlockBasedTableOptions, block_restart_interval),
|
|
|
|
OptionType::kInt, OptionVerificationType::kNormal, false, 0}},
|
|
|
|
{"index_block_restart_interval",
|
|
|
|
{offsetof(struct BlockBasedTableOptions, index_block_restart_interval),
|
|
|
|
OptionType::kInt, OptionVerificationType::kNormal, false, 0}},
|
|
|
|
{"index_per_partition",
|
|
|
|
{0, OptionType::kUInt64T, OptionVerificationType::kDeprecated, false,
|
|
|
|
0}},
|
|
|
|
{"metadata_block_size",
|
|
|
|
{offsetof(struct BlockBasedTableOptions, metadata_block_size),
|
|
|
|
OptionType::kUInt64T, OptionVerificationType::kNormal, false, 0}},
|
|
|
|
{"partition_filters",
|
|
|
|
{offsetof(struct BlockBasedTableOptions, partition_filters),
|
|
|
|
OptionType::kBoolean, OptionVerificationType::kNormal, false, 0}},
|
|
|
|
{"filter_policy",
|
|
|
|
{offsetof(struct BlockBasedTableOptions, filter_policy),
|
|
|
|
OptionType::kFilterPolicy, OptionVerificationType::kByName, false,
|
|
|
|
0}},
|
|
|
|
{"whole_key_filtering",
|
|
|
|
{offsetof(struct BlockBasedTableOptions, whole_key_filtering),
|
|
|
|
OptionType::kBoolean, OptionVerificationType::kNormal, false, 0}},
|
|
|
|
{"skip_table_builder_flush",
|
|
|
|
{0, OptionType::kBoolean, OptionVerificationType::kDeprecated, false,
|
|
|
|
0}},
|
|
|
|
{"format_version",
|
|
|
|
{offsetof(struct BlockBasedTableOptions, format_version),
|
|
|
|
OptionType::kUInt32T, OptionVerificationType::kNormal, false, 0}},
|
|
|
|
{"verify_compression",
|
|
|
|
{offsetof(struct BlockBasedTableOptions, verify_compression),
|
|
|
|
OptionType::kBoolean, OptionVerificationType::kNormal, false, 0}},
|
|
|
|
{"read_amp_bytes_per_bit",
|
|
|
|
{offsetof(struct BlockBasedTableOptions, read_amp_bytes_per_bit),
|
2018-01-11 00:06:29 +01:00
|
|
|
OptionType::kSizeT, OptionVerificationType::kNormal, false, 0}},
|
|
|
|
{"enable_index_compression",
|
|
|
|
{offsetof(struct BlockBasedTableOptions, enable_index_compression),
|
2018-03-27 05:14:24 +02:00
|
|
|
OptionType::kBoolean, OptionVerificationType::kNormal, false, 0}},
|
|
|
|
{"block_align",
|
|
|
|
{offsetof(struct BlockBasedTableOptions, block_align),
|
2018-06-23 00:14:05 +02:00
|
|
|
OptionType::kBoolean, OptionVerificationType::kNormal, false, 0}},
|
|
|
|
{"pin_top_level_index_and_filter",
|
|
|
|
{offsetof(struct BlockBasedTableOptions,
|
|
|
|
pin_top_level_index_and_filter),
|
2018-01-11 00:06:29 +01:00
|
|
|
OptionType::kBoolean, OptionVerificationType::kNormal, false, 0}}};
|
2017-07-29 01:23:50 +02:00
|
|
|
#endif // !ROCKSDB_LITE
|
2013-10-29 01:54:09 +01:00
|
|
|
} // namespace rocksdb
|