2014-01-27 21:58:46 -08:00
|
|
|
// Copyright (c) 2011 The LevelDB Authors. All rights reserved.
|
|
|
|
// Use of this source code is governed by a BSD-style license that can be
|
|
|
|
// found in the LICENSE file. See the AUTHORS file for names of contributors.
|
2013-11-19 16:29:42 -08:00
|
|
|
#pragma once
|
|
|
|
|
2015-07-01 16:13:49 -07:00
|
|
|
#include <stdint.h>
|
2013-11-19 16:29:42 -08:00
|
|
|
#include <string>
|
2014-02-12 13:14:59 -08:00
|
|
|
#include <map>
|
2013-11-19 16:29:42 -08:00
|
|
|
#include "rocksdb/status.h"
|
A new call back to TablePropertiesCollector to allow users know the entry is add, delete or merge
Summary:
Currently users have no idea a key is add, delete or merge from TablePropertiesCollector call back. Add a new function to add it.
Also refactor the codes so that
(1) make table property collector and internal table property collector two separate data structures with the later one now exposed
(2) table builders only receive internal table properties
Test Plan: Add cases in table_properties_collector_test to cover both of old and new ways of using TablePropertiesCollector.
Reviewers: yhchiang, igor.sugak, rven, igor
Reviewed By: rven, igor
Subscribers: meyering, yoshinorim, maykov, leveldb, dhruba
Differential Revision: https://reviews.facebook.net/D35373
2015-04-06 10:04:30 -07:00
|
|
|
#include "rocksdb/types.h"
|
2013-11-19 16:29:42 -08:00
|
|
|
|
|
|
|
namespace rocksdb {
|
|
|
|
|
2014-01-27 21:58:46 -08:00
|
|
|
// -- Table Properties
|
2013-12-05 13:09:13 -08:00
|
|
|
// Other than basic table properties, each table may also have the user
|
|
|
|
// collected properties.
|
|
|
|
// The value of the user-collected properties are encoded as raw bytes --
|
|
|
|
// users have to interprete these values by themselves.
|
2014-02-12 13:14:59 -08:00
|
|
|
// Note: To do prefix seek/scan in `UserCollectedProperties`, you can do
|
|
|
|
// something similar to:
|
|
|
|
//
|
|
|
|
// UserCollectedProperties props = ...;
|
|
|
|
// for (auto pos = props.lower_bound(prefix);
|
|
|
|
// pos != props.end() && pos->first.compare(0, prefix.size(), prefix) == 0;
|
|
|
|
// ++pos) {
|
|
|
|
// ...
|
|
|
|
// }
|
2015-07-02 17:23:41 -07:00
|
|
|
typedef std::map<std::string, std::string> UserCollectedProperties;
|
2013-12-05 13:09:13 -08:00
|
|
|
|
2013-11-19 16:29:42 -08:00
|
|
|
// TableProperties contains a bunch of read-only properties of its associated
|
|
|
|
// table.
|
|
|
|
struct TableProperties {
|
|
|
|
public:
|
|
|
|
// the total size of all data blocks.
|
|
|
|
uint64_t data_size = 0;
|
|
|
|
// the size of index block.
|
|
|
|
uint64_t index_size = 0;
|
|
|
|
// the size of filter block.
|
|
|
|
uint64_t filter_size = 0;
|
|
|
|
// total raw key size
|
|
|
|
uint64_t raw_key_size = 0;
|
|
|
|
// total raw value size
|
|
|
|
uint64_t raw_value_size = 0;
|
|
|
|
// the number of blocks in this table
|
|
|
|
uint64_t num_data_blocks = 0;
|
|
|
|
// the number of entries in this table
|
|
|
|
uint64_t num_entries = 0;
|
2013-12-20 09:35:24 -08:00
|
|
|
// format version, reserved for backward compatibility
|
|
|
|
uint64_t format_version = 0;
|
|
|
|
// If 0, key is variable length. Otherwise number of bytes for each key.
|
|
|
|
uint64_t fixed_key_len = 0;
|
2013-11-19 16:29:42 -08:00
|
|
|
|
|
|
|
// The name of the filter policy used in this table.
|
|
|
|
// If no filter policy is used, `filter_policy_name` will be an empty string.
|
|
|
|
std::string filter_policy_name;
|
|
|
|
|
|
|
|
// user collected properties
|
|
|
|
UserCollectedProperties user_collected_properties;
|
|
|
|
|
|
|
|
// convert this object to a human readable form
|
|
|
|
// @prop_delim: delimiter for each property.
|
2014-01-27 21:58:46 -08:00
|
|
|
std::string ToString(const std::string& prop_delim = "; ",
|
|
|
|
const std::string& kv_delim = "=") const;
|
2015-08-25 12:03:54 -07:00
|
|
|
|
|
|
|
// Aggregate the numerical member variables of the specified
|
|
|
|
// TableProperties.
|
|
|
|
void Add(const TableProperties& tp);
|
2013-11-19 16:29:42 -08:00
|
|
|
};
|
|
|
|
|
2013-12-05 13:09:13 -08:00
|
|
|
// table properties' human-readable names in the property block.
|
|
|
|
struct TablePropertiesNames {
|
|
|
|
static const std::string kDataSize;
|
|
|
|
static const std::string kIndexSize;
|
|
|
|
static const std::string kFilterSize;
|
|
|
|
static const std::string kRawKeySize;
|
|
|
|
static const std::string kRawValueSize;
|
|
|
|
static const std::string kNumDataBlocks;
|
|
|
|
static const std::string kNumEntries;
|
2013-12-20 09:35:24 -08:00
|
|
|
static const std::string kFormatVersion;
|
|
|
|
static const std::string kFixedKeyLen;
|
2013-12-05 13:09:13 -08:00
|
|
|
static const std::string kFilterPolicy;
|
|
|
|
};
|
|
|
|
|
2013-12-05 16:51:26 -08:00
|
|
|
extern const std::string kPropertiesBlock;
|
2013-12-05 13:09:13 -08:00
|
|
|
|
A new call back to TablePropertiesCollector to allow users know the entry is add, delete or merge
Summary:
Currently users have no idea a key is add, delete or merge from TablePropertiesCollector call back. Add a new function to add it.
Also refactor the codes so that
(1) make table property collector and internal table property collector two separate data structures with the later one now exposed
(2) table builders only receive internal table properties
Test Plan: Add cases in table_properties_collector_test to cover both of old and new ways of using TablePropertiesCollector.
Reviewers: yhchiang, igor.sugak, rven, igor
Reviewed By: rven, igor
Subscribers: meyering, yoshinorim, maykov, leveldb, dhruba
Differential Revision: https://reviews.facebook.net/D35373
2015-04-06 10:04:30 -07:00
|
|
|
enum EntryType {
|
|
|
|
kEntryPut,
|
|
|
|
kEntryDelete,
|
|
|
|
kEntryMerge,
|
|
|
|
kEntryOther,
|
|
|
|
};
|
|
|
|
|
2013-11-19 16:29:42 -08:00
|
|
|
// `TablePropertiesCollector` provides the mechanism for users to collect
|
2015-08-05 07:33:27 -07:00
|
|
|
// their own properties that they are interested in. This class is essentially
|
|
|
|
// a collection of callback functions that will be invoked during table
|
|
|
|
// building. It is construced with TablePropertiesCollectorFactory. The methods
|
|
|
|
// don't need to be thread-safe, as we will create exactly one
|
TablePropertiesCollectorFactory
Summary:
This diff addresses task #4296714 and rethinks how users provide us with TablePropertiesCollectors as part of Options.
Here's description of task #4296714:
I'm debugging #4295529 and noticed that our count of user properties kDeletedKeys is wrong. We're sharing one single InternalKeyPropertiesCollector with all Table Builders. In LOG Files, we're outputting number of kDeletedKeys as connected with a single table, while it's actually the total count of deleted keys since creation of the DB.
For example, this table has 3155 entries and 1391828 deleted keys.
The problem with current approach that we call methods on a single TablePropertiesCollector for all the tables we create. Even worse, we could do it from multiple threads at the same time and TablePropertiesCollector has no way of knowing which table we're calling it for.
Good part: Looks like nobody inside Facebook is using Options::table_properties_collectors. This means we should be able to painfully change the API.
In this change, I introduce TablePropertiesCollectorFactory. For every table we create, we call `CreateTablePropertiesCollector`, which creates a TablePropertiesCollector for a single table. We then use it sequentially from a single thread, which means it doesn't have to be thread-safe.
Test Plan:
Added a test in table_properties_collector_test that fails on master (build two tables, assert that kDeletedKeys count is correct for the second one).
Also, all other tests
Reviewers: sdong, dhruba, haobo, kailiu
Reviewed By: kailiu
CC: leveldb
Differential Revision: https://reviews.facebook.net/D18579
2014-05-13 12:30:55 -07:00
|
|
|
// TablePropertiesCollector object per table and then call it sequentially
|
2013-11-19 16:29:42 -08:00
|
|
|
class TablePropertiesCollector {
|
|
|
|
public:
|
2014-01-27 21:58:46 -08:00
|
|
|
virtual ~TablePropertiesCollector() {}
|
2013-11-19 16:29:42 -08:00
|
|
|
|
A new call back to TablePropertiesCollector to allow users know the entry is add, delete or merge
Summary:
Currently users have no idea a key is add, delete or merge from TablePropertiesCollector call back. Add a new function to add it.
Also refactor the codes so that
(1) make table property collector and internal table property collector two separate data structures with the later one now exposed
(2) table builders only receive internal table properties
Test Plan: Add cases in table_properties_collector_test to cover both of old and new ways of using TablePropertiesCollector.
Reviewers: yhchiang, igor.sugak, rven, igor
Reviewed By: rven, igor
Subscribers: meyering, yoshinorim, maykov, leveldb, dhruba
Differential Revision: https://reviews.facebook.net/D35373
2015-04-06 10:04:30 -07:00
|
|
|
// DEPRECATE User defined collector should implement AddUserKey(), though
|
|
|
|
// this old function still works for backward compatible reason.
|
2013-11-19 16:29:42 -08:00
|
|
|
// Add() will be called when a new key/value pair is inserted into the table.
|
A new call back to TablePropertiesCollector to allow users know the entry is add, delete or merge
Summary:
Currently users have no idea a key is add, delete or merge from TablePropertiesCollector call back. Add a new function to add it.
Also refactor the codes so that
(1) make table property collector and internal table property collector two separate data structures with the later one now exposed
(2) table builders only receive internal table properties
Test Plan: Add cases in table_properties_collector_test to cover both of old and new ways of using TablePropertiesCollector.
Reviewers: yhchiang, igor.sugak, rven, igor
Reviewed By: rven, igor
Subscribers: meyering, yoshinorim, maykov, leveldb, dhruba
Differential Revision: https://reviews.facebook.net/D35373
2015-04-06 10:04:30 -07:00
|
|
|
// @params key the user key that is inserted into the table.
|
|
|
|
// @params value the value that is inserted into the table.
|
|
|
|
virtual Status Add(const Slice& key, const Slice& value) {
|
|
|
|
return Status::InvalidArgument(
|
|
|
|
"TablePropertiesCollector::Add() deprecated.");
|
|
|
|
}
|
|
|
|
|
|
|
|
// AddUserKey() will be called when a new key/value pair is inserted into the
|
|
|
|
// table.
|
|
|
|
// @params key the user key that is inserted into the table.
|
|
|
|
// @params value the value that is inserted into the table.
|
|
|
|
// @params file_size file size up to now
|
|
|
|
virtual Status AddUserKey(const Slice& key, const Slice& value,
|
|
|
|
EntryType type, SequenceNumber seq,
|
|
|
|
uint64_t file_size) {
|
2015-08-05 07:33:27 -07:00
|
|
|
// For backwards-compatibility.
|
A new call back to TablePropertiesCollector to allow users know the entry is add, delete or merge
Summary:
Currently users have no idea a key is add, delete or merge from TablePropertiesCollector call back. Add a new function to add it.
Also refactor the codes so that
(1) make table property collector and internal table property collector two separate data structures with the later one now exposed
(2) table builders only receive internal table properties
Test Plan: Add cases in table_properties_collector_test to cover both of old and new ways of using TablePropertiesCollector.
Reviewers: yhchiang, igor.sugak, rven, igor
Reviewed By: rven, igor
Subscribers: meyering, yoshinorim, maykov, leveldb, dhruba
Differential Revision: https://reviews.facebook.net/D35373
2015-04-06 10:04:30 -07:00
|
|
|
return Add(key, value);
|
|
|
|
}
|
2013-11-19 16:29:42 -08:00
|
|
|
|
|
|
|
// Finish() will be called when a table has already been built and is ready
|
|
|
|
// for writing the properties block.
|
|
|
|
// @params properties User will add their collected statistics to
|
|
|
|
// `properties`.
|
2013-12-05 13:09:13 -08:00
|
|
|
virtual Status Finish(UserCollectedProperties* properties) = 0;
|
2013-11-19 16:29:42 -08:00
|
|
|
|
|
|
|
// Return the human-readable properties, where the key is property name and
|
|
|
|
// the value is the human-readable form of value.
|
2013-12-05 13:09:13 -08:00
|
|
|
virtual UserCollectedProperties GetReadableProperties() const = 0;
|
TablePropertiesCollectorFactory
Summary:
This diff addresses task #4296714 and rethinks how users provide us with TablePropertiesCollectors as part of Options.
Here's description of task #4296714:
I'm debugging #4295529 and noticed that our count of user properties kDeletedKeys is wrong. We're sharing one single InternalKeyPropertiesCollector with all Table Builders. In LOG Files, we're outputting number of kDeletedKeys as connected with a single table, while it's actually the total count of deleted keys since creation of the DB.
For example, this table has 3155 entries and 1391828 deleted keys.
The problem with current approach that we call methods on a single TablePropertiesCollector for all the tables we create. Even worse, we could do it from multiple threads at the same time and TablePropertiesCollector has no way of knowing which table we're calling it for.
Good part: Looks like nobody inside Facebook is using Options::table_properties_collectors. This means we should be able to painfully change the API.
In this change, I introduce TablePropertiesCollectorFactory. For every table we create, we call `CreateTablePropertiesCollector`, which creates a TablePropertiesCollector for a single table. We then use it sequentially from a single thread, which means it doesn't have to be thread-safe.
Test Plan:
Added a test in table_properties_collector_test that fails on master (build two tables, assert that kDeletedKeys count is correct for the second one).
Also, all other tests
Reviewers: sdong, dhruba, haobo, kailiu
Reviewed By: kailiu
CC: leveldb
Differential Revision: https://reviews.facebook.net/D18579
2014-05-13 12:30:55 -07:00
|
|
|
|
|
|
|
// The name of the properties collector can be used for debugging purpose.
|
|
|
|
virtual const char* Name() const = 0;
|
2015-06-04 12:03:40 -07:00
|
|
|
|
|
|
|
// EXPERIMENTAL Return whether the output file should be further compacted
|
|
|
|
virtual bool NeedCompact() const { return false; }
|
TablePropertiesCollectorFactory
Summary:
This diff addresses task #4296714 and rethinks how users provide us with TablePropertiesCollectors as part of Options.
Here's description of task #4296714:
I'm debugging #4295529 and noticed that our count of user properties kDeletedKeys is wrong. We're sharing one single InternalKeyPropertiesCollector with all Table Builders. In LOG Files, we're outputting number of kDeletedKeys as connected with a single table, while it's actually the total count of deleted keys since creation of the DB.
For example, this table has 3155 entries and 1391828 deleted keys.
The problem with current approach that we call methods on a single TablePropertiesCollector for all the tables we create. Even worse, we could do it from multiple threads at the same time and TablePropertiesCollector has no way of knowing which table we're calling it for.
Good part: Looks like nobody inside Facebook is using Options::table_properties_collectors. This means we should be able to painfully change the API.
In this change, I introduce TablePropertiesCollectorFactory. For every table we create, we call `CreateTablePropertiesCollector`, which creates a TablePropertiesCollector for a single table. We then use it sequentially from a single thread, which means it doesn't have to be thread-safe.
Test Plan:
Added a test in table_properties_collector_test that fails on master (build two tables, assert that kDeletedKeys count is correct for the second one).
Also, all other tests
Reviewers: sdong, dhruba, haobo, kailiu
Reviewed By: kailiu
CC: leveldb
Differential Revision: https://reviews.facebook.net/D18579
2014-05-13 12:30:55 -07:00
|
|
|
};
|
|
|
|
|
|
|
|
// Constructs TablePropertiesCollector. Internals create a new
|
|
|
|
// TablePropertiesCollector for each new table
|
|
|
|
class TablePropertiesCollectorFactory {
|
|
|
|
public:
|
|
|
|
virtual ~TablePropertiesCollectorFactory() {}
|
|
|
|
// has to be thread-safe
|
|
|
|
virtual TablePropertiesCollector* CreateTablePropertiesCollector() = 0;
|
|
|
|
|
|
|
|
// The name of the properties collector can be used for debugging purpose.
|
|
|
|
virtual const char* Name() const = 0;
|
2013-11-19 16:29:42 -08:00
|
|
|
};
|
|
|
|
|
|
|
|
// Extra properties
|
|
|
|
// Below is a list of non-basic properties that are collected by database
|
|
|
|
// itself. Especially some properties regarding to the internal keys (which
|
|
|
|
// is unknown to `table`).
|
2013-12-05 13:09:13 -08:00
|
|
|
extern uint64_t GetDeletedKeys(const UserCollectedProperties& props);
|
2013-11-19 16:29:42 -08:00
|
|
|
|
|
|
|
} // namespace rocksdb
|