2016-02-09 15:12:00 -08:00
|
|
|
// Copyright (c) 2011-present, Facebook, Inc. All rights reserved.
|
2014-01-17 12:46:06 -08:00
|
|
|
// This source code is licensed under the BSD-style license found in the
|
|
|
|
// LICENSE file in the root directory of this source tree. An additional grant
|
|
|
|
// of patent rights can be found in the PATENTS file in the same directory.
|
2017-04-27 17:50:56 -07:00
|
|
|
// This source code is also licensed under the GPLv2 license found in the
|
|
|
|
// COPYING file in the root directory of this source tree.
|
2014-01-17 12:46:06 -08:00
|
|
|
//
|
|
|
|
#pragma once
|
|
|
|
#include "rocksdb/statistics.h"
|
|
|
|
|
2014-01-23 16:11:55 -08:00
|
|
|
#include <vector>
|
|
|
|
#include <atomic>
|
2014-07-28 12:05:36 -07:00
|
|
|
#include <string>
|
|
|
|
|
2017-04-05 19:02:00 -07:00
|
|
|
#include "monitoring/histogram.h"
|
2016-08-24 15:42:31 -07:00
|
|
|
#include "port/likely.h"
|
|
|
|
#include "port/port.h"
|
2017-05-23 10:29:14 -07:00
|
|
|
#include "util/core_local.h"
|
2014-07-28 12:05:36 -07:00
|
|
|
#include "util/mutexlock.h"
|
2017-05-23 10:29:14 -07:00
|
|
|
|
|
|
|
#ifdef __clang__
|
|
|
|
#define ROCKSDB_FIELD_UNUSED __attribute__((__unused__))
|
|
|
|
#else
|
|
|
|
#define ROCKSDB_FIELD_UNUSED
|
|
|
|
#endif // __clang__
|
2014-01-17 12:46:06 -08:00
|
|
|
|
|
|
|
namespace rocksdb {
|
|
|
|
|
2014-07-28 12:05:36 -07:00
|
|
|
enum TickersInternal : uint32_t {
|
|
|
|
INTERNAL_TICKER_ENUM_START = TICKER_ENUM_MAX,
|
|
|
|
INTERNAL_TICKER_ENUM_MAX
|
|
|
|
};
|
|
|
|
|
|
|
|
enum HistogramsInternal : uint32_t {
|
|
|
|
INTERNAL_HISTOGRAM_START = HISTOGRAM_ENUM_MAX,
|
|
|
|
INTERNAL_HISTOGRAM_ENUM_MAX
|
|
|
|
};
|
|
|
|
|
|
|
|
|
2014-01-17 12:46:06 -08:00
|
|
|
class StatisticsImpl : public Statistics {
|
|
|
|
public:
|
2014-07-28 12:05:36 -07:00
|
|
|
StatisticsImpl(std::shared_ptr<Statistics> stats,
|
|
|
|
bool enable_internal_stats);
|
2014-01-17 12:46:06 -08:00
|
|
|
virtual ~StatisticsImpl();
|
|
|
|
|
2014-07-28 12:05:36 -07:00
|
|
|
virtual uint64_t getTickerCount(uint32_t ticker_type) const override;
|
|
|
|
virtual void histogramData(uint32_t histogram_type,
|
|
|
|
HistogramData* const data) const override;
|
Add Statistics.getHistogramString() to print more detailed outputs of a histogram
Summary:
Provide a way for users to know more detailed ditribution of a histogram metrics. Example outputs:
Manually add statement
fprintf(stdout, "%s\n", dbstats->getHistogramString(SST_READ_MICROS).c_str());
Will print out something like:
Count: 989151 Average: 1.7659 StdDev: 1.52
Min: 0.0000 Median: 1.2071 Max: 860.0000
Percentiles: P50: 1.21 P75: 1.70 P99: 5.12 P99.9: 13.67 P99.99: 21.70
------------------------------------------------------
[ 0, 1 ) 390839 39.513% 39.513% ########
[ 1, 2 ) 500918 50.641% 90.154% ##########
[ 2, 3 ) 79358 8.023% 98.177% ##
[ 3, 4 ) 6297 0.637% 98.813%
[ 4, 5 ) 1712 0.173% 98.986%
[ 5, 6 ) 1134 0.115% 99.101%
[ 6, 7 ) 1222 0.124% 99.224%
[ 7, 8 ) 1529 0.155% 99.379%
[ 8, 9 ) 1264 0.128% 99.507%
[ 9, 10 ) 988 0.100% 99.607%
[ 10, 12 ) 1378 0.139% 99.746%
[ 12, 14 ) 1828 0.185% 99.931%
[ 14, 16 ) 410 0.041% 99.972%
[ 16, 18 ) 72 0.007% 99.980%
[ 18, 20 ) 67 0.007% 99.986%
[ 20, 25 ) 106 0.011% 99.997%
[ 25, 30 ) 24 0.002% 99.999%
[ 30, 35 ) 1 0.000% 100.000%
[ 250, 300 ) 2 0.000% 100.000%
[ 300, 350 ) 1 0.000% 100.000%
[ 800, 900 ) 1 0.000% 100.000%
Test Plan: Manually add a print in db_bench and make sure it prints out as expected. Will add some codes to cover the function
Subscribers: leveldb, dhruba
Differential Revision: https://reviews.facebook.net/D43611
2015-08-05 13:14:28 -07:00
|
|
|
std::string getHistogramString(uint32_t histogram_type) const override;
|
2014-07-28 12:05:36 -07:00
|
|
|
|
|
|
|
virtual void setTickerCount(uint32_t ticker_type, uint64_t count) override;
|
2016-10-11 10:54:11 -07:00
|
|
|
virtual uint64_t getAndResetTickerCount(uint32_t ticker_type) override;
|
2014-07-28 12:05:36 -07:00
|
|
|
virtual void recordTick(uint32_t ticker_type, uint64_t count) override;
|
|
|
|
virtual void measureTime(uint32_t histogram_type, uint64_t value) override;
|
|
|
|
|
2017-04-26 15:19:50 -07:00
|
|
|
virtual Status Reset() override;
|
2014-07-28 12:05:36 -07:00
|
|
|
virtual std::string ToString() const override;
|
|
|
|
virtual bool HistEnabledForType(uint32_t type) const override;
|
2014-01-17 12:46:06 -08:00
|
|
|
|
|
|
|
private:
|
2017-05-23 10:29:14 -07:00
|
|
|
// If non-nullptr, forwards updates to the object pointed to by `stats_`.
|
|
|
|
std::shared_ptr<Statistics> stats_;
|
|
|
|
// TODO(ajkr): clean this up since there are no internal stats anymore
|
2014-07-28 12:05:36 -07:00
|
|
|
bool enable_internal_stats_;
|
2017-05-23 10:29:14 -07:00
|
|
|
// Synchronizes anything that operates across other cores' local data,
|
2017-04-26 15:19:50 -07:00
|
|
|
// such that operations like Reset() can be performed atomically.
|
2016-08-24 15:42:31 -07:00
|
|
|
mutable port::Mutex aggregate_lock_;
|
2014-07-28 12:05:36 -07:00
|
|
|
|
2017-05-23 10:29:14 -07:00
|
|
|
// The ticker/histogram data are stored in this structure, which we will store
|
|
|
|
// per-core. It is cache-aligned, so tickers/histograms belonging to different
|
|
|
|
// cores can never share the same cache line.
|
|
|
|
//
|
|
|
|
// Alignment attributes expand to nothing depending on the platform
|
|
|
|
struct StatisticsData {
|
|
|
|
std::atomic_uint_fast64_t tickers_[INTERNAL_TICKER_ENUM_MAX] = {{0}};
|
|
|
|
HistogramImpl histograms_[INTERNAL_HISTOGRAM_ENUM_MAX];
|
|
|
|
char
|
|
|
|
padding[(CACHE_LINE_SIZE -
|
|
|
|
(INTERNAL_TICKER_ENUM_MAX * sizeof(std::atomic_uint_fast64_t) +
|
|
|
|
INTERNAL_HISTOGRAM_ENUM_MAX * sizeof(HistogramImpl)) %
|
|
|
|
CACHE_LINE_SIZE) %
|
|
|
|
CACHE_LINE_SIZE] ROCKSDB_FIELD_UNUSED;
|
2014-01-29 15:08:41 -08:00
|
|
|
};
|
|
|
|
|
2017-05-23 10:29:14 -07:00
|
|
|
static_assert(sizeof(StatisticsData) % 64 == 0, "Expected 64-byte aligned");
|
Thread-specific histogram statistics
Summary:
To reduce contention for atomics when HistogramStats are shared across
threads, this diff makes them thread-specific so updates are faster. This comes
at the expense of slower reads (much less frequent), which now require merging
all histograms. In this diff,
- Thread-specific HistogramImpl is created upon the thread's first measureTime()
- Thread-specific HistogramImpl are merged and deleted upon thread termination or ThreadLocalPtr destruction, whichever comes first
- getHistogramString() and histogramData() merge all histograms, both thread-specific and previously merged ones
Test Plan:
unit tests, ran db_bench and verified histograms look similar
before:
$ TEST_TMPDIR=/dev/shm/ perf record -g ./db_bench --benchmarks=readwhilewriting --statistics --num=1000000 --use_existing_db --threads=64 --cache_size=250000000 --compression_type=lz4
...
+ 7.63% db_bench db_bench [.] rocksdb::HistogramStat::Add
after:
$ TEST_TMPDIR=/dev/shm/ perf record -g ./db_bench --benchmarks=readwhilewriting --statistics --num=1000000 --use_existing_db --threads=64 --cache_size=250000000 --compression_type=lz4
...
+ 0.98% db_bench db_bench [.] rocksdb::HistogramStat::Add
Reviewers: sdong, MarkCallaghan, kradhakrishnan, IslamAbdelRahman
Reviewed By: IslamAbdelRahman
Subscribers: andrewkr, dhruba, leveldb
Differential Revision: https://reviews.facebook.net/D62649
2016-08-31 14:02:09 -07:00
|
|
|
|
2017-05-23 10:29:14 -07:00
|
|
|
CoreLocalArray<StatisticsData> per_core_stats_;
|
Thread-specific histogram statistics
Summary:
To reduce contention for atomics when HistogramStats are shared across
threads, this diff makes them thread-specific so updates are faster. This comes
at the expense of slower reads (much less frequent), which now require merging
all histograms. In this diff,
- Thread-specific HistogramImpl is created upon the thread's first measureTime()
- Thread-specific HistogramImpl are merged and deleted upon thread termination or ThreadLocalPtr destruction, whichever comes first
- getHistogramString() and histogramData() merge all histograms, both thread-specific and previously merged ones
Test Plan:
unit tests, ran db_bench and verified histograms look similar
before:
$ TEST_TMPDIR=/dev/shm/ perf record -g ./db_bench --benchmarks=readwhilewriting --statistics --num=1000000 --use_existing_db --threads=64 --cache_size=250000000 --compression_type=lz4
...
+ 7.63% db_bench db_bench [.] rocksdb::HistogramStat::Add
after:
$ TEST_TMPDIR=/dev/shm/ perf record -g ./db_bench --benchmarks=readwhilewriting --statistics --num=1000000 --use_existing_db --threads=64 --cache_size=250000000 --compression_type=lz4
...
+ 0.98% db_bench db_bench [.] rocksdb::HistogramStat::Add
Reviewers: sdong, MarkCallaghan, kradhakrishnan, IslamAbdelRahman
Reviewed By: IslamAbdelRahman
Subscribers: andrewkr, dhruba, leveldb
Differential Revision: https://reviews.facebook.net/D62649
2016-08-31 14:02:09 -07:00
|
|
|
|
2017-04-26 15:19:50 -07:00
|
|
|
uint64_t getTickerCountLocked(uint32_t ticker_type) const;
|
2017-05-23 10:29:14 -07:00
|
|
|
std::unique_ptr<HistogramImpl> getHistogramImplLocked(
|
|
|
|
uint32_t histogram_type) const;
|
2017-04-26 15:19:50 -07:00
|
|
|
void setTickerCountLocked(uint32_t ticker_type, uint64_t count);
|
2014-01-17 12:46:06 -08:00
|
|
|
};
|
|
|
|
|
|
|
|
// Utility functions
|
2014-07-28 12:05:36 -07:00
|
|
|
inline void MeasureTime(Statistics* statistics, uint32_t histogram_type,
|
2014-01-17 12:46:06 -08:00
|
|
|
uint64_t value) {
|
|
|
|
if (statistics) {
|
2014-07-28 12:05:36 -07:00
|
|
|
statistics->measureTime(histogram_type, value);
|
2014-01-17 12:46:06 -08:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2014-07-28 12:05:36 -07:00
|
|
|
inline void RecordTick(Statistics* statistics, uint32_t ticker_type,
|
2014-01-17 12:46:06 -08:00
|
|
|
uint64_t count = 1) {
|
|
|
|
if (statistics) {
|
2014-07-28 12:05:36 -07:00
|
|
|
statistics->recordTick(ticker_type, count);
|
2014-01-17 12:46:06 -08:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2014-07-28 12:05:36 -07:00
|
|
|
inline void SetTickerCount(Statistics* statistics, uint32_t ticker_type,
|
2014-01-17 12:46:06 -08:00
|
|
|
uint64_t count) {
|
|
|
|
if (statistics) {
|
2014-07-28 12:05:36 -07:00
|
|
|
statistics->setTickerCount(ticker_type, count);
|
2014-01-17 12:46:06 -08:00
|
|
|
}
|
|
|
|
}
|
2014-07-28 12:10:49 -07:00
|
|
|
|
2014-01-17 12:46:06 -08:00
|
|
|
}
|