// Copyright (c) 2013, Facebook, Inc. All rights reserved. // This source code is licensed under the BSD-style license found in the // LICENSE file in the root directory of this source tree. An additional grant // of patent rights can be found in the PATENTS file in the same directory. // // Copyright (c) 2011 The LevelDB Authors. All rights reserved. // Use of this source code is governed by a BSD-style license that can be // found in the LICENSE file. See the AUTHORS file for names of contributors. // #pragma once #include "db/version_set.h" #include #include class ColumnFamilyData; namespace rocksdb { class MemTableList; class DBImpl; enum DBPropertyType : uint32_t { kUnknown, kNumFilesAtLevel, // Number of files at a specific level kLevelStats, // Return number of files and total sizes of each level kCFStats, // Return general statitistics of CF kDBStats, // Return general statitistics of DB kStats, // Return general statitistics of both DB and CF kSsTables, // Return a human readable string of current SST files kStartIntTypes, // ---- Dummy value to indicate the start of integer values kNumImmutableMemTable, // Return number of immutable mem tables kMemtableFlushPending, // Return 1 if mem table flushing is pending, // otherwise 0. kCompactionPending, // Return 1 if a compaction is pending. Otherwise 0. kBackgroundErrors, // Return accumulated background errors encountered. kCurSizeActiveMemTable, // Return current size of the active memtable kCurSizeAllMemTables, // Return current size of all (active + immutable) // memtables kNumEntriesInMutableMemtable, // Return number of entries in the mutable // memtable. kNumEntriesInImmutableMemtable, // Return sum of number of entries in all // the immutable mem tables. kEstimatedNumKeys, // Estimated total number of keys in the database. kEstimatedUsageByTableReaders, // Estimated memory by table readers. kIsFileDeletionEnabled, // Equals disable_delete_obsolete_files_, // 0 means file deletions enabled }; extern DBPropertyType GetPropertyType(const Slice& property, bool* is_int_property, bool* need_out_of_mutex); class InternalStats { public: enum InternalCFStatsType { LEVEL0_SLOWDOWN, MEMTABLE_COMPACTION, LEVEL0_NUM_FILES, WRITE_STALLS_ENUM_MAX, BYTES_FLUSHED, INTERNAL_CF_STATS_ENUM_MAX, }; enum InternalDBStatsType { WAL_FILE_BYTES, WAL_FILE_SYNCED, BYTES_WRITTEN, NUMBER_KEYS_WRITTEN, WRITE_DONE_BY_OTHER, WRITE_DONE_BY_SELF, WRITE_WITH_WAL, INTERNAL_DB_STATS_ENUM_MAX, }; InternalStats(int num_levels, Env* env, ColumnFamilyData* cfd) : db_stats_(INTERNAL_DB_STATS_ENUM_MAX), cf_stats_value_(INTERNAL_CF_STATS_ENUM_MAX), cf_stats_count_(INTERNAL_CF_STATS_ENUM_MAX), comp_stats_(num_levels), stall_leveln_slowdown_hard_(num_levels), stall_leveln_slowdown_count_hard_(num_levels), stall_leveln_slowdown_soft_(num_levels), stall_leveln_slowdown_count_soft_(num_levels), bg_error_count_(0), number_levels_(num_levels), env_(env), cfd_(cfd), started_at_(env->NowMicros()) { for (int i = 0; i< INTERNAL_DB_STATS_ENUM_MAX; ++i) { db_stats_[i] = 0; } for (int i = 0; i< INTERNAL_CF_STATS_ENUM_MAX; ++i) { cf_stats_value_[i] = 0; cf_stats_count_[i] = 0; } for (int i = 0; i < num_levels; ++i) { stall_leveln_slowdown_hard_[i] = 0; stall_leveln_slowdown_count_hard_[i] = 0; stall_leveln_slowdown_soft_[i] = 0; stall_leveln_slowdown_count_soft_[i] = 0; } } // Per level compaction stats. comp_stats_[level] stores the stats for // compactions that produced data for the specified "level". struct CompactionStats { uint64_t micros; // Bytes read from level N during compaction between levels N and N+1 uint64_t bytes_readn; // Bytes read from level N+1 during compaction between levels N and N+1 uint64_t bytes_readnp1; // Total bytes written during compaction between levels N and N+1 uint64_t bytes_written; // Files read from level N during compaction between levels N and N+1 int files_in_leveln; // Files read from level N+1 during compaction between levels N and N+1 int files_in_levelnp1; // Files written during compaction between levels N and N+1 int files_out_levelnp1; // Total incoming entries during compaction between levels N and N+1 uint64_t num_input_records; // Accumulated diff number of entries // (num input entries - num output entires) for compaction levels N and N+1 uint64_t num_dropped_records; // Number of compactions done int count; explicit CompactionStats(int _count = 0) : micros(0), bytes_readn(0), bytes_readnp1(0), bytes_written(0), files_in_leveln(0), files_in_levelnp1(0), files_out_levelnp1(0), num_input_records(0), num_dropped_records(0), count(_count) {} explicit CompactionStats(const CompactionStats& c) : micros(c.micros), bytes_readn(c.bytes_readn), bytes_readnp1(c.bytes_readnp1), bytes_written(c.bytes_written), files_in_leveln(c.files_in_leveln), files_in_levelnp1(c.files_in_levelnp1), files_out_levelnp1(c.files_out_levelnp1), num_input_records(c.num_input_records), num_dropped_records(c.num_dropped_records), count(c.count) {} void Add(const CompactionStats& c) { this->micros += c.micros; this->bytes_readn += c.bytes_readn; this->bytes_readnp1 += c.bytes_readnp1; this->bytes_written += c.bytes_written; this->files_in_leveln += c.files_in_leveln; this->files_in_levelnp1 += c.files_in_levelnp1; this->files_out_levelnp1 += c.files_out_levelnp1; this->num_input_records += c.num_input_records; this->num_dropped_records += c.num_dropped_records; this->count += c.count; } void Subtract(const CompactionStats& c) { this->micros -= c.micros; this->bytes_readn -= c.bytes_readn; this->bytes_readnp1 -= c.bytes_readnp1; this->bytes_written -= c.bytes_written; this->files_in_leveln -= c.files_in_leveln; this->files_in_levelnp1 -= c.files_in_levelnp1; this->files_out_levelnp1 -= c.files_out_levelnp1; this->num_input_records -= c.num_input_records; this->num_dropped_records -= c.num_dropped_records; this->count -= c.count; } }; void AddCompactionStats(int level, const CompactionStats& stats) { comp_stats_[level].Add(stats); } void RecordLevelNSlowdown(int level, uint64_t micros, bool soft) { if (soft) { stall_leveln_slowdown_soft_[level] += micros; ++stall_leveln_slowdown_count_soft_[level]; } else { stall_leveln_slowdown_hard_[level] += micros; ++stall_leveln_slowdown_count_hard_[level]; } } void AddCFStats(InternalCFStatsType type, uint64_t value) { cf_stats_value_[type] += value; ++cf_stats_count_[type]; } void AddDBStats(InternalDBStatsType type, uint64_t value) { db_stats_[type] += value; } uint64_t GetBackgroundErrorCount() const { return bg_error_count_; } uint64_t BumpAndGetBackgroundErrorCount() { return ++bg_error_count_; } bool GetStringProperty(DBPropertyType property_type, const Slice& property, std::string* value); bool GetIntProperty(DBPropertyType property_type, uint64_t* value, DBImpl* db) const; bool GetIntPropertyOutOfMutex(DBPropertyType property_type, Version* version, uint64_t* value) const; private: void DumpDBStats(std::string* value); void DumpCFStats(std::string* value); // Per-DB stats std::vector db_stats_; // Per-ColumnFamily stats std::vector cf_stats_value_; std::vector cf_stats_count_; // Per-ColumnFamily/level compaction stats std::vector comp_stats_; // These count the number of microseconds for which MakeRoomForWrite stalls. std::vector stall_leveln_slowdown_hard_; std::vector stall_leveln_slowdown_count_hard_; std::vector stall_leveln_slowdown_soft_; std::vector stall_leveln_slowdown_count_soft_; // Used to compute per-interval statistics struct CFStatsSnapshot { // ColumnFamily-level stats CompactionStats comp_stats; uint64_t ingest_bytes; // Bytes written to L0 uint64_t stall_us; // Stall time in micro-seconds uint64_t stall_count; // Stall count CFStatsSnapshot() : comp_stats(0), ingest_bytes(0), stall_us(0), stall_count(0) {} } cf_stats_snapshot_; struct DBStatsSnapshot { // DB-level stats uint64_t ingest_bytes; // Bytes written by user uint64_t wal_bytes; // Bytes written to WAL uint64_t wal_synced; // Number of times WAL is synced uint64_t write_with_wal; // Number of writes that request WAL // These count the number of writes processed by the calling thread or // another thread. uint64_t write_other; uint64_t write_self; // Total number of keys written. write_self and write_other measure number // of write requests written, Each of the write request can contain updates // to multiple keys. num_keys_written is total number of keys updated by all // those writes. uint64_t num_keys_written; double seconds_up; DBStatsSnapshot() : ingest_bytes(0), wal_bytes(0), wal_synced(0), write_with_wal(0), write_other(0), write_self(0), num_keys_written(0), seconds_up(0) {} } db_stats_snapshot_; // Total number of background errors encountered. Every time a flush task // or compaction task fails, this counter is incremented. The failure can // be caused by any possible reason, including file system errors, out of // resources, or input file corruption. Failing when retrying the same flush // or compaction will cause the counter to increase too. uint64_t bg_error_count_; const int number_levels_; Env* env_; ColumnFamilyData* cfd_; const uint64_t started_at_; }; } // namespace rocksdb