internal_stats.h 15.3 KB
Newer Older
I
Igor Canadi 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16
//  Copyright (c) 2013, Facebook, Inc.  All rights reserved.
//  This source code is licensed under the BSD-style license found in the
//  LICENSE file in the root directory of this source tree. An additional grant
//  of patent rights can be found in the PATENTS file in the same directory.
//
// Copyright (c) 2011 The LevelDB Authors. All rights reserved.
// Use of this source code is governed by a BSD-style license that can be
// found in the LICENSE file. See the AUTHORS file for names of contributors.
//

#pragma once
#include "db/version_set.h"

#include <vector>
#include <string>

17 18
class ColumnFamilyData;

I
Igor Canadi 已提交
19
namespace rocksdb {
20 21

class MemTableList;
22
class DBImpl;
23

24 25
// IMPORTANT: If you add a new property here, also add it to the list in
//            include/rocksdb/db.h
26 27
enum DBPropertyType : uint32_t {
  kUnknown,
28 29
  kNumFilesAtLevel,  // Number of files at a specific level
  kLevelStats,       // Return number of files and total sizes of each level
30 31 32
  kCFStats,          // Return general statitistics of CF
  kDBStats,          // Return general statitistics of DB
  kStats,            // Return general statitistics of both DB and CF
33
  kSsTables,         // Return a human readable string of current SST files
34
  kStartIntTypes,    // ---- Dummy value to indicate the start of integer values
35 36 37 38 39 40
  kNumImmutableMemTable,         // Return number of immutable mem tables that
                                 // have not been flushed.
  kNumImmutableMemTableFlushed,  // Return number of immutable mem tables
                                 // in memory that have already been flushed
  kMemtableFlushPending,         // Return 1 if mem table flushing is pending,
                                 // otherwise 0.
41
  kNumRunningFlushes,      // Return the number of currently running flushes.
42
  kCompactionPending,      // Return 1 if a compaction is pending. Otherwise 0.
43 44
  kNumRunningCompactions,  // Return the number of currently running
                           // compactions.
45
  kBackgroundErrors,       // Return accumulated background errors encountered.
46
  kCurSizeActiveMemTable,  // Return current size of the active memtable
47 48 49 50
  kCurSizeAllMemTables,    // Return current size of unflushed
                           // (active + immutable) memtables
  kSizeAllMemTables,       // Return current size of all (active + immutable
                           // + pinned) memtables
51
  kNumEntriesInMutableMemtable,    // Return number of deletes in the mutable
52 53 54
                                   // memtable.
  kNumEntriesInImmutableMemtable,  // Return sum of number of entries in all
                                   // the immutable mem tables.
55 56 57 58
  kNumDeletesInMutableMemtable,    // Return number of deletion entries in the
                                   // mutable memtable.
  kNumDeletesInImmutableMemtable,  // Return the total number of deletion
                                   // entries in all the immutable mem tables.
S
sdong 已提交
59
  kEstimatedNumKeys,  // Estimated total number of keys in the database.
60
  kEstimatedUsageByTableReaders,  // Estimated memory by table readers.
61 62
  kIsFileDeletionEnabled,         // Equals disable_delete_obsolete_files_,
                                  // 0 means file deletions enabled
63 64
  kNumSnapshots,                  // Number of snapshots in the system
  kOldestSnapshotTime,            // Unix timestamp of the first snapshot
65
  kNumLiveVersions,
66 67 68 69
  kEstimateLiveDataSize,            // Estimated amount of live data in bytes
  kTotalSstFilesSize,               // Total size of all sst files.
  kBaseLevel,                       // The level that L0 data is compacted to
  kEstimatePendingCompactionBytes,  // Estimated bytes to compaction
70 71 72 73 74
  kAggregatedTableProperties,  // Return a string that contains the aggregated
                               // table properties.
  kAggregatedTablePropertiesAtLevel,  // Return a string that contains the
                                      // aggregated
  // table properties at the specified level.
75 76
};

77 78 79
extern DBPropertyType GetPropertyType(const Slice& property,
                                      bool* is_int_property,
                                      bool* need_out_of_mutex);
80

81 82

#ifndef ROCKSDB_LITE
I
Igor Canadi 已提交
83 84
class InternalStats {
 public:
85
  enum InternalCFStatsType {
86 87
    LEVEL0_SLOWDOWN_TOTAL,
    LEVEL0_SLOWDOWN_WITH_COMPACTION,
I
Igor Canadi 已提交
88
    MEMTABLE_COMPACTION,
89 90
    LEVEL0_NUM_FILES_TOTAL,
    LEVEL0_NUM_FILES_WITH_COMPACTION,
91
    HARD_PENDING_COMPACTION_BYTES_LIMIT,
I
Igor Canadi 已提交
92
    WRITE_STALLS_ENUM_MAX,
93 94
    BYTES_FLUSHED,
    INTERNAL_CF_STATS_ENUM_MAX,
I
Igor Canadi 已提交
95 96
  };

97 98 99 100
  enum InternalDBStatsType {
    WAL_FILE_BYTES,
    WAL_FILE_SYNCED,
    BYTES_WRITTEN,
S
sdong 已提交
101
    NUMBER_KEYS_WRITTEN,
102 103 104
    WRITE_DONE_BY_OTHER,
    WRITE_DONE_BY_SELF,
    WRITE_WITH_WAL,
S
sdong 已提交
105
    WRITE_STALL_MICROS,
106 107 108
    INTERNAL_DB_STATS_ENUM_MAX,
  };

109
  InternalStats(int num_levels, Env* env, ColumnFamilyData* cfd)
110 111 112 113 114 115
      : db_stats_(INTERNAL_DB_STATS_ENUM_MAX),
        cf_stats_value_(INTERNAL_CF_STATS_ENUM_MAX),
        cf_stats_count_(INTERNAL_CF_STATS_ENUM_MAX),
        comp_stats_(num_levels),
        stall_leveln_slowdown_count_hard_(num_levels),
        stall_leveln_slowdown_count_soft_(num_levels),
116
        file_read_latency_(num_levels),
117
        bg_error_count_(0),
I
Igor Canadi 已提交
118 119
        number_levels_(num_levels),
        env_(env),
120
        cfd_(cfd),
121 122 123 124 125 126 127 128 129 130 131 132 133
        started_at_(env->NowMicros()) {
    for (int i = 0; i< INTERNAL_DB_STATS_ENUM_MAX; ++i) {
      db_stats_[i] = 0;
    }
    for (int i = 0; i< INTERNAL_CF_STATS_ENUM_MAX; ++i) {
      cf_stats_value_[i] = 0;
      cf_stats_count_[i] = 0;
    }
    for (int i = 0; i < num_levels; ++i) {
      stall_leveln_slowdown_count_hard_[i] = 0;
      stall_leveln_slowdown_count_soft_[i] = 0;
    }
  }
I
Igor Canadi 已提交
134

135
  // Per level compaction stats.  comp_stats_[level] stores the stats for
I
Igor Canadi 已提交
136 137 138 139
  // compactions that produced data for the specified "level".
  struct CompactionStats {
    uint64_t micros;

140 141
    // The number of bytes read from all non-output levels
    uint64_t bytes_read_non_output_levels;
I
Igor Canadi 已提交
142

143 144
    // The number of bytes read from the compaction output level.
    uint64_t bytes_read_output_level;
I
Igor Canadi 已提交
145

146
    // Total number of bytes written during compaction
147
    uint64_t bytes_written;
I
Igor Canadi 已提交
148

149
    // Total number of bytes moved to the output level
150 151
    uint64_t bytes_moved;

152 153
    // The number of compaction input files in all non-output levels.
    int num_input_files_in_non_output_levels;
I
Igor Canadi 已提交
154

155 156
    // The number of compaction input files in the output level.
    int num_input_files_in_output_level;
I
Igor Canadi 已提交
157

158 159
    // The number of compaction output files.
    int num_output_files;
I
Igor Canadi 已提交
160

161
    // Total incoming entries during compaction between levels N and N+1
S
sdong 已提交
162
    uint64_t num_input_records;
163 164 165

    // Accumulated diff number of entries
    // (num input entries - num output entires) for compaction  levels N and N+1
S
sdong 已提交
166
    uint64_t num_dropped_records;
167

I
Igor Canadi 已提交
168 169 170
    // Number of compactions done
    int count;

I
Igor Canadi 已提交
171
    explicit CompactionStats(int _count = 0)
I
Igor Canadi 已提交
172
        : micros(0),
173 174
          bytes_read_non_output_levels(0),
          bytes_read_output_level(0),
I
Igor Canadi 已提交
175
          bytes_written(0),
176
          bytes_moved(0),
177 178 179
          num_input_files_in_non_output_levels(0),
          num_input_files_in_output_level(0),
          num_output_files(0),
180 181
          num_input_records(0),
          num_dropped_records(0),
I
Igor Canadi 已提交
182
          count(_count) {}
I
Igor Canadi 已提交
183

184 185
    explicit CompactionStats(const CompactionStats& c)
        : micros(c.micros),
186 187
          bytes_read_non_output_levels(c.bytes_read_non_output_levels),
          bytes_read_output_level(c.bytes_read_output_level),
188
          bytes_written(c.bytes_written),
189
          bytes_moved(c.bytes_moved),
190 191 192 193 194
          num_input_files_in_non_output_levels(
              c.num_input_files_in_non_output_levels),
          num_input_files_in_output_level(
              c.num_input_files_in_output_level),
          num_output_files(c.num_output_files),
195 196
          num_input_records(c.num_input_records),
          num_dropped_records(c.num_dropped_records),
197 198
          count(c.count) {}

I
Igor Canadi 已提交
199 200
    void Add(const CompactionStats& c) {
      this->micros += c.micros;
201 202
      this->bytes_read_non_output_levels += c.bytes_read_non_output_levels;
      this->bytes_read_output_level += c.bytes_read_output_level;
I
Igor Canadi 已提交
203
      this->bytes_written += c.bytes_written;
204
      this->bytes_moved += c.bytes_moved;
205 206 207 208 209
      this->num_input_files_in_non_output_levels +=
          c.num_input_files_in_non_output_levels;
      this->num_input_files_in_output_level +=
          c.num_input_files_in_output_level;
      this->num_output_files += c.num_output_files;
210 211
      this->num_input_records += c.num_input_records;
      this->num_dropped_records += c.num_dropped_records;
L
Lei Jin 已提交
212
      this->count += c.count;
I
Igor Canadi 已提交
213
    }
214 215 216

    void Subtract(const CompactionStats& c) {
      this->micros -= c.micros;
217 218
      this->bytes_read_non_output_levels -= c.bytes_read_non_output_levels;
      this->bytes_read_output_level -= c.bytes_read_output_level;
219
      this->bytes_written -= c.bytes_written;
220
      this->bytes_moved -= c.bytes_moved;
221 222 223 224 225
      this->num_input_files_in_non_output_levels -=
          c.num_input_files_in_non_output_levels;
      this->num_input_files_in_output_level -=
          c.num_input_files_in_output_level;
      this->num_output_files -= c.num_output_files;
226 227
      this->num_input_records -= c.num_input_records;
      this->num_dropped_records -= c.num_dropped_records;
228 229
      this->count -= c.count;
    }
I
Igor Canadi 已提交
230 231 232
  };

  void AddCompactionStats(int level, const CompactionStats& stats) {
233
    comp_stats_[level].Add(stats);
I
Igor Canadi 已提交
234 235
  }

236 237 238 239
  void IncBytesMoved(int level, uint64_t amount) {
    comp_stats_[level].bytes_moved += amount;
  }

240
  void RecordLevelNSlowdown(int level, bool soft) {
241 242 243 244 245 246 247 248 249 250
    if (soft) {
      ++stall_leveln_slowdown_count_soft_[level];
    } else {
      ++stall_leveln_slowdown_count_hard_[level];
    }
  }

  void AddCFStats(InternalCFStatsType type, uint64_t value) {
    cf_stats_value_[type] += value;
    ++cf_stats_count_[type];
I
Igor Canadi 已提交
251 252
  }

253 254
  void AddDBStats(InternalDBStatsType type, uint64_t value) {
    db_stats_[type] += value;
I
Igor Canadi 已提交
255 256
  }

257 258 259 260
  HistogramImpl* GetFileReadHist(int level) {
    return &file_read_latency_[level];
  }

261 262 263 264
  uint64_t GetBackgroundErrorCount() const { return bg_error_count_; }

  uint64_t BumpAndGetBackgroundErrorCount() { return ++bg_error_count_; }

265 266
  bool GetStringProperty(DBPropertyType property_type, const Slice& property,
                         std::string* value);
I
Igor Canadi 已提交
267

268 269
  bool GetIntProperty(DBPropertyType property_type, uint64_t* value,
                      DBImpl* db) const;
270 271 272

  bool GetIntPropertyOutOfMutex(DBPropertyType property_type, Version* version,
                                uint64_t* value) const;
273

I
Igor Canadi 已提交
274
 private:
275
  void DumpDBStats(std::string* value);
276
  void DumpCFStats(std::string* value);
277 278 279 280 281 282 283 284 285 286 287

  // Per-DB stats
  std::vector<uint64_t> db_stats_;
  // Per-ColumnFamily stats
  std::vector<uint64_t> cf_stats_value_;
  std::vector<uint64_t> cf_stats_count_;
  // Per-ColumnFamily/level compaction stats
  std::vector<CompactionStats> comp_stats_;
  // These count the number of microseconds for which MakeRoomForWrite stalls.
  std::vector<uint64_t> stall_leveln_slowdown_count_hard_;
  std::vector<uint64_t> stall_leveln_slowdown_count_soft_;
288
  std::vector<HistogramImpl> file_read_latency_;
I
Igor Canadi 已提交
289 290

  // Used to compute per-interval statistics
291 292 293 294 295 296 297 298 299 300 301 302 303 304 305 306 307 308
  struct CFStatsSnapshot {
    // ColumnFamily-level stats
    CompactionStats comp_stats;
    uint64_t ingest_bytes;            // Bytes written to L0
    uint64_t stall_count;             // Stall count

    CFStatsSnapshot()
        : comp_stats(0),
          ingest_bytes(0),
          stall_count(0) {}
  } cf_stats_snapshot_;

  struct DBStatsSnapshot {
    // DB-level stats
    uint64_t ingest_bytes;            // Bytes written by user
    uint64_t wal_bytes;               // Bytes written to WAL
    uint64_t wal_synced;              // Number of times WAL is synced
    uint64_t write_with_wal;          // Number of writes that request WAL
I
Igor Canadi 已提交
309 310
    // These count the number of writes processed by the calling thread or
    // another thread.
311 312
    uint64_t write_other;
    uint64_t write_self;
313 314 315 316
    // Stats from compaction jobs - bytes written, bytes read, duration.
    uint64_t compact_bytes_write;
    uint64_t compact_bytes_read;
    uint64_t compact_micros;
S
sdong 已提交
317 318 319 320 321
    // Total number of keys written. write_self and write_other measure number
    // of write requests written, Each of the write request can contain updates
    // to multiple keys. num_keys_written is total number of keys updated by all
    // those writes.
    uint64_t num_keys_written;
S
sdong 已提交
322 323
    // Total time writes delayed by stalls.
    uint64_t write_stall_micros;
324 325 326 327 328 329 330 331 332
    double seconds_up;

    DBStatsSnapshot()
        : ingest_bytes(0),
          wal_bytes(0),
          wal_synced(0),
          write_with_wal(0),
          write_other(0),
          write_self(0),
333 334 335
          compact_bytes_write(0),
          compact_bytes_read(0),
          compact_micros(0),
336
          num_keys_written(0),
S
sdong 已提交
337
          write_stall_micros(0),
338 339
          seconds_up(0) {}
  } db_stats_snapshot_;
I
Igor Canadi 已提交
340

341 342 343 344 345 346 347
  // Total number of background errors encountered. Every time a flush task
  // or compaction task fails, this counter is incremented. The failure can
  // be caused by any possible reason, including file system errors, out of
  // resources, or input file corruption. Failing when retrying the same flush
  // or compaction will cause the counter to increase too.
  uint64_t bg_error_count_;

348
  const int number_levels_;
I
Igor Canadi 已提交
349
  Env* env_;
350
  ColumnFamilyData* cfd_;
351
  const uint64_t started_at_;
I
Igor Canadi 已提交
352 353
};

354 355 356 357 358
#else

class InternalStats {
 public:
  enum InternalCFStatsType {
359 360
    LEVEL0_SLOWDOWN_TOTAL,
    LEVEL0_SLOWDOWN_WITH_COMPACTION,
361
    MEMTABLE_COMPACTION,
362 363
    LEVEL0_NUM_FILES_TOTAL,
    LEVEL0_NUM_FILES_WITH_COMPACTION,
364
    HARD_PENDING_COMPACTION_BYTES_LIMIT,
365 366 367 368 369 370 371 372 373 374 375 376 377
    WRITE_STALLS_ENUM_MAX,
    BYTES_FLUSHED,
    INTERNAL_CF_STATS_ENUM_MAX,
  };

  enum InternalDBStatsType {
    WAL_FILE_BYTES,
    WAL_FILE_SYNCED,
    BYTES_WRITTEN,
    NUMBER_KEYS_WRITTEN,
    WRITE_DONE_BY_OTHER,
    WRITE_DONE_BY_SELF,
    WRITE_WITH_WAL,
S
sdong 已提交
378
    WRITE_STALL_MICROS,
379 380 381 382 383 384 385
    INTERNAL_DB_STATS_ENUM_MAX,
  };

  InternalStats(int num_levels, Env* env, ColumnFamilyData* cfd) {}

  struct CompactionStats {
    uint64_t micros;
386 387
    uint64_t bytes_read_non_output_levels;
    uint64_t bytes_read_output_level;
388
    uint64_t bytes_written;
389
    uint64_t bytes_moved;
390 391 392
    int num_input_files_in_non_output_levels;
    int num_input_files_in_output_level;
    int num_output_files;
393 394 395 396 397 398 399 400 401 402 403 404 405 406 407
    uint64_t num_input_records;
    uint64_t num_dropped_records;
    int count;

    explicit CompactionStats(int _count = 0) {}

    explicit CompactionStats(const CompactionStats& c) {}

    void Add(const CompactionStats& c) {}

    void Subtract(const CompactionStats& c) {}
  };

  void AddCompactionStats(int level, const CompactionStats& stats) {}

408 409
  void IncBytesMoved(int level, uint64_t amount) {}

410
  void RecordLevelNSlowdown(int level, bool soft) {}
411 412 413 414 415

  void AddCFStats(InternalCFStatsType type, uint64_t value) {}

  void AddDBStats(InternalDBStatsType type, uint64_t value) {}

416 417
  HistogramImpl* GetFileReadHist(int level) { return nullptr; }

418 419 420 421 422 423 424 425 426 427 428 429 430 431 432
  uint64_t GetBackgroundErrorCount() const { return 0; }

  uint64_t BumpAndGetBackgroundErrorCount() { return 0; }

  bool GetStringProperty(DBPropertyType property_type, const Slice& property,
                         std::string* value) { return false; }

  bool GetIntProperty(DBPropertyType property_type, uint64_t* value,
                      DBImpl* db) const { return false; }

  bool GetIntPropertyOutOfMutex(DBPropertyType property_type, Version* version,
                                uint64_t* value) const { return false; }
};
#endif  // !ROCKSDB_LITE

I
Igor Canadi 已提交
433
}  // namespace rocksdb