db_bench.cc 85.3 KB
Newer Older
J
jorlow@chromium.org 已提交
1 2 3 4
// Copyright (c) 2011 The LevelDB Authors. All rights reserved.
// Use of this source code is governed by a BSD-style license that can be
// found in the LICENSE file. See the AUTHORS file for names of contributors.

5
#include <cstddef>
J
jorlow@chromium.org 已提交
6 7 8 9 10
#include <sys/types.h>
#include <stdio.h>
#include <stdlib.h>
#include "db/db_impl.h"
#include "db/version_set.h"
11
#include "db/db_statistics.h"
12 13 14 15 16 17
#include "rocksdb/options.h"
#include "rocksdb/cache.h"
#include "rocksdb/db.h"
#include "rocksdb/env.h"
#include "rocksdb/write_batch.h"
#include "rocksdb/statistics.h"
J
jorlow@chromium.org 已提交
18
#include "port/port.h"
19
#include "util/bit_set.h"
J
jorlow@chromium.org 已提交
20
#include "util/crc32c.h"
J
jorlow@chromium.org 已提交
21
#include "util/histogram.h"
22
#include "util/mutexlock.h"
J
jorlow@chromium.org 已提交
23
#include "util/random.h"
24
#include "util/stack_trace.h"
25
#include "util/string_util.h"
J
jorlow@chromium.org 已提交
26
#include "util/testutil.h"
27
#include "hdfs/env_hdfs.h"
D
Deon Nicholas 已提交
28
#include "utilities/merge_operators.h"
J
jorlow@chromium.org 已提交
29 30 31

// Comma-separated list of operations to run in the specified order
//   Actual benchmarks:
32 33 34 35 36
//      fillseq       -- write N values in sequential key order in async mode
//      fillrandom    -- write N values in random key order in async mode
//      overwrite     -- overwrite N values in random key order in async mode
//      fillsync      -- write N/100 values in random key order in sync mode
//      fill100K      -- write N/1000 100K values in random order in async mode
S
Sanjay Ghemawat 已提交
37 38
//      deleteseq     -- delete N keys in sequential order
//      deleterandom  -- delete N keys in random order
39 40 41
//      readseq       -- read N times sequentially
//      readreverse   -- read N times in reverse order
//      readrandom    -- read N times in random order
S
Sanjay Ghemawat 已提交
42
//      readmissing   -- read N missing keys in random order
43
//      readhot       -- read N times in random order from 1% section of DB
T
Tyler Harter 已提交
44 45 46
//      readwhilewriting      -- 1 writer, N threads doing random reads
//      readrandomwriterandom -- N threads doing random-read, random-write
//      prefixscanrandom      -- prefix scan N times in random order
47
//      updaterandom  -- N threads doing read-modify-write for random keys
D
Deon Nicholas 已提交
48 49 50
//      appendrandom  -- N threads doing read-modify-write with growing values
//      mergerandom   -- same as updaterandom/appendrandom using merge operator
//                    -- must be used with FLAGS_merge_operator (see below)
S
Sanjay Ghemawat 已提交
51
//      seekrandom    -- N random seeks
J
jorlow@chromium.org 已提交
52
//      crc32c        -- repeated crc32c of 4K of data
53
//      acquireload   -- load N*1000 times
J
jorlow@chromium.org 已提交
54 55
//   Meta operations:
//      compact     -- Compact the entire DB
56
//      stats       -- Print DB stats
57
//      levelstats  -- Print the number of files and bytes per level
S
Sanjay Ghemawat 已提交
58
//      sstables    -- Print sstable info
J
jorlow@chromium.org 已提交
59 60
//      heapprofile -- Dump a heap profile (if supported by this port)
static const char* FLAGS_benchmarks =
61
    "fillseq,"
J
jorlow@chromium.org 已提交
62
    "fillsync,"
63 64
    "fillrandom,"
    "overwrite,"
J
jorlow@chromium.org 已提交
65 66
    "readrandom,"
    "readrandom,"  // Extra run to allow previous compactions to quiesce
J
jorlow@chromium.org 已提交
67
    "readseq,"
J
jorlow@chromium.org 已提交
68
    "readreverse,"
J
jorlow@chromium.org 已提交
69
    "compact,"
J
jorlow@chromium.org 已提交
70
    "readrandom,"
J
jorlow@chromium.org 已提交
71
    "readseq,"
J
jorlow@chromium.org 已提交
72
    "readreverse,"
73
    "readwhilewriting,"
74
    "readrandomwriterandom," // mix reads and writes based on FLAGS_readwritepercent
M
Mark Callaghan 已提交
75
    "updaterandom," // read-modify-write for random keys
76
    "randomwithverify," // random reads and writes with some verification
J
jorlow@chromium.org 已提交
77 78
    "fill100K,"
    "crc32c,"
79 80
    "snappycomp,"
    "snappyuncomp,"
81
    "acquireload,"
J
jorlow@chromium.org 已提交
82
    ;
83 84
// the maximum size of key in bytes
static const int MAX_KEY_SIZE = 128;
J
jorlow@chromium.org 已提交
85
// Number of key/values to place in database
86
static long long FLAGS_num = 1000000;
J
jorlow@chromium.org 已提交
87

88 89 90
// Number of distinct keys to use. Used in RandomWithVerify to read/write
// on fewer keys so that gets are more likely to find the key and puts
// are more likely to update the same key
91
static long long FLAGS_numdistinct = 1000;
92

93
// Number of read operations to do.  If negative, do FLAGS_num reads.
94
static long FLAGS_reads = -1;
95

96 97 98
// When ==1 reads use ::Get, when >1 reads use an iterator
static long FLAGS_read_range = 1;

T
Tyler Harter 已提交
99 100 101 102 103 104 105
// Whether to place prefixes in blooms
static bool FLAGS_use_prefix_blooms = false;

// Whether to set ReadOptions.prefix for prefixscanrandom.  If this
// true, use_prefix_blooms must also be true.
static bool FLAGS_use_prefix_api = false;

106 107 108
// Seed base for random number generators. When 0 it is deterministic.
static long FLAGS_seed = 0;

109 110 111
// Number of concurrent threads to run.
static int FLAGS_threads = 1;

M
Mark Callaghan 已提交
112 113 114 115
// Time in seconds for the random-ops tests to run. When 0 then
// FLAGS_num & FLAGS_reads determine the test duration
static int FLAGS_duration = 0;

J
jorlow@chromium.org 已提交
116 117 118
// Size of each value
static int FLAGS_value_size = 100;

119 120 121
//size of each key
static int FLAGS_key_size = 16;

J
jorlow@chromium.org 已提交
122 123
// Arrange to generate values that shrink to this fraction of
// their original size after compression
124
static double FLAGS_compression_ratio = 0.5;
J
jorlow@chromium.org 已提交
125 126 127 128 129

// Print histogram of operation timings
static bool FLAGS_histogram = false;

// Number of bytes to buffer in memtable before compacting
130 131 132
// (initialized to default value by "main")
static int FLAGS_write_buffer_size = 0;

A
Abhishek Kona 已提交
133
// The number of in-memory memtables.
134 135 136 137
// Each memtable is of size FLAGS_write_buffer_size.
// This is initialized to default value of 2 in "main" function.
static int FLAGS_max_write_buffer_number = 0;

138 139 140
// The minimum number of write buffers that will be merged together
// before writing to storage. This is cheap because it is an
// in-memory merge. If this feature is not enabled, then all these
X
Xing Jin 已提交
141
// write buffers are flushed to L0 as separate files and this increases
142
// read amplification because a get request has to check in all of these
X
Xing Jin 已提交
143
// files. Also, an in-memory merge may result in writing less
144 145 146 147
// data to storage if there are duplicate records in each of these
// individual write buffers.
static int FLAGS_min_write_buffer_number_to_merge = 0;

148 149 150 151 152
// The maximum number of concurrent background compactions
// that can occur in parallel.
// This is initialized to default value of 1 in "main" function.
static int FLAGS_max_background_compactions = 0;

153 154
// style of compaction: level-based vs universal
static leveldb::CompactionStyle FLAGS_compaction_style = leveldb::kCompactionStyleLevel;
155

X
Xing Jin 已提交
156 157
// Percentage flexibility while comparing file size
// (for universal compaction only).
158
static int FLAGS_universal_size_ratio = 1;
159

X
Xing Jin 已提交
160 161
// The minimum number of files in a single compaction run
// (for universal compaction only).
162
static int FLAGS_compaction_universal_min_merge_width = 2;
163

164 165
// Number of bytes to use as a cache of uncompressed data.
// Negative means use default settings.
D
Dhruba Borthakur 已提交
166
static long FLAGS_cache_size = -1;
J
jorlow@chromium.org 已提交
167

168 169 170
// Number of bytes in a block.
static int FLAGS_block_size = 0;

171 172 173
// Maximum number of files to keep open at the same time (use default if == 0)
static int FLAGS_open_files = 0;

S
Sanjay Ghemawat 已提交
174 175 176 177
// Bloom filter bits per key.
// Negative means use default settings.
static int FLAGS_bloom_bits = -1;

178 179 180 181 182
// If true, do not destroy the existing database.  If you set this
// flag and also specify a benchmark that wants a fresh database, that
// benchmark will fail.
static bool FLAGS_use_existing_db = false;

183
// Use the db with the following name.
184
static const char* FLAGS_db = nullptr;
185

186 187 188 189 190
// Number of shards for the block cache is 2 ** FLAGS_cache_numshardbits.
// Negative means use default settings. This is applied only
// if FLAGS_cache_size is non-negative.
static int FLAGS_cache_numshardbits = -1;

191 192 193
// Verify checksum for every block read from storage
static bool FLAGS_verify_checksum = false;

194 195
// Database statistics
static bool FLAGS_statistics = false;
A
Abhishek Kona 已提交
196
static class std::shared_ptr<leveldb::Statistics> dbstats;
197

198 199 200
// Number of write operations to do.  If negative, do FLAGS_num reads.
static long FLAGS_writes = -1;

201 202 203 204
// Per-thread rate limit on writes per second. No limit when <= 0.
// Only for the readwhilewriting test.
static int FLAGS_writes_per_second = 0;

H
heyongqiang 已提交
205 206
// These default values might change if the hardcoded

207 208 209
// Sync all writes to disk
static bool FLAGS_sync = false;

H
heyongqiang 已提交
210 211 212
// If true, do not wait until data is synced to disk.
static bool FLAGS_disable_data_sync = false;

213 214 215
// If true, issue fsync instead of fdatasync
static bool FLAGS_use_fsync = false;

H
heyongqiang 已提交
216 217 218
// If true, do not write WAL for write.
static bool FLAGS_disable_wal = false;

M
Mark Callaghan 已提交
219 220 221 222 223 224 225
// If true, create a snapshot per query when randomread benchmark is used
static bool FLAGS_use_snapshot = false;

// If true, call GetApproximateSizes per query when FLAGS_read_range is > 1
// and randomread benchmark is used
static bool FLAGS_get_approx = false;

226
// The total number of levels
227
static int FLAGS_num_levels = 7;
228

X
Xing Jin 已提交
229
// Target file size at level-1
H
heyongqiang 已提交
230 231
static int FLAGS_target_file_size_base = 2 * 1048576;

X
Xing Jin 已提交
232
// A multiplier to compute target level-N file size (N >= 2)
H
heyongqiang 已提交
233 234
static int FLAGS_target_file_size_multiplier = 1;

235
// Max bytes for level-1
236
static uint64_t FLAGS_max_bytes_for_level_base = 10 * 1048576;
H
heyongqiang 已提交
237

X
Xing Jin 已提交
238
// A multiplier to compute max bytes for level-N (N >= 2)
H
heyongqiang 已提交
239 240
static int FLAGS_max_bytes_for_level_multiplier = 10;

241 242 243
// A vector that specifies additional fanout per level
static std::vector<int> FLAGS_max_bytes_for_level_multiplier_additional;

H
heyongqiang 已提交
244 245 246
// Number of files in level-0 that will trigger put stop.
static int FLAGS_level0_stop_writes_trigger = 12;

247 248
// Number of files in level-0 that will slow down writes.
static int FLAGS_level0_slowdown_writes_trigger = 8;
H
heyongqiang 已提交
249

250 251 252
// Number of files in level-0 when compactions start
static int FLAGS_level0_file_num_compaction_trigger = 4;

X
Xing Jin 已提交
253 254 255 256
// Ratio of reads to reads/writes (expressed as percentage) for the
// ReadRandomWriteRandom workload. The default value 90 means 90% operations
// out of all reads and writes operations are reads. In other words, 9 gets
// for every 1 put.
257 258
static int FLAGS_readwritepercent = 90;

X
Xing Jin 已提交
259 260 261 262
// Percentage of deletes out of reads/writes/deletes (used in RandomWithVerify
// only). RandomWithVerify calculates writepercent as
// (100 - FLAGS_readwritepercent - FLAGS_deletepercent), so FLAGS_deletepercent
// must be smaller than (100 - FLAGS_readwritepercent)
263 264
static int FLAGS_deletepercent = 2;

X
Xing Jin 已提交
265
// Option to disable compaction triggered by read.
266 267
static int FLAGS_disable_seek_compaction = false;

268 269 270 271 272
// Option to delete obsolete files periodically
// Default: 0 which means that obsolete files are
// deleted after every compaction run.
static uint64_t FLAGS_delete_obsolete_files_period_micros = 0;

X
Xing Jin 已提交
273
// Algorithm used to compress the database
274 275 276
static enum leveldb::CompressionType FLAGS_compression_type =
    leveldb::kSnappyCompression;

X
Xing Jin 已提交
277 278 279
// If non-negative, compression starts from this level. Levels with number
// < FLAGS_min_level_to_compress are not compressed.
// Otherwise, apply FLAGS_compression_type to all levels.
280
static int FLAGS_min_level_to_compress = -1;
281

282 283
static int FLAGS_table_cache_numshardbits = 4;

284 285 286
// posix or hdfs environment
static leveldb::Env* FLAGS_env = leveldb::Env::Default();

287 288
// Stats are reported every N operations when this is greater
// than zero. When 0 the interval grows over time.
289
static long long FLAGS_stats_interval = 0;
290

291 292 293 294
// Reports additional stats per interval when this is greater
// than 0.
static int FLAGS_stats_per_interval = 0;

J
Jim Paton 已提交
295 296
static double FLAGS_soft_rate_limit = 0;

297 298 299
// When not equal to 0 this make threads sleep at each stats
// reporting interval until the compaction score for all levels is
// less than or equal to this value.
J
Jim Paton 已提交
300
static double FLAGS_hard_rate_limit = 0;
301

J
Jim Paton 已提交
302 303 304
// When FLAGS_hard_rate_limit is set then this is the max time a put will be
// stalled.
static int FLAGS_rate_limit_delay_max_milliseconds = 1000;
305

306 307
// Control maximum bytes of overlaps in grandparent (i.e., level+2) before we
// stop building a single file in a level->level+1 compaction.
308
static int FLAGS_max_grandparent_overlap_factor = 10;
309

H
heyongqiang 已提交
310 311 312
// Run read only benchmarks.
static bool FLAGS_read_only = false;

313 314 315
// Do not auto trigger compactions
static bool FLAGS_disable_auto_compactions = false;

X
Xing Jin 已提交
316 317
// Cap the size of data in level-K for a compaction run
// that compacts Level-K with Level-(K+1) (for K >= 1)
318 319
static int FLAGS_source_compaction_factor = 1;

320 321 322
// Set the TTL for the WAL Files.
static uint64_t FLAGS_WAL_ttl_seconds = 0;

323 324 325 326 327 328 329 330 331
// Allow buffered io using OS buffers
static bool FLAGS_use_os_buffer;

// Allow reads to occur via mmap-ing files
static bool FLAGS_use_mmap_reads;

// Allow writes to occur via mmap-ing files
static bool FLAGS_use_mmap_writes;

332 333 334 335 336 337 338 339
// Advise random access on table file open
static bool FLAGS_advise_random_on_open =
  leveldb::Options().advise_random_on_open;

// Access pattern advice when a file is compacted
static auto FLAGS_compaction_fadvice =
  leveldb::Options().access_hint_on_compaction_start;

340 341 342 343 344 345 346 347 348 349 350
// Use multiget to access a series of keys instead of get
static bool FLAGS_use_multiget = false;

// If FLAGS_use_multiget is true, determines number of keys to group per call
// Arbitrary default. 90 is good because it agrees with FLAGS_readwritepercent
static long FLAGS_keys_per_multiget = 90;

// Print a message to user when a key is missing in a Get/MultiGet call
// TODO: Apply this flag to generic Get calls too. Currently only with Multiget
static bool FLAGS_warn_missing_keys = true;

H
Haobo Xu 已提交
351 352 353 354
// Use adaptive mutex
static auto FLAGS_use_adaptive_mutex =
  leveldb::Options().use_adaptive_mutex;

H
Haobo Xu 已提交
355 356 357 358 359 360
// Allows OS to incrementally sync files to disk while they are being
// written, in the background. Issue one request for every bytes_per_sync
// written. 0 turns it off.
static auto FLAGS_bytes_per_sync =
  leveldb::Options().bytes_per_sync;

361
// On true, deletes use bloom-filter and drop the delete if key not present
362
static bool FLAGS_filter_deletes = false;
363

J
Jim Paton 已提交
364 365 366 367 368 369 370 371 372 373 374 375
// Control the prefix size for PrefixHashRep
static bool FLAGS_prefix_size = 0;

enum RepFactory {
  kSkipList,
  kPrefixHash,
  kUnsorted,
  kVectorRep
};

static enum RepFactory FLAGS_rep_factory;

D
Deon Nicholas 已提交
376 377 378 379 380
// The merge operator to use with the database.
// If a new merge operator is specified, be sure to use fresh database
// The possible merge operators are defined in utilities/merge_operators.h
static std::string FLAGS_merge_operator = "";

J
jorlow@chromium.org 已提交
381 382
namespace leveldb {

383
// Helper for quickly generating random data.
J
jorlow@chromium.org 已提交
384 385 386
class RandomGenerator {
 private:
  std::string data_;
387
  unsigned int pos_;
J
jorlow@chromium.org 已提交
388 389 390 391 392 393 394 395

 public:
  RandomGenerator() {
    // We use a limited amount of data over and over again and ensure
    // that it is larger than the compression window (32KB), and also
    // large enough to serve all typical value sizes we want to write.
    Random rnd(301);
    std::string piece;
396
    while (data_.size() < (unsigned)std::max(1048576, FLAGS_value_size)) {
J
jorlow@chromium.org 已提交
397 398 399 400 401 402 403 404
      // Add a short fragment that is as compressible as specified
      // by FLAGS_compression_ratio.
      test::CompressibleString(&rnd, FLAGS_compression_ratio, 100, &piece);
      data_.append(piece);
    }
    pos_ = 0;
  }

405
  Slice Generate(unsigned int len) {
J
jorlow@chromium.org 已提交
406 407 408 409 410 411 412
    if (pos_ + len > data_.size()) {
      pos_ = 0;
      assert(len < data_.size());
    }
    pos_ += len;
    return Slice(data_.data() + pos_ - len, len);
  }
413
};
X
Xing Jin 已提交
414

415
static Slice TrimSpace(Slice s) {
416
  unsigned int start = 0;
417 418 419
  while (start < s.size() && isspace(s[start])) {
    start++;
  }
420
  unsigned int limit = s.size();
421 422 423 424 425 426
  while (limit > start && isspace(s[limit-1])) {
    limit--;
  }
  return Slice(s.data() + start, limit - start);
}

427 428 429 430 431 432 433 434 435 436
static void AppendWithSpace(std::string* str, Slice msg) {
  if (msg.empty()) return;
  if (!str->empty()) {
    str->push_back(' ');
  }
  str->append(msg.data(), msg.size());
}

class Stats {
 private:
437
  int id_;
438 439 440
  double start_;
  double finish_;
  double seconds_;
441 442 443
  long long done_;
  long long last_report_done_;
  long long next_report_;
444 445
  int64_t bytes_;
  double last_op_finish_;
446
  double last_report_finish_;
447
  HistogramImpl hist_;
448
  std::string message_;
449
  bool exclude_from_merge_;
450 451

 public:
452
  Stats() { Start(-1); }
453

454 455 456
  void Start(int id) {
    id_ = id;
    next_report_ = FLAGS_stats_interval ? FLAGS_stats_interval : 100;
457 458 459
    last_op_finish_ = start_;
    hist_.Clear();
    done_ = 0;
460
    last_report_done_ = 0;
461 462
    bytes_ = 0;
    seconds_ = 0;
463
    start_ = FLAGS_env->NowMicros();
464
    finish_ = start_;
465
    last_report_finish_ = start_;
466
    message_.clear();
467 468
    // When set, stats from this thread won't be merged with others.
    exclude_from_merge_ = false;
469 470 471
  }

  void Merge(const Stats& other) {
472 473 474
    if (other.exclude_from_merge_)
      return;

475 476 477 478 479 480 481 482 483 484 485 486
    hist_.Merge(other.hist_);
    done_ += other.done_;
    bytes_ += other.bytes_;
    seconds_ += other.seconds_;
    if (other.start_ < start_) start_ = other.start_;
    if (other.finish_ > finish_) finish_ = other.finish_;

    // Just keep the messages from one thread
    if (message_.empty()) message_ = other.message_;
  }

  void Stop() {
487
    finish_ = FLAGS_env->NowMicros();
488 489 490 491 492 493 494
    seconds_ = (finish_ - start_) * 1e-6;
  }

  void AddMessage(Slice msg) {
    AppendWithSpace(&message_, msg);
  }

495
  void SetId(int id) { id_ = id; }
496
  void SetExcludeFromMerge() { exclude_from_merge_ = true; }
497

M
Mark Callaghan 已提交
498
  void FinishedSingleOp(DB* db) {
499
    if (FLAGS_histogram) {
500
      double now = FLAGS_env->NowMicros();
501 502
      double micros = now - last_op_finish_;
      hist_.Add(micros);
503
      if (micros > 20000 && !FLAGS_stats_interval) {
504 505 506 507 508 509 510 511
        fprintf(stderr, "long op: %.1f micros%30s\r", micros, "");
        fflush(stderr);
      }
      last_op_finish_ = now;
    }

    done_++;
    if (done_ >= next_report_) {
512 513 514 515 516 517 518 519
      if (!FLAGS_stats_interval) {
        if      (next_report_ < 1000)   next_report_ += 100;
        else if (next_report_ < 5000)   next_report_ += 500;
        else if (next_report_ < 10000)  next_report_ += 1000;
        else if (next_report_ < 50000)  next_report_ += 5000;
        else if (next_report_ < 100000) next_report_ += 10000;
        else if (next_report_ < 500000) next_report_ += 50000;
        else                            next_report_ += 100000;
520
        fprintf(stderr, "... finished %lld ops%30s\r", done_, "");
521 522 523 524
        fflush(stderr);
      } else {
        double now = FLAGS_env->NowMicros();
        fprintf(stderr,
525 526
                "%s ... thread %d: (%lld,%lld) ops and "
                "(%.1f,%.1f) ops/second in (%.6f,%.6f) seconds\n",
527
                FLAGS_env->TimeToString((uint64_t) now/1000000).c_str(),
528
                id_,
M
Mark Callaghan 已提交
529
                done_ - last_report_done_, done_,
530
                (done_ - last_report_done_) /
M
Mark Callaghan 已提交
531 532 533 534
                ((now - last_report_finish_) / 1000000.0),
                done_ / ((now - start_) / 1000000.0),
                (now - last_report_finish_) / 1000000.0,
                (now - start_) / 1000000.0);
M
Mark Callaghan 已提交
535

536 537 538
        if (FLAGS_stats_per_interval) {
          std::string stats;
          if (db && db->GetProperty("leveldb.stats", &stats))
539
            fprintf(stderr, "%s\n", stats.c_str());
540
        }
M
Mark Callaghan 已提交
541

542 543 544 545 546
        fflush(stderr);
        next_report_ += FLAGS_stats_interval;
        last_report_finish_ = now;
        last_report_done_ = done_;
      }
547 548 549 550 551 552 553 554 555 556 557 558 559 560 561 562 563 564 565 566 567 568 569
    }
  }

  void AddBytes(int64_t n) {
    bytes_ += n;
  }

  void Report(const Slice& name) {
    // Pretend at least one op was done in case we are running a benchmark
    // that does not call FinishedSingleOp().
    if (done_ < 1) done_ = 1;

    std::string extra;
    if (bytes_ > 0) {
      // Rate is computed on actual elapsed time, not the sum of per-thread
      // elapsed times.
      double elapsed = (finish_ - start_) * 1e-6;
      char rate[100];
      snprintf(rate, sizeof(rate), "%6.1f MB/s",
               (bytes_ / 1048576.0) / elapsed);
      extra = rate;
    }
    AppendWithSpace(&extra, message_);
570 571
    double elapsed = (finish_ - start_) * 1e-6;
    double throughput = (double)done_/elapsed;
572

D
Dhruba Borthakur 已提交
573
    fprintf(stdout, "%-12s : %11.3f micros/op %ld ops/sec;%s%s\n",
574
            name.ToString().c_str(),
575
            elapsed * 1e6 / done_,
D
Dhruba Borthakur 已提交
576
            (long)throughput,
577 578 579 580 581 582 583 584 585 586 587 588 589 590 591 592 593 594 595 596 597
            (extra.empty() ? "" : " "),
            extra.c_str());
    if (FLAGS_histogram) {
      fprintf(stdout, "Microseconds per op:\n%s\n", hist_.ToString().c_str());
    }
    fflush(stdout);
  }
};

// State shared by all concurrent executions of the same benchmark.
struct SharedState {
  port::Mutex mu;
  port::CondVar cv;
  int total;

  // Each thread goes through the following states:
  //    (1) initializing
  //    (2) waiting for others to be initialized
  //    (3) running
  //    (4) done

598 599
  long num_initialized;
  long num_done;
600 601 602 603 604 605 606 607
  bool start;

  SharedState() : cv(&mu) { }
};

// Per-thread state for concurrent executions of the same benchmark.
struct ThreadState {
  int tid;             // 0..n-1 when running in n threads
608
  Random64 rand;         // Has different seeds for different threads
609
  Stats stats;
610
  SharedState* shared;
611

A
Abhishek Kona 已提交
612
  /* implicit */ ThreadState(int index)
613
      : tid(index),
614
        rand((FLAGS_seed ? FLAGS_seed : 1000) + index) {
615 616 617
  }
};

M
Mark Callaghan 已提交
618 619
class Duration {
 public:
620
  Duration(int max_seconds, long long max_ops) {
M
Mark Callaghan 已提交
621 622 623 624 625 626 627
    max_seconds_ = max_seconds;
    max_ops_= max_ops;
    ops_ = 0;
    start_at_ = FLAGS_env->NowMicros();
  }

  bool Done(int increment) {
628
    if (increment <= 0) increment = 1;    // avoid Done(0) and infinite loops
M
Mark Callaghan 已提交
629 630 631
    ops_ += increment;

    if (max_seconds_) {
632 633
      // Recheck every appx 1000 ops (exact iff increment is factor of 1000)
      if ((ops_/1000) != ((ops_-increment)/1000)) {
M
Mark Callaghan 已提交
634 635 636 637 638 639 640 641 642 643 644 645
        double now = FLAGS_env->NowMicros();
        return ((now - start_at_) / 1000000.0) >= max_seconds_;
      } else {
        return false;
      }
    } else {
      return ops_ > max_ops_;
    }
  }

 private:
  int max_seconds_;
646 647
  long long max_ops_;
  long long ops_;
M
Mark Callaghan 已提交
648 649 650
  double start_at_;
};

J
jorlow@chromium.org 已提交
651 652
class Benchmark {
 private:
653
  shared_ptr<Cache> cache_;
S
Sanjay Ghemawat 已提交
654
  const FilterPolicy* filter_policy_;
T
Tyler Harter 已提交
655
  const SliceTransform* prefix_extractor_;
J
jorlow@chromium.org 已提交
656
  DB* db_;
657
  long long num_;
658
  int value_size_;
659
  int key_size_;
660 661
  int entries_per_batch_;
  WriteOptions write_options_;
662 663 664
  long long reads_;
  long long writes_;
  long long readwrites_;
J
jorlow@chromium.org 已提交
665
  int heap_counter_;
666
  char keyFormat_[100]; // this string will contain the format of key. e.g "%016d"
667 668
  void PrintHeader() {
    PrintEnvironment();
669
    fprintf(stdout, "Keys:       %d bytes each\n", FLAGS_key_size);
670 671 672
    fprintf(stdout, "Values:     %d bytes each (%d bytes after compression)\n",
            FLAGS_value_size,
            static_cast<int>(FLAGS_value_size * FLAGS_compression_ratio + 0.5));
673
    fprintf(stdout, "Entries:    %lld\n", num_);
674
    fprintf(stdout, "RawSize:    %.1f MB (estimated)\n",
675
            ((static_cast<int64_t>(FLAGS_key_size + FLAGS_value_size) * num_)
676
             / 1048576.0));
677
    fprintf(stdout, "FileSize:   %.1f MB (estimated)\n",
678
            (((FLAGS_key_size + FLAGS_value_size * FLAGS_compression_ratio) * num_)
679
             / 1048576.0));
680
    fprintf(stdout, "Write rate limit: %d\n", FLAGS_writes_per_second);
681 682 683 684 685 686 687 688 689 690 691 692 693 694 695 696

    switch (FLAGS_compression_type) {
      case leveldb::kNoCompression:
        fprintf(stdout, "Compression: none\n");
        break;
      case leveldb::kSnappyCompression:
        fprintf(stdout, "Compression: snappy\n");
        break;
      case leveldb::kZlibCompression:
        fprintf(stdout, "Compression: zlib\n");
        break;
      case leveldb::kBZip2Compression:
        fprintf(stdout, "Compression: bzip2\n");
        break;
    }

J
Jim Paton 已提交
697 698 699 700 701 702 703 704 705 706 707 708 709 710 711
    switch (FLAGS_rep_factory) {
      case kPrefixHash:
        fprintf(stdout, "Memtablerep: prefix_hash\n");
        break;
      case kSkipList:
        fprintf(stdout, "Memtablerep: skip_list\n");
        break;
      case kUnsorted:
        fprintf(stdout, "Memtablerep: unsorted\n");
        break;
      case kVectorRep:
        fprintf(stdout, "Memtablerep: vector\n");
        break;
    }

712 713 714 715 716 717 718 719 720 721 722 723 724 725
    PrintWarnings();
    fprintf(stdout, "------------------------------------------------\n");
  }

  void PrintWarnings() {
#if defined(__GNUC__) && !defined(__OPTIMIZE__)
    fprintf(stdout,
            "WARNING: Optimization is disabled: benchmarks unnecessarily slow\n"
            );
#endif
#ifndef NDEBUG
    fprintf(stdout,
            "WARNING: Assertions are enabled; benchmarks unnecessarily slow\n");
#endif
726

727 728 729 730 731
    if (FLAGS_compression_type != leveldb::kNoCompression) {
      // The test string should not be too small.
      const int len = FLAGS_block_size;
      char* text = (char*) malloc(len+1);
      bool result = true;
732
      const char* name = nullptr;
733 734 735 736 737 738 739
      std::string compressed;

      memset(text, (int) 'y', len);
      text[len] = '\0';

      switch (FLAGS_compression_type) {
        case kSnappyCompression:
740 741
          result = port::Snappy_Compress(Options().compression_opts, text,
                                         strlen(text), &compressed);
742 743 744
          name = "Snappy";
          break;
        case kZlibCompression:
745 746
          result = port::Zlib_Compress(Options().compression_opts, text,
                                       strlen(text), &compressed);
747 748 749
          name = "Zlib";
          break;
        case kBZip2Compression:
750 751
          result = port::BZip2_Compress(Options().compression_opts, text,
                                        strlen(text), &compressed);
752 753
          name = "BZip2";
          break;
754 755 756
        case kNoCompression:
          assert(false); // cannot happen
          break;
757 758 759 760 761 762 763 764 765
      }

      if (!result) {
        fprintf(stdout, "WARNING: %s compression is not enabled\n", name);
      } else if (name && compressed.size() >= strlen(text)) {
        fprintf(stdout, "WARNING: %s compression is not effective\n", name);
      }

      free(text);
766
    }
767 768 769 770 771 772 773
  }

  void PrintEnvironment() {
    fprintf(stderr, "LevelDB:    version %d.%d\n",
            kMajorVersion, kMinorVersion);

#if defined(__linux)
774
    time_t now = time(nullptr);
775 776 777
    fprintf(stderr, "Date:       %s", ctime(&now));  // ctime() adds newline

    FILE* cpuinfo = fopen("/proc/cpuinfo", "r");
778
    if (cpuinfo != nullptr) {
779 780 781 782
      char line[1000];
      int num_cpus = 0;
      std::string cpu_type;
      std::string cache_size;
783
      while (fgets(line, sizeof(line), cpuinfo) != nullptr) {
784
        const char* sep = strchr(line, ':');
785
        if (sep == nullptr) {
786 787 788 789 790 791 792 793 794 795 796 797 798 799 800 801 802 803
          continue;
        }
        Slice key = TrimSpace(Slice(line, sep - 1 - line));
        Slice val = TrimSpace(Slice(sep + 1));
        if (key == "model name") {
          ++num_cpus;
          cpu_type = val.ToString();
        } else if (key == "cache size") {
          cache_size = val.ToString();
        }
      }
      fclose(cpuinfo);
      fprintf(stderr, "CPU:        %d * %s\n", num_cpus, cpu_type.c_str());
      fprintf(stderr, "CPUCache:   %s\n", cache_size.c_str());
    }
#endif
  }

J
jorlow@chromium.org 已提交
804
 public:
805
  Benchmark()
806 807 808
  : cache_(FLAGS_cache_size >= 0 ?
           (FLAGS_cache_numshardbits >= 1 ?
            NewLRUCache(FLAGS_cache_size, FLAGS_cache_numshardbits) :
809
            NewLRUCache(FLAGS_cache_size)) : nullptr),
S
Sanjay Ghemawat 已提交
810 811
    filter_policy_(FLAGS_bloom_bits >= 0
                   ? NewBloomFilterPolicy(FLAGS_bloom_bits)
812
                   : nullptr),
T
Tyler Harter 已提交
813
    prefix_extractor_(NewFixedPrefixTransform(FLAGS_key_size-1)),
814
    db_(nullptr),
815
    num_(FLAGS_num),
816
    value_size_(FLAGS_value_size),
817
    key_size_(FLAGS_key_size),
818
    entries_per_batch_(1),
819
    reads_(FLAGS_reads < 0 ? FLAGS_num : FLAGS_reads),
820
    writes_(FLAGS_writes < 0 ? FLAGS_num : FLAGS_writes),
821
    readwrites_((FLAGS_writes < 0  && FLAGS_reads < 0)? FLAGS_num :
822
                ((FLAGS_writes > FLAGS_reads) ? FLAGS_writes : FLAGS_reads)
823
               ),
824
    heap_counter_(0) {
J
jorlow@chromium.org 已提交
825
    std::vector<std::string> files;
826
    FLAGS_env->GetChildren(FLAGS_db, &files);
827
    for (unsigned int i = 0; i < files.size(); i++) {
J
jorlow@chromium.org 已提交
828
      if (Slice(files[i]).starts_with("heap-")) {
829
        FLAGS_env->DeleteFile(std::string(FLAGS_db) + "/" + files[i]);
J
jorlow@chromium.org 已提交
830 831
      }
    }
832
    if (!FLAGS_use_existing_db) {
833
      DestroyDB(FLAGS_db, Options());
834
    }
J
jorlow@chromium.org 已提交
835 836 837 838
  }

  ~Benchmark() {
    delete db_;
S
Sanjay Ghemawat 已提交
839
    delete filter_policy_;
T
Tyler Harter 已提交
840
    delete prefix_extractor_;
J
jorlow@chromium.org 已提交
841 842
  }

843
  //this function will construct string format for key. e.g "%016lld"
X
Xing Jin 已提交
844 845 846
  void ConstructStrFormatForKey(char* str, int keySize) {
    str[0] = '%';
    str[1] = '0';
847
    sprintf(str+2, "%dlld%s", keySize, "%s");
X
Xing Jin 已提交
848 849
  }

850
  unique_ptr<char []> GenerateKeyFromInt(long long v, const char* suffix = "") {
X
Xing Jin 已提交
851 852 853 854 855
    unique_ptr<char []> keyInStr(new char[MAX_KEY_SIZE]);
    snprintf(keyInStr.get(), MAX_KEY_SIZE, keyFormat_, v, suffix);
    return keyInStr;
  }

J
jorlow@chromium.org 已提交
856
  void Run() {
857 858
    PrintHeader();
    Open();
J
jorlow@chromium.org 已提交
859 860

    const char* benchmarks = FLAGS_benchmarks;
861
    while (benchmarks != nullptr) {
J
jorlow@chromium.org 已提交
862 863
      const char* sep = strchr(benchmarks, ',');
      Slice name;
864
      if (sep == nullptr) {
J
jorlow@chromium.org 已提交
865
        name = benchmarks;
866
        benchmarks = nullptr;
J
jorlow@chromium.org 已提交
867 868 869 870 871
      } else {
        name = Slice(benchmarks, sep - benchmarks);
        benchmarks = sep + 1;
      }

X
Xing Jin 已提交
872
      // Sanitize parameters
873
      num_ = FLAGS_num;
874
      reads_ = (FLAGS_reads < 0 ? FLAGS_num : FLAGS_reads);
875
      writes_ = (FLAGS_writes < 0 ? FLAGS_num : FLAGS_writes);
876
      value_size_ = FLAGS_value_size;
877 878
      key_size_ = FLAGS_key_size;
      ConstructStrFormatForKey(keyFormat_, key_size_);
879 880
      entries_per_batch_ = 1;
      write_options_ = WriteOptions();
881 882 883
      if (FLAGS_sync) {
        write_options_.sync = true;
      }
H
heyongqiang 已提交
884 885
      write_options_.disableWAL = FLAGS_disable_wal;

886
      void (Benchmark::*method)(ThreadState*) = nullptr;
887
      bool fresh_db = false;
888
      int num_threads = FLAGS_threads;
889 890

      if (name == Slice("fillseq")) {
891 892
        fresh_db = true;
        method = &Benchmark::WriteSeq;
893
      } else if (name == Slice("fillbatch")) {
894 895 896
        fresh_db = true;
        entries_per_batch_ = 1000;
        method = &Benchmark::WriteSeq;
897
      } else if (name == Slice("fillrandom")) {
898 899
        fresh_db = true;
        method = &Benchmark::WriteRandom;
900 901 902 903 904 905 906 907
      } else if (name == Slice("filluniquerandom")) {
        fresh_db = true;
        if (num_threads > 1) {
          fprintf(stderr, "filluniquerandom multithreaded not supported"
                           " set --threads=1");
          exit(1);
        }
        method = &Benchmark::WriteUniqueRandom;
908
      } else if (name == Slice("overwrite")) {
909 910
        fresh_db = false;
        method = &Benchmark::WriteRandom;
911
      } else if (name == Slice("fillsync")) {
912 913 914 915
        fresh_db = true;
        num_ /= 1000;
        write_options_.sync = true;
        method = &Benchmark::WriteRandom;
916
      } else if (name == Slice("fill100K")) {
917 918 919 920
        fresh_db = true;
        num_ /= 1000;
        value_size_ = 100 * 1000;
        method = &Benchmark::WriteRandom;
J
jorlow@chromium.org 已提交
921
      } else if (name == Slice("readseq")) {
922
        method = &Benchmark::ReadSequential;
J
jorlow@chromium.org 已提交
923
      } else if (name == Slice("readreverse")) {
924
        method = &Benchmark::ReadReverse;
J
jorlow@chromium.org 已提交
925
      } else if (name == Slice("readrandom")) {
926
        method = &Benchmark::ReadRandom;
S
Sanjay Ghemawat 已提交
927 928 929 930
      } else if (name == Slice("readmissing")) {
        method = &Benchmark::ReadMissing;
      } else if (name == Slice("seekrandom")) {
        method = &Benchmark::SeekRandom;
931
      } else if (name == Slice("readhot")) {
932
        method = &Benchmark::ReadHot;
933
      } else if (name == Slice("readrandomsmall")) {
934
        reads_ /= 1000;
935
        method = &Benchmark::ReadRandom;
T
Tyler Harter 已提交
936 937
      } else if (name == Slice("prefixscanrandom")) {
        method = &Benchmark::PrefixScanRandom;
S
Sanjay Ghemawat 已提交
938 939 940 941
      } else if (name == Slice("deleteseq")) {
        method = &Benchmark::DeleteSeq;
      } else if (name == Slice("deleterandom")) {
        method = &Benchmark::DeleteRandom;
942 943 944
      } else if (name == Slice("readwhilewriting")) {
        num_threads++;  // Add extra thread for writing
        method = &Benchmark::ReadWhileWriting;
945 946
      } else if (name == Slice("readrandomwriterandom")) {
        method = &Benchmark::ReadRandomWriteRandom;
M
Mark Callaghan 已提交
947 948
      } else if (name == Slice("updaterandom")) {
        method = &Benchmark::UpdateRandom;
D
Deon Nicholas 已提交
949 950 951 952 953 954 955 956 957 958
      } else if (name == Slice("appendrandom")) {
        method = &Benchmark::AppendRandom;
      } else if (name == Slice("mergerandom")) {
        if (FLAGS_merge_operator.empty()) {
          fprintf(stdout, "%-12s : skipped (--merge_operator is unknown)\n",
                  name.ToString().c_str());
          method = nullptr;
        } else {
          method = &Benchmark::MergeRandom;
        }
959 960
      } else if (name == Slice("randomwithverify")) {
        method = &Benchmark::RandomWithVerify;
J
jorlow@chromium.org 已提交
961
      } else if (name == Slice("compact")) {
962
        method = &Benchmark::Compact;
J
jorlow@chromium.org 已提交
963
      } else if (name == Slice("crc32c")) {
964
        method = &Benchmark::Crc32c;
965
      } else if (name == Slice("acquireload")) {
966
        method = &Benchmark::AcquireLoad;
967
      } else if (name == Slice("snappycomp")) {
968
        method = &Benchmark::SnappyCompress;
969
      } else if (name == Slice("snappyuncomp")) {
970
        method = &Benchmark::SnappyUncompress;
J
jorlow@chromium.org 已提交
971 972
      } else if (name == Slice("heapprofile")) {
        HeapProfile();
973
      } else if (name == Slice("stats")) {
S
Sanjay Ghemawat 已提交
974
        PrintStats("leveldb.stats");
975 976
      } else if (name == Slice("levelstats")) {
        PrintStats("leveldb.levelstats");
S
Sanjay Ghemawat 已提交
977 978
      } else if (name == Slice("sstables")) {
        PrintStats("leveldb.sstables");
J
jorlow@chromium.org 已提交
979
      } else {
980 981 982 983
        if (name != Slice()) {  // No error message for empty name
          fprintf(stderr, "unknown benchmark '%s'\n", name.ToString().c_str());
        }
      }
984 985 986 987 988

      if (fresh_db) {
        if (FLAGS_use_existing_db) {
          fprintf(stdout, "%-12s : skipped (--use_existing_db is true)\n",
                  name.ToString().c_str());
989
          method = nullptr;
990 991
        } else {
          delete db_;
992
          db_ = nullptr;
993 994 995 996 997
          DestroyDB(FLAGS_db, Options());
          Open();
        }
      }

998
      if (method != nullptr) {
999
        fprintf(stdout, "DB path: [%s]\n", FLAGS_db);
1000
        RunBenchmark(num_threads, name, method);
J
jorlow@chromium.org 已提交
1001 1002
      }
    }
1003 1004 1005
    if (FLAGS_statistics) {
     fprintf(stdout, "STATISTICS:\n%s\n", dbstats->ToString().c_str());
    }
J
jorlow@chromium.org 已提交
1006 1007
  }

1008
 private:
1009 1010 1011 1012 1013 1014 1015 1016 1017 1018 1019 1020 1021 1022 1023 1024 1025 1026 1027 1028 1029 1030
  struct ThreadArg {
    Benchmark* bm;
    SharedState* shared;
    ThreadState* thread;
    void (Benchmark::*method)(ThreadState*);
  };

  static void ThreadBody(void* v) {
    ThreadArg* arg = reinterpret_cast<ThreadArg*>(v);
    SharedState* shared = arg->shared;
    ThreadState* thread = arg->thread;
    {
      MutexLock l(&shared->mu);
      shared->num_initialized++;
      if (shared->num_initialized >= shared->total) {
        shared->cv.SignalAll();
      }
      while (!shared->start) {
        shared->cv.Wait();
      }
    }

1031
    thread->stats.Start(thread->tid);
1032 1033 1034 1035 1036 1037 1038 1039 1040 1041 1042 1043
    (arg->bm->*(arg->method))(thread);
    thread->stats.Stop();

    {
      MutexLock l(&shared->mu);
      shared->num_done++;
      if (shared->num_done >= shared->total) {
        shared->cv.SignalAll();
      }
    }
  }

1044 1045
  void RunBenchmark(int n, Slice name,
                    void (Benchmark::*method)(ThreadState*)) {
1046 1047 1048 1049 1050 1051 1052 1053 1054 1055 1056 1057
    SharedState shared;
    shared.total = n;
    shared.num_initialized = 0;
    shared.num_done = 0;
    shared.start = false;

    ThreadArg* arg = new ThreadArg[n];
    for (int i = 0; i < n; i++) {
      arg[i].bm = this;
      arg[i].method = method;
      arg[i].shared = &shared;
      arg[i].thread = new ThreadState(i);
1058
      arg[i].thread->shared = &shared;
1059
      FLAGS_env->StartThread(ThreadBody, &arg[i]);
1060 1061 1062 1063 1064 1065 1066 1067 1068 1069 1070 1071 1072 1073
    }

    shared.mu.Lock();
    while (shared.num_initialized < n) {
      shared.cv.Wait();
    }

    shared.start = true;
    shared.cv.SignalAll();
    while (shared.num_done < n) {
      shared.cv.Wait();
    }
    shared.mu.Unlock();

1074 1075 1076 1077
    // Stats for some threads can be excluded.
    Stats merge_stats;
    for (int i = 0; i < n; i++) {
      merge_stats.Merge(arg[i].thread->stats);
1078
    }
1079
    merge_stats.Report(name);
1080 1081 1082 1083 1084 1085 1086 1087

    for (int i = 0; i < n; i++) {
      delete arg[i].thread;
    }
    delete[] arg;
  }

  void Crc32c(ThreadState* thread) {
J
jorlow@chromium.org 已提交
1088
    // Checksum about 500MB of data total
1089 1090
    const int size = 4096;
    const char* label = "(4K per op)";
J
jorlow@chromium.org 已提交
1091
    std::string data(size, 'x');
J
jorlow@chromium.org 已提交
1092 1093 1094 1095
    int64_t bytes = 0;
    uint32_t crc = 0;
    while (bytes < 500 * 1048576) {
      crc = crc32c::Value(data.data(), size);
1096
      thread->stats.FinishedSingleOp(nullptr);
J
jorlow@chromium.org 已提交
1097 1098 1099 1100 1101
      bytes += size;
    }
    // Print so result is not dead
    fprintf(stderr, "... crc=0x%x\r", static_cast<unsigned int>(crc));

1102 1103
    thread->stats.AddBytes(bytes);
    thread->stats.AddMessage(label);
J
jorlow@chromium.org 已提交
1104 1105
  }

1106
  void AcquireLoad(ThreadState* thread) {
1107 1108 1109
    int dummy;
    port::AtomicPointer ap(&dummy);
    int count = 0;
1110
    void *ptr = nullptr;
1111
    thread->stats.AddMessage("(each op is 1000 loads)");
1112 1113 1114 1115 1116
    while (count < 100000) {
      for (int i = 0; i < 1000; i++) {
        ptr = ap.Acquire_Load();
      }
      count++;
1117
      thread->stats.FinishedSingleOp(nullptr);
1118
    }
1119
    if (ptr == nullptr) exit(1); // Disable unused variable warning.
1120 1121
  }

1122 1123 1124
  void SnappyCompress(ThreadState* thread) {
    RandomGenerator gen;
    Slice input = gen.Generate(Options().block_size);
1125 1126 1127 1128 1129
    int64_t bytes = 0;
    int64_t produced = 0;
    bool ok = true;
    std::string compressed;
    while (ok && bytes < 1024 * 1048576) {  // Compress 1G
1130 1131
      ok = port::Snappy_Compress(Options().compression_opts, input.data(),
                                 input.size(), &compressed);
1132 1133
      produced += compressed.size();
      bytes += input.size();
1134
      thread->stats.FinishedSingleOp(nullptr);
1135 1136 1137
    }

    if (!ok) {
1138
      thread->stats.AddMessage("(snappy failure)");
1139 1140 1141 1142
    } else {
      char buf[100];
      snprintf(buf, sizeof(buf), "(output: %.1f%%)",
               (produced * 100.0) / bytes);
1143 1144
      thread->stats.AddMessage(buf);
      thread->stats.AddBytes(bytes);
1145 1146 1147
    }
  }

1148 1149 1150
  void SnappyUncompress(ThreadState* thread) {
    RandomGenerator gen;
    Slice input = gen.Generate(Options().block_size);
1151
    std::string compressed;
1152 1153
    bool ok = port::Snappy_Compress(Options().compression_opts, input.data(),
                                    input.size(), &compressed);
1154
    int64_t bytes = 0;
1155
    char* uncompressed = new char[input.size()];
1156 1157
    while (ok && bytes < 1024 * 1048576) {  // Compress 1G
      ok =  port::Snappy_Uncompress(compressed.data(), compressed.size(),
1158 1159
                                    uncompressed);
      bytes += input.size();
1160
      thread->stats.FinishedSingleOp(nullptr);
1161
    }
1162
    delete[] uncompressed;
1163 1164

    if (!ok) {
1165
      thread->stats.AddMessage("(snappy failure)");
1166
    } else {
1167
      thread->stats.AddBytes(bytes);
1168 1169 1170
    }
  }

1171
  void Open() {
1172
    assert(db_ == nullptr);
1173
    Options options;
1174
    options.create_if_missing = !FLAGS_use_existing_db;
1175
    options.block_cache = cache_;
1176
    if (cache_ == nullptr) {
1177 1178
      options.no_block_cache = true;
    }
1179
    options.write_buffer_size = FLAGS_write_buffer_size;
1180
    options.max_write_buffer_number = FLAGS_max_write_buffer_number;
1181 1182
    options.min_write_buffer_number_to_merge =
      FLAGS_min_write_buffer_number_to_merge;
1183
    options.max_background_compactions = FLAGS_max_background_compactions;
1184 1185 1186 1187
    options.compaction_style = FLAGS_compaction_style;
    options.compaction_options_universal.size_ratio = FLAGS_universal_size_ratio;
    options.compaction_options_universal.min_merge_width =
      FLAGS_compaction_universal_min_merge_width;
1188
    options.block_size = FLAGS_block_size;
S
Sanjay Ghemawat 已提交
1189
    options.filter_policy = filter_policy_;
T
Tyler Harter 已提交
1190 1191
    options.prefix_extractor = FLAGS_use_prefix_blooms ? prefix_extractor_
                                                       : nullptr;
1192 1193
    options.max_open_files = FLAGS_open_files;
    options.statistics = dbstats;
1194
    options.env = FLAGS_env;
H
heyongqiang 已提交
1195
    options.disableDataSync = FLAGS_disable_data_sync;
1196
    options.use_fsync = FLAGS_use_fsync;
1197
    options.num_levels = FLAGS_num_levels;
H
heyongqiang 已提交
1198 1199 1200 1201 1202
    options.target_file_size_base = FLAGS_target_file_size_base;
    options.target_file_size_multiplier = FLAGS_target_file_size_multiplier;
    options.max_bytes_for_level_base = FLAGS_max_bytes_for_level_base;
    options.max_bytes_for_level_multiplier =
        FLAGS_max_bytes_for_level_multiplier;
1203
    options.filter_deletes = FLAGS_filter_deletes;
J
Jim Paton 已提交
1204 1205 1206 1207 1208 1209 1210 1211 1212 1213 1214 1215 1216 1217 1218 1219 1220 1221 1222 1223 1224 1225 1226 1227 1228
    if ((FLAGS_prefix_size == 0) == (FLAGS_rep_factory == kPrefixHash)) {
      fprintf(stderr,
            "prefix_size should be non-zero iff memtablerep == prefix_hash\n");
      exit(1);
    }
    switch (FLAGS_rep_factory) {
      case kPrefixHash:
        options.memtable_factory.reset(
          new PrefixHashRepFactory(NewFixedPrefixTransform(FLAGS_prefix_size))
        );
        break;
      case kUnsorted:
        options.memtable_factory.reset(
          new UnsortedRepFactory
        );
        break;
      case kSkipList:
        // no need to do anything
        break;
      case kVectorRep:
        options.memtable_factory.reset(
          new VectorRepFactory
        );
        break;
    }
1229 1230 1231 1232 1233 1234 1235 1236 1237 1238
    if (FLAGS_max_bytes_for_level_multiplier_additional.size() > 0) {
      if (FLAGS_max_bytes_for_level_multiplier_additional.size() !=
          (unsigned int)FLAGS_num_levels) {
        fprintf(stderr, "Insufficient number of fanouts specified %d\n",
                (int)FLAGS_max_bytes_for_level_multiplier_additional.size());
        exit(1);
      }
      options.max_bytes_for_level_multiplier_additional =
        FLAGS_max_bytes_for_level_multiplier_additional;
    }
H
heyongqiang 已提交
1239
    options.level0_stop_writes_trigger = FLAGS_level0_stop_writes_trigger;
M
Mark Callaghan 已提交
1240
    options.level0_file_num_compaction_trigger =
1241
        FLAGS_level0_file_num_compaction_trigger;
H
heyongqiang 已提交
1242 1243
    options.level0_slowdown_writes_trigger =
      FLAGS_level0_slowdown_writes_trigger;
1244
    options.compression = FLAGS_compression_type;
1245
    options.WAL_ttl_seconds = FLAGS_WAL_ttl_seconds;
1246 1247
    if (FLAGS_min_level_to_compress >= 0) {
      assert(FLAGS_min_level_to_compress <= FLAGS_num_levels);
1248
      options.compression_per_level.resize(FLAGS_num_levels);
1249
      for (int i = 0; i < FLAGS_min_level_to_compress; i++) {
1250 1251
        options.compression_per_level[i] = kNoCompression;
      }
1252
      for (int i = FLAGS_min_level_to_compress;
1253 1254 1255 1256
           i < FLAGS_num_levels; i++) {
        options.compression_per_level[i] = FLAGS_compression_type;
      }
    }
1257
    options.disable_seek_compaction = FLAGS_disable_seek_compaction;
1258 1259
    options.delete_obsolete_files_period_micros =
      FLAGS_delete_obsolete_files_period_micros;
J
Jim Paton 已提交
1260 1261 1262 1263
    options.soft_rate_limit = FLAGS_soft_rate_limit;
    options.hard_rate_limit = FLAGS_hard_rate_limit;
    options.rate_limit_delay_max_milliseconds =
      FLAGS_rate_limit_delay_max_milliseconds;
1264
    options.table_cache_numshardbits = FLAGS_table_cache_numshardbits;
A
Abhishek Kona 已提交
1265
    options.max_grandparent_overlap_factor =
1266
      FLAGS_max_grandparent_overlap_factor;
1267
    options.disable_auto_compactions = FLAGS_disable_auto_compactions;
1268
    options.source_compaction_factor = FLAGS_source_compaction_factor;
1269 1270 1271 1272 1273

    // fill storage options
    options.allow_os_buffer = FLAGS_use_os_buffer;
    options.allow_mmap_reads = FLAGS_use_mmap_reads;
    options.allow_mmap_writes = FLAGS_use_mmap_writes;
1274 1275
    options.advise_random_on_open = FLAGS_advise_random_on_open;
    options.access_hint_on_compaction_start = FLAGS_compaction_fadvice;
H
Haobo Xu 已提交
1276 1277

    options.use_adaptive_mutex = FLAGS_use_adaptive_mutex;
H
Haobo Xu 已提交
1278
    options.bytes_per_sync = FLAGS_bytes_per_sync;
H
Haobo Xu 已提交
1279

D
Deon Nicholas 已提交
1280
    // merge operator options
1281 1282 1283
    options.merge_operator = MergeOperators::CreateFromStringId(
        FLAGS_merge_operator);
    if (options.merge_operator == nullptr && !FLAGS_merge_operator.empty()) {
D
Deon Nicholas 已提交
1284 1285 1286 1287 1288
      fprintf(stderr, "invalid merge operator: %s\n",
              FLAGS_merge_operator.c_str());
      exit(1);
    }

H
heyongqiang 已提交
1289 1290 1291 1292 1293 1294
    Status s;
    if(FLAGS_read_only) {
      s = DB::OpenForReadOnly(options, FLAGS_db, &db_);
    } else {
      s = DB::Open(options, FLAGS_db, &db_);
    }
1295 1296 1297 1298
    if (!s.ok()) {
      fprintf(stderr, "open error: %s\n", s.ToString().c_str());
      exit(1);
    }
1299
    if (FLAGS_min_level_to_compress >= 0) {
1300
      options.compression_per_level.clear();
1301
    }
1302 1303
  }

1304 1305 1306 1307
  enum WriteMode {
    RANDOM, SEQUENTIAL, UNIQUE_RANDOM
  };

1308
  void WriteSeq(ThreadState* thread) {
1309
    DoWrite(thread, SEQUENTIAL);
1310
  }
1311

1312
  void WriteRandom(ThreadState* thread) {
1313
    DoWrite(thread, RANDOM);
1314 1315
  }

1316 1317 1318 1319 1320 1321 1322 1323 1324 1325 1326 1327 1328
  void WriteUniqueRandom(ThreadState* thread) {
    DoWrite(thread, UNIQUE_RANDOM);
  }

  void DoWrite(ThreadState* thread, WriteMode write_mode) {
    const int test_duration = write_mode == RANDOM ? FLAGS_duration : 0;
    const int num_ops = writes_ == 0 ? num_ : writes_ ;
    Duration duration(test_duration, num_ops);
    unique_ptr<BitSet> bit_set;

    if (write_mode == UNIQUE_RANDOM) {
      bit_set.reset(new BitSet(num_ops));
    }
M
Mark Callaghan 已提交
1329

1330
    if (num_ != FLAGS_num) {
1331
      char msg[100];
1332
      snprintf(msg, sizeof(msg), "(%lld ops)", num_);
1333
      thread->stats.AddMessage(msg);
1334 1335
    }

1336
    RandomGenerator gen;
J
jorlow@chromium.org 已提交
1337 1338
    WriteBatch batch;
    Status s;
1339
    int64_t bytes = 0;
M
Mark Callaghan 已提交
1340 1341
    int i = 0;
    while (!duration.Done(entries_per_batch_)) {
J
jorlow@chromium.org 已提交
1342
      batch.Clear();
1343
      for (int j = 0; j < entries_per_batch_; j++) {
1344
        long long k = 0;
1345 1346 1347 1348 1349 1350 1351 1352 1353
        switch(write_mode) {
          case SEQUENTIAL:
            k = i +j;
            break;
          case RANDOM:
            k = thread->rand.Next() % FLAGS_num;
            break;
          case UNIQUE_RANDOM:
            {
1354
              const long long t = thread->rand.Next() % FLAGS_num;
1355 1356 1357 1358 1359 1360 1361 1362 1363 1364 1365 1366 1367 1368 1369 1370 1371 1372 1373 1374 1375 1376 1377 1378 1379 1380 1381
              if (!bit_set->test(t)) {
                // best case
                k = t;
              } else {
                bool found = false;
                // look forward
                for (size_t i = t + 1; i < bit_set->size(); ++i) {
                  if (!bit_set->test(i)) {
                    found = true;
                    k = i;
                    break;
                  }
                }
                if (!found) {
                  for (size_t i = t; i-- > 0;) {
                    if (!bit_set->test(i)) {
                      found = true;
                      k = i;
                      break;
                    }
                  }
                }
              }
              bit_set->set(k);
              break;
            }
        };
1382 1383 1384
        unique_ptr<char []> key = GenerateKeyFromInt(k);
        batch.Put(key.get(), gen.Generate(value_size_));
        bytes += value_size_ + strlen(key.get());
M
Mark Callaghan 已提交
1385
        thread->stats.FinishedSingleOp(db_);
1386
      }
1387
      s = db_->Write(write_options_, &batch);
J
jorlow@chromium.org 已提交
1388 1389 1390 1391
      if (!s.ok()) {
        fprintf(stderr, "put error: %s\n", s.ToString().c_str());
        exit(1);
      }
M
Mark Callaghan 已提交
1392
      i += entries_per_batch_;
J
jorlow@chromium.org 已提交
1393
    }
1394
    thread->stats.AddBytes(bytes);
J
jorlow@chromium.org 已提交
1395 1396
  }

1397
  void ReadSequential(ThreadState* thread) {
1398
    Iterator* iter = db_->NewIterator(ReadOptions(FLAGS_verify_checksum, true));
1399
    long long i = 0;
1400
    int64_t bytes = 0;
1401
    for (iter->SeekToFirst(); i < reads_ && iter->Valid(); iter->Next()) {
1402
      bytes += iter->key().size() + iter->value().size();
M
Mark Callaghan 已提交
1403
      thread->stats.FinishedSingleOp(db_);
1404 1405 1406
      ++i;
    }
    delete iter;
1407
    thread->stats.AddBytes(bytes);
1408 1409
  }

1410
  void ReadReverse(ThreadState* thread) {
1411
    Iterator* iter = db_->NewIterator(ReadOptions(FLAGS_verify_checksum, true));
1412
    long long i = 0;
1413
    int64_t bytes = 0;
1414
    for (iter->SeekToLast(); i < reads_ && iter->Valid(); iter->Prev()) {
1415
      bytes += iter->key().size() + iter->value().size();
M
Mark Callaghan 已提交
1416
      thread->stats.FinishedSingleOp(db_);
1417 1418 1419
      ++i;
    }
    delete iter;
1420
    thread->stats.AddBytes(bytes);
1421 1422
  }

1423 1424 1425
  // Calls MultiGet over a list of keys from a random distribution.
  // Returns the total number of keys found.
  long MultiGetRandom(ReadOptions& options, int num_keys,
1426
                     Random64& rand, long long range, const char* suffix) {
1427 1428 1429 1430 1431 1432
    assert(num_keys > 0);
    std::vector<Slice> keys(num_keys);
    std::vector<std::string> values(num_keys);
    std::vector<unique_ptr<char []> > gen_keys(num_keys);

    int i;
1433
    long long k;
1434 1435 1436 1437 1438 1439 1440 1441 1442 1443 1444 1445 1446 1447 1448 1449 1450 1451 1452 1453 1454 1455 1456 1457 1458 1459 1460 1461 1462 1463 1464 1465 1466 1467 1468 1469 1470

    // Fill the keys vector
    for(i=0; i<num_keys; ++i) {
      k = rand.Next() % range;
      gen_keys[i] = GenerateKeyFromInt(k,suffix);
      keys[i] = gen_keys[i].get();
    }

    if (FLAGS_use_snapshot) {
      options.snapshot = db_->GetSnapshot();
    }

    // Apply the operation
    std::vector<Status> statuses = db_->MultiGet(options, keys, &values);
    assert((long)statuses.size() == num_keys);
    assert((long)keys.size() == num_keys);  // Should always be the case.
    assert((long)values.size() == num_keys);

    if (FLAGS_use_snapshot) {
      db_->ReleaseSnapshot(options.snapshot);
      options.snapshot = nullptr;
    }

    // Count number found
    long found = 0;
    for(i=0; i<num_keys; ++i) {
      if (statuses[i].ok()){
        ++found;
      } else if (FLAGS_warn_missing_keys == true) {
        // Key not found, or error.
        fprintf(stderr, "get error: %s\n", statuses[i].ToString().c_str());
      }
    }

    return found;
  }

1471
  void ReadRandom(ThreadState* thread) {
1472
    ReadOptions options(FLAGS_verify_checksum, true);
M
Mark Callaghan 已提交
1473
    Duration duration(FLAGS_duration, reads_);
1474

1475
    long long found = 0;
M
Mark Callaghan 已提交
1476

1477 1478 1479 1480 1481 1482 1483
    if (FLAGS_use_multiget) {   // MultiGet
      const long& kpg = FLAGS_keys_per_multiget;  // keys per multiget group
      long keys_left = reads_;

      // Recalculate number of keys per group, and call MultiGet until done
      long num_keys;
      while(num_keys = std::min(keys_left, kpg), !duration.Done(num_keys)) {
X
Xing Jin 已提交
1484
        found += MultiGetRandom(options, num_keys, thread->rand, FLAGS_num, "");
1485 1486 1487 1488 1489 1490 1491
        thread->stats.FinishedSingleOp(db_);
        keys_left -= num_keys;
      }
    } else {    // Regular case. Do one "get" at a time Get
      Iterator* iter = db_->NewIterator(options);
      std::string value;
      while (!duration.Done(1)) {
1492
        const long long k = thread->rand.Next() % FLAGS_num;
1493 1494 1495
        unique_ptr<char []> key = GenerateKeyFromInt(k);
        if (FLAGS_use_snapshot) {
          options.snapshot = db_->GetSnapshot();
1496
        }
M
Mark Callaghan 已提交
1497

1498 1499 1500 1501 1502 1503 1504 1505 1506 1507 1508 1509 1510 1511 1512 1513 1514 1515 1516 1517 1518 1519
        if (FLAGS_read_range < 2) {
          if (db_->Get(options, key.get(), &value).ok()) {
            found++;
          }
        } else {
          Slice skey(key.get());
          int count = 1;

          if (FLAGS_get_approx) {
            unique_ptr<char []> key2 =
                GenerateKeyFromInt(k + (int) FLAGS_read_range);
            Slice skey2(key2.get());
            Range range(skey, skey2);
            uint64_t sizes;
            db_->GetApproximateSizes(&range, 1, &sizes);
          }

          for (iter->Seek(skey);
               iter->Valid() && count <= FLAGS_read_range;
               ++count, iter->Next()) {
            found++;
          }
M
Mark Callaghan 已提交
1520 1521
        }

1522 1523 1524
        if (FLAGS_use_snapshot) {
          db_->ReleaseSnapshot(options.snapshot);
          options.snapshot = nullptr;
1525 1526
        }

1527
        thread->stats.FinishedSingleOp(db_);
M
Mark Callaghan 已提交
1528 1529
      }

1530
      delete iter;
S
Sanjay Ghemawat 已提交
1531
    }
1532

S
Sanjay Ghemawat 已提交
1533
    char msg[100];
1534
    snprintf(msg, sizeof(msg), "(%lld of %lld found)", found, reads_);
S
Sanjay Ghemawat 已提交
1535 1536 1537
    thread->stats.AddMessage(msg);
  }

T
Tyler Harter 已提交
1538 1539 1540 1541 1542 1543 1544 1545 1546 1547 1548 1549 1550 1551 1552 1553 1554 1555 1556 1557 1558 1559 1560 1561 1562 1563 1564 1565 1566 1567 1568 1569 1570 1571 1572
  void PrefixScanRandom(ThreadState* thread) {
    if (FLAGS_use_prefix_api) {
      assert(FLAGS_use_prefix_blooms);
      assert(FLAGS_bloom_bits >= 1);
    }

    ReadOptions options(FLAGS_verify_checksum, true);
    Duration duration(FLAGS_duration, reads_);

    long long found = 0;

    while (!duration.Done(1)) {
      std::string value;
      const int k = thread->rand.Next() % FLAGS_num;
      unique_ptr<char []> key = GenerateKeyFromInt(k);
      Slice skey(key.get());
      Slice prefix = prefix_extractor_->Transform(skey);
      options.prefix = FLAGS_use_prefix_api ? &prefix : nullptr;

      Iterator* iter = db_->NewIterator(options);
      for (iter->Seek(skey);
           iter->Valid() && iter->key().starts_with(prefix);
           iter->Next()) {
        found++;
      }
      delete iter;

      thread->stats.FinishedSingleOp(db_);
    }

    char msg[100];
    snprintf(msg, sizeof(msg), "(%lld of %lld found)", found, reads_);
    thread->stats.AddMessage(msg);
  }

X
Xing Jin 已提交
1573
  void ReadMissing(ThreadState* thread) {
1574 1575
    FLAGS_warn_missing_keys = false;    // Never warn about missing keys

M
Mark Callaghan 已提交
1576
    Duration duration(FLAGS_duration, reads_);
1577
    ReadOptions options(FLAGS_verify_checksum, true);
1578 1579 1580 1581 1582 1583 1584 1585 1586

    if (FLAGS_use_multiget) {
      const long& kpg = FLAGS_keys_per_multiget;  // keys per multiget group
      long keys_left = reads_;

      // Recalculate number of keys per group, and call MultiGet until done
      long num_keys;
      long found;
      while(num_keys = std::min(keys_left, kpg), !duration.Done(num_keys)) {
X
Xing Jin 已提交
1587 1588 1589 1590
        found = MultiGetRandom(options, num_keys, thread->rand, FLAGS_num, ".");

        // We should not find any key since the key we try to get has a
        // different suffix
1591 1592 1593
        if (found) {
          assert(false);
        }
X
Xing Jin 已提交
1594

1595 1596 1597 1598 1599 1600 1601
        thread->stats.FinishedSingleOp(db_);
        keys_left -= num_keys;
      }
    } else {  // Regular case (not MultiGet)
      std::string value;
      Status s;
      while (!duration.Done(1)) {
1602
        const long long k = thread->rand.Next() % FLAGS_num;
1603 1604 1605 1606 1607
        unique_ptr<char []> key = GenerateKeyFromInt(k, ".");
        s = db_->Get(options, key.get(), &value);
        assert(!s.ok() && s.IsNotFound());
        thread->stats.FinishedSingleOp(db_);
      }
J
jorlow@chromium.org 已提交
1608 1609 1610
    }
  }

1611
  void ReadHot(ThreadState* thread) {
M
Mark Callaghan 已提交
1612
    Duration duration(FLAGS_duration, reads_);
1613
    ReadOptions options(FLAGS_verify_checksum, true);
1614 1615
    const long long range = (FLAGS_num + 99) / 100;
    long long found = 0;
1616 1617

    if (FLAGS_use_multiget) {
1618 1619
      const long long kpg = FLAGS_keys_per_multiget;  // keys per multiget group
      long long keys_left = reads_;
1620 1621 1622 1623 1624 1625 1626 1627 1628 1629 1630

      // Recalculate number of keys per group, and call MultiGet until done
      long num_keys;
      while(num_keys = std::min(keys_left, kpg), !duration.Done(num_keys)) {
        found += MultiGetRandom(options, num_keys, thread->rand, range, "");
        thread->stats.FinishedSingleOp(db_);
        keys_left -= num_keys;
      }
    } else {
      std::string value;
      while (!duration.Done(1)) {
1631
        const long long k = thread->rand.Next() % range;
1632 1633 1634 1635 1636 1637
        unique_ptr<char []> key = GenerateKeyFromInt(k);
        if (db_->Get(options, key.get(), &value).ok()){
          ++found;
        }
        thread->stats.FinishedSingleOp(db_);
      }
1638
    }
1639 1640

    char msg[100];
1641
    snprintf(msg, sizeof(msg), "(%lld of %lld found)", found, reads_);
1642
    thread->stats.AddMessage(msg);
1643 1644
  }

S
Sanjay Ghemawat 已提交
1645
  void SeekRandom(ThreadState* thread) {
M
Mark Callaghan 已提交
1646
    Duration duration(FLAGS_duration, reads_);
1647
    ReadOptions options(FLAGS_verify_checksum, true);
S
Sanjay Ghemawat 已提交
1648
    std::string value;
1649
    long long found = 0;
M
Mark Callaghan 已提交
1650
    while (!duration.Done(1)) {
S
Sanjay Ghemawat 已提交
1651
      Iterator* iter = db_->NewIterator(options);
1652
      const long long k = thread->rand.Next() % FLAGS_num;
1653 1654 1655
      unique_ptr<char []> key = GenerateKeyFromInt(k);
      iter->Seek(key.get());
      if (iter->Valid() && iter->key() == key.get()) found++;
S
Sanjay Ghemawat 已提交
1656
      delete iter;
M
Mark Callaghan 已提交
1657
      thread->stats.FinishedSingleOp(db_);
S
Sanjay Ghemawat 已提交
1658 1659
    }
    char msg[100];
1660
    snprintf(msg, sizeof(msg), "(%lld of %lld found)", found, num_);
S
Sanjay Ghemawat 已提交
1661 1662 1663 1664 1665 1666
    thread->stats.AddMessage(msg);
  }

  void DoDelete(ThreadState* thread, bool seq) {
    WriteBatch batch;
    Status s;
M
Mark Callaghan 已提交
1667 1668 1669
    Duration duration(seq ? 0 : FLAGS_duration, num_);
    long i = 0;
    while (!duration.Done(entries_per_batch_)) {
S
Sanjay Ghemawat 已提交
1670 1671
      batch.Clear();
      for (int j = 0; j < entries_per_batch_; j++) {
1672
        const long long k = seq ? i+j : (thread->rand.Next() % FLAGS_num);
1673 1674
        unique_ptr<char []> key = GenerateKeyFromInt(k);
        batch.Delete(key.get());
M
Mark Callaghan 已提交
1675
        thread->stats.FinishedSingleOp(db_);
S
Sanjay Ghemawat 已提交
1676 1677 1678 1679 1680 1681
      }
      s = db_->Write(write_options_, &batch);
      if (!s.ok()) {
        fprintf(stderr, "del error: %s\n", s.ToString().c_str());
        exit(1);
      }
M
Mark Callaghan 已提交
1682
      ++i;
S
Sanjay Ghemawat 已提交
1683 1684 1685 1686 1687 1688 1689 1690 1691 1692 1693
    }
  }

  void DeleteSeq(ThreadState* thread) {
    DoDelete(thread, true);
  }

  void DeleteRandom(ThreadState* thread) {
    DoDelete(thread, false);
  }

1694 1695 1696 1697 1698 1699
  void ReadWhileWriting(ThreadState* thread) {
    if (thread->tid > 0) {
      ReadRandom(thread);
    } else {
      // Special thread that keeps writing until other threads are done.
      RandomGenerator gen;
1700 1701 1702 1703 1704 1705 1706 1707 1708
      double last = FLAGS_env->NowMicros();
      int writes_per_second_by_10 = 0;
      int num_writes = 0;

      // --writes_per_second rate limit is enforced per 100 milliseconds
      // intervals to avoid a burst of writes at the start of each second.

      if (FLAGS_writes_per_second > 0)
        writes_per_second_by_10 = FLAGS_writes_per_second / 10;
1709 1710 1711 1712

      // Don't merge stats from this thread with the readers.
      thread->stats.SetExcludeFromMerge();

1713 1714 1715 1716 1717 1718 1719 1720 1721
      while (true) {
        {
          MutexLock l(&thread->shared->mu);
          if (thread->shared->num_done + 1 >= thread->shared->num_initialized) {
            // Other threads have finished
            break;
          }
        }

1722
        const long long k = thread->rand.Next() % FLAGS_num;
1723 1724
        unique_ptr<char []> key = GenerateKeyFromInt(k);
        Status s = db_->Put(write_options_, key.get(), gen.Generate(value_size_));
1725 1726 1727 1728
        if (!s.ok()) {
          fprintf(stderr, "put error: %s\n", s.ToString().c_str());
          exit(1);
        }
1729
        thread->stats.FinishedSingleOp(db_);
1730 1731 1732 1733 1734 1735 1736 1737 1738 1739 1740 1741 1742 1743

        ++num_writes;
        if (writes_per_second_by_10 && num_writes >= writes_per_second_by_10) {
          double now = FLAGS_env->NowMicros();
          double usecs_since_last = now - last;

          num_writes = 0;
          last = now;

          if (usecs_since_last < 100000.0) {
            FLAGS_env->SleepForMicroseconds(100000.0 - usecs_since_last);
            last = FLAGS_env->NowMicros();
          }
        }
1744 1745 1746 1747
      }
    }
  }

1748
  // Given a key K and value V, this puts (K+"0", V), (K+"1", V), (K+"2", V)
1749 1750
  // in DB atomically i.e in a single batch. Also refer GetMany.
  Status PutMany(const WriteOptions& writeoptions,
1751 1752 1753 1754 1755 1756 1757 1758 1759 1760 1761 1762 1763 1764 1765 1766 1767
                  const Slice& key, const Slice& value) {
    std::string suffixes[3] = {"2", "1", "0"};
    std::string keys[3];

    WriteBatch batch;
    Status s;
    for (int i = 0; i < 3; i++) {
      keys[i] = key.ToString() + suffixes[i];
      batch.Put(keys[i], value);
    }

    s = db_->Write(writeoptions, &batch);
    return s;
  }


  // Given a key K, this deletes (K+"0", V), (K+"1", V), (K+"2", V)
1768 1769
  // in DB atomically i.e in a single batch. Also refer GetMany.
  Status DeleteMany(const WriteOptions& writeoptions,
1770 1771 1772 1773 1774 1775 1776 1777 1778 1779 1780 1781 1782 1783 1784 1785 1786
                  const Slice& key) {
    std::string suffixes[3] = {"1", "2", "0"};
    std::string keys[3];

    WriteBatch batch;
    Status s;
    for (int i = 0; i < 3; i++) {
      keys[i] = key.ToString() + suffixes[i];
      batch.Delete(keys[i]);
    }

    s = db_->Write(writeoptions, &batch);
    return s;
  }

  // Given a key K and value V, this gets values for K+"0", K+"1" and K+"2"
  // in the same snapshot, and verifies that all the values are identical.
1787 1788
  // ASSUMES that PutMany was used to put (K, V) into the DB.
  Status GetMany(const ReadOptions& readoptions,
1789 1790 1791 1792 1793 1794 1795 1796 1797 1798 1799 1800 1801 1802 1803 1804 1805 1806 1807 1808 1809 1810 1811 1812 1813 1814 1815 1816 1817 1818 1819 1820 1821 1822 1823 1824 1825
                  const Slice& key, std::string* value) {
    std::string suffixes[3] = {"0", "1", "2"};
    std::string keys[3];
    Slice key_slices[3];
    std::string values[3];
    ReadOptions readoptionscopy = readoptions;
    readoptionscopy.snapshot = db_->GetSnapshot();
    Status s;
    for (int i = 0; i < 3; i++) {
      keys[i] = key.ToString() + suffixes[i];
      key_slices[i] = keys[i];
      s = db_->Get(readoptionscopy, key_slices[i], value);
      if (!s.ok() && !s.IsNotFound()) {
        fprintf(stderr, "get error: %s\n", s.ToString().c_str());
        values[i] = "";
        // we continue after error rather than exiting so that we can
        // find more errors if any
      } else if (s.IsNotFound()) {
        values[i] = "";
      } else {
        values[i] = *value;
      }
    }
    db_->ReleaseSnapshot(readoptionscopy.snapshot);

    if ((values[0] != values[1]) || (values[1] != values[2])) {
      fprintf(stderr, "inconsistent values for key %s: %s, %s, %s\n",
              key.ToString().c_str(), values[0].c_str(), values[1].c_str(),
              values[2].c_str());
      // we continue after error rather than exiting so that we can
      // find more errors if any
    }

    return s;
  }

  // Differs from readrandomwriterandom in the following ways:
1826
  // (a) Uses GetMany/PutMany to read/write key values. Refer to those funcs.
1827 1828 1829 1830
  // (b) Does deletes as well (per FLAGS_deletepercent)
  // (c) In order to achieve high % of 'found' during lookups, and to do
  //     multiple writes (including puts and deletes) it uses upto
  //     FLAGS_numdistinct distinct keys instead of FLAGS_num distinct keys.
1831
  // (d) Does not have a MultiGet option.
1832 1833 1834 1835
  void RandomWithVerify(ThreadState* thread) {
    ReadOptions options(FLAGS_verify_checksum, true);
    RandomGenerator gen;
    std::string value;
1836
    long long found = 0;
1837 1838 1839
    int get_weight = 0;
    int put_weight = 0;
    int delete_weight = 0;
1840 1841 1842
    long long gets_done = 0;
    long long puts_done = 0;
    long long deletes_done = 0;
1843

1844
    // the number of iterations is the larger of read_ or write_
1845 1846
    for (long long i = 0; i < readwrites_; i++) {
      const long long k = thread->rand.Next() % (FLAGS_numdistinct);
1847
      unique_ptr<char []> key = GenerateKeyFromInt(k);
1848
      if (get_weight == 0 && put_weight == 0 && delete_weight == 0) {
1849
        // one batch completed, reinitialize for next batch
1850 1851 1852 1853 1854 1855
        get_weight = FLAGS_readwritepercent;
        delete_weight = FLAGS_deletepercent;
        put_weight = 100 - get_weight - delete_weight;
      }
      if (get_weight > 0) {
        // do all the gets first
1856
        Status s = GetMany(options, key.get(), &value);
1857
        if (!s.ok() && !s.IsNotFound()) {
1858
          fprintf(stderr, "getmany error: %s\n", s.ToString().c_str());
1859 1860 1861 1862 1863 1864 1865 1866 1867 1868
          // we continue after error rather than exiting so that we can
          // find more errors if any
        } else if (!s.IsNotFound()) {
          found++;
        }
        get_weight--;
        gets_done++;
      } else if (put_weight > 0) {
        // then do all the corresponding number of puts
        // for all the gets we have done earlier
1869
        Status s = PutMany(write_options_, key.get(), gen.Generate(value_size_));
1870
        if (!s.ok()) {
1871
          fprintf(stderr, "putmany error: %s\n", s.ToString().c_str());
1872 1873 1874 1875 1876
          exit(1);
        }
        put_weight--;
        puts_done++;
      } else if (delete_weight > 0) {
1877
        Status s = DeleteMany(write_options_, key.get());
1878
        if (!s.ok()) {
1879
          fprintf(stderr, "deletemany error: %s\n", s.ToString().c_str());
1880 1881 1882 1883 1884 1885 1886 1887 1888
          exit(1);
        }
        delete_weight--;
        deletes_done++;
      }

      thread->stats.FinishedSingleOp(db_);
    }
    char msg[100];
1889 1890
    snprintf(msg, sizeof(msg),
             "( get:%lld put:%lld del:%lld total:%lld found:%lld)",
1891 1892 1893 1894
             gets_done, puts_done, deletes_done, readwrites_, found);
    thread->stats.AddMessage(msg);
  }

X
Xing Jin 已提交
1895
  // This is different from ReadWhileWriting because it does not use
1896
  // an extra thread.
1897
  void ReadRandomWriteRandom(ThreadState* thread) {
1898 1899 1900 1901 1902 1903
    if (FLAGS_use_multiget){
      // Separate function for multiget (for ease of reading)
      ReadRandomWriteRandomMultiGet(thread);
      return;
    }

1904 1905 1906
    ReadOptions options(FLAGS_verify_checksum, true);
    RandomGenerator gen;
    std::string value;
1907
    long long found = 0;
1908 1909
    int get_weight = 0;
    int put_weight = 0;
1910 1911
    long long reads_done = 0;
    long long writes_done = 0;
M
Mark Callaghan 已提交
1912 1913
    Duration duration(FLAGS_duration, readwrites_);

1914
    // the number of iterations is the larger of read_ or write_
M
Mark Callaghan 已提交
1915
    while (!duration.Done(1)) {
1916
      const long long k = thread->rand.Next() % FLAGS_num;
1917
      unique_ptr<char []> key = GenerateKeyFromInt(k);
1918
      if (get_weight == 0 && put_weight == 0) {
X
Xing Jin 已提交
1919
        // one batch completed, reinitialize for next batch
1920 1921 1922 1923
        get_weight = FLAGS_readwritepercent;
        put_weight = 100 - get_weight;
      }
      if (get_weight > 0) {
M
Mark Callaghan 已提交
1924 1925 1926 1927 1928 1929 1930

        if (FLAGS_use_snapshot) {
          options.snapshot = db_->GetSnapshot();
        }

        if (FLAGS_get_approx) {
          char key2[100];
1931
          snprintf(key2, sizeof(key2), "%016lld", k + 1);
M
Mark Callaghan 已提交
1932 1933 1934 1935 1936 1937 1938
          Slice skey2(key2);
          Slice skey(key2);
          Range range(skey, skey2);
          uint64_t sizes;
          db_->GetApproximateSizes(&range, 1, &sizes);
        }

1939
        // do all the gets first
1940
        Status s = db_->Get(options, key.get(), &value);
1941 1942 1943 1944 1945 1946 1947 1948
        if (!s.ok() && !s.IsNotFound()) {
          fprintf(stderr, "get error: %s\n", s.ToString().c_str());
          // we continue after error rather than exiting so that we can
          // find more errors if any
        } else if (!s.IsNotFound()) {
          found++;
        }

1949 1950
        get_weight--;
        reads_done++;
M
Mark Callaghan 已提交
1951 1952 1953 1954 1955

        if (FLAGS_use_snapshot) {
          db_->ReleaseSnapshot(options.snapshot);
        }

1956 1957 1958
      } else  if (put_weight > 0) {
        // then do all the corresponding number of puts
        // for all the gets we have done earlier
1959
        Status s = db_->Put(write_options_, key.get(), gen.Generate(value_size_));
1960 1961 1962 1963 1964 1965 1966
        if (!s.ok()) {
          fprintf(stderr, "put error: %s\n", s.ToString().c_str());
          exit(1);
        }
        put_weight--;
        writes_done++;
      }
M
Mark Callaghan 已提交
1967
      thread->stats.FinishedSingleOp(db_);
1968 1969
    }
    char msg[100];
1970 1971
    snprintf(msg, sizeof(msg),
             "( reads:%lld writes:%lld total:%lld found:%lld)",
1972
             reads_done, writes_done, readwrites_, found);
1973 1974 1975
    thread->stats.AddMessage(msg);
  }

1976 1977 1978 1979 1980 1981 1982 1983 1984 1985 1986 1987 1988 1989 1990 1991 1992 1993 1994 1995 1996 1997 1998 1999 2000 2001 2002 2003 2004 2005 2006 2007 2008 2009 2010 2011 2012 2013 2014 2015 2016 2017 2018 2019 2020
  // ReadRandomWriteRandom (with multiget)
  // Does FLAGS_keys_per_multiget reads (per multiget), followed by some puts.
  // FLAGS_readwritepercent will specify the ratio of gets to puts.
  // e.g.: If FLAGS_keys_per_multiget == 100 and FLAGS_readwritepercent == 75
  // Then each block will do 100 multigets and 33 puts
  // So there are 133 operations in-total: 100 of them (75%) are gets, and 33
  // of them (25%) are puts.
  void ReadRandomWriteRandomMultiGet(ThreadState* thread) {
    ReadOptions options(FLAGS_verify_checksum, true);
    RandomGenerator gen;

    // For multiget
    const long& kpg = FLAGS_keys_per_multiget;  // keys per multiget group

    long keys_left = readwrites_;  // number of keys still left to read
    long num_keys;                  // number of keys to read in current group
    long num_put_keys;              // number of keys to put in current group

    long found = 0;
    long reads_done = 0;
    long writes_done = 0;
    long multigets_done = 0;

    // the number of iterations is the larger of read_ or write_
    Duration duration(FLAGS_duration, readwrites_);
    while(true) {
      // Read num_keys keys, then write num_put_keys keys.
      // The ratio of num_keys to num_put_keys is always FLAGS_readwritepercent
      // And num_keys is set to be FLAGS_keys_per_multiget (kpg)
      // num_put_keys is calculated accordingly (to maintain the ratio)
      // Note: On the final iteration, num_keys and num_put_keys will be smaller
      num_keys = std::min(keys_left*(FLAGS_readwritepercent + 99)/100, kpg);
      num_put_keys = num_keys * (100-FLAGS_readwritepercent)
                     / FLAGS_readwritepercent;

      // This will break the loop when duration is complete
      if (duration.Done(num_keys + num_put_keys)) {
        break;
      }

      // A quick check to make sure our formula doesn't break on edge cases
      assert(num_keys >= 1);
      assert(num_keys + num_put_keys <= keys_left);

      // Apply the MultiGet operations
X
Xing Jin 已提交
2021
      found += MultiGetRandom(options, num_keys, thread->rand, FLAGS_num, "");
2022 2023 2024 2025 2026 2027
      ++multigets_done;
      reads_done+=num_keys;
      thread->stats.FinishedSingleOp(db_);

      // Now do the puts
      int i;
2028
      long long k;
2029 2030 2031 2032 2033 2034 2035 2036 2037 2038 2039 2040 2041 2042 2043 2044 2045
      for(i=0; i<num_put_keys; ++i) {
        k = thread->rand.Next() % FLAGS_num;
        unique_ptr<char []> key = GenerateKeyFromInt(k);
        Status s = db_->Put(write_options_, key.get(),
                            gen.Generate(value_size_));
        if (!s.ok()) {
          fprintf(stderr, "put error: %s\n", s.ToString().c_str());
          exit(1);
        }
        writes_done++;
        thread->stats.FinishedSingleOp(db_);
      }

      keys_left -= (num_keys + num_put_keys);
    }
    char msg[100];
    snprintf(msg, sizeof(msg),
2046
             "( reads:%ld writes:%ld total:%lld multiget_ops:%ld found:%ld)",
2047 2048 2049 2050
             reads_done, writes_done, readwrites_, multigets_done, found);
    thread->stats.AddMessage(msg);
  }

M
Mark Callaghan 已提交
2051 2052 2053 2054 2055 2056
  //
  // Read-modify-write for random keys
  void UpdateRandom(ThreadState* thread) {
    ReadOptions options(FLAGS_verify_checksum, true);
    RandomGenerator gen;
    std::string value;
2057
    long long found = 0;
M
Mark Callaghan 已提交
2058 2059 2060 2061
    Duration duration(FLAGS_duration, readwrites_);

    // the number of iterations is the larger of read_ or write_
    while (!duration.Done(1)) {
2062
      const long long k = thread->rand.Next() % FLAGS_num;
M
Mark Callaghan 已提交
2063 2064 2065 2066 2067 2068 2069 2070
      unique_ptr<char []> key = GenerateKeyFromInt(k);

      if (FLAGS_use_snapshot) {
        options.snapshot = db_->GetSnapshot();
      }

      if (FLAGS_get_approx) {
        char key2[100];
2071
        snprintf(key2, sizeof(key2), "%016lld", k + 1);
M
Mark Callaghan 已提交
2072 2073 2074 2075 2076 2077 2078 2079 2080 2081 2082 2083 2084 2085 2086 2087 2088 2089 2090 2091 2092 2093 2094
        Slice skey2(key2);
        Slice skey(key2);
        Range range(skey, skey2);
        uint64_t sizes;
        db_->GetApproximateSizes(&range, 1, &sizes);
      }

      if (db_->Get(options, key.get(), &value).ok()) {
        found++;
      }

      if (FLAGS_use_snapshot) {
        db_->ReleaseSnapshot(options.snapshot);
      }

      Status s = db_->Put(write_options_, key.get(), gen.Generate(value_size_));
      if (!s.ok()) {
        fprintf(stderr, "put error: %s\n", s.ToString().c_str());
        exit(1);
      }
      thread->stats.FinishedSingleOp(db_);
    }
    char msg[100];
2095 2096
    snprintf(msg, sizeof(msg),
             "( updates:%lld found:%lld)", readwrites_, found);
M
Mark Callaghan 已提交
2097 2098 2099
    thread->stats.AddMessage(msg);
  }

D
Deon Nicholas 已提交
2100 2101 2102 2103 2104 2105 2106 2107 2108 2109 2110 2111
  // Read-modify-write for random keys.
  // Each operation causes the key grow by value_size (simulating an append).
  // Generally used for benchmarking against merges of similar type
  void AppendRandom(ThreadState* thread) {
    ReadOptions options(FLAGS_verify_checksum, true);
    RandomGenerator gen;
    std::string value;
    long found = 0;

    // The number of iterations is the larger of read_ or write_
    Duration duration(FLAGS_duration, readwrites_);
    while (!duration.Done(1)) {
2112
      const long long k = thread->rand.Next() % FLAGS_num;
D
Deon Nicholas 已提交
2113 2114 2115 2116 2117 2118 2119 2120
      unique_ptr<char []> key = GenerateKeyFromInt(k);

      if (FLAGS_use_snapshot) {
        options.snapshot = db_->GetSnapshot();
      }

      if (FLAGS_get_approx) {
        char key2[100];
2121
        snprintf(key2, sizeof(key2), "%016lld", k + 1);
D
Deon Nicholas 已提交
2122 2123 2124 2125 2126 2127 2128 2129 2130 2131 2132 2133 2134 2135 2136 2137 2138 2139 2140 2141 2142 2143 2144 2145 2146 2147 2148 2149 2150 2151 2152 2153 2154 2155 2156 2157
        Slice skey2(key2);
        Slice skey(key2);
        Range range(skey, skey2);
        uint64_t sizes;
        db_->GetApproximateSizes(&range, 1, &sizes);
      }

      // Get the existing value
      if (db_->Get(options, key.get(), &value).ok()) {
        found++;
      } else {
        // If not existing, then just assume an empty string of data
        value.clear();
      }

      if (FLAGS_use_snapshot) {
        db_->ReleaseSnapshot(options.snapshot);
      }

      // Update the value (by appending data)
      Slice operand = gen.Generate(value_size_);
      if (value.size() > 0) {
        // Use a delimeter to match the semantics for StringAppendOperator
        value.append(1,',');
      }
      value.append(operand.data(), operand.size());

      // Write back to the database
      Status s = db_->Put(write_options_, key.get(), value);
      if (!s.ok()) {
        fprintf(stderr, "put error: %s\n", s.ToString().c_str());
        exit(1);
      }
      thread->stats.FinishedSingleOp(db_);
    }
    char msg[100];
2158
    snprintf(msg, sizeof(msg), "( updates:%lld found:%ld)", readwrites_, found);
D
Deon Nicholas 已提交
2159 2160 2161 2162 2163 2164 2165 2166 2167 2168 2169 2170 2171 2172 2173 2174
    thread->stats.AddMessage(msg);
  }

  // Read-modify-write for random keys (using MergeOperator)
  // The merge operator to use should be defined by FLAGS_merge_operator
  // Adjust FLAGS_value_size so that the keys are reasonable for this operator
  // Assumes that the merge operator is non-null (i.e.: is well-defined)
  //
  // For example, use FLAGS_merge_operator="uint64add" and FLAGS_value_size=8
  // to simulate random additions over 64-bit integers using merge.
  void MergeRandom(ThreadState* thread) {
    RandomGenerator gen;

    // The number of iterations is the larger of read_ or write_
    Duration duration(FLAGS_duration, readwrites_);
    while (!duration.Done(1)) {
2175
      const long long k = thread->rand.Next() % FLAGS_num;
D
Deon Nicholas 已提交
2176 2177 2178 2179 2180 2181 2182 2183 2184 2185 2186 2187 2188 2189
      unique_ptr<char []> key = GenerateKeyFromInt(k);

      Status s = db_->Merge(write_options_, key.get(),
                            gen.Generate(value_size_));

      if (!s.ok()) {
        fprintf(stderr, "merge error: %s\n", s.ToString().c_str());
        exit(1);
      }
      thread->stats.FinishedSingleOp(db_);
    }

    // Print some statistics
    char msg[100];
2190
    snprintf(msg, sizeof(msg), "( updates:%lld)", readwrites_);
D
Deon Nicholas 已提交
2191 2192 2193
    thread->stats.AddMessage(msg);
  }

2194
  void Compact(ThreadState* thread) {
2195
    db_->CompactRange(nullptr, nullptr);
J
jorlow@chromium.org 已提交
2196 2197
  }

S
Sanjay Ghemawat 已提交
2198
  void PrintStats(const char* key) {
2199
    std::string stats;
S
Sanjay Ghemawat 已提交
2200
    if (!db_->GetProperty(key, &stats)) {
2201
      stats = "(failed)";
2202
    }
2203
    fprintf(stdout, "\n%s\n", stats.c_str());
2204 2205
  }

J
jorlow@chromium.org 已提交
2206 2207 2208 2209 2210 2211
  static void WriteToFile(void* arg, const char* buf, int n) {
    reinterpret_cast<WritableFile*>(arg)->Append(Slice(buf, n));
  }

  void HeapProfile() {
    char fname[100];
H
Haobo Xu 已提交
2212
    EnvOptions soptions;
2213
    snprintf(fname, sizeof(fname), "%s/heap-%04d", FLAGS_db, ++heap_counter_);
2214
    unique_ptr<WritableFile> file;
2215
    Status s = FLAGS_env->NewWritableFile(fname, &file, soptions);
J
jorlow@chromium.org 已提交
2216
    if (!s.ok()) {
2217
      fprintf(stderr, "%s\n", s.ToString().c_str());
J
jorlow@chromium.org 已提交
2218 2219
      return;
    }
2220
    bool ok = port::GetHeapProfile(WriteToFile, file.get());
J
jorlow@chromium.org 已提交
2221
    if (!ok) {
2222
      fprintf(stderr, "heap profiling not supported\n");
2223
      FLAGS_env->DeleteFile(fname);
J
jorlow@chromium.org 已提交
2224 2225 2226 2227
    }
  }
};

H
Hans Wennborg 已提交
2228
}  // namespace leveldb
J
jorlow@chromium.org 已提交
2229 2230

int main(int argc, char** argv) {
2231 2232
  leveldb::InstallStackTraceHandler();

2233
  FLAGS_write_buffer_size = leveldb::Options().write_buffer_size;
2234
  FLAGS_max_write_buffer_number = leveldb::Options().max_write_buffer_number;
2235 2236
  FLAGS_min_write_buffer_number_to_merge =
    leveldb::Options().min_write_buffer_number_to_merge;
2237
  FLAGS_open_files = leveldb::Options().max_open_files;
A
Abhishek Kona 已提交
2238
  FLAGS_max_background_compactions =
2239
    leveldb::Options().max_background_compactions;
2240 2241 2242 2243 2244
  FLAGS_compaction_style = leveldb::Options().compaction_style;
  FLAGS_universal_size_ratio =
    leveldb::Options().compaction_options_universal.size_ratio;
  FLAGS_compaction_universal_min_merge_width =
    leveldb::Options().compaction_options_universal.min_merge_width;
2245 2246
  // Compression test code above refers to FLAGS_block_size
  FLAGS_block_size = leveldb::Options().block_size;
H
Haobo Xu 已提交
2247 2248 2249
  FLAGS_use_os_buffer = leveldb::EnvOptions().use_os_buffer;
  FLAGS_use_mmap_reads = leveldb::EnvOptions().use_mmap_reads;
  FLAGS_use_mmap_writes = leveldb::EnvOptions().use_mmap_writes;
2250

H
heyongqiang 已提交
2251
  std::string default_db_path;
2252

J
jorlow@chromium.org 已提交
2253 2254 2255
  for (int i = 1; i < argc; i++) {
    double d;
    int n;
2256
    long l;
2257
    long long ll;
J
jorlow@chromium.org 已提交
2258
    char junk;
2259
    char buf[2048];
2260
    char str[512];
2261

J
jorlow@chromium.org 已提交
2262 2263 2264 2265 2266 2267 2268
    if (leveldb::Slice(argv[i]).starts_with("--benchmarks=")) {
      FLAGS_benchmarks = argv[i] + strlen("--benchmarks=");
    } else if (sscanf(argv[i], "--compression_ratio=%lf%c", &d, &junk) == 1) {
      FLAGS_compression_ratio = d;
    } else if (sscanf(argv[i], "--histogram=%d%c", &n, &junk) == 1 &&
               (n == 0 || n == 1)) {
      FLAGS_histogram = n;
2269 2270 2271
    } else if (sscanf(argv[i], "--use_existing_db=%d%c", &n, &junk) == 1 &&
               (n == 0 || n == 1)) {
      FLAGS_use_existing_db = n;
2272 2273 2274 2275 2276 2277
    } else if (sscanf(argv[i], "--num=%lld%c", &ll, &junk) == 1) {
      FLAGS_num = ll;
    } else if (sscanf(argv[i], "--numdistinct=%lld%c", &ll, &junk) == 1) {
      FLAGS_numdistinct = ll;
    } else if (sscanf(argv[i], "--reads=%lld%c", &ll, &junk) == 1) {
      FLAGS_reads = ll;
2278 2279
    } else if (sscanf(argv[i], "--read_range=%d%c", &n, &junk) == 1) {
      FLAGS_read_range = n;
T
Tyler Harter 已提交
2280 2281 2282 2283 2284 2285 2286

    } else if (sscanf(argv[i], "--use_prefix_blooms=%d%c", &n, &junk) == 1 &&
               (n == 0 || n == 1)) {
      FLAGS_use_prefix_blooms = n;
    } else if (sscanf(argv[i], "--use_prefix_api=%d%c", &n, &junk) == 1 &&
               (n == 0 || n == 1)) {
      FLAGS_use_prefix_api = n;
M
Mark Callaghan 已提交
2287 2288
    } else if (sscanf(argv[i], "--duration=%d%c", &n, &junk) == 1) {
      FLAGS_duration = n;
2289 2290
    } else if (sscanf(argv[i], "--seed=%ld%c", &l, &junk) == 1) {
      FLAGS_seed = l;
2291 2292
    } else if (sscanf(argv[i], "--threads=%d%c", &n, &junk) == 1) {
      FLAGS_threads = n;
J
jorlow@chromium.org 已提交
2293 2294
    } else if (sscanf(argv[i], "--value_size=%d%c", &n, &junk) == 1) {
      FLAGS_value_size = n;
2295 2296 2297 2298 2299 2300 2301
    } else if (sscanf(argv[i], "--key_size=%d%c", &n, &junk) == 1) {
      if (MAX_KEY_SIZE < n) {
         fprintf(stderr, "key_size should not be larger than %d\n", MAX_KEY_SIZE);
         exit(1);
      } else {
        FLAGS_key_size = n;
      }
J
jorlow@chromium.org 已提交
2302 2303
    } else if (sscanf(argv[i], "--write_buffer_size=%d%c", &n, &junk) == 1) {
      FLAGS_write_buffer_size = n;
2304 2305
    } else if (sscanf(argv[i], "--max_write_buffer_number=%d%c", &n, &junk) == 1) {
      FLAGS_max_write_buffer_number = n;
2306 2307 2308
    } else if (sscanf(argv[i], "--min_write_buffer_number_to_merge=%d%c",
               &n, &junk) == 1) {
      FLAGS_min_write_buffer_number_to_merge = n;
J
Jim Paton 已提交
2309 2310
    } else if (sscanf(argv[i], "--max_background_compactions=%d%c", &n, &junk)
               == 1) {
2311
      FLAGS_max_background_compactions = n;
2312 2313 2314 2315 2316
    } else if (sscanf(argv[i], "--compaction_style=%d%c", &n, &junk) == 1) {
      FLAGS_compaction_style = (leveldb::CompactionStyle)n;
    } else if (sscanf(argv[i], "--universal_size_ratio=%d%c", &n, &junk) == 1) {
      FLAGS_universal_size_ratio = n;
    } else if (sscanf(argv[i], "--universal_min_merge_width=%d%c",
2317
               &n, &junk) == 1) {
2318
      FLAGS_compaction_universal_min_merge_width = n;
2319 2320
    } else if (sscanf(argv[i], "--cache_size=%ld%c", &l, &junk) == 1) {
      FLAGS_cache_size = l;
2321 2322
    } else if (sscanf(argv[i], "--block_size=%d%c", &n, &junk) == 1) {
      FLAGS_block_size = n;
2323
    } else if (sscanf(argv[i], "--cache_numshardbits=%d%c", &n, &junk) == 1) {
2324 2325 2326 2327 2328 2329
      if (n < 20) {
        FLAGS_cache_numshardbits = n;
      } else {
        fprintf(stderr, "The cache cannot be sharded into 2**%d pieces\n", n);
        exit(1);
      }
2330
    } else if (sscanf(argv[i], "--table_cache_numshardbits=%d%c",
A
Abhishek Kona 已提交
2331
          &n, &junk) == 1) {
2332 2333 2334 2335 2336
      if (n <= 0 || n > 20) {
        fprintf(stderr, "The cache cannot be sharded into 2**%d pieces\n", n);
        exit(1);
      }
      FLAGS_table_cache_numshardbits = n;
S
Sanjay Ghemawat 已提交
2337 2338
    } else if (sscanf(argv[i], "--bloom_bits=%d%c", &n, &junk) == 1) {
      FLAGS_bloom_bits = n;
2339 2340
    } else if (sscanf(argv[i], "--open_files=%d%c", &n, &junk) == 1) {
      FLAGS_open_files = n;
2341 2342
    } else if (strncmp(argv[i], "--db=", 5) == 0) {
      FLAGS_db = argv[i] + 5;
2343 2344 2345
    } else if (sscanf(argv[i], "--verify_checksum=%d%c", &n, &junk) == 1 &&
               (n == 0 || n == 1)) {
      FLAGS_verify_checksum = n;
2346 2347
    } else if (sscanf(argv[i], "--bufferedio=%d%c", &n, &junk) == 1 &&
               (n == 0 || n == 1)) {
2348
      FLAGS_use_os_buffer = n;
2349 2350
    } else if (sscanf(argv[i], "--mmap_read=%d%c", &n, &junk) == 1 &&
               (n == 0 || n == 1)) {
2351
      FLAGS_use_mmap_reads = n;
2352 2353
    } else if (sscanf(argv[i], "--mmap_write=%d%c", &n, &junk) == 1 &&
               (n == 0 || n == 1)) {
2354
      FLAGS_use_mmap_writes = n;
2355 2356 2357
    } else if (sscanf(argv[i], "--statistics=%d%c", &n, &junk) == 1 &&
               (n == 0 || n == 1)) {
      if (n == 1) {
H
Haobo Xu 已提交
2358
        dbstats = leveldb::CreateDBStatistics();
2359 2360
        FLAGS_statistics = true;
      }
2361 2362
    } else if (sscanf(argv[i], "--writes=%lld%c", &ll, &junk) == 1) {
      FLAGS_writes = ll;
2363 2364
    } else if (sscanf(argv[i], "--writes_per_second=%d%c", &n, &junk) == 1) {
      FLAGS_writes_per_second = n;
2365 2366 2367
    } else if (sscanf(argv[i], "--sync=%d%c", &n, &junk) == 1 &&
               (n == 0 || n == 1)) {
      FLAGS_sync = n;
2368
    } else if (sscanf(argv[i], "--readwritepercent=%d%c", &n, &junk) == 1 &&
2369
               n > 0 && n < 100) {
2370
      FLAGS_readwritepercent = n;
2371 2372 2373
    } else if (sscanf(argv[i], "--deletepercent=%d%c", &n, &junk) == 1 &&
               n > 0 && n < 100) {
      FLAGS_deletepercent = n;
H
heyongqiang 已提交
2374 2375 2376
    } else if (sscanf(argv[i], "--disable_data_sync=%d%c", &n, &junk) == 1 &&
        (n == 0 || n == 1)) {
      FLAGS_disable_data_sync = n;
2377 2378 2379
    } else if (sscanf(argv[i], "--use_fsync=%d%c", &n, &junk) == 1 &&
        (n == 0 || n == 1)) {
      FLAGS_use_fsync = n;
H
heyongqiang 已提交
2380
    } else if (sscanf(argv[i], "--disable_wal=%d%c", &n, &junk) == 1 &&
2381
        (n == 0 || n == 1)) {
H
heyongqiang 已提交
2382
      FLAGS_disable_wal = n;
M
Mark Callaghan 已提交
2383 2384 2385 2386 2387 2388
    } else if (sscanf(argv[i], "--use_snapshot=%d%c", &n, &junk) == 1 &&
        (n == 0 || n == 1)) {
      FLAGS_use_snapshot = n;
    } else if (sscanf(argv[i], "--get_approx=%d%c", &n, &junk) == 1 &&
        (n == 0 || n == 1)) {
      FLAGS_get_approx = n;
2389 2390
    } else if (sscanf(argv[i], "--hdfs=%s", buf) == 1) {
      FLAGS_env  = new leveldb::HdfsEnv(buf);
2391 2392 2393
    } else if (sscanf(argv[i], "--num_levels=%d%c",
        &n, &junk) == 1) {
      FLAGS_num_levels = n;
H
heyongqiang 已提交
2394 2395 2396 2397 2398 2399 2400
    } else if (sscanf(argv[i], "--target_file_size_base=%d%c",
        &n, &junk) == 1) {
      FLAGS_target_file_size_base = n;
    } else if ( sscanf(argv[i], "--target_file_size_multiplier=%d%c",
        &n, &junk) == 1) {
      FLAGS_target_file_size_multiplier = n;
    } else if (
2401 2402
        sscanf(argv[i], "--max_bytes_for_level_base=%ld%c", &l, &junk) == 1) {
      FLAGS_max_bytes_for_level_base = l;
H
heyongqiang 已提交
2403 2404 2405
    } else if (sscanf(argv[i], "--max_bytes_for_level_multiplier=%d%c",
        &n, &junk) == 1) {
      FLAGS_max_bytes_for_level_multiplier = n;
H
heyongqiang 已提交
2406 2407 2408
    } else if (sscanf(argv[i],"--level0_stop_writes_trigger=%d%c",
        &n, &junk) == 1) {
      FLAGS_level0_stop_writes_trigger = n;
2409 2410 2411 2412 2413 2414 2415 2416
    } else if (sscanf(argv[i],
                "--max_bytes_for_level_multiplier_additional=%s%c",
                str, &junk) == 1) {
      std::vector<std::string> fanout = leveldb::stringSplit(str, ',');
      for (unsigned int j= 0; j < fanout.size(); j++) {
        FLAGS_max_bytes_for_level_multiplier_additional.push_back(
          std::stoi(fanout[j]));
      }
H
heyongqiang 已提交
2417 2418 2419
    } else if (sscanf(argv[i],"--level0_slowdown_writes_trigger=%d%c",
        &n, &junk) == 1) {
      FLAGS_level0_slowdown_writes_trigger = n;
2420 2421 2422
    } else if (sscanf(argv[i],"--level0_file_num_compaction_trigger=%d%c",
        &n, &junk) == 1) {
      FLAGS_level0_file_num_compaction_trigger = n;
2423 2424 2425 2426 2427 2428 2429 2430 2431 2432 2433 2434 2435
    } else if (strncmp(argv[i], "--compression_type=", 19) == 0) {
      const char* ctype = argv[i] + 19;
      if (!strcasecmp(ctype, "none"))
        FLAGS_compression_type = leveldb::kNoCompression;
      else if (!strcasecmp(ctype, "snappy"))
        FLAGS_compression_type = leveldb::kSnappyCompression;
      else if (!strcasecmp(ctype, "zlib"))
        FLAGS_compression_type = leveldb::kZlibCompression;
      else if (!strcasecmp(ctype, "bzip2"))
        FLAGS_compression_type = leveldb::kBZip2Compression;
      else {
        fprintf(stdout, "Cannot parse %s\n", argv[i]);
      }
J
Jim Paton 已提交
2436 2437 2438 2439 2440 2441 2442 2443 2444 2445 2446 2447 2448
    } else if (strncmp(argv[i], "--memtablerep=", 14) == 0) {
      const char* ctype = argv[i] + 14;
      if (!strcasecmp(ctype, "skip_list"))
        FLAGS_rep_factory = kSkipList;
      else if (!strcasecmp(ctype, "prefix_hash"))
        FLAGS_rep_factory = kPrefixHash;
      else if (!strcasecmp(ctype, "unsorted"))
        FLAGS_rep_factory = kUnsorted;
      else if (!strcasecmp(ctype, "vector"))
        FLAGS_rep_factory = kVectorRep;
      else {
        fprintf(stdout, "Cannot parse %s\n", argv[i]);
      }
2449 2450
    } else if (sscanf(argv[i], "--min_level_to_compress=%d%c", &n, &junk) == 1
        && n >= 0) {
2451
      FLAGS_min_level_to_compress = n;
2452 2453 2454
    } else if (sscanf(argv[i], "--disable_seek_compaction=%d%c", &n, &junk) == 1
        && (n == 0 || n == 1)) {
      FLAGS_disable_seek_compaction = n;
2455 2456
    } else if (sscanf(argv[i], "--delete_obsolete_files_period_micros=%ld%c",
                      &l, &junk) == 1) {
2457
      FLAGS_delete_obsolete_files_period_micros = l;
2458 2459
    } else if (sscanf(argv[i], "--stats_interval=%lld%c", &ll, &junk) == 1) {
      FLAGS_stats_interval = ll;
2460 2461 2462
    } else if (sscanf(argv[i], "--stats_per_interval=%d%c", &n, &junk) == 1
        && (n == 0 || n == 1)) {
      FLAGS_stats_per_interval = n;
J
Jim Paton 已提交
2463 2464 2465
    } else if (sscanf(argv[i], "--prefix_size=%d%c", &n, &junk) == 1 &&
               n >= 0 && n < 2000000000) {
      FLAGS_prefix_size = n;
J
Jim Paton 已提交
2466 2467 2468 2469
    } else if (sscanf(argv[i], "--soft_rate_limit=%lf%c", &d, &junk) == 1 &&
               d > 0.0) {
      FLAGS_soft_rate_limit = d;
    } else if (sscanf(argv[i], "--hard_rate_limit=%lf%c", &d, &junk) == 1 &&
2470
               d > 1.0) {
J
Jim Paton 已提交
2471
      FLAGS_hard_rate_limit = d;
2472
    } else if (sscanf(argv[i],
J
Jim Paton 已提交
2473 2474 2475
               "--rate_limit_delay_max_milliseconds=%d%c", &n, &junk) == 1
        && n >= 0) {
      FLAGS_rate_limit_delay_max_milliseconds = n;
H
heyongqiang 已提交
2476 2477 2478
    } else if (sscanf(argv[i], "--readonly=%d%c", &n, &junk) == 1 &&
        (n == 0 || n ==1 )) {
      FLAGS_read_only = n;
2479 2480 2481
    } else if (sscanf(argv[i], "--max_grandparent_overlap_factor=%d%c",
               &n, &junk) == 1) {
      FLAGS_max_grandparent_overlap_factor = n;
A
Abhishek Kona 已提交
2482
    } else if (sscanf(argv[i], "--disable_auto_compactions=%d%c",
2483 2484
               &n, &junk) == 1 && (n == 0 || n ==1)) {
      FLAGS_disable_auto_compactions = n;
A
Abhishek Kona 已提交
2485
    } else if (sscanf(argv[i], "--source_compaction_factor=%d%c",
2486 2487
               &n, &junk) == 1 && n > 0) {
      FLAGS_source_compaction_factor = n;
2488 2489
    } else if (sscanf(argv[i], "--wal_ttl=%d%c", &n, &junk) == 1) {
      FLAGS_WAL_ttl_seconds = static_cast<uint64_t>(n);
2490 2491 2492 2493 2494 2495 2496 2497 2498 2499 2500 2501 2502 2503 2504
    } else if (sscanf(argv[i], "--advise_random_on_open=%d%c", &n, &junk) == 1
               && (n == 0 || n ==1 )) {
      FLAGS_advise_random_on_open = n;
    } else if (sscanf(argv[i], "--compaction_fadvice=%s", buf) == 1) {
      if (!strcasecmp(buf, "NONE"))
        FLAGS_compaction_fadvice = leveldb::Options::NONE;
      else if (!strcasecmp(buf, "NORMAL"))
        FLAGS_compaction_fadvice = leveldb::Options::NORMAL;
      else if (!strcasecmp(buf, "SEQUENTIAL"))
        FLAGS_compaction_fadvice = leveldb::Options::SEQUENTIAL;
      else if (!strcasecmp(buf, "WILLNEED"))
        FLAGS_compaction_fadvice = leveldb::Options::WILLNEED;
      else {
        fprintf(stdout, "Unknown compaction fadvice:%s\n", buf);
      }
H
Haobo Xu 已提交
2505 2506 2507
    } else if (sscanf(argv[i], "--use_adaptive_mutex=%d%c", &n, &junk) == 1
               && (n == 0 || n ==1 )) {
      FLAGS_use_adaptive_mutex = n;
2508 2509 2510 2511 2512 2513
    } else if (sscanf(argv[i], "--use_multiget=%d%c", &n, &junk) == 1 &&
               (n == 0 || n == 1)) {
      FLAGS_use_multiget = n;
    } else if (sscanf(argv[i], "--keys_per_multiget=%d%c",
               &n, &junk) == 1) {
      FLAGS_keys_per_multiget = n;
D
Deon Nicholas 已提交
2514
    } else if (sscanf(argv[i], "--bytes_per_sync=%ld%c", &l, &junk) == 1) {
H
Haobo Xu 已提交
2515
      FLAGS_bytes_per_sync = l;
2516
    } else if (sscanf(argv[i], "--filter_deletes=%d%c", &n, &junk)
2517
               == 1 && (n == 0 || n ==1 )) {
2518
      FLAGS_filter_deletes = n;
D
Deon Nicholas 已提交
2519 2520
    } else if (sscanf(argv[i], "--merge_operator=%s", buf) == 1) {
      FLAGS_merge_operator = buf;
2521
    } else {
J
jorlow@chromium.org 已提交
2522 2523 2524 2525 2526
      fprintf(stderr, "Invalid flag '%s'\n", argv[i]);
      exit(1);
    }
  }

2527 2528 2529 2530
  // The number of background threads should be at least as much the
  // max number of concurrent compactions.
  FLAGS_env->SetBackgroundThreads(FLAGS_max_background_compactions);

H
heyongqiang 已提交
2531
  // Choose a location for the test database if none given with --db=<path>
2532
  if (FLAGS_db == nullptr) {
H
heyongqiang 已提交
2533 2534 2535 2536 2537
      leveldb::Env::Default()->GetTestDirectory(&default_db_path);
      default_db_path += "/dbbench";
      FLAGS_db = default_db_path.c_str();
  }

J
jorlow@chromium.org 已提交
2538 2539 2540 2541
  leveldb::Benchmark benchmark;
  benchmark.Run();
  return 0;
}