db_bench.cc 29.1 KB
Newer Older
J
jorlow@chromium.org 已提交
1 2 3 4 5 6 7 8 9
// Copyright (c) 2011 The LevelDB Authors. All rights reserved.
// Use of this source code is governed by a BSD-style license that can be
// found in the LICENSE file. See the AUTHORS file for names of contributors.

#include <sys/types.h>
#include <stdio.h>
#include <stdlib.h>
#include "db/db_impl.h"
#include "db/version_set.h"
10 11 12 13
#include "leveldb/cache.h"
#include "leveldb/db.h"
#include "leveldb/env.h"
#include "leveldb/write_batch.h"
J
jorlow@chromium.org 已提交
14 15
#include "port/port.h"
#include "util/crc32c.h"
J
jorlow@chromium.org 已提交
16
#include "util/histogram.h"
17
#include "util/mutexlock.h"
J
jorlow@chromium.org 已提交
18 19 20 21 22
#include "util/random.h"
#include "util/testutil.h"

// Comma-separated list of operations to run in the specified order
//   Actual benchmarks:
23 24 25 26 27
//      fillseq       -- write N values in sequential key order in async mode
//      fillrandom    -- write N values in random key order in async mode
//      overwrite     -- overwrite N values in random key order in async mode
//      fillsync      -- write N/100 values in random key order in sync mode
//      fill100K      -- write N/1000 100K values in random order in async mode
S
Sanjay Ghemawat 已提交
28 29
//      deleteseq     -- delete N keys in sequential order
//      deleterandom  -- delete N keys in random order
30 31 32
//      readseq       -- read N times sequentially
//      readreverse   -- read N times in reverse order
//      readrandom    -- read N times in random order
S
Sanjay Ghemawat 已提交
33
//      readmissing   -- read N missing keys in random order
34
//      readhot       -- read N times in random order from 1% section of DB
S
Sanjay Ghemawat 已提交
35
//      seekrandom    -- N random seeks
J
jorlow@chromium.org 已提交
36
//      crc32c        -- repeated crc32c of 4K of data
37
//      acquireload   -- load N*1000 times
J
jorlow@chromium.org 已提交
38 39
//   Meta operations:
//      compact     -- Compact the entire DB
40
//      stats       -- Print DB stats
S
Sanjay Ghemawat 已提交
41
//      sstables    -- Print sstable info
J
jorlow@chromium.org 已提交
42 43
//      heapprofile -- Dump a heap profile (if supported by this port)
static const char* FLAGS_benchmarks =
44
    "fillseq,"
J
jorlow@chromium.org 已提交
45
    "fillsync,"
46 47
    "fillrandom,"
    "overwrite,"
J
jorlow@chromium.org 已提交
48 49
    "readrandom,"
    "readrandom,"  // Extra run to allow previous compactions to quiesce
J
jorlow@chromium.org 已提交
50
    "readseq,"
J
jorlow@chromium.org 已提交
51
    "readreverse,"
J
jorlow@chromium.org 已提交
52
    "compact,"
J
jorlow@chromium.org 已提交
53
    "readrandom,"
J
jorlow@chromium.org 已提交
54
    "readseq,"
J
jorlow@chromium.org 已提交
55
    "readreverse,"
J
jorlow@chromium.org 已提交
56 57
    "fill100K,"
    "crc32c,"
58 59
    "snappycomp,"
    "snappyuncomp,"
60
    "acquireload,"
J
jorlow@chromium.org 已提交
61
    ;
J
jorlow@chromium.org 已提交
62 63

// Number of key/values to place in database
64
static long FLAGS_num = 1000000;
J
jorlow@chromium.org 已提交
65

66
// Number of read operations to do.  If negative, do FLAGS_num reads.
67
static long FLAGS_reads = -1;
68

69 70 71
// Number of concurrent threads to run.
static int FLAGS_threads = 1;

J
jorlow@chromium.org 已提交
72 73 74 75 76
// Size of each value
static int FLAGS_value_size = 100;

// Arrange to generate values that shrink to this fraction of
// their original size after compression
77
static double FLAGS_compression_ratio = 0.5;
J
jorlow@chromium.org 已提交
78 79 80 81 82

// Print histogram of operation timings
static bool FLAGS_histogram = false;

// Number of bytes to buffer in memtable before compacting
83 84 85 86 87
// (initialized to default value by "main")
static int FLAGS_write_buffer_size = 0;

// Number of bytes to use as a cache of uncompressed data.
// Negative means use default settings.
D
Dhruba Borthakur 已提交
88
static long FLAGS_cache_size = -1;
J
jorlow@chromium.org 已提交
89

90 91 92
// Maximum number of files to keep open at the same time (use default if == 0)
static int FLAGS_open_files = 0;

S
Sanjay Ghemawat 已提交
93 94 95 96
// Bloom filter bits per key.
// Negative means use default settings.
static int FLAGS_bloom_bits = -1;

97 98 99 100 101
// If true, do not destroy the existing database.  If you set this
// flag and also specify a benchmark that wants a fresh database, that
// benchmark will fail.
static bool FLAGS_use_existing_db = false;

102 103 104
// Use the db with the following name.
static const char* FLAGS_db = "/tmp/dbbench";

105 106 107 108 109
// Number of shards for the block cache is 2 ** FLAGS_cache_numshardbits.
// Negative means use default settings. This is applied only
// if FLAGS_cache_size is non-negative.
static int FLAGS_cache_numshardbits = -1;

110 111 112
// Verify checksum for every block read from storage
static bool FLAGS_verify_checksum = false;

J
jorlow@chromium.org 已提交
113 114 115
namespace leveldb {

namespace {
116 117

// Helper for quickly generating random data.
J
jorlow@chromium.org 已提交
118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147
class RandomGenerator {
 private:
  std::string data_;
  int pos_;

 public:
  RandomGenerator() {
    // We use a limited amount of data over and over again and ensure
    // that it is larger than the compression window (32KB), and also
    // large enough to serve all typical value sizes we want to write.
    Random rnd(301);
    std::string piece;
    while (data_.size() < 1048576) {
      // Add a short fragment that is as compressible as specified
      // by FLAGS_compression_ratio.
      test::CompressibleString(&rnd, FLAGS_compression_ratio, 100, &piece);
      data_.append(piece);
    }
    pos_ = 0;
  }

  Slice Generate(int len) {
    if (pos_ + len > data_.size()) {
      pos_ = 0;
      assert(len < data_.size());
    }
    pos_ += len;
    return Slice(data_.data() + pos_ - len, len);
  }
};
148 149 150 151 152 153 154 155 156 157 158 159 160

static Slice TrimSpace(Slice s) {
  int start = 0;
  while (start < s.size() && isspace(s[start])) {
    start++;
  }
  int limit = s.size();
  while (limit > start && isspace(s[limit-1])) {
    limit--;
  }
  return Slice(s.data() + start, limit - start);
}

161 162 163 164 165 166 167 168 169 170 171 172 173
static void AppendWithSpace(std::string* str, Slice msg) {
  if (msg.empty()) return;
  if (!str->empty()) {
    str->push_back(' ');
  }
  str->append(msg.data(), msg.size());
}

class Stats {
 private:
  double start_;
  double finish_;
  double seconds_;
174
  long done_;
175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224 225 226 227 228 229 230 231 232 233 234 235 236 237
  int next_report_;
  int64_t bytes_;
  double last_op_finish_;
  Histogram hist_;
  std::string message_;

 public:
  Stats() { Start(); }

  void Start() {
    next_report_ = 100;
    last_op_finish_ = start_;
    hist_.Clear();
    done_ = 0;
    bytes_ = 0;
    seconds_ = 0;
    start_ = Env::Default()->NowMicros();
    finish_ = start_;
    message_.clear();
  }

  void Merge(const Stats& other) {
    hist_.Merge(other.hist_);
    done_ += other.done_;
    bytes_ += other.bytes_;
    seconds_ += other.seconds_;
    if (other.start_ < start_) start_ = other.start_;
    if (other.finish_ > finish_) finish_ = other.finish_;

    // Just keep the messages from one thread
    if (message_.empty()) message_ = other.message_;
  }

  void Stop() {
    finish_ = Env::Default()->NowMicros();
    seconds_ = (finish_ - start_) * 1e-6;
  }

  void AddMessage(Slice msg) {
    AppendWithSpace(&message_, msg);
  }

  void FinishedSingleOp() {
    if (FLAGS_histogram) {
      double now = Env::Default()->NowMicros();
      double micros = now - last_op_finish_;
      hist_.Add(micros);
      if (micros > 20000) {
        fprintf(stderr, "long op: %.1f micros%30s\r", micros, "");
        fflush(stderr);
      }
      last_op_finish_ = now;
    }

    done_++;
    if (done_ >= next_report_) {
      if      (next_report_ < 1000)   next_report_ += 100;
      else if (next_report_ < 5000)   next_report_ += 500;
      else if (next_report_ < 10000)  next_report_ += 1000;
      else if (next_report_ < 50000)  next_report_ += 5000;
      else if (next_report_ < 100000) next_report_ += 10000;
      else if (next_report_ < 500000) next_report_ += 50000;
      else                            next_report_ += 100000;
238
      fprintf(stderr, "... finished %ld ops%30s\r", done_, "");
239 240 241 242 243 244 245 246 247 248 249 250 251 252 253 254 255 256 257 258 259 260 261 262
      fflush(stderr);
    }
  }

  void AddBytes(int64_t n) {
    bytes_ += n;
  }

  void Report(const Slice& name) {
    // Pretend at least one op was done in case we are running a benchmark
    // that does not call FinishedSingleOp().
    if (done_ < 1) done_ = 1;

    std::string extra;
    if (bytes_ > 0) {
      // Rate is computed on actual elapsed time, not the sum of per-thread
      // elapsed times.
      double elapsed = (finish_ - start_) * 1e-6;
      char rate[100];
      snprintf(rate, sizeof(rate), "%6.1f MB/s",
               (bytes_ / 1048576.0) / elapsed);
      extra = rate;
    }
    AppendWithSpace(&extra, message_);
263 264
    double elapsed = (finish_ - start_) * 1e-6;
    double throughput = (double)done_/elapsed;
265

D
Dhruba Borthakur 已提交
266
    fprintf(stdout, "%-12s : %11.3f micros/op %ld ops/sec;%s%s\n",
267 268
            name.ToString().c_str(),
            seconds_ * 1e6 / done_,
D
Dhruba Borthakur 已提交
269
            (long)throughput,
270 271 272 273 274 275 276 277 278 279 280 281 282 283 284 285 286 287 288 289 290
            (extra.empty() ? "" : " "),
            extra.c_str());
    if (FLAGS_histogram) {
      fprintf(stdout, "Microseconds per op:\n%s\n", hist_.ToString().c_str());
    }
    fflush(stdout);
  }
};

// State shared by all concurrent executions of the same benchmark.
struct SharedState {
  port::Mutex mu;
  port::CondVar cv;
  int total;

  // Each thread goes through the following states:
  //    (1) initializing
  //    (2) waiting for others to be initialized
  //    (3) running
  //    (4) done

291 292
  long num_initialized;
  long num_done;
293 294 295 296 297 298 299 300 301 302
  bool start;

  SharedState() : cv(&mu) { }
};

// Per-thread state for concurrent executions of the same benchmark.
struct ThreadState {
  int tid;             // 0..n-1 when running in n threads
  Random rand;         // Has different seeds for different threads
  Stats stats;
303
  SharedState* shared;
304 305 306 307 308 309 310

  ThreadState(int index)
      : tid(index),
        rand(1000 + index) {
  }
};

H
Hans Wennborg 已提交
311
}  // namespace
J
jorlow@chromium.org 已提交
312 313 314 315

class Benchmark {
 private:
  Cache* cache_;
S
Sanjay Ghemawat 已提交
316
  const FilterPolicy* filter_policy_;
J
jorlow@chromium.org 已提交
317
  DB* db_;
318
  long num_;
319 320 321
  int value_size_;
  int entries_per_batch_;
  WriteOptions write_options_;
322
  long reads_;
J
jorlow@chromium.org 已提交
323 324
  int heap_counter_;

325 326 327 328 329 330 331
  void PrintHeader() {
    const int kKeySize = 16;
    PrintEnvironment();
    fprintf(stdout, "Keys:       %d bytes each\n", kKeySize);
    fprintf(stdout, "Values:     %d bytes each (%d bytes after compression)\n",
            FLAGS_value_size,
            static_cast<int>(FLAGS_value_size * FLAGS_compression_ratio + 0.5));
332
    fprintf(stdout, "Entries:    %ld\n", num_);
333
    fprintf(stdout, "RawSize:    %.1f MB (estimated)\n",
334 335
            ((static_cast<int64_t>(kKeySize + FLAGS_value_size) * num_)
             / 1048576.0));
336 337 338 339 340 341 342 343 344 345 346 347 348 349 350 351 352
    fprintf(stdout, "FileSize:   %.1f MB (estimated)\n",
            (((kKeySize + FLAGS_value_size * FLAGS_compression_ratio) * num_)
             / 1048576.0));
    PrintWarnings();
    fprintf(stdout, "------------------------------------------------\n");
  }

  void PrintWarnings() {
#if defined(__GNUC__) && !defined(__OPTIMIZE__)
    fprintf(stdout,
            "WARNING: Optimization is disabled: benchmarks unnecessarily slow\n"
            );
#endif
#ifndef NDEBUG
    fprintf(stdout,
            "WARNING: Assertions are enabled; benchmarks unnecessarily slow\n");
#endif
353 354 355 356 357 358 359 360 361

    // See if snappy is working by attempting to compress a compressible string
    const char text[] = "yyyyyyyyyyyyyyyyyyyyyyyyyyyyyyyyyyyyyyyyy";
    std::string compressed;
    if (!port::Snappy_Compress(text, sizeof(text), &compressed)) {
      fprintf(stdout, "WARNING: Snappy compression is not enabled\n");
    } else if (compressed.size() >= sizeof(text)) {
      fprintf(stdout, "WARNING: Snappy compression is not effective\n");
    }
362 363 364 365 366 367 368 369 370 371 372 373 374 375 376 377 378 379 380 381 382 383 384 385 386 387 388 389 390 391 392 393 394 395 396 397 398
  }

  void PrintEnvironment() {
    fprintf(stderr, "LevelDB:    version %d.%d\n",
            kMajorVersion, kMinorVersion);

#if defined(__linux)
    time_t now = time(NULL);
    fprintf(stderr, "Date:       %s", ctime(&now));  // ctime() adds newline

    FILE* cpuinfo = fopen("/proc/cpuinfo", "r");
    if (cpuinfo != NULL) {
      char line[1000];
      int num_cpus = 0;
      std::string cpu_type;
      std::string cache_size;
      while (fgets(line, sizeof(line), cpuinfo) != NULL) {
        const char* sep = strchr(line, ':');
        if (sep == NULL) {
          continue;
        }
        Slice key = TrimSpace(Slice(line, sep - 1 - line));
        Slice val = TrimSpace(Slice(sep + 1));
        if (key == "model name") {
          ++num_cpus;
          cpu_type = val.ToString();
        } else if (key == "cache size") {
          cache_size = val.ToString();
        }
      }
      fclose(cpuinfo);
      fprintf(stderr, "CPU:        %d * %s\n", num_cpus, cpu_type.c_str());
      fprintf(stderr, "CPUCache:   %s\n", cache_size.c_str());
    }
#endif
  }

J
jorlow@chromium.org 已提交
399
 public:
400
  Benchmark()
401 402 403 404
  : cache_(FLAGS_cache_size >= 0 ? 
           (FLAGS_cache_numshardbits >= 1 ? 
            NewLRUCache(FLAGS_cache_size, FLAGS_cache_numshardbits) : 
            NewLRUCache(FLAGS_cache_size)) : NULL),
S
Sanjay Ghemawat 已提交
405 406 407
    filter_policy_(FLAGS_bloom_bits >= 0
                   ? NewBloomFilterPolicy(FLAGS_bloom_bits)
                   : NULL),
408 409
    db_(NULL),
    num_(FLAGS_num),
410 411
    value_size_(FLAGS_value_size),
    entries_per_batch_(1),
412
    reads_(FLAGS_reads < 0 ? FLAGS_num : FLAGS_reads),
413
    heap_counter_(0) {
J
jorlow@chromium.org 已提交
414
    std::vector<std::string> files;
415
    Env::Default()->GetChildren(FLAGS_db, &files);
J
jorlow@chromium.org 已提交
416 417
    for (int i = 0; i < files.size(); i++) {
      if (Slice(files[i]).starts_with("heap-")) {
418
        Env::Default()->DeleteFile(std::string(FLAGS_db) + "/" + files[i]);
J
jorlow@chromium.org 已提交
419 420
      }
    }
421
    if (!FLAGS_use_existing_db) {
422
      DestroyDB(FLAGS_db, Options());
423
    }
J
jorlow@chromium.org 已提交
424 425 426 427 428
  }

  ~Benchmark() {
    delete db_;
    delete cache_;
S
Sanjay Ghemawat 已提交
429
    delete filter_policy_;
J
jorlow@chromium.org 已提交
430 431 432
  }

  void Run() {
433 434
    PrintHeader();
    Open();
J
jorlow@chromium.org 已提交
435 436 437 438 439 440 441 442 443 444 445 446 447

    const char* benchmarks = FLAGS_benchmarks;
    while (benchmarks != NULL) {
      const char* sep = strchr(benchmarks, ',');
      Slice name;
      if (sep == NULL) {
        name = benchmarks;
        benchmarks = NULL;
      } else {
        name = Slice(benchmarks, sep - benchmarks);
        benchmarks = sep + 1;
      }

448 449
      // Reset parameters that may be overriddden bwlow
      num_ = FLAGS_num;
450
      reads_ = (FLAGS_reads < 0 ? FLAGS_num : FLAGS_reads);
451 452 453 454 455 456
      value_size_ = FLAGS_value_size;
      entries_per_batch_ = 1;
      write_options_ = WriteOptions();

      void (Benchmark::*method)(ThreadState*) = NULL;
      bool fresh_db = false;
457
      int num_threads = FLAGS_threads;
458 459

      if (name == Slice("fillseq")) {
460 461
        fresh_db = true;
        method = &Benchmark::WriteSeq;
462
      } else if (name == Slice("fillbatch")) {
463 464 465
        fresh_db = true;
        entries_per_batch_ = 1000;
        method = &Benchmark::WriteSeq;
466
      } else if (name == Slice("fillrandom")) {
467 468
        fresh_db = true;
        method = &Benchmark::WriteRandom;
469
      } else if (name == Slice("overwrite")) {
470 471
        fresh_db = false;
        method = &Benchmark::WriteRandom;
472
      } else if (name == Slice("fillsync")) {
473 474 475 476
        fresh_db = true;
        num_ /= 1000;
        write_options_.sync = true;
        method = &Benchmark::WriteRandom;
477
      } else if (name == Slice("fill100K")) {
478 479 480 481
        fresh_db = true;
        num_ /= 1000;
        value_size_ = 100 * 1000;
        method = &Benchmark::WriteRandom;
J
jorlow@chromium.org 已提交
482
      } else if (name == Slice("readseq")) {
483
        method = &Benchmark::ReadSequential;
J
jorlow@chromium.org 已提交
484
      } else if (name == Slice("readreverse")) {
485
        method = &Benchmark::ReadReverse;
J
jorlow@chromium.org 已提交
486
      } else if (name == Slice("readrandom")) {
487
        method = &Benchmark::ReadRandom;
S
Sanjay Ghemawat 已提交
488 489 490 491
      } else if (name == Slice("readmissing")) {
        method = &Benchmark::ReadMissing;
      } else if (name == Slice("seekrandom")) {
        method = &Benchmark::SeekRandom;
492
      } else if (name == Slice("readhot")) {
493
        method = &Benchmark::ReadHot;
494
      } else if (name == Slice("readrandomsmall")) {
495
        reads_ /= 1000;
496
        method = &Benchmark::ReadRandom;
S
Sanjay Ghemawat 已提交
497 498 499 500
      } else if (name == Slice("deleteseq")) {
        method = &Benchmark::DeleteSeq;
      } else if (name == Slice("deleterandom")) {
        method = &Benchmark::DeleteRandom;
501 502 503
      } else if (name == Slice("readwhilewriting")) {
        num_threads++;  // Add extra thread for writing
        method = &Benchmark::ReadWhileWriting;
J
jorlow@chromium.org 已提交
504
      } else if (name == Slice("compact")) {
505
        method = &Benchmark::Compact;
J
jorlow@chromium.org 已提交
506
      } else if (name == Slice("crc32c")) {
507
        method = &Benchmark::Crc32c;
508
      } else if (name == Slice("acquireload")) {
509
        method = &Benchmark::AcquireLoad;
510
      } else if (name == Slice("snappycomp")) {
511
        method = &Benchmark::SnappyCompress;
512
      } else if (name == Slice("snappyuncomp")) {
513
        method = &Benchmark::SnappyUncompress;
J
jorlow@chromium.org 已提交
514 515
      } else if (name == Slice("heapprofile")) {
        HeapProfile();
516
      } else if (name == Slice("stats")) {
S
Sanjay Ghemawat 已提交
517 518 519
        PrintStats("leveldb.stats");
      } else if (name == Slice("sstables")) {
        PrintStats("leveldb.sstables");
J
jorlow@chromium.org 已提交
520
      } else {
521 522 523 524
        if (name != Slice()) {  // No error message for empty name
          fprintf(stderr, "unknown benchmark '%s'\n", name.ToString().c_str());
        }
      }
525 526 527 528 529 530 531 532 533 534 535 536 537 538 539

      if (fresh_db) {
        if (FLAGS_use_existing_db) {
          fprintf(stdout, "%-12s : skipped (--use_existing_db is true)\n",
                  name.ToString().c_str());
          method = NULL;
        } else {
          delete db_;
          db_ = NULL;
          DestroyDB(FLAGS_db, Options());
          Open();
        }
      }

      if (method != NULL) {
540
        RunBenchmark(num_threads, name, method);
J
jorlow@chromium.org 已提交
541 542 543 544
      }
    }
  }

545
 private:
546 547 548 549 550 551 552 553 554 555 556 557 558 559 560 561 562 563 564 565 566 567 568 569 570 571 572 573 574 575 576 577 578 579 580
  struct ThreadArg {
    Benchmark* bm;
    SharedState* shared;
    ThreadState* thread;
    void (Benchmark::*method)(ThreadState*);
  };

  static void ThreadBody(void* v) {
    ThreadArg* arg = reinterpret_cast<ThreadArg*>(v);
    SharedState* shared = arg->shared;
    ThreadState* thread = arg->thread;
    {
      MutexLock l(&shared->mu);
      shared->num_initialized++;
      if (shared->num_initialized >= shared->total) {
        shared->cv.SignalAll();
      }
      while (!shared->start) {
        shared->cv.Wait();
      }
    }

    thread->stats.Start();
    (arg->bm->*(arg->method))(thread);
    thread->stats.Stop();

    {
      MutexLock l(&shared->mu);
      shared->num_done++;
      if (shared->num_done >= shared->total) {
        shared->cv.SignalAll();
      }
    }
  }

581 582
  void RunBenchmark(int n, Slice name,
                    void (Benchmark::*method)(ThreadState*)) {
583 584 585 586 587 588 589 590 591 592 593 594
    SharedState shared;
    shared.total = n;
    shared.num_initialized = 0;
    shared.num_done = 0;
    shared.start = false;

    ThreadArg* arg = new ThreadArg[n];
    for (int i = 0; i < n; i++) {
      arg[i].bm = this;
      arg[i].method = method;
      arg[i].shared = &shared;
      arg[i].thread = new ThreadState(i);
595
      arg[i].thread->shared = &shared;
596 597 598 599 600 601 602 603 604 605 606 607 608 609 610 611 612 613 614 615 616 617 618 619 620 621 622
      Env::Default()->StartThread(ThreadBody, &arg[i]);
    }

    shared.mu.Lock();
    while (shared.num_initialized < n) {
      shared.cv.Wait();
    }

    shared.start = true;
    shared.cv.SignalAll();
    while (shared.num_done < n) {
      shared.cv.Wait();
    }
    shared.mu.Unlock();

    for (int i = 1; i < n; i++) {
      arg[0].thread->stats.Merge(arg[i].thread->stats);
    }
    arg[0].thread->stats.Report(name);

    for (int i = 0; i < n; i++) {
      delete arg[i].thread;
    }
    delete[] arg;
  }

  void Crc32c(ThreadState* thread) {
J
jorlow@chromium.org 已提交
623
    // Checksum about 500MB of data total
624 625
    const int size = 4096;
    const char* label = "(4K per op)";
J
jorlow@chromium.org 已提交
626
    std::string data(size, 'x');
J
jorlow@chromium.org 已提交
627 628 629 630
    int64_t bytes = 0;
    uint32_t crc = 0;
    while (bytes < 500 * 1048576) {
      crc = crc32c::Value(data.data(), size);
631
      thread->stats.FinishedSingleOp();
J
jorlow@chromium.org 已提交
632 633 634 635 636
      bytes += size;
    }
    // Print so result is not dead
    fprintf(stderr, "... crc=0x%x\r", static_cast<unsigned int>(crc));

637 638
    thread->stats.AddBytes(bytes);
    thread->stats.AddMessage(label);
J
jorlow@chromium.org 已提交
639 640
  }

641
  void AcquireLoad(ThreadState* thread) {
642 643 644 645
    int dummy;
    port::AtomicPointer ap(&dummy);
    int count = 0;
    void *ptr = NULL;
646
    thread->stats.AddMessage("(each op is 1000 loads)");
647 648 649 650 651
    while (count < 100000) {
      for (int i = 0; i < 1000; i++) {
        ptr = ap.Acquire_Load();
      }
      count++;
652
      thread->stats.FinishedSingleOp();
653 654 655 656
    }
    if (ptr == NULL) exit(1); // Disable unused variable warning.
  }

657 658 659
  void SnappyCompress(ThreadState* thread) {
    RandomGenerator gen;
    Slice input = gen.Generate(Options().block_size);
660 661 662 663 664 665 666 667
    int64_t bytes = 0;
    int64_t produced = 0;
    bool ok = true;
    std::string compressed;
    while (ok && bytes < 1024 * 1048576) {  // Compress 1G
      ok = port::Snappy_Compress(input.data(), input.size(), &compressed);
      produced += compressed.size();
      bytes += input.size();
668
      thread->stats.FinishedSingleOp();
669 670 671
    }

    if (!ok) {
672
      thread->stats.AddMessage("(snappy failure)");
673 674 675 676
    } else {
      char buf[100];
      snprintf(buf, sizeof(buf), "(output: %.1f%%)",
               (produced * 100.0) / bytes);
677 678
      thread->stats.AddMessage(buf);
      thread->stats.AddBytes(bytes);
679 680 681
    }
  }

682 683 684
  void SnappyUncompress(ThreadState* thread) {
    RandomGenerator gen;
    Slice input = gen.Generate(Options().block_size);
685 686 687
    std::string compressed;
    bool ok = port::Snappy_Compress(input.data(), input.size(), &compressed);
    int64_t bytes = 0;
688
    char* uncompressed = new char[input.size()];
689 690
    while (ok && bytes < 1024 * 1048576) {  // Compress 1G
      ok =  port::Snappy_Uncompress(compressed.data(), compressed.size(),
691 692
                                    uncompressed);
      bytes += input.size();
693
      thread->stats.FinishedSingleOp();
694
    }
695
    delete[] uncompressed;
696 697

    if (!ok) {
698
      thread->stats.AddMessage("(snappy failure)");
699
    } else {
700
      thread->stats.AddBytes(bytes);
701 702 703
    }
  }

704 705 706
  void Open() {
    assert(db_ == NULL);
    Options options;
707
    options.create_if_missing = !FLAGS_use_existing_db;
708 709
    options.block_cache = cache_;
    options.write_buffer_size = FLAGS_write_buffer_size;
S
Sanjay Ghemawat 已提交
710
    options.filter_policy = filter_policy_;
711
    Status s = DB::Open(options, FLAGS_db, &db_);
712 713 714 715 716 717
    if (!s.ok()) {
      fprintf(stderr, "open error: %s\n", s.ToString().c_str());
      exit(1);
    }
  }

718 719 720
  void WriteSeq(ThreadState* thread) {
    DoWrite(thread, true);
  }
721

722 723 724 725 726 727
  void WriteRandom(ThreadState* thread) {
    DoWrite(thread, false);
  }

  void DoWrite(ThreadState* thread, bool seq) {
    if (num_ != FLAGS_num) {
728
      char msg[100];
729 730
      snprintf(msg, sizeof(msg), "(%d ops)", num_);
      thread->stats.AddMessage(msg);
731 732
    }

733
    RandomGenerator gen;
J
jorlow@chromium.org 已提交
734 735
    WriteBatch batch;
    Status s;
736 737
    int64_t bytes = 0;
    for (int i = 0; i < num_; i += entries_per_batch_) {
J
jorlow@chromium.org 已提交
738
      batch.Clear();
739 740
      for (int j = 0; j < entries_per_batch_; j++) {
        const int k = seq ? i+j : (thread->rand.Next() % FLAGS_num);
741 742
        char key[100];
        snprintf(key, sizeof(key), "%016d", k);
743 744 745
        batch.Put(key, gen.Generate(value_size_));
        bytes += value_size_ + strlen(key);
        thread->stats.FinishedSingleOp();
746
      }
747
      s = db_->Write(write_options_, &batch);
J
jorlow@chromium.org 已提交
748 749 750 751 752
      if (!s.ok()) {
        fprintf(stderr, "put error: %s\n", s.ToString().c_str());
        exit(1);
      }
    }
753
    thread->stats.AddBytes(bytes);
J
jorlow@chromium.org 已提交
754 755
  }

756
  void ReadSequential(ThreadState* thread) {
757
    Iterator* iter = db_->NewIterator(ReadOptions(FLAGS_verify_checksum, true));
758
    long i = 0;
759
    int64_t bytes = 0;
760
    for (iter->SeekToFirst(); i < reads_ && iter->Valid(); iter->Next()) {
761 762
      bytes += iter->key().size() + iter->value().size();
      thread->stats.FinishedSingleOp();
763 764 765
      ++i;
    }
    delete iter;
766
    thread->stats.AddBytes(bytes);
767 768
  }

769
  void ReadReverse(ThreadState* thread) {
770
    Iterator* iter = db_->NewIterator(ReadOptions(FLAGS_verify_checksum, true));
771
    long i = 0;
772
    int64_t bytes = 0;
773
    for (iter->SeekToLast(); i < reads_ && iter->Valid(); iter->Prev()) {
774 775
      bytes += iter->key().size() + iter->value().size();
      thread->stats.FinishedSingleOp();
776 777 778
      ++i;
    }
    delete iter;
779
    thread->stats.AddBytes(bytes);
780 781
  }

782
  void ReadRandom(ThreadState* thread) {
783
    ReadOptions options(FLAGS_verify_checksum, true);
784
    std::string value;
S
Sanjay Ghemawat 已提交
785
    int found = 0;
786
    for (long i = 0; i < reads_; i++) {
787
      char key[100];
788
      const int k = thread->rand.Next() % FLAGS_num;
789
      snprintf(key, sizeof(key), "%016d", k);
S
Sanjay Ghemawat 已提交
790 791 792 793 794 795 796 797 798 799 800
      if (db_->Get(options, key, &value).ok()) {
        found++;
      }
      thread->stats.FinishedSingleOp();
    }
    char msg[100];
    snprintf(msg, sizeof(msg), "(%d of %d found)", found, num_);
    thread->stats.AddMessage(msg);
  }

  void ReadMissing(ThreadState* thread) {
801
    ReadOptions options(FLAGS_verify_checksum, true);
S
Sanjay Ghemawat 已提交
802
    std::string value;
803
    for (long i = 0; i < reads_; i++) {
S
Sanjay Ghemawat 已提交
804 805 806
      char key[100];
      const int k = thread->rand.Next() % FLAGS_num;
      snprintf(key, sizeof(key), "%016d.", k);
807
      db_->Get(options, key, &value);
808
      thread->stats.FinishedSingleOp();
J
jorlow@chromium.org 已提交
809 810 811
    }
  }

812
  void ReadHot(ThreadState* thread) {
813
    ReadOptions options(FLAGS_verify_checksum, true);
814
    std::string value;
815 816
    const long range = (FLAGS_num + 99) / 100;
    for (long i = 0; i < reads_; i++) {
817
      char key[100];
818
      const int k = thread->rand.Next() % range;
819 820
      snprintf(key, sizeof(key), "%016d", k);
      db_->Get(options, key, &value);
821
      thread->stats.FinishedSingleOp();
822 823 824
    }
  }

S
Sanjay Ghemawat 已提交
825
  void SeekRandom(ThreadState* thread) {
826
    ReadOptions options(FLAGS_verify_checksum, true);
S
Sanjay Ghemawat 已提交
827 828
    std::string value;
    int found = 0;
829
    for (long i = 0; i < reads_; i++) {
S
Sanjay Ghemawat 已提交
830 831 832 833 834 835 836 837 838 839 840 841 842 843 844 845 846 847 848 849 850 851 852 853 854 855 856 857 858 859 860 861 862 863 864 865 866 867 868 869 870 871 872
      Iterator* iter = db_->NewIterator(options);
      char key[100];
      const int k = thread->rand.Next() % FLAGS_num;
      snprintf(key, sizeof(key), "%016d", k);
      iter->Seek(key);
      if (iter->Valid() && iter->key() == key) found++;
      delete iter;
      thread->stats.FinishedSingleOp();
    }
    char msg[100];
    snprintf(msg, sizeof(msg), "(%d of %d found)", found, num_);
    thread->stats.AddMessage(msg);
  }

  void DoDelete(ThreadState* thread, bool seq) {
    RandomGenerator gen;
    WriteBatch batch;
    Status s;
    for (int i = 0; i < num_; i += entries_per_batch_) {
      batch.Clear();
      for (int j = 0; j < entries_per_batch_; j++) {
        const int k = seq ? i+j : (thread->rand.Next() % FLAGS_num);
        char key[100];
        snprintf(key, sizeof(key), "%016d", k);
        batch.Delete(key);
        thread->stats.FinishedSingleOp();
      }
      s = db_->Write(write_options_, &batch);
      if (!s.ok()) {
        fprintf(stderr, "del error: %s\n", s.ToString().c_str());
        exit(1);
      }
    }
  }

  void DeleteSeq(ThreadState* thread) {
    DoDelete(thread, true);
  }

  void DeleteRandom(ThreadState* thread) {
    DoDelete(thread, false);
  }

873 874 875 876 877 878 879 880 881 882 883 884 885 886 887 888 889 890 891 892 893 894 895 896 897 898 899 900 901 902
  void ReadWhileWriting(ThreadState* thread) {
    if (thread->tid > 0) {
      ReadRandom(thread);
    } else {
      // Special thread that keeps writing until other threads are done.
      RandomGenerator gen;
      while (true) {
        {
          MutexLock l(&thread->shared->mu);
          if (thread->shared->num_done + 1 >= thread->shared->num_initialized) {
            // Other threads have finished
            break;
          }
        }

        const int k = thread->rand.Next() % FLAGS_num;
        char key[100];
        snprintf(key, sizeof(key), "%016d", k);
        Status s = db_->Put(write_options_, key, gen.Generate(value_size_));
        if (!s.ok()) {
          fprintf(stderr, "put error: %s\n", s.ToString().c_str());
          exit(1);
        }
      }

      // Do not count any of the preceding work/delay in stats.
      thread->stats.Start();
    }
  }

903
  void Compact(ThreadState* thread) {
G
Gabor Cselle 已提交
904
    db_->CompactRange(NULL, NULL);
J
jorlow@chromium.org 已提交
905 906
  }

S
Sanjay Ghemawat 已提交
907
  void PrintStats(const char* key) {
908
    std::string stats;
S
Sanjay Ghemawat 已提交
909
    if (!db_->GetProperty(key, &stats)) {
910
      stats = "(failed)";
911
    }
912
    fprintf(stdout, "\n%s\n", stats.c_str());
913 914
  }

J
jorlow@chromium.org 已提交
915 916 917 918 919 920
  static void WriteToFile(void* arg, const char* buf, int n) {
    reinterpret_cast<WritableFile*>(arg)->Append(Slice(buf, n));
  }

  void HeapProfile() {
    char fname[100];
921
    snprintf(fname, sizeof(fname), "%s/heap-%04d", FLAGS_db, ++heap_counter_);
J
jorlow@chromium.org 已提交
922 923 924
    WritableFile* file;
    Status s = Env::Default()->NewWritableFile(fname, &file);
    if (!s.ok()) {
925
      fprintf(stderr, "%s\n", s.ToString().c_str());
J
jorlow@chromium.org 已提交
926 927 928 929 930
      return;
    }
    bool ok = port::GetHeapProfile(WriteToFile, file);
    delete file;
    if (!ok) {
931
      fprintf(stderr, "heap profiling not supported\n");
J
jorlow@chromium.org 已提交
932 933 934 935 936
      Env::Default()->DeleteFile(fname);
    }
  }
};

H
Hans Wennborg 已提交
937
}  // namespace leveldb
J
jorlow@chromium.org 已提交
938 939

int main(int argc, char** argv) {
940
  FLAGS_write_buffer_size = leveldb::Options().write_buffer_size;
941 942
  FLAGS_open_files = leveldb::Options().max_open_files;

J
jorlow@chromium.org 已提交
943 944 945
  for (int i = 1; i < argc; i++) {
    double d;
    int n;
946
    long l;
J
jorlow@chromium.org 已提交
947 948 949 950 951 952 953 954
    char junk;
    if (leveldb::Slice(argv[i]).starts_with("--benchmarks=")) {
      FLAGS_benchmarks = argv[i] + strlen("--benchmarks=");
    } else if (sscanf(argv[i], "--compression_ratio=%lf%c", &d, &junk) == 1) {
      FLAGS_compression_ratio = d;
    } else if (sscanf(argv[i], "--histogram=%d%c", &n, &junk) == 1 &&
               (n == 0 || n == 1)) {
      FLAGS_histogram = n;
955 956 957
    } else if (sscanf(argv[i], "--use_existing_db=%d%c", &n, &junk) == 1 &&
               (n == 0 || n == 1)) {
      FLAGS_use_existing_db = n;
958 959
    } else if (sscanf(argv[i], "--num=%ld%c", &l, &junk) == 1) {
      FLAGS_num = l;
960 961
    } else if (sscanf(argv[i], "--reads=%d%c", &n, &junk) == 1) {
      FLAGS_reads = n;
962 963
    } else if (sscanf(argv[i], "--threads=%d%c", &n, &junk) == 1) {
      FLAGS_threads = n;
J
jorlow@chromium.org 已提交
964 965 966 967
    } else if (sscanf(argv[i], "--value_size=%d%c", &n, &junk) == 1) {
      FLAGS_value_size = n;
    } else if (sscanf(argv[i], "--write_buffer_size=%d%c", &n, &junk) == 1) {
      FLAGS_write_buffer_size = n;
D
Dhruba Borthakur 已提交
968
    } else if (sscanf(argv[i], "--cache_size=%ld%c", &n, &junk) == 1) {
969
      FLAGS_cache_size = n;
970 971
    } else if (sscanf(argv[i], "--cache_numshardbits=%d%c", &n, &junk) == 1) {
      FLAGS_cache_numshardbits = n;
S
Sanjay Ghemawat 已提交
972 973
    } else if (sscanf(argv[i], "--bloom_bits=%d%c", &n, &junk) == 1) {
      FLAGS_bloom_bits = n;
974 975
    } else if (sscanf(argv[i], "--open_files=%d%c", &n, &junk) == 1) {
      FLAGS_open_files = n;
976 977
    } else if (strncmp(argv[i], "--db=", 5) == 0) {
      FLAGS_db = argv[i] + 5;
978 979 980
    } else if (sscanf(argv[i], "--verify_checksum=%d%c", &n, &junk) == 1 &&
               (n == 0 || n == 1)) {
      FLAGS_verify_checksum = n;
981
    } else {
J
jorlow@chromium.org 已提交
982 983 984 985 986 987 988 989 990
      fprintf(stderr, "Invalid flag '%s'\n", argv[i]);
      exit(1);
    }
  }

  leveldb::Benchmark benchmark;
  benchmark.Run();
  return 0;
}