corruption_test.cc 9.7 KB
Newer Older
J
jorlow@chromium.org 已提交
1 2 3 4
// Copyright (c) 2011 The LevelDB Authors. All rights reserved.
// Use of this source code is governed by a BSD-style license that can be
// found in the LICENSE file. See the AUTHORS file for names of contributors.

5
#include "rocksdb/db.h"
J
jorlow@chromium.org 已提交
6 7 8 9 10

#include <errno.h>
#include <fcntl.h>
#include <sys/stat.h>
#include <sys/types.h>
11 12 13
#include "rocksdb/cache.h"
#include "rocksdb/env.h"
#include "rocksdb/write_batch.h"
J
jorlow@chromium.org 已提交
14 15
#include "db/db_impl.h"
#include "db/filename.h"
J
jorlow@chromium.org 已提交
16
#include "db/log_format.h"
J
jorlow@chromium.org 已提交
17
#include "db/version_set.h"
H
Haobo Xu 已提交
18
#include "table/table.h"
J
jorlow@chromium.org 已提交
19 20 21 22
#include "util/logging.h"
#include "util/testharness.h"
#include "util/testutil.h"

23
namespace rocksdb {
J
jorlow@chromium.org 已提交
24 25 26 27 28 29 30

static const int kValueSize = 1000;

class CorruptionTest {
 public:
  test::ErrorEnv env_;
  std::string dbname_;
31
  shared_ptr<Cache> tiny_cache_;
J
jorlow@chromium.org 已提交
32 33 34
  Options options_;
  DB* db_;

35
  CorruptionTest() {
36
    tiny_cache_ = NewLRUCache(100);
J
jorlow@chromium.org 已提交
37 38 39 40
    options_.env = &env_;
    dbname_ = test::TmpDir() + "/db_test";
    DestroyDB(dbname_, options_);

A
Abhishek Kona 已提交
41
    db_ = nullptr;
J
jorlow@chromium.org 已提交
42
    options_.create_if_missing = true;
H
Haobo Xu 已提交
43
    options_.block_size_deviation = 0; // make unit test pass for now
J
jorlow@chromium.org 已提交
44 45 46 47 48 49 50 51 52
    Reopen();
    options_.create_if_missing = false;
  }

  ~CorruptionTest() {
     delete db_;
     DestroyDB(dbname_, Options());
  }

A
Abhishek Kona 已提交
53
  Status TryReopen(Options* options = nullptr) {
J
jorlow@chromium.org 已提交
54
    delete db_;
A
Abhishek Kona 已提交
55
    db_ = nullptr;
J
jorlow@chromium.org 已提交
56 57
    Options opt = (options ? *options : options_);
    opt.env = &env_;
58
    opt.block_cache = tiny_cache_;
H
Haobo Xu 已提交
59
    opt.block_size_deviation = 0;
X
Xing Jin 已提交
60
    opt.arena_block_size = 4096;
J
jorlow@chromium.org 已提交
61 62 63
    return DB::Open(opt, dbname_, &db_);
  }

A
Abhishek Kona 已提交
64
  void Reopen(Options* options = nullptr) {
J
jorlow@chromium.org 已提交
65 66 67 68 69
    ASSERT_OK(TryReopen(options));
  }

  void RepairDB() {
    delete db_;
A
Abhishek Kona 已提交
70
    db_ = nullptr;
71
    ASSERT_OK(::rocksdb::RepairDB(dbname_, options_));
J
jorlow@chromium.org 已提交
72 73 74 75 76 77 78 79 80 81 82 83 84 85 86
  }

  void Build(int n) {
    std::string key_space, value_space;
    WriteBatch batch;
    for (int i = 0; i < n; i++) {
      //if ((i % 100) == 0) fprintf(stderr, "@ %d of %d\n", i, n);
      Slice key = Key(i, &key_space);
      batch.Clear();
      batch.Put(key, Value(i, &value_space));
      ASSERT_OK(db_->Write(WriteOptions(), &batch));
    }
  }

  void Check(int min_expected, int max_expected) {
87
    unsigned int next_expected = 0;
J
jorlow@chromium.org 已提交
88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125
    int missed = 0;
    int bad_keys = 0;
    int bad_values = 0;
    int correct = 0;
    std::string value_space;
    Iterator* iter = db_->NewIterator(ReadOptions());
    for (iter->SeekToFirst(); iter->Valid(); iter->Next()) {
      uint64_t key;
      Slice in(iter->key());
      if (!ConsumeDecimalNumber(&in, &key) ||
          !in.empty() ||
          key < next_expected) {
        bad_keys++;
        continue;
      }
      missed += (key - next_expected);
      next_expected = key + 1;
      if (iter->value() != Value(key, &value_space)) {
        bad_values++;
      } else {
        correct++;
      }
    }
    delete iter;

    fprintf(stderr,
            "expected=%d..%d; got=%d; bad_keys=%d; bad_values=%d; missed=%d\n",
            min_expected, max_expected, correct, bad_keys, bad_values, missed);
    ASSERT_LE(min_expected, correct);
    ASSERT_GE(max_expected, correct);
  }

  void Corrupt(FileType filetype, int offset, int bytes_to_corrupt) {
    // Pick file to corrupt
    std::vector<std::string> filenames;
    ASSERT_OK(env_.GetChildren(dbname_, &filenames));
    uint64_t number;
    FileType type;
126 127
    std::string fname;
    int picked_number = -1;
128
    for (unsigned int i = 0; i < filenames.size(); i++) {
D
dgrogan@chromium.org 已提交
129
      if (ParseFileName(filenames[i], &number, &type) &&
130 131 132 133
          type == filetype &&
          int(number) > picked_number) {  // Pick latest file
        fname = dbname_ + "/" + filenames[i];
        picked_number = number;
J
jorlow@chromium.org 已提交
134 135
      }
    }
136
    ASSERT_TRUE(!fname.empty()) << filetype;
J
jorlow@chromium.org 已提交
137 138

    struct stat sbuf;
J
jorlow@chromium.org 已提交
139 140 141 142 143 144 145 146 147 148 149
    if (stat(fname.c_str(), &sbuf) != 0) {
      const char* msg = strerror(errno);
      ASSERT_TRUE(false) << fname << ": " << msg;
    }

    if (offset < 0) {
      // Relative to end of file; make it absolute
      if (-offset > sbuf.st_size) {
        offset = 0;
      } else {
        offset = sbuf.st_size + offset;
J
jorlow@chromium.org 已提交
150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169
      }
    }
    if (offset > sbuf.st_size) {
      offset = sbuf.st_size;
    }
    if (offset + bytes_to_corrupt > sbuf.st_size) {
      bytes_to_corrupt = sbuf.st_size - offset;
    }

    // Do it
    std::string contents;
    Status s = ReadFileToString(Env::Default(), fname, &contents);
    ASSERT_TRUE(s.ok()) << s.ToString();
    for (int i = 0; i < bytes_to_corrupt; i++) {
      contents[i + offset] ^= 0x80;
    }
    s = WriteStringToFile(Env::Default(), contents, fname);
    ASSERT_TRUE(s.ok()) << s.ToString();
  }

170 171 172 173 174 175 176 177
  int Property(const std::string& name) {
    std::string property;
    int result;
    if (db_->GetProperty(name, &property) &&
        sscanf(property.c_str(), "%d", &result) == 1) {
      return result;
    } else {
      return -1;
J
jorlow@chromium.org 已提交
178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196
    }
  }

  // Return the ith key
  Slice Key(int i, std::string* storage) {
    char buf[100];
    snprintf(buf, sizeof(buf), "%016d", i);
    storage->assign(buf, strlen(buf));
    return Slice(*storage);
  }

  // Return the value to associate with the specified key
  Slice Value(int k, std::string* storage) {
    Random r(k);
    return test::RandomString(&r, kValueSize, storage);
  }
};

TEST(CorruptionTest, Recovery) {
J
jorlow@chromium.org 已提交
197 198
  Build(100);
  Check(100, 100);
J
jorlow@chromium.org 已提交
199
  Corrupt(kLogFile, 19, 1);      // WriteBatch tag for first record
J
jorlow@chromium.org 已提交
200
  Corrupt(kLogFile, log::kBlockSize + 1000, 1);  // Somewhere in second block
J
jorlow@chromium.org 已提交
201
  Reopen();
J
jorlow@chromium.org 已提交
202 203 204

  // The 64 records in the first two log blocks are completely lost.
  Check(36, 36);
J
jorlow@chromium.org 已提交
205 206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224 225 226 227 228 229 230 231 232
}

TEST(CorruptionTest, RecoverWriteError) {
  env_.writable_file_error_ = true;
  Status s = TryReopen();
  ASSERT_TRUE(!s.ok());
}

TEST(CorruptionTest, NewFileErrorDuringWrite) {
  // Do enough writing to force minor compaction
  env_.writable_file_error_ = true;
  const int num = 3 + (Options().write_buffer_size / kValueSize);
  std::string value_storage;
  Status s;
  for (int i = 0; s.ok() && i < num; i++) {
    WriteBatch batch;
    batch.Put("a", Value(100, &value_storage));
    s = db_->Write(WriteOptions(), &batch);
  }
  ASSERT_TRUE(!s.ok());
  ASSERT_GE(env_.num_writable_file_errors_, 1);
  env_.writable_file_error_ = false;
  Reopen();
}

TEST(CorruptionTest, TableFile) {
  Build(100);
  DBImpl* dbi = reinterpret_cast<DBImpl*>(db_);
233
  dbi->TEST_FlushMemTable();
A
Abhishek Kona 已提交
234 235
  dbi->TEST_CompactRange(0, nullptr, nullptr);
  dbi->TEST_CompactRange(1, nullptr, nullptr);
J
jorlow@chromium.org 已提交
236 237 238 239 240 241 242 243

  Corrupt(kTableFile, 100, 1);
  Check(99, 99);
}

TEST(CorruptionTest, TableFileIndexData) {
  Build(10000);  // Enough to build multiple Tables
  DBImpl* dbi = reinterpret_cast<DBImpl*>(db_);
244
  dbi->TEST_FlushMemTable();
J
jorlow@chromium.org 已提交
245

246
  Corrupt(kTableFile, -2000, 500);
J
jorlow@chromium.org 已提交
247 248 249 250 251 252 253 254 255 256 257 258 259 260 261 262 263 264 265 266 267 268 269 270 271 272 273 274 275 276 277 278 279 280 281
  Reopen();
  Check(5000, 9999);
}

TEST(CorruptionTest, MissingDescriptor) {
  Build(1000);
  RepairDB();
  Reopen();
  Check(1000, 1000);
}

TEST(CorruptionTest, SequenceNumberRecovery) {
  ASSERT_OK(db_->Put(WriteOptions(), "foo", "v1"));
  ASSERT_OK(db_->Put(WriteOptions(), "foo", "v2"));
  ASSERT_OK(db_->Put(WriteOptions(), "foo", "v3"));
  ASSERT_OK(db_->Put(WriteOptions(), "foo", "v4"));
  ASSERT_OK(db_->Put(WriteOptions(), "foo", "v5"));
  RepairDB();
  Reopen();
  std::string v;
  ASSERT_OK(db_->Get(ReadOptions(), "foo", &v));
  ASSERT_EQ("v5", v);
  // Write something.  If sequence number was not recovered properly,
  // it will be hidden by an earlier write.
  ASSERT_OK(db_->Put(WriteOptions(), "foo", "v6"));
  ASSERT_OK(db_->Get(ReadOptions(), "foo", &v));
  ASSERT_EQ("v6", v);
  Reopen();
  ASSERT_OK(db_->Get(ReadOptions(), "foo", &v));
  ASSERT_EQ("v6", v);
}

TEST(CorruptionTest, CorruptedDescriptor) {
  ASSERT_OK(db_->Put(WriteOptions(), "foo", "hello"));
  DBImpl* dbi = reinterpret_cast<DBImpl*>(db_);
282
  dbi->TEST_FlushMemTable();
A
Abhishek Kona 已提交
283
  dbi->TEST_CompactRange(0, nullptr, nullptr);
J
jorlow@chromium.org 已提交
284 285 286 287 288 289 290 291 292 293 294 295 296 297 298

  Corrupt(kDescriptorFile, 0, 1000);
  Status s = TryReopen();
  ASSERT_TRUE(!s.ok());

  RepairDB();
  Reopen();
  std::string v;
  ASSERT_OK(db_->Get(ReadOptions(), "foo", &v));
  ASSERT_EQ("hello", v);
}

TEST(CorruptionTest, CompactionInputError) {
  Build(10);
  DBImpl* dbi = reinterpret_cast<DBImpl*>(db_);
299
  dbi->TEST_FlushMemTable();
300
  const int last = dbi->MaxMemCompactionLevel();
301
  ASSERT_EQ(1, Property("rocksdb.num-files-at-level" + NumberToString(last)));
J
jorlow@chromium.org 已提交
302 303 304 305 306 307 308 309 310 311 312 313

  Corrupt(kTableFile, 100, 1);
  Check(9, 9);

  // Force compactions by writing lots of values
  Build(10000);
  Check(10000, 10000);
}

TEST(CorruptionTest, CompactionInputErrorParanoid) {
  Options options;
  options.paranoid_checks = true;
314
  options.write_buffer_size = 1048576;
J
jorlow@chromium.org 已提交
315
  Reopen(&options);
316 317 318
  DBImpl* dbi = reinterpret_cast<DBImpl*>(db_);

  // Fill levels >= 1 so memtable compaction outputs to level 1
319
  for (int level = 1; level < dbi->NumberLevels(); level++) {
320 321
    dbi->Put(WriteOptions(), "", "begin");
    dbi->Put(WriteOptions(), "~", "end");
322
    dbi->TEST_FlushMemTable();
323
  }
J
jorlow@chromium.org 已提交
324 325

  Build(10);
326
  dbi->TEST_FlushMemTable();
327
  ASSERT_EQ(1, Property("rocksdb.num-files-at-level0"));
J
jorlow@chromium.org 已提交
328 329 330 331 332 333 334 335 336 337 338 339 340 341 342 343

  Corrupt(kTableFile, 100, 1);
  Check(9, 9);

  // Write must eventually fail because of corrupted table
  Status s;
  std::string tmp1, tmp2;
  for (int i = 0; i < 10000 && s.ok(); i++) {
    s = db_->Put(WriteOptions(), Key(i, &tmp1), Value(i, &tmp2));
  }
  ASSERT_TRUE(!s.ok()) << "write did not fail in corrupted paranoid db";
}

TEST(CorruptionTest, UnrelatedKeys) {
  Build(10);
  DBImpl* dbi = reinterpret_cast<DBImpl*>(db_);
344
  dbi->TEST_FlushMemTable();
J
jorlow@chromium.org 已提交
345 346 347 348 349 350 351
  Corrupt(kTableFile, 100, 1);

  std::string tmp1, tmp2;
  ASSERT_OK(db_->Put(WriteOptions(), Key(1000, &tmp1), Value(1000, &tmp2)));
  std::string v;
  ASSERT_OK(db_->Get(ReadOptions(), Key(1000, &tmp1), &v));
  ASSERT_EQ(Value(1000, &tmp2).ToString(), v);
352
  dbi->TEST_FlushMemTable();
J
jorlow@chromium.org 已提交
353 354 355 356
  ASSERT_OK(db_->Get(ReadOptions(), Key(1000, &tmp1), &v));
  ASSERT_EQ(Value(1000, &tmp2).ToString(), v);
}

357
}  // namespace rocksdb
J
jorlow@chromium.org 已提交
358 359

int main(int argc, char** argv) {
360
  return rocksdb::test::RunAllTests();
J
jorlow@chromium.org 已提交
361
}