提交 11943e8b 编写于 作者: Y Yanqin Jin 提交者: Facebook GitHub Bot

Exclude timestamp when checking compaction boundaries (#10787)

Summary:
When checking if a range [start, end) overlaps with a compaction whose range is [start1, end1), always exclude timestamp from start, end, start1 and end1, otherwise some versions of one user key may be compacted to bottommost layer while others remain in the original level.

Pull Request resolved: https://github.com/facebook/rocksdb/pull/10787

Test Plan: make check

Reviewed By: ltamasi

Differential Revision: D40187672

Pulled By: ltamasi

fbshipit-source-id: 81226267fd3e33ffa79665c62abadf2ebec45496
上级 7af47c53
...@@ -342,6 +342,8 @@ bool Compaction::SupportsPerKeyPlacement() const { ...@@ -342,6 +342,8 @@ bool Compaction::SupportsPerKeyPlacement() const {
int Compaction::GetPenultimateLevel() const { return penultimate_level_; } int Compaction::GetPenultimateLevel() const { return penultimate_level_; }
// smallest_key and largest_key include timestamps if user-defined timestamp is
// enabled.
bool Compaction::OverlapPenultimateLevelOutputRange( bool Compaction::OverlapPenultimateLevelOutputRange(
const Slice& smallest_key, const Slice& largest_key) const { const Slice& smallest_key, const Slice& largest_key) const {
if (!SupportsPerKeyPlacement()) { if (!SupportsPerKeyPlacement()) {
...@@ -350,11 +352,13 @@ bool Compaction::OverlapPenultimateLevelOutputRange( ...@@ -350,11 +352,13 @@ bool Compaction::OverlapPenultimateLevelOutputRange(
const Comparator* ucmp = const Comparator* ucmp =
input_vstorage_->InternalComparator()->user_comparator(); input_vstorage_->InternalComparator()->user_comparator();
return ucmp->Compare(smallest_key, penultimate_level_largest_user_key_) <= return ucmp->CompareWithoutTimestamp(
0 && smallest_key, penultimate_level_largest_user_key_) <= 0 &&
ucmp->Compare(largest_key, penultimate_level_smallest_user_key_) >= 0; ucmp->CompareWithoutTimestamp(
largest_key, penultimate_level_smallest_user_key_) >= 0;
} }
// key includes timestamp if user-defined timestamp is enabled.
bool Compaction::WithinPenultimateLevelOutputRange(const Slice& key) const { bool Compaction::WithinPenultimateLevelOutputRange(const Slice& key) const {
if (!SupportsPerKeyPlacement()) { if (!SupportsPerKeyPlacement()) {
return false; return false;
...@@ -363,8 +367,10 @@ bool Compaction::WithinPenultimateLevelOutputRange(const Slice& key) const { ...@@ -363,8 +367,10 @@ bool Compaction::WithinPenultimateLevelOutputRange(const Slice& key) const {
const Comparator* ucmp = const Comparator* ucmp =
input_vstorage_->InternalComparator()->user_comparator(); input_vstorage_->InternalComparator()->user_comparator();
return ucmp->Compare(key, penultimate_level_smallest_user_key_) >= 0 && return ucmp->CompareWithoutTimestamp(
ucmp->Compare(key, penultimate_level_largest_user_key_) <= 0; key, penultimate_level_smallest_user_key_) >= 0 &&
ucmp->CompareWithoutTimestamp(
key, penultimate_level_largest_user_key_) <= 0;
} }
bool Compaction::InputCompressionMatchesOutput() const { bool Compaction::InputCompressionMatchesOutput() const {
......
...@@ -319,6 +319,8 @@ class Compaction { ...@@ -319,6 +319,8 @@ class Compaction {
// Return true if the given range is overlap with penultimate level output // Return true if the given range is overlap with penultimate level output
// range. // range.
// Both smallest_key and largest_key include timestamps if user-defined
// timestamp is enabled.
bool OverlapPenultimateLevelOutputRange(const Slice& smallest_key, bool OverlapPenultimateLevelOutputRange(const Slice& smallest_key,
const Slice& largest_key) const; const Slice& largest_key) const;
...@@ -328,6 +330,7 @@ class Compaction { ...@@ -328,6 +330,7 @@ class Compaction {
// If per_key_placement is not supported, always return false. // If per_key_placement is not supported, always return false.
// TODO: currently it doesn't support moving data from the last level to the // TODO: currently it doesn't support moving data from the last level to the
// penultimate level // penultimate level
// key includes timestamp if user-defined timestamp is enabled.
bool WithinPenultimateLevelOutputRange(const Slice& key) const; bool WithinPenultimateLevelOutputRange(const Slice& key) const;
CompactionReason compaction_reason() const { return compaction_reason_; } CompactionReason compaction_reason() const { return compaction_reason_; }
...@@ -474,9 +477,11 @@ class Compaction { ...@@ -474,9 +477,11 @@ class Compaction {
TablePropertiesCollection output_table_properties_; TablePropertiesCollection output_table_properties_;
// smallest user keys in compaction // smallest user keys in compaction
// includes timestamp if user-defined timestamp is enabled.
Slice smallest_user_key_; Slice smallest_user_key_;
// largest user keys in compaction // largest user keys in compaction
// includes timestamp if user-defined timestamp is enabled.
Slice largest_user_key_; Slice largest_user_key_;
// Reason for compaction // Reason for compaction
...@@ -497,6 +502,7 @@ class Compaction { ...@@ -497,6 +502,7 @@ class Compaction {
const int penultimate_level_; const int penultimate_level_;
// Key range for penultimate level output // Key range for penultimate level output
// includes timestamp if user-defined timestamp is enabled.
Slice penultimate_level_smallest_user_key_; Slice penultimate_level_smallest_user_key_;
Slice penultimate_level_largest_user_key_; Slice penultimate_level_largest_user_key_;
}; };
......
...@@ -88,6 +88,7 @@ class CompactionIterator { ...@@ -88,6 +88,7 @@ class CompactionIterator {
virtual int number_levels() const = 0; virtual int number_levels() const = 0;
// Result includes timestamp if user-defined timestamp is enabled.
virtual Slice GetLargestUserKey() const = 0; virtual Slice GetLargestUserKey() const = 0;
virtual bool allow_ingest_behind() const = 0; virtual bool allow_ingest_behind() const = 0;
...@@ -108,6 +109,7 @@ class CompactionIterator { ...@@ -108,6 +109,7 @@ class CompactionIterator {
virtual bool SupportsPerKeyPlacement() const = 0; virtual bool SupportsPerKeyPlacement() const = 0;
// `key` includes timestamp if user-defined timestamp is enabled.
virtual bool WithinPenultimateLevelOutputRange(const Slice& key) const = 0; virtual bool WithinPenultimateLevelOutputRange(const Slice& key) const = 0;
}; };
...@@ -133,6 +135,7 @@ class CompactionIterator { ...@@ -133,6 +135,7 @@ class CompactionIterator {
int number_levels() const override { return compaction_->number_levels(); } int number_levels() const override { return compaction_->number_levels(); }
// Result includes timestamp if user-defined timestamp is enabled.
Slice GetLargestUserKey() const override { Slice GetLargestUserKey() const override {
return compaction_->GetLargestUserKey(); return compaction_->GetLargestUserKey();
} }
...@@ -173,6 +176,7 @@ class CompactionIterator { ...@@ -173,6 +176,7 @@ class CompactionIterator {
// Check if key is within penultimate level output range, to see if it's // Check if key is within penultimate level output range, to see if it's
// safe to output to the penultimate level for per_key_placement feature. // safe to output to the penultimate level for per_key_placement feature.
// `key` includes timestamp if user-defined timestamp is enabled.
bool WithinPenultimateLevelOutputRange(const Slice& key) const override { bool WithinPenultimateLevelOutputRange(const Slice& key) const override {
return compaction_->WithinPenultimateLevelOutputRange(key); return compaction_->WithinPenultimateLevelOutputRange(key);
} }
......
Markdown is supported
0% .
You are about to add 0 people to the discussion. Proceed with caution.
先完成此消息的编辑!
想要评论请 注册