bplus_tree.cpp 57.0 KB
Newer Older
羽飞's avatar
羽飞 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40
/* Copyright (c) 2021 Xie Meiyi(xiemeiyi@hust.edu.cn) and OceanBase and/or its affiliates. All rights reserved.
miniob is licensed under Mulan PSL v2.
You can use this software according to the terms and conditions of the Mulan PSL v2.
You may obtain a copy of Mulan PSL v2 at:
         http://license.coscl.org.cn/MulanPSL2
THIS SOFTWARE IS PROVIDED ON AN "AS IS" BASIS, WITHOUT WARRANTIES OF ANY KIND,
EITHER EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO NON-INFRINGEMENT,
MERCHANTABILITY OR FIT FOR A PARTICULAR PURPOSE.
See the Mulan PSL v2 for more details. */

//
// Created by Xie Meiyi
// Rewritten by Longda & Wangyunlai
//
#include "storage/index/bplus_tree.h"
#include "storage/default/disk_buffer_pool.h"
#include "rc.h"
#include "common/log/log.h"
#include "sql/parser/parse_defs.h"

#define FIRST_INDEX_PAGE 1

int calc_internal_page_capacity(int attr_length)
{
  int item_size = attr_length + sizeof(RID) + sizeof(PageNum);

  int capacity =
    ((int)BP_PAGE_DATA_SIZE - InternalIndexNode::HEADER_SIZE) / item_size;
  return capacity;
}

int calc_leaf_page_capacity(int attr_length)
{
  int item_size = attr_length + sizeof(RID) + sizeof(RID);
  int capacity =
    ((int)BP_PAGE_DATA_SIZE - LeafIndexNode::HEADER_SIZE) / item_size;
  return capacity;
}

/////////////////////////////////////////////////////////////////////////////////
羽飞's avatar
羽飞 已提交
41 42
IndexNodeHandler::IndexNodeHandler(const IndexFileHeader &header, Frame *frame)
  : header_(header), page_num_(frame->page_num()), node_((IndexNode *)frame->data())
羽飞's avatar
羽飞 已提交
43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124
{}

bool IndexNodeHandler::is_leaf() const
{
  return node_->is_leaf;
}
void IndexNodeHandler::init_empty(bool leaf)
{
  node_->is_leaf = leaf;
  node_->key_num = 0;
  node_->parent = BP_INVALID_PAGE_NUM;
}
PageNum IndexNodeHandler::page_num() const
{
  return page_num_;
}

int IndexNodeHandler::key_size() const
{
  return header_.key_length;
}

int IndexNodeHandler::value_size() const
{
  // return header_.value_size;
  return sizeof(RID);
}

int IndexNodeHandler::item_size() const
{
  return key_size() + value_size();
}

int IndexNodeHandler::size() const
{
  return node_->key_num;
}

void IndexNodeHandler::increase_size(int n)
{
  node_->key_num += n;
}

PageNum IndexNodeHandler::parent_page_num() const
{
  return node_->parent;
}

void IndexNodeHandler::set_parent_page_num(PageNum page_num)
{
  this->node_->parent = page_num;
}
std::string to_string(const IndexNodeHandler &handler)
{
  std::stringstream ss;

  ss << "PageNum:" << handler.page_num()
     << ",is_leaf:" << handler.is_leaf() << ","
     << "key_num:" << handler.size() << ","
     << "parent:" << handler.parent_page_num() << ",";

  return ss.str();
}

bool IndexNodeHandler::validate() const
{
  if (parent_page_num() == BP_INVALID_PAGE_NUM) {
    // this is a root page
    if (size() < 1) {
      LOG_WARN("root page has no item");
      return false;
    }

    if (!is_leaf() && size() < 2) {
      LOG_WARN("root page internal node has less than 2 child. size=%d", size());
      return false;
    }
  }
  return true;
}

/////////////////////////////////////////////////////////////////////////////////
羽飞's avatar
羽飞 已提交
125 126
LeafIndexNodeHandler::LeafIndexNodeHandler(const IndexFileHeader &header, Frame *frame)
  : IndexNodeHandler(header, frame), leaf_node_((LeafIndexNode *)frame->data())
羽飞's avatar
羽飞 已提交
127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224 225 226
{}

void LeafIndexNodeHandler::init_empty()
{
  IndexNodeHandler::init_empty(true);
  leaf_node_->prev_brother = BP_INVALID_PAGE_NUM;
  leaf_node_->next_brother = BP_INVALID_PAGE_NUM;
}

void LeafIndexNodeHandler::set_next_page(PageNum page_num)
{
  leaf_node_->next_brother = page_num;
}

void LeafIndexNodeHandler::set_prev_page(PageNum page_num)
{
  leaf_node_->prev_brother = page_num;
}
PageNum LeafIndexNodeHandler::next_page() const
{
  return leaf_node_->next_brother;
}
PageNum LeafIndexNodeHandler::prev_page() const
{
  return leaf_node_->prev_brother;
}

char *LeafIndexNodeHandler::key_at(int index)
{
  assert(index >= 0 && index < size());
  return __key_at(index);
}

char *LeafIndexNodeHandler::value_at(int index)
{
  assert(index >= 0 && index < size());
  return __value_at(index);
}

int LeafIndexNodeHandler::max_size() const
{
  return header_.leaf_max_size;
}

int LeafIndexNodeHandler::min_size() const
{
  return header_.leaf_max_size - header_.leaf_max_size / 2;
}

int LeafIndexNodeHandler::lookup(const KeyComparator &comparator, const char *key, bool *found /* = nullptr */) const
{
  const int size = this->size();
  int i = 0;
  for ( ; i < size; i++) {
    int result = comparator(key, __key_at(i));
    if (0 == result) {
      if (found) {
	*found = true;
      }
      return i;
    }
    if (result < 0) {
      break;
    }
  }
  if (found) {
    *found = false;
  }
  return i;
}

void LeafIndexNodeHandler::insert(int index, const char *key, const char *value)
{
  if (index < size()) {
    memmove(__item_at(index + 1), __item_at(index), (size() - index) * item_size());
  }
  memcpy(__item_at(index), key, key_size());
  memcpy(__item_at(index) + key_size(), value, value_size());
  increase_size(1);
}
void LeafIndexNodeHandler::remove(int index)
{
  assert(index >= 0 && index < size());
  if (index < size() - 1) {
    memmove(__item_at(index), __item_at(index + 1), (size() - index - 1) * item_size());
  }
  increase_size(-1);
}

int LeafIndexNodeHandler::remove(const char *key, const KeyComparator &comparator)
{
  bool found = false;
  int index = lookup(comparator, key, &found);
  if (found) {
    this->remove(index);
    return 1;
  }
  return 0;
}

羽飞's avatar
羽飞 已提交
227
RC LeafIndexNodeHandler::move_half_to(LeafIndexNodeHandler &other, DiskBufferPool *bp)
羽飞's avatar
羽飞 已提交
228 229 230 231 232 233 234 235 236
{
  const int size = this->size();
  const int move_index = size / 2;

  memcpy(other.__item_at(0), this->__item_at(move_index), item_size() * (size - move_index));
  other.increase_size(size - move_index);
  this->increase_size(- ( size - move_index));
  return RC::SUCCESS;
}
羽飞's avatar
羽飞 已提交
237
RC LeafIndexNodeHandler::move_first_to_end(LeafIndexNodeHandler &other, DiskBufferPool *disk_buffer_pool)
羽飞's avatar
羽飞 已提交
238 239 240 241 242 243 244 245 246 247
{
  other.append(__item_at(0));

  if (size() >= 1) {
    memmove(__item_at(0), __item_at(1), (size() - 1) * item_size() );
  }
  increase_size(-1);
  return RC::SUCCESS;
}

羽飞's avatar
羽飞 已提交
248
RC LeafIndexNodeHandler::move_last_to_front(LeafIndexNodeHandler &other, DiskBufferPool *bp)
羽飞's avatar
羽飞 已提交
249 250 251 252 253 254 255 256 257
{
  other.preappend(__item_at(size() - 1));

  increase_size(-1);
  return RC::SUCCESS;
}
/**
 * move all items to left page
 */
羽飞's avatar
羽飞 已提交
258
RC LeafIndexNodeHandler::move_to(LeafIndexNodeHandler &other, DiskBufferPool *bp)
羽飞's avatar
羽飞 已提交
259 260 261 262 263 264 265 266 267
{
  memcpy(other.__item_at(other.size()), this->__item_at(0), this->size() * item_size());
  other.increase_size(this->size());
  this->increase_size(- this->size());

  other.set_next_page(this->next_page());

  PageNum next_right_page_num = this->next_page();
  if (next_right_page_num != BP_INVALID_PAGE_NUM) {
羽飞's avatar
羽飞 已提交
268 269
    Frame *next_right_frame;
    RC rc = bp->get_this_page(next_right_page_num, &next_right_frame);
羽飞's avatar
羽飞 已提交
270 271 272 273 274
    if (rc != RC::SUCCESS) {
      LOG_WARN("failed to fetch next right page. page number:%d. rc=%d:%s", next_right_page_num, rc, strrc(rc));
      return rc;
    }

羽飞's avatar
羽飞 已提交
275
    LeafIndexNodeHandler next_right_node(header_, next_right_frame);
羽飞's avatar
羽飞 已提交
276
    next_right_node.set_prev_page(other.page_num());
羽飞's avatar
羽飞 已提交
277 278
    next_right_frame->mark_dirty();
    bp->unpin_page(next_right_frame);
羽飞's avatar
羽飞 已提交
279 280 281 282 283 284 285 286 287 288 289 290 291 292 293 294 295 296 297 298 299 300 301 302 303 304 305 306 307 308 309 310 311 312 313 314 315 316 317 318 319 320 321 322 323 324
  }
  return RC::SUCCESS;
}

void LeafIndexNodeHandler::append(const char *item)
{
  memcpy(__item_at(size()), item, item_size());
  increase_size(1);
}

void LeafIndexNodeHandler::preappend(const char *item)
{
  if (size() > 0) {
    memmove(__item_at(1), __item_at(0), size() * item_size());
  }
  memcpy(__item_at(0), item, item_size());
  increase_size(1);
}

char *LeafIndexNodeHandler::__item_at(int index) const
{
  return leaf_node_->array + (index * item_size());
}
char *LeafIndexNodeHandler::__key_at(int index) const
{
  return __item_at(index);
}
char *LeafIndexNodeHandler::__value_at(int index) const
{
  return __item_at(index) + key_size();
}

std::string to_string(const LeafIndexNodeHandler &handler, const KeyPrinter &printer)
{
  std::stringstream ss;
  ss << to_string((const IndexNodeHandler &)handler)
     << ",prev page:" << handler.prev_page()
     << ",next page:" << handler.next_page();
  ss << ",values=[" << printer(handler.__key_at(0)) ;
  for (int i = 1; i < handler.size(); i++) {
    ss << "," << printer(handler.__key_at(i));
  }
  ss << "]";
  return ss.str();
}

羽飞's avatar
羽飞 已提交
325
bool LeafIndexNodeHandler::validate(const KeyComparator &comparator, DiskBufferPool *bp) const
羽飞's avatar
羽飞 已提交
326 327 328 329 330 331 332 333 334 335 336 337 338 339 340 341 342 343 344 345
{
  bool result = IndexNodeHandler::validate();
  if (false == result) {
    return false;
  }

  const int node_size = size();
  for (int i = 1; i < node_size; i++) {
    if (comparator(__key_at(i - 1), __key_at(i)) >= 0) {
      LOG_WARN("page number = %d, invalid key order. id1=%d,id2=%d, this=%s",
	       page_num(), i-1, i, to_string(*this).c_str());
      return false;
    }
  }

  PageNum parent_page_num = this->parent_page_num();
  if (parent_page_num == BP_INVALID_PAGE_NUM) {
    return true;
  }

羽飞's avatar
羽飞 已提交
346 347
  Frame *parent_frame;
  RC rc = bp->get_this_page(parent_page_num, &parent_frame);
羽飞's avatar
羽飞 已提交
348 349 350 351 352 353
  if (rc != RC::SUCCESS) {
    LOG_WARN("failed to fetch parent page. page num=%d, rc=%d:%s",
	     parent_page_num, rc, strrc(rc));
    return false;
  }

羽飞's avatar
羽飞 已提交
354
  InternalIndexNodeHandler parent_node(header_, parent_frame);
羽飞's avatar
羽飞 已提交
355 356 357 358
  int index_in_parent = parent_node.value_index(this->page_num());
  if (index_in_parent < 0) {
    LOG_WARN("invalid leaf node. cannot find index in parent. this page num=%d, parent page num=%d",
	     this->page_num(), parent_page_num);
羽飞's avatar
羽飞 已提交
359
    bp->unpin_page(parent_frame);
羽飞's avatar
羽飞 已提交
360 361 362 363 364 365 366 367 368
    return false;
  }

  if (0 != index_in_parent) {
    int cmp_result = comparator(__key_at(0), parent_node.key_at(index_in_parent));
    if (cmp_result < 0) {
      LOG_WARN("invalid leaf node. first item should be greate than or equal to parent item. " \
	       "this page num=%d, parent page num=%d, index in parent=%d",
	       this->page_num(), parent_node.page_num(), index_in_parent);
羽飞's avatar
羽飞 已提交
369
      bp->unpin_page(parent_frame);
羽飞's avatar
羽飞 已提交
370 371 372 373 374 375 376 377 378 379
      return false;
    }
  }

  if (index_in_parent < parent_node.size() - 1) {
    int cmp_result = comparator(__key_at(size() - 1), parent_node.key_at(index_in_parent + 1));
    if (cmp_result >= 0) {
      LOG_WARN("invalid leaf node. last item should be less than the item at the first after item in parent." \
	       "this page num=%d, parent page num=%d, parent item to compare=%d",
	       this->page_num(), parent_node.page_num(), index_in_parent + 1);
羽飞's avatar
羽飞 已提交
380
      bp->unpin_page(parent_frame);
羽飞's avatar
羽飞 已提交
381 382 383
      return false;
    }
  }
羽飞's avatar
羽飞 已提交
384
  bp->unpin_page(parent_frame);
羽飞's avatar
羽飞 已提交
385 386 387 388
  return true;
}

/////////////////////////////////////////////////////////////////////////////////
羽飞's avatar
羽飞 已提交
389 390
InternalIndexNodeHandler::InternalIndexNodeHandler(const IndexFileHeader &header, Frame *frame)
  : IndexNodeHandler(header, frame), internal_node_((InternalIndexNode *)frame->data())
羽飞's avatar
羽飞 已提交
391 392 393 394 395 396 397 398 399 400 401 402 403 404 405 406 407 408 409 410 411 412 413 414 415 416 417 418 419 420 421 422 423 424 425 426 427 428 429 430 431 432 433 434 435 436 437 438
{}

std::string to_string(const InternalIndexNodeHandler &node, const KeyPrinter &printer)
{
  std::stringstream ss;
  ss << to_string((const IndexNodeHandler &)node);
  ss << ",children:["
     << "{key:" << printer(node.__key_at(0)) << ","
     << "value:" << *(PageNum *)node.__value_at(0) << "}";

  for (int i = 1; i < node.size(); i++) {
    ss << ",{key:" << printer(node.__key_at(i))
       << ",value:"<< *(PageNum *)node.__value_at(i) << "}";
  }
  ss << "]";
  return ss.str();
}

void InternalIndexNodeHandler::init_empty()
{
  IndexNodeHandler::init_empty(false);
}
void InternalIndexNodeHandler::create_new_root(PageNum first_page_num, const char *key, PageNum page_num)
{
  memset(__key_at(0), 0, key_size());
  memcpy(__value_at(0), &first_page_num, value_size());
  memcpy(__item_at(1), key, key_size());
  memcpy(__value_at(1), &page_num, value_size());
  increase_size(2);
}

/**
 * insert one entry
 * the entry to be inserted will never at the first slot.
 * the right child page after split will always have bigger keys.
 */
void InternalIndexNodeHandler::insert(const char *key, PageNum page_num, const KeyComparator &comparator)
{
  int insert_position = -1;
  lookup(comparator, key, nullptr, &insert_position);
  if (insert_position < size()) {
    memmove(__item_at(insert_position + 1), __item_at(insert_position), (size() - insert_position) * item_size());
  }
  memcpy(__item_at(insert_position), key, key_size());
  memcpy(__value_at(insert_position), &page_num, value_size());
  increase_size(1);
}

羽飞's avatar
羽飞 已提交
439
RC InternalIndexNodeHandler::move_half_to(InternalIndexNodeHandler &other, DiskBufferPool *bp)
羽飞's avatar
羽飞 已提交
440 441 442
{
  const int size = this->size();
  const int move_index = size / 2;
羽飞's avatar
羽飞 已提交
443
  RC rc = other.copy_from(this->__item_at(move_index), size - move_index, bp);
羽飞's avatar
羽飞 已提交
444 445 446 447 448 449 450 451 452 453 454 455 456 457 458 459 460 461 462 463 464 465 466 467 468 469 470 471 472 473 474 475 476 477 478 479 480 481 482 483 484 485 486 487 488 489 490 491 492 493 494 495 496 497 498 499 500 501 502 503 504 505 506 507 508 509 510 511 512 513 514 515 516 517 518 519 520 521 522 523 524 525 526 527 528 529 530 531 532 533 534 535 536 537 538 539 540
  if (rc != RC::SUCCESS) {
    LOG_WARN("failed to copy item to new node. rc=%d:%s", rc, strrc(rc));
    return rc;
  }

  increase_size(- (size - move_index));
  return rc;
}

int InternalIndexNodeHandler::max_size() const
{
  return header_.internal_max_size;
}

int InternalIndexNodeHandler::min_size() const
{
  return header_.internal_max_size - header_.internal_max_size / 2;
}

/**
 * lookup the first item which key <= item
 * @return unlike the leafNode, the return value is not the insert position,
 * but only the index of child to find. 
 */
int InternalIndexNodeHandler::lookup(const KeyComparator &comparator, const char *key,
				     bool *found /* = nullptr */, int *insert_position /*= nullptr */) const
{
  int i = 1;
  const int size = this->size();
  for ( ; i < size; i++) {
    int result = comparator(key, __key_at(i));
    if (result == 0) {
      if (found) {
	*found = true;
      }
      if (insert_position) {
	*insert_position = i;
      }
      return i;
    }
    if (result < 0) {
      if (found) {
	*found = false;
      }
      if (insert_position) {
	*insert_position = i;
      }

      return i - 1;
    }
  }
  if (found) {
    *found = false;
  }
  if (insert_position) {
    *insert_position = size;
  }
  return size - 1;
}

char *InternalIndexNodeHandler::key_at(int index)
{
  assert(index >= 0 && index < size());
  return __key_at(index);
}

void InternalIndexNodeHandler::set_key_at(int index, const char *key)
{
  assert(index >= 0 && index < size());
  memcpy(__key_at(index), key, key_size());
}

PageNum InternalIndexNodeHandler::value_at(int index)
{
  assert(index >= 0 && index < size());
  return *(PageNum *)__value_at(index);
}

int InternalIndexNodeHandler::value_index(PageNum page_num)
{
  for (int i = 0; i < size(); i++) {
    if (page_num == *(PageNum*)__value_at(i)) {
      return i;
    }
  }
  return -1;
}

void InternalIndexNodeHandler::remove(int index)
{
  assert(index >= 0 && index < size());
  if (index < size() - 1) {
    memmove(__item_at(index), __item_at(index + 1), (size() - index - 1) * item_size());
  }
  increase_size(-1);
}

羽飞's avatar
羽飞 已提交
541
RC InternalIndexNodeHandler::move_to(InternalIndexNodeHandler &other, DiskBufferPool *disk_buffer_pool)
羽飞's avatar
羽飞 已提交
542
{
羽飞's avatar
羽飞 已提交
543
  RC rc = other.copy_from(__item_at(0), size(), disk_buffer_pool);
羽飞's avatar
羽飞 已提交
544 545 546 547 548 549 550 551 552
  if (rc != RC::SUCCESS) {
    LOG_WARN("failed to copy items to other node. rc=%d:%s", rc, strrc(rc));
    return rc;
  }

  increase_size(- this->size());
  return RC::SUCCESS;
}

羽飞's avatar
羽飞 已提交
553
RC InternalIndexNodeHandler::move_first_to_end(InternalIndexNodeHandler &other, DiskBufferPool *disk_buffer_pool)
羽飞's avatar
羽飞 已提交
554
{
羽飞's avatar
羽飞 已提交
555
  RC rc = other.append(__item_at(0), disk_buffer_pool);
羽飞's avatar
羽飞 已提交
556 557 558 559 560 561 562 563 564 565 566 567
  if (rc != RC::SUCCESS) {
    LOG_WARN("failed to append item to others.");
    return rc;
  }

  if (size() >= 1) {
    memmove(__item_at(0), __item_at(1), (size() - 1) * item_size() );
  }
  increase_size(-1);
  return rc;
}

羽飞's avatar
羽飞 已提交
568
RC InternalIndexNodeHandler::move_last_to_front(InternalIndexNodeHandler &other, DiskBufferPool *bp)
羽飞's avatar
羽飞 已提交
569
{
羽飞's avatar
羽飞 已提交
570
  RC rc = other.preappend(__item_at(size() - 1), bp);
羽飞's avatar
羽飞 已提交
571 572 573 574 575 576 577 578 579 580 581
  if (rc != RC::SUCCESS) {
    LOG_WARN("failed to preappend to others");
    return rc;
  }

  increase_size(-1);
  return rc;
}
/**
 * copy items from other node to self's right
 */
羽飞's avatar
羽飞 已提交
582
RC InternalIndexNodeHandler::copy_from(const char *items, int num, DiskBufferPool *disk_buffer_pool)
羽飞's avatar
羽飞 已提交
583 584 585 586 587
{
  memcpy(__item_at(this->size()), items, num * item_size());

  RC rc = RC::SUCCESS;
  PageNum this_page_num = this->page_num();
羽飞's avatar
羽飞 已提交
588
  Frame *frame = nullptr;
羽飞's avatar
羽飞 已提交
589 590
  for (int i = 0; i < num; i++) {
    const PageNum page_num = *(const PageNum *)((items + i * item_size()) + key_size());
羽飞's avatar
羽飞 已提交
591
    rc = disk_buffer_pool->get_this_page(page_num, &frame);
羽飞's avatar
羽飞 已提交
592 593 594 595 596
    if (rc != RC::SUCCESS) {
      LOG_WARN("failed to set child's page num. child page num:%d, this page num=%d, rc=%d:%s",
	       page_num, this_page_num, rc, strrc(rc));
      return rc;
    }
羽飞's avatar
羽飞 已提交
597
    IndexNodeHandler child_node(header_, frame);
羽飞's avatar
羽飞 已提交
598
    child_node.set_parent_page_num(this_page_num);
羽飞's avatar
羽飞 已提交
599 600
    frame->mark_dirty();
    disk_buffer_pool->unpin_page(frame);
羽飞's avatar
羽飞 已提交
601 602 603 604 605
  }
  increase_size(num);
  return rc;
}

羽飞's avatar
羽飞 已提交
606
RC InternalIndexNodeHandler::append(const char *item, DiskBufferPool *bp)
羽飞's avatar
羽飞 已提交
607
{
羽飞's avatar
羽飞 已提交
608
  return this->copy_from(item, 1, bp);
羽飞's avatar
羽飞 已提交
609 610
}

羽飞's avatar
羽飞 已提交
611
RC InternalIndexNodeHandler::preappend(const char *item, DiskBufferPool *bp)
羽飞's avatar
羽飞 已提交
612 613
{
  PageNum child_page_num = *(PageNum *)(item + key_size());
羽飞's avatar
羽飞 已提交
614 615
  Frame *frame = nullptr;
  RC rc = bp->get_this_page(child_page_num, &frame);
羽飞's avatar
羽飞 已提交
616 617 618 619 620
  if (rc != RC::SUCCESS) {
    LOG_WARN("failed to fetch child page. rc=%d:%s", rc, strrc(rc));
    return rc;
  }

羽飞's avatar
羽飞 已提交
621
  IndexNodeHandler child_node(header_, frame);
羽飞's avatar
羽飞 已提交
622 623
  child_node.set_parent_page_num(this->page_num());

羽飞's avatar
羽飞 已提交
624 625
  frame->mark_dirty();
  bp->unpin_page(frame);
羽飞's avatar
羽飞 已提交
626 627 628 629 630 631 632 633 634 635 636 637 638 639 640 641 642 643 644 645 646 647 648 649 650 651 652 653 654 655 656 657 658 659 660

  if (this->size() > 0) {
    memmove(__item_at(1), __item_at(0), this->size() * item_size());
  }

  memcpy(__item_at(0), item, item_size());
  increase_size(1);
  return RC::SUCCESS;
}

char *InternalIndexNodeHandler::__item_at(int index) const
{
  return internal_node_->array + (index * item_size());
}

char *InternalIndexNodeHandler::__key_at(int index) const
{
  return __item_at(index);
}

char *InternalIndexNodeHandler::__value_at(int index) const
{
  return __item_at(index) + key_size();
}

int InternalIndexNodeHandler::value_size() const
{
  return sizeof(PageNum);
}

int InternalIndexNodeHandler::item_size() const
{
  return key_size() + this->value_size();
}

羽飞's avatar
羽飞 已提交
661
bool InternalIndexNodeHandler::validate(const KeyComparator &comparator, DiskBufferPool *bp) const
羽飞's avatar
羽飞 已提交
662 663 664 665 666 667 668 669 670 671 672 673 674 675 676 677 678 679 680 681
{
  bool result = IndexNodeHandler::validate();
  if (false == result) {
    return false;
  }

  const int node_size = size();
  for (int i = 2; i < node_size; i++) {
    if (comparator(__key_at(i - 1), __key_at(i)) >= 0) {
      LOG_WARN("page number = %d, invalid key order. id1=%d,id2=%d, this=%s",
	       page_num(), i-1, i, to_string(*this).c_str());
      return false;
    }
  }

  for (int i = 0; result && i < node_size; i++) {
    PageNum page_num = *(PageNum *)__value_at(i);
    if (page_num < 0) {
      LOG_WARN("this page num=%d, got invalid child page. page num=%d", this->page_num(), page_num);
    } else {
羽飞's avatar
羽飞 已提交
682 683
      Frame *child_frame;
      RC rc = bp->get_this_page(page_num, &child_frame);
羽飞's avatar
羽飞 已提交
684 685 686 687
      if (rc != RC::SUCCESS) {
	LOG_WARN("failed to fetch child page while validate internal page. page num=%d, rc=%d:%s",
		 page_num, rc, strrc(rc));
      } else {
羽飞's avatar
羽飞 已提交
688
	IndexNodeHandler child_node(header_, child_frame);
羽飞's avatar
羽飞 已提交
689 690 691 692 693
	if (child_node.parent_page_num() != this->page_num()) {
	  LOG_WARN("child's parent page num is invalid. child page num=%d, parent page num=%d, this page num=%d",
		   child_node.page_num(), child_node.parent_page_num(), this->page_num());
	  result = false;
	}
羽飞's avatar
羽飞 已提交
694
	bp->unpin_page(child_frame);
羽飞's avatar
羽飞 已提交
695 696 697 698 699 700 701 702 703 704 705 706 707
      }
    }
  }

  if (!result) {
    return result;
  }

  const PageNum parent_page_num = this->parent_page_num();
  if (parent_page_num == BP_INVALID_PAGE_NUM) {
    return result;
  }

羽飞's avatar
羽飞 已提交
708 709
  Frame *parent_frame;
  RC rc = bp->get_this_page(parent_page_num, &parent_frame);
羽飞's avatar
羽飞 已提交
710 711 712 713 714
  if (rc != RC::SUCCESS) {
    LOG_WARN("failed to fetch parent page. page num=%d, rc=%d:%s", parent_page_num, rc, strrc(rc));
    return false;
  }

羽飞's avatar
羽飞 已提交
715
  InternalIndexNodeHandler parent_node(header_, parent_frame);
羽飞's avatar
羽飞 已提交
716 717 718 719
  int index_in_parent = parent_node.value_index(this->page_num());
  if (index_in_parent < 0) {
    LOG_WARN("invalid internal node. cannot find index in parent. this page num=%d, parent page num=%d",
	     this->page_num(), parent_page_num);
羽飞's avatar
羽飞 已提交
720
    bp->unpin_page(parent_frame);
羽飞's avatar
羽飞 已提交
721 722 723 724 725 726 727 728 729
    return false;
  }

  if (0 != index_in_parent) {
    int cmp_result = comparator(__key_at(1), parent_node.key_at(index_in_parent));
    if (cmp_result < 0) {
      LOG_WARN("invalid internal node. the second item should be greate than or equal to parent item. " \
	       "this page num=%d, parent page num=%d, index in parent=%d",
	       this->page_num(), parent_node.page_num(), index_in_parent);
羽飞's avatar
羽飞 已提交
730
      bp->unpin_page(parent_frame);
羽飞's avatar
羽飞 已提交
731 732 733 734 735 736 737 738 739 740
      return false;
    }
  }

  if (index_in_parent < parent_node.size() - 1) {
    int cmp_result = comparator(__key_at(size() - 1), parent_node.key_at(index_in_parent + 1));
    if (cmp_result >= 0) {
      LOG_WARN("invalid internal node. last item should be less than the item at the first after item in parent." \
	       "this page num=%d, parent page num=%d, parent item to compare=%d",
	       this->page_num(), parent_node.page_num(), index_in_parent + 1);
羽飞's avatar
羽飞 已提交
741
      bp->unpin_page(parent_frame);
羽飞's avatar
羽飞 已提交
742 743 744
      return false;
    }
  }
羽飞's avatar
羽飞 已提交
745
  bp->unpin_page(parent_frame);
羽飞's avatar
羽飞 已提交
746 747 748 749 750 751 752 753

  return result;
}

/////////////////////////////////////////////////////////////////////////////////

RC BplusTreeHandler::sync()
{
羽飞's avatar
羽飞 已提交
754
  return disk_buffer_pool_->purge_all_pages();
羽飞's avatar
羽飞 已提交
755 756 757 758 759
}

RC BplusTreeHandler::create(const char *file_name, AttrType attr_type, int attr_length,
			    int internal_max_size /* = -1*/, int leaf_max_size /* = -1 */)
{
羽飞's avatar
羽飞 已提交
760 761
  BufferPoolManager &bpm = BufferPoolManager::instance();
  RC rc = bpm.create_file(file_name);
羽飞's avatar
羽飞 已提交
762 763 764 765 766 767
  if (rc != RC::SUCCESS) {
    LOG_WARN("Failed to create file. file name=%s, rc=%d:%s", file_name, rc, strrc(rc));
    return rc;
  }
  LOG_INFO("Successfully create index file:%s", file_name);

羽飞's avatar
羽飞 已提交
768 769
  DiskBufferPool *bp = nullptr;
  rc = bpm.open_file(file_name, bp);
羽飞's avatar
羽飞 已提交
770 771 772 773 774 775
  if (rc != RC::SUCCESS) {
    LOG_WARN("Failed to open file. file name=%s, rc=%d:%s", file_name, rc, strrc(rc));
    return rc;
  }
  LOG_INFO("Successfully open index file %s.", file_name);

羽飞's avatar
羽飞 已提交
776 777
  Frame *header_frame;
  rc = bp->allocate_page(&header_frame);
羽飞's avatar
羽飞 已提交
778 779
  if (rc != RC::SUCCESS) {
    LOG_WARN("failed to allocate header page for bplus tree. rc=%d:%s", rc, strrc(rc));
羽飞's avatar
羽飞 已提交
780
    bpm.close_file(file_name);
羽飞's avatar
羽飞 已提交
781 782 783
    return rc;
  }

羽飞's avatar
羽飞 已提交
784
  if (header_frame->page_num() != FIRST_INDEX_PAGE) {
羽飞's avatar
羽飞 已提交
785
    LOG_WARN("header page num should be %d but got %d. is it a new file : %s",
羽飞's avatar
羽飞 已提交
786 787
	     FIRST_INDEX_PAGE, header_frame->page_num(), file_name);
    bpm.close_file(file_name);
羽飞's avatar
羽飞 已提交
788 789 790 791 792 793 794 795 796
    return RC::INTERNAL;
  }

  if (internal_max_size < 0) {
    internal_max_size = calc_internal_page_capacity(attr_length);
  }
  if (leaf_max_size < 0) {
    leaf_max_size = calc_leaf_page_capacity(attr_length);
  }
羽飞's avatar
羽飞 已提交
797 798

  char *pdata = header_frame->data();
羽飞's avatar
羽飞 已提交
799 800 801 802 803 804 805 806
  IndexFileHeader *file_header = (IndexFileHeader *)pdata;
  file_header->attr_length = attr_length;
  file_header->key_length = attr_length + sizeof(RID);
  file_header->attr_type = attr_type;
  file_header->internal_max_size = internal_max_size;
  file_header->leaf_max_size = leaf_max_size;
  file_header->root_page = BP_INVALID_PAGE_NUM;

羽飞's avatar
羽飞 已提交
807
  header_frame->mark_dirty();
羽飞's avatar
羽飞 已提交
808

羽飞's avatar
羽飞 已提交
809
  disk_buffer_pool_ = bp;
羽飞's avatar
羽飞 已提交
810 811 812

  memcpy(&file_header_, pdata, sizeof(file_header_));
  header_dirty_ = false;
羽飞's avatar
羽飞 已提交
813
  bp->unpin_page(header_frame);
羽飞's avatar
羽飞 已提交
814 815 816 817 818 819 820 821 822 823 824 825 826 827 828 829

  mem_pool_item_ = new common::MemPoolItem(file_name);
  if (mem_pool_item_->init(file_header->key_length) < 0) {
    LOG_WARN("Failed to init memory pool for index %s", file_name);
    close();
    return RC::NOMEM;
  }

  key_comparator_.init(file_header->attr_type, file_header->attr_length);
  key_printer_.init(file_header->attr_type, file_header->attr_length);
  LOG_INFO("Successfully create index %s", file_name);
  return RC::SUCCESS;
}

RC BplusTreeHandler::open(const char *file_name)
{
羽飞's avatar
羽飞 已提交
830
  if (disk_buffer_pool_ != nullptr) {
羽飞's avatar
羽飞 已提交
831 832 833 834
    LOG_WARN("%s has been opened before index.open.", file_name);
    return RC::RECORD_OPENNED;
  }

羽飞's avatar
羽飞 已提交
835 836 837
  BufferPoolManager &bpm = BufferPoolManager::instance();
  DiskBufferPool *disk_buffer_pool;
  RC rc = bpm.open_file(file_name, disk_buffer_pool);
羽飞's avatar
羽飞 已提交
838 839 840 841 842
  if (rc != RC::SUCCESS) {
    LOG_WARN("Failed to open file name=%s, rc=%d:%s", file_name, rc, strrc(rc));
    return rc;
  }

羽飞's avatar
羽飞 已提交
843 844
  Frame *frame;
  rc = disk_buffer_pool->get_this_page(FIRST_INDEX_PAGE, &frame);
羽飞's avatar
羽飞 已提交
845 846
  if (rc != RC::SUCCESS) {
    LOG_WARN("Failed to get first page file name=%s, rc=%d:%s", file_name, rc, strrc(rc));
羽飞's avatar
羽飞 已提交
847
    bpm.close_file(file_name);
羽飞's avatar
羽飞 已提交
848 849 850
    return rc;
  }

羽飞's avatar
羽飞 已提交
851
  char *pdata = frame->data();
羽飞's avatar
羽飞 已提交
852 853 854 855 856 857 858 859 860 861 862 863
  memcpy(&file_header_, pdata, sizeof(IndexFileHeader));
  header_dirty_ = false;
  disk_buffer_pool_ = disk_buffer_pool;

  mem_pool_item_ = new common::MemPoolItem(file_name);
  if (mem_pool_item_->init(file_header_.key_length) < 0) {
    LOG_WARN("Failed to init memory pool for index %s", file_name);
    close();
    return RC::NOMEM;
  }

  // close old page_handle
羽飞's avatar
羽飞 已提交
864
  disk_buffer_pool->unpin_page(frame);
羽飞's avatar
羽飞 已提交
865 866

  key_comparator_.init(file_header_.attr_type, file_header_.attr_length);
羽飞's avatar
羽飞 已提交
867
  key_printer_.init(file_header_.attr_type, file_header_.attr_length);
羽飞's avatar
羽飞 已提交
868 869 870 871 872 873
  LOG_INFO("Successfully open index %s", file_name);
  return RC::SUCCESS;
}

RC BplusTreeHandler::close()
{
羽飞's avatar
羽飞 已提交
874
  if (disk_buffer_pool_ != nullptr) {
羽飞's avatar
羽飞 已提交
875

羽飞's avatar
羽飞 已提交
876
    disk_buffer_pool_->close_file(); // TODO
羽飞's avatar
羽飞 已提交
877 878 879 880 881 882 883 884 885

    delete mem_pool_item_;
    mem_pool_item_ = nullptr;
  }

  disk_buffer_pool_ = nullptr;
  return RC::SUCCESS;
}

羽飞's avatar
羽飞 已提交
886
RC BplusTreeHandler::print_leaf(Frame *frame)
羽飞's avatar
羽飞 已提交
887
{
羽飞's avatar
羽飞 已提交
888
  LeafIndexNodeHandler leaf_node(file_header_, frame);
羽飞's avatar
羽飞 已提交
889
  LOG_INFO("leaf node: %s", to_string(leaf_node, key_printer_).c_str());
羽飞's avatar
羽飞 已提交
890
  disk_buffer_pool_->unpin_page(frame);
羽飞's avatar
羽飞 已提交
891 892 893
  return RC::SUCCESS;
}

羽飞's avatar
羽飞 已提交
894
RC BplusTreeHandler::print_internal_node_recursive(Frame *frame)
羽飞's avatar
羽飞 已提交
895 896 897
{
  RC rc = RC::SUCCESS;
  LOG_INFO("bplus tree. file header: %s", file_header_.to_string().c_str());
羽飞's avatar
羽飞 已提交
898
  InternalIndexNodeHandler internal_node(file_header_, frame);
羽飞's avatar
羽飞 已提交
899 900 901 902 903
  LOG_INFO("internal node: %s", to_string(internal_node, key_printer_).c_str());

  int node_size = internal_node.size();
  for (int i = 0; i < node_size; i++) {
    PageNum page_num = internal_node.value_at(i);
羽飞's avatar
羽飞 已提交
904 905
    Frame *child_frame;
    rc = disk_buffer_pool_->get_this_page(page_num, &child_frame);
羽飞's avatar
羽飞 已提交
906 907
    if (rc != RC::SUCCESS) {
      LOG_WARN("failed to fetch child page. page id=%d, rc=%d:%s", page_num, rc, strrc(rc));
羽飞's avatar
羽飞 已提交
908
      disk_buffer_pool_->unpin_page(frame);
羽飞's avatar
羽飞 已提交
909 910 911
      return rc;
    }

羽飞's avatar
羽飞 已提交
912
    IndexNodeHandler node(file_header_, child_frame);
羽飞's avatar
羽飞 已提交
913
    if (node.is_leaf()) {
羽飞's avatar
羽飞 已提交
914
      rc = print_leaf(child_frame);
羽飞's avatar
羽飞 已提交
915
    } else {
羽飞's avatar
羽飞 已提交
916
      rc = print_internal_node_recursive(child_frame);
羽飞's avatar
羽飞 已提交
917 918
    }
    if (rc != RC::SUCCESS) {
羽飞's avatar
羽飞 已提交
919 920
      LOG_WARN("failed to print node. page id=%d, rc=%d:%s", child_frame->page_num(), rc, strrc(rc));
      disk_buffer_pool_->unpin_page(frame);
羽飞's avatar
羽飞 已提交
921 922 923 924
      return rc;
    }
  }

羽飞's avatar
羽飞 已提交
925
  disk_buffer_pool_->unpin_page(frame);
羽飞's avatar
羽飞 已提交
926 927 928 929 930
  return RC::SUCCESS;
}

RC BplusTreeHandler::print_tree()
{
羽飞's avatar
羽飞 已提交
931
  if (disk_buffer_pool_ == nullptr) {
羽飞's avatar
羽飞 已提交
932 933 934 935 936 937 938 939
    LOG_WARN("Index hasn't been created or opened, fail to print");
    return RC::SUCCESS;
  }
  if (is_empty()) {
    LOG_INFO("tree is empty");
    return RC::SUCCESS;
  }

羽飞's avatar
羽飞 已提交
940
  Frame *frame;
羽飞's avatar
羽飞 已提交
941
  PageNum page_num = file_header_.root_page;
羽飞's avatar
羽飞 已提交
942
  RC rc = disk_buffer_pool_->get_this_page(page_num, &frame);
羽飞's avatar
羽飞 已提交
943 944 945 946 947
  if (rc != RC::SUCCESS) {
    LOG_WARN("failed to fetch page. page id=%d, rc=%d:%s", page_num, rc, strrc(rc));
    return rc;
  }
  
羽飞's avatar
羽飞 已提交
948
  IndexNodeHandler node(file_header_, frame);
羽飞's avatar
羽飞 已提交
949
  if (node.is_leaf()) {
羽飞's avatar
羽飞 已提交
950
    rc = print_leaf(frame);
羽飞's avatar
羽飞 已提交
951
  } else {
羽飞's avatar
羽飞 已提交
952
    rc = print_internal_node_recursive(frame);
羽飞's avatar
羽飞 已提交
953 954 955 956 957 958 959 960 961 962 963
  }
  return rc;
}

RC BplusTreeHandler::print_leafs()
{
  if (is_empty()) {
    LOG_INFO("empty tree");
    return RC::SUCCESS;
  }

羽飞's avatar
羽飞 已提交
964
  Frame *frame;
羽飞's avatar
羽飞 已提交
965
  
羽飞's avatar
羽飞 已提交
966
  RC rc = left_most_page(frame);
羽飞's avatar
羽飞 已提交
967 968 969 970 971
  if (rc != RC::SUCCESS) {
    LOG_WARN("failed to get left most page. rc=%d:%s", rc, strrc(rc));
    return rc;
  }

羽飞's avatar
羽飞 已提交
972 973
  while (frame->page_num() != BP_INVALID_PAGE_NUM) {
    LeafIndexNodeHandler leaf_node(file_header_, frame);
羽飞's avatar
羽飞 已提交
974 975 976
    LOG_INFO("leaf info: %s", to_string(leaf_node, key_printer_).c_str());

    PageNum next_page_num = leaf_node.next_page();
羽飞's avatar
羽飞 已提交
977
    disk_buffer_pool_->unpin_page(frame);
羽飞's avatar
羽飞 已提交
978 979 980 981 982

    if (next_page_num == BP_INVALID_PAGE_NUM) {
      break;
    }

羽飞's avatar
羽飞 已提交
983
    rc = disk_buffer_pool_->get_this_page(next_page_num, &frame);
羽飞's avatar
羽飞 已提交
984 985 986 987 988 989 990 991
    if (rc != RC::SUCCESS) {
      LOG_WARN("failed to get next page. page id=%d, rc=%d:%s", next_page_num, rc, strrc(rc));
      return rc;
    }
  }
  return rc;
}

羽飞's avatar
羽飞 已提交
992
bool BplusTreeHandler::validate_node_recursive(Frame *frame)
羽飞's avatar
羽飞 已提交
993 994
{
  bool result = true;
羽飞's avatar
羽飞 已提交
995
  IndexNodeHandler node(file_header_, frame);
羽飞's avatar
羽飞 已提交
996
  if (node.is_leaf()) {
羽飞's avatar
羽飞 已提交
997 998
    LeafIndexNodeHandler leaf_node(file_header_, frame);
    result = leaf_node.validate(key_comparator_, disk_buffer_pool_);
羽飞's avatar
羽飞 已提交
999
  } else {
羽飞's avatar
羽飞 已提交
1000 1001
    InternalIndexNodeHandler internal_node(file_header_, frame);
    result = internal_node.validate(key_comparator_, disk_buffer_pool_);
羽飞's avatar
羽飞 已提交
1002 1003
    for (int i = 0; result && i < internal_node.size(); i++) {
      PageNum page_num = internal_node.value_at(i);
羽飞's avatar
羽飞 已提交
1004 1005
      Frame *child_frame;
      RC rc = disk_buffer_pool_->get_this_page(page_num, &child_frame);
羽飞's avatar
羽飞 已提交
1006 1007 1008 1009 1010 1011
      if (rc != RC::SUCCESS) {
        LOG_WARN("failed to fetch child page.page id=%d, rc=%d:%s", page_num, rc, strrc(rc));
        result = false;
        break;
      }

羽飞's avatar
羽飞 已提交
1012
      result = validate_node_recursive(child_frame);
羽飞's avatar
羽飞 已提交
1013 1014 1015
    }
  }

羽飞's avatar
羽飞 已提交
1016
  disk_buffer_pool_->unpin_page(frame);
羽飞's avatar
羽飞 已提交
1017 1018 1019 1020 1021 1022 1023 1024 1025
  return result;
}

bool BplusTreeHandler::validate_leaf_link()
{
  if (is_empty()) {
    return true;
  }

羽飞's avatar
羽飞 已提交
1026 1027
  Frame *frame;
  RC rc = left_most_page(frame);
羽飞's avatar
羽飞 已提交
1028 1029 1030 1031 1032 1033 1034
  if (rc != RC::SUCCESS) {
    LOG_WARN("failed to fetch left most page. rc=%d:%s", rc, strrc(rc));
    return false;
  }

  PageNum prev_page_num = BP_INVALID_PAGE_NUM;

羽飞's avatar
羽飞 已提交
1035
  LeafIndexNodeHandler leaf_node(file_header_, frame);
羽飞's avatar
羽飞 已提交
1036 1037
  if (leaf_node.prev_page() != prev_page_num) {
    LOG_WARN("invalid page. current_page_num=%d, prev page num should be %d but got %d",
羽飞's avatar
羽飞 已提交
1038
  	       frame->page_num(), prev_page_num, leaf_node.prev_page());
羽飞's avatar
羽飞 已提交
1039 1040 1041 1042
    return false;
  }
  PageNum next_page_num = leaf_node.next_page();

羽飞's avatar
羽飞 已提交
1043
  prev_page_num = frame->page_num();
羽飞's avatar
羽飞 已提交
1044 1045
  char *prev_key = (char *)mem_pool_item_->alloc();
  memcpy(prev_key, leaf_node.key_at(leaf_node.size() - 1), file_header_.key_length);
羽飞's avatar
羽飞 已提交
1046
  disk_buffer_pool_->unpin_page(frame);
羽飞's avatar
羽飞 已提交
1047 1048 1049

  bool result = true;
  while (result && next_page_num != BP_INVALID_PAGE_NUM) {
羽飞's avatar
羽飞 已提交
1050
    rc = disk_buffer_pool_->get_this_page(next_page_num, &frame);
羽飞's avatar
羽飞 已提交
1051 1052 1053 1054 1055
    if (rc != RC::SUCCESS) {
      LOG_WARN("failed to fetch next page. page num=%d, rc=%d:%s", next_page_num, rc, strrc(rc));
      return false;
    }

羽飞's avatar
羽飞 已提交
1056
    LeafIndexNodeHandler leaf_node(file_header_, frame);
羽飞's avatar
羽飞 已提交
1057 1058
    if (leaf_node.prev_page() != prev_page_num) {
      LOG_WARN("invalid page. current_page_num=%d, prev page num should be %d but got %d",
羽飞's avatar
羽飞 已提交
1059
	       frame->page_num(), prev_page_num, leaf_node.prev_page());
羽飞's avatar
羽飞 已提交
1060 1061 1062 1063 1064 1065 1066 1067 1068
      result = false;
    }
    if (key_comparator_(prev_key, leaf_node.key_at(0)) >= 0) {
      LOG_WARN("invalid page. current first key is not bigger than last");
      result = false;
    }

    next_page_num = leaf_node.next_page();
    memcpy(prev_key, leaf_node.key_at(leaf_node.size() - 1), file_header_.key_length);
羽飞's avatar
羽飞 已提交
1069 1070
    prev_page_num = frame->page_num();
    disk_buffer_pool_->unpin_page(frame);
羽飞's avatar
羽飞 已提交
1071 1072 1073 1074 1075 1076 1077 1078 1079 1080 1081 1082 1083
  }

  free_key(prev_key);
  // can do more things
  return result;
}

bool BplusTreeHandler::validate_tree()
{
  if (is_empty()) {
    return true;
  }

羽飞's avatar
羽飞 已提交
1084 1085
  Frame *frame;
  RC rc = disk_buffer_pool_->get_this_page(file_header_.root_page, &frame);
羽飞's avatar
羽飞 已提交
1086 1087 1088 1089 1090
  if (rc != RC::SUCCESS) {
    LOG_WARN("failed to fetch root page. page id=%d, rc=%d:%s", file_header_.root_page, rc, strrc(rc));
    return rc;
  }

羽飞's avatar
羽飞 已提交
1091
  if (!validate_node_recursive(frame) || !validate_leaf_link()) {
羽飞's avatar
羽飞 已提交
1092 1093 1094 1095 1096 1097 1098 1099 1100 1101 1102 1103 1104 1105
    LOG_WARN("Current B+ Tree is invalid");
    print_tree();
    return false;
  }

  LOG_INFO("great! current tree is valid");
  return true;
}

bool BplusTreeHandler::is_empty() const
{
  return file_header_.root_page == BP_INVALID_PAGE_NUM;
}

羽飞's avatar
羽飞 已提交
1106
RC BplusTreeHandler::find_leaf(const char *key, Frame *&frame)
羽飞's avatar
羽飞 已提交
1107 1108 1109 1110 1111
{
  return find_leaf_internal(
			    [&](InternalIndexNodeHandler &internal_node) {
			      return internal_node.value_at(internal_node.lookup(key_comparator_, key));
			    },
羽飞's avatar
羽飞 已提交
1112
			    frame);
羽飞's avatar
羽飞 已提交
1113 1114
}

羽飞's avatar
羽飞 已提交
1115
RC BplusTreeHandler::left_most_page(Frame *&frame)
羽飞's avatar
羽飞 已提交
1116 1117 1118 1119 1120
{
  return find_leaf_internal(
			    [&](InternalIndexNodeHandler &internal_node) {
			      return internal_node.value_at(0);
			    },
羽飞's avatar
羽飞 已提交
1121
			    frame
羽飞's avatar
羽飞 已提交
1122 1123
			    );
}
羽飞's avatar
羽飞 已提交
1124
RC BplusTreeHandler::right_most_page(Frame *&frame)
羽飞's avatar
羽飞 已提交
1125 1126 1127 1128 1129
{
  return find_leaf_internal(
			    [&](InternalIndexNodeHandler &internal_node) {
			      return internal_node.value_at(internal_node.size() - 1);
			    },
羽飞's avatar
羽飞 已提交
1130
			    frame
羽飞's avatar
羽飞 已提交
1131 1132 1133 1134
			    );
}

RC BplusTreeHandler::find_leaf_internal(const std::function<PageNum(InternalIndexNodeHandler &)> &child_page_getter,
羽飞's avatar
羽飞 已提交
1135
					Frame *&frame)
羽飞's avatar
羽飞 已提交
1136 1137 1138 1139 1140
{
  if (is_empty()) {
    return RC::EMPTY;
  }

羽飞's avatar
羽飞 已提交
1141
  RC rc = disk_buffer_pool_->get_this_page(file_header_.root_page, &frame);
羽飞's avatar
羽飞 已提交
1142 1143 1144 1145 1146
  if (rc != RC::SUCCESS) {
    LOG_WARN("failed to fetch root page. page id=%d, rc=%d:%s", file_header_.root_page, rc, strrc(rc));
    return rc;
  }

羽飞's avatar
羽飞 已提交
1147
  IndexNode *node = (IndexNode *)frame->data();
羽飞's avatar
羽飞 已提交
1148
  while (false == node->is_leaf) {
羽飞's avatar
羽飞 已提交
1149
    InternalIndexNodeHandler internal_node(file_header_, frame);
羽飞's avatar
羽飞 已提交
1150 1151
    PageNum page_num = child_page_getter(internal_node);

羽飞's avatar
羽飞 已提交
1152
    disk_buffer_pool_->unpin_page(frame);
羽飞's avatar
羽飞 已提交
1153

羽飞's avatar
羽飞 已提交
1154
    rc = disk_buffer_pool_->get_this_page(page_num, &frame);
羽飞's avatar
羽飞 已提交
1155
    if (rc != RC::SUCCESS) {
羽飞's avatar
羽飞 已提交
1156
      LOG_WARN("Failed to load page page_num:%d", page_num);
羽飞's avatar
羽飞 已提交
1157 1158
      return rc;
    }
羽飞's avatar
羽飞 已提交
1159
    node = (IndexNode *)frame->data();
羽飞's avatar
羽飞 已提交
1160 1161 1162 1163 1164
  }

  return RC::SUCCESS;
}

羽飞's avatar
羽飞 已提交
1165
RC BplusTreeHandler::insert_entry_into_leaf_node(Frame *frame, const char *key, const RID *rid)
羽飞's avatar
羽飞 已提交
1166
{
羽飞's avatar
羽飞 已提交
1167
  LeafIndexNodeHandler leaf_node(file_header_, frame);
羽飞's avatar
羽飞 已提交
1168 1169 1170 1171 1172 1173 1174 1175 1176
  bool exists = false;
  int insert_position = leaf_node.lookup(key_comparator_, key, &exists);
  if (exists) {
    LOG_TRACE("entry exists");
    return RC::RECORD_DUPLICATE_KEY;
  }

  if (leaf_node.size() < leaf_node.max_size()) {
    leaf_node.insert(insert_position, key, (const char *)rid);
羽飞's avatar
羽飞 已提交
1177 1178
    frame->mark_dirty();
    disk_buffer_pool_->unpin_page(frame);
羽飞's avatar
羽飞 已提交
1179 1180 1181
    return RC::SUCCESS;
  }

羽飞's avatar
羽飞 已提交
1182 1183
  Frame * new_frame = nullptr;
  RC rc = split<LeafIndexNodeHandler>(frame, new_frame);
羽飞's avatar
羽飞 已提交
1184 1185 1186 1187 1188
  if (rc != RC::SUCCESS) {
    LOG_WARN("failed to split leaf node. rc=%d:%s", rc, strrc(rc));
    return rc;
  }

羽飞's avatar
羽飞 已提交
1189 1190
  LeafIndexNodeHandler new_index_node(file_header_, new_frame);
  new_index_node.set_prev_page(frame->page_num());
羽飞's avatar
羽飞 已提交
1191 1192
  new_index_node.set_next_page(leaf_node.next_page());
  new_index_node.set_parent_page_num(leaf_node.parent_page_num());
羽飞's avatar
羽飞 已提交
1193
  leaf_node.set_next_page(new_frame->page_num());
羽飞's avatar
羽飞 已提交
1194 1195 1196

  PageNum next_page_num = new_index_node.next_page();
  if (next_page_num != BP_INVALID_PAGE_NUM) {
羽飞's avatar
羽飞 已提交
1197 1198
    Frame * next_frame;
    rc = disk_buffer_pool_->get_this_page(next_page_num, &next_frame);
羽飞's avatar
羽飞 已提交
1199 1200 1201 1202 1203
    if (rc != RC::SUCCESS) {
      LOG_WARN("failed to fetch next page. page num=%d, rc=%d:%s", next_page_num, rc, strrc(rc));
      return rc;
    }

羽飞's avatar
羽飞 已提交
1204 1205 1206
    LeafIndexNodeHandler next_node(file_header_, next_frame);
    next_node.set_prev_page(new_frame->page_num());
    disk_buffer_pool_->unpin_page(next_frame);
羽飞's avatar
羽飞 已提交
1207 1208 1209 1210 1211 1212 1213 1214
  }

  if (insert_position < leaf_node.size()) {
    leaf_node.insert(insert_position, key, (const char *)rid);
  } else {
    new_index_node.insert(insert_position - leaf_node.size(), key, (const char *)rid);
  }

羽飞's avatar
羽飞 已提交
1215
  return insert_entry_into_parent(frame, new_frame, new_index_node.key_at(0));
羽飞's avatar
羽飞 已提交
1216 1217
}

羽飞's avatar
羽飞 已提交
1218
RC BplusTreeHandler::insert_entry_into_parent(Frame *frame, Frame *new_frame, const char *key)
羽飞's avatar
羽飞 已提交
1219 1220 1221
{
  RC rc = RC::SUCCESS;

羽飞's avatar
羽飞 已提交
1222 1223
  IndexNodeHandler node_handler(file_header_, frame);
  IndexNodeHandler new_node_handler(file_header_, new_frame);
羽飞's avatar
羽飞 已提交
1224 1225 1226 1227 1228
  PageNum parent_page_num = node_handler.parent_page_num();

  if (parent_page_num == BP_INVALID_PAGE_NUM) {

    // create new root page
羽飞's avatar
羽飞 已提交
1229 1230
    Frame *root_frame;
    rc = disk_buffer_pool_->allocate_page(&root_frame);
羽飞's avatar
羽飞 已提交
1231 1232 1233 1234 1235
    if (rc != RC::SUCCESS) {
      LOG_WARN("failed to allocate new root page. rc=%d:%s", rc, strrc(rc));
      return rc;
    }

羽飞's avatar
羽飞 已提交
1236
    InternalIndexNodeHandler root_node(file_header_, root_frame);
羽飞's avatar
羽飞 已提交
1237
    root_node.init_empty();
羽飞's avatar
羽飞 已提交
1238 1239 1240
    root_node.create_new_root(frame->page_num(), key, new_frame->page_num());
    node_handler.set_parent_page_num(root_frame->page_num());
    new_node_handler.set_parent_page_num(root_frame->page_num());
羽飞's avatar
羽飞 已提交
1241

羽飞's avatar
羽飞 已提交
1242 1243 1244 1245
    frame->mark_dirty();
    new_frame->mark_dirty();
    disk_buffer_pool_->unpin_page(frame);
    disk_buffer_pool_->unpin_page(new_frame);
羽飞's avatar
羽飞 已提交
1246

羽飞's avatar
羽飞 已提交
1247
    file_header_.root_page = root_frame->page_num();
羽飞's avatar
羽飞 已提交
1248
    update_root_page_num(); // TODO
羽飞's avatar
羽飞 已提交
1249 1250
    root_frame->mark_dirty();
    disk_buffer_pool_->unpin_page(root_frame);
羽飞's avatar
羽飞 已提交
1251 1252 1253 1254 1255

    return RC::SUCCESS;

  } else {

羽飞's avatar
羽飞 已提交
1256 1257
    Frame *parent_frame;
    rc = disk_buffer_pool_->get_this_page(parent_page_num, &parent_frame);
羽飞's avatar
羽飞 已提交
1258 1259 1260 1261 1262 1263
    if (rc != RC::SUCCESS) {
      LOG_WARN("failed to insert entry into leaf. rc=%d:%s", rc, strrc(rc));
      // should do more things to recover
      return rc;
    }

羽飞's avatar
羽飞 已提交
1264
    InternalIndexNodeHandler node(file_header_, parent_frame);
羽飞's avatar
羽飞 已提交
1265 1266 1267

    /// current node is not in full mode, insert the entry and return
    if (node.size() < node.max_size()) {
羽飞's avatar
羽飞 已提交
1268
      node.insert(key, new_frame->page_num(), key_comparator_);
羽飞's avatar
羽飞 已提交
1269 1270
      new_node_handler.set_parent_page_num(parent_page_num);

羽飞's avatar
羽飞 已提交
1271 1272 1273 1274 1275 1276
      frame->mark_dirty();
      new_frame->mark_dirty();
      parent_frame->mark_dirty();
      disk_buffer_pool_->unpin_page(frame);
      disk_buffer_pool_->unpin_page(new_frame);
      disk_buffer_pool_->unpin_page(parent_frame);
羽飞's avatar
羽飞 已提交
1277 1278 1279 1280

    } else {

      // we should split the node and insert the entry and then insert new entry to current node's parent
羽飞's avatar
羽飞 已提交
1281 1282
      Frame * new_parent_frame;
      rc = split<InternalIndexNodeHandler>(parent_frame, new_parent_frame);
羽飞's avatar
羽飞 已提交
1283 1284
      if (rc != RC::SUCCESS) {
	LOG_WARN("failed to split internal node. rc=%d:%s", rc, strrc(rc));
羽飞's avatar
羽飞 已提交
1285 1286 1287
	disk_buffer_pool_->unpin_page(frame);
	disk_buffer_pool_->unpin_page(new_frame);
	disk_buffer_pool_->unpin_page(parent_frame);
羽飞's avatar
羽飞 已提交
1288 1289
      } else {
	// insert into left or right ? decide by key compare result
羽飞's avatar
羽飞 已提交
1290
	InternalIndexNodeHandler new_node(file_header_, new_parent_frame);
羽飞's avatar
羽飞 已提交
1291
	if (key_comparator_(key, new_node.key_at(0)) > 0) {
羽飞's avatar
羽飞 已提交
1292
	  new_node.insert(key, new_frame->page_num(), key_comparator_);
羽飞's avatar
羽飞 已提交
1293 1294
          new_node_handler.set_parent_page_num(new_node.page_num());
	} else {
羽飞's avatar
羽飞 已提交
1295
	  node.insert(key, new_frame->page_num(), key_comparator_);
羽飞's avatar
羽飞 已提交
1296 1297 1298
          new_node_handler.set_parent_page_num(node.page_num());
	}

羽飞's avatar
羽飞 已提交
1299 1300
	disk_buffer_pool_->unpin_page(frame);
	disk_buffer_pool_->unpin_page(new_frame);
羽飞's avatar
羽飞 已提交
1301
	
羽飞's avatar
羽飞 已提交
1302
	rc = insert_entry_into_parent(parent_frame, new_parent_frame, new_node.key_at(0));
羽飞's avatar
羽飞 已提交
1303 1304 1305 1306 1307 1308 1309 1310 1311 1312 1313 1314 1315
      }
    }
  }
  return rc;
}

/**
 * split one full node into two
 * @param page_handle[inout] the node to split
 * @param new_page_handle[out] the new node after split
 * @param intert_position the intert position of new key
 */
template <typename IndexNodeHandlerType>
羽飞's avatar
羽飞 已提交
1316
RC BplusTreeHandler::split(Frame *frame, Frame *&new_frame)
羽飞's avatar
羽飞 已提交
1317
{
羽飞's avatar
羽飞 已提交
1318
  IndexNodeHandlerType old_node(file_header_, frame);
羽飞's avatar
羽飞 已提交
1319 1320 1321 1322 1323 1324 1325 1326

  char *new_parent_key = (char *)mem_pool_item_->alloc();
  if (new_parent_key == nullptr) {
    LOG_WARN("Failed to alloc memory for new key. size=%d", file_header_.key_length);
    return RC::NOMEM;
  }

  // add a new node
羽飞's avatar
羽飞 已提交
1327
  RC rc = disk_buffer_pool_->allocate_page(&new_frame);
羽飞's avatar
羽飞 已提交
1328
  if (rc != RC::SUCCESS) {
羽飞's avatar
羽飞 已提交
1329
    LOG_WARN("Failed to split index page due to failed to allocate page, rc=%d:%s", rc, strrc(rc));
羽飞's avatar
羽飞 已提交
1330 1331 1332
    return rc;
  }

羽飞's avatar
羽飞 已提交
1333
  IndexNodeHandlerType new_node(file_header_, new_frame);
羽飞's avatar
羽飞 已提交
1334 1335 1336
  new_node.init_empty();
  new_node.set_parent_page_num(old_node.parent_page_num());

羽飞's avatar
羽飞 已提交
1337
  old_node.move_half_to(new_node, disk_buffer_pool_);
羽飞's avatar
羽飞 已提交
1338

羽飞's avatar
羽飞 已提交
1339 1340
  frame->mark_dirty();
  new_frame->mark_dirty();
羽飞's avatar
羽飞 已提交
1341 1342 1343 1344 1345
  return RC::SUCCESS;
}

RC BplusTreeHandler::update_root_page_num()
{
羽飞's avatar
羽飞 已提交
1346 1347
  Frame * header_frame;
  RC rc = disk_buffer_pool_->get_this_page(FIRST_INDEX_PAGE, &header_frame);
羽飞's avatar
羽飞 已提交
1348 1349 1350 1351 1352
  if (rc != RC::SUCCESS) {
    LOG_WARN("failed to fetch header page. rc=%d:%s", rc, strrc(rc));
    return rc;
  }

羽飞's avatar
羽飞 已提交
1353
  IndexFileHeader *header = (IndexFileHeader *)header_frame->data();
羽飞's avatar
羽飞 已提交
1354
  header->root_page = file_header_.root_page;
羽飞's avatar
羽飞 已提交
1355 1356
  header_frame->mark_dirty();
  disk_buffer_pool_->unpin_page(header_frame);
羽飞's avatar
羽飞 已提交
1357 1358 1359 1360 1361 1362 1363 1364 1365 1366 1367 1368 1369
  return rc;
}


RC BplusTreeHandler::create_new_tree(const char *key, const RID *rid)
{
  RC rc = RC::SUCCESS;
  if (file_header_.root_page != BP_INVALID_PAGE_NUM) {
    rc = RC::INTERNAL;
    LOG_WARN("cannot create new tree while root page is valid. root page id=%d", file_header_.root_page);
    return rc;
  }

羽飞's avatar
羽飞 已提交
1370 1371
  Frame *frame;
  rc = disk_buffer_pool_->allocate_page(&frame);
羽飞's avatar
羽飞 已提交
1372 1373 1374 1375 1376
  if (rc != RC::SUCCESS) {
    LOG_WARN("failed to allocate root page. rc=%d:%s", rc, strrc(rc));
    return rc;
  }

羽飞's avatar
羽飞 已提交
1377
  LeafIndexNodeHandler leaf_node(file_header_, frame);
羽飞's avatar
羽飞 已提交
1378 1379
  leaf_node.init_empty();
  leaf_node.insert(0, key, (const char *)rid);
羽飞's avatar
羽飞 已提交
1380 1381 1382
  file_header_.root_page = frame->page_num();
  frame->mark_dirty();
  disk_buffer_pool_->unpin_page(frame);
羽飞's avatar
羽飞 已提交
1383 1384 1385 1386 1387 1388 1389 1390 1391 1392

  rc = update_root_page_num();
  // disk_buffer_pool_->check_all_pages_unpinned(file_id_);
  return rc;
}

char *BplusTreeHandler::make_key(const char *user_key, const RID &rid)
{
  char *key = (char *)mem_pool_item_->alloc();
  if (key == nullptr) {
羽飞's avatar
羽飞 已提交
1393
    LOG_WARN("Failed to alloc memory for key.");
羽飞's avatar
羽飞 已提交
1394 1395 1396 1397 1398 1399 1400 1401 1402 1403 1404 1405 1406 1407 1408 1409 1410 1411 1412 1413 1414
    return nullptr;
  }
  memcpy(key, user_key, file_header_.attr_length);
  memcpy(key + file_header_.attr_length, &rid, sizeof(rid));
  return key;
}

void BplusTreeHandler::free_key(char *key)
{
  mem_pool_item_->free(key);
}

RC BplusTreeHandler::insert_entry(const char *user_key, const RID *rid)
{
  if (user_key == nullptr || rid == nullptr) {
    LOG_WARN("Invalid arguments, key is empty or rid is empty");
    return RC::INVALID_ARGUMENT;
  }

  char *key = make_key(user_key, *rid);
  if (key == nullptr) {
羽飞's avatar
羽飞 已提交
1415
    LOG_WARN("Failed to alloc memory for key.");
羽飞's avatar
羽飞 已提交
1416 1417 1418 1419 1420 1421 1422
    return RC::NOMEM;
  }

  if (is_empty()) {
    return create_new_tree(key, rid);
  }

羽飞's avatar
羽飞 已提交
1423 1424
  Frame *frame;
  RC rc = find_leaf(key, frame);
羽飞's avatar
羽飞 已提交
1425
  if (rc != RC::SUCCESS) {
羽飞's avatar
羽飞 已提交
1426
    LOG_WARN("Failed to find leaf %s. rc=%d:%s", rid->to_string().c_str(), rc, strrc(rc));
羽飞's avatar
羽飞 已提交
1427 1428 1429 1430
    mem_pool_item_->free(key);
    return rc;
  }

羽飞's avatar
羽飞 已提交
1431
  rc = insert_entry_into_leaf_node(frame, key, rid);
羽飞's avatar
羽飞 已提交
1432
  if (rc != RC::SUCCESS) {
羽飞's avatar
羽飞 已提交
1433 1434
    LOG_TRACE("Failed to insert into leaf of index, rid:%s", rid->to_string().c_str());
    disk_buffer_pool_->unpin_page(frame);
羽飞's avatar
羽飞 已提交
1435 1436 1437 1438 1439 1440 1441 1442 1443 1444 1445 1446 1447 1448 1449 1450 1451 1452 1453 1454 1455 1456 1457 1458 1459 1460 1461 1462 1463 1464 1465 1466 1467 1468
    mem_pool_item_->free(key);
    // disk_buffer_pool_->check_all_pages_unpinned(file_id_);
    return rc;
  }

  mem_pool_item_->free(key);
  LOG_TRACE("insert entry success");
  // disk_buffer_pool_->check_all_pages_unpinned(file_id_);
  return RC::SUCCESS;
}

RC BplusTreeHandler::get_entry(const char *user_key, std::list<RID> &rids)
{
  BplusTreeScanner scanner(*this);
  RC rc = scanner.open(user_key, true/*left_inclusive*/, user_key, true/*right_inclusive*/);
  if (rc != RC::SUCCESS) {
    LOG_WARN("failed to open scanner. rc=%d:%s", rc, strrc(rc));
    return rc;
  }

  RID rid;
  while ((rc = scanner.next_entry(&rid)) == RC::SUCCESS) {
    rids.push_back(rid);
  }

  scanner.close();
  if (rc != RC::RECORD_EOF) {
    LOG_WARN("scanner return error. rc=%d:%s", rc, strrc(rc));
  } else {
    rc = RC::SUCCESS;
  }
  return rc;
}

羽飞's avatar
羽飞 已提交
1469
RC BplusTreeHandler::adjust_root(Frame *root_frame)
羽飞's avatar
羽飞 已提交
1470
{
羽飞's avatar
羽飞 已提交
1471
  IndexNodeHandler root_node(file_header_, root_frame);
羽飞's avatar
羽飞 已提交
1472
  if (root_node.is_leaf() && root_node.size() > 0) {
羽飞's avatar
羽飞 已提交
1473 1474
    root_frame->mark_dirty();
    disk_buffer_pool_->unpin_page(root_frame);
羽飞's avatar
羽飞 已提交
1475 1476 1477 1478 1479 1480 1481 1482
    return RC::SUCCESS;
  }

  if (root_node.is_leaf()) {
    // this is a leaf and an empty node
    file_header_.root_page = BP_INVALID_PAGE_NUM;
  } else {
    // this is an internal node and has only one child node
羽飞's avatar
羽飞 已提交
1483
    InternalIndexNodeHandler internal_node(file_header_, root_frame);
羽飞's avatar
羽飞 已提交
1484 1485

    const PageNum child_page_num = internal_node.value_at(0);
羽飞's avatar
羽飞 已提交
1486 1487
    Frame * child_frame;
    RC rc = disk_buffer_pool_->get_this_page(child_page_num, &child_frame);
羽飞's avatar
羽飞 已提交
1488 1489 1490 1491 1492
    if (rc != RC::SUCCESS) {
      LOG_WARN("failed to fetch child page. page num=%d, rc=%d:%s", child_page_num, rc, strrc(rc));
      return rc;
    }

羽飞's avatar
羽飞 已提交
1493
    IndexNodeHandler child_node(file_header_, child_frame);
羽飞's avatar
羽飞 已提交
1494
    child_node.set_parent_page_num(BP_INVALID_PAGE_NUM);
羽飞's avatar
羽飞 已提交
1495
    disk_buffer_pool_->unpin_page(child_frame);
羽飞's avatar
羽飞 已提交
1496 1497 1498 1499 1500 1501
    
    file_header_.root_page = child_page_num;
  }

  update_root_page_num();

羽飞's avatar
羽飞 已提交
1502 1503 1504
  PageNum old_root_page_num = root_frame->page_num();
  disk_buffer_pool_->unpin_page(root_frame);
  disk_buffer_pool_->dispose_page(old_root_page_num);
羽飞's avatar
羽飞 已提交
1505 1506 1507
  return RC::SUCCESS;
}
template <typename IndexNodeHandlerType>
羽飞's avatar
羽飞 已提交
1508
RC BplusTreeHandler::coalesce_or_redistribute(Frame *frame)
羽飞's avatar
羽飞 已提交
1509
{
羽飞's avatar
羽飞 已提交
1510
  IndexNodeHandlerType index_node(file_header_, frame);
羽飞's avatar
羽飞 已提交
1511
  if (index_node.size() >= index_node.min_size()) {
羽飞's avatar
羽飞 已提交
1512
    disk_buffer_pool_->unpin_page(frame);
羽飞's avatar
羽飞 已提交
1513 1514 1515 1516 1517 1518 1519
    return RC::SUCCESS;
  }

  const PageNum parent_page_num = index_node.parent_page_num();
  if (BP_INVALID_PAGE_NUM == parent_page_num) {
    // this is the root page
    if (index_node.size() > 1) {
羽飞's avatar
羽飞 已提交
1520
      disk_buffer_pool_->unpin_page(frame);
羽飞's avatar
羽飞 已提交
1521 1522
    } else {
      // adjust the root node
羽飞's avatar
羽飞 已提交
1523
      adjust_root(frame);
羽飞's avatar
羽飞 已提交
1524 1525 1526 1527
    }
    return RC::SUCCESS;
  }

羽飞's avatar
羽飞 已提交
1528 1529
  Frame * parent_frame;
  RC rc = disk_buffer_pool_->get_this_page(parent_page_num, &parent_frame);
羽飞's avatar
羽飞 已提交
1530 1531
  if (rc != RC::SUCCESS) {
    LOG_WARN("failed to fetch parent page. page id=%d, rc=%d:%s", parent_page_num, rc, strrc(rc));
羽飞's avatar
羽飞 已提交
1532
    disk_buffer_pool_->unpin_page(frame);
羽飞's avatar
羽飞 已提交
1533 1534 1535
    return rc;
  }

羽飞's avatar
羽飞 已提交
1536
  InternalIndexNodeHandler parent_index_node(file_header_, parent_frame);
羽飞's avatar
羽飞 已提交
1537
  int index = parent_index_node.lookup(key_comparator_, index_node.key_at(index_node.size() - 1));
羽飞's avatar
羽飞 已提交
1538
  if (parent_index_node.value_at(index) != frame->page_num()) {
羽飞's avatar
羽飞 已提交
1539
    LOG_ERROR("lookup return an invalid value. index=%d, this page num=%d, but got %d",
羽飞's avatar
羽飞 已提交
1540
	      index, frame->page_num(), parent_index_node.value_at(index));
羽飞's avatar
羽飞 已提交
1541 1542 1543 1544 1545 1546 1547 1548
  }
  PageNum neighbor_page_num;
  if (index == 0) {
    neighbor_page_num = parent_index_node.value_at(1);
  } else {
    neighbor_page_num = parent_index_node.value_at(index - 1);
  }

羽飞's avatar
羽飞 已提交
1549 1550
  Frame * neighbor_frame;
  rc = disk_buffer_pool_->get_this_page(neighbor_page_num, &neighbor_frame);
羽飞's avatar
羽飞 已提交
1551 1552 1553
  if (rc != RC::SUCCESS) {
    LOG_WARN("failed to fetch neighbor page. page id=%d, rc=%d:%s", neighbor_page_num, rc, strrc(rc));
    // TODO do more thing to release resource
羽飞's avatar
羽飞 已提交
1554 1555
    disk_buffer_pool_->unpin_page(frame);
    disk_buffer_pool_->unpin_page(parent_frame);
羽飞's avatar
羽飞 已提交
1556 1557 1558
    return rc;
  }

羽飞's avatar
羽飞 已提交
1559
  IndexNodeHandlerType neighbor_node(file_header_, neighbor_frame);
羽飞's avatar
羽飞 已提交
1560
  if (index_node.size() + neighbor_node.size() > index_node.max_size()) {
羽飞's avatar
羽飞 已提交
1561
    rc = redistribute<IndexNodeHandlerType>(neighbor_frame, frame, parent_frame, index);
羽飞's avatar
羽飞 已提交
1562
  } else {
羽飞's avatar
羽飞 已提交
1563
    rc = coalesce<IndexNodeHandlerType>(neighbor_frame, frame, parent_frame, index);
羽飞's avatar
羽飞 已提交
1564 1565 1566 1567 1568
  }
  return rc;
}

template <typename IndexNodeHandlerType>
羽飞's avatar
羽飞 已提交
1569
RC BplusTreeHandler::coalesce(Frame *neighbor_frame, Frame *frame, Frame *parent_frame, int index)
羽飞's avatar
羽飞 已提交
1570
{
羽飞's avatar
羽飞 已提交
1571 1572
  IndexNodeHandlerType neighbor_node(file_header_, neighbor_frame);
  IndexNodeHandlerType node(file_header_, frame);
羽飞's avatar
羽飞 已提交
1573

羽飞's avatar
羽飞 已提交
1574
  InternalIndexNodeHandler parent_node(file_header_, parent_frame);
羽飞's avatar
羽飞 已提交
1575

羽飞's avatar
羽飞 已提交
1576 1577
  Frame *left_frame = nullptr;
  Frame *right_frame = nullptr;
羽飞's avatar
羽飞 已提交
1578 1579
  if (index == 0) {
    // neighbor node is at right
羽飞's avatar
羽飞 已提交
1580 1581
    left_frame  = frame;
    right_frame = neighbor_frame;
羽飞's avatar
羽飞 已提交
1582 1583
    index++;
  } else {
羽飞's avatar
羽飞 已提交
1584 1585
    left_frame  = neighbor_frame;
    right_frame = frame;
羽飞's avatar
羽飞 已提交
1586 1587 1588
    // neighbor is at left
  }

羽飞's avatar
羽飞 已提交
1589 1590
  IndexNodeHandlerType left_node(file_header_, left_frame);
  IndexNodeHandlerType right_node(file_header_, right_frame);
羽飞's avatar
羽飞 已提交
1591 1592 1593

  parent_node.remove(index);
  // parent_node.validate(key_comparator_, disk_buffer_pool_, file_id_);
羽飞's avatar
羽飞 已提交
1594
  RC rc = right_node.move_to(left_node, disk_buffer_pool_);
羽飞's avatar
羽飞 已提交
1595 1596 1597 1598 1599 1600 1601
  if (rc != RC::SUCCESS) {
    LOG_WARN("failed to move right node to left. rc=%d:%s", rc, strrc(rc));
    return rc;
  }
  // left_node.validate(key_comparator_);

  if (left_node.is_leaf()) {
羽飞's avatar
羽飞 已提交
1602 1603
    LeafIndexNodeHandler left_leaf_node(file_header_, left_frame);
    LeafIndexNodeHandler right_leaf_node(file_header_, right_frame);
羽飞's avatar
羽飞 已提交
1604 1605 1606 1607
    left_leaf_node.set_next_page(right_leaf_node.next_page());

    PageNum next_right_page_num = right_leaf_node.next_page();
    if (next_right_page_num != BP_INVALID_PAGE_NUM) {
羽飞's avatar
羽飞 已提交
1608 1609
      Frame *next_right_frame;
      rc = disk_buffer_pool_->get_this_page(next_right_page_num, &next_right_frame);
羽飞's avatar
羽飞 已提交
1610 1611
      if (rc != RC::SUCCESS) {
        LOG_WARN("failed to fetch next right page. page number:%d. rc=%d:%s", next_right_page_num, rc, strrc(rc));
羽飞's avatar
羽飞 已提交
1612 1613 1614
	disk_buffer_pool_->unpin_page(frame);
	disk_buffer_pool_->unpin_page(neighbor_frame);
	disk_buffer_pool_->unpin_page(parent_frame);
羽飞's avatar
羽飞 已提交
1615 1616 1617
        return rc;
      }

羽飞's avatar
羽飞 已提交
1618
      LeafIndexNodeHandler next_right_node(file_header_, next_right_frame);
羽飞's avatar
羽飞 已提交
1619
      next_right_node.set_prev_page(left_node.page_num());
羽飞's avatar
羽飞 已提交
1620
      disk_buffer_pool_->unpin_page(next_right_frame);
羽飞's avatar
羽飞 已提交
1621 1622 1623 1624
    }
    
  }

羽飞's avatar
羽飞 已提交
1625 1626 1627 1628 1629
  PageNum right_page_num = right_frame->page_num();
  disk_buffer_pool_->unpin_page(left_frame);
  disk_buffer_pool_->unpin_page(right_frame);
  disk_buffer_pool_->dispose_page(right_page_num);
  return coalesce_or_redistribute<InternalIndexNodeHandler>(parent_frame);
羽飞's avatar
羽飞 已提交
1630 1631 1632
}

template <typename IndexNodeHandlerType>
羽飞's avatar
羽飞 已提交
1633
RC BplusTreeHandler::redistribute(Frame *neighbor_frame, Frame *frame, Frame *parent_frame, int index)
羽飞's avatar
羽飞 已提交
1634
{
羽飞's avatar
羽飞 已提交
1635 1636 1637
  InternalIndexNodeHandler parent_node(file_header_, parent_frame);
  IndexNodeHandlerType neighbor_node(file_header_, neighbor_frame);
  IndexNodeHandlerType node(file_header_, frame);
羽飞's avatar
羽飞 已提交
1638 1639 1640 1641 1642 1643
  if (neighbor_node.size() < node.size()) {
    LOG_ERROR("got invalid nodes. neighbor node size %d, this node size %d",
	      neighbor_node.size(), node.size());
  }
  if (index == 0) {
    // the neighbor is at right
羽飞's avatar
羽飞 已提交
1644
    neighbor_node.move_first_to_end(node, disk_buffer_pool_);
羽飞's avatar
羽飞 已提交
1645 1646 1647 1648 1649 1650
    // neighbor_node.validate(key_comparator_, disk_buffer_pool_, file_id_);
    // node.validate(key_comparator_, disk_buffer_pool_, file_id_);
    parent_node.set_key_at(index + 1, neighbor_node.key_at(0));
    // parent_node.validate(key_comparator_, disk_buffer_pool_, file_id_);
  } else {
    // the neighbor is at left
羽飞's avatar
羽飞 已提交
1651
    neighbor_node.move_last_to_front(node, disk_buffer_pool_);
羽飞's avatar
羽飞 已提交
1652 1653 1654 1655 1656 1657
    // neighbor_node.validate(key_comparator_, disk_buffer_pool_, file_id_);
    // node.validate(key_comparator_, disk_buffer_pool_, file_id_);
    parent_node.set_key_at(index, node.key_at(0));
    // parent_node.validate(key_comparator_, disk_buffer_pool_, file_id_);
  }

羽飞's avatar
羽飞 已提交
1658 1659 1660 1661 1662 1663
  neighbor_frame->mark_dirty();
  frame->mark_dirty();
  parent_frame->mark_dirty();
  disk_buffer_pool_->unpin_page(parent_frame);
  disk_buffer_pool_->unpin_page(neighbor_frame);
  disk_buffer_pool_->unpin_page(frame);
羽飞's avatar
羽飞 已提交
1664 1665 1666
  return RC::SUCCESS;
}

羽飞's avatar
羽飞 已提交
1667
RC BplusTreeHandler::delete_entry_internal(Frame *leaf_frame, const char *key)
羽飞's avatar
羽飞 已提交
1668
{
羽飞's avatar
羽飞 已提交
1669
  LeafIndexNodeHandler leaf_index_node(file_header_, leaf_frame);
羽飞's avatar
羽飞 已提交
1670 1671 1672 1673

  const int remove_count = leaf_index_node.remove(key, key_comparator_);
  if (remove_count == 0) {
    LOG_TRACE("no data to remove");
羽飞's avatar
羽飞 已提交
1674
    disk_buffer_pool_->unpin_page(leaf_frame);
羽飞's avatar
羽飞 已提交
1675 1676 1677 1678
    return RC::RECORD_RECORD_NOT_EXIST;
  }
  // leaf_index_node.validate(key_comparator_, disk_buffer_pool_, file_id_);

羽飞's avatar
羽飞 已提交
1679
  leaf_frame->mark_dirty();
羽飞's avatar
羽飞 已提交
1680 1681

  if (leaf_index_node.size() >= leaf_index_node.min_size()) {
羽飞's avatar
羽飞 已提交
1682
    disk_buffer_pool_->unpin_page(leaf_frame);
羽飞's avatar
羽飞 已提交
1683 1684 1685
    return RC::SUCCESS;
  }

羽飞's avatar
羽飞 已提交
1686
  return coalesce_or_redistribute<LeafIndexNodeHandler>(leaf_frame);
羽飞's avatar
羽飞 已提交
1687 1688 1689 1690 1691 1692 1693 1694 1695 1696 1697 1698
}

RC BplusTreeHandler::delete_entry(const char *user_key, const RID *rid)
{
  char *key = (char *)mem_pool_item_->alloc();
  if (nullptr == key) {
    LOG_WARN("Failed to alloc memory for key. size=%d", file_header_.key_length);
    return RC::NOMEM;
  }
  memcpy(key, user_key, file_header_.attr_length);
  memcpy(key + file_header_.attr_length, rid, sizeof(*rid));

羽飞's avatar
羽飞 已提交
1699 1700
  Frame *leaf_frame;
  RC rc = find_leaf(key, leaf_frame);
羽飞's avatar
羽飞 已提交
1701 1702 1703 1704 1705
  if (rc != RC::SUCCESS) {
    LOG_WARN("failed to find leaf page. rc =%d:%s", rc, strrc(rc));
    mem_pool_item_->free(key);
    return rc;
  }
羽飞's avatar
羽飞 已提交
1706
  rc = delete_entry_internal(leaf_frame, key);
羽飞's avatar
羽飞 已提交
1707
  if (rc != RC::SUCCESS) {
羽飞's avatar
羽飞 已提交
1708
    LOG_WARN("Failed to delete index");
羽飞's avatar
羽飞 已提交
1709 1710 1711 1712 1713 1714 1715 1716 1717 1718 1719 1720 1721 1722 1723 1724 1725 1726 1727 1728 1729 1730 1731 1732 1733 1734 1735 1736 1737 1738 1739 1740 1741 1742 1743 1744 1745 1746
    mem_pool_item_->free(key);
    return rc;
  }
  mem_pool_item_->free(key);
  return RC::SUCCESS;
}

BplusTreeScanner::BplusTreeScanner(BplusTreeHandler &tree_handler) : tree_handler_(tree_handler)
{}

BplusTreeScanner::~BplusTreeScanner()
{
  close();
}

RC BplusTreeScanner::open(const char *left_user_key, bool left_inclusive,
                          const char *right_user_key, bool right_inclusive)
{
  RC rc = RC::SUCCESS;
  if (inited_) {
    LOG_WARN("tree scanner has been inited");
    return RC::INTERNAL;
  }

  inited_ = true;
  
  // 校验输入的键值是否是合法范围
  if (left_user_key && right_user_key) {
    const auto &attr_comparator = tree_handler_.key_comparator_.attr_comparator();
    const int result = attr_comparator(left_user_key, right_user_key);
    if (result > 0 || // left < right
         // left == right but is (left,right)/[left,right) or (left,right]
	(result == 0 && (left_inclusive == false || right_inclusive == false))) { 
      return RC::INVALID_ARGUMENT;
    }
  }

  if (nullptr == left_user_key) {
羽飞's avatar
羽飞 已提交
1747
    rc = tree_handler_.left_most_page(left_frame_);
羽飞's avatar
羽飞 已提交
1748 1749 1750 1751 1752 1753 1754 1755 1756 1757 1758 1759 1760
    if (rc != RC::SUCCESS) {
      LOG_WARN("failed to find left most page. rc=%d:%s", rc, strrc(rc));
      return rc;
    }

    iter_index_ = 0;
  } else {
    char *left_key = nullptr;
    if (left_inclusive) { 
      left_key = tree_handler_.make_key(left_user_key, *RID::min());
    } else {
      left_key = tree_handler_.make_key(left_user_key, *RID::max());
    }
羽飞's avatar
羽飞 已提交
1761
    rc = tree_handler_.find_leaf(left_key, left_frame_);
羽飞's avatar
羽飞 已提交
1762 1763 1764 1765 1766 1767

    if (rc != RC::SUCCESS) {
      LOG_WARN("failed to find left page. rc=%d:%s", rc, strrc(rc));
      tree_handler_.free_key(left_key);
      return rc;
    }
羽飞's avatar
羽飞 已提交
1768
    LeafIndexNodeHandler left_node(tree_handler_.file_header_, left_frame_);
羽飞's avatar
羽飞 已提交
1769 1770 1771 1772 1773 1774 1775 1776 1777
    int left_index = left_node.lookup(tree_handler_.key_comparator_, left_key);
    tree_handler_.free_key(left_key);
    // lookup 返回的是适合插入的位置,还需要判断一下是否在合适的边界范围内
    if (left_index >= left_node.size()) { // 超出了当前页,就需要向后移动一个位置
      const PageNum next_page_num = left_node.next_page();
      if (next_page_num == BP_INVALID_PAGE_NUM) { // 这里已经是最后一页,说明当前扫描,没有数据
	return RC::SUCCESS;
      }

羽飞's avatar
羽飞 已提交
1778 1779
      tree_handler_.disk_buffer_pool_->unpin_page(left_frame_);
      rc = tree_handler_.disk_buffer_pool_->get_this_page(next_page_num, &left_frame_);
羽飞's avatar
羽飞 已提交
1780 1781 1782 1783 1784 1785 1786 1787 1788 1789 1790 1791
      if (rc != RC::SUCCESS) {
	LOG_WARN("failed to fetch next page. page num=%d, rc=%d:%s", next_page_num, rc, strrc(rc));
	return rc;
      }

      left_index = 0;
    }
    iter_index_ = left_index;
  }

  // 没有指定右边界范围,那么就返回右边界最大值
  if (nullptr == right_user_key) {
羽飞's avatar
羽飞 已提交
1792
    rc = tree_handler_.right_most_page(right_frame_);
羽飞's avatar
羽飞 已提交
1793 1794 1795 1796 1797
    if (rc != RC::SUCCESS) {
      LOG_WARN("failed to fetch right most page. rc=%d:%s", rc, strrc(rc));
      return rc;
    }

羽飞's avatar
羽飞 已提交
1798
    LeafIndexNodeHandler node(tree_handler_.file_header_, right_frame_);
羽飞's avatar
羽飞 已提交
1799 1800 1801 1802 1803 1804 1805 1806 1807 1808
    end_index_ = node.size() - 1;
  } else {

    char *right_key = nullptr;
    if (right_inclusive) {
      right_key = tree_handler_.make_key(right_user_key, *RID::max());
    } else {
      right_key = tree_handler_.make_key(right_user_key, *RID::min());
    }

羽飞's avatar
羽飞 已提交
1809
    rc = tree_handler_.find_leaf(right_key, right_frame_);
羽飞's avatar
羽飞 已提交
1810 1811 1812 1813 1814 1815
    if (rc != RC::SUCCESS) {
      LOG_WARN("failed to find left page. rc=%d:%s", rc, strrc(rc));
      tree_handler_.free_key(right_key);
      return rc;
    }

羽飞's avatar
羽飞 已提交
1816
    LeafIndexNodeHandler right_node(tree_handler_.file_header_, right_frame_);
羽飞's avatar
羽飞 已提交
1817 1818 1819 1820 1821 1822 1823 1824 1825 1826 1827 1828 1829 1830 1831
    int right_index = right_node.lookup(tree_handler_.key_comparator_, right_key);
    tree_handler_.free_key(right_key);
    // lookup 返回的是适合插入的位置,需要根据实际情况做调整
    // 通常情况下需要找到上一个位置
    if (right_index > 0) {
      right_index--;
    } else {
      // 实际上,只有最左边的叶子节点查找时,lookup 才可能返回0
      // 其它的叶子节点都不可能返回0,所以这段逻辑其实是可以简化的
      const PageNum prev_page_num = right_node.prev_page();
      if (prev_page_num == BP_INVALID_PAGE_NUM) {
	end_index_ = -1;
	return RC::SUCCESS;
      }

羽飞's avatar
羽飞 已提交
1832 1833
      tree_handler_.disk_buffer_pool_->unpin_page(right_frame_);
      rc = tree_handler_.disk_buffer_pool_->get_this_page(prev_page_num, &right_frame_);
羽飞's avatar
羽飞 已提交
1834 1835 1836 1837 1838
      if (rc != RC::SUCCESS) {
	LOG_WARN("failed to fetch prev page num. page num=%d, rc=%d:%s", prev_page_num, rc, strrc(rc));
	return rc;
      }

羽飞's avatar
羽飞 已提交
1839
      LeafIndexNodeHandler tmp_node(tree_handler_.file_header_, right_frame_);
羽飞's avatar
羽飞 已提交
1840 1841 1842 1843 1844 1845 1846 1847
      right_index = tmp_node.size() - 1;
    }
    end_index_ = right_index;
  }

  // 判断是否左边界比右边界要靠后
  // 两个边界最多会多一页
  // 查找不存在的元素,或者不存在的范围数据时,可能会存在这个问题
羽飞's avatar
羽飞 已提交
1848
  if (left_frame_->page_num() == right_frame_->page_num() &&
羽飞's avatar
羽飞 已提交
1849 1850 1851
      iter_index_ > end_index_) {
    end_index_ = -1;
  } else {
羽飞's avatar
羽飞 已提交
1852 1853
    LeafIndexNodeHandler left_node(tree_handler_.file_header_, left_frame_);
    LeafIndexNodeHandler right_node(tree_handler_.file_header_, right_frame_);
羽飞's avatar
羽飞 已提交
1854 1855 1856 1857 1858 1859 1860 1861 1862 1863 1864 1865 1866
    if (left_node.prev_page() == right_node.page_num()) {
      end_index_ = -1;
    }
  }
  return RC::SUCCESS;
}

RC BplusTreeScanner::next_entry(RID *rid)
{
  if (-1 == end_index_) {
    return RC::RECORD_EOF;
  }

羽飞's avatar
羽飞 已提交
1867
  LeafIndexNodeHandler node(tree_handler_.file_header_, left_frame_);
羽飞's avatar
羽飞 已提交
1868 1869
  memcpy(rid, node.value_at(iter_index_), sizeof(*rid));

羽飞's avatar
羽飞 已提交
1870
  if (left_frame_->page_num() == right_frame_->page_num() &&
羽飞's avatar
羽飞 已提交
1871 1872 1873 1874 1875 1876 1877 1878 1879 1880 1881
      iter_index_ == end_index_) {
    end_index_ = -1;
    return RC::SUCCESS;
  }

  if (iter_index_ < node.size() - 1) {
    ++iter_index_;
    return RC::SUCCESS;
  }

  RC rc = RC::SUCCESS;
羽飞's avatar
羽飞 已提交
1882
  if (left_frame_->page_num() != right_frame_->page_num()) {
羽飞's avatar
羽飞 已提交
1883
    PageNum page_num = node.next_page();
羽飞's avatar
羽飞 已提交
1884
    tree_handler_.disk_buffer_pool_->unpin_page(left_frame_);
羽飞's avatar
羽飞 已提交
1885 1886 1887 1888
    if (page_num == BP_INVALID_PAGE_NUM) {
      LOG_WARN("got invalid next page. page num=%d", page_num);
      rc = RC::INTERNAL;
    } else {
羽飞's avatar
羽飞 已提交
1889
      rc = tree_handler_.disk_buffer_pool_->get_this_page(page_num, &left_frame_);
羽飞's avatar
羽飞 已提交
1890 1891 1892 1893 1894 1895 1896 1897 1898
      if (rc != RC::SUCCESS) {
        LOG_WARN("failed to fetch next page. page num=%d, rc=%d:%s", page_num, rc, strrc(rc));
        return rc;
      }

      iter_index_ = 0;
    }
  } else if (end_index_ != -1) {
    LOG_WARN("should have more pages but not. left page=%d, right page=%d",
羽飞's avatar
羽飞 已提交
1899
	     left_frame_->page_num(), right_frame_->page_num());
羽飞's avatar
羽飞 已提交
1900 1901 1902 1903 1904 1905 1906
    rc = RC::INTERNAL;
  }
  return rc;
}

RC BplusTreeScanner::close()
{
羽飞's avatar
羽飞 已提交
1907 1908
  if (left_frame_ != nullptr) {
    tree_handler_.disk_buffer_pool_->unpin_page(left_frame_);
羽飞's avatar
羽飞 已提交
1909
  }
羽飞's avatar
羽飞 已提交
1910 1911
  if (right_frame_ != nullptr) {
    tree_handler_.disk_buffer_pool_->unpin_page(right_frame_);
羽飞's avatar
羽飞 已提交
1912 1913 1914 1915 1916 1917
  }
  end_index_ = -1;
  inited_ = false;
  LOG_INFO("bplus tree scanner closed");
  return RC::SUCCESS;
}