9 #include "index/bpTree_block.h"
10 #include "buffer/buffer_manager.h"
11 #include "share/err_type.h"
14 #define BP_TREE_T Bp_tree<key_t, value_t>
15 #define BP_TREE_BLOCK_T bpTree_Block
16 #define BP_TREE_LEAF_T bpTree_Leaf<key_t, value_t>
17 #define BP_TREE_INTERNAL_T bpTree_Internal<key_t, blockId_t>
35 void InitRoot(std::string indexFileName);
37 const std::string& getName()
const {
49 bool Insert(
const key_t &key,
const value_t &val);
60 bool Delete(
const key_t &key);
68 bool Delete(
const key_t &key, value_t &deleted);
78 bool FindValue(
const key_t &key, value_t &result)
const;
89 bool FindRange(
const key_t& lower_key,
const key_t& upper_key, std::vector<value_t>& result)
const;
97 bool UpdateKey(
const key_t &former_key,
const key_t &new_key);
105 bool UpdateValue(
const key_t &key,
const value_t &new_val);
108 blockId_t _root_id = INVALID_BLOCK_ID;
109 std::string _index_fname;
110 db_size_t _file_block_count;
116 blockId_t FindRootBlockId(BP_TREE_BLOCK_T* block);
126 BP_TREE_LEAF_T* FindNode(
const key_t &key, pageId_t &leaf_pageId)
const;
137 bool Insert_in_Leaf(
const key_t &key,
const value_t &val, BP_TREE_LEAF_T* leaf);
147 bool Insert_in_Parent(
const key_t &key, BP_TREE_BLOCK_T* prev_leaf, BP_TREE_BLOCK_T* split);
157 bool Delete_in_Parent(BP_TREE_BLOCK_T* parent, db_size_t pos_sep);
159 void loadPointer(BP_TREE_LEAF_T*& leaf, pageId_t& leaf_pageId, blockId_t b_id)
const{
160 char* raw = _bfm->
getPage(_index_fname, b_id, leaf_pageId);
161 leaf =
reinterpret_cast<BP_TREE_LEAF_T*
>(raw);
164 void loadPointer(BP_TREE_INTERNAL_T*&
internal, pageId_t& internal_pageId, blockId_t b_id)
const{
165 char* raw = _bfm->
getPage(_index_fname, b_id, internal_pageId);
166 internal =
reinterpret_cast<BP_TREE_INTERNAL_T*
>(raw);
169 void loadPointer(BP_TREE_BLOCK_T*& block, blockId_t b_id)
const{
170 char* raw = _bfm->
getPage(_index_fname, b_id);
171 block =
reinterpret_cast<BP_TREE_BLOCK_T*
>(raw);
174 void loadPointer(BP_TREE_BLOCK_T*& block, pageId_t& pageId, blockId_t b_id)
const {
175 char* raw = _bfm->
getPage(_index_fname, b_id, pageId);
176 block =
reinterpret_cast<BP_TREE_BLOCK_T*
>(raw);
179 void setChildrenParent(BP_TREE_INTERNAL_T*
internal){
180 for(db_size_t i = 0; i <
internal->_size; ++i){
181 BP_TREE_BLOCK_T* child;
182 loadPointer(child, internal->_k_child_pair[i].second);
183 child->_parent_block_id =
internal->_block_id;
187 std::pair<key_t, value_t>& getKeyRowidPair(
const key_t &key);
191 void BP_TREE_T::InitRoot(std::string indexFileName) {
192 _index_fname = indexFileName;
195 BP_TREE_BLOCK_T* headBlock;
196 loadPointer(headBlock, headPageId, 0);
197 _bfm->pinPage(headPageId);
201 if (headBlock->_blockType == INVALID_BLOCK){
202 _root_id = INVALID_BLOCK_ID;
205 _root_id = FindRootBlockId(headBlock);
208 _file_block_count = (_bfm->getFileSize(indexFileName) + PAGESIZE - 1) / PAGESIZE;
209 _bfm->unpinPage(headPageId);
213 blockId_t BP_TREE_T::FindRootBlockId(
bpTree_Block *block) {
214 assert(block->_blockType != INVALID_BLOCK);
216 while (block->_parent_block_id != INVALID_BLOCK_ID){
217 loadPointer(block, block->_parent_block_id);
220 return block->_block_id;
224 bool BP_TREE_T::FindValue(
const key_t &key, value_t &result)
const {
226 BP_TREE_LEAF_T* n = FindNode(key, p_Id);
228 if (n ==
nullptr)
throw DB_BPTREE_EMPTY;
230 db_size_t pos = n->leaf_biSearch(key);
232 result = n->_k_rowid_pair[pos].second;
234 if (pos < n->_size && n->_k_rowid_pair[pos].first == key){
235 _bfm->unpinPage(p_Id);
239 _bfm->unpinPage(p_Id);
245 bool BP_TREE_T::FindRange(
const key_t &lower_key,
const key_t &upper_key, std::vector<value_t> &result)
const {
246 assert(lower_key < upper_key);
249 BP_TREE_LEAF_T* lkey_leaf = FindNode(lower_key, lkey_pId);
252 BP_TREE_LEAF_T* rkey_leaf = FindNode(upper_key, rkey_pId);
254 if (rkey_leaf ==
nullptr || lkey_leaf ==
nullptr)
throw DB_BPTREE_EMPTY;
256 db_size_t l_pos = lkey_leaf->leaf_biSearch(lower_key);
258 db_size_t r_pos = rkey_leaf->leaf_biSearch(upper_key);
260 if (r_pos >= rkey_leaf->_size || rkey_leaf->_k_rowid_pair[r_pos].first != upper_key) {
261 if(r_pos != 0) --r_pos;
263 std::cout <<
"BP Tree Error! -- Contact CGF" << std::endl;
267 if (lkey_leaf->_block_id == rkey_leaf->_block_id){
268 for (db_size_t pos = l_pos; pos <= r_pos; ++pos){
269 result.push_back(lkey_leaf->_k_rowid_pair[pos].second);
273 for (db_size_t pos = l_pos; pos < lkey_leaf->_size; ++pos){
274 result.push_back(lkey_leaf->_k_rowid_pair[pos].second);
276 BP_TREE_LEAF_T* next_node;
278 while(lkey_leaf->_next_block_id != rkey_leaf->_block_id){
279 loadPointer(next_node, next_pId, lkey_leaf->_next_block_id);
280 _bfm->unpinPage(lkey_pId);
281 lkey_leaf = next_node;
284 for (db_size_t pos = 0; pos < lkey_leaf->_size; ++pos){
285 result.push_back(lkey_leaf->_k_rowid_pair[pos].second);
289 _bfm->unpinPage(lkey_pId);
291 for (db_size_t pos = 0; pos <= r_pos; ++pos){
292 result.push_back(lkey_leaf->_k_rowid_pair[pos].second);
294 _bfm->unpinPage(rkey_pId);
300 BP_TREE_LEAF_T* BP_TREE_T::FindNode(
const key_t &key, pageId_t& leaf_pageId)
const{
301 pageId_t temp_pageId;
302 BP_TREE_BLOCK_T* root;
303 if (_root_id == INVALID_BLOCK_ID){
306 loadPointer(root, temp_pageId, _root_id);
308 BP_TREE_INTERNAL_T* internal_ptr;
309 if (root->_blockType == INVALID_BLOCK){
312 else if(root->isLeaf()){
313 internal_ptr = (BP_TREE_INTERNAL_T*)root;
316 internal_ptr =
static_cast<BP_TREE_INTERNAL_T*
>(root);
317 while(!internal_ptr->isLeaf()){
319 db_size_t pos = internal_ptr->internal_biSearch(key);
320 blockId_t child_b_id = internal_ptr->_k_child_pair[pos].second;
321 loadPointer(internal_ptr, temp_pageId, child_b_id);
326 leaf_pageId = temp_pageId;
327 _bfm->pinPage(leaf_pageId);
329 return reinterpret_cast<BP_TREE_LEAF_T*
>(internal_ptr);
333 bool BP_TREE_T::Insert_in_Parent(
const key_t &key, BP_TREE_BLOCK_T* prev_leaf, BP_TREE_BLOCK_T* split){
334 if (prev_leaf->_block_id == _root_id){
335 pageId_t newRoot_pageId;
336 BP_TREE_INTERNAL_T* newRoot;
337 loadPointer(newRoot, newRoot_pageId, _file_block_count);
338 _bfm->modifyPage(newRoot_pageId);
340 _file_block_count += 1;
342 _root_id = _file_block_count - 1;
343 newRoot->init(_file_block_count - 1, INVALID_BLOCK_ID);
346 newRoot->_k_child_pair[0] = std::make_pair(trash, prev_leaf->_block_id);
347 newRoot->_k_child_pair[1] = std::make_pair(key, split->_block_id);
350 prev_leaf->_parent_block_id = newRoot->_block_id;
351 split->_parent_block_id = newRoot->_block_id;
357 BP_TREE_INTERNAL_T* parent;
358 pageId_t parent_pageId;
359 loadPointer(parent, parent_pageId, prev_leaf->_parent_block_id);
361 if(parent->_blockType != INTERNAL_BLOCK){
362 loadPointer(parent, parent_pageId, prev_leaf->_parent_block_id);
365 _bfm->pinPage(parent_pageId);
366 _bfm->modifyPage(parent_pageId);
369 db_size_t pos = parent->internal_biSearch(key);
371 db_size_t move_len = parent->_size - pos;
373 memmove(parent->_k_child_pair + pos + 1, parent->_k_child_pair + pos, move_len *
sizeof(parent->_k_child_pair[0]));
375 parent->_k_child_pair[pos] = std::make_pair(key, split->_block_id);
376 split->_parent_block_id = parent->_block_id;
377 prev_leaf->_parent_block_id = parent->_block_id;
379 if (parent->_size > parent->_max_size){
380 assert(parent->_size == parent->_max_size + 1);
382 BP_TREE_INTERNAL_T* split_parent;
383 pageId_t split_pageId;
385 loadPointer(split_parent, split_pageId, _file_block_count);
386 _bfm->pinPage(split_pageId);
387 _bfm->modifyPage(split_pageId);
389 _file_block_count += 1;
391 split_parent->init(_file_block_count - 1, parent->_parent_block_id);
394 db_size_t mid = (parent->_max_size + 1) / 2;
395 key_t right_smallest_key = parent->_k_child_pair[mid].first;
396 db_size_t move_len_split = (parent->_max_size + 1) - mid;
399 memcpy(split_parent->_k_child_pair, parent->_k_child_pair + mid, move_len_split *
sizeof(parent->_k_child_pair[0]));
400 split_parent->_size = move_len_split;
404 setChildrenParent(split_parent);
406 ret = Insert_in_Parent(right_smallest_key, parent, split_parent);
407 _bfm->unpinPage(split_pageId);
408 _bfm->unpinPage(parent_pageId);
412 _bfm->unpinPage(parent_pageId);
419 bool BP_TREE_T::Insert_in_Leaf(
const key_t &key,
const value_t &val, BP_TREE_LEAF_T* leaf){
420 assert(leaf->isLeaf());
423 db_size_t pos = leaf->leaf_biSearch(key);
427 if (pos < leaf->_size && leaf->_k_rowid_pair[pos].first == key)
return false;
430 memmove((
void*)(leaf->_k_rowid_pair + pos + 1), (
void*)(leaf->_k_rowid_pair + pos),
sizeof(leaf->_k_rowid_pair[0]) * (leaf->_size - pos));
431 leaf->_k_rowid_pair[pos] = std::make_pair(key, val);
438 bool BP_TREE_T::Insert(
const key_t &key,
const value_t &val){
439 if (_root_id == INVALID_BLOCK_ID){
441 pageId_t root_pageId;
442 BP_TREE_LEAF_T* root;
443 loadPointer(root, root_pageId, 0);
445 _bfm->pinPage(root_pageId);
446 _bfm->modifyPage(root_pageId);
447 root->init(0, INVALID_BLOCK_ID, INVALID_BLOCK_ID);
449 Insert_in_Leaf(key, val, root);
450 _bfm->unpinPage(root_pageId);
454 pageId_t leaf_pageId;
455 BP_TREE_LEAF_T* leaf = FindNode(key, leaf_pageId);
456 if (leaf ==
nullptr){
460 _bfm->modifyPage(leaf_pageId);
462 if (leaf->_size < leaf->_max_size){
463 Insert_in_Leaf(key, val, leaf);
464 _bfm->unpinPage(leaf_pageId);
467 assert(leaf->_size == leaf->_max_size);
470 BP_TREE_INTERNAL_T* p2;
472 if(leaf->_block_id != _root_id){
473 loadPointer(p, leaf->_parent_block_id);
474 assert(p->_blockType == INTERNAL_BLOCK);
476 loadPointer(p2, trash, leaf->_parent_block_id);
477 assert(p2->_blockType == INTERNAL_BLOCK);
480 pageId_t split_pageId;
481 BP_TREE_LEAF_T* split;
482 loadPointer(split, split_pageId, _file_block_count);
483 _file_block_count += 1;
484 _bfm->pinPage(split_pageId);
486 _bfm->modifyPage(split_pageId);
488 split->init(_file_block_count - 1, leaf->_parent_block_id, leaf->_next_block_id);
489 leaf->_next_block_id = split->_block_id;
492 Insert_in_Leaf(key, val, leaf);
496 db_size_t i = (leaf->_max_size + 1) / 2;
497 db_size_t copy_len = (leaf->_max_size + 1) - i;
499 memcpy(split->_k_rowid_pair, leaf->_k_rowid_pair + i,
sizeof(leaf->_k_rowid_pair[0]) * copy_len);
501 split->_size = copy_len;
503 Insert_in_Parent(split->_k_rowid_pair[0].first, leaf, split);
505 _bfm->unpinPage(split_pageId);
506 _bfm->unpinPage(leaf_pageId);
513 bool BP_TREE_T::Delete_in_Parent(BP_TREE_BLOCK_T* _parent, db_size_t pos_sep){
515 auto parent =
static_cast<BP_TREE_INTERNAL_T*
>(_parent);
519 memmove(parent->_k_child_pair + pos_sep, parent->_k_child_pair + pos_sep + 1,
520 (parent->_size - (pos_sep + 1)) *
sizeof(parent->_k_child_pair[0]));
523 if (parent->_block_id == _root_id){
524 if (parent->_size == 1){
525 _root_id = parent->_k_child_pair[0].second;
527 parent->_blockType = INVALID_BLOCK;
532 else if (parent->_size < (parent->_max_size + 1) / 2){
533 BP_TREE_INTERNAL_T* grandparent;
534 pageId_t grandparent_pageId;
536 BP_TREE_INTERNAL_T* parent_sibling;
537 pageId_t parentSib_pageId;
539 loadPointer(grandparent, grandparent_pageId, parent->_parent_block_id);
540 _bfm->pinPage(grandparent_pageId);
542 assert(grandparent->_blockType == INTERNAL_BLOCK);
544 key_t sep_key_in_grandparent;
545 db_size_t pos_sep_grand = grandparent->internal_biSearch(parent->_k_child_pair[0].first);
548 assert(grandparent->_k_child_pair[pos_sep_grand].second == parent->_block_id);
550 if (pos_sep_grand == grandparent->_size - 1){
551 loadPointer(parent_sibling, parentSib_pageId, grandparent->_k_child_pair[pos_sep_grand - 1].second);
552 is_predecessor =
false;
553 sep_key_in_grandparent = grandparent->_k_child_pair[pos_sep_grand].first;
555 assert(grandparent->_k_child_pair[pos_sep_grand].first == parent->_k_child_pair[0].first);
559 loadPointer(parent_sibling, parentSib_pageId, grandparent->_k_child_pair[pos_sep_grand].second);
560 is_predecessor =
true;
561 sep_key_in_grandparent = grandparent->_k_child_pair[pos_sep_grand].first;
563 assert(grandparent->_k_child_pair[pos_sep_grand].first == parent_sibling->_k_child_pair[0].first);
565 _bfm->pinPage(parentSib_pageId);
568 if (parent->_size + parent_sibling->_size < parent->_max_size){
569 if (is_predecessor) {
571 parent = parent_sibling;
572 parent_sibling = temp;
575 memcpy(parent_sibling->_k_child_pair + parent_sibling->_size, parent->_k_child_pair,
576 parent->_size *
sizeof(parent->_k_child_pair[0]));
577 parent_sibling->_size += parent->_size;
581 for(db_size_t i = parent_sibling->_size - parent->_size; i < parent_sibling->_size; ++i){
582 BP_TREE_BLOCK_T* child;
583 loadPointer(child, parent_sibling->_k_child_pair[i].second);
584 child->_parent_block_id = parent_sibling->_block_id;
586 _bfm->unpinPage(parentSib_pageId);
587 Delete_in_Parent(grandparent, pos_sep_grand);
589 parent->_blockType = INVALID_BLOCK;
595 parent->_k_child_pair[parent->_size] = parent_sibling->_k_child_pair[0];
597 parent_sibling->_size -= 1;
598 memmove(parent_sibling->_k_child_pair, parent_sibling->_k_child_pair + 1,
599 parent_sibling->_size *
sizeof(parent->_k_child_pair[0]));
602 BP_TREE_BLOCK_T* child;
603 loadPointer(child, parent->_k_child_pair[parent->_size - 1].second);
604 child->_parent_block_id = parent_sibling->_block_id;
606 grandparent->_k_child_pair[pos_sep_grand].first = parent_sibling->_k_child_pair[0].first;
609 memmove(parent->_k_child_pair + 1, parent->_k_child_pair,
610 parent->_size *
sizeof(parent->_k_child_pair[0]));
611 parent->_k_child_pair[0] = parent_sibling->_k_child_pair[parent_sibling->_size - 1];
612 parent_sibling->_size -= 1;
616 BP_TREE_BLOCK_T* child;
617 loadPointer(child, parent->_k_child_pair[0].second);
618 child->_parent_block_id = parent->_block_id;
620 grandparent->_k_child_pair[pos_sep_grand].first = parent->_k_child_pair[0].first;
622 _bfm->unpinPage(parentSib_pageId);
629 bool BP_TREE_T::Delete(
const key_t &key) {
630 pageId_t leaf_pageId;
631 BP_TREE_LEAF_T* leaf = FindNode(key, leaf_pageId);
632 if (leaf ==
nullptr){
633 throw DB_KEY_NOT_FOUND;
636 _bfm->modifyPage(leaf_pageId);
639 db_size_t pos = leaf->leaf_biSearch(key);
640 if(leaf->_k_rowid_pair[pos].first != key){
641 throw DB_KEY_NOT_FOUND;
645 memmove(leaf->_k_rowid_pair + pos, leaf->_k_rowid_pair + pos + 1,
646 sizeof(leaf->_k_rowid_pair[0]) * (leaf->_size - (pos + 1)));
649 if (leaf->_block_id == _root_id) {
650 if (leaf->_size == 0){
651 leaf->_blockType = INVALID_BLOCK;
652 _root_id = INVALID_BLOCK_ID;
657 else if (leaf->_size < (leaf->_max_size + 1) / 2){
659 assert(leaf->_size == (leaf->_max_size + 1) / 2 - 1);
661 BP_TREE_LEAF_T *sibling;
662 pageId_t sibling_pageId;
663 BP_TREE_INTERNAL_T *parent;
664 pageId_t parent_pageId;
666 loadPointer(parent, parent_pageId, leaf->_parent_block_id);
667 _bfm->pinPage(parent_pageId);
670 key_t sep_key_in_parent;
672 db_size_t pos_sep = parent->internal_biSearch(leaf->_k_rowid_pair[0].first);
673 assert(parent->_k_child_pair[pos_sep].second == leaf->_block_id);
675 if (pos_sep == parent->_size - 1){
676 loadPointer(sibling, sibling_pageId, parent->_k_child_pair[pos_sep - 1].second);
677 sep_key_in_parent = parent->_k_child_pair[pos_sep].first;
679 assert(parent->_k_child_pair[pos_sep].first == leaf->_k_rowid_pair[0].first);
680 is_predecessor =
false;
684 loadPointer(sibling, sibling_pageId, parent->_k_child_pair[pos_sep].second);
685 sep_key_in_parent = parent->_k_child_pair[pos_sep].first;
687 assert(parent->_k_child_pair[pos_sep].first == sibling->_k_rowid_pair[0].first);
688 is_predecessor =
true;
690 _bfm->pinPage(sibling_pageId);
693 if (sibling->_size + leaf->_size < sibling->_max_size){
694 _bfm->modifyPage(sibling_pageId);
695 _bfm->modifyPage(leaf_pageId);
696 _bfm->modifyPage(parent_pageId);
706 sibling->_next_block_id = leaf->_next_block_id;
708 memcpy(sibling->_k_rowid_pair + sibling->_size, leaf->_k_rowid_pair,
709 leaf->_size *
sizeof(leaf->_k_rowid_pair[0]));
710 sibling->_size += leaf->_size;
713 _bfm->unpinPage(sibling_pageId);
714 _bfm->unpinPage(leaf_pageId);
716 Delete_in_Parent(parent, pos_sep);
718 leaf->_blockType = INVALID_BLOCK;
723 leaf->_k_rowid_pair[leaf->_size] = sibling->_k_rowid_pair[0];
726 memmove(sibling->_k_rowid_pair, sibling->_k_rowid_pair + 1,
727 sibling->_size *
sizeof(sibling->_k_rowid_pair[0]));
729 parent->_k_child_pair[pos_sep].first = sibling->_k_rowid_pair[0].first;
732 memmove(leaf->_k_rowid_pair + 1, leaf->_k_rowid_pair,
733 leaf->_size *
sizeof(sibling->_k_rowid_pair[0]));
734 leaf->_k_rowid_pair[0] = sibling->_k_rowid_pair[sibling->_size - 1];
738 parent->_k_child_pair[pos_sep].first = leaf->_k_rowid_pair[0].first;
741 _bfm->unpinPage(sibling_pageId);
742 _bfm->unpinPage(leaf_pageId);
745 _bfm->unpinPage(parent_pageId);
758 bool BP_TREE_T::UpdateKey(
const key_t &former_key,
const key_t &new_key) {
760 BP_TREE_LEAF_T* n = FindNode(former_key, key_pageId);
761 db_size_t pos = n->leaf_biSearch(former_key);
762 if (n->_k_rowid_pair[pos].first != former_key)
throw DB_KEY_NOT_FOUND;
763 value_t val = n->_k_rowid_pair[pos].second;
764 _bfm->unpinPage(key_pageId);
768 success_flg = Delete(former_key);
770 success_flg = Insert(new_key, val);
776 bool BP_TREE_T::UpdateValue(
const key_t &key,
const value_t &new_val) {
778 BP_TREE_LEAF_T* n = FindNode(key, key_pageId);
779 db_size_t pos = n->leaf_biSearch(key);
780 if (n->_k_rowid_pair[pos].first != key)
throw DB_KEY_NOT_FOUND;
781 n->_k_rowid_pair[pos].second = new_val;
782 _bfm->unpinPage(key_pageId);