tinySQL  0.1
A self-contained database management system
bpTree_disk.h
1 #ifndef BPTREE_DISK_H
2 #define BPTREE_DISK_H
3 
4 #include <vector>
5 #include <iostream>
6 #include <cassert>
7 #include <cstring>
8 
9 #include "index/bpTree_block.h"
10 #include "buffer/buffer_manager.h"
11 #include "share/err_type.h"
12 
13 
14 #define BP_TREE_T Bp_tree<key_t, value_t>
15 #define BP_TREE_BLOCK_T bpTree_Block
16 #define BP_TREE_LEAF_T bpTree_Leaf<key_t, value_t>
17 #define BP_TREE_INTERNAL_T bpTree_Internal<key_t, blockId_t>
18 
19 // TODO : Check if every pin is eliminated after use.
20 
25 KEY_VALUE_T_DECLARE
26 class Bp_tree{
27 public:
28  Bp_tree(BufferManager* buf_manager):_bfm(buf_manager){};
29 
35  void InitRoot(std::string indexFileName);
36 
37  const std::string& getName() const {
38  return _index_fname;
39  }
40 
49  bool Insert(const key_t &key, const value_t &val);
50 
60  bool Delete(const key_t &key);
61 
68  bool Delete(const key_t &key, value_t &deleted);
69 
78  bool FindValue(const key_t &key, value_t &result) const;
79 
89  bool FindRange(const key_t& lower_key, const key_t& upper_key, std::vector<value_t>& result) const;
90 
97  bool UpdateKey(const key_t &former_key, const key_t &new_key);
98 
105  bool UpdateValue(const key_t &key, const value_t &new_val);
106 
107 private:
108  blockId_t _root_id = INVALID_BLOCK_ID;
109  std::string _index_fname;
110  db_size_t _file_block_count;
111 // BP_TREE_BLOCK_T* header_ptr;
112 // pageId_t header_pageId; ///< The header page id in the buffer pool. The page is pinned.
113 
114  BufferManager* _bfm;
115 
116  blockId_t FindRootBlockId(BP_TREE_BLOCK_T* block);
117 
126  BP_TREE_LEAF_T* FindNode(const key_t &key, pageId_t &leaf_pageId) const;
127 
137  bool Insert_in_Leaf(const key_t &key, const value_t &val, BP_TREE_LEAF_T* leaf);
138 
147  bool Insert_in_Parent(const key_t &key, BP_TREE_BLOCK_T* prev_leaf, BP_TREE_BLOCK_T* split);
148 
157  bool Delete_in_Parent(BP_TREE_BLOCK_T* parent, db_size_t pos_sep);
158 
159  void loadPointer(BP_TREE_LEAF_T*& leaf, pageId_t& leaf_pageId, blockId_t b_id) const{
160  char* raw = _bfm->getPage(_index_fname, b_id, leaf_pageId);
161  leaf = reinterpret_cast<BP_TREE_LEAF_T*>(raw);
162  }
163 
164  void loadPointer(BP_TREE_INTERNAL_T*& internal, pageId_t& internal_pageId, blockId_t b_id) const{
165  char* raw = _bfm->getPage(_index_fname, b_id, internal_pageId);
166  internal = reinterpret_cast<BP_TREE_INTERNAL_T*>(raw);
167  }
168 
169  void loadPointer(BP_TREE_BLOCK_T*& block, blockId_t b_id) const{
170  char* raw = _bfm->getPage(_index_fname, b_id);
171  block = reinterpret_cast<BP_TREE_BLOCK_T*>(raw);
172  }
173 
174  void loadPointer(BP_TREE_BLOCK_T*& block, pageId_t& pageId, blockId_t b_id) const {
175  char* raw = _bfm->getPage(_index_fname, b_id, pageId);
176  block = reinterpret_cast<BP_TREE_BLOCK_T*>(raw);
177  }
178 
179  void setChildrenParent(BP_TREE_INTERNAL_T* internal){
180  for(db_size_t i = 0; i < internal->_size; ++i){
181  BP_TREE_BLOCK_T* child;
182  loadPointer(child, internal->_k_child_pair[i].second);
183  child->_parent_block_id = internal->_block_id;
184  }
185  }
186 
187  std::pair<key_t, value_t>& getKeyRowidPair(const key_t &key);
188 };
189 
190 KEY_VALUE_T_DECLARE
191 void BP_TREE_T::InitRoot(std::string indexFileName) {
192  _index_fname = indexFileName;
193 
194  pageId_t headPageId;
195  BP_TREE_BLOCK_T* headBlock;
196  loadPointer(headBlock, headPageId, 0); // May throw here
197  _bfm->pinPage(headPageId);
198 
199  // Set _root_id to avoid expensive operations later;
200  // and set the initial total block count of the file
201  if (headBlock->_blockType == INVALID_BLOCK){ // Happens when no content except the header is in the file
202  _root_id = INVALID_BLOCK_ID;
203  }
204  else{
205  _root_id = FindRootBlockId(headBlock);
206  }
207  // Upper bound of the integer: fileSize / PAGESIZE
208  _file_block_count = (_bfm->getFileSize(indexFileName) + PAGESIZE - 1) / PAGESIZE;
209  _bfm->unpinPage(headPageId);
210 }
211 
212 KEY_VALUE_T_DECLARE
213 blockId_t BP_TREE_T::FindRootBlockId(bpTree_Block *block) {
214  assert(block->_blockType != INVALID_BLOCK);
215 
216  while (block->_parent_block_id != INVALID_BLOCK_ID){
217  loadPointer(block, block->_parent_block_id);
218  }
219 
220  return block->_block_id;
221 }
222 
223 KEY_VALUE_T_DECLARE
224 bool BP_TREE_T::FindValue(const key_t &key, value_t &result) const {
225  pageId_t p_Id;
226  BP_TREE_LEAF_T* n = FindNode(key, p_Id);
227 
228  if (n == nullptr) throw DB_BPTREE_EMPTY;
229 
230  db_size_t pos = n->leaf_biSearch(key);
231  if (pos < n->_size){
232  result = n->_k_rowid_pair[pos].second;
233  }
234  if (pos < n->_size && n->_k_rowid_pair[pos].first == key){
235  _bfm->unpinPage(p_Id);
236  return true;
237  }
238  else {
239  _bfm->unpinPage(p_Id);
240  return false;
241  }
242 }
243 
244 KEY_VALUE_T_DECLARE
245 bool BP_TREE_T::FindRange(const key_t &lower_key, const key_t &upper_key, std::vector<value_t> &result) const {
246  assert(lower_key < upper_key);
247 
248  pageId_t lkey_pId;
249  BP_TREE_LEAF_T* lkey_leaf = FindNode(lower_key, lkey_pId);
250 
251  pageId_t rkey_pId;
252  BP_TREE_LEAF_T* rkey_leaf = FindNode(upper_key, rkey_pId);
253 
254  if (rkey_leaf == nullptr || lkey_leaf == nullptr) throw DB_BPTREE_EMPTY;
255 
256  db_size_t l_pos = lkey_leaf->leaf_biSearch(lower_key);
257 // if (lkey_leaf->_k_rowid_pair[l_pos].first != lower_key) return false;
258  db_size_t r_pos = rkey_leaf->leaf_biSearch(upper_key);
259 
260  if (r_pos >= rkey_leaf->_size || rkey_leaf->_k_rowid_pair[r_pos].first != upper_key) {
261  if(r_pos != 0) --r_pos;
262  else{
263  std::cout << "BP Tree Error! -- Contact CGF" << std::endl;
264  }
265  }
266 
267  if (lkey_leaf->_block_id == rkey_leaf->_block_id){
268  for (db_size_t pos = l_pos; pos <= r_pos; ++pos){
269  result.push_back(lkey_leaf->_k_rowid_pair[pos].second);
270  }
271  }
272  else{
273  for (db_size_t pos = l_pos; pos < lkey_leaf->_size; ++pos){
274  result.push_back(lkey_leaf->_k_rowid_pair[pos].second);
275  }
276  BP_TREE_LEAF_T* next_node;
277  pageId_t next_pId;
278  while(lkey_leaf->_next_block_id != rkey_leaf->_block_id){
279  loadPointer(next_node, next_pId, lkey_leaf->_next_block_id);
280  _bfm->unpinPage(lkey_pId);
281  lkey_leaf = next_node;
282  lkey_pId = next_pId;
283 
284  for (db_size_t pos = 0; pos < lkey_leaf->_size; ++pos){
285  result.push_back(lkey_leaf->_k_rowid_pair[pos].second);
286  }
287  }
288 
289  _bfm->unpinPage(lkey_pId);
290 
291  for (db_size_t pos = 0; pos <= r_pos; ++pos){
292  result.push_back(lkey_leaf->_k_rowid_pair[pos].second);
293  }
294  _bfm->unpinPage(rkey_pId);
295  }
296  return true;
297 }
298 
299 KEY_VALUE_T_DECLARE
300 BP_TREE_LEAF_T* BP_TREE_T::FindNode(const key_t &key, pageId_t& leaf_pageId) const{
301  pageId_t temp_pageId;
302  BP_TREE_BLOCK_T* root;
303  if (_root_id == INVALID_BLOCK_ID){
304  return nullptr;
305  }
306  loadPointer(root, temp_pageId, _root_id);
307 
308  BP_TREE_INTERNAL_T* internal_ptr;
309  if (root->_blockType == INVALID_BLOCK){
310  return nullptr;
311  }
312  else if(root->isLeaf()){
313  internal_ptr = (BP_TREE_INTERNAL_T*)root; // Simply init. Make no sense.
314  }
315  else{
316  internal_ptr = static_cast<BP_TREE_INTERNAL_T*>(root);
317  while(!internal_ptr->isLeaf()){
318  //The greatest key pos that is smaller or equal to the key.
319  db_size_t pos = internal_ptr->internal_biSearch(key);
320  blockId_t child_b_id = internal_ptr->_k_child_pair[pos].second;
321  loadPointer(internal_ptr, temp_pageId, child_b_id);
322  }
323  }
324 
325  // Make sure the page that internal_ptr pointing at is pinned!!!
326  leaf_pageId = temp_pageId;
327  _bfm->pinPage(leaf_pageId);
328  // internal_ptr is actually leaf pointer here.
329  return reinterpret_cast<BP_TREE_LEAF_T*>(internal_ptr);
330 }
331 
332 KEY_VALUE_T_DECLARE
333 bool BP_TREE_T::Insert_in_Parent(const key_t &key, BP_TREE_BLOCK_T* prev_leaf, BP_TREE_BLOCK_T* split){
334  if (prev_leaf->_block_id == _root_id){
335  pageId_t newRoot_pageId;
336  BP_TREE_INTERNAL_T* newRoot;
337  loadPointer(newRoot, newRoot_pageId, _file_block_count);
338  _bfm->modifyPage(newRoot_pageId);
339  // TODO : Add pin page and not pin page for concurrency. Assume the page is not likely to be changed here.
340  _file_block_count += 1;
341 
342  _root_id = _file_block_count - 1;
343  newRoot->init(_file_block_count - 1, INVALID_BLOCK_ID);
344  newRoot->_size = 2;
345  key_t trash;
346  newRoot->_k_child_pair[0] = std::make_pair(trash, prev_leaf->_block_id);
347  newRoot->_k_child_pair[1] = std::make_pair(key, split->_block_id);
348 
349  // CAUTION : Remember to reset the _parent_block_id
350  prev_leaf->_parent_block_id = newRoot->_block_id;
351  split->_parent_block_id = newRoot->_block_id;
352  return true;
353  }
354  else{
355  bool ret;
356 
357  BP_TREE_INTERNAL_T* parent;
358  pageId_t parent_pageId;
359  loadPointer(parent, parent_pageId, prev_leaf->_parent_block_id);
360 
361  if(parent->_blockType != INTERNAL_BLOCK){
362  loadPointer(parent, parent_pageId, prev_leaf->_parent_block_id);
363  }
364 
365  _bfm->pinPage(parent_pageId);
366  _bfm->modifyPage(parent_pageId);
367 
368  // Directly insert the current key and pointer temporarily
369  db_size_t pos = parent->internal_biSearch(key); // This position should exactly be the separator of prev_leaf and its sibling
370  pos += 1; // The correct starting point to move.
371  db_size_t move_len = parent->_size - pos;
372 
373  memmove(parent->_k_child_pair + pos + 1, parent->_k_child_pair + pos, move_len * sizeof(parent->_k_child_pair[0]));
374  parent->_size += 1;
375  parent->_k_child_pair[pos] = std::make_pair(key, split->_block_id);
376  split->_parent_block_id = parent->_block_id;
377  prev_leaf->_parent_block_id = parent->_block_id;
378 
379  if (parent->_size > parent->_max_size){ // Not enough space. Split parent.
380  assert(parent->_size == parent->_max_size + 1);
381 
382  BP_TREE_INTERNAL_T* split_parent;
383  pageId_t split_pageId;
384 
385  loadPointer(split_parent, split_pageId, _file_block_count); // Assign a new block the node
386  _bfm->pinPage(split_pageId);
387  _bfm->modifyPage(split_pageId);
388 
389  _file_block_count += 1;
390  // CAUTION : remember to init the newly assigned block.
391  split_parent->init(_file_block_count - 1, parent->_parent_block_id);
392 
393  // Move keys and pointers to split.
394  db_size_t mid = (parent->_max_size + 1) / 2;
395  key_t right_smallest_key = parent->_k_child_pair[mid].first;
396  db_size_t move_len_split = (parent->_max_size + 1) - mid;
397 
398  // Because the first key is not used, we in fact abandoned the first key in split node.
399  memcpy(split_parent->_k_child_pair, parent->_k_child_pair + mid, move_len_split * sizeof(parent->_k_child_pair[0]));
400  split_parent->_size = move_len_split;
401  parent->_size = mid;
402 
403  // CAUTION: Always remember to reset its children's parent
404  setChildrenParent(split_parent);
405 
406  ret = Insert_in_Parent(right_smallest_key, parent, split_parent);
407  _bfm->unpinPage(split_pageId);
408  _bfm->unpinPage(parent_pageId);
409  return ret;
410  }
411  else{
412  _bfm->unpinPage(parent_pageId);
413  return true;
414  }
415  }
416 }
417 
418 KEY_VALUE_T_DECLARE
419 bool BP_TREE_T::Insert_in_Leaf(const key_t &key, const value_t &val, BP_TREE_LEAF_T* leaf){
420  assert(leaf->isLeaf());
421 // assert(leaf->_size < leaf->_max_size);
422 
423  db_size_t pos = leaf->leaf_biSearch(key);
424 
425  // TODO : Change this to throw
426  // Only allow is_unique key
427  if (pos < leaf->_size /*&& leaf->_size > 0*/ && leaf->_k_rowid_pair[pos].first == key) return false;
428 
429  // Insert the key-val pair. The space should be pre-allocated at the initialization of node pages.
430  memmove((void*)(leaf->_k_rowid_pair + pos + 1), (void*)(leaf->_k_rowid_pair + pos), sizeof(leaf->_k_rowid_pair[0]) * (leaf->_size - pos));
431  leaf->_k_rowid_pair[pos] = std::make_pair(key, val);
432  leaf->_size += 1;
433 
434  return true;
435 }
436 
437 KEY_VALUE_T_DECLARE
438 bool BP_TREE_T::Insert(const key_t &key, const value_t &val){
439  if (_root_id == INVALID_BLOCK_ID){ // Create a new root at block 0 of B+ tree file.
440  _root_id = 0;
441  pageId_t root_pageId;
442  BP_TREE_LEAF_T* root;
443  loadPointer(root, root_pageId, 0);
444 
445  _bfm->pinPage(root_pageId);
446  _bfm->modifyPage(root_pageId);
447  root->init(0, INVALID_BLOCK_ID, INVALID_BLOCK_ID);
448 
449  Insert_in_Leaf(key, val, root);
450  _bfm->unpinPage(root_pageId);
451  return true;
452  }
453  else{
454  pageId_t leaf_pageId;
455  BP_TREE_LEAF_T* leaf = FindNode(key, leaf_pageId); // The page is already pinned in the function.
456  if (leaf == nullptr){
457  return false;
458  }
459 
460  _bfm->modifyPage(leaf_pageId);
461 
462  if (leaf->_size < leaf->_max_size){ // Still have space
463  Insert_in_Leaf(key, val, leaf);
464  _bfm->unpinPage(leaf_pageId);
465  }
466  else{
467  assert(leaf->_size == leaf->_max_size);
468 
469  BP_TREE_BLOCK_T* p;
470  BP_TREE_INTERNAL_T* p2;
471  pageId_t trash;
472  if(leaf->_block_id != _root_id){
473  loadPointer(p, leaf->_parent_block_id);
474  assert(p->_blockType == INTERNAL_BLOCK);
475 
476  loadPointer(p2, trash, leaf->_parent_block_id);
477  assert(p2->_blockType == INTERNAL_BLOCK);
478  }
479 
480  pageId_t split_pageId;
481  BP_TREE_LEAF_T* split;
482  loadPointer(split, split_pageId, _file_block_count);
483  _file_block_count += 1;
484  _bfm->pinPage(split_pageId);
485 
486  _bfm->modifyPage(split_pageId);
487  // Set the block_id, root_id, sibling, parent
488  split->init(_file_block_count - 1, leaf->_parent_block_id, leaf->_next_block_id);
489  leaf->_next_block_id = split->_block_id;
490 
491  // Insert in leaf first
492  Insert_in_Leaf(key, val, leaf);
493 
495  // The position right after the (max_size + 1)/2 th element. In this way, both split nodes contains more than max_size/2 elements
496  db_size_t i = (leaf->_max_size + 1) / 2;
497  db_size_t copy_len = (leaf->_max_size + 1) - i;
498 
499  memcpy(split->_k_rowid_pair, leaf->_k_rowid_pair + i, sizeof(leaf->_k_rowid_pair[0]) * copy_len);
500  leaf->_size = i;
501  split->_size = copy_len;
502 
503  Insert_in_Parent(split->_k_rowid_pair[0].first, leaf, split);
504 
505  _bfm->unpinPage(split_pageId);
506  _bfm->unpinPage(leaf_pageId);
507  }
508  return true;
509  }
510 }
511 
512 KEY_VALUE_T_DECLARE
513 bool BP_TREE_T::Delete_in_Parent(BP_TREE_BLOCK_T* _parent, db_size_t pos_sep){
514  // Caller has set the modifyPage flag for these pointers!
515  auto parent = static_cast<BP_TREE_INTERNAL_T*>(_parent);
516 
517  // Delete the pointer to the child from its parent, and its "separation key"
518  // Caller need to make sure that the abandoned child is the latter one in merging
519  memmove(parent->_k_child_pair + pos_sep, parent->_k_child_pair + pos_sep + 1,
520  (parent->_size - (pos_sep + 1)) * sizeof(parent->_k_child_pair[0]));
521  parent->_size -= 1;
522 
523  if (parent->_block_id == _root_id){
524  if (parent->_size == 1){
525  _root_id = parent->_k_child_pair[0].second;
526  // TODO : Check the lazy delete (reorganize file)
527  parent->_blockType = INVALID_BLOCK;
528 // delete parent;
529  }
530  return true;
531  }
532  else if (parent->_size < (parent->_max_size + 1) / 2){ // (int)(degree + 1)/2 is equivalent to degree/2 's upper integer
533  BP_TREE_INTERNAL_T* grandparent;
534  pageId_t grandparent_pageId;
535 
536  BP_TREE_INTERNAL_T* parent_sibling;
537  pageId_t parentSib_pageId;
538 
539  loadPointer(grandparent, grandparent_pageId, parent->_parent_block_id);
540  _bfm->pinPage(grandparent_pageId);
541 
542  assert(grandparent->_blockType == INTERNAL_BLOCK); // Avoid invalid_block debug
543 
544  key_t sep_key_in_grandparent;
545  db_size_t pos_sep_grand = grandparent->internal_biSearch(parent->_k_child_pair[0].first);
546  bool is_predecessor;
547 
548  assert(grandparent->_k_child_pair[pos_sep_grand].second == parent->_block_id);
549 
550  if (pos_sep_grand == grandparent->_size - 1){ // The last child
551  loadPointer(parent_sibling, parentSib_pageId, grandparent->_k_child_pair[pos_sep_grand - 1].second);
552  is_predecessor = false;
553  sep_key_in_grandparent = grandparent->_k_child_pair[pos_sep_grand].first;
554 
555  assert(grandparent->_k_child_pair[pos_sep_grand].first == parent->_k_child_pair[0].first);
556  }
557  else{
558  pos_sep_grand += 1;
559  loadPointer(parent_sibling, parentSib_pageId, grandparent->_k_child_pair[pos_sep_grand].second);
560  is_predecessor = true;
561  sep_key_in_grandparent = grandparent->_k_child_pair[pos_sep_grand].first;
562 
563  assert(grandparent->_k_child_pair[pos_sep_grand].first == parent_sibling->_k_child_pair[0].first);
564  }
565  _bfm->pinPage(parentSib_pageId);
566 
567  // At most n - 1 keys in non-leaves
568  if (parent->_size + parent_sibling->_size < parent->_max_size){ // Merge leaf and sibling
569  if (is_predecessor) { // Parent is the predecessor
570  auto temp = parent;
571  parent = parent_sibling;
572  parent_sibling = temp;
573  }
574  // Move the content in parent to sibling, and
575  memcpy(parent_sibling->_k_child_pair + parent_sibling->_size, parent->_k_child_pair,
576  parent->_size * sizeof(parent->_k_child_pair[0]));
577  parent_sibling->_size += parent->_size;
578  parent->_size = 0;
579 
580  // set the child->parent pointer
581  for(db_size_t i = parent_sibling->_size - parent->_size; i < parent_sibling->_size; ++i){
582  BP_TREE_BLOCK_T* child;
583  loadPointer(child, parent_sibling->_k_child_pair[i].second);
584  child->_parent_block_id = parent_sibling->_block_id;
585  }
586  _bfm->unpinPage(parentSib_pageId);
587  Delete_in_Parent(grandparent, pos_sep_grand);
588  // Lazy delete
589  parent->_blockType = INVALID_BLOCK;
590 // delete parent;
591  return true;
592  }
593  else{ // Redistribute the keys and pointers
594  if (is_predecessor){
595  parent->_k_child_pair[parent->_size] = parent_sibling->_k_child_pair[0];
596  parent->_size += 1;
597  parent_sibling->_size -= 1;
598  memmove(parent_sibling->_k_child_pair, parent_sibling->_k_child_pair + 1,
599  parent_sibling->_size * sizeof(parent->_k_child_pair[0]));
600 
601  // Set the moved child's parent
602  BP_TREE_BLOCK_T* child;
603  loadPointer(child, parent->_k_child_pair[parent->_size - 1].second);
604  child->_parent_block_id = parent_sibling->_block_id;
605 
606  grandparent->_k_child_pair[pos_sep_grand].first = parent_sibling->_k_child_pair[0].first;
607  }
608  else{
609  memmove(parent->_k_child_pair + 1, parent->_k_child_pair,
610  parent->_size * sizeof(parent->_k_child_pair[0]));
611  parent->_k_child_pair[0] = parent_sibling->_k_child_pair[parent_sibling->_size - 1];
612  parent_sibling->_size -= 1;
613  parent->_size += 1;
614 
615  // Set the moved child's parent
616  BP_TREE_BLOCK_T* child;
617  loadPointer(child, parent->_k_child_pair[0].second);
618  child->_parent_block_id = parent->_block_id;
619 
620  grandparent->_k_child_pair[pos_sep_grand].first = parent->_k_child_pair[0].first;
621  }
622  _bfm->unpinPage(parentSib_pageId);
623  return true;
624  }
625  }
626 }
627 
628 KEY_VALUE_T_DECLARE
629 bool BP_TREE_T::Delete(const key_t &key) {
630  pageId_t leaf_pageId;
631  BP_TREE_LEAF_T* leaf = FindNode(key, leaf_pageId); // The page should be already pinned
632  if (leaf == nullptr){ // Usually happens when tree is empty
633  throw DB_KEY_NOT_FOUND;
634  }
635 
636  _bfm->modifyPage(leaf_pageId);
637 
638  // Delete the key and value from leaf
639  db_size_t pos = leaf->leaf_biSearch(key);
640  if(leaf->_k_rowid_pair[pos].first != key){ // Delete must match
641  throw DB_KEY_NOT_FOUND;
642  }
643 
644  // Remove the key and value
645  memmove(leaf->_k_rowid_pair + pos, leaf->_k_rowid_pair + pos + 1,
646  sizeof(leaf->_k_rowid_pair[0]) * (leaf->_size - (pos + 1)));
647  leaf->_size -= 1;
648 
649  if (leaf->_block_id == _root_id) {
650  if (leaf->_size == 0){ // Empty tree
651  leaf->_blockType = INVALID_BLOCK;
652  _root_id = INVALID_BLOCK_ID;
653  }
654  return true;
655  }
656  // Violate capacity constraint for leaf and non-root node
657  else if (leaf->_size < (leaf->_max_size + 1) / 2){ // The upper bound of _max_size / 2
658  // Make sure of the safety.
659  assert(leaf->_size == (leaf->_max_size + 1) / 2 - 1);
660 
661  BP_TREE_LEAF_T *sibling;
662  pageId_t sibling_pageId;
663  BP_TREE_INTERNAL_T *parent;
664  pageId_t parent_pageId;
665 
666  loadPointer(parent, parent_pageId, leaf->_parent_block_id);
667  _bfm->pinPage(parent_pageId);
668  // We have to know whether to choose the sibling forward or backward.
669  // I choose the sibling backward, unless leaf is the tail child of its parent
670  key_t sep_key_in_parent;
671  bool is_predecessor;
672  db_size_t pos_sep = parent->internal_biSearch(leaf->_k_rowid_pair[0].first);
673  assert(parent->_k_child_pair[pos_sep].second == leaf->_block_id);
674 
675  if (pos_sep == parent->_size - 1){ // The tail child.
676  loadPointer(sibling, sibling_pageId, parent->_k_child_pair[pos_sep - 1].second);
677  sep_key_in_parent = parent->_k_child_pair[pos_sep].first;
678  // For safety and debug purpose.
679  assert(parent->_k_child_pair[pos_sep].first == leaf->_k_rowid_pair[0].first);
680  is_predecessor = false;
681  }
682  else{
683  pos_sep += 1;
684  loadPointer(sibling, sibling_pageId, parent->_k_child_pair[pos_sep].second);
685  sep_key_in_parent = parent->_k_child_pair[pos_sep].first;
686 
687  assert(parent->_k_child_pair[pos_sep].first == sibling->_k_rowid_pair[0].first);
688  is_predecessor = true;
689  }
690  _bfm->pinPage(sibling_pageId);
691 
692  // At most n - 1 keys in leaves.
693  if (sibling->_size + leaf->_size < sibling->_max_size){ // Merge leaf and sibling
694  _bfm->modifyPage(sibling_pageId);
695  _bfm->modifyPage(leaf_pageId);
696  _bfm->modifyPage(parent_pageId);
697  // Make sure leaf is the latter one
698  if (is_predecessor){
699  auto temp1 = leaf;
700  leaf = sibling;
701  sibling = temp1;
702  }
703 
704  // Move the content in leaf to sibling
705  // 1. move the sibling pointer to the next node
706  sibling->_next_block_id = leaf->_next_block_id;
707  // 2. move the _k_rowid_pair
708  memcpy(sibling->_k_rowid_pair + sibling->_size, leaf->_k_rowid_pair,
709  leaf->_size * sizeof(leaf->_k_rowid_pair[0]));
710  sibling->_size += leaf->_size;
711  leaf->_size = 0;
712 
713  _bfm->unpinPage(sibling_pageId);
714  _bfm->unpinPage(leaf_pageId);
715 
716  Delete_in_Parent(parent, pos_sep);
717  // Lazy delete here. Forget about leaf block_id.
718  leaf->_blockType = INVALID_BLOCK;
719 // delete leaf;
720  }
721  else{ // Redistribution between two leaves
722  if (is_predecessor){ // leaf is the predecessor of sibling
723  leaf->_k_rowid_pair[leaf->_size] = sibling->_k_rowid_pair[0];
724  leaf->_size += 1;
725  sibling->_size -= 1;
726  memmove(sibling->_k_rowid_pair, sibling->_k_rowid_pair + 1,
727  sibling->_size * sizeof(sibling->_k_rowid_pair[0]));
728  // The separation key
729  parent->_k_child_pair[pos_sep].first = sibling->_k_rowid_pair[0].first;
730  }
731  else{ // leaf is the successor of sibling
732  memmove(leaf->_k_rowid_pair + 1, leaf->_k_rowid_pair,
733  leaf->_size * sizeof(sibling->_k_rowid_pair[0]));
734  leaf->_k_rowid_pair[0] = sibling->_k_rowid_pair[sibling->_size - 1];
735  leaf->_size += 1;
736  sibling->_size -= 1;
737 
738  parent->_k_child_pair[pos_sep].first = leaf->_k_rowid_pair[0].first;
739  }
740 
741  _bfm->unpinPage(sibling_pageId);
742  _bfm->unpinPage(leaf_pageId);
743  }
744  // TODO : Check if it is necessary to optimize the pin and unpin
745  _bfm->unpinPage(parent_pageId);
746 
747  return true;
748  }
749 }
750 
751 //KEY_VALUE_T_DECLARE
752 //std::pair<key_t, value_t>& BP_TREE_T::getKeyRowidPair(const key_t &key) {
753 //
754 // FindNode(key, )
755 //}
756 
757 KEY_VALUE_T_DECLARE
758 bool BP_TREE_T::UpdateKey(const key_t &former_key, const key_t &new_key) {
759  pageId_t key_pageId;
760  BP_TREE_LEAF_T* n = FindNode(former_key, key_pageId);
761  db_size_t pos = n->leaf_biSearch(former_key);
762  if (n->_k_rowid_pair[pos].first != former_key) throw DB_KEY_NOT_FOUND;
763  value_t val = n->_k_rowid_pair[pos].second;
764  _bfm->unpinPage(key_pageId);
765 
766  bool success_flg;
767  // TODO : Make it more efficient. Redundant search
768  success_flg = Delete(former_key);
769  if (success_flg){
770  success_flg = Insert(new_key, val);
771  }
772  return success_flg;
773 }
774 
775 KEY_VALUE_T_DECLARE
776 bool BP_TREE_T::UpdateValue(const key_t &key, const value_t &new_val) {
777  pageId_t key_pageId;
778  BP_TREE_LEAF_T* n = FindNode(key, key_pageId);
779  db_size_t pos = n->leaf_biSearch(key);
780  if (n->_k_rowid_pair[pos].first != key) throw DB_KEY_NOT_FOUND;
781  n->_k_rowid_pair[pos].second = new_val;
782  _bfm->unpinPage(key_pageId);
783  return true;
784 }
785 
786 //KEY_VALUE_T_DECLARE
787 //bool BP_TREE_T::FindRange(key_t lower_key, key_t upper_key, std::vector<value_t>& result) {
788 // const BP_NODE_T* lower_node = FindNode(lower_key);
789 // const BP_NODE_T* upper_node = FindNode(upper_key);
790 //
791 // db_size_t start_id = lower_node->FindPos_at_Node(lower_key);
792 // db_size_t end_id = upper_node->FindPos_at_Node(upper_key);
793 //
794 // if (start_id == -1 || end_id == -1){
795 // return false;
796 // }
797 // else{
798 // if (lower_node == upper_node){
799 // for (db_size_t i = start_id; i <= end_id; ++i){
800 // result.push_back(lower_node->value_field.at(i));
801 // }
802 // }
803 // else{
804 // for (db_size_t i = start_id; i < lower_node->value_field.size(); ++i){
805 // result.push_back(lower_node->value_field.at(i));
806 // }
807 // const BP_NODE_T* next = lower_node->ptr_field.front();
808 // while(next != upper_node){
809 // for (auto value : next->value_field){
810 // result.push_back(value);
811 // }
812 // next = next->ptr_field.front();
813 // }
814 // for (db_size_t i = 0; i <= end_id; ++i) {
815 // result.push_back(upper_node->value_field.at(i));
816 // }
817 // }
818 // return true;
819 // }
820 //}
821 
822 #endif
Bp_tree::Delete
bool Delete(const key_t &key)
Basic deletion from the tree.
Bp_tree::Insert
bool Insert(const key_t &key, const value_t &val)
Basic insertion to the tree.
Bp_tree::InitRoot
void InitRoot(std::string indexFileName)
Bp_tree::FindValue
bool FindValue(const key_t &key, value_t &result) const
Find the values by key (normally, we may say "pointers" for "values")
BufferManager
Buffer manager is an abstraction of memory on computer for modules at higher level.
Definition: buffer_manager.h:69
Bp_tree::UpdateValue
bool UpdateValue(const key_t &key, const value_t &new_val)
Update a certain value.
Bp_tree
The B-plus-tree storage details on the disk.
Definition: bpTree_disk.h:26
BufferManager::getPage
char * getPage(const std::string &file_name, int block_id)
获取一页
Definition: buffer_manager.cpp:130
bpTree_Block
The storage detail of the header of each page in index files.
Definition: bpTree_block.h:39
Bp_tree::FindRange
bool FindRange(const key_t &lower_key, const key_t &upper_key, std::vector< value_t > &result) const
Find the value(pointer) based on the given lower and upper key.
Bp_tree::UpdateKey
bool UpdateKey(const key_t &former_key, const key_t &new_key)
Update a certain key.