Move from dataset_dev branch to here

This commit is contained in:
Jesse Lee 2020-04-28 17:11:34 -04:00
parent 2bc3fcb1c1
commit 3c643e7298
5 changed files with 480 additions and 160 deletions

View File

@ -18,6 +18,7 @@
#include <atomic>
#include <memory>
#include <utility>
#include <vector>
#include "dataset/util/btree.h"
@ -25,19 +26,20 @@
namespace mindspore {
namespace dataset {
// This is a B+ tree with generated uint64_t value as key.
// Use minKey() function to query the min key.
// Use maxKey() function to query the max key.
// @tparam T
template <typename T>
class AutoIndexObj : public BPlusTree<uint64_t, T> {
/// This is a B+ tree with generated int64_t value as key.
/// Use minKey() function to query the min key.
/// Use maxKey() function to query the max key.
/// @tparam T
template <typename T, typename A = std::allocator<T>>
class AutoIndexObj : public BPlusTree<int64_t, T, A> {
public:
using my_tree = BPlusTree<uint64_t, T>;
using my_tree = BPlusTree<int64_t, T, A>;
using key_type = typename my_tree::key_type;
using value_type = typename my_tree::value_type;
explicit AutoIndexObj(const typename my_tree::value_allocator &alloc = Allocator<T>{std::make_shared<SystemPool>()})
: my_tree::BPlusTree(alloc), inx_(kMinKey) {}
AutoIndexObj() : my_tree::BPlusTree(), inx_(kMinKey) {}
explicit AutoIndexObj(const Allocator<T> &alloc) : my_tree::BPlusTree(alloc), inx_(kMinKey) {}
~AutoIndexObj() = default;
@ -52,6 +54,14 @@ class AutoIndexObj : public BPlusTree<uint64_t, T> {
return my_tree::DoInsert(my_inx, val);
}
Status insert(std::unique_ptr<value_type> &&val, key_type *key = nullptr) {
key_type my_inx = inx_.fetch_add(1);
if (key) {
*key = my_inx;
}
return my_tree::DoInsert(my_inx, std::move(val));
}
// Insert a vector of objects into the tree.
// @param v
// @return

View File

@ -44,12 +44,14 @@ struct BPlusTreeTraits {
static constexpr bool kAppendMode = false;
};
// Implementation of B+ tree
// @tparam K
// @tparam V
// @tparam C
// @tparam T
template <typename K, typename V, typename C = std::less<K>, typename T = BPlusTreeTraits>
/// Implementation of B+ tree
/// @tparam K -- the type of key
/// @tparam V -- the type of value
/// @tparam A -- allocator
/// @tparam C -- comparison class
/// @tparam T -- trait
template <typename K, typename V, typename A = std::allocator<V>, typename C = std::less<K>,
typename T = BPlusTreeTraits>
class BPlusTree {
public:
enum class IndexRc : char {
@ -87,11 +89,13 @@ class BPlusTree {
using key_compare = C;
using slot_type = typename T::slot_type;
using traits = T;
using key_allocator = Allocator<key_type>;
using value_allocator = Allocator<value_type>;
using slot_allocator = Allocator<slot_type>;
using value_allocator = A;
using key_allocator = typename value_allocator::template rebind<key_type>::other;
using slot_allocator = typename value_allocator::template rebind<slot_type>::other;
explicit BPlusTree(const value_allocator &alloc);
BPlusTree();
explicit BPlusTree(const Allocator<V> &alloc);
~BPlusTree() noexcept;
@ -109,10 +113,15 @@ class BPlusTree {
bool empty() const { return (size() == 0); }
// @param key
// @param value
// @return
/// @param key
/// @param value
/// @return
Status DoInsert(const key_type &key, const value_type &value);
Status DoInsert(const key_type &key, std::unique_ptr<value_type> &&value);
// Update a new value for a given key.
std::unique_ptr<value_type> DoUpdate(const key_type &key, const value_type &new_value);
std::unique_ptr<value_type> DoUpdate(const key_type &key, std::unique_ptr<value_type> &&new_value);
void PopulateNumKeys();
@ -144,7 +153,7 @@ class BPlusTree {
virtual ~BaseNode() = default;
protected:
RWLock rw_lock_;
mutable RWLock rw_lock_;
value_allocator alloc_;
private:
@ -267,7 +276,7 @@ class BPlusTree {
// 50/50 split
IndexRc Split(LeafNode *to);
IndexRc InsertIntoSlot(LockPathCB *insCB, slot_type slot, const key_type &key, std::shared_ptr<value_type> value);
IndexRc InsertIntoSlot(LockPathCB *insCB, slot_type slot, const key_type &key, std::unique_ptr<value_type> &&value);
explicit LeafNode(const value_allocator &alloc) : BaseNode::BaseNode(alloc), slotuse_(0) {}
@ -275,11 +284,11 @@ class BPlusTree {
slot_type slot_dir_[traits::kLeafSlots];
key_type keys_[traits::kLeafSlots];
std::shared_ptr<value_type> data_[traits::kLeafSlots];
std::unique_ptr<value_type> data_[traits::kLeafSlots];
slot_type slotuse_;
};
RWLock rw_lock_;
mutable RWLock rw_lock_;
value_allocator alloc_;
// All the leaf nodes. Used by the iterator to traverse all the key/values.
List<LeafNode> leaf_nodes_;
@ -319,8 +328,8 @@ class BPlusTree {
return lo;
}
IndexRc LeafInsertKeyValue(LockPathCB *ins_cb, LeafNode *node, const key_type &key, std::shared_ptr<value_type> value,
key_type *split_key, LeafNode **split_node);
IndexRc LeafInsertKeyValue(LockPathCB *ins_cb, LeafNode *node, const key_type &key,
std::unique_ptr<value_type> &&value, key_type *split_key, LeafNode **split_node);
IndexRc InnerInsertKeyChild(InnerNode *node, const key_type &key, BaseNode *ptr, key_type *split_key,
InnerNode **split_node);
@ -335,10 +344,11 @@ class BPlusTree {
return child;
}
IndexRc InsertKeyValue(LockPathCB *ins_cb, BaseNode *n, const key_type &key, std::shared_ptr<value_type> value,
IndexRc InsertKeyValue(LockPathCB *ins_cb, BaseNode *n, const key_type &key, std::unique_ptr<value_type> &&value,
key_type *split_key, BaseNode **split_node);
IndexRc Locate(BaseNode *top, const key_type &key, LeafNode **ln, slot_type *s) const;
IndexRc Locate(RWLock *parent_lock, bool forUpdate, BaseNode *top, const key_type &key, LeafNode **ln,
slot_type *s) const;
public:
class Iterator : public std::iterator<std::bidirectional_iterator_tag, value_type> {
@ -346,19 +356,27 @@ class BPlusTree {
using reference = BPlusTree::value_type &;
using pointer = BPlusTree::value_type *;
explicit Iterator(BPlusTree *btree) : cur_(btree->leaf_nodes_.head), slot_(0) {}
explicit Iterator(BPlusTree *btree) : cur_(btree->leaf_nodes_.head), slot_(0), locked_(false) {}
Iterator(LeafNode *leaf, slot_type slot) : cur_(leaf), slot_(slot) {}
Iterator(LeafNode *leaf, slot_type slot, bool locked = false) : cur_(leaf), slot_(slot), locked_(locked) {}
~Iterator() = default;
~Iterator();
explicit Iterator(const Iterator &);
Iterator &operator=(const Iterator &lhs);
Iterator(Iterator &&);
Iterator &operator=(Iterator &&lhs);
pointer operator->() const { return cur_->data_[cur_->slot_dir_[slot_]].get(); }
reference operator*() const { return *(cur_->data_[cur_->slot_dir_[slot_]].get()); }
const key_type &key() { return cur_->keys_[cur_->slot_dir_[slot_]]; }
const key_type &key() const { return cur_->keys_[cur_->slot_dir_[slot_]]; }
const value_type &value() { return *(cur_->data_[cur_->slot_dir_[slot_]].get()); }
value_type &value() const { return *(cur_->data_[cur_->slot_dir_[slot_]].get()); }
// Prefix++
Iterator &operator++();
@ -379,6 +397,7 @@ class BPlusTree {
private:
typename BPlusTree::LeafNode *cur_;
slot_type slot_;
bool locked_;
};
class ConstIterator : public std::iterator<std::bidirectional_iterator_tag, value_type> {
@ -386,11 +405,20 @@ class BPlusTree {
using reference = BPlusTree::value_type &;
using pointer = BPlusTree::value_type *;
explicit ConstIterator(const BPlusTree *btree) : cur_(btree->leaf_nodes_.head), slot_(0) {}
explicit ConstIterator(const BPlusTree *btree) : cur_(btree->leaf_nodes_.head), slot_(0), locked_(false) {}
~ConstIterator() = default;
~ConstIterator();
ConstIterator(const LeafNode *leaf, slot_type slot) : cur_(leaf), slot_(slot) {}
ConstIterator(const LeafNode *leaf, slot_type slot, bool locked = false)
: cur_(leaf), slot_(slot), locked_(locked) {}
explicit ConstIterator(const ConstIterator &);
ConstIterator &operator=(const ConstIterator &lhs);
ConstIterator(ConstIterator &&);
ConstIterator &operator=(ConstIterator &&lhs);
pointer operator->() const { return cur_->data_[cur_->slot_dir_[slot_]].get(); }
@ -398,7 +426,7 @@ class BPlusTree {
const key_type &key() const { return cur_->keys_[cur_->slot_dir_[slot_]]; }
const value_type &value() const { return *(cur_->data_[cur_->slot_dir_[slot_]].get()); }
value_type &value() const { return *(cur_->data_[cur_->slot_dir_[slot_]].get()); }
// Prefix++
ConstIterator &operator++();
@ -419,6 +447,7 @@ class BPlusTree {
private:
const typename BPlusTree::LeafNode *cur_;
slot_type slot_;
bool locked_;
};
Iterator begin();
@ -435,6 +464,7 @@ class BPlusTree {
// Locate the entry with key
ConstIterator Search(const key_type &key) const;
Iterator Search(const key_type &key);
value_type operator[](key_type key);
};

View File

@ -19,10 +19,10 @@
namespace mindspore {
namespace dataset {
template<typename K, typename V, typename C, typename T>
typename BPlusTree<K, V, C, T>::IndexRc BPlusTree<K, V, C, T>::InnerNode::Sort() {
template <typename K, typename V, typename A, typename C, typename T>
typename BPlusTree<K, V, A, C, T>::IndexRc BPlusTree<K, V, A, C, T>::InnerNode::Sort() {
// Build an inverse map. Basically it means keys[i] should be relocated to keys[inverse[i]];
Allocator<slot_type> alloc(this->alloc_);
slot_allocator alloc(this->alloc_);
slot_type *inverse = nullptr;
try {
inverse = alloc.allocate(traits::kInnerSlots);
@ -51,15 +51,15 @@ typename BPlusTree<K, V, C, T>::IndexRc BPlusTree<K, V, C, T>::InnerNode::Sort()
slot_dir_[i] = i;
}
if (inverse != nullptr) {
alloc.deallocate(inverse);
alloc.deallocate(inverse, traits::kInnerSlots);
inverse = nullptr;
}
return IndexRc::kOk;
}
template<typename K, typename V, typename C, typename T>
typename BPlusTree<K, V, C, T>::IndexRc BPlusTree<K, V, C, T>::InnerNode::Split(BPlusTree<K, V, C, T>::InnerNode *to,
key_type *split_key) {
template <typename K, typename V, typename A, typename C, typename T>
typename BPlusTree<K, V, A, C, T>::IndexRc BPlusTree<K, V, A, C, T>::InnerNode::Split(
BPlusTree<K, V, A, C, T>::InnerNode *to, key_type *split_key) {
DS_ASSERT(to);
DS_ASSERT(to->slotuse_ == 0);
// It is simpler to sort first, then split. Other alternative is to move key by key to the
@ -72,7 +72,7 @@ typename BPlusTree<K, V, C, T>::IndexRc BPlusTree<K, V, C, T>::InnerNode::Split(
if (err != EOK) {
return IndexRc::kUnexpectedError;
}
err = memcpy_s(to->data_, sizeof(to->data_), data_ + mid + 1, (num_keys_to_move + 1) * sizeof(BaseNode * ));
err = memcpy_s(to->data_, sizeof(to->data_), data_ + mid + 1, (num_keys_to_move + 1) * sizeof(BaseNode *));
if (err != EOK) {
return IndexRc::kUnexpectedError;
}
@ -84,10 +84,9 @@ typename BPlusTree<K, V, C, T>::IndexRc BPlusTree<K, V, C, T>::InnerNode::Split(
return IndexRc::kOk;
}
template<typename K, typename V, typename C, typename T>
typename BPlusTree<K, V, C, T>::IndexRc
BPlusTree<K, V, C, T>::InnerNode::InsertIntoSlot(slot_type slot, const key_type &key,
BPlusTree<K, V, C, T>::BaseNode *ptr) {
template <typename K, typename V, typename A, typename C, typename T>
typename BPlusTree<K, V, A, C, T>::IndexRc BPlusTree<K, V, A, C, T>::InnerNode::InsertIntoSlot(
slot_type slot, const key_type &key, BPlusTree<K, V, A, C, T>::BaseNode *ptr) {
if (is_full()) {
return IndexRc::kSlotFull;
}
@ -111,10 +110,10 @@ BPlusTree<K, V, C, T>::InnerNode::InsertIntoSlot(slot_type slot, const key_type
return IndexRc::kOk;
}
template<typename K, typename V, typename C, typename T>
typename BPlusTree<K, V, C, T>::IndexRc BPlusTree<K, V, C, T>::LeafNode::Sort() {
template <typename K, typename V, typename A, typename C, typename T>
typename BPlusTree<K, V, A, C, T>::IndexRc BPlusTree<K, V, A, C, T>::LeafNode::Sort() {
// Build an inverse map. Basically it means keys[i] should be relocated to keys[inverse[i]];
Allocator<slot_type> alloc(this->alloc_);
slot_allocator alloc(this->alloc_);
slot_type *inverse = nullptr;
try {
inverse = alloc.allocate(traits::kLeafSlots);
@ -143,14 +142,15 @@ typename BPlusTree<K, V, C, T>::IndexRc BPlusTree<K, V, C, T>::LeafNode::Sort()
slot_dir_[i] = i;
}
if (inverse != nullptr) {
alloc.deallocate(inverse);
alloc.deallocate(inverse, traits::kLeafSlots);
inverse = nullptr;
}
return IndexRc::kOk;
}
template<typename K, typename V, typename C, typename T>
typename BPlusTree<K, V, C, T>::IndexRc BPlusTree<K, V, C, T>::LeafNode::Split(BPlusTree<K, V, C, T>::LeafNode *to) {
template <typename K, typename V, typename A, typename C, typename T>
typename BPlusTree<K, V, A, C, T>::IndexRc BPlusTree<K, V, A, C, T>::LeafNode::Split(
BPlusTree<K, V, A, C, T>::LeafNode *to) {
DS_ASSERT(to);
DS_ASSERT(to->slotuse_ == 0);
// It is simpler to sort first, then split. Other alternative is to move key by key to the
@ -171,11 +171,10 @@ typename BPlusTree<K, V, C, T>::IndexRc BPlusTree<K, V, C, T>::LeafNode::Split(B
return IndexRc::kOk;
}
template<typename K, typename V, typename C, typename T>
typename BPlusTree<K, V, C, T>::IndexRc
BPlusTree<K, V, C, T>::LeafNode::InsertIntoSlot(BPlusTree<K, V, C, T>::LockPathCB *insCB, slot_type slot,
const key_type &key,
std::shared_ptr<value_type> value) {
template <typename K, typename V, typename A, typename C, typename T>
typename BPlusTree<K, V, A, C, T>::IndexRc BPlusTree<K, V, A, C, T>::LeafNode::InsertIntoSlot(
BPlusTree<K, V, A, C, T>::LockPathCB *insCB, slot_type slot, const key_type &key,
std::unique_ptr<value_type> &&value) {
if (is_full()) {
// If we need to do node split, we need to ensure all the intermediate nodes are locked exclusive.
// Otherwise we need to do a retry.
@ -210,8 +209,9 @@ BPlusTree<K, V, C, T>::LeafNode::InsertIntoSlot(BPlusTree<K, V, C, T>::LockPathC
return IndexRc::kOk;
}
template<typename K, typename V, typename C, typename T>
typename BPlusTree<K, V, C, T>::IndexRc BPlusTree<K, V, C, T>::AllocateInner(BPlusTree<K, V, C, T>::InnerNode **p) {
template <typename K, typename V, typename A, typename C, typename T>
typename BPlusTree<K, V, A, C, T>::IndexRc BPlusTree<K, V, A, C, T>::AllocateInner(
BPlusTree<K, V, A, C, T>::InnerNode **p) {
if (p == nullptr) {
return IndexRc::kNullPointer;
}
@ -224,14 +224,15 @@ typename BPlusTree<K, V, C, T>::IndexRc BPlusTree<K, V, C, T>::AllocateInner(BPl
} catch (std::exception &e) {
return IndexRc::kUnexpectedError;
}
*p = new(ptr) InnerNode(alloc_);
*p = new (ptr) InnerNode(alloc_);
all_.Prepend(ptr);
stats_.inner_nodes_++;
return IndexRc::kOk;
}
template<typename K, typename V, typename C, typename T>
typename BPlusTree<K, V, C, T>::IndexRc BPlusTree<K, V, C, T>::AllocateLeaf(BPlusTree<K, V, C, T>::LeafNode **p) {
template <typename K, typename V, typename A, typename C, typename T>
typename BPlusTree<K, V, A, C, T>::IndexRc BPlusTree<K, V, A, C, T>::AllocateLeaf(
BPlusTree<K, V, A, C, T>::LeafNode **p) {
if (p == nullptr) {
return IndexRc::kNullPointer;
}
@ -244,24 +245,22 @@ typename BPlusTree<K, V, C, T>::IndexRc BPlusTree<K, V, C, T>::AllocateLeaf(BPlu
} catch (std::exception &e) {
return IndexRc::kUnexpectedError;
}
*p = new(ptr) LeafNode(alloc_);
*p = new (ptr) LeafNode(alloc_);
all_.Prepend(ptr);
stats_.leaves_++;
return IndexRc::kOk;
}
template<typename K, typename V, typename C, typename T>
typename BPlusTree<K, V, C, T>::IndexRc
BPlusTree<K, V, C, T>::LeafInsertKeyValue(BPlusTree<K, V, C, T>::LockPathCB *ins_cb,
BPlusTree<K, V, C, T>::LeafNode *node, const key_type &key,
std::shared_ptr<value_type> value, key_type *split_key,
BPlusTree<K, V, C, T>::LeafNode **split_node) {
template <typename K, typename V, typename A, typename C, typename T>
typename BPlusTree<K, V, A, C, T>::IndexRc BPlusTree<K, V, A, C, T>::LeafInsertKeyValue(
BPlusTree<K, V, A, C, T>::LockPathCB *ins_cb, BPlusTree<K, V, A, C, T>::LeafNode *node, const key_type &key,
std::unique_ptr<value_type> &&value, key_type *split_key, BPlusTree<K, V, A, C, T>::LeafNode **split_node) {
bool duplicate;
slot_type slot = FindSlot(node, key, &duplicate);
if (duplicate) {
return IndexRc::kDuplicateKey;
}
IndexRc rc = node->InsertIntoSlot(ins_cb, slot, key, value);
IndexRc rc = node->InsertIntoSlot(ins_cb, slot, key, std::move(value));
if (rc == IndexRc::kSlotFull) {
LeafNode *new_leaf = nullptr;
rc = AllocateLeaf(&new_leaf);
@ -273,7 +272,7 @@ BPlusTree<K, V, C, T>::LeafInsertKeyValue(BPlusTree<K, V, C, T>::LockPathCB *ins
*split_key = key;
// Just insert the new key to the new leaf. No further need to move the keys
// from one leaf to the other.
rc = new_leaf->InsertIntoSlot(nullptr, 0, key, value);
rc = new_leaf->InsertIntoSlot(nullptr, 0, key, std::move(value));
RETURN_IF_BAD_RC(rc);
} else {
// 50/50 split
@ -281,11 +280,11 @@ BPlusTree<K, V, C, T>::LeafInsertKeyValue(BPlusTree<K, V, C, T>::LockPathCB *ins
RETURN_IF_BAD_RC(rc);
*split_key = new_leaf->keys_[0];
if (LessThan(key, *split_key)) {
rc = node->InsertIntoSlot(nullptr, slot, key, value);
rc = node->InsertIntoSlot(nullptr, slot, key, std::move(value));
RETURN_IF_BAD_RC(rc);
} else {
slot -= node->slotuse_;
rc = new_leaf->InsertIntoSlot(nullptr, slot, key, value);
rc = new_leaf->InsertIntoSlot(nullptr, slot, key, std::move(value));
RETURN_IF_BAD_RC(rc);
}
}
@ -293,11 +292,10 @@ BPlusTree<K, V, C, T>::LeafInsertKeyValue(BPlusTree<K, V, C, T>::LockPathCB *ins
return rc;
}
template<typename K, typename V, typename C, typename T>
typename BPlusTree<K, V, C, T>::IndexRc
BPlusTree<K, V, C, T>::InnerInsertKeyChild(BPlusTree<K, V, C, T>::InnerNode *node, const key_type &key,
BPlusTree<K, V, C, T>::BaseNode *ptr,
key_type *split_key, BPlusTree<K, V, C, T>::InnerNode **split_node) {
template <typename K, typename V, typename A, typename C, typename T>
typename BPlusTree<K, V, A, C, T>::IndexRc BPlusTree<K, V, A, C, T>::InnerInsertKeyChild(
BPlusTree<K, V, A, C, T>::InnerNode *node, const key_type &key, BPlusTree<K, V, A, C, T>::BaseNode *ptr,
key_type *split_key, BPlusTree<K, V, A, C, T>::InnerNode **split_node) {
bool duplicate;
slot_type slot = FindSlot(node, key, &duplicate);
if (duplicate) {
@ -333,12 +331,10 @@ BPlusTree<K, V, C, T>::InnerInsertKeyChild(BPlusTree<K, V, C, T>::InnerNode *nod
return rc;
}
template<typename K, typename V, typename C, typename T>
typename BPlusTree<K, V, C, T>::IndexRc
BPlusTree<K, V, C, T>::InsertKeyValue(BPlusTree<K, V, C, T>::LockPathCB *ins_cb, BPlusTree<K, V, C, T>::BaseNode *n,
const key_type &key,
std::shared_ptr<value_type> value, key_type *split_key,
BPlusTree<K, V, C, T>::BaseNode **split_node) {
template <typename K, typename V, typename A, typename C, typename T>
typename BPlusTree<K, V, A, C, T>::IndexRc BPlusTree<K, V, A, C, T>::InsertKeyValue(
BPlusTree<K, V, A, C, T>::LockPathCB *ins_cb, BPlusTree<K, V, A, C, T>::BaseNode *n, const key_type &key,
std::unique_ptr<value_type> &&value, key_type *split_key, BPlusTree<K, V, A, C, T>::BaseNode **split_node) {
if (split_key == nullptr || split_node == nullptr) {
return IndexRc::kUnexpectedError;
}
@ -378,17 +374,36 @@ BPlusTree<K, V, C, T>::InsertKeyValue(BPlusTree<K, V, C, T>::LockPathCB *ins_cb,
return IndexRc::kOk;
}
template<typename K, typename V, typename C, typename T>
typename BPlusTree<K, V, C, T>::IndexRc
BPlusTree<K, V, C, T>::Locate(BPlusTree<K, V, C, T>::BaseNode *top, const key_type &key,
BPlusTree<K, V, C, T>::LeafNode **ln,
slot_type *s) const {
template <typename K, typename V, typename A, typename C, typename T>
typename BPlusTree<K, V, A, C, T>::IndexRc BPlusTree<K, V, A, C, T>::Locate(RWLock *parent_lock,
bool forUpdate,
BPlusTree<K, V, A, C, T>::BaseNode *top,
const key_type &key,
BPlusTree<K, V, A, C, T>::LeafNode **ln,
slot_type *s) const {
if (ln == nullptr || s == nullptr) {
return IndexRc::kNullPointer;
}
if (top == nullptr) {
return IndexRc::kKeyNotFound;
}
RWLock *myLock = nullptr;
if (parent_lock != nullptr) {
// Crabbing. Lock this node first, then unlock the parent.
myLock = &top->rw_lock_;
if (top->is_leafnode()) {
if (forUpdate) {
// We are holding the parent lock in S and try to lock this node with X. It is not possible to run
// into deadlock because no one will hold the child in X and trying to lock the parent in that order.
myLock->LockExclusive();
} else {
myLock->LockShared();
}
} else {
myLock->LockShared();
}
parent_lock->Unlock();
}
if (top->is_leafnode()) {
bool duplicate;
auto *leaf = static_cast<LeafNode *>(top);
@ -398,22 +413,29 @@ BPlusTree<K, V, C, T>::Locate(BPlusTree<K, V, C, T>::BaseNode *top, const key_ty
*ln = leaf;
*s = slot;
} else {
if (myLock != nullptr) {
myLock->Unlock();
}
return IndexRc::kKeyNotFound;
}
} else {
auto *inner = static_cast<InnerNode *>(top);
slot_type slot = FindSlot(inner, key);
return Locate(FindBranch(inner, slot), key, ln, s);
return Locate(myLock, forUpdate, FindBranch(inner, slot), key, ln, s);
}
// We still have a S lock on the leaf node. Leave it there. The iterator will unlock it for us.
return IndexRc::kOk;
}
template <typename K, typename V, typename C, typename T>
BPlusTree<K, V, C, T>::BPlusTree(const value_allocator &alloc)
template <typename K, typename V, typename A, typename C, typename T>
BPlusTree<K, V, A, C, T>::BPlusTree() : leaf_nodes_(&LeafNode::link_), all_(&BaseNode::lru_), root_(nullptr) {}
template <typename K, typename V, typename A, typename C, typename T>
BPlusTree<K, V, A, C, T>::BPlusTree(const Allocator<V> &alloc)
: alloc_(alloc), leaf_nodes_(&LeafNode::link_), all_(&BaseNode::lru_), root_(nullptr) {}
template<typename K, typename V, typename C, typename T>
BPlusTree<K, V, C, T>::~BPlusTree() noexcept {
template <typename K, typename V, typename A, typename C, typename T>
BPlusTree<K, V, A, C, T>::~BPlusTree() noexcept {
// We have a list of all the nodes allocated. Traverse them and free all the memory
BaseNode *n = all_.head;
BaseNode *t = nullptr;
@ -436,8 +458,8 @@ BPlusTree<K, V, C, T>::~BPlusTree() noexcept {
root_ = nullptr;
}
template<typename K, typename V, typename C, typename T>
Status BPlusTree<K, V, C, T>::DoInsert(const key_type &key, const value_type &value) {
template <typename K, typename V, typename A, typename C, typename T>
Status BPlusTree<K, V, A, C, T>::DoInsert(const key_type &key, std::unique_ptr<value_type> &&value) {
IndexRc rc;
if (root_ == nullptr) {
UniqueLock lck(&rw_lock_);
@ -464,10 +486,7 @@ Status BPlusTree<K, V, C, T>::DoInsert(const key_type &key, const value_type &va
retry = false;
BaseNode *new_child = nullptr;
key_type new_key = key_type();
// We don't store the value directly into the leaf node as it is expensive to move it during node split.
// Rather we store a pointer instead. The value_type must support the copy constructor.
std::shared_ptr<value_type> ptr_value = std::make_shared<value_type>(value);
rc = InsertKeyValue(&InsCB, root_, key, std::move(ptr_value), &new_key, &new_child);
rc = InsertKeyValue(&InsCB, root_, key, std::move(value), &new_key, &new_child);
if (rc == IndexRc::kRetry) {
retry = true;
} else if (rc != IndexRc::kOk) {
@ -489,12 +508,50 @@ Status BPlusTree<K, V, C, T>::DoInsert(const key_type &key, const value_type &va
}
}
} while (retry);
(void) stats_.size_++;
(void)stats_.size_++;
return Status::OK();
}
template <typename K, typename V, typename C, typename T>
void BPlusTree<K, V, C, T>::PopulateNumKeys() {
template <typename K, typename V, typename A, typename C, typename T>
Status BPlusTree<K, V, A, C, T>::DoInsert(const key_type &key, const value_type &value) {
// We don't store the value directly into the leaf node as it is expensive to move it during node split.
// Rather we store a pointer instead.
return DoInsert(key, std::make_unique<value_type>(value));
}
template <typename K, typename V, typename A, typename C, typename T>
std::unique_ptr<V> BPlusTree<K, V, A, C, T>::DoUpdate(const key_type &key, const value_type &new_value) {
return DoUpdate(key, std::make_unique<value_type>(new_value));
}
template <typename K, typename V, typename A, typename C, typename T>
std::unique_ptr<V> BPlusTree<K, V, A, C, T>::DoUpdate(const key_type &key, std::unique_ptr<value_type> &&new_value) {
if (root_ != nullptr) {
LeafNode *leaf = nullptr;
slot_type slot;
RWLock *myLock = &this->rw_lock_;
// Lock the tree in S, pass the lock to Locate which will unlock it for us underneath.
myLock->LockShared();
IndexRc rc = Locate(myLock, true, root_, key, &leaf, &slot);
if (rc == IndexRc::kOk) {
// All locks from the tree to the parent of leaf are all gone. We still have a X lock
// on the leaf.
// Swap out the old value and replace it with new value.
std::unique_ptr<value_type> old = std::move(leaf->data_[leaf->slot_dir_[slot]]);
leaf->data_[leaf->slot_dir_[slot]] = std::move(new_value);
leaf->rw_lock_.Unlock();
return old;
} else {
MS_LOG(INFO) << "Key not found. rc = " << static_cast<int>(rc) << ".";
return nullptr;
}
} else {
return nullptr;
}
}
template <typename K, typename V, typename A, typename C, typename T>
void BPlusTree<K, V, A, C, T>::PopulateNumKeys() {
// Start from the root and we calculate how many leaf nodes as pointed to by each inner node.
// The results are stored in the numKeys array in each inner node.
(void)PopulateNumKeys(root_);
@ -502,8 +559,8 @@ void BPlusTree<K, V, C, T>::PopulateNumKeys() {
stats_.num_keys_array_valid_ = true;
}
template <typename K, typename V, typename C, typename T>
uint64_t BPlusTree<K, V, C, T>::PopulateNumKeys(BPlusTree<K, V, C, T>::BaseNode *n) {
template <typename K, typename V, typename A, typename C, typename T>
uint64_t BPlusTree<K, V, A, C, T>::PopulateNumKeys(BPlusTree<K, V, A, C, T>::BaseNode *n) {
if (n->is_leafnode()) {
auto *leaf = static_cast<LeafNode *>(n);
return leaf->slotuse_;
@ -518,8 +575,8 @@ uint64_t BPlusTree<K, V, C, T>::PopulateNumKeys(BPlusTree<K, V, C, T>::BaseNode
}
}
template <typename K, typename V, typename C, typename T>
typename BPlusTree<K, V, C, T>::key_type BPlusTree<K, V, C, T>::KeyAtPos(uint64_t inx) {
template <typename K, typename V, typename A, typename C, typename T>
typename BPlusTree<K, V, A, C, T>::key_type BPlusTree<K, V, A, C, T>::KeyAtPos(uint64_t inx) {
if (stats_.num_keys_array_valid_ == false) {
// We need exclusive access to the tree. If concurrent insert is going on, it is hard to get accurate numbers
UniqueLock lck(&rw_lock_);
@ -532,8 +589,9 @@ typename BPlusTree<K, V, C, T>::key_type BPlusTree<K, V, C, T>::KeyAtPos(uint64_
return KeyAtPos(root_, inx);
}
template <typename K, typename V, typename C, typename T>
typename BPlusTree<K, V, C, T>::key_type BPlusTree<K, V, C, T>::KeyAtPos(BPlusTree<K, V, C, T>::BaseNode *n, uint64_t inx) {
template <typename K, typename V, typename A, typename C, typename T>
typename BPlusTree<K, V, A, C, T>::key_type BPlusTree<K, V, A, C, T>::KeyAtPos(BPlusTree<K, V, A, C, T>::BaseNode *n,
uint64_t inx) {
if (n->is_leafnode()) {
auto *leaf = static_cast<LeafNode *>(n);
return leaf->keys_[leaf->slot_dir_[inx]];
@ -546,7 +604,7 @@ typename BPlusTree<K, V, C, T>::key_type BPlusTree<K, V, C, T>::KeyAtPos(BPlusTr
}
for (auto i = 0; i < inner->slotuse_; i++) {
if ((inx + 1) > inner->num_keys_[inner->slot_dir_[i] + 1]) {
inx -= inner->num_keys_[inner->slot_dir_[i]+1];
inx -= inner->num_keys_[inner->slot_dir_[i] + 1];
} else {
return KeyAtPos(inner->data_[inner->slot_dir_[i] + 1], inx);
}

View File

@ -21,11 +21,23 @@
namespace mindspore {
namespace dataset {
template <typename K, typename V, typename C, typename T>
typename BPlusTree<K, V, C, T>::Iterator &BPlusTree<K, V, C, T>::Iterator::operator++() {
template <typename K, typename V, typename A, typename C, typename T>
BPlusTree<K, V, A, C, T>::Iterator::~Iterator() {
if (locked_) {
cur_->rw_lock_.Unlock();
locked_ = false;
}
}
template <typename K, typename V, typename A, typename C, typename T>
typename BPlusTree<K, V, A, C, T>::Iterator &BPlusTree<K, V, A, C, T>::Iterator::operator++() {
if (slot_ + 1u < cur_->slotuse_) {
++slot_;
} else if (cur_->link_.next) {
if (locked_) {
cur_->link_.next->rw_lock_.LockShared();
cur_->rw_lock_.Unlock();
}
cur_ = cur_->link_.next;
slot_ = 0;
} else {
@ -34,12 +46,16 @@ typename BPlusTree<K, V, C, T>::Iterator &BPlusTree<K, V, C, T>::Iterator::opera
return *this;
}
template <typename K, typename V, typename C, typename T>
typename BPlusTree<K, V, C, T>::Iterator BPlusTree<K, V, C, T>::Iterator::operator++(int) {
template <typename K, typename V, typename A, typename C, typename T>
typename BPlusTree<K, V, A, C, T>::Iterator BPlusTree<K, V, A, C, T>::Iterator::operator++(int) {
Iterator tmp = *this;
if (slot_ + 1u < cur_->slotuse_) {
++slot_;
} else if (cur_->link_.next) {
if (locked_) {
cur_->link_.next->rw_lock_.LockShared();
cur_->rw_lock_.Unlock();
}
cur_ = cur_->link_.next;
slot_ = 0;
} else {
@ -48,11 +64,15 @@ typename BPlusTree<K, V, C, T>::Iterator BPlusTree<K, V, C, T>::Iterator::operat
return tmp;
}
template <typename K, typename V, typename C, typename T>
typename BPlusTree<K, V, C, T>::Iterator &BPlusTree<K, V, C, T>::Iterator::operator--() {
template <typename K, typename V, typename A, typename C, typename T>
typename BPlusTree<K, V, A, C, T>::Iterator &BPlusTree<K, V, A, C, T>::Iterator::operator--() {
if (slot_ > 0) {
--slot_;
} else if (cur_->link_.prev) {
if (locked_) {
cur_->link_.prev->rw_lock_.LockShared();
cur_->rw_lock_.Unlock();
}
cur_ = cur_->link_.prev;
slot_ = cur_->slotuse_ - 1;
} else {
@ -61,12 +81,16 @@ typename BPlusTree<K, V, C, T>::Iterator &BPlusTree<K, V, C, T>::Iterator::opera
return *this;
}
template <typename K, typename V, typename C, typename T>
typename BPlusTree<K, V, C, T>::Iterator BPlusTree<K, V, C, T>::Iterator::operator--(int) {
template <typename K, typename V, typename A, typename C, typename T>
typename BPlusTree<K, V, A, C, T>::Iterator BPlusTree<K, V, A, C, T>::Iterator::operator--(int) {
Iterator tmp = *this;
if (slot_ > 0) {
--slot_;
} else if (cur_->link_.prev) {
if (locked_) {
cur_->link_.prev->rw_lock_.LockShared();
cur_->rw_lock_.Unlock();
}
cur_ = cur_->link_.prev;
slot_ = cur_->slotuse_ - 1;
} else {
@ -75,11 +99,77 @@ typename BPlusTree<K, V, C, T>::Iterator BPlusTree<K, V, C, T>::Iterator::operat
return tmp;
}
template <typename K, typename V, typename C, typename T>
typename BPlusTree<K, V, C, T>::ConstIterator &BPlusTree<K, V, C, T>::ConstIterator::operator++() {
template <typename K, typename V, typename A, typename C, typename T>
BPlusTree<K, V, A, C, T>::Iterator::Iterator(const BPlusTree<K, V, A, C, T>::Iterator &lhs) {
this->cur_ = lhs.cur_;
this->slot_ = lhs.slot_;
this->locked_ = lhs.locked_;
if (this->locked_) {
this->cur_->rw_lock_.LockShared();
}
}
template <typename K, typename V, typename A, typename C, typename T>
BPlusTree<K, V, A, C, T>::Iterator::Iterator(BPlusTree<K, V, A, C, T>::Iterator &&lhs) {
this->cur_ = lhs.cur_;
this->slot_ = lhs.slot_;
this->locked_ = lhs.locked_;
lhs.locked_ = false;
lhs.slot_ = 0;
lhs.cur_ = nullptr;
}
template <typename K, typename V, typename A, typename C, typename T>
typename BPlusTree<K, V, A, C, T>::Iterator &BPlusTree<K, V, A, C, T>::Iterator::operator=(
const BPlusTree<K, V, A, C, T>::Iterator &lhs) {
if (*this != lhs) {
if (this->locked_) {
this->cur_->rw_lock_.Unlock();
}
this->cur_ = lhs.cur_;
this->slot_ = lhs.slot_;
this->locked_ = lhs.locked_;
if (this->locked_) {
this->cur_->rw_lock_.LockShared();
}
}
return *this;
}
template <typename K, typename V, typename A, typename C, typename T>
typename BPlusTree<K, V, A, C, T>::Iterator &BPlusTree<K, V, A, C, T>::Iterator::operator=(
BPlusTree<K, V, A, C, T>::Iterator &&lhs) {
if (*this != lhs) {
if (this->locked_) {
this->cur_->rw_lock_.Unlock();
}
this->cur_ = lhs.cur_;
this->slot_ = lhs.slot_;
this->locked_ = lhs.locked_;
lhs.locked_ = false;
lhs.slot_ = 0;
lhs.cur_ = nullptr;
}
return *this;
}
template <typename K, typename V, typename A, typename C, typename T>
BPlusTree<K, V, A, C, T>::ConstIterator::~ConstIterator() {
if (locked_) {
cur_->rw_lock_.Unlock();
locked_ = false;
}
}
template <typename K, typename V, typename A, typename C, typename T>
typename BPlusTree<K, V, A, C, T>::ConstIterator &BPlusTree<K, V, A, C, T>::ConstIterator::operator++() {
if (slot_ + 1u < cur_->slotuse_) {
++slot_;
} else if (cur_->link_.next) {
if (locked_) {
cur_->link_.next->rw_lock_.LockShared();
cur_->rw_lock_.Unlock();
}
cur_ = cur_->link_.next;
slot_ = 0;
} else {
@ -88,12 +178,16 @@ typename BPlusTree<K, V, C, T>::ConstIterator &BPlusTree<K, V, C, T>::ConstItera
return *this;
}
template <typename K, typename V, typename C, typename T>
typename BPlusTree<K, V, C, T>::ConstIterator BPlusTree<K, V, C, T>::ConstIterator::operator++(int) {
template <typename K, typename V, typename A, typename C, typename T>
typename BPlusTree<K, V, A, C, T>::ConstIterator BPlusTree<K, V, A, C, T>::ConstIterator::operator++(int) {
Iterator tmp = *this;
if (slot_ + 1u < cur_->slotuse_) {
++slot_;
} else if (cur_->link_.next) {
if (locked_) {
cur_->link_.next->rw_lock_.LockShared();
cur_->rw_lock_.Unlock();
}
cur_ = cur_->link_.next;
slot_ = 0;
} else {
@ -102,11 +196,15 @@ typename BPlusTree<K, V, C, T>::ConstIterator BPlusTree<K, V, C, T>::ConstIterat
return tmp;
}
template <typename K, typename V, typename C, typename T>
typename BPlusTree<K, V, C, T>::ConstIterator &BPlusTree<K, V, C, T>::ConstIterator::operator--() {
template <typename K, typename V, typename A, typename C, typename T>
typename BPlusTree<K, V, A, C, T>::ConstIterator &BPlusTree<K, V, A, C, T>::ConstIterator::operator--() {
if (slot_ > 0) {
--slot_;
} else if (cur_->link_.prev) {
if (locked_) {
cur_->link_.prev->rw_lock_.LockShared();
cur_->rw_lock_.Unlock();
}
cur_ = cur_->link_.prev;
slot_ = cur_->slotuse_ - 1;
} else {
@ -115,12 +213,16 @@ typename BPlusTree<K, V, C, T>::ConstIterator &BPlusTree<K, V, C, T>::ConstItera
return *this;
}
template <typename K, typename V, typename C, typename T>
typename BPlusTree<K, V, C, T>::ConstIterator BPlusTree<K, V, C, T>::ConstIterator::operator--(int) {
template <typename K, typename V, typename A, typename C, typename T>
typename BPlusTree<K, V, A, C, T>::ConstIterator BPlusTree<K, V, A, C, T>::ConstIterator::operator--(int) {
Iterator tmp = *this;
if (slot_ > 0) {
--slot_;
} else if (cur_->link_.prev) {
if (locked_) {
cur_->link_.prev->rw_lock_.LockShared();
cur_->rw_lock_.Unlock();
}
cur_ = cur_->link_.prev;
slot_ = cur_->slotuse_ - 1;
} else {
@ -129,14 +231,95 @@ typename BPlusTree<K, V, C, T>::ConstIterator BPlusTree<K, V, C, T>::ConstIterat
return tmp;
}
template <typename K, typename V, typename C, typename T>
typename BPlusTree<K, V, C, T>::ConstIterator BPlusTree<K, V, C, T>::Search(const key_type &key) const {
template <typename K, typename V, typename A, typename C, typename T>
BPlusTree<K, V, A, C, T>::ConstIterator::ConstIterator(const BPlusTree<K, V, A, C, T>::ConstIterator &lhs) {
this->cur_ = lhs.cur_;
this->slot_ = lhs.slot_;
this->locked_ = lhs.locked_;
if (this->locked_) {
this->cur_->rw_lock_.LockShared();
}
}
template <typename K, typename V, typename A, typename C, typename T>
BPlusTree<K, V, A, C, T>::ConstIterator::ConstIterator(BPlusTree<K, V, A, C, T>::ConstIterator &&lhs) {
this->cur_ = lhs.cur_;
this->slot_ = lhs.slot_;
this->locked_ = lhs.locked_;
lhs.locked_ = false;
lhs.slot_ = 0;
lhs.cur_ = nullptr;
}
template <typename K, typename V, typename A, typename C, typename T>
typename BPlusTree<K, V, A, C, T>::ConstIterator &BPlusTree<K, V, A, C, T>::ConstIterator::operator=(
const BPlusTree<K, V, A, C, T>::ConstIterator &lhs) {
if (*this != lhs) {
if (this->locked_) {
this->cur_->rw_lock_.Unlock();
}
this->cur_ = lhs.cur_;
this->slot_ = lhs.slot_;
this->locked_ = lhs.locked_;
if (this->locked_) {
this->cur_->rw_lock_.LockShared();
}
}
return *this;
}
template <typename K, typename V, typename A, typename C, typename T>
typename BPlusTree<K, V, A, C, T>::ConstIterator &BPlusTree<K, V, A, C, T>::ConstIterator::operator=(
BPlusTree<K, V, A, C, T>::ConstIterator &&lhs) {
if (*this != lhs) {
if (this->locked_) {
this->cur_->rw_lock_.Unlock();
}
this->cur_ = lhs.cur_;
this->slot_ = lhs.slot_;
this->locked_ = lhs.locked_;
lhs.locked_ = false;
lhs.slot_ = 0;
lhs.cur_ = nullptr;
}
return *this;
}
template <typename K, typename V, typename A, typename C, typename T>
typename BPlusTree<K, V, A, C, T>::ConstIterator BPlusTree<K, V, A, C, T>::Search(const key_type &key) const {
if (root_ != nullptr) {
LeafNode *leaf = nullptr;
slot_type slot;
IndexRc rc = Locate(root_, key, &leaf, &slot);
RWLock *myLock = &this->rw_lock_;
// Lock the tree in S, pass the lock to Locate which will unlock it for us underneath.
myLock->LockShared();
IndexRc rc = Locate(myLock, false, root_, key, &leaf, &slot);
if (rc == IndexRc::kOk) {
return ConstIterator(leaf, slot);
// All locks from the tree to the parent of leaf are all gone. We still have a S lock
// on the leaf. The unlock will be handled by the iterator when it goes out of scope.
return ConstIterator(leaf, slot, true);
} else {
MS_LOG(INFO) << "Key not found. rc = " << static_cast<int>(rc) << ".";
return cend();
}
} else {
return cend();
}
}
template <typename K, typename V, typename A, typename C, typename T>
typename BPlusTree<K, V, A, C, T>::Iterator BPlusTree<K, V, A, C, T>::Search(const key_type &key) {
if (root_ != nullptr) {
LeafNode *leaf = nullptr;
slot_type slot;
RWLock *myLock = &this->rw_lock_;
// Lock the tree in S, pass the lock to Locate which will unlock it for us underneath.
myLock->LockShared();
IndexRc rc = Locate(myLock, false, root_, key, &leaf, &slot);
if (rc == IndexRc::kOk) {
// All locks from the tree to the parent of leaf are all gone. We still have a S lock
// on the leaf. The unlock will be handled by the iterator when it goes out of scope.
return Iterator(leaf, slot, true);
} else {
MS_LOG(INFO) << "Key not found. rc = " << static_cast<int>(rc) << ".";
return end();
@ -146,39 +329,39 @@ typename BPlusTree<K, V, C, T>::ConstIterator BPlusTree<K, V, C, T>::Search(cons
}
}
template <typename K, typename V, typename C, typename T>
typename BPlusTree<K, V, C, T>::value_type BPlusTree<K, V, C, T>::operator[](key_type key) {
ConstIterator it = Search(key);
template <typename K, typename V, typename A, typename C, typename T>
typename BPlusTree<K, V, A, C, T>::value_type BPlusTree<K, V, A, C, T>::operator[](key_type key) {
Iterator it = Search(key);
return it.value();
}
template <typename K, typename V, typename C, typename T>
typename BPlusTree<K, V, C, T>::Iterator BPlusTree<K, V, C, T>::begin() {
template <typename K, typename V, typename A, typename C, typename T>
typename BPlusTree<K, V, A, C, T>::Iterator BPlusTree<K, V, A, C, T>::begin() {
return Iterator(this);
}
template <typename K, typename V, typename C, typename T>
typename BPlusTree<K, V, C, T>::Iterator BPlusTree<K, V, C, T>::end() {
template <typename K, typename V, typename A, typename C, typename T>
typename BPlusTree<K, V, A, C, T>::Iterator BPlusTree<K, V, A, C, T>::end() {
return Iterator(this->leaf_nodes_.tail, this->leaf_nodes_.tail ? this->leaf_nodes_.tail->slotuse_ : 0);
}
template <typename K, typename V, typename C, typename T>
typename BPlusTree<K, V, C, T>::ConstIterator BPlusTree<K, V, C, T>::begin() const {
template <typename K, typename V, typename A, typename C, typename T>
typename BPlusTree<K, V, A, C, T>::ConstIterator BPlusTree<K, V, A, C, T>::begin() const {
return ConstIterator(this);
}
template <typename K, typename V, typename C, typename T>
typename BPlusTree<K, V, C, T>::ConstIterator BPlusTree<K, V, C, T>::end() const {
template <typename K, typename V, typename A, typename C, typename T>
typename BPlusTree<K, V, A, C, T>::ConstIterator BPlusTree<K, V, A, C, T>::end() const {
return ConstIterator(this->leaf_nodes_.tail, this->leaf_nodes_.tail ? this->leaf_nodes_.tail->slotuse_ : 0);
}
template <typename K, typename V, typename C, typename T>
typename BPlusTree<K, V, C, T>::ConstIterator BPlusTree<K, V, C, T>::cbegin() const {
template <typename K, typename V, typename A, typename C, typename T>
typename BPlusTree<K, V, A, C, T>::ConstIterator BPlusTree<K, V, A, C, T>::cbegin() const {
return ConstIterator(this);
}
template <typename K, typename V, typename C, typename T>
typename BPlusTree<K, V, C, T>::ConstIterator BPlusTree<K, V, C, T>::cend() const {
template <typename K, typename V, typename A, typename C, typename T>
typename BPlusTree<K, V, A, C, T>::ConstIterator BPlusTree<K, V, A, C, T>::cend() const {
return ConstIterator(this->leaf_nodes_.tail, this->leaf_nodes_.tail ? this->leaf_nodes_.tail->slotuse_ : 0);
}
} // namespace dataset

View File

@ -50,7 +50,7 @@ class MindDataTestBPlusTree : public UT::Common {
// Test serial insert.
TEST_F(MindDataTestBPlusTree, Test1) {
Allocator<std::string> alloc(std::make_shared<SystemPool>());
BPlusTree<uint64_t, std::string, std::less<uint64_t>, mytraits> btree(alloc);
BPlusTree<uint64_t, std::string, Allocator<std::string>, std::less<uint64_t>, mytraits> btree(alloc);
Status rc;
for (int i = 0; i < 100; i++) {
uint64_t key = 2 * i;
@ -92,16 +92,16 @@ TEST_F(MindDataTestBPlusTree, Test1) {
}
}
// Test nearch
// Test search
{
MS_LOG(INFO) << "Locate key " << 100 << " Expect found.";
auto it = btree.Search(100);
EXPECT_FALSE(it == btree.cend());
EXPECT_FALSE(it == btree.end());
EXPECT_EQ(it.key(), 100);
EXPECT_EQ(it.value(), "Hello World. I am 100");
MS_LOG(INFO) << "Locate key " << 300 << " Expect not found.";
it = btree.Search(300);
EXPECT_TRUE(it == btree.cend());
EXPECT_TRUE(it == btree.end());
}
// Test duplicate key
@ -114,7 +114,7 @@ TEST_F(MindDataTestBPlusTree, Test1) {
// Test concurrent insert.
TEST_F(MindDataTestBPlusTree, Test2) {
Allocator<std::string> alloc(std::make_shared<SystemPool>());
BPlusTree<uint64_t, std::string, std::less<uint64_t>, mytraits> btree(alloc);
BPlusTree<uint64_t, std::string, Allocator<std::string>, std::less<uint64_t>, mytraits> btree(alloc);
TaskGroup vg;
auto f = [&](int k) -> Status {
TaskManager::FindMe()->Post();
@ -127,10 +127,22 @@ TEST_F(MindDataTestBPlusTree, Test2) {
}
return Status::OK();
};
// Spawn two threads. One insert the odd numbers and the other insert the even numbers just like Test1
auto g = [&](int k) -> Status {
TaskManager::FindMe()->Post();
for (int i = 0; i < 1000; i++) {
uint64_t key = rand() % 10000;;
auto it = btree.Search(key);
}
return Status::OK();
};
// Spawn multiple threads to do insert.
for (int k = 0; k < 100; k++) {
vg.CreateAsyncTask("Concurrent Insert", std::bind(f, k));
}
// Spawn a few threads to do random search.
for (int k = 0; k < 2; k++) {
vg.CreateAsyncTask("Concurrent search", std::bind(g, k));
}
vg.join_all();
EXPECT_EQ(btree.size(), 10000);
@ -158,7 +170,7 @@ TEST_F(MindDataTestBPlusTree, Test2) {
MS_LOG(INFO) << "Locating key from 0 to 9999. Expect found.";
for (int i = 0; i < 10000; i++) {
auto it = btree.Search(i);
bool eoS = (it == btree.cend());
bool eoS = (it == btree.end());
EXPECT_FALSE(eoS);
if (!eoS) {
EXPECT_EQ(it.key(), i);
@ -168,7 +180,7 @@ TEST_F(MindDataTestBPlusTree, Test2) {
}
MS_LOG(INFO) << "Locate key " << 10000 << ". Expect not found";
auto it = btree.Search(10000);
EXPECT_TRUE(it == btree.cend());
EXPECT_TRUE(it == btree.end());
}
// Test to retrieve key at certain position.
@ -182,11 +194,11 @@ TEST_F(MindDataTestBPlusTree, Test2) {
TEST_F(MindDataTestBPlusTree, Test3) {
Allocator<std::string> alloc(std::make_shared<SystemPool>());
AutoIndexObj<std::string> ai(alloc);
AutoIndexObj<std::string, Allocator<std::string>> ai(alloc);
Status rc;
rc = ai.insert("Hello World");
EXPECT_TRUE(rc.IsOk());
ai.insert({"a", "b", "c"});
rc = ai.insert({"a", "b", "c"});
EXPECT_TRUE(rc.IsOk());
uint64_t min = ai.min_key();
uint64_t max = ai.max_key();
@ -199,3 +211,30 @@ TEST_F(MindDataTestBPlusTree, Test3) {
MS_LOG(DEBUG) << ai[i] << std::endl;
}
}
TEST_F(MindDataTestBPlusTree, Test4) {
Allocator<int64_t> alloc(std::make_shared<SystemPool>());
AutoIndexObj<int64_t, Allocator<int64_t>> ai(alloc);
Status rc;
for (int i = 0; i < 1000; i++) {
rc = ai.insert(std::make_unique<int64_t>(i));
EXPECT_TRUE(rc.IsOk());
}
// Test iterator
{
int cnt = 0;
auto it = ai.begin();
uint64_t prev = it.key();
++it;
++cnt;
while (it != ai.end()) {
uint64_t cur = it.key();
EXPECT_TRUE(prev < cur);
EXPECT_EQ(it.value(), cnt);
prev = cur;
++it;
++cnt;
}
EXPECT_EQ(cnt, 1000);
}
}