2017-05-26 04:48:44 +08:00
|
|
|
/*
|
|
|
|
* IndexedSet.h
|
|
|
|
*
|
|
|
|
* This source file is part of the FoundationDB open source project
|
|
|
|
*
|
|
|
|
* Copyright 2013-2018 Apple Inc. and the FoundationDB project authors
|
2018-02-22 02:25:11 +08:00
|
|
|
*
|
2017-05-26 04:48:44 +08:00
|
|
|
* Licensed under the Apache License, Version 2.0 (the "License");
|
|
|
|
* you may not use this file except in compliance with the License.
|
|
|
|
* You may obtain a copy of the License at
|
2018-02-22 02:25:11 +08:00
|
|
|
*
|
2017-05-26 04:48:44 +08:00
|
|
|
* http://www.apache.org/licenses/LICENSE-2.0
|
2018-02-22 02:25:11 +08:00
|
|
|
*
|
2017-05-26 04:48:44 +08:00
|
|
|
* Unless required by applicable law or agreed to in writing, software
|
|
|
|
* distributed under the License is distributed on an "AS IS" BASIS,
|
|
|
|
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
|
|
* See the License for the specific language governing permissions and
|
|
|
|
* limitations under the License.
|
|
|
|
*/
|
|
|
|
|
|
|
|
#ifndef FLOW_INDEXEDSET_H
|
|
|
|
#define FLOW_INDEXEDSET_H
|
|
|
|
#pragma once
|
|
|
|
|
2020-04-04 02:18:06 +08:00
|
|
|
#include "flow/Arena.h"
|
2018-10-20 01:30:13 +08:00
|
|
|
#include "flow/Platform.h"
|
|
|
|
#include "flow/FastAlloc.h"
|
|
|
|
#include "flow/Trace.h"
|
|
|
|
#include "flow/Error.h"
|
2017-05-26 04:48:44 +08:00
|
|
|
|
|
|
|
#include <deque>
|
2020-05-17 01:34:36 +08:00
|
|
|
#include <type_traits>
|
2017-05-26 04:48:44 +08:00
|
|
|
#include <vector>
|
|
|
|
|
|
|
|
// IndexedSet<T, Metric> is similar to a std::set<T>, with the following additional features:
|
|
|
|
// - Each element in the set is associated with a value of type Metric
|
|
|
|
// - sumTo() and sumRange() can report the sum of the metric values associated with a
|
|
|
|
// contiguous range of elements in O(lg N) time
|
|
|
|
// - index() can be used to find an element having a given sumTo() in O(lg N) time
|
|
|
|
// - Search functions (find(), lower_bound(), etc) can accept a type comparable to T instead of T
|
|
|
|
// (e.g. StringRef when T is std::string or Standalone<StringRef>). This can save a lot of needless
|
|
|
|
// copying at query time for read-mostly sets with string keys.
|
|
|
|
// - the size() function is missing; if the metric being used is a count sumTo(end()) will do instead
|
|
|
|
// A number of STL compatibility features are missing and should be added as needed.
|
|
|
|
// T must define operator <, which must define a total order. Unlike std::set,
|
|
|
|
// a user-defined predicate is not currently supported as a template parameter.
|
|
|
|
// Metric is required to have operators + and - and <, and behavior is undefined if
|
|
|
|
// the sum of metrics for all elements of a set overflows the Metric type.
|
|
|
|
|
|
|
|
// Map<Key,Value> is similar to a std::map<Key,Value>, except that it inherits the search key type
|
|
|
|
// flexibility of IndexedSet<>, uses MapPair<Key,Value> by default instead of pair<Key,Value>
|
|
|
|
// (use iterator->key instead of iterator->first), and uses FastAllocator for nodes.
|
|
|
|
|
|
|
|
template <class T>
|
|
|
|
class Future;
|
|
|
|
|
|
|
|
class Void;
|
|
|
|
|
2019-01-10 10:03:54 +08:00
|
|
|
class StringRef;
|
|
|
|
|
2017-05-26 04:48:44 +08:00
|
|
|
template <class T, class Metric>
|
2021-03-11 02:06:03 +08:00
|
|
|
struct IndexedSet {
|
2017-05-26 04:48:44 +08:00
|
|
|
typedef T value_type;
|
|
|
|
typedef T key_type;
|
|
|
|
|
|
|
|
private: // Forward-declare IndexedSet::Node because Clang is much stricter about this ordering.
|
|
|
|
struct Node : FastAllocated<Node> {
|
2017-10-04 11:07:29 +08:00
|
|
|
// Here, and throughout all code that indirectly instantiates a Node, we rely on forwarding
|
|
|
|
// references so that we don't need to maintain the set of 2^arity lvalue and rvalue reference
|
|
|
|
// combinations, but still take advantage of move constructors when available (or required).
|
|
|
|
template <class T_, class Metric_>
|
2021-03-11 02:06:03 +08:00
|
|
|
Node(T_&& data, Metric_&& m, Node* parent = 0)
|
|
|
|
: data(std::forward<T_>(data)), total(std::forward<Metric_>(m)), parent(parent), balance(0) {
|
2020-05-17 01:34:36 +08:00
|
|
|
child[0] = child[1] = nullptr;
|
2017-05-26 04:48:44 +08:00
|
|
|
}
|
2020-05-17 01:34:36 +08:00
|
|
|
Node(Node const&) = delete;
|
|
|
|
Node& operator=(Node const&) = delete;
|
2021-03-11 02:06:03 +08:00
|
|
|
~Node() {
|
2017-05-26 04:48:44 +08:00
|
|
|
delete child[0];
|
|
|
|
delete child[1];
|
|
|
|
}
|
|
|
|
|
|
|
|
T data;
|
2021-03-11 02:06:03 +08:00
|
|
|
signed char balance; // right height - left height
|
|
|
|
Metric total; // this + child[0] + child[1]
|
|
|
|
Node* child[2]; // left, right
|
|
|
|
Node* parent;
|
2017-05-26 04:48:44 +08:00
|
|
|
};
|
|
|
|
|
2020-05-17 01:34:36 +08:00
|
|
|
template <bool isConst>
|
|
|
|
struct IteratorImpl {
|
2020-05-17 05:25:13 +08:00
|
|
|
typename std::conditional_t<isConst, const IndexedSet::Node, IndexedSet::Node>* node;
|
2020-05-17 01:34:36 +08:00
|
|
|
|
2020-05-18 03:47:32 +08:00
|
|
|
explicit IteratorImpl<isConst>(const IteratorImpl<!isConst>& nonConstIter) : node(nonConstIter.node) {
|
|
|
|
static_assert(isConst);
|
|
|
|
}
|
2020-05-17 01:34:36 +08:00
|
|
|
|
2020-05-17 05:25:13 +08:00
|
|
|
explicit IteratorImpl(decltype(node) n = nullptr) : node(n){};
|
2020-05-17 01:34:36 +08:00
|
|
|
|
2020-05-18 03:47:32 +08:00
|
|
|
typename std::conditional_t<isConst, const T, T>& operator*() const { return node->data; }
|
2020-05-17 01:34:36 +08:00
|
|
|
|
2020-05-18 03:47:32 +08:00
|
|
|
typename std::conditional_t<isConst, const T, T>* operator->() const { return &node->data; }
|
2020-05-17 01:34:36 +08:00
|
|
|
|
2017-05-26 04:48:44 +08:00
|
|
|
void operator++();
|
|
|
|
void decrementNonEnd();
|
2020-05-18 03:47:32 +08:00
|
|
|
bool operator==(const IteratorImpl<isConst>& r) const { return node == r.node; }
|
|
|
|
bool operator!=(const IteratorImpl<isConst>& r) const { return node != r.node; }
|
2019-01-10 10:03:54 +08:00
|
|
|
// following two methods are for memory storage engine(KeyValueStoreMemory class) use only
|
|
|
|
// in order to have same interface as radixtree
|
2020-05-18 04:29:22 +08:00
|
|
|
typename std::conditional_t<isConst, const StringRef, StringRef>& getKey(uint8_t* dummyContent) const {
|
|
|
|
return node->data.key;
|
|
|
|
}
|
|
|
|
typename std::conditional_t<isConst, const StringRef, StringRef>& getValue() const { return node->data.value; }
|
2017-05-26 04:48:44 +08:00
|
|
|
};
|
|
|
|
|
2020-05-17 01:34:36 +08:00
|
|
|
template <bool isConst>
|
|
|
|
struct Impl {
|
2020-05-17 03:53:36 +08:00
|
|
|
using NodeT = std::conditional_t<isConst, const Node, Node>;
|
2020-05-17 01:34:36 +08:00
|
|
|
using IteratorT = IteratorImpl<isConst>;
|
|
|
|
using SetT = std::conditional_t<isConst, const IndexedSet<T, Metric>, IndexedSet<T, Metric>>;
|
|
|
|
|
|
|
|
static IteratorT begin(SetT&);
|
|
|
|
|
|
|
|
template <bool constIterator>
|
|
|
|
static IteratorImpl<isConst || constIterator> previous(SetT&, IteratorImpl<constIterator>);
|
|
|
|
|
|
|
|
template <class M>
|
|
|
|
static IteratorT index(SetT&, const M&);
|
|
|
|
|
|
|
|
template <class Key>
|
|
|
|
static IteratorT find(SetT&, const Key&);
|
|
|
|
|
|
|
|
template <class Key>
|
|
|
|
static IteratorT upper_bound(SetT&, const Key&);
|
|
|
|
|
|
|
|
template <class Key>
|
|
|
|
static IteratorT lower_bound(SetT&, const Key&);
|
|
|
|
|
|
|
|
template <class Key>
|
|
|
|
static IteratorT lastLessOrEqual(SetT&, const Key&);
|
|
|
|
|
|
|
|
static IteratorT lastItem(SetT&);
|
|
|
|
};
|
|
|
|
|
2020-05-17 01:38:42 +08:00
|
|
|
using ConstImpl = Impl<true>;
|
|
|
|
using NonConstImpl = Impl<false>;
|
|
|
|
|
2020-05-17 01:34:36 +08:00
|
|
|
public:
|
|
|
|
using iterator = IteratorImpl<false>;
|
|
|
|
using const_iterator = IteratorImpl<true>;
|
|
|
|
|
2020-05-17 06:00:15 +08:00
|
|
|
IndexedSet() : root(nullptr){};
|
2017-05-26 04:48:44 +08:00
|
|
|
~IndexedSet() { delete root; }
|
2020-06-10 08:33:41 +08:00
|
|
|
IndexedSet(IndexedSet&& r) noexcept : root(r.root) { r.root = nullptr; }
|
|
|
|
IndexedSet& operator=(IndexedSet&& r) noexcept {
|
|
|
|
delete root;
|
|
|
|
root = r.root;
|
|
|
|
r.root = 0;
|
|
|
|
return *this;
|
|
|
|
}
|
2017-05-26 04:48:44 +08:00
|
|
|
|
2020-05-17 01:38:42 +08:00
|
|
|
const_iterator begin() const { return ConstImpl::begin(*this); };
|
|
|
|
iterator begin() { return NonConstImpl::begin(*this); };
|
2020-05-17 09:01:07 +08:00
|
|
|
const_iterator cbegin() const { return begin(); }
|
|
|
|
|
2020-05-17 05:29:38 +08:00
|
|
|
const_iterator end() const { return const_iterator{}; }
|
|
|
|
iterator end() { return iterator{}; }
|
2020-05-17 09:01:07 +08:00
|
|
|
const_iterator cend() const { return end(); }
|
2020-05-17 01:34:36 +08:00
|
|
|
|
2020-05-17 01:38:42 +08:00
|
|
|
const_iterator previous(const_iterator i) const { return ConstImpl::previous(*this, i); }
|
2020-05-17 08:01:26 +08:00
|
|
|
const_iterator previous(iterator i) const { return ConstImpl::previous(*this, const_iterator{ i }); }
|
2020-05-17 03:53:36 +08:00
|
|
|
iterator previous(iterator i) { return NonConstImpl::previous(*this, i); }
|
2020-05-17 01:34:36 +08:00
|
|
|
|
2020-05-17 01:38:42 +08:00
|
|
|
const_iterator lastItem() const { return ConstImpl::lastItem(*this); }
|
|
|
|
iterator lastItem() { return NonConstImpl::lastItem(*this); }
|
2017-05-26 04:48:44 +08:00
|
|
|
|
|
|
|
bool empty() const { return !root; }
|
2020-05-17 06:00:15 +08:00
|
|
|
void clear() {
|
|
|
|
delete root;
|
|
|
|
root = nullptr;
|
|
|
|
}
|
2021-03-11 02:06:03 +08:00
|
|
|
void swap(IndexedSet& r) { std::swap(root, r.root); }
|
2017-05-26 04:48:44 +08:00
|
|
|
|
|
|
|
// Place data in the set with the given metric. If an item equal to data is already in the set and,
|
|
|
|
// replaceExisting == true, it will be overwritten (and its metric will be replaced)
|
2017-10-04 11:07:29 +08:00
|
|
|
template <class T_, class Metric_>
|
2021-03-11 02:06:03 +08:00
|
|
|
iterator insert(T_&& data, Metric_&& metric, bool replaceExisting = true);
|
2017-05-26 04:48:44 +08:00
|
|
|
|
2021-03-11 02:06:03 +08:00
|
|
|
// Insert all items from data into set. All items will use metric. If an item equal to data is already in the set
|
|
|
|
// and,
|
|
|
|
// replaceExisting == true, it will be overwritten (and its metric will be replaced). returns the number of items
|
|
|
|
// inserted.
|
|
|
|
int insert(const std::vector<std::pair<T, Metric>>& data, bool replaceExisting = true);
|
2017-05-26 04:48:44 +08:00
|
|
|
|
|
|
|
// Increase the metric for the given item by the given amount. Inserts data into the set if it
|
|
|
|
// doesn't exist. Returns the new sum.
|
2017-10-04 11:07:29 +08:00
|
|
|
template <class T_, class Metric_>
|
2021-03-11 02:06:03 +08:00
|
|
|
Metric addMetric(T_&& data, Metric_&& metric);
|
2017-05-26 04:48:44 +08:00
|
|
|
|
|
|
|
// Remove the data item, if any, which is equal to key
|
|
|
|
template <class Key>
|
2021-03-11 02:06:03 +08:00
|
|
|
void erase(const Key& key) {
|
|
|
|
erase(find(key));
|
|
|
|
}
|
2017-05-26 04:48:44 +08:00
|
|
|
|
|
|
|
// Erase the indicated item. No effect if item == end().
|
|
|
|
// SOMEDAY: Return ++item
|
|
|
|
void erase(iterator item);
|
|
|
|
|
|
|
|
// Erase all data items x for which begin<=x<end
|
|
|
|
template <class Key>
|
2021-03-11 02:06:03 +08:00
|
|
|
void erase(const Key& begin, const Key& end) {
|
|
|
|
erase(lower_bound(begin), lower_bound(end));
|
|
|
|
}
|
2017-05-26 04:48:44 +08:00
|
|
|
|
|
|
|
// Erase data items with a deferred (async) free process. The data structure has the items removed
|
|
|
|
// synchronously with the invocation of this method so any subsequent call will see this new state.
|
|
|
|
template <class Key>
|
|
|
|
Future<Void> eraseAsync(const Key& begin, const Key& end);
|
|
|
|
|
|
|
|
// Erase the items in the indicated range.
|
|
|
|
void erase(iterator begin, iterator end);
|
|
|
|
|
|
|
|
// Erase data items with a deferred (async) free process. The data structure has the items removed
|
|
|
|
// synchronously with the invocation of this method so any subsequent call will see this new state.
|
|
|
|
Future<Void> eraseAsync(iterator begin, iterator end);
|
|
|
|
|
|
|
|
// Returns the number of items equal to key (either 0 or 1)
|
|
|
|
template <class Key>
|
2021-03-11 02:06:03 +08:00
|
|
|
int count(const Key& key) const {
|
|
|
|
return find(key) != end();
|
|
|
|
}
|
2017-05-26 04:48:44 +08:00
|
|
|
|
|
|
|
// Returns x such that key==*x, or end()
|
|
|
|
template <class Key>
|
2020-05-17 01:34:36 +08:00
|
|
|
const_iterator find(const Key& key) const {
|
2020-05-17 01:38:42 +08:00
|
|
|
return ConstImpl::find(*this, key);
|
2020-05-17 01:34:36 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
template <class Key>
|
|
|
|
iterator find(const Key& key) {
|
2020-05-17 01:38:42 +08:00
|
|
|
return NonConstImpl::find(*this, key);
|
2020-05-17 01:34:36 +08:00
|
|
|
}
|
2017-05-26 04:48:44 +08:00
|
|
|
|
|
|
|
// Returns the smallest x such that *x>=key, or end()
|
|
|
|
template <class Key>
|
2020-05-17 01:34:36 +08:00
|
|
|
const_iterator lower_bound(const Key& key) const {
|
2020-05-17 01:38:42 +08:00
|
|
|
return ConstImpl::lower_bound(*this, key);
|
2020-05-17 01:34:36 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
template <class Key>
|
|
|
|
iterator lower_bound(const Key& key) {
|
2020-05-17 01:38:42 +08:00
|
|
|
return NonConstImpl::lower_bound(*this, key);
|
2020-05-17 01:34:36 +08:00
|
|
|
};
|
2017-05-26 04:48:44 +08:00
|
|
|
|
|
|
|
// Returns the smallest x such that *x>key, or end()
|
|
|
|
template <class Key>
|
2020-05-17 01:34:36 +08:00
|
|
|
const_iterator upper_bound(const Key& key) const {
|
2020-05-17 01:38:42 +08:00
|
|
|
return ConstImpl::upper_bound(*this, key);
|
2020-05-17 01:34:36 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
template <class Key>
|
|
|
|
iterator upper_bound(const Key& key) {
|
2020-05-17 01:38:42 +08:00
|
|
|
return NonConstImpl::upper_bound(*this, key);
|
2020-05-17 01:34:36 +08:00
|
|
|
};
|
2017-05-26 04:48:44 +08:00
|
|
|
|
|
|
|
// Returns the largest x such that *x<=key, or end()
|
|
|
|
template <class Key>
|
2020-05-17 01:34:36 +08:00
|
|
|
const_iterator lastLessOrEqual(const Key& key) const {
|
2020-05-17 01:38:42 +08:00
|
|
|
return ConstImpl::lastLessOrEqual(*this, key);
|
2020-05-17 01:34:36 +08:00
|
|
|
};
|
|
|
|
|
|
|
|
template <class Key>
|
|
|
|
iterator lastLessOrEqual(const Key& key) {
|
2020-05-17 01:38:42 +08:00
|
|
|
return NonConstImpl::lastLessOrEqual(*this, key);
|
2020-05-17 01:34:36 +08:00
|
|
|
}
|
2017-05-26 04:48:44 +08:00
|
|
|
|
|
|
|
// Returns smallest x such that sumTo(x+1) > metric, or end()
|
|
|
|
template <class M>
|
2020-05-17 01:34:36 +08:00
|
|
|
const_iterator index(M const& metric) const {
|
2020-05-17 01:38:42 +08:00
|
|
|
return ConstImpl::index(*this, metric);
|
2020-05-17 01:34:36 +08:00
|
|
|
};
|
|
|
|
|
|
|
|
template <class M>
|
|
|
|
iterator index(M const& metric) {
|
2020-05-17 01:38:42 +08:00
|
|
|
return NonConstImpl::index(*this, metric);
|
2020-05-17 01:34:36 +08:00
|
|
|
}
|
2017-05-26 04:48:44 +08:00
|
|
|
|
|
|
|
// Return the metric inserted with item x
|
2020-05-17 01:34:36 +08:00
|
|
|
Metric getMetric(const_iterator x) const;
|
2020-05-18 02:23:10 +08:00
|
|
|
Metric getMetric(iterator x) const { return getMetric(const_iterator{ x }); }
|
2017-05-26 04:48:44 +08:00
|
|
|
|
|
|
|
// Return the sum of getMetric(x) for begin()<=x<to
|
2020-05-17 01:34:36 +08:00
|
|
|
Metric sumTo(const_iterator to) const;
|
2020-05-18 02:23:10 +08:00
|
|
|
Metric sumTo(iterator to) const { return sumTo(const_iterator{ to }); }
|
2017-05-26 04:48:44 +08:00
|
|
|
|
|
|
|
// Return the sum of getMetric(x) for begin<=x<end
|
2020-05-17 01:34:36 +08:00
|
|
|
Metric sumRange(const_iterator begin, const_iterator end) const { return sumTo(end) - sumTo(begin); }
|
2020-05-17 04:01:57 +08:00
|
|
|
Metric sumRange(iterator begin, iterator end) const {
|
|
|
|
return sumTo(const_iterator{ end }) - sumTo(const_iterator{ begin });
|
|
|
|
}
|
2017-05-26 04:48:44 +08:00
|
|
|
|
|
|
|
// Return the sum of getMetric(x) for all x s.t. begin <= *x && *x < end
|
2020-05-17 01:34:36 +08:00
|
|
|
template <class Key>
|
|
|
|
Metric sumRange(const Key& begin, const Key& end) const {
|
|
|
|
return sumRange(lower_bound(begin), lower_bound(end));
|
|
|
|
}
|
2017-05-26 04:48:44 +08:00
|
|
|
|
|
|
|
// Return the amount of memory used by an entry in the IndexedSet
|
2020-06-18 09:08:43 +08:00
|
|
|
constexpr static int getElementBytes() { return sizeof(Node); }
|
2017-05-26 04:48:44 +08:00
|
|
|
|
|
|
|
private:
|
|
|
|
// Copy operations unimplemented. SOMEDAY: Implement and make public.
|
2021-03-11 02:06:03 +08:00
|
|
|
IndexedSet(const IndexedSet&);
|
|
|
|
IndexedSet& operator=(const IndexedSet&);
|
2017-05-26 04:48:44 +08:00
|
|
|
|
2021-03-11 02:06:03 +08:00
|
|
|
Node* root;
|
2017-05-26 04:48:44 +08:00
|
|
|
|
2020-04-04 02:18:06 +08:00
|
|
|
Metric eraseHalf(Node* start, Node* end, int eraseDir, int& heightDelta, std::vector<Node*>& toFree);
|
2021-03-11 02:06:03 +08:00
|
|
|
void erase(iterator begin, iterator end, std::vector<Node*>& toFree);
|
2017-05-26 04:48:44 +08:00
|
|
|
|
2021-03-11 02:06:03 +08:00
|
|
|
void replacePointer(Node* oldNode, Node* newNode) {
|
2017-05-26 04:48:44 +08:00
|
|
|
if (oldNode->parent)
|
2021-03-11 02:06:03 +08:00
|
|
|
oldNode->parent->child[oldNode->parent->child[1] == oldNode] = newNode;
|
2017-05-26 04:48:44 +08:00
|
|
|
else
|
|
|
|
root = newNode;
|
|
|
|
if (newNode)
|
|
|
|
newNode->parent = oldNode->parent;
|
|
|
|
}
|
|
|
|
|
2020-05-17 02:31:15 +08:00
|
|
|
template <int direction, bool isConst>
|
2020-05-17 05:58:09 +08:00
|
|
|
static void moveIteratorImpl(std::conditional_t<isConst, const Node, Node>*& node) {
|
2020-05-17 02:31:15 +08:00
|
|
|
if (node->child[0 ^ direction]) {
|
|
|
|
node = node->child[0 ^ direction];
|
2021-03-11 02:06:03 +08:00
|
|
|
while (node->child[1 ^ direction])
|
|
|
|
node = node->child[1 ^ direction];
|
2020-05-17 01:34:36 +08:00
|
|
|
} else {
|
2021-03-11 02:06:03 +08:00
|
|
|
while (node->parent && node->parent->child[0 ^ direction] == node)
|
|
|
|
node = node->parent;
|
2020-05-17 02:31:15 +08:00
|
|
|
node = node->parent;
|
2020-05-17 01:34:36 +08:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2020-05-17 02:31:15 +08:00
|
|
|
// direction 0 = left, 1 = right
|
2020-05-17 01:34:36 +08:00
|
|
|
template <int direction>
|
2020-05-17 02:31:15 +08:00
|
|
|
static void moveIterator(Node const*& node) {
|
2020-05-17 05:58:09 +08:00
|
|
|
moveIteratorImpl<direction, true>(node);
|
2020-05-17 02:31:15 +08:00
|
|
|
}
|
|
|
|
template <int direction>
|
|
|
|
static void moveIterator(Node*& node) {
|
2020-05-17 05:58:09 +08:00
|
|
|
moveIteratorImpl<direction, false>(node);
|
2017-05-26 04:48:44 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
public: // but testonly
|
2021-03-11 02:06:03 +08:00
|
|
|
std::pair<int, int> testonly_assertBalanced(Node* n = 0, int d = 0, bool a = true);
|
2017-05-26 04:48:44 +08:00
|
|
|
};
|
|
|
|
|
|
|
|
class NoMetric {
|
|
|
|
public:
|
|
|
|
NoMetric() {}
|
|
|
|
NoMetric(int) {} // NoMetric(1)
|
|
|
|
NoMetric operator+(NoMetric const&) const { return NoMetric(); }
|
|
|
|
NoMetric operator-(NoMetric const&) const { return NoMetric(); }
|
|
|
|
bool operator<(NoMetric const&) const { return false; }
|
|
|
|
};
|
|
|
|
|
|
|
|
template <class Key, class Value>
|
|
|
|
class MapPair {
|
|
|
|
public:
|
|
|
|
Key key;
|
|
|
|
Value value;
|
|
|
|
|
2017-10-04 11:07:29 +08:00
|
|
|
template <class Key_, class Value_>
|
2021-03-11 02:06:03 +08:00
|
|
|
MapPair(Key_&& key, Value_&& value) : key(std::forward<Key_>(key)), value(std::forward<Value_>(value)) {}
|
|
|
|
void operator=(MapPair const& rhs) {
|
|
|
|
key = rhs.key;
|
|
|
|
value = rhs.value;
|
|
|
|
}
|
|
|
|
MapPair(MapPair const& rhs) : key(rhs.key), value(rhs.value) {}
|
2017-05-26 04:48:44 +08:00
|
|
|
|
2020-06-10 08:33:41 +08:00
|
|
|
MapPair(MapPair&& r) noexcept : key(std::move(r.key)), value(std::move(r.value)) {}
|
|
|
|
void operator=(MapPair&& r) noexcept {
|
|
|
|
key = std::move(r.key);
|
|
|
|
value = std::move(r.value);
|
|
|
|
}
|
2017-05-26 04:48:44 +08:00
|
|
|
|
2020-04-04 02:18:06 +08:00
|
|
|
int compare(MapPair<Key, Value> const& r) const { return ::compare(key, r.key); }
|
|
|
|
template <class CompatibleWithKey>
|
|
|
|
int compare(CompatibleWithKey const& r) const {
|
|
|
|
return ::compare(key, r);
|
|
|
|
}
|
2021-03-11 02:06:03 +08:00
|
|
|
bool operator<(MapPair<Key, Value> const& r) const { return key < r.key; }
|
2020-07-11 05:37:47 +08:00
|
|
|
bool operator>(MapPair<Key, Value> const& r) const { return key > r.key; }
|
2021-03-11 02:06:03 +08:00
|
|
|
bool operator<=(MapPair<Key, Value> const& r) const { return key <= r.key; }
|
2020-07-11 05:37:47 +08:00
|
|
|
bool operator>=(MapPair<Key, Value> const& r) const { return key >= r.key; }
|
2021-03-11 02:06:03 +08:00
|
|
|
bool operator==(MapPair<Key, Value> const& r) const { return key == r.key; }
|
|
|
|
bool operator!=(MapPair<Key, Value> const& r) const { return key != r.key; }
|
2017-05-26 04:48:44 +08:00
|
|
|
|
2021-03-11 02:06:03 +08:00
|
|
|
// private: MapPair( const MapPair& );
|
2017-05-26 04:48:44 +08:00
|
|
|
};
|
|
|
|
|
2020-04-04 02:18:06 +08:00
|
|
|
template <class Key, class Value, class CompatibleWithKey>
|
|
|
|
inline int compare(CompatibleWithKey const& l, MapPair<Key, Value> const& r) {
|
|
|
|
return compare(l, r.key);
|
|
|
|
}
|
|
|
|
|
2017-05-26 04:48:44 +08:00
|
|
|
template <class Key, class Value>
|
2021-03-11 02:06:03 +08:00
|
|
|
inline MapPair<typename std::decay<Key>::type, typename std::decay<Value>::type> mapPair(Key&& key, Value&& value) {
|
|
|
|
return MapPair<typename std::decay<Key>::type, typename std::decay<Value>::type>(std::forward<Key>(key),
|
|
|
|
std::forward<Value>(value));
|
|
|
|
}
|
2017-05-26 04:48:44 +08:00
|
|
|
|
|
|
|
template <class Key, class Value, class CompatibleWithKey>
|
2021-03-11 02:06:03 +08:00
|
|
|
bool operator<(MapPair<Key, Value> const& l, CompatibleWithKey const& r) {
|
|
|
|
return l.key < r;
|
|
|
|
}
|
2017-05-26 04:48:44 +08:00
|
|
|
|
|
|
|
template <class Key, class Value, class CompatibleWithKey>
|
2021-03-11 02:06:03 +08:00
|
|
|
bool operator<(CompatibleWithKey const& l, MapPair<Key, Value> const& r) {
|
|
|
|
return l < r.key;
|
|
|
|
}
|
2017-05-26 04:48:44 +08:00
|
|
|
|
2021-03-11 02:06:03 +08:00
|
|
|
template <class Key, class Value, class Pair = MapPair<Key, Value>, class Metric = NoMetric>
|
2017-05-26 04:48:44 +08:00
|
|
|
class Map {
|
|
|
|
public:
|
2021-03-11 02:06:03 +08:00
|
|
|
typedef typename IndexedSet<Pair, Metric>::iterator iterator;
|
2020-05-17 01:34:36 +08:00
|
|
|
typedef typename IndexedSet<Pair, Metric>::const_iterator const_iterator;
|
2017-05-26 04:48:44 +08:00
|
|
|
|
|
|
|
Map() {}
|
2020-05-17 01:34:36 +08:00
|
|
|
const_iterator begin() const { return set.begin(); }
|
|
|
|
iterator begin() { return set.begin(); }
|
2020-05-17 09:01:07 +08:00
|
|
|
const_iterator cbegin() const { return begin(); }
|
2020-05-17 01:34:36 +08:00
|
|
|
const_iterator end() const { return set.end(); }
|
|
|
|
iterator end() { return set.end(); }
|
2020-05-17 09:01:07 +08:00
|
|
|
const_iterator cend() const { return end(); }
|
2020-05-17 01:34:36 +08:00
|
|
|
const_iterator lastItem() const { return set.lastItem(); }
|
|
|
|
iterator lastItem() { return set.lastItem(); }
|
|
|
|
const_iterator previous(const_iterator i) const { return set.previous(i); }
|
|
|
|
iterator previous(iterator i) { return set.previous(i); }
|
2017-05-26 04:48:44 +08:00
|
|
|
bool empty() const { return set.empty(); }
|
|
|
|
|
2021-03-11 02:06:03 +08:00
|
|
|
Value& operator[](const Key& key) {
|
|
|
|
iterator i = set.insert(Pair(key, Value()), Metric(1), false);
|
2017-05-26 04:48:44 +08:00
|
|
|
return i->value;
|
|
|
|
}
|
|
|
|
|
2021-03-11 02:06:03 +08:00
|
|
|
Value& get(const Key& key, Metric m = Metric(1)) {
|
|
|
|
iterator i = set.insert(Pair(key, Value()), m, false);
|
2017-05-26 04:48:44 +08:00
|
|
|
return i->value;
|
|
|
|
}
|
|
|
|
|
2021-03-11 02:06:03 +08:00
|
|
|
iterator insert(const Pair& p, bool replaceExisting = true, Metric m = Metric(1)) {
|
|
|
|
return set.insert(p, m, replaceExisting);
|
|
|
|
}
|
|
|
|
iterator insert(Pair&& p, bool replaceExisting = true, Metric m = Metric(1)) {
|
|
|
|
return set.insert(std::move(p), m, replaceExisting);
|
|
|
|
}
|
|
|
|
int insert(const std::vector<std::pair<MapPair<Key, Value>, Metric>>& pairs, bool replaceExisting = true) {
|
|
|
|
return set.insert(pairs, replaceExisting);
|
|
|
|
}
|
|
|
|
|
2017-05-26 04:48:44 +08:00
|
|
|
template <class KeyCompatible>
|
2021-03-11 02:06:03 +08:00
|
|
|
void erase(KeyCompatible const& k) {
|
|
|
|
set.erase(k);
|
|
|
|
}
|
|
|
|
void erase(iterator b, iterator e) { set.erase(b, e); }
|
|
|
|
void erase(iterator x) { set.erase(x); }
|
2017-05-26 04:48:44 +08:00
|
|
|
void clear() { set.clear(); }
|
|
|
|
Metric size() const {
|
|
|
|
static_assert(!std::is_same<Metric, NoMetric>::value, "size() on Map with NoMetric is not valid!");
|
|
|
|
return sumTo(end());
|
|
|
|
}
|
|
|
|
|
|
|
|
template <class KeyCompatible>
|
2020-05-17 01:34:36 +08:00
|
|
|
const_iterator find(KeyCompatible const& k) const {
|
|
|
|
return set.find(k);
|
|
|
|
}
|
|
|
|
template <class KeyCompatible>
|
|
|
|
iterator find(KeyCompatible const& k) {
|
|
|
|
return set.find(k);
|
|
|
|
}
|
|
|
|
|
|
|
|
template <class KeyCompatible>
|
|
|
|
const_iterator lower_bound(KeyCompatible const& k) const {
|
|
|
|
return set.lower_bound(k);
|
|
|
|
}
|
|
|
|
template <class KeyCompatible>
|
|
|
|
iterator lower_bound(KeyCompatible const& k) {
|
|
|
|
return set.lower_bound(k);
|
|
|
|
}
|
|
|
|
|
|
|
|
template <class KeyCompatible>
|
|
|
|
const_iterator upper_bound(KeyCompatible const& k) const {
|
|
|
|
return set.upper_bound(k);
|
|
|
|
}
|
2017-05-26 04:48:44 +08:00
|
|
|
template <class KeyCompatible>
|
2020-05-17 01:34:36 +08:00
|
|
|
iterator upper_bound(KeyCompatible const& k) {
|
|
|
|
return set.upper_bound(k);
|
|
|
|
}
|
|
|
|
|
2017-05-26 04:48:44 +08:00
|
|
|
template <class KeyCompatible>
|
2020-05-17 01:34:36 +08:00
|
|
|
const_iterator lastLessOrEqual(KeyCompatible const& k) const {
|
|
|
|
return set.lastLessOrEqual(k);
|
|
|
|
}
|
2017-05-26 04:48:44 +08:00
|
|
|
template <class KeyCompatible>
|
2020-05-17 01:34:36 +08:00
|
|
|
iterator lastLessOrEqual(KeyCompatible const& k) {
|
|
|
|
return set.lastLessOrEqual(k);
|
|
|
|
}
|
|
|
|
|
|
|
|
template <class M>
|
|
|
|
const_iterator index(M const& metric) const {
|
|
|
|
return set.index(metric);
|
|
|
|
}
|
|
|
|
template <class M>
|
|
|
|
iterator index(M const& metric) {
|
|
|
|
return set.index(metric);
|
|
|
|
}
|
|
|
|
|
|
|
|
Metric getMetric(const_iterator x) const { return set.getMetric(x); }
|
|
|
|
Metric getMetric(iterator x) const { return getMetric(const_iterator{ x }); }
|
|
|
|
|
|
|
|
Metric sumTo(const_iterator to) const { return set.sumTo(to); }
|
|
|
|
Metric sumTo(iterator to) const { return sumTo(const_iterator{ to }); }
|
|
|
|
|
|
|
|
Metric sumRange(const_iterator begin, const_iterator end) const { return set.sumRange(begin, end); }
|
|
|
|
Metric sumRange(iterator begin, iterator end) const { return set.sumRange(begin, end); }
|
2021-03-11 02:06:03 +08:00
|
|
|
template <class KeyCompatible>
|
|
|
|
Metric sumRange(const KeyCompatible& begin, const KeyCompatible& end) const {
|
|
|
|
return set.sumRange(begin, end);
|
|
|
|
}
|
2017-05-26 04:48:44 +08:00
|
|
|
|
2021-03-11 02:06:03 +08:00
|
|
|
static int getElementBytes() { return IndexedSet<Pair, Metric>::getElementBytes(); }
|
2017-05-26 04:48:44 +08:00
|
|
|
|
2020-06-10 08:33:41 +08:00
|
|
|
Map(Map&& r) noexcept : set(std::move(r.set)) {}
|
|
|
|
void operator=(Map&& r) noexcept { set = std::move(r.set); }
|
2017-05-26 04:48:44 +08:00
|
|
|
|
2020-10-01 03:22:23 +08:00
|
|
|
Future<Void> clearAsync();
|
|
|
|
|
2017-05-26 04:48:44 +08:00
|
|
|
private:
|
2021-03-11 02:06:03 +08:00
|
|
|
Map(Map<Key, Value, Pair> const&); // unimplemented
|
|
|
|
void operator=(Map<Key, Value, Pair> const&); // unimplemented
|
2017-05-26 04:48:44 +08:00
|
|
|
|
2021-03-11 02:06:03 +08:00
|
|
|
IndexedSet<Pair, Metric> set;
|
2017-05-26 04:48:44 +08:00
|
|
|
};
|
|
|
|
|
|
|
|
/////////////////////// implementation //////////////////////////
|
|
|
|
|
|
|
|
template <class T, class Metric>
|
2020-05-17 01:34:36 +08:00
|
|
|
template <bool isConst>
|
|
|
|
void IndexedSet<T, Metric>::IteratorImpl<isConst>::operator++() {
|
2020-05-17 05:25:13 +08:00
|
|
|
moveIterator<1>(node);
|
2017-05-26 04:48:44 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
template <class T, class Metric>
|
2020-05-17 01:34:36 +08:00
|
|
|
template <bool isConst>
|
|
|
|
void IndexedSet<T, Metric>::IteratorImpl<isConst>::decrementNonEnd() {
|
2020-05-17 05:25:13 +08:00
|
|
|
moveIterator<0>(node);
|
2017-05-26 04:48:44 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
template <class Node>
|
|
|
|
void ISRotate(Node*& oldRootRef, int d) {
|
2021-03-11 02:06:03 +08:00
|
|
|
Node* oldRoot = oldRootRef;
|
|
|
|
Node* newRoot = oldRoot->child[1 - d];
|
2017-05-26 04:48:44 +08:00
|
|
|
|
|
|
|
// metrics
|
|
|
|
auto orTotal = oldRoot->total - newRoot->total;
|
|
|
|
if (newRoot->child[d])
|
|
|
|
orTotal = orTotal + newRoot->child[d]->total;
|
|
|
|
newRoot->total = oldRoot->total;
|
|
|
|
oldRoot->total = orTotal;
|
|
|
|
|
2021-03-11 02:06:03 +08:00
|
|
|
// pointers
|
|
|
|
oldRoot->child[1 - d] = newRoot->child[d];
|
|
|
|
if (oldRoot->child[1 - d])
|
|
|
|
oldRoot->child[1 - d]->parent = oldRoot;
|
2017-05-26 04:48:44 +08:00
|
|
|
newRoot->child[d] = oldRoot;
|
|
|
|
newRoot->parent = oldRoot->parent;
|
|
|
|
oldRoot->parent = newRoot;
|
|
|
|
oldRootRef = newRoot;
|
|
|
|
}
|
|
|
|
|
|
|
|
template <class Node>
|
|
|
|
void ISAdjustBalance(Node* root, int d, int bal) {
|
2021-03-11 02:06:03 +08:00
|
|
|
Node* n = root->child[d];
|
|
|
|
Node* nn = n->child[1 - d];
|
2017-05-26 04:48:44 +08:00
|
|
|
|
2021-03-11 02:06:03 +08:00
|
|
|
if (!nn->balance)
|
2017-05-26 04:48:44 +08:00
|
|
|
root->balance = n->balance = 0;
|
2021-03-11 02:06:03 +08:00
|
|
|
else if (nn->balance == bal) {
|
2017-05-26 04:48:44 +08:00
|
|
|
root->balance = -bal;
|
|
|
|
n->balance = 0;
|
|
|
|
} else {
|
|
|
|
root->balance = 0;
|
|
|
|
n->balance = bal;
|
|
|
|
}
|
|
|
|
nn->balance = 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
template <class Node>
|
2021-03-11 02:06:03 +08:00
|
|
|
int ISRebalance(Node*& root) {
|
|
|
|
// Pre: root is a tree having the BST, metric, and balance invariants but not (necessarily) the AVL invariant.
|
|
|
|
// root->child[0] and root->child[1] are AVL. Post: root is an AVL tree with the same nodes Returns: the change in
|
|
|
|
// height of root rebalance is O(1) if abs(root->balance)<=2, and probably O(log N) otherwise. (The rare "still
|
|
|
|
// unbalanced" recursion is hard to analyze)
|
2017-05-26 04:48:44 +08:00
|
|
|
//
|
|
|
|
// The documentation of this function will be referencing the following tree (where
|
2021-03-11 02:06:03 +08:00
|
|
|
// nodes A, C, E, and G represent subtrees of unspecified height). Thus for each node X,
|
2017-05-26 04:48:44 +08:00
|
|
|
// we know the value of balance(X), but not height(X).
|
|
|
|
//
|
|
|
|
// We will assume that balance(F) < 0 (so we will be rotating right).
|
|
|
|
// Trees that rotate to the left will perform analagous operations.
|
2021-03-11 02:06:03 +08:00
|
|
|
//
|
2017-05-26 04:48:44 +08:00
|
|
|
// F
|
|
|
|
// / \
|
|
|
|
// B G
|
|
|
|
// / \
|
2021-03-11 02:06:03 +08:00
|
|
|
// A D
|
2017-05-26 04:48:44 +08:00
|
|
|
// / \
|
|
|
|
// C E
|
|
|
|
|
|
|
|
if (!root || (root->balance >= -1 && root->balance <= +1))
|
|
|
|
return 0;
|
|
|
|
|
2021-03-11 02:06:03 +08:00
|
|
|
int rebalanceDir = root->balance < 0; // 1 if rotating right, 0 if rotating left
|
|
|
|
auto* n = root->child[1 - rebalanceDir]; // Node B
|
2017-05-26 04:48:44 +08:00
|
|
|
int bal = rebalanceDir ? +1 : -1; // 1 if rotating right, -1 if rotating left
|
|
|
|
int rootBal = root->balance;
|
|
|
|
|
|
|
|
// Depending on the balance at B, we will be required to do one or two rotations.
|
|
|
|
// If balance(B) <= 0, then we do only one rotation (the second of the two).
|
|
|
|
//
|
|
|
|
// In a tree where balance(B) == +1, we are required to do both rotations.
|
|
|
|
// The result of the first rotation will be:
|
|
|
|
//
|
|
|
|
// F
|
|
|
|
// / \
|
|
|
|
// D G
|
|
|
|
// / \
|
2021-03-11 02:06:03 +08:00
|
|
|
// B E
|
2017-05-26 04:48:44 +08:00
|
|
|
// / \
|
|
|
|
// A C
|
|
|
|
//
|
|
|
|
bool doubleRotation = n->balance == bal;
|
|
|
|
if (doubleRotation) {
|
|
|
|
int x = n->child[rebalanceDir]->balance; // balance of Node D
|
2021-03-11 02:06:03 +08:00
|
|
|
ISRotate(root->child[1 - rebalanceDir], 1 - rebalanceDir); // Rotate at Node B
|
2017-05-26 04:48:44 +08:00
|
|
|
|
|
|
|
// Change node pointed to by 'n' to prepare for the second rotation
|
|
|
|
// After this first rotation, Node D will be the left child of the root
|
2021-03-11 02:06:03 +08:00
|
|
|
n = root->child[1 - rebalanceDir];
|
2017-05-26 04:48:44 +08:00
|
|
|
|
|
|
|
// Compute the balance at the new root node D' of our rotation
|
|
|
|
// We know that height(A) == max(height(C), height(E)) because B had balance of +1
|
|
|
|
// If height(E) >= height(C), then height(E) == height(A) and balance(D') = -1
|
|
|
|
// Otherwise height(C) == height(E) + 1, and therefore balance(D') = -2
|
2021-03-11 02:06:03 +08:00
|
|
|
n->balance = ((x == -bal) ? -2 : -1) * bal;
|
2017-05-26 04:48:44 +08:00
|
|
|
|
|
|
|
// Compute the balance at the old root node B' of our rotation
|
|
|
|
// As stated above, height(A) == max(height(C), height(E))
|
|
|
|
// If height(C) >= height(E), then height(A) == height(C) and balance(B') = 0
|
|
|
|
// Otherwise height(A) == height(E) == height(C) + 1, and therefore balance(B') = -1
|
2021-03-11 02:06:03 +08:00
|
|
|
n->child[1 - rebalanceDir]->balance = ((x == bal) ? -1 : 0) * bal;
|
2017-05-26 04:48:44 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
// At this point, we perform the "second" rotation (which may actually be the first
|
|
|
|
// if the "first" rotation was not performed). The rotation that is performed is the
|
|
|
|
// same for both trees, but the result will be different depending on which tree we
|
|
|
|
// started with:
|
|
|
|
//
|
|
|
|
// If unrotated: If once rotated:
|
|
|
|
//
|
|
|
|
// B D
|
|
|
|
// / \ / \
|
|
|
|
// A F B F
|
|
|
|
// / \ / \ / \
|
|
|
|
// D G A C E G
|
|
|
|
// / \
|
|
|
|
// C E
|
|
|
|
//
|
|
|
|
// The documentation for this second rotation will be based on the unrotated original tree.
|
|
|
|
|
|
|
|
// Compute the balance at the new root node B'.
|
|
|
|
// balance(B') = 1 + max(height(D), height(G)) - height(A) = 1 + max(height(D) - height(A), height(G) - height(A))
|
|
|
|
// balance(B') = 1 + max(balance(B), height(G) - height(A))
|
|
|
|
//
|
|
|
|
// Now, we must find height(G) - height(A):
|
|
|
|
// If height(A) >= height(D) (i.e. balance(B) <= 0), then
|
|
|
|
// height(G) - height(A) = height(G) - height(B) + 1 = balance(F) + 1
|
|
|
|
//
|
|
|
|
// Otherwise, height(A) = height(D) - balance(B) = height(B) - 1 - balance(B), so
|
2021-03-11 02:06:03 +08:00
|
|
|
// height(G) - height(A) = height(G) - height(B) + 1 + balance(B) = balance(F) + 1 + balance(B)
|
2017-05-26 04:48:44 +08:00
|
|
|
//
|
|
|
|
// balance(B') = 1 + max(balance(B), balance(F) + 1 + max(balance(B), 0))
|
|
|
|
//
|
|
|
|
int nBal = n->balance * bal; // Direction corrected balance at Node B
|
|
|
|
int newRootBalance = bal * (1 + std::max(nBal, bal * root->balance + 1 + std::max(nBal, 0)));
|
|
|
|
|
|
|
|
// Compute the balance at the old root node F' (which becomes a child of the new root).
|
|
|
|
// balance(F') = height(G) - height(D)
|
|
|
|
//
|
|
|
|
// If height(D) >= height(A) (i.e. balance(B) >= 0), then height(D) = height(B) - 1, so
|
|
|
|
// balance(F') = height(G) - height(B) + 1 = balance(F) + 1
|
|
|
|
//
|
2021-03-11 02:06:03 +08:00
|
|
|
// Otherwise, height(D) = height(A) + balance(B) = height(B) - 1 + balance(B), so
|
|
|
|
// balance(F') = height(G) - height(B) + 1 - balance(B) = balance(F) + 1 - balance(B)
|
2017-05-26 04:48:44 +08:00
|
|
|
//
|
|
|
|
// balance(F') = balance(F) + 1 - min(balance(B), 0)
|
|
|
|
//
|
|
|
|
int newChildBalance = root->balance + bal * (1 - std::min(nBal, 0));
|
|
|
|
|
2021-03-11 02:06:03 +08:00
|
|
|
ISRotate(root, rebalanceDir);
|
2017-05-26 04:48:44 +08:00
|
|
|
root->balance = newRootBalance;
|
|
|
|
root->child[rebalanceDir]->balance = newChildBalance;
|
|
|
|
|
2021-03-11 02:06:03 +08:00
|
|
|
// If the original tree is very unbalanced, the unbalance may have been "pushed" down into this subtree, so
|
|
|
|
// recursively rebalance that if necessary.
|
2017-05-26 04:48:44 +08:00
|
|
|
int childHeightChange = ISRebalance(root->child[rebalanceDir]);
|
|
|
|
root->balance += childHeightChange * bal;
|
|
|
|
|
|
|
|
newRootBalance *= bal;
|
|
|
|
|
|
|
|
// Compute the change in height at the root
|
|
|
|
// We will look at the single and double rotation cases separately
|
|
|
|
//
|
|
|
|
// If we did a single rotation, then height(A) >= height(D).
|
|
|
|
// As a result, height(A) >= height(G) + 1; otherwise the tree would be balanced and we wouldn't do any rotations.
|
2021-03-11 02:06:03 +08:00
|
|
|
//
|
|
|
|
// Then the original height of the tree is height(A) + 2,
|
2017-05-26 04:48:44 +08:00
|
|
|
// and the new height is max(height(D) + 2 + childHeightChange, height(A) + 1), so
|
|
|
|
//
|
|
|
|
// heightChange_single = max(height(D) + 2 + childHeightChange, height(A) + 1) - (height(A) + 2)
|
|
|
|
// heightChange_single = max(height(D) - height(A) + childHeightChange, -1)
|
|
|
|
// heightChange_single = max(balance(B) + childHeightChange, -1)
|
|
|
|
//
|
|
|
|
// If we did a double rotation, then height(D) = height(A) + 1 in the original tree.
|
|
|
|
// As a result, height(D) >= height(G) + 1; otherwise the tree would be balanced and we wouldn't do any rotations.
|
|
|
|
//
|
|
|
|
// Then the original height of the tree is height(D) + 2,
|
|
|
|
// and the new height is max(height(A), height(C), height(E), height(G)) + 2
|
|
|
|
//
|
|
|
|
// balance(B) == 1, so height(A) == max(height(C), height(E)).
|
|
|
|
// Also, height(A) = height(D) - 1 >= height(G)
|
|
|
|
// Therefore the new height is height(A) + 2
|
|
|
|
//
|
|
|
|
// heightChange_double = height(A) + 2 - (height(D) + 2)
|
|
|
|
// heightChange_double = height(A) - height(D)
|
|
|
|
// heightChange_double = -1
|
|
|
|
//
|
|
|
|
int heightChange = doubleRotation ? -1 : std::max(nBal + childHeightChange, -1);
|
|
|
|
|
2021-03-11 02:06:03 +08:00
|
|
|
// If the root is still unbalanced, then it should at least be more balanced than before. Recursively rebalance the
|
|
|
|
// root until we get a balanced tree.
|
|
|
|
if (root->balance < -1 || root->balance > +1) {
|
2017-05-26 04:48:44 +08:00
|
|
|
ASSERT(abs(root->balance) < abs(rootBal));
|
|
|
|
heightChange += ISRebalance(root);
|
|
|
|
}
|
|
|
|
|
|
|
|
return heightChange;
|
|
|
|
}
|
|
|
|
|
|
|
|
template <class Node>
|
|
|
|
Node* ISCommonSubtreeRoot(Node* first, Node* last) {
|
|
|
|
// Finds the smallest common subtree of first and last and returns its root node
|
|
|
|
|
2021-03-11 02:06:03 +08:00
|
|
|
// Find the depth of first and last
|
|
|
|
int firstDepth = 0, lastDepth = 0;
|
|
|
|
for (auto f = first; f; f = f->parent)
|
|
|
|
firstDepth++;
|
|
|
|
for (auto f = last; f; f = f->parent)
|
|
|
|
lastDepth++;
|
2017-05-26 04:48:44 +08:00
|
|
|
|
2021-03-11 02:06:03 +08:00
|
|
|
// Traverse up the tree from the deeper of first and last until f and l are at the same depth
|
2017-05-26 04:48:44 +08:00
|
|
|
auto f = first, l = last;
|
2021-03-11 02:06:03 +08:00
|
|
|
for (int i = firstDepth; i > lastDepth; i--)
|
|
|
|
f = f->parent;
|
|
|
|
for (int i = lastDepth; i > firstDepth; i--)
|
|
|
|
l = l->parent;
|
2017-05-26 04:48:44 +08:00
|
|
|
|
2021-03-11 02:06:03 +08:00
|
|
|
// Traverse up from f and l simultaneously until we reach a common node
|
2017-05-26 04:48:44 +08:00
|
|
|
while (f != l) {
|
|
|
|
f = f->parent;
|
|
|
|
l = l->parent;
|
|
|
|
}
|
|
|
|
|
|
|
|
return f;
|
|
|
|
}
|
|
|
|
|
|
|
|
template <class T, class Metric>
|
2020-05-17 01:34:36 +08:00
|
|
|
template <bool isConst>
|
|
|
|
typename IndexedSet<T, Metric>::template Impl<isConst>::IteratorT IndexedSet<T, Metric>::Impl<isConst>::begin(
|
|
|
|
IndexedSet<T, Metric>::Impl<isConst>::SetT& self) {
|
|
|
|
NodeT* x = self.root;
|
2021-03-11 02:06:03 +08:00
|
|
|
while (x && x->child[0])
|
|
|
|
x = x->child[0];
|
2020-05-17 03:53:36 +08:00
|
|
|
return IteratorT{ x };
|
2017-05-26 04:48:44 +08:00
|
|
|
}
|
|
|
|
|
2020-05-17 01:34:36 +08:00
|
|
|
template <class T, class Metric>
|
|
|
|
template <bool isConst>
|
|
|
|
template <bool constIterator>
|
|
|
|
typename IndexedSet<T, Metric>::template IteratorImpl<isConst || constIterator>
|
|
|
|
IndexedSet<T, Metric>::Impl<isConst>::previous(IndexedSet<T, Metric>::Impl<isConst>::SetT& self,
|
|
|
|
IndexedSet<T, Metric>::IteratorImpl<constIterator> iter) {
|
2021-03-11 02:06:03 +08:00
|
|
|
if (iter == self.end())
|
|
|
|
return self.lastItem();
|
2020-05-17 01:34:36 +08:00
|
|
|
|
2020-05-17 05:25:13 +08:00
|
|
|
moveIterator<0>(iter.node);
|
2020-05-17 01:34:36 +08:00
|
|
|
return iter;
|
2017-05-26 04:48:44 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
template <class T, class Metric>
|
2020-05-17 01:34:36 +08:00
|
|
|
template <bool isConst>
|
|
|
|
typename IndexedSet<T, Metric>::template Impl<isConst>::IteratorT IndexedSet<T, Metric>::Impl<isConst>::lastItem(
|
|
|
|
IndexedSet<T, Metric>::Impl<isConst>::SetT& self) {
|
|
|
|
NodeT* x = self.root;
|
2021-03-11 02:06:03 +08:00
|
|
|
while (x && x->child[1])
|
|
|
|
x = x->child[1];
|
2020-05-17 03:53:36 +08:00
|
|
|
return IteratorT{ x };
|
2017-05-26 04:48:44 +08:00
|
|
|
}
|
|
|
|
|
2021-03-11 02:06:03 +08:00
|
|
|
template <class T, class Metric>
|
|
|
|
template <class T_, class Metric_>
|
|
|
|
Metric IndexedSet<T, Metric>::addMetric(T_&& data, Metric_&& metric) {
|
|
|
|
auto i = find(data);
|
2017-05-26 04:48:44 +08:00
|
|
|
if (i == end()) {
|
2021-03-11 02:06:03 +08:00
|
|
|
insert(std::forward<T_>(data), std::forward<Metric_>(metric));
|
2017-05-26 04:48:44 +08:00
|
|
|
return metric;
|
|
|
|
} else {
|
|
|
|
Metric m = metric + getMetric(i);
|
2021-03-11 02:06:03 +08:00
|
|
|
insert(std::forward<T_>(data), m);
|
2017-05-26 04:48:44 +08:00
|
|
|
return m;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2021-03-11 02:06:03 +08:00
|
|
|
template <class T, class Metric>
|
|
|
|
template <class T_, class Metric_>
|
|
|
|
typename IndexedSet<T, Metric>::iterator IndexedSet<T, Metric>::insert(T_&& data,
|
|
|
|
Metric_&& metric,
|
|
|
|
bool replaceExisting) {
|
2020-05-17 03:53:36 +08:00
|
|
|
if (root == nullptr) {
|
2017-10-04 11:07:29 +08:00
|
|
|
root = new Node(std::forward<T_>(data), std::forward<Metric_>(metric));
|
2020-05-17 03:53:36 +08:00
|
|
|
return iterator{ root };
|
2017-05-26 04:48:44 +08:00
|
|
|
}
|
2021-03-11 02:06:03 +08:00
|
|
|
Node* t = root;
|
2017-05-26 04:48:44 +08:00
|
|
|
int d; // direction
|
|
|
|
// traverse to find insert point
|
2021-03-11 02:06:03 +08:00
|
|
|
while (true) {
|
2020-04-04 02:18:06 +08:00
|
|
|
int cmp = compare(data, t->data);
|
|
|
|
if (cmp == 0) {
|
2021-03-11 02:06:03 +08:00
|
|
|
Node* returnNode = t;
|
|
|
|
if (replaceExisting) {
|
2017-10-12 08:35:10 +08:00
|
|
|
t->data = std::forward<T_>(data);
|
2017-05-26 04:48:44 +08:00
|
|
|
Metric delta = t->total;
|
2017-10-12 08:40:48 +08:00
|
|
|
t->total = std::forward<Metric_>(metric);
|
2021-03-11 02:06:03 +08:00
|
|
|
if (t->child[0])
|
|
|
|
t->total = t->total + t->child[0]->total;
|
|
|
|
if (t->child[1])
|
|
|
|
t->total = t->total + t->child[1]->total;
|
2017-05-26 04:48:44 +08:00
|
|
|
delta = t->total - delta;
|
|
|
|
while (true) {
|
|
|
|
t = t->parent;
|
2021-03-11 02:06:03 +08:00
|
|
|
if (!t)
|
|
|
|
break;
|
2017-05-26 04:48:44 +08:00
|
|
|
t->total = t->total + delta;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2020-05-17 03:53:36 +08:00
|
|
|
return iterator{ returnNode };
|
2017-05-26 04:48:44 +08:00
|
|
|
}
|
2020-04-04 02:18:06 +08:00
|
|
|
d = cmp > 0;
|
2021-03-11 02:06:03 +08:00
|
|
|
Node* nextT = t->child[d];
|
|
|
|
if (!nextT)
|
|
|
|
break;
|
2017-05-26 04:48:44 +08:00
|
|
|
t = nextT;
|
|
|
|
}
|
|
|
|
|
2021-03-11 02:06:03 +08:00
|
|
|
Node* newNode = new Node(std::forward<T_>(data), std::forward<Metric_>(metric), t);
|
2017-05-26 04:48:44 +08:00
|
|
|
t->child[d] = newNode;
|
|
|
|
|
2021-03-11 02:06:03 +08:00
|
|
|
while (true) {
|
2017-05-26 04:48:44 +08:00
|
|
|
t->balance += d ? 1 : -1;
|
|
|
|
t->total = t->total + metric;
|
|
|
|
if (t->balance == 0)
|
|
|
|
break;
|
2021-03-11 02:06:03 +08:00
|
|
|
if (t->balance != 1 && t->balance != -1) {
|
|
|
|
Node** parent = t->parent ? &t->parent->child[t->parent->child[1] == t] : &root;
|
|
|
|
// assert( *parent == t );
|
2017-05-26 04:48:44 +08:00
|
|
|
|
2021-03-11 02:06:03 +08:00
|
|
|
Node* n = t->child[d];
|
2017-05-26 04:48:44 +08:00
|
|
|
int bal = d ? 1 : -1;
|
2021-03-11 02:06:03 +08:00
|
|
|
if (n->balance == bal) {
|
2017-05-26 04:48:44 +08:00
|
|
|
t->balance = n->balance = 0;
|
|
|
|
} else {
|
|
|
|
ISAdjustBalance(t, d, bal);
|
|
|
|
ISRotate(t->child[d], d);
|
|
|
|
}
|
2021-03-11 02:06:03 +08:00
|
|
|
ISRotate(*parent, 1 - d);
|
2017-05-26 04:48:44 +08:00
|
|
|
t = *parent;
|
|
|
|
break;
|
|
|
|
}
|
2021-03-11 02:06:03 +08:00
|
|
|
if (!t->parent)
|
|
|
|
break;
|
2017-05-26 04:48:44 +08:00
|
|
|
|
|
|
|
d = t->parent->child[1] == t;
|
|
|
|
t = t->parent;
|
|
|
|
}
|
|
|
|
while (true) {
|
|
|
|
t = t->parent;
|
2021-03-11 02:06:03 +08:00
|
|
|
if (!t)
|
|
|
|
break;
|
2017-05-26 04:48:44 +08:00
|
|
|
t->total = t->total + metric;
|
|
|
|
}
|
|
|
|
|
2020-05-17 03:53:36 +08:00
|
|
|
return iterator{ newNode };
|
2017-05-26 04:48:44 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
template <class T, class Metric>
|
2021-03-11 02:06:03 +08:00
|
|
|
int IndexedSet<T, Metric>::insert(const std::vector<std::pair<T, Metric>>& dataVector, bool replaceExisting) {
|
2017-05-26 04:48:44 +08:00
|
|
|
int num_inserted = 0;
|
2020-05-17 06:00:15 +08:00
|
|
|
Node* blockStart = nullptr;
|
|
|
|
Node* blockEnd = nullptr;
|
2017-05-26 04:48:44 +08:00
|
|
|
|
2021-03-11 02:06:03 +08:00
|
|
|
for (int i = 0; i < dataVector.size(); ++i) {
|
2017-05-26 04:48:44 +08:00
|
|
|
Metric metric = dataVector[i].second;
|
|
|
|
T data = std::move(dataVector[i].first);
|
|
|
|
|
|
|
|
int d = 1; // direction
|
2020-05-17 06:00:15 +08:00
|
|
|
if (blockStart == nullptr || (blockEnd != nullptr && data >= blockEnd->data)) {
|
|
|
|
blockEnd = nullptr;
|
|
|
|
if (root == nullptr) {
|
2017-05-26 04:48:44 +08:00
|
|
|
root = new Node(std::move(data), metric);
|
|
|
|
num_inserted++;
|
|
|
|
blockStart = root;
|
|
|
|
continue;
|
|
|
|
}
|
|
|
|
|
2021-03-11 02:06:03 +08:00
|
|
|
Node* t = root;
|
2017-05-26 04:48:44 +08:00
|
|
|
// traverse to find insert point
|
|
|
|
bool foundNode = false;
|
2020-04-04 02:18:06 +08:00
|
|
|
while (true) {
|
|
|
|
int cmp = compare(data, t->data);
|
2020-05-08 06:50:40 +08:00
|
|
|
d = cmp > 0;
|
2020-05-08 08:22:04 +08:00
|
|
|
if (d == 0)
|
2017-05-26 04:48:44 +08:00
|
|
|
blockEnd = t;
|
2020-04-04 02:18:06 +08:00
|
|
|
if (cmp == 0) {
|
2021-03-11 02:06:03 +08:00
|
|
|
Node* returnNode = t;
|
|
|
|
if (replaceExisting) {
|
2017-05-26 04:48:44 +08:00
|
|
|
num_inserted++;
|
|
|
|
t->data = std::move(data);
|
|
|
|
Metric delta = t->total;
|
|
|
|
t->total = metric;
|
2021-03-11 02:06:03 +08:00
|
|
|
if (t->child[0])
|
|
|
|
t->total = t->total + t->child[0]->total;
|
|
|
|
if (t->child[1])
|
|
|
|
t->total = t->total + t->child[1]->total;
|
2017-05-26 04:48:44 +08:00
|
|
|
delta = t->total - delta;
|
|
|
|
while (true) {
|
|
|
|
t = t->parent;
|
2021-03-11 02:06:03 +08:00
|
|
|
if (!t)
|
|
|
|
break;
|
2017-05-26 04:48:44 +08:00
|
|
|
t->total = t->total + delta;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
blockStart = returnNode;
|
|
|
|
foundNode = true;
|
|
|
|
break;
|
|
|
|
}
|
2021-03-11 02:06:03 +08:00
|
|
|
Node* nextT = t->child[d];
|
|
|
|
if (!nextT) {
|
2017-05-26 04:48:44 +08:00
|
|
|
blockStart = t;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
t = nextT;
|
|
|
|
}
|
|
|
|
|
2021-03-11 02:06:03 +08:00
|
|
|
if (foundNode)
|
2017-05-26 04:48:44 +08:00
|
|
|
continue;
|
|
|
|
}
|
|
|
|
|
2021-03-11 02:06:03 +08:00
|
|
|
Node* t = blockStart;
|
|
|
|
while (t->child[d]) {
|
2017-05-26 04:48:44 +08:00
|
|
|
t = t->child[d];
|
|
|
|
d = 0;
|
|
|
|
}
|
|
|
|
|
2021-03-11 02:06:03 +08:00
|
|
|
Node* newNode = new Node(std::move(data), metric, t);
|
2017-05-26 04:48:44 +08:00
|
|
|
num_inserted++;
|
|
|
|
|
|
|
|
t->child[d] = newNode;
|
|
|
|
blockStart = newNode;
|
|
|
|
|
2021-03-11 02:06:03 +08:00
|
|
|
while (true) {
|
2017-05-26 04:48:44 +08:00
|
|
|
t->balance += d ? 1 : -1;
|
|
|
|
t->total = t->total + metric;
|
|
|
|
if (t->balance == 0)
|
|
|
|
break;
|
2021-03-11 02:06:03 +08:00
|
|
|
if (t->balance != 1 && t->balance != -1) {
|
|
|
|
Node** parent = t->parent ? &t->parent->child[t->parent->child[1] == t] : &root;
|
|
|
|
// assert( *parent == t );
|
2017-05-26 04:48:44 +08:00
|
|
|
|
2021-03-11 02:06:03 +08:00
|
|
|
Node* n = t->child[d];
|
2017-05-26 04:48:44 +08:00
|
|
|
int bal = d ? 1 : -1;
|
2021-03-11 02:06:03 +08:00
|
|
|
if (n->balance == bal) {
|
2017-05-26 04:48:44 +08:00
|
|
|
t->balance = n->balance = 0;
|
|
|
|
} else {
|
|
|
|
ISAdjustBalance(t, d, bal);
|
|
|
|
ISRotate(t->child[d], d);
|
|
|
|
}
|
2021-03-11 02:06:03 +08:00
|
|
|
ISRotate(*parent, 1 - d);
|
2017-05-26 04:48:44 +08:00
|
|
|
t = *parent;
|
|
|
|
break;
|
|
|
|
}
|
2021-03-11 02:06:03 +08:00
|
|
|
if (!t->parent)
|
|
|
|
break;
|
2017-05-26 04:48:44 +08:00
|
|
|
|
|
|
|
d = t->parent->child[1] == t;
|
|
|
|
t = t->parent;
|
|
|
|
}
|
|
|
|
while (true) {
|
|
|
|
t = t->parent;
|
2021-03-11 02:06:03 +08:00
|
|
|
if (!t)
|
|
|
|
break;
|
2017-05-26 04:48:44 +08:00
|
|
|
t->total = t->total + metric;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return num_inserted;
|
|
|
|
}
|
|
|
|
|
|
|
|
template <class T, class Metric>
|
2021-03-11 02:06:03 +08:00
|
|
|
Metric IndexedSet<T, Metric>::eraseHalf(Node* start,
|
|
|
|
Node* end,
|
|
|
|
int eraseDir,
|
|
|
|
int& heightDelta,
|
2020-04-04 02:18:06 +08:00
|
|
|
std::vector<Node*>& toFree) {
|
2021-03-11 02:06:03 +08:00
|
|
|
// Removes all nodes between start (inclusive) and end (exclusive) from the set, where start is equal to end or one
|
|
|
|
// of its descendants eraseDir 1 means erase the right half (nodes > at) of the left subtree of end. eraseDir 0
|
|
|
|
// means the left half of the right subtree toFree is extended with the roots of completely removed subtrees
|
2017-05-26 04:48:44 +08:00
|
|
|
// heightDelta will be set to the change in height of the end node
|
2021-03-11 02:06:03 +08:00
|
|
|
// Returns the amount that should be subtracted from end node's metric value (and, by extension, the metric values
|
|
|
|
// of all ancestors of the end node).
|
2017-05-26 04:48:44 +08:00
|
|
|
//
|
|
|
|
// The end node may be left unbalanced (AVL invariant broken)
|
2021-03-11 02:06:03 +08:00
|
|
|
// The end node may be left with the incorrect metric total (the correct value is end->total = end->total +
|
|
|
|
// metricDelta) scare quotes in comments mean the values when eraseDir==1 (when eraseDir==0, "left" means right etc)
|
2017-05-26 04:48:44 +08:00
|
|
|
|
|
|
|
// metricDelta measures how much should be subtracted from the current node's metrics
|
|
|
|
Metric metricDelta = 0;
|
|
|
|
heightDelta = 0;
|
|
|
|
|
|
|
|
int fromDir = 1 - eraseDir;
|
|
|
|
|
|
|
|
// Begin removing nodes at start continuing up until we get to end
|
2021-03-11 02:06:03 +08:00
|
|
|
while (start != end) {
|
2017-05-26 04:48:44 +08:00
|
|
|
start->total = start->total - metricDelta;
|
|
|
|
|
2021-03-11 02:06:03 +08:00
|
|
|
IndexedSet<T, Metric>::Node* parent = start->parent;
|
2017-05-26 04:48:44 +08:00
|
|
|
|
2021-03-11 02:06:03 +08:00
|
|
|
// Obtain the child pointer to start, which rebalance will update with the new root of the subtree currently
|
|
|
|
// rooted at start
|
|
|
|
IndexedSet<T, Metric>::Node*& node = parent->child[parent->child[1] == start];
|
2017-05-26 04:48:44 +08:00
|
|
|
int nextDir = parent->child[1] == start;
|
|
|
|
|
2021-03-11 02:06:03 +08:00
|
|
|
if (fromDir == eraseDir) {
|
2017-05-26 04:48:44 +08:00
|
|
|
// The "right" subtree has been half-erased, and the "left" subtree doesn't need to be (nor does node).
|
|
|
|
// But this node might be unbalanced by the shrinking "right" subtree. Rebalance and continue up.
|
2021-03-11 02:06:03 +08:00
|
|
|
heightDelta += ISRebalance(node);
|
2017-05-26 04:48:44 +08:00
|
|
|
} else {
|
|
|
|
// The "left" subtree has been half-erased. `start' and its "right" subtree will be completely erased,
|
|
|
|
// leaving only the "left" subtree in its place (which is already AVL balanced).
|
|
|
|
heightDelta += -1 - std::max<int>(0, node->balance * (eraseDir ? +1 : -1));
|
|
|
|
metricDelta = metricDelta + start->total;
|
|
|
|
|
|
|
|
// If there is a surviving subtree of start, then connect it to start->parent
|
2021-03-11 02:06:03 +08:00
|
|
|
IndexedSet<T, Metric>::Node* n = node->child[fromDir];
|
2017-05-26 04:48:44 +08:00
|
|
|
node = n; // This updates the appropriate child pointer of start->parent
|
|
|
|
if (n) {
|
|
|
|
metricDelta = metricDelta - n->total;
|
|
|
|
n->parent = start->parent;
|
|
|
|
}
|
2020-05-17 01:34:36 +08:00
|
|
|
|
|
|
|
start->child[fromDir] = nullptr;
|
2021-03-11 02:06:03 +08:00
|
|
|
toFree.push_back(start);
|
2017-05-26 04:48:44 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
int dir = (nextDir ? +1 : -1);
|
|
|
|
int oldBalance = parent->balance;
|
|
|
|
|
|
|
|
// The change in height from removing nodes should never increase our height
|
|
|
|
ASSERT(heightDelta <= 0);
|
|
|
|
parent->balance += heightDelta * dir;
|
|
|
|
|
|
|
|
// Compute the change in height of start's parent based on its change in balance.
|
2021-03-11 02:06:03 +08:00
|
|
|
// Because we can only be (possibly) shrinking one subtree of parent:
|
|
|
|
// If we were originally heavier on the shrunken size (oldBalance * dir > 0), then the change in height is at
|
|
|
|
// most abs(oldBalance) == oldBalance * dir. If we were lighter on the shrunken side, then height cannot
|
|
|
|
// change.
|
2017-05-26 04:48:44 +08:00
|
|
|
int maxHeightChange = std::max(oldBalance * dir, 0);
|
|
|
|
int balanceChange = (oldBalance - parent->balance) * dir;
|
|
|
|
heightDelta = -std::min(maxHeightChange, balanceChange);
|
|
|
|
|
|
|
|
start = parent;
|
|
|
|
fromDir = nextDir;
|
|
|
|
}
|
|
|
|
|
|
|
|
return metricDelta;
|
|
|
|
}
|
|
|
|
|
|
|
|
template <class T, class Metric>
|
2021-03-11 02:06:03 +08:00
|
|
|
void IndexedSet<T, Metric>::erase(typename IndexedSet<T, Metric>::iterator begin,
|
|
|
|
typename IndexedSet<T, Metric>::iterator end,
|
|
|
|
std::vector<Node*>& toFree) {
|
2017-05-26 04:48:44 +08:00
|
|
|
// Removes all nodes in the set between first and last, inclusive.
|
|
|
|
// toFree is extended with the roots of completely removed subtrees.
|
|
|
|
|
2020-05-17 05:25:13 +08:00
|
|
|
ASSERT(!end.node || (begin.node && (::compare(*begin, *end) <= 0)));
|
2020-04-24 05:05:59 +08:00
|
|
|
|
2021-03-11 02:06:03 +08:00
|
|
|
if (begin == end)
|
2017-05-26 04:48:44 +08:00
|
|
|
return;
|
2020-05-17 05:25:13 +08:00
|
|
|
|
|
|
|
IndexedSet<T, Metric>::Node* first = begin.node;
|
|
|
|
IndexedSet<T, Metric>::Node* last = previous(end).node;
|
2017-05-26 04:48:44 +08:00
|
|
|
|
2021-03-11 02:06:03 +08:00
|
|
|
IndexedSet<T, Metric>::Node* subRoot = ISCommonSubtreeRoot(first, last);
|
2017-05-26 04:48:44 +08:00
|
|
|
|
|
|
|
Metric metricDelta = 0;
|
|
|
|
int leftHeightDelta = 0;
|
|
|
|
int rightHeightDelta = 0;
|
2021-03-11 02:06:03 +08:00
|
|
|
|
|
|
|
// Erase all matching nodes that descend from subRoot, by first erasing descendants of subRoot->child[0] and then
|
|
|
|
// erasing the descendants of subRoot->child[1] subRoot is not removed from the tree at this time
|
2020-04-04 02:18:06 +08:00
|
|
|
metricDelta = metricDelta + eraseHalf(first, subRoot, 1, leftHeightDelta, toFree);
|
|
|
|
metricDelta = metricDelta + eraseHalf(last, subRoot, 0, rightHeightDelta, toFree);
|
2017-05-26 04:48:44 +08:00
|
|
|
|
2021-03-11 02:06:03 +08:00
|
|
|
// Change in the height of subRoot due to past activity, before subRoot is rebalanced. subRoot->balance already
|
|
|
|
// reflects changes in height to its children.
|
|
|
|
int heightDelta = leftHeightDelta + rightHeightDelta;
|
2017-05-26 04:48:44 +08:00
|
|
|
|
|
|
|
// Rebalance and update metrics for all nodes from subRoot up to the root
|
2020-05-17 06:00:15 +08:00
|
|
|
for (auto p = subRoot; p != nullptr; p = p->parent) {
|
2017-05-26 04:48:44 +08:00
|
|
|
p->total = p->total - metricDelta;
|
|
|
|
|
2021-03-11 02:06:03 +08:00
|
|
|
auto& pc = p->parent ? p->parent->child[p->parent->child[1] == p] : root;
|
2017-05-26 04:48:44 +08:00
|
|
|
heightDelta += ISRebalance(pc);
|
|
|
|
p = pc;
|
|
|
|
|
|
|
|
// Update the balance and compute heightDelta for p->parent
|
|
|
|
if (p->parent) {
|
|
|
|
int oldb = p->parent->balance;
|
2021-03-11 02:06:03 +08:00
|
|
|
int dir = (p->parent->child[1] == p ? +1 : -1);
|
2017-05-26 04:48:44 +08:00
|
|
|
p->parent->balance += heightDelta * dir;
|
|
|
|
|
2021-03-11 02:06:03 +08:00
|
|
|
heightDelta = (std::max(p->parent->balance * dir, 0) - std::max(oldb * dir, 0));
|
2017-05-26 04:48:44 +08:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
// Erase the subRoot using the single node erase implementation
|
2021-03-11 02:06:03 +08:00
|
|
|
erase(IndexedSet<T, Metric>::iterator(subRoot));
|
2017-05-26 04:48:44 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
template <class T, class Metric>
|
2021-03-11 02:06:03 +08:00
|
|
|
void IndexedSet<T, Metric>::erase(iterator toErase) {
|
2017-05-26 04:48:44 +08:00
|
|
|
Node* rebalanceNode;
|
|
|
|
int rebalanceDir;
|
|
|
|
|
|
|
|
{
|
|
|
|
// Find the node to erase
|
2020-05-17 05:25:13 +08:00
|
|
|
Node* t = toErase.node;
|
2021-03-11 02:06:03 +08:00
|
|
|
if (!t)
|
|
|
|
return;
|
2017-05-26 04:48:44 +08:00
|
|
|
|
|
|
|
if (!t->child[0] || !t->child[1]) {
|
|
|
|
Metric tMetric = t->total;
|
2021-03-11 02:06:03 +08:00
|
|
|
if (t->child[0])
|
|
|
|
tMetric = tMetric - t->child[0]->total;
|
|
|
|
if (t->child[1])
|
|
|
|
tMetric = tMetric - t->child[1]->total;
|
|
|
|
for (Node* p = t->parent; p; p = p->parent)
|
2017-05-26 04:48:44 +08:00
|
|
|
p->total = p->total - tMetric;
|
|
|
|
rebalanceNode = t->parent;
|
2021-03-11 02:06:03 +08:00
|
|
|
if (rebalanceNode)
|
|
|
|
rebalanceDir = rebalanceNode->child[1] == t;
|
|
|
|
int d = !t->child[0]; // Only one child, on this side (or no children!)
|
2017-05-26 04:48:44 +08:00
|
|
|
replacePointer(t, t->child[d]);
|
|
|
|
t->child[d] = 0;
|
|
|
|
delete t;
|
2021-03-11 02:06:03 +08:00
|
|
|
} else { // Remove node with two children
|
2017-05-26 04:48:44 +08:00
|
|
|
Node* predecessor = t->child[0];
|
2021-03-11 02:06:03 +08:00
|
|
|
while (predecessor->child[1])
|
2017-05-26 04:48:44 +08:00
|
|
|
predecessor = predecessor->child[1];
|
|
|
|
rebalanceNode = predecessor->parent;
|
2021-03-11 02:06:03 +08:00
|
|
|
if (rebalanceNode == t)
|
|
|
|
rebalanceNode = predecessor;
|
|
|
|
if (rebalanceNode)
|
|
|
|
rebalanceDir = rebalanceNode->child[1] == predecessor;
|
2017-05-26 04:48:44 +08:00
|
|
|
|
|
|
|
Metric tMetric = t->total - t->child[0]->total - t->child[1]->total;
|
2021-03-11 02:06:03 +08:00
|
|
|
if (predecessor->child[0])
|
|
|
|
predecessor->total = predecessor->total - predecessor->child[0]->total;
|
|
|
|
for (Node* p = predecessor->parent; p != t; p = p->parent)
|
2017-05-26 04:48:44 +08:00
|
|
|
p->total = p->total - predecessor->total;
|
2021-03-11 02:06:03 +08:00
|
|
|
for (Node* p = t->parent; p; p = p->parent)
|
2017-05-26 04:48:44 +08:00
|
|
|
p->total = p->total - tMetric;
|
|
|
|
|
|
|
|
// Replace t with predecessor
|
2021-03-11 02:06:03 +08:00
|
|
|
replacePointer(predecessor, predecessor->child[0]);
|
|
|
|
replacePointer(t, predecessor);
|
2017-05-26 04:48:44 +08:00
|
|
|
predecessor->balance = t->balance;
|
2021-03-11 02:06:03 +08:00
|
|
|
for (int i = 0; i < 2; i++) {
|
2017-05-26 04:48:44 +08:00
|
|
|
Node* c = predecessor->child[i] = t->child[i];
|
|
|
|
if (c) {
|
|
|
|
c->parent = predecessor;
|
|
|
|
predecessor->total = predecessor->total + c->total;
|
|
|
|
t->child[i] = 0;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
delete t;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2021-03-11 02:06:03 +08:00
|
|
|
if (!rebalanceNode)
|
|
|
|
return;
|
2017-05-26 04:48:44 +08:00
|
|
|
|
|
|
|
while (true) {
|
|
|
|
rebalanceNode->balance += rebalanceDir ? -1 : +1;
|
|
|
|
|
2021-03-11 02:06:03 +08:00
|
|
|
if (rebalanceNode->balance < -1 || rebalanceNode->balance > +1) {
|
|
|
|
Node** parent = rebalanceNode->parent
|
|
|
|
? &rebalanceNode->parent->child[rebalanceNode->parent->child[1] == rebalanceNode]
|
|
|
|
: &root;
|
|
|
|
Node* n = rebalanceNode->child[1 - rebalanceDir];
|
2017-05-26 04:48:44 +08:00
|
|
|
int bal = rebalanceDir ? +1 : -1;
|
|
|
|
if (n->balance == -bal) {
|
|
|
|
rebalanceNode->balance = n->balance = 0;
|
2021-03-11 02:06:03 +08:00
|
|
|
ISRotate(*parent, rebalanceDir);
|
2017-05-26 04:48:44 +08:00
|
|
|
} else if (n->balance == bal) {
|
2021-03-11 02:06:03 +08:00
|
|
|
ISAdjustBalance(rebalanceNode, 1 - rebalanceDir, -bal);
|
|
|
|
ISRotate(rebalanceNode->child[1 - rebalanceDir], 1 - rebalanceDir);
|
|
|
|
ISRotate(*parent, rebalanceDir);
|
|
|
|
} else { // n->balance == 0
|
2017-05-26 04:48:44 +08:00
|
|
|
rebalanceNode->balance = -bal;
|
|
|
|
n->balance = bal;
|
2021-03-11 02:06:03 +08:00
|
|
|
ISRotate(*parent, rebalanceDir);
|
2017-05-26 04:48:44 +08:00
|
|
|
break;
|
|
|
|
}
|
|
|
|
rebalanceNode = *parent;
|
2021-03-11 02:06:03 +08:00
|
|
|
} else if (rebalanceNode->balance) // +/- 1, we are done
|
2017-05-26 04:48:44 +08:00
|
|
|
break;
|
|
|
|
|
2021-03-11 02:06:03 +08:00
|
|
|
if (!rebalanceNode->parent)
|
|
|
|
break;
|
2017-05-26 04:48:44 +08:00
|
|
|
rebalanceDir = rebalanceNode->parent->child[1] == rebalanceNode;
|
|
|
|
rebalanceNode = rebalanceNode->parent;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
// Returns x such that key==*x, or end()
|
|
|
|
template <class T, class Metric>
|
2020-05-17 01:34:36 +08:00
|
|
|
template <bool isConst>
|
2017-05-26 04:48:44 +08:00
|
|
|
template <class Key>
|
2020-05-17 01:34:36 +08:00
|
|
|
typename IndexedSet<T, Metric>::template Impl<isConst>::IteratorT IndexedSet<T, Metric>::Impl<isConst>::find(
|
2021-03-11 02:06:03 +08:00
|
|
|
IndexedSet<T, Metric>::Impl<isConst>::SetT& self,
|
|
|
|
const Key& key) {
|
2020-05-17 01:34:36 +08:00
|
|
|
NodeT* t = self.root;
|
2021-03-11 02:06:03 +08:00
|
|
|
while (t) {
|
2020-04-04 02:18:06 +08:00
|
|
|
int cmp = compare(key, t->data);
|
2021-03-11 02:06:03 +08:00
|
|
|
if (cmp == 0)
|
|
|
|
return IteratorT{ t };
|
2020-04-04 02:18:06 +08:00
|
|
|
t = t->child[cmp > 0];
|
2017-05-26 04:48:44 +08:00
|
|
|
}
|
2020-05-17 01:34:36 +08:00
|
|
|
return self.end();
|
2017-05-26 04:48:44 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
// Returns the smallest x such that *x>=key, or end()
|
|
|
|
template <class T, class Metric>
|
2020-05-17 01:34:36 +08:00
|
|
|
template <bool isConst>
|
2017-05-26 04:48:44 +08:00
|
|
|
template <class Key>
|
2020-05-17 01:34:36 +08:00
|
|
|
typename IndexedSet<T, Metric>::template Impl<isConst>::IteratorT IndexedSet<T, Metric>::Impl<isConst>::lower_bound(
|
2021-03-11 02:06:03 +08:00
|
|
|
IndexedSet<T, Metric>::Impl<isConst>::SetT& self,
|
|
|
|
const Key& key) {
|
2020-05-17 01:34:36 +08:00
|
|
|
NodeT* t = self.root;
|
2021-03-11 02:06:03 +08:00
|
|
|
if (!t)
|
|
|
|
return self.end();
|
2020-03-31 07:13:37 +08:00
|
|
|
bool less;
|
2017-05-26 04:48:44 +08:00
|
|
|
while (true) {
|
2020-03-31 07:13:37 +08:00
|
|
|
less = t->data < key;
|
2020-05-17 01:34:36 +08:00
|
|
|
NodeT* n = t->child[less];
|
2021-03-11 02:06:03 +08:00
|
|
|
if (!n)
|
|
|
|
break;
|
2017-05-26 04:48:44 +08:00
|
|
|
t = n;
|
|
|
|
}
|
|
|
|
|
2021-03-11 02:06:03 +08:00
|
|
|
if (less)
|
|
|
|
moveIterator<1>(t);
|
2017-05-26 04:48:44 +08:00
|
|
|
|
2020-05-17 03:53:36 +08:00
|
|
|
return IteratorT{ t };
|
2017-05-26 04:48:44 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
// Returns the smallest x such that *x>key, or end()
|
|
|
|
template <class T, class Metric>
|
2020-05-17 01:34:36 +08:00
|
|
|
template <bool isConst>
|
2017-05-26 04:48:44 +08:00
|
|
|
template <class Key>
|
2020-05-17 01:34:36 +08:00
|
|
|
typename IndexedSet<T, Metric>::template Impl<isConst>::IteratorT IndexedSet<T, Metric>::Impl<isConst>::upper_bound(
|
2021-03-11 02:06:03 +08:00
|
|
|
IndexedSet<T, Metric>::Impl<isConst>::SetT& self,
|
|
|
|
const Key& key) {
|
2020-05-17 01:34:36 +08:00
|
|
|
NodeT* t = self.root;
|
2021-03-11 02:06:03 +08:00
|
|
|
if (!t)
|
|
|
|
return self.end();
|
2020-03-31 07:13:37 +08:00
|
|
|
bool not_less;
|
2017-05-26 04:48:44 +08:00
|
|
|
while (true) {
|
2020-03-31 07:13:37 +08:00
|
|
|
not_less = !(key < t->data);
|
2020-05-17 01:34:36 +08:00
|
|
|
NodeT* n = t->child[not_less];
|
2021-03-11 02:06:03 +08:00
|
|
|
if (!n)
|
|
|
|
break;
|
2017-05-26 04:48:44 +08:00
|
|
|
t = n;
|
|
|
|
}
|
|
|
|
|
2021-03-11 02:06:03 +08:00
|
|
|
if (not_less)
|
|
|
|
moveIterator<1>(t);
|
2017-05-26 04:48:44 +08:00
|
|
|
|
2020-05-17 03:53:36 +08:00
|
|
|
return IteratorT{ t };
|
2017-05-26 04:48:44 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
template <class T, class Metric>
|
2020-05-17 01:34:36 +08:00
|
|
|
template <bool isConst>
|
2017-05-26 04:48:44 +08:00
|
|
|
template <class Key>
|
2020-05-17 01:34:36 +08:00
|
|
|
typename IndexedSet<T, Metric>::template Impl<isConst>::IteratorT IndexedSet<T, Metric>::Impl<isConst>::lastLessOrEqual(
|
2021-03-11 02:06:03 +08:00
|
|
|
IndexedSet<T, Metric>::Impl<isConst>::SetT& self,
|
|
|
|
const Key& key) {
|
2020-05-17 01:34:36 +08:00
|
|
|
auto i = self.upper_bound(key);
|
2021-03-11 02:06:03 +08:00
|
|
|
if (i == self.begin())
|
|
|
|
return self.end();
|
2020-05-17 01:34:36 +08:00
|
|
|
return self.previous(i);
|
2017-05-26 04:48:44 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
// Returns first x such that metric < sum(begin(), x+1), or end()
|
|
|
|
template <class T, class Metric>
|
2020-05-17 01:34:36 +08:00
|
|
|
template <bool isConst>
|
2017-05-26 04:48:44 +08:00
|
|
|
template <class M>
|
2020-05-17 01:34:36 +08:00
|
|
|
typename IndexedSet<T, Metric>::template Impl<isConst>::IteratorT IndexedSet<T, Metric>::Impl<isConst>::index(
|
2021-03-11 02:06:03 +08:00
|
|
|
IndexedSet<T, Metric>::Impl<isConst>::SetT& self,
|
|
|
|
const M& metric) {
|
2017-05-26 04:48:44 +08:00
|
|
|
M m = metric;
|
2020-05-17 01:34:36 +08:00
|
|
|
NodeT* t = self.root;
|
2017-05-26 04:48:44 +08:00
|
|
|
while (t) {
|
|
|
|
if (t->child[0] && m < t->child[0]->total)
|
|
|
|
t = t->child[0];
|
|
|
|
else {
|
|
|
|
m = m - t->total;
|
2021-03-11 02:06:03 +08:00
|
|
|
if (t->child[1])
|
|
|
|
m = m + t->child[1]->total;
|
|
|
|
if (m < M())
|
|
|
|
return IteratorT{ t };
|
2017-05-26 04:48:44 +08:00
|
|
|
t = t->child[1];
|
|
|
|
}
|
|
|
|
}
|
2020-05-17 01:34:36 +08:00
|
|
|
return self.end();
|
2017-05-26 04:48:44 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
template <class T, class Metric>
|
2020-05-17 01:34:36 +08:00
|
|
|
Metric IndexedSet<T, Metric>::getMetric(typename IndexedSet<T, Metric>::const_iterator x) const {
|
2020-05-17 05:25:13 +08:00
|
|
|
Metric m = x.node->total;
|
2021-03-11 02:06:03 +08:00
|
|
|
for (int i = 0; i < 2; i++)
|
|
|
|
if (x.node->child[i])
|
|
|
|
m = m - x.node->child[i]->total;
|
2017-05-26 04:48:44 +08:00
|
|
|
return m;
|
|
|
|
}
|
|
|
|
|
|
|
|
template <class T, class Metric>
|
2020-05-17 01:34:36 +08:00
|
|
|
Metric IndexedSet<T, Metric>::sumTo(typename IndexedSet<T, Metric>::const_iterator end) const {
|
2021-03-11 02:06:03 +08:00
|
|
|
if (!end.node)
|
|
|
|
return root ? root->total : Metric();
|
2017-05-26 04:48:44 +08:00
|
|
|
|
2020-05-17 05:25:13 +08:00
|
|
|
Metric m = end.node->child[0] ? end.node->child[0]->total : Metric();
|
|
|
|
for (const Node* p = end.node; p->parent; p = p->parent) {
|
2017-05-26 04:48:44 +08:00
|
|
|
if (p->parent->child[1] == p) {
|
|
|
|
m = m - p->total;
|
|
|
|
m = m + p->parent->total;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return m;
|
|
|
|
}
|
|
|
|
|
2018-10-20 01:30:13 +08:00
|
|
|
#include "flow/flow.h"
|
|
|
|
#include "flow/IndexedSet.actor.h"
|
2017-05-26 04:48:44 +08:00
|
|
|
|
|
|
|
template <class T, class Metric>
|
2021-03-11 02:06:03 +08:00
|
|
|
void IndexedSet<T, Metric>::erase(typename IndexedSet<T, Metric>::iterator begin,
|
|
|
|
typename IndexedSet<T, Metric>::iterator end) {
|
|
|
|
std::vector<IndexedSet<T, Metric>::Node*> toFree;
|
2017-05-26 04:48:44 +08:00
|
|
|
erase(begin, end, toFree);
|
|
|
|
|
|
|
|
ISFreeNodes(toFree, true);
|
|
|
|
}
|
|
|
|
|
|
|
|
template <class T, class Metric>
|
|
|
|
template <class Key>
|
2021-03-11 02:06:03 +08:00
|
|
|
Future<Void> IndexedSet<T, Metric>::eraseAsync(const Key& begin, const Key& end) {
|
|
|
|
return eraseAsync(lower_bound(begin), lower_bound(end));
|
2017-05-26 04:48:44 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
template <class T, class Metric>
|
2021-03-11 02:06:03 +08:00
|
|
|
Future<Void> IndexedSet<T, Metric>::eraseAsync(typename IndexedSet<T, Metric>::iterator begin,
|
|
|
|
typename IndexedSet<T, Metric>::iterator end) {
|
|
|
|
std::vector<IndexedSet<T, Metric>::Node*> toFree;
|
2017-05-26 04:48:44 +08:00
|
|
|
erase(begin, end, toFree);
|
|
|
|
|
|
|
|
return uncancellable(ISFreeNodes(toFree, false));
|
|
|
|
}
|
|
|
|
|
2020-10-01 03:22:23 +08:00
|
|
|
template <class Key, class Value, class Pair, class Metric>
|
|
|
|
Future<Void> Map<Key, Value, Pair, Metric>::clearAsync() {
|
|
|
|
return set.eraseAsync(set.begin(), set.end());
|
|
|
|
}
|
|
|
|
|
2017-05-26 04:48:44 +08:00
|
|
|
#endif
|