2016-08-14 20:45:47 +08:00
|
|
|
#pragma mark
|
|
|
|
|
|
|
|
#include <cstring>
|
|
|
|
#include <functional>
|
2016-08-19 18:28:10 +08:00
|
|
|
#include "data_structures/map/rh_common.hpp"
|
2016-08-09 23:44:39 +08:00
|
|
|
#include "utils/crtp.hpp"
|
2016-08-11 21:08:11 +08:00
|
|
|
#include "utils/likely.hpp"
|
2016-08-15 07:09:58 +08:00
|
|
|
#include "utils/option.hpp"
|
2016-08-09 23:44:39 +08:00
|
|
|
#include "utils/option_ptr.hpp"
|
|
|
|
|
|
|
|
// HashMultiMap with RobinHood collision resolution policy.
|
|
|
|
// Single threaded.
|
2016-08-11 03:02:54 +08:00
|
|
|
// Entrys are POINTERS alligned to 8B.
|
2016-08-09 23:44:39 +08:00
|
|
|
// Entrys must know thers key.
|
|
|
|
// D must have method K& get_key()
|
|
|
|
// K must be comparable with ==.
|
|
|
|
// HashMap behaves as if it isn't owner of entrys.
|
2016-09-19 06:22:36 +08:00
|
|
|
//
|
|
|
|
// Main idea of this MultiMap is a tweak of logic in RobinHood.
|
|
|
|
// RobinHood offset from prefered slot is equal to the number of slots between
|
|
|
|
// [current slot and prefered slot>.
|
|
|
|
// While in this flavour of "multi RobinHood" offset from prefered slot is equal
|
|
|
|
// to the number of different keyed elements between his current slot and
|
|
|
|
// prefered slot.
|
|
|
|
// In the following examples slots will have keys as caracters. So something
|
|
|
|
// like this: |a| will mean that in this slot there is data with key 'a'.
|
|
|
|
// like this: | | will mean empty slot.
|
|
|
|
// like this: |...| will mean arbitary number of slots.
|
|
|
|
// like this: |b:a| will mean that a want's to be in slot but b is in't.
|
|
|
|
//
|
|
|
|
// Examples:
|
|
|
|
// |...|a:a|...| => off(a) = 0
|
|
|
|
// |...|a:a|a|...|a|...| => off(a) = 0
|
|
|
|
// |...|b:a|a|...| => off(a) = 1
|
|
|
|
// |...|b:a|b|...|b|a|...| => off(a) = 1
|
|
|
|
// |...|c:a|b|a|...| => off(a) = 2
|
|
|
|
// |...|c:a|c|...|c|b|...|b||a|...|a|...| => off(a) = 2
|
|
|
|
// ...
|
2016-08-09 23:44:39 +08:00
|
|
|
template <class K, class D, size_t init_size_pow2 = 2>
|
2016-08-11 21:08:11 +08:00
|
|
|
class RhHashMultiMap : public RhBase<K, D, init_size_pow2>
|
2016-08-09 23:44:39 +08:00
|
|
|
{
|
2016-08-11 21:08:11 +08:00
|
|
|
typedef RhBase<K, D, init_size_pow2> base;
|
|
|
|
using base::array;
|
|
|
|
using base::index;
|
|
|
|
using base::capacity;
|
|
|
|
using base::count;
|
|
|
|
using typename base::Combined;
|
|
|
|
using base::before_index;
|
|
|
|
using base::create_it;
|
2016-08-09 23:44:39 +08:00
|
|
|
|
|
|
|
void increase_size()
|
|
|
|
{
|
|
|
|
size_t old_size = capacity;
|
|
|
|
auto a = array;
|
2016-08-11 21:08:11 +08:00
|
|
|
if (base::increase_size()) {
|
|
|
|
for (int i = 0; i < old_size; i++) {
|
|
|
|
if (a[i].valid()) {
|
|
|
|
add(a[i].ptr());
|
|
|
|
}
|
2016-08-09 23:44:39 +08:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
free(a);
|
|
|
|
}
|
|
|
|
|
2016-08-11 21:08:11 +08:00
|
|
|
public:
|
|
|
|
using base::RhBase;
|
|
|
|
using base::end;
|
|
|
|
using typename base::ConstIterator;
|
|
|
|
using typename base::Iterator;
|
|
|
|
|
2016-08-15 07:09:58 +08:00
|
|
|
bool contains(const K &key) const { return find_index(key).is_present(); }
|
2016-08-10 03:29:03 +08:00
|
|
|
|
2016-08-11 03:02:54 +08:00
|
|
|
Iterator find(const K &key_in)
|
2016-08-15 07:09:58 +08:00
|
|
|
{
|
|
|
|
auto index = find_index(key_in);
|
|
|
|
if (index) {
|
|
|
|
return create_it(index.get());
|
|
|
|
} else {
|
|
|
|
return end();
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
ConstIterator find(const K &key_in) const
|
|
|
|
{
|
|
|
|
auto index = find_index(key_in);
|
|
|
|
if (index) {
|
|
|
|
return create_it(index.get());
|
|
|
|
} else {
|
|
|
|
return end();
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
private:
|
|
|
|
Option<size_t> find_index(const K &key_in) const
|
2016-08-09 23:44:39 +08:00
|
|
|
{
|
2016-08-11 03:02:54 +08:00
|
|
|
if (count > 0) {
|
|
|
|
auto key = std::ref(key_in);
|
|
|
|
size_t mask = this->mask();
|
|
|
|
size_t now = index(key, mask);
|
|
|
|
size_t off = 0;
|
|
|
|
size_t border = 8 <= capacity ? 8 : capacity;
|
2016-08-09 23:44:39 +08:00
|
|
|
Combined other = array[now];
|
2016-08-11 03:02:54 +08:00
|
|
|
while (other.valid() && off < border) {
|
2016-08-09 23:44:39 +08:00
|
|
|
auto other_off = other.off();
|
2016-08-11 03:02:54 +08:00
|
|
|
if (other_off == off && key == other.ptr()->get_key()) {
|
2016-08-15 07:09:58 +08:00
|
|
|
return Option<size_t>(now);
|
2016-08-09 23:44:39 +08:00
|
|
|
|
|
|
|
} else if (other_off < off) { // Other is rich
|
|
|
|
break;
|
|
|
|
|
2016-08-11 21:08:11 +08:00
|
|
|
} else { // Else other has equal or greater off, so he is poor.
|
|
|
|
if (UNLIKELY(skip(now, other, other_off, mask))) {
|
|
|
|
break;
|
|
|
|
}
|
2016-08-09 23:44:39 +08:00
|
|
|
off++;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
2016-08-11 03:02:54 +08:00
|
|
|
|
2016-08-15 07:09:58 +08:00
|
|
|
return Option<size_t>();
|
2016-08-09 23:44:39 +08:00
|
|
|
}
|
|
|
|
|
2016-08-15 07:09:58 +08:00
|
|
|
public:
|
2016-08-11 06:05:24 +08:00
|
|
|
// Inserts element.
|
|
|
|
void add(D *data) { add(data->get_key(), data); }
|
|
|
|
|
2016-08-09 23:44:39 +08:00
|
|
|
// Inserts element with the given key.
|
2016-08-11 03:02:54 +08:00
|
|
|
void add(const K &key_in, D *data)
|
2016-08-09 23:44:39 +08:00
|
|
|
{
|
2016-08-11 03:02:54 +08:00
|
|
|
assert(key_in == data->get_key());
|
2016-08-09 23:44:39 +08:00
|
|
|
|
2016-08-11 03:02:54 +08:00
|
|
|
if (count < capacity) {
|
|
|
|
auto key = std::ref(key_in);
|
|
|
|
size_t mask = this->mask();
|
|
|
|
size_t now = index(key, mask);
|
|
|
|
size_t start = now;
|
|
|
|
size_t off = 0;
|
|
|
|
size_t border = 8 <= capacity ? 8 : capacity;
|
2016-08-09 23:44:39 +08:00
|
|
|
|
|
|
|
Combined other = array[now];
|
2016-08-11 03:02:54 +08:00
|
|
|
while (off < border) {
|
|
|
|
if (other.valid()) {
|
2016-08-11 21:08:11 +08:00
|
|
|
const size_t other_off = other.off();
|
2016-08-11 06:05:24 +08:00
|
|
|
bool multi = false;
|
2016-08-11 21:08:11 +08:00
|
|
|
if (other_off == off && other.ptr()->get_key() == key) {
|
|
|
|
// Found the same
|
2016-09-19 06:22:36 +08:00
|
|
|
// Must skip same keyd values to insert new value at the
|
|
|
|
// end.
|
2016-08-11 21:08:11 +08:00
|
|
|
do {
|
2016-08-11 03:02:54 +08:00
|
|
|
now = (now + 1) & mask;
|
|
|
|
other = array[now];
|
|
|
|
if (!other.valid()) {
|
2016-09-19 06:22:36 +08:00
|
|
|
// Found empty slot in which data ca be added.
|
2016-08-11 03:02:54 +08:00
|
|
|
set(now, data, off);
|
|
|
|
return;
|
|
|
|
}
|
2016-08-11 21:08:11 +08:00
|
|
|
} while (other.equal(key, off));
|
2016-09-19 06:22:36 +08:00
|
|
|
// There is no empty slot after same keyed values.
|
2016-08-11 03:02:54 +08:00
|
|
|
multi = true;
|
|
|
|
} else if (other_off > off ||
|
|
|
|
other_poor(other, mask, start,
|
2016-08-11 21:08:11 +08:00
|
|
|
now)) { // Else other has equal or
|
|
|
|
// greater off, so he is poor.
|
|
|
|
skip(now, other, other_off, mask); // TRUE IS IMPOSSIBLE
|
2016-08-11 03:02:54 +08:00
|
|
|
off++;
|
|
|
|
continue;
|
|
|
|
}
|
2016-08-09 23:44:39 +08:00
|
|
|
|
2016-09-19 06:22:36 +08:00
|
|
|
// Data will be insrted at current slot and all other data
|
|
|
|
// will be displaced for one slot.
|
2016-08-09 23:44:39 +08:00
|
|
|
array[now] = Combined(data, off);
|
2016-08-11 06:05:24 +08:00
|
|
|
auto start_insert = now;
|
|
|
|
while (is_off_adjusted(other, mask, start_insert, now,
|
|
|
|
multi) ||
|
|
|
|
other.increment_off()) {
|
2016-08-11 03:02:54 +08:00
|
|
|
now = (now + 1) & mask;
|
|
|
|
auto tmp = array[now];
|
|
|
|
array[now] = other;
|
|
|
|
other = tmp;
|
|
|
|
if (!other.valid()) {
|
2016-09-19 06:22:36 +08:00
|
|
|
// Found empty slot which means i can finish now.
|
2016-08-11 03:02:54 +08:00
|
|
|
count++;
|
|
|
|
return;
|
2016-08-09 23:44:39 +08:00
|
|
|
}
|
|
|
|
}
|
2016-08-11 03:02:54 +08:00
|
|
|
data = other.ptr();
|
|
|
|
break; // Cant insert removed element
|
2016-08-09 23:44:39 +08:00
|
|
|
} else {
|
2016-09-19 06:22:36 +08:00
|
|
|
// Found empty slot for data.
|
2016-08-11 03:02:54 +08:00
|
|
|
set(now, data, off);
|
|
|
|
return;
|
2016-08-09 23:44:39 +08:00
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2016-09-19 06:22:36 +08:00
|
|
|
// There is't enough space for data.
|
2016-08-09 23:44:39 +08:00
|
|
|
increase_size();
|
|
|
|
add(data);
|
|
|
|
}
|
|
|
|
|
2016-08-11 06:05:24 +08:00
|
|
|
// Removes element equal by key and value. Returns true if it existed.
|
|
|
|
bool remove(D *data)
|
|
|
|
{
|
|
|
|
if (count > 0) {
|
|
|
|
auto key = std::ref(data->get_key());
|
|
|
|
size_t mask = this->mask();
|
|
|
|
size_t now = index(key, mask);
|
|
|
|
size_t off = 0;
|
|
|
|
size_t border = 8 <= capacity ? 8 : capacity;
|
|
|
|
Combined other = array[now];
|
2016-09-19 06:22:36 +08:00
|
|
|
|
2016-08-11 06:05:24 +08:00
|
|
|
while (other.valid() && off < border) {
|
2016-08-11 21:08:11 +08:00
|
|
|
const size_t other_off = other.off();
|
2016-08-11 06:05:24 +08:00
|
|
|
if (other_off == off && key == other.ptr()->get_key()) {
|
2016-09-19 06:22:36 +08:00
|
|
|
// Found same key data.
|
2016-08-11 06:05:24 +08:00
|
|
|
auto founded = capacity;
|
2016-08-11 21:08:11 +08:00
|
|
|
size_t started = now;
|
|
|
|
bool multi = false;
|
2016-09-19 06:22:36 +08:00
|
|
|
// Must find slot with searched data.
|
2016-08-11 06:05:24 +08:00
|
|
|
do {
|
|
|
|
if (other.ptr() == data) {
|
2016-09-19 06:22:36 +08:00
|
|
|
// founded it.
|
2016-08-11 06:05:24 +08:00
|
|
|
founded = now;
|
|
|
|
}
|
|
|
|
now = (now + 1) & mask;
|
|
|
|
other = array[now];
|
2016-08-11 21:08:11 +08:00
|
|
|
if (!other.valid() || UNLIKELY(started == now)) {
|
|
|
|
// Reason is possibility of map full of same values.
|
2016-08-11 06:05:24 +08:00
|
|
|
break;
|
|
|
|
}
|
2016-08-11 21:08:11 +08:00
|
|
|
} while (other.equal(key, off) && (multi = true));
|
2016-09-19 06:22:36 +08:00
|
|
|
|
2016-08-11 06:05:24 +08:00
|
|
|
if (founded == capacity) {
|
2016-09-19 06:22:36 +08:00
|
|
|
// Didn't found the data.
|
2016-08-11 06:05:24 +08:00
|
|
|
return false;
|
|
|
|
}
|
|
|
|
|
2016-09-19 06:22:36 +08:00
|
|
|
// Data will be removed by moving other data by one slot
|
|
|
|
// before.
|
2016-08-11 06:05:24 +08:00
|
|
|
auto bef = before_index(now, mask);
|
|
|
|
array[founded] = array[bef];
|
|
|
|
|
|
|
|
auto start_rem = bef;
|
|
|
|
while (other.valid() &&
|
|
|
|
(is_off_adjusted_rem(other, mask, start_rem, bef,
|
|
|
|
now, multi) ||
|
|
|
|
other.decrement_off())) {
|
|
|
|
array[bef] = other;
|
|
|
|
bef = now;
|
|
|
|
now = (now + 1) & mask;
|
|
|
|
other = array[now];
|
|
|
|
}
|
|
|
|
|
|
|
|
array[bef] = Combined();
|
|
|
|
count--;
|
|
|
|
return true;
|
|
|
|
|
|
|
|
} else if (other_off < off) { // Other is rich
|
|
|
|
break;
|
|
|
|
|
2016-08-11 21:08:11 +08:00
|
|
|
} else { // Else other has equal or greater off, so he is poor.
|
2016-09-19 06:22:36 +08:00
|
|
|
// Must skip values of same keys but different key than
|
|
|
|
// data.
|
2016-08-11 21:08:11 +08:00
|
|
|
if (UNLIKELY(skip(now, other, other_off, mask))) {
|
|
|
|
break;
|
|
|
|
}
|
2016-08-11 06:05:24 +08:00
|
|
|
off++;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
|
2016-08-11 21:08:11 +08:00
|
|
|
private:
|
|
|
|
// Skips same key valus as other. true if whole map is full of same key
|
|
|
|
// values.
|
2016-08-15 07:09:58 +08:00
|
|
|
bool skip(size_t &now, Combined &other, size_t other_off, size_t mask) const
|
2016-08-09 23:44:39 +08:00
|
|
|
{
|
2016-08-11 21:08:11 +08:00
|
|
|
auto other_key = other.ptr()->get_key();
|
|
|
|
size_t start = now;
|
|
|
|
do {
|
|
|
|
now = (now + 1) & mask;
|
|
|
|
other = array[now];
|
|
|
|
if (UNLIKELY(start == now)) { // Reason is possibility of map
|
|
|
|
// full of same values.
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
} while (other.valid() && other.equal(other_key, other_off));
|
|
|
|
return false;
|
2016-08-09 23:44:39 +08:00
|
|
|
}
|
|
|
|
|
2016-08-11 21:08:11 +08:00
|
|
|
void set(size_t now, D *data, size_t off)
|
2016-08-11 03:02:54 +08:00
|
|
|
{
|
2016-08-11 21:08:11 +08:00
|
|
|
array[now] = Combined(data, off);
|
|
|
|
count++;
|
2016-08-11 03:02:54 +08:00
|
|
|
}
|
|
|
|
|
2016-08-11 21:08:11 +08:00
|
|
|
// True if no adjusment is needed, false otherwise.
|
|
|
|
bool is_off_adjusted(Combined &com, size_t mask, size_t start, size_t now,
|
|
|
|
bool multi)
|
2016-08-09 23:44:39 +08:00
|
|
|
{
|
2016-08-11 21:08:11 +08:00
|
|
|
if (com.off() == 0) { // Must be adjusted
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
size_t cin = index(com.ptr()->get_key(), mask);
|
|
|
|
if (outside(start, now, cin)) { // Outside [start,now] interval
|
|
|
|
return multi;
|
|
|
|
}
|
|
|
|
auto a = array[cin];
|
|
|
|
auto b = array[(cin + 1) & mask];
|
|
|
|
return a == b;
|
|
|
|
// Check if different key has eneterd in to
|
|
|
|
// range of other.
|
2016-08-09 23:44:39 +08:00
|
|
|
}
|
|
|
|
|
2016-08-11 21:08:11 +08:00
|
|
|
bool other_poor(Combined other, size_t mask, size_t start, size_t now)
|
2016-08-09 23:44:39 +08:00
|
|
|
{
|
2016-08-11 21:08:11 +08:00
|
|
|
// If other index is smaller then he is poorer.
|
|
|
|
return outside_left_weak(start, now,
|
|
|
|
index(other.ptr()->get_key(), mask));
|
2016-08-09 23:44:39 +08:00
|
|
|
}
|
|
|
|
|
2016-08-11 21:08:11 +08:00
|
|
|
// True if no adjusment is needed, false otherwise.
|
|
|
|
bool is_off_adjusted_rem(Combined &com, size_t mask, size_t start,
|
|
|
|
size_t bef, size_t now, bool multi)
|
|
|
|
{
|
|
|
|
if (com.off() == 0) { // Must be adjusted
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
size_t cin = index(com.ptr()->get_key(), mask);
|
|
|
|
if (cin == bef) {
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
if (outside(start, now, cin)) {
|
|
|
|
return multi;
|
|
|
|
}
|
|
|
|
auto a = array[cin];
|
|
|
|
auto b = array[before_index(cin, mask)];
|
|
|
|
return b.valid() && a == b;
|
|
|
|
// Check if different key has eneterd in to
|
|
|
|
// range of other.
|
|
|
|
}
|
2016-08-09 23:44:39 +08:00
|
|
|
|
2016-08-11 21:08:11 +08:00
|
|
|
// True if p is uutside [start,end] interval
|
|
|
|
bool outside(size_t start, size_t end, size_t p)
|
|
|
|
{
|
|
|
|
return (start <= end && (p < start || p > end)) ||
|
|
|
|
(end < start && p < start && p > end);
|
|
|
|
}
|
2016-08-09 23:44:39 +08:00
|
|
|
|
2016-08-11 21:08:11 +08:00
|
|
|
// True if p is outside <start,end] interval
|
|
|
|
bool outside_left_weak(size_t start, size_t end, size_t p)
|
|
|
|
{
|
|
|
|
return (start <= end && (p <= start || p > end)) ||
|
|
|
|
(end < start && p <= start && p > end);
|
|
|
|
}
|
2016-08-09 23:44:39 +08:00
|
|
|
};
|