hashmap.h 16.1 KB
Newer Older
1
// Copyright 2012 the V8 project authors. All rights reserved.
2 3
// Use of this source code is governed by a BSD-style license that can be
// found in the LICENSE file.
4

lpy's avatar
lpy committed
5 6 7 8 9 10
// The reason we write our own hash map instead of using unordered_map in STL,
// is that STL containers use a mutex pool on debug build, which will lead to
// deadlock when we are using async signal handler.

#ifndef V8_BASE_HASHMAP_H_
#define V8_BASE_HASHMAP_H_
11

12 13
#include <stdlib.h>

14
#include "src/base/bits.h"
15
#include "src/base/hashmap-entry.h"
16
#include "src/base/logging.h"
17

18
namespace v8 {
lpy's avatar
lpy committed
19 20 21 22 23 24 25
namespace base {

class DefaultAllocationPolicy {
 public:
  V8_INLINE void* New(size_t size) { return malloc(size); }
  V8_INLINE static void Delete(void* p) { free(p); }
};
26

27
template <typename Key, typename Value, class MatchFun, class AllocationPolicy>
28
class TemplateHashMapImpl {
29
 public:
30
  typedef TemplateHashMapEntry<Key, Value> Entry;
31

32 33 34 35 36
  // The default capacity.  This is used by the call sites which want
  // to pass in a non-default AllocationPolicy but want to use the
  // default value of capacity specified by the implementation.
  static const uint32_t kDefaultHashMapCapacity = 8;

37 38
  // initial_capacity is the size of the initial hash map;
  // it must be a power of 2 (and thus must not be 0).
39 40
  TemplateHashMapImpl(uint32_t capacity = kDefaultHashMapCapacity,
                      MatchFun match = MatchFun(),
41
                      AllocationPolicy allocator = AllocationPolicy());
42

43
  ~TemplateHashMapImpl();
44

45
  // If an entry with matching key is found, returns that entry.
46 47
  // Otherwise, nullptr is returned.
  Entry* Lookup(const Key& key, uint32_t hash) const;
48 49 50

  // If an entry with matching key is found, returns that entry.
  // If no matching entry is found, a new entry is inserted with
51
  // corresponding key, key hash, and default initialized value.
52 53
  Entry* LookupOrInsert(const Key& key, uint32_t hash,
                        AllocationPolicy allocator = AllocationPolicy());
54

55 56 57 58 59 60 61
  // If an entry with matching key is found, returns that entry.
  // If no matching entry is found, a new entry is inserted with
  // corresponding key, key hash, and value created by func.
  template <typename Func>
  Entry* LookupOrInsert(const Key& key, uint32_t hash, const Func& value_func,
                        AllocationPolicy allocator = AllocationPolicy());

62 63
  Entry* InsertNew(const Key& key, uint32_t hash,
                   AllocationPolicy allocator = AllocationPolicy());
64

65
  // Removes the entry with matching key.
66 67
  // It returns the value of the deleted entry
  // or null if there is no value for such key.
68
  Value Remove(const Key& key, uint32_t hash);
69

70 71 72
  // Empties the hash map (occupancy() == 0).
  void Clear();

73 74 75 76 77 78 79 80
  // Empties the map and makes it unusable for allocation.
  void Invalidate() {
    AllocationPolicy::Delete(map_);
    map_ = nullptr;
    occupancy_ = 0;
    capacity_ = 0;
  }

81
  // The number of (non-empty) entries in the table.
82
  uint32_t occupancy() const { return occupancy_; }
83 84 85 86

  // The capacity of the table. The implementation
  // makes sure that occupancy is at most 80% of
  // the table capacity.
87
  uint32_t capacity() const { return capacity_; }
88 89 90

  // Iteration
  //
91
  // for (Entry* p = map.Start(); p != nullptr; p = map.Next(p)) {
92 93 94 95 96 97
  //   ...
  // }
  //
  // If entries are inserted during iteration, the effect of
  // calling Next() is undefined.
  Entry* Start() const;
98
  Entry* Next(Entry* entry) const;
99

100 101 102 103 104 105 106 107
  void Reset(AllocationPolicy allocator) {
    Initialize(capacity_, allocator);
    occupancy_ = 0;
  }

 protected:
  void Initialize(uint32_t capacity, AllocationPolicy allocator);

108 109 110 111
 private:
  Entry* map_;
  uint32_t capacity_;
  uint32_t occupancy_;
112 113
  // TODO(leszeks): This takes up space even if it has no state, maybe replace
  // with something that does the empty base optimisation e.g. std::tuple
114
  MatchFun match_;
115

116
  Entry* map_end() const { return map_ + capacity_; }
117
  Entry* Probe(const Key& key, uint32_t hash) const;
118
  Entry* FillEmptyEntry(Entry* entry, const Key& key, const Value& value,
119 120 121
                        uint32_t hash,
                        AllocationPolicy allocator = AllocationPolicy());
  void Resize(AllocationPolicy allocator);
122
};
123 124 125
template <typename Key, typename Value, typename MatchFun,
          class AllocationPolicy>
TemplateHashMapImpl<Key, Value, MatchFun, AllocationPolicy>::
126
    TemplateHashMapImpl(uint32_t initial_capacity, MatchFun match,
127 128
                        AllocationPolicy allocator)
    : match_(match) {
129
  Initialize(initial_capacity, allocator);
130 131
}

132 133 134 135
template <typename Key, typename Value, typename MatchFun,
          class AllocationPolicy>
TemplateHashMapImpl<Key, Value, MatchFun,
                    AllocationPolicy>::~TemplateHashMapImpl() {
136
  AllocationPolicy::Delete(map_);
137 138
}

139 140 141 142 143
template <typename Key, typename Value, typename MatchFun,
          class AllocationPolicy>
typename TemplateHashMapImpl<Key, Value, MatchFun, AllocationPolicy>::Entry*
TemplateHashMapImpl<Key, Value, MatchFun, AllocationPolicy>::Lookup(
    const Key& key, uint32_t hash) const {
144 145
  Entry* entry = Probe(key, hash);
  return entry->exists() ? entry : nullptr;
146 147
}

148 149 150 151
template <typename Key, typename Value, typename MatchFun,
          class AllocationPolicy>
typename TemplateHashMapImpl<Key, Value, MatchFun, AllocationPolicy>::Entry*
TemplateHashMapImpl<Key, Value, MatchFun, AllocationPolicy>::LookupOrInsert(
152
    const Key& key, uint32_t hash, AllocationPolicy allocator) {
153 154 155 156 157 158 159 160 161 162
  return LookupOrInsert(key, hash, []() { return Value(); }, allocator);
}

template <typename Key, typename Value, typename MatchFun,
          class AllocationPolicy>
template <typename Func>
typename TemplateHashMapImpl<Key, Value, MatchFun, AllocationPolicy>::Entry*
TemplateHashMapImpl<Key, Value, MatchFun, AllocationPolicy>::LookupOrInsert(
    const Key& key, uint32_t hash, const Func& value_func,
    AllocationPolicy allocator) {
163
  // Find a matching entry.
164 165 166
  Entry* entry = Probe(key, hash);
  if (entry->exists()) {
    return entry;
167 168
  }

169
  return FillEmptyEntry(entry, key, value_func(), hash, allocator);
170 171
}

172 173 174 175
template <typename Key, typename Value, typename MatchFun,
          class AllocationPolicy>
typename TemplateHashMapImpl<Key, Value, MatchFun, AllocationPolicy>::Entry*
TemplateHashMapImpl<Key, Value, MatchFun, AllocationPolicy>::InsertNew(
176
    const Key& key, uint32_t hash, AllocationPolicy allocator) {
177
  Entry* entry = Probe(key, hash);
178
  return FillEmptyEntry(entry, key, Value(), hash, allocator);
179 180
}

181 182 183 184
template <typename Key, typename Value, typename MatchFun,
          class AllocationPolicy>
Value TemplateHashMapImpl<Key, Value, MatchFun, AllocationPolicy>::Remove(
    const Key& key, uint32_t hash) {
185 186
  // Lookup the entry for the key to remove.
  Entry* p = Probe(key, hash);
187
  if (!p->exists()) {
188
    // Key not found nothing to remove.
189
    return nullptr;
190 191
  }

192
  Value value = p->value;
193 194 195 196 197 198 199 200 201 202 203 204 205 206
  // To remove an entry we need to ensure that it does not create an empty
  // entry that will cause the search for another entry to stop too soon. If all
  // the entries between the entry to remove and the next empty slot have their
  // initial position inside this interval, clearing the entry to remove will
  // not break the search. If, while searching for the next empty entry, an
  // entry is encountered which does not have its initial position between the
  // entry to remove and the position looked at, then this entry can be moved to
  // the place of the entry to remove without breaking the search for it. The
  // entry made vacant by this move is now the entry to remove and the process
  // starts over.
  // Algorithm from http://en.wikipedia.org/wiki/Open_addressing.

  // This guarantees loop termination as there is at least one empty entry so
  // eventually the removed entry will have an empty entry after it.
207
  DCHECK(occupancy_ < capacity_);
208 209 210 211 212 213 214 215 216 217 218 219 220

  // p is the candidate entry to clear. q is used to scan forwards.
  Entry* q = p;  // Start at the entry to remove.
  while (true) {
    // Move q to the next entry.
    q = q + 1;
    if (q == map_end()) {
      q = map_;
    }

    // All entries between p and q have their initial position between p and q
    // and the entry p can be cleared without breaking the search for these
    // entries.
221
    if (!q->exists()) {
222 223 224 225 226 227 228 229 230
      break;
    }

    // Find the initial position for the entry at position q.
    Entry* r = map_ + (q->hash & (capacity_ - 1));

    // If the entry at position q has its initial position outside the range
    // between p and q it can be moved forward to position p and will still be
    // found. There is now a new candidate entry for clearing.
lpy's avatar
lpy committed
231
    if ((q > p && (r <= p || r > q)) || (q < p && (r <= p && r > q))) {
232 233 234 235 236 237
      *p = *q;
      p = q;
    }
  }

  // Clear the entry which is allowed to en emptied.
238
  p->clear();
239
  occupancy_--;
240
  return value;
241 242
}

243 244 245
template <typename Key, typename Value, typename MatchFun,
          class AllocationPolicy>
void TemplateHashMapImpl<Key, Value, MatchFun, AllocationPolicy>::Clear() {
246
  // Mark all entries as empty.
247 248
  for (size_t i = 0; i < capacity_; ++i) {
    map_[i].clear();
249 250 251 252
  }
  occupancy_ = 0;
}

253 254 255 256
template <typename Key, typename Value, typename MatchFun,
          class AllocationPolicy>
typename TemplateHashMapImpl<Key, Value, MatchFun, AllocationPolicy>::Entry*
TemplateHashMapImpl<Key, Value, MatchFun, AllocationPolicy>::Start() const {
257 258 259
  return Next(map_ - 1);
}

260 261 262 263 264
template <typename Key, typename Value, typename MatchFun,
          class AllocationPolicy>
typename TemplateHashMapImpl<Key, Value, MatchFun, AllocationPolicy>::Entry*
TemplateHashMapImpl<Key, Value, MatchFun, AllocationPolicy>::Next(
    Entry* entry) const {
265
  const Entry* end = map_end();
266 267 268 269
  DCHECK(map_ - 1 <= entry && entry < end);
  for (entry++; entry < end; entry++) {
    if (entry->exists()) {
      return entry;
270 271
    }
  }
272
  return nullptr;
273 274
}

275 276 277 278 279
template <typename Key, typename Value, typename MatchFun,
          class AllocationPolicy>
typename TemplateHashMapImpl<Key, Value, MatchFun, AllocationPolicy>::Entry*
TemplateHashMapImpl<Key, Value, MatchFun, AllocationPolicy>::Probe(
    const Key& key, uint32_t hash) const {
280
  DCHECK(base::bits::IsPowerOfTwo32(capacity_));
281 282
  size_t i = hash & (capacity_ - 1);
  DCHECK(i < capacity_);
283

284
  DCHECK(occupancy_ < capacity_);  // Guarantees loop termination.
285 286
  while (map_[i].exists() && !match_(hash, map_[i].hash, key, map_[i].key)) {
    i = (i + 1) & (capacity_ - 1);
287 288
  }

289
  return &map_[i];
290 291
}

292 293 294 295
template <typename Key, typename Value, typename MatchFun,
          class AllocationPolicy>
typename TemplateHashMapImpl<Key, Value, MatchFun, AllocationPolicy>::Entry*
TemplateHashMapImpl<Key, Value, MatchFun, AllocationPolicy>::FillEmptyEntry(
296 297
    Entry* entry, const Key& key, const Value& value, uint32_t hash,
    AllocationPolicy allocator) {
298 299 300 301 302 303 304
  DCHECK(!entry->exists());

  new (entry) Entry(key, value, hash);
  occupancy_++;

  // Grow the map if we reached >= 80% occupancy.
  if (occupancy_ + occupancy_ / 4 >= capacity_) {
305
    Resize(allocator);
306 307 308 309
    entry = Probe(key, hash);
  }

  return entry;
310 311
}

312 313 314
template <typename Key, typename Value, typename MatchFun,
          class AllocationPolicy>
void TemplateHashMapImpl<Key, Value, MatchFun, AllocationPolicy>::Initialize(
315
    uint32_t capacity, AllocationPolicy allocator) {
316
  DCHECK(base::bits::IsPowerOfTwo32(capacity));
317
  map_ = reinterpret_cast<Entry*>(allocator.New(capacity * sizeof(Entry)));
318
  if (map_ == nullptr) {
lpy's avatar
lpy committed
319
    FATAL("Out of memory: HashMap::Initialize");
320 321 322 323 324 325
    return;
  }
  capacity_ = capacity;
  Clear();
}

326 327 328
template <typename Key, typename Value, typename MatchFun,
          class AllocationPolicy>
void TemplateHashMapImpl<Key, Value, MatchFun, AllocationPolicy>::Resize(
329
    AllocationPolicy allocator) {
330 331 332 333
  Entry* map = map_;
  uint32_t n = occupancy_;

  // Allocate larger map.
334
  Initialize(capacity_ * 2, allocator);
335 336

  // Rehash all current entries.
337 338 339
  for (Entry* entry = map; n > 0; entry++) {
    if (entry->exists()) {
      Entry* new_entry = Probe(entry->key, entry->hash);
340 341
      new_entry = FillEmptyEntry(new_entry, entry->key, entry->value,
                                 entry->hash, allocator);
342 343 344 345 346
      n--;
    }
  }

  // Delete old map.
347
  AllocationPolicy::Delete(map);
348
}
349

350 351 352 353 354 355 356 357 358 359 360 361 362 363 364 365
// Match function which compares hashes before executing a (potentially
// expensive) key comparison.
template <typename Key, typename MatchFun>
struct HashEqualityThenKeyMatcher {
  explicit HashEqualityThenKeyMatcher(MatchFun match) : match_(match) {}

  bool operator()(uint32_t hash1, uint32_t hash2, const Key& key1,
                  const Key& key2) const {
    return hash1 == hash2 && match_(key1, key2);
  }

 private:
  MatchFun match_;
};

// Hashmap<void*, void*> which takes a custom key comparison function pointer.
366
template <typename AllocationPolicy>
367
class CustomMatcherTemplateHashMapImpl
368 369 370 371 372 373 374
    : public TemplateHashMapImpl<
          void*, void*,
          HashEqualityThenKeyMatcher<void*, bool (*)(void*, void*)>,
          AllocationPolicy> {
  typedef TemplateHashMapImpl<
      void*, void*, HashEqualityThenKeyMatcher<void*, bool (*)(void*, void*)>,
      AllocationPolicy>
375 376 377 378 379
      Base;

 public:
  typedef bool (*MatchFun)(void*, void*);

380 381 382
  CustomMatcherTemplateHashMapImpl(
      MatchFun match, uint32_t capacity = Base::kDefaultHashMapCapacity,
      AllocationPolicy allocator = AllocationPolicy())
383 384
      : Base(capacity, HashEqualityThenKeyMatcher<void*, MatchFun>(match),
             allocator) {}
385 386 387 388 389
};

typedef CustomMatcherTemplateHashMapImpl<DefaultAllocationPolicy>
    CustomMatcherHashMap;

390 391 392 393 394 395 396 397 398 399
// Match function which compares keys directly by equality.
template <typename Key>
struct KeyEqualityMatcher {
  bool operator()(uint32_t hash1, uint32_t hash2, const Key& key1,
                  const Key& key2) const {
    return key1 == key2;
  }
};

// Hashmap<void*, void*> which compares the key pointers directly.
400 401
template <typename AllocationPolicy>
class PointerTemplateHashMapImpl
402
    : public TemplateHashMapImpl<void*, void*, KeyEqualityMatcher<void*>,
403
                                 AllocationPolicy> {
404
  typedef TemplateHashMapImpl<void*, void*, KeyEqualityMatcher<void*>,
405 406
                              AllocationPolicy>
      Base;
407

408 409 410
 public:
  PointerTemplateHashMapImpl(uint32_t capacity = Base::kDefaultHashMapCapacity,
                             AllocationPolicy allocator = AllocationPolicy())
411
      : Base(capacity, KeyEqualityMatcher<void*>(), allocator) {}
412 413 414 415
};

typedef PointerTemplateHashMapImpl<DefaultAllocationPolicy> HashMap;

416
// A hash map for pointer keys and values with an STL-like interface.
417 418
template <class Key, class Value, class MatchFun, class AllocationPolicy>
class TemplateHashMap
419 420 421 422 423 424 425
    : private TemplateHashMapImpl<void*, void*,
                                  HashEqualityThenKeyMatcher<void*, MatchFun>,
                                  AllocationPolicy> {
  typedef TemplateHashMapImpl<void*, void*,
                              HashEqualityThenKeyMatcher<void*, MatchFun>,
                              AllocationPolicy>
      Base;
426

427
 public:
lpy's avatar
lpy committed
428
  STATIC_ASSERT(sizeof(Key*) == sizeof(void*));    // NOLINT
429 430 431 432 433 434 435 436 437 438 439 440 441 442
  STATIC_ASSERT(sizeof(Value*) == sizeof(void*));  // NOLINT
  struct value_type {
    Key* first;
    Value* second;
  };

  class Iterator {
   public:
    Iterator& operator++() {
      entry_ = map_->Next(entry_);
      return *this;
    }

    value_type* operator->() { return reinterpret_cast<value_type*>(entry_); }
lpy's avatar
lpy committed
443
    bool operator!=(const Iterator& other) { return entry_ != other.entry_; }
444 445

   private:
446
    Iterator(const Base* map, typename Base::Entry* entry)
lpy's avatar
lpy committed
447
        : map_(map), entry_(entry) {}
448

449 450
    const Base* map_;
    typename Base::Entry* entry_;
451 452 453 454

    friend class TemplateHashMap;
  };

455
  TemplateHashMap(MatchFun match,
456
                  AllocationPolicy allocator = AllocationPolicy())
457 458
      : Base(Base::kDefaultHashMapCapacity,
             HashEqualityThenKeyMatcher<void*, MatchFun>(match), allocator) {}
459 460

  Iterator begin() const { return Iterator(this, this->Start()); }
461
  Iterator end() const { return Iterator(this, nullptr); }
462 463
  Iterator find(Key* key, bool insert = false,
                AllocationPolicy allocator = AllocationPolicy()) {
464
    if (insert) {
465
      return Iterator(this, this->LookupOrInsert(key, key->Hash(), allocator));
466 467
    }
    return Iterator(this, this->Lookup(key, key->Hash()));
468 469 470
  }
};

lpy's avatar
lpy committed
471
}  // namespace base
472
}  // namespace v8
473

lpy's avatar
lpy committed
474
#endif  // V8_BASE_HASHMAP_H_