1*7c3d14c8STreehugger Robot //===-- sanitizer_addrhashmap.h ---------------------------------*- C++ -*-===//
2*7c3d14c8STreehugger Robot //
3*7c3d14c8STreehugger Robot // The LLVM Compiler Infrastructure
4*7c3d14c8STreehugger Robot //
5*7c3d14c8STreehugger Robot // This file is distributed under the University of Illinois Open Source
6*7c3d14c8STreehugger Robot // License. See LICENSE.TXT for details.
7*7c3d14c8STreehugger Robot //
8*7c3d14c8STreehugger Robot //===----------------------------------------------------------------------===//
9*7c3d14c8STreehugger Robot //
10*7c3d14c8STreehugger Robot // Concurrent uptr->T hashmap.
11*7c3d14c8STreehugger Robot //
12*7c3d14c8STreehugger Robot //===----------------------------------------------------------------------===//
13*7c3d14c8STreehugger Robot
14*7c3d14c8STreehugger Robot #ifndef SANITIZER_ADDRHASHMAP_H
15*7c3d14c8STreehugger Robot #define SANITIZER_ADDRHASHMAP_H
16*7c3d14c8STreehugger Robot
17*7c3d14c8STreehugger Robot #include "sanitizer_common.h"
18*7c3d14c8STreehugger Robot #include "sanitizer_mutex.h"
19*7c3d14c8STreehugger Robot #include "sanitizer_atomic.h"
20*7c3d14c8STreehugger Robot #include "sanitizer_allocator_internal.h"
21*7c3d14c8STreehugger Robot
22*7c3d14c8STreehugger Robot namespace __sanitizer {
23*7c3d14c8STreehugger Robot
24*7c3d14c8STreehugger Robot // Concurrent uptr->T hashmap.
25*7c3d14c8STreehugger Robot // T must be a POD type, kSize is preferably a prime but can be any number.
26*7c3d14c8STreehugger Robot // Usage example:
27*7c3d14c8STreehugger Robot //
28*7c3d14c8STreehugger Robot // typedef AddrHashMap<uptr, 11> Map;
29*7c3d14c8STreehugger Robot // Map m;
30*7c3d14c8STreehugger Robot // {
31*7c3d14c8STreehugger Robot // Map::Handle h(&m, addr);
32*7c3d14c8STreehugger Robot // use h.operator->() to access the data
33*7c3d14c8STreehugger Robot // if h.created() then the element was just created, and the current thread
34*7c3d14c8STreehugger Robot // has exclusive access to it
35*7c3d14c8STreehugger Robot // otherwise the current thread has only read access to the data
36*7c3d14c8STreehugger Robot // }
37*7c3d14c8STreehugger Robot // {
38*7c3d14c8STreehugger Robot // Map::Handle h(&m, addr, true);
39*7c3d14c8STreehugger Robot // this will remove the data from the map in Handle dtor
40*7c3d14c8STreehugger Robot // the current thread has exclusive access to the data
41*7c3d14c8STreehugger Robot // if !h.exists() then the element never existed
42*7c3d14c8STreehugger Robot // }
43*7c3d14c8STreehugger Robot template<typename T, uptr kSize>
44*7c3d14c8STreehugger Robot class AddrHashMap {
45*7c3d14c8STreehugger Robot private:
46*7c3d14c8STreehugger Robot struct Cell {
47*7c3d14c8STreehugger Robot atomic_uintptr_t addr;
48*7c3d14c8STreehugger Robot T val;
49*7c3d14c8STreehugger Robot };
50*7c3d14c8STreehugger Robot
51*7c3d14c8STreehugger Robot struct AddBucket {
52*7c3d14c8STreehugger Robot uptr cap;
53*7c3d14c8STreehugger Robot uptr size;
54*7c3d14c8STreehugger Robot Cell cells[1]; // variable len
55*7c3d14c8STreehugger Robot };
56*7c3d14c8STreehugger Robot
57*7c3d14c8STreehugger Robot static const uptr kBucketSize = 3;
58*7c3d14c8STreehugger Robot
59*7c3d14c8STreehugger Robot struct Bucket {
60*7c3d14c8STreehugger Robot RWMutex mtx;
61*7c3d14c8STreehugger Robot atomic_uintptr_t add;
62*7c3d14c8STreehugger Robot Cell cells[kBucketSize];
63*7c3d14c8STreehugger Robot };
64*7c3d14c8STreehugger Robot
65*7c3d14c8STreehugger Robot public:
66*7c3d14c8STreehugger Robot AddrHashMap();
67*7c3d14c8STreehugger Robot
68*7c3d14c8STreehugger Robot class Handle {
69*7c3d14c8STreehugger Robot public:
70*7c3d14c8STreehugger Robot Handle(AddrHashMap<T, kSize> *map, uptr addr);
71*7c3d14c8STreehugger Robot Handle(AddrHashMap<T, kSize> *map, uptr addr, bool remove);
72*7c3d14c8STreehugger Robot Handle(AddrHashMap<T, kSize> *map, uptr addr, bool remove, bool create);
73*7c3d14c8STreehugger Robot
74*7c3d14c8STreehugger Robot ~Handle();
75*7c3d14c8STreehugger Robot T *operator->();
76*7c3d14c8STreehugger Robot bool created() const;
77*7c3d14c8STreehugger Robot bool exists() const;
78*7c3d14c8STreehugger Robot
79*7c3d14c8STreehugger Robot private:
80*7c3d14c8STreehugger Robot friend AddrHashMap<T, kSize>;
81*7c3d14c8STreehugger Robot AddrHashMap<T, kSize> *map_;
82*7c3d14c8STreehugger Robot Bucket *bucket_;
83*7c3d14c8STreehugger Robot Cell *cell_;
84*7c3d14c8STreehugger Robot uptr addr_;
85*7c3d14c8STreehugger Robot uptr addidx_;
86*7c3d14c8STreehugger Robot bool created_;
87*7c3d14c8STreehugger Robot bool remove_;
88*7c3d14c8STreehugger Robot bool create_;
89*7c3d14c8STreehugger Robot };
90*7c3d14c8STreehugger Robot
91*7c3d14c8STreehugger Robot private:
92*7c3d14c8STreehugger Robot friend class Handle;
93*7c3d14c8STreehugger Robot Bucket *table_;
94*7c3d14c8STreehugger Robot
95*7c3d14c8STreehugger Robot void acquire(Handle *h);
96*7c3d14c8STreehugger Robot void release(Handle *h);
97*7c3d14c8STreehugger Robot uptr calcHash(uptr addr);
98*7c3d14c8STreehugger Robot };
99*7c3d14c8STreehugger Robot
100*7c3d14c8STreehugger Robot template<typename T, uptr kSize>
Handle(AddrHashMap<T,kSize> * map,uptr addr)101*7c3d14c8STreehugger Robot AddrHashMap<T, kSize>::Handle::Handle(AddrHashMap<T, kSize> *map, uptr addr) {
102*7c3d14c8STreehugger Robot map_ = map;
103*7c3d14c8STreehugger Robot addr_ = addr;
104*7c3d14c8STreehugger Robot remove_ = false;
105*7c3d14c8STreehugger Robot create_ = true;
106*7c3d14c8STreehugger Robot map_->acquire(this);
107*7c3d14c8STreehugger Robot }
108*7c3d14c8STreehugger Robot
109*7c3d14c8STreehugger Robot template<typename T, uptr kSize>
Handle(AddrHashMap<T,kSize> * map,uptr addr,bool remove)110*7c3d14c8STreehugger Robot AddrHashMap<T, kSize>::Handle::Handle(AddrHashMap<T, kSize> *map, uptr addr,
111*7c3d14c8STreehugger Robot bool remove) {
112*7c3d14c8STreehugger Robot map_ = map;
113*7c3d14c8STreehugger Robot addr_ = addr;
114*7c3d14c8STreehugger Robot remove_ = remove;
115*7c3d14c8STreehugger Robot create_ = true;
116*7c3d14c8STreehugger Robot map_->acquire(this);
117*7c3d14c8STreehugger Robot }
118*7c3d14c8STreehugger Robot
119*7c3d14c8STreehugger Robot template<typename T, uptr kSize>
Handle(AddrHashMap<T,kSize> * map,uptr addr,bool remove,bool create)120*7c3d14c8STreehugger Robot AddrHashMap<T, kSize>::Handle::Handle(AddrHashMap<T, kSize> *map, uptr addr,
121*7c3d14c8STreehugger Robot bool remove, bool create) {
122*7c3d14c8STreehugger Robot map_ = map;
123*7c3d14c8STreehugger Robot addr_ = addr;
124*7c3d14c8STreehugger Robot remove_ = remove;
125*7c3d14c8STreehugger Robot create_ = create;
126*7c3d14c8STreehugger Robot map_->acquire(this);
127*7c3d14c8STreehugger Robot }
128*7c3d14c8STreehugger Robot
129*7c3d14c8STreehugger Robot template<typename T, uptr kSize>
~Handle()130*7c3d14c8STreehugger Robot AddrHashMap<T, kSize>::Handle::~Handle() {
131*7c3d14c8STreehugger Robot map_->release(this);
132*7c3d14c8STreehugger Robot }
133*7c3d14c8STreehugger Robot
134*7c3d14c8STreehugger Robot template <typename T, uptr kSize>
135*7c3d14c8STreehugger Robot T *AddrHashMap<T, kSize>::Handle::operator->() {
136*7c3d14c8STreehugger Robot return &cell_->val;
137*7c3d14c8STreehugger Robot }
138*7c3d14c8STreehugger Robot
139*7c3d14c8STreehugger Robot template<typename T, uptr kSize>
created()140*7c3d14c8STreehugger Robot bool AddrHashMap<T, kSize>::Handle::created() const {
141*7c3d14c8STreehugger Robot return created_;
142*7c3d14c8STreehugger Robot }
143*7c3d14c8STreehugger Robot
144*7c3d14c8STreehugger Robot template<typename T, uptr kSize>
exists()145*7c3d14c8STreehugger Robot bool AddrHashMap<T, kSize>::Handle::exists() const {
146*7c3d14c8STreehugger Robot return cell_ != nullptr;
147*7c3d14c8STreehugger Robot }
148*7c3d14c8STreehugger Robot
149*7c3d14c8STreehugger Robot template<typename T, uptr kSize>
AddrHashMap()150*7c3d14c8STreehugger Robot AddrHashMap<T, kSize>::AddrHashMap() {
151*7c3d14c8STreehugger Robot table_ = (Bucket*)MmapOrDie(kSize * sizeof(table_[0]), "AddrHashMap");
152*7c3d14c8STreehugger Robot }
153*7c3d14c8STreehugger Robot
154*7c3d14c8STreehugger Robot template<typename T, uptr kSize>
acquire(Handle * h)155*7c3d14c8STreehugger Robot void AddrHashMap<T, kSize>::acquire(Handle *h) {
156*7c3d14c8STreehugger Robot uptr addr = h->addr_;
157*7c3d14c8STreehugger Robot uptr hash = calcHash(addr);
158*7c3d14c8STreehugger Robot Bucket *b = &table_[hash];
159*7c3d14c8STreehugger Robot
160*7c3d14c8STreehugger Robot h->created_ = false;
161*7c3d14c8STreehugger Robot h->addidx_ = -1U;
162*7c3d14c8STreehugger Robot h->bucket_ = b;
163*7c3d14c8STreehugger Robot h->cell_ = nullptr;
164*7c3d14c8STreehugger Robot
165*7c3d14c8STreehugger Robot // If we want to remove the element, we need exclusive access to the bucket,
166*7c3d14c8STreehugger Robot // so skip the lock-free phase.
167*7c3d14c8STreehugger Robot if (h->remove_)
168*7c3d14c8STreehugger Robot goto locked;
169*7c3d14c8STreehugger Robot
170*7c3d14c8STreehugger Robot retry:
171*7c3d14c8STreehugger Robot // First try to find an existing element w/o read mutex.
172*7c3d14c8STreehugger Robot CHECK(!h->remove_);
173*7c3d14c8STreehugger Robot // Check the embed cells.
174*7c3d14c8STreehugger Robot for (uptr i = 0; i < kBucketSize; i++) {
175*7c3d14c8STreehugger Robot Cell *c = &b->cells[i];
176*7c3d14c8STreehugger Robot uptr addr1 = atomic_load(&c->addr, memory_order_acquire);
177*7c3d14c8STreehugger Robot if (addr1 == addr) {
178*7c3d14c8STreehugger Robot h->cell_ = c;
179*7c3d14c8STreehugger Robot return;
180*7c3d14c8STreehugger Robot }
181*7c3d14c8STreehugger Robot }
182*7c3d14c8STreehugger Robot
183*7c3d14c8STreehugger Robot // Check the add cells with read lock.
184*7c3d14c8STreehugger Robot if (atomic_load(&b->add, memory_order_relaxed)) {
185*7c3d14c8STreehugger Robot b->mtx.ReadLock();
186*7c3d14c8STreehugger Robot AddBucket *add = (AddBucket*)atomic_load(&b->add, memory_order_relaxed);
187*7c3d14c8STreehugger Robot for (uptr i = 0; i < add->size; i++) {
188*7c3d14c8STreehugger Robot Cell *c = &add->cells[i];
189*7c3d14c8STreehugger Robot uptr addr1 = atomic_load(&c->addr, memory_order_relaxed);
190*7c3d14c8STreehugger Robot if (addr1 == addr) {
191*7c3d14c8STreehugger Robot h->addidx_ = i;
192*7c3d14c8STreehugger Robot h->cell_ = c;
193*7c3d14c8STreehugger Robot return;
194*7c3d14c8STreehugger Robot }
195*7c3d14c8STreehugger Robot }
196*7c3d14c8STreehugger Robot b->mtx.ReadUnlock();
197*7c3d14c8STreehugger Robot }
198*7c3d14c8STreehugger Robot
199*7c3d14c8STreehugger Robot locked:
200*7c3d14c8STreehugger Robot // Re-check existence under write lock.
201*7c3d14c8STreehugger Robot // Embed cells.
202*7c3d14c8STreehugger Robot b->mtx.Lock();
203*7c3d14c8STreehugger Robot for (uptr i = 0; i < kBucketSize; i++) {
204*7c3d14c8STreehugger Robot Cell *c = &b->cells[i];
205*7c3d14c8STreehugger Robot uptr addr1 = atomic_load(&c->addr, memory_order_relaxed);
206*7c3d14c8STreehugger Robot if (addr1 == addr) {
207*7c3d14c8STreehugger Robot if (h->remove_) {
208*7c3d14c8STreehugger Robot h->cell_ = c;
209*7c3d14c8STreehugger Robot return;
210*7c3d14c8STreehugger Robot }
211*7c3d14c8STreehugger Robot b->mtx.Unlock();
212*7c3d14c8STreehugger Robot goto retry;
213*7c3d14c8STreehugger Robot }
214*7c3d14c8STreehugger Robot }
215*7c3d14c8STreehugger Robot
216*7c3d14c8STreehugger Robot // Add cells.
217*7c3d14c8STreehugger Robot AddBucket *add = (AddBucket*)atomic_load(&b->add, memory_order_relaxed);
218*7c3d14c8STreehugger Robot if (add) {
219*7c3d14c8STreehugger Robot for (uptr i = 0; i < add->size; i++) {
220*7c3d14c8STreehugger Robot Cell *c = &add->cells[i];
221*7c3d14c8STreehugger Robot uptr addr1 = atomic_load(&c->addr, memory_order_relaxed);
222*7c3d14c8STreehugger Robot if (addr1 == addr) {
223*7c3d14c8STreehugger Robot if (h->remove_) {
224*7c3d14c8STreehugger Robot h->addidx_ = i;
225*7c3d14c8STreehugger Robot h->cell_ = c;
226*7c3d14c8STreehugger Robot return;
227*7c3d14c8STreehugger Robot }
228*7c3d14c8STreehugger Robot b->mtx.Unlock();
229*7c3d14c8STreehugger Robot goto retry;
230*7c3d14c8STreehugger Robot }
231*7c3d14c8STreehugger Robot }
232*7c3d14c8STreehugger Robot }
233*7c3d14c8STreehugger Robot
234*7c3d14c8STreehugger Robot // The element does not exist, no need to create it if we want to remove.
235*7c3d14c8STreehugger Robot if (h->remove_ || !h->create_) {
236*7c3d14c8STreehugger Robot b->mtx.Unlock();
237*7c3d14c8STreehugger Robot return;
238*7c3d14c8STreehugger Robot }
239*7c3d14c8STreehugger Robot
240*7c3d14c8STreehugger Robot // Now try to create it under the mutex.
241*7c3d14c8STreehugger Robot h->created_ = true;
242*7c3d14c8STreehugger Robot // See if we have a free embed cell.
243*7c3d14c8STreehugger Robot for (uptr i = 0; i < kBucketSize; i++) {
244*7c3d14c8STreehugger Robot Cell *c = &b->cells[i];
245*7c3d14c8STreehugger Robot uptr addr1 = atomic_load(&c->addr, memory_order_relaxed);
246*7c3d14c8STreehugger Robot if (addr1 == 0) {
247*7c3d14c8STreehugger Robot h->cell_ = c;
248*7c3d14c8STreehugger Robot return;
249*7c3d14c8STreehugger Robot }
250*7c3d14c8STreehugger Robot }
251*7c3d14c8STreehugger Robot
252*7c3d14c8STreehugger Robot // Store in the add cells.
253*7c3d14c8STreehugger Robot if (!add) {
254*7c3d14c8STreehugger Robot // Allocate a new add array.
255*7c3d14c8STreehugger Robot const uptr kInitSize = 64;
256*7c3d14c8STreehugger Robot add = (AddBucket*)InternalAlloc(kInitSize);
257*7c3d14c8STreehugger Robot internal_memset(add, 0, kInitSize);
258*7c3d14c8STreehugger Robot add->cap = (kInitSize - sizeof(*add)) / sizeof(add->cells[0]) + 1;
259*7c3d14c8STreehugger Robot add->size = 0;
260*7c3d14c8STreehugger Robot atomic_store(&b->add, (uptr)add, memory_order_relaxed);
261*7c3d14c8STreehugger Robot }
262*7c3d14c8STreehugger Robot if (add->size == add->cap) {
263*7c3d14c8STreehugger Robot // Grow existing add array.
264*7c3d14c8STreehugger Robot uptr oldsize = sizeof(*add) + (add->cap - 1) * sizeof(add->cells[0]);
265*7c3d14c8STreehugger Robot uptr newsize = oldsize * 2;
266*7c3d14c8STreehugger Robot AddBucket *add1 = (AddBucket*)InternalAlloc(newsize);
267*7c3d14c8STreehugger Robot internal_memset(add1, 0, newsize);
268*7c3d14c8STreehugger Robot add1->cap = (newsize - sizeof(*add)) / sizeof(add->cells[0]) + 1;
269*7c3d14c8STreehugger Robot add1->size = add->size;
270*7c3d14c8STreehugger Robot internal_memcpy(add1->cells, add->cells, add->size * sizeof(add->cells[0]));
271*7c3d14c8STreehugger Robot InternalFree(add);
272*7c3d14c8STreehugger Robot atomic_store(&b->add, (uptr)add1, memory_order_relaxed);
273*7c3d14c8STreehugger Robot add = add1;
274*7c3d14c8STreehugger Robot }
275*7c3d14c8STreehugger Robot // Store.
276*7c3d14c8STreehugger Robot uptr i = add->size++;
277*7c3d14c8STreehugger Robot Cell *c = &add->cells[i];
278*7c3d14c8STreehugger Robot CHECK_EQ(atomic_load(&c->addr, memory_order_relaxed), 0);
279*7c3d14c8STreehugger Robot h->addidx_ = i;
280*7c3d14c8STreehugger Robot h->cell_ = c;
281*7c3d14c8STreehugger Robot }
282*7c3d14c8STreehugger Robot
283*7c3d14c8STreehugger Robot template<typename T, uptr kSize>
release(Handle * h)284*7c3d14c8STreehugger Robot void AddrHashMap<T, kSize>::release(Handle *h) {
285*7c3d14c8STreehugger Robot if (!h->cell_)
286*7c3d14c8STreehugger Robot return;
287*7c3d14c8STreehugger Robot Bucket *b = h->bucket_;
288*7c3d14c8STreehugger Robot Cell *c = h->cell_;
289*7c3d14c8STreehugger Robot uptr addr1 = atomic_load(&c->addr, memory_order_relaxed);
290*7c3d14c8STreehugger Robot if (h->created_) {
291*7c3d14c8STreehugger Robot // Denote completion of insertion.
292*7c3d14c8STreehugger Robot CHECK_EQ(addr1, 0);
293*7c3d14c8STreehugger Robot // After the following store, the element becomes available
294*7c3d14c8STreehugger Robot // for lock-free reads.
295*7c3d14c8STreehugger Robot atomic_store(&c->addr, h->addr_, memory_order_release);
296*7c3d14c8STreehugger Robot b->mtx.Unlock();
297*7c3d14c8STreehugger Robot } else if (h->remove_) {
298*7c3d14c8STreehugger Robot // Denote that the cell is empty now.
299*7c3d14c8STreehugger Robot CHECK_EQ(addr1, h->addr_);
300*7c3d14c8STreehugger Robot atomic_store(&c->addr, 0, memory_order_release);
301*7c3d14c8STreehugger Robot // See if we need to compact the bucket.
302*7c3d14c8STreehugger Robot AddBucket *add = (AddBucket*)atomic_load(&b->add, memory_order_relaxed);
303*7c3d14c8STreehugger Robot if (h->addidx_ == -1U) {
304*7c3d14c8STreehugger Robot // Removed from embed array, move an add element into the freed cell.
305*7c3d14c8STreehugger Robot if (add && add->size != 0) {
306*7c3d14c8STreehugger Robot uptr last = --add->size;
307*7c3d14c8STreehugger Robot Cell *c1 = &add->cells[last];
308*7c3d14c8STreehugger Robot c->val = c1->val;
309*7c3d14c8STreehugger Robot uptr addr1 = atomic_load(&c1->addr, memory_order_relaxed);
310*7c3d14c8STreehugger Robot atomic_store(&c->addr, addr1, memory_order_release);
311*7c3d14c8STreehugger Robot atomic_store(&c1->addr, 0, memory_order_release);
312*7c3d14c8STreehugger Robot }
313*7c3d14c8STreehugger Robot } else {
314*7c3d14c8STreehugger Robot // Removed from add array, compact it.
315*7c3d14c8STreehugger Robot uptr last = --add->size;
316*7c3d14c8STreehugger Robot Cell *c1 = &add->cells[last];
317*7c3d14c8STreehugger Robot if (c != c1) {
318*7c3d14c8STreehugger Robot *c = *c1;
319*7c3d14c8STreehugger Robot atomic_store(&c1->addr, 0, memory_order_relaxed);
320*7c3d14c8STreehugger Robot }
321*7c3d14c8STreehugger Robot }
322*7c3d14c8STreehugger Robot if (add && add->size == 0) {
323*7c3d14c8STreehugger Robot // FIXME(dvyukov): free add?
324*7c3d14c8STreehugger Robot }
325*7c3d14c8STreehugger Robot b->mtx.Unlock();
326*7c3d14c8STreehugger Robot } else {
327*7c3d14c8STreehugger Robot CHECK_EQ(addr1, h->addr_);
328*7c3d14c8STreehugger Robot if (h->addidx_ != -1U)
329*7c3d14c8STreehugger Robot b->mtx.ReadUnlock();
330*7c3d14c8STreehugger Robot }
331*7c3d14c8STreehugger Robot }
332*7c3d14c8STreehugger Robot
333*7c3d14c8STreehugger Robot template<typename T, uptr kSize>
calcHash(uptr addr)334*7c3d14c8STreehugger Robot uptr AddrHashMap<T, kSize>::calcHash(uptr addr) {
335*7c3d14c8STreehugger Robot addr += addr << 10;
336*7c3d14c8STreehugger Robot addr ^= addr >> 6;
337*7c3d14c8STreehugger Robot return addr % kSize;
338*7c3d14c8STreehugger Robot }
339*7c3d14c8STreehugger Robot
340*7c3d14c8STreehugger Robot } // namespace __sanitizer
341*7c3d14c8STreehugger Robot
342*7c3d14c8STreehugger Robot #endif // SANITIZER_ADDRHASHMAP_H
343