src/zencore/memtrack/growonlylockfreehash.h


1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255

// Copyright Epic Games, Inc. All Rights Reserved.

#pragma once

#include <zenbase/zenbase.h>
#include <zencore/intmath.h>
#include <zencore/thread.h>

#include <zencore/memory/fmalloc.h>

#include <atomic>

namespace zen {

// Hash table with fast lock free reads, that only supports insertion of items, and no modification of
// values.  KeyType must be an integer.  EntryType should be a POD with an identifiable "empty" state
// that can't occur in the table, and include the following member functions:
//
//		KeyType GetKey() const;											// Get the key from EntryType
//		ValueType GetValue() const;										// Get the value from EntryType
//		bool IsEmpty() const;											// Query whether EntryType is empty
//		void SetKeyValue(KeyType Key, ValueType Value);					// Write key and value into EntryType (ATOMICALLY!  See below)
//		static uint32 KeyHash(KeyType Key);								// Convert Key to more well distributed hash
//		static void ClearEntries(EntryType* Entries, int32 EntryCount);	// Fill an array of entries with empty values
//
// The function "SetKeyValue" must be multi-thread safe when writing new items!  This means writing the
// Key last and atomically, or writing the entire EntryType in a single write (say if the key and value
// are packed into a single integer word).  Inline is recommended, since these functions are called a
// lot in the inner loop of the algorithm.  A simple implementation of "KeyHash" can just return the
// Key (if it's already reasonable as a hash), or mix the bits if better distribution is required.  A
// simple implementation of "ClearEntries" can just be a memset, if zero represents an empty entry.
//
// A set can be approximated by making "GetValue" a nop function, and just paying attention to the bool
// result from FindEntry, although you do need to either reserve a certain Key as invalid, or add
// space to store a valid flag as the Value.  This class should only be used for small value types, as
// the values are embedded into the hash table, and not stored separately.
//
// Writes are implemented using a lock -- it would be possible to make writes lock free (or lock free
// when resizing doesn't occur), but it adds complexity.  If we were to go that route, it would make
// sense to create a fully generic lock free set, which would be much more involved to implement and
// validate than this simple class, and might also offer somewhat worse read perf.  Lock free containers
// that support item removal either need additional synchronization overhead on readers, so writers can
// tell if a reader is active and spin, or need graveyard markers and a garbage collection pass called
// periodically, which makes it no longer a simple standalone container.
//
// Lock free reads are accomplished by the reader atomically pulling the hash table pointer from the
// class.  The hash table is self contained, with its size stored in the table itself, and hash tables
// are not freed until the class's destruction.  So if the table needs to be reallocated due to a write,
// active readers will still have valid memory.  This does mean that tables leak, but worst case, you
// end up with half of the memory being waste.  It would be possible to garbage collect the excess
// tables, but you'd need some kind of global synchronization to make sure no readers are active.
//
// Besides cleanup of wasted tables, it might be useful to provide a function to clear a table.  This
// would involve clearing the Key for all the elements in the table (but leaving the memory allocated),
// and can be done safely with active readers.  It's not possible to safely remove individual items due
// to the need to potentially move other items, which would break an active reader that has already
// searched past a moved item.  But in the case of removing all items, we don't care when a reader fails,
// it's expected that eventually all readers will fail, regardless of where they are searching.  A clear
// function could be useful if a lot of the data you are caching is no longer used, and you want to
// reset the cache.
//
template<typename EntryType, typename KeyType, typename ValueType>
class TGrowOnlyLockFreeHash
{
public:
	TGrowOnlyLockFreeHash(FMalloc* InMalloc) : Malloc(InMalloc), HashTable(nullptr) {}

	~TGrowOnlyLockFreeHash()
	{
		FHashHeader* HashTableNext;
		for (FHashHeader* HashTableCurrent = HashTable; HashTableCurrent; HashTableCurrent = HashTableNext)
		{
			HashTableNext = HashTableCurrent->Next;

			Malloc->Free(HashTableCurrent);
		}
	}

	/**
	 * Preallocate the hash table to a certain size
	 * @param Count - Number of EntryType elements to allocate
	 * @warning Can only be called once, and only before any items have been added!
	 */
	void Reserve(uint32_t Count)
	{
		zen::RwLock::ExclusiveLockScope _(WriteCriticalSection);
		ZEN_ASSERT(HashTable.load(std::memory_order_relaxed) == nullptr);

		if (Count <= 0)
		{
			Count = DEFAULT_INITIAL_SIZE;
		}
		Count						= uint32_t(zen::NextPow2(Count));
		FHashHeader* HashTableLocal = (FHashHeader*)Malloc->Malloc(sizeof(FHashHeader) + (Count - 1) * sizeof(EntryType));

		HashTableLocal->Next	  = nullptr;
		HashTableLocal->TableSize = Count;
		HashTableLocal->Used	  = 0;
		EntryType::ClearEntries(HashTableLocal->Elements, Count);

		HashTable.store(HashTableLocal, std::memory_order_release);
	}

	/**
	 * Find an entry in the hash table
	 * @param Key - Key to search for
	 * @param OutValue - Memory location to write result value to.  Left unmodified if Key isn't found.
	 * @param bIsAlreadyInTable - Optional result for whether key was found in table.
	 */
	void Find(KeyType Key, ValueType* OutValue, bool* bIsAlreadyInTable = nullptr) const
	{
		FHashHeader* HashTableLocal = HashTable.load(std::memory_order_acquire);
		if (HashTableLocal)
		{
			uint32_t TableMask = HashTableLocal->TableSize - 1;

			// Linear probing
			for (uint32_t TableIndex = EntryType::KeyHash(Key) & TableMask; !HashTableLocal->Elements[TableIndex].IsEmpty();
				 TableIndex			 = (TableIndex + 1) & TableMask)
			{
				if (HashTableLocal->Elements[TableIndex].GetKey() == Key)
				{
					if (OutValue)
					{
						*OutValue = HashTableLocal->Elements[TableIndex].GetValue();
					}
					if (bIsAlreadyInTable)
					{
						*bIsAlreadyInTable = true;
					}
					return;
				}
			}
		}

		if (bIsAlreadyInTable)
		{
			*bIsAlreadyInTable = false;
		}
	}

	/**
	 * Add an entry with the given Key to the hash table, will do nothing if the item already exists
	 * @param Key - Key to add
	 * @param Value - Value to add for key
	 * @param bIsAlreadyInTable -- Optional result for whether item was already in table
	 */
	void Emplace(KeyType Key, ValueType Value, bool* bIsAlreadyInTable = nullptr)
	{
		zen::RwLock::ExclusiveLockScope _(WriteCriticalSection);

		// After locking, check if the item is already in the hash table.
		ValueType ValueIgnore;
		bool	  bFindResult;
		Find(Key, &ValueIgnore, &bFindResult);
		if (bFindResult == true)
		{
			if (bIsAlreadyInTable)
			{
				*bIsAlreadyInTable = true;
			}
			return;
		}

		// Check if there is space in the hash table for a new item.  We resize when the hash
		// table gets half full or more.  @todo:  allow client to specify max load factor?
		FHashHeader* HashTableLocal = HashTable;

		if (!HashTableLocal || (HashTableLocal->Used >= HashTableLocal->TableSize / 2))
		{
			int32_t		 GrowCount	   = HashTableLocal ? HashTableLocal->TableSize * 2 : DEFAULT_INITIAL_SIZE;
			FHashHeader* HashTableGrow = (FHashHeader*)Malloc->Malloc(sizeof(FHashHeader) + (GrowCount - 1) * sizeof(EntryType));

			HashTableGrow->Next		 = HashTableLocal;
			HashTableGrow->TableSize = GrowCount;
			HashTableGrow->Used		 = 0;
			EntryType::ClearEntries(HashTableGrow->Elements, GrowCount);

			if (HashTableLocal)
			{
				// Copy existing elements from the old table to the new table
				for (int32_t TableIndex = 0; TableIndex < HashTableLocal->TableSize; TableIndex++)
				{
					EntryType& Entry = HashTableLocal->Elements[TableIndex];
					if (!Entry.IsEmpty())
					{
						HashInsertInternal(HashTableGrow, Entry.GetKey(), Entry.GetValue());
					}
				}
			}

			HashTableLocal = HashTableGrow;
			HashTable.store(HashTableGrow, std::memory_order_release);
		}

		// Then add our new item
		HashInsertInternal(HashTableLocal, Key, Value);

		if (bIsAlreadyInTable)
		{
			*bIsAlreadyInTable = false;
		}
	}

	void FindOrAdd(KeyType Key, ValueType Value, bool* bIsAlreadyInTable = nullptr)
	{
		// Attempt to find the item lock free, before calling "Emplace", which locks the container
		bool	  bFindResult;
		ValueType IgnoreResult;
		Find(Key, &IgnoreResult, &bFindResult);
		if (bFindResult)
		{
			if (bIsAlreadyInTable)
			{
				*bIsAlreadyInTable = true;
			}
			return;
		}

		Emplace(Key, Value, bIsAlreadyInTable);
	}

private:
	struct FHashHeader
	{
		FHashHeader* Next;	// Old buffers are stored in a linked list for cleanup
		int32_t		 TableSize;
		int32_t		 Used;
		EntryType	 Elements[1];  // Variable sized
	};

	FMalloc*				  Malloc;
	std::atomic<FHashHeader*> HashTable;
	zen::RwLock				  WriteCriticalSection;

	static constexpr int32_t DEFAULT_INITIAL_SIZE = 1024;

	static void HashInsertInternal(FHashHeader* HashTableLocal, KeyType Key, ValueType Value)
	{
		int32_t TableMask = HashTableLocal->TableSize - 1;

		// Linear probing
		for (int32_t TableIndex = EntryType::KeyHash(Key) & TableMask;; TableIndex = (TableIndex + 1) & TableMask)
		{
			if (HashTableLocal->Elements[TableIndex].IsEmpty())
			{
				HashTableLocal->Elements[TableIndex].SetKeyValue(Key, Value);
				HashTableLocal->Used++;
				break;
			}
		}
	}
};

}  // namespace zen