-
-
Notifications
You must be signed in to change notification settings - Fork 7.3k
/
lfu_cache.cpp
304 lines (263 loc) · 8.49 KB
/
lfu_cache.cpp
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
/**
* @file
* @brief Implementation for [LFU Cache]
* (https://en.wikipedia.org/wiki/Least_frequently_used)
*
* @details
* LFU discards the least frequently used value. if there are multiple items
* with the same minimum frequency then, the least recently used among them is
* discarded. Data structures used - doubly linked list and unordered_map(hash
* map).
*
* Hashmap maps the key to the address of the node of the linked list and its
* current usage frequency. If the element is accessed the element is removed
* from the linked list of the current frequency and added to the linked list of
* incremented frequency.
*
* When the cache is full, the last element in the minimum frequency linked list
* is popped.
*
* @author [Karan Sharma](https://github.com/deDSeC00720)
*/
#include <cassert> // for assert
#include <iostream> // for std::cout
#include <unordered_map> // for std::unordered_map
/**
* @namespace
* @brief Other algorithms
*/
namespace others {
/**
* @namespace
* @brief Cache algorithm
*/
namespace Cache {
/**
* @class
* @brief Node for a doubly linked list with data, prev and next pointers
* @tparam T type of the data of the node
*/
template <typename T>
class D_Node {
public:
T data; ///< data of the node
D_Node<T> *prev; ///< previous node in the doubly linked list
D_Node<T> *next; ///< next node in the doubly linked list
explicit D_Node(T data) : data(data), prev(nullptr), next(nullptr) {}
};
template <typename K, typename V>
using CacheNode = D_Node<std::pair<K, V>>;
/**
* @class
* @brief LFUCache
* @tparam K type of key in the LFU
* @tparam V type of value in the LFU
*/
template <typename K, typename V>
class LFUCache {
std::unordered_map<K, std::pair<CacheNode<K, V> *, int>>
node_map; ///< maps the key to the node address and frequency
std::unordered_map<int, std::pair<CacheNode<K, V> *, CacheNode<K, V> *>>
freq_map; ///< maps the frequency to doubly linked list
int minFreq; ///< minimum frequency in the cache
int _capacity; ///< maximum capacity of the cache
public:
/**
* @brief Constructor, Initialize with minFreq and _capacity.
* @param _capacity Total capacity of the cache.
*/
explicit LFUCache(int _capacity) : minFreq(0), _capacity(_capacity) {}
private:
/**
* @brief push the node at first position in the linked list of given
* frequency
* @param freq the frequency mapping to the linked list where node should be
* pushed.
* @param node node to be pushed to the linked list.
*/
void push(int freq, CacheNode<K, V> *node) {
// if freq is not present, then make a new list with node as the head as
// well as tail.
if (!freq_map.count(freq)) {
freq_map[freq] = {node, node};
return;
}
std::pair<CacheNode<K, V> *, CacheNode<K, V> *> &p = freq_map[freq];
// insert the node at the beginning of the linked list and update the
// head.
p.first->prev = node;
node->next = p.first;
p.first = node;
}
/**
* @brief increase the frequency of node and push it in the respective list.
* @param p_node the node to be updated
*/
void increase_frequency(std::pair<CacheNode<K, V> *, int> &p_node) {
CacheNode<K, V> *node = p_node.first;
int freq = p_node.second;
std::pair<CacheNode<K, V> *, CacheNode<K, V> *> &p = freq_map[freq];
// if the given node is the only node in the list,
// then erase the frequency from map
// and increase minFreq by 1.
if (p.first == node && p.second == node) {
freq_map.erase(freq);
if (minFreq == freq) {
minFreq = freq + 1;
}
} else {
// remove the given node from current freq linked list
CacheNode<K, V> *prev = node->prev;
CacheNode<K, V> *next = node->next;
node->prev = nullptr;
node->next = nullptr;
if (prev) {
prev->next = next;
} else {
p.first = next;
}
if (next) {
next->prev = prev;
} else {
p.second = prev;
}
}
push(freq + 1, node);
++p_node.second;
}
/**
* @brief pop the last node in the least frequently used linked list
*/
void pop() {
std::pair<CacheNode<K, V> *, CacheNode<K, V> *> &p = freq_map[minFreq];
// if there is only one node
// remove the node and erase
// the frequency from freq_map
if (p.first == p.second) {
delete p.first;
freq_map.erase(minFreq);
return;
}
// remove the last node in the linked list
CacheNode<K, V> *temp = p.second;
p.second = temp->prev;
p.second->next = nullptr;
delete temp;
}
public:
/**
* @brief upsert a key-value pair
* @param key key of the key-value pair
* @param value value of the key-value pair
*/
void put(K key, V value) {
// update the value if key already exists
if (node_map.count(key)) {
node_map[key].first->data.second = value;
increase_frequency(node_map[key]);
return;
}
// if the cache is full
// remove the least frequently used item
if (node_map.size() == _capacity) {
node_map.erase(freq_map[minFreq].second->data.first);
pop();
}
// insert the new node and set minFreq to 1
CacheNode<K, V> *node = new CacheNode<K, V>({key, value});
node_map[key] = {node, 1};
minFreq = 1;
push(1, node);
}
/**
* @brief get the value of the key-value pair if exists
* @param key key of the key-value pair
* @return the value mapped to the given key
* @exception exception is thrown if the key is not present in the cache
*/
V get(K key) {
if (!node_map.count(key)) {
throw std::runtime_error("key is not present in the cache");
}
// increase the frequency and return the value
V value = node_map[key].first->data.second;
increase_frequency(node_map[key]);
return value;
}
/**
* @brief Returns the number of items present in the cache.
* @return number of items in the cache
*/
int size() const { return node_map.size(); }
/**
* @brief Returns the total capacity of the cache
* @return Total capacity of the cache
*/
int capacity() const { return _capacity; }
/**
* @brief returns true if the cache is empty, false otherwise.
* @return true if the cache is empty, false otherwise.
*/
bool empty() const { return node_map.empty(); }
/**
* @brief destructs the cache, iterates on the map and deletes every node
* present in the cache.
*/
~LFUCache() {
auto it = node_map.begin();
while (it != node_map.end()) {
delete it->second.first;
++it;
}
}
};
} // namespace Cache
} // namespace others
/**
* @brief self test implementation
* @return void
*/
static void test() {
others::Cache::LFUCache<int, int> cache(5);
// test the initial state of the cache
assert(cache.size() == 0);
assert(cache.capacity() == 5);
assert(cache.empty());
// test insertion in the cache
cache.put(1, 10);
cache.put(-2, 20);
// test the state of cache after inserting some items
assert(cache.size() == 2);
assert(cache.capacity() == 5);
assert(!cache.empty());
// test getting items from the cache
assert(cache.get(1) == 10);
assert(cache.get(-2) == 20);
cache.put(-3, -30);
cache.put(4, 40);
cache.put(5, -50);
cache.put(6, 60);
// test the state after inserting more items than the capacity
assert(cache.size() == 5);
assert(cache.capacity() == 5);
assert(!cache.empty());
// test retrieval of all items in the cache
assert(cache.get(1) == 10);
assert(cache.get(-2) == 20);
// fetching -3 throws runtime_error
// as -3 was evicted being the least frequently used
// when 6 was added
// assert(cache.get(-3) == -30);
assert(cache.get(4) == 40);
assert(cache.get(5) == -50);
assert(cache.get(6) == 60);
std::cout << "test - passed\n";
}
/**
* @brief main function
* @return 0 on exit
*/
int main() {
test(); // run the self test implementation
return 0;
}