-
Notifications
You must be signed in to change notification settings - Fork 5
/
fptree.h
447 lines (338 loc) · 10.5 KB
/
fptree.h
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
// Copyright (c) Simon Fraser University. All rights reserved.
// Licensed under the MIT license.
//
// Authors:
// George He <georgeh@sfu.ca>
// Duo Lu <luduol@sfu.ca>
// Tianzheng Wang <tzwang@sfu.ca>
#pragma once
#include <stdio.h>
#include <stdlib.h>
#include <stdint.h>
#include <sys/types.h>
#include <bits/hash_bytes.h>
#include <unistd.h>
#include <time.h>
#include <string.h>
#include <immintrin.h>
#include <tbb/spin_mutex.h>
#include <tbb/spin_rw_mutex.h>
//#include "oneapi/tbb/spin_mutex.h"
//#include "oneapi/tbb/spin_rw_mutex.h"
#include <iostream>
#include <string>
#include <cstdint>
#include <cstring>
#include <cmath>
#include <algorithm>
#include <array>
#include <utility>
#include <tuple>
#include <atomic>
#include <queue>
#include <limits>
#include <chrono>
#include <vector>
#include <random>
#include <climits>
#include <functional>
#include <cassert>
#include <thread>
#include <boost/lockfree/queue.hpp>
#include <sys/stat.h>
#ifdef TEST_MODE
#define MAX_INNER_SIZE 3
#define MAX_LEAF_SIZE 4
#define SIZE_ONE_BYTE_HASH 1
#define SIZE_PMEM_POINTER 16
#else
#define MAX_INNER_SIZE 128
#define MAX_LEAF_SIZE 64
#define SIZE_ONE_BYTE_HASH 1
#define SIZE_PMEM_POINTER 16
#endif
#if MAX_LEAF_SIZE > 64
#error "Number of kv pairs in LeafNode must be <= 64."
#endif
static const uint64_t offset = std::numeric_limits<uint64_t>::max() >> (64 - MAX_LEAF_SIZE);
enum Result { Insert, Update, Split, Abort, Delete, Remove, NotFound };
#ifdef PMEM
#include <libpmemobj.h>
#define PMEMOBJ_POOL_SIZE ((size_t)(1024 * 1024 * 11) * 1000) /* 11 GB */
POBJ_LAYOUT_BEGIN(FPtree);
POBJ_LAYOUT_ROOT(FPtree, struct List);
POBJ_LAYOUT_TOID(FPtree, struct LeafNode);
POBJ_LAYOUT_END(FPtree);
POBJ_LAYOUT_BEGIN(Array);
POBJ_LAYOUT_TOID(Array, struct Log);
POBJ_LAYOUT_END(Array);
inline PMEMobjpool *pop;
#endif
static uint8_t getOneByteHash(uint64_t key);
struct KV
{
uint64_t key;
uint64_t value;
KV() {}
KV(uint64_t key, uint64_t value) { this->key = key; this->value = value; }
};
struct LeafNodeStat
{
uint64_t kv_idx; // bitmap index of key
uint64_t count; // number of kv in leaf
uint64_t min_key; // min key excluding key
};
// This Bitset class implements bitmap of size <= 64
// The bitmap iterates from right to left - starting from least significant bit
// off contains 0 on some significant bits when bitmap size < 64
class Bitset
{
public:
uint64_t bits;
Bitset()
{
bits = 0;
}
~Bitset() {}
Bitset(const Bitset& bts)
{
bits = bts.bits;
}
Bitset& operator=(const Bitset& bts)
{
bits = bts.bits;
return *this;
}
inline void set(const size_t pos)
{
bits |= ((uint64_t)1 << pos);
}
inline void reset(const size_t pos)
{
bits &= ~((uint64_t)1 << pos);
}
inline void clear()
{
bits = 0;
}
inline bool test(const size_t pos) const
{
return bits & ((uint64_t)1 << pos);
}
inline void flip()
{
bits ^= offset;
}
inline bool is_full()
{
return bits == offset;
}
inline size_t count()
{
return __builtin_popcountl(bits);
}
inline size_t first_set()
{
size_t idx = __builtin_ffsl(bits);
return idx ? idx - 1 : MAX_LEAF_SIZE;
}
inline size_t first_zero()
{
size_t idx = __builtin_ffsl(bits ^ offset);
return idx ? idx - 1 : MAX_LEAF_SIZE;
}
void print_bits()
{
for (uint64_t i = 0; i < 64; i++) { std::cout << ((bits >> i) & 1); }
std::cout << std::endl;
}
};
/*******************************************************
Define node struture
********************************************************/
struct BaseNode
{
bool isInnerNode;
friend class FPtree;
public:
BaseNode();
} __attribute__((aligned(64)));
struct InnerNode : BaseNode
{
uint64_t nKey;
uint64_t keys[MAX_INNER_SIZE];
BaseNode* p_children[MAX_INNER_SIZE + 1];
friend class FPtree;
public:
InnerNode();
InnerNode(uint64_t key, BaseNode* left, BaseNode* right);
InnerNode(const InnerNode& inner);
~InnerNode();
// for using mempool only where constructor is not called
void init(uint64_t key, BaseNode* left, BaseNode* right);
// return index of child in p_children when searching key in this innernode
uint64_t findChildIndex(uint64_t key);
// remove key at index, default remove right child (or left child if false)
void removeKey(uint64_t index, bool remove_right_child);
// add key at index pos, default add child to the right
void addKey(uint64_t index, uint64_t key, BaseNode* child, bool add_child_right);
} __attribute__((aligned(64)));
struct LeafNode : BaseNode
{
__attribute__((aligned(64))) uint8_t fingerprints[MAX_LEAF_SIZE];
Bitset bitmap;
KV kv_pairs[MAX_LEAF_SIZE];
#ifdef PMEM
TOID(struct LeafNode) p_next;
#else
LeafNode* p_next;
#endif
std::atomic<uint64_t> lock;
friend class FPtree;
public:
#ifndef PMEM
LeafNode();
LeafNode(const LeafNode& leaf);
LeafNode& operator=(const LeafNode& leaf);
#endif
inline bool isFull() { return this->bitmap.is_full(); }
void addKV(struct KV kv);
// find index of kv that has kv.key = key, return MAX_LEAF_SIZE if key not found
uint64_t findKVIndex(uint64_t key);
// return min key in leaf
uint64_t minKey();
bool Lock()
{
uint64_t expected = 0;
return std::atomic_compare_exchange_strong(&lock, &expected, 1);
}
void Unlock()
{
this->lock = 0;
}
void getStat(uint64_t key, LeafNodeStat& lstat);
} __attribute__((aligned(64)));
#ifdef PMEM
struct argLeafNode
{
size_t size;
bool isInnerNode;
Bitset bitmap;
__attribute__((aligned(64))) uint8_t fingerprints[MAX_LEAF_SIZE];
KV kv_pairs[MAX_LEAF_SIZE];
uint64_t lock;
argLeafNode(LeafNode* leaf)
{
isInnerNode = false;
size = sizeof(struct LeafNode);
memcpy(fingerprints, leaf->fingerprints, sizeof(leaf->fingerprints));
memcpy(kv_pairs, leaf->kv_pairs, sizeof(leaf->kv_pairs));
bitmap = leaf->bitmap;
lock = 1;
}
argLeafNode(struct KV kv)
{
isInnerNode = false;
size = sizeof(struct LeafNode);
kv_pairs[0] = kv;
fingerprints[0] = getOneByteHash(kv.key);
bitmap.set(0);
lock = 0;
}
};
static int constructLeafNode(PMEMobjpool *pop, void *ptr, void *arg);
struct List
{
TOID(struct LeafNode) head;
};
/*
uLog
*/
struct Log
{
TOID(struct LeafNode) PCurrentLeaf;
TOID(struct LeafNode) PLeaf;
};
static const uint64_t sizeLogArray = 128;
static boost::lockfree::queue<Log*> splitLogQueue = boost::lockfree::queue<Log*>(sizeLogArray);
static boost::lockfree::queue<Log*> deleteLogQueue = boost::lockfree::queue<Log*>(sizeLogArray);
#endif
struct Stack //TODO: Get rid of Stack
{
public:
static const uint64_t kMaxNodes = 32;
InnerNode* innerNodes[kMaxNodes];
uint64_t num_nodes;
Stack() : num_nodes(0) {}
~Stack() { num_nodes = 0; }
inline void push(InnerNode* node)
{
assert(num_nodes < kMaxNodes && "Error: exceed max stack size");
this->innerNodes[num_nodes++] = node;
}
InnerNode* pop() { return num_nodes == 0 ? nullptr : this->innerNodes[--num_nodes]; }
inline bool isEmpty() { return num_nodes == 0; }
inline InnerNode* top() { return num_nodes == 0 ? nullptr : this->innerNodes[num_nodes - 1]; }
inline void clear() { num_nodes = 0; }
};
static thread_local Stack stack_innerNodes;
static thread_local InnerNode* inners[32];
static thread_local short ppos[32];
struct FPtree
{
BaseNode *root;
tbb::speculative_spin_rw_mutex speculative_lock;
InnerNode* right_most_innnerNode; // for bulkload
public:
FPtree();
~FPtree();
BaseNode* getRoot () { return this->root; }
void printFPTree(std::string prefix, BaseNode *root);
// return flse if kv.key not found, otherwise set kv.value to value associated with kv.key
uint64_t find(uint64_t key);
// return false if kv.key not found, otherwise update value associated with key
bool update(struct KV kv);
// return false if key already exists, otherwise insert kv
bool insert(struct KV kv);
// delete key from tree
bool deleteKey(uint64_t key);
// TODO: fix/optimize iterator based scan methods
// initialize scan by finding the first kv with kv.key >= key
void scanInitialize(uint64_t key);
KV scanNext();
bool scanComplete();
uint64_t rangeScan(uint64_t key, uint64_t scan_size, char* result);
#ifdef PMEM
bool bulkLoad(float load_factor);
void recoverSplit(Log* uLog);
void recoverDelete(Log* uLog);
void recover();
void pmemInit(const char* path_ptr, long long pool_size);
void showList();
#endif
private:
// return leaf that may contain key, does not push inner nodes
LeafNode* findLeaf(uint64_t key);
// return leaf that may contain key, push all innernodes on traversal path into stack
LeafNode* findLeafAndPushInnerNodes(uint64_t key);
uint64_t findSplitKey(LeafNode* leaf);
uint64_t splitLeaf(LeafNode* leaf);
void updateParents(uint64_t splitKey, InnerNode* parent, BaseNode* leaf);
void splitLeafAndUpdateInnerParents(LeafNode* reachedLeafNode, Result decision, struct KV kv,
bool updateFunc, uint64_t prevPos);
// merge parent with sibling, may incur further merges. Remove key from indexNode after
void removeLeafAndMergeInnerNodes(short i, short indexNode_level);
// try transfer a key from sender to receiver, sender and receiver should be immediate siblings
// If receiver & sender are inner nodes, will assume the only child in receiver is at index 0
// return false if cannot borrow key from sender
bool tryBorrowKey(InnerNode* parent, uint64_t receiver_idx, uint64_t sender_idx);
uint64_t minKey(BaseNode* node);
LeafNode* minLeaf(BaseNode* node);
LeafNode* maxLeaf(BaseNode* node);
void sortKV();
uint64_t size_volatile_kv;
KV volatile_current_kv[MAX_LEAF_SIZE];
LeafNode* current_leaf;
uint64_t bitmap_idx;
friend class Inspector;
};