-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathindex.cc
120 lines (105 loc) · 3.97 KB
/
index.cc
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
#include "index.h"
#include <iostream>
#include <filesystem>
#include <chrono>
#include <fstream>
namespace fs = std::filesystem;
void Index::get(uint64_t key, int &level, uint64_t &filename, uint64_t &offset, uint64_t &length, bool &deleted) const {
if (levels.empty()) {
return;
}
// search top-down
for (level = 0; level < maxLevel; ++level) {
// search from the latest one
for (auto &indexKV: levels[level]) {
uint64_t timestamp = indexKV.first;
auto iter = indexKV.second->find(key);
// if key found in this file
if (iter != indexKV.second->end()) {
filename = timestamp;
offset = iter->second->offset_;
length = iter->second->length_;
deleted = iter->second->deleted_;
return;
}
}
}
}
bool Index::find(uint64_t key) {
for (auto &level: levels) {
for (auto &pair: level) {
std::shared_ptr<IndexTree> tree = pair.second;
auto iter = tree->find(key);
// if key in disk and not marked as deleted
if (iter != tree->end() && !(iter->second->is_deleted())) {
return true;
}
}
}
return false;
}
void
Index::put(uint64_t key, int level, const std::string &filename, uint64_t offset, uint64_t length,
std::time_t timestamp, bool deleted) {
if (level > maxLevel) {
return;
}
// if file not existed, create it
if (levels[level].count(std::stoull(filename)) == 0) {
(void) levels[level].insert({std::stoull(filename), std::make_shared<IndexTree>()});
}
auto &tree = levels[level][std::stoull(filename)];
(void) tree->insert({key, std::make_shared<IndexNode>(offset, length, timestamp, deleted)});
}
Index::Index(const std::string &dir) : dir_(dir) {
levels = std::vector<IndexLevel>(maxLevel, IndexLevel());
}
Index::~Index() = default;
void Index::reset() {
levels.clear();
levels = std::vector<IndexLevel>(maxLevel, IndexLevel());
}
void Index::recover(Filter &filter) {
if (!fs::exists(dir_)) {
return;
}
for (auto &p: fs::recursive_directory_iterator(dir_)) {
if (fs::is_directory(p)) {
continue;
}
std::string path = p.path().string();
std::ifstream file(path, std::ios::in | std::ios::binary);
// get number of key-value pairs in the last 2 bytes
uint64_t n = 0U;
(void) file.seekg(-sizeof(uint64_t), std::ios_base::end);
(void) file.read(reinterpret_cast<char *>(&n), sizeof(uint64_t));
std::size_t pos = path.find(fs::path::preferred_separator);
path = path.substr(pos + 1U, path.size());
if (path == "wal" || path == "immwal") {
continue;
}
for (uint64_t i = 1U; i <= n; i++) {
// recover key
uint64_t key;
(void) file.seekg((int) (-sizeof(uint64_t) * (1U + 2U * i)), std::ios_base::end);
(void) file.read(reinterpret_cast<char *>(&key), sizeof(uint64_t));
// recover offset
uint64_t offset = 0U;
(void) file.seekg((int) (-sizeof(uint64_t) * (2U * i)), std::ios_base::end);
(void) file.read(reinterpret_cast<char *>(&offset), sizeof(uint64_t));
// recover value
std::string s;
(void) file.seekg(offset + sizeof(uint64_t));
(void) std::getline(file, s, '\0');
pos = path.find(fs::path::preferred_separator);
int level = std::stoi(path.substr(0, pos));
std::string filename = path.substr(pos + 1, path.size());
put(key, level, filename, offset, s.size(), std::chrono::duration_cast<std::chrono::milliseconds>(
std::chrono::system_clock::now().time_since_epoch()
).count(), false);
// sync with filter
filter.add(key, level, std::stoull(filename));
}
file.close();
}
}