1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
|
/*
*
*/
#include "framework/scheduling/SerialScheduler.h"
#include "framework/util/Configuration.h"
#include "util/types.h"
#define ENABLE_TIMER
#define TS_TEST
#include <thread>
#include "framework/DynamicExtension.h"
#include "framework/scheduling/FIFOScheduler.h"
#include "shard/TrieSpline.h"
#include "query/rangecount.h"
#include "framework/interface/Record.h"
#include "file_util.h"
#include "standard_benchmarks.h"
#include "framework/reconstruction/FixedShardCountPolicy.h"
#include <gsl/gsl_rng.h>
#include "psu-util/timer.h"
typedef de::Record<uint64_t, uint64_t> Rec;
typedef de::TrieSpline<Rec> Shard;
typedef de::rc::Query<Shard> Q;
typedef de::DynamicExtension<Shard, Q, de::DeletePolicy::TOMBSTONE, de::FIFOScheduler> Ext;
typedef Q::Parameters QP;
typedef de::DEConfiguration<Shard, Q, de::DeletePolicy::TOMBSTONE, de::FIFOScheduler> Conf;
void usage(char *progname) {
fprintf(stderr, "%s reccnt datafile queryfile\n", progname);
}
int main(int argc, char **argv) {
if (argc < 4) {
usage(argv[0]);
exit(EXIT_FAILURE);
}
size_t n = atol(argv[1]);
std::string d_fname = std::string(argv[2]);
std::string q_fname = std::string(argv[3]);
auto data = read_sosd_file<Rec>(d_fname, n);
auto queries = read_range_queries<QP>(q_fname, .0001);
std::vector<size_t> sfs = {2, 3, 4, 5, 6, 7, 8}; //, 4, 8, 16, 32, 64, 128, 256, 512, 1024};
size_t buffer_size = 8000;
std::vector<size_t> policies = {1};
for (auto pol: policies) {
for (size_t i=0; i<sfs.size(); i++) {
auto policy = get_policy<Shard, Q>(sfs[i], buffer_size, pol, n);
auto config = Conf(std::move(policy));
config.recon_enable_maint_on_flush = false;
config.recon_maint_disabled = true;
config.buffer_flush_trigger = 4000;
auto extension = new Ext(std::move(config));
/* warmup structure w/ 10% of records */
size_t warmup = .1 * n;
for (size_t j=0; j<warmup; j++) {
while (!extension->insert(data[j])) {
usleep(1);
}
//fprintf(stderr, "%ld\r", j);
}
extension->await_version();
fprintf(stderr, "\n[I] Running Insertion Benchmark\n");
TIMER_INIT();
TIMER_START();
for (size_t j=warmup; j<data.size(); j++) {
while (!extension->insert(data[j])) {
usleep(1);
fprintf(stderr, "insert blocked %ld\r", j);
}
}
TIMER_STOP();
auto total_insert_lat = TIMER_RESULT();
fprintf(stderr, "\n[I] Finished running insertion benchmark\n");
extension->await_version();
fprintf(stderr, "[I] Running query benchmark\n");
size_t total = 0;
/* repeat the queries a bunch of times */
TIMER_START();
for (size_t l=0; l<10; l++) {
for (size_t j=0; j<queries.size(); j++) {
auto q = queries[j];
auto res = extension->query(std::move(q));
total += res.get();
}
}
TIMER_STOP();
auto total_query_lat = TIMER_RESULT();
fprintf(stderr, "[I] Finished running query benchmark\n");
auto query_latency = total_query_lat / (10*queries.size());
auto insert_throughput = (size_t) ((double) (n - warmup) / (double) total_insert_lat *1.0e9);
fprintf(stdout, "%ld\t%ld\t%ld\t%ld\t%ld\n", pol, sfs[i], n, insert_throughput, query_latency);
fprintf(stderr, "%ld\n", total);
fflush(stdout);
extension->print_structure();
delete extension;
}
}
fflush(stderr);
}
|