From aa5832f5e1bf7fcbd0a9507677a650b5e749ef46 Mon Sep 17 00:00:00 2001 From: Douglas Rumbaugh Date: Wed, 7 Jun 2023 10:26:24 -0400 Subject: Sampling benchmark --- benchmarks/bench.h | 206 +++++++++++++++++++++++++++++++++++++++++++++++++++++ 1 file changed, 206 insertions(+) create mode 100644 benchmarks/bench.h (limited to 'benchmarks/bench.h') diff --git a/benchmarks/bench.h b/benchmarks/bench.h new file mode 100644 index 0000000..8af244a --- /dev/null +++ b/benchmarks/bench.h @@ -0,0 +1,206 @@ +#ifndef H_BENCH +#define H_BENCH +#include "framework/DynamicExtension.h" +#include "shard/WSS.h" + +#include +#include +#include +#include +#include +#include +#include +#include +#include +#include +#include +#include +#include + +typedef uint64_t key_type; +typedef uint32_t value_type; +typedef uint64_t weight_type; + +typedef de::WeightedRecord WRec; +typedef de::DynamicExtension, de::WSSQuery> ExtendedWSS; + +static gsl_rng *g_rng; +static std::set *g_to_delete; +static bool g_osm_data; + +static key_type g_min_key = UINT64_MAX; +static key_type g_max_key = 0; + +static size_t g_max_record_cnt = 0; +static size_t g_reccnt = 0; + +static constexpr unsigned int DEFAULT_SEED = 0; + +static unsigned int get_random_seed() +{ + unsigned int seed = 0; + std::fstream urandom; + urandom.open("/dev/urandom", std::ios::in|std::ios::binary); + urandom.read((char *) &seed, sizeof(seed)); + urandom.close(); + + return seed; +} + +static key_type osm_to_key(const char *key_field) { + double tmp_key = (atof(key_field) + 180) * 10e6; + return (key_type) tmp_key; +} + +static void init_bench_rng(unsigned int seed, const gsl_rng_type *type) +{ + g_rng = gsl_rng_alloc(type); + gsl_rng_set(g_rng, seed); +} + +static void init_bench_env(size_t max_reccnt, bool random_seed, bool osm_correction=true) +{ + unsigned int seed = (random_seed) ? get_random_seed() : DEFAULT_SEED; + init_bench_rng(seed, gsl_rng_mt19937); + g_to_delete = new std::set(); + g_osm_data = osm_correction; + g_max_record_cnt = max_reccnt; + g_reccnt = 0; +} + +static void delete_bench_env() +{ + gsl_rng_free(g_rng); + delete g_to_delete; +} + +static bool next_record(std::fstream *file, WRec *record) +{ + if (g_reccnt >= g_max_record_cnt) return false; + + std::string line; + if (std::getline(*file, line, '\n')) { + std::stringstream line_stream(line); + std::string key_field; + std::string value_field; + std::string weight_field; + + std::getline(line_stream, value_field, '\t'); + std::getline(line_stream, key_field, '\t'); + std::getline(line_stream, weight_field, '\t'); + + record->key = (g_osm_data) ? osm_to_key(key_field.c_str()) : atol(key_field.c_str()); + record->value = atol(value_field.c_str()); + record->weight = atof(weight_field.c_str()); + + if (record->key < g_min_key) g_min_key = record->key; + + if (record->key > g_max_key) g_max_key = record->key; + + g_reccnt++; + + return true; + } + + return false; +} + +static bool build_insert_vec(std::fstream *file, std::vector &vec, size_t n) { + vec.clear(); + for (size_t i=0; i= 1) fprintf(stderr, "\n"); +} + +static bool warmup(std::fstream *file, ExtendedWSS *extended_wss, size_t count, double delete_prop, bool progress=true) +{ + size_t del_buf_size = 10000; + size_t delete_idx = del_buf_size; + + std::vector delbuf; + std::set deleted_keys; + + de::wss_query_parms parms; + parms.rng = g_rng; + parms.sample_size = del_buf_size; + + size_t inserted = 0; + + double last_percent = 0; + for (size_t i=0; iinsert(rec); + + if (i > extended_wss->get_buffer_capacity() && delete_idx >= delbuf.size()) { + extended_wss->query(&parms); + delete_idx = 0; + deleted_keys.clear(); + } + + if (i > extended_wss->get_buffer_capacity() && gsl_rng_uniform(g_rng) < delete_prop) { + auto rec = delbuf[delete_idx]; + delete_idx++; + + if (deleted_keys.find(rec) == deleted_keys.end()) { + extended_wss->erase(rec); + deleted_keys.insert(rec); + } + } + + if (progress && ((double) i / (double) count) - last_percent > .01) { + progress_update((double) i / (double) count, "warming up:"); + last_percent = (double) i / (double) count; + } + } + + if (progress) { + progress_update(1, "warming up:"); + } + + return true; +} + + +static void reset_de_perf_metrics() { + + /* + * rejection counters are zeroed automatically by the + * sampling function itself. + */ + + RESET_IO_CNT(); +} + +#endif // H_BENCH -- cgit v1.2.3