summaryrefslogtreecommitdiffstats
diff options
context:
space:
mode:
authorDouglas Rumbaugh <dbr4@psu.edu>2023-06-05 12:45:40 -0400
committerDouglas Rumbaugh <dbr4@psu.edu>2023-06-05 12:45:40 -0400
commit1b332b5766b00df4be21825a4d8cd657e7f13433 (patch)
treecd83045a7adfde1bcd42de256c6ba3211d6d158d
parentf8f3cb6c55b085fa260c7f80644d5ef057d4a070 (diff)
downloaddynamic-extension-1b332b5766b00df4be21825a4d8cd657e7f13433.tar.gz
TrieSpline tests+bugfixes
-rw-r--r--CMakeLists.txt8
-rw-r--r--include/shard/TrieSpline.h29
-rw-r--r--tests/triespline_tests.cpp217
3 files changed, 240 insertions, 14 deletions
diff --git a/CMakeLists.txt b/CMakeLists.txt
index 367f2e9..420c19c 100644
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -12,6 +12,8 @@ set(bench True)
set(CMAKE_RUNTIME_OUTPUT_DIRECTORY "${CMAKE_CURRENT_SOURCE_DIR}/bin")
+add_compile_options(-Iinclude -Iexternal/PLEX/include)
+
if (debug)
add_compile_options(-g -O0)
add_compile_options(-fsanitize=address)
@@ -22,12 +24,10 @@ else()
add_compile_options(-O3)
endif()
-
# Test build instructions
if (tests)
set(CMAKE_RUNTIME_OUTPUT_DIRECTORY "${CMAKE_CURRENT_SOURCE_DIR}/bin/tests")
file(MAKE_DIRECTORY "${CMAKE_CURRENT_SOURCE_DIR}/tests/data")
- add_compile_options(-Iinclude)
add_executable(pagedfile_tests ${CMAKE_CURRENT_SOURCE_DIR}/tests/pagedfile_tests.cpp)
target_link_libraries(pagedfile_tests PUBLIC gsl check subunit pthread)
@@ -56,6 +56,10 @@ if (tests)
add_executable(wss_tests ${CMAKE_CURRENT_SOURCE_DIR}/tests/wss_tests.cpp)
target_link_libraries(wss_tests PUBLIC gsl check subunit pthread)
target_include_directories(wss_tests PRIVATE include)
+
+ add_executable(triespline_tests ${CMAKE_CURRENT_SOURCE_DIR}/tests/triespline_tests.cpp)
+ target_link_libraries(triespline_tests PUBLIC gsl check subunit pthread)
+ target_include_directories(triespline_tests PRIVATE include external/PLEX/include)
endif()
# Benchmark build instructions
diff --git a/include/shard/TrieSpline.h b/include/shard/TrieSpline.h
index 5cd01e3..13753a1 100644
--- a/include/shard/TrieSpline.h
+++ b/include/shard/TrieSpline.h
@@ -15,7 +15,7 @@
#include <memory>
#include <concepts>
-#include "PLEX/include/ts/builder.h"
+#include "ts/builder.h"
#include "ds/PriorityQueue.h"
#include "util/Cursor.h"
#include "ds/BloomFilter.h"
@@ -88,7 +88,7 @@ public:
std::sort(base, stop, std::less<Wrapped<R>>());
K min_key = base->rec.key;
- K max_key = stop->rec.key;
+ K max_key = (stop - 1)->rec.key;
auto bldr = ts::Builder<K>(min_key, max_key, g_max_error);
@@ -104,16 +104,16 @@ public:
}
if (m_reccnt == 0) {
- m_max_key = m_min_key = base->key;
- } else if (base->key > m_max_key) {
- m_max_key = base->key;
- } else if (base->key < m_min_key) {
- m_min_key = base->key;
+ m_max_key = m_min_key = base->rec.key;
+ } else if (base->rec.key > m_max_key) {
+ m_max_key = base->rec.key;
+ } else if (base->rec.key < m_min_key) {
+ m_min_key = base->rec.key;
}
base->header &= 1;
m_data[m_reccnt++] = *base;
- bldr.AddKey(base->key);
+ bldr.AddKey(base->rec.key);
if (m_bf && base->is_tombstone()) {
m_tombstone_cnt++;
@@ -258,19 +258,24 @@ private:
return m_reccnt;
}
+ // if the found location _is_ the key, we're done.
+ if (m_data[idx].rec.key == key) {
+ return idx;
+ }
+
// if the found location is larger than the key, we need to
// move backwards towards the beginning of the array
- if (m_data[idx].key > key) {
+ if (m_data[idx].rec.key > key) {
for (ssize_t i=idx; i>=0; i--) {
- if (m_data[i].key < key) {
+ if (m_data[i].rec.key < key) {
return i+1;
}
}
// otherwise, we move forward towards the end
} else {
for (size_t i=idx; i<m_reccnt; i++) {
- if (m_data[i].key >= key) {
- return i-1;
+ if (m_data[i].rec.key >= key) {
+ return i - 1;
}
}
}
diff --git a/tests/triespline_tests.cpp b/tests/triespline_tests.cpp
new file mode 100644
index 0000000..982be79
--- /dev/null
+++ b/tests/triespline_tests.cpp
@@ -0,0 +1,217 @@
+/*
+ * tests/irs_tests.cpp
+ *
+ * Unit tests for TrieSpline (Augmented B+Tree) shard
+ *
+ * Copyright (C) 2023 Douglas Rumbaugh <drumbaugh@psu.edu>
+ * Dong Xie <dongx@psu.edu>
+ *
+ * All rights reserved. Published under the Modified BSD License.
+ *
+ */
+
+#include "shard/TrieSpline.h"
+#include "testing.h"
+
+#include <check.h>
+
+using namespace de;
+
+typedef TrieSpline<Rec> Shard;
+
+START_TEST(t_mbuffer_init)
+{
+ auto buffer = new MutableBuffer<Rec>(1024, true, 1024);
+ for (uint64_t i = 512; i > 0; i--) {
+ uint32_t v = i;
+ buffer->append({i,v, 1});
+ }
+
+ for (uint64_t i = 1; i <= 256; ++i) {
+ uint32_t v = i;
+ buffer->append({i, v, 1}, true);
+ }
+
+ for (uint64_t i = 257; i <= 512; ++i) {
+ uint32_t v = i + 1;
+ buffer->append({i, v, 1});
+ }
+
+ Shard* shard = new Shard(buffer);
+ ck_assert_uint_eq(shard->get_record_count(), 512);
+
+ delete buffer;
+ delete shard;
+}
+
+
+START_TEST(t_irs_init)
+{
+ size_t n = 512;
+ auto mbuffer1 = create_test_mbuffer<Rec>(n);
+ auto mbuffer2 = create_test_mbuffer<Rec>(n);
+ auto mbuffer3 = create_test_mbuffer<Rec>(n);
+
+ auto shard1 = new Shard(mbuffer1);
+ auto shard2 = new Shard(mbuffer2);
+ auto shard3 = new Shard(mbuffer3);
+
+ Shard* shards[3] = {shard1, shard2, shard3};
+ auto shard4 = new Shard(shards, 3);
+
+ ck_assert_int_eq(shard4->get_record_count(), n * 3);
+ ck_assert_int_eq(shard4->get_tombstone_count(), 0);
+
+ size_t total_cnt = 0;
+ size_t shard1_idx = 0;
+ size_t shard2_idx = 0;
+ size_t shard3_idx = 0;
+
+ for (size_t i = 0; i < shard4->get_record_count(); ++i) {
+ auto rec1 = shard1->get_record_at(shard1_idx);
+ auto rec2 = shard2->get_record_at(shard2_idx);
+ auto rec3 = shard3->get_record_at(shard3_idx);
+
+ auto cur_rec = shard4->get_record_at(i);
+
+ if (shard1_idx < n && cur_rec->rec == rec1->rec) {
+ ++shard1_idx;
+ } else if (shard2_idx < n && cur_rec->rec == rec2->rec) {
+ ++shard2_idx;
+ } else if (shard3_idx < n && cur_rec->rec == rec3->rec) {
+ ++shard3_idx;
+ } else {
+ assert(false);
+ }
+ }
+
+ delete mbuffer1;
+ delete mbuffer2;
+ delete mbuffer3;
+
+ delete shard1;
+ delete shard2;
+ delete shard3;
+ delete shard4;
+}
+
+START_TEST(t_point_lookup)
+{
+ size_t n = 10000;
+
+ auto buffer = create_double_seq_mbuffer<Rec>(n, false);
+ auto shard = Shard(buffer);
+
+ for (size_t i=0; i<n; i++) {
+ Rec r;
+ auto rec = (buffer->get_data() + i);
+ r.key = rec->rec.key;
+ r.value = rec->rec.value;
+
+ auto result = shard.point_lookup(r);
+ ck_assert_ptr_nonnull(result);
+ ck_assert_int_eq(result->rec.key, r.key);
+ ck_assert_int_eq(result->rec.value, r.value);
+ }
+
+ delete buffer;
+}
+END_TEST
+
+
+START_TEST(t_point_lookup_miss)
+{
+ size_t n = 10000;
+
+ auto buffer = create_double_seq_mbuffer<Rec>(n, false);
+ auto isam = Shard(buffer);
+
+ for (size_t i=n + 100; i<2*n; i++) {
+ Rec r;
+ r.key = i;
+ r.value = i;
+
+ auto result = isam.point_lookup(r);
+ ck_assert_ptr_null(result);
+ }
+
+ delete buffer;
+}
+
+
+START_TEST(t_full_cancelation)
+{
+ size_t n = 100;
+ auto buffer = create_double_seq_mbuffer<Rec>(n, false);
+ auto buffer_ts = create_double_seq_mbuffer<Rec>(n, true);
+
+ Shard* shard = new Shard(buffer);
+ Shard* shard_ts = new Shard(buffer_ts);
+
+ ck_assert_int_eq(shard->get_record_count(), n);
+ ck_assert_int_eq(shard->get_tombstone_count(), 0);
+ ck_assert_int_eq(shard_ts->get_record_count(), n);
+ ck_assert_int_eq(shard_ts->get_tombstone_count(), n);
+
+ Shard* shards[] = {shard, shard_ts};
+
+ Shard* merged = new Shard(shards, 2);
+
+ ck_assert_int_eq(merged->get_tombstone_count(), 0);
+ ck_assert_int_eq(merged->get_record_count(), 0);
+
+ delete buffer;
+ delete buffer_ts;
+ delete shard;
+ delete shard_ts;
+ delete merged;
+}
+END_TEST
+
+
+Suite *unit_testing()
+{
+ Suite *unit = suite_create("TrieSpline Shard Unit Testing");
+
+ TCase *create = tcase_create("de::TrieSpline constructor Testing");
+ tcase_add_test(create, t_mbuffer_init);
+ tcase_add_test(create, t_irs_init);
+ tcase_set_timeout(create, 100);
+ suite_add_tcase(unit, create);
+
+
+ TCase *tombstone = tcase_create("de:TrieSpline::tombstone cancellation Testing");
+ tcase_add_test(tombstone, t_full_cancelation);
+ suite_add_tcase(unit, tombstone);
+
+
+ TCase *lookup = tcase_create("de:TrieSpline:point_lookup Testing");
+ tcase_add_test(lookup, t_point_lookup);
+ tcase_add_test(lookup, t_point_lookup_miss);
+ suite_add_tcase(unit, lookup);
+
+
+ return unit;
+}
+
+
+int shard_unit_tests()
+{
+ int failed = 0;
+ Suite *unit = unit_testing();
+ SRunner *unit_shardner = srunner_create(unit);
+
+ srunner_run_all(unit_shardner, CK_NORMAL);
+ failed = srunner_ntests_failed(unit_shardner);
+ srunner_free(unit_shardner);
+
+ return failed;
+}
+
+
+int main()
+{
+ int unit_failed = shard_unit_tests();
+
+ return (unit_failed == 0) ? EXIT_SUCCESS : EXIT_FAILURE;
+}