Interface update (#5)

* Query Interface Adjustments/Refactoring Began the process of adjusting the query interface (and also the shard interface, to a lesser degree) to better accommodate the user. In particular the following changes have been made, 1. The number of necessary template arguments for the query type has been drastically reduced, while also removing the void pointers and manual delete functions from the interface. This was accomplished by requiring many of the sub-types associated with a query (parameters, etc.) to be nested inside the main query class, and by forcing the SHARD type to expose its associated record type. 2. User-defined query return types are now supported. Queries no longer are required to return strictly sets of records. Instead, the query now has LocalResultType and ResultType template parameters (which can be defaulted using a typedef in the Query type itself), allowing much more flexibility. Note that, at least for the short term, the LocalResultType must still expose the same is_deleted/is_tombstone interface as a Wrapped<R> used to, as this is currently needed for delete filtering. A better approach to this is, hopefully, forthcoming. 3. Updated the ISAMTree.h shard and rangequery.h query to use the new interfaces, and adjusted the associated unit tests as well. 4. Dropped the unnecessary "get_data()" function from the ShardInterface concept. 5. Dropped the need to specify a record type in the ShardInterface concept. This is now handled using a required Shard::RECORD member of the Shard class itself, which should expose the name of the record type. * Updates to framework to support new Query/Shard interfaces Pretty extensive adjustments to the framework, particularly to the templates themselves, along with some type-renaming work, to support the new query and shard interfaces. Adjusted the external query interface to take an rvalue reference, rather than a pointer, to the query parameters. * Removed framework-level delete filtering This was causing some issues with the new query interface, and should probably be reworked anyway, so I'm temporarily (TM) removing the feature. * Updated benchmarks + remaining code for new interface
author: Douglas B. Rumbaugh <dbr4@psu.edu> 2024-12-06 13:13:51 -0500
committer: GitHub <noreply@github.com> 2024-12-06 18:13:51 +0000
commit: 9fe305c7d28e993e55c55427f377ae7e3251ea4f (patch)
tree: 384b687f64b84eb81bde2becac8a5f24916b07b4 /include/framework/structure/InternalLevel.h
parent: 47916da2ba5ed5bee2dda3cbcc58d39e1e931bfc (diff)
download: dynamic-extension-9fe305c7d28e993e55c55427f377ae7e3251ea4f.tar.gz
1 files changed, 222 insertions, 217 deletions
diff --git a/include/framework/structure/InternalLevel.h b/include/framework/structure/InternalLevel.h
index b962dcc..a4cf94d 100644
--- a/include/framework/structure/InternalLevel.h
+++ b/include/framework/structure/InternalLevel.h
@@ -1,8 +1,8 @@
 /*
  * include/framework/structure/InternalLevel.h
  *
- * Copyright (C) 2023 Douglas B. Rumbaugh <drumbaugh@psu.edu> 
- *                    Dong Xie <dongx@psu.edu>
+ * Copyright (C) 2023-2024 Douglas B. Rumbaugh <drumbaugh@psu.edu>
+ *                         Dong Xie <dongx@psu.edu>
  *
  * Distributed under the Modified BSD License.
  *
@@ -15,276 +15,281 @@
  */
 #pragma once
 
-#include <vector>
 #include <memory>
+#include <vector>
 
-#include "util/types.h"
-#include "framework/interface/Shard.h"
 #include "framework/interface/Query.h"
 #include "framework/interface/Record.h"
+#include "framework/interface/Shard.h"
 #include "framework/structure/BufferView.h"
+#include "util/types.h"
 
 namespace de {
-template <RecordInterface R, ShardInterface<R> S, QueryInterface<R, S> Q>
+template <ShardInterface ShardType, QueryInterface<ShardType> QueryType>
 class InternalLevel;
 
-
-
-template <RecordInterface R, ShardInterface<R> S, QueryInterface<R, S> Q>
+template <ShardInterface ShardType, QueryInterface<ShardType> QueryType>
 class InternalLevel {
-    typedef S Shard;
-    typedef BufferView<R> BuffView;
-public:
-    InternalLevel(ssize_t level_no, size_t shard_cap)
-    : m_level_no(level_no)
-    , m_shard_cnt(0)
-    , m_shards(shard_cap, nullptr)
-    , m_pending_shard(nullptr)
-    {}
-
-    ~InternalLevel() { 
-        delete m_pending_shard;
-    }
+  typedef typename ShardType::RECORD RecordType;
+  typedef BufferView<RecordType> BuffView;
 
-    /*
-     * Create a new shard combining the records from base_level and new_level,
-     * and return a shared_ptr to a new level containing this shard. This is used
-     * for reconstructions under the leveling layout policy.
-     *
-     * No changes are made to the levels provided as arguments.
-     */
-    static std::shared_ptr<InternalLevel> reconstruction(InternalLevel* base_level, InternalLevel* new_level) {
-        assert(base_level->m_level_no > new_level->m_level_no || (base_level->m_level_no == 0 && new_level->m_level_no == 0));
-        auto res = new InternalLevel(base_level->m_level_no, 1);
-        res->m_shard_cnt = 1;
-        std::vector<Shard *> shards = {base_level->m_shards[0].get(),
+public:
+  InternalLevel(ssize_t level_no, size_t shard_cap)
+      : m_level_no(level_no), m_shard_cnt(0), m_shards(shard_cap, nullptr),
+        m_pending_shard(nullptr) {}
+
+  ~InternalLevel() { delete m_pending_shard; }
+
+  /*
+   * Create a new shard combining the records from base_level and new_level,
+   * and return a shared_ptr to a new level containing this shard. This is used
+   * for reconstructions under the leveling layout policy.
+   *
+   * No changes are made to the levels provided as arguments.
+   */
+  static std::shared_ptr<InternalLevel>
+  reconstruction(InternalLevel *base_level, InternalLevel *new_level) {
+    assert(base_level->m_level_no > new_level->m_level_no ||
+           (base_level->m_level_no == 0 && new_level->m_level_no == 0));
+    auto res = new InternalLevel(base_level->m_level_no, 1);
+    res->m_shard_cnt = 1;
+    std::vector<ShardType *> shards = {base_level->m_shards[0].get(),
                                        new_level->m_shards[0].get()};
 
-        res->m_shards[0] = std::make_shared<S>(shards);
-        return std::shared_ptr<InternalLevel>(res);
+    res->m_shards[0] = std::make_shared<ShardType>(shards);
+    return std::shared_ptr<InternalLevel>(res);
+  }
+
+  static std::shared_ptr<InternalLevel>
+  reconstruction(std::vector<InternalLevel *> levels, size_t level_idx) {
+    std::vector<ShardType *> shards;
+    for (auto level : levels) {
+      for (auto shard : level->m_shards) {
+        if (shard)
+          shards.emplace_back(shard.get());
+      }
     }
 
-    static std::shared_ptr<InternalLevel> reconstruction(std::vector<InternalLevel*> levels, size_t level_idx) {
-        std::vector<Shard *> shards; 
-        for (auto level : levels) {
-            for (auto shard : level->m_shards) {
-                if (shard) shards.emplace_back(shard.get());
-            }
-        }
-
-        auto res = new InternalLevel(level_idx, 1);
-        res->m_shard_cnt = 1;
-        res->m_shards[0] = std::make_shared<S>(shards);
+    auto res = new InternalLevel(level_idx, 1);
+    res->m_shard_cnt = 1;
+    res->m_shards[0] = std::make_shared<ShardType>(shards);
+
+    return std::shared_ptr<InternalLevel>(res);
+  }
+
+  /*
+   * Create a new shard combining the records from all of
+   * the shards in level, and append this new shard into
+   * this level. This is used for reconstructions under
+   * the tiering layout policy.
+   *
+   * No changes are made to the level provided as an argument.
+   */
+  void append_level(InternalLevel *level) {
+    // FIXME: that this is happening probably means that
+    // something is going terribly wrong earlier in the
+    // reconstruction logic.
+    if (level->get_shard_count() == 0) {
+      return;
+    }
 
-        return std::shared_ptr<InternalLevel>(res);
+    std::vector<ShardType *> shards;
+    for (auto shard : level->m_shards) {
+      if (shard)
+        shards.emplace_back(shard.get());
     }
 
-    /*
-     * Create a new shard combining the records from all of
-     * the shards in level, and append this new shard into
-     * this level. This is used for reconstructions under
-     * the tiering layout policy.
-     *
-     * No changes are made to the level provided as an argument.
-     */
-    void append_level(InternalLevel* level) {
-        // FIXME: that this is happening probably means that
-        // something is going terribly wrong earlier in the
-        // reconstruction logic.
-        if (level->get_shard_count() == 0) {
-            return;
-        }
+    if (m_shard_cnt == m_shards.size()) {
+      m_pending_shard = new ShardType(shards);
+      return;
+    }
 
-        std::vector<S*> shards;
-        for (auto shard : level->m_shards) {
-            if (shard) shards.emplace_back(shard.get());
-        }
+    auto tmp = new ShardType(shards);
+    m_shards[m_shard_cnt] = std::shared_ptr<ShardType>(tmp);
+
+    ++m_shard_cnt;
+  }
+
+  /*
+   * Create a new shard using the records in the
+   * provided buffer, and append this new shard
+   * into this level. This is used for buffer
+   * flushes under the tiering layout policy.
+   */
+  void append_buffer(BuffView buffer) {
+    if (m_shard_cnt == m_shards.size()) {
+      assert(m_pending_shard == nullptr);
+      m_pending_shard = new ShardType(std::move(buffer));
+      return;
+    }
 
-        if (m_shard_cnt == m_shards.size()) {
-            m_pending_shard = new S(shards);
-            return;
-        }
+    m_shards[m_shard_cnt] = std::make_shared<ShardType>(std::move(buffer));
+    ++m_shard_cnt;
+  }
 
-        auto tmp = new S(shards);
-        m_shards[m_shard_cnt] = std::shared_ptr<S>(tmp);
+  void finalize() {
+    if (m_pending_shard) {
+      for (size_t i = 0; i < m_shards.size(); i++) {
+        m_shards[i] = nullptr;
+      }
 
-        ++m_shard_cnt;
+      m_shards[0] = std::shared_ptr<ShardType>(m_pending_shard);
+      m_pending_shard = nullptr;
+      m_shard_cnt = 1;
     }
-
-    /*
-     * Create a new shard using the records in the
-     * provided buffer, and append this new shard
-     * into this level. This is used for buffer
-     * flushes under the tiering layout policy.
-     */
-    void append_buffer(BuffView buffer) {
-        if (m_shard_cnt == m_shards.size()) {
-            assert(m_pending_shard == nullptr);
-            m_pending_shard = new S(std::move(buffer));
-            return;
-        }
-
-        m_shards[m_shard_cnt] = std::make_shared<S>(std::move(buffer));
-        ++m_shard_cnt;
+  }
+
+  /*
+   * Create a new shard containing the combined records
+   * from all shards on this level and return it.
+   *
+   * No changes are made to this level.
+   */
+  ShardType *get_combined_shard() {
+    if (m_shard_cnt == 0) {
+      return nullptr;
     }
 
-    void finalize() {
-        if (m_pending_shard) {
-            for (size_t i=0; i<m_shards.size(); i++) {
-                m_shards[i] = nullptr;
-            }
-
-            m_shards[0] = std::shared_ptr<S>(m_pending_shard);
-            m_pending_shard = nullptr;
-            m_shard_cnt = 1;
-        }
+    std::vector<ShardType *> shards;
+    for (auto shard : m_shards) {
+      if (shard)
+        shards.emplace_back(shard.get());
     }
 
-    /*
-     * Create a new shard containing the combined records
-     * from all shards on this level and return it.
-     *
-     * No changes are made to this level.
-     */
-    Shard *get_combined_shard() {
-        if (m_shard_cnt == 0) {
-            return nullptr;
-        }
-
-        std::vector<Shard *> shards;
-        for (auto shard : m_shards) {
-            if (shard) shards.emplace_back(shard.get());
-        }
-
-        return new S(shards);
+    return new ShardType(shards);
+  }
+
+  void get_local_queries(
+      std::vector<std::pair<ShardID, ShardType *>> &shards,
+      std::vector<typename QueryType::LocalQuery *> &local_queries,
+      typename QueryType::Parameters *query_parms) {
+    for (size_t i = 0; i < m_shard_cnt; i++) {
+      if (m_shards[i]) {
+        auto local_query =
+            QueryType::local_preproc(m_shards[i].get(), query_parms);
+        shards.push_back({{m_level_no, (ssize_t)i}, m_shards[i].get()});
+        local_queries.emplace_back(local_query);
+      }
     }
+  }
 
-    void get_query_states(std::vector<std::pair<ShardID, Shard *>> &shards, std::vector<void*>& shard_states, void *query_parms) {
-        for (size_t i=0; i<m_shard_cnt; i++) {
-            if (m_shards[i]) {
-                auto shard_state = Q::get_query_state(m_shards[i].get(), query_parms);
-                shards.push_back({{m_level_no, (ssize_t) i}, m_shards[i].get()});
-                shard_states.emplace_back(shard_state);
-            }
+  bool check_tombstone(size_t shard_stop, const RecordType &rec) {
+    if (m_shard_cnt == 0)
+      return false;
+
+    for (int i = m_shard_cnt - 1; i >= (ssize_t)shard_stop; i--) {
+      if (m_shards[i]) {
+        auto res = m_shards[i]->point_lookup(rec, true);
+        if (res && res->is_tombstone()) {
+          return true;
         }
+      }
     }
-
-    bool check_tombstone(size_t shard_stop, const R& rec) {
-        if (m_shard_cnt == 0) return false;
-
-        for (int i = m_shard_cnt - 1; i >= (ssize_t) shard_stop;  i--) {
-            if (m_shards[i]) {
-                auto res = m_shards[i]->point_lookup(rec, true);
-                if (res && res->is_tombstone()) {
-                    return true;
-                }
-            }
+    return false;
+  }
+
+  bool delete_record(const RecordType &rec) {
+    if (m_shard_cnt == 0)
+      return false;
+
+    for (size_t i = 0; i < m_shards.size(); ++i) {
+      if (m_shards[i]) {
+        auto res = m_shards[i]->point_lookup(rec);
+        if (res) {
+          res->set_delete();
+          return true;
         }
-        return false;
+      }
     }
 
-    bool delete_record(const R &rec) {
-        if (m_shard_cnt == 0) return false;
-
-        for (size_t i = 0; i < m_shards.size();  ++i) {
-            if (m_shards[i]) {
-                auto res = m_shards[i]->point_lookup(rec);
-                if (res) {
-                    res->set_delete();
-                    return true;
-                }
-            }
-        }
+    return false;
+  }
 
-        return false;
+  ShardType *get_shard(size_t idx) {
+    if (idx >= m_shard_cnt) {
+      return nullptr;
     }
 
-    Shard* get_shard(size_t idx) {
-        if (idx >= m_shard_cnt) {
-            return nullptr;
-        }
+    return m_shards[idx].get();
+  }
 
-        return m_shards[idx].get();
-    }
+  size_t get_shard_count() { return m_shard_cnt; }
 
-    size_t get_shard_count() {
-        return m_shard_cnt;
+  size_t get_record_count() {
+    size_t cnt = 0;
+    for (size_t i = 0; i < m_shard_cnt; i++) {
+      if (m_shards[i]) {
+        cnt += m_shards[i]->get_record_count();
+      }
     }
 
-    size_t get_record_count() {
-        size_t cnt = 0;
-        for (size_t i=0; i<m_shard_cnt; i++) {
-            if (m_shards[i]) {
-                cnt += m_shards[i]->get_record_count();
-            }
-        }
+    return cnt;
+  }
 
-        return cnt;
+  size_t get_tombstone_count() {
+    size_t res = 0;
+    for (size_t i = 0; i < m_shard_cnt; ++i) {
+      if (m_shards[i]) {
+        res += m_shards[i]->get_tombstone_count();
+      }
     }
-    
-    size_t get_tombstone_count() {
-        size_t res = 0;
-        for (size_t i = 0; i < m_shard_cnt; ++i) {
-            if (m_shards[i]) {
-                res += m_shards[i]->get_tombstone_count();
-            }
-        }
-        return res;
+    return res;
+  }
+
+  size_t get_aux_memory_usage() {
+    size_t cnt = 0;
+    for (size_t i = 0; i < m_shard_cnt; i++) {
+      if (m_shards[i]) {
+        cnt += m_shards[i]->get_aux_memory_usage();
+      }
     }
 
-    size_t get_aux_memory_usage() {
-        size_t cnt = 0;
-        for (size_t i=0; i<m_shard_cnt; i++) {
-            if (m_shards[i]){
-                cnt += m_shards[i]->get_aux_memory_usage();
-            }
-        }
+    return cnt;
+  }
 
-        return cnt;
+  size_t get_memory_usage() {
+    size_t cnt = 0;
+    for (size_t i = 0; i < m_shard_cnt; i++) {
+      if (m_shards[i]) {
+        cnt += m_shards[i]->get_memory_usage();
+      }
     }
 
-    size_t get_memory_usage() {
-        size_t cnt = 0;
-        for (size_t i=0; i<m_shard_cnt; i++) {
-            if (m_shards[i]) {
-                cnt += m_shards[i]->get_memory_usage();
-            }
-        }
-
-        return cnt;
+    return cnt;
+  }
+
+  double get_tombstone_prop() {
+    size_t tscnt = 0;
+    size_t reccnt = 0;
+    for (size_t i = 0; i < m_shard_cnt; i++) {
+      if (m_shards[i]) {
+        tscnt += m_shards[i]->get_tombstone_count();
+        reccnt += m_shards[i]->get_record_count();
+      }
     }
 
-    double get_tombstone_prop() {
-        size_t tscnt = 0;
-        size_t reccnt = 0;
-        for (size_t i=0; i<m_shard_cnt; i++) {
-            if (m_shards[i]) {
-                tscnt += m_shards[i]->get_tombstone_count();
-                reccnt += m_shards[i]->get_record_count();
-            }
-        }
+    return (double)tscnt / (double)(tscnt + reccnt);
+  }
 
-        return (double) tscnt / (double) (tscnt + reccnt);
+  std::shared_ptr<InternalLevel> clone() {
+    auto new_level =
+        std::make_shared<InternalLevel>(m_level_no, m_shards.size());
+    for (size_t i = 0; i < m_shard_cnt; i++) {
+      new_level->m_shards[i] = m_shards[i];
     }
+    new_level->m_shard_cnt = m_shard_cnt;
 
-    std::shared_ptr<InternalLevel> clone() {
-        auto new_level = std::make_shared<InternalLevel>(m_level_no, m_shards.size());
-        for (size_t i=0; i<m_shard_cnt; i++) {
-            new_level->m_shards[i] = m_shards[i];
-        }
-        new_level->m_shard_cnt = m_shard_cnt;
-
-        return new_level;
-    }
+    return new_level;
+  }
 
 private:
-    ssize_t m_level_no;
-    
-    size_t m_shard_cnt;
-    size_t m_shard_size_cap;
+  ssize_t m_level_no;
+
+  size_t m_shard_cnt;
+  size_t m_shard_size_cap;
 
-    std::vector<std::shared_ptr<Shard>> m_shards;
-    Shard *m_pending_shard;
+  std::vector<std::shared_ptr<ShardType>> m_shards;
+  ShardType *m_pending_shard;
 };
 
-}
+} // namespace de
author	Douglas B. Rumbaugh <dbr4@psu.edu>	2024-12-06 13:13:51 -0500
committer	GitHub <noreply@github.com>	2024-12-06 18:13:51 +0000
commit	9fe305c7d28e993e55c55427f377ae7e3251ea4f (patch)
tree	384b687f64b84eb81bde2becac8a5f24916b07b4 /include/framework/structure/InternalLevel.h
parent	47916da2ba5ed5bee2dda3cbcc58d39e1e931bfc (diff)
download	dynamic-extension-9fe305c7d28e993e55c55427f377ae7e3251ea4f.tar.gz