From d6e08e9d8d3ac9b356ac50cee22b41f828160247 Mon Sep 17 00:00:00 2001 From: Douglas Rumbaugh Date: Thu, 27 Jul 2023 18:21:26 -0400 Subject: Expanded query interface Query interface now enables skipping of delete processing and stopping query processing when first match is found. --- include/shard/PGM.h | 128 ++++++++++++++++++++++++++++++++++++++++++++++------ 1 file changed, 115 insertions(+), 13 deletions(-) (limited to 'include/shard/PGM.h') diff --git a/include/shard/PGM.h b/include/shard/PGM.h index 65d548e..aba5227 100644 --- a/include/shard/PGM.h +++ b/include/shard/PGM.h @@ -33,9 +33,17 @@ struct pgm_range_query_parms { decltype(R::key) upper_bound; }; +template +struct PGMPointLookupParms { + decltype(R::key) target_key; +}; + template class PGMRangeQuery; +template +class PGMPointLookup; + template struct PGMState { size_t start_idx; @@ -45,12 +53,6 @@ struct PGMState { template struct PGMBufferState { size_t cutoff; - Alias* alias; - - ~PGMBufferState() { - delete alias; - } - }; template @@ -64,6 +66,7 @@ public: // FIXME: there has to be a better way to do this friend class PGMRangeQuery; + friend class PGMPointLookup; PGM(MutableBuffer* buffer) : m_reccnt(0), m_tombstone_cnt(0) { @@ -274,11 +277,80 @@ private: pgm::PGMIndex m_pgm; BloomFilter *m_bf; }; +template +class PGMPointLookup { +public: + constexpr static bool EARLY_ABORT=false; + constexpr static bool SKIP_DELETE_FILTER=false; + + static void *get_query_state(PGM *ts, void *parms) { + return nullptr; + } + + static void* get_buffer_query_state(MutableBuffer *buffer, void *parms) { + return nullptr; + } + + static void process_query_states(void *query_parms, std::vector &shard_states, void *buff_state) { + return; + } + + static std::vector> query(PGM *ts, void *q_state, void *parms) { + std::vector> records; + auto p = (PGMPointLookupParms *) parms; + auto s = (PGMState *) q_state; + + size_t idx = ts->get_lower_bound(p->target_key); + if (ts->get_record_at(idx)->rec.key == p->target_key) { + records.emplace_back(*ts->get_record_at(idx)); + } + + return records; + } + + static std::vector> buffer_query(MutableBuffer *buffer, void *state, void *parms) { + auto p = (PGMPointLookupParms *) parms; + auto s = (PGMBufferState *) state; + + std::vector> records; + for (size_t i=0; iget_record_count(); i++) { + auto rec = buffer->get_data() + i; + if (rec->rec.key == p->target_key) { + records.emplace_back(*rec); + return records; + } + } + + return records; + } + + static std::vector merge(std::vector>> &results, void *parms) { + std::vector output; + for (size_t i=0 ;i 0) { + output.emplace_back(results[i][0].rec); + return output; + } + } + + return output; + } + + static void delete_query_state(void *state) { + } + + static void delete_buffer_query_state(void *state) { + } +}; + template class PGMRangeQuery { public: + constexpr static bool EARLY_ABORT=false; + constexpr static bool SKIP_DELETE_FILTER=false; + static void *get_query_state(PGM *ts, void *parms) { auto res = new PGMState(); auto p = (pgm_range_query_parms *) parms; @@ -296,7 +368,7 @@ public: return res; } - static void process_query_states(void *query_parms, std::vector shard_states, void *buff_state) { + static void process_query_states(void *query_parms, std::vector &shard_states, void *buff_state) { return; } @@ -343,11 +415,25 @@ public: return records; } - static std::vector merge(std::vector> &results, void *parms) { + static std::vector merge(std::vector>> &results, void *parms) { + std::vector>> cursors; + cursors.reserve(results.size()); + + PriorityQueue> pq(results.size()); size_t total = 0; - for (size_t i=0; i 0){ + auto base = results[i].data(); + cursors.emplace_back(Cursor{base, base + results[i].size(), 0, results[i].size()}); + assert(i == cursors.size() - 1); + total += results[i].size(); + pq.push(cursors[i].ptr, tmp_n - i - 1); + } else { + cursors.emplace_back(Cursor>{nullptr, nullptr, 0, 0}); + } if (total == 0) { return std::vector(); @@ -356,8 +442,24 @@ public: std::vector output; output.reserve(total); - for (size_t i=0; i 1 ? pq.peek(1) : queue_record>{nullptr, 0}; + if (!now.data->is_tombstone() && next.data != nullptr && + now.data->rec == next.data->rec && next.data->is_tombstone()) { + + pq.pop(); pq.pop(); + auto& cursor1 = cursors[tmp_n - now.version - 1]; + auto& cursor2 = cursors[tmp_n - next.version - 1]; + if (advance_cursor>(cursor1)) pq.push(cursor1.ptr, now.version); + if (advance_cursor>(cursor2)) pq.push(cursor2.ptr, next.version); + } else { + auto& cursor = cursors[tmp_n - now.version - 1]; + if (!now.data->is_tombstone()) output.push_back(cursor.ptr->rec); + pq.pop(); + + if (advance_cursor>(cursor)) pq.push(cursor.ptr, now.version); + } } return output; -- cgit v1.2.3