fix: distributed executor, main.cpp, tests and docs

poyrazK · poyrazK · commit b0da5b66bce1 · 2026-04-11T18:41:41.000+03:00
- Fix Phase 1 error to include node.id and reply.error_msg
- Move bloom filtering to sender side in ShuffleFragment handler
- Remove receiver-side bloom check in PushData handler
- Fix tests to only assert no-false-negative property
- Remove duplicate section in SQLITE_COMPARISON.md
diff --git a/docs/performance/SQLITE_COMPARISON.md b/docs/performance/SQLITE_COMPARISON.md
@@ -39,22 +39,16 @@ We addressed the gaps via the following optimizations:
 2.  **Pinned Page Iteration**: Modifying our `HeapTable::Iterator` to hold pages pinned across slot iteration avoids repetitive atomic checks and LRU updates per-row.
 3.  **Batch Insert Mode**: Skipping single-row undo logs and exclusive locks to exploit pure in-memory bump allocation. This drove the `INSERT` speedup well past SQLite limits, as we write raw tuples uninterrupted.
 
-## 6. Post-Optimization Enhancements
-We addressed the gaps via the following optimizations:
-1.  **Buffer Pool Bypass (`fetch_page_by_id`)**: Reduced global std::mutex latch contention by explicitly caching ID lookups, yielding a ~30% improvement in scan logic.
-2.  **Pinned Page Iteration**: Modifying our `HeapTable::Iterator` to hold pages pinned across slot iteration avoids repetitive atomic checks and LRU updates per-row.
-3.  **Batch Insert Mode**: Skipping single-row undo logs and exclusive locks to exploit pure in-memory bump allocation. This drove the `INSERT` speedup well past SQLite limits, as we write raw tuples uninterrupted.
-
-## 7. Distributed Join Optimization: Bloom Filters
+## 6. Distributed Join Optimization: Bloom Filters
 
 ### Problem
 Distributed shuffle joins send **all tuples** across the network to partitioned nodes, even when many will never match. This causes unnecessary network traffic and buffer memory usage.
 
 ### Solution: Bloom Filter Integration
 Implemented bloom filters to filter tuples at the source before network transmission:
-- **One-sided bloom filter**: Built from the inner/right table, applied to filter the outer/left table
-- **Distributed construction**: Each data node builds bloom filter locally during its scan phase
-- **Coordinator coordination**: `BloomFilterPush` RPC broadcasts filter metadata to all nodes
+- **One-sided bloom filter**: Built from the left/build table, applied to filter the right/probe table
+- **Distributed construction**: Each data node constructs its local bloom during the left/build scan phase
+- **Coordinator coordination**: `BloomFilterPush` RPC broadcasts filter metadata to all nodes before the right/probe shuffle
 
 ### Architecture
 ```
diff --git a/src/distributed/distributed_executor.cpp b/src/distributed/distributed_executor.cpp
@@ -230,8 +230,9 @@ QueryResult DistributedExecutor::execute(const parser::Statement& stmt,
                     }
                     auto reply = network::QueryResultsReply::deserialize(resp);
                     if (!reply.success) {
-                        phase1_success = false;
-                        break;
+                        QueryResult res;
+                        res.set_error("Shuffle failed on node " + node.id + ": " + reply.error_msg);
+                        return res;
                     }
                 }
 
diff --git a/src/main.cpp b/src/main.cpp
@@ -472,50 +472,9 @@ int main(int argc, char* argv[]) {
                         (void)h;
                         auto args = cloudsql::network::PushDataArgs::deserialize(p);
                         if (cluster_manager != nullptr) {
-                            // Apply bloom filter if available for this context
-                            if (cluster_manager->has_bloom_filter(args.context_id)) {
-                                auto bloom = cluster_manager->get_bloom_filter(args.context_id);
-                                std::string probe_key_col =
-                                    cluster_manager->get_probe_key_col(args.context_id);
-
-                                // Get probe table schema to find key column index
-                                auto table_meta_opt = catalog->get_table_by_name(args.table_name);
-                                if (table_meta_opt.has_value() && !probe_key_col.empty()) {
-                                    const auto* table_meta = table_meta_opt.value();
-                                    size_t key_idx = static_cast<size_t>(-1);
-                                    for (size_t i = 0; i < table_meta->columns.size(); ++i) {
-                                        if (table_meta->columns[i].name == probe_key_col) {
-                                            key_idx = i;
-                                            break;
-                                        }
-                                    }
-
-                                    if (key_idx != static_cast<size_t>(-1)) {
-                                        // Filter rows using bloom filter
-                                        std::vector<cloudsql::executor::Tuple> filtered_rows;
-                                        filtered_rows.reserve(args.rows.size());
-                                        for (auto& row : args.rows) {
-                                            if (bloom.might_contain(row.get(key_idx))) {
-                                                filtered_rows.push_back(std::move(row));
-                                            }
-                                        }
-                                        cluster_manager->buffer_shuffle_data(
-                                            args.context_id, args.table_name,
-                                            std::move(filtered_rows));
-                                    } else {
-                                        // Key column not found, buffer as-is
-                                        cluster_manager->buffer_shuffle_data(
-                                            args.context_id, args.table_name, std::move(args.rows));
-                                    }
-                                } else {
-                                    // No metadata, buffer as-is
-                                    cluster_manager->buffer_shuffle_data(
-                                        args.context_id, args.table_name, std::move(args.rows));
-                                }
-                            } else {
-                                cluster_manager->buffer_shuffle_data(
-                                    args.context_id, args.table_name, std::move(args.rows));
-                            }
+                            // Receiver-side: buffer data as-is (bloom filtering done on sender)
+                            cluster_manager->buffer_shuffle_data(args.context_id, args.table_name,
+                                                                 std::move(args.rows));
                         }
 
                         cloudsql::network::QueryResultsReply reply;
@@ -630,10 +589,43 @@ int main(int argc, char* argv[]) {
                                         continue;
                                     }
 
+                                    // Apply bloom filter on sender side before sending
+                                    std::vector<cloudsql::executor::Tuple> rows_to_send = std::move(rows);
+                                    if (cluster_manager->has_bloom_filter(args.context_id)) {
+                                        auto bloom = cluster_manager->get_bloom_filter(args.context_id);
+                                        std::string probe_key_col = cluster_manager->get_probe_key_col(args.context_id);
+
+                                        if (!probe_key_col.empty()) {
+                                            // Find key column index in current table
+                                            auto table_meta_opt = catalog->get_table_by_name(args.table_name);
+                                            if (table_meta_opt.has_value()) {
+                                                const auto* table_meta = table_meta_opt.value();
+                                                size_t key_idx = static_cast<size_t>(-1);
+                                                for (size_t i = 0; i < table_meta->columns.size(); ++i) {
+                                                    if (table_meta->columns[i].name == probe_key_col) {
+                                                        key_idx = i;
+                                                        break;
+                                                    }
+                                                }
+
+                                                if (key_idx != static_cast<size_t>(-1)) {
+                                                    std::vector<cloudsql::executor::Tuple> filtered;
+                                                    filtered.reserve(rows_to_send.size());
+                                                    for (auto& row : rows_to_send) {
+                                                        if (bloom.might_contain(row.get(key_idx))) {
+                                                            filtered.push_back(std::move(row));
+                                                        }
+                                                    }
+                                                    rows_to_send = std::move(filtered);
+                                                }
+                                            }
+                                        }
+                                    }
+
                                     cloudsql::network::PushDataArgs push_args;
                                     push_args.context_id = args.context_id;
                                     push_args.table_name = args.table_name;
-                                    push_args.rows = std::move(rows);
+                                    push_args.rows = std::move(rows_to_send);
                                     std::vector<uint8_t> resp;
                                     if (!client.call(cloudsql::network::RpcType::PushData,
                                                      push_args.serialize(), resp)) {
diff --git a/tests/bloom_filter_test.cpp b/tests/bloom_filter_test.cpp
@@ -145,23 +145,20 @@ TEST(BloomFilterTests, DuplicateInsertions) {
  * @brief Tests different value types.
  */
 TEST(BloomFilterTests, DifferentValueTypes) {
-    BloomFilter bf(100);
+    BloomFilter bf(1000);  // Large filter to minimize false positives
 
     bf.insert(Value::make_int64(1));
     bf.insert(Value::make_int64(2));
     bf.insert(Value::make_float64(3.14));
     bf.insert(Value::make_text("string"));
     bf.insert(Value::make_bool(true));
 
+    // Verify no-false-negative: inserted values must be found
     EXPECT_TRUE(bf.might_contain(Value::make_int64(1)));
     EXPECT_TRUE(bf.might_contain(Value::make_int64(2)));
     EXPECT_TRUE(bf.might_contain(Value::make_float64(3.14)));
     EXPECT_TRUE(bf.might_contain(Value::make_text("string")));
     EXPECT_TRUE(bf.might_contain(Value::make_bool(true)));
-
-    // Non-inserted
-    EXPECT_FALSE(bf.might_contain(Value::make_int64(999)));
-    EXPECT_FALSE(bf.might_contain(Value::make_text("not inserted")));
 }
 
 /**
@@ -239,6 +236,11 @@ TEST(BloomFilterTests, BloomFilterApplicationLogic) {
     bf.insert(Value::make_int64(20));
     bf.insert(Value::make_int64(30));
 
+    // Verify no-false-negative: inserted values must be found via might_contain
+    EXPECT_TRUE(bf.might_contain(Value::make_int64(10)));
+    EXPECT_TRUE(bf.might_contain(Value::make_int64(20)));
+    EXPECT_TRUE(bf.might_contain(Value::make_int64(30)));
+
     // Simulate tuple filtering (as done in PushData handler)
     std::vector<cloudsql::executor::Tuple> tuples;
     tuples.push_back(
@@ -257,18 +259,15 @@ TEST(BloomFilterTests, BloomFilterApplicationLogic) {
         }
     }
 
-    // Should have 2 matches (10 and 20)
-    EXPECT_EQ(filtered.size(), 2);
-
-    // Verify the filtered values (matches may be in different order due to move)
+    // Verify found values in filtered list
     bool found_10 = false;
     bool found_20 = false;
     for (auto& row : filtered) {
         if (row.get(0) == Value::make_int64(10)) found_10 = true;
         if (row.get(0) == Value::make_int64(20)) found_20 = true;
     }
-    EXPECT_TRUE(found_10);
-    EXPECT_TRUE(found_20);
+    EXPECT_TRUE(found_10);  // Inserted value must be found
+    EXPECT_TRUE(found_20);  // Inserted value must be found
 }
 
 }  // namespace

Original file line number	Diff line number	Diff line change
`@@ -230,8 +230,9 @@ QueryResult DistributedExecutor::execute(const parser::Statement& stmt,`
`230`	`230`	`}`
`231`	`231`	`auto reply = network::QueryResultsReply::deserialize(resp);`
`232`	`232`	`if (!reply.success) {`
`233`		`- phase1_success = false;`
`234`		`- break;`
	`233`	`+ QueryResult res;`
	`234`	`+ res.set_error("Shuffle failed on node " + node.id + ": " + reply.error_msg);`
	`235`	`+ return res;`
`235`	`236`	`}`
`236`	`237`	`}`
`237`	`238`