From 55e0617ba75182958fc16579eaad6731b4a54ea2 Mon Sep 17 00:00:00 2001
From: RobinTF <83676088+RobinTF@users.noreply.github.com>
Date: Mon, 18 Nov 2024 18:54:41 +0100
Subject: [PATCH 1/4] Allow block-based join algorithm to work with undef
 values (#1616)

Extend the block-based merge-join algorithm, s.t. it can support undefined inputs. This currently only works for single columns joins where the undefined values are at the beginning of each input and (as there is only one join column) compatible with every other input element.
This is an important precondition for a lazy single-column join for sorted inputs.
---
 src/util/JoinAlgorithms/JoinAlgorithms.h | 299 +++++++++++++++++++++--
 src/util/TransparentFunctors.h           |  10 +
 test/JoinAlgorithmsTest.cpp              | 276 +++++++++++++++++++++
 3 files changed, 559 insertions(+), 26 deletions(-)
diff --git a/src/util/JoinAlgorithms/JoinAlgorithms.h b/src/util/JoinAlgorithms/JoinAlgorithms.h
index 13d52aa2d8..64c27d74c9 100644
--- a/src/util/JoinAlgorithms/JoinAlgorithms.h
+++ b/src/util/JoinAlgorithms/JoinAlgorithms.h
@@ -156,7 +156,7 @@ template <std::ranges::random_access_range Range1,
     if constexpr (isSimilar<FindSmallerUndefRangesLeft, Noop> &&
                   isSimilar<FindSmallerUndefRangesRight, Noop>) {
       return true;
-    } else if constexpr (std::is_same_v<T, Id>) {
+    } else if constexpr (std::is_convertible_v<T, Id>) {
       return row != Id::makeUndefined();
     } else {
       return (std::ranges::none_of(
@@ -664,6 +664,7 @@ struct JoinSide {
   [[no_unique_address]] const End end_;
   const Projection& projection_;
   CurrentBlocks currentBlocks_{};
+  CurrentBlocks undefBlocks_{};
 
   // Type aliases for a single element from a block from the left/right input.
   using value_type = std::ranges::range_value_t<std::iter_value_t<Iterator>>;
@@ -689,6 +690,10 @@ auto makeJoinSide(Blocks& blocks, const auto& projection) {
 template <typename T>
 concept IsJoinSide = ad_utility::isInstantiation<T, JoinSide>;
 
+struct AlwaysFalse {
+  bool operator()(const auto&) const { return false; }
+};
+
 // The class that actually performs the zipper join for blocks without UNDEF.
 // See the public `zipperJoinForBlocksWithoutUndef` function below for details.
 // The general approach of the algorithm is described in the following. Several
@@ -736,7 +741,10 @@ concept IsJoinSide = ad_utility::isInstantiation<T, JoinSide>;
 // `currentEl` (5 in this example). New blocks are added to one of the buffers
 // if they become empty at one point in the algorithm.
 template <IsJoinSide LeftSide, IsJoinSide RightSide, typename LessThan,
-          typename CompatibleRowAction>
+          typename CompatibleRowAction,
+          ad_utility::InvocableWithExactReturnType<
+              bool, typename LeftSide::ProjectedEl>
+              IsUndef = AlwaysFalse>
 struct BlockZipperJoinImpl {
   // The left and right inputs of the join
   LeftSide leftSide_;
@@ -745,11 +753,14 @@ struct BlockZipperJoinImpl {
   const LessThan& lessThan_;
   // The callback that is called for each pair of matching rows.
   CompatibleRowAction& compatibleRowAction_;
+  [[no_unique_address]] IsUndef isUndefined_{};
 
   // Type alias for the result of the projection. Elements from the left and
   // right input must be projected to the same type.
   using ProjectedEl = LeftSide::ProjectedEl;
   static_assert(std::same_as<ProjectedEl, typename RightSide::ProjectedEl>);
+  static constexpr bool potentiallyHasUndef =
+      !std::is_same_v<IsUndef, AlwaysFalse>;
 
   // Create an equality comparison from the `lessThan` predicate.
   bool eq(const auto& el1, const auto& el2) {
@@ -850,12 +861,38 @@ struct BlockZipperJoinImpl {
     return std::tuple{std::ref(first.fullBlock()), first.subrange(), it};
   }
 
-  // Call `compatibleRowAction` for all pairs of elements in the Cartesian
-  // product of the blocks in `blocksLeft` and `blocksRight`.
+  // Check if a side contains undefined values.
+  static bool hasUndef(const auto& side) {
+    if constexpr (potentiallyHasUndef) {
+      return !side.undefBlocks_.empty();
+    }
+    return false;
+  }
+
+  // Combine all elements from all blocks on the left with all elements from all
+  // blocks on the right and add them to the result.
+  void addCartesianProduct(const auto& blocksLeft, const auto& blocksRight) {
+    // TODO<C++23> use `std::views::cartesian_product`.
+    for (const auto& lBlock : blocksLeft) {
+      for (const auto& rBlock : blocksRight) {
+        compatibleRowAction_.setInput(lBlock.fullBlock(), rBlock.fullBlock());
+        for (size_t i : lBlock.getIndexRange()) {
+          for (size_t j : rBlock.getIndexRange()) {
+            compatibleRowAction_.addRow(i, j);
+          }
+        }
+      }
+    }
+  }
+
+  // Handle non-matching rows from the left side for an optional join or a minus
+  // join.
   template <bool DoOptionalJoin>
-  void addAll(const auto& blocksLeft, const auto& blocksRight) {
+  void addNonMatchingRowsFromLeftForOptionalJoin(const auto& blocksLeft,
+                                                 const auto& blocksRight) {
     if constexpr (DoOptionalJoin) {
-      if (std::ranges::all_of(
+      if (!hasUndef(rightSide_) &&
+          std::ranges::all_of(
               blocksRight | std::views::transform(
                                 [](const auto& inp) { return inp.subrange(); }),
               std::ranges::empty)) {
@@ -868,17 +905,15 @@ struct BlockZipperJoinImpl {
         }
       }
     }
-    // TODO<C++23> use `std::views::cartesian_product`.
-    for (const auto& lBlock : blocksLeft) {
-      for (const auto& rBlock : blocksRight) {
-        compatibleRowAction_.setInput(lBlock.fullBlock(), rBlock.fullBlock());
-        for (size_t i : lBlock.getIndexRange()) {
-          for (size_t j : rBlock.getIndexRange()) {
-            compatibleRowAction_.addRow(i, j);
-          }
-        }
-      }
-    }
+  }
+
+  // Call `compatibleRowAction` for all pairs of elements in the Cartesian
+  // product of the blocks in `blocksLeft` and `blocksRight`.
+  template <bool DoOptionalJoin>
+  void addAll(const auto& blocksLeft, const auto& blocksRight) {
+    addNonMatchingRowsFromLeftForOptionalJoin<DoOptionalJoin>(blocksLeft,
+                                                              blocksRight);
+    addCartesianProduct(blocksLeft, blocksRight);
     compatibleRowAction_.flush();
   }
 
@@ -897,6 +932,59 @@ struct BlockZipperJoinImpl {
     return result;
   }
 
+  // Main implementation for `findUndefValues`.
+  template <bool left, typename T>
+  cppcoro::generator<T> findUndefValuesHelper(const auto& fullBlockLeft,
+                                              const auto& fullBlockRight,
+                                              T& begL, T& begR,
+                                              const auto& undefBlocks) {
+    for (const auto& undefBlock : undefBlocks) {
+      // Select proper input table from the stored undef blocks
+      if constexpr (left) {
+        begL = undefBlock.fullBlock().begin();
+        compatibleRowAction_.setInput(undefBlock.fullBlock(),
+                                      fullBlockRight.get());
+      } else {
+        begR = undefBlock.fullBlock().begin();
+        compatibleRowAction_.setInput(fullBlockLeft.get(),
+                                      undefBlock.fullBlock());
+      }
+      const auto& subrange = undefBlock.subrange();
+      // Yield all iterators to the elements within the stored undef blocks.
+      for (auto subIt = subrange.begin(); subIt < subrange.end(); ++subIt) {
+        co_yield subIt;
+      }
+    }
+    // Reset back to original input
+    compatibleRowAction_.setInput(fullBlockLeft.get(), fullBlockRight.get());
+    // No need for further iteration because we know we won't encounter any new
+    // undefined values at this point.
+  }
+
+  // Create a generator that yields iterators to all undefined values that
+  // have been found so far. Note that because of limitations of the
+  // `zipperJoinWithUndef` interface we need to set `begL` and `begR` to the
+  // beginning of the full blocks of the left and right side respectively so
+  // that they can be used within `zipperJoinWithUndef` to compute the
+  // distance from the yielded iterator to the beginning of the block.
+  template <bool left, typename T>
+  auto findUndefValues(const auto& fullBlockLeft, const auto& fullBlockRight,
+                       T& begL, T& begR) {
+    return [this, &fullBlockLeft, &fullBlockRight, &begL, &begR](
+               const auto&, auto, auto, bool) {
+      auto currentSide = [this]() {
+        if constexpr (left) {
+          return std::cref(leftSide_);
+        } else {
+          return std::cref(rightSide_);
+        }
+      }();
+      return findUndefValuesHelper<left, T>(fullBlockLeft, fullBlockRight, begL,
+                                            begR,
+                                            currentSide.get().undefBlocks_);
+    };
+  }
+
   // Join the first block in `currentBlocksLeft` with the first block in
   // `currentBlocksRight`, but ignore all elements that are `>= currentEl`
   // The fully joined parts of the block are then removed from
@@ -912,15 +1000,16 @@ struct BlockZipperJoinImpl {
         getFirstBlock(currentBlocksRight, currentEl);
 
     compatibleRowAction_.setInput(fullBlockLeft.get(), fullBlockRight.get());
-    auto addRowIndex = [begL = fullBlockLeft.get().begin(),
-                        begR = fullBlockRight.get().begin(),
-                        this](auto itFromL, auto itFromR) {
+    auto begL = fullBlockLeft.get().begin();
+    auto begR = fullBlockRight.get().begin();
+    auto addRowIndex = [&begL, &begR, this](auto itFromL, auto itFromR) {
       compatibleRowAction_.addRow(itFromL - begL, itFromR - begR);
     };
 
     auto addNotFoundRowIndex = [&]() {
       if constexpr (DoOptionalJoin) {
-        return [begL = fullBlockLeft.get().begin(), this](auto itFromL) {
+        return [this, begL = fullBlockLeft.get().begin()](auto itFromL) {
+          AD_CORRECTNESS_CHECK(!hasUndef(rightSide_));
           compatibleRowAction_.addOptionalRow(itFromL - begL);
         };
 
@@ -928,10 +1017,25 @@ struct BlockZipperJoinImpl {
         return ad_utility::noop;
       }
     }();
-    [[maybe_unused]] auto res = zipperJoinWithUndef(
-        std::ranges::subrange{subrangeLeft.begin(), currentElItL},
-        std::ranges::subrange{subrangeRight.begin(), currentElItR}, lessThan_,
-        addRowIndex, noop, noop, addNotFoundRowIndex);
+    // All undefined values should already be processed at this point.
+    AD_CORRECTNESS_CHECK(!isUndefined_(subrangeLeft.front()));
+    AD_CORRECTNESS_CHECK(!isUndefined_(subrangeRight.front()));
+    // If we have undefined values stored, we need to provide a generator that
+    // yields iterators to the individual undefined values.
+    if constexpr (potentiallyHasUndef) {
+      [[maybe_unused]] auto res = zipperJoinWithUndef(
+          std::ranges::subrange{subrangeLeft.begin(), currentElItL},
+          std::ranges::subrange{subrangeRight.begin(), currentElItR}, lessThan_,
+          addRowIndex,
+          findUndefValues<true>(fullBlockLeft, fullBlockRight, begL, begR),
+          findUndefValues<false>(fullBlockLeft, fullBlockRight, begL, begR),
+          addNotFoundRowIndex);
+    } else {
+      [[maybe_unused]] auto res = zipperJoinWithUndef(
+          std::ranges::subrange{subrangeLeft.begin(), currentElItL},
+          std::ranges::subrange{subrangeRight.begin(), currentElItR}, lessThan_,
+          addRowIndex, noop, noop, addNotFoundRowIndex);
+    }
     compatibleRowAction_.flush();
 
     // Remove the joined elements.
@@ -979,6 +1083,21 @@ struct BlockZipperJoinImpl {
     return fillEqualToCurrentElBothSides(getCurrentEl());
   }
 
+  // Based on `blockStatus` add the Cartesian product of the blocks in
+  // `leftBlocks` and/or `rightBlocks` with their respective counterpart in
+  // `undefBlocks_`.
+  void joinWithUndefBlocks(BlockStatus blockStatus, const auto& leftBlocks,
+                           const auto& rightBlocks) {
+    if (blockStatus == BlockStatus::allFilled ||
+        blockStatus == BlockStatus::leftMissing) {
+      addCartesianProduct(leftBlocks, rightSide_.undefBlocks_);
+    }
+    if (blockStatus == BlockStatus::allFilled ||
+        blockStatus == BlockStatus::rightMissing) {
+      addCartesianProduct(leftSide_.undefBlocks_, rightBlocks);
+    }
+  }
+
   // Combine the above functionality and perform one round of joining.
   // Has to be called alternately with `fillBuffer`.
   template <bool DoOptionalJoin, typename ProjectedEl>
@@ -1010,9 +1129,12 @@ struct BlockZipperJoinImpl {
         blockStatus = BlockStatus::allFilled;
       }
     };
+
     // We are only guaranteed to have all relevant blocks from one side, so we
     // also need to pass through the remaining blocks from the other side.
     while (!equalToCurrentElLeft.empty() && !equalToCurrentElRight.empty()) {
+      joinWithUndefBlocks(blockStatus, equalToCurrentElLeft,
+                          equalToCurrentElRight);
       addAll<DoOptionalJoin>(equalToCurrentElLeft, equalToCurrentElRight);
       switch (blockStatus) {
         case BlockStatus::allFilled:
@@ -1059,15 +1181,112 @@ struct BlockZipperJoinImpl {
     compatibleRowAction_.flush();
   }
 
+  // Consume all remaining blocks from one side and add the Cartesian product of
+  // those blocks with the undef blocks from the other side.
+  // `reverse` is used to determine if the left or right side is consumed.
+  template <bool reversed>
+  void consumeRemainingBlocks(auto& side, const auto& undefBlocks) {
+    while (side.it_ != side.end_) {
+      const auto& lBlock = *side.it_;
+      for (const auto& rBlock : undefBlocks) {
+        if constexpr (reversed) {
+          compatibleRowAction_.setInput(rBlock.fullBlock(), lBlock);
+        } else {
+          compatibleRowAction_.setInput(lBlock, rBlock.fullBlock());
+        }
+        for (size_t i : ad_utility::integerRange(lBlock.size())) {
+          for (size_t j : rBlock.getIndexRange()) {
+            if constexpr (reversed) {
+              compatibleRowAction_.addRow(j, i);
+            } else {
+              compatibleRowAction_.addRow(i, j);
+            }
+          }
+        }
+      }
+      ++side.it_;
+    }
+  }
+
+  // If one of the sides is exhausted and has no values to match the pairs
+  // left, we need to pair the remaining values with the undef values we have
+  // left.
+  void addRemainingUndefPairs() {
+    if constexpr (potentiallyHasUndef) {
+      addCartesianProduct(leftSide_.currentBlocks_, rightSide_.undefBlocks_);
+      consumeRemainingBlocks<false>(leftSide_, rightSide_.undefBlocks_);
+
+      addCartesianProduct(leftSide_.undefBlocks_, rightSide_.currentBlocks_);
+      consumeRemainingBlocks<true>(rightSide_, leftSide_.undefBlocks_);
+
+      compatibleRowAction_.flush();
+    }
+  }
+
+  // Consume the blocks until the first block is found that does contain a
+  // defined value. All blocks up until that point are stored in
+  // `side.undefBlocks_` and skipped for subsequent processing. The first block
+  // containing defined values is split and the defined part is stored in
+  // `side.currentBlocks_`.
+  void findFirstBlockWithoutUndef(auto& side) {
+    // The reference of `it` is there on purpose.
+    for (auto& it = side.it_; it != side.end_; ++it) {
+      auto& el = *it;
+      if (std::ranges::empty(el) || !isUndefined_(el.front())) {
+        return;
+      }
+      bool endIsUndefined = isUndefined_(el.back());
+      side.undefBlocks_.emplace_back(std::move(el));
+      if (!endIsUndefined) {
+        auto& lastUndefinedBlock = side.undefBlocks_.back();
+        side.currentBlocks_.push_back(lastUndefinedBlock);
+        auto subrange = std::ranges::equal_range(
+            lastUndefinedBlock.subrange(),
+            lastUndefinedBlock.subrange().front(), lessThan_);
+        size_t undefCount = std::ranges::size(subrange);
+        lastUndefinedBlock.setSubrange(std::move(subrange));
+        auto& firstDefinedBlock = side.currentBlocks_.back();
+        firstDefinedBlock.setSubrange(
+            firstDefinedBlock.fullBlock().begin() + undefCount,
+            firstDefinedBlock.fullBlock().end());
+        // Make sure this block is not accessed with moved-out value.
+        ++it;
+        return;
+      }
+    }
+  }
+
+  // Find and process all leading undefined values from the blocks.
+  void fetchAndProcessUndefinedBlocks() {
+    if constexpr (potentiallyHasUndef) {
+      findFirstBlockWithoutUndef(leftSide_);
+      findFirstBlockWithoutUndef(rightSide_);
+      addCartesianProduct(leftSide_.undefBlocks_, rightSide_.undefBlocks_);
+    }
+  }
+
   // The actual join routine that combines all the previous functions.
   template <bool DoOptionalJoin>
   void runJoin() {
+    fetchAndProcessUndefinedBlocks();
+    if (potentiallyHasUndef && !hasUndef(leftSide_) && !hasUndef(rightSide_)) {
+      // Run the join without UNDEF values if there are none. No need to move
+      // since LeftSide and RightSide are references.
+      BlockZipperJoinImpl<LeftSide, RightSide, LessThan, CompatibleRowAction,
+                          AlwaysFalse>{leftSide_, rightSide_, lessThan_,
+                                       compatibleRowAction_, AlwaysFalse{}}
+          .template runJoin<DoOptionalJoin>();
+      return;
+    }
     while (true) {
       BlockStatus blockStatus = fillBuffer();
       if (leftSide_.currentBlocks_.empty() ||
           rightSide_.currentBlocks_.empty()) {
+        addRemainingUndefPairs();
         if constexpr (DoOptionalJoin) {
-          fillWithAllFromLeft();
+          if (!hasUndef(rightSide_)) {
+            fillWithAllFromLeft();
+          }
         }
         return;
       }
@@ -1081,6 +1300,10 @@ template <typename LHS, typename RHS, typename LessThan,
           typename CompatibleRowAction>
 BlockZipperJoinImpl(LHS&, RHS&, const LessThan&, CompatibleRowAction&)
     -> BlockZipperJoinImpl<LHS, RHS, LessThan, CompatibleRowAction>;
+template <typename LHS, typename RHS, typename LessThan,
+          typename CompatibleRowAction, typename IsUndef>
+BlockZipperJoinImpl(LHS&, RHS&, const LessThan&, CompatibleRowAction&, IsUndef)
+    -> BlockZipperJoinImpl<LHS, RHS, LessThan, CompatibleRowAction, IsUndef>;
 
 }  // namespace detail
 
@@ -1133,4 +1356,28 @@ void zipperJoinForBlocksWithoutUndef(LeftBlocks&& leftBlocks,
   impl.template runJoin<DoOptionalJoin>();
 }
 
+// Similar to `zipperJoinForBlocksWithoutUndef`, but allows for UNDEF values in
+// a single column join scenario.
+template <typename LeftBlocks, typename RightBlocks, typename LessThan,
+          typename LeftProjection = std::identity,
+          typename RightProjection = std::identity,
+          typename DoOptionalJoinTag = std::false_type>
+void zipperJoinForBlocksWithPotentialUndef(LeftBlocks&& leftBlocks,
+                                           RightBlocks&& rightBlocks,
+                                           const LessThan& lessThan,
+                                           auto& compatibleRowAction,
+                                           LeftProjection leftProjection = {},
+                                           RightProjection rightProjection = {},
+                                           DoOptionalJoinTag = {}) {
+  static constexpr bool DoOptionalJoin = DoOptionalJoinTag::value;
+
+  auto leftSide = detail::makeJoinSide(leftBlocks, leftProjection);
+  auto rightSide = detail::makeJoinSide(rightBlocks, rightProjection);
+
+  detail::BlockZipperJoinImpl impl{
+      leftSide, rightSide, lessThan, compatibleRowAction,
+      [](const Id& id) { return id.isUndefined(); }};
+  impl.template runJoin<DoOptionalJoin>();
+}
+
 }  // namespace ad_utility
diff --git a/src/util/TransparentFunctors.h b/src/util/TransparentFunctors.h
index e00d3b7a53..6e2bd9fca3 100644
--- a/src/util/TransparentFunctors.h
+++ b/src/util/TransparentFunctors.h
@@ -118,6 +118,16 @@ struct Noop {
 };
 [[maybe_unused]] static constexpr Noop noop{};
 
+template <typename T>
+struct StaticCast {
+  constexpr decltype(auto) operator()(auto&& x) const {
+    return static_cast<T>(AD_FWD(x));
+  }
+};
+
+template <typename T>
+static constexpr StaticCast<T> staticCast{};
+
 }  // namespace ad_utility
 
 #endif  // QLEVER_TRANSPARENTFUNCTORS_H
diff --git a/test/JoinAlgorithmsTest.cpp b/test/JoinAlgorithmsTest.cpp
index f9397eaf46..1829de1519 100644
--- a/test/JoinAlgorithmsTest.cpp
+++ b/test/JoinAlgorithmsTest.cpp
@@ -195,3 +195,279 @@ TEST(JoinAlgorithms, JoinWithBlocksMultipleBlocksPerElementBothSides) {
   // the optional join stays the same.
   testOptionalJoin(a, b, expectedResult);
 }
+
+namespace {
+
+// Replacement for `Id`, but with an additional tag to distinguish between ids
+// with the same value for testing.
+struct FakeId {
+  Id value_;
+  std::string_view tag_;
+
+  operator Id() const { return value_; }
+  auto operator==(const FakeId& other) const {
+    return value_.getBits() == other.value_.getBits() && tag_ == other.tag_;
+  }
+
+  friend std::ostream& operator<<(std::ostream& os, const FakeId& id) {
+    return os << "FakeId{" << id.value_ << ", " << id.tag_ << "}";
+  }
+};
+
+// RowAdder implementation that works with FakeIds and allows to tell undefined
+// ids apart from each other.
+struct RowAdderWithUndef {
+  const std::vector<FakeId>* left_ = nullptr;
+  const std::vector<FakeId>* right_ = nullptr;
+  std::vector<std::array<FakeId, 2>> output_{};
+
+  void setInput(const std::vector<FakeId>& left,
+                const std::vector<FakeId>& right) {
+    left_ = &left;
+    right_ = &right;
+  }
+
+  void setOnlyLeftInputForOptionalJoin(const std::vector<FakeId>& left) {
+    left_ = &left;
+  }
+
+  void addRow(size_t leftIndex, size_t rightIndex) {
+    auto id1 = (*left_)[leftIndex];
+    auto id2 = (*right_)[rightIndex];
+    output_.push_back({id1, id2});
+  }
+
+  void addOptionalRow(size_t leftIndex) {
+    auto id = (*left_)[leftIndex];
+    output_.push_back({id, FakeId{Id::makeUndefined(), "OPTIONAL"}});
+  }
+
+  void flush() const {
+    // Does nothing, but is required for the interface.
+  }
+
+  const auto& getOutput() const { return output_; }
+};
+
+// Join both vectors `a` and `b` and assert that the result is equal to the
+// given `expected` result. Joins are performed 2 times, the second time with
+// `a` and `b` swapped.
+void testDynamicJoinWithUndef(const std::vector<std::vector<FakeId>>& a,
+                              const std::vector<std::vector<FakeId>>& b,
+                              std::vector<std::array<FakeId, 2>> expected,
+                              source_location l = source_location::current()) {
+  using namespace std::placeholders;
+  using namespace std::ranges;
+  auto trace = generateLocationTrace(l);
+  auto compare = [](FakeId l, FakeId r) {
+    return static_cast<Id>(l) < static_cast<Id>(r);
+  };
+  AD_CONTRACT_CHECK(is_sorted(a | views::join, {}, ad_utility::staticCast<Id>));
+  AD_CONTRACT_CHECK(is_sorted(b | views::join, {}, ad_utility::staticCast<Id>));
+  auto validationProjection = [](const std::array<FakeId, 2>& fakeIds) -> Id {
+    const auto& [x, y] = fakeIds;
+    return x == Id::makeUndefined() ? y : x;
+  };
+  {
+    RowAdderWithUndef adder{};
+    zipperJoinForBlocksWithPotentialUndef(a, b, compare, adder);
+    const auto& result = adder.getOutput();
+    // The result must be sorted on the first column
+    EXPECT_TRUE(is_sorted(result, std::less<>{}, validationProjection));
+    // The exact order of the elements with the same first column is not
+    // important and depends on implementation details. We therefore do not
+    // enforce it here.
+    EXPECT_THAT(result, ::testing::UnorderedElementsAreArray(expected));
+  }
+
+  for (auto& [x, y] : expected) {
+    std::swap(x, y);
+  }
+
+  {
+    RowAdderWithUndef adder{};
+    zipperJoinForBlocksWithPotentialUndef(b, a, compare, adder);
+    const auto& result = adder.getOutput();
+    EXPECT_TRUE(is_sorted(result, std::less<>{}, validationProjection));
+    EXPECT_THAT(result, ::testing::UnorderedElementsAreArray(expected));
+  }
+}
+using F = FakeId;
+auto I = Id::makeFromInt;
+}  // namespace
+
+// ________________________________________________________________________________________
+TEST(JoinAlgorithms, JoinWithBlocksWithUndefOnOneSide) {
+  auto U = Id::makeUndefined();
+  std::vector<std::vector<FakeId>> a{{{U, "a0"}},
+                                     {{I(42), "a1"}, {I(42), "a2"}},
+                                     {{I(42), "a3"}, {I(67), "a4"}},
+                                     {{I(67), "a5"}},
+                                     {{I(67), "a6"}},
+                                     {{I(67), "a7"}},
+                                     {{I(67), "a8"}},
+                                     {{I(67), "a9"}},
+                                     {{I(67), "a10"}},
+                                     {{I(68), "a11"}},
+                                     {{I(68), "a12"}},
+                                     {{I(68), "a13"}},
+                                     {{I(68), "a14"}},
+                                     {{I(68), "a15"}},
+                                     {{I(68), "a16"}},
+                                     {{I(68), "a17"}}};
+  std::vector<std::vector<FakeId>> b{{{I(2), "b0"}, {I(42), "b1"}},
+                                     {{I(42), "b2"}, {I(67), "b3"}}};
+  std::vector<std::array<FakeId, 2>> expectedResult{
+      {F{U, "a0"}, F{I(2), "b0"}},       {F{U, "a0"}, F{I(42), "b1"}},
+      {F{U, "a0"}, F{I(42), "b2"}},      {F{I(42), "a1"}, F{I(42), "b1"}},
+      {F{I(42), "a1"}, F{I(42), "b2"}},  {F{I(42), "a2"}, F{I(42), "b1"}},
+      {F{I(42), "a2"}, F{I(42), "b2"}},  {F{I(42), "a3"}, F{I(42), "b1"}},
+      {F{I(42), "a3"}, F{I(42), "b2"}},  {F{U, "a0"}, F{I(67), "b3"}},
+      {F{I(67), "a4"}, F{I(67), "b3"}},  {F{I(67), "a5"}, F{I(67), "b3"}},
+      {F{I(67), "a6"}, F{I(67), "b3"}},  {F{I(67), "a7"}, F{I(67), "b3"}},
+      {F{I(67), "a8"}, F{I(67), "b3"}},  {F{I(67), "a9"}, F{I(67), "b3"}},
+      {F{I(67), "a10"}, F{I(67), "b3"}},
+  };
+  testDynamicJoinWithUndef(a, b, expectedResult);
+}
+
+// ________________________________________________________________________________________
+TEST(JoinAlgorithms, JoinWithBlocksWithUndefOnBothSides) {
+  auto U = Id::makeUndefined();
+  std::vector<std::vector<FakeId>> a{{{U, "a0"}},
+                                     {{I(42), "a1"}, {I(42), "a2"}},
+                                     {{I(42), "a3"}, {I(67), "a4"}},
+                                     {{I(67), "a5"}},
+                                     {{I(67), "a6"}},
+                                     {{I(67), "a7"}},
+                                     {{I(67), "a8"}},
+                                     {{I(68), "a9"}},
+                                     {{I(68), "a10"}},
+                                     {{I(68), "a11"}},
+                                     {{I(68), "a12"}}};
+  std::vector<std::vector<FakeId>> b{{{U, "b0"}},
+                                     {{U, "b1"}, {I(2), "b2"}, {I(42), "b3"}},
+                                     {{I(42), "b4"}, {I(67), "b5"}}};
+  std::vector<std::array<FakeId, 2>> expectedResult{
+      {F{U, "a0"}, F{U, "b0"}},         {F{U, "a0"}, F{U, "b1"}},
+      {F{U, "a0"}, F{I(2), "b2"}},      {F{U, "a0"}, F{I(42), "b3"}},
+      {F{U, "a0"}, F{I(42), "b4"}},     {F{I(42), "a1"}, F{U, "b0"}},
+      {F{I(42), "a1"}, F{U, "b1"}},     {F{I(42), "a2"}, F{U, "b0"}},
+      {F{I(42), "a2"}, F{U, "b1"}},     {F{I(42), "a3"}, F{U, "b0"}},
+      {F{I(42), "a3"}, F{U, "b1"}},     {F{I(42), "a1"}, F{I(42), "b3"}},
+      {F{I(42), "a2"}, F{I(42), "b3"}}, {F{I(42), "a3"}, F{I(42), "b3"}},
+      {F{I(42), "a1"}, F{I(42), "b4"}}, {F{I(42), "a2"}, F{I(42), "b4"}},
+      {F{I(42), "a3"}, F{I(42), "b4"}}, {F{U, "a0"}, F{I(67), "b5"}},
+      {F{I(67), "a4"}, F{U, "b0"}},     {F{I(67), "a4"}, F{U, "b1"}},
+      {F{I(67), "a5"}, F{U, "b0"}},     {F{I(67), "a5"}, F{U, "b1"}},
+      {F{I(67), "a6"}, F{U, "b0"}},     {F{I(67), "a6"}, F{U, "b1"}},
+      {F{I(67), "a7"}, F{U, "b0"}},     {F{I(67), "a7"}, F{U, "b1"}},
+      {F{I(67), "a8"}, F{U, "b0"}},     {F{I(67), "a8"}, F{U, "b1"}},
+      {F{I(67), "a4"}, F{I(67), "b5"}}, {F{I(67), "a5"}, F{I(67), "b5"}},
+      {F{I(67), "a6"}, F{I(67), "b5"}}, {F{I(67), "a7"}, F{I(67), "b5"}},
+      {F{I(67), "a8"}, F{I(67), "b5"}}, {F{I(68), "a9"}, F{U, "b0"}},
+      {F{I(68), "a9"}, F{U, "b1"}},     {F{I(68), "a10"}, F{U, "b0"}},
+      {F{I(68), "a10"}, F{U, "b1"}},    {F{I(68), "a11"}, F{U, "b0"}},
+      {F{I(68), "a11"}, F{U, "b1"}},    {F{I(68), "a12"}, F{U, "b0"}},
+      {F{I(68), "a12"}, F{U, "b1"}},
+  };
+  testDynamicJoinWithUndef(a, b, expectedResult);
+}
+
+// _____________________________________________________________________________
+TEST(JoinAlgorithms, JoinWithBlocksOneSideSingleUndef) {
+  auto U = Id::makeUndefined();
+  std::vector<std::vector<FakeId>> a{{{U, "a0"}}};
+  std::vector<std::vector<FakeId>> b{{{I(1), "b0"}, {I(2), "b1"}}};
+
+  std::vector<std::array<FakeId, 2>> expectedResult{
+      {F{U, "a0"}, F{I(1), "b0"}},
+      {F{U, "a0"}, F{I(2), "b1"}},
+  };
+  testDynamicJoinWithUndef(a, b, expectedResult);
+}
+
+// _____________________________________________________________________________
+TEST(JoinAlgorithms, JoinWithBlocksOneUndefinedValueMixedWithOtherValues) {
+  auto U = Id::makeUndefined();
+  std::vector<std::vector<FakeId>> a{{{U, "a0"}, {I(1), "a1"}, {I(2), "a2"}}};
+  std::vector<std::vector<FakeId>> b{{{U, "b0"}, {I(2), "b1"}, {I(3), "b2"}}};
+
+  std::vector<std::array<FakeId, 2>> expectedResult{
+      {F{U, "a0"}, F{U, "b0"}},       {F{I(1), "a1"}, F{U, "b0"}},
+      {F{U, "a0"}, F{I(2), "b1"}},    {F{I(2), "a2"}, F{U, "b0"}},
+      {F{I(2), "a2"}, F{I(2), "b1"}}, {F{U, "a0"}, F{I(3), "b2"}},
+  };
+  testDynamicJoinWithUndef(a, b, expectedResult);
+}
+
+// _____________________________________________________________________________
+TEST(JoinAlgorithms, UndefinedJoinWorksWithoutUndefinedValues) {
+  std::vector<std::vector<FakeId>> a{{{I(1), "a1"}, {I(2), "a2"}}};
+  std::vector<std::vector<FakeId>> b{{{I(2), "b1"}, {I(3), "b2"}}};
+
+  std::vector<std::array<FakeId, 2>> expectedResult{
+      {F{I(2), "a2"}, F{I(2), "b1"}}};
+  testDynamicJoinWithUndef(a, b, expectedResult);
+}
+
+// _____________________________________________________________________________
+TEST(JoinAlgorithms, JoinWithBlocksMultipleGroupsAfterUndefined) {
+  auto U = Id::makeUndefined();
+  std::vector<std::vector<FakeId>> a{
+      {{U, "a0"}, {I(1), "a1"}, {I(2), "a2"}, {I(3), "a3"}}};
+  std::vector<std::vector<FakeId>> b{
+      {{U, "b0"}, {I(1), "b1"}, {I(2), "b2"}, {I(3), "b3"}}};
+
+  std::vector<std::array<FakeId, 2>> expectedResult{
+      {F{U, "a0"}, F{U, "b0"}},       {F{I(1), "a1"}, F{U, "b0"}},
+      {F{U, "a0"}, F{I(1), "b1"}},    {F{I(1), "a1"}, F{I(1), "b1"}},
+      {F{U, "a0"}, F{I(2), "b2"}},    {F{I(2), "a2"}, F{U, "b0"}},
+      {F{I(2), "a2"}, F{I(2), "b2"}}, {F{U, "a0"}, F{I(3), "b3"}},
+      {F{I(3), "a3"}, F{U, "b0"}},    {F{I(3), "a3"}, F{I(3), "b3"}},
+  };
+  testDynamicJoinWithUndef(a, b, expectedResult);
+}
+
+// _____________________________________________________________________________
+TEST(JoinAlgorithms, TrailingEmptyBlocksAreHandledWell) {
+  auto U = Id::makeUndefined();
+  std::vector<std::vector<FakeId>> a{
+      {{U, "a0"}}, {{I(1), "a1"}}, {{I(2), "a2"}}, {{I(3), "a3"}}};
+  std::vector<std::vector<FakeId>> b{{{I(3), "b0"}}, {}, {}, {}, {}};
+
+  std::vector<std::array<FakeId, 2>> expectedResult{
+      {F{U, "a0"}, F{I(3), "b0"}}, {F{I(3), "a3"}, F{I(3), "b0"}}};
+  testDynamicJoinWithUndef(a, b, expectedResult);
+}
+
+// _____________________________________________________________________________
+TEST(JoinAlgorithms, EmptyBlocksInTheMiddleAreHandledWell) {
+  auto U = Id::makeUndefined();
+  std::vector<std::vector<FakeId>> a{
+      {{U, "a0"}}, {{I(1), "a1"}}, {{I(2), "a2"}}, {{I(3), "a3"}}};
+  std::vector<std::vector<FakeId>> b{{{I(1), "b0"}}, {}, {{I(1), "b1"}}, {}, {},
+                                     {{I(3), "b2"}}};
+
+  std::vector<std::array<FakeId, 2>> expectedResult{
+      {F{U, "a0"}, F{I(1), "b0"}},    {F{U, "a0"}, F{I(1), "b1"}},
+      {F{I(1), "a1"}, F{I(1), "b0"}}, {F{I(1), "a1"}, F{I(1), "b1"}},
+      {F{U, "a0"}, F{I(3), "b2"}},    {F{I(3), "a3"}, F{I(3), "b2"}}};
+  testDynamicJoinWithUndef(a, b, expectedResult);
+}
+
+// _____________________________________________________________________________
+TEST(JoinAlgorithm, DefaultIsUndefinedFunctionAlwaysReturnsFalse) {
+  // This test is mostly for coverage purposes.
+  RowAdderWithUndef adder{};
+  std::vector<std::vector<FakeId>> dummyBlocks{};
+  auto compare = [](auto l, auto r) { return static_cast<Id>(l) < r; };
+  auto joinSide =
+      ad_utility::detail::makeJoinSide(dummyBlocks, std::identity{});
+  ad_utility::detail::BlockZipperJoinImpl impl{joinSide, joinSide, compare,
+                                               adder};
+  EXPECT_FALSE(impl.isUndefined_("Something"));
+  EXPECT_FALSE(impl.isUndefined_(1));
+  EXPECT_FALSE(impl.isUndefined_(I(1)));
+  EXPECT_FALSE(impl.isUndefined_(Id::makeUndefined()));
+}

From 92d906f198cfbf56347362aaa3a50bb0b45f9946 Mon Sep 17 00:00:00 2001
From: RobinTF <83676088+RobinTF@users.noreply.github.com>
Date: Tue, 19 Nov 2024 18:54:24 +0100
Subject: [PATCH 2/4] Fix out-of-memory issue with transitive paths (#1627)

The introduction of lazy transitive paths via #1595 caused transitive
path operations with lazy inputs and a fully materialized result to
store the same local vocab once per input row. This led to OOM errors
even if that local vocab was empty. This is not fixed by (1) skipping
empty local vocabs when merging, and (2) only storing one local vocab
per input block instead of repeating it for each row.

There can still be duplicates between the local vocabs of different
blocks. Deduplicating those is work for a separate PR.
---
 src/engine/LocalVocab.cpp         |  8 +++-----
 src/engine/LocalVocab.h           |  3 ++-
 src/engine/TransitivePathBase.cpp |  6 ++----
 src/engine/TransitivePathImpl.h   | 16 +++++++++++++---
 4 files changed, 20 insertions(+), 13 deletions(-)

diff --git a/src/engine/LocalVocab.cpp b/src/engine/LocalVocab.cpp
index 1dbc8e7c68..80c97de87a 100644
--- a/src/engine/LocalVocab.cpp
+++ b/src/engine/LocalVocab.cpp
@@ -10,11 +10,9 @@
 
 // _____________________________________________________________________________
 LocalVocab LocalVocab::clone() const {
-  LocalVocab localVocabClone;
-  localVocabClone.otherWordSets_ = otherWordSets_;
-  localVocabClone.otherWordSets_.push_back(primaryWordSet_);
-  // Return the clone.
-  return localVocabClone;
+  LocalVocab clone;
+  clone.mergeWith(std::span{this, 1});
+  return clone;
 }
 
 // _____________________________________________________________________________
diff --git a/src/engine/LocalVocab.h b/src/engine/LocalVocab.h
index 3055c400a6..ff30b824f1 100644
--- a/src/engine/LocalVocab.h
+++ b/src/engine/LocalVocab.h
@@ -96,7 +96,8 @@ class LocalVocab {
   template <std::ranges::range R>
   void mergeWith(const R& vocabs) {
     auto inserter = std::back_inserter(otherWordSets_);
-    for (const auto& vocab : vocabs) {
+    using std::views::filter;
+    for (const auto& vocab : vocabs | filter(std::not_fn(&LocalVocab::empty))) {
       std::ranges::copy(vocab.otherWordSets_, inserter);
       *inserter = vocab.primaryWordSet_;
     }
diff --git a/src/engine/TransitivePathBase.cpp b/src/engine/TransitivePathBase.cpp
index a833bfdfbd..1db8a7eb0d 100644
--- a/src/engine/TransitivePathBase.cpp
+++ b/src/engine/TransitivePathBase.cpp
@@ -93,7 +93,7 @@ Result::Generator TransitivePathBase::fillTableWithHullImpl(
   ad_utility::Timer timer{ad_utility::Timer::Stopped};
   size_t outputRow = 0;
   IdTableStatic<OUTPUT_WIDTH> table{getResultWidth(), allocator()};
-  std::vector<LocalVocab> storedLocalVocabs;
+  LocalVocab mergedVocab{};
   for (auto& [node, linkedNodes, localVocab, idTable, inputRow] : hull) {
     timer.cont();
     // As an optimization nodes without any linked nodes should not get yielded
@@ -120,7 +120,7 @@ Result::Generator TransitivePathBase::fillTableWithHullImpl(
     }
 
     if (yieldOnce) {
-      storedLocalVocabs.emplace_back(std::move(localVocab));
+      mergedVocab.mergeWith(std::span{&localVocab, 1});
     } else {
       timer.stop();
       runtimeInfo().addDetail("IdTable fill time", timer.msecs());
@@ -132,8 +132,6 @@ Result::Generator TransitivePathBase::fillTableWithHullImpl(
   }
   if (yieldOnce) {
     timer.start();
-    LocalVocab mergedVocab{};
-    mergedVocab.mergeWith(storedLocalVocabs);
     runtimeInfo().addDetail("IdTable fill time", timer.msecs());
     co_yield {std::move(table).toDynamic(), std::move(mergedVocab)};
   }
diff --git a/src/engine/TransitivePathImpl.h b/src/engine/TransitivePathImpl.h
index 407b63a298..3e15141114 100644
--- a/src/engine/TransitivePathImpl.h
+++ b/src/engine/TransitivePathImpl.h
@@ -82,7 +82,8 @@ class TransitivePathImpl : public TransitivePathBase {
         transitiveHull(edges, sub->getCopyOfLocalVocab(), std::move(nodes),
                        targetSide.isVariable()
                            ? std::nullopt
-                           : std::optional{std::get<Id>(targetSide.value_)});
+                           : std::optional{std::get<Id>(targetSide.value_)},
+                       yieldOnce);
 
     auto result = fillTableWithHull(
         std::move(hull), startSide.outputCol_, targetSide.outputCol_,
@@ -131,7 +132,8 @@ class TransitivePathImpl : public TransitivePathBase {
         edges, sub->getCopyOfLocalVocab(), std::span{&tableInfo, 1},
         targetSide.isVariable()
             ? std::nullopt
-            : std::optional{std::get<Id>(targetSide.value_)});
+            : std::optional{std::get<Id>(targetSide.value_)},
+        yieldOnce);
 
     auto result = fillTableWithHull(std::move(hull), startSide.outputCol_,
                                     targetSide.outputCol_, yieldOnce);
@@ -240,11 +242,15 @@ class TransitivePathImpl : public TransitivePathBase {
    * `TableColumnWithVocab` that can be consumed to create a transitive hull.
    * @param target Optional target Id. If supplied, only paths which end
    * in this Id are added to the hull.
+   * @param yieldOnce This has to be set to the same value as the consuming
+   * code. When set to true, this will prevent yielding the same LocalVocab over
+   * and over again to make merging faster (because merging with an empty
+   * LocalVocab is a no-op).
    * @return Map Maps each Id to its connected Ids in the transitive hull
    */
   NodeGenerator transitiveHull(const T& edges, LocalVocab edgesVocab,
                                std::ranges::range auto startNodes,
-                               std::optional<Id> target) const {
+                               std::optional<Id> target, bool yieldOnce) const {
     ad_utility::Timer timer{ad_utility::Timer::Stopped};
     for (auto&& tableColumn : startNodes) {
       timer.cont();
@@ -260,6 +266,10 @@ class TransitivePathImpl : public TransitivePathBase {
                                    mergedVocab.clone(), tableColumn.table_,
                                    currentRow};
           timer.cont();
+          // Reset vocab to prevent merging the same vocab over and over again.
+          if (yieldOnce) {
+            mergedVocab = LocalVocab{};
+          }
         }
         currentRow++;
       }

From 774ea834f5bb496eb96a0120ac8a2062cd6318d9 Mon Sep 17 00:00:00 2001
From: Hannah Bast <bast@informatik.uni-freiburg.de>
Date: Wed, 20 Nov 2024 10:50:51 +0100
Subject: [PATCH 3/4] Improve `LocalVocab` comments and code (#1626)

Major revision of comments, many of which were completely outdated. Also improve variable names and make some minor changes to the code. In particular, the the methods `size()` and `empty()` now run in constant time.
---
 src/engine/LocalVocab.cpp      |  38 +++++------
 src/engine/LocalVocab.h        | 120 ++++++++++++++++++++-------------
 src/index/LocalVocabEntry.h    |   2 +-
 src/util/TransparentFunctors.h |  91 ++++++++++++++-----------
 4 files changed, 142 insertions(+), 109 deletions(-)

diff --git a/src/engine/LocalVocab.cpp b/src/engine/LocalVocab.cpp
index 80c97de87a..240780261a 100644
--- a/src/engine/LocalVocab.cpp
+++ b/src/engine/LocalVocab.cpp
@@ -1,35 +1,35 @@
-// Copyright 2022, University of Freiburg
+// Copyright 2022 - 2024, University of Freiburg
 // Chair of Algorithms and Data Structures
-// Author: Hannah Bast <bast@cs.uni-freiburg.de>
+// Authors: Hannah Bast <bast@cs.uni-freiburg.de>
+//          Johannes Kalmbach <kalmbach@cs.uni-freiburg.de>
 
 #include "engine/LocalVocab.h"
 
 #include "absl/strings/str_cat.h"
 #include "global/Id.h"
 #include "global/ValueId.h"
+#include "util/TransparentFunctors.h"
 
 // _____________________________________________________________________________
 LocalVocab LocalVocab::clone() const {
-  LocalVocab clone;
-  clone.mergeWith(std::span{this, 1});
-  return clone;
+  LocalVocab result;
+  result.mergeWith(std::span{this, 1});
+  AD_CORRECTNESS_CHECK(result.size_ == size_);
+  return result;
 }
 
 // _____________________________________________________________________________
 LocalVocab LocalVocab::merge(std::span<const LocalVocab*> vocabs) {
-  LocalVocab res;
-  res.mergeWith(vocabs |
-                std::views::transform(
-                    [](const LocalVocab* localVocab) -> const LocalVocab& {
-                      return *localVocab;
-                    }));
-  return res;
+  LocalVocab result;
+  result.mergeWith(vocabs | std::views::transform(ad_utility::dereference));
+  return result;
 }
 
 // _____________________________________________________________________________
 template <typename WordT>
 LocalVocabIndex LocalVocab::getIndexAndAddIfNotContainedImpl(WordT&& word) {
   auto [wordIterator, isNewWord] = primaryWordSet().insert(AD_FWD(word));
+  size_ += static_cast<size_t>(isNewWord);
   // TODO<Libc++18> Use std::to_address (more idiomatic, but currently breaks
   // the MacOS build.
   return &(*wordIterator);
@@ -37,18 +37,19 @@ LocalVocabIndex LocalVocab::getIndexAndAddIfNotContainedImpl(WordT&& word) {
 
 // _____________________________________________________________________________
 LocalVocabIndex LocalVocab::getIndexAndAddIfNotContained(
-    const LiteralOrIri& word) {
+    const LocalVocabEntry& word) {
   return getIndexAndAddIfNotContainedImpl(word);
 }
 
 // _____________________________________________________________________________
-LocalVocabIndex LocalVocab::getIndexAndAddIfNotContained(LiteralOrIri&& word) {
+LocalVocabIndex LocalVocab::getIndexAndAddIfNotContained(
+    LocalVocabEntry&& word) {
   return getIndexAndAddIfNotContainedImpl(std::move(word));
 }
 
 // _____________________________________________________________________________
 std::optional<LocalVocabIndex> LocalVocab::getIndexOrNullopt(
-    const LiteralOrIri& word) const {
+    const LocalVocabEntry& word) const {
   auto localVocabIndex = primaryWordSet().find(word);
   if (localVocabIndex != primaryWordSet().end()) {
     // TODO<Libc++18> Use std::to_address (more idiomatic, but currently breaks
@@ -60,15 +61,14 @@ std::optional<LocalVocabIndex> LocalVocab::getIndexOrNullopt(
 }
 
 // _____________________________________________________________________________
-const LocalVocab::LiteralOrIri& LocalVocab::getWord(
+const LocalVocabEntry& LocalVocab::getWord(
     LocalVocabIndex localVocabIndex) const {
   return *localVocabIndex;
 }
 
 // _____________________________________________________________________________
-std::vector<LocalVocab::LiteralOrIri> LocalVocab::getAllWordsForTesting()
-    const {
-  std::vector<LiteralOrIri> result;
+std::vector<LocalVocabEntry> LocalVocab::getAllWordsForTesting() const {
+  std::vector<LocalVocabEntry> result;
   std::ranges::copy(primaryWordSet(), std::back_inserter(result));
   for (const auto& previous : otherWordSets_) {
     std::ranges::copy(*previous, std::back_inserter(result));
diff --git a/src/engine/LocalVocab.h b/src/engine/LocalVocab.h
index ff30b824f1..72745746b9 100644
--- a/src/engine/LocalVocab.h
+++ b/src/engine/LocalVocab.h
@@ -1,6 +1,7 @@
-// Copyright 2022, University of Freiburg
+// Copyright 2022 - 2024, University of Freiburg
 // Chair of Algorithms and Data Structures
-// Author: Hannah Bast <bast@cs.uni-freiburg.de>
+// Authors: Hannah Bast <bast@cs.uni-freiburg.de>
+//          Johannes Kalmbach <kalmbach@cs.uni-freiburg.de>
 
 #pragma once
 
@@ -14,31 +15,39 @@
 #include "global/Id.h"
 #include "parser/LiteralOrIri.h"
 #include "util/BlankNodeManager.h"
+#include "util/Exception.h"
 
-// A class for maintaining a local vocabulary with contiguous (local) IDs. This
-// is meant for words that are not part of the normal vocabulary (constructed
-// from the input data at indexing time).
+// A class for maintaining a local vocabulary, which conceptually is a set of
+// `LiteralOrIri`s that are not part of the original vocabulary (which stems
+// from the input data). The implementation is subtle and quite clever:
 //
-
+// The entries of the local vocabulary are `LocalVocabEntry`s, each of which
+// holds a `LiteralOrIri` and remembers its position in the original vocabulary
+// after it has been computed once.
+//
+// A `LocalVocab` has a primary set of `LocalVocabEntry`s, which can grow
+// dynamically, and a collection of other sets of `LocalVocabEntry`s, which
+// cannot be modified by this class. A `LocalVocabEntry` lives exactly as long
+// as it is contained in at least one of the (primary or other) sets of a
+// `LocalVocab`.
 class LocalVocab {
  private:
-  using Entry = LocalVocabEntry;
-  using LiteralOrIri = LocalVocabEntry;
-  // A map of the words in the local vocabulary to their local IDs. This is a
-  // node hash map because we need the addresses of the words (which are of type
-  // `LiteralOrIri`) to remain stable over their lifetime in the hash map
-  // because we hand out pointers to them.
-  using Set = absl::node_hash_set<LiteralOrIri>;
+  // The primary set of `LocalVocabEntry`s, which can grow dynamically.
+  //
+  // NOTE: This is a `absl::node_hash_set` because we hand out pointers to
+  // the `LocalVocabEntry`s and it is hence essential that their addresses
+  // remain stable over their lifetime in the hash set.
+  using Set = absl::node_hash_set<LocalVocabEntry>;
   std::shared_ptr<Set> primaryWordSet_ = std::make_shared<Set>();
 
-  // Local vocabularies from child operations that were merged into this
-  // vocabulary s.t. the pointers are kept alive. They have to be `const`
-  // because they are possibly shared concurrently (for example via the cache).
+  // The other sets of `LocalVocabEntry`s, which are static.
   std::vector<std::shared_ptr<const Set>> otherWordSets_;
 
-  auto& primaryWordSet() { return *primaryWordSet_; }
-  const auto& primaryWordSet() const { return *primaryWordSet_; }
+  // The number of words (so that we can compute `size()` in constant time).
+  size_t size_ = 0;
 
+  // Each `LocalVocab` has its own `LocalBlankNodeManager` to generate blank
+  // nodes when needed (e.g., when parsing the result of a SERVICE query).
   std::optional<ad_utility::BlankNodeManager::LocalBlankNodeManager>
       localBlankNodeManager_;
 
@@ -50,49 +59,54 @@ class LocalVocab {
   LocalVocab(const LocalVocab&) = delete;
   LocalVocab& operator=(const LocalVocab&) = delete;
 
-  // Make a logical copy. The clone will have an empty primary set so it can
-  // safely be modified. The contents are copied as shared pointers to const, so
-  // the function runs in linear time in the number of word sets.
+  // Make a logical copy, where all sets of `LocalVocabEntry`s become "other"
+  // sets, that is, they cannot be modified by the copy. The primary set becomes
+  // empty. This only copies shared pointers and takes time linear in the number
+  // of sets.
   LocalVocab clone() const;
 
   // Moving a local vocabulary is not problematic (though the typical use case
-  // in our code is to copy shared pointers to local vocabularies).
+  // in our code is to copy shared pointers from one `LocalVocab` to another).
   LocalVocab(LocalVocab&&) = default;
   LocalVocab& operator=(LocalVocab&&) = default;
 
-  // Get the index of a word in the local vocabulary. If the word was already
-  // contained, return the already existing index. If the word was not yet
-  // contained, add it, and return the new index.
-  LocalVocabIndex getIndexAndAddIfNotContained(const LiteralOrIri& word);
-  LocalVocabIndex getIndexAndAddIfNotContained(LiteralOrIri&& word);
+  // For a given `LocalVocabEntry`, return the corresponding `LocalVocabIndex`
+  // (which is just the address of the `LocalVocabEntry`). If the
+  // `LocalVocabEntry` is not contained in any of the sets, add it to the
+  // primary.
+  LocalVocabIndex getIndexAndAddIfNotContained(const LocalVocabEntry& word);
+  LocalVocabIndex getIndexAndAddIfNotContained(LocalVocabEntry&& word);
 
-  // Get the index of a word in the local vocabulary, or std::nullopt if it is
-  // not contained. This is useful for testing.
+  // Like `getIndexAndAddIfNotContained`, but if the `LocalVocabEntry` is not
+  // contained in any of the sets, do not add it and return `std::nullopt`.
   std::optional<LocalVocabIndex> getIndexOrNullopt(
-      const LiteralOrIri& word) const;
+      const LocalVocabEntry& word) const;
 
-  // The number of words in the vocabulary.
-  // Note: This is not constant time, but linear in the number of word sets.
+  // The number of words in this local vocabulary.
   size_t size() const {
-    auto result = primaryWordSet().size();
-    for (const auto& previous : otherWordSets_) {
-      result += previous->size();
+    if constexpr (ad_utility::areExpensiveChecksEnabled) {
+      auto size = primaryWordSet().size();
+      for (const auto& previous : otherWordSets_) {
+        size += previous->size();
+      }
+      AD_CORRECTNESS_CHECK(size == size_);
     }
-    return result;
+    return size_;
   }
 
   // Return true if and only if the local vocabulary is empty.
   bool empty() const { return size() == 0; }
 
-  // Return a const reference to the word.
-  const LiteralOrIri& getWord(LocalVocabIndex localVocabIndex) const;
-
-  // Create a local vocab that contains and keeps alive all the words from each
-  // of the `vocabs`. The primary word set of the newly created vocab is empty.
-  static LocalVocab merge(std::span<const LocalVocab*> vocabs);
+  // Get the `LocalVocabEntry` corresponding to the given `LocalVocabIndex`.
+  //
+  // NOTE: This used to be a more complex function but is now a simple
+  // dereference. It could be thrown out in the future.
+  const LocalVocabEntry& getWord(LocalVocabIndex localVocabIndex) const;
 
-  // Merge all passed local vocabs to keep alive all the words from each of the
-  // `vocabs`.
+  // Add all sets (primary and other) of the given local vocabs as other sets
+  // to this local vocab. The purpose is to keep all the contained
+  // `LocalVocabEntry`s alive as long as this `LocalVocab` is alive. The
+  // primary set of this `LocalVocab` remains unchanged.
   template <std::ranges::range R>
   void mergeWith(const R& vocabs) {
     auto inserter = std::back_inserter(otherWordSets_);
@@ -100,11 +114,17 @@ class LocalVocab {
     for (const auto& vocab : vocabs | filter(std::not_fn(&LocalVocab::empty))) {
       std::ranges::copy(vocab.otherWordSets_, inserter);
       *inserter = vocab.primaryWordSet_;
+      size_ += vocab.size_;
     }
   }
 
-  // Return all the words from all the word sets as a vector.
-  std::vector<LiteralOrIri> getAllWordsForTesting() const;
+  // Create a new local vocab with empty set and other sets that are the union
+  // of all sets (primary and other) of the given local vocabs.
+  static LocalVocab merge(std::span<const LocalVocab*> vocabs);
+
+  // Return all the words from all the word sets as a vector. This is useful
+  // for testing.
+  std::vector<LocalVocabEntry> getAllWordsForTesting() const;
 
   // Get a new BlankNodeIndex using the LocalBlankNodeManager.
   [[nodiscard]] BlankNodeIndex getBlankNodeIndex(
@@ -115,8 +135,12 @@ class LocalVocab {
   bool isBlankNodeIndexContained(BlankNodeIndex blankNodeIndex) const;
 
  private:
-  // Common implementation for the two variants of
-  // `getIndexAndAddIfNotContainedImpl` above.
+  // Accessors for the primary set.
+  Set& primaryWordSet() { return *primaryWordSet_; }
+  const Set& primaryWordSet() const { return *primaryWordSet_; }
+
+  // Common implementation for the two methods `getIndexAndAddIfNotContained`
+  // and `getIndexOrNullopt` above.
   template <typename WordT>
   LocalVocabIndex getIndexAndAddIfNotContainedImpl(WordT&& word);
 };
diff --git a/src/index/LocalVocabEntry.h b/src/index/LocalVocabEntry.h
index 545d8a8350..e591ad64ff 100644
--- a/src/index/LocalVocabEntry.h
+++ b/src/index/LocalVocabEntry.h
@@ -27,7 +27,7 @@ class alignas(16) LocalVocabEntry
   // the first *larger* word in the vocabulary. Note: we store the cache as
   // three separate atomics to avoid mutexes. The downside is, that in parallel
   // code multiple threads might look up the position concurrently, which wastes
-  // a bit of resources. We however don't consider this case to be likely.
+  // a bit of resources. However, we don't consider this case to be likely.
   mutable ad_utility::CopyableAtomic<VocabIndex> lowerBoundInVocab_;
   mutable ad_utility::CopyableAtomic<VocabIndex> upperBoundInVocab_;
   mutable ad_utility::CopyableAtomic<bool> positionInVocabKnown_ = false;
diff --git a/src/util/TransparentFunctors.h b/src/util/TransparentFunctors.h
index 6e2bd9fca3..1b889a0796 100644
--- a/src/util/TransparentFunctors.h
+++ b/src/util/TransparentFunctors.h
@@ -1,25 +1,23 @@
-//  Copyright 2022, University of Freiburg,
-//  Chair of Algorithms and Data Structures.
-//  Author:
-//   2022 -    Johannes Kalmbach <kalmbach@cs.uni-freiburg.de>
+// Copyright 2022 - 2024, University of Freiburg
+// Chair of Algorithms and Data Structures
+// Author: Johannes Kalmbach <kalmbach@cs.uni-freiburg.de>
 
-#ifndef QLEVER_TRANSPARENTFUNCTORS_H
-#define QLEVER_TRANSPARENTFUNCTORS_H
+#pragma once
 
 #include <util/Forward.h>
 #include <util/TypeTraits.h>
 
 #include <utility>
 
-/// Contains several function object types with templated operator() that wrap
-/// overloaded functions from the standard library. This enables passing them as
-/// function parameters.
-
-/// Note that in theory all of them could be implemented shorter as captureless
-/// lambda expressions. We have chosen not to do this because the STL also does
-/// not choose this approach (see e.g. `std::less`, `std::plus`, etc.) and
-/// because global inline lambdas in header files might in theory cause ODR (one
-/// definition rule) problems, especially  when using different compilers.
+// Contains several function object types with templated operator() that wrap
+// overloaded functions from the standard library. This enables passing them as
+// function parameters.
+//
+// NOTE: in theory all of them could be implemented shorter as captureless
+// lambda expressions. We have chosen not to do this because the STL also does
+// not choose this approach (see e.g. `std::less`, `std::plus`, etc.) and
+// because global inline lambdas in header files might in theory cause ODR (one
+// definition rule) problems, especially  when using different compilers.
 
 namespace ad_utility {
 
@@ -79,37 +77,60 @@ struct ToBoolImpl {
   }
 };
 
+// Implementation of `staticCast` (see below).
+template <typename T>
+struct StaticCastImpl {
+  constexpr decltype(auto) operator()(auto&& x) const {
+    return static_cast<T>(AD_FWD(x));
+  }
+};
+
+// Implementation of `dereference` (see below).
+struct DereferenceImpl {
+  constexpr decltype(auto) operator()(auto&& x) const { return *AD_FWD(x); }
+};
+
 }  // namespace detail
 
-/// Return the first element via perfect forwarding of any type for which
-/// `std::get<0>(x)` is valid. This holds e.g. for `std::pair`, `std::tuple`,
-/// and `std::array`.
+// Return the first element via perfect forwarding of any type for which
+// `std::get<0>(x)` is valid. This holds e.g. for `std::pair`, `std::tuple`,
+// and `std::array`.
 static constexpr detail::FirstImpl first;
 
-/// Return the second element via perfect forwarding of any type for which
-/// `std::get<1>(x)` is valid. This holds e.g. for `std::pair`, `std::tuple`,
-/// and `std::array`.
+// Return the second element via perfect forwarding of any type for which
+// `std::get<1>(x)` is valid. This holds e.g. for `std::pair`, `std::tuple`,
+// and `std::array`.
 static constexpr detail::SecondImpl second;
 
-/// Transparent functor for `std::holds_alternative`
+// Transparent functor for `std::holds_alternative`
 template <typename T>
 static constexpr detail::HoldsAlternativeImpl<T> holdsAlternative;
 
-/// Transparent functor for `std::get`. Currently only works for `std::variant`
-/// and not for `std::array` or `std::tuple`.
+// Transparent functor for `std::get`. Currently only works for `std::variant`
+// and not for `std::array` or `std::tuple`.
 template <typename T>
 static constexpr detail::GetImpl<T> get;
 
-/// Transparent functor for `std::get_if`. As an extension to `std::get_if`,
-/// `ad_utility::getIf` may also be called with a `variant` object or reference,
-/// not only with a pointer.
+// Transparent functor for `std::get_if`. As an extension to `std::get_if`,
+// `ad_utility::getIf` may also be called with a `variant` object or reference,
+// not only with a pointer.
 template <typename T>
 static constexpr detail::GetIfImpl<T> getIf;
 
+// Transparent functor that converts any type to `bool` via
+// `static_cast<bool>`.
 static constexpr detail::ToBoolImpl toBool;
 
-/// A functor that takes an arbitrary number of arguments by reference and does
-/// nothing.
+// Transparent functor that casts any type to `T` via `static_cast<T>`.
+template <typename T>
+static constexpr detail::StaticCastImpl<T> staticCast{};
+
+// Transparent functor that dereferences a pointer or smart pointer.
+static constexpr detail::DereferenceImpl dereference;
+
+// Transparent functor that takes an arbitrary number of arguments by reference
+// and does nothing. We also use the type `Noop`, hence it is defined here and
+// not in the `detail` namespace above.
 struct Noop {
   void operator()(const auto&...) const {
     // This function deliberately does nothing (static analysis expects a
@@ -118,16 +139,4 @@ struct Noop {
 };
 [[maybe_unused]] static constexpr Noop noop{};
 
-template <typename T>
-struct StaticCast {
-  constexpr decltype(auto) operator()(auto&& x) const {
-    return static_cast<T>(AD_FWD(x));
-  }
-};
-
-template <typename T>
-static constexpr StaticCast<T> staticCast{};
-
 }  // namespace ad_utility
-
-#endif  // QLEVER_TRANSPARENTFUNCTORS_H

From d53d4f9fd91fd03463382e2b6f476d4ee345d6d9 Mon Sep 17 00:00:00 2001
From: unex <63149623+UNEXENU@users.noreply.github.com>
Date: Thu, 21 Nov 2024 10:45:10 +0100
Subject: [PATCH 4/4] Also merge the `LocalBlankNodeManager`s when a
 `LocalVocab` is merged. (#1617)

This resolves a bug that was introduced in #1504, where the `LocalBlankNodeManager` of a `LocalVocab` was not accounted for in the merge functions of the `LocalVocab`.
---
 src/engine/LocalVocab.cpp     |  4 +++-
 src/engine/LocalVocab.h       | 24 ++++++++++++++++++++-
 src/util/BlankNodeManager.cpp | 30 +++++++++++++--------------
 src/util/BlankNodeManager.h   | 39 +++++++++++++++++++++++++++++++----
 test/BlankNodeManagerTest.cpp | 30 +++++++++++++++++----------
 test/LocalVocabTest.cpp       | 32 ++++++++++++++++++++++++++++
 6 files changed, 127 insertions(+), 32 deletions(-)

diff --git a/src/engine/LocalVocab.cpp b/src/engine/LocalVocab.cpp
index 240780261a..2170d20d5d 100644
--- a/src/engine/LocalVocab.cpp
+++ b/src/engine/LocalVocab.cpp
@@ -82,7 +82,9 @@ BlankNodeIndex LocalVocab::getBlankNodeIndex(
   AD_CONTRACT_CHECK(blankNodeManager);
   // Initialize the `localBlankNodeManager_` if it doesn't exist yet.
   if (!localBlankNodeManager_) [[unlikely]] {
-    localBlankNodeManager_.emplace(blankNodeManager);
+    localBlankNodeManager_ =
+        std::make_shared<ad_utility::BlankNodeManager::LocalBlankNodeManager>(
+            blankNodeManager);
   }
   return BlankNodeIndex::make(localBlankNodeManager_->getId());
 }
diff --git a/src/engine/LocalVocab.h b/src/engine/LocalVocab.h
index 72745746b9..f61982400d 100644
--- a/src/engine/LocalVocab.h
+++ b/src/engine/LocalVocab.h
@@ -5,8 +5,10 @@
 
 #pragma once
 
+#include <algorithm>
 #include <cstdlib>
 #include <memory>
+#include <ranges>
 #include <span>
 #include <string>
 #include <vector>
@@ -48,7 +50,7 @@ class LocalVocab {
 
   // Each `LocalVocab` has its own `LocalBlankNodeManager` to generate blank
   // nodes when needed (e.g., when parsing the result of a SERVICE query).
-  std::optional<ad_utility::BlankNodeManager::LocalBlankNodeManager>
+  std::shared_ptr<ad_utility::BlankNodeManager::LocalBlankNodeManager>
       localBlankNodeManager_;
 
  public:
@@ -116,6 +118,26 @@ class LocalVocab {
       *inserter = vocab.primaryWordSet_;
       size_ += vocab.size_;
     }
+
+    // Also merge the `vocabs` `LocalBlankNodeManager`s, if they exist.
+    using LocalBlankNodeManager =
+        ad_utility::BlankNodeManager::LocalBlankNodeManager;
+    auto localManagersView =
+        vocabs |
+        std::views::transform([](const LocalVocab& vocab) -> const auto& {
+          return vocab.localBlankNodeManager_;
+        });
+
+    auto it = std::ranges::find_if(localManagersView,
+                                   [](const auto& l) { return l != nullptr; });
+    if (it == localManagersView.end()) {
+      return;
+    }
+    if (!localBlankNodeManager_) {
+      localBlankNodeManager_ =
+          std::make_shared<LocalBlankNodeManager>((*it)->blankNodeManager());
+    }
+    localBlankNodeManager_->mergeWith(localManagersView);
   }
 
   // Create a new local vocab with empty set and other sets that are the union
diff --git a/src/util/BlankNodeManager.cpp b/src/util/BlankNodeManager.cpp
index 6b367118d5..44295b3aeb 100644
--- a/src/util/BlankNodeManager.cpp
+++ b/src/util/BlankNodeManager.cpp
@@ -4,6 +4,8 @@
 
 #include "util/BlankNodeManager.h"
 
+#include "util/Exception.h"
+
 namespace ad_utility {
 
 // _____________________________________________________________________________
@@ -41,30 +43,28 @@ BlankNodeManager::LocalBlankNodeManager::LocalBlankNodeManager(
     BlankNodeManager* blankNodeManager)
     : blankNodeManager_(blankNodeManager) {}
 
-// _____________________________________________________________________________
-BlankNodeManager::LocalBlankNodeManager::~LocalBlankNodeManager() {
-  auto ptr = blankNodeManager_->usedBlocksSet_.wlock();
-  for (const auto& block : blocks_) {
-    AD_CONTRACT_CHECK(ptr->contains(block.blockIdx_));
-    ptr->erase(block.blockIdx_);
-  }
-}
-
 // _____________________________________________________________________________
 uint64_t BlankNodeManager::LocalBlankNodeManager::getId() {
-  if (blocks_.empty() || blocks_.back().nextIdx_ == idxAfterCurrentBlock_) {
-    blocks_.emplace_back(blankNodeManager_->allocateBlock());
-    idxAfterCurrentBlock_ = blocks_.back().nextIdx_ + blockSize_;
+  if (blocks_->empty() || blocks_->back().nextIdx_ == idxAfterCurrentBlock_) {
+    blocks_->emplace_back(blankNodeManager_->allocateBlock());
+    idxAfterCurrentBlock_ = blocks_->back().nextIdx_ + blockSize_;
   }
-  return blocks_.back().nextIdx_++;
+  return blocks_->back().nextIdx_++;
 }
 
 // _____________________________________________________________________________
 bool BlankNodeManager::LocalBlankNodeManager::containsBlankNodeIndex(
     uint64_t index) const {
-  return std::ranges::any_of(blocks_, [index](const Block& block) {
+  auto containsIndex = [index](const Block& block) {
     return index >= block.startIdx_ && index < block.nextIdx_;
-  });
+  };
+
+  return std::ranges::any_of(*blocks_, containsIndex) ||
+         std::ranges::any_of(
+             otherBlocks_,
+             [&](const std::shared_ptr<const std::vector<Block>>& blocks) {
+               return std::ranges::any_of(*blocks, containsIndex);
+             });
 }
 
 }  // namespace ad_utility
diff --git a/src/util/BlankNodeManager.h b/src/util/BlankNodeManager.h
index 7fd5416294..afdc748281 100644
--- a/src/util/BlankNodeManager.h
+++ b/src/util/BlankNodeManager.h
@@ -58,6 +58,7 @@ class BlankNodeManager {
 
    public:
     ~Block() = default;
+
     // The index of this block.
     const uint64_t blockIdx_;
 
@@ -71,7 +72,7 @@ class BlankNodeManager {
   class LocalBlankNodeManager {
    public:
     explicit LocalBlankNodeManager(BlankNodeManager* blankNodeManager);
-    ~LocalBlankNodeManager();
+    ~LocalBlankNodeManager() = default;
 
     // No copy, as the managed blocks should not be duplicated.
     LocalBlankNodeManager(const LocalBlankNodeManager&) = delete;
@@ -87,16 +88,46 @@ class BlankNodeManager {
     // Return true iff the `index` was returned by a previous call to `getId()`.
     bool containsBlankNodeIndex(uint64_t index) const;
 
-   private:
-    // Reserved blocks.
-    std::vector<BlankNodeManager::Block> blocks_;
+    // Merge passed `LocalBlankNodeManager`s to keep alive their reserved
+    // BlankNodeIndex blocks.
+    template <std::ranges::range R>
+    void mergeWith(const R& localBlankNodeManagers) {
+      auto inserter = std::back_inserter(otherBlocks_);
+      for (const auto& l : localBlankNodeManagers) {
+        if (l == nullptr) {
+          continue;
+        }
+        std::ranges::copy(l->otherBlocks_, inserter);
+        *inserter = l->blocks_;
+      }
+    }
+
+    // Getter for the `blankNodeManager_` pointer required in
+    // `LocalVocab::mergeWith`.
+    BlankNodeManager* blankNodeManager() const { return blankNodeManager_; }
 
+   private:
     // Reference to the BlankNodeManager, used to free the reserved blocks.
     BlankNodeManager* blankNodeManager_;
 
+    // Reserved blocks.
+    using Blocks = std::vector<BlankNodeManager::Block>;
+    std::shared_ptr<Blocks> blocks_{
+        new Blocks(), [blankNodeManager = blankNodeManager()](auto blocksPtr) {
+          auto ptr = blankNodeManager->usedBlocksSet_.wlock();
+          for (const auto& block : *blocksPtr) {
+            AD_CONTRACT_CHECK(ptr->contains(block.blockIdx_));
+            ptr->erase(block.blockIdx_);
+          }
+          delete blocksPtr;
+        }};
+
     // The first index after the current Block.
     uint64_t idxAfterCurrentBlock_{0};
 
+    // Blocks merged from other `LocalBlankNodeManager`s.
+    std::vector<std::shared_ptr<const Blocks>> otherBlocks_;
+
     FRIEND_TEST(BlankNodeManager, LocalBlankNodeManagerGetID);
   };
 
diff --git a/test/BlankNodeManagerTest.cpp b/test/BlankNodeManagerTest.cpp
index 70803bd3f0..9d1969c80c 100644
--- a/test/BlankNodeManagerTest.cpp
+++ b/test/BlankNodeManagerTest.cpp
@@ -37,24 +37,32 @@ TEST(BlankNodeManager, blockAllocationAndFree) {
 // _____________________________________________________________________________
 TEST(BlankNodeManager, LocalBlankNodeManagerGetID) {
   BlankNodeManager bnm(0);
-  BlankNodeManager::LocalBlankNodeManager l(&bnm);
+  auto l = std::make_shared<BlankNodeManager::LocalBlankNodeManager>(&bnm);
 
   // initially the LocalBlankNodeManager doesn't have any blocks
-  EXPECT_EQ(l.blocks_.size(), 0);
+  EXPECT_EQ(l->blocks_->size(), 0);
 
   // A new Block is allocated, if
   // no blocks are allocated yet
-  uint64_t id = l.getId();
-  EXPECT_EQ(l.blocks_.size(), 1);
-  EXPECT_TRUE(l.containsBlankNodeIndex(id));
-  EXPECT_FALSE(l.containsBlankNodeIndex(id + 1));
-  EXPECT_FALSE(l.containsBlankNodeIndex(id - 1));
+  uint64_t id = l->getId();
+  EXPECT_EQ(l->blocks_->size(), 1);
+  EXPECT_TRUE(l->containsBlankNodeIndex(id));
+  EXPECT_FALSE(l->containsBlankNodeIndex(id + 1));
+  EXPECT_FALSE(l->containsBlankNodeIndex(id - 1));
 
   // or the ids of the last block are all used
-  l.blocks_.back().nextIdx_ = id + BlankNodeManager::blockSize_;
-  id = l.getId();
-  EXPECT_TRUE(l.containsBlankNodeIndex(id));
-  EXPECT_EQ(l.blocks_.size(), 2);
+  l->blocks_->back().nextIdx_ = id + BlankNodeManager::blockSize_;
+  id = l->getId();
+  EXPECT_TRUE(l->containsBlankNodeIndex(id));
+  EXPECT_EQ(l->blocks_->size(), 2);
+
+  // The `LocalBlankNodeManager` still works when recursively merged.
+  std::vector itSelf{l};
+  l->mergeWith(itSelf);
+
+  EXPECT_TRUE(l->containsBlankNodeIndex(id));
+  EXPECT_TRUE(l->containsBlankNodeIndex(l->getId()));
+  EXPECT_EQ(l->blocks_, l->otherBlocks_[0]);
 }
 
 // _____________________________________________________________________________
diff --git a/test/LocalVocabTest.cpp b/test/LocalVocabTest.cpp
index a9058d3a68..38728a3c92 100644
--- a/test/LocalVocabTest.cpp
+++ b/test/LocalVocabTest.cpp
@@ -134,6 +134,14 @@ TEST(LocalVocab, clone) {
   for (size_t i = 0; i < inputWords.size(); ++i) {
     EXPECT_EQ(*indices[i], inputWords[i]);
   }
+
+  // Test that a BlankNodeIndex obtained by a `LocalVocab` is also contained
+  // in the clone.
+  ad_utility::BlankNodeManager bnm;
+  LocalVocab v;
+  auto id = v.getBlankNodeIndex(&bnm);
+  LocalVocab vClone = v.clone();
+  EXPECT_TRUE(vClone.isBlankNodeIndexContained(id));
 }
 // _____________________________________________________________________________
 TEST(LocalVocab, merge) {
@@ -162,6 +170,30 @@ TEST(LocalVocab, merge) {
   EXPECT_EQ(*indices[1], lit("twoA"));
   EXPECT_EQ(*indices[2], lit("oneB"));
   EXPECT_EQ(*indices[3], lit("twoB"));
+
+  // Test that the `LocalBlankNodeManager` of vocabs is merged correctly.
+  ad_utility::BlankNodeManager bnm;
+  LocalVocab localVocabMerged2;
+  BlankNodeIndex id;
+  {
+    LocalVocab vocC, vocD;
+    id = vocC.getBlankNodeIndex(&bnm);
+    auto vocabs2 = std::vector{&std::as_const(vocC), &std::as_const(vocD)};
+    localVocabMerged2 = LocalVocab::merge(vocabs2);
+  }
+  EXPECT_TRUE(localVocabMerged2.isBlankNodeIndexContained(id));
+
+  LocalVocab vocE, vocF;
+  auto id2 = vocE.getBlankNodeIndex(&bnm);
+  auto vocabs3 =
+      std::vector{&std::as_const(localVocabMerged2), &std::as_const(vocF)};
+  vocE.mergeWith(vocabs3 | std::views::transform(
+                               [](const LocalVocab* l) -> const LocalVocab& {
+                                 return *l;
+                               }));
+  EXPECT_TRUE(vocE.isBlankNodeIndexContained(id));
+  EXPECT_TRUE(localVocabMerged2.isBlankNodeIndexContained(id));
+  EXPECT_TRUE(vocE.isBlankNodeIndexContained(id2));
 }
 
 // _____________________________________________________________________________