Skip to content

Commit

Permalink
feat(fuzzer): Update "tryFlipJoinSides" functions to handle multi-joi…
Browse files Browse the repository at this point in the history
…ns (#11938)

Summary:
Pull Request resolved: #11938

The function should traverse the plan tree and recursively flip the sides of all join nodes that are eligible to be flipped. This is in preparation to make the Join Fuzzer produce plans with multiple joins. Flipping join sides help make alternate plans that should be logically equivalent.

Reviewed By: kgpai

Differential Revision: D67606686

fbshipit-source-id: 6ef6f351d99ba99805caacf47ed600524dd1f23d
  • Loading branch information
Daniel Hunte authored and facebook-github-bot committed Jan 24, 2025
1 parent 276c1db commit 9002fc9
Showing 1 changed file with 60 additions and 17 deletions.
77 changes: 60 additions & 17 deletions velox/exec/fuzzer/JoinFuzzer.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -110,6 +110,12 @@ class JoinFuzzer {
numGroups(_numGroups) {}
};

static core::PlanNodePtr tryFlipJoinSides(const core::HashJoinNode& joinNode);
static core::PlanNodePtr tryFlipJoinSides(
const core::MergeJoinNode& joinNode);
static core::PlanNodePtr tryFlipJoinSides(
const core::NestedLoopJoinNode& joinNode);

private:
static VectorFuzzer::Options getFuzzerOptions() {
VectorFuzzer::Options opts;
Expand All @@ -135,6 +141,10 @@ class JoinFuzzer {
// Randomly pick a join type to test.
core::JoinType pickJoinType();

template <typename TNode>
static std::pair<core::PlanNodePtr, core::PlanNodePtr> tryFlipJoinSidesHelper(
const TNode& joinNode);

// Makes the query plan with default settings in JoinFuzzer and value inputs
// for both probe and build sides.
//
Expand Down Expand Up @@ -605,67 +615,100 @@ std::optional<core::JoinType> tryFlipJoinType(core::JoinType joinType) {
}
}

template <typename TNode>
std::pair<core::PlanNodePtr, core::PlanNodePtr>
JoinFuzzer::tryFlipJoinSidesHelper(const TNode& joinNode) {
core::PlanNodePtr left = joinNode.sources()[0];
core::PlanNodePtr right = joinNode.sources()[1];
if (auto leftJoinInput =
std::dynamic_pointer_cast<const TNode>(joinNode.sources()[0])) {
left = JoinFuzzer::tryFlipJoinSides(*leftJoinInput);
}
if (auto rightJoinInput =
std::dynamic_pointer_cast<const TNode>(joinNode.sources()[1])) {
right = JoinFuzzer::tryFlipJoinSides(*rightJoinInput);
}
return make_pair(left, right);
}

// Returns a plan with flipped join sides of the input hash join node. If the
// join type doesn't allow flipping, returns a nullptr.
core::PlanNodePtr tryFlipJoinSides(const core::HashJoinNode& joinNode) {
// inputs of the join node are other hash join nodes, recursively flip the join
// sides of those join nodes as well. If the join type doesn't allow flipping,
// returns a nullptr.
core::PlanNodePtr JoinFuzzer::tryFlipJoinSides(
const core::HashJoinNode& joinNode) {
// Null-aware right semi project join doesn't support filter.
if (joinNode.filter() &&
joinNode.joinType() == core::JoinType::kLeftSemiProject &&
joinNode.isNullAware()) {
return nullptr;
}

auto flippedJoinType = tryFlipJoinType(joinNode.joinType());
if (!flippedJoinType.has_value()) {
if (!flippedJoinType) {
return nullptr;
}
auto [left, right] =
JoinFuzzer::tryFlipJoinSidesHelper<core::HashJoinNode>(joinNode);

return std::make_shared<core::HashJoinNode>(
joinNode.id(),
flippedJoinType.value(),
*flippedJoinType,
joinNode.isNullAware(),
joinNode.rightKeys(),
joinNode.leftKeys(),
joinNode.filter(),
joinNode.sources()[1],
joinNode.sources()[0],
right,
left,
joinNode.outputType());
}

// Returns a plan with flipped join sides of the input merge join node. If the
// inputs of the join node are other merge join nodes, recursively flip the join
// sides of those join nodes as well. If the
// join type doesn't allow flipping, returns a nullptr.
core::PlanNodePtr tryFlipJoinSides(const core::MergeJoinNode& joinNode) {
core::PlanNodePtr JoinFuzzer::tryFlipJoinSides(
const core::MergeJoinNode& joinNode) {
// Merge join only supports inner and left join, so only inner join can be
// flipped.
if (joinNode.joinType() != core::JoinType::kInner) {
return nullptr;
}
auto flippedJoinType = core::JoinType::kInner;

auto [left, right] =
JoinFuzzer::tryFlipJoinSidesHelper<core::MergeJoinNode>(joinNode);

return std::make_shared<core::MergeJoinNode>(
joinNode.id(),
flippedJoinType,
core::JoinType::kInner,
joinNode.rightKeys(),
joinNode.leftKeys(),
joinNode.filter(),
joinNode.sources()[1],
joinNode.sources()[0],
right,
left,
joinNode.outputType());
}

// Returns a plan with flipped join sides of the input nested loop join node. If
// the join type doesn't allow flipping, returns a nullptr.
core::PlanNodePtr tryFlipJoinSides(const core::NestedLoopJoinNode& joinNode) {
// the inputs of the join node are other nested loop join nodes, recursively
// flip the join sides of those join nodes as well. If the join type doesn't
// allow flipping, returns a nullptr.
core::PlanNodePtr JoinFuzzer::tryFlipJoinSides(
const core::NestedLoopJoinNode& joinNode) {
auto flippedJoinType = tryFlipJoinType(joinNode.joinType());
if (!flippedJoinType.has_value()) {
if (!flippedJoinType) {
return nullptr;
}

auto [left, right] =
JoinFuzzer::tryFlipJoinSidesHelper<core::NestedLoopJoinNode>(joinNode);

return std::make_shared<core::NestedLoopJoinNode>(
joinNode.id(),
flippedJoinType.value(),
joinNode.joinCondition(),
joinNode.sources()[1],
joinNode.sources()[0],
right,
left,
joinNode.outputType());
}

Expand Down Expand Up @@ -817,7 +860,7 @@ void addFlippedJoinPlan(
int32_t numGroups = 0) {
auto joinNode = std::dynamic_pointer_cast<const TNode>(plan);
VELOX_CHECK_NOT_NULL(joinNode);
if (auto flippedPlan = tryFlipJoinSides(*joinNode)) {
if (auto flippedPlan = JoinFuzzer::tryFlipJoinSides(*joinNode)) {
plans.push_back(JoinFuzzer::PlanWithSplits{
flippedPlan,
probeScanId,
Expand Down

0 comments on commit 9002fc9

Please sign in to comment.