blob: 7ce80e8f6d535b6ee082fddcfc0abfa3a5ba3df5 [file] [log] [blame]
/**
* Licensed to the Apache Software Foundation (ASF) under one
* or more contributor license agreements. See the NOTICE file
* distributed with this work for additional information
* regarding copyright ownership. The ASF licenses this file
* to you under the Apache License, Version 2.0 (the
* "License"); you may not use this file except in compliance
* with the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing,
* software distributed under the License is distributed on an
* "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
* KIND, either express or implied. See the License for the
* specific language governing permissions and limitations
* under the License.
**/
#include "query_optimizer/physical/HashJoin.hpp"
#include <string>
#include <vector>
#include "query_optimizer/OptimizerTree.hpp"
#include "query_optimizer/expressions/AttributeReference.hpp"
#include "query_optimizer/expressions/ExpressionUtil.hpp"
#include "query_optimizer/expressions/NamedExpression.hpp"
#include "query_optimizer/expressions/Predicate.hpp"
#include "query_optimizer/physical/Physical.hpp"
#include "utility/Cast.hpp"
namespace quickstep {
namespace optimizer {
namespace physical {
namespace E = ::quickstep::optimizer::expressions;
std::vector<expressions::AttributeReferencePtr> HashJoin::getReferencedAttributes() const {
std::vector<expressions::AttributeReferencePtr> referenced_attributes;
for (const expressions::NamedExpressionPtr &project_expression :
project_expressions()) {
const std::vector<expressions::AttributeReferencePtr> referenced_attributes_in_expression =
project_expression->getReferencedAttributes();
referenced_attributes.insert(referenced_attributes.end(),
referenced_attributes_in_expression.begin(),
referenced_attributes_in_expression.end());
}
referenced_attributes.insert(referenced_attributes.end(),
left_join_attributes_.begin(),
left_join_attributes_.end());
referenced_attributes.insert(referenced_attributes.end(),
right_join_attributes_.begin(),
right_join_attributes_.end());
if (residual_predicate_ != nullptr) {
const std::vector<expressions::AttributeReferencePtr> referenced_attributes_in_residual =
residual_predicate_->getReferencedAttributes();
referenced_attributes.insert(referenced_attributes.end(),
referenced_attributes_in_residual.begin(),
referenced_attributes_in_residual.end());
}
if (build_predicate_ != nullptr) {
const std::vector<expressions::AttributeReferencePtr> referenced_attributes_in_build =
build_predicate_->getReferencedAttributes();
referenced_attributes.insert(referenced_attributes.end(),
referenced_attributes_in_build.begin(),
referenced_attributes_in_build.end());
}
return referenced_attributes;
}
PhysicalPtr HashJoin::copyWithNewProjectExpressions(
const std::vector<E::NamedExpressionPtr> &output_expressions) const {
DCHECK_EQ(project_expressions().size(), output_expressions.size());
return Create(left(), right(), left_join_attributes_, right_join_attributes_,
residual_predicate_, build_predicate_, output_expressions, join_type_);
}
bool HashJoin::maybeCopyWithPrunedExpressions(
const expressions::UnorderedNamedExpressionSet &referenced_expressions,
PhysicalPtr *output) const {
std::vector<expressions::NamedExpressionPtr> new_project_expressions;
const std::vector<expressions::NamedExpressionPtr> &
current_project_expressions = project_expressions();
for (const expressions::NamedExpressionPtr &project_expression :
current_project_expressions) {
if (referenced_expressions.find(project_expression) !=
referenced_expressions.end()) {
new_project_expressions.emplace_back(project_expression);
}
}
if (new_project_expressions.size() != current_project_expressions.size()) {
*output = Create(left(),
right(),
left_join_attributes_,
right_join_attributes_,
residual_predicate_,
build_predicate_,
new_project_expressions,
join_type_,
has_repartition_,
cloneOutputPartitionSchemeHeader());
return true;
}
return false;
}
void HashJoin::getFieldStringItems(
std::vector<std::string> *inline_field_names,
std::vector<std::string> *inline_field_values,
std::vector<std::string> *non_container_child_field_names,
std::vector<OptimizerTreeBaseNodePtr> *non_container_child_fields,
std::vector<std::string> *container_child_field_names,
std::vector<std::vector<OptimizerTreeBaseNodePtr>> *container_child_fields) const {
BinaryJoin::getFieldStringItems(inline_field_names,
inline_field_values,
non_container_child_field_names,
non_container_child_fields,
container_child_field_names,
container_child_fields);
if (residual_predicate_ != nullptr) {
non_container_child_field_names->push_back("residual_predicate");
non_container_child_fields->push_back(residual_predicate_);
}
if (build_predicate_ != nullptr) {
non_container_child_field_names->push_back("build_predicate");
non_container_child_fields->push_back(build_predicate_);
}
container_child_field_names->push_back("left_join_attributes");
container_child_fields->push_back(CastSharedPtrVector<OptimizerTreeBase>(left_join_attributes_));
container_child_field_names->push_back("right_join_attributes");
container_child_fields->push_back(CastSharedPtrVector<OptimizerTreeBase>(right_join_attributes_));
}
} // namespace physical
} // namespace optimizer
} // namespace quickstep