Skip to content

Commit

Permalink
[Chore](inverted index) remove useless code in scan operator for norm…
Browse files Browse the repository at this point in the history
…alize compound and match predicate (apache#40232)

## Proposed changes
Remove unused code in scan operator for normalizing compound and match
predicate
  • Loading branch information
airborne12 authored Sep 2, 2024
1 parent 4c16768 commit 00f3f4c
Show file tree
Hide file tree
Showing 2 changed files with 0 additions and 254 deletions.
219 changes: 0 additions & 219 deletions be/src/pipeline/exec/scan_operator.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -967,225 +967,6 @@ Status ScanLocalState<Derived>::_normalize_noneq_binary_predicate(
return Status::OK();
}

template <typename Derived>
void ScanLocalState<Derived>::_normalize_compound_predicate(
vectorized::VExpr* expr, vectorized::VExprContext* expr_ctx, PushDownType* pdt,
bool _is_runtime_filter_predicate,
const std::function<bool(const vectorized::VExprSPtrs&,
std::shared_ptr<vectorized::VSlotRef>&, vectorized::VExprSPtr&)>&
in_predicate_checker,
const std::function<bool(const vectorized::VExprSPtrs&,
std::shared_ptr<vectorized::VSlotRef>&, vectorized::VExprSPtr&)>&
eq_predicate_checker) {
if (TExprNodeType::COMPOUND_PRED == expr->node_type()) {
auto compound_fn_name = expr->fn().name.function_name;
auto children_num = expr->children().size();
for (auto i = 0; i < children_num; ++i) {
auto* child_expr = expr->children()[i].get();
if (TExprNodeType::BINARY_PRED == child_expr->node_type() ||
TExprNodeType::IN_PRED == child_expr->node_type() ||
TExprNodeType::MATCH_PRED == child_expr->node_type()) {
SlotDescriptor* slot = nullptr;
ColumnValueRangeType* range_on_slot = nullptr;
if (_is_predicate_acting_on_slot(child_expr, in_predicate_checker, &slot,
&range_on_slot) ||
_is_predicate_acting_on_slot(child_expr, eq_predicate_checker, &slot,
&range_on_slot)) {
ColumnValueRangeType active_range =
*range_on_slot; // copy, in order not to affect the range in the _colname_to_value_range
std::visit(
[&](auto& value_range) {
Defer mark_runtime_filter_flag {[&]() {
value_range.mark_runtime_filter_predicate(
_is_runtime_filter_predicate);
}};
if (TExprNodeType::BINARY_PRED == child_expr->node_type()) {
static_cast<void>(_normalize_binary_compound_predicate(
child_expr, expr_ctx, slot, value_range, pdt));
} else if (TExprNodeType::IN_PRED == child_expr->node_type()) {
static_cast<void>(_normalize_in_and_not_in_compound_predicate(
child_expr, expr_ctx, slot, value_range, pdt));
} else {
static_cast<void>(_normalize_match_compound_predicate(
child_expr, expr_ctx, slot, value_range, pdt));
}
},
active_range);

_compound_value_ranges.emplace_back(active_range);
}
} else if (TExprNodeType::COMPOUND_PRED == child_expr->node_type()) {
_normalize_compound_predicate(child_expr, expr_ctx, pdt,
_is_runtime_filter_predicate, in_predicate_checker,
eq_predicate_checker);
}
}
}
}

template <typename Derived>
template <PrimitiveType T>
Status ScanLocalState<Derived>::_normalize_binary_compound_predicate(
vectorized::VExpr* expr, vectorized::VExprContext* expr_ctx, SlotDescriptor* slot,
ColumnValueRange<T>& range, PushDownType* pdt) {
DCHECK(expr->children().size() == 2);
if (TExprNodeType::BINARY_PRED == expr->node_type()) {
auto eq_checker = [](const std::string& fn_name) { return fn_name == "eq"; };
auto ne_checker = [](const std::string& fn_name) { return fn_name == "ne"; };
auto noneq_checker = [](const std::string& fn_name) {
return fn_name != "ne" && fn_name != "eq" && fn_name != "eq_for_null";
};

StringRef value;
int slot_ref_child = -1;
PushDownType eq_pdt;
PushDownType ne_pdt;
PushDownType noneq_pdt;
RETURN_IF_ERROR(_should_push_down_binary_predicate(
reinterpret_cast<vectorized::VectorizedFnCall*>(expr), expr_ctx, &value,
&slot_ref_child, eq_checker, eq_pdt));
RETURN_IF_ERROR(_should_push_down_binary_predicate(
reinterpret_cast<vectorized::VectorizedFnCall*>(expr), expr_ctx, &value,
&slot_ref_child, ne_checker, ne_pdt));
RETURN_IF_ERROR(_should_push_down_binary_predicate(
reinterpret_cast<vectorized::VectorizedFnCall*>(expr), expr_ctx, &value,
&slot_ref_child, noneq_checker, noneq_pdt));
if (eq_pdt == PushDownType::UNACCEPTABLE && ne_pdt == PushDownType::UNACCEPTABLE &&
noneq_pdt == PushDownType::UNACCEPTABLE) {
return Status::OK();
}
DCHECK(slot_ref_child >= 0);
const std::string& fn_name =
reinterpret_cast<vectorized::VectorizedFnCall*>(expr)->fn().name.function_name;
if (eq_pdt == PushDownType::ACCEPTABLE || ne_pdt == PushDownType::ACCEPTABLE ||
noneq_pdt == PushDownType::ACCEPTABLE) {
if (value.data != nullptr) {
if constexpr (T == TYPE_CHAR || T == TYPE_VARCHAR || T == TYPE_STRING ||
T == TYPE_HLL) {
auto val = StringRef(value.data, value.size);
RETURN_IF_ERROR(_change_value_range<false>(
range, reinterpret_cast<void*>(&val),
ColumnValueRange<T>::add_compound_value_range, fn_name,
slot_ref_child));
} else {
RETURN_IF_ERROR(_change_value_range<false>(
range, reinterpret_cast<void*>(const_cast<char*>(value.data)),
ColumnValueRange<T>::add_compound_value_range, fn_name,
slot_ref_child));
}
}
*pdt = PushDownType::ACCEPTABLE;
}
}
return Status::OK();
}

template <typename Derived>
template <PrimitiveType T>
Status ScanLocalState<Derived>::_normalize_in_and_not_in_compound_predicate(
vectorized::VExpr* expr, vectorized::VExprContext* expr_ctx, SlotDescriptor* slot,
ColumnValueRange<T>& range, PushDownType* pdt) {
if (TExprNodeType::IN_PRED == expr->node_type()) {
std::string fn_name = expr->op() == TExprOpcode::type::FILTER_IN ? "in" : "not_in";

HybridSetBase::IteratorBase* iter = nullptr;
auto hybrid_set = expr->get_set_func();

if (hybrid_set != nullptr) {
*pdt = PushDownType::UNACCEPTABLE;
return Status::OK();
} else {
auto* pred = static_cast<vectorized::VInPredicate*>(expr);

auto* state = reinterpret_cast<vectorized::InState*>(
expr_ctx->fn_context(pred->fn_context_index())
->get_function_state(FunctionContext::FRAGMENT_LOCAL));

if (!state->use_set) {
return Status::OK();
}

iter = state->hybrid_set->begin();

if (state->hybrid_set->contain_null()) {
*pdt = PushDownType::UNACCEPTABLE;
return Status::OK();
}
}

while (iter->has_next()) {
if (nullptr == iter->get_value()) {
iter->next();
continue;
}
auto* value = const_cast<void*>(iter->get_value());
RETURN_IF_ERROR(_change_value_range<false>(
range, value, ColumnValueRange<T>::add_compound_value_range, fn_name, 0));
iter->next();
}
*pdt = PushDownType::ACCEPTABLE;
}
return Status::OK();
}

template <typename Derived>
template <PrimitiveType T>
Status ScanLocalState<Derived>::_normalize_match_compound_predicate(
vectorized::VExpr* expr, vectorized::VExprContext* expr_ctx, SlotDescriptor* slot,
ColumnValueRange<T>& range, PushDownType* pdt) {
DCHECK(expr->children().size() == 2);
if (TExprNodeType::MATCH_PRED == expr->node_type()) {
RETURN_IF_ERROR(_normalize_match_predicate(expr, expr_ctx, slot, range, pdt));
}

return Status::OK();
}

template <typename Derived>
template <PrimitiveType T>
Status ScanLocalState<Derived>::_normalize_match_predicate(vectorized::VExpr* expr,
vectorized::VExprContext* expr_ctx,
SlotDescriptor* slot,
ColumnValueRange<T>& range,
PushDownType* pdt) {
if (TExprNodeType::MATCH_PRED == expr->node_type()) {
DCHECK(expr->children().size() == 2);

// create empty range as temp range, temp range should do intersection on range
auto temp_range = ColumnValueRange<T>::create_empty_column_value_range(
slot->is_nullable(), range.precision(), range.scale());
// Normalize match conjuncts like 'where col match value'

auto match_checker = [](const std::string& fn_name) { return is_match_condition(fn_name); };
StringRef value;
int slot_ref_child = -1;
PushDownType temp_pdt;
RETURN_IF_ERROR(_should_push_down_binary_predicate(
reinterpret_cast<vectorized::VectorizedFnCall*>(expr), expr_ctx, &value,
&slot_ref_child, match_checker, temp_pdt));
if (temp_pdt != PushDownType::UNACCEPTABLE) {
DCHECK(slot_ref_child >= 0);
if (value.data != nullptr) {
using CppType = typename PrimitiveTypeTraits<T>::CppType;
if constexpr (T == TYPE_CHAR || T == TYPE_VARCHAR || T == TYPE_STRING ||
T == TYPE_HLL) {
auto val = StringRef(value.data, value.size);
ColumnValueRange<T>::add_match_value_range(temp_range,
to_match_type(expr->op()),
reinterpret_cast<CppType*>(&val));
} else {
ColumnValueRange<T>::add_match_value_range(
temp_range, to_match_type(expr->op()),
reinterpret_cast<CppType*>(const_cast<char*>(value.data)));
}
range.intersection(temp_range);
}
*pdt = temp_pdt;
}
}
return Status::OK();
}

template <typename Derived>
Status ScanLocalState<Derived>::_prepare_scanners() {
std::list<vectorized::VScannerSPtr> scanners;
Expand Down
35 changes: 0 additions & 35 deletions be/src/pipeline/exec/scan_operator.h
Original file line number Diff line number Diff line change
Expand Up @@ -283,46 +283,11 @@ class ScanLocalState : public ScanLocalStateBase {
vectorized::VExprContext* expr_ctx,
SlotDescriptor* slot, ColumnValueRange<T>& range,
PushDownType* pdt);

void _normalize_compound_predicate(
vectorized::VExpr* expr, vectorized::VExprContext* expr_ctx, PushDownType* pdt,
bool is_runtimer_filter_predicate,
const std::function<bool(const vectorized::VExprSPtrs&,
std::shared_ptr<vectorized::VSlotRef>&,
vectorized::VExprSPtr&)>& in_predicate_checker,
const std::function<bool(const vectorized::VExprSPtrs&,
std::shared_ptr<vectorized::VSlotRef>&,
vectorized::VExprSPtr&)>& eq_predicate_checker);

template <PrimitiveType T>
Status _normalize_binary_compound_predicate(vectorized::VExpr* expr,
vectorized::VExprContext* expr_ctx,
SlotDescriptor* slot, ColumnValueRange<T>& range,
PushDownType* pdt);

template <PrimitiveType T>
Status _normalize_in_and_not_in_compound_predicate(vectorized::VExpr* expr,
vectorized::VExprContext* expr_ctx,
SlotDescriptor* slot,
ColumnValueRange<T>& range,
PushDownType* pdt);

template <PrimitiveType T>
Status _normalize_match_compound_predicate(vectorized::VExpr* expr,
vectorized::VExprContext* expr_ctx,
SlotDescriptor* slot, ColumnValueRange<T>& range,
PushDownType* pdt);

template <PrimitiveType T>
Status _normalize_is_null_predicate(vectorized::VExpr* expr, vectorized::VExprContext* expr_ctx,
SlotDescriptor* slot, ColumnValueRange<T>& range,
PushDownType* pdt);

template <PrimitiveType T>
Status _normalize_match_predicate(vectorized::VExpr* expr, vectorized::VExprContext* expr_ctx,
SlotDescriptor* slot, ColumnValueRange<T>& range,
PushDownType* pdt);

bool _ignore_cast(SlotDescriptor* slot, vectorized::VExpr* expr);

template <bool IsFixed, PrimitiveType PrimitiveType, typename ChangeFixedValueRangeFunc>
Expand Down

0 comments on commit 00f3f4c

Please sign in to comment.