// Copyright (C) 2019-2020 Zilliz. All rights reserved. // // Licensed under the Apache License, Version 2.0 (the "License"); you may not use this file except in compliance // with the License. You may obtain a copy of the License at // // http://www.apache.org/licenses/LICENSE-2.0 // // Unless required by applicable law or agreed to in writing, software distributed under the License // is distributed on an "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express // or implied. See the License for the specific language governing permissions and limitations under the License #include #include "ExprImpl.h" #include "PlanProto.h" #include "generated/ExtractInfoExprVisitor.h" #include "generated/ExtractInfoPlanNodeVisitor.h" namespace milvus::query { namespace planpb = milvus::proto::plan; template std::unique_ptr> ExtractTermExprImpl(FieldOffset field_offset, DataType data_type, const planpb::TermExpr& expr_proto) { static_assert(std::is_fundamental_v); auto size = expr_proto.values_size(); std::vector terms(size); for (int i = 0; i < size; ++i) { auto& value_proto = expr_proto.values(i); if constexpr (std::is_same_v) { Assert(value_proto.val_case() == planpb::GenericValue::kBoolVal); terms[i] = static_cast(value_proto.bool_val()); } else if constexpr (std::is_integral_v) { Assert(value_proto.val_case() == planpb::GenericValue::kInt64Val); terms[i] = static_cast(value_proto.int64_val()); } else if constexpr (std::is_floating_point_v) { Assert(value_proto.val_case() == planpb::GenericValue::kFloatVal); terms[i] = static_cast(value_proto.float_val()); } else { static_assert(always_false); } } std::sort(terms.begin(), terms.end()); return std::make_unique>(field_offset, data_type, terms); } template std::unique_ptr> ExtractUnaryRangeExprImpl(FieldOffset field_offset, DataType data_type, const planpb::UnaryRangeExpr& expr_proto) { static_assert(std::is_fundamental_v); auto getValue = [&](const auto& value_proto) -> T { if constexpr (std::is_same_v) { Assert(value_proto.val_case() == planpb::GenericValue::kBoolVal); return static_cast(value_proto.bool_val()); } else if constexpr (std::is_integral_v) { Assert(value_proto.val_case() == planpb::GenericValue::kInt64Val); return static_cast(value_proto.int64_val()); } else if constexpr (std::is_floating_point_v) { Assert(value_proto.val_case() == planpb::GenericValue::kFloatVal); return static_cast(value_proto.float_val()); } else { static_assert(always_false); } }; return std::make_unique>(field_offset, data_type, static_cast(expr_proto.op()), getValue(expr_proto.value())); } template std::unique_ptr> ExtractBinaryRangeExprImpl(FieldOffset field_offset, DataType data_type, const planpb::BinaryRangeExpr& expr_proto) { static_assert(std::is_fundamental_v); auto getValue = [&](const auto& value_proto) -> T { if constexpr (std::is_same_v) { Assert(value_proto.val_case() == planpb::GenericValue::kBoolVal); return static_cast(value_proto.bool_val()); } else if constexpr (std::is_integral_v) { Assert(value_proto.val_case() == planpb::GenericValue::kInt64Val); return static_cast(value_proto.int64_val()); } else if constexpr (std::is_floating_point_v) { Assert(value_proto.val_case() == planpb::GenericValue::kFloatVal); return static_cast(value_proto.float_val()); } else { static_assert(always_false); } }; return std::make_unique>(field_offset, data_type, expr_proto.lower_inclusive(), expr_proto.upper_inclusive(), getValue(expr_proto.lower_value()), getValue(expr_proto.upper_value())); } std::unique_ptr ProtoParser::PlanNodeFromProto(const planpb::PlanNode& plan_node_proto) { // TODO: add more buffs Assert(plan_node_proto.has_vector_anns()); auto& anns_proto = plan_node_proto.vector_anns(); auto expr_opt = [&]() -> std::optional { if (!anns_proto.has_predicates()) { return std::nullopt; } else { return ParseExpr(anns_proto.predicates()); } }(); auto& query_info_proto = anns_proto.query_info(); SearchInfo search_info; auto field_id = FieldId(anns_proto.field_id()); auto field_offset = schema.get_offset(field_id); search_info.field_offset_ = field_offset; search_info.metric_type_ = GetMetricType(query_info_proto.metric_type()); search_info.topk_ = query_info_proto.topk(); search_info.round_decimal_ = query_info_proto.round_decimal(); search_info.search_params_ = json::parse(query_info_proto.search_params()); auto plan_node = [&]() -> std::unique_ptr { if (anns_proto.is_binary()) { return std::make_unique(); } else { return std::make_unique(); } }(); plan_node->placeholder_tag_ = anns_proto.placeholder_tag(); plan_node->predicate_ = std::move(expr_opt); plan_node->search_info_ = std::move(search_info); return plan_node; } std::unique_ptr ProtoParser::RetrievePlanNodeFromProto(const planpb::PlanNode& plan_node_proto) { Assert(plan_node_proto.has_predicates()); auto& predicate_proto = plan_node_proto.predicates(); auto expr_opt = [&]() -> ExprPtr { return ParseExpr(predicate_proto); }(); auto plan_node = [&]() -> std::unique_ptr { return std::make_unique(); }(); plan_node->predicate_ = std::move(expr_opt); return plan_node; } std::unique_ptr ProtoParser::CreatePlan(const proto::plan::PlanNode& plan_node_proto) { auto plan = std::make_unique(schema); auto plan_node = PlanNodeFromProto(plan_node_proto); ExtractedPlanInfo plan_info(schema.size()); ExtractInfoPlanNodeVisitor extractor(plan_info); plan_node->accept(extractor); plan->tag2field_["$0"] = plan_node->search_info_.field_offset_; plan->plan_node_ = std::move(plan_node); plan->extra_info_opt_ = std::move(plan_info); for (auto field_id_raw : plan_node_proto.output_field_ids()) { auto field_id = FieldId(field_id_raw); auto offset = schema.get_offset(field_id); plan->target_entries_.push_back(offset); } return plan; } std::unique_ptr ProtoParser::CreateRetrievePlan(const proto::plan::PlanNode& plan_node_proto) { auto retrieve_plan = std::make_unique(schema); auto plan_node = RetrievePlanNodeFromProto(plan_node_proto); ExtractedPlanInfo plan_info(schema.size()); ExtractInfoPlanNodeVisitor extractor(plan_info); plan_node->accept(extractor); retrieve_plan->plan_node_ = std::move(plan_node); for (auto field_id_raw : plan_node_proto.output_field_ids()) { auto field_id = FieldId(field_id_raw); auto offset = schema.get_offset(field_id); retrieve_plan->field_offsets_.push_back(offset); } return retrieve_plan; } ExprPtr ProtoParser::ParseUnaryRangeExpr(const proto::plan::UnaryRangeExpr& expr_pb) { auto& column_info = expr_pb.column_info(); auto field_id = FieldId(column_info.field_id()); auto field_offset = schema.get_offset(field_id); auto data_type = schema[field_offset].get_data_type(); Assert(data_type == static_cast(column_info.data_type())); auto result = [&]() -> ExprPtr { switch (data_type) { case DataType::BOOL: { return ExtractUnaryRangeExprImpl(field_offset, data_type, expr_pb); } case DataType::INT8: { return ExtractUnaryRangeExprImpl(field_offset, data_type, expr_pb); } case DataType::INT16: { return ExtractUnaryRangeExprImpl(field_offset, data_type, expr_pb); } case DataType::INT32: { return ExtractUnaryRangeExprImpl(field_offset, data_type, expr_pb); } case DataType::INT64: { return ExtractUnaryRangeExprImpl(field_offset, data_type, expr_pb); } case DataType::FLOAT: { return ExtractUnaryRangeExprImpl(field_offset, data_type, expr_pb); } case DataType::DOUBLE: { return ExtractUnaryRangeExprImpl(field_offset, data_type, expr_pb); } default: { PanicInfo("unsupported data type"); } } }(); return result; } ExprPtr ProtoParser::ParseBinaryRangeExpr(const proto::plan::BinaryRangeExpr& expr_pb) { auto& columnInfo = expr_pb.column_info(); auto field_id = FieldId(columnInfo.field_id()); auto field_offset = schema.get_offset(field_id); auto data_type = schema[field_offset].get_data_type(); Assert(data_type == (DataType)columnInfo.data_type()); auto result = [&]() -> ExprPtr { switch (data_type) { case DataType::BOOL: { return ExtractBinaryRangeExprImpl(field_offset, data_type, expr_pb); } case DataType::INT8: { return ExtractBinaryRangeExprImpl(field_offset, data_type, expr_pb); } case DataType::INT16: { return ExtractBinaryRangeExprImpl(field_offset, data_type, expr_pb); } case DataType::INT32: { return ExtractBinaryRangeExprImpl(field_offset, data_type, expr_pb); } case DataType::INT64: { return ExtractBinaryRangeExprImpl(field_offset, data_type, expr_pb); } case DataType::FLOAT: { return ExtractBinaryRangeExprImpl(field_offset, data_type, expr_pb); } case DataType::DOUBLE: { return ExtractBinaryRangeExprImpl(field_offset, data_type, expr_pb); } default: { PanicInfo("unsupported data type"); } } }(); return result; } ExprPtr ProtoParser::ParseCompareExpr(const proto::plan::CompareExpr& expr_pb) { auto& left_column_info = expr_pb.left_column_info(); auto left_field_id = FieldId(left_column_info.field_id()); auto left_field_offset = schema.get_offset(left_field_id); auto left_data_type = schema[left_field_offset].get_data_type(); Assert(left_data_type == static_cast(left_column_info.data_type())); auto& right_column_info = expr_pb.right_column_info(); auto right_field_id = FieldId(right_column_info.field_id()); auto right_field_offset = schema.get_offset(right_field_id); auto right_data_type = schema[right_field_offset].get_data_type(); Assert(right_data_type == static_cast(right_column_info.data_type())); return [&]() -> ExprPtr { auto result = std::make_unique(); result->left_field_offset_ = left_field_offset; result->left_data_type_ = left_data_type; result->right_field_offset_ = right_field_offset; result->right_data_type_ = right_data_type; result->op_type_ = static_cast(expr_pb.op()); return result; }(); } ExprPtr ProtoParser::ParseTermExpr(const proto::plan::TermExpr& expr_pb) { auto& columnInfo = expr_pb.column_info(); auto field_id = FieldId(columnInfo.field_id()); auto field_offset = schema.get_offset(field_id); auto data_type = schema[field_offset].get_data_type(); Assert(data_type == (DataType)columnInfo.data_type()); // auto& field_meta = schema[field_offset]; auto result = [&]() -> ExprPtr { switch (data_type) { case DataType::BOOL: { return ExtractTermExprImpl(field_offset, data_type, expr_pb); } case DataType::INT8: { return ExtractTermExprImpl(field_offset, data_type, expr_pb); } case DataType::INT16: { return ExtractTermExprImpl(field_offset, data_type, expr_pb); } case DataType::INT32: { return ExtractTermExprImpl(field_offset, data_type, expr_pb); } case DataType::INT64: { return ExtractTermExprImpl(field_offset, data_type, expr_pb); } case DataType::FLOAT: { return ExtractTermExprImpl(field_offset, data_type, expr_pb); } case DataType::DOUBLE: { return ExtractTermExprImpl(field_offset, data_type, expr_pb); } default: { PanicInfo("unsupported data type"); } } }(); return result; } ExprPtr ProtoParser::ParseUnaryExpr(const proto::plan::UnaryExpr& expr_pb) { auto op = static_cast(expr_pb.op()); Assert(op == LogicalUnaryExpr::OpType::LogicalNot); auto expr = this->ParseExpr(expr_pb.child()); return std::make_unique(op, expr); } ExprPtr ProtoParser::ParseBinaryExpr(const proto::plan::BinaryExpr& expr_pb) { auto op = static_cast(expr_pb.op()); auto left_expr = this->ParseExpr(expr_pb.left()); auto right_expr = this->ParseExpr(expr_pb.right()); return std::make_unique(op, left_expr, right_expr); } ExprPtr ProtoParser::ParseExpr(const proto::plan::Expr& expr_pb) { using ppe = proto::plan::Expr; switch (expr_pb.expr_case()) { case ppe::kBinaryExpr: { return ParseBinaryExpr(expr_pb.binary_expr()); } case ppe::kUnaryExpr: { return ParseUnaryExpr(expr_pb.unary_expr()); } case ppe::kTermExpr: { return ParseTermExpr(expr_pb.term_expr()); } case ppe::kUnaryRangeExpr: { return ParseUnaryRangeExpr(expr_pb.unary_range_expr()); } case ppe::kBinaryRangeExpr: { return ParseBinaryRangeExpr(expr_pb.binary_range_expr()); } case ppe::kCompareExpr: { return ParseCompareExpr(expr_pb.compare_expr()); } default: PanicInfo("unsupported expr proto node"); } } } // namespace milvus::query