mirror of
https://gitee.com/milvus-io/milvus.git
synced 2026-01-01 16:35:29 +08:00
445 lines
18 KiB
C++
445 lines
18 KiB
C++
// Copyright (C) 2019-2020 Zilliz. All rights reserved.
|
|
//
|
|
// Licensed under the Apache License, Version 2.0 (the "License"); you may not use this file except in compliance
|
|
// with the License. You may obtain a copy of the License at
|
|
//
|
|
// http://www.apache.org/licenses/LICENSE-2.0
|
|
//
|
|
// Unless required by applicable law or agreed to in writing, software distributed under the License
|
|
// is distributed on an "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express
|
|
// or implied. See the License for the specific language governing permissions and limitations under the License
|
|
|
|
#include <google/protobuf/text_format.h>
|
|
|
|
#include <string>
|
|
|
|
#include "ExprImpl.h"
|
|
#include "PlanProto.h"
|
|
#include "generated/ExtractInfoExprVisitor.h"
|
|
#include "generated/ExtractInfoPlanNodeVisitor.h"
|
|
#include "common/VectorTrait.h"
|
|
|
|
namespace milvus::query {
|
|
namespace planpb = milvus::proto::plan;
|
|
|
|
template <typename T>
|
|
std::unique_ptr<TermExprImpl<T>>
|
|
ExtractTermExprImpl(FieldId field_id, DataType data_type, const planpb::TermExpr& expr_proto) {
|
|
static_assert(IsScalar<T>);
|
|
auto size = expr_proto.values_size();
|
|
std::vector<T> terms(size);
|
|
for (int i = 0; i < size; ++i) {
|
|
auto& value_proto = expr_proto.values(i);
|
|
if constexpr (std::is_same_v<T, bool>) {
|
|
Assert(value_proto.val_case() == planpb::GenericValue::kBoolVal);
|
|
terms[i] = static_cast<T>(value_proto.bool_val());
|
|
} else if constexpr (std::is_integral_v<T>) {
|
|
Assert(value_proto.val_case() == planpb::GenericValue::kInt64Val);
|
|
terms[i] = static_cast<T>(value_proto.int64_val());
|
|
} else if constexpr (std::is_floating_point_v<T>) {
|
|
Assert(value_proto.val_case() == planpb::GenericValue::kFloatVal);
|
|
terms[i] = static_cast<T>(value_proto.float_val());
|
|
} else if constexpr (std::is_same_v<T, std::string>) {
|
|
Assert(value_proto.val_case() == planpb::GenericValue::kStringVal);
|
|
terms[i] = static_cast<T>(value_proto.string_val());
|
|
} else {
|
|
static_assert(always_false<T>);
|
|
}
|
|
}
|
|
std::sort(terms.begin(), terms.end());
|
|
return std::make_unique<TermExprImpl<T>>(field_id, data_type, terms);
|
|
}
|
|
|
|
template <typename T>
|
|
std::unique_ptr<UnaryRangeExprImpl<T>>
|
|
ExtractUnaryRangeExprImpl(FieldId field_id, DataType data_type, const planpb::UnaryRangeExpr& expr_proto) {
|
|
static_assert(IsScalar<T>);
|
|
auto getValue = [&](const auto& value_proto) -> T {
|
|
if constexpr (std::is_same_v<T, bool>) {
|
|
Assert(value_proto.val_case() == planpb::GenericValue::kBoolVal);
|
|
return static_cast<T>(value_proto.bool_val());
|
|
} else if constexpr (std::is_integral_v<T>) {
|
|
Assert(value_proto.val_case() == planpb::GenericValue::kInt64Val);
|
|
return static_cast<T>(value_proto.int64_val());
|
|
} else if constexpr (std::is_floating_point_v<T>) {
|
|
Assert(value_proto.val_case() == planpb::GenericValue::kFloatVal);
|
|
return static_cast<T>(value_proto.float_val());
|
|
} else if constexpr (std::is_same_v<T, std::string>) {
|
|
Assert(value_proto.val_case() == planpb::GenericValue::kStringVal);
|
|
return static_cast<T>(value_proto.string_val());
|
|
} else {
|
|
static_assert(always_false<T>);
|
|
}
|
|
};
|
|
return std::make_unique<UnaryRangeExprImpl<T>>(field_id, data_type, static_cast<OpType>(expr_proto.op()),
|
|
getValue(expr_proto.value()));
|
|
}
|
|
|
|
template <typename T>
|
|
std::unique_ptr<BinaryRangeExprImpl<T>>
|
|
ExtractBinaryRangeExprImpl(FieldId field_id, DataType data_type, const planpb::BinaryRangeExpr& expr_proto) {
|
|
static_assert(IsScalar<T>);
|
|
auto getValue = [&](const auto& value_proto) -> T {
|
|
if constexpr (std::is_same_v<T, bool>) {
|
|
Assert(value_proto.val_case() == planpb::GenericValue::kBoolVal);
|
|
return static_cast<T>(value_proto.bool_val());
|
|
} else if constexpr (std::is_integral_v<T>) {
|
|
Assert(value_proto.val_case() == planpb::GenericValue::kInt64Val);
|
|
return static_cast<T>(value_proto.int64_val());
|
|
} else if constexpr (std::is_floating_point_v<T>) {
|
|
Assert(value_proto.val_case() == planpb::GenericValue::kFloatVal);
|
|
return static_cast<T>(value_proto.float_val());
|
|
} else if constexpr (std::is_same_v<T, std::string>) {
|
|
Assert(value_proto.val_case() == planpb::GenericValue::kStringVal);
|
|
return static_cast<T>(value_proto.string_val());
|
|
} else {
|
|
static_assert(always_false<T>);
|
|
}
|
|
};
|
|
return std::make_unique<BinaryRangeExprImpl<T>>(field_id, data_type, expr_proto.lower_inclusive(),
|
|
expr_proto.upper_inclusive(), getValue(expr_proto.lower_value()),
|
|
getValue(expr_proto.upper_value()));
|
|
}
|
|
|
|
template <typename T>
|
|
std::unique_ptr<BinaryArithOpEvalRangeExprImpl<T>>
|
|
ExtractBinaryArithOpEvalRangeExprImpl(FieldId field_id,
|
|
DataType data_type,
|
|
const planpb::BinaryArithOpEvalRangeExpr& expr_proto) {
|
|
static_assert(std::is_fundamental_v<T>);
|
|
auto getValue = [&](const auto& value_proto) -> T {
|
|
if constexpr (std::is_same_v<T, bool>) {
|
|
// Handle bool here. Otherwise, it can go in `is_integral_v<T>`
|
|
static_assert(always_false<T>);
|
|
} else if constexpr (std::is_integral_v<T>) {
|
|
Assert(value_proto.val_case() == planpb::GenericValue::kInt64Val);
|
|
return static_cast<T>(value_proto.int64_val());
|
|
} else if constexpr (std::is_floating_point_v<T>) {
|
|
Assert(value_proto.val_case() == planpb::GenericValue::kFloatVal);
|
|
return static_cast<T>(value_proto.float_val());
|
|
} else {
|
|
static_assert(always_false<T>);
|
|
}
|
|
};
|
|
return std::make_unique<BinaryArithOpEvalRangeExprImpl<T>>(
|
|
field_id, data_type, static_cast<ArithOpType>(expr_proto.arith_op()), getValue(expr_proto.right_operand()),
|
|
static_cast<OpType>(expr_proto.op()), getValue(expr_proto.value()));
|
|
}
|
|
|
|
std::unique_ptr<VectorPlanNode>
|
|
ProtoParser::PlanNodeFromProto(const planpb::PlanNode& plan_node_proto) {
|
|
// TODO: add more buffs
|
|
Assert(plan_node_proto.has_vector_anns());
|
|
auto& anns_proto = plan_node_proto.vector_anns();
|
|
auto expr_opt = [&]() -> std::optional<ExprPtr> {
|
|
if (!anns_proto.has_predicates()) {
|
|
return std::nullopt;
|
|
} else {
|
|
return ParseExpr(anns_proto.predicates());
|
|
}
|
|
}();
|
|
|
|
auto& query_info_proto = anns_proto.query_info();
|
|
|
|
SearchInfo search_info;
|
|
auto field_id = FieldId(anns_proto.field_id());
|
|
search_info.field_id_ = field_id;
|
|
|
|
search_info.metric_type_ = query_info_proto.metric_type();
|
|
search_info.topk_ = query_info_proto.topk();
|
|
search_info.round_decimal_ = query_info_proto.round_decimal();
|
|
search_info.search_params_ = json::parse(query_info_proto.search_params());
|
|
|
|
auto plan_node = [&]() -> std::unique_ptr<VectorPlanNode> {
|
|
if (anns_proto.is_binary()) {
|
|
return std::make_unique<BinaryVectorANNS>();
|
|
} else {
|
|
return std::make_unique<FloatVectorANNS>();
|
|
}
|
|
}();
|
|
plan_node->placeholder_tag_ = anns_proto.placeholder_tag();
|
|
plan_node->predicate_ = std::move(expr_opt);
|
|
plan_node->search_info_ = std::move(search_info);
|
|
return plan_node;
|
|
}
|
|
|
|
std::unique_ptr<RetrievePlanNode>
|
|
ProtoParser::RetrievePlanNodeFromProto(const planpb::PlanNode& plan_node_proto) {
|
|
Assert(plan_node_proto.has_predicates());
|
|
auto& predicate_proto = plan_node_proto.predicates();
|
|
auto expr_opt = [&]() -> ExprPtr { return ParseExpr(predicate_proto); }();
|
|
|
|
auto plan_node = [&]() -> std::unique_ptr<RetrievePlanNode> { return std::make_unique<RetrievePlanNode>(); }();
|
|
plan_node->predicate_ = std::move(expr_opt);
|
|
return plan_node;
|
|
}
|
|
|
|
std::unique_ptr<Plan>
|
|
ProtoParser::CreatePlan(const proto::plan::PlanNode& plan_node_proto) {
|
|
// std::cout << plan_node_proto.DebugString() << std::endl;
|
|
auto plan = std::make_unique<Plan>(schema);
|
|
|
|
auto plan_node = PlanNodeFromProto(plan_node_proto);
|
|
ExtractedPlanInfo plan_info(schema.size());
|
|
ExtractInfoPlanNodeVisitor extractor(plan_info);
|
|
plan_node->accept(extractor);
|
|
|
|
plan->tag2field_["$0"] = plan_node->search_info_.field_id_;
|
|
plan->plan_node_ = std::move(plan_node);
|
|
plan->extra_info_opt_ = std::move(plan_info);
|
|
|
|
for (auto field_id_raw : plan_node_proto.output_field_ids()) {
|
|
auto field_id = FieldId(field_id_raw);
|
|
plan->target_entries_.push_back(field_id);
|
|
}
|
|
|
|
return plan;
|
|
}
|
|
|
|
std::unique_ptr<RetrievePlan>
|
|
ProtoParser::CreateRetrievePlan(const proto::plan::PlanNode& plan_node_proto) {
|
|
auto retrieve_plan = std::make_unique<RetrievePlan>(schema);
|
|
|
|
auto plan_node = RetrievePlanNodeFromProto(plan_node_proto);
|
|
ExtractedPlanInfo plan_info(schema.size());
|
|
ExtractInfoPlanNodeVisitor extractor(plan_info);
|
|
plan_node->accept(extractor);
|
|
|
|
retrieve_plan->plan_node_ = std::move(plan_node);
|
|
for (auto field_id_raw : plan_node_proto.output_field_ids()) {
|
|
auto field_id = FieldId(field_id_raw);
|
|
retrieve_plan->field_ids_.push_back(field_id);
|
|
}
|
|
return retrieve_plan;
|
|
}
|
|
|
|
ExprPtr
|
|
ProtoParser::ParseUnaryRangeExpr(const proto::plan::UnaryRangeExpr& expr_pb) {
|
|
auto& column_info = expr_pb.column_info();
|
|
auto field_id = FieldId(column_info.field_id());
|
|
auto data_type = schema[field_id].get_data_type();
|
|
Assert(data_type == static_cast<DataType>(column_info.data_type()));
|
|
|
|
auto result = [&]() -> ExprPtr {
|
|
switch (data_type) {
|
|
case DataType::BOOL: {
|
|
return ExtractUnaryRangeExprImpl<bool>(field_id, data_type, expr_pb);
|
|
}
|
|
case DataType::INT8: {
|
|
return ExtractUnaryRangeExprImpl<int8_t>(field_id, data_type, expr_pb);
|
|
}
|
|
case DataType::INT16: {
|
|
return ExtractUnaryRangeExprImpl<int16_t>(field_id, data_type, expr_pb);
|
|
}
|
|
case DataType::INT32: {
|
|
return ExtractUnaryRangeExprImpl<int32_t>(field_id, data_type, expr_pb);
|
|
}
|
|
case DataType::INT64: {
|
|
return ExtractUnaryRangeExprImpl<int64_t>(field_id, data_type, expr_pb);
|
|
}
|
|
case DataType::FLOAT: {
|
|
return ExtractUnaryRangeExprImpl<float>(field_id, data_type, expr_pb);
|
|
}
|
|
case DataType::DOUBLE: {
|
|
return ExtractUnaryRangeExprImpl<double>(field_id, data_type, expr_pb);
|
|
}
|
|
case DataType::VARCHAR: {
|
|
return ExtractUnaryRangeExprImpl<std::string>(field_id, data_type, expr_pb);
|
|
}
|
|
default: {
|
|
PanicInfo("unsupported data type");
|
|
}
|
|
}
|
|
}();
|
|
return result;
|
|
}
|
|
|
|
ExprPtr
|
|
ProtoParser::ParseBinaryRangeExpr(const proto::plan::BinaryRangeExpr& expr_pb) {
|
|
auto& columnInfo = expr_pb.column_info();
|
|
auto field_id = FieldId(columnInfo.field_id());
|
|
auto data_type = schema[field_id].get_data_type();
|
|
Assert(data_type == (DataType)columnInfo.data_type());
|
|
|
|
auto result = [&]() -> ExprPtr {
|
|
switch (data_type) {
|
|
case DataType::BOOL: {
|
|
return ExtractBinaryRangeExprImpl<bool>(field_id, data_type, expr_pb);
|
|
}
|
|
case DataType::INT8: {
|
|
return ExtractBinaryRangeExprImpl<int8_t>(field_id, data_type, expr_pb);
|
|
}
|
|
case DataType::INT16: {
|
|
return ExtractBinaryRangeExprImpl<int16_t>(field_id, data_type, expr_pb);
|
|
}
|
|
case DataType::INT32: {
|
|
return ExtractBinaryRangeExprImpl<int32_t>(field_id, data_type, expr_pb);
|
|
}
|
|
case DataType::INT64: {
|
|
return ExtractBinaryRangeExprImpl<int64_t>(field_id, data_type, expr_pb);
|
|
}
|
|
case DataType::FLOAT: {
|
|
return ExtractBinaryRangeExprImpl<float>(field_id, data_type, expr_pb);
|
|
}
|
|
case DataType::DOUBLE: {
|
|
return ExtractBinaryRangeExprImpl<double>(field_id, data_type, expr_pb);
|
|
}
|
|
case DataType::VARCHAR: {
|
|
return ExtractBinaryRangeExprImpl<std::string>(field_id, data_type, expr_pb);
|
|
}
|
|
default: {
|
|
PanicInfo("unsupported data type");
|
|
}
|
|
}
|
|
}();
|
|
return result;
|
|
}
|
|
|
|
ExprPtr
|
|
ProtoParser::ParseCompareExpr(const proto::plan::CompareExpr& expr_pb) {
|
|
auto& left_column_info = expr_pb.left_column_info();
|
|
auto left_field_id = FieldId(left_column_info.field_id());
|
|
auto left_data_type = schema[left_field_id].get_data_type();
|
|
Assert(left_data_type == static_cast<DataType>(left_column_info.data_type()));
|
|
|
|
auto& right_column_info = expr_pb.right_column_info();
|
|
auto right_field_id = FieldId(right_column_info.field_id());
|
|
auto right_data_type = schema[right_field_id].get_data_type();
|
|
Assert(right_data_type == static_cast<DataType>(right_column_info.data_type()));
|
|
|
|
return [&]() -> ExprPtr {
|
|
auto result = std::make_unique<CompareExpr>();
|
|
result->left_field_id_ = left_field_id;
|
|
result->left_data_type_ = left_data_type;
|
|
result->right_field_id_ = right_field_id;
|
|
result->right_data_type_ = right_data_type;
|
|
result->op_type_ = static_cast<OpType>(expr_pb.op());
|
|
return result;
|
|
}();
|
|
}
|
|
|
|
ExprPtr
|
|
ProtoParser::ParseTermExpr(const proto::plan::TermExpr& expr_pb) {
|
|
auto& columnInfo = expr_pb.column_info();
|
|
auto field_id = FieldId(columnInfo.field_id());
|
|
auto data_type = schema[field_id].get_data_type();
|
|
Assert(data_type == (DataType)columnInfo.data_type());
|
|
|
|
// auto& field_meta = schema[field_offset];
|
|
auto result = [&]() -> ExprPtr {
|
|
switch (data_type) {
|
|
case DataType::BOOL: {
|
|
return ExtractTermExprImpl<bool>(field_id, data_type, expr_pb);
|
|
}
|
|
case DataType::INT8: {
|
|
return ExtractTermExprImpl<int8_t>(field_id, data_type, expr_pb);
|
|
}
|
|
case DataType::INT16: {
|
|
return ExtractTermExprImpl<int16_t>(field_id, data_type, expr_pb);
|
|
}
|
|
case DataType::INT32: {
|
|
return ExtractTermExprImpl<int32_t>(field_id, data_type, expr_pb);
|
|
}
|
|
case DataType::INT64: {
|
|
return ExtractTermExprImpl<int64_t>(field_id, data_type, expr_pb);
|
|
}
|
|
case DataType::FLOAT: {
|
|
return ExtractTermExprImpl<float>(field_id, data_type, expr_pb);
|
|
}
|
|
case DataType::DOUBLE: {
|
|
return ExtractTermExprImpl<double>(field_id, data_type, expr_pb);
|
|
}
|
|
case DataType::VARCHAR: {
|
|
return ExtractTermExprImpl<std::string>(field_id, data_type, expr_pb);
|
|
}
|
|
default: {
|
|
PanicInfo("unsupported data type");
|
|
}
|
|
}
|
|
}();
|
|
return result;
|
|
}
|
|
|
|
ExprPtr
|
|
ProtoParser::ParseUnaryExpr(const proto::plan::UnaryExpr& expr_pb) {
|
|
auto op = static_cast<LogicalUnaryExpr::OpType>(expr_pb.op());
|
|
Assert(op == LogicalUnaryExpr::OpType::LogicalNot);
|
|
auto expr = this->ParseExpr(expr_pb.child());
|
|
return std::make_unique<LogicalUnaryExpr>(op, expr);
|
|
}
|
|
|
|
ExprPtr
|
|
ProtoParser::ParseBinaryExpr(const proto::plan::BinaryExpr& expr_pb) {
|
|
auto op = static_cast<LogicalBinaryExpr::OpType>(expr_pb.op());
|
|
auto left_expr = this->ParseExpr(expr_pb.left());
|
|
auto right_expr = this->ParseExpr(expr_pb.right());
|
|
return std::make_unique<LogicalBinaryExpr>(op, left_expr, right_expr);
|
|
}
|
|
|
|
ExprPtr
|
|
ProtoParser::ParseBinaryArithOpEvalRangeExpr(const proto::plan::BinaryArithOpEvalRangeExpr& expr_pb) {
|
|
auto& column_info = expr_pb.column_info();
|
|
auto field_id = FieldId(column_info.field_id());
|
|
auto data_type = schema[field_id].get_data_type();
|
|
Assert(data_type == static_cast<DataType>(column_info.data_type()));
|
|
|
|
auto result = [&]() -> ExprPtr {
|
|
switch (data_type) {
|
|
case DataType::INT8: {
|
|
return ExtractBinaryArithOpEvalRangeExprImpl<int8_t>(field_id, data_type, expr_pb);
|
|
}
|
|
case DataType::INT16: {
|
|
return ExtractBinaryArithOpEvalRangeExprImpl<int16_t>(field_id, data_type, expr_pb);
|
|
}
|
|
case DataType::INT32: {
|
|
return ExtractBinaryArithOpEvalRangeExprImpl<int32_t>(field_id, data_type, expr_pb);
|
|
}
|
|
case DataType::INT64: {
|
|
return ExtractBinaryArithOpEvalRangeExprImpl<int64_t>(field_id, data_type, expr_pb);
|
|
}
|
|
case DataType::FLOAT: {
|
|
return ExtractBinaryArithOpEvalRangeExprImpl<float>(field_id, data_type, expr_pb);
|
|
}
|
|
case DataType::DOUBLE: {
|
|
return ExtractBinaryArithOpEvalRangeExprImpl<double>(field_id, data_type, expr_pb);
|
|
}
|
|
default: {
|
|
PanicInfo("unsupported data type");
|
|
}
|
|
}
|
|
}();
|
|
return result;
|
|
}
|
|
|
|
ExprPtr
|
|
ProtoParser::ParseExpr(const proto::plan::Expr& expr_pb) {
|
|
using ppe = proto::plan::Expr;
|
|
switch (expr_pb.expr_case()) {
|
|
case ppe::kBinaryExpr: {
|
|
return ParseBinaryExpr(expr_pb.binary_expr());
|
|
}
|
|
case ppe::kUnaryExpr: {
|
|
return ParseUnaryExpr(expr_pb.unary_expr());
|
|
}
|
|
case ppe::kTermExpr: {
|
|
return ParseTermExpr(expr_pb.term_expr());
|
|
}
|
|
case ppe::kUnaryRangeExpr: {
|
|
return ParseUnaryRangeExpr(expr_pb.unary_range_expr());
|
|
}
|
|
case ppe::kBinaryRangeExpr: {
|
|
return ParseBinaryRangeExpr(expr_pb.binary_range_expr());
|
|
}
|
|
case ppe::kCompareExpr: {
|
|
return ParseCompareExpr(expr_pb.compare_expr());
|
|
}
|
|
case ppe::kBinaryArithOpEvalRangeExpr: {
|
|
return ParseBinaryArithOpEvalRangeExpr(expr_pb.binary_arith_op_eval_range_expr());
|
|
}
|
|
default:
|
|
PanicInfo("unsupported expr proto node");
|
|
}
|
|
}
|
|
|
|
} // namespace milvus::query
|