enhance: optimize term expr performance (#45671)

issue: https://github.com/milvus-io/milvus/issues/45641 pr: https://github.com/milvus-io/milvus/pull/45491 Signed-off-by: sunby <sunbingyi1992@gmail.com>
2025-12-07 17:48:29 +08:00 · 2025-11-19 19:43:06 +08:00 · 2025-11-19 19:43:06 +08:00 · e4a85ab92e
commit e4a85ab92e
parent 08ae6b5fcc
3 changed files with 24 additions and 17 deletions
--- a/internal/core/src/exec/expression/Element.h
+++ b/internal/core/src/exec/expression/Element.h
@ -216,7 +216,7 @@ class FlatVectorElement : public MultiElement {
    In(const ValueType& value) const override {
        if (std::holds_alternative<T>(value)) {
            for (const auto& v : values_) {
-                if (v == value)
+                if (v == std::get<T>(value))
                    return true;
            }
        }
--- a/internal/core/src/exec/expression/Expr.h
+++ b/internal/core/src/exec/expression/Expr.h
@ -982,7 +982,7 @@ class SegmentExpr : public Expr {

    template <typename T, typename FUNC, typename... ValTypes>
    VectorPtr
-    ProcessIndexChunks(FUNC func, ValTypes... values) {
+    ProcessIndexChunks(FUNC func, const ValTypes&... values) {
        typedef std::
            conditional_t<std::is_same_v<T, std::string_view>, std::string, T>
                IndexInnerType;
--- a/internal/core/src/exec/expression/TermExpr.cpp
+++ b/internal/core/src/exec/expression/TermExpr.cpp
@ -837,29 +837,36 @@ PhyTermFilterExpr::ExecVisitorImplForIndex() {
        return nullptr;
    }

-    std::vector<IndexInnerType> vals;
-    for (auto& val : expr_->vals_) {
-        if constexpr (std::is_same_v<T, double>) {
-            if (val.has_int64_val()) {
-                // only json field will cast int to double because other fields are casted in proxy
-                vals.emplace_back(static_cast<double>(val.int64_val()));
-                continue;
+    if (!arg_inited_) {
+        std::vector<IndexInnerType> vals;
+        for (auto& val : expr_->vals_) {
+            if constexpr (std::is_same_v<T, double>) {
+                if (val.has_int64_val()) {
+                    // only json field will cast int to double because other fields are casted in proxy
+                    vals.emplace_back(static_cast<double>(val.int64_val()));
+                    continue;
+                }
+            }
+
+            // Generic overflow handling for all types
+            bool overflowed = false;
+            auto converted_val =
+                GetValueFromProtoWithOverflow<T>(val, overflowed);
+            if (!overflowed) {
+                vals.emplace_back(converted_val);
            }
        }
-
-        // Generic overflow handling for all types
-        bool overflowed = false;
-        auto converted_val = GetValueFromProtoWithOverflow<T>(val, overflowed);
-        if (!overflowed) {
-            vals.emplace_back(converted_val);
-        }
+        arg_set_ = std::make_shared<FlatVectorElement<IndexInnerType>>(vals);
+        arg_inited_ = true;
    }
    auto execute_sub_batch = [](Index* index_ptr,
                                const std::vector<IndexInnerType>& vals) {
        TermIndexFunc<T> func;
        return func(index_ptr, vals.size(), vals.data());
    };
-    auto res = ProcessIndexChunks<T>(execute_sub_batch, vals);
+    auto args =
+        std::dynamic_pointer_cast<FlatVectorElement<IndexInnerType>>(arg_set_);
+    auto res = ProcessIndexChunks<T>(execute_sub_batch, args->values_);
    AssertInfo(res->size() == real_batch_size,
               "internal error: expr processed rows {} not equal "
               "expect batch size {}",