enhance: optimize term expr performance (#45491)

issue: https://github.com/milvus-io/milvus/issues/45641 --------- Signed-off-by: sunby <sunbingyi1992@gmail.com>
2025-12-06 17:18:35 +08:00 · 2025-11-21 11:01:05 +08:00 · 2025-11-21 11:01:05 +08:00 · 275a5b9afc
commit 275a5b9afc
parent 3202847092
1 changed files with 22 additions and 15 deletions
--- a/internal/core/src/exec/expression/TermExpr.cpp
+++ b/internal/core/src/exec/expression/TermExpr.cpp
@ -838,29 +838,36 @@ PhyTermFilterExpr::ExecVisitorImplForIndex() {
        return nullptr;
    }
-    std::vector<IndexInnerType> vals;
+    if (!arg_inited_) {
-    for (auto& val : expr_->vals_) {
+        std::vector<IndexInnerType> vals;
-        if constexpr (std::is_same_v<T, double>) {
+        for (auto& val : expr_->vals_) {
-            if (val.has_int64_val()) {
+            if constexpr (std::is_same_v<T, double>) {
-                // only json field will cast int to double because other fields are casted in proxy
+                if (val.has_int64_val()) {
-                vals.emplace_back(static_cast<double>(val.int64_val()));
+                    // only json field will cast int to double because other fields are casted in proxy
-                continue;
+                    vals.emplace_back(static_cast<double>(val.int64_val()));
                    continue;
                }
            }
            // Generic overflow handling for all types
            bool overflowed = false;
            auto converted_val =
                GetValueFromProtoWithOverflow<T>(val, overflowed);
            if (!overflowed) {
                vals.emplace_back(converted_val);
            }
        }
-
+        arg_set_ = std::make_shared<FlatVectorElement<IndexInnerType>>(vals);
-        // Generic overflow handling for all types
+        arg_inited_ = true;
        bool overflowed = false;
        auto converted_val = GetValueFromProtoWithOverflow<T>(val, overflowed);
        if (!overflowed) {
            vals.emplace_back(converted_val);
        }
    }
    auto execute_sub_batch = [](Index* index_ptr,
                                const std::vector<IndexInnerType>& vals) {
        TermIndexFunc<T> func;
        return func(index_ptr, vals.size(), vals.data());
    };
-    auto res = ProcessIndexChunks<T>(execute_sub_batch, vals);
+    auto args =
        std::dynamic_pointer_cast<FlatVectorElement<IndexInnerType>>(arg_set_);
    auto res = ProcessIndexChunks<T>(execute_sub_batch, args->values_);
    AssertInfo(res->size() == real_batch_size,
               "internal error: expr processed rows {} not equal "
               "expect batch size {}",