milvus/pkg/util/paramtable/function_param.go
junjiejiangjjj d3164e8030
feat: add configurable batch factor and runtime check bypass for embedding functions (#45592)
https://github.com/milvus-io/milvus/issues/45544
- Add batch_factor configuration parameter (default: 5) to control
embedding provider batch sizes
- Add disable_func_runtime_check property to bypass function validation
during collection creation
- Add database interceptor support for AddCollectionFunction,
AlterCollectionFunction, and DropCollectionFunction requests

Signed-off-by: junjie.jiang <junjie.jiang@zilliz.com>
2025-11-20 19:55:04 +08:00

200 lines
6.6 KiB
Go

// Licensed to the LF AI & Data foundation under one
// or more contributor license agreements. See the NOTICE file
// distributed with this work for additional information
// regarding copyright ownership. The ASF licenses this file
// to you under the Apache License, Version 2.0 (the
// "License"); you may not use this file except in compliance
// with the License. You may obtain a copy of the License at
//
// http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.
package paramtable
import (
"strings"
)
type functionConfig struct {
BatchFactor ParamItem `refreshable:"true"`
TextEmbeddingProviders ParamGroup `refreshable:"true"`
RerankModelProviders ParamGroup `refreshable:"true"`
LocalResourcePath ParamItem `refreshable:"true"`
LinderaDownloadUrls ParamGroup `refreshable:"true"`
ZillizProviders ParamGroup `refreshable:"true"`
}
func (p *functionConfig) init(base *BaseTable) {
p.BatchFactor = ParamItem{
Key: "function.batch_factor.",
Version: "2.6.7",
DefaultValue: "5",
}
p.BatchFactor.Init(base.mgr)
p.TextEmbeddingProviders = ParamGroup{
KeyPrefix: "function.textEmbedding.providers.",
Version: "2.6.0",
Export: true,
DocFunc: func(key string) string {
switch key {
case "tei.enable":
return "Whether to enable TEI model service"
case "tei.credential":
return "The name in the crendential configuration item"
case "azure_openai.credential":
return "The name in the crendential configuration item"
case "azure_openai.url":
return "Your azure openai embedding url, Default is the official embedding url"
case "azure_openai.resource_name":
return "Your azure openai resource name"
case "azure_openai.enable":
return "Whether to enable azure openai model service"
case "openai.credential":
return "The name in the crendential configuration item"
case "openai.url":
return "Your openai embedding url, Default is the official embedding url"
case "openai.enable":
return "Whether to enable openai model service"
case "dashscope.credential":
return "The name in the crendential configuration item"
case "dashscope.url":
return "Your dashscope embedding url, Default is the official embedding url"
case "dashscope.enable":
return "Whether to enable dashscope model service"
case "cohere.credential":
return "The name in the crendential configuration item"
case "cohere.url":
return "Your cohere embedding url, Default is the official embedding url"
case "cohere.enable":
return "Whether to enable cohere model service"
case "voyageai.credential":
return "The name in the crendential configuration item"
case "voyageai.url":
return "Your voyageai embedding url, Default is the official embedding url"
case "voyageai.enable":
return "Whether to enable voyageai model service"
case "siliconflow.url":
return "Your siliconflow embedding url, Default is the official embedding url"
case "siliconflow.credential":
return "The name in the crendential configuration item"
case "siliconflow.enable":
return "Whether to enable siliconflow model service"
case "bedrock.credential":
return "The name in the crendential configuration item"
case "bedrock.enable":
return "Whether to enable bedrock model service"
case "vertexai.url":
return "Your VertexAI embedding url"
case "vertexai.credential":
return "The name in the crendential configuration item"
case "vertexai.enable":
return "Whether to enable vertexai model service"
default:
return ""
}
},
}
p.TextEmbeddingProviders.Init(base.mgr)
p.RerankModelProviders = ParamGroup{
KeyPrefix: "function.rerank.model.providers.",
Version: "2.6.0",
Export: true,
DocFunc: func(key string) string {
switch key {
case "tei.credential":
return "The name in the crendential configuration item"
case "tei.enable":
return "Whether to enable TEI rerank service"
case "vllm.credential":
return "The name in the crendential configuration item"
case "vllm.enable":
return "Whether to enable vllm rerank service"
case "siliconflow.credential":
return "The name in the crendential configuration item"
case "siliconflow.url":
return "Your siliconflow rerank url, Default is the official rerank url"
case "siliconflow.enable":
return "Whether to enable siliconflow model service"
case "voyageai.credential":
return "The name in the crendential configuration item"
case "voyageai.url":
return "Your voyageai rerank url, Default is the official rerank url"
case "voyageai.enable":
return "Whether to enable voyageai model service"
case "cohere.credential":
return "The name in the crendential configuration item"
case "cohere.url":
return "Your cohere rerank url, Default is the official rerank url"
case "cohere.enable":
return "Whether to enable cohere model service"
default:
return ""
}
},
}
p.RerankModelProviders.Init(base.mgr)
p.LocalResourcePath = ParamItem{
Key: "function.analyzer.local_resource_path",
Version: "2.5.16",
Export: true,
DefaultValue: "/var/lib/milvus/analyzer",
}
p.LocalResourcePath.Init(base.mgr)
p.LinderaDownloadUrls = ParamGroup{
KeyPrefix: "function.analyzer.lindera.download_urls.",
Version: "2.5.16",
}
p.LinderaDownloadUrls.Init(base.mgr)
p.ZillizProviders = ParamGroup{
KeyPrefix: "function.models.zilliz.",
Version: "2.6.5",
}
p.ZillizProviders.Init(base.mgr)
}
func (p *functionConfig) GetTextEmbeddingProviderConfig(providerName string) map[string]string {
matchedParam := make(map[string]string)
params := p.TextEmbeddingProviders.GetValue()
prefix := providerName + "."
for k, v := range params {
if strings.HasPrefix(k, prefix) {
matchedParam[strings.TrimPrefix(k, prefix)] = v
}
}
return matchedParam
}
func (p *functionConfig) GetBatchFactor() int {
factor := p.BatchFactor.GetAsInt()
if factor <= 0 {
factor = 1
}
return factor
}
func (p *functionConfig) GetRerankModelProviders(providerName string) map[string]string {
matchedParam := make(map[string]string)
params := p.RerankModelProviders.GetValue()
prefix := providerName + "."
for k, v := range params {
if strings.HasPrefix(k, prefix) {
matchedParam[strings.TrimPrefix(k, prefix)] = v
}
}
return matchedParam
}