mirror of
https://gitee.com/milvus-io/milvus.git
synced 2025-12-07 01:28:27 +08:00
issue: #36672 The expression supports filling elements through templates, which helps to reduce the overhead of parsing the elements. --------- Signed-off-by: Cai Zhang <cai.zhang@zilliz.com>
159 lines
5.4 KiB
Go
159 lines
5.4 KiB
Go
package common
|
|
|
|
import (
|
|
"encoding/binary"
|
|
"fmt"
|
|
"math"
|
|
"math/rand"
|
|
"strings"
|
|
"time"
|
|
|
|
"github.com/x448/float16"
|
|
"go.uber.org/zap"
|
|
|
|
"github.com/milvus-io/milvus/client/v2/entity"
|
|
"github.com/milvus-io/milvus/pkg/log"
|
|
)
|
|
|
|
var (
|
|
letterRunes = []rune("abcdefghijklmnopqrstuvwxyzABCDEFGHIJKLMNOPQRSTUVWXYZ")
|
|
r *rand.Rand
|
|
)
|
|
|
|
func init() {
|
|
r = rand.New(rand.NewSource(time.Now().UnixNano()))
|
|
}
|
|
|
|
func GenRandomString(prefix string, n int) string {
|
|
b := make([]rune, n)
|
|
for i := range b {
|
|
b[i] = letterRunes[r.Intn(len(letterRunes))]
|
|
}
|
|
str := fmt.Sprintf("%s_%s", prefix, string(b))
|
|
return str
|
|
}
|
|
|
|
// GenLongString gen invalid long string
|
|
func GenLongString(n int) string {
|
|
var builder strings.Builder
|
|
longString := "a"
|
|
for i := 0; i < n; i++ {
|
|
builder.WriteString(longString)
|
|
}
|
|
return builder.String()
|
|
}
|
|
|
|
func GenValidNames() []string {
|
|
return []string{
|
|
"a",
|
|
"_",
|
|
"_name",
|
|
"_123",
|
|
"name_",
|
|
"_coll_123_",
|
|
}
|
|
}
|
|
|
|
func GenInvalidNames() []string {
|
|
invalidNames := []string{
|
|
"",
|
|
" ",
|
|
"12-s",
|
|
"(mn)",
|
|
"中文",
|
|
"%$#",
|
|
"1",
|
|
"[10]",
|
|
"a b",
|
|
DefaultDynamicFieldName,
|
|
GenLongString(MaxCollectionNameLen + 1),
|
|
}
|
|
return invalidNames
|
|
}
|
|
|
|
func GenFloatVector(dim int) []float32 {
|
|
vector := make([]float32, 0, dim)
|
|
for j := 0; j < dim; j++ {
|
|
vector = append(vector, rand.Float32())
|
|
}
|
|
return vector
|
|
}
|
|
|
|
func GenFloat16Vector(dim int) []byte {
|
|
ret := make([]byte, dim*2)
|
|
for i := 0; i < dim; i++ {
|
|
v := float16.Fromfloat32(rand.Float32()).Bits()
|
|
binary.LittleEndian.PutUint16(ret[i*2:], v)
|
|
}
|
|
return ret
|
|
}
|
|
|
|
func GenBFloat16Vector(dim int) []byte {
|
|
ret16 := make([]uint16, 0, dim)
|
|
for i := 0; i < dim; i++ {
|
|
f := rand.Float32()
|
|
bits := math.Float32bits(f)
|
|
bits >>= 16
|
|
bits &= 0x7FFF
|
|
ret16 = append(ret16, uint16(bits))
|
|
}
|
|
ret := make([]byte, len(ret16)*2)
|
|
for i, value := range ret16 {
|
|
binary.LittleEndian.PutUint16(ret[i*2:], value)
|
|
}
|
|
return ret
|
|
}
|
|
|
|
func GenBinaryVector(dim int) []byte {
|
|
vector := make([]byte, dim/8)
|
|
rand.Read(vector)
|
|
return vector
|
|
}
|
|
|
|
func GenSparseVector(maxLen int) entity.SparseEmbedding {
|
|
length := 1 + rand.Intn(1+maxLen)
|
|
positions := make([]uint32, length)
|
|
values := make([]float32, length)
|
|
for i := 0; i < length; i++ {
|
|
positions[i] = uint32(2*i + 1)
|
|
values[i] = rand.Float32()
|
|
}
|
|
vector, err := entity.NewSliceSparseEmbedding(positions, values)
|
|
if err != nil {
|
|
log.Fatal("Generate vector failed %s", zap.Error(err))
|
|
}
|
|
return vector
|
|
}
|
|
|
|
// InvalidExprStruct invalid expr
|
|
type InvalidExprStruct struct {
|
|
Expr string
|
|
ErrNil bool
|
|
ErrMsg string
|
|
}
|
|
|
|
var InvalidExpressions = []InvalidExprStruct{
|
|
{Expr: "id in [0]", ErrNil: true, ErrMsg: "fieldName(id) not found"}, // not exist field but no error
|
|
{Expr: "int64 in not [0]", ErrNil: false, ErrMsg: "cannot parse expression"}, // wrong term expr keyword
|
|
{Expr: "int64 > 10 AND int64 < 100", ErrNil: false, ErrMsg: "cannot parse expression"}, // AND isn't supported
|
|
{Expr: "int64 < 10 OR int64 > 100", ErrNil: false, ErrMsg: "cannot parse expression"}, // OR isn't supported
|
|
{Expr: "int64 < floatVec", ErrNil: false, ErrMsg: "not supported"}, // unsupported compare field
|
|
{Expr: "floatVec in [0]", ErrNil: false, ErrMsg: "cannot be casted to FloatVector"}, // value and field type mismatch
|
|
{Expr: fmt.Sprintf("%s == 1", DefaultJSONFieldName), ErrNil: true, ErrMsg: ""}, // hist empty
|
|
{Expr: fmt.Sprintf("%s like 'a%%' ", DefaultJSONFieldName), ErrNil: true, ErrMsg: ""}, // hist empty
|
|
{Expr: fmt.Sprintf("%s like `a%%` ", DefaultJSONFieldName), ErrNil: false, ErrMsg: "cannot parse expression"}, // ``
|
|
{Expr: fmt.Sprintf("%s > 1", DefaultDynamicFieldName), ErrNil: true, ErrMsg: ""}, // hits empty
|
|
{Expr: fmt.Sprintf("%s[\"dynamicList\"] == [2, 3]", DefaultDynamicFieldName), ErrNil: true, ErrMsg: ""},
|
|
{Expr: fmt.Sprintf("%s['a'] == [2, 3]", DefaultJSONFieldName), ErrNil: true, ErrMsg: ""}, // json field not exist
|
|
{Expr: fmt.Sprintf("%s['number'] == [2, 3]", DefaultJSONFieldName), ErrNil: true, ErrMsg: ""}, // field exist but type not match
|
|
{Expr: fmt.Sprintf("%s[0] == [2, 3]", DefaultJSONFieldName), ErrNil: true, ErrMsg: ""}, // field exist but type not match
|
|
{Expr: fmt.Sprintf("json_contains (%s['number'], 2)", DefaultJSONFieldName), ErrNil: true, ErrMsg: ""},
|
|
{Expr: fmt.Sprintf("json_contains (%s['list'], [2])", DefaultJSONFieldName), ErrNil: true, ErrMsg: ""},
|
|
{Expr: fmt.Sprintf("json_contains_all (%s['list'], 2)", DefaultJSONFieldName), ErrNil: false, ErrMsg: "operation element must be an array"},
|
|
{Expr: fmt.Sprintf("JSON_CONTAINS_ANY (%s['list'], 2)", DefaultJSONFieldName), ErrNil: false, ErrMsg: "operation element must be an array"},
|
|
{Expr: fmt.Sprintf("json_contains_aby (%s['list'], 2)", DefaultJSONFieldName), ErrNil: false, ErrMsg: "function json_contains_aby(json, int64_t) not found."},
|
|
{Expr: fmt.Sprintf("json_contains_aby (%s['list'], 2)", DefaultJSONFieldName), ErrNil: false, ErrMsg: "function json_contains_aby(json, int64_t) not found."},
|
|
{Expr: fmt.Sprintf("%s[-1] > %d", DefaultInt8ArrayField, TestCapacity), ErrNil: false, ErrMsg: "cannot parse expression"}, // array[-1] >
|
|
{Expr: fmt.Sprintf("%s[-1] > 1", DefaultJSONFieldName), ErrNil: false, ErrMsg: "invalid expression"}, // json[-1] >
|
|
}
|