mirror of
https://gitee.com/milvus-io/milvus.git
synced 2025-12-28 22:45:26 +08:00
related: #45993 This commit extends nullable vector support to the proxy layer, querynode, and adds comprehensive validation, search reduce, and field data handling for nullable vectors with sparse storage. Proxy layer changes: - Update validate_util.go checkAligned() with getExpectedVectorRows() helper to validate nullable vector field alignment using valid data count - Update checkFloatVectorFieldData/checkSparseFloatVectorFieldData for nullable vector validation with proper row count expectations - Add FieldDataIdxComputer in typeutil/schema.go for logical-to-physical index translation during search reduce operations - Update search_reduce_util.go reduceSearchResultData to use idxComputers for correct field data indexing with nullable vectors - Update task.go, task_query.go, task_upsert.go for nullable vector handling - Update msg_pack.go with nullable vector field data processing QueryNode layer changes: - Update segments/result.go for nullable vector result handling - Update segments/search_reduce.go with nullable vector offset translation Storage and index changes: - Update data_codec.go and utils.go for nullable vector serialization - Update indexcgowrapper/dataset.go and index.go for nullable vector indexing Utility changes: - Add FieldDataIdxComputer struct with Compute() method for efficient logical-to-physical index mapping across multiple field data - Update EstimateEntitySize() and AppendFieldData() with fieldIdxs parameter - Update funcutil.go with nullable vector support functions <!-- This is an auto-generated comment: release notes by coderabbit.ai --> ## Summary by CodeRabbit * **New Features** * Full support for nullable vector fields (float, binary, float16, bfloat16, int8, sparse) across ingest, storage, indexing, search and retrieval; logical↔physical offset mapping preserves row semantics. * Client: compaction control and compaction-state APIs. * **Bug Fixes** * Improved validation for adding vector fields (nullable + dimension checks) and corrected search/query behavior for nullable vectors. * **Chores** * Persisted validity maps with indexes and on-disk formats. * **Tests** * Extensive new and updated end-to-end nullable-vector tests. <sub>✏️ Tip: You can customize this high-level summary in your review settings.</sub> <!-- end of auto-generated comment: release notes by coderabbit.ai --> --------- Signed-off-by: marcelo-cjl <marcelo.chen@zilliz.com>
3097 lines
88 KiB
Go
3097 lines
88 KiB
Go
// Licensed to the LF AI & Data foundation under one
|
|
// or more contributor license agreements. See the NOTICE file
|
|
// distributed with this work for additional information
|
|
// regarding copyright ownership. The ASF licenses this file
|
|
// to you under the Apache License, Version 2.0 (the
|
|
// "License"); you may not use this file except in compliance
|
|
// with the License. You may obtain a copy of the License at
|
|
//
|
|
// http://www.apache.org/licenses/LICENSE-2.0
|
|
//
|
|
// Unless required by applicable law or agreed to in writing, software
|
|
// distributed under the License is distributed on an "AS IS" BASIS,
|
|
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
// See the License for the specific language governing permissions and
|
|
// limitations under the License.
|
|
|
|
package storage
|
|
|
|
import (
|
|
"math"
|
|
"math/rand"
|
|
"testing"
|
|
|
|
"github.com/apache/arrow/go/v17/arrow/array"
|
|
"github.com/stretchr/testify/assert"
|
|
"github.com/stretchr/testify/require"
|
|
|
|
"github.com/milvus-io/milvus-proto/go-api/v2/schemapb"
|
|
"github.com/milvus-io/milvus/pkg/v2/util/merr"
|
|
"github.com/milvus-io/milvus/pkg/v2/util/typeutil"
|
|
)
|
|
|
|
func TestPayload_ReaderAndWriter(t *testing.T) {
|
|
t.Run("TestBool", func(t *testing.T) {
|
|
w, err := NewPayloadWriter(schemapb.DataType_Bool)
|
|
require.Nil(t, err)
|
|
require.NotNil(t, w)
|
|
|
|
err = w.AddBoolToPayload([]bool{false, false, false, false}, nil)
|
|
assert.NoError(t, err)
|
|
err = w.AddDataToPayloadForUT([]bool{false, false, false, false}, nil)
|
|
assert.NoError(t, err)
|
|
err = w.FinishPayloadWriter()
|
|
assert.NoError(t, err)
|
|
|
|
length, err := w.GetPayloadLengthFromWriter()
|
|
assert.NoError(t, err)
|
|
assert.Equal(t, 8, length)
|
|
defer w.ReleasePayloadWriter()
|
|
|
|
buffer, err := w.GetPayloadBufferFromWriter()
|
|
assert.NoError(t, err)
|
|
|
|
r, err := NewPayloadReader(schemapb.DataType_Bool, buffer, false)
|
|
require.Nil(t, err)
|
|
length, err = r.GetPayloadLengthFromReader()
|
|
assert.NoError(t, err)
|
|
assert.Equal(t, length, 8)
|
|
bools, valids, err := r.GetBoolFromPayload()
|
|
assert.NoError(t, err)
|
|
assert.Equal(t, []bool{false, false, false, false, false, false, false, false}, bools)
|
|
assert.Nil(t, valids)
|
|
ibools, valids, _, err := r.GetDataFromPayload()
|
|
bools = ibools.([]bool)
|
|
assert.NoError(t, err)
|
|
assert.Nil(t, valids)
|
|
assert.Equal(t, []bool{false, false, false, false, false, false, false, false}, bools)
|
|
defer r.ReleasePayloadReader()
|
|
})
|
|
|
|
t.Run("TestInt8", func(t *testing.T) {
|
|
w, err := NewPayloadWriter(schemapb.DataType_Int8)
|
|
require.Nil(t, err)
|
|
require.NotNil(t, w)
|
|
|
|
err = w.AddInt8ToPayload([]int8{1, 2, 3}, nil)
|
|
assert.NoError(t, err)
|
|
err = w.AddDataToPayloadForUT([]int8{4, 5, 6}, nil)
|
|
assert.NoError(t, err)
|
|
err = w.FinishPayloadWriter()
|
|
assert.NoError(t, err)
|
|
|
|
length, err := w.GetPayloadLengthFromWriter()
|
|
assert.NoError(t, err)
|
|
assert.Equal(t, 6, length)
|
|
defer w.ReleasePayloadWriter()
|
|
|
|
buffer, err := w.GetPayloadBufferFromWriter()
|
|
assert.NoError(t, err)
|
|
|
|
r, err := NewPayloadReader(schemapb.DataType_Int8, buffer, false)
|
|
require.Nil(t, err)
|
|
length, err = r.GetPayloadLengthFromReader()
|
|
assert.NoError(t, err)
|
|
assert.Equal(t, length, 6)
|
|
|
|
int8s, valids, err := r.GetInt8FromPayload()
|
|
assert.NoError(t, err)
|
|
assert.Nil(t, valids)
|
|
assert.Equal(t, []int8{1, 2, 3, 4, 5, 6}, int8s)
|
|
|
|
iint8s, valids, _, err := r.GetDataFromPayload()
|
|
int8s = iint8s.([]int8)
|
|
assert.NoError(t, err)
|
|
assert.Nil(t, valids)
|
|
|
|
assert.Equal(t, []int8{1, 2, 3, 4, 5, 6}, int8s)
|
|
defer r.ReleasePayloadReader()
|
|
})
|
|
|
|
t.Run("TestInt16", func(t *testing.T) {
|
|
w, err := NewPayloadWriter(schemapb.DataType_Int16)
|
|
require.Nil(t, err)
|
|
require.NotNil(t, w)
|
|
|
|
err = w.AddInt16ToPayload([]int16{1, 2, 3}, nil)
|
|
assert.NoError(t, err)
|
|
err = w.AddDataToPayloadForUT([]int16{1, 2, 3}, nil)
|
|
assert.NoError(t, err)
|
|
err = w.FinishPayloadWriter()
|
|
assert.NoError(t, err)
|
|
|
|
length, err := w.GetPayloadLengthFromWriter()
|
|
assert.NoError(t, err)
|
|
assert.Equal(t, 6, length)
|
|
defer w.ReleasePayloadWriter()
|
|
|
|
buffer, err := w.GetPayloadBufferFromWriter()
|
|
assert.NoError(t, err)
|
|
|
|
r, err := NewPayloadReader(schemapb.DataType_Int16, buffer, false)
|
|
require.Nil(t, err)
|
|
length, err = r.GetPayloadLengthFromReader()
|
|
assert.NoError(t, err)
|
|
assert.Equal(t, length, 6)
|
|
int16s, valids, err := r.GetInt16FromPayload()
|
|
assert.NoError(t, err)
|
|
assert.Nil(t, valids)
|
|
assert.Equal(t, []int16{1, 2, 3, 1, 2, 3}, int16s)
|
|
|
|
iint16s, valids, _, err := r.GetDataFromPayload()
|
|
int16s = iint16s.([]int16)
|
|
assert.NoError(t, err)
|
|
assert.Nil(t, valids)
|
|
assert.Equal(t, []int16{1, 2, 3, 1, 2, 3}, int16s)
|
|
defer r.ReleasePayloadReader()
|
|
})
|
|
|
|
t.Run("TestInt32", func(t *testing.T) {
|
|
w, err := NewPayloadWriter(schemapb.DataType_Int32)
|
|
require.Nil(t, err)
|
|
require.NotNil(t, w)
|
|
|
|
err = w.AddInt32ToPayload([]int32{1, 2, 3}, nil)
|
|
assert.NoError(t, err)
|
|
err = w.AddDataToPayloadForUT([]int32{1, 2, 3}, nil)
|
|
assert.NoError(t, err)
|
|
err = w.FinishPayloadWriter()
|
|
assert.NoError(t, err)
|
|
|
|
length, err := w.GetPayloadLengthFromWriter()
|
|
assert.NoError(t, err)
|
|
assert.Equal(t, 6, length)
|
|
defer w.ReleasePayloadWriter()
|
|
|
|
buffer, err := w.GetPayloadBufferFromWriter()
|
|
assert.NoError(t, err)
|
|
|
|
r, err := NewPayloadReader(schemapb.DataType_Int32, buffer, false)
|
|
require.Nil(t, err)
|
|
length, err = r.GetPayloadLengthFromReader()
|
|
assert.NoError(t, err)
|
|
assert.Equal(t, length, 6)
|
|
|
|
int32s, valids, err := r.GetInt32FromPayload()
|
|
assert.NoError(t, err)
|
|
assert.Equal(t, []int32{1, 2, 3, 1, 2, 3}, int32s)
|
|
assert.Nil(t, valids)
|
|
|
|
iint32s, valids, _, err := r.GetDataFromPayload()
|
|
int32s = iint32s.([]int32)
|
|
assert.NoError(t, err)
|
|
assert.Equal(t, []int32{1, 2, 3, 1, 2, 3}, int32s)
|
|
assert.Nil(t, valids)
|
|
defer r.ReleasePayloadReader()
|
|
})
|
|
|
|
t.Run("TestInt64", func(t *testing.T) {
|
|
w, err := NewPayloadWriter(schemapb.DataType_Int64)
|
|
require.Nil(t, err)
|
|
require.NotNil(t, w)
|
|
|
|
err = w.AddInt64ToPayload([]int64{1, 2, 3}, nil)
|
|
assert.NoError(t, err)
|
|
err = w.AddDataToPayloadForUT([]int64{1, 2, 3}, nil)
|
|
assert.NoError(t, err)
|
|
err = w.FinishPayloadWriter()
|
|
assert.NoError(t, err)
|
|
|
|
length, err := w.GetPayloadLengthFromWriter()
|
|
assert.NoError(t, err)
|
|
assert.Equal(t, 6, length)
|
|
defer w.ReleasePayloadWriter()
|
|
|
|
buffer, err := w.GetPayloadBufferFromWriter()
|
|
assert.NoError(t, err)
|
|
|
|
r, err := NewPayloadReader(schemapb.DataType_Int64, buffer, false)
|
|
require.Nil(t, err)
|
|
length, err = r.GetPayloadLengthFromReader()
|
|
assert.NoError(t, err)
|
|
assert.Equal(t, length, 6)
|
|
|
|
int64s, valids, err := r.GetInt64FromPayload()
|
|
assert.NoError(t, err)
|
|
assert.Equal(t, []int64{1, 2, 3, 1, 2, 3}, int64s)
|
|
assert.Nil(t, valids)
|
|
|
|
iint64s, valids, _, err := r.GetDataFromPayload()
|
|
int64s = iint64s.([]int64)
|
|
assert.NoError(t, err)
|
|
assert.Equal(t, []int64{1, 2, 3, 1, 2, 3}, int64s)
|
|
assert.Nil(t, valids)
|
|
defer r.ReleasePayloadReader()
|
|
})
|
|
|
|
t.Run("TestFloat32", func(t *testing.T) {
|
|
w, err := NewPayloadWriter(schemapb.DataType_Float)
|
|
require.Nil(t, err)
|
|
require.NotNil(t, w)
|
|
|
|
err = w.AddFloatToPayload([]float32{1.0, 2.0, 3.0}, nil)
|
|
assert.NoError(t, err)
|
|
err = w.AddDataToPayloadForUT([]float32{1.0, 2.0, 3.0}, nil)
|
|
assert.NoError(t, err)
|
|
err = w.FinishPayloadWriter()
|
|
assert.NoError(t, err)
|
|
|
|
length, err := w.GetPayloadLengthFromWriter()
|
|
assert.NoError(t, err)
|
|
assert.Equal(t, 6, length)
|
|
defer w.ReleasePayloadWriter()
|
|
|
|
buffer, err := w.GetPayloadBufferFromWriter()
|
|
assert.NoError(t, err)
|
|
|
|
r, err := NewPayloadReader(schemapb.DataType_Float, buffer, false)
|
|
require.Nil(t, err)
|
|
length, err = r.GetPayloadLengthFromReader()
|
|
assert.NoError(t, err)
|
|
assert.Equal(t, length, 6)
|
|
|
|
float32s, valids, err := r.GetFloatFromPayload()
|
|
assert.NoError(t, err)
|
|
assert.Equal(t, []float32{1.0, 2.0, 3.0, 1.0, 2.0, 3.0}, float32s)
|
|
assert.Nil(t, valids)
|
|
|
|
ifloat32s, valids, _, err := r.GetDataFromPayload()
|
|
float32s = ifloat32s.([]float32)
|
|
assert.NoError(t, err)
|
|
assert.Equal(t, []float32{1.0, 2.0, 3.0, 1.0, 2.0, 3.0}, float32s)
|
|
assert.Nil(t, valids)
|
|
defer r.ReleasePayloadReader()
|
|
})
|
|
|
|
t.Run("TestDouble", func(t *testing.T) {
|
|
w, err := NewPayloadWriter(schemapb.DataType_Double)
|
|
require.Nil(t, err)
|
|
require.NotNil(t, w)
|
|
|
|
err = w.AddDoubleToPayload([]float64{1.0, 2.0, 3.0}, nil)
|
|
assert.NoError(t, err)
|
|
err = w.AddDataToPayloadForUT([]float64{1.0, 2.0, 3.0}, nil)
|
|
assert.NoError(t, err)
|
|
err = w.FinishPayloadWriter()
|
|
assert.NoError(t, err)
|
|
|
|
length, err := w.GetPayloadLengthFromWriter()
|
|
assert.NoError(t, err)
|
|
assert.Equal(t, 6, length)
|
|
defer w.ReleasePayloadWriter()
|
|
|
|
buffer, err := w.GetPayloadBufferFromWriter()
|
|
assert.NoError(t, err)
|
|
|
|
r, err := NewPayloadReader(schemapb.DataType_Double, buffer, false)
|
|
require.Nil(t, err)
|
|
length, err = r.GetPayloadLengthFromReader()
|
|
assert.NoError(t, err)
|
|
assert.Equal(t, length, 6)
|
|
|
|
float64s, valids, err := r.GetDoubleFromPayload()
|
|
assert.NoError(t, err)
|
|
assert.Equal(t, []float64{1.0, 2.0, 3.0, 1.0, 2.0, 3.0}, float64s)
|
|
assert.Nil(t, valids)
|
|
|
|
ifloat64s, valids, _, err := r.GetDataFromPayload()
|
|
float64s = ifloat64s.([]float64)
|
|
assert.NoError(t, err)
|
|
assert.Nil(t, valids)
|
|
assert.Equal(t, []float64{1.0, 2.0, 3.0, 1.0, 2.0, 3.0}, float64s)
|
|
defer r.ReleasePayloadReader()
|
|
})
|
|
|
|
t.Run("TestAddString", func(t *testing.T) {
|
|
w, err := NewPayloadWriter(schemapb.DataType_String)
|
|
require.Nil(t, err)
|
|
require.NotNil(t, w)
|
|
|
|
err = w.AddOneStringToPayload("hello0", true)
|
|
assert.NoError(t, err)
|
|
err = w.AddOneStringToPayload("hello1", true)
|
|
assert.NoError(t, err)
|
|
err = w.AddOneStringToPayload("hello2", true)
|
|
assert.NoError(t, err)
|
|
err = w.AddDataToPayloadForUT("hello3", nil)
|
|
assert.NoError(t, err)
|
|
err = w.FinishPayloadWriter()
|
|
assert.NoError(t, err)
|
|
length, err := w.GetPayloadLengthFromWriter()
|
|
assert.NoError(t, err)
|
|
assert.Equal(t, length, 4)
|
|
buffer, err := w.GetPayloadBufferFromWriter()
|
|
assert.NoError(t, err)
|
|
|
|
r, err := NewPayloadReader(schemapb.DataType_String, buffer, false)
|
|
assert.NoError(t, err)
|
|
length, err = r.GetPayloadLengthFromReader()
|
|
assert.NoError(t, err)
|
|
assert.Equal(t, length, 4)
|
|
|
|
str, valids, err := r.GetStringFromPayload()
|
|
assert.NoError(t, err)
|
|
assert.Nil(t, valids)
|
|
|
|
assert.Equal(t, str[0], "hello0")
|
|
assert.Equal(t, str[1], "hello1")
|
|
assert.Equal(t, str[2], "hello2")
|
|
assert.Equal(t, str[3], "hello3")
|
|
|
|
istr, valids, _, err := r.GetDataFromPayload()
|
|
strArray := istr.([]string)
|
|
assert.NoError(t, err)
|
|
assert.Equal(t, strArray[0], "hello0")
|
|
assert.Equal(t, strArray[1], "hello1")
|
|
assert.Equal(t, strArray[2], "hello2")
|
|
assert.Equal(t, strArray[3], "hello3")
|
|
assert.Nil(t, valids)
|
|
r.ReleasePayloadReader()
|
|
w.ReleasePayloadWriter()
|
|
})
|
|
|
|
t.Run("TestAddArray", func(t *testing.T) {
|
|
w, err := NewPayloadWriter(schemapb.DataType_Array)
|
|
require.Nil(t, err)
|
|
require.NotNil(t, w)
|
|
|
|
err = w.AddOneArrayToPayload(&schemapb.ScalarField{
|
|
Data: &schemapb.ScalarField_IntData{
|
|
IntData: &schemapb.IntArray{
|
|
Data: []int32{1, 2},
|
|
},
|
|
},
|
|
}, true)
|
|
assert.NoError(t, err)
|
|
err = w.AddOneArrayToPayload(&schemapb.ScalarField{
|
|
Data: &schemapb.ScalarField_IntData{
|
|
IntData: &schemapb.IntArray{
|
|
Data: []int32{3, 4},
|
|
},
|
|
},
|
|
}, true)
|
|
assert.NoError(t, err)
|
|
err = w.AddOneArrayToPayload(&schemapb.ScalarField{
|
|
Data: &schemapb.ScalarField_IntData{
|
|
IntData: &schemapb.IntArray{
|
|
Data: []int32{5, 6},
|
|
},
|
|
},
|
|
}, true)
|
|
assert.NoError(t, err)
|
|
err = w.AddDataToPayloadForUT(&schemapb.ScalarField{
|
|
Data: &schemapb.ScalarField_IntData{
|
|
IntData: &schemapb.IntArray{
|
|
Data: []int32{7, 8},
|
|
},
|
|
},
|
|
}, nil)
|
|
assert.NoError(t, err)
|
|
err = w.FinishPayloadWriter()
|
|
assert.NoError(t, err)
|
|
length, err := w.GetPayloadLengthFromWriter()
|
|
assert.NoError(t, err)
|
|
assert.Equal(t, length, 4)
|
|
buffer, err := w.GetPayloadBufferFromWriter()
|
|
assert.NoError(t, err)
|
|
|
|
r, err := NewPayloadReader(schemapb.DataType_Array, buffer, false)
|
|
assert.NoError(t, err)
|
|
length, err = r.GetPayloadLengthFromReader()
|
|
assert.NoError(t, err)
|
|
assert.Equal(t, length, 4)
|
|
|
|
arrayList, valids, err := r.GetArrayFromPayload()
|
|
assert.NoError(t, err)
|
|
assert.Nil(t, valids)
|
|
|
|
assert.EqualValues(t, []int32{1, 2}, arrayList[0].GetIntData().GetData())
|
|
assert.EqualValues(t, []int32{3, 4}, arrayList[1].GetIntData().GetData())
|
|
assert.EqualValues(t, []int32{5, 6}, arrayList[2].GetIntData().GetData())
|
|
assert.EqualValues(t, []int32{7, 8}, arrayList[3].GetIntData().GetData())
|
|
|
|
iArrayList, valids, _, err := r.GetDataFromPayload()
|
|
arrayList = iArrayList.([]*schemapb.ScalarField)
|
|
assert.NoError(t, err)
|
|
assert.Nil(t, valids)
|
|
assert.EqualValues(t, []int32{1, 2}, arrayList[0].GetIntData().GetData())
|
|
assert.EqualValues(t, []int32{3, 4}, arrayList[1].GetIntData().GetData())
|
|
assert.EqualValues(t, []int32{5, 6}, arrayList[2].GetIntData().GetData())
|
|
assert.EqualValues(t, []int32{7, 8}, arrayList[3].GetIntData().GetData())
|
|
r.ReleasePayloadReader()
|
|
w.ReleasePayloadWriter()
|
|
})
|
|
|
|
t.Run("TestAddJSON", func(t *testing.T) {
|
|
w, err := NewPayloadWriter(schemapb.DataType_JSON)
|
|
require.Nil(t, err)
|
|
require.NotNil(t, w)
|
|
|
|
err = w.AddOneJSONToPayload([]byte(`{"1":"1"}`), true)
|
|
assert.NoError(t, err)
|
|
err = w.AddOneJSONToPayload([]byte(`{"2":"2"}`), true)
|
|
assert.NoError(t, err)
|
|
err = w.AddOneJSONToPayload([]byte(`{"3":"3"}`), true)
|
|
assert.NoError(t, err)
|
|
err = w.AddDataToPayloadForUT([]byte(`{"4":"4"}`), nil)
|
|
assert.NoError(t, err)
|
|
err = w.FinishPayloadWriter()
|
|
assert.NoError(t, err)
|
|
length, err := w.GetPayloadLengthFromWriter()
|
|
assert.NoError(t, err)
|
|
assert.Equal(t, length, 4)
|
|
buffer, err := w.GetPayloadBufferFromWriter()
|
|
assert.NoError(t, err)
|
|
|
|
r, err := NewPayloadReader(schemapb.DataType_JSON, buffer, false)
|
|
assert.NoError(t, err)
|
|
length, err = r.GetPayloadLengthFromReader()
|
|
assert.NoError(t, err)
|
|
assert.Equal(t, length, 4)
|
|
|
|
json, valids, err := r.GetJSONFromPayload()
|
|
assert.NoError(t, err)
|
|
assert.Nil(t, valids)
|
|
|
|
assert.EqualValues(t, []byte(`{"1":"1"}`), json[0])
|
|
assert.EqualValues(t, []byte(`{"2":"2"}`), json[1])
|
|
assert.EqualValues(t, []byte(`{"3":"3"}`), json[2])
|
|
assert.EqualValues(t, []byte(`{"4":"4"}`), json[3])
|
|
|
|
iJSON, valids, _, err := r.GetDataFromPayload()
|
|
json = iJSON.([][]byte)
|
|
assert.NoError(t, err)
|
|
assert.Nil(t, valids)
|
|
assert.EqualValues(t, []byte(`{"1":"1"}`), json[0])
|
|
assert.EqualValues(t, []byte(`{"2":"2"}`), json[1])
|
|
assert.EqualValues(t, []byte(`{"3":"3"}`), json[2])
|
|
assert.EqualValues(t, []byte(`{"4":"4"}`), json[3])
|
|
r.ReleasePayloadReader()
|
|
w.ReleasePayloadWriter()
|
|
})
|
|
|
|
t.Run("TestBinaryVector", func(t *testing.T) {
|
|
w, err := NewPayloadWriter(schemapb.DataType_BinaryVector, WithDim(8))
|
|
require.Nil(t, err)
|
|
require.NotNil(t, w)
|
|
|
|
in := make([]byte, 16)
|
|
for i := 0; i < 16; i++ {
|
|
in[i] = 1
|
|
}
|
|
in2 := make([]byte, 8)
|
|
for i := 0; i < 8; i++ {
|
|
in2[i] = 1
|
|
}
|
|
|
|
err = w.AddBinaryVectorToPayload(in, 8, nil)
|
|
assert.NoError(t, err)
|
|
err = w.AddDataToPayloadForUT(in2, nil)
|
|
assert.NoError(t, err)
|
|
err = w.FinishPayloadWriter()
|
|
assert.NoError(t, err)
|
|
|
|
length, err := w.GetPayloadLengthFromWriter()
|
|
assert.NoError(t, err)
|
|
assert.Equal(t, 24, length)
|
|
defer w.ReleasePayloadWriter()
|
|
|
|
buffer, err := w.GetPayloadBufferFromWriter()
|
|
assert.NoError(t, err)
|
|
|
|
r, err := NewPayloadReader(schemapb.DataType_BinaryVector, buffer, false)
|
|
require.Nil(t, err)
|
|
length, err = r.GetPayloadLengthFromReader()
|
|
assert.NoError(t, err)
|
|
assert.Equal(t, length, 24)
|
|
|
|
binVecs, dim, _, _, err := r.GetBinaryVectorFromPayload()
|
|
assert.NoError(t, err)
|
|
assert.Equal(t, 8, dim)
|
|
assert.Equal(t, 24, len(binVecs))
|
|
|
|
ibinVecs, valids, dim, err := r.GetDataFromPayload()
|
|
assert.Nil(t, valids)
|
|
assert.NoError(t, err)
|
|
binVecs = ibinVecs.([]byte)
|
|
assert.Equal(t, 8, dim)
|
|
assert.Equal(t, 24, len(binVecs))
|
|
defer r.ReleasePayloadReader()
|
|
})
|
|
|
|
t.Run("TestFloatVector", func(t *testing.T) {
|
|
w, err := NewPayloadWriter(schemapb.DataType_FloatVector, WithDim(1))
|
|
require.Nil(t, err)
|
|
require.NotNil(t, w)
|
|
|
|
err = w.AddFloatVectorToPayload([]float32{1.0, 2.0}, 1, nil)
|
|
assert.NoError(t, err)
|
|
err = w.AddDataToPayloadForUT([]float32{3.0, 4.0}, nil)
|
|
assert.NoError(t, err)
|
|
err = w.FinishPayloadWriter()
|
|
assert.NoError(t, err)
|
|
|
|
length, err := w.GetPayloadLengthFromWriter()
|
|
assert.NoError(t, err)
|
|
assert.Equal(t, 4, length)
|
|
defer w.ReleasePayloadWriter()
|
|
|
|
buffer, err := w.GetPayloadBufferFromWriter()
|
|
assert.NoError(t, err)
|
|
|
|
r, err := NewPayloadReader(schemapb.DataType_FloatVector, buffer, false)
|
|
require.Nil(t, err)
|
|
length, err = r.GetPayloadLengthFromReader()
|
|
assert.NoError(t, err)
|
|
assert.Equal(t, length, 4)
|
|
|
|
floatVecs, dim, _, _, err := r.GetFloatVectorFromPayload()
|
|
assert.NoError(t, err)
|
|
assert.Equal(t, 1, dim)
|
|
assert.Equal(t, 4, len(floatVecs))
|
|
assert.Equal(t, []float32{1.0, 2.0, 3.0, 4.0}, floatVecs)
|
|
|
|
ifloatVecs, valids, dim, err := r.GetDataFromPayload()
|
|
assert.Nil(t, valids)
|
|
assert.NoError(t, err)
|
|
floatVecs = ifloatVecs.([]float32)
|
|
assert.Equal(t, 1, dim)
|
|
assert.Equal(t, 4, len(floatVecs))
|
|
assert.Equal(t, []float32{1.0, 2.0, 3.0, 4.0}, floatVecs)
|
|
defer r.ReleasePayloadReader()
|
|
})
|
|
|
|
t.Run("TestFloat16Vector", func(t *testing.T) {
|
|
w, err := NewPayloadWriter(schemapb.DataType_Float16Vector, WithDim(1))
|
|
require.Nil(t, err)
|
|
require.NotNil(t, w)
|
|
|
|
err = w.AddFloat16VectorToPayload([]byte{1, 2}, 1, nil)
|
|
assert.NoError(t, err)
|
|
err = w.AddDataToPayloadForUT([]byte{3, 4}, nil)
|
|
assert.NoError(t, err)
|
|
err = w.FinishPayloadWriter()
|
|
assert.NoError(t, err)
|
|
|
|
length, err := w.GetPayloadLengthFromWriter()
|
|
assert.NoError(t, err)
|
|
assert.Equal(t, 2, length)
|
|
defer w.ReleasePayloadWriter()
|
|
|
|
buffer, err := w.GetPayloadBufferFromWriter()
|
|
assert.NoError(t, err)
|
|
|
|
r, err := NewPayloadReader(schemapb.DataType_Float16Vector, buffer, false)
|
|
require.Nil(t, err)
|
|
length, err = r.GetPayloadLengthFromReader()
|
|
assert.NoError(t, err)
|
|
assert.Equal(t, length, 2)
|
|
|
|
float16Vecs, dim, _, _, err := r.GetFloat16VectorFromPayload()
|
|
assert.NoError(t, err)
|
|
assert.Equal(t, 1, dim)
|
|
assert.Equal(t, 4, len(float16Vecs))
|
|
assert.ElementsMatch(t, []byte{1, 2, 3, 4}, float16Vecs)
|
|
|
|
ifloat16Vecs, valids, dim, err := r.GetDataFromPayload()
|
|
assert.NoError(t, err)
|
|
assert.Nil(t, valids)
|
|
float16Vecs = ifloat16Vecs.([]byte)
|
|
assert.Equal(t, 1, dim)
|
|
assert.Equal(t, 4, len(float16Vecs))
|
|
assert.ElementsMatch(t, []byte{1, 2, 3, 4}, float16Vecs)
|
|
defer r.ReleasePayloadReader()
|
|
})
|
|
|
|
t.Run("TestBFloat16Vector", func(t *testing.T) {
|
|
w, err := NewPayloadWriter(schemapb.DataType_BFloat16Vector, WithDim(1))
|
|
require.Nil(t, err)
|
|
require.NotNil(t, w)
|
|
|
|
err = w.AddBFloat16VectorToPayload([]byte{1, 2}, 1, nil)
|
|
assert.NoError(t, err)
|
|
err = w.AddDataToPayloadForUT([]byte{3, 4}, nil)
|
|
assert.NoError(t, err)
|
|
err = w.FinishPayloadWriter()
|
|
assert.NoError(t, err)
|
|
|
|
length, err := w.GetPayloadLengthFromWriter()
|
|
assert.NoError(t, err)
|
|
assert.Equal(t, 2, length)
|
|
defer w.ReleasePayloadWriter()
|
|
|
|
buffer, err := w.GetPayloadBufferFromWriter()
|
|
assert.NoError(t, err)
|
|
|
|
r, err := NewPayloadReader(schemapb.DataType_BFloat16Vector, buffer, false)
|
|
require.Nil(t, err)
|
|
length, err = r.GetPayloadLengthFromReader()
|
|
assert.NoError(t, err)
|
|
assert.Equal(t, length, 2)
|
|
|
|
bfloat16Vecs, dim, _, _, err := r.GetBFloat16VectorFromPayload()
|
|
assert.NoError(t, err)
|
|
assert.Equal(t, 1, dim)
|
|
assert.Equal(t, 4, len(bfloat16Vecs))
|
|
assert.ElementsMatch(t, []byte{1, 2, 3, 4}, bfloat16Vecs)
|
|
|
|
ibfloat16Vecs, valids, dim, err := r.GetDataFromPayload()
|
|
assert.NoError(t, err)
|
|
assert.Nil(t, valids)
|
|
bfloat16Vecs = ibfloat16Vecs.([]byte)
|
|
assert.Equal(t, 1, dim)
|
|
assert.Equal(t, 4, len(bfloat16Vecs))
|
|
assert.ElementsMatch(t, []byte{1, 2, 3, 4}, bfloat16Vecs)
|
|
defer r.ReleasePayloadReader()
|
|
})
|
|
|
|
t.Run("TestSparseFloatVector", func(t *testing.T) {
|
|
w, err := NewPayloadWriter(schemapb.DataType_SparseFloatVector)
|
|
require.Nil(t, err)
|
|
require.NotNil(t, w)
|
|
|
|
err = w.AddSparseFloatVectorToPayload(&SparseFloatVectorFieldData{
|
|
SparseFloatArray: schemapb.SparseFloatArray{
|
|
Dim: 600,
|
|
Contents: [][]byte{
|
|
typeutil.CreateSparseFloatRow([]uint32{0, 1, 2}, []float32{1.1, 1.2, 1.3}),
|
|
typeutil.CreateSparseFloatRow([]uint32{10, 20, 30}, []float32{2.1, 2.2, 2.3}),
|
|
typeutil.CreateSparseFloatRow([]uint32{100, 200, 599}, []float32{3.1, 3.2, 3.3}),
|
|
},
|
|
},
|
|
})
|
|
assert.NoError(t, err)
|
|
err = w.AddSparseFloatVectorToPayload(&SparseFloatVectorFieldData{
|
|
SparseFloatArray: schemapb.SparseFloatArray{
|
|
Dim: 600,
|
|
Contents: [][]byte{
|
|
typeutil.CreateSparseFloatRow([]uint32{30, 41, 52}, []float32{1.1, 1.2, 1.3}),
|
|
typeutil.CreateSparseFloatRow([]uint32{60, 80, 230}, []float32{2.1, 2.2, 2.3}),
|
|
typeutil.CreateSparseFloatRow([]uint32{170, 300, 579}, []float32{3.1, 3.2, 3.3}),
|
|
},
|
|
},
|
|
})
|
|
assert.NoError(t, err)
|
|
err = w.FinishPayloadWriter()
|
|
assert.NoError(t, err)
|
|
|
|
length, err := w.GetPayloadLengthFromWriter()
|
|
assert.NoError(t, err)
|
|
assert.Equal(t, 6, length)
|
|
defer w.ReleasePayloadWriter()
|
|
|
|
buffer, err := w.GetPayloadBufferFromWriter()
|
|
assert.NoError(t, err)
|
|
|
|
r, err := NewPayloadReader(schemapb.DataType_SparseFloatVector, buffer, false)
|
|
require.Nil(t, err)
|
|
length, err = r.GetPayloadLengthFromReader()
|
|
assert.NoError(t, err)
|
|
assert.Equal(t, length, 6)
|
|
|
|
floatVecs, dim, _, err := r.GetSparseFloatVectorFromPayload()
|
|
assert.NoError(t, err)
|
|
assert.Equal(t, 600, dim)
|
|
assert.Equal(t, 6, len(floatVecs.Contents))
|
|
assert.EqualExportedValues(t, &schemapb.SparseFloatArray{
|
|
// merged dim should be max of all dims
|
|
Dim: 600,
|
|
Contents: [][]byte{
|
|
typeutil.CreateSparseFloatRow([]uint32{0, 1, 2}, []float32{1.1, 1.2, 1.3}),
|
|
typeutil.CreateSparseFloatRow([]uint32{10, 20, 30}, []float32{2.1, 2.2, 2.3}),
|
|
typeutil.CreateSparseFloatRow([]uint32{100, 200, 599}, []float32{3.1, 3.2, 3.3}),
|
|
typeutil.CreateSparseFloatRow([]uint32{30, 41, 52}, []float32{1.1, 1.2, 1.3}),
|
|
typeutil.CreateSparseFloatRow([]uint32{60, 80, 230}, []float32{2.1, 2.2, 2.3}),
|
|
typeutil.CreateSparseFloatRow([]uint32{170, 300, 579}, []float32{3.1, 3.2, 3.3}),
|
|
},
|
|
}, &floatVecs.SparseFloatArray)
|
|
|
|
ifloatVecs, valids, dim, err := r.GetDataFromPayload()
|
|
assert.NoError(t, err)
|
|
assert.Nil(t, valids)
|
|
assert.Equal(t, floatVecs, ifloatVecs.(*SparseFloatVectorFieldData))
|
|
assert.Equal(t, 600, dim)
|
|
defer r.ReleasePayloadReader()
|
|
})
|
|
|
|
testSparseOneBatch := func(t *testing.T, rows [][]byte, actualDim int) {
|
|
w, err := NewPayloadWriter(schemapb.DataType_SparseFloatVector)
|
|
require.Nil(t, err)
|
|
require.NotNil(t, w)
|
|
|
|
err = w.AddSparseFloatVectorToPayload(&SparseFloatVectorFieldData{
|
|
SparseFloatArray: schemapb.SparseFloatArray{
|
|
Dim: int64(actualDim),
|
|
Contents: rows,
|
|
},
|
|
})
|
|
assert.NoError(t, err)
|
|
err = w.FinishPayloadWriter()
|
|
assert.NoError(t, err)
|
|
|
|
length, err := w.GetPayloadLengthFromWriter()
|
|
assert.NoError(t, err)
|
|
assert.Equal(t, 3, length)
|
|
defer w.ReleasePayloadWriter()
|
|
|
|
buffer, err := w.GetPayloadBufferFromWriter()
|
|
assert.NoError(t, err)
|
|
|
|
r, err := NewPayloadReader(schemapb.DataType_SparseFloatVector, buffer, false)
|
|
require.Nil(t, err)
|
|
length, err = r.GetPayloadLengthFromReader()
|
|
assert.NoError(t, err)
|
|
assert.Equal(t, length, 3)
|
|
|
|
floatVecs, dim, _, err := r.GetSparseFloatVectorFromPayload()
|
|
assert.NoError(t, err)
|
|
assert.Equal(t, actualDim, dim)
|
|
assert.Equal(t, 3, len(floatVecs.Contents))
|
|
assert.EqualExportedValues(t, &schemapb.SparseFloatArray{
|
|
Dim: int64(dim),
|
|
Contents: rows,
|
|
}, &floatVecs.SparseFloatArray)
|
|
|
|
ifloatVecs, valids, dim, err := r.GetDataFromPayload()
|
|
assert.Nil(t, valids)
|
|
assert.NoError(t, err)
|
|
assert.Equal(t, floatVecs, ifloatVecs.(*SparseFloatVectorFieldData))
|
|
assert.Equal(t, actualDim, dim)
|
|
defer r.ReleasePayloadReader()
|
|
}
|
|
|
|
t.Run("TestSparseFloatVector_emptyRow", func(t *testing.T) {
|
|
testSparseOneBatch(t, [][]byte{
|
|
typeutil.CreateSparseFloatRow([]uint32{}, []float32{}),
|
|
typeutil.CreateSparseFloatRow([]uint32{10, 20, 30}, []float32{2.1, 2.2, 2.3}),
|
|
typeutil.CreateSparseFloatRow([]uint32{100, 200, 599}, []float32{3.1, 3.2, 3.3}),
|
|
}, 600)
|
|
testSparseOneBatch(t, [][]byte{
|
|
typeutil.CreateSparseFloatRow([]uint32{}, []float32{}),
|
|
typeutil.CreateSparseFloatRow([]uint32{}, []float32{}),
|
|
typeutil.CreateSparseFloatRow([]uint32{}, []float32{}),
|
|
}, 0)
|
|
})
|
|
|
|
t.Run("TestSparseFloatVector_largeRow", func(t *testing.T) {
|
|
nnz := 100000
|
|
// generate an int slice with nnz random sorted elements
|
|
indices := make([]uint32, nnz)
|
|
values := make([]float32, nnz)
|
|
for i := 0; i < nnz; i++ {
|
|
indices[i] = uint32(i * 6)
|
|
values[i] = float32(i)
|
|
}
|
|
dim := int(indices[nnz-1]) + 1
|
|
testSparseOneBatch(t, [][]byte{
|
|
typeutil.CreateSparseFloatRow([]uint32{}, []float32{}),
|
|
typeutil.CreateSparseFloatRow([]uint32{10, 20, 30}, []float32{2.1, 2.2, 2.3}),
|
|
typeutil.CreateSparseFloatRow(indices, values),
|
|
}, dim)
|
|
})
|
|
|
|
t.Run("TestSparseFloatVector_negativeValues", func(t *testing.T) {
|
|
testSparseOneBatch(t, [][]byte{
|
|
typeutil.CreateSparseFloatRow([]uint32{}, []float32{}),
|
|
typeutil.CreateSparseFloatRow([]uint32{10, 20, 30}, []float32{-2.1, 2.2, -2.3}),
|
|
typeutil.CreateSparseFloatRow([]uint32{100, 200, 599}, []float32{3.1, -3.2, 3.3}),
|
|
}, 600)
|
|
})
|
|
|
|
// even though SPARSE_INVERTED_INDEX and SPARSE_WAND index do not support
|
|
// arbitrarily large dimensions, HNSW does, so we still need to test it.
|
|
// Dimension range we support is 0 to positive int32 max - 1(to leave room
|
|
// for dim).
|
|
t.Run("TestSparseFloatVector_largeIndex", func(t *testing.T) {
|
|
int32Max := uint32(math.MaxInt32)
|
|
testSparseOneBatch(t, [][]byte{
|
|
typeutil.CreateSparseFloatRow([]uint32{}, []float32{}),
|
|
typeutil.CreateSparseFloatRow([]uint32{10, 20, 30}, []float32{-2.1, 2.2, -2.3}),
|
|
typeutil.CreateSparseFloatRow([]uint32{100, int32Max / 2, int32Max - 1}, []float32{3.1, -3.2, 3.3}),
|
|
}, int(int32Max))
|
|
})
|
|
|
|
t.Run("TestAddBoolAfterFinish", func(t *testing.T) {
|
|
w, err := NewPayloadWriter(schemapb.DataType_Bool)
|
|
require.Nil(t, err)
|
|
require.NotNil(t, w)
|
|
|
|
_, err = w.GetPayloadBufferFromWriter()
|
|
assert.Error(t, err)
|
|
|
|
err = w.AddBoolToPayload([]bool{}, nil)
|
|
assert.Error(t, err)
|
|
err = w.FinishPayloadWriter()
|
|
assert.NoError(t, err)
|
|
err = w.AddBoolToPayload([]bool{false}, nil)
|
|
assert.Error(t, err)
|
|
})
|
|
|
|
t.Run("TestAddInt8AfterFinish", func(t *testing.T) {
|
|
w, err := NewPayloadWriter(schemapb.DataType_Int8)
|
|
require.Nil(t, err)
|
|
require.NotNil(t, w)
|
|
defer w.Close()
|
|
|
|
_, err = w.GetPayloadBufferFromWriter()
|
|
assert.Error(t, err)
|
|
|
|
err = w.AddInt8ToPayload([]int8{}, nil)
|
|
assert.Error(t, err)
|
|
err = w.FinishPayloadWriter()
|
|
assert.NoError(t, err)
|
|
err = w.AddInt8ToPayload([]int8{0}, nil)
|
|
assert.Error(t, err)
|
|
})
|
|
t.Run("TestAddInt16AfterFinish", func(t *testing.T) {
|
|
w, err := NewPayloadWriter(schemapb.DataType_Int16)
|
|
require.Nil(t, err)
|
|
require.NotNil(t, w)
|
|
defer w.Close()
|
|
|
|
_, err = w.GetPayloadBufferFromWriter()
|
|
assert.Error(t, err)
|
|
|
|
err = w.AddInt16ToPayload([]int16{}, nil)
|
|
assert.Error(t, err)
|
|
err = w.FinishPayloadWriter()
|
|
assert.NoError(t, err)
|
|
err = w.AddInt16ToPayload([]int16{0}, nil)
|
|
assert.Error(t, err)
|
|
})
|
|
t.Run("TestAddInt32AfterFinish", func(t *testing.T) {
|
|
w, err := NewPayloadWriter(schemapb.DataType_Int32)
|
|
require.Nil(t, err)
|
|
require.NotNil(t, w)
|
|
defer w.Close()
|
|
|
|
_, err = w.GetPayloadBufferFromWriter()
|
|
assert.Error(t, err)
|
|
|
|
err = w.AddInt32ToPayload([]int32{}, nil)
|
|
assert.Error(t, err)
|
|
err = w.FinishPayloadWriter()
|
|
assert.NoError(t, err)
|
|
err = w.AddInt32ToPayload([]int32{0}, nil)
|
|
assert.Error(t, err)
|
|
})
|
|
t.Run("TestAddInt64AfterFinish", func(t *testing.T) {
|
|
w, err := NewPayloadWriter(schemapb.DataType_Int64)
|
|
require.Nil(t, err)
|
|
require.NotNil(t, w)
|
|
defer w.Close()
|
|
|
|
_, err = w.GetPayloadBufferFromWriter()
|
|
assert.Error(t, err)
|
|
|
|
err = w.AddInt64ToPayload([]int64{}, nil)
|
|
assert.Error(t, err)
|
|
err = w.FinishPayloadWriter()
|
|
assert.NoError(t, err)
|
|
err = w.AddInt64ToPayload([]int64{0}, nil)
|
|
assert.Error(t, err)
|
|
})
|
|
t.Run("TestAddFloatAfterFinish", func(t *testing.T) {
|
|
w, err := NewPayloadWriter(schemapb.DataType_Float)
|
|
require.Nil(t, err)
|
|
require.NotNil(t, w)
|
|
defer w.Close()
|
|
|
|
_, err = w.GetPayloadBufferFromWriter()
|
|
assert.Error(t, err)
|
|
|
|
err = w.AddFloatToPayload([]float32{}, nil)
|
|
assert.Error(t, err)
|
|
err = w.FinishPayloadWriter()
|
|
assert.NoError(t, err)
|
|
err = w.AddFloatToPayload([]float32{0.0}, nil)
|
|
assert.Error(t, err)
|
|
})
|
|
t.Run("TestAddDoubleAfterFinish", func(t *testing.T) {
|
|
w, err := NewPayloadWriter(schemapb.DataType_Double)
|
|
require.Nil(t, err)
|
|
require.NotNil(t, w)
|
|
defer w.Close()
|
|
|
|
_, err = w.GetPayloadBufferFromWriter()
|
|
assert.Error(t, err)
|
|
|
|
err = w.AddDoubleToPayload([]float64{}, nil)
|
|
assert.Error(t, err)
|
|
err = w.FinishPayloadWriter()
|
|
assert.NoError(t, err)
|
|
err = w.AddDoubleToPayload([]float64{0.0}, nil)
|
|
assert.Error(t, err)
|
|
})
|
|
t.Run("TestAddOneStringAfterFinish", func(t *testing.T) {
|
|
w, err := NewPayloadWriter(schemapb.DataType_String)
|
|
require.Nil(t, err)
|
|
require.NotNil(t, w)
|
|
defer w.Close()
|
|
|
|
_, err = w.GetPayloadBufferFromWriter()
|
|
assert.Error(t, err)
|
|
|
|
err = w.AddOneStringToPayload("", true)
|
|
assert.NoError(t, err)
|
|
err = w.FinishPayloadWriter()
|
|
assert.NoError(t, err)
|
|
err = w.AddOneStringToPayload("c", true)
|
|
assert.Error(t, err)
|
|
})
|
|
t.Run("TestAddBinVectorAfterFinish", func(t *testing.T) {
|
|
w, err := NewPayloadWriter(schemapb.DataType_BinaryVector, WithDim(8))
|
|
require.Nil(t, err)
|
|
require.NotNil(t, w)
|
|
defer w.Close()
|
|
|
|
_, err = w.GetPayloadBufferFromWriter()
|
|
assert.Error(t, err)
|
|
|
|
err = w.FinishPayloadWriter()
|
|
assert.NoError(t, err)
|
|
|
|
err = w.AddBinaryVectorToPayload([]byte{}, 8, nil)
|
|
assert.Error(t, err)
|
|
err = w.AddBinaryVectorToPayload([]byte{1}, 0, nil)
|
|
assert.Error(t, err)
|
|
|
|
err = w.AddBinaryVectorToPayload([]byte{1, 0, 0, 0, 0, 0, 0, 0}, 8, nil)
|
|
assert.Error(t, err)
|
|
err = w.FinishPayloadWriter()
|
|
assert.Error(t, err)
|
|
err = w.AddBinaryVectorToPayload([]byte{1, 0, 0, 0, 0, 0, 0, 0}, 8, nil)
|
|
assert.Error(t, err)
|
|
})
|
|
t.Run("TestAddFloatVectorAfterFinish", func(t *testing.T) {
|
|
w, err := NewPayloadWriter(schemapb.DataType_FloatVector, WithDim(8))
|
|
require.Nil(t, err)
|
|
require.NotNil(t, w)
|
|
defer w.Close()
|
|
|
|
err = w.FinishPayloadWriter()
|
|
assert.NoError(t, err)
|
|
|
|
err = w.AddFloatVectorToPayload([]float32{}, 8, nil)
|
|
assert.Error(t, err)
|
|
err = w.AddFloatVectorToPayload([]float32{1.0}, 0, nil)
|
|
assert.Error(t, err)
|
|
|
|
err = w.AddFloatVectorToPayload([]float32{1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0}, 8, nil)
|
|
assert.Error(t, err)
|
|
err = w.FinishPayloadWriter()
|
|
assert.Error(t, err)
|
|
err = w.AddFloatVectorToPayload([]float32{1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0}, 8, nil)
|
|
assert.Error(t, err)
|
|
})
|
|
t.Run("TestAddFloat16VectorAfterFinish", func(t *testing.T) {
|
|
w, err := NewPayloadWriter(schemapb.DataType_Float16Vector, WithDim(8))
|
|
require.Nil(t, err)
|
|
require.NotNil(t, w)
|
|
defer w.Close()
|
|
|
|
err = w.AddFloat16VectorToPayload([]byte{}, 8, nil)
|
|
assert.Error(t, err)
|
|
|
|
err = w.FinishPayloadWriter()
|
|
assert.NoError(t, err)
|
|
|
|
err = w.AddFloat16VectorToPayload([]byte{}, 8, nil)
|
|
assert.Error(t, err)
|
|
err = w.AddFloat16VectorToPayload([]byte{1}, 0, nil)
|
|
assert.Error(t, err)
|
|
|
|
err = w.AddFloat16VectorToPayload([]byte{1, 0, 0, 0, 0, 0, 0, 0}, 8, nil)
|
|
assert.Error(t, err)
|
|
err = w.FinishPayloadWriter()
|
|
assert.Error(t, err)
|
|
err = w.AddFloat16VectorToPayload([]byte{1, 0, 0, 0, 0, 0, 0, 0}, 8, nil)
|
|
assert.Error(t, err)
|
|
})
|
|
t.Run("TestAddBFloat16VectorAfterFinish", func(t *testing.T) {
|
|
w, err := NewPayloadWriter(schemapb.DataType_BFloat16Vector, WithDim(8))
|
|
require.Nil(t, err)
|
|
require.NotNil(t, w)
|
|
defer w.Close()
|
|
|
|
err = w.AddBFloat16VectorToPayload([]byte{}, 8, nil)
|
|
assert.Error(t, err)
|
|
|
|
err = w.FinishPayloadWriter()
|
|
assert.NoError(t, err)
|
|
|
|
err = w.AddBFloat16VectorToPayload([]byte{}, 8, nil)
|
|
assert.Error(t, err)
|
|
err = w.AddBFloat16VectorToPayload([]byte{1}, 0, nil)
|
|
assert.Error(t, err)
|
|
|
|
err = w.AddBFloat16VectorToPayload([]byte{1, 0, 0, 0, 0, 0, 0, 0}, 8, nil)
|
|
assert.Error(t, err)
|
|
err = w.FinishPayloadWriter()
|
|
assert.Error(t, err)
|
|
err = w.AddBFloat16VectorToPayload([]byte{1, 0, 0, 0, 0, 0, 0, 0}, 8, nil)
|
|
assert.Error(t, err)
|
|
})
|
|
t.Run("TestAddSparseFloatVectorAfterFinish", func(t *testing.T) {
|
|
w, err := NewPayloadWriter(schemapb.DataType_SparseFloatVector)
|
|
require.Nil(t, err)
|
|
require.NotNil(t, w)
|
|
defer w.Close()
|
|
|
|
err = w.FinishPayloadWriter()
|
|
assert.NoError(t, err)
|
|
|
|
err = w.AddSparseFloatVectorToPayload(&SparseFloatVectorFieldData{
|
|
SparseFloatArray: schemapb.SparseFloatArray{
|
|
Dim: 53,
|
|
Contents: [][]byte{
|
|
typeutil.CreateSparseFloatRow([]uint32{30, 41, 52}, []float32{1.1, 1.2, 1.3}),
|
|
},
|
|
},
|
|
})
|
|
assert.Error(t, err)
|
|
err = w.AddSparseFloatVectorToPayload(&SparseFloatVectorFieldData{
|
|
SparseFloatArray: schemapb.SparseFloatArray{
|
|
Dim: 600,
|
|
Contents: [][]byte{
|
|
typeutil.CreateSparseFloatRow([]uint32{30, 41, 52}, []float32{1.1, 1.2, 1.3}),
|
|
},
|
|
},
|
|
})
|
|
assert.Error(t, err)
|
|
|
|
err = w.FinishPayloadWriter()
|
|
assert.Error(t, err)
|
|
})
|
|
t.Run("TestNewReadError", func(t *testing.T) {
|
|
buffer := []byte{0}
|
|
r, err := NewPayloadReader(999, buffer, false)
|
|
assert.Error(t, err)
|
|
assert.Nil(t, r)
|
|
})
|
|
t.Run("TestGetDataError", func(t *testing.T) {
|
|
r := PayloadReader{}
|
|
r.colType = 999
|
|
|
|
_, _, _, err := r.GetDataFromPayload()
|
|
assert.Error(t, err)
|
|
})
|
|
t.Run("TestGetBoolError", func(t *testing.T) {
|
|
w, err := NewPayloadWriter(schemapb.DataType_Int8)
|
|
require.Nil(t, err)
|
|
require.NotNil(t, w)
|
|
|
|
err = w.AddInt8ToPayload([]int8{1, 2, 3}, nil)
|
|
assert.NoError(t, err)
|
|
|
|
err = w.FinishPayloadWriter()
|
|
assert.NoError(t, err)
|
|
|
|
buffer, err := w.GetPayloadBufferFromWriter()
|
|
assert.NoError(t, err)
|
|
|
|
r, err := NewPayloadReader(schemapb.DataType_Bool, buffer, false)
|
|
assert.NoError(t, err)
|
|
|
|
_, _, err = r.GetBoolFromPayload()
|
|
assert.Error(t, err)
|
|
|
|
r.colType = 999
|
|
_, _, err = r.GetBoolFromPayload()
|
|
assert.Error(t, err)
|
|
})
|
|
t.Run("TestGetBoolError2", func(t *testing.T) {
|
|
w, err := NewPayloadWriter(schemapb.DataType_Bool)
|
|
require.Nil(t, err)
|
|
require.NotNil(t, w)
|
|
|
|
err = w.AddBoolToPayload([]bool{true, false, true}, nil)
|
|
assert.NoError(t, err)
|
|
|
|
err = w.FinishPayloadWriter()
|
|
assert.NoError(t, err)
|
|
|
|
buffer, err := w.GetPayloadBufferFromWriter()
|
|
assert.NoError(t, err)
|
|
|
|
r, err := NewPayloadReader(schemapb.DataType_Bool, buffer, false)
|
|
assert.NoError(t, err)
|
|
|
|
r.numRows = 99
|
|
_, _, err = r.GetBoolFromPayload()
|
|
assert.Error(t, err)
|
|
})
|
|
t.Run("TestGetInt8Error", func(t *testing.T) {
|
|
w, err := NewPayloadWriter(schemapb.DataType_Bool)
|
|
require.Nil(t, err)
|
|
require.NotNil(t, w)
|
|
|
|
err = w.AddBoolToPayload([]bool{false, true, true}, nil)
|
|
assert.NoError(t, err)
|
|
|
|
err = w.FinishPayloadWriter()
|
|
assert.NoError(t, err)
|
|
|
|
buffer, err := w.GetPayloadBufferFromWriter()
|
|
assert.NoError(t, err)
|
|
|
|
r, err := NewPayloadReader(schemapb.DataType_Int8, buffer, false)
|
|
assert.NoError(t, err)
|
|
|
|
_, _, err = r.GetInt8FromPayload()
|
|
assert.Error(t, err)
|
|
|
|
r.colType = 999
|
|
_, _, err = r.GetInt8FromPayload()
|
|
assert.Error(t, err)
|
|
})
|
|
t.Run("TestGetInt8Error2", func(t *testing.T) {
|
|
w, err := NewPayloadWriter(schemapb.DataType_Int8)
|
|
require.Nil(t, err)
|
|
require.NotNil(t, w)
|
|
|
|
err = w.AddInt8ToPayload([]int8{1, 2, 3}, nil)
|
|
assert.NoError(t, err)
|
|
|
|
err = w.FinishPayloadWriter()
|
|
assert.NoError(t, err)
|
|
|
|
buffer, err := w.GetPayloadBufferFromWriter()
|
|
assert.NoError(t, err)
|
|
|
|
r, err := NewPayloadReader(schemapb.DataType_Int8, buffer, false)
|
|
assert.NoError(t, err)
|
|
|
|
r.numRows = 99
|
|
_, _, err = r.GetInt8FromPayload()
|
|
assert.Error(t, err)
|
|
})
|
|
t.Run("TestGetInt16Error", func(t *testing.T) {
|
|
w, err := NewPayloadWriter(schemapb.DataType_Bool)
|
|
require.Nil(t, err)
|
|
require.NotNil(t, w)
|
|
|
|
err = w.AddBoolToPayload([]bool{false, true, true}, nil)
|
|
assert.NoError(t, err)
|
|
|
|
err = w.FinishPayloadWriter()
|
|
assert.NoError(t, err)
|
|
|
|
buffer, err := w.GetPayloadBufferFromWriter()
|
|
assert.NoError(t, err)
|
|
|
|
r, err := NewPayloadReader(schemapb.DataType_Int16, buffer, false)
|
|
assert.NoError(t, err)
|
|
|
|
_, _, err = r.GetInt16FromPayload()
|
|
assert.Error(t, err)
|
|
|
|
r.colType = 999
|
|
_, _, err = r.GetInt16FromPayload()
|
|
assert.Error(t, err)
|
|
})
|
|
t.Run("TestGetInt16Error2", func(t *testing.T) {
|
|
w, err := NewPayloadWriter(schemapb.DataType_Int16)
|
|
require.Nil(t, err)
|
|
require.NotNil(t, w)
|
|
|
|
err = w.AddInt16ToPayload([]int16{1, 2, 3}, nil)
|
|
assert.NoError(t, err)
|
|
|
|
err = w.FinishPayloadWriter()
|
|
assert.NoError(t, err)
|
|
|
|
buffer, err := w.GetPayloadBufferFromWriter()
|
|
assert.NoError(t, err)
|
|
|
|
r, err := NewPayloadReader(schemapb.DataType_Int16, buffer, false)
|
|
assert.NoError(t, err)
|
|
|
|
r.numRows = 99
|
|
_, _, err = r.GetInt16FromPayload()
|
|
assert.Error(t, err)
|
|
})
|
|
t.Run("TestGetInt32Error", func(t *testing.T) {
|
|
w, err := NewPayloadWriter(schemapb.DataType_Bool)
|
|
require.Nil(t, err)
|
|
require.NotNil(t, w)
|
|
|
|
err = w.AddBoolToPayload([]bool{false, true, true}, nil)
|
|
assert.NoError(t, err)
|
|
|
|
err = w.FinishPayloadWriter()
|
|
assert.NoError(t, err)
|
|
|
|
buffer, err := w.GetPayloadBufferFromWriter()
|
|
assert.NoError(t, err)
|
|
|
|
r, err := NewPayloadReader(schemapb.DataType_Int32, buffer, false)
|
|
assert.NoError(t, err)
|
|
|
|
_, _, err = r.GetInt32FromPayload()
|
|
assert.Error(t, err)
|
|
|
|
r.colType = 999
|
|
_, _, err = r.GetInt32FromPayload()
|
|
assert.Error(t, err)
|
|
})
|
|
t.Run("TestGetInt32Error2", func(t *testing.T) {
|
|
w, err := NewPayloadWriter(schemapb.DataType_Int32)
|
|
require.Nil(t, err)
|
|
require.NotNil(t, w)
|
|
|
|
err = w.AddInt32ToPayload([]int32{1, 2, 3}, nil)
|
|
assert.NoError(t, err)
|
|
|
|
err = w.FinishPayloadWriter()
|
|
assert.NoError(t, err)
|
|
|
|
buffer, err := w.GetPayloadBufferFromWriter()
|
|
assert.NoError(t, err)
|
|
|
|
r, err := NewPayloadReader(schemapb.DataType_Int32, buffer, false)
|
|
assert.NoError(t, err)
|
|
|
|
r.numRows = 99
|
|
_, _, err = r.GetInt32FromPayload()
|
|
assert.Error(t, err)
|
|
})
|
|
t.Run("TestGetInt64Error", func(t *testing.T) {
|
|
w, err := NewPayloadWriter(schemapb.DataType_Bool)
|
|
require.Nil(t, err)
|
|
require.NotNil(t, w)
|
|
|
|
err = w.AddBoolToPayload([]bool{false, true, true}, nil)
|
|
assert.NoError(t, err)
|
|
|
|
err = w.FinishPayloadWriter()
|
|
assert.NoError(t, err)
|
|
|
|
buffer, err := w.GetPayloadBufferFromWriter()
|
|
assert.NoError(t, err)
|
|
|
|
r, err := NewPayloadReader(schemapb.DataType_Int64, buffer, false)
|
|
assert.NoError(t, err)
|
|
|
|
_, _, err = r.GetInt64FromPayload()
|
|
assert.Error(t, err)
|
|
|
|
r.colType = 999
|
|
_, _, err = r.GetInt64FromPayload()
|
|
assert.Error(t, err)
|
|
})
|
|
t.Run("TestGetInt64Error2", func(t *testing.T) {
|
|
w, err := NewPayloadWriter(schemapb.DataType_Int64)
|
|
require.Nil(t, err)
|
|
require.NotNil(t, w)
|
|
|
|
err = w.AddInt64ToPayload([]int64{1, 2, 3}, nil)
|
|
assert.NoError(t, err)
|
|
|
|
err = w.FinishPayloadWriter()
|
|
assert.NoError(t, err)
|
|
|
|
buffer, err := w.GetPayloadBufferFromWriter()
|
|
assert.NoError(t, err)
|
|
|
|
r, err := NewPayloadReader(schemapb.DataType_Int64, buffer, false)
|
|
assert.NoError(t, err)
|
|
|
|
r.numRows = 99
|
|
_, _, err = r.GetInt64FromPayload()
|
|
assert.Error(t, err)
|
|
})
|
|
t.Run("TestGetFloatError", func(t *testing.T) {
|
|
w, err := NewPayloadWriter(schemapb.DataType_Bool)
|
|
require.Nil(t, err)
|
|
require.NotNil(t, w)
|
|
|
|
err = w.AddBoolToPayload([]bool{false, true, true}, nil)
|
|
assert.NoError(t, err)
|
|
|
|
err = w.FinishPayloadWriter()
|
|
assert.NoError(t, err)
|
|
|
|
buffer, err := w.GetPayloadBufferFromWriter()
|
|
assert.NoError(t, err)
|
|
|
|
r, err := NewPayloadReader(schemapb.DataType_Float, buffer, false)
|
|
assert.NoError(t, err)
|
|
|
|
_, _, err = r.GetFloatFromPayload()
|
|
assert.Error(t, err)
|
|
|
|
r.colType = 999
|
|
_, _, err = r.GetFloatFromPayload()
|
|
assert.Error(t, err)
|
|
})
|
|
t.Run("TestGetFloatError2", func(t *testing.T) {
|
|
w, err := NewPayloadWriter(schemapb.DataType_Float)
|
|
require.Nil(t, err)
|
|
require.NotNil(t, w)
|
|
|
|
err = w.AddFloatToPayload([]float32{1, 2, 3}, nil)
|
|
assert.NoError(t, err)
|
|
|
|
err = w.FinishPayloadWriter()
|
|
assert.NoError(t, err)
|
|
|
|
buffer, err := w.GetPayloadBufferFromWriter()
|
|
assert.NoError(t, err)
|
|
|
|
r, err := NewPayloadReader(schemapb.DataType_Float, buffer, false)
|
|
assert.NoError(t, err)
|
|
|
|
r.numRows = 99
|
|
_, _, err = r.GetFloatFromPayload()
|
|
assert.Error(t, err)
|
|
})
|
|
t.Run("TestGetDoubleError", func(t *testing.T) {
|
|
w, err := NewPayloadWriter(schemapb.DataType_Bool)
|
|
require.Nil(t, err)
|
|
require.NotNil(t, w)
|
|
|
|
err = w.AddBoolToPayload([]bool{false, true, true}, nil)
|
|
assert.NoError(t, err)
|
|
|
|
err = w.FinishPayloadWriter()
|
|
assert.NoError(t, err)
|
|
|
|
buffer, err := w.GetPayloadBufferFromWriter()
|
|
assert.NoError(t, err)
|
|
|
|
r, err := NewPayloadReader(schemapb.DataType_Double, buffer, false)
|
|
assert.NoError(t, err)
|
|
|
|
_, _, err = r.GetDoubleFromPayload()
|
|
assert.Error(t, err)
|
|
|
|
r.colType = 999
|
|
_, _, err = r.GetDoubleFromPayload()
|
|
assert.Error(t, err)
|
|
})
|
|
t.Run("TestGetDoubleError2", func(t *testing.T) {
|
|
w, err := NewPayloadWriter(schemapb.DataType_Double)
|
|
require.Nil(t, err)
|
|
require.NotNil(t, w)
|
|
|
|
err = w.AddDoubleToPayload([]float64{1, 2, 3}, nil)
|
|
assert.NoError(t, err)
|
|
|
|
err = w.FinishPayloadWriter()
|
|
assert.NoError(t, err)
|
|
|
|
buffer, err := w.GetPayloadBufferFromWriter()
|
|
assert.NoError(t, err)
|
|
|
|
r, err := NewPayloadReader(schemapb.DataType_Double, buffer, false)
|
|
assert.NoError(t, err)
|
|
|
|
r.numRows = 99
|
|
_, _, err = r.GetDoubleFromPayload()
|
|
assert.Error(t, err)
|
|
})
|
|
t.Run("TestGetStringError", func(t *testing.T) {
|
|
w, err := NewPayloadWriter(schemapb.DataType_Bool)
|
|
require.Nil(t, err)
|
|
require.NotNil(t, w)
|
|
|
|
err = w.AddBoolToPayload([]bool{false, true, true}, nil)
|
|
assert.NoError(t, err)
|
|
|
|
err = w.FinishPayloadWriter()
|
|
assert.NoError(t, err)
|
|
|
|
buffer, err := w.GetPayloadBufferFromWriter()
|
|
assert.NoError(t, err)
|
|
|
|
r, err := NewPayloadReader(schemapb.DataType_String, buffer, false)
|
|
assert.NoError(t, err)
|
|
|
|
_, _, err = r.GetStringFromPayload()
|
|
assert.Error(t, err)
|
|
|
|
r.colType = 999
|
|
_, _, err = r.GetStringFromPayload()
|
|
assert.Error(t, err)
|
|
})
|
|
t.Run("TestGetStringError2", func(t *testing.T) {
|
|
w, err := NewPayloadWriter(schemapb.DataType_String)
|
|
require.Nil(t, err)
|
|
require.NotNil(t, w)
|
|
|
|
err = w.AddOneStringToPayload("hello0", true)
|
|
assert.NoError(t, err)
|
|
err = w.AddOneStringToPayload("hello1", true)
|
|
assert.NoError(t, err)
|
|
err = w.AddOneStringToPayload("hello2", true)
|
|
assert.NoError(t, err)
|
|
|
|
err = w.FinishPayloadWriter()
|
|
assert.NoError(t, err)
|
|
|
|
buffer, err := w.GetPayloadBufferFromWriter()
|
|
assert.NoError(t, err)
|
|
|
|
r, err := NewPayloadReader(schemapb.DataType_String, buffer, false)
|
|
assert.NoError(t, err)
|
|
|
|
r.numRows = 99
|
|
_, _, err = r.GetStringFromPayload()
|
|
assert.Error(t, err)
|
|
})
|
|
t.Run("TestGetArrayError", func(t *testing.T) {
|
|
w, err := NewPayloadWriter(schemapb.DataType_Bool)
|
|
require.Nil(t, err)
|
|
require.NotNil(t, w)
|
|
|
|
err = w.AddBoolToPayload([]bool{false, true, true}, nil)
|
|
assert.NoError(t, err)
|
|
|
|
err = w.FinishPayloadWriter()
|
|
assert.NoError(t, err)
|
|
|
|
buffer, err := w.GetPayloadBufferFromWriter()
|
|
assert.NoError(t, err)
|
|
|
|
r, err := NewPayloadReader(schemapb.DataType_Array, buffer, false)
|
|
assert.NoError(t, err)
|
|
|
|
_, _, err = r.GetArrayFromPayload()
|
|
assert.Error(t, err)
|
|
|
|
r.colType = 999
|
|
_, _, err = r.GetArrayFromPayload()
|
|
assert.Error(t, err)
|
|
})
|
|
t.Run("TestGetBinaryVectorError", func(t *testing.T) {
|
|
w, err := NewPayloadWriter(schemapb.DataType_Bool)
|
|
require.Nil(t, err)
|
|
require.NotNil(t, w)
|
|
|
|
err = w.AddBoolToPayload([]bool{false, true, true}, nil)
|
|
assert.NoError(t, err)
|
|
|
|
err = w.FinishPayloadWriter()
|
|
assert.NoError(t, err)
|
|
|
|
buffer, err := w.GetPayloadBufferFromWriter()
|
|
assert.NoError(t, err)
|
|
|
|
r, err := NewPayloadReader(schemapb.DataType_BinaryVector, buffer, false)
|
|
assert.NoError(t, err)
|
|
|
|
_, _, _, _, err = r.GetBinaryVectorFromPayload()
|
|
assert.Error(t, err)
|
|
|
|
r.colType = 999
|
|
_, _, _, _, err = r.GetBinaryVectorFromPayload()
|
|
assert.Error(t, err)
|
|
})
|
|
t.Run("TestGetBinaryVectorError2", func(t *testing.T) {
|
|
w, err := NewPayloadWriter(schemapb.DataType_BinaryVector, WithDim(8))
|
|
require.Nil(t, err)
|
|
require.NotNil(t, w)
|
|
|
|
err = w.AddBinaryVectorToPayload([]byte{1, 0, 0, 0, 0, 0, 0, 0}, 8, nil)
|
|
assert.NoError(t, err)
|
|
|
|
err = w.FinishPayloadWriter()
|
|
assert.NoError(t, err)
|
|
|
|
buffer, err := w.GetPayloadBufferFromWriter()
|
|
assert.NoError(t, err)
|
|
|
|
r, err := NewPayloadReader(schemapb.DataType_BinaryVector, buffer, false)
|
|
assert.NoError(t, err)
|
|
|
|
r.numRows = 99
|
|
_, _, _, _, err = r.GetBinaryVectorFromPayload()
|
|
assert.Error(t, err)
|
|
})
|
|
t.Run("TestGetFloatVectorError", func(t *testing.T) {
|
|
w, err := NewPayloadWriter(schemapb.DataType_Bool)
|
|
require.Nil(t, err)
|
|
require.NotNil(t, w)
|
|
|
|
err = w.AddBoolToPayload([]bool{false, true, true}, nil)
|
|
assert.NoError(t, err)
|
|
|
|
err = w.FinishPayloadWriter()
|
|
assert.NoError(t, err)
|
|
|
|
buffer, err := w.GetPayloadBufferFromWriter()
|
|
assert.NoError(t, err)
|
|
|
|
r, err := NewPayloadReader(schemapb.DataType_FloatVector, buffer, false)
|
|
assert.NoError(t, err)
|
|
|
|
_, _, _, _, err = r.GetFloatVectorFromPayload()
|
|
assert.Error(t, err)
|
|
|
|
r.colType = 999
|
|
_, _, _, _, err = r.GetFloatVectorFromPayload()
|
|
assert.Error(t, err)
|
|
})
|
|
t.Run("TestGetFloatVectorError2", func(t *testing.T) {
|
|
w, err := NewPayloadWriter(schemapb.DataType_FloatVector, WithDim(8))
|
|
require.Nil(t, err)
|
|
require.NotNil(t, w)
|
|
|
|
err = w.AddFloatVectorToPayload([]float32{1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0}, 8, nil)
|
|
assert.NoError(t, err)
|
|
|
|
err = w.FinishPayloadWriter()
|
|
assert.NoError(t, err)
|
|
|
|
buffer, err := w.GetPayloadBufferFromWriter()
|
|
assert.NoError(t, err)
|
|
|
|
r, err := NewPayloadReader(schemapb.DataType_FloatVector, buffer, false)
|
|
assert.NoError(t, err)
|
|
|
|
r.numRows = 99
|
|
_, _, _, _, err = r.GetFloatVectorFromPayload()
|
|
assert.Error(t, err)
|
|
})
|
|
|
|
t.Run("TestByteArrayDatasetError", func(t *testing.T) {
|
|
w, err := NewPayloadWriter(schemapb.DataType_String)
|
|
require.Nil(t, err)
|
|
require.NotNil(t, w)
|
|
|
|
err = w.AddOneStringToPayload("hello0", true)
|
|
assert.NoError(t, err)
|
|
|
|
err = w.FinishPayloadWriter()
|
|
assert.NoError(t, err)
|
|
|
|
buffer, err := w.GetPayloadBufferFromWriter()
|
|
assert.NoError(t, err)
|
|
|
|
r, err := NewPayloadReader(schemapb.DataType_FloatVector, buffer, false)
|
|
assert.NoError(t, err)
|
|
|
|
r.colType = 99
|
|
_, err = r.GetByteArrayDataSet()
|
|
assert.Error(t, err)
|
|
|
|
r.colType = schemapb.DataType_String
|
|
dataset, err := r.GetByteArrayDataSet()
|
|
assert.NoError(t, err)
|
|
|
|
dataset.columnIdx = math.MaxInt
|
|
_, err = dataset.NextBatch(100)
|
|
assert.Error(t, err)
|
|
|
|
dataset.groupID = math.MaxInt
|
|
assert.Error(t, err)
|
|
})
|
|
|
|
t.Run("TestWriteLargeSizeData", func(t *testing.T) {
|
|
t.Skip("Large data skip for online ut")
|
|
size := 1 << 29 // 512M
|
|
var vec []float32
|
|
for i := 0; i < size/4; i++ {
|
|
vec = append(vec, 1)
|
|
}
|
|
|
|
w, err := NewPayloadWriter(schemapb.DataType_FloatVector)
|
|
assert.NoError(t, err)
|
|
|
|
err = w.AddFloatVectorToPayload(vec, 128, nil)
|
|
assert.NoError(t, err)
|
|
|
|
err = w.FinishPayloadWriter()
|
|
assert.NoError(t, err)
|
|
|
|
_, err = w.GetPayloadBufferFromWriter()
|
|
assert.NoError(t, err)
|
|
|
|
w.ReleasePayloadWriter()
|
|
})
|
|
|
|
t.Run("TestAddBool with wrong valids", func(t *testing.T) {
|
|
w, err := NewPayloadWriter(schemapb.DataType_Bool)
|
|
require.Nil(t, err)
|
|
require.NotNil(t, w)
|
|
|
|
err = w.AddBoolToPayload([]bool{false}, []bool{false})
|
|
assert.ErrorIs(t, err, merr.ErrParameterInvalid)
|
|
})
|
|
|
|
t.Run("TestAddInt8 with wrong valids", func(t *testing.T) {
|
|
w, err := NewPayloadWriter(schemapb.DataType_Int8)
|
|
require.Nil(t, err)
|
|
require.NotNil(t, w)
|
|
|
|
err = w.AddInt8ToPayload([]int8{1}, []bool{false})
|
|
assert.ErrorIs(t, err, merr.ErrParameterInvalid)
|
|
})
|
|
|
|
t.Run("TestAddInt16 with wrong valids", func(t *testing.T) {
|
|
w, err := NewPayloadWriter(schemapb.DataType_Int16)
|
|
require.Nil(t, err)
|
|
require.NotNil(t, w)
|
|
|
|
err = w.AddInt16ToPayload([]int16{1}, []bool{false})
|
|
assert.ErrorIs(t, err, merr.ErrParameterInvalid)
|
|
})
|
|
|
|
t.Run("TestAddInt32 with wrong valids", func(t *testing.T) {
|
|
w, err := NewPayloadWriter(schemapb.DataType_Int32)
|
|
require.Nil(t, err)
|
|
require.NotNil(t, w)
|
|
|
|
err = w.AddInt32ToPayload([]int32{1}, []bool{false})
|
|
assert.ErrorIs(t, err, merr.ErrParameterInvalid)
|
|
})
|
|
|
|
t.Run("TestAddInt64 with wrong valids", func(t *testing.T) {
|
|
w, err := NewPayloadWriter(schemapb.DataType_Int64)
|
|
require.Nil(t, err)
|
|
require.NotNil(t, w)
|
|
|
|
err = w.AddInt64ToPayload([]int64{1}, []bool{false})
|
|
assert.ErrorIs(t, err, merr.ErrParameterInvalid)
|
|
})
|
|
|
|
t.Run("TestAddFloat32 with wrong valids", func(t *testing.T) {
|
|
w, err := NewPayloadWriter(schemapb.DataType_Float)
|
|
require.Nil(t, err)
|
|
require.NotNil(t, w)
|
|
|
|
err = w.AddFloatToPayload([]float32{1.0}, []bool{false})
|
|
assert.ErrorIs(t, err, merr.ErrParameterInvalid)
|
|
})
|
|
|
|
t.Run("TestAddDouble with wrong valids", func(t *testing.T) {
|
|
w, err := NewPayloadWriter(schemapb.DataType_Double)
|
|
require.Nil(t, err)
|
|
require.NotNil(t, w)
|
|
|
|
err = w.AddDoubleToPayload([]float64{1.0}, []bool{false})
|
|
assert.ErrorIs(t, err, merr.ErrParameterInvalid)
|
|
})
|
|
|
|
t.Run("TestAddAddString with wrong valids", func(t *testing.T) {
|
|
w, err := NewPayloadWriter(schemapb.DataType_String)
|
|
require.Nil(t, err)
|
|
require.NotNil(t, w)
|
|
|
|
err = w.AddOneStringToPayload("hello0", false)
|
|
assert.ErrorIs(t, err, merr.ErrParameterInvalid)
|
|
})
|
|
|
|
t.Run("TestAddArray with wrong valids", func(t *testing.T) {
|
|
w, err := NewPayloadWriter(schemapb.DataType_Array)
|
|
require.Nil(t, err)
|
|
require.NotNil(t, w)
|
|
|
|
err = w.AddOneArrayToPayload(&schemapb.ScalarField{
|
|
Data: &schemapb.ScalarField_IntData{
|
|
IntData: &schemapb.IntArray{
|
|
Data: []int32{1, 2},
|
|
},
|
|
},
|
|
}, false)
|
|
assert.ErrorIs(t, err, merr.ErrParameterInvalid)
|
|
})
|
|
|
|
t.Run("TestAddJSON with wrong valids", func(t *testing.T) {
|
|
w, err := NewPayloadWriter(schemapb.DataType_JSON)
|
|
require.Nil(t, err)
|
|
require.NotNil(t, w)
|
|
|
|
err = w.AddOneJSONToPayload([]byte(`{"1":"1"}`), false)
|
|
assert.ErrorIs(t, err, merr.ErrParameterInvalid)
|
|
})
|
|
|
|
t.Run("TestVectorArray", func(t *testing.T) {
|
|
dim := 4
|
|
w, err := NewPayloadWriter(
|
|
schemapb.DataType_ArrayOfVector,
|
|
WithDim(dim),
|
|
WithElementType(schemapb.DataType_FloatVector),
|
|
)
|
|
require.NoError(t, err)
|
|
require.NotNil(t, w)
|
|
|
|
// Create VectorArrayFieldData with 3 rows
|
|
vectorArrayData := &VectorArrayFieldData{
|
|
Dim: int64(dim),
|
|
Data: []*schemapb.VectorField{
|
|
{
|
|
Dim: int64(dim),
|
|
Data: &schemapb.VectorField_FloatVector{
|
|
FloatVector: &schemapb.FloatArray{
|
|
Data: []float32{1.0, 2.0, 3.0, 4.0, 5.0, 6.0, 7.0, 8.0},
|
|
},
|
|
},
|
|
},
|
|
{
|
|
Dim: int64(dim),
|
|
Data: &schemapb.VectorField_FloatVector{
|
|
FloatVector: &schemapb.FloatArray{
|
|
Data: []float32{11.0, 22.0, 33.0, 44.0},
|
|
},
|
|
},
|
|
},
|
|
{
|
|
Dim: int64(dim),
|
|
Data: &schemapb.VectorField_FloatVector{
|
|
FloatVector: &schemapb.FloatArray{
|
|
Data: []float32{111.0, 222.0, 333.0, 444.0, 555.0, 666.0, 777.0, 888.0, 999.0, 1000.0, 1111.0, 1212.0, 1313.0, 1414.0, 1515.0, 1616.0, 1717.0, 1818.0, 1919.0, 2020.0},
|
|
},
|
|
},
|
|
},
|
|
},
|
|
ElementType: schemapb.DataType_FloatVector,
|
|
}
|
|
|
|
err = w.AddVectorArrayFieldDataToPayload(vectorArrayData)
|
|
assert.NoError(t, err)
|
|
|
|
err = w.FinishPayloadWriter()
|
|
assert.NoError(t, err)
|
|
|
|
length, err := w.GetPayloadLengthFromWriter()
|
|
assert.NoError(t, err)
|
|
assert.Equal(t, 3, length)
|
|
|
|
buffer, err := w.GetPayloadBufferFromWriter()
|
|
assert.NoError(t, err)
|
|
|
|
r, err := NewPayloadReader(schemapb.DataType_ArrayOfVector, buffer, false)
|
|
assert.NoError(t, err)
|
|
|
|
length, err = r.GetPayloadLengthFromReader()
|
|
assert.NoError(t, err)
|
|
assert.Equal(t, 3, length)
|
|
|
|
vectorArrays, err := r.GetVectorArrayFromPayload()
|
|
assert.NoError(t, err)
|
|
|
|
assert.EqualValues(t, []float32{1.0, 2.0, 3.0, 4.0, 5.0, 6.0, 7.0, 8.0}, vectorArrays[0].GetFloatVector().GetData())
|
|
assert.EqualValues(t, []float32{11.0, 22.0, 33.0, 44.0}, vectorArrays[1].GetFloatVector().GetData())
|
|
assert.EqualValues(t, []float32{111.0, 222.0, 333.0, 444.0, 555.0, 666.0, 777.0, 888.0, 999.0, 1000.0, 1111.0, 1212.0, 1313.0, 1414.0, 1515.0, 1616.0, 1717.0, 1818.0, 1919.0, 2020.0}, vectorArrays[2].GetFloatVector().GetData())
|
|
for _, v := range vectorArrays {
|
|
assert.Equal(t, int64(dim), v.GetDim())
|
|
}
|
|
|
|
iArrayList, _, _, err := r.GetDataFromPayload()
|
|
vectorArrays = iArrayList.([]*schemapb.VectorField)
|
|
assert.NoError(t, err)
|
|
assert.EqualValues(t, []float32{1.0, 2.0, 3.0, 4.0, 5.0, 6.0, 7.0, 8.0}, vectorArrays[0].GetFloatVector().GetData())
|
|
assert.EqualValues(t, []float32{11.0, 22.0, 33.0, 44.0}, vectorArrays[1].GetFloatVector().GetData())
|
|
assert.EqualValues(t, []float32{111.0, 222.0, 333.0, 444.0, 555.0, 666.0, 777.0, 888.0, 999.0, 1000.0, 1111.0, 1212.0, 1313.0, 1414.0, 1515.0, 1616.0, 1717.0, 1818.0, 1919.0, 2020.0}, vectorArrays[2].GetFloatVector().GetData())
|
|
for _, v := range vectorArrays {
|
|
assert.Equal(t, int64(dim), v.GetDim())
|
|
}
|
|
|
|
r.ReleasePayloadReader()
|
|
w.ReleasePayloadWriter()
|
|
})
|
|
}
|
|
|
|
func TestPayload_NullableReaderAndWriter(t *testing.T) {
|
|
t.Run("TestBool", func(t *testing.T) {
|
|
w, err := NewPayloadWriter(schemapb.DataType_Bool, WithNullable(true))
|
|
require.Nil(t, err)
|
|
require.NotNil(t, w)
|
|
|
|
err = w.AddBoolToPayload([]bool{true, false, false, false}, []bool{true, false, true, false})
|
|
assert.NoError(t, err)
|
|
err = w.AddDataToPayloadForUT([]bool{true, false, false, false}, []bool{true, false, true, false})
|
|
assert.NoError(t, err)
|
|
err = w.FinishPayloadWriter()
|
|
assert.NoError(t, err)
|
|
|
|
length, err := w.GetPayloadLengthFromWriter()
|
|
assert.NoError(t, err)
|
|
assert.Equal(t, 8, length)
|
|
defer w.ReleasePayloadWriter()
|
|
|
|
buffer, err := w.GetPayloadBufferFromWriter()
|
|
assert.NoError(t, err)
|
|
|
|
r, err := NewPayloadReader(schemapb.DataType_Bool, buffer, true)
|
|
require.Nil(t, err)
|
|
length, err = r.GetPayloadLengthFromReader()
|
|
assert.NoError(t, err)
|
|
assert.Equal(t, length, 8)
|
|
bools, valids, err := r.GetBoolFromPayload()
|
|
assert.NoError(t, err)
|
|
assert.Equal(t, []bool{true, false, false, false, true, false, false, false}, bools)
|
|
assert.Equal(t, []bool{true, false, true, false, true, false, true, false}, valids)
|
|
ibools, valids, _, err := r.GetDataFromPayload()
|
|
bools = ibools.([]bool)
|
|
assert.NoError(t, err)
|
|
assert.Equal(t, []bool{true, false, false, false, true, false, false, false}, bools)
|
|
assert.Equal(t, []bool{true, false, true, false, true, false, true, false}, valids)
|
|
defer r.ReleasePayloadReader()
|
|
})
|
|
|
|
t.Run("TestInt8", func(t *testing.T) {
|
|
w, err := NewPayloadWriter(schemapb.DataType_Int8, WithNullable(true))
|
|
require.Nil(t, err)
|
|
require.NotNil(t, w)
|
|
|
|
err = w.AddInt8ToPayload([]int8{1, 2, 3}, []bool{true, false, true})
|
|
assert.NoError(t, err)
|
|
err = w.AddDataToPayloadForUT([]int8{4, 5, 6}, []bool{true, false, true})
|
|
assert.NoError(t, err)
|
|
err = w.FinishPayloadWriter()
|
|
assert.NoError(t, err)
|
|
|
|
length, err := w.GetPayloadLengthFromWriter()
|
|
assert.NoError(t, err)
|
|
assert.Equal(t, 6, length)
|
|
defer w.ReleasePayloadWriter()
|
|
|
|
buffer, err := w.GetPayloadBufferFromWriter()
|
|
assert.NoError(t, err)
|
|
|
|
r, err := NewPayloadReader(schemapb.DataType_Int8, buffer, true)
|
|
require.Nil(t, err)
|
|
length, err = r.GetPayloadLengthFromReader()
|
|
assert.NoError(t, err)
|
|
assert.Equal(t, length, 6)
|
|
|
|
int8s, valids, err := r.GetInt8FromPayload()
|
|
assert.NoError(t, err)
|
|
assert.Equal(t, []int8{1, 0, 3, 4, 0, 6}, int8s)
|
|
assert.Equal(t, []bool{true, false, true, true, false, true}, valids)
|
|
|
|
iint8s, valids, _, err := r.GetDataFromPayload()
|
|
int8s = iint8s.([]int8)
|
|
assert.NoError(t, err)
|
|
|
|
assert.Equal(t, []int8{1, 0, 3, 4, 0, 6}, int8s)
|
|
assert.Equal(t, []bool{true, false, true, true, false, true}, valids)
|
|
defer r.ReleasePayloadReader()
|
|
})
|
|
|
|
t.Run("TestInt16", func(t *testing.T) {
|
|
w, err := NewPayloadWriter(schemapb.DataType_Int16, WithNullable(true))
|
|
require.Nil(t, err)
|
|
require.NotNil(t, w)
|
|
|
|
err = w.AddInt16ToPayload([]int16{1, 2, 3}, []bool{true, false, true})
|
|
assert.NoError(t, err)
|
|
err = w.AddDataToPayloadForUT([]int16{1, 2, 3}, []bool{true, false, true})
|
|
assert.NoError(t, err)
|
|
err = w.FinishPayloadWriter()
|
|
assert.NoError(t, err)
|
|
|
|
length, err := w.GetPayloadLengthFromWriter()
|
|
assert.NoError(t, err)
|
|
assert.Equal(t, 6, length)
|
|
defer w.ReleasePayloadWriter()
|
|
|
|
buffer, err := w.GetPayloadBufferFromWriter()
|
|
assert.NoError(t, err)
|
|
|
|
r, err := NewPayloadReader(schemapb.DataType_Int16, buffer, true)
|
|
require.Nil(t, err)
|
|
length, err = r.GetPayloadLengthFromReader()
|
|
assert.NoError(t, err)
|
|
assert.Equal(t, length, 6)
|
|
int16s, valids, err := r.GetInt16FromPayload()
|
|
assert.NoError(t, err)
|
|
assert.Equal(t, []int16{1, 0, 3, 1, 0, 3}, int16s)
|
|
assert.Equal(t, []bool{true, false, true, true, false, true}, valids)
|
|
|
|
iint16s, valids, _, err := r.GetDataFromPayload()
|
|
int16s = iint16s.([]int16)
|
|
assert.NoError(t, err)
|
|
assert.Equal(t, []int16{1, 0, 3, 1, 0, 3}, int16s)
|
|
assert.Equal(t, []bool{true, false, true, true, false, true}, valids)
|
|
defer r.ReleasePayloadReader()
|
|
})
|
|
|
|
t.Run("TestInt32", func(t *testing.T) {
|
|
w, err := NewPayloadWriter(schemapb.DataType_Int32, WithNullable(true))
|
|
require.Nil(t, err)
|
|
require.NotNil(t, w)
|
|
|
|
err = w.AddInt32ToPayload([]int32{1, 2, 3}, []bool{true, false, true})
|
|
assert.NoError(t, err)
|
|
err = w.AddDataToPayloadForUT([]int32{1, 2, 3}, []bool{true, false, true})
|
|
assert.NoError(t, err)
|
|
err = w.FinishPayloadWriter()
|
|
assert.NoError(t, err)
|
|
|
|
length, err := w.GetPayloadLengthFromWriter()
|
|
assert.NoError(t, err)
|
|
assert.Equal(t, 6, length)
|
|
defer w.ReleasePayloadWriter()
|
|
|
|
buffer, err := w.GetPayloadBufferFromWriter()
|
|
assert.NoError(t, err)
|
|
|
|
r, err := NewPayloadReader(schemapb.DataType_Int32, buffer, true)
|
|
require.Nil(t, err)
|
|
length, err = r.GetPayloadLengthFromReader()
|
|
assert.NoError(t, err)
|
|
assert.Equal(t, length, 6)
|
|
|
|
int32s, valids, err := r.GetInt32FromPayload()
|
|
assert.NoError(t, err)
|
|
assert.Equal(t, []int32{1, 0, 3, 1, 0, 3}, int32s)
|
|
assert.Equal(t, []bool{true, false, true, true, false, true}, valids)
|
|
|
|
iint32s, valids, _, err := r.GetDataFromPayload()
|
|
int32s = iint32s.([]int32)
|
|
assert.NoError(t, err)
|
|
assert.Equal(t, []int32{1, 0, 3, 1, 0, 3}, int32s)
|
|
assert.Equal(t, []bool{true, false, true, true, false, true}, valids)
|
|
defer r.ReleasePayloadReader()
|
|
})
|
|
|
|
t.Run("TestInt64", func(t *testing.T) {
|
|
w, err := NewPayloadWriter(schemapb.DataType_Int64, WithNullable(true))
|
|
require.Nil(t, err)
|
|
require.NotNil(t, w)
|
|
|
|
err = w.AddInt64ToPayload([]int64{1, 2, 3}, []bool{true, false, true})
|
|
assert.NoError(t, err)
|
|
err = w.AddDataToPayloadForUT([]int64{1, 2, 3}, []bool{true, false, true})
|
|
assert.NoError(t, err)
|
|
err = w.FinishPayloadWriter()
|
|
assert.NoError(t, err)
|
|
|
|
length, err := w.GetPayloadLengthFromWriter()
|
|
assert.NoError(t, err)
|
|
assert.Equal(t, 6, length)
|
|
defer w.ReleasePayloadWriter()
|
|
|
|
buffer, err := w.GetPayloadBufferFromWriter()
|
|
assert.NoError(t, err)
|
|
|
|
r, err := NewPayloadReader(schemapb.DataType_Int64, buffer, true)
|
|
require.Nil(t, err)
|
|
length, err = r.GetPayloadLengthFromReader()
|
|
assert.NoError(t, err)
|
|
assert.Equal(t, length, 6)
|
|
|
|
int64s, valids, err := r.GetInt64FromPayload()
|
|
assert.NoError(t, err)
|
|
assert.Equal(t, []int64{1, 0, 3, 1, 0, 3}, int64s)
|
|
assert.Equal(t, []bool{true, false, true, true, false, true}, valids)
|
|
|
|
iint64s, valids, _, err := r.GetDataFromPayload()
|
|
int64s = iint64s.([]int64)
|
|
assert.NoError(t, err)
|
|
assert.Equal(t, []int64{1, 0, 3, 1, 0, 3}, int64s)
|
|
assert.Equal(t, []bool{true, false, true, true, false, true}, valids)
|
|
defer r.ReleasePayloadReader()
|
|
})
|
|
|
|
t.Run("TestFloat32", func(t *testing.T) {
|
|
w, err := NewPayloadWriter(schemapb.DataType_Float, WithNullable(true))
|
|
require.Nil(t, err)
|
|
require.NotNil(t, w)
|
|
|
|
err = w.AddFloatToPayload([]float32{1.0, 2.0, 3.0}, []bool{true, false, true})
|
|
assert.NoError(t, err)
|
|
err = w.AddDataToPayloadForUT([]float32{1.0, 2.0, 3.0}, []bool{false, true, false})
|
|
assert.NoError(t, err)
|
|
err = w.FinishPayloadWriter()
|
|
assert.NoError(t, err)
|
|
|
|
length, err := w.GetPayloadLengthFromWriter()
|
|
assert.NoError(t, err)
|
|
assert.Equal(t, 6, length)
|
|
defer w.ReleasePayloadWriter()
|
|
|
|
buffer, err := w.GetPayloadBufferFromWriter()
|
|
assert.NoError(t, err)
|
|
|
|
r, err := NewPayloadReader(schemapb.DataType_Float, buffer, true)
|
|
require.Nil(t, err)
|
|
length, err = r.GetPayloadLengthFromReader()
|
|
assert.NoError(t, err)
|
|
assert.Equal(t, length, 6)
|
|
|
|
float32s, valids, err := r.GetFloatFromPayload()
|
|
assert.NoError(t, err)
|
|
assert.Equal(t, []float32{1.0, 0, 3.0, 0, 2.0, 0}, float32s)
|
|
assert.Equal(t, []bool{true, false, true, false, true, false}, valids)
|
|
|
|
ifloat32s, valids, _, err := r.GetDataFromPayload()
|
|
float32s = ifloat32s.([]float32)
|
|
assert.NoError(t, err)
|
|
assert.Equal(t, []float32{1.0, 0, 3.0, 0, 2.0, 0}, float32s)
|
|
assert.Equal(t, []bool{true, false, true, false, true, false}, valids)
|
|
defer r.ReleasePayloadReader()
|
|
})
|
|
|
|
t.Run("TestDouble", func(t *testing.T) {
|
|
w, err := NewPayloadWriter(schemapb.DataType_Double, WithNullable(true))
|
|
require.Nil(t, err)
|
|
require.NotNil(t, w)
|
|
|
|
err = w.AddDoubleToPayload([]float64{1.0, 2.0, 3.0}, []bool{true, false, true})
|
|
assert.NoError(t, err)
|
|
err = w.AddDataToPayloadForUT([]float64{1.0, 2.0, 3.0}, []bool{false, true, false})
|
|
assert.NoError(t, err)
|
|
err = w.FinishPayloadWriter()
|
|
assert.NoError(t, err)
|
|
|
|
length, err := w.GetPayloadLengthFromWriter()
|
|
assert.NoError(t, err)
|
|
assert.Equal(t, 6, length)
|
|
defer w.ReleasePayloadWriter()
|
|
|
|
buffer, err := w.GetPayloadBufferFromWriter()
|
|
assert.NoError(t, err)
|
|
|
|
r, err := NewPayloadReader(schemapb.DataType_Double, buffer, true)
|
|
require.Nil(t, err)
|
|
length, err = r.GetPayloadLengthFromReader()
|
|
assert.NoError(t, err)
|
|
assert.Equal(t, length, 6)
|
|
|
|
float64s, valids, err := r.GetDoubleFromPayload()
|
|
assert.NoError(t, err)
|
|
assert.Equal(t, []float64{1.0, 0, 3.0, 0, 2.0, 0}, float64s)
|
|
assert.Equal(t, []bool{true, false, true, false, true, false}, valids)
|
|
|
|
ifloat64s, valids, _, err := r.GetDataFromPayload()
|
|
float64s = ifloat64s.([]float64)
|
|
assert.NoError(t, err)
|
|
assert.Equal(t, []float64{1.0, 0, 3.0, 0, 2.0, 0}, float64s)
|
|
assert.Equal(t, []bool{true, false, true, false, true, false}, valids)
|
|
defer r.ReleasePayloadReader()
|
|
})
|
|
|
|
t.Run("TestAddString", func(t *testing.T) {
|
|
w, err := NewPayloadWriter(schemapb.DataType_String, WithNullable(true))
|
|
require.Nil(t, err)
|
|
require.NotNil(t, w)
|
|
|
|
err = w.AddOneStringToPayload("hello0", true)
|
|
assert.NoError(t, err)
|
|
err = w.AddOneStringToPayload("hello1", false)
|
|
assert.NoError(t, err)
|
|
err = w.AddOneStringToPayload("hello2", true)
|
|
assert.NoError(t, err)
|
|
err = w.AddDataToPayloadForUT("hello3", []bool{false})
|
|
assert.NoError(t, err)
|
|
err = w.FinishPayloadWriter()
|
|
assert.NoError(t, err)
|
|
length, err := w.GetPayloadLengthFromWriter()
|
|
assert.NoError(t, err)
|
|
assert.Equal(t, length, 4)
|
|
buffer, err := w.GetPayloadBufferFromWriter()
|
|
assert.NoError(t, err)
|
|
|
|
r, err := NewPayloadReader(schemapb.DataType_String, buffer, true)
|
|
assert.NoError(t, err)
|
|
length, err = r.GetPayloadLengthFromReader()
|
|
assert.NoError(t, err)
|
|
assert.Equal(t, length, 4)
|
|
|
|
str, valids, err := r.GetStringFromPayload()
|
|
assert.NoError(t, err)
|
|
|
|
assert.Equal(t, str[0], "hello0")
|
|
assert.Equal(t, str[1], "")
|
|
assert.Equal(t, str[2], "hello2")
|
|
assert.Equal(t, str[3], "")
|
|
assert.Equal(t, []bool{true, false, true, false}, valids)
|
|
|
|
istr, valids, _, err := r.GetDataFromPayload()
|
|
strArray := istr.([]string)
|
|
assert.NoError(t, err)
|
|
assert.Equal(t, strArray[0], "hello0")
|
|
assert.Equal(t, strArray[1], "")
|
|
assert.Equal(t, strArray[2], "hello2")
|
|
assert.Equal(t, strArray[3], "")
|
|
assert.Equal(t, []bool{true, false, true, false}, valids)
|
|
r.ReleasePayloadReader()
|
|
w.ReleasePayloadWriter()
|
|
})
|
|
|
|
t.Run("TestAddArray", func(t *testing.T) {
|
|
w, err := NewPayloadWriter(schemapb.DataType_Array, WithNullable(true))
|
|
require.Nil(t, err)
|
|
require.NotNil(t, w)
|
|
|
|
err = w.AddOneArrayToPayload(&schemapb.ScalarField{
|
|
Data: &schemapb.ScalarField_IntData{
|
|
IntData: &schemapb.IntArray{
|
|
Data: []int32{1, 2},
|
|
},
|
|
},
|
|
}, true)
|
|
assert.NoError(t, err)
|
|
err = w.AddOneArrayToPayload(&schemapb.ScalarField{
|
|
Data: &schemapb.ScalarField_IntData{
|
|
IntData: &schemapb.IntArray{
|
|
Data: []int32{3, 4},
|
|
},
|
|
},
|
|
}, false)
|
|
assert.NoError(t, err)
|
|
err = w.AddOneArrayToPayload(&schemapb.ScalarField{
|
|
Data: &schemapb.ScalarField_IntData{
|
|
IntData: &schemapb.IntArray{
|
|
Data: []int32{5, 6},
|
|
},
|
|
},
|
|
}, true)
|
|
assert.NoError(t, err)
|
|
err = w.AddDataToPayloadForUT(&schemapb.ScalarField{
|
|
Data: &schemapb.ScalarField_IntData{
|
|
IntData: &schemapb.IntArray{
|
|
Data: []int32{7, 8},
|
|
},
|
|
},
|
|
}, []bool{false})
|
|
assert.NoError(t, err)
|
|
err = w.FinishPayloadWriter()
|
|
assert.NoError(t, err)
|
|
length, err := w.GetPayloadLengthFromWriter()
|
|
assert.NoError(t, err)
|
|
assert.Equal(t, length, 4)
|
|
buffer, err := w.GetPayloadBufferFromWriter()
|
|
assert.NoError(t, err)
|
|
|
|
r, err := NewPayloadReader(schemapb.DataType_Array, buffer, true)
|
|
assert.NoError(t, err)
|
|
length, err = r.GetPayloadLengthFromReader()
|
|
assert.NoError(t, err)
|
|
assert.Equal(t, length, 4)
|
|
|
|
arrayList, valids, err := r.GetArrayFromPayload()
|
|
assert.NoError(t, err)
|
|
|
|
assert.EqualValues(t, []int32{1, 2}, arrayList[0].GetIntData().GetData())
|
|
assert.EqualValues(t, []int32(nil), arrayList[1].GetIntData().GetData())
|
|
assert.EqualValues(t, []int32{5, 6}, arrayList[2].GetIntData().GetData())
|
|
assert.EqualValues(t, []int32(nil), arrayList[3].GetIntData().GetData())
|
|
assert.Equal(t, []bool{true, false, true, false}, valids)
|
|
|
|
iArrayList, valids, _, err := r.GetDataFromPayload()
|
|
arrayList = iArrayList.([]*schemapb.ScalarField)
|
|
assert.NoError(t, err)
|
|
assert.EqualValues(t, []int32{1, 2}, arrayList[0].GetIntData().GetData())
|
|
assert.EqualValues(t, []int32(nil), arrayList[1].GetIntData().GetData())
|
|
assert.EqualValues(t, []int32{5, 6}, arrayList[2].GetIntData().GetData())
|
|
assert.EqualValues(t, []int32(nil), arrayList[3].GetIntData().GetData())
|
|
assert.Equal(t, []bool{true, false, true, false}, valids)
|
|
r.ReleasePayloadReader()
|
|
w.ReleasePayloadWriter()
|
|
})
|
|
|
|
t.Run("TestAddJSON", func(t *testing.T) {
|
|
w, err := NewPayloadWriter(schemapb.DataType_JSON, WithNullable(true))
|
|
require.Nil(t, err)
|
|
require.NotNil(t, w)
|
|
|
|
err = w.AddOneJSONToPayload([]byte(`{"1":"1"}`), true)
|
|
assert.NoError(t, err)
|
|
err = w.AddOneJSONToPayload([]byte(`{"2":"2"}`), false)
|
|
assert.NoError(t, err)
|
|
err = w.AddOneJSONToPayload([]byte(`{"3":"3"}`), true)
|
|
assert.NoError(t, err)
|
|
err = w.AddDataToPayloadForUT([]byte(`{"4":"4"}`), []bool{false})
|
|
assert.NoError(t, err)
|
|
err = w.FinishPayloadWriter()
|
|
assert.NoError(t, err)
|
|
length, err := w.GetPayloadLengthFromWriter()
|
|
assert.NoError(t, err)
|
|
assert.Equal(t, length, 4)
|
|
buffer, err := w.GetPayloadBufferFromWriter()
|
|
assert.NoError(t, err)
|
|
|
|
r, err := NewPayloadReader(schemapb.DataType_JSON, buffer, true)
|
|
assert.NoError(t, err)
|
|
length, err = r.GetPayloadLengthFromReader()
|
|
assert.NoError(t, err)
|
|
assert.Equal(t, length, 4)
|
|
|
|
json, valids, err := r.GetJSONFromPayload()
|
|
assert.NoError(t, err)
|
|
|
|
assert.EqualValues(t, []byte(`{"1":"1"}`), json[0])
|
|
assert.EqualValues(t, []byte(``), json[1])
|
|
assert.EqualValues(t, []byte(`{"3":"3"}`), json[2])
|
|
assert.EqualValues(t, []byte(``), json[3])
|
|
assert.Equal(t, []bool{true, false, true, false}, valids)
|
|
|
|
iJSON, valids, _, err := r.GetDataFromPayload()
|
|
json = iJSON.([][]byte)
|
|
assert.NoError(t, err)
|
|
assert.EqualValues(t, []byte(`{"1":"1"}`), json[0])
|
|
assert.EqualValues(t, []byte(``), json[1])
|
|
assert.EqualValues(t, []byte(`{"3":"3"}`), json[2])
|
|
assert.EqualValues(t, []byte(``), json[3])
|
|
assert.Equal(t, []bool{true, false, true, false}, valids)
|
|
r.ReleasePayloadReader()
|
|
w.ReleasePayloadWriter()
|
|
})
|
|
|
|
t.Run("TestFloatVector", func(t *testing.T) {
|
|
dim := 128
|
|
numRows := 100
|
|
|
|
type testCase struct {
|
|
name string
|
|
validDataSetup func([]bool) int
|
|
}
|
|
|
|
testCases := []testCase{
|
|
{
|
|
name: "half null",
|
|
validDataSetup: func(validData []bool) int {
|
|
validCount := 0
|
|
for i := 0; i < numRows; i++ {
|
|
if i%2 == 0 {
|
|
validData[i] = true
|
|
validCount++
|
|
}
|
|
}
|
|
return validCount
|
|
},
|
|
},
|
|
{
|
|
name: "all valid",
|
|
validDataSetup: func(validData []bool) int {
|
|
for i := 0; i < numRows; i++ {
|
|
validData[i] = true
|
|
}
|
|
return numRows
|
|
},
|
|
},
|
|
{
|
|
name: "all null",
|
|
validDataSetup: func(validData []bool) int {
|
|
return 0
|
|
},
|
|
},
|
|
}
|
|
|
|
for _, tc := range testCases {
|
|
w, err := NewPayloadWriter(schemapb.DataType_FloatVector, WithDim(dim), WithNullable(true))
|
|
require.NoError(t, err)
|
|
|
|
validData := make([]bool, numRows)
|
|
validCount := tc.validDataSetup(validData)
|
|
|
|
data := make([]float32, validCount*dim)
|
|
dataIdx := 0
|
|
for i := 0; i < numRows; i++ {
|
|
if validData[i] {
|
|
for j := 0; j < dim; j++ {
|
|
data[dataIdx*dim+j] = float32(i*100 + j)
|
|
}
|
|
dataIdx++
|
|
}
|
|
}
|
|
|
|
err = w.AddFloatVectorToPayload(data, dim, validData)
|
|
require.NoError(t, err)
|
|
|
|
err = w.FinishPayloadWriter()
|
|
require.NoError(t, err)
|
|
|
|
buffer, err := w.GetPayloadBufferFromWriter()
|
|
require.NoError(t, err)
|
|
|
|
r, err := NewPayloadReader(schemapb.DataType_FloatVector, buffer, true)
|
|
require.NoError(t, err)
|
|
|
|
readData, readDim, readValid, readNumRows, err := r.GetFloatVectorFromPayload()
|
|
require.NoError(t, err)
|
|
require.Equal(t, dim, readDim)
|
|
require.Equal(t, numRows, readNumRows)
|
|
require.Equal(t, numRows, len(readValid))
|
|
|
|
dataIdx = 0
|
|
for i := 0; i < numRows; i++ {
|
|
require.Equal(t, validData[i], readValid[i])
|
|
if validData[i] {
|
|
pos := dataIdx
|
|
for j := 0; j < dim; j++ {
|
|
require.Equal(t, data[dataIdx*dim+j], readData[pos*dim+j])
|
|
}
|
|
dataIdx++
|
|
}
|
|
}
|
|
}
|
|
})
|
|
|
|
t.Run("TestBinaryVector", func(t *testing.T) {
|
|
dim := 128
|
|
numRows := 100
|
|
|
|
type testCase struct {
|
|
name string
|
|
validDataSetup func([]bool) int
|
|
}
|
|
|
|
testCases := []testCase{
|
|
{
|
|
name: "partial null",
|
|
validDataSetup: func(validData []bool) int {
|
|
validCount := 0
|
|
for i := 0; i < numRows; i++ {
|
|
if i%3 == 0 {
|
|
validData[i] = true
|
|
validCount++
|
|
}
|
|
}
|
|
return validCount
|
|
},
|
|
},
|
|
{
|
|
name: "all valid",
|
|
validDataSetup: func(validData []bool) int {
|
|
for i := 0; i < numRows; i++ {
|
|
validData[i] = true
|
|
}
|
|
return numRows
|
|
},
|
|
},
|
|
{
|
|
name: "all null",
|
|
validDataSetup: func(validData []bool) int {
|
|
return 0
|
|
},
|
|
},
|
|
}
|
|
|
|
for _, tc := range testCases {
|
|
w, err := NewPayloadWriter(schemapb.DataType_BinaryVector, WithDim(dim), WithNullable(true))
|
|
require.NoError(t, err)
|
|
|
|
validData := make([]bool, numRows)
|
|
validCount := tc.validDataSetup(validData)
|
|
|
|
data := make([]byte, validCount*dim/8)
|
|
dataIdx := 0
|
|
for i := 0; i < numRows; i++ {
|
|
if validData[i] {
|
|
for j := 0; j < dim/8; j++ {
|
|
data[dataIdx*dim/8+j] = byte(i + j)
|
|
}
|
|
dataIdx++
|
|
}
|
|
}
|
|
|
|
err = w.AddBinaryVectorToPayload(data, dim, validData)
|
|
require.NoError(t, err)
|
|
|
|
err = w.FinishPayloadWriter()
|
|
require.NoError(t, err)
|
|
|
|
buffer, err := w.GetPayloadBufferFromWriter()
|
|
require.NoError(t, err)
|
|
|
|
r, err := NewPayloadReader(schemapb.DataType_BinaryVector, buffer, true)
|
|
require.NoError(t, err)
|
|
|
|
readData, readDim, readValid, readNumRows, err := r.GetBinaryVectorFromPayload()
|
|
require.NoError(t, err)
|
|
require.Equal(t, dim, readDim)
|
|
require.Equal(t, numRows, readNumRows)
|
|
require.Equal(t, numRows, len(readValid))
|
|
|
|
dataIdx = 0
|
|
for i := 0; i < numRows; i++ {
|
|
require.Equal(t, validData[i], readValid[i])
|
|
if validData[i] {
|
|
pos := dataIdx
|
|
for j := 0; j < dim/8; j++ {
|
|
require.Equal(t, data[dataIdx*dim/8+j], readData[pos*dim/8+j])
|
|
}
|
|
dataIdx++
|
|
}
|
|
}
|
|
}
|
|
})
|
|
|
|
t.Run("TestFloat16Vector", func(t *testing.T) {
|
|
dim := 128
|
|
numRows := 100
|
|
|
|
type testCase struct {
|
|
name string
|
|
validDataSetup func([]bool) int
|
|
}
|
|
|
|
testCases := []testCase{
|
|
{
|
|
name: "partial null",
|
|
validDataSetup: func(validData []bool) int {
|
|
validCount := 0
|
|
for i := 0; i < numRows; i++ {
|
|
if i%2 == 1 {
|
|
validData[i] = true
|
|
validCount++
|
|
}
|
|
}
|
|
return validCount
|
|
},
|
|
},
|
|
{
|
|
name: "all valid",
|
|
validDataSetup: func(validData []bool) int {
|
|
for i := 0; i < numRows; i++ {
|
|
validData[i] = true
|
|
}
|
|
return numRows
|
|
},
|
|
},
|
|
{
|
|
name: "all null",
|
|
validDataSetup: func(validData []bool) int {
|
|
return 0
|
|
},
|
|
},
|
|
}
|
|
|
|
for _, tc := range testCases {
|
|
w, err := NewPayloadWriter(schemapb.DataType_Float16Vector, WithDim(dim), WithNullable(true))
|
|
require.NoError(t, err)
|
|
|
|
validData := make([]bool, numRows)
|
|
validCount := tc.validDataSetup(validData)
|
|
|
|
data := make([]byte, validCount*dim*2)
|
|
dataIdx := 0
|
|
for i := 0; i < numRows; i++ {
|
|
if validData[i] {
|
|
for j := 0; j < dim*2; j++ {
|
|
data[dataIdx*dim*2+j] = byte((i*10 + j) % 256)
|
|
}
|
|
dataIdx++
|
|
}
|
|
}
|
|
|
|
err = w.AddFloat16VectorToPayload(data, dim, validData)
|
|
require.NoError(t, err)
|
|
|
|
err = w.FinishPayloadWriter()
|
|
require.NoError(t, err)
|
|
|
|
buffer, err := w.GetPayloadBufferFromWriter()
|
|
require.NoError(t, err)
|
|
|
|
r, err := NewPayloadReader(schemapb.DataType_Float16Vector, buffer, true)
|
|
require.NoError(t, err)
|
|
|
|
readData, readDim, readValid, readNumRows, err := r.GetFloat16VectorFromPayload()
|
|
require.NoError(t, err)
|
|
require.Equal(t, dim, readDim)
|
|
require.Equal(t, numRows, readNumRows)
|
|
require.Equal(t, numRows, len(readValid))
|
|
|
|
dataIdx = 0
|
|
for i := 0; i < numRows; i++ {
|
|
require.Equal(t, validData[i], readValid[i])
|
|
if validData[i] {
|
|
pos := dataIdx
|
|
for j := 0; j < dim*2; j++ {
|
|
require.Equal(t, data[dataIdx*dim*2+j], readData[pos*dim*2+j])
|
|
}
|
|
dataIdx++
|
|
}
|
|
}
|
|
}
|
|
})
|
|
|
|
t.Run("TestBFloat16Vector", func(t *testing.T) {
|
|
dim := 128
|
|
numRows := 100
|
|
|
|
type testCase struct {
|
|
name string
|
|
validDataSetup func([]bool) int
|
|
}
|
|
|
|
testCases := []testCase{
|
|
{
|
|
name: "partial null",
|
|
validDataSetup: func(validData []bool) int {
|
|
validCount := 0
|
|
for i := 0; i < numRows; i++ {
|
|
if (i+1)%3 != 0 {
|
|
validData[i] = true
|
|
validCount++
|
|
}
|
|
}
|
|
return validCount
|
|
},
|
|
},
|
|
{
|
|
name: "all valid",
|
|
validDataSetup: func(validData []bool) int {
|
|
for i := 0; i < numRows; i++ {
|
|
validData[i] = true
|
|
}
|
|
return numRows
|
|
},
|
|
},
|
|
{
|
|
name: "all null",
|
|
validDataSetup: func(validData []bool) int {
|
|
return 0
|
|
},
|
|
},
|
|
}
|
|
|
|
for _, tc := range testCases {
|
|
w, err := NewPayloadWriter(schemapb.DataType_BFloat16Vector, WithDim(dim), WithNullable(true))
|
|
require.NoError(t, err)
|
|
|
|
validData := make([]bool, numRows)
|
|
validCount := tc.validDataSetup(validData)
|
|
|
|
data := make([]byte, validCount*dim*2)
|
|
dataIdx := 0
|
|
for i := 0; i < numRows; i++ {
|
|
if validData[i] {
|
|
for j := 0; j < dim*2; j++ {
|
|
data[dataIdx*dim*2+j] = byte((i*20 + j) % 256)
|
|
}
|
|
dataIdx++
|
|
}
|
|
}
|
|
|
|
err = w.AddBFloat16VectorToPayload(data, dim, validData)
|
|
require.NoError(t, err)
|
|
|
|
err = w.FinishPayloadWriter()
|
|
require.NoError(t, err)
|
|
|
|
buffer, err := w.GetPayloadBufferFromWriter()
|
|
require.NoError(t, err)
|
|
|
|
r, err := NewPayloadReader(schemapb.DataType_BFloat16Vector, buffer, true)
|
|
require.NoError(t, err)
|
|
|
|
readData, readDim, readValid, readNumRows, err := r.GetBFloat16VectorFromPayload()
|
|
require.NoError(t, err)
|
|
require.Equal(t, dim, readDim)
|
|
require.Equal(t, numRows, readNumRows)
|
|
require.Equal(t, numRows, len(readValid))
|
|
|
|
dataIdx = 0
|
|
for i := 0; i < numRows; i++ {
|
|
require.Equal(t, validData[i], readValid[i])
|
|
if validData[i] {
|
|
pos := dataIdx
|
|
for j := 0; j < dim*2; j++ {
|
|
require.Equal(t, data[dataIdx*dim*2+j], readData[pos*dim*2+j])
|
|
}
|
|
dataIdx++
|
|
}
|
|
}
|
|
}
|
|
})
|
|
|
|
t.Run("TestInt8Vector", func(t *testing.T) {
|
|
dim := 128
|
|
numRows := 100
|
|
|
|
type testCase struct {
|
|
name string
|
|
validDataSetup func([]bool) int
|
|
}
|
|
|
|
testCases := []testCase{
|
|
{
|
|
name: "partial null",
|
|
validDataSetup: func(validData []bool) int {
|
|
validCount := 0
|
|
for i := 0; i < numRows; i++ {
|
|
if i < numRows/2 {
|
|
validData[i] = true
|
|
validCount++
|
|
}
|
|
}
|
|
return validCount
|
|
},
|
|
},
|
|
{
|
|
name: "all valid",
|
|
validDataSetup: func(validData []bool) int {
|
|
for i := 0; i < numRows; i++ {
|
|
validData[i] = true
|
|
}
|
|
return numRows
|
|
},
|
|
},
|
|
{
|
|
name: "all null",
|
|
validDataSetup: func(validData []bool) int {
|
|
return 0
|
|
},
|
|
},
|
|
}
|
|
|
|
for _, tc := range testCases {
|
|
w, err := NewPayloadWriter(schemapb.DataType_Int8Vector, WithDim(dim), WithNullable(true))
|
|
require.NoError(t, err)
|
|
|
|
validData := make([]bool, numRows)
|
|
validCount := tc.validDataSetup(validData)
|
|
|
|
data := make([]int8, validCount*dim)
|
|
dataIdx := 0
|
|
for i := 0; i < numRows; i++ {
|
|
if validData[i] {
|
|
for j := 0; j < dim; j++ {
|
|
data[dataIdx*dim+j] = int8((i*10 + j) % 128)
|
|
}
|
|
dataIdx++
|
|
}
|
|
}
|
|
|
|
err = w.AddInt8VectorToPayload(data, dim, validData)
|
|
require.NoError(t, err)
|
|
|
|
err = w.FinishPayloadWriter()
|
|
require.NoError(t, err)
|
|
|
|
buffer, err := w.GetPayloadBufferFromWriter()
|
|
require.NoError(t, err)
|
|
|
|
r, err := NewPayloadReader(schemapb.DataType_Int8Vector, buffer, true)
|
|
require.NoError(t, err)
|
|
|
|
readData, readDim, readValid, readNumRows, err := r.GetInt8VectorFromPayload()
|
|
require.NoError(t, err)
|
|
require.Equal(t, dim, readDim)
|
|
require.Equal(t, numRows, readNumRows)
|
|
require.Equal(t, numRows, len(readValid))
|
|
|
|
dataIdx = 0
|
|
for i := 0; i < numRows; i++ {
|
|
require.Equal(t, validData[i], readValid[i])
|
|
if validData[i] {
|
|
pos := dataIdx
|
|
for j := 0; j < dim; j++ {
|
|
require.Equal(t, data[dataIdx*dim+j], readData[pos*dim+j])
|
|
}
|
|
dataIdx++
|
|
}
|
|
}
|
|
}
|
|
})
|
|
|
|
t.Run("TestSparseFloatVector", func(t *testing.T) {
|
|
numRows := 100
|
|
|
|
type testCase struct {
|
|
name string
|
|
validDataSetup func([]bool) int
|
|
}
|
|
|
|
testCases := []testCase{
|
|
{
|
|
name: "half null",
|
|
validDataSetup: func(validData []bool) int {
|
|
validCount := 0
|
|
for i := 0; i < numRows; i++ {
|
|
if i%2 == 0 {
|
|
validData[i] = true
|
|
validCount++
|
|
}
|
|
}
|
|
return validCount
|
|
},
|
|
},
|
|
{
|
|
name: "all valid",
|
|
validDataSetup: func(validData []bool) int {
|
|
for i := 0; i < numRows; i++ {
|
|
validData[i] = true
|
|
}
|
|
return numRows
|
|
},
|
|
},
|
|
{
|
|
name: "all null",
|
|
validDataSetup: func(validData []bool) int {
|
|
return 0
|
|
},
|
|
},
|
|
}
|
|
|
|
for _, tc := range testCases {
|
|
w, err := NewPayloadWriter(schemapb.DataType_SparseFloatVector, WithNullable(true))
|
|
require.NoError(t, err)
|
|
|
|
validData := make([]bool, numRows)
|
|
tc.validDataSetup(validData)
|
|
|
|
data := &SparseFloatVectorFieldData{
|
|
SparseFloatArray: schemapb.SparseFloatArray{
|
|
Dim: 100,
|
|
},
|
|
ValidData: validData,
|
|
}
|
|
for i := 0; i < numRows; i++ {
|
|
if validData[i] {
|
|
sparseVec := make([]byte, 16)
|
|
for j := 0; j < 16; j++ {
|
|
sparseVec[j] = byte((i*10 + j) % 256)
|
|
}
|
|
data.SparseFloatArray.Contents = append(data.SparseFloatArray.Contents, sparseVec)
|
|
}
|
|
}
|
|
|
|
err = w.AddSparseFloatVectorToPayload(data)
|
|
require.NoError(t, err)
|
|
|
|
err = w.FinishPayloadWriter()
|
|
require.NoError(t, err)
|
|
|
|
buffer, err := w.GetPayloadBufferFromWriter()
|
|
require.NoError(t, err)
|
|
|
|
r, err := NewPayloadReader(schemapb.DataType_SparseFloatVector, buffer, true)
|
|
require.NoError(t, err)
|
|
|
|
readData, _, readValid, err := r.GetSparseFloatVectorFromPayload()
|
|
require.NoError(t, err)
|
|
require.Equal(t, numRows, len(readValid))
|
|
require.Equal(t, numRows, len(readData.Contents))
|
|
|
|
for i := 0; i < numRows; i++ {
|
|
require.Equal(t, validData[i], readValid[i])
|
|
if validData[i] {
|
|
require.NotNil(t, readData.Contents[i])
|
|
require.Equal(t, 16, len(readData.Contents[i]))
|
|
for j := 0; j < 16; j++ {
|
|
require.Equal(t, byte((i*10+j)%256), readData.Contents[i][j])
|
|
}
|
|
} else {
|
|
require.Nil(t, readData.Contents[i])
|
|
}
|
|
}
|
|
}
|
|
})
|
|
|
|
t.Run("TestAddBool with wrong valids", func(t *testing.T) {
|
|
w, err := NewPayloadWriter(schemapb.DataType_Bool, WithNullable(true))
|
|
require.Nil(t, err)
|
|
require.NotNil(t, w)
|
|
|
|
err = w.AddBoolToPayload([]bool{false}, nil)
|
|
assert.ErrorIs(t, err, merr.ErrParameterInvalid)
|
|
})
|
|
|
|
t.Run("TestAddInt8 with wrong valids", func(t *testing.T) {
|
|
w, err := NewPayloadWriter(schemapb.DataType_Int8, WithNullable(true))
|
|
require.Nil(t, err)
|
|
require.NotNil(t, w)
|
|
|
|
err = w.AddInt8ToPayload([]int8{1}, nil)
|
|
assert.ErrorIs(t, err, merr.ErrParameterInvalid)
|
|
})
|
|
|
|
t.Run("TestAddInt16 with wrong valids", func(t *testing.T) {
|
|
w, err := NewPayloadWriter(schemapb.DataType_Int16, WithNullable(true))
|
|
require.Nil(t, err)
|
|
require.NotNil(t, w)
|
|
|
|
err = w.AddInt16ToPayload([]int16{1}, nil)
|
|
assert.ErrorIs(t, err, merr.ErrParameterInvalid)
|
|
})
|
|
|
|
t.Run("TestAddInt32 with wrong valids", func(t *testing.T) {
|
|
w, err := NewPayloadWriter(schemapb.DataType_Int32, WithNullable(true))
|
|
require.Nil(t, err)
|
|
require.NotNil(t, w)
|
|
|
|
err = w.AddInt32ToPayload([]int32{1}, nil)
|
|
assert.ErrorIs(t, err, merr.ErrParameterInvalid)
|
|
})
|
|
|
|
t.Run("TestAddInt64 with wrong valids", func(t *testing.T) {
|
|
w, err := NewPayloadWriter(schemapb.DataType_Int64, WithNullable(true))
|
|
require.Nil(t, err)
|
|
require.NotNil(t, w)
|
|
|
|
err = w.AddInt64ToPayload([]int64{1}, nil)
|
|
assert.ErrorIs(t, err, merr.ErrParameterInvalid)
|
|
})
|
|
|
|
t.Run("TestAddFloat32 with wrong valids", func(t *testing.T) {
|
|
w, err := NewPayloadWriter(schemapb.DataType_Float, WithNullable(true))
|
|
require.Nil(t, err)
|
|
require.NotNil(t, w)
|
|
|
|
err = w.AddFloatToPayload([]float32{1.0}, nil)
|
|
assert.ErrorIs(t, err, merr.ErrParameterInvalid)
|
|
})
|
|
|
|
t.Run("TestAddDouble with wrong valids", func(t *testing.T) {
|
|
w, err := NewPayloadWriter(schemapb.DataType_Double, WithNullable(true))
|
|
require.Nil(t, err)
|
|
require.NotNil(t, w)
|
|
|
|
err = w.AddDoubleToPayload([]float64{1.0}, nil)
|
|
assert.ErrorIs(t, err, merr.ErrParameterInvalid)
|
|
})
|
|
|
|
t.Run("TestAddAddString with wrong valids", func(t *testing.T) {
|
|
w, err := NewPayloadWriter(schemapb.DataType_String, WithNullable(true))
|
|
require.Nil(t, err)
|
|
require.NotNil(t, w)
|
|
err = w.AddDataToPayloadForUT("hello0", nil)
|
|
assert.ErrorIs(t, err, merr.ErrParameterInvalid)
|
|
|
|
w, err = NewPayloadWriter(schemapb.DataType_String, WithNullable(true))
|
|
require.Nil(t, err)
|
|
require.NotNil(t, w)
|
|
err = w.AddDataToPayloadForUT("hello0", []bool{false, false})
|
|
assert.ErrorIs(t, err, merr.ErrParameterInvalid)
|
|
|
|
w, err = NewPayloadWriter(schemapb.DataType_String)
|
|
require.Nil(t, err)
|
|
require.NotNil(t, w)
|
|
err = w.AddDataToPayloadForUT("hello0", []bool{false})
|
|
assert.ErrorIs(t, err, merr.ErrParameterInvalid)
|
|
|
|
w, err = NewPayloadWriter(schemapb.DataType_String)
|
|
require.Nil(t, err)
|
|
require.NotNil(t, w)
|
|
err = w.AddDataToPayloadForUT("hello0", []bool{true})
|
|
assert.ErrorIs(t, err, merr.ErrParameterInvalid)
|
|
})
|
|
|
|
t.Run("TestAddArray with wrong valids", func(t *testing.T) {
|
|
w, err := NewPayloadWriter(schemapb.DataType_Array, WithNullable(true))
|
|
require.Nil(t, err)
|
|
require.NotNil(t, w)
|
|
err = w.AddDataToPayloadForUT(&schemapb.ScalarField{
|
|
Data: &schemapb.ScalarField_IntData{
|
|
IntData: &schemapb.IntArray{
|
|
Data: []int32{1, 2},
|
|
},
|
|
},
|
|
}, nil)
|
|
assert.ErrorIs(t, err, merr.ErrParameterInvalid)
|
|
|
|
w, err = NewPayloadWriter(schemapb.DataType_Array, WithNullable(true))
|
|
require.Nil(t, err)
|
|
require.NotNil(t, w)
|
|
|
|
err = w.AddDataToPayloadForUT(&schemapb.ScalarField{
|
|
Data: &schemapb.ScalarField_IntData{
|
|
IntData: &schemapb.IntArray{
|
|
Data: []int32{1, 2},
|
|
},
|
|
},
|
|
}, []bool{false, false})
|
|
assert.ErrorIs(t, err, merr.ErrParameterInvalid)
|
|
|
|
w, err = NewPayloadWriter(schemapb.DataType_Array)
|
|
require.Nil(t, err)
|
|
require.NotNil(t, w)
|
|
err = w.AddDataToPayloadForUT(&schemapb.ScalarField{
|
|
Data: &schemapb.ScalarField_IntData{
|
|
IntData: &schemapb.IntArray{
|
|
Data: []int32{1, 2},
|
|
},
|
|
},
|
|
}, []bool{false})
|
|
assert.ErrorIs(t, err, merr.ErrParameterInvalid)
|
|
|
|
w, err = NewPayloadWriter(schemapb.DataType_Array)
|
|
require.Nil(t, err)
|
|
require.NotNil(t, w)
|
|
err = w.AddDataToPayloadForUT(&schemapb.ScalarField{
|
|
Data: &schemapb.ScalarField_IntData{
|
|
IntData: &schemapb.IntArray{
|
|
Data: []int32{1, 2},
|
|
},
|
|
},
|
|
}, []bool{true})
|
|
assert.ErrorIs(t, err, merr.ErrParameterInvalid)
|
|
})
|
|
|
|
t.Run("TestAddJSON with wrong valids", func(t *testing.T) {
|
|
w, err := NewPayloadWriter(schemapb.DataType_JSON, WithNullable(true))
|
|
require.Nil(t, err)
|
|
require.NotNil(t, w)
|
|
err = w.AddDataToPayloadForUT([]byte(`{"1":"1"}`), nil)
|
|
assert.ErrorIs(t, err, merr.ErrParameterInvalid)
|
|
|
|
w, err = NewPayloadWriter(schemapb.DataType_JSON, WithNullable(true))
|
|
require.Nil(t, err)
|
|
require.NotNil(t, w)
|
|
err = w.AddDataToPayloadForUT([]byte(`{"1":"1"}`), []bool{false, false})
|
|
assert.ErrorIs(t, err, merr.ErrParameterInvalid)
|
|
|
|
w, err = NewPayloadWriter(schemapb.DataType_JSON)
|
|
require.Nil(t, err)
|
|
require.NotNil(t, w)
|
|
err = w.AddDataToPayloadForUT([]byte(`{"1":"1"}`), []bool{false})
|
|
assert.ErrorIs(t, err, merr.ErrParameterInvalid)
|
|
|
|
w, err = NewPayloadWriter(schemapb.DataType_JSON)
|
|
require.Nil(t, err)
|
|
require.NotNil(t, w)
|
|
err = w.AddDataToPayloadForUT([]byte(`{"1":"1"}`), []bool{true})
|
|
assert.ErrorIs(t, err, merr.ErrParameterInvalid)
|
|
})
|
|
}
|
|
|
|
func TestArrowRecordReader(t *testing.T) {
|
|
t.Run("TestArrowRecordReader", func(t *testing.T) {
|
|
w, err := NewPayloadWriter(schemapb.DataType_String)
|
|
assert.NoError(t, err)
|
|
defer w.Close()
|
|
|
|
err = w.AddOneStringToPayload("hello0", true)
|
|
assert.NoError(t, err)
|
|
err = w.AddOneStringToPayload("hello1", true)
|
|
assert.NoError(t, err)
|
|
err = w.AddOneStringToPayload("hello2", true)
|
|
assert.NoError(t, err)
|
|
err = w.FinishPayloadWriter()
|
|
assert.NoError(t, err)
|
|
length, err := w.GetPayloadLengthFromWriter()
|
|
assert.NoError(t, err)
|
|
assert.Equal(t, 3, length)
|
|
buffer, err := w.GetPayloadBufferFromWriter()
|
|
assert.NoError(t, err)
|
|
|
|
r, err := NewPayloadReader(schemapb.DataType_String, buffer, false)
|
|
assert.NoError(t, err)
|
|
length, err = r.GetPayloadLengthFromReader()
|
|
assert.NoError(t, err)
|
|
assert.Equal(t, 3, length)
|
|
|
|
rr, err := r.GetArrowRecordReader()
|
|
assert.NoError(t, err)
|
|
|
|
for rr.Next() {
|
|
rec := rr.Record()
|
|
arr := rec.Column(0).(*array.String)
|
|
defer rec.Release()
|
|
|
|
assert.Equal(t, "hello0", arr.Value(0))
|
|
assert.Equal(t, "hello1", arr.Value(1))
|
|
assert.Equal(t, "hello2", arr.Value(2))
|
|
}
|
|
})
|
|
}
|
|
|
|
func dataGen(size int) ([]byte, error) {
|
|
w, err := NewPayloadWriter(schemapb.DataType_String)
|
|
if err != nil {
|
|
return nil, err
|
|
}
|
|
defer w.Close()
|
|
|
|
letterRunes := []rune("abcdefghijklmnopqrstuvwxyzABCDEFGHIJKLMNOPQRSTUVWXYZ")
|
|
|
|
for i := 0; i < size; i++ {
|
|
b := make([]rune, 20)
|
|
for i := range b {
|
|
b[i] = letterRunes[rand.Intn(len(letterRunes))]
|
|
}
|
|
w.AddOneStringToPayload(string(b), true)
|
|
}
|
|
err = w.FinishPayloadWriter()
|
|
if err != nil {
|
|
return nil, err
|
|
}
|
|
buffer, err := w.GetPayloadBufferFromWriter()
|
|
if err != nil {
|
|
return nil, err
|
|
}
|
|
return buffer, err
|
|
}
|
|
|
|
func BenchmarkDefaultReader(b *testing.B) {
|
|
size := 10
|
|
buffer, err := dataGen(size)
|
|
assert.NoError(b, err)
|
|
|
|
b.ResetTimer()
|
|
r, err := NewPayloadReader(schemapb.DataType_String, buffer, false)
|
|
require.Nil(b, err)
|
|
defer r.ReleasePayloadReader()
|
|
|
|
length, err := r.GetPayloadLengthFromReader()
|
|
assert.NoError(b, err)
|
|
assert.Equal(b, length, size)
|
|
|
|
d, v, err := r.GetStringFromPayload()
|
|
assert.NoError(b, err)
|
|
assert.Nil(b, v)
|
|
for i := 0; i < 100; i++ {
|
|
for _, de := range d {
|
|
assert.Equal(b, 20, len(de))
|
|
}
|
|
}
|
|
}
|
|
|
|
func BenchmarkDataSetReader(b *testing.B) {
|
|
size := 10
|
|
buffer, err := dataGen(size)
|
|
assert.NoError(b, err)
|
|
|
|
b.ResetTimer()
|
|
r, err := NewPayloadReader(schemapb.DataType_String, buffer, false)
|
|
require.Nil(b, err)
|
|
defer r.ReleasePayloadReader()
|
|
|
|
length, err := r.GetPayloadLengthFromReader()
|
|
assert.NoError(b, err)
|
|
assert.Equal(b, length, size)
|
|
|
|
ds, err := r.GetByteArrayDataSet()
|
|
assert.NoError(b, err)
|
|
|
|
for i := 0; i < 100; i++ {
|
|
for ds.HasNext() {
|
|
stringArray, err := ds.NextBatch(1024)
|
|
assert.NoError(b, err)
|
|
for _, de := range stringArray {
|
|
assert.Equal(b, 20, len(string(de)))
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|
|
func BenchmarkArrowRecordReader(b *testing.B) {
|
|
size := 10
|
|
buffer, err := dataGen(size)
|
|
assert.NoError(b, err)
|
|
|
|
b.ResetTimer()
|
|
r, err := NewPayloadReader(schemapb.DataType_String, buffer, false)
|
|
require.Nil(b, err)
|
|
defer r.ReleasePayloadReader()
|
|
|
|
length, err := r.GetPayloadLengthFromReader()
|
|
assert.NoError(b, err)
|
|
assert.Equal(b, length, size)
|
|
|
|
rr, err := r.GetArrowRecordReader()
|
|
assert.NoError(b, err)
|
|
defer rr.Release()
|
|
|
|
for i := 0; i < 100; i++ {
|
|
for rr.Next() {
|
|
rec := rr.Record()
|
|
arr := rec.Column(0).(*array.String)
|
|
defer rec.Release()
|
|
for i := 0; i < arr.Len(); i++ {
|
|
assert.Equal(b, 20, len(arr.Value(i)))
|
|
}
|
|
}
|
|
}
|
|
}
|