milvus/internal/storage/payload_test.go
marcelo-cjl 3b599441fd
feat: Add nullable vector support for proxy and querynode (#46305)
related: #45993 

This commit extends nullable vector support to the proxy layer,
querynode,
and adds comprehensive validation, search reduce, and field data
handling
    for nullable vectors with sparse storage.
    
    Proxy layer changes:
- Update validate_util.go checkAligned() with getExpectedVectorRows()
helper
      to validate nullable vector field alignment using valid data count
- Update checkFloatVectorFieldData/checkSparseFloatVectorFieldData for
      nullable vector validation with proper row count expectations
- Add FieldDataIdxComputer in typeutil/schema.go for logical-to-physical
      index translation during search reduce operations
- Update search_reduce_util.go reduceSearchResultData to use
idxComputers
      for correct field data indexing with nullable vectors
- Update task.go, task_query.go, task_upsert.go for nullable vector
handling
    - Update msg_pack.go with nullable vector field data processing
    
    QueryNode layer changes:
    - Update segments/result.go for nullable vector result handling
- Update segments/search_reduce.go with nullable vector offset
translation
    
    Storage and index changes:
- Update data_codec.go and utils.go for nullable vector serialization
- Update indexcgowrapper/dataset.go and index.go for nullable vector
indexing
    
    Utility changes:
- Add FieldDataIdxComputer struct with Compute() method for efficient
      logical-to-physical index mapping across multiple field data
- Update EstimateEntitySize() and AppendFieldData() with fieldIdxs
parameter
    - Update funcutil.go with nullable vector support functions

<!-- This is an auto-generated comment: release notes by coderabbit.ai
-->
## Summary by CodeRabbit

* **New Features**
* Full support for nullable vector fields (float, binary, float16,
bfloat16, int8, sparse) across ingest, storage, indexing, search and
retrieval; logical↔physical offset mapping preserves row semantics.
  * Client: compaction control and compaction-state APIs.

* **Bug Fixes**
* Improved validation for adding vector fields (nullable + dimension
checks) and corrected search/query behavior for nullable vectors.

* **Chores**
  * Persisted validity maps with indexes and on-disk formats.

* **Tests**
  * Extensive new and updated end-to-end nullable-vector tests.

<sub>✏️ Tip: You can customize this high-level summary in your review
settings.</sub>
<!-- end of auto-generated comment: release notes by coderabbit.ai -->

---------

Signed-off-by: marcelo-cjl <marcelo.chen@zilliz.com>
2025-12-24 10:13:19 +08:00

3097 lines
88 KiB
Go

// Licensed to the LF AI & Data foundation under one
// or more contributor license agreements. See the NOTICE file
// distributed with this work for additional information
// regarding copyright ownership. The ASF licenses this file
// to you under the Apache License, Version 2.0 (the
// "License"); you may not use this file except in compliance
// with the License. You may obtain a copy of the License at
//
// http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.
package storage
import (
"math"
"math/rand"
"testing"
"github.com/apache/arrow/go/v17/arrow/array"
"github.com/stretchr/testify/assert"
"github.com/stretchr/testify/require"
"github.com/milvus-io/milvus-proto/go-api/v2/schemapb"
"github.com/milvus-io/milvus/pkg/v2/util/merr"
"github.com/milvus-io/milvus/pkg/v2/util/typeutil"
)
func TestPayload_ReaderAndWriter(t *testing.T) {
t.Run("TestBool", func(t *testing.T) {
w, err := NewPayloadWriter(schemapb.DataType_Bool)
require.Nil(t, err)
require.NotNil(t, w)
err = w.AddBoolToPayload([]bool{false, false, false, false}, nil)
assert.NoError(t, err)
err = w.AddDataToPayloadForUT([]bool{false, false, false, false}, nil)
assert.NoError(t, err)
err = w.FinishPayloadWriter()
assert.NoError(t, err)
length, err := w.GetPayloadLengthFromWriter()
assert.NoError(t, err)
assert.Equal(t, 8, length)
defer w.ReleasePayloadWriter()
buffer, err := w.GetPayloadBufferFromWriter()
assert.NoError(t, err)
r, err := NewPayloadReader(schemapb.DataType_Bool, buffer, false)
require.Nil(t, err)
length, err = r.GetPayloadLengthFromReader()
assert.NoError(t, err)
assert.Equal(t, length, 8)
bools, valids, err := r.GetBoolFromPayload()
assert.NoError(t, err)
assert.Equal(t, []bool{false, false, false, false, false, false, false, false}, bools)
assert.Nil(t, valids)
ibools, valids, _, err := r.GetDataFromPayload()
bools = ibools.([]bool)
assert.NoError(t, err)
assert.Nil(t, valids)
assert.Equal(t, []bool{false, false, false, false, false, false, false, false}, bools)
defer r.ReleasePayloadReader()
})
t.Run("TestInt8", func(t *testing.T) {
w, err := NewPayloadWriter(schemapb.DataType_Int8)
require.Nil(t, err)
require.NotNil(t, w)
err = w.AddInt8ToPayload([]int8{1, 2, 3}, nil)
assert.NoError(t, err)
err = w.AddDataToPayloadForUT([]int8{4, 5, 6}, nil)
assert.NoError(t, err)
err = w.FinishPayloadWriter()
assert.NoError(t, err)
length, err := w.GetPayloadLengthFromWriter()
assert.NoError(t, err)
assert.Equal(t, 6, length)
defer w.ReleasePayloadWriter()
buffer, err := w.GetPayloadBufferFromWriter()
assert.NoError(t, err)
r, err := NewPayloadReader(schemapb.DataType_Int8, buffer, false)
require.Nil(t, err)
length, err = r.GetPayloadLengthFromReader()
assert.NoError(t, err)
assert.Equal(t, length, 6)
int8s, valids, err := r.GetInt8FromPayload()
assert.NoError(t, err)
assert.Nil(t, valids)
assert.Equal(t, []int8{1, 2, 3, 4, 5, 6}, int8s)
iint8s, valids, _, err := r.GetDataFromPayload()
int8s = iint8s.([]int8)
assert.NoError(t, err)
assert.Nil(t, valids)
assert.Equal(t, []int8{1, 2, 3, 4, 5, 6}, int8s)
defer r.ReleasePayloadReader()
})
t.Run("TestInt16", func(t *testing.T) {
w, err := NewPayloadWriter(schemapb.DataType_Int16)
require.Nil(t, err)
require.NotNil(t, w)
err = w.AddInt16ToPayload([]int16{1, 2, 3}, nil)
assert.NoError(t, err)
err = w.AddDataToPayloadForUT([]int16{1, 2, 3}, nil)
assert.NoError(t, err)
err = w.FinishPayloadWriter()
assert.NoError(t, err)
length, err := w.GetPayloadLengthFromWriter()
assert.NoError(t, err)
assert.Equal(t, 6, length)
defer w.ReleasePayloadWriter()
buffer, err := w.GetPayloadBufferFromWriter()
assert.NoError(t, err)
r, err := NewPayloadReader(schemapb.DataType_Int16, buffer, false)
require.Nil(t, err)
length, err = r.GetPayloadLengthFromReader()
assert.NoError(t, err)
assert.Equal(t, length, 6)
int16s, valids, err := r.GetInt16FromPayload()
assert.NoError(t, err)
assert.Nil(t, valids)
assert.Equal(t, []int16{1, 2, 3, 1, 2, 3}, int16s)
iint16s, valids, _, err := r.GetDataFromPayload()
int16s = iint16s.([]int16)
assert.NoError(t, err)
assert.Nil(t, valids)
assert.Equal(t, []int16{1, 2, 3, 1, 2, 3}, int16s)
defer r.ReleasePayloadReader()
})
t.Run("TestInt32", func(t *testing.T) {
w, err := NewPayloadWriter(schemapb.DataType_Int32)
require.Nil(t, err)
require.NotNil(t, w)
err = w.AddInt32ToPayload([]int32{1, 2, 3}, nil)
assert.NoError(t, err)
err = w.AddDataToPayloadForUT([]int32{1, 2, 3}, nil)
assert.NoError(t, err)
err = w.FinishPayloadWriter()
assert.NoError(t, err)
length, err := w.GetPayloadLengthFromWriter()
assert.NoError(t, err)
assert.Equal(t, 6, length)
defer w.ReleasePayloadWriter()
buffer, err := w.GetPayloadBufferFromWriter()
assert.NoError(t, err)
r, err := NewPayloadReader(schemapb.DataType_Int32, buffer, false)
require.Nil(t, err)
length, err = r.GetPayloadLengthFromReader()
assert.NoError(t, err)
assert.Equal(t, length, 6)
int32s, valids, err := r.GetInt32FromPayload()
assert.NoError(t, err)
assert.Equal(t, []int32{1, 2, 3, 1, 2, 3}, int32s)
assert.Nil(t, valids)
iint32s, valids, _, err := r.GetDataFromPayload()
int32s = iint32s.([]int32)
assert.NoError(t, err)
assert.Equal(t, []int32{1, 2, 3, 1, 2, 3}, int32s)
assert.Nil(t, valids)
defer r.ReleasePayloadReader()
})
t.Run("TestInt64", func(t *testing.T) {
w, err := NewPayloadWriter(schemapb.DataType_Int64)
require.Nil(t, err)
require.NotNil(t, w)
err = w.AddInt64ToPayload([]int64{1, 2, 3}, nil)
assert.NoError(t, err)
err = w.AddDataToPayloadForUT([]int64{1, 2, 3}, nil)
assert.NoError(t, err)
err = w.FinishPayloadWriter()
assert.NoError(t, err)
length, err := w.GetPayloadLengthFromWriter()
assert.NoError(t, err)
assert.Equal(t, 6, length)
defer w.ReleasePayloadWriter()
buffer, err := w.GetPayloadBufferFromWriter()
assert.NoError(t, err)
r, err := NewPayloadReader(schemapb.DataType_Int64, buffer, false)
require.Nil(t, err)
length, err = r.GetPayloadLengthFromReader()
assert.NoError(t, err)
assert.Equal(t, length, 6)
int64s, valids, err := r.GetInt64FromPayload()
assert.NoError(t, err)
assert.Equal(t, []int64{1, 2, 3, 1, 2, 3}, int64s)
assert.Nil(t, valids)
iint64s, valids, _, err := r.GetDataFromPayload()
int64s = iint64s.([]int64)
assert.NoError(t, err)
assert.Equal(t, []int64{1, 2, 3, 1, 2, 3}, int64s)
assert.Nil(t, valids)
defer r.ReleasePayloadReader()
})
t.Run("TestFloat32", func(t *testing.T) {
w, err := NewPayloadWriter(schemapb.DataType_Float)
require.Nil(t, err)
require.NotNil(t, w)
err = w.AddFloatToPayload([]float32{1.0, 2.0, 3.0}, nil)
assert.NoError(t, err)
err = w.AddDataToPayloadForUT([]float32{1.0, 2.0, 3.0}, nil)
assert.NoError(t, err)
err = w.FinishPayloadWriter()
assert.NoError(t, err)
length, err := w.GetPayloadLengthFromWriter()
assert.NoError(t, err)
assert.Equal(t, 6, length)
defer w.ReleasePayloadWriter()
buffer, err := w.GetPayloadBufferFromWriter()
assert.NoError(t, err)
r, err := NewPayloadReader(schemapb.DataType_Float, buffer, false)
require.Nil(t, err)
length, err = r.GetPayloadLengthFromReader()
assert.NoError(t, err)
assert.Equal(t, length, 6)
float32s, valids, err := r.GetFloatFromPayload()
assert.NoError(t, err)
assert.Equal(t, []float32{1.0, 2.0, 3.0, 1.0, 2.0, 3.0}, float32s)
assert.Nil(t, valids)
ifloat32s, valids, _, err := r.GetDataFromPayload()
float32s = ifloat32s.([]float32)
assert.NoError(t, err)
assert.Equal(t, []float32{1.0, 2.0, 3.0, 1.0, 2.0, 3.0}, float32s)
assert.Nil(t, valids)
defer r.ReleasePayloadReader()
})
t.Run("TestDouble", func(t *testing.T) {
w, err := NewPayloadWriter(schemapb.DataType_Double)
require.Nil(t, err)
require.NotNil(t, w)
err = w.AddDoubleToPayload([]float64{1.0, 2.0, 3.0}, nil)
assert.NoError(t, err)
err = w.AddDataToPayloadForUT([]float64{1.0, 2.0, 3.0}, nil)
assert.NoError(t, err)
err = w.FinishPayloadWriter()
assert.NoError(t, err)
length, err := w.GetPayloadLengthFromWriter()
assert.NoError(t, err)
assert.Equal(t, 6, length)
defer w.ReleasePayloadWriter()
buffer, err := w.GetPayloadBufferFromWriter()
assert.NoError(t, err)
r, err := NewPayloadReader(schemapb.DataType_Double, buffer, false)
require.Nil(t, err)
length, err = r.GetPayloadLengthFromReader()
assert.NoError(t, err)
assert.Equal(t, length, 6)
float64s, valids, err := r.GetDoubleFromPayload()
assert.NoError(t, err)
assert.Equal(t, []float64{1.0, 2.0, 3.0, 1.0, 2.0, 3.0}, float64s)
assert.Nil(t, valids)
ifloat64s, valids, _, err := r.GetDataFromPayload()
float64s = ifloat64s.([]float64)
assert.NoError(t, err)
assert.Nil(t, valids)
assert.Equal(t, []float64{1.0, 2.0, 3.0, 1.0, 2.0, 3.0}, float64s)
defer r.ReleasePayloadReader()
})
t.Run("TestAddString", func(t *testing.T) {
w, err := NewPayloadWriter(schemapb.DataType_String)
require.Nil(t, err)
require.NotNil(t, w)
err = w.AddOneStringToPayload("hello0", true)
assert.NoError(t, err)
err = w.AddOneStringToPayload("hello1", true)
assert.NoError(t, err)
err = w.AddOneStringToPayload("hello2", true)
assert.NoError(t, err)
err = w.AddDataToPayloadForUT("hello3", nil)
assert.NoError(t, err)
err = w.FinishPayloadWriter()
assert.NoError(t, err)
length, err := w.GetPayloadLengthFromWriter()
assert.NoError(t, err)
assert.Equal(t, length, 4)
buffer, err := w.GetPayloadBufferFromWriter()
assert.NoError(t, err)
r, err := NewPayloadReader(schemapb.DataType_String, buffer, false)
assert.NoError(t, err)
length, err = r.GetPayloadLengthFromReader()
assert.NoError(t, err)
assert.Equal(t, length, 4)
str, valids, err := r.GetStringFromPayload()
assert.NoError(t, err)
assert.Nil(t, valids)
assert.Equal(t, str[0], "hello0")
assert.Equal(t, str[1], "hello1")
assert.Equal(t, str[2], "hello2")
assert.Equal(t, str[3], "hello3")
istr, valids, _, err := r.GetDataFromPayload()
strArray := istr.([]string)
assert.NoError(t, err)
assert.Equal(t, strArray[0], "hello0")
assert.Equal(t, strArray[1], "hello1")
assert.Equal(t, strArray[2], "hello2")
assert.Equal(t, strArray[3], "hello3")
assert.Nil(t, valids)
r.ReleasePayloadReader()
w.ReleasePayloadWriter()
})
t.Run("TestAddArray", func(t *testing.T) {
w, err := NewPayloadWriter(schemapb.DataType_Array)
require.Nil(t, err)
require.NotNil(t, w)
err = w.AddOneArrayToPayload(&schemapb.ScalarField{
Data: &schemapb.ScalarField_IntData{
IntData: &schemapb.IntArray{
Data: []int32{1, 2},
},
},
}, true)
assert.NoError(t, err)
err = w.AddOneArrayToPayload(&schemapb.ScalarField{
Data: &schemapb.ScalarField_IntData{
IntData: &schemapb.IntArray{
Data: []int32{3, 4},
},
},
}, true)
assert.NoError(t, err)
err = w.AddOneArrayToPayload(&schemapb.ScalarField{
Data: &schemapb.ScalarField_IntData{
IntData: &schemapb.IntArray{
Data: []int32{5, 6},
},
},
}, true)
assert.NoError(t, err)
err = w.AddDataToPayloadForUT(&schemapb.ScalarField{
Data: &schemapb.ScalarField_IntData{
IntData: &schemapb.IntArray{
Data: []int32{7, 8},
},
},
}, nil)
assert.NoError(t, err)
err = w.FinishPayloadWriter()
assert.NoError(t, err)
length, err := w.GetPayloadLengthFromWriter()
assert.NoError(t, err)
assert.Equal(t, length, 4)
buffer, err := w.GetPayloadBufferFromWriter()
assert.NoError(t, err)
r, err := NewPayloadReader(schemapb.DataType_Array, buffer, false)
assert.NoError(t, err)
length, err = r.GetPayloadLengthFromReader()
assert.NoError(t, err)
assert.Equal(t, length, 4)
arrayList, valids, err := r.GetArrayFromPayload()
assert.NoError(t, err)
assert.Nil(t, valids)
assert.EqualValues(t, []int32{1, 2}, arrayList[0].GetIntData().GetData())
assert.EqualValues(t, []int32{3, 4}, arrayList[1].GetIntData().GetData())
assert.EqualValues(t, []int32{5, 6}, arrayList[2].GetIntData().GetData())
assert.EqualValues(t, []int32{7, 8}, arrayList[3].GetIntData().GetData())
iArrayList, valids, _, err := r.GetDataFromPayload()
arrayList = iArrayList.([]*schemapb.ScalarField)
assert.NoError(t, err)
assert.Nil(t, valids)
assert.EqualValues(t, []int32{1, 2}, arrayList[0].GetIntData().GetData())
assert.EqualValues(t, []int32{3, 4}, arrayList[1].GetIntData().GetData())
assert.EqualValues(t, []int32{5, 6}, arrayList[2].GetIntData().GetData())
assert.EqualValues(t, []int32{7, 8}, arrayList[3].GetIntData().GetData())
r.ReleasePayloadReader()
w.ReleasePayloadWriter()
})
t.Run("TestAddJSON", func(t *testing.T) {
w, err := NewPayloadWriter(schemapb.DataType_JSON)
require.Nil(t, err)
require.NotNil(t, w)
err = w.AddOneJSONToPayload([]byte(`{"1":"1"}`), true)
assert.NoError(t, err)
err = w.AddOneJSONToPayload([]byte(`{"2":"2"}`), true)
assert.NoError(t, err)
err = w.AddOneJSONToPayload([]byte(`{"3":"3"}`), true)
assert.NoError(t, err)
err = w.AddDataToPayloadForUT([]byte(`{"4":"4"}`), nil)
assert.NoError(t, err)
err = w.FinishPayloadWriter()
assert.NoError(t, err)
length, err := w.GetPayloadLengthFromWriter()
assert.NoError(t, err)
assert.Equal(t, length, 4)
buffer, err := w.GetPayloadBufferFromWriter()
assert.NoError(t, err)
r, err := NewPayloadReader(schemapb.DataType_JSON, buffer, false)
assert.NoError(t, err)
length, err = r.GetPayloadLengthFromReader()
assert.NoError(t, err)
assert.Equal(t, length, 4)
json, valids, err := r.GetJSONFromPayload()
assert.NoError(t, err)
assert.Nil(t, valids)
assert.EqualValues(t, []byte(`{"1":"1"}`), json[0])
assert.EqualValues(t, []byte(`{"2":"2"}`), json[1])
assert.EqualValues(t, []byte(`{"3":"3"}`), json[2])
assert.EqualValues(t, []byte(`{"4":"4"}`), json[3])
iJSON, valids, _, err := r.GetDataFromPayload()
json = iJSON.([][]byte)
assert.NoError(t, err)
assert.Nil(t, valids)
assert.EqualValues(t, []byte(`{"1":"1"}`), json[0])
assert.EqualValues(t, []byte(`{"2":"2"}`), json[1])
assert.EqualValues(t, []byte(`{"3":"3"}`), json[2])
assert.EqualValues(t, []byte(`{"4":"4"}`), json[3])
r.ReleasePayloadReader()
w.ReleasePayloadWriter()
})
t.Run("TestBinaryVector", func(t *testing.T) {
w, err := NewPayloadWriter(schemapb.DataType_BinaryVector, WithDim(8))
require.Nil(t, err)
require.NotNil(t, w)
in := make([]byte, 16)
for i := 0; i < 16; i++ {
in[i] = 1
}
in2 := make([]byte, 8)
for i := 0; i < 8; i++ {
in2[i] = 1
}
err = w.AddBinaryVectorToPayload(in, 8, nil)
assert.NoError(t, err)
err = w.AddDataToPayloadForUT(in2, nil)
assert.NoError(t, err)
err = w.FinishPayloadWriter()
assert.NoError(t, err)
length, err := w.GetPayloadLengthFromWriter()
assert.NoError(t, err)
assert.Equal(t, 24, length)
defer w.ReleasePayloadWriter()
buffer, err := w.GetPayloadBufferFromWriter()
assert.NoError(t, err)
r, err := NewPayloadReader(schemapb.DataType_BinaryVector, buffer, false)
require.Nil(t, err)
length, err = r.GetPayloadLengthFromReader()
assert.NoError(t, err)
assert.Equal(t, length, 24)
binVecs, dim, _, _, err := r.GetBinaryVectorFromPayload()
assert.NoError(t, err)
assert.Equal(t, 8, dim)
assert.Equal(t, 24, len(binVecs))
ibinVecs, valids, dim, err := r.GetDataFromPayload()
assert.Nil(t, valids)
assert.NoError(t, err)
binVecs = ibinVecs.([]byte)
assert.Equal(t, 8, dim)
assert.Equal(t, 24, len(binVecs))
defer r.ReleasePayloadReader()
})
t.Run("TestFloatVector", func(t *testing.T) {
w, err := NewPayloadWriter(schemapb.DataType_FloatVector, WithDim(1))
require.Nil(t, err)
require.NotNil(t, w)
err = w.AddFloatVectorToPayload([]float32{1.0, 2.0}, 1, nil)
assert.NoError(t, err)
err = w.AddDataToPayloadForUT([]float32{3.0, 4.0}, nil)
assert.NoError(t, err)
err = w.FinishPayloadWriter()
assert.NoError(t, err)
length, err := w.GetPayloadLengthFromWriter()
assert.NoError(t, err)
assert.Equal(t, 4, length)
defer w.ReleasePayloadWriter()
buffer, err := w.GetPayloadBufferFromWriter()
assert.NoError(t, err)
r, err := NewPayloadReader(schemapb.DataType_FloatVector, buffer, false)
require.Nil(t, err)
length, err = r.GetPayloadLengthFromReader()
assert.NoError(t, err)
assert.Equal(t, length, 4)
floatVecs, dim, _, _, err := r.GetFloatVectorFromPayload()
assert.NoError(t, err)
assert.Equal(t, 1, dim)
assert.Equal(t, 4, len(floatVecs))
assert.Equal(t, []float32{1.0, 2.0, 3.0, 4.0}, floatVecs)
ifloatVecs, valids, dim, err := r.GetDataFromPayload()
assert.Nil(t, valids)
assert.NoError(t, err)
floatVecs = ifloatVecs.([]float32)
assert.Equal(t, 1, dim)
assert.Equal(t, 4, len(floatVecs))
assert.Equal(t, []float32{1.0, 2.0, 3.0, 4.0}, floatVecs)
defer r.ReleasePayloadReader()
})
t.Run("TestFloat16Vector", func(t *testing.T) {
w, err := NewPayloadWriter(schemapb.DataType_Float16Vector, WithDim(1))
require.Nil(t, err)
require.NotNil(t, w)
err = w.AddFloat16VectorToPayload([]byte{1, 2}, 1, nil)
assert.NoError(t, err)
err = w.AddDataToPayloadForUT([]byte{3, 4}, nil)
assert.NoError(t, err)
err = w.FinishPayloadWriter()
assert.NoError(t, err)
length, err := w.GetPayloadLengthFromWriter()
assert.NoError(t, err)
assert.Equal(t, 2, length)
defer w.ReleasePayloadWriter()
buffer, err := w.GetPayloadBufferFromWriter()
assert.NoError(t, err)
r, err := NewPayloadReader(schemapb.DataType_Float16Vector, buffer, false)
require.Nil(t, err)
length, err = r.GetPayloadLengthFromReader()
assert.NoError(t, err)
assert.Equal(t, length, 2)
float16Vecs, dim, _, _, err := r.GetFloat16VectorFromPayload()
assert.NoError(t, err)
assert.Equal(t, 1, dim)
assert.Equal(t, 4, len(float16Vecs))
assert.ElementsMatch(t, []byte{1, 2, 3, 4}, float16Vecs)
ifloat16Vecs, valids, dim, err := r.GetDataFromPayload()
assert.NoError(t, err)
assert.Nil(t, valids)
float16Vecs = ifloat16Vecs.([]byte)
assert.Equal(t, 1, dim)
assert.Equal(t, 4, len(float16Vecs))
assert.ElementsMatch(t, []byte{1, 2, 3, 4}, float16Vecs)
defer r.ReleasePayloadReader()
})
t.Run("TestBFloat16Vector", func(t *testing.T) {
w, err := NewPayloadWriter(schemapb.DataType_BFloat16Vector, WithDim(1))
require.Nil(t, err)
require.NotNil(t, w)
err = w.AddBFloat16VectorToPayload([]byte{1, 2}, 1, nil)
assert.NoError(t, err)
err = w.AddDataToPayloadForUT([]byte{3, 4}, nil)
assert.NoError(t, err)
err = w.FinishPayloadWriter()
assert.NoError(t, err)
length, err := w.GetPayloadLengthFromWriter()
assert.NoError(t, err)
assert.Equal(t, 2, length)
defer w.ReleasePayloadWriter()
buffer, err := w.GetPayloadBufferFromWriter()
assert.NoError(t, err)
r, err := NewPayloadReader(schemapb.DataType_BFloat16Vector, buffer, false)
require.Nil(t, err)
length, err = r.GetPayloadLengthFromReader()
assert.NoError(t, err)
assert.Equal(t, length, 2)
bfloat16Vecs, dim, _, _, err := r.GetBFloat16VectorFromPayload()
assert.NoError(t, err)
assert.Equal(t, 1, dim)
assert.Equal(t, 4, len(bfloat16Vecs))
assert.ElementsMatch(t, []byte{1, 2, 3, 4}, bfloat16Vecs)
ibfloat16Vecs, valids, dim, err := r.GetDataFromPayload()
assert.NoError(t, err)
assert.Nil(t, valids)
bfloat16Vecs = ibfloat16Vecs.([]byte)
assert.Equal(t, 1, dim)
assert.Equal(t, 4, len(bfloat16Vecs))
assert.ElementsMatch(t, []byte{1, 2, 3, 4}, bfloat16Vecs)
defer r.ReleasePayloadReader()
})
t.Run("TestSparseFloatVector", func(t *testing.T) {
w, err := NewPayloadWriter(schemapb.DataType_SparseFloatVector)
require.Nil(t, err)
require.NotNil(t, w)
err = w.AddSparseFloatVectorToPayload(&SparseFloatVectorFieldData{
SparseFloatArray: schemapb.SparseFloatArray{
Dim: 600,
Contents: [][]byte{
typeutil.CreateSparseFloatRow([]uint32{0, 1, 2}, []float32{1.1, 1.2, 1.3}),
typeutil.CreateSparseFloatRow([]uint32{10, 20, 30}, []float32{2.1, 2.2, 2.3}),
typeutil.CreateSparseFloatRow([]uint32{100, 200, 599}, []float32{3.1, 3.2, 3.3}),
},
},
})
assert.NoError(t, err)
err = w.AddSparseFloatVectorToPayload(&SparseFloatVectorFieldData{
SparseFloatArray: schemapb.SparseFloatArray{
Dim: 600,
Contents: [][]byte{
typeutil.CreateSparseFloatRow([]uint32{30, 41, 52}, []float32{1.1, 1.2, 1.3}),
typeutil.CreateSparseFloatRow([]uint32{60, 80, 230}, []float32{2.1, 2.2, 2.3}),
typeutil.CreateSparseFloatRow([]uint32{170, 300, 579}, []float32{3.1, 3.2, 3.3}),
},
},
})
assert.NoError(t, err)
err = w.FinishPayloadWriter()
assert.NoError(t, err)
length, err := w.GetPayloadLengthFromWriter()
assert.NoError(t, err)
assert.Equal(t, 6, length)
defer w.ReleasePayloadWriter()
buffer, err := w.GetPayloadBufferFromWriter()
assert.NoError(t, err)
r, err := NewPayloadReader(schemapb.DataType_SparseFloatVector, buffer, false)
require.Nil(t, err)
length, err = r.GetPayloadLengthFromReader()
assert.NoError(t, err)
assert.Equal(t, length, 6)
floatVecs, dim, _, err := r.GetSparseFloatVectorFromPayload()
assert.NoError(t, err)
assert.Equal(t, 600, dim)
assert.Equal(t, 6, len(floatVecs.Contents))
assert.EqualExportedValues(t, &schemapb.SparseFloatArray{
// merged dim should be max of all dims
Dim: 600,
Contents: [][]byte{
typeutil.CreateSparseFloatRow([]uint32{0, 1, 2}, []float32{1.1, 1.2, 1.3}),
typeutil.CreateSparseFloatRow([]uint32{10, 20, 30}, []float32{2.1, 2.2, 2.3}),
typeutil.CreateSparseFloatRow([]uint32{100, 200, 599}, []float32{3.1, 3.2, 3.3}),
typeutil.CreateSparseFloatRow([]uint32{30, 41, 52}, []float32{1.1, 1.2, 1.3}),
typeutil.CreateSparseFloatRow([]uint32{60, 80, 230}, []float32{2.1, 2.2, 2.3}),
typeutil.CreateSparseFloatRow([]uint32{170, 300, 579}, []float32{3.1, 3.2, 3.3}),
},
}, &floatVecs.SparseFloatArray)
ifloatVecs, valids, dim, err := r.GetDataFromPayload()
assert.NoError(t, err)
assert.Nil(t, valids)
assert.Equal(t, floatVecs, ifloatVecs.(*SparseFloatVectorFieldData))
assert.Equal(t, 600, dim)
defer r.ReleasePayloadReader()
})
testSparseOneBatch := func(t *testing.T, rows [][]byte, actualDim int) {
w, err := NewPayloadWriter(schemapb.DataType_SparseFloatVector)
require.Nil(t, err)
require.NotNil(t, w)
err = w.AddSparseFloatVectorToPayload(&SparseFloatVectorFieldData{
SparseFloatArray: schemapb.SparseFloatArray{
Dim: int64(actualDim),
Contents: rows,
},
})
assert.NoError(t, err)
err = w.FinishPayloadWriter()
assert.NoError(t, err)
length, err := w.GetPayloadLengthFromWriter()
assert.NoError(t, err)
assert.Equal(t, 3, length)
defer w.ReleasePayloadWriter()
buffer, err := w.GetPayloadBufferFromWriter()
assert.NoError(t, err)
r, err := NewPayloadReader(schemapb.DataType_SparseFloatVector, buffer, false)
require.Nil(t, err)
length, err = r.GetPayloadLengthFromReader()
assert.NoError(t, err)
assert.Equal(t, length, 3)
floatVecs, dim, _, err := r.GetSparseFloatVectorFromPayload()
assert.NoError(t, err)
assert.Equal(t, actualDim, dim)
assert.Equal(t, 3, len(floatVecs.Contents))
assert.EqualExportedValues(t, &schemapb.SparseFloatArray{
Dim: int64(dim),
Contents: rows,
}, &floatVecs.SparseFloatArray)
ifloatVecs, valids, dim, err := r.GetDataFromPayload()
assert.Nil(t, valids)
assert.NoError(t, err)
assert.Equal(t, floatVecs, ifloatVecs.(*SparseFloatVectorFieldData))
assert.Equal(t, actualDim, dim)
defer r.ReleasePayloadReader()
}
t.Run("TestSparseFloatVector_emptyRow", func(t *testing.T) {
testSparseOneBatch(t, [][]byte{
typeutil.CreateSparseFloatRow([]uint32{}, []float32{}),
typeutil.CreateSparseFloatRow([]uint32{10, 20, 30}, []float32{2.1, 2.2, 2.3}),
typeutil.CreateSparseFloatRow([]uint32{100, 200, 599}, []float32{3.1, 3.2, 3.3}),
}, 600)
testSparseOneBatch(t, [][]byte{
typeutil.CreateSparseFloatRow([]uint32{}, []float32{}),
typeutil.CreateSparseFloatRow([]uint32{}, []float32{}),
typeutil.CreateSparseFloatRow([]uint32{}, []float32{}),
}, 0)
})
t.Run("TestSparseFloatVector_largeRow", func(t *testing.T) {
nnz := 100000
// generate an int slice with nnz random sorted elements
indices := make([]uint32, nnz)
values := make([]float32, nnz)
for i := 0; i < nnz; i++ {
indices[i] = uint32(i * 6)
values[i] = float32(i)
}
dim := int(indices[nnz-1]) + 1
testSparseOneBatch(t, [][]byte{
typeutil.CreateSparseFloatRow([]uint32{}, []float32{}),
typeutil.CreateSparseFloatRow([]uint32{10, 20, 30}, []float32{2.1, 2.2, 2.3}),
typeutil.CreateSparseFloatRow(indices, values),
}, dim)
})
t.Run("TestSparseFloatVector_negativeValues", func(t *testing.T) {
testSparseOneBatch(t, [][]byte{
typeutil.CreateSparseFloatRow([]uint32{}, []float32{}),
typeutil.CreateSparseFloatRow([]uint32{10, 20, 30}, []float32{-2.1, 2.2, -2.3}),
typeutil.CreateSparseFloatRow([]uint32{100, 200, 599}, []float32{3.1, -3.2, 3.3}),
}, 600)
})
// even though SPARSE_INVERTED_INDEX and SPARSE_WAND index do not support
// arbitrarily large dimensions, HNSW does, so we still need to test it.
// Dimension range we support is 0 to positive int32 max - 1(to leave room
// for dim).
t.Run("TestSparseFloatVector_largeIndex", func(t *testing.T) {
int32Max := uint32(math.MaxInt32)
testSparseOneBatch(t, [][]byte{
typeutil.CreateSparseFloatRow([]uint32{}, []float32{}),
typeutil.CreateSparseFloatRow([]uint32{10, 20, 30}, []float32{-2.1, 2.2, -2.3}),
typeutil.CreateSparseFloatRow([]uint32{100, int32Max / 2, int32Max - 1}, []float32{3.1, -3.2, 3.3}),
}, int(int32Max))
})
t.Run("TestAddBoolAfterFinish", func(t *testing.T) {
w, err := NewPayloadWriter(schemapb.DataType_Bool)
require.Nil(t, err)
require.NotNil(t, w)
_, err = w.GetPayloadBufferFromWriter()
assert.Error(t, err)
err = w.AddBoolToPayload([]bool{}, nil)
assert.Error(t, err)
err = w.FinishPayloadWriter()
assert.NoError(t, err)
err = w.AddBoolToPayload([]bool{false}, nil)
assert.Error(t, err)
})
t.Run("TestAddInt8AfterFinish", func(t *testing.T) {
w, err := NewPayloadWriter(schemapb.DataType_Int8)
require.Nil(t, err)
require.NotNil(t, w)
defer w.Close()
_, err = w.GetPayloadBufferFromWriter()
assert.Error(t, err)
err = w.AddInt8ToPayload([]int8{}, nil)
assert.Error(t, err)
err = w.FinishPayloadWriter()
assert.NoError(t, err)
err = w.AddInt8ToPayload([]int8{0}, nil)
assert.Error(t, err)
})
t.Run("TestAddInt16AfterFinish", func(t *testing.T) {
w, err := NewPayloadWriter(schemapb.DataType_Int16)
require.Nil(t, err)
require.NotNil(t, w)
defer w.Close()
_, err = w.GetPayloadBufferFromWriter()
assert.Error(t, err)
err = w.AddInt16ToPayload([]int16{}, nil)
assert.Error(t, err)
err = w.FinishPayloadWriter()
assert.NoError(t, err)
err = w.AddInt16ToPayload([]int16{0}, nil)
assert.Error(t, err)
})
t.Run("TestAddInt32AfterFinish", func(t *testing.T) {
w, err := NewPayloadWriter(schemapb.DataType_Int32)
require.Nil(t, err)
require.NotNil(t, w)
defer w.Close()
_, err = w.GetPayloadBufferFromWriter()
assert.Error(t, err)
err = w.AddInt32ToPayload([]int32{}, nil)
assert.Error(t, err)
err = w.FinishPayloadWriter()
assert.NoError(t, err)
err = w.AddInt32ToPayload([]int32{0}, nil)
assert.Error(t, err)
})
t.Run("TestAddInt64AfterFinish", func(t *testing.T) {
w, err := NewPayloadWriter(schemapb.DataType_Int64)
require.Nil(t, err)
require.NotNil(t, w)
defer w.Close()
_, err = w.GetPayloadBufferFromWriter()
assert.Error(t, err)
err = w.AddInt64ToPayload([]int64{}, nil)
assert.Error(t, err)
err = w.FinishPayloadWriter()
assert.NoError(t, err)
err = w.AddInt64ToPayload([]int64{0}, nil)
assert.Error(t, err)
})
t.Run("TestAddFloatAfterFinish", func(t *testing.T) {
w, err := NewPayloadWriter(schemapb.DataType_Float)
require.Nil(t, err)
require.NotNil(t, w)
defer w.Close()
_, err = w.GetPayloadBufferFromWriter()
assert.Error(t, err)
err = w.AddFloatToPayload([]float32{}, nil)
assert.Error(t, err)
err = w.FinishPayloadWriter()
assert.NoError(t, err)
err = w.AddFloatToPayload([]float32{0.0}, nil)
assert.Error(t, err)
})
t.Run("TestAddDoubleAfterFinish", func(t *testing.T) {
w, err := NewPayloadWriter(schemapb.DataType_Double)
require.Nil(t, err)
require.NotNil(t, w)
defer w.Close()
_, err = w.GetPayloadBufferFromWriter()
assert.Error(t, err)
err = w.AddDoubleToPayload([]float64{}, nil)
assert.Error(t, err)
err = w.FinishPayloadWriter()
assert.NoError(t, err)
err = w.AddDoubleToPayload([]float64{0.0}, nil)
assert.Error(t, err)
})
t.Run("TestAddOneStringAfterFinish", func(t *testing.T) {
w, err := NewPayloadWriter(schemapb.DataType_String)
require.Nil(t, err)
require.NotNil(t, w)
defer w.Close()
_, err = w.GetPayloadBufferFromWriter()
assert.Error(t, err)
err = w.AddOneStringToPayload("", true)
assert.NoError(t, err)
err = w.FinishPayloadWriter()
assert.NoError(t, err)
err = w.AddOneStringToPayload("c", true)
assert.Error(t, err)
})
t.Run("TestAddBinVectorAfterFinish", func(t *testing.T) {
w, err := NewPayloadWriter(schemapb.DataType_BinaryVector, WithDim(8))
require.Nil(t, err)
require.NotNil(t, w)
defer w.Close()
_, err = w.GetPayloadBufferFromWriter()
assert.Error(t, err)
err = w.FinishPayloadWriter()
assert.NoError(t, err)
err = w.AddBinaryVectorToPayload([]byte{}, 8, nil)
assert.Error(t, err)
err = w.AddBinaryVectorToPayload([]byte{1}, 0, nil)
assert.Error(t, err)
err = w.AddBinaryVectorToPayload([]byte{1, 0, 0, 0, 0, 0, 0, 0}, 8, nil)
assert.Error(t, err)
err = w.FinishPayloadWriter()
assert.Error(t, err)
err = w.AddBinaryVectorToPayload([]byte{1, 0, 0, 0, 0, 0, 0, 0}, 8, nil)
assert.Error(t, err)
})
t.Run("TestAddFloatVectorAfterFinish", func(t *testing.T) {
w, err := NewPayloadWriter(schemapb.DataType_FloatVector, WithDim(8))
require.Nil(t, err)
require.NotNil(t, w)
defer w.Close()
err = w.FinishPayloadWriter()
assert.NoError(t, err)
err = w.AddFloatVectorToPayload([]float32{}, 8, nil)
assert.Error(t, err)
err = w.AddFloatVectorToPayload([]float32{1.0}, 0, nil)
assert.Error(t, err)
err = w.AddFloatVectorToPayload([]float32{1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0}, 8, nil)
assert.Error(t, err)
err = w.FinishPayloadWriter()
assert.Error(t, err)
err = w.AddFloatVectorToPayload([]float32{1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0}, 8, nil)
assert.Error(t, err)
})
t.Run("TestAddFloat16VectorAfterFinish", func(t *testing.T) {
w, err := NewPayloadWriter(schemapb.DataType_Float16Vector, WithDim(8))
require.Nil(t, err)
require.NotNil(t, w)
defer w.Close()
err = w.AddFloat16VectorToPayload([]byte{}, 8, nil)
assert.Error(t, err)
err = w.FinishPayloadWriter()
assert.NoError(t, err)
err = w.AddFloat16VectorToPayload([]byte{}, 8, nil)
assert.Error(t, err)
err = w.AddFloat16VectorToPayload([]byte{1}, 0, nil)
assert.Error(t, err)
err = w.AddFloat16VectorToPayload([]byte{1, 0, 0, 0, 0, 0, 0, 0}, 8, nil)
assert.Error(t, err)
err = w.FinishPayloadWriter()
assert.Error(t, err)
err = w.AddFloat16VectorToPayload([]byte{1, 0, 0, 0, 0, 0, 0, 0}, 8, nil)
assert.Error(t, err)
})
t.Run("TestAddBFloat16VectorAfterFinish", func(t *testing.T) {
w, err := NewPayloadWriter(schemapb.DataType_BFloat16Vector, WithDim(8))
require.Nil(t, err)
require.NotNil(t, w)
defer w.Close()
err = w.AddBFloat16VectorToPayload([]byte{}, 8, nil)
assert.Error(t, err)
err = w.FinishPayloadWriter()
assert.NoError(t, err)
err = w.AddBFloat16VectorToPayload([]byte{}, 8, nil)
assert.Error(t, err)
err = w.AddBFloat16VectorToPayload([]byte{1}, 0, nil)
assert.Error(t, err)
err = w.AddBFloat16VectorToPayload([]byte{1, 0, 0, 0, 0, 0, 0, 0}, 8, nil)
assert.Error(t, err)
err = w.FinishPayloadWriter()
assert.Error(t, err)
err = w.AddBFloat16VectorToPayload([]byte{1, 0, 0, 0, 0, 0, 0, 0}, 8, nil)
assert.Error(t, err)
})
t.Run("TestAddSparseFloatVectorAfterFinish", func(t *testing.T) {
w, err := NewPayloadWriter(schemapb.DataType_SparseFloatVector)
require.Nil(t, err)
require.NotNil(t, w)
defer w.Close()
err = w.FinishPayloadWriter()
assert.NoError(t, err)
err = w.AddSparseFloatVectorToPayload(&SparseFloatVectorFieldData{
SparseFloatArray: schemapb.SparseFloatArray{
Dim: 53,
Contents: [][]byte{
typeutil.CreateSparseFloatRow([]uint32{30, 41, 52}, []float32{1.1, 1.2, 1.3}),
},
},
})
assert.Error(t, err)
err = w.AddSparseFloatVectorToPayload(&SparseFloatVectorFieldData{
SparseFloatArray: schemapb.SparseFloatArray{
Dim: 600,
Contents: [][]byte{
typeutil.CreateSparseFloatRow([]uint32{30, 41, 52}, []float32{1.1, 1.2, 1.3}),
},
},
})
assert.Error(t, err)
err = w.FinishPayloadWriter()
assert.Error(t, err)
})
t.Run("TestNewReadError", func(t *testing.T) {
buffer := []byte{0}
r, err := NewPayloadReader(999, buffer, false)
assert.Error(t, err)
assert.Nil(t, r)
})
t.Run("TestGetDataError", func(t *testing.T) {
r := PayloadReader{}
r.colType = 999
_, _, _, err := r.GetDataFromPayload()
assert.Error(t, err)
})
t.Run("TestGetBoolError", func(t *testing.T) {
w, err := NewPayloadWriter(schemapb.DataType_Int8)
require.Nil(t, err)
require.NotNil(t, w)
err = w.AddInt8ToPayload([]int8{1, 2, 3}, nil)
assert.NoError(t, err)
err = w.FinishPayloadWriter()
assert.NoError(t, err)
buffer, err := w.GetPayloadBufferFromWriter()
assert.NoError(t, err)
r, err := NewPayloadReader(schemapb.DataType_Bool, buffer, false)
assert.NoError(t, err)
_, _, err = r.GetBoolFromPayload()
assert.Error(t, err)
r.colType = 999
_, _, err = r.GetBoolFromPayload()
assert.Error(t, err)
})
t.Run("TestGetBoolError2", func(t *testing.T) {
w, err := NewPayloadWriter(schemapb.DataType_Bool)
require.Nil(t, err)
require.NotNil(t, w)
err = w.AddBoolToPayload([]bool{true, false, true}, nil)
assert.NoError(t, err)
err = w.FinishPayloadWriter()
assert.NoError(t, err)
buffer, err := w.GetPayloadBufferFromWriter()
assert.NoError(t, err)
r, err := NewPayloadReader(schemapb.DataType_Bool, buffer, false)
assert.NoError(t, err)
r.numRows = 99
_, _, err = r.GetBoolFromPayload()
assert.Error(t, err)
})
t.Run("TestGetInt8Error", func(t *testing.T) {
w, err := NewPayloadWriter(schemapb.DataType_Bool)
require.Nil(t, err)
require.NotNil(t, w)
err = w.AddBoolToPayload([]bool{false, true, true}, nil)
assert.NoError(t, err)
err = w.FinishPayloadWriter()
assert.NoError(t, err)
buffer, err := w.GetPayloadBufferFromWriter()
assert.NoError(t, err)
r, err := NewPayloadReader(schemapb.DataType_Int8, buffer, false)
assert.NoError(t, err)
_, _, err = r.GetInt8FromPayload()
assert.Error(t, err)
r.colType = 999
_, _, err = r.GetInt8FromPayload()
assert.Error(t, err)
})
t.Run("TestGetInt8Error2", func(t *testing.T) {
w, err := NewPayloadWriter(schemapb.DataType_Int8)
require.Nil(t, err)
require.NotNil(t, w)
err = w.AddInt8ToPayload([]int8{1, 2, 3}, nil)
assert.NoError(t, err)
err = w.FinishPayloadWriter()
assert.NoError(t, err)
buffer, err := w.GetPayloadBufferFromWriter()
assert.NoError(t, err)
r, err := NewPayloadReader(schemapb.DataType_Int8, buffer, false)
assert.NoError(t, err)
r.numRows = 99
_, _, err = r.GetInt8FromPayload()
assert.Error(t, err)
})
t.Run("TestGetInt16Error", func(t *testing.T) {
w, err := NewPayloadWriter(schemapb.DataType_Bool)
require.Nil(t, err)
require.NotNil(t, w)
err = w.AddBoolToPayload([]bool{false, true, true}, nil)
assert.NoError(t, err)
err = w.FinishPayloadWriter()
assert.NoError(t, err)
buffer, err := w.GetPayloadBufferFromWriter()
assert.NoError(t, err)
r, err := NewPayloadReader(schemapb.DataType_Int16, buffer, false)
assert.NoError(t, err)
_, _, err = r.GetInt16FromPayload()
assert.Error(t, err)
r.colType = 999
_, _, err = r.GetInt16FromPayload()
assert.Error(t, err)
})
t.Run("TestGetInt16Error2", func(t *testing.T) {
w, err := NewPayloadWriter(schemapb.DataType_Int16)
require.Nil(t, err)
require.NotNil(t, w)
err = w.AddInt16ToPayload([]int16{1, 2, 3}, nil)
assert.NoError(t, err)
err = w.FinishPayloadWriter()
assert.NoError(t, err)
buffer, err := w.GetPayloadBufferFromWriter()
assert.NoError(t, err)
r, err := NewPayloadReader(schemapb.DataType_Int16, buffer, false)
assert.NoError(t, err)
r.numRows = 99
_, _, err = r.GetInt16FromPayload()
assert.Error(t, err)
})
t.Run("TestGetInt32Error", func(t *testing.T) {
w, err := NewPayloadWriter(schemapb.DataType_Bool)
require.Nil(t, err)
require.NotNil(t, w)
err = w.AddBoolToPayload([]bool{false, true, true}, nil)
assert.NoError(t, err)
err = w.FinishPayloadWriter()
assert.NoError(t, err)
buffer, err := w.GetPayloadBufferFromWriter()
assert.NoError(t, err)
r, err := NewPayloadReader(schemapb.DataType_Int32, buffer, false)
assert.NoError(t, err)
_, _, err = r.GetInt32FromPayload()
assert.Error(t, err)
r.colType = 999
_, _, err = r.GetInt32FromPayload()
assert.Error(t, err)
})
t.Run("TestGetInt32Error2", func(t *testing.T) {
w, err := NewPayloadWriter(schemapb.DataType_Int32)
require.Nil(t, err)
require.NotNil(t, w)
err = w.AddInt32ToPayload([]int32{1, 2, 3}, nil)
assert.NoError(t, err)
err = w.FinishPayloadWriter()
assert.NoError(t, err)
buffer, err := w.GetPayloadBufferFromWriter()
assert.NoError(t, err)
r, err := NewPayloadReader(schemapb.DataType_Int32, buffer, false)
assert.NoError(t, err)
r.numRows = 99
_, _, err = r.GetInt32FromPayload()
assert.Error(t, err)
})
t.Run("TestGetInt64Error", func(t *testing.T) {
w, err := NewPayloadWriter(schemapb.DataType_Bool)
require.Nil(t, err)
require.NotNil(t, w)
err = w.AddBoolToPayload([]bool{false, true, true}, nil)
assert.NoError(t, err)
err = w.FinishPayloadWriter()
assert.NoError(t, err)
buffer, err := w.GetPayloadBufferFromWriter()
assert.NoError(t, err)
r, err := NewPayloadReader(schemapb.DataType_Int64, buffer, false)
assert.NoError(t, err)
_, _, err = r.GetInt64FromPayload()
assert.Error(t, err)
r.colType = 999
_, _, err = r.GetInt64FromPayload()
assert.Error(t, err)
})
t.Run("TestGetInt64Error2", func(t *testing.T) {
w, err := NewPayloadWriter(schemapb.DataType_Int64)
require.Nil(t, err)
require.NotNil(t, w)
err = w.AddInt64ToPayload([]int64{1, 2, 3}, nil)
assert.NoError(t, err)
err = w.FinishPayloadWriter()
assert.NoError(t, err)
buffer, err := w.GetPayloadBufferFromWriter()
assert.NoError(t, err)
r, err := NewPayloadReader(schemapb.DataType_Int64, buffer, false)
assert.NoError(t, err)
r.numRows = 99
_, _, err = r.GetInt64FromPayload()
assert.Error(t, err)
})
t.Run("TestGetFloatError", func(t *testing.T) {
w, err := NewPayloadWriter(schemapb.DataType_Bool)
require.Nil(t, err)
require.NotNil(t, w)
err = w.AddBoolToPayload([]bool{false, true, true}, nil)
assert.NoError(t, err)
err = w.FinishPayloadWriter()
assert.NoError(t, err)
buffer, err := w.GetPayloadBufferFromWriter()
assert.NoError(t, err)
r, err := NewPayloadReader(schemapb.DataType_Float, buffer, false)
assert.NoError(t, err)
_, _, err = r.GetFloatFromPayload()
assert.Error(t, err)
r.colType = 999
_, _, err = r.GetFloatFromPayload()
assert.Error(t, err)
})
t.Run("TestGetFloatError2", func(t *testing.T) {
w, err := NewPayloadWriter(schemapb.DataType_Float)
require.Nil(t, err)
require.NotNil(t, w)
err = w.AddFloatToPayload([]float32{1, 2, 3}, nil)
assert.NoError(t, err)
err = w.FinishPayloadWriter()
assert.NoError(t, err)
buffer, err := w.GetPayloadBufferFromWriter()
assert.NoError(t, err)
r, err := NewPayloadReader(schemapb.DataType_Float, buffer, false)
assert.NoError(t, err)
r.numRows = 99
_, _, err = r.GetFloatFromPayload()
assert.Error(t, err)
})
t.Run("TestGetDoubleError", func(t *testing.T) {
w, err := NewPayloadWriter(schemapb.DataType_Bool)
require.Nil(t, err)
require.NotNil(t, w)
err = w.AddBoolToPayload([]bool{false, true, true}, nil)
assert.NoError(t, err)
err = w.FinishPayloadWriter()
assert.NoError(t, err)
buffer, err := w.GetPayloadBufferFromWriter()
assert.NoError(t, err)
r, err := NewPayloadReader(schemapb.DataType_Double, buffer, false)
assert.NoError(t, err)
_, _, err = r.GetDoubleFromPayload()
assert.Error(t, err)
r.colType = 999
_, _, err = r.GetDoubleFromPayload()
assert.Error(t, err)
})
t.Run("TestGetDoubleError2", func(t *testing.T) {
w, err := NewPayloadWriter(schemapb.DataType_Double)
require.Nil(t, err)
require.NotNil(t, w)
err = w.AddDoubleToPayload([]float64{1, 2, 3}, nil)
assert.NoError(t, err)
err = w.FinishPayloadWriter()
assert.NoError(t, err)
buffer, err := w.GetPayloadBufferFromWriter()
assert.NoError(t, err)
r, err := NewPayloadReader(schemapb.DataType_Double, buffer, false)
assert.NoError(t, err)
r.numRows = 99
_, _, err = r.GetDoubleFromPayload()
assert.Error(t, err)
})
t.Run("TestGetStringError", func(t *testing.T) {
w, err := NewPayloadWriter(schemapb.DataType_Bool)
require.Nil(t, err)
require.NotNil(t, w)
err = w.AddBoolToPayload([]bool{false, true, true}, nil)
assert.NoError(t, err)
err = w.FinishPayloadWriter()
assert.NoError(t, err)
buffer, err := w.GetPayloadBufferFromWriter()
assert.NoError(t, err)
r, err := NewPayloadReader(schemapb.DataType_String, buffer, false)
assert.NoError(t, err)
_, _, err = r.GetStringFromPayload()
assert.Error(t, err)
r.colType = 999
_, _, err = r.GetStringFromPayload()
assert.Error(t, err)
})
t.Run("TestGetStringError2", func(t *testing.T) {
w, err := NewPayloadWriter(schemapb.DataType_String)
require.Nil(t, err)
require.NotNil(t, w)
err = w.AddOneStringToPayload("hello0", true)
assert.NoError(t, err)
err = w.AddOneStringToPayload("hello1", true)
assert.NoError(t, err)
err = w.AddOneStringToPayload("hello2", true)
assert.NoError(t, err)
err = w.FinishPayloadWriter()
assert.NoError(t, err)
buffer, err := w.GetPayloadBufferFromWriter()
assert.NoError(t, err)
r, err := NewPayloadReader(schemapb.DataType_String, buffer, false)
assert.NoError(t, err)
r.numRows = 99
_, _, err = r.GetStringFromPayload()
assert.Error(t, err)
})
t.Run("TestGetArrayError", func(t *testing.T) {
w, err := NewPayloadWriter(schemapb.DataType_Bool)
require.Nil(t, err)
require.NotNil(t, w)
err = w.AddBoolToPayload([]bool{false, true, true}, nil)
assert.NoError(t, err)
err = w.FinishPayloadWriter()
assert.NoError(t, err)
buffer, err := w.GetPayloadBufferFromWriter()
assert.NoError(t, err)
r, err := NewPayloadReader(schemapb.DataType_Array, buffer, false)
assert.NoError(t, err)
_, _, err = r.GetArrayFromPayload()
assert.Error(t, err)
r.colType = 999
_, _, err = r.GetArrayFromPayload()
assert.Error(t, err)
})
t.Run("TestGetBinaryVectorError", func(t *testing.T) {
w, err := NewPayloadWriter(schemapb.DataType_Bool)
require.Nil(t, err)
require.NotNil(t, w)
err = w.AddBoolToPayload([]bool{false, true, true}, nil)
assert.NoError(t, err)
err = w.FinishPayloadWriter()
assert.NoError(t, err)
buffer, err := w.GetPayloadBufferFromWriter()
assert.NoError(t, err)
r, err := NewPayloadReader(schemapb.DataType_BinaryVector, buffer, false)
assert.NoError(t, err)
_, _, _, _, err = r.GetBinaryVectorFromPayload()
assert.Error(t, err)
r.colType = 999
_, _, _, _, err = r.GetBinaryVectorFromPayload()
assert.Error(t, err)
})
t.Run("TestGetBinaryVectorError2", func(t *testing.T) {
w, err := NewPayloadWriter(schemapb.DataType_BinaryVector, WithDim(8))
require.Nil(t, err)
require.NotNil(t, w)
err = w.AddBinaryVectorToPayload([]byte{1, 0, 0, 0, 0, 0, 0, 0}, 8, nil)
assert.NoError(t, err)
err = w.FinishPayloadWriter()
assert.NoError(t, err)
buffer, err := w.GetPayloadBufferFromWriter()
assert.NoError(t, err)
r, err := NewPayloadReader(schemapb.DataType_BinaryVector, buffer, false)
assert.NoError(t, err)
r.numRows = 99
_, _, _, _, err = r.GetBinaryVectorFromPayload()
assert.Error(t, err)
})
t.Run("TestGetFloatVectorError", func(t *testing.T) {
w, err := NewPayloadWriter(schemapb.DataType_Bool)
require.Nil(t, err)
require.NotNil(t, w)
err = w.AddBoolToPayload([]bool{false, true, true}, nil)
assert.NoError(t, err)
err = w.FinishPayloadWriter()
assert.NoError(t, err)
buffer, err := w.GetPayloadBufferFromWriter()
assert.NoError(t, err)
r, err := NewPayloadReader(schemapb.DataType_FloatVector, buffer, false)
assert.NoError(t, err)
_, _, _, _, err = r.GetFloatVectorFromPayload()
assert.Error(t, err)
r.colType = 999
_, _, _, _, err = r.GetFloatVectorFromPayload()
assert.Error(t, err)
})
t.Run("TestGetFloatVectorError2", func(t *testing.T) {
w, err := NewPayloadWriter(schemapb.DataType_FloatVector, WithDim(8))
require.Nil(t, err)
require.NotNil(t, w)
err = w.AddFloatVectorToPayload([]float32{1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0}, 8, nil)
assert.NoError(t, err)
err = w.FinishPayloadWriter()
assert.NoError(t, err)
buffer, err := w.GetPayloadBufferFromWriter()
assert.NoError(t, err)
r, err := NewPayloadReader(schemapb.DataType_FloatVector, buffer, false)
assert.NoError(t, err)
r.numRows = 99
_, _, _, _, err = r.GetFloatVectorFromPayload()
assert.Error(t, err)
})
t.Run("TestByteArrayDatasetError", func(t *testing.T) {
w, err := NewPayloadWriter(schemapb.DataType_String)
require.Nil(t, err)
require.NotNil(t, w)
err = w.AddOneStringToPayload("hello0", true)
assert.NoError(t, err)
err = w.FinishPayloadWriter()
assert.NoError(t, err)
buffer, err := w.GetPayloadBufferFromWriter()
assert.NoError(t, err)
r, err := NewPayloadReader(schemapb.DataType_FloatVector, buffer, false)
assert.NoError(t, err)
r.colType = 99
_, err = r.GetByteArrayDataSet()
assert.Error(t, err)
r.colType = schemapb.DataType_String
dataset, err := r.GetByteArrayDataSet()
assert.NoError(t, err)
dataset.columnIdx = math.MaxInt
_, err = dataset.NextBatch(100)
assert.Error(t, err)
dataset.groupID = math.MaxInt
assert.Error(t, err)
})
t.Run("TestWriteLargeSizeData", func(t *testing.T) {
t.Skip("Large data skip for online ut")
size := 1 << 29 // 512M
var vec []float32
for i := 0; i < size/4; i++ {
vec = append(vec, 1)
}
w, err := NewPayloadWriter(schemapb.DataType_FloatVector)
assert.NoError(t, err)
err = w.AddFloatVectorToPayload(vec, 128, nil)
assert.NoError(t, err)
err = w.FinishPayloadWriter()
assert.NoError(t, err)
_, err = w.GetPayloadBufferFromWriter()
assert.NoError(t, err)
w.ReleasePayloadWriter()
})
t.Run("TestAddBool with wrong valids", func(t *testing.T) {
w, err := NewPayloadWriter(schemapb.DataType_Bool)
require.Nil(t, err)
require.NotNil(t, w)
err = w.AddBoolToPayload([]bool{false}, []bool{false})
assert.ErrorIs(t, err, merr.ErrParameterInvalid)
})
t.Run("TestAddInt8 with wrong valids", func(t *testing.T) {
w, err := NewPayloadWriter(schemapb.DataType_Int8)
require.Nil(t, err)
require.NotNil(t, w)
err = w.AddInt8ToPayload([]int8{1}, []bool{false})
assert.ErrorIs(t, err, merr.ErrParameterInvalid)
})
t.Run("TestAddInt16 with wrong valids", func(t *testing.T) {
w, err := NewPayloadWriter(schemapb.DataType_Int16)
require.Nil(t, err)
require.NotNil(t, w)
err = w.AddInt16ToPayload([]int16{1}, []bool{false})
assert.ErrorIs(t, err, merr.ErrParameterInvalid)
})
t.Run("TestAddInt32 with wrong valids", func(t *testing.T) {
w, err := NewPayloadWriter(schemapb.DataType_Int32)
require.Nil(t, err)
require.NotNil(t, w)
err = w.AddInt32ToPayload([]int32{1}, []bool{false})
assert.ErrorIs(t, err, merr.ErrParameterInvalid)
})
t.Run("TestAddInt64 with wrong valids", func(t *testing.T) {
w, err := NewPayloadWriter(schemapb.DataType_Int64)
require.Nil(t, err)
require.NotNil(t, w)
err = w.AddInt64ToPayload([]int64{1}, []bool{false})
assert.ErrorIs(t, err, merr.ErrParameterInvalid)
})
t.Run("TestAddFloat32 with wrong valids", func(t *testing.T) {
w, err := NewPayloadWriter(schemapb.DataType_Float)
require.Nil(t, err)
require.NotNil(t, w)
err = w.AddFloatToPayload([]float32{1.0}, []bool{false})
assert.ErrorIs(t, err, merr.ErrParameterInvalid)
})
t.Run("TestAddDouble with wrong valids", func(t *testing.T) {
w, err := NewPayloadWriter(schemapb.DataType_Double)
require.Nil(t, err)
require.NotNil(t, w)
err = w.AddDoubleToPayload([]float64{1.0}, []bool{false})
assert.ErrorIs(t, err, merr.ErrParameterInvalid)
})
t.Run("TestAddAddString with wrong valids", func(t *testing.T) {
w, err := NewPayloadWriter(schemapb.DataType_String)
require.Nil(t, err)
require.NotNil(t, w)
err = w.AddOneStringToPayload("hello0", false)
assert.ErrorIs(t, err, merr.ErrParameterInvalid)
})
t.Run("TestAddArray with wrong valids", func(t *testing.T) {
w, err := NewPayloadWriter(schemapb.DataType_Array)
require.Nil(t, err)
require.NotNil(t, w)
err = w.AddOneArrayToPayload(&schemapb.ScalarField{
Data: &schemapb.ScalarField_IntData{
IntData: &schemapb.IntArray{
Data: []int32{1, 2},
},
},
}, false)
assert.ErrorIs(t, err, merr.ErrParameterInvalid)
})
t.Run("TestAddJSON with wrong valids", func(t *testing.T) {
w, err := NewPayloadWriter(schemapb.DataType_JSON)
require.Nil(t, err)
require.NotNil(t, w)
err = w.AddOneJSONToPayload([]byte(`{"1":"1"}`), false)
assert.ErrorIs(t, err, merr.ErrParameterInvalid)
})
t.Run("TestVectorArray", func(t *testing.T) {
dim := 4
w, err := NewPayloadWriter(
schemapb.DataType_ArrayOfVector,
WithDim(dim),
WithElementType(schemapb.DataType_FloatVector),
)
require.NoError(t, err)
require.NotNil(t, w)
// Create VectorArrayFieldData with 3 rows
vectorArrayData := &VectorArrayFieldData{
Dim: int64(dim),
Data: []*schemapb.VectorField{
{
Dim: int64(dim),
Data: &schemapb.VectorField_FloatVector{
FloatVector: &schemapb.FloatArray{
Data: []float32{1.0, 2.0, 3.0, 4.0, 5.0, 6.0, 7.0, 8.0},
},
},
},
{
Dim: int64(dim),
Data: &schemapb.VectorField_FloatVector{
FloatVector: &schemapb.FloatArray{
Data: []float32{11.0, 22.0, 33.0, 44.0},
},
},
},
{
Dim: int64(dim),
Data: &schemapb.VectorField_FloatVector{
FloatVector: &schemapb.FloatArray{
Data: []float32{111.0, 222.0, 333.0, 444.0, 555.0, 666.0, 777.0, 888.0, 999.0, 1000.0, 1111.0, 1212.0, 1313.0, 1414.0, 1515.0, 1616.0, 1717.0, 1818.0, 1919.0, 2020.0},
},
},
},
},
ElementType: schemapb.DataType_FloatVector,
}
err = w.AddVectorArrayFieldDataToPayload(vectorArrayData)
assert.NoError(t, err)
err = w.FinishPayloadWriter()
assert.NoError(t, err)
length, err := w.GetPayloadLengthFromWriter()
assert.NoError(t, err)
assert.Equal(t, 3, length)
buffer, err := w.GetPayloadBufferFromWriter()
assert.NoError(t, err)
r, err := NewPayloadReader(schemapb.DataType_ArrayOfVector, buffer, false)
assert.NoError(t, err)
length, err = r.GetPayloadLengthFromReader()
assert.NoError(t, err)
assert.Equal(t, 3, length)
vectorArrays, err := r.GetVectorArrayFromPayload()
assert.NoError(t, err)
assert.EqualValues(t, []float32{1.0, 2.0, 3.0, 4.0, 5.0, 6.0, 7.0, 8.0}, vectorArrays[0].GetFloatVector().GetData())
assert.EqualValues(t, []float32{11.0, 22.0, 33.0, 44.0}, vectorArrays[1].GetFloatVector().GetData())
assert.EqualValues(t, []float32{111.0, 222.0, 333.0, 444.0, 555.0, 666.0, 777.0, 888.0, 999.0, 1000.0, 1111.0, 1212.0, 1313.0, 1414.0, 1515.0, 1616.0, 1717.0, 1818.0, 1919.0, 2020.0}, vectorArrays[2].GetFloatVector().GetData())
for _, v := range vectorArrays {
assert.Equal(t, int64(dim), v.GetDim())
}
iArrayList, _, _, err := r.GetDataFromPayload()
vectorArrays = iArrayList.([]*schemapb.VectorField)
assert.NoError(t, err)
assert.EqualValues(t, []float32{1.0, 2.0, 3.0, 4.0, 5.0, 6.0, 7.0, 8.0}, vectorArrays[0].GetFloatVector().GetData())
assert.EqualValues(t, []float32{11.0, 22.0, 33.0, 44.0}, vectorArrays[1].GetFloatVector().GetData())
assert.EqualValues(t, []float32{111.0, 222.0, 333.0, 444.0, 555.0, 666.0, 777.0, 888.0, 999.0, 1000.0, 1111.0, 1212.0, 1313.0, 1414.0, 1515.0, 1616.0, 1717.0, 1818.0, 1919.0, 2020.0}, vectorArrays[2].GetFloatVector().GetData())
for _, v := range vectorArrays {
assert.Equal(t, int64(dim), v.GetDim())
}
r.ReleasePayloadReader()
w.ReleasePayloadWriter()
})
}
func TestPayload_NullableReaderAndWriter(t *testing.T) {
t.Run("TestBool", func(t *testing.T) {
w, err := NewPayloadWriter(schemapb.DataType_Bool, WithNullable(true))
require.Nil(t, err)
require.NotNil(t, w)
err = w.AddBoolToPayload([]bool{true, false, false, false}, []bool{true, false, true, false})
assert.NoError(t, err)
err = w.AddDataToPayloadForUT([]bool{true, false, false, false}, []bool{true, false, true, false})
assert.NoError(t, err)
err = w.FinishPayloadWriter()
assert.NoError(t, err)
length, err := w.GetPayloadLengthFromWriter()
assert.NoError(t, err)
assert.Equal(t, 8, length)
defer w.ReleasePayloadWriter()
buffer, err := w.GetPayloadBufferFromWriter()
assert.NoError(t, err)
r, err := NewPayloadReader(schemapb.DataType_Bool, buffer, true)
require.Nil(t, err)
length, err = r.GetPayloadLengthFromReader()
assert.NoError(t, err)
assert.Equal(t, length, 8)
bools, valids, err := r.GetBoolFromPayload()
assert.NoError(t, err)
assert.Equal(t, []bool{true, false, false, false, true, false, false, false}, bools)
assert.Equal(t, []bool{true, false, true, false, true, false, true, false}, valids)
ibools, valids, _, err := r.GetDataFromPayload()
bools = ibools.([]bool)
assert.NoError(t, err)
assert.Equal(t, []bool{true, false, false, false, true, false, false, false}, bools)
assert.Equal(t, []bool{true, false, true, false, true, false, true, false}, valids)
defer r.ReleasePayloadReader()
})
t.Run("TestInt8", func(t *testing.T) {
w, err := NewPayloadWriter(schemapb.DataType_Int8, WithNullable(true))
require.Nil(t, err)
require.NotNil(t, w)
err = w.AddInt8ToPayload([]int8{1, 2, 3}, []bool{true, false, true})
assert.NoError(t, err)
err = w.AddDataToPayloadForUT([]int8{4, 5, 6}, []bool{true, false, true})
assert.NoError(t, err)
err = w.FinishPayloadWriter()
assert.NoError(t, err)
length, err := w.GetPayloadLengthFromWriter()
assert.NoError(t, err)
assert.Equal(t, 6, length)
defer w.ReleasePayloadWriter()
buffer, err := w.GetPayloadBufferFromWriter()
assert.NoError(t, err)
r, err := NewPayloadReader(schemapb.DataType_Int8, buffer, true)
require.Nil(t, err)
length, err = r.GetPayloadLengthFromReader()
assert.NoError(t, err)
assert.Equal(t, length, 6)
int8s, valids, err := r.GetInt8FromPayload()
assert.NoError(t, err)
assert.Equal(t, []int8{1, 0, 3, 4, 0, 6}, int8s)
assert.Equal(t, []bool{true, false, true, true, false, true}, valids)
iint8s, valids, _, err := r.GetDataFromPayload()
int8s = iint8s.([]int8)
assert.NoError(t, err)
assert.Equal(t, []int8{1, 0, 3, 4, 0, 6}, int8s)
assert.Equal(t, []bool{true, false, true, true, false, true}, valids)
defer r.ReleasePayloadReader()
})
t.Run("TestInt16", func(t *testing.T) {
w, err := NewPayloadWriter(schemapb.DataType_Int16, WithNullable(true))
require.Nil(t, err)
require.NotNil(t, w)
err = w.AddInt16ToPayload([]int16{1, 2, 3}, []bool{true, false, true})
assert.NoError(t, err)
err = w.AddDataToPayloadForUT([]int16{1, 2, 3}, []bool{true, false, true})
assert.NoError(t, err)
err = w.FinishPayloadWriter()
assert.NoError(t, err)
length, err := w.GetPayloadLengthFromWriter()
assert.NoError(t, err)
assert.Equal(t, 6, length)
defer w.ReleasePayloadWriter()
buffer, err := w.GetPayloadBufferFromWriter()
assert.NoError(t, err)
r, err := NewPayloadReader(schemapb.DataType_Int16, buffer, true)
require.Nil(t, err)
length, err = r.GetPayloadLengthFromReader()
assert.NoError(t, err)
assert.Equal(t, length, 6)
int16s, valids, err := r.GetInt16FromPayload()
assert.NoError(t, err)
assert.Equal(t, []int16{1, 0, 3, 1, 0, 3}, int16s)
assert.Equal(t, []bool{true, false, true, true, false, true}, valids)
iint16s, valids, _, err := r.GetDataFromPayload()
int16s = iint16s.([]int16)
assert.NoError(t, err)
assert.Equal(t, []int16{1, 0, 3, 1, 0, 3}, int16s)
assert.Equal(t, []bool{true, false, true, true, false, true}, valids)
defer r.ReleasePayloadReader()
})
t.Run("TestInt32", func(t *testing.T) {
w, err := NewPayloadWriter(schemapb.DataType_Int32, WithNullable(true))
require.Nil(t, err)
require.NotNil(t, w)
err = w.AddInt32ToPayload([]int32{1, 2, 3}, []bool{true, false, true})
assert.NoError(t, err)
err = w.AddDataToPayloadForUT([]int32{1, 2, 3}, []bool{true, false, true})
assert.NoError(t, err)
err = w.FinishPayloadWriter()
assert.NoError(t, err)
length, err := w.GetPayloadLengthFromWriter()
assert.NoError(t, err)
assert.Equal(t, 6, length)
defer w.ReleasePayloadWriter()
buffer, err := w.GetPayloadBufferFromWriter()
assert.NoError(t, err)
r, err := NewPayloadReader(schemapb.DataType_Int32, buffer, true)
require.Nil(t, err)
length, err = r.GetPayloadLengthFromReader()
assert.NoError(t, err)
assert.Equal(t, length, 6)
int32s, valids, err := r.GetInt32FromPayload()
assert.NoError(t, err)
assert.Equal(t, []int32{1, 0, 3, 1, 0, 3}, int32s)
assert.Equal(t, []bool{true, false, true, true, false, true}, valids)
iint32s, valids, _, err := r.GetDataFromPayload()
int32s = iint32s.([]int32)
assert.NoError(t, err)
assert.Equal(t, []int32{1, 0, 3, 1, 0, 3}, int32s)
assert.Equal(t, []bool{true, false, true, true, false, true}, valids)
defer r.ReleasePayloadReader()
})
t.Run("TestInt64", func(t *testing.T) {
w, err := NewPayloadWriter(schemapb.DataType_Int64, WithNullable(true))
require.Nil(t, err)
require.NotNil(t, w)
err = w.AddInt64ToPayload([]int64{1, 2, 3}, []bool{true, false, true})
assert.NoError(t, err)
err = w.AddDataToPayloadForUT([]int64{1, 2, 3}, []bool{true, false, true})
assert.NoError(t, err)
err = w.FinishPayloadWriter()
assert.NoError(t, err)
length, err := w.GetPayloadLengthFromWriter()
assert.NoError(t, err)
assert.Equal(t, 6, length)
defer w.ReleasePayloadWriter()
buffer, err := w.GetPayloadBufferFromWriter()
assert.NoError(t, err)
r, err := NewPayloadReader(schemapb.DataType_Int64, buffer, true)
require.Nil(t, err)
length, err = r.GetPayloadLengthFromReader()
assert.NoError(t, err)
assert.Equal(t, length, 6)
int64s, valids, err := r.GetInt64FromPayload()
assert.NoError(t, err)
assert.Equal(t, []int64{1, 0, 3, 1, 0, 3}, int64s)
assert.Equal(t, []bool{true, false, true, true, false, true}, valids)
iint64s, valids, _, err := r.GetDataFromPayload()
int64s = iint64s.([]int64)
assert.NoError(t, err)
assert.Equal(t, []int64{1, 0, 3, 1, 0, 3}, int64s)
assert.Equal(t, []bool{true, false, true, true, false, true}, valids)
defer r.ReleasePayloadReader()
})
t.Run("TestFloat32", func(t *testing.T) {
w, err := NewPayloadWriter(schemapb.DataType_Float, WithNullable(true))
require.Nil(t, err)
require.NotNil(t, w)
err = w.AddFloatToPayload([]float32{1.0, 2.0, 3.0}, []bool{true, false, true})
assert.NoError(t, err)
err = w.AddDataToPayloadForUT([]float32{1.0, 2.0, 3.0}, []bool{false, true, false})
assert.NoError(t, err)
err = w.FinishPayloadWriter()
assert.NoError(t, err)
length, err := w.GetPayloadLengthFromWriter()
assert.NoError(t, err)
assert.Equal(t, 6, length)
defer w.ReleasePayloadWriter()
buffer, err := w.GetPayloadBufferFromWriter()
assert.NoError(t, err)
r, err := NewPayloadReader(schemapb.DataType_Float, buffer, true)
require.Nil(t, err)
length, err = r.GetPayloadLengthFromReader()
assert.NoError(t, err)
assert.Equal(t, length, 6)
float32s, valids, err := r.GetFloatFromPayload()
assert.NoError(t, err)
assert.Equal(t, []float32{1.0, 0, 3.0, 0, 2.0, 0}, float32s)
assert.Equal(t, []bool{true, false, true, false, true, false}, valids)
ifloat32s, valids, _, err := r.GetDataFromPayload()
float32s = ifloat32s.([]float32)
assert.NoError(t, err)
assert.Equal(t, []float32{1.0, 0, 3.0, 0, 2.0, 0}, float32s)
assert.Equal(t, []bool{true, false, true, false, true, false}, valids)
defer r.ReleasePayloadReader()
})
t.Run("TestDouble", func(t *testing.T) {
w, err := NewPayloadWriter(schemapb.DataType_Double, WithNullable(true))
require.Nil(t, err)
require.NotNil(t, w)
err = w.AddDoubleToPayload([]float64{1.0, 2.0, 3.0}, []bool{true, false, true})
assert.NoError(t, err)
err = w.AddDataToPayloadForUT([]float64{1.0, 2.0, 3.0}, []bool{false, true, false})
assert.NoError(t, err)
err = w.FinishPayloadWriter()
assert.NoError(t, err)
length, err := w.GetPayloadLengthFromWriter()
assert.NoError(t, err)
assert.Equal(t, 6, length)
defer w.ReleasePayloadWriter()
buffer, err := w.GetPayloadBufferFromWriter()
assert.NoError(t, err)
r, err := NewPayloadReader(schemapb.DataType_Double, buffer, true)
require.Nil(t, err)
length, err = r.GetPayloadLengthFromReader()
assert.NoError(t, err)
assert.Equal(t, length, 6)
float64s, valids, err := r.GetDoubleFromPayload()
assert.NoError(t, err)
assert.Equal(t, []float64{1.0, 0, 3.0, 0, 2.0, 0}, float64s)
assert.Equal(t, []bool{true, false, true, false, true, false}, valids)
ifloat64s, valids, _, err := r.GetDataFromPayload()
float64s = ifloat64s.([]float64)
assert.NoError(t, err)
assert.Equal(t, []float64{1.0, 0, 3.0, 0, 2.0, 0}, float64s)
assert.Equal(t, []bool{true, false, true, false, true, false}, valids)
defer r.ReleasePayloadReader()
})
t.Run("TestAddString", func(t *testing.T) {
w, err := NewPayloadWriter(schemapb.DataType_String, WithNullable(true))
require.Nil(t, err)
require.NotNil(t, w)
err = w.AddOneStringToPayload("hello0", true)
assert.NoError(t, err)
err = w.AddOneStringToPayload("hello1", false)
assert.NoError(t, err)
err = w.AddOneStringToPayload("hello2", true)
assert.NoError(t, err)
err = w.AddDataToPayloadForUT("hello3", []bool{false})
assert.NoError(t, err)
err = w.FinishPayloadWriter()
assert.NoError(t, err)
length, err := w.GetPayloadLengthFromWriter()
assert.NoError(t, err)
assert.Equal(t, length, 4)
buffer, err := w.GetPayloadBufferFromWriter()
assert.NoError(t, err)
r, err := NewPayloadReader(schemapb.DataType_String, buffer, true)
assert.NoError(t, err)
length, err = r.GetPayloadLengthFromReader()
assert.NoError(t, err)
assert.Equal(t, length, 4)
str, valids, err := r.GetStringFromPayload()
assert.NoError(t, err)
assert.Equal(t, str[0], "hello0")
assert.Equal(t, str[1], "")
assert.Equal(t, str[2], "hello2")
assert.Equal(t, str[3], "")
assert.Equal(t, []bool{true, false, true, false}, valids)
istr, valids, _, err := r.GetDataFromPayload()
strArray := istr.([]string)
assert.NoError(t, err)
assert.Equal(t, strArray[0], "hello0")
assert.Equal(t, strArray[1], "")
assert.Equal(t, strArray[2], "hello2")
assert.Equal(t, strArray[3], "")
assert.Equal(t, []bool{true, false, true, false}, valids)
r.ReleasePayloadReader()
w.ReleasePayloadWriter()
})
t.Run("TestAddArray", func(t *testing.T) {
w, err := NewPayloadWriter(schemapb.DataType_Array, WithNullable(true))
require.Nil(t, err)
require.NotNil(t, w)
err = w.AddOneArrayToPayload(&schemapb.ScalarField{
Data: &schemapb.ScalarField_IntData{
IntData: &schemapb.IntArray{
Data: []int32{1, 2},
},
},
}, true)
assert.NoError(t, err)
err = w.AddOneArrayToPayload(&schemapb.ScalarField{
Data: &schemapb.ScalarField_IntData{
IntData: &schemapb.IntArray{
Data: []int32{3, 4},
},
},
}, false)
assert.NoError(t, err)
err = w.AddOneArrayToPayload(&schemapb.ScalarField{
Data: &schemapb.ScalarField_IntData{
IntData: &schemapb.IntArray{
Data: []int32{5, 6},
},
},
}, true)
assert.NoError(t, err)
err = w.AddDataToPayloadForUT(&schemapb.ScalarField{
Data: &schemapb.ScalarField_IntData{
IntData: &schemapb.IntArray{
Data: []int32{7, 8},
},
},
}, []bool{false})
assert.NoError(t, err)
err = w.FinishPayloadWriter()
assert.NoError(t, err)
length, err := w.GetPayloadLengthFromWriter()
assert.NoError(t, err)
assert.Equal(t, length, 4)
buffer, err := w.GetPayloadBufferFromWriter()
assert.NoError(t, err)
r, err := NewPayloadReader(schemapb.DataType_Array, buffer, true)
assert.NoError(t, err)
length, err = r.GetPayloadLengthFromReader()
assert.NoError(t, err)
assert.Equal(t, length, 4)
arrayList, valids, err := r.GetArrayFromPayload()
assert.NoError(t, err)
assert.EqualValues(t, []int32{1, 2}, arrayList[0].GetIntData().GetData())
assert.EqualValues(t, []int32(nil), arrayList[1].GetIntData().GetData())
assert.EqualValues(t, []int32{5, 6}, arrayList[2].GetIntData().GetData())
assert.EqualValues(t, []int32(nil), arrayList[3].GetIntData().GetData())
assert.Equal(t, []bool{true, false, true, false}, valids)
iArrayList, valids, _, err := r.GetDataFromPayload()
arrayList = iArrayList.([]*schemapb.ScalarField)
assert.NoError(t, err)
assert.EqualValues(t, []int32{1, 2}, arrayList[0].GetIntData().GetData())
assert.EqualValues(t, []int32(nil), arrayList[1].GetIntData().GetData())
assert.EqualValues(t, []int32{5, 6}, arrayList[2].GetIntData().GetData())
assert.EqualValues(t, []int32(nil), arrayList[3].GetIntData().GetData())
assert.Equal(t, []bool{true, false, true, false}, valids)
r.ReleasePayloadReader()
w.ReleasePayloadWriter()
})
t.Run("TestAddJSON", func(t *testing.T) {
w, err := NewPayloadWriter(schemapb.DataType_JSON, WithNullable(true))
require.Nil(t, err)
require.NotNil(t, w)
err = w.AddOneJSONToPayload([]byte(`{"1":"1"}`), true)
assert.NoError(t, err)
err = w.AddOneJSONToPayload([]byte(`{"2":"2"}`), false)
assert.NoError(t, err)
err = w.AddOneJSONToPayload([]byte(`{"3":"3"}`), true)
assert.NoError(t, err)
err = w.AddDataToPayloadForUT([]byte(`{"4":"4"}`), []bool{false})
assert.NoError(t, err)
err = w.FinishPayloadWriter()
assert.NoError(t, err)
length, err := w.GetPayloadLengthFromWriter()
assert.NoError(t, err)
assert.Equal(t, length, 4)
buffer, err := w.GetPayloadBufferFromWriter()
assert.NoError(t, err)
r, err := NewPayloadReader(schemapb.DataType_JSON, buffer, true)
assert.NoError(t, err)
length, err = r.GetPayloadLengthFromReader()
assert.NoError(t, err)
assert.Equal(t, length, 4)
json, valids, err := r.GetJSONFromPayload()
assert.NoError(t, err)
assert.EqualValues(t, []byte(`{"1":"1"}`), json[0])
assert.EqualValues(t, []byte(``), json[1])
assert.EqualValues(t, []byte(`{"3":"3"}`), json[2])
assert.EqualValues(t, []byte(``), json[3])
assert.Equal(t, []bool{true, false, true, false}, valids)
iJSON, valids, _, err := r.GetDataFromPayload()
json = iJSON.([][]byte)
assert.NoError(t, err)
assert.EqualValues(t, []byte(`{"1":"1"}`), json[0])
assert.EqualValues(t, []byte(``), json[1])
assert.EqualValues(t, []byte(`{"3":"3"}`), json[2])
assert.EqualValues(t, []byte(``), json[3])
assert.Equal(t, []bool{true, false, true, false}, valids)
r.ReleasePayloadReader()
w.ReleasePayloadWriter()
})
t.Run("TestFloatVector", func(t *testing.T) {
dim := 128
numRows := 100
type testCase struct {
name string
validDataSetup func([]bool) int
}
testCases := []testCase{
{
name: "half null",
validDataSetup: func(validData []bool) int {
validCount := 0
for i := 0; i < numRows; i++ {
if i%2 == 0 {
validData[i] = true
validCount++
}
}
return validCount
},
},
{
name: "all valid",
validDataSetup: func(validData []bool) int {
for i := 0; i < numRows; i++ {
validData[i] = true
}
return numRows
},
},
{
name: "all null",
validDataSetup: func(validData []bool) int {
return 0
},
},
}
for _, tc := range testCases {
w, err := NewPayloadWriter(schemapb.DataType_FloatVector, WithDim(dim), WithNullable(true))
require.NoError(t, err)
validData := make([]bool, numRows)
validCount := tc.validDataSetup(validData)
data := make([]float32, validCount*dim)
dataIdx := 0
for i := 0; i < numRows; i++ {
if validData[i] {
for j := 0; j < dim; j++ {
data[dataIdx*dim+j] = float32(i*100 + j)
}
dataIdx++
}
}
err = w.AddFloatVectorToPayload(data, dim, validData)
require.NoError(t, err)
err = w.FinishPayloadWriter()
require.NoError(t, err)
buffer, err := w.GetPayloadBufferFromWriter()
require.NoError(t, err)
r, err := NewPayloadReader(schemapb.DataType_FloatVector, buffer, true)
require.NoError(t, err)
readData, readDim, readValid, readNumRows, err := r.GetFloatVectorFromPayload()
require.NoError(t, err)
require.Equal(t, dim, readDim)
require.Equal(t, numRows, readNumRows)
require.Equal(t, numRows, len(readValid))
dataIdx = 0
for i := 0; i < numRows; i++ {
require.Equal(t, validData[i], readValid[i])
if validData[i] {
pos := dataIdx
for j := 0; j < dim; j++ {
require.Equal(t, data[dataIdx*dim+j], readData[pos*dim+j])
}
dataIdx++
}
}
}
})
t.Run("TestBinaryVector", func(t *testing.T) {
dim := 128
numRows := 100
type testCase struct {
name string
validDataSetup func([]bool) int
}
testCases := []testCase{
{
name: "partial null",
validDataSetup: func(validData []bool) int {
validCount := 0
for i := 0; i < numRows; i++ {
if i%3 == 0 {
validData[i] = true
validCount++
}
}
return validCount
},
},
{
name: "all valid",
validDataSetup: func(validData []bool) int {
for i := 0; i < numRows; i++ {
validData[i] = true
}
return numRows
},
},
{
name: "all null",
validDataSetup: func(validData []bool) int {
return 0
},
},
}
for _, tc := range testCases {
w, err := NewPayloadWriter(schemapb.DataType_BinaryVector, WithDim(dim), WithNullable(true))
require.NoError(t, err)
validData := make([]bool, numRows)
validCount := tc.validDataSetup(validData)
data := make([]byte, validCount*dim/8)
dataIdx := 0
for i := 0; i < numRows; i++ {
if validData[i] {
for j := 0; j < dim/8; j++ {
data[dataIdx*dim/8+j] = byte(i + j)
}
dataIdx++
}
}
err = w.AddBinaryVectorToPayload(data, dim, validData)
require.NoError(t, err)
err = w.FinishPayloadWriter()
require.NoError(t, err)
buffer, err := w.GetPayloadBufferFromWriter()
require.NoError(t, err)
r, err := NewPayloadReader(schemapb.DataType_BinaryVector, buffer, true)
require.NoError(t, err)
readData, readDim, readValid, readNumRows, err := r.GetBinaryVectorFromPayload()
require.NoError(t, err)
require.Equal(t, dim, readDim)
require.Equal(t, numRows, readNumRows)
require.Equal(t, numRows, len(readValid))
dataIdx = 0
for i := 0; i < numRows; i++ {
require.Equal(t, validData[i], readValid[i])
if validData[i] {
pos := dataIdx
for j := 0; j < dim/8; j++ {
require.Equal(t, data[dataIdx*dim/8+j], readData[pos*dim/8+j])
}
dataIdx++
}
}
}
})
t.Run("TestFloat16Vector", func(t *testing.T) {
dim := 128
numRows := 100
type testCase struct {
name string
validDataSetup func([]bool) int
}
testCases := []testCase{
{
name: "partial null",
validDataSetup: func(validData []bool) int {
validCount := 0
for i := 0; i < numRows; i++ {
if i%2 == 1 {
validData[i] = true
validCount++
}
}
return validCount
},
},
{
name: "all valid",
validDataSetup: func(validData []bool) int {
for i := 0; i < numRows; i++ {
validData[i] = true
}
return numRows
},
},
{
name: "all null",
validDataSetup: func(validData []bool) int {
return 0
},
},
}
for _, tc := range testCases {
w, err := NewPayloadWriter(schemapb.DataType_Float16Vector, WithDim(dim), WithNullable(true))
require.NoError(t, err)
validData := make([]bool, numRows)
validCount := tc.validDataSetup(validData)
data := make([]byte, validCount*dim*2)
dataIdx := 0
for i := 0; i < numRows; i++ {
if validData[i] {
for j := 0; j < dim*2; j++ {
data[dataIdx*dim*2+j] = byte((i*10 + j) % 256)
}
dataIdx++
}
}
err = w.AddFloat16VectorToPayload(data, dim, validData)
require.NoError(t, err)
err = w.FinishPayloadWriter()
require.NoError(t, err)
buffer, err := w.GetPayloadBufferFromWriter()
require.NoError(t, err)
r, err := NewPayloadReader(schemapb.DataType_Float16Vector, buffer, true)
require.NoError(t, err)
readData, readDim, readValid, readNumRows, err := r.GetFloat16VectorFromPayload()
require.NoError(t, err)
require.Equal(t, dim, readDim)
require.Equal(t, numRows, readNumRows)
require.Equal(t, numRows, len(readValid))
dataIdx = 0
for i := 0; i < numRows; i++ {
require.Equal(t, validData[i], readValid[i])
if validData[i] {
pos := dataIdx
for j := 0; j < dim*2; j++ {
require.Equal(t, data[dataIdx*dim*2+j], readData[pos*dim*2+j])
}
dataIdx++
}
}
}
})
t.Run("TestBFloat16Vector", func(t *testing.T) {
dim := 128
numRows := 100
type testCase struct {
name string
validDataSetup func([]bool) int
}
testCases := []testCase{
{
name: "partial null",
validDataSetup: func(validData []bool) int {
validCount := 0
for i := 0; i < numRows; i++ {
if (i+1)%3 != 0 {
validData[i] = true
validCount++
}
}
return validCount
},
},
{
name: "all valid",
validDataSetup: func(validData []bool) int {
for i := 0; i < numRows; i++ {
validData[i] = true
}
return numRows
},
},
{
name: "all null",
validDataSetup: func(validData []bool) int {
return 0
},
},
}
for _, tc := range testCases {
w, err := NewPayloadWriter(schemapb.DataType_BFloat16Vector, WithDim(dim), WithNullable(true))
require.NoError(t, err)
validData := make([]bool, numRows)
validCount := tc.validDataSetup(validData)
data := make([]byte, validCount*dim*2)
dataIdx := 0
for i := 0; i < numRows; i++ {
if validData[i] {
for j := 0; j < dim*2; j++ {
data[dataIdx*dim*2+j] = byte((i*20 + j) % 256)
}
dataIdx++
}
}
err = w.AddBFloat16VectorToPayload(data, dim, validData)
require.NoError(t, err)
err = w.FinishPayloadWriter()
require.NoError(t, err)
buffer, err := w.GetPayloadBufferFromWriter()
require.NoError(t, err)
r, err := NewPayloadReader(schemapb.DataType_BFloat16Vector, buffer, true)
require.NoError(t, err)
readData, readDim, readValid, readNumRows, err := r.GetBFloat16VectorFromPayload()
require.NoError(t, err)
require.Equal(t, dim, readDim)
require.Equal(t, numRows, readNumRows)
require.Equal(t, numRows, len(readValid))
dataIdx = 0
for i := 0; i < numRows; i++ {
require.Equal(t, validData[i], readValid[i])
if validData[i] {
pos := dataIdx
for j := 0; j < dim*2; j++ {
require.Equal(t, data[dataIdx*dim*2+j], readData[pos*dim*2+j])
}
dataIdx++
}
}
}
})
t.Run("TestInt8Vector", func(t *testing.T) {
dim := 128
numRows := 100
type testCase struct {
name string
validDataSetup func([]bool) int
}
testCases := []testCase{
{
name: "partial null",
validDataSetup: func(validData []bool) int {
validCount := 0
for i := 0; i < numRows; i++ {
if i < numRows/2 {
validData[i] = true
validCount++
}
}
return validCount
},
},
{
name: "all valid",
validDataSetup: func(validData []bool) int {
for i := 0; i < numRows; i++ {
validData[i] = true
}
return numRows
},
},
{
name: "all null",
validDataSetup: func(validData []bool) int {
return 0
},
},
}
for _, tc := range testCases {
w, err := NewPayloadWriter(schemapb.DataType_Int8Vector, WithDim(dim), WithNullable(true))
require.NoError(t, err)
validData := make([]bool, numRows)
validCount := tc.validDataSetup(validData)
data := make([]int8, validCount*dim)
dataIdx := 0
for i := 0; i < numRows; i++ {
if validData[i] {
for j := 0; j < dim; j++ {
data[dataIdx*dim+j] = int8((i*10 + j) % 128)
}
dataIdx++
}
}
err = w.AddInt8VectorToPayload(data, dim, validData)
require.NoError(t, err)
err = w.FinishPayloadWriter()
require.NoError(t, err)
buffer, err := w.GetPayloadBufferFromWriter()
require.NoError(t, err)
r, err := NewPayloadReader(schemapb.DataType_Int8Vector, buffer, true)
require.NoError(t, err)
readData, readDim, readValid, readNumRows, err := r.GetInt8VectorFromPayload()
require.NoError(t, err)
require.Equal(t, dim, readDim)
require.Equal(t, numRows, readNumRows)
require.Equal(t, numRows, len(readValid))
dataIdx = 0
for i := 0; i < numRows; i++ {
require.Equal(t, validData[i], readValid[i])
if validData[i] {
pos := dataIdx
for j := 0; j < dim; j++ {
require.Equal(t, data[dataIdx*dim+j], readData[pos*dim+j])
}
dataIdx++
}
}
}
})
t.Run("TestSparseFloatVector", func(t *testing.T) {
numRows := 100
type testCase struct {
name string
validDataSetup func([]bool) int
}
testCases := []testCase{
{
name: "half null",
validDataSetup: func(validData []bool) int {
validCount := 0
for i := 0; i < numRows; i++ {
if i%2 == 0 {
validData[i] = true
validCount++
}
}
return validCount
},
},
{
name: "all valid",
validDataSetup: func(validData []bool) int {
for i := 0; i < numRows; i++ {
validData[i] = true
}
return numRows
},
},
{
name: "all null",
validDataSetup: func(validData []bool) int {
return 0
},
},
}
for _, tc := range testCases {
w, err := NewPayloadWriter(schemapb.DataType_SparseFloatVector, WithNullable(true))
require.NoError(t, err)
validData := make([]bool, numRows)
tc.validDataSetup(validData)
data := &SparseFloatVectorFieldData{
SparseFloatArray: schemapb.SparseFloatArray{
Dim: 100,
},
ValidData: validData,
}
for i := 0; i < numRows; i++ {
if validData[i] {
sparseVec := make([]byte, 16)
for j := 0; j < 16; j++ {
sparseVec[j] = byte((i*10 + j) % 256)
}
data.SparseFloatArray.Contents = append(data.SparseFloatArray.Contents, sparseVec)
}
}
err = w.AddSparseFloatVectorToPayload(data)
require.NoError(t, err)
err = w.FinishPayloadWriter()
require.NoError(t, err)
buffer, err := w.GetPayloadBufferFromWriter()
require.NoError(t, err)
r, err := NewPayloadReader(schemapb.DataType_SparseFloatVector, buffer, true)
require.NoError(t, err)
readData, _, readValid, err := r.GetSparseFloatVectorFromPayload()
require.NoError(t, err)
require.Equal(t, numRows, len(readValid))
require.Equal(t, numRows, len(readData.Contents))
for i := 0; i < numRows; i++ {
require.Equal(t, validData[i], readValid[i])
if validData[i] {
require.NotNil(t, readData.Contents[i])
require.Equal(t, 16, len(readData.Contents[i]))
for j := 0; j < 16; j++ {
require.Equal(t, byte((i*10+j)%256), readData.Contents[i][j])
}
} else {
require.Nil(t, readData.Contents[i])
}
}
}
})
t.Run("TestAddBool with wrong valids", func(t *testing.T) {
w, err := NewPayloadWriter(schemapb.DataType_Bool, WithNullable(true))
require.Nil(t, err)
require.NotNil(t, w)
err = w.AddBoolToPayload([]bool{false}, nil)
assert.ErrorIs(t, err, merr.ErrParameterInvalid)
})
t.Run("TestAddInt8 with wrong valids", func(t *testing.T) {
w, err := NewPayloadWriter(schemapb.DataType_Int8, WithNullable(true))
require.Nil(t, err)
require.NotNil(t, w)
err = w.AddInt8ToPayload([]int8{1}, nil)
assert.ErrorIs(t, err, merr.ErrParameterInvalid)
})
t.Run("TestAddInt16 with wrong valids", func(t *testing.T) {
w, err := NewPayloadWriter(schemapb.DataType_Int16, WithNullable(true))
require.Nil(t, err)
require.NotNil(t, w)
err = w.AddInt16ToPayload([]int16{1}, nil)
assert.ErrorIs(t, err, merr.ErrParameterInvalid)
})
t.Run("TestAddInt32 with wrong valids", func(t *testing.T) {
w, err := NewPayloadWriter(schemapb.DataType_Int32, WithNullable(true))
require.Nil(t, err)
require.NotNil(t, w)
err = w.AddInt32ToPayload([]int32{1}, nil)
assert.ErrorIs(t, err, merr.ErrParameterInvalid)
})
t.Run("TestAddInt64 with wrong valids", func(t *testing.T) {
w, err := NewPayloadWriter(schemapb.DataType_Int64, WithNullable(true))
require.Nil(t, err)
require.NotNil(t, w)
err = w.AddInt64ToPayload([]int64{1}, nil)
assert.ErrorIs(t, err, merr.ErrParameterInvalid)
})
t.Run("TestAddFloat32 with wrong valids", func(t *testing.T) {
w, err := NewPayloadWriter(schemapb.DataType_Float, WithNullable(true))
require.Nil(t, err)
require.NotNil(t, w)
err = w.AddFloatToPayload([]float32{1.0}, nil)
assert.ErrorIs(t, err, merr.ErrParameterInvalid)
})
t.Run("TestAddDouble with wrong valids", func(t *testing.T) {
w, err := NewPayloadWriter(schemapb.DataType_Double, WithNullable(true))
require.Nil(t, err)
require.NotNil(t, w)
err = w.AddDoubleToPayload([]float64{1.0}, nil)
assert.ErrorIs(t, err, merr.ErrParameterInvalid)
})
t.Run("TestAddAddString with wrong valids", func(t *testing.T) {
w, err := NewPayloadWriter(schemapb.DataType_String, WithNullable(true))
require.Nil(t, err)
require.NotNil(t, w)
err = w.AddDataToPayloadForUT("hello0", nil)
assert.ErrorIs(t, err, merr.ErrParameterInvalid)
w, err = NewPayloadWriter(schemapb.DataType_String, WithNullable(true))
require.Nil(t, err)
require.NotNil(t, w)
err = w.AddDataToPayloadForUT("hello0", []bool{false, false})
assert.ErrorIs(t, err, merr.ErrParameterInvalid)
w, err = NewPayloadWriter(schemapb.DataType_String)
require.Nil(t, err)
require.NotNil(t, w)
err = w.AddDataToPayloadForUT("hello0", []bool{false})
assert.ErrorIs(t, err, merr.ErrParameterInvalid)
w, err = NewPayloadWriter(schemapb.DataType_String)
require.Nil(t, err)
require.NotNil(t, w)
err = w.AddDataToPayloadForUT("hello0", []bool{true})
assert.ErrorIs(t, err, merr.ErrParameterInvalid)
})
t.Run("TestAddArray with wrong valids", func(t *testing.T) {
w, err := NewPayloadWriter(schemapb.DataType_Array, WithNullable(true))
require.Nil(t, err)
require.NotNil(t, w)
err = w.AddDataToPayloadForUT(&schemapb.ScalarField{
Data: &schemapb.ScalarField_IntData{
IntData: &schemapb.IntArray{
Data: []int32{1, 2},
},
},
}, nil)
assert.ErrorIs(t, err, merr.ErrParameterInvalid)
w, err = NewPayloadWriter(schemapb.DataType_Array, WithNullable(true))
require.Nil(t, err)
require.NotNil(t, w)
err = w.AddDataToPayloadForUT(&schemapb.ScalarField{
Data: &schemapb.ScalarField_IntData{
IntData: &schemapb.IntArray{
Data: []int32{1, 2},
},
},
}, []bool{false, false})
assert.ErrorIs(t, err, merr.ErrParameterInvalid)
w, err = NewPayloadWriter(schemapb.DataType_Array)
require.Nil(t, err)
require.NotNil(t, w)
err = w.AddDataToPayloadForUT(&schemapb.ScalarField{
Data: &schemapb.ScalarField_IntData{
IntData: &schemapb.IntArray{
Data: []int32{1, 2},
},
},
}, []bool{false})
assert.ErrorIs(t, err, merr.ErrParameterInvalid)
w, err = NewPayloadWriter(schemapb.DataType_Array)
require.Nil(t, err)
require.NotNil(t, w)
err = w.AddDataToPayloadForUT(&schemapb.ScalarField{
Data: &schemapb.ScalarField_IntData{
IntData: &schemapb.IntArray{
Data: []int32{1, 2},
},
},
}, []bool{true})
assert.ErrorIs(t, err, merr.ErrParameterInvalid)
})
t.Run("TestAddJSON with wrong valids", func(t *testing.T) {
w, err := NewPayloadWriter(schemapb.DataType_JSON, WithNullable(true))
require.Nil(t, err)
require.NotNil(t, w)
err = w.AddDataToPayloadForUT([]byte(`{"1":"1"}`), nil)
assert.ErrorIs(t, err, merr.ErrParameterInvalid)
w, err = NewPayloadWriter(schemapb.DataType_JSON, WithNullable(true))
require.Nil(t, err)
require.NotNil(t, w)
err = w.AddDataToPayloadForUT([]byte(`{"1":"1"}`), []bool{false, false})
assert.ErrorIs(t, err, merr.ErrParameterInvalid)
w, err = NewPayloadWriter(schemapb.DataType_JSON)
require.Nil(t, err)
require.NotNil(t, w)
err = w.AddDataToPayloadForUT([]byte(`{"1":"1"}`), []bool{false})
assert.ErrorIs(t, err, merr.ErrParameterInvalid)
w, err = NewPayloadWriter(schemapb.DataType_JSON)
require.Nil(t, err)
require.NotNil(t, w)
err = w.AddDataToPayloadForUT([]byte(`{"1":"1"}`), []bool{true})
assert.ErrorIs(t, err, merr.ErrParameterInvalid)
})
}
func TestArrowRecordReader(t *testing.T) {
t.Run("TestArrowRecordReader", func(t *testing.T) {
w, err := NewPayloadWriter(schemapb.DataType_String)
assert.NoError(t, err)
defer w.Close()
err = w.AddOneStringToPayload("hello0", true)
assert.NoError(t, err)
err = w.AddOneStringToPayload("hello1", true)
assert.NoError(t, err)
err = w.AddOneStringToPayload("hello2", true)
assert.NoError(t, err)
err = w.FinishPayloadWriter()
assert.NoError(t, err)
length, err := w.GetPayloadLengthFromWriter()
assert.NoError(t, err)
assert.Equal(t, 3, length)
buffer, err := w.GetPayloadBufferFromWriter()
assert.NoError(t, err)
r, err := NewPayloadReader(schemapb.DataType_String, buffer, false)
assert.NoError(t, err)
length, err = r.GetPayloadLengthFromReader()
assert.NoError(t, err)
assert.Equal(t, 3, length)
rr, err := r.GetArrowRecordReader()
assert.NoError(t, err)
for rr.Next() {
rec := rr.Record()
arr := rec.Column(0).(*array.String)
defer rec.Release()
assert.Equal(t, "hello0", arr.Value(0))
assert.Equal(t, "hello1", arr.Value(1))
assert.Equal(t, "hello2", arr.Value(2))
}
})
}
func dataGen(size int) ([]byte, error) {
w, err := NewPayloadWriter(schemapb.DataType_String)
if err != nil {
return nil, err
}
defer w.Close()
letterRunes := []rune("abcdefghijklmnopqrstuvwxyzABCDEFGHIJKLMNOPQRSTUVWXYZ")
for i := 0; i < size; i++ {
b := make([]rune, 20)
for i := range b {
b[i] = letterRunes[rand.Intn(len(letterRunes))]
}
w.AddOneStringToPayload(string(b), true)
}
err = w.FinishPayloadWriter()
if err != nil {
return nil, err
}
buffer, err := w.GetPayloadBufferFromWriter()
if err != nil {
return nil, err
}
return buffer, err
}
func BenchmarkDefaultReader(b *testing.B) {
size := 10
buffer, err := dataGen(size)
assert.NoError(b, err)
b.ResetTimer()
r, err := NewPayloadReader(schemapb.DataType_String, buffer, false)
require.Nil(b, err)
defer r.ReleasePayloadReader()
length, err := r.GetPayloadLengthFromReader()
assert.NoError(b, err)
assert.Equal(b, length, size)
d, v, err := r.GetStringFromPayload()
assert.NoError(b, err)
assert.Nil(b, v)
for i := 0; i < 100; i++ {
for _, de := range d {
assert.Equal(b, 20, len(de))
}
}
}
func BenchmarkDataSetReader(b *testing.B) {
size := 10
buffer, err := dataGen(size)
assert.NoError(b, err)
b.ResetTimer()
r, err := NewPayloadReader(schemapb.DataType_String, buffer, false)
require.Nil(b, err)
defer r.ReleasePayloadReader()
length, err := r.GetPayloadLengthFromReader()
assert.NoError(b, err)
assert.Equal(b, length, size)
ds, err := r.GetByteArrayDataSet()
assert.NoError(b, err)
for i := 0; i < 100; i++ {
for ds.HasNext() {
stringArray, err := ds.NextBatch(1024)
assert.NoError(b, err)
for _, de := range stringArray {
assert.Equal(b, 20, len(string(de)))
}
}
}
}
func BenchmarkArrowRecordReader(b *testing.B) {
size := 10
buffer, err := dataGen(size)
assert.NoError(b, err)
b.ResetTimer()
r, err := NewPayloadReader(schemapb.DataType_String, buffer, false)
require.Nil(b, err)
defer r.ReleasePayloadReader()
length, err := r.GetPayloadLengthFromReader()
assert.NoError(b, err)
assert.Equal(b, length, size)
rr, err := r.GetArrowRecordReader()
assert.NoError(b, err)
defer rr.Release()
for i := 0; i < 100; i++ {
for rr.Next() {
rec := rr.Record()
arr := rec.Column(0).(*array.String)
defer rec.Release()
for i := 0; i < arr.Len(); i++ {
assert.Equal(b, 20, len(arr.Value(i)))
}
}
}
}