mirror of
https://gitee.com/milvus-io/milvus.git
synced 2025-12-07 01:28:27 +08:00
enhance: [GoSDK] support unmarshal result set into orm receiver (#36789)
Related to milvus-io/milvus-sdk-go#800 Signed-off-by: Congqi Xia <congqi.xia@zilliz.com>
This commit is contained in:
parent
0ec92513a5
commit
744a36c287
@ -29,30 +29,6 @@ import (
|
|||||||
"github.com/milvus-io/milvus/pkg/util/merr"
|
"github.com/milvus-io/milvus/pkg/util/merr"
|
||||||
)
|
)
|
||||||
|
|
||||||
type ResultSets struct{}
|
|
||||||
|
|
||||||
type ResultSet struct {
|
|
||||||
ResultCount int // the returning entry count
|
|
||||||
GroupByValue column.Column
|
|
||||||
IDs column.Column // auto generated id, can be mapped to the columns from `Insert` API
|
|
||||||
Fields DataSet // output field data
|
|
||||||
Scores []float32 // distance to the target vector
|
|
||||||
Err error // search error if any
|
|
||||||
}
|
|
||||||
|
|
||||||
// DataSet is an alias type for column slice.
|
|
||||||
type DataSet []column.Column
|
|
||||||
|
|
||||||
// GetColumn returns column with provided field name.
|
|
||||||
func (rs ResultSet) GetColumn(fieldName string) column.Column {
|
|
||||||
for _, column := range rs.Fields {
|
|
||||||
if column.Name() == fieldName {
|
|
||||||
return column
|
|
||||||
}
|
|
||||||
}
|
|
||||||
return nil
|
|
||||||
}
|
|
||||||
|
|
||||||
func (c *Client) Search(ctx context.Context, option SearchOption, callOptions ...grpc.CallOption) ([]ResultSet, error) {
|
func (c *Client) Search(ctx context.Context, option SearchOption, callOptions ...grpc.CallOption) ([]ResultSet, error) {
|
||||||
req := option.Request()
|
req := option.Request()
|
||||||
collection, err := c.getCollection(ctx, req.GetCollectionName())
|
collection, err := c.getCollection(ctx, req.GetCollectionName())
|
||||||
|
|||||||
194
client/results.go
Normal file
194
client/results.go
Normal file
@ -0,0 +1,194 @@
|
|||||||
|
// Licensed to the LF AI & Data foundation under one
|
||||||
|
// or more contributor license agreements. See the NOTICE file
|
||||||
|
// distributed with this work for additional information
|
||||||
|
// regarding copyright ownership. The ASF licenses this file
|
||||||
|
// to you under the Apache License, Version 2.0 (the
|
||||||
|
// "License"); you may not use this file except in compliance
|
||||||
|
// with the License. You may obtain a copy of the License at
|
||||||
|
//
|
||||||
|
// http://www.apache.org/licenses/LICENSE-2.0
|
||||||
|
//
|
||||||
|
// Unless required by applicable law or agreed to in writing, software
|
||||||
|
// distributed under the License is distributed on an "AS IS" BASIS,
|
||||||
|
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||||
|
// See the License for the specific language governing permissions and
|
||||||
|
// limitations under the License.
|
||||||
|
|
||||||
|
package client
|
||||||
|
|
||||||
|
import (
|
||||||
|
"reflect"
|
||||||
|
|
||||||
|
"github.com/cockroachdb/errors"
|
||||||
|
|
||||||
|
"github.com/milvus-io/milvus/client/v2/column"
|
||||||
|
"github.com/milvus-io/milvus/client/v2/entity"
|
||||||
|
"github.com/milvus-io/milvus/client/v2/row"
|
||||||
|
)
|
||||||
|
|
||||||
|
// ResultSet is struct for search result set.
|
||||||
|
type ResultSet struct {
|
||||||
|
// internal schema for unmarshaling
|
||||||
|
sch *entity.Schema
|
||||||
|
|
||||||
|
ResultCount int // the returning entry count
|
||||||
|
GroupByValue column.Column
|
||||||
|
IDs column.Column // auto generated id, can be mapped to the columns from `Insert` API
|
||||||
|
Fields DataSet // output field data
|
||||||
|
Scores []float32 // distance to the target vector
|
||||||
|
Err error // search error if any
|
||||||
|
}
|
||||||
|
|
||||||
|
// GetColumn returns column with provided field name.
|
||||||
|
func (rs *ResultSet) GetColumn(fieldName string) column.Column {
|
||||||
|
for _, column := range rs.Fields {
|
||||||
|
if column.Name() == fieldName {
|
||||||
|
return column
|
||||||
|
}
|
||||||
|
}
|
||||||
|
return nil
|
||||||
|
}
|
||||||
|
|
||||||
|
// Unmarshal puts dataset into receiver in row based way.
|
||||||
|
// `receiver` shall be a slice of pointer of model struct
|
||||||
|
// eg, []*Records, in which type `Record` defines the row data.
|
||||||
|
// note that distance/score is not unmarshaled here.
|
||||||
|
func (sr *ResultSet) Unmarshal(receiver any) (err error) {
|
||||||
|
err = sr.Fields.Unmarshal(receiver)
|
||||||
|
if err != nil {
|
||||||
|
return err
|
||||||
|
}
|
||||||
|
return sr.fillPKEntry(receiver)
|
||||||
|
}
|
||||||
|
|
||||||
|
func (sr *ResultSet) fillPKEntry(receiver any) (err error) {
|
||||||
|
defer func() {
|
||||||
|
if x := recover(); x != nil {
|
||||||
|
err = errors.Newf("failed to unmarshal result set: %v", x)
|
||||||
|
}
|
||||||
|
}()
|
||||||
|
rr := reflect.ValueOf(receiver)
|
||||||
|
|
||||||
|
if rr.Kind() == reflect.Ptr {
|
||||||
|
if rr.IsNil() && rr.CanAddr() {
|
||||||
|
rr.Set(reflect.New(rr.Type().Elem()))
|
||||||
|
}
|
||||||
|
rr = rr.Elem()
|
||||||
|
}
|
||||||
|
|
||||||
|
rt := rr.Type()
|
||||||
|
rv := rr
|
||||||
|
|
||||||
|
switch rt.Kind() {
|
||||||
|
case reflect.Slice:
|
||||||
|
pkField := sr.sch.PKField()
|
||||||
|
|
||||||
|
et := rt.Elem()
|
||||||
|
for et.Kind() == reflect.Ptr {
|
||||||
|
et = et.Elem()
|
||||||
|
}
|
||||||
|
|
||||||
|
candidates := row.ParseCandidate(et)
|
||||||
|
candi, ok := candidates[pkField.Name]
|
||||||
|
if !ok {
|
||||||
|
// pk field not found in struct, skip
|
||||||
|
return nil
|
||||||
|
}
|
||||||
|
for i := 0; i < sr.IDs.Len(); i++ {
|
||||||
|
row := rv.Index(i)
|
||||||
|
for row.Kind() == reflect.Ptr {
|
||||||
|
row = row.Elem()
|
||||||
|
}
|
||||||
|
|
||||||
|
val, err := sr.IDs.Get(i)
|
||||||
|
if err != nil {
|
||||||
|
return err
|
||||||
|
}
|
||||||
|
row.Field(candi).Set(reflect.ValueOf(val))
|
||||||
|
}
|
||||||
|
rr.Set(rv)
|
||||||
|
default:
|
||||||
|
return errors.Newf("receiver need to be slice or array but get %v", rt.Kind())
|
||||||
|
}
|
||||||
|
return nil
|
||||||
|
}
|
||||||
|
|
||||||
|
// DataSet is an alias type for column slice.
|
||||||
|
// Returned by query API.
|
||||||
|
type DataSet []column.Column
|
||||||
|
|
||||||
|
// Len returns the row count of dataset.
|
||||||
|
// if there is no column, it shall return 0.
|
||||||
|
func (ds DataSet) Len() int {
|
||||||
|
if len(ds) == 0 {
|
||||||
|
return 0
|
||||||
|
}
|
||||||
|
return ds[0].Len()
|
||||||
|
}
|
||||||
|
|
||||||
|
// Unmarshal puts dataset into receiver in row based way.
|
||||||
|
// `receiver` shall be a slice of pointer of model struct
|
||||||
|
// eg, []*Records, in which type `Record` defines the row data.
|
||||||
|
func (ds DataSet) Unmarshal(receiver any) (err error) {
|
||||||
|
defer func() {
|
||||||
|
if x := recover(); x != nil {
|
||||||
|
err = errors.Newf("failed to unmarshal result set: %v", x)
|
||||||
|
}
|
||||||
|
}()
|
||||||
|
rr := reflect.ValueOf(receiver)
|
||||||
|
|
||||||
|
if rr.Kind() == reflect.Ptr {
|
||||||
|
if rr.IsNil() && rr.CanAddr() {
|
||||||
|
rr.Set(reflect.New(rr.Type().Elem()))
|
||||||
|
}
|
||||||
|
rr = rr.Elem()
|
||||||
|
}
|
||||||
|
|
||||||
|
rt := rr.Type()
|
||||||
|
rv := rr
|
||||||
|
|
||||||
|
switch rt.Kind() {
|
||||||
|
// TODO maybe support Array and just fill data
|
||||||
|
// case reflect.Array:
|
||||||
|
case reflect.Slice:
|
||||||
|
et := rt.Elem()
|
||||||
|
if et.Kind() != reflect.Ptr {
|
||||||
|
return errors.Newf("receiver must be slice of pointers but get: %v", et.Kind())
|
||||||
|
}
|
||||||
|
for et.Kind() == reflect.Ptr {
|
||||||
|
et = et.Elem()
|
||||||
|
}
|
||||||
|
for i := 0; i < ds.Len(); i++ {
|
||||||
|
data := reflect.New(et)
|
||||||
|
err := ds.fillData(data.Elem(), et, i)
|
||||||
|
if err != nil {
|
||||||
|
return err
|
||||||
|
}
|
||||||
|
rv = reflect.Append(rv, data)
|
||||||
|
}
|
||||||
|
rr.Set(rv)
|
||||||
|
default:
|
||||||
|
return errors.Newf("receiver need to be slice or array but get %v", rt.Kind())
|
||||||
|
}
|
||||||
|
return nil
|
||||||
|
}
|
||||||
|
|
||||||
|
func (ds DataSet) fillData(data reflect.Value, dataType reflect.Type, idx int) error {
|
||||||
|
m := row.ParseCandidate(dataType)
|
||||||
|
for i := 0; i < len(ds); i++ {
|
||||||
|
name := ds[i].Name()
|
||||||
|
fidx, ok := m[name]
|
||||||
|
if !ok {
|
||||||
|
// if target is not found, the behavior here is to ignore the column
|
||||||
|
// `strict` mode could be added in the future to return error if any column missing
|
||||||
|
continue
|
||||||
|
}
|
||||||
|
val, err := ds[i].Get(idx)
|
||||||
|
if err != nil {
|
||||||
|
return err
|
||||||
|
}
|
||||||
|
// TODO check datatype, return error here instead of reflect panicking & recover
|
||||||
|
data.Field(fidx).Set(reflect.ValueOf(val))
|
||||||
|
}
|
||||||
|
return nil
|
||||||
|
}
|
||||||
127
client/results_test.go
Normal file
127
client/results_test.go
Normal file
@ -0,0 +1,127 @@
|
|||||||
|
// Licensed to the LF AI & Data foundation under one
|
||||||
|
// or more contributor license agreements. See the NOTICE file
|
||||||
|
// distributed with this work for additional information
|
||||||
|
// regarding copyright ownership. The ASF licenses this file
|
||||||
|
// to you under the Apache License, Version 2.0 (the
|
||||||
|
// "License"); you may not use this file except in compliance
|
||||||
|
// with the License. You may obtain a copy of the License at
|
||||||
|
//
|
||||||
|
// http://www.apache.org/licenses/LICENSE-2.0
|
||||||
|
//
|
||||||
|
// Unless required by applicable law or agreed to in writing, software
|
||||||
|
// distributed under the License is distributed on an "AS IS" BASIS,
|
||||||
|
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||||
|
// See the License for the specific language governing permissions and
|
||||||
|
// limitations under the License.
|
||||||
|
|
||||||
|
package client
|
||||||
|
|
||||||
|
import (
|
||||||
|
"testing"
|
||||||
|
|
||||||
|
"github.com/stretchr/testify/suite"
|
||||||
|
|
||||||
|
"github.com/milvus-io/milvus/client/v2/column"
|
||||||
|
"github.com/milvus-io/milvus/client/v2/entity"
|
||||||
|
)
|
||||||
|
|
||||||
|
type ResultSetSuite struct {
|
||||||
|
suite.Suite
|
||||||
|
}
|
||||||
|
|
||||||
|
func (s *ResultSetSuite) TestResultsetUnmarshal() {
|
||||||
|
type MyData struct {
|
||||||
|
A int64 `milvus:"name:id"`
|
||||||
|
V []float32 `milvus:"name:vector"`
|
||||||
|
}
|
||||||
|
type OtherData struct {
|
||||||
|
A string `milvus:"name:id"`
|
||||||
|
V []float32 `milvus:"name:vector"`
|
||||||
|
}
|
||||||
|
|
||||||
|
var (
|
||||||
|
idData = []int64{1, 2, 3}
|
||||||
|
vectorData = [][]float32{
|
||||||
|
{0.1, 0.2},
|
||||||
|
{0.1, 0.2},
|
||||||
|
{0.1, 0.2},
|
||||||
|
}
|
||||||
|
)
|
||||||
|
|
||||||
|
rs := DataSet([]column.Column{
|
||||||
|
column.NewColumnInt64("id", idData),
|
||||||
|
column.NewColumnFloatVector("vector", 2, vectorData),
|
||||||
|
})
|
||||||
|
err := rs.Unmarshal([]MyData{})
|
||||||
|
s.Error(err)
|
||||||
|
|
||||||
|
receiver := []MyData{}
|
||||||
|
err = rs.Unmarshal(&receiver)
|
||||||
|
s.Error(err)
|
||||||
|
|
||||||
|
var ptrReceiver []*MyData
|
||||||
|
err = rs.Unmarshal(&ptrReceiver)
|
||||||
|
s.NoError(err)
|
||||||
|
|
||||||
|
for idx, row := range ptrReceiver {
|
||||||
|
s.Equal(row.A, idData[idx])
|
||||||
|
s.Equal(row.V, vectorData[idx])
|
||||||
|
}
|
||||||
|
|
||||||
|
var otherReceiver []*OtherData
|
||||||
|
err = rs.Unmarshal(&otherReceiver)
|
||||||
|
s.Error(err)
|
||||||
|
}
|
||||||
|
|
||||||
|
func (s *ResultSetSuite) TestSearchResultUnmarshal() {
|
||||||
|
type MyData struct {
|
||||||
|
A int64 `milvus:"name:id"`
|
||||||
|
V []float32 `milvus:"name:vector"`
|
||||||
|
}
|
||||||
|
type OtherData struct {
|
||||||
|
A string `milvus:"name:id"`
|
||||||
|
V []float32 `milvus:"name:vector"`
|
||||||
|
}
|
||||||
|
|
||||||
|
var (
|
||||||
|
idData = []int64{1, 2, 3}
|
||||||
|
vectorData = [][]float32{
|
||||||
|
{0.1, 0.2},
|
||||||
|
{0.1, 0.2},
|
||||||
|
{0.1, 0.2},
|
||||||
|
}
|
||||||
|
)
|
||||||
|
|
||||||
|
sr := ResultSet{
|
||||||
|
sch: entity.NewSchema().
|
||||||
|
WithField(entity.NewField().WithName("id").WithIsPrimaryKey(true).WithDataType(entity.FieldTypeInt64)).
|
||||||
|
WithField(entity.NewField().WithName("vector").WithDim(2).WithDataType(entity.FieldTypeFloatVector)),
|
||||||
|
IDs: column.NewColumnInt64("id", idData),
|
||||||
|
Fields: DataSet([]column.Column{
|
||||||
|
column.NewColumnFloatVector("vector", 2, vectorData),
|
||||||
|
}),
|
||||||
|
}
|
||||||
|
err := sr.Unmarshal([]MyData{})
|
||||||
|
s.Error(err)
|
||||||
|
|
||||||
|
receiver := []MyData{}
|
||||||
|
err = sr.Unmarshal(&receiver)
|
||||||
|
s.Error(err)
|
||||||
|
|
||||||
|
var ptrReceiver []*MyData
|
||||||
|
err = sr.Unmarshal(&ptrReceiver)
|
||||||
|
s.NoError(err)
|
||||||
|
|
||||||
|
for idx, row := range ptrReceiver {
|
||||||
|
s.Equal(row.A, idData[idx])
|
||||||
|
s.Equal(row.V, vectorData[idx])
|
||||||
|
}
|
||||||
|
|
||||||
|
var otherReceiver []*OtherData
|
||||||
|
err = sr.Unmarshal(&otherReceiver)
|
||||||
|
s.Error(err)
|
||||||
|
}
|
||||||
|
|
||||||
|
func TestResults(t *testing.T) {
|
||||||
|
suite.Run(t, new(ResultSetSuite))
|
||||||
|
}
|
||||||
43
client/row/type.go
Normal file
43
client/row/type.go
Normal file
@ -0,0 +1,43 @@
|
|||||||
|
// Licensed to the LF AI & Data foundation under one
|
||||||
|
// or more contributor license agreements. See the NOTICE file
|
||||||
|
// distributed with this work for additional information
|
||||||
|
// regarding copyright ownership. The ASF licenses this file
|
||||||
|
// to you under the Apache License, Version 2.0 (the
|
||||||
|
// "License"); you may not use this file except in compliance
|
||||||
|
// with the License. You may obtain a copy of the License at
|
||||||
|
//
|
||||||
|
// http://www.apache.org/licenses/LICENSE-2.0
|
||||||
|
//
|
||||||
|
// Unless required by applicable law or agreed to in writing, software
|
||||||
|
// distributed under the License is distributed on an "AS IS" BASIS,
|
||||||
|
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||||
|
// See the License for the specific language governing permissions and
|
||||||
|
// limitations under the License.
|
||||||
|
|
||||||
|
package row
|
||||||
|
|
||||||
|
import (
|
||||||
|
"go/ast"
|
||||||
|
"reflect"
|
||||||
|
)
|
||||||
|
|
||||||
|
func ParseCandidate(dataType reflect.Type) map[string]int {
|
||||||
|
result := make(map[string]int)
|
||||||
|
for i := 0; i < dataType.NumField(); i++ {
|
||||||
|
f := dataType.Field(i)
|
||||||
|
// ignore anonymous field for now
|
||||||
|
if f.Anonymous || !ast.IsExported(f.Name) {
|
||||||
|
continue
|
||||||
|
}
|
||||||
|
|
||||||
|
name := f.Name
|
||||||
|
tag := f.Tag.Get(MilvusTag)
|
||||||
|
tagSettings := ParseTagSetting(tag, MilvusTagSep)
|
||||||
|
if tagName, has := tagSettings[MilvusTagName]; has {
|
||||||
|
name = tagName
|
||||||
|
}
|
||||||
|
|
||||||
|
result[name] = i
|
||||||
|
}
|
||||||
|
return result
|
||||||
|
}
|
||||||
Loading…
x
Reference in New Issue
Block a user