/* * # Licensed to the LF AI & Data foundation under one * # or more contributor license agreements. See the NOTICE file * # distributed with this work for additional information * # regarding copyright ownership. The ASF licenses this file * # to you under the Apache License, Version 2.0 (the * # "License"); you may not use this file except in compliance * # with the License. You may obtain a copy of the License at * # * # http://www.apache.org/licenses/LICENSE-2.0 * # * # Unless required by applicable law or agreed to in writing, software * # distributed under the License is distributed on an "AS IS" BASIS, * # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * # See the License for the specific language governing permissions and * # limitations under the License. */ package embedding import ( "os" "testing" "github.com/cockroachdb/errors" "github.com/stretchr/testify/suite" "github.com/milvus-io/milvus-proto/go-api/v2/commonpb" "github.com/milvus-io/milvus-proto/go-api/v2/schemapb" "github.com/milvus-io/milvus/internal/util/credentials" "github.com/milvus-io/milvus/internal/util/function/models" ) func TestBedrockTextEmbeddingProvider(t *testing.T) { suite.Run(t, new(BedrockTextEmbeddingProviderSuite)) } type BedrockTextEmbeddingProviderSuite struct { suite.Suite schema *schemapb.CollectionSchema providers []string } func (s *BedrockTextEmbeddingProviderSuite) SetupTest() { s.schema = &schemapb.CollectionSchema{ Name: "test", Fields: []*schemapb.FieldSchema{ {FieldID: 100, Name: "int64", DataType: schemapb.DataType_Int64}, {FieldID: 101, Name: "text", DataType: schemapb.DataType_VarChar}, { FieldID: 102, Name: "vector", DataType: schemapb.DataType_FloatVector, TypeParams: []*commonpb.KeyValuePair{ {Key: "dim", Value: "4"}, }, }, }, } s.providers = []string{bedrockProvider} } func createBedrockProvider(schema *schemapb.FieldSchema, providerName string, dim int) (textEmbeddingProvider, error) { functionSchema := &schemapb.FunctionSchema{ Name: "test", Type: schemapb.FunctionType_Unknown, InputFieldNames: []string{"text"}, OutputFieldNames: []string{"vector"}, InputFieldIds: []int64{101}, OutputFieldIds: []int64{102}, Params: []*commonpb.KeyValuePair{ {Key: models.ModelNameParamKey, Value: TestModel}, {Key: models.DimParamKey, Value: "4"}, }, } switch providerName { case bedrockProvider: return NewBedrockEmbeddingProvider(schema, functionSchema, &MockBedrockClient{dim: dim}, map[string]string{}, credentials.NewCredentials(map[string]string{"mock.access_key_id": "mock", "mock.secret_access_key": "mock"})) default: return nil, errors.New("Unknow provider") } } func (s *BedrockTextEmbeddingProviderSuite) TestEmbedding() { for _, provderName := range s.providers { provder, err := createBedrockProvider(s.schema.Fields[2], provderName, 4) s.NoError(err) { data := []string{"sentence"} r, err2 := provder.CallEmbedding(data, models.InsertMode) ret := r.([][]float32) s.NoError(err2) s.Equal(1, len(ret)) s.Equal(4, len(ret[0])) s.Equal([]float32{0.0, 1.0, 2.0, 3.0}, ret[0]) } { data := []string{"sentence 1", "sentence 2", "sentence 3"} ret, _ := provder.CallEmbedding(data, models.SearchMode) s.Equal([][]float32{{0.0, 1.0, 2.0, 3.0}, {0.0, 1.0, 2.0, 3.0}, {0.0, 1.0, 2.0, 3.0}}, ret) } } } func (s *BedrockTextEmbeddingProviderSuite) TestEmbeddingDimNotMatch() { for _, provderName := range s.providers { provder, err := createBedrockProvider(s.schema.Fields[2], provderName, 2) s.NoError(err) // embedding dim not match data := []string{"sentence", "sentence"} _, err2 := provder.CallEmbedding(data, models.InsertMode) s.Error(err2) } } func (s *BedrockTextEmbeddingProviderSuite) TestParseCredentail() { { cred := credentials.NewCredentials(map[string]string{}) ak, sk, err := parseAKSKInfo(cred, []*commonpb.KeyValuePair{}, map[string]string{}) s.Equal(ak, "") s.Equal(sk, "") s.NoError(err) } { cred := credentials.NewCredentials(map[string]string{}) _, _, err := parseAKSKInfo(cred, []*commonpb.KeyValuePair{}, map[string]string{"credential": "NotExist"}) s.ErrorContains(err, "is not a aksk crediential, can not find key") } { cred := credentials.NewCredentials(map[string]string{"mock.apikey": "mock"}) _, _, err := parseAKSKInfo(cred, []*commonpb.KeyValuePair{}, map[string]string{"credential": "mock"}) s.ErrorContains(err, "is not a aksk crediential, can not find key") } { cred := credentials.NewCredentials(map[string]string{"mock.access_key_id": "mock", "mock.secret_access_key": "mock"}) _, _, err := parseAKSKInfo(cred, []*commonpb.KeyValuePair{}, map[string]string{"credential": "mock"}) s.NoError(err) } { os.Setenv(models.BedrockAccessKeyId, "mock") os.Setenv(models.BedrockSAKEnvStr, "mock") cred := credentials.NewCredentials(map[string]string{}) _, _, err := parseAKSKInfo(cred, []*commonpb.KeyValuePair{}, map[string]string{}) s.NoError(err) } } func (s *BedrockTextEmbeddingProviderSuite) TestCreateBedrockClient() { _, err := createBedRockEmbeddingClient("", "", "") s.Error(err) _, err = createBedRockEmbeddingClient("mock_id", "", "") s.Error(err) _, err = createBedRockEmbeddingClient("", "mock_key", "") s.Error(err) _, err = createBedRockEmbeddingClient("mock_id", "mock_key", "") s.Error(err) _, err = createBedRockEmbeddingClient("mock_id", "mock_key", "mock_region") s.NoError(err) } func (s *BedrockTextEmbeddingProviderSuite) TestNewBedrockEmbeddingProvider() { fieldSchema := &schemapb.FieldSchema{ FieldID: 102, Name: "vector", DataType: schemapb.DataType_FloatVector, TypeParams: []*commonpb.KeyValuePair{ {Key: "dim", Value: "4"}, }, } functionSchema := &schemapb.FunctionSchema{ Name: "test", Type: schemapb.FunctionType_Unknown, InputFieldNames: []string{"text"}, OutputFieldNames: []string{"vector"}, InputFieldIds: []int64{101}, OutputFieldIds: []int64{102}, Params: []*commonpb.KeyValuePair{ {Key: models.ModelNameParamKey, Value: TestModel}, {Key: models.CredentialParamKey, Value: "mock"}, {Key: models.RegionParamKey, Value: "mock"}, {Key: models.DimParamKey, Value: "4"}, {Key: models.NormalizeParamKey, Value: "false"}, }, } provider, err := NewBedrockEmbeddingProvider(fieldSchema, functionSchema, nil, map[string]string{}, credentials.NewCredentials(map[string]string{"mock.access_key_id": "mock", "mock.secret_access_key": "mock"})) s.NoError(err) s.True(provider.MaxBatch() > 0) s.Equal(provider.FieldDim(), int64(4)) _, err = NewBedrockEmbeddingProvider(fieldSchema, functionSchema, nil, map[string]string{models.CredentialParamKey: "mock"}, credentials.NewCredentials(map[string]string{"mock.access_key_id": "mock", "mock.secret_access_key": "mock"})) s.NoError(err) functionSchema.Params[4] = &commonpb.KeyValuePair{Key: models.NormalizeParamKey, Value: "true"} _, err = NewBedrockEmbeddingProvider(fieldSchema, functionSchema, nil, map[string]string{}, credentials.NewCredentials(map[string]string{"mock.access_key_id": "mock", "mock.secret_access_key": "mock"})) s.NoError(err) functionSchema.Params[4] = &commonpb.KeyValuePair{Key: models.NormalizeParamKey, Value: "invalid"} _, err = NewBedrockEmbeddingProvider(fieldSchema, functionSchema, nil, map[string]string{}, credentials.NewCredentials(map[string]string{"mock.access_key_id": "mock", "mock.secret_access_key": "mock"})) s.Error(err) // invalid dim functionSchema.Params[0] = &commonpb.KeyValuePair{Key: models.ModelNameParamKey, Value: TestModel} functionSchema.Params[0] = &commonpb.KeyValuePair{Key: models.DimParamKey, Value: "Invalid"} _, err = NewBedrockEmbeddingProvider(fieldSchema, functionSchema, nil, map[string]string{}, credentials.NewCredentials(map[string]string{"mock.access_key_id": "mock", "mock.secret_access_key": "mock"})) s.Error(err) }