milvus/tests/integration/ops/suspend_node_test.go
Zhen Ye ecb24e7232
enhance: use multi-process framework in integration test (#42976)
issue: #41609

- add env `MILVUS_NODE_ID_FOR_TESTING` to set up a node id for milvus
process.
- add env `MILVUS_CONFIG_REFRESH_INTERVAL` to set up the refresh
interval of paramtable.
- Init paramtable when calling `paramtable.Get()`.
- add new multi process framework for integration test.
- change all integration test into multi process.
- merge some test case into one suite to speed up it.
- modify some test, which need to wait for issue #42966, #42685.
- remove the waittssync for delete collection to fix issue: #42989

---------

Signed-off-by: chyezh <chyezh@outlook.com>
2025-06-30 14:22:43 +08:00

150 lines
4.7 KiB
Go

// Licensed to the LF AI & Data foundation under one
// or more contributor license agreements. See the NOTICE file
// distributed with this work for additional information
// regarding copyright ownership. The ASF licenses this file
// to you under the Apache License, Version 2.0 (the
// "License"); you may not use this file except in compliance
// with the License. You may obtain a copy of the License at
//
// http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.
package ops
import (
"context"
"testing"
"github.com/stretchr/testify/suite"
"github.com/milvus-io/milvus-proto/go-api/v2/milvuspb"
"github.com/milvus-io/milvus/internal/querycoordv2/meta"
"github.com/milvus-io/milvus/internal/querycoordv2/session"
"github.com/milvus-io/milvus/pkg/v2/proto/querypb"
"github.com/milvus-io/milvus/pkg/v2/util/merr"
"github.com/milvus-io/milvus/pkg/v2/util/paramtable"
"github.com/milvus-io/milvus/tests/integration"
"github.com/milvus-io/milvus/tests/integration/cluster/process"
)
const (
dim = 128
dbName = ""
collectionName = "test_suspend_node"
)
type SuspendNodeTestSuite struct {
integration.MiniClusterSuite
}
func (s *SuspendNodeTestSuite) SetupSuite() {
s.WithMilvusConfig(paramtable.Get().QueryCoordCfg.BalanceCheckInterval.Key, "1000")
s.WithMilvusConfig(paramtable.Get().QueryNodeCfg.GracefulStopTimeout.Key, "1")
s.MiniClusterSuite.SetupSuite()
}
func (s *SuspendNodeTestSuite) loadCollection(collectionName string, db string, replica int, rgs []string) {
ctx, cancel := context.WithCancel(context.Background())
defer cancel()
// load
loadStatus, err := s.Cluster.MilvusClient.LoadCollection(ctx, &milvuspb.LoadCollectionRequest{
DbName: db,
CollectionName: collectionName,
ReplicaNumber: int32(replica),
ResourceGroups: rgs,
})
s.NoError(err)
s.True(merr.Ok(loadStatus))
s.WaitForLoadWithDB(ctx, db, collectionName)
}
func (s *SuspendNodeTestSuite) releaseCollection(db, collectionName string) {
ctx, cancel := context.WithCancel(context.Background())
defer cancel()
// load
status, err := s.Cluster.MilvusClient.ReleaseCollection(ctx, &milvuspb.ReleaseCollectionRequest{
DbName: db,
CollectionName: collectionName,
})
s.NoError(err)
s.True(merr.Ok(status))
}
func (s *SuspendNodeTestSuite) TestSuspendNode() {
ctx := context.Background()
s.CreateCollectionWithConfiguration(ctx, &integration.CreateCollectionConfig{
DBName: dbName,
Dim: dim,
CollectionName: collectionName,
ChannelNum: 1,
SegmentNum: 3,
RowNumPerSegment: 2000,
})
qns := make([]*process.QueryNodeProcess, 0)
for i := 1; i < 3; i++ {
qn := s.Cluster.AddQueryNode()
qns = append(qns, qn)
}
// load collection without specified replica and rgs
s.loadCollection(collectionName, dbName, 1, nil)
resp2, err := s.Cluster.MilvusClient.GetReplicas(ctx, &milvuspb.GetReplicasRequest{
DbName: dbName,
CollectionName: collectionName,
})
s.NoError(err)
s.True(merr.Ok(resp2.Status))
s.Len(resp2.GetReplicas(), 1)
defer s.releaseCollection(dbName, collectionName)
resp3, err := s.Cluster.MixCoordClient.SuspendNode(ctx, &querypb.SuspendNodeRequest{
NodeID: qns[0].GetNodeID(),
})
s.NoError(err)
s.True(merr.Ok(resp3))
// expect suspend node to be removed from resource group
resp5, err := s.Cluster.MixCoordClient.DescribeResourceGroup(ctx, &querypb.DescribeResourceGroupRequest{
ResourceGroup: meta.DefaultResourceGroupName,
})
s.NoError(err)
s.True(merr.Ok(resp5.GetStatus()))
s.Equal(2, len(resp5.GetResourceGroup().GetNodes()))
resp6, err := s.Cluster.MixCoordClient.ResumeNode(ctx, &querypb.ResumeNodeRequest{
NodeID: qns[0].GetNodeID(),
})
s.NoError(err)
s.True(merr.Ok(resp6))
// expect node state to be resume
resp7, err := s.Cluster.MixCoordClient.ListQueryNode(ctx, &querypb.ListQueryNodeRequest{})
s.NoError(err)
s.True(merr.Ok(resp7.GetStatus()))
for _, node := range resp7.GetNodeInfos() {
if node.GetID() == qns[0].GetNodeID() {
s.Equal(session.NodeStateNormal.String(), node.GetState())
}
}
// expect suspend node to be added to resource group
resp8, err := s.Cluster.MixCoordClient.DescribeResourceGroup(ctx, &querypb.DescribeResourceGroupRequest{
ResourceGroup: meta.DefaultResourceGroupName,
})
s.NoError(err)
s.True(merr.Ok(resp8.GetStatus()))
s.Equal(3, len(resp8.GetResourceGroup().GetNodes()))
}
func TestSuspendNode(t *testing.T) {
suite.Run(t, new(SuspendNodeTestSuite))
}