Minio Error is not Handled gracefully (#17003)

Signed-off-by: xiaofan-luan <xiaofan.luan@zilliz.com>
This commit is contained in:
Xiaofan 2022-05-16 19:25:55 +08:00 committed by GitHub
parent 327bd6abbe
commit 5355153805
No known key found for this signature in database
GPG Key ID: 4AEE18F83AFDEB23
8 changed files with 187 additions and 57 deletions

View File

@ -51,7 +51,12 @@ func NewLocalChunkManager(opts ...Option) *LocalChunkManager {
// Path returns the path of local data if exists. // Path returns the path of local data if exists.
func (lcm *LocalChunkManager) Path(filePath string) (string, error) { func (lcm *LocalChunkManager) Path(filePath string) (string, error) {
if !lcm.Exist(filePath) { exist, err := lcm.Exist(filePath)
if err != nil {
return "", err
}
if !exist {
return "", fmt.Errorf("local file cannot be found with filePath: %s", filePath) return "", fmt.Errorf("local file cannot be found with filePath: %s", filePath)
} }
absPath := path.Join(lcm.localPath, filePath) absPath := path.Join(lcm.localPath, filePath)
@ -59,7 +64,11 @@ func (lcm *LocalChunkManager) Path(filePath string) (string, error) {
} }
func (lcm *LocalChunkManager) Reader(filePath string) (FileReader, error) { func (lcm *LocalChunkManager) Reader(filePath string) (FileReader, error) {
if !lcm.Exist(filePath) { exist, err := lcm.Exist(filePath)
if err != nil {
return nil, err
}
if !exist {
return nil, errors.New("local file cannot be found with filePath:" + filePath) return nil, errors.New("local file cannot be found with filePath:" + filePath)
} }
absPath := path.Join(lcm.localPath, filePath) absPath := path.Join(lcm.localPath, filePath)
@ -70,17 +79,17 @@ func (lcm *LocalChunkManager) Reader(filePath string) (FileReader, error) {
func (lcm *LocalChunkManager) Write(filePath string, content []byte) error { func (lcm *LocalChunkManager) Write(filePath string, content []byte) error {
absPath := path.Join(lcm.localPath, filePath) absPath := path.Join(lcm.localPath, filePath)
dir := path.Dir(absPath) dir := path.Dir(absPath)
if _, err := os.Stat(dir); os.IsNotExist(err) { exist, err := lcm.Exist(dir)
if err != nil {
return err
}
if !exist {
err := os.MkdirAll(dir, os.ModePerm) err := os.MkdirAll(dir, os.ModePerm)
if err != nil { if err != nil {
return err return err
} }
} }
err := ioutil.WriteFile(absPath, content, os.ModePerm) return ioutil.WriteFile(absPath, content, os.ModePerm)
if err != nil {
return err
}
return nil
} }
// MultiWrite writes the data to local storage. // MultiWrite writes the data to local storage.
@ -99,17 +108,25 @@ func (lcm *LocalChunkManager) MultiWrite(contents map[string][]byte) error {
} }
// Exist checks whether chunk is saved to local storage. // Exist checks whether chunk is saved to local storage.
func (lcm *LocalChunkManager) Exist(filePath string) bool { func (lcm *LocalChunkManager) Exist(filePath string) (bool, error) {
absPath := path.Join(lcm.localPath, filePath) absPath := path.Join(lcm.localPath, filePath)
if _, err := os.Stat(absPath); errors.Is(err, os.ErrNotExist) { _, err := os.Stat(absPath)
return false if err != nil {
if os.IsNotExist(err) {
return false, nil
} }
return true return false, err
}
return true, nil
} }
// Read reads the local storage data if exists. // Read reads the local storage data if exists.
func (lcm *LocalChunkManager) Read(filePath string) ([]byte, error) { func (lcm *LocalChunkManager) Read(filePath string) ([]byte, error) {
if !lcm.Exist(filePath) { exist, err := lcm.Exist(filePath)
if err != nil {
return nil, err
}
if !exist {
return nil, fmt.Errorf("file not exist: %s", filePath) return nil, fmt.Errorf("file not exist: %s", filePath)
} }
absPath := path.Join(lcm.localPath, filePath) absPath := path.Join(lcm.localPath, filePath)
@ -202,7 +219,11 @@ func (lcm *LocalChunkManager) Size(filePath string) (int64, error) {
} }
func (lcm *LocalChunkManager) Remove(filePath string) error { func (lcm *LocalChunkManager) Remove(filePath string) error {
if lcm.Exist(filePath) { exist, err := lcm.Exist(filePath)
if err != nil {
return err
}
if exist {
absPath := path.Join(lcm.localPath, filePath) absPath := path.Join(lcm.localPath, filePath)
err := os.RemoveAll(absPath) err := os.RemoveAll(absPath)
if err != nil { if err != nil {

View File

@ -370,4 +370,34 @@ func TestLocalCM(t *testing.T) {
assert.Error(t, err) assert.Error(t, err)
assert.Equal(t, p, "") assert.Equal(t, p, "")
}) })
t.Run("test Prefix", func(t *testing.T) {
testPrefix := "prefix"
testCM := NewLocalChunkManager(RootPath(localPath))
defer testCM.RemoveWithPrefix(testPrefix)
pathB := path.Join("a", "b")
key := path.Join(testPrefix, pathB)
value := []byte("a")
err := testCM.Write(key, value)
assert.NoError(t, err)
pathC := path.Join("a", "c")
key = path.Join(testPrefix, pathC)
err = testCM.Write(key, value)
assert.NoError(t, err)
pathPrefix := path.Join(testPrefix, "a")
r, err := testCM.ListWithPrefix(pathPrefix)
assert.NoError(t, err)
assert.Equal(t, len(r), 2)
testCM.RemoveWithPrefix(testPrefix)
r, err = testCM.ListWithPrefix(pathPrefix)
assert.NoError(t, err)
assert.Equal(t, len(r), 0)
})
} }

View File

@ -69,19 +69,24 @@ func newMinioChunkManagerWithConfig(ctx context.Context, c *config) (*MinioChunk
checkBucketFn := func() error { checkBucketFn := func() error {
bucketExists, err = minIOClient.BucketExists(ctx, c.bucketName) bucketExists, err = minIOClient.BucketExists(ctx, c.bucketName)
if err != nil { if err != nil {
log.Warn("failed to check blob bucket exist", zap.String("bucket", c.bucketName), zap.Error(err))
return err return err
} }
if !bucketExists { if !bucketExists {
log.Debug("minio chunk manager new minio client", zap.Any("Check bucket", "bucket not exist"))
if c.createBucket { if c.createBucket {
log.Debug("minio chunk manager create minio bucket.", zap.Any("bucket name", c.bucketName)) log.Info("blob bucket not exist, create bucket.", zap.Any("bucket name", c.bucketName))
return minIOClient.MakeBucket(ctx, c.bucketName, minio.MakeBucketOptions{}) err := minIOClient.MakeBucket(ctx, c.bucketName, minio.MakeBucketOptions{})
if err != nil {
log.Warn("failed to create blob bucket", zap.String("bucket", c.bucketName), zap.Error(err))
return err
} }
} else {
return fmt.Errorf("bucket %s not Existed", c.bucketName) return fmt.Errorf("bucket %s not Existed", c.bucketName)
} }
}
return nil return nil
} }
err = retry.Do(ctx, checkBucketFn, retry.Attempts(100)) err = retry.Do(ctx, checkBucketFn, retry.Attempts(20))
if err != nil { if err != nil {
return nil, err return nil, err
} }
@ -91,14 +96,17 @@ func newMinioChunkManagerWithConfig(ctx context.Context, c *config) (*MinioChunk
Client: minIOClient, Client: minIOClient,
bucketName: c.bucketName, bucketName: c.bucketName,
} }
log.Debug("minio chunk manager new minio client success.") log.Info("minio chunk manager init success.", zap.String("bucketname", c.bucketName), zap.String("root", c.rootPath))
return mcm, nil return mcm, nil
} }
// Path returns the path of minio data if exists. // Path returns the path of minio data if exists.
func (mcm *MinioChunkManager) Path(filePath string) (string, error) { func (mcm *MinioChunkManager) Path(filePath string) (string, error) {
if !mcm.Exist(filePath) { exist, err := mcm.Exist(filePath)
if err != nil {
return "", err
}
if !exist {
return "", errors.New("minio file manage cannot be found with filePath:" + filePath) return "", errors.New("minio file manage cannot be found with filePath:" + filePath)
} }
return filePath, nil return filePath, nil
@ -106,15 +114,18 @@ func (mcm *MinioChunkManager) Path(filePath string) (string, error) {
// Reader returns the path of minio data if exists. // Reader returns the path of minio data if exists.
func (mcm *MinioChunkManager) Reader(filePath string) (FileReader, error) { func (mcm *MinioChunkManager) Reader(filePath string) (FileReader, error) {
if !mcm.Exist(filePath) { reader, err := mcm.Client.GetObject(mcm.ctx, mcm.bucketName, filePath, minio.GetObjectOptions{})
return nil, errors.New("minio file manage cannot be found with filePath:" + filePath) if err != nil {
log.Warn("failed to get object", zap.String("path", filePath), zap.Error(err))
return nil, err
} }
return mcm.Client.GetObject(mcm.ctx, mcm.bucketName, filePath, minio.GetObjectOptions{}) return reader, nil
} }
func (mcm *MinioChunkManager) Size(filePath string) (int64, error) { func (mcm *MinioChunkManager) Size(filePath string) (int64, error) {
objectInfo, err := mcm.Client.StatObject(mcm.ctx, mcm.bucketName, filePath, minio.StatObjectOptions{}) objectInfo, err := mcm.Client.StatObject(mcm.ctx, mcm.bucketName, filePath, minio.StatObjectOptions{})
if err != nil { if err != nil {
log.Warn("failed to stat object", zap.String("path", filePath), zap.Error(err))
return 0, err return 0, err
} }
@ -126,6 +137,7 @@ func (mcm *MinioChunkManager) Write(filePath string, content []byte) error {
_, err := mcm.Client.PutObject(mcm.ctx, mcm.bucketName, filePath, bytes.NewReader(content), int64(len(content)), minio.PutObjectOptions{}) _, err := mcm.Client.PutObject(mcm.ctx, mcm.bucketName, filePath, bytes.NewReader(content), int64(len(content)), minio.PutObjectOptions{})
if err != nil { if err != nil {
log.Warn("failed to put object", zap.String("path", filePath), zap.Error(err))
return err return err
} }
@ -149,20 +161,34 @@ func (mcm *MinioChunkManager) MultiWrite(kvs map[string][]byte) error {
} }
// Exist checks whether chunk is saved to minio storage. // Exist checks whether chunk is saved to minio storage.
func (mcm *MinioChunkManager) Exist(filePath string) bool { func (mcm *MinioChunkManager) Exist(filePath string) (bool, error) {
_, err := mcm.Client.StatObject(mcm.ctx, mcm.bucketName, filePath, minio.StatObjectOptions{}) _, err := mcm.Client.StatObject(mcm.ctx, mcm.bucketName, filePath, minio.StatObjectOptions{})
return err == nil if err != nil {
errResponse := minio.ToErrorResponse(err)
if errResponse.Code == "NoSuchKey" {
return false, nil
}
log.Warn("failed to stat object", zap.String("path", filePath), zap.Error(err))
return false, err
}
return true, nil
} }
// Read reads the minio storage data if exists. // Read reads the minio storage data if exists.
func (mcm *MinioChunkManager) Read(filePath string) ([]byte, error) { func (mcm *MinioChunkManager) Read(filePath string) ([]byte, error) {
object, err := mcm.Client.GetObject(mcm.ctx, mcm.bucketName, filePath, minio.GetObjectOptions{}) object, err := mcm.Client.GetObject(mcm.ctx, mcm.bucketName, filePath, minio.GetObjectOptions{})
if err != nil { if err != nil {
log.Warn("failed to get object", zap.String("path", filePath), zap.Error(err))
return nil, err return nil, err
} }
defer object.Close() defer object.Close()
return ioutil.ReadAll(object) data, err := ioutil.ReadAll(object)
if err != nil {
log.Warn("failed to read object", zap.String("path", filePath), zap.Error(err))
return nil, err
}
return data, nil
} }
func (mcm *MinioChunkManager) MultiRead(keys []string) ([][]byte, error) { func (mcm *MinioChunkManager) MultiRead(keys []string) ([][]byte, error) {
@ -189,7 +215,6 @@ func (mcm *MinioChunkManager) ReadWithPrefix(prefix string) ([]string, [][]byte,
} }
objectsValues, err := mcm.MultiRead(objectsKeys) objectsValues, err := mcm.MultiRead(objectsKeys)
if err != nil { if err != nil {
log.Error(fmt.Sprintf("MinIO load with prefix error. path = %s", prefix), zap.Error(err))
return nil, nil, err return nil, nil, err
} }
@ -209,22 +234,33 @@ func (mcm *MinioChunkManager) ReadAt(filePath string, off int64, length int64) (
opts := minio.GetObjectOptions{} opts := minio.GetObjectOptions{}
err := opts.SetRange(off, off+length-1) err := opts.SetRange(off, off+length-1)
if err != nil { if err != nil {
log.Warn("failed to set range", zap.String("path", filePath), zap.Error(err))
return nil, err return nil, err
} }
object, err := mcm.Client.GetObject(mcm.ctx, mcm.bucketName, filePath, opts) object, err := mcm.Client.GetObject(mcm.ctx, mcm.bucketName, filePath, opts)
if err != nil { if err != nil {
log.Warn("failed to get object", zap.String("path", filePath), zap.Error(err))
return nil, err return nil, err
} }
defer object.Close() defer object.Close()
return ioutil.ReadAll(object) data, err := ioutil.ReadAll(object)
if err != nil {
log.Warn("failed to read object", zap.String("path", filePath), zap.Error(err))
return nil, err
}
return data, nil
} }
// Remove deletes an object with @key. // Remove deletes an object with @key.
func (mcm *MinioChunkManager) Remove(key string) error { func (mcm *MinioChunkManager) Remove(filePath string) error {
err := mcm.Client.RemoveObject(mcm.ctx, mcm.bucketName, key, minio.RemoveObjectOptions{}) err := mcm.Client.RemoveObject(mcm.ctx, mcm.bucketName, filePath, minio.RemoveObjectOptions{})
if err != nil {
log.Warn("failed to remove object", zap.String("path", filePath), zap.Error(err))
return err return err
} }
return nil
}
// MultiRemove deletes a objects with @keys. // MultiRemove deletes a objects with @keys.
func (mcm *MinioChunkManager) MultiRemove(keys []string) error { func (mcm *MinioChunkManager) MultiRemove(keys []string) error {
@ -243,18 +279,10 @@ func (mcm *MinioChunkManager) MultiRemove(keys []string) error {
// RemoveWithPrefix removes all objects with the same prefix @prefix from minio. // RemoveWithPrefix removes all objects with the same prefix @prefix from minio.
func (mcm *MinioChunkManager) RemoveWithPrefix(prefix string) error { func (mcm *MinioChunkManager) RemoveWithPrefix(prefix string) error {
objectsCh := make(chan minio.ObjectInfo) objects := mcm.Client.ListObjects(mcm.ctx, mcm.bucketName, minio.ListObjectsOptions{Prefix: prefix, Recursive: true})
for rErr := range mcm.Client.RemoveObjects(mcm.ctx, mcm.bucketName, objects, minio.RemoveObjectsOptions{GovernanceBypass: true}) {
go func() {
defer close(objectsCh)
for object := range mcm.Client.ListObjects(mcm.ctx, mcm.bucketName, minio.ListObjectsOptions{Prefix: prefix, Recursive: true}) {
objectsCh <- object
}
}()
for rErr := range mcm.Client.RemoveObjects(mcm.ctx, mcm.bucketName, objectsCh, minio.RemoveObjectsOptions{GovernanceBypass: true}) {
if rErr.Err != nil { if rErr.Err != nil {
log.Warn("failed to remove objects", zap.String("prefix", prefix), zap.Error(rErr.Err))
return rErr.Err return rErr.Err
} }
} }
@ -262,11 +290,14 @@ func (mcm *MinioChunkManager) RemoveWithPrefix(prefix string) error {
} }
func (mcm *MinioChunkManager) ListWithPrefix(prefix string) ([]string, error) { func (mcm *MinioChunkManager) ListWithPrefix(prefix string) ([]string, error) {
objects := mcm.Client.ListObjects(mcm.ctx, mcm.bucketName, minio.ListObjectsOptions{Prefix: prefix}) objects := mcm.Client.ListObjects(mcm.ctx, mcm.bucketName, minio.ListObjectsOptions{Prefix: prefix, Recursive: true})
var objectsKeys []string var objectsKeys []string
for object := range objects { for object := range objects {
if object.Err != nil {
log.Warn("failed to list with prefix", zap.String("prefix", prefix), zap.Error(object.Err))
return nil, object.Err
}
objectsKeys = append(objectsKeys, object.Key) objectsKeys = append(objectsKeys, object.Key)
} }
return objectsKeys, nil return objectsKeys, nil

View File

@ -18,6 +18,7 @@ package storage
import ( import (
"context" "context"
"fmt"
"path" "path"
"strconv" "strconv"
"testing" "testing"
@ -163,7 +164,7 @@ func TestMinIOCM(t *testing.T) {
expectedValue [][]byte expectedValue [][]byte
description string description string
}{ }{
{false, []string{"key_1", "key_not_exist"}, [][]byte{[]byte("111"), {}}, "multiload 1 exist 1 not"}, {false, []string{"key_1", "key_not_exist"}, [][]byte{[]byte("111"), nil}, "multiload 1 exist 1 not"},
{true, []string{"abc", "key_3"}, [][]byte{[]byte("123"), []byte("333")}, "multiload 2 exist"}, {true, []string{"abc", "key_3"}, [][]byte{[]byte("123"), []byte("333")}, "multiload 2 exist"},
} }
@ -406,6 +407,7 @@ func TestMinIOCM(t *testing.T) {
assert.Error(t, err) assert.Error(t, err)
assert.Equal(t, p, "") assert.Equal(t, p, "")
}) })
t.Run("test Mmap", func(t *testing.T) { t.Run("test Mmap", func(t *testing.T) {
testMmapRoot := path.Join(testMinIOKVRoot, "mmap") testMmapRoot := path.Join(testMinIOKVRoot, "mmap")
ctx, cancel := context.WithCancel(context.Background()) ctx, cancel := context.WithCancel(context.Background())
@ -426,4 +428,44 @@ func TestMinIOCM(t *testing.T) {
assert.Nil(t, r) assert.Nil(t, r)
}) })
t.Run("test Prefix", func(t *testing.T) {
testPrefix := path.Join(testMinIOKVRoot, "prefix")
ctx, cancel := context.WithCancel(context.Background())
defer cancel()
testCM, err := newMinIOChunkManager(ctx, testBucket)
require.NoError(t, err)
defer testCM.RemoveWithPrefix(testPrefix)
pathB := path.Join("a", "b")
key := path.Join(testPrefix, pathB)
value := []byte("a")
err = testCM.Write(key, value)
assert.NoError(t, err)
pathC := path.Join("a", "c")
key = path.Join(testPrefix, pathC)
err = testCM.Write(key, value)
assert.NoError(t, err)
pathPrefix := path.Join(testPrefix, "a")
r, err := testCM.ListWithPrefix(pathPrefix)
assert.NoError(t, err)
assert.Equal(t, len(r), 2)
testCM.RemoveWithPrefix(testPrefix)
r, err = testCM.ListWithPrefix(pathPrefix)
assert.NoError(t, err)
assert.Equal(t, len(r), 0)
// test wrong prefix
b := make([]byte, 2048)
pathWrong := path.Join(testPrefix, string(b))
_, err = testCM.ListWithPrefix(pathWrong)
assert.Error(t, err)
fmt.Println(err)
})
} }

View File

@ -34,7 +34,7 @@ type ChunkManager interface {
// MultiWrite writes multi @content to @filePath. // MultiWrite writes multi @content to @filePath.
MultiWrite(contents map[string][]byte) error MultiWrite(contents map[string][]byte) error
// Exist returns true if @filePath exists. // Exist returns true if @filePath exists.
Exist(filePath string) bool Exist(filePath string) (bool, error)
// Read reads @filePath and returns content. // Read reads @filePath and returns content.
Read(filePath string) ([]byte, error) Read(filePath string) ([]byte, error)
// Reader return a reader for @filePath // Reader return a reader for @filePath

View File

@ -136,7 +136,7 @@ func (vcm *VectorChunkManager) MultiWrite(contents map[string][]byte) error {
} }
// Exist checks whether vector data is saved to local cache. // Exist checks whether vector data is saved to local cache.
func (vcm *VectorChunkManager) Exist(filePath string) bool { func (vcm *VectorChunkManager) Exist(filePath string) (bool, error) {
return vcm.vectorStorage.Exist(filePath) return vcm.vectorStorage.Exist(filePath)
} }

View File

@ -235,8 +235,9 @@ func TestVectorChunkManager_Write(t *testing.T) {
err = vcm.Write(key, []byte{1}) err = vcm.Write(key, []byte{1})
assert.Nil(t, err) assert.Nil(t, err)
exist := vcm.Exist(key) exist, err := vcm.Exist(key)
assert.True(t, exist) assert.True(t, exist)
assert.NoError(t, err)
contents := map[string][]byte{ contents := map[string][]byte{
"key_1": {111}, "key_1": {111},
@ -245,10 +246,12 @@ func TestVectorChunkManager_Write(t *testing.T) {
err = vcm.MultiWrite(contents) err = vcm.MultiWrite(contents)
assert.NoError(t, err) assert.NoError(t, err)
exist = vcm.Exist("key_1") exist, err = vcm.Exist("key_1")
assert.True(t, exist) assert.True(t, exist)
exist = vcm.Exist("key_2") assert.NoError(t, err)
exist, err = vcm.Exist("key_2")
assert.True(t, exist) assert.True(t, exist)
assert.NoError(t, err)
err = vcm.RemoveWithPrefix(localPath) err = vcm.RemoveWithPrefix(localPath)
assert.NoError(t, err) assert.NoError(t, err)
@ -271,8 +274,9 @@ func TestVectorChunkManager_Remove(t *testing.T) {
err = vcm.Remove(key) err = vcm.Remove(key)
assert.Nil(t, err) assert.Nil(t, err)
exist := vcm.Exist(key) exist, err := vcm.Exist(key)
assert.False(t, exist) assert.False(t, exist)
assert.NoError(t, err)
contents := map[string][]byte{ contents := map[string][]byte{
"key_1": {111}, "key_1": {111},
@ -284,10 +288,12 @@ func TestVectorChunkManager_Remove(t *testing.T) {
err = vcm.MultiRemove([]string{"key_1", "key_2"}) err = vcm.MultiRemove([]string{"key_1", "key_2"})
assert.NoError(t, err) assert.NoError(t, err)
exist = vcm.Exist("key_1") exist, err = vcm.Exist("key_1")
assert.False(t, exist) assert.False(t, exist)
exist = vcm.Exist("key_2") assert.NoError(t, err)
exist, err = vcm.Exist("key_2")
assert.False(t, exist) assert.False(t, exist)
assert.NoError(t, err)
err = vcm.RemoveWithPrefix(localPath) err = vcm.RemoveWithPrefix(localPath)
assert.NoError(t, err) assert.NoError(t, err)

View File

@ -46,8 +46,8 @@ func (mc *MockChunkManager) MultiWrite(contents map[string][]byte) error {
return nil return nil
} }
func (mc *MockChunkManager) Exist(filePath string) bool { func (mc *MockChunkManager) Exist(filePath string) (bool, error) {
return true return true, nil
} }
func (mc *MockChunkManager) Read(filePath string) ([]byte, error) { func (mc *MockChunkManager) Read(filePath string) ([]byte, error) {