milvus/internal/core/src/storage/FileManager.h
congqixia 5ece760d73
fix: Pass fs via FileManagerContext when loading index (#44733)
Related to #44615

---------

Signed-off-by: Congqi Xia <congqi.xia@zilliz.com>
2025-10-11 09:55:57 +08:00

216 lines
6.8 KiB
C++

// Licensed to the LF AI & Data foundation under one
// or more contributor license agreements. See the NOTICE file
// distributed with this work for additional information
// regarding copyright ownership. The ASF licenses this file
// to you under the Apache License, Version 2.0 (the
// "License"); you may not use this file except in compliance
// with the License. You may obtain a copy of the License at
//
// http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.
#pragma once
#include <string>
#include <optional>
#include <memory>
#include "common/Consts.h"
#include "boost/filesystem/path.hpp"
#include "log/Log.h"
#include "storage/ChunkManager.h"
#include "storage/Types.h"
#include "milvus-storage/filesystem/fs.h"
#include "filemanager/FileManager.h"
namespace milvus::storage {
struct FileManagerContext {
FileManagerContext() : chunkManagerPtr(nullptr) {
}
explicit FileManagerContext(const ChunkManagerPtr& chunkManagerPtr)
: chunkManagerPtr(chunkManagerPtr) {
}
FileManagerContext(const FieldDataMeta& fieldDataMeta,
const IndexMeta& indexMeta,
const ChunkManagerPtr& chunkManagerPtr,
milvus_storage::ArrowFileSystemPtr fs)
: fieldDataMeta(fieldDataMeta),
indexMeta(indexMeta),
chunkManagerPtr(chunkManagerPtr),
fs(std::move(fs)) {
}
bool
Valid() const {
return chunkManagerPtr != nullptr;
}
void
set_for_loading_index(bool value) {
for_loading_index = value;
}
void
set_plugin_context(std::shared_ptr<CPluginContext> context) {
plugin_context = context;
}
FieldDataMeta fieldDataMeta;
IndexMeta indexMeta;
ChunkManagerPtr chunkManagerPtr;
milvus_storage::ArrowFileSystemPtr fs;
bool for_loading_index{false};
std::shared_ptr<CPluginContext> plugin_context;
};
#define FILEMANAGER_TRY try {
#define FILEMANAGER_CATCH \
} \
catch (SegcoreError & e) { \
LOG_ERROR("SegcoreError:{} code {}", e.what(), e.get_error_code()); \
return false; \
} \
catch (std::exception & e) { \
LOG_ERROR("Exception:{}", e.what()); \
return false;
#define FILEMANAGER_END }
class FileManagerImpl : public milvus::FileManager {
public:
explicit FileManagerImpl(const FieldDataMeta& field_mata,
IndexMeta index_meta)
: field_meta_(field_mata), index_meta_(std::move(index_meta)) {
}
public:
/**
* @brief Load a file to the local disk, so we can use stl lib to operate it.
*
* @param filename
* @return false if any error, or return true.
*/
virtual bool
LoadFile(const std::string& filename) override = 0;
/**
* @brief Add file to FileManager to manipulate it.
*
* @param filename
* @return false if any error, or return true.
*/
virtual bool
AddFile(const std::string& filename) override = 0;
/**
* @brief Check if a file exists.
*
* @param filename
* @return std::nullopt if any error, or return if the file exists.
*/
virtual std::optional<bool>
IsExisted(const std::string& filename) override = 0;
/**
* @brief Delete a file from FileManager.
*
* @param filename
* @return false if any error, or return true.
*/
virtual bool
RemoveFile(const std::string& filename) override = 0;
virtual bool
AddFileMeta(const FileMeta& file_meta) override = 0;
virtual std::shared_ptr<InputStream>
OpenInputStream(const std::string& filename) override = 0;
virtual std::shared_ptr<OutputStream>
OpenOutputStream(const std::string& filename) override = 0;
public:
virtual std::string
GetName() const = 0;
virtual FieldDataMeta
GetFieldDataMeta() const {
return field_meta_;
}
virtual IndexMeta
GetIndexMeta() const {
return index_meta_;
}
virtual ChunkManagerPtr
GetChunkManager() const {
return rcm_;
}
virtual std::string
GetRemoteIndexObjectPrefix() const {
boost::filesystem::path prefix = rcm_->GetRootPath();
boost::filesystem::path path = std::string(INDEX_ROOT_PATH);
boost::filesystem::path path1 =
std::to_string(index_meta_.build_id) + "/" +
std::to_string(index_meta_.index_version) + "/" +
std::to_string(field_meta_.partition_id) + "/" +
std::to_string(field_meta_.segment_id);
return (prefix / path / path1).string();
}
virtual std::string
GetRemoteIndexObjectPrefixV2() const {
return std::string(INDEX_ROOT_PATH) + "/" +
std::to_string(index_meta_.build_id) + "/" +
std::to_string(index_meta_.index_version) + "/" +
std::to_string(field_meta_.partition_id) + "/" +
std::to_string(field_meta_.segment_id);
}
virtual std::string
GetRemoteIndexFilePrefixV2() const {
boost::filesystem::path bucket = rcm_->GetBucketName();
std::string v1_prefix = GetRemoteIndexObjectPrefix();
if (bucket.empty()) {
return v1_prefix;
} else {
return (bucket / v1_prefix).string();
}
}
virtual std::string
GetRemoteTextLogPrefix() const {
boost::filesystem::path prefix = rcm_->GetRootPath();
boost::filesystem::path path = std::string(TEXT_LOG_ROOT_PATH);
boost::filesystem::path path1 =
std::to_string(index_meta_.build_id) + "/" +
std::to_string(index_meta_.index_version) + "/" +
std::to_string(field_meta_.collection_id) + "/" +
std::to_string(field_meta_.partition_id) + "/" +
std::to_string(field_meta_.segment_id) + "/" +
std::to_string(field_meta_.field_id);
return (prefix / path / path1).string();
}
protected:
// collection meta
FieldDataMeta field_meta_;
// index meta
IndexMeta index_meta_;
ChunkManagerPtr rcm_;
milvus_storage::ArrowFileSystemPtr fs_;
std::shared_ptr<CPluginContext> plugin_context_;
};
using FileManagerImplPtr = std::shared_ptr<FileManagerImpl>;
} // namespace milvus::storage