mirror of
https://gitee.com/milvus-io/milvus.git
synced 2026-01-07 19:31:51 +08:00
* finish configure modifiable and some take effect runtime Signed-off-by: Yhz <yinghao.zou@zilliz.com> * move test file to unittet folder Signed-off-by: Yhz <yinghao.zou@zilliz.com> * add test case for cofig Signed-off-by: Yhz <yinghao.zou@zilliz.com> * fix format issue Signed-off-by: Yhz <yinghao.zou@zilliz.com> * optimize callback Signed-off-by: Yhz <yinghao.zou@zilliz.com> * fix error when get config by http in CPU mode Signed-off-by: Yhz <yinghao.zou@zilliz.com> * update callback map Signed-off-by: Yhz <yinghao.zou@zilliz.com> * correct typo Signed-off-by: Yhz <yinghao.zou@zilliz.com> * update callback register Signed-off-by: Yhz <yinghao.zou@zilliz.com> * add identity in registers Signed-off-by: Yhz <yinghao.zou@zilliz.com> * add identity in FaissPass class Signed-off-by: Yhz <yinghao.zou@zilliz.com> * add comments at cmd test if fail Signed-off-by: Yhz <yinghao.zou@zilliz.com> * remove some comments and add test for validate storage path Signed-off-by: Yhz <yinghao.zou@zilliz.com> * format pass Signed-off-by: Yhz <yinghao.zou@zilliz.com> * remove endpoint info and update CORS Signed-off-by: Yhz <yinghao.zou@zilliz.com> * add test case in web module to test drop a non-existent table Signed-off-by: Yhz <yinghao.zou@zilliz.com> * optimize config store Signed-off-by: Yhz <yinghao.zou@zilliz.com> * add check code in config Signed-off-by: Yhz <yinghao.zou@zilliz.com> * add scheduler gpu handler Signed-off-by: Yhz <yinghao.zou@zilliz.com> * update optimizer faiss pass Signed-off-by: Yhz <yinghao.zou@zilliz.com> * add default value of gpu_enable_ in GpuCacheMgr Signed-off-by: Yhz <yinghao.zou@zilliz.com> * optimize code: remove comments Signed-off-by: Yhz <yinghao.zou@zilliz.com> * format pass Signed-off-by: Yhz <yinghao.zou@zilliz.com> * add gpu macro in optimizer handler module to fix compile bug on cpu version Signed-off-by: Yhz <yinghao.zou@zilliz.com> * change cache setting unit bytes Signed-off-by: Yhz <yinghao.zou@zilliz.com> * rename variables Signed-off-by: Yhz <yinghao.zou@zilliz.com>
81 lines
2.8 KiB
C++
81 lines
2.8 KiB
C++
// Copyright (C) 2019-2020 Zilliz. All rights reserved.
|
|
//
|
|
// Licensed under the Apache License, Version 2.0 (the "License"); you may not use this file except in compliance
|
|
// with the License. You may obtain a copy of the License at
|
|
//
|
|
// http://www.apache.org/licenses/LICENSE-2.0
|
|
//
|
|
// Unless required by applicable law or agreed to in writing, software distributed under the License
|
|
// is distributed on an "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express
|
|
// or implied. See the License for the specific language governing permissions and limitations under the License.
|
|
#ifdef MILVUS_GPU_VERSION
|
|
#include "scheduler/optimizer/FaissIVFSQ8HPass.h"
|
|
#include "cache/GpuCacheMgr.h"
|
|
#include "scheduler/SchedInst.h"
|
|
#include "scheduler/Utils.h"
|
|
#include "scheduler/task/SearchTask.h"
|
|
#include "scheduler/tasklabel/SpecResLabel.h"
|
|
#include "server/Config.h"
|
|
#include "utils/Log.h"
|
|
|
|
namespace milvus {
|
|
namespace scheduler {
|
|
|
|
void
|
|
FaissIVFSQ8HPass::Init() {
|
|
#ifdef CUSTOMIZATION
|
|
server::Config& config = server::Config::GetInstance();
|
|
Status s = config.GetEngineConfigGpuSearchThreshold(threshold_);
|
|
if (!s.ok()) {
|
|
threshold_ = std::numeric_limits<int64_t>::max();
|
|
}
|
|
s = config.GetGpuResourceConfigSearchResources(search_gpus_);
|
|
if (!s.ok()) {
|
|
throw std::exception();
|
|
}
|
|
|
|
SetIdentity("FaissIVFSQ8HPass");
|
|
AddGpuEnableListener();
|
|
AddGpuSearchThresholdListener();
|
|
AddGpuSearchResListener();
|
|
#endif
|
|
}
|
|
|
|
bool
|
|
FaissIVFSQ8HPass::Run(const TaskPtr& task) {
|
|
#ifdef CUSTOMIZATION
|
|
if (task->Type() != TaskType::SearchTask) {
|
|
return false;
|
|
}
|
|
|
|
auto search_task = std::static_pointer_cast<XSearchTask>(task);
|
|
if (search_task->file_->engine_type_ != (int)engine::EngineType::FAISS_IVFSQ8H) {
|
|
return false;
|
|
}
|
|
|
|
auto search_job = std::static_pointer_cast<SearchJob>(search_task->job_.lock());
|
|
ResourcePtr res_ptr;
|
|
if (!gpu_enable_) {
|
|
SERVER_LOG_DEBUG << "FaissIVFSQ8HPass: gpu disable, specify cpu to search!";
|
|
res_ptr = ResMgrInst::GetInstance()->GetResource("cpu");
|
|
}
|
|
if (search_job->nq() < threshold_) {
|
|
SERVER_LOG_DEBUG << "FaissIVFSQ8HPass: nq < gpu_search_threshold, specify cpu to search!";
|
|
res_ptr = ResMgrInst::GetInstance()->GetResource("cpu");
|
|
} else {
|
|
auto best_device_id = count_ % search_gpus_.size();
|
|
SERVER_LOG_DEBUG << "FaissIVFSQ8HPass: nq > gpu_search_threshold, specify gpu" << best_device_id
|
|
<< " to search!";
|
|
++count_;
|
|
res_ptr = ResMgrInst::GetInstance()->GetResource(ResourceType::GPU, search_gpus_[best_device_id]);
|
|
}
|
|
auto label = std::make_shared<SpecResLabel>(res_ptr);
|
|
task->label() = label;
|
|
return true;
|
|
#endif
|
|
}
|
|
|
|
} // namespace scheduler
|
|
} // namespace milvus
|
|
#endif
|