mirror of
https://gitee.com/milvus-io/milvus.git
synced 2025-12-30 23:45:28 +08:00
* rename MILVUS_ENABLE_PROFILING to ENABLE_CPU_PROFILING, and add ENABLE_MEM_PROFILING Signed-off-by: feisiyicl <7764126@qq.com> * optimize ReadOnlyArrayInvertedLists Signed-off-by: feisiyicl <7764126@qq.com> * update changelog Signed-off-by: feisiyicl <7764126@qq.com> * retry ci Signed-off-by: feisiyicl <7764126@qq.com> * fix build issue Signed-off-by: feisiyicl <7764126@qq.com>
165 lines
6.2 KiB
C++
165 lines
6.2 KiB
C++
// Licensed to the Apache Software Foundation (ASF) under one
|
|
// or more contributor license agreements. See the NOTICE file
|
|
// distributed with this work for additional information
|
|
// regarding copyright ownership. The ASF licenses this file
|
|
// to you under the Apache License, Version 2.0 (the
|
|
// "License"); you may not use this file except in compliance
|
|
// with the License. You may obtain a copy of the License at
|
|
//
|
|
// http://www.apache.org/licenses/LICENSE-2.0
|
|
//
|
|
// Unless required by applicable law or agreed to in writing,
|
|
// software distributed under the License is distributed on an
|
|
// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
|
|
// KIND, either express or implied. See the License for the
|
|
// specific language governing permissions and limitations
|
|
// under the License.
|
|
|
|
#include "server/delivery/request/SearchByIDRequest.h"
|
|
|
|
#include <memory>
|
|
|
|
#include "config/Config.h"
|
|
#include "server/DBWrapper.h"
|
|
#include "utils/CommonUtil.h"
|
|
#include "utils/Log.h"
|
|
#include "utils/TimeRecorder.h"
|
|
#include "utils/ValidationUtil.h"
|
|
|
|
#ifdef ENABLE_CPU_PROFILING
|
|
#include <gperftools/profiler.h>
|
|
#endif
|
|
|
|
namespace milvus {
|
|
namespace server {
|
|
|
|
SearchByIDRequest::SearchByIDRequest(const std::shared_ptr<milvus::server::Context>& context,
|
|
const std::string& collection_name, const std::vector<int64_t>& id_array,
|
|
int64_t topk, const milvus::json& extra_params,
|
|
const std::vector<std::string>& partition_list, TopKQueryResult& result)
|
|
: BaseRequest(context, BaseRequest::kSearchByID),
|
|
collection_name_(collection_name),
|
|
id_array_(id_array),
|
|
topk_(topk),
|
|
extra_params_(extra_params),
|
|
partition_list_(partition_list),
|
|
result_(result) {
|
|
}
|
|
|
|
BaseRequestPtr
|
|
SearchByIDRequest::Create(const std::shared_ptr<milvus::server::Context>& context, const std::string& collection_name,
|
|
const std::vector<int64_t>& id_array, int64_t topk, const milvus::json& extra_params,
|
|
const std::vector<std::string>& partition_list, TopKQueryResult& result) {
|
|
return std::shared_ptr<BaseRequest>(
|
|
new SearchByIDRequest(context, collection_name, id_array, topk, extra_params, partition_list, result));
|
|
}
|
|
|
|
Status
|
|
SearchByIDRequest::OnExecute() {
|
|
try {
|
|
milvus::server::ContextChild pre_tracer(context_, "Pre query");
|
|
|
|
std::string hdr = "SearchByIDRequest(collection=" + collection_name_ + ", k=" + std::to_string(topk_) +
|
|
", extra_params=" + extra_params_.dump() + ")";
|
|
|
|
TimeRecorder rc(hdr);
|
|
|
|
// step 1: check empty id array
|
|
if (id_array_.empty()) {
|
|
return Status(SERVER_INVALID_ARGUMENT, "No vector id specified");
|
|
}
|
|
|
|
// step 2: check collection name
|
|
auto status = ValidationUtil::ValidateCollectionName(collection_name_);
|
|
if (!status.ok()) {
|
|
return status;
|
|
}
|
|
|
|
// step 3: check search topk
|
|
status = ValidationUtil::ValidateSearchTopk(topk_);
|
|
if (!status.ok()) {
|
|
return status;
|
|
}
|
|
|
|
// step 4: check collection existence
|
|
// only process root collection, ignore partition collection
|
|
engine::meta::CollectionSchema collection_schema;
|
|
collection_schema.collection_id_ = collection_name_;
|
|
status = DBWrapper::DB()->DescribeCollection(collection_schema);
|
|
if (!status.ok()) {
|
|
if (status.code() == DB_NOT_FOUND) {
|
|
return Status(SERVER_COLLECTION_NOT_EXIST, CollectionNotExistMsg(collection_name_));
|
|
} else {
|
|
return status;
|
|
}
|
|
} else {
|
|
if (!collection_schema.owner_collection_.empty()) {
|
|
return Status(SERVER_INVALID_COLLECTION_NAME, CollectionNotExistMsg(collection_name_));
|
|
}
|
|
}
|
|
|
|
// step 5: check search parameters
|
|
status = ValidationUtil::ValidateSearchParams(extra_params_, collection_schema, topk_);
|
|
if (!status.ok()) {
|
|
return status;
|
|
}
|
|
|
|
// step 6: check collection's index type supports search by id
|
|
if (collection_schema.engine_type_ != (int32_t)engine::EngineType::FAISS_IDMAP &&
|
|
collection_schema.engine_type_ != (int32_t)engine::EngineType::FAISS_BIN_IDMAP &&
|
|
collection_schema.engine_type_ != (int32_t)engine::EngineType::FAISS_IVFFLAT &&
|
|
collection_schema.engine_type_ != (int32_t)engine::EngineType::FAISS_BIN_IVFFLAT &&
|
|
collection_schema.engine_type_ != (int32_t)engine::EngineType::FAISS_IVFSQ8) {
|
|
std::string err_msg = "Index type " + std::to_string(collection_schema.engine_type_) +
|
|
" does not support SearchByID operation";
|
|
LOG_SERVER_ERROR_ << err_msg;
|
|
return Status(SERVER_UNSUPPORTED_ERROR, err_msg);
|
|
}
|
|
|
|
rc.RecordSection("check validation");
|
|
|
|
// step 7: search vectors
|
|
engine::ResultIds result_ids;
|
|
engine::ResultDistances result_distances;
|
|
|
|
#ifdef ENABLE_CPU_PROFILING
|
|
std::string fname = "/tmp/search_by_id_" + CommonUtil::GetCurrentTimeStr() + ".profiling";
|
|
ProfilerStart(fname.c_str());
|
|
#endif
|
|
|
|
pre_tracer.Finish();
|
|
|
|
status = DBWrapper::DB()->QueryByIDs(context_, collection_name_, partition_list_, (size_t)topk_, extra_params_,
|
|
id_array_, result_ids, result_distances);
|
|
|
|
#ifdef ENABLE_CPU_PROFILING
|
|
ProfilerStop();
|
|
#endif
|
|
|
|
rc.RecordSection("search vectors from engine");
|
|
if (!status.ok()) {
|
|
return status;
|
|
}
|
|
|
|
if (result_ids.empty()) {
|
|
return Status::OK(); // empty collection
|
|
}
|
|
|
|
// step 8: construct result array
|
|
milvus::server::ContextChild tracer(context_, "Constructing result");
|
|
result_.row_num_ = id_array_.size();
|
|
result_.distance_list_.swap(result_distances);
|
|
result_.id_list_.swap(result_ids);
|
|
|
|
rc.RecordSection("construct result and send");
|
|
rc.ElapseFromBegin("totally cost");
|
|
} catch (std::exception& ex) {
|
|
return Status(SERVER_UNEXPECTED_ERROR, ex.what());
|
|
}
|
|
|
|
return Status::OK();
|
|
}
|
|
|
|
} // namespace server
|
|
} // namespace milvus
|