milvus/internal/core/src/storage/InsertData.cpp
xige-16 04082b3de2
Migrate the ability to upload and download binlog to cpp (#22984)
Signed-off-by: xige-16 <xi.ge@zilliz.com>
2023-06-25 14:38:44 +08:00

115 lines
4.0 KiB
C++

// Licensed to the LF AI & Data foundation under one
// or more contributor license agreements. See the NOTICE file
// distributed with this work for additional information
// regarding copyright ownership. The ASF licenses this file
// to you under the Apache License, Version 2.0 (the
// "License"); you may not use this file except in compliance
// with the License. You may obtain a copy of the License at
//
// http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.
#include "storage/InsertData.h"
#include "storage/Event.h"
#include "storage/Util.h"
#include "utils/Json.h"
#include "common/FieldMeta.h"
#include "common/Consts.h"
namespace milvus::storage {
void
InsertData::SetFieldDataMeta(const FieldDataMeta& meta) {
AssertInfo(!field_data_meta_.has_value(), "field meta has been inited");
field_data_meta_ = meta;
}
std::vector<uint8_t>
InsertData::Serialize(StorageType medium) {
switch (medium) {
case StorageType::Remote:
return serialize_to_remote_file();
case StorageType::LocalDisk:
return serialize_to_local_file();
default:
PanicInfo("unsupported medium type");
}
}
// TODO :: handle string and bool type
std::vector<uint8_t>
InsertData::serialize_to_remote_file() {
AssertInfo(field_data_meta_.has_value(), "field data not exist");
AssertInfo(field_data_ != nullptr, "empty field data");
DataType data_type = field_data_->get_data_type();
// create descriptor event
DescriptorEvent descriptor_event;
auto& des_event_data = descriptor_event.event_data;
auto& des_fix_part = des_event_data.fix_part;
des_fix_part.collection_id = field_data_meta_->collection_id;
des_fix_part.partition_id = field_data_meta_->partition_id;
des_fix_part.segment_id = field_data_meta_->segment_id;
des_fix_part.field_id = field_data_meta_->field_id;
des_fix_part.start_timestamp = time_range_.first;
des_fix_part.end_timestamp = time_range_.second;
des_fix_part.data_type = milvus::proto::schema::DataType(data_type);
for (auto i = int8_t(EventType::DescriptorEvent);
i < int8_t(EventType::EventTypeEnd);
i++) {
des_event_data.post_header_lengths.push_back(
GetEventFixPartSize(EventType(i)));
}
des_event_data.extras[ORIGIN_SIZE_KEY] =
std::to_string(field_data_->Size());
auto& des_event_header = descriptor_event.event_header;
// TODO :: set timestamp
des_event_header.timestamp_ = 0;
// serialize descriptor event data
auto des_event_bytes = descriptor_event.Serialize();
// create insert event
InsertEvent insert_event;
insert_event.event_offset = des_event_bytes.size();
auto& insert_event_data = insert_event.event_data;
insert_event_data.start_timestamp = time_range_.first;
insert_event_data.end_timestamp = time_range_.second;
insert_event_data.field_data = field_data_;
auto& insert_event_header = insert_event.event_header;
// TODO :: set timestamps
insert_event_header.timestamp_ = 0;
insert_event_header.event_type_ = EventType::InsertEvent;
// serialize insert event
auto insert_event_bytes = insert_event.Serialize();
des_event_bytes.insert(des_event_bytes.end(),
insert_event_bytes.begin(),
insert_event_bytes.end());
return des_event_bytes;
}
// local insert file format
// -------------------------------------------
// | Rows(int) | Dimension(int) | InsertData |
// -------------------------------------------
std::vector<uint8_t>
InsertData::serialize_to_local_file() {
LocalInsertEvent event;
event.field_data = field_data_;
return event.Serialize();
}
} // namespace milvus::storage