milvus/internal/storage/cwrapper/PayloadStream.h
FluorineDog 6412ebc0d4 Add support of metric type in schema, enable binary vector, fix segfault
Signed-off-by: FluorineDog <guilin.gou@zilliz.com>
2020-12-05 06:46:01 +08:00

75 lines
1.8 KiB
C++

#pragma once
#include <arrow/api.h>
#include <arrow/io/interfaces.h>
#include <parquet/arrow/writer.h>
#include <parquet/arrow/reader.h>
#include "ColumnType.h"
namespace wrapper {
class PayloadOutputStream;
class PayloadInputStream;
constexpr int EMPTY_DIMENSION = -1;
struct PayloadWriter {
ColumnType columnType;
int dimension; // binary vector, float vector
std::shared_ptr<arrow::ArrayBuilder> builder;
std::shared_ptr<arrow::Schema> schema;
std::shared_ptr<PayloadOutputStream> output;
int rows;
};
struct PayloadReader {
ColumnType column_type;
std::shared_ptr<PayloadInputStream> input;
std::unique_ptr<parquet::arrow::FileReader> reader;
std::shared_ptr<arrow::Table> table;
std::shared_ptr<arrow::ChunkedArray> column;
std::shared_ptr<arrow::Array> array;
bool *bValues;
};
class PayloadOutputStream : public arrow::io::OutputStream {
public:
PayloadOutputStream();
~PayloadOutputStream();
arrow::Status Close() override;
arrow::Result<int64_t> Tell() const override;
bool closed() const override;
arrow::Status Write(const void *data, int64_t nbytes) override;
arrow::Status Flush() override;
public:
const std::vector<uint8_t> &Buffer() const;
private:
std::vector<uint8_t> buffer_;
bool closed_;
};
class PayloadInputStream : public arrow::io::RandomAccessFile {
public:
PayloadInputStream(const uint8_t *data, int64_t size);
~PayloadInputStream();
arrow::Status Close() override;
arrow::Result<int64_t> Tell() const override;
bool closed() const override;
arrow::Status Seek(int64_t position) override;
arrow::Result<int64_t> Read(int64_t nbytes, void *out) override;
arrow::Result<std::shared_ptr<arrow::Buffer>> Read(int64_t nbytes) override;
arrow::Result<int64_t> GetSize() override;
private:
const uint8_t *data_;
const int64_t size_;
int64_t tell_;
bool closed_;
};
}