milvus/internal/core/src/index/ScalarIndex.h
zhagnlu fc876639cf
enhance: support json stats with shredding design (#42534)
#42533

Co-authored-by: luzhang <luzhang@zilliz.com>
2025-09-01 10:49:52 +08:00

180 lines
4.8 KiB
C++

// Licensed to the LF AI & Data foundation under one
// or more contributor license agreements. See the NOTICE file
// distributed with this work for additional information
// regarding copyright ownership. The ASF licenses this file
// to you under the Apache License, Version 2.0 (the
// "License"); you may not use this file except in compliance
// with the License. You may obtain a copy of the License at
//
// http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.
#pragma once
#include <boost/dynamic_bitset.hpp>
#include <map>
#include <memory>
#include <string>
#include "common/Types.h"
#include "common/EasyAssert.h"
#include "index/Index.h"
#include "fmt/format.h"
#include "index/Meta.h"
namespace milvus::index {
enum class ScalarIndexType {
NONE = 0,
BITMAP,
STLSORT,
MARISA,
INVERTED,
HYBRID,
JSONSTATS,
};
inline std::string
ToString(ScalarIndexType type) {
switch (type) {
case ScalarIndexType::NONE:
return "NONE";
case ScalarIndexType::BITMAP:
return "BITMAP";
case ScalarIndexType::STLSORT:
return "STLSORT";
case ScalarIndexType::MARISA:
return "MARISA";
case ScalarIndexType::INVERTED:
return "INVERTED";
case ScalarIndexType::HYBRID:
return "HYBRID";
default:
return "UNKNOWN";
}
}
template <typename T>
class ScalarIndex : public IndexBase {
public:
ScalarIndex(const std::string& index_type) : IndexBase(index_type) {
}
void
BuildWithRawDataForUT(size_t n,
const void* values,
const Config& config = {}) override;
void
BuildWithDataset(const DatasetPtr& dataset,
const Config& config = {}) override {
ThrowInfo(Unsupported,
"scalar index don't support build index with dataset");
};
public:
virtual ScalarIndexType
GetIndexType() const = 0;
virtual void
Build(size_t n, const T* values, const bool* valid_data = nullptr) = 0;
virtual const TargetBitmap
In(size_t n, const T* values) = 0;
virtual const TargetBitmap
IsNull() = 0;
virtual TargetBitmap
IsNotNull() = 0;
virtual const TargetBitmap
InApplyFilter(size_t n,
const T* values,
const std::function<bool(size_t /* offset */)>& filter) {
ThrowInfo(ErrorCode::Unsupported, "InApplyFilter is not implemented");
}
virtual void
InApplyCallback(size_t n,
const T* values,
const std::function<void(size_t /* offset */)>& callback) {
ThrowInfo(ErrorCode::Unsupported, "InApplyCallback is not implemented");
}
virtual const TargetBitmap
NotIn(size_t n, const T* values) = 0;
virtual const TargetBitmap
Range(T value, OpType op) = 0;
virtual const TargetBitmap
Range(T lower_bound_value,
bool lb_inclusive,
T upper_bound_value,
bool ub_inclusive) = 0;
virtual std::optional<T>
Reverse_Lookup(size_t offset) const = 0;
virtual const TargetBitmap
Query(const DatasetPtr& dataset);
virtual bool
SupportPatternMatch() const {
return false;
}
virtual const TargetBitmap
PatternMatch(const std::string& pattern, proto::plan::OpType op) {
ThrowInfo(Unsupported, "pattern match is not supported");
}
virtual bool
IsMmapSupported() const override {
return index_type_ == milvus::index::BITMAP_INDEX_TYPE ||
index_type_ == milvus::index::HYBRID_INDEX_TYPE ||
index_type_ == milvus::index::INVERTED_INDEX_TYPE ||
index_type_ == milvus::index::MARISA_TRIE ||
index_type_ == milvus::index::MARISA_TRIE_UPPER;
}
virtual int64_t
Size() = 0;
virtual bool
SupportRegexQuery() const {
return false;
}
virtual bool
TryUseRegexQuery() const {
return true;
}
virtual const TargetBitmap
RegexQuery(const std::string& pattern) {
ThrowInfo(Unsupported, "regex query is not supported");
}
virtual void
BuildWithFieldData(const std::vector<FieldDataPtr>& field_datas) {
ThrowInfo(Unsupported, "BuildwithFieldData is not supported");
}
virtual void
LoadWithoutAssemble(const BinarySet& binary_set, const Config& config) {
ThrowInfo(Unsupported, "LoadWithoutAssemble is not supported");
}
};
template <typename T>
using ScalarIndexPtr = std::unique_ptr<ScalarIndex<T>>;
} // namespace milvus::index