2019-03-24 17:07:38 +08:00

51 lines
1.5 KiB
Python

from engine.retrieval import search_index
from engine.ingestion import build_index
class Singleton(type):
_instances = {}
def __call__(cls, *args, **kwargs):
if cls not in cls._instances:
cls._instances[cls] = super(Singleton, cls).__call__(*args, **kwargs)
return cls._instances[cls]
class Scheduler(metaclass=Singleton):
def Search(self, index_file_key, vectors, k):
assert index_file_key
assert vectors
assert k
return self.__scheduler(index_file_key, vectors, k)
def __scheduler(self, index_data_key, vectors, k):
result_list = []
raw_data_list = index_data_key['raw']
index_data_list = index_data_key['index']
for key in raw_data_list:
raw_data, d = self.GetRawData(key)
index_builder = build_index.FactoryIndex()
index = index_builder().build(d, raw_data)
searcher = search_index.FaissSearch(index) # silly
result_list.append(searcher.search_by_vectors(vectors, k))
for key in index_data_list:
index = self.GetIndexData(key)
searcher = search_index.FaissSearch(index)
result_list.append(searcher.search_by_vectors(vectors, k))
if len(result_list) == 1:
return result_list[0].vectors
result = search_index.top_k(sum(result_list), k)
return result
def GetIndexData(self, key):
pass
def GetRawData(self, key):
pass