mirror of https://github.com/milvus-io/milvus.git
177 lines
6.3 KiB
Python
177 lines
6.3 KiB
Python
from engine.model.group_table import GroupTable
|
|
from engine.model.file_table import FileTable
|
|
from engine.controller.raw_file_handler import RawFileHandler
|
|
from engine.controller.group_handler import GroupHandler
|
|
from engine.controller.index_file_handler import IndexFileHandler
|
|
from engine.settings import ROW_LIMIT
|
|
from flask import jsonify
|
|
from engine import db
|
|
import sys, os
|
|
|
|
class VectorEngine(object):
|
|
group_dict = None
|
|
|
|
@staticmethod
|
|
def AddGroup(group_id, dimension):
|
|
group = GroupTable.query.filter(GroupTable.group_name==group_id).first()
|
|
if group:
|
|
print('Already create the group: ', group_id)
|
|
return jsonify({'code': 1, 'group_name': group_id, 'file_number': group.file_number})
|
|
else:
|
|
print('To create the group: ', group_id)
|
|
new_group = GroupTable(group_id, dimension)
|
|
GroupHandler.CreateGroupDirectory(group_id)
|
|
|
|
# add into database
|
|
db.session.add(new_group)
|
|
db.session.commit()
|
|
return jsonify({'code': 0, 'group_name': group_id, 'file_number': 0})
|
|
|
|
|
|
@staticmethod
|
|
def GetGroup(group_id):
|
|
group = GroupTable.query.filter(GroupTable.group_name==group_id).first()
|
|
if group:
|
|
print('Found the group: ', group_id)
|
|
return jsonify({'code': 0, 'group_name': group_id, 'file_number': group.file_number})
|
|
else:
|
|
print('Not found the group: ', group_id)
|
|
return jsonify({'code': 1, 'group_name': group_id, 'file_number': 0}) # not found
|
|
|
|
|
|
@staticmethod
|
|
def DeleteGroup(group_id):
|
|
group = GroupTable.query.filter(GroupTable.group_name==group_id).first()
|
|
if(group):
|
|
# old_group = GroupTable(group_id)
|
|
db.session.delete(group)
|
|
db.session.commit()
|
|
GroupHandler.DeleteGroupDirectory(group_id)
|
|
|
|
records = FileTable.query.filter(FileTable.group_name == group_id).all()
|
|
for record in records:
|
|
print("record.group_name: ", record.group_name)
|
|
db.session.delete(record)
|
|
db.session.commit()
|
|
|
|
return jsonify({'code': 0, 'group_name': group_id, 'file_number': group.file_number})
|
|
else:
|
|
return jsonify({'code': 0, 'group_name': group_id, 'file_number': 0})
|
|
|
|
|
|
@staticmethod
|
|
def GetGroupList():
|
|
group = GroupTable.query.all()
|
|
group_list = []
|
|
for group_tuple in group:
|
|
group_item = {}
|
|
group_item['group_name'] = group_tuple.group_name
|
|
group_item['file_number'] = group_tuple.file_number
|
|
group_list.append(group_item)
|
|
|
|
print(group_list)
|
|
return jsonify(results = group_list)
|
|
|
|
|
|
@staticmethod
|
|
def AddVector(group_id, vector):
|
|
print(group_id, vector)
|
|
file = FileTable.query.filter(FileTable.group_name == group_id).filter(FileTable.type == 'raw').first()
|
|
if file:
|
|
print('insert into exist file')
|
|
# insert into raw file
|
|
VectorEngine.InsertVectorIntoRawFile(group_id, file.filename, vector)
|
|
|
|
# check if the file can be indexed
|
|
if file.row_number + 1 >= ROW_LIMIT:
|
|
# read data from raw file
|
|
data = GetVectorsFromRawFile()
|
|
|
|
# create index
|
|
index_filename = file.filename + '_index'
|
|
CreateIndex(group_id, index_filename, data)
|
|
|
|
# update record into database
|
|
FileTable.query.filter(FileTable.group_name == group_id).filter(FileTable.type == 'raw').update({'row_number':file.row_number + 1, 'type': 'index'})
|
|
pass
|
|
|
|
else:
|
|
# we still can insert into exist raw file, update database
|
|
FileTable.query.filter(FileTable.group_name == group_id).filter(FileTable.type == 'raw').update({'row_number':file.row_number + 1})
|
|
db.session.commit()
|
|
print('Update db for raw file insertion')
|
|
pass
|
|
|
|
else:
|
|
print('add a new raw file')
|
|
# first raw file
|
|
raw_filename = group_id + '.raw'
|
|
# create and insert vector into raw file
|
|
VectorEngine.InsertVectorIntoRawFile(group_id, raw_filename, vector)
|
|
# insert a record into database
|
|
db.session.add(FileTable(group_id, raw_filename, 'raw', 1))
|
|
db.session.commit()
|
|
|
|
return jsonify({'code': 0})
|
|
|
|
|
|
@staticmethod
|
|
def SearchVector(group_id, vector, limit):
|
|
# find all files
|
|
files = FileTable.query.filter(FileTable.group_name == group_id).all()
|
|
|
|
for file in files:
|
|
if(file.type == 'raw'):
|
|
# create index
|
|
# add vector list
|
|
# train
|
|
# get topk
|
|
print('search in raw file: ', file.filename)
|
|
pass
|
|
else:
|
|
# get topk
|
|
print('search in index file: ', file.filename)
|
|
data = IndexFileHandler.Read(file.filename, file.type)
|
|
pass
|
|
|
|
# according to difference files get topk of each
|
|
# reduce the topk from them
|
|
# construct response and send back
|
|
return jsonify({'code': 0})
|
|
|
|
|
|
@staticmethod
|
|
def CreateIndex(group_id):
|
|
# create index
|
|
file = FileTable.query.filter(FileTable.group_name == group_id).filter(FileTable.type == 'raw').first()
|
|
path = GroupHandler.GetGroupDirectory(group_id) + '/' + file.filename
|
|
print('Going to create index for: ', path)
|
|
return jsonify({'code': 0})
|
|
|
|
|
|
@staticmethod
|
|
def InsertVectorIntoRawFile(group_id, filename, vector):
|
|
# print(sys._getframe().f_code.co_name, group_id, vector)
|
|
# path = GroupHandler.GetGroupDirectory(group_id) + '/' + filename
|
|
if VectorEngine.group_dict is None:
|
|
# print("VectorEngine.group_dict is None")
|
|
VectorEngine.group_dict = dict()
|
|
VectorEngine.group_dict[group_id] = []
|
|
|
|
VectorEngine.group_dict[group_id].append(vector)
|
|
|
|
print('InsertVectorIntoRawFile: ', VectorEngine.group_dict[group_id])
|
|
|
|
# if filename exist
|
|
# append
|
|
# if filename not exist
|
|
# create file
|
|
# append
|
|
return filename
|
|
|
|
|
|
@staticmethod
|
|
def GetVectorListFromRawFile(group_id, filename):
|
|
return VectorEngine.group_dict[group_id]
|
|
|