mirror of https://github.com/milvus-io/milvus.git
2074 lines
73 KiB
C++
2074 lines
73 KiB
C++
// Copyright (C) 2019-2020 Zilliz. All rights reserved.
|
|
//
|
|
// Licensed under the Apache License, Version 2.0 (the "License"); you may not use this file except in compliance
|
|
// with the License. You may obtain a copy of the License at
|
|
//
|
|
// http://www.apache.org/licenses/LICENSE-2.0
|
|
//
|
|
// Unless required by applicable law or agreed to in writing, software distributed under the License
|
|
// is distributed on an "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express
|
|
// or implied. See the License for the specific language governing permissions and limitations under the License.
|
|
|
|
#include "db/DBImpl.h"
|
|
|
|
#include <assert.h>
|
|
#include <fiu-local.h>
|
|
|
|
#include <algorithm>
|
|
#include <boost/filesystem.hpp>
|
|
#include <chrono>
|
|
#include <cstring>
|
|
#include <functional>
|
|
#include <iostream>
|
|
#include <limits>
|
|
#include <set>
|
|
#include <thread>
|
|
#include <utility>
|
|
|
|
#include "Utils.h"
|
|
#include "cache/CpuCacheMgr.h"
|
|
#include "cache/GpuCacheMgr.h"
|
|
#include "db/IDGenerator.h"
|
|
#include "engine/EngineFactory.h"
|
|
#include "index/thirdparty/faiss/utils/distances.h"
|
|
#include "insert/MemMenagerFactory.h"
|
|
#include "meta/MetaConsts.h"
|
|
#include "meta/MetaFactory.h"
|
|
#include "meta/SqliteMetaImpl.h"
|
|
#include "metrics/Metrics.h"
|
|
#include "scheduler/SchedInst.h"
|
|
#include "scheduler/job/BuildIndexJob.h"
|
|
#include "scheduler/job/DeleteJob.h"
|
|
#include "scheduler/job/SearchJob.h"
|
|
#include "segment/SegmentReader.h"
|
|
#include "segment/SegmentWriter.h"
|
|
#include "utils/Exception.h"
|
|
#include "utils/Log.h"
|
|
#include "utils/StringHelpFunctions.h"
|
|
#include "utils/TimeRecorder.h"
|
|
#include "utils/ValidationUtil.h"
|
|
#include "wal/WalDefinations.h"
|
|
|
|
namespace milvus {
|
|
namespace engine {
|
|
|
|
namespace {
|
|
|
|
constexpr uint64_t METRIC_ACTION_INTERVAL = 1;
|
|
constexpr uint64_t COMPACT_ACTION_INTERVAL = 1;
|
|
constexpr uint64_t INDEX_ACTION_INTERVAL = 1;
|
|
|
|
static const Status SHUTDOWN_ERROR = Status(DB_ERROR, "Milvus server is shutdown!");
|
|
|
|
} // namespace
|
|
|
|
DBImpl::DBImpl(const DBOptions& options)
|
|
: options_(options), initialized_(false), merge_thread_pool_(1, 1), index_thread_pool_(1, 1) {
|
|
meta_ptr_ = MetaFactory::Build(options.meta_, options.mode_);
|
|
mem_mgr_ = MemManagerFactory::Build(meta_ptr_, options_);
|
|
|
|
if (options_.wal_enable_) {
|
|
wal::MXLogConfiguration mxlog_config;
|
|
mxlog_config.recovery_error_ignore = options_.recovery_error_ignore_;
|
|
// 2 buffers in the WAL
|
|
mxlog_config.buffer_size = options_.buffer_size_ / 2;
|
|
mxlog_config.mxlog_path = options_.mxlog_path_;
|
|
wal_mgr_ = std::make_shared<wal::WalManager>(mxlog_config);
|
|
}
|
|
|
|
SetIdentity("DBImpl");
|
|
AddCacheInsertDataListener();
|
|
AddUseBlasThresholdListener();
|
|
|
|
Start();
|
|
}
|
|
|
|
DBImpl::~DBImpl() {
|
|
Stop();
|
|
}
|
|
|
|
///////////////////////////////////////////////////////////////////////////////////////////////////////////////////
|
|
// external api
|
|
///////////////////////////////////////////////////////////////////////////////////////////////////////////////////
|
|
Status
|
|
DBImpl::Start() {
|
|
if (initialized_.load(std::memory_order_acquire)) {
|
|
return Status::OK();
|
|
}
|
|
|
|
// ENGINE_LOG_TRACE << "DB service start";
|
|
initialized_.store(true, std::memory_order_release);
|
|
|
|
// wal
|
|
if (options_.wal_enable_) {
|
|
auto error_code = DB_ERROR;
|
|
if (wal_mgr_ != nullptr) {
|
|
error_code = wal_mgr_->Init(meta_ptr_);
|
|
}
|
|
if (error_code != WAL_SUCCESS) {
|
|
throw Exception(error_code, "Wal init error!");
|
|
}
|
|
|
|
// recovery
|
|
while (1) {
|
|
wal::MXLogRecord record;
|
|
auto error_code = wal_mgr_->GetNextRecovery(record);
|
|
if (error_code != WAL_SUCCESS) {
|
|
throw Exception(error_code, "Wal recovery error!");
|
|
}
|
|
if (record.type == wal::MXLogType::None) {
|
|
break;
|
|
}
|
|
|
|
ExecWalRecord(record);
|
|
}
|
|
|
|
// for distribute version, some nodes are read only
|
|
if (options_.mode_ != DBOptions::MODE::CLUSTER_READONLY) {
|
|
// background thread
|
|
bg_wal_thread_ = std::thread(&DBImpl::BackgroundWalTask, this);
|
|
}
|
|
|
|
} else {
|
|
// for distribute version, some nodes are read only
|
|
if (options_.mode_ != DBOptions::MODE::CLUSTER_READONLY) {
|
|
// ENGINE_LOG_TRACE << "StartTimerTasks";
|
|
bg_timer_thread_ = std::thread(&DBImpl::BackgroundTimerTask, this);
|
|
}
|
|
}
|
|
|
|
return Status::OK();
|
|
}
|
|
|
|
Status
|
|
DBImpl::Stop() {
|
|
if (!initialized_.load(std::memory_order_acquire)) {
|
|
return Status::OK();
|
|
}
|
|
|
|
initialized_.store(false, std::memory_order_release);
|
|
|
|
if (options_.mode_ != DBOptions::MODE::CLUSTER_READONLY) {
|
|
if (options_.wal_enable_) {
|
|
// wait flush merge/buildindex finish
|
|
bg_task_swn_.Notify();
|
|
bg_wal_thread_.join();
|
|
|
|
} else {
|
|
// flush all
|
|
wal::MXLogRecord record;
|
|
record.type = wal::MXLogType::Flush;
|
|
ExecWalRecord(record);
|
|
|
|
// wait merge/buildindex finish
|
|
bg_task_swn_.Notify();
|
|
bg_timer_thread_.join();
|
|
}
|
|
|
|
meta_ptr_->CleanUpShadowFiles();
|
|
}
|
|
|
|
// ENGINE_LOG_TRACE << "DB service stop";
|
|
return Status::OK();
|
|
}
|
|
|
|
Status
|
|
DBImpl::DropAll() {
|
|
return meta_ptr_->DropAll();
|
|
}
|
|
|
|
Status
|
|
DBImpl::CreateCollection(meta::CollectionSchema& collection_schema) {
|
|
if (!initialized_.load(std::memory_order_acquire)) {
|
|
return SHUTDOWN_ERROR;
|
|
}
|
|
|
|
meta::CollectionSchema temp_schema = collection_schema;
|
|
temp_schema.index_file_size_ *= ONE_MB; // store as MB
|
|
if (options_.wal_enable_) {
|
|
temp_schema.flush_lsn_ = wal_mgr_->CreateCollection(collection_schema.collection_id_);
|
|
}
|
|
|
|
return meta_ptr_->CreateCollection(temp_schema);
|
|
}
|
|
|
|
Status
|
|
DBImpl::DropCollection(const std::string& collection_id) {
|
|
if (!initialized_.load(std::memory_order_acquire)) {
|
|
return SHUTDOWN_ERROR;
|
|
}
|
|
|
|
if (options_.wal_enable_) {
|
|
wal_mgr_->DropCollection(collection_id);
|
|
}
|
|
|
|
return DropCollectionRecursively(collection_id);
|
|
}
|
|
|
|
Status
|
|
DBImpl::DescribeCollection(meta::CollectionSchema& collection_schema) {
|
|
if (!initialized_.load(std::memory_order_acquire)) {
|
|
return SHUTDOWN_ERROR;
|
|
}
|
|
|
|
auto stat = meta_ptr_->DescribeCollection(collection_schema);
|
|
collection_schema.index_file_size_ /= ONE_MB; // return as MB
|
|
return stat;
|
|
}
|
|
|
|
Status
|
|
DBImpl::HasCollection(const std::string& collection_id, bool& has_or_not) {
|
|
if (!initialized_.load(std::memory_order_acquire)) {
|
|
return SHUTDOWN_ERROR;
|
|
}
|
|
|
|
return meta_ptr_->HasCollection(collection_id, has_or_not);
|
|
}
|
|
|
|
Status
|
|
DBImpl::HasNativeCollection(const std::string& collection_id, bool& has_or_not_) {
|
|
if (!initialized_.load(std::memory_order_acquire)) {
|
|
return SHUTDOWN_ERROR;
|
|
}
|
|
|
|
engine::meta::CollectionSchema collection_schema;
|
|
collection_schema.collection_id_ = collection_id;
|
|
auto status = DescribeCollection(collection_schema);
|
|
if (!status.ok()) {
|
|
has_or_not_ = false;
|
|
return status;
|
|
} else {
|
|
if (!collection_schema.owner_collection_.empty()) {
|
|
has_or_not_ = false;
|
|
return Status(DB_NOT_FOUND, "");
|
|
}
|
|
|
|
has_or_not_ = true;
|
|
return Status::OK();
|
|
}
|
|
}
|
|
|
|
Status
|
|
DBImpl::AllCollections(std::vector<meta::CollectionSchema>& collection_schema_array) {
|
|
if (!initialized_.load(std::memory_order_acquire)) {
|
|
return SHUTDOWN_ERROR;
|
|
}
|
|
|
|
std::vector<meta::CollectionSchema> all_collections;
|
|
auto status = meta_ptr_->AllCollections(all_collections);
|
|
|
|
// only return real collections, dont return partition collections
|
|
collection_schema_array.clear();
|
|
for (auto& schema : all_collections) {
|
|
if (schema.owner_collection_.empty()) {
|
|
collection_schema_array.push_back(schema);
|
|
}
|
|
}
|
|
|
|
return status;
|
|
}
|
|
|
|
Status
|
|
DBImpl::GetCollectionInfo(const std::string& collection_id, CollectionInfo& collection_info) {
|
|
if (!initialized_.load(std::memory_order_acquire)) {
|
|
return SHUTDOWN_ERROR;
|
|
}
|
|
|
|
// step1: get all partition ids
|
|
std::vector<std::pair<std::string, std::string>> name2tag = {{collection_id, milvus::engine::DEFAULT_PARTITON_TAG}};
|
|
std::vector<meta::CollectionSchema> partition_array;
|
|
auto status = meta_ptr_->ShowPartitions(collection_id, partition_array);
|
|
for (auto& schema : partition_array) {
|
|
name2tag.push_back(std::make_pair(schema.collection_id_, schema.partition_tag_));
|
|
}
|
|
|
|
// step2: get native collection info
|
|
std::vector<int> file_types{meta::SegmentSchema::FILE_TYPE::RAW, meta::SegmentSchema::FILE_TYPE::TO_INDEX,
|
|
meta::SegmentSchema::FILE_TYPE::INDEX};
|
|
|
|
static std::map<int32_t, std::string> index_type_name = {
|
|
{(int32_t)engine::EngineType::FAISS_IDMAP, "IDMAP"},
|
|
{(int32_t)engine::EngineType::FAISS_IVFFLAT, "IVFFLAT"},
|
|
{(int32_t)engine::EngineType::FAISS_IVFSQ8, "IVFSQ8"},
|
|
{(int32_t)engine::EngineType::NSG_MIX, "NSG"},
|
|
{(int32_t)engine::EngineType::ANNOY, "ANNOY"},
|
|
{(int32_t)engine::EngineType::FAISS_IVFSQ8H, "IVFSQ8H"},
|
|
{(int32_t)engine::EngineType::FAISS_PQ, "PQ"},
|
|
{(int32_t)engine::EngineType::SPTAG_KDT, "KDT"},
|
|
{(int32_t)engine::EngineType::SPTAG_BKT, "BKT"},
|
|
{(int32_t)engine::EngineType::FAISS_BIN_IDMAP, "IDMAP"},
|
|
{(int32_t)engine::EngineType::FAISS_BIN_IVFFLAT, "IVFFLAT"},
|
|
};
|
|
|
|
for (auto& name_tag : name2tag) {
|
|
meta::SegmentsSchema collection_files;
|
|
status = meta_ptr_->FilesByType(name_tag.first, file_types, collection_files);
|
|
if (!status.ok()) {
|
|
std::string err_msg = "Failed to get collection info: " + status.ToString();
|
|
ENGINE_LOG_ERROR << err_msg;
|
|
return Status(DB_ERROR, err_msg);
|
|
}
|
|
|
|
std::vector<SegmentStat> segments_stat;
|
|
for (auto& file : collection_files) {
|
|
SegmentStat seg_stat;
|
|
seg_stat.name_ = file.segment_id_;
|
|
seg_stat.row_count_ = (int64_t)file.row_count_;
|
|
seg_stat.index_name_ = index_type_name[file.engine_type_];
|
|
seg_stat.data_size_ = (int64_t)file.file_size_;
|
|
segments_stat.emplace_back(seg_stat);
|
|
}
|
|
|
|
PartitionStat partition_stat;
|
|
if (name_tag.first == collection_id) {
|
|
partition_stat.tag_ = milvus::engine::DEFAULT_PARTITON_TAG;
|
|
} else {
|
|
partition_stat.tag_ = name_tag.second;
|
|
}
|
|
|
|
partition_stat.segments_stat_.swap(segments_stat);
|
|
collection_info.partitions_stat_.emplace_back(partition_stat);
|
|
}
|
|
|
|
return Status::OK();
|
|
}
|
|
|
|
Status
|
|
DBImpl::PreloadCollection(const std::string& collection_id) {
|
|
if (!initialized_.load(std::memory_order_acquire)) {
|
|
return SHUTDOWN_ERROR;
|
|
}
|
|
|
|
// step 1: get all collection files from parent collection
|
|
meta::SegmentsSchema files_array;
|
|
auto status = GetFilesToSearch(collection_id, files_array);
|
|
if (!status.ok()) {
|
|
return status;
|
|
}
|
|
|
|
// step 2: get files from partition collections
|
|
std::vector<meta::CollectionSchema> partition_array;
|
|
status = meta_ptr_->ShowPartitions(collection_id, partition_array);
|
|
for (auto& schema : partition_array) {
|
|
status = GetFilesToSearch(schema.collection_id_, files_array);
|
|
}
|
|
|
|
int64_t size = 0;
|
|
int64_t cache_total = cache::CpuCacheMgr::GetInstance()->CacheCapacity();
|
|
int64_t cache_usage = cache::CpuCacheMgr::GetInstance()->CacheUsage();
|
|
int64_t available_size = cache_total - cache_usage;
|
|
|
|
// step 3: load file one by one
|
|
ENGINE_LOG_DEBUG << "Begin pre-load collection:" + collection_id + ", totally " << files_array.size()
|
|
<< " files need to be pre-loaded";
|
|
TimeRecorderAuto rc("Pre-load collection:" + collection_id);
|
|
for (auto& file : files_array) {
|
|
EngineType engine_type;
|
|
if (file.file_type_ == meta::SegmentSchema::FILE_TYPE::RAW ||
|
|
file.file_type_ == meta::SegmentSchema::FILE_TYPE::TO_INDEX ||
|
|
file.file_type_ == meta::SegmentSchema::FILE_TYPE::BACKUP) {
|
|
engine_type =
|
|
utils::IsBinaryMetricType(file.metric_type_) ? EngineType::FAISS_BIN_IDMAP : EngineType::FAISS_IDMAP;
|
|
} else {
|
|
engine_type = (EngineType)file.engine_type_;
|
|
}
|
|
|
|
auto json = milvus::json::parse(file.index_params_);
|
|
ExecutionEnginePtr engine =
|
|
EngineFactory::Build(file.dimension_, file.location_, engine_type, (MetricType)file.metric_type_, json);
|
|
fiu_do_on("DBImpl.PreloadCollection.null_engine", engine = nullptr);
|
|
if (engine == nullptr) {
|
|
ENGINE_LOG_ERROR << "Invalid engine type";
|
|
return Status(DB_ERROR, "Invalid engine type");
|
|
}
|
|
|
|
fiu_do_on("DBImpl.PreloadCollection.exceed_cache", size = available_size + 1);
|
|
|
|
try {
|
|
fiu_do_on("DBImpl.PreloadCollection.engine_throw_exception", throw std::exception());
|
|
std::string msg = "Pre-loaded file: " + file.file_id_ + " size: " + std::to_string(file.file_size_);
|
|
TimeRecorderAuto rc_1(msg);
|
|
engine->Load(true);
|
|
|
|
size += engine->Size();
|
|
if (size > available_size) {
|
|
ENGINE_LOG_DEBUG << "Pre-load cancelled since cache is almost full";
|
|
return Status(SERVER_CACHE_FULL, "Cache is full");
|
|
}
|
|
} catch (std::exception& ex) {
|
|
std::string msg = "Pre-load collection encounter exception: " + std::string(ex.what());
|
|
ENGINE_LOG_ERROR << msg;
|
|
return Status(DB_ERROR, msg);
|
|
}
|
|
}
|
|
|
|
return Status::OK();
|
|
}
|
|
|
|
Status
|
|
DBImpl::UpdateCollectionFlag(const std::string& collection_id, int64_t flag) {
|
|
if (!initialized_.load(std::memory_order_acquire)) {
|
|
return SHUTDOWN_ERROR;
|
|
}
|
|
|
|
return meta_ptr_->UpdateCollectionFlag(collection_id, flag);
|
|
}
|
|
|
|
Status
|
|
DBImpl::GetCollectionRowCount(const std::string& collection_id, uint64_t& row_count) {
|
|
if (!initialized_.load(std::memory_order_acquire)) {
|
|
return SHUTDOWN_ERROR;
|
|
}
|
|
|
|
return GetCollectionRowCountRecursively(collection_id, row_count);
|
|
}
|
|
|
|
Status
|
|
DBImpl::CreatePartition(const std::string& collection_id, const std::string& partition_name,
|
|
const std::string& partition_tag) {
|
|
if (!initialized_.load(std::memory_order_acquire)) {
|
|
return SHUTDOWN_ERROR;
|
|
}
|
|
|
|
uint64_t lsn = 0;
|
|
meta_ptr_->GetCollectionFlushLSN(collection_id, lsn);
|
|
return meta_ptr_->CreatePartition(collection_id, partition_name, partition_tag, lsn);
|
|
}
|
|
|
|
Status
|
|
DBImpl::DropPartition(const std::string& partition_name) {
|
|
if (!initialized_.load(std::memory_order_acquire)) {
|
|
return SHUTDOWN_ERROR;
|
|
}
|
|
|
|
mem_mgr_->EraseMemVector(partition_name); // not allow insert
|
|
auto status = meta_ptr_->DropPartition(partition_name); // soft delete collection
|
|
if (!status.ok()) {
|
|
ENGINE_LOG_ERROR << status.message();
|
|
return status;
|
|
}
|
|
|
|
// scheduler will determine when to delete collection files
|
|
auto nres = scheduler::ResMgrInst::GetInstance()->GetNumOfComputeResource();
|
|
scheduler::DeleteJobPtr job = std::make_shared<scheduler::DeleteJob>(partition_name, meta_ptr_, nres);
|
|
scheduler::JobMgrInst::GetInstance()->Put(job);
|
|
job->WaitAndDelete();
|
|
|
|
return Status::OK();
|
|
}
|
|
|
|
Status
|
|
DBImpl::DropPartitionByTag(const std::string& collection_id, const std::string& partition_tag) {
|
|
if (!initialized_.load(std::memory_order_acquire)) {
|
|
return SHUTDOWN_ERROR;
|
|
}
|
|
|
|
std::string partition_name;
|
|
auto status = meta_ptr_->GetPartitionName(collection_id, partition_tag, partition_name);
|
|
if (!status.ok()) {
|
|
ENGINE_LOG_ERROR << status.message();
|
|
return status;
|
|
}
|
|
|
|
return DropPartition(partition_name);
|
|
}
|
|
|
|
Status
|
|
DBImpl::ShowPartitions(const std::string& collection_id, std::vector<meta::CollectionSchema>& partition_schema_array) {
|
|
if (!initialized_.load(std::memory_order_acquire)) {
|
|
return SHUTDOWN_ERROR;
|
|
}
|
|
|
|
return meta_ptr_->ShowPartitions(collection_id, partition_schema_array);
|
|
}
|
|
|
|
Status
|
|
DBImpl::InsertVectors(const std::string& collection_id, const std::string& partition_tag, VectorsData& vectors) {
|
|
// ENGINE_LOG_DEBUG << "Insert " << n << " vectors to cache";
|
|
if (!initialized_.load(std::memory_order_acquire)) {
|
|
return SHUTDOWN_ERROR;
|
|
}
|
|
|
|
// insert vectors into target collection
|
|
// (zhiru): generate ids
|
|
if (vectors.id_array_.empty()) {
|
|
SafeIDGenerator& id_generator = SafeIDGenerator::GetInstance();
|
|
Status status = id_generator.GetNextIDNumbers(vectors.vector_count_, vectors.id_array_);
|
|
if (!status.ok()) {
|
|
return status;
|
|
}
|
|
}
|
|
|
|
Status status;
|
|
if (options_.wal_enable_) {
|
|
std::string target_collection_name;
|
|
status = GetPartitionByTag(collection_id, partition_tag, target_collection_name);
|
|
if (!status.ok()) {
|
|
return status;
|
|
}
|
|
|
|
if (!vectors.float_data_.empty()) {
|
|
wal_mgr_->Insert(collection_id, partition_tag, vectors.id_array_, vectors.float_data_);
|
|
} else if (!vectors.binary_data_.empty()) {
|
|
wal_mgr_->Insert(collection_id, partition_tag, vectors.id_array_, vectors.binary_data_);
|
|
}
|
|
bg_task_swn_.Notify();
|
|
|
|
} else {
|
|
wal::MXLogRecord record;
|
|
record.lsn = 0; // need to get from meta ?
|
|
record.collection_id = collection_id;
|
|
record.partition_tag = partition_tag;
|
|
record.ids = vectors.id_array_.data();
|
|
record.length = vectors.vector_count_;
|
|
if (vectors.binary_data_.empty()) {
|
|
record.type = wal::MXLogType::InsertVector;
|
|
record.data = vectors.float_data_.data();
|
|
record.data_size = vectors.float_data_.size() * sizeof(float);
|
|
} else {
|
|
record.type = wal::MXLogType::InsertBinary;
|
|
record.ids = vectors.id_array_.data();
|
|
record.length = vectors.vector_count_;
|
|
record.data = vectors.binary_data_.data();
|
|
record.data_size = vectors.binary_data_.size() * sizeof(uint8_t);
|
|
}
|
|
|
|
status = ExecWalRecord(record);
|
|
}
|
|
|
|
return status;
|
|
}
|
|
|
|
Status
|
|
DBImpl::DeleteVector(const std::string& collection_id, IDNumber vector_id) {
|
|
IDNumbers ids;
|
|
ids.push_back(vector_id);
|
|
return DeleteVectors(collection_id, ids);
|
|
}
|
|
|
|
Status
|
|
DBImpl::DeleteVectors(const std::string& collection_id, IDNumbers vector_ids) {
|
|
if (!initialized_.load(std::memory_order_acquire)) {
|
|
return SHUTDOWN_ERROR;
|
|
}
|
|
|
|
Status status;
|
|
if (options_.wal_enable_) {
|
|
wal_mgr_->DeleteById(collection_id, vector_ids);
|
|
bg_task_swn_.Notify();
|
|
|
|
} else {
|
|
wal::MXLogRecord record;
|
|
record.lsn = 0; // need to get from meta ?
|
|
record.type = wal::MXLogType::Delete;
|
|
record.collection_id = collection_id;
|
|
record.ids = vector_ids.data();
|
|
record.length = vector_ids.size();
|
|
|
|
status = ExecWalRecord(record);
|
|
}
|
|
|
|
return status;
|
|
}
|
|
|
|
Status
|
|
DBImpl::Flush(const std::string& collection_id) {
|
|
if (!initialized_.load(std::memory_order_acquire)) {
|
|
return SHUTDOWN_ERROR;
|
|
}
|
|
|
|
Status status;
|
|
bool has_collection;
|
|
status = HasCollection(collection_id, has_collection);
|
|
if (!status.ok()) {
|
|
return status;
|
|
}
|
|
if (!has_collection) {
|
|
ENGINE_LOG_ERROR << "Collection to flush does not exist: " << collection_id;
|
|
return Status(DB_NOT_FOUND, "Collection to flush does not exist");
|
|
}
|
|
|
|
ENGINE_LOG_DEBUG << "Begin flush collection: " << collection_id;
|
|
|
|
if (options_.wal_enable_) {
|
|
ENGINE_LOG_DEBUG << "WAL flush";
|
|
auto lsn = wal_mgr_->Flush(collection_id);
|
|
ENGINE_LOG_DEBUG << "wal_mgr_->Flush";
|
|
if (lsn != 0) {
|
|
bg_task_swn_.Notify();
|
|
flush_task_swn_.Wait();
|
|
ENGINE_LOG_DEBUG << "flush_task_swn_.Wait()";
|
|
}
|
|
|
|
} else {
|
|
ENGINE_LOG_DEBUG << "MemTable flush";
|
|
wal::MXLogRecord record;
|
|
record.type = wal::MXLogType::Flush;
|
|
record.collection_id = collection_id;
|
|
status = ExecWalRecord(record);
|
|
}
|
|
|
|
ENGINE_LOG_DEBUG << "End flush collection: " << collection_id;
|
|
|
|
return status;
|
|
}
|
|
|
|
Status
|
|
DBImpl::Flush() {
|
|
if (!initialized_.load(std::memory_order_acquire)) {
|
|
return SHUTDOWN_ERROR;
|
|
}
|
|
|
|
ENGINE_LOG_DEBUG << "Begin flush all collections";
|
|
|
|
Status status;
|
|
if (options_.wal_enable_) {
|
|
ENGINE_LOG_DEBUG << "WAL flush";
|
|
auto lsn = wal_mgr_->Flush();
|
|
if (lsn != 0) {
|
|
bg_task_swn_.Notify();
|
|
flush_task_swn_.Wait();
|
|
}
|
|
} else {
|
|
ENGINE_LOG_DEBUG << "MemTable flush";
|
|
wal::MXLogRecord record;
|
|
record.type = wal::MXLogType::Flush;
|
|
status = ExecWalRecord(record);
|
|
}
|
|
|
|
ENGINE_LOG_DEBUG << "End flush all collections";
|
|
|
|
return status;
|
|
}
|
|
|
|
Status
|
|
DBImpl::Compact(const std::string& collection_id) {
|
|
if (!initialized_.load(std::memory_order_acquire)) {
|
|
return SHUTDOWN_ERROR;
|
|
}
|
|
|
|
engine::meta::CollectionSchema collection_schema;
|
|
collection_schema.collection_id_ = collection_id;
|
|
auto status = DescribeCollection(collection_schema);
|
|
if (!status.ok()) {
|
|
if (status.code() == DB_NOT_FOUND) {
|
|
ENGINE_LOG_ERROR << "Collection to compact does not exist: " << collection_id;
|
|
return Status(DB_NOT_FOUND, "Collection to compact does not exist");
|
|
} else {
|
|
return status;
|
|
}
|
|
} else {
|
|
if (!collection_schema.owner_collection_.empty()) {
|
|
ENGINE_LOG_ERROR << "Collection to compact does not exist: " << collection_id;
|
|
return Status(DB_NOT_FOUND, "Collection to compact does not exist");
|
|
}
|
|
}
|
|
|
|
ENGINE_LOG_DEBUG << "Before compacting, wait for build index thread to finish...";
|
|
|
|
// WaitBuildIndexFinish();
|
|
|
|
const std::lock_guard<std::mutex> index_lock(build_index_mutex_);
|
|
const std::lock_guard<std::mutex> merge_lock(flush_merge_compact_mutex_);
|
|
|
|
ENGINE_LOG_DEBUG << "Compacting collection: " << collection_id;
|
|
|
|
// Get files to compact from meta.
|
|
std::vector<int> file_types{meta::SegmentSchema::FILE_TYPE::RAW, meta::SegmentSchema::FILE_TYPE::TO_INDEX,
|
|
meta::SegmentSchema::FILE_TYPE::BACKUP};
|
|
meta::SegmentsSchema files_to_compact;
|
|
status = meta_ptr_->FilesByType(collection_id, file_types, files_to_compact);
|
|
if (!status.ok()) {
|
|
std::string err_msg = "Failed to get files to compact: " + status.message();
|
|
ENGINE_LOG_ERROR << err_msg;
|
|
return Status(DB_ERROR, err_msg);
|
|
}
|
|
|
|
ENGINE_LOG_DEBUG << "Found " << files_to_compact.size() << " segment to compact";
|
|
|
|
OngoingFileChecker::GetInstance().MarkOngoingFiles(files_to_compact);
|
|
|
|
Status compact_status;
|
|
for (auto iter = files_to_compact.begin(); iter != files_to_compact.end();) {
|
|
meta::SegmentSchema file = *iter;
|
|
iter = files_to_compact.erase(iter);
|
|
|
|
// Check if the segment needs compacting
|
|
std::string segment_dir;
|
|
utils::GetParentPath(file.location_, segment_dir);
|
|
|
|
segment::SegmentReader segment_reader(segment_dir);
|
|
size_t deleted_docs_size;
|
|
status = segment_reader.ReadDeletedDocsSize(deleted_docs_size);
|
|
if (!status.ok()) {
|
|
OngoingFileChecker::GetInstance().UnmarkOngoingFile(file);
|
|
continue; // skip this file and try compact next one
|
|
}
|
|
|
|
meta::SegmentsSchema files_to_update;
|
|
if (deleted_docs_size != 0) {
|
|
compact_status = CompactFile(collection_id, file, files_to_update);
|
|
|
|
if (!compact_status.ok()) {
|
|
ENGINE_LOG_ERROR << "Compact failed for segment " << file.segment_id_ << ": "
|
|
<< compact_status.message();
|
|
OngoingFileChecker::GetInstance().UnmarkOngoingFile(file);
|
|
continue; // skip this file and try compact next one
|
|
}
|
|
} else {
|
|
OngoingFileChecker::GetInstance().UnmarkOngoingFile(file);
|
|
ENGINE_LOG_DEBUG << "Segment " << file.segment_id_ << " has no deleted data. No need to compact";
|
|
continue; // skip this file and try compact next one
|
|
}
|
|
|
|
ENGINE_LOG_DEBUG << "Updating meta after compaction...";
|
|
status = meta_ptr_->UpdateCollectionFiles(files_to_update);
|
|
OngoingFileChecker::GetInstance().UnmarkOngoingFile(file);
|
|
if (!status.ok()) {
|
|
compact_status = status;
|
|
break; // meta error, could not go on
|
|
}
|
|
}
|
|
|
|
OngoingFileChecker::GetInstance().UnmarkOngoingFiles(files_to_compact);
|
|
|
|
if (compact_status.ok()) {
|
|
ENGINE_LOG_DEBUG << "Finished compacting collection: " << collection_id;
|
|
}
|
|
|
|
return compact_status;
|
|
}
|
|
|
|
Status
|
|
DBImpl::CompactFile(const std::string& collection_id, const meta::SegmentSchema& file,
|
|
meta::SegmentsSchema& files_to_update) {
|
|
ENGINE_LOG_DEBUG << "Compacting segment " << file.segment_id_ << " for collection: " << collection_id;
|
|
|
|
// Create new collection file
|
|
meta::SegmentSchema compacted_file;
|
|
compacted_file.collection_id_ = collection_id;
|
|
// compacted_file.date_ = date;
|
|
compacted_file.file_type_ = meta::SegmentSchema::NEW_MERGE; // TODO: use NEW_MERGE for now
|
|
Status status = meta_ptr_->CreateCollectionFile(compacted_file);
|
|
|
|
if (!status.ok()) {
|
|
ENGINE_LOG_ERROR << "Failed to create collection file: " << status.message();
|
|
return status;
|
|
}
|
|
|
|
// Compact (merge) file to the newly created collection file
|
|
|
|
std::string new_segment_dir;
|
|
utils::GetParentPath(compacted_file.location_, new_segment_dir);
|
|
auto segment_writer_ptr = std::make_shared<segment::SegmentWriter>(new_segment_dir);
|
|
|
|
std::string segment_dir_to_merge;
|
|
utils::GetParentPath(file.location_, segment_dir_to_merge);
|
|
|
|
ENGINE_LOG_DEBUG << "Compacting begin...";
|
|
segment_writer_ptr->Merge(segment_dir_to_merge, compacted_file.file_id_);
|
|
|
|
// Serialize
|
|
ENGINE_LOG_DEBUG << "Serializing compacted segment...";
|
|
status = segment_writer_ptr->Serialize();
|
|
if (!status.ok()) {
|
|
ENGINE_LOG_ERROR << "Failed to serialize compacted segment: " << status.message();
|
|
compacted_file.file_type_ = meta::SegmentSchema::TO_DELETE;
|
|
auto mark_status = meta_ptr_->UpdateCollectionFile(compacted_file);
|
|
if (mark_status.ok()) {
|
|
ENGINE_LOG_DEBUG << "Mark file: " << compacted_file.file_id_ << " to to_delete";
|
|
}
|
|
return status;
|
|
}
|
|
|
|
// Update collection files state
|
|
// if index type isn't IDMAP, set file type to TO_INDEX if file size exceed index_file_size
|
|
// else set file type to RAW, no need to build index
|
|
if (!utils::IsRawIndexType(compacted_file.engine_type_)) {
|
|
compacted_file.file_type_ = (segment_writer_ptr->Size() >= compacted_file.index_file_size_)
|
|
? meta::SegmentSchema::TO_INDEX
|
|
: meta::SegmentSchema::RAW;
|
|
} else {
|
|
compacted_file.file_type_ = meta::SegmentSchema::RAW;
|
|
}
|
|
compacted_file.file_size_ = segment_writer_ptr->Size();
|
|
compacted_file.row_count_ = segment_writer_ptr->VectorCount();
|
|
|
|
if (compacted_file.row_count_ == 0) {
|
|
ENGINE_LOG_DEBUG << "Compacted segment is empty. Mark it as TO_DELETE";
|
|
compacted_file.file_type_ = meta::SegmentSchema::TO_DELETE;
|
|
}
|
|
|
|
files_to_update.emplace_back(compacted_file);
|
|
|
|
// Set all files in segment to TO_DELETE
|
|
auto& segment_id = file.segment_id_;
|
|
meta::SegmentsSchema segment_files;
|
|
status = meta_ptr_->GetCollectionFilesBySegmentId(segment_id, segment_files);
|
|
if (!status.ok()) {
|
|
return status;
|
|
}
|
|
for (auto& f : segment_files) {
|
|
f.file_type_ = meta::SegmentSchema::FILE_TYPE::TO_DELETE;
|
|
files_to_update.emplace_back(f);
|
|
}
|
|
|
|
ENGINE_LOG_DEBUG << "Compacted segment " << compacted_file.segment_id_ << " from "
|
|
<< std::to_string(file.file_size_) << " bytes to " << std::to_string(compacted_file.file_size_)
|
|
<< " bytes";
|
|
|
|
if (options_.insert_cache_immediately_) {
|
|
segment_writer_ptr->Cache();
|
|
}
|
|
|
|
return status;
|
|
}
|
|
|
|
Status
|
|
DBImpl::GetVectorByID(const std::string& collection_id, const IDNumber& vector_id, VectorsData& vector) {
|
|
if (!initialized_.load(std::memory_order_acquire)) {
|
|
return SHUTDOWN_ERROR;
|
|
}
|
|
|
|
bool has_collection;
|
|
auto status = HasCollection(collection_id, has_collection);
|
|
if (!has_collection) {
|
|
ENGINE_LOG_ERROR << "Collection " << collection_id << " does not exist: ";
|
|
return Status(DB_NOT_FOUND, "Collection does not exist");
|
|
}
|
|
if (!status.ok()) {
|
|
return status;
|
|
}
|
|
|
|
meta::SegmentsSchema files_to_query;
|
|
|
|
std::vector<int> file_types{meta::SegmentSchema::FILE_TYPE::RAW, meta::SegmentSchema::FILE_TYPE::TO_INDEX,
|
|
meta::SegmentSchema::FILE_TYPE::BACKUP};
|
|
meta::SegmentsSchema collection_files;
|
|
status = meta_ptr_->FilesByType(collection_id, file_types, files_to_query);
|
|
if (!status.ok()) {
|
|
std::string err_msg = "Failed to get files for GetVectorByID: " + status.message();
|
|
ENGINE_LOG_ERROR << err_msg;
|
|
return status;
|
|
}
|
|
|
|
std::vector<meta::CollectionSchema> partition_array;
|
|
status = meta_ptr_->ShowPartitions(collection_id, partition_array);
|
|
for (auto& schema : partition_array) {
|
|
meta::SegmentsSchema files;
|
|
status = meta_ptr_->FilesByType(schema.collection_id_, file_types, files);
|
|
if (!status.ok()) {
|
|
std::string err_msg = "Failed to get files for GetVectorByID: " + status.message();
|
|
ENGINE_LOG_ERROR << err_msg;
|
|
return status;
|
|
}
|
|
files_to_query.insert(files_to_query.end(), std::make_move_iterator(files.begin()),
|
|
std::make_move_iterator(files.end()));
|
|
}
|
|
|
|
if (files_to_query.empty()) {
|
|
ENGINE_LOG_DEBUG << "No files to get vector by id from";
|
|
return Status::OK();
|
|
}
|
|
|
|
cache::CpuCacheMgr::GetInstance()->PrintInfo();
|
|
OngoingFileChecker::GetInstance().MarkOngoingFiles(files_to_query);
|
|
|
|
status = GetVectorByIdHelper(collection_id, vector_id, vector, files_to_query);
|
|
|
|
OngoingFileChecker::GetInstance().UnmarkOngoingFiles(files_to_query);
|
|
cache::CpuCacheMgr::GetInstance()->PrintInfo();
|
|
|
|
return status;
|
|
}
|
|
|
|
Status
|
|
DBImpl::GetVectorIDs(const std::string& collection_id, const std::string& segment_id, IDNumbers& vector_ids) {
|
|
if (!initialized_.load(std::memory_order_acquire)) {
|
|
return SHUTDOWN_ERROR;
|
|
}
|
|
|
|
// step 1: check collection existence
|
|
bool has_collection;
|
|
auto status = HasCollection(collection_id, has_collection);
|
|
if (!has_collection) {
|
|
ENGINE_LOG_ERROR << "Collection " << collection_id << " does not exist: ";
|
|
return Status(DB_NOT_FOUND, "Collection does not exist");
|
|
}
|
|
if (!status.ok()) {
|
|
return status;
|
|
}
|
|
|
|
// step 2: find segment
|
|
meta::SegmentsSchema collection_files;
|
|
status = meta_ptr_->GetCollectionFilesBySegmentId(segment_id, collection_files);
|
|
if (!status.ok()) {
|
|
return status;
|
|
}
|
|
|
|
if (collection_files.empty()) {
|
|
return Status(DB_NOT_FOUND, "Segment does not exist");
|
|
}
|
|
|
|
// check the segment is belong to this collection
|
|
if (collection_files[0].collection_id_ != collection_id) {
|
|
// the segment could be in a partition under this collection
|
|
meta::CollectionSchema collection_schema;
|
|
collection_schema.collection_id_ = collection_files[0].collection_id_;
|
|
status = DescribeCollection(collection_schema);
|
|
if (collection_schema.owner_collection_ != collection_id) {
|
|
return Status(DB_NOT_FOUND, "Segment does not belong to this collection");
|
|
}
|
|
}
|
|
|
|
// step 3: load segment ids and delete offset
|
|
std::string segment_dir;
|
|
engine::utils::GetParentPath(collection_files[0].location_, segment_dir);
|
|
segment::SegmentReader segment_reader(segment_dir);
|
|
|
|
std::vector<segment::doc_id_t> uids;
|
|
status = segment_reader.LoadUids(uids);
|
|
if (!status.ok()) {
|
|
return status;
|
|
}
|
|
|
|
segment::DeletedDocsPtr deleted_docs_ptr;
|
|
status = segment_reader.LoadDeletedDocs(deleted_docs_ptr);
|
|
if (!status.ok()) {
|
|
return status;
|
|
}
|
|
|
|
// step 4: construct id array
|
|
// avoid duplicate offset and erase from max offset to min offset
|
|
auto& deleted_offset = deleted_docs_ptr->GetDeletedDocs();
|
|
std::set<segment::offset_t, std::greater<segment::offset_t>> ordered_offset;
|
|
for (segment::offset_t offset : deleted_offset) {
|
|
ordered_offset.insert(offset);
|
|
}
|
|
for (segment::offset_t offset : ordered_offset) {
|
|
uids.erase(uids.begin() + offset);
|
|
}
|
|
vector_ids.swap(uids);
|
|
|
|
return status;
|
|
}
|
|
|
|
Status
|
|
DBImpl::GetVectorByIdHelper(const std::string& collection_id, IDNumber vector_id, VectorsData& vector,
|
|
const meta::SegmentsSchema& files) {
|
|
ENGINE_LOG_DEBUG << "Getting vector by id in " << files.size() << " files";
|
|
|
|
for (auto& file : files) {
|
|
// Load bloom filter
|
|
std::string segment_dir;
|
|
engine::utils::GetParentPath(file.location_, segment_dir);
|
|
segment::SegmentReader segment_reader(segment_dir);
|
|
segment::IdBloomFilterPtr id_bloom_filter_ptr;
|
|
segment_reader.LoadBloomFilter(id_bloom_filter_ptr);
|
|
|
|
// Check if the id is present in bloom filter.
|
|
if (id_bloom_filter_ptr->Check(vector_id)) {
|
|
// Load uids and check if the id is indeed present. If yes, find its offset.
|
|
std::vector<int64_t> offsets;
|
|
std::vector<segment::doc_id_t> uids;
|
|
auto status = segment_reader.LoadUids(uids);
|
|
if (!status.ok()) {
|
|
return status;
|
|
}
|
|
|
|
auto found = std::find(uids.begin(), uids.end(), vector_id);
|
|
if (found != uids.end()) {
|
|
auto offset = std::distance(uids.begin(), found);
|
|
|
|
// Check whether the id has been deleted
|
|
segment::DeletedDocsPtr deleted_docs_ptr;
|
|
status = segment_reader.LoadDeletedDocs(deleted_docs_ptr);
|
|
if (!status.ok()) {
|
|
return status;
|
|
}
|
|
auto& deleted_docs = deleted_docs_ptr->GetDeletedDocs();
|
|
|
|
auto deleted = std::find(deleted_docs.begin(), deleted_docs.end(), offset);
|
|
if (deleted == deleted_docs.end()) {
|
|
// Load raw vector
|
|
bool is_binary = utils::IsBinaryMetricType(file.metric_type_);
|
|
size_t single_vector_bytes = is_binary ? file.dimension_ / 8 : file.dimension_ * sizeof(float);
|
|
std::vector<uint8_t> raw_vector;
|
|
status = segment_reader.LoadVectors(offset * single_vector_bytes, single_vector_bytes, raw_vector);
|
|
if (!status.ok()) {
|
|
return status;
|
|
}
|
|
|
|
vector.vector_count_ = 1;
|
|
if (is_binary) {
|
|
vector.binary_data_ = std::move(raw_vector);
|
|
} else {
|
|
std::vector<float> float_vector;
|
|
float_vector.resize(file.dimension_);
|
|
memcpy(float_vector.data(), raw_vector.data(), single_vector_bytes);
|
|
vector.float_data_ = std::move(float_vector);
|
|
}
|
|
return Status::OK();
|
|
}
|
|
}
|
|
} else {
|
|
continue;
|
|
}
|
|
}
|
|
|
|
return Status::OK();
|
|
}
|
|
|
|
Status
|
|
DBImpl::CreateIndex(const std::string& collection_id, const CollectionIndex& index) {
|
|
if (!initialized_.load(std::memory_order_acquire)) {
|
|
return SHUTDOWN_ERROR;
|
|
}
|
|
|
|
// serialize memory data
|
|
// std::set<std::string> sync_collection_ids;
|
|
// auto status = SyncMemData(sync_collection_ids);
|
|
auto status = Flush();
|
|
|
|
{
|
|
std::unique_lock<std::mutex> lock(build_index_mutex_);
|
|
|
|
// step 1: check index difference
|
|
CollectionIndex old_index;
|
|
status = DescribeIndex(collection_id, old_index);
|
|
if (!status.ok()) {
|
|
ENGINE_LOG_ERROR << "Failed to get collection index info for collection: " << collection_id;
|
|
return status;
|
|
}
|
|
|
|
// step 2: update index info
|
|
CollectionIndex new_index = index;
|
|
new_index.metric_type_ = old_index.metric_type_; // dont change metric type, it was defined by CreateCollection
|
|
if (!utils::IsSameIndex(old_index, new_index)) {
|
|
status = UpdateCollectionIndexRecursively(collection_id, new_index);
|
|
if (!status.ok()) {
|
|
return status;
|
|
}
|
|
}
|
|
}
|
|
|
|
// step 3: let merge file thread finish
|
|
// to avoid duplicate data bug
|
|
WaitMergeFileFinish();
|
|
|
|
// step 4: wait and build index
|
|
status = index_failed_checker_.CleanFailedIndexFileOfCollection(collection_id);
|
|
status = WaitCollectionIndexRecursively(collection_id, index);
|
|
|
|
return status;
|
|
}
|
|
|
|
Status
|
|
DBImpl::DescribeIndex(const std::string& collection_id, CollectionIndex& index) {
|
|
if (!initialized_.load(std::memory_order_acquire)) {
|
|
return SHUTDOWN_ERROR;
|
|
}
|
|
|
|
return meta_ptr_->DescribeCollectionIndex(collection_id, index);
|
|
}
|
|
|
|
Status
|
|
DBImpl::DropIndex(const std::string& collection_id) {
|
|
if (!initialized_.load(std::memory_order_acquire)) {
|
|
return SHUTDOWN_ERROR;
|
|
}
|
|
|
|
ENGINE_LOG_DEBUG << "Drop index for collection: " << collection_id;
|
|
return DropCollectionIndexRecursively(collection_id);
|
|
}
|
|
|
|
Status
|
|
DBImpl::QueryByID(const std::shared_ptr<server::Context>& context, const std::string& collection_id,
|
|
const std::vector<std::string>& partition_tags, uint64_t k, const milvus::json& extra_params,
|
|
IDNumber vector_id, ResultIds& result_ids, ResultDistances& result_distances) {
|
|
if (!initialized_.load(std::memory_order_acquire)) {
|
|
return SHUTDOWN_ERROR;
|
|
}
|
|
|
|
VectorsData vectors_data = VectorsData();
|
|
vectors_data.id_array_.emplace_back(vector_id);
|
|
vectors_data.vector_count_ = 1;
|
|
Status result =
|
|
Query(context, collection_id, partition_tags, k, extra_params, vectors_data, result_ids, result_distances);
|
|
return result;
|
|
}
|
|
|
|
Status
|
|
DBImpl::Query(const std::shared_ptr<server::Context>& context, const std::string& collection_id,
|
|
const std::vector<std::string>& partition_tags, uint64_t k, const milvus::json& extra_params,
|
|
const VectorsData& vectors, ResultIds& result_ids, ResultDistances& result_distances) {
|
|
milvus::server::ContextChild tracer(context, "Query");
|
|
|
|
if (!initialized_.load(std::memory_order_acquire)) {
|
|
return SHUTDOWN_ERROR;
|
|
}
|
|
|
|
Status status;
|
|
meta::SegmentsSchema files_array;
|
|
|
|
if (partition_tags.empty()) {
|
|
// no partition tag specified, means search in whole collection
|
|
// get all collection files from parent collection
|
|
status = GetFilesToSearch(collection_id, files_array);
|
|
if (!status.ok()) {
|
|
return status;
|
|
}
|
|
|
|
std::vector<meta::CollectionSchema> partition_array;
|
|
status = meta_ptr_->ShowPartitions(collection_id, partition_array);
|
|
for (auto& schema : partition_array) {
|
|
status = GetFilesToSearch(schema.collection_id_, files_array);
|
|
}
|
|
|
|
if (files_array.empty()) {
|
|
return Status::OK();
|
|
}
|
|
} else {
|
|
// get files from specified partitions
|
|
std::set<std::string> partition_name_array;
|
|
status = GetPartitionsByTags(collection_id, partition_tags, partition_name_array);
|
|
if (!status.ok()) {
|
|
return status; // didn't match any partition.
|
|
}
|
|
|
|
for (auto& partition_name : partition_name_array) {
|
|
status = GetFilesToSearch(partition_name, files_array);
|
|
}
|
|
|
|
if (files_array.empty()) {
|
|
return Status::OK();
|
|
}
|
|
}
|
|
|
|
cache::CpuCacheMgr::GetInstance()->PrintInfo(); // print cache info before query
|
|
status = QueryAsync(tracer.Context(), files_array, k, extra_params, vectors, result_ids, result_distances);
|
|
cache::CpuCacheMgr::GetInstance()->PrintInfo(); // print cache info after query
|
|
|
|
return status;
|
|
}
|
|
|
|
Status
|
|
DBImpl::QueryByFileID(const std::shared_ptr<server::Context>& context, const std::vector<std::string>& file_ids,
|
|
uint64_t k, const milvus::json& extra_params, const VectorsData& vectors, ResultIds& result_ids,
|
|
ResultDistances& result_distances) {
|
|
milvus::server::ContextChild tracer(context, "Query by file id");
|
|
|
|
if (!initialized_.load(std::memory_order_acquire)) {
|
|
return SHUTDOWN_ERROR;
|
|
}
|
|
|
|
// get specified files
|
|
std::vector<size_t> ids;
|
|
for (auto& id : file_ids) {
|
|
std::string::size_type sz;
|
|
ids.push_back(std::stoul(id, &sz));
|
|
}
|
|
|
|
meta::SegmentsSchema search_files;
|
|
auto status = meta_ptr_->FilesByID(ids, search_files);
|
|
if (!status.ok()) {
|
|
return status;
|
|
}
|
|
|
|
fiu_do_on("DBImpl.QueryByFileID.empty_files_array", search_files.clear());
|
|
if (search_files.empty()) {
|
|
return Status(DB_ERROR, "Invalid file id");
|
|
}
|
|
|
|
cache::CpuCacheMgr::GetInstance()->PrintInfo(); // print cache info before query
|
|
status = QueryAsync(tracer.Context(), search_files, k, extra_params, vectors, result_ids, result_distances);
|
|
cache::CpuCacheMgr::GetInstance()->PrintInfo(); // print cache info after query
|
|
|
|
return status;
|
|
}
|
|
|
|
Status
|
|
DBImpl::Size(uint64_t& result) {
|
|
if (!initialized_.load(std::memory_order_acquire)) {
|
|
return SHUTDOWN_ERROR;
|
|
}
|
|
|
|
return meta_ptr_->Size(result);
|
|
}
|
|
|
|
///////////////////////////////////////////////////////////////////////////////////////////////////////////////////
|
|
// internal methods
|
|
///////////////////////////////////////////////////////////////////////////////////////////////////////////////////
|
|
Status
|
|
DBImpl::QueryAsync(const std::shared_ptr<server::Context>& context, const meta::SegmentsSchema& files, uint64_t k,
|
|
const milvus::json& extra_params, const VectorsData& vectors, ResultIds& result_ids,
|
|
ResultDistances& result_distances) {
|
|
milvus::server::ContextChild tracer(context, "Query Async");
|
|
server::CollectQueryMetrics metrics(vectors.vector_count_);
|
|
|
|
TimeRecorder rc("");
|
|
|
|
// step 1: construct search job
|
|
auto status = OngoingFileChecker::GetInstance().MarkOngoingFiles(files);
|
|
|
|
ENGINE_LOG_DEBUG << "Engine query begin, index file count: " << files.size();
|
|
scheduler::SearchJobPtr job = std::make_shared<scheduler::SearchJob>(tracer.Context(), k, extra_params, vectors);
|
|
for (auto& file : files) {
|
|
scheduler::SegmentSchemaPtr file_ptr = std::make_shared<meta::SegmentSchema>(file);
|
|
job->AddIndexFile(file_ptr);
|
|
}
|
|
|
|
// step 2: put search job to scheduler and wait result
|
|
scheduler::JobMgrInst::GetInstance()->Put(job);
|
|
job->WaitResult();
|
|
|
|
status = OngoingFileChecker::GetInstance().UnmarkOngoingFiles(files);
|
|
if (!job->GetStatus().ok()) {
|
|
return job->GetStatus();
|
|
}
|
|
|
|
// step 3: construct results
|
|
result_ids = job->GetResultIds();
|
|
result_distances = job->GetResultDistances();
|
|
rc.ElapseFromBegin("Engine query totally cost");
|
|
|
|
return Status::OK();
|
|
}
|
|
|
|
void
|
|
DBImpl::BackgroundTimerTask() {
|
|
server::SystemInfo::GetInstance().Init();
|
|
while (true) {
|
|
if (!initialized_.load(std::memory_order_acquire)) {
|
|
WaitMergeFileFinish();
|
|
WaitBuildIndexFinish();
|
|
|
|
ENGINE_LOG_DEBUG << "DB background thread exit";
|
|
break;
|
|
}
|
|
|
|
if (options_.auto_flush_interval_ > 0) {
|
|
bg_task_swn_.Wait_For(std::chrono::seconds(options_.auto_flush_interval_));
|
|
} else {
|
|
bg_task_swn_.Wait();
|
|
}
|
|
|
|
StartMetricTask();
|
|
StartMergeTask();
|
|
StartBuildIndexTask();
|
|
}
|
|
}
|
|
|
|
void
|
|
DBImpl::WaitMergeFileFinish() {
|
|
ENGINE_LOG_DEBUG << "Begin WaitMergeFileFinish";
|
|
std::lock_guard<std::mutex> lck(merge_result_mutex_);
|
|
for (auto& iter : merge_thread_results_) {
|
|
iter.wait();
|
|
}
|
|
ENGINE_LOG_DEBUG << "End WaitMergeFileFinish";
|
|
}
|
|
|
|
void
|
|
DBImpl::WaitBuildIndexFinish() {
|
|
ENGINE_LOG_DEBUG << "Begin WaitBuildIndexFinish";
|
|
std::lock_guard<std::mutex> lck(index_result_mutex_);
|
|
for (auto& iter : index_thread_results_) {
|
|
iter.wait();
|
|
}
|
|
ENGINE_LOG_DEBUG << "End WaitBuildIndexFinish";
|
|
}
|
|
|
|
void
|
|
DBImpl::StartMetricTask() {
|
|
static uint64_t metric_clock_tick = 0;
|
|
++metric_clock_tick;
|
|
if (metric_clock_tick % METRIC_ACTION_INTERVAL != 0) {
|
|
return;
|
|
}
|
|
|
|
server::Metrics::GetInstance().KeepingAliveCounterIncrement(METRIC_ACTION_INTERVAL);
|
|
int64_t cache_usage = cache::CpuCacheMgr::GetInstance()->CacheUsage();
|
|
int64_t cache_total = cache::CpuCacheMgr::GetInstance()->CacheCapacity();
|
|
fiu_do_on("DBImpl.StartMetricTask.InvalidTotalCache", cache_total = 0);
|
|
|
|
if (cache_total > 0) {
|
|
double cache_usage_double = cache_usage;
|
|
server::Metrics::GetInstance().CpuCacheUsageGaugeSet(cache_usage_double * 100 / cache_total);
|
|
} else {
|
|
server::Metrics::GetInstance().CpuCacheUsageGaugeSet(0);
|
|
}
|
|
|
|
server::Metrics::GetInstance().GpuCacheUsageGaugeSet();
|
|
uint64_t size;
|
|
Size(size);
|
|
server::Metrics::GetInstance().DataFileSizeGaugeSet(size);
|
|
server::Metrics::GetInstance().CPUUsagePercentSet();
|
|
server::Metrics::GetInstance().RAMUsagePercentSet();
|
|
server::Metrics::GetInstance().GPUPercentGaugeSet();
|
|
server::Metrics::GetInstance().GPUMemoryUsageGaugeSet();
|
|
server::Metrics::GetInstance().OctetsSet();
|
|
|
|
server::Metrics::GetInstance().CPUCoreUsagePercentSet();
|
|
server::Metrics::GetInstance().GPUTemperature();
|
|
server::Metrics::GetInstance().CPUTemperature();
|
|
server::Metrics::GetInstance().PushToGateway();
|
|
}
|
|
|
|
void
|
|
DBImpl::StartMergeTask() {
|
|
static uint64_t compact_clock_tick = 0;
|
|
++compact_clock_tick;
|
|
if (compact_clock_tick % COMPACT_ACTION_INTERVAL != 0) {
|
|
return;
|
|
}
|
|
|
|
if (!options_.wal_enable_) {
|
|
Flush();
|
|
}
|
|
|
|
// ENGINE_LOG_DEBUG << "Begin StartMergeTask";
|
|
// merge task has been finished?
|
|
{
|
|
std::lock_guard<std::mutex> lck(merge_result_mutex_);
|
|
if (!merge_thread_results_.empty()) {
|
|
std::chrono::milliseconds span(10);
|
|
if (merge_thread_results_.back().wait_for(span) == std::future_status::ready) {
|
|
merge_thread_results_.pop_back();
|
|
}
|
|
}
|
|
}
|
|
|
|
// add new merge task
|
|
{
|
|
std::lock_guard<std::mutex> lck(merge_result_mutex_);
|
|
if (merge_thread_results_.empty()) {
|
|
// collect merge files for all collections(if merge_collection_ids_ is empty) for two reasons:
|
|
// 1. other collections may still has un-merged files
|
|
// 2. server may be closed unexpected, these un-merge files need to be merged when server restart
|
|
if (merge_collection_ids_.empty()) {
|
|
std::vector<meta::CollectionSchema> collection_schema_array;
|
|
meta_ptr_->AllCollections(collection_schema_array);
|
|
for (auto& schema : collection_schema_array) {
|
|
merge_collection_ids_.insert(schema.collection_id_);
|
|
}
|
|
}
|
|
|
|
// start merge file thread
|
|
merge_thread_results_.push_back(
|
|
merge_thread_pool_.enqueue(&DBImpl::BackgroundMerge, this, merge_collection_ids_));
|
|
merge_collection_ids_.clear();
|
|
}
|
|
}
|
|
|
|
// ENGINE_LOG_DEBUG << "End StartMergeTask";
|
|
}
|
|
|
|
Status
|
|
DBImpl::MergeFiles(const std::string& collection_id, const meta::SegmentsSchema& files) {
|
|
// const std::lock_guard<std::mutex> lock(flush_merge_compact_mutex_);
|
|
|
|
ENGINE_LOG_DEBUG << "Merge files for collection: " << collection_id;
|
|
|
|
// step 1: create collection file
|
|
meta::SegmentSchema collection_file;
|
|
collection_file.collection_id_ = collection_id;
|
|
collection_file.file_type_ = meta::SegmentSchema::NEW_MERGE;
|
|
Status status = meta_ptr_->CreateCollectionFile(collection_file);
|
|
|
|
if (!status.ok()) {
|
|
ENGINE_LOG_ERROR << "Failed to create collection: " << status.ToString();
|
|
return status;
|
|
}
|
|
|
|
// step 2: merge files
|
|
/*
|
|
ExecutionEnginePtr index =
|
|
EngineFactory::Build(collection_file.dimension_, collection_file.location_,
|
|
(EngineType)collection_file.engine_type_, (MetricType)collection_file.metric_type_, collection_file.nlist_);
|
|
*/
|
|
meta::SegmentsSchema updated;
|
|
|
|
std::string new_segment_dir;
|
|
utils::GetParentPath(collection_file.location_, new_segment_dir);
|
|
auto segment_writer_ptr = std::make_shared<segment::SegmentWriter>(new_segment_dir);
|
|
|
|
for (auto& file : files) {
|
|
server::CollectMergeFilesMetrics metrics;
|
|
std::string segment_dir_to_merge;
|
|
utils::GetParentPath(file.location_, segment_dir_to_merge);
|
|
segment_writer_ptr->Merge(segment_dir_to_merge, collection_file.file_id_);
|
|
auto file_schema = file;
|
|
file_schema.file_type_ = meta::SegmentSchema::TO_DELETE;
|
|
updated.push_back(file_schema);
|
|
auto size = segment_writer_ptr->Size();
|
|
if (size >= file_schema.index_file_size_) {
|
|
break;
|
|
}
|
|
}
|
|
|
|
// step 3: serialize to disk
|
|
try {
|
|
status = segment_writer_ptr->Serialize();
|
|
fiu_do_on("DBImpl.MergeFiles.Serialize_ThrowException", throw std::exception());
|
|
fiu_do_on("DBImpl.MergeFiles.Serialize_ErrorStatus", status = Status(DB_ERROR, ""));
|
|
} catch (std::exception& ex) {
|
|
std::string msg = "Serialize merged index encounter exception: " + std::string(ex.what());
|
|
ENGINE_LOG_ERROR << msg;
|
|
status = Status(DB_ERROR, msg);
|
|
}
|
|
|
|
if (!status.ok()) {
|
|
ENGINE_LOG_ERROR << "Failed to persist merged segment: " << new_segment_dir << ". Error: " << status.message();
|
|
|
|
// if failed to serialize merge file to disk
|
|
// typical error: out of disk space, out of memory or permission denied
|
|
collection_file.file_type_ = meta::SegmentSchema::TO_DELETE;
|
|
status = meta_ptr_->UpdateCollectionFile(collection_file);
|
|
ENGINE_LOG_DEBUG << "Failed to update file to index, mark file: " << collection_file.file_id_
|
|
<< " to to_delete";
|
|
|
|
return status;
|
|
}
|
|
|
|
// step 4: update collection files state
|
|
// if index type isn't IDMAP, set file type to TO_INDEX if file size exceed index_file_size
|
|
// else set file type to RAW, no need to build index
|
|
if (!utils::IsRawIndexType(collection_file.engine_type_)) {
|
|
collection_file.file_type_ = (segment_writer_ptr->Size() >= collection_file.index_file_size_)
|
|
? meta::SegmentSchema::TO_INDEX
|
|
: meta::SegmentSchema::RAW;
|
|
} else {
|
|
collection_file.file_type_ = meta::SegmentSchema::RAW;
|
|
}
|
|
collection_file.file_size_ = segment_writer_ptr->Size();
|
|
collection_file.row_count_ = segment_writer_ptr->VectorCount();
|
|
updated.push_back(collection_file);
|
|
status = meta_ptr_->UpdateCollectionFiles(updated);
|
|
ENGINE_LOG_DEBUG << "New merged segment " << collection_file.segment_id_ << " of size "
|
|
<< segment_writer_ptr->Size() << " bytes";
|
|
|
|
if (options_.insert_cache_immediately_) {
|
|
segment_writer_ptr->Cache();
|
|
}
|
|
|
|
return status;
|
|
}
|
|
|
|
Status
|
|
DBImpl::BackgroundMergeFiles(const std::string& collection_id) {
|
|
const std::lock_guard<std::mutex> lock(flush_merge_compact_mutex_);
|
|
|
|
meta::SegmentsSchema raw_files;
|
|
auto status = meta_ptr_->FilesToMerge(collection_id, raw_files);
|
|
if (!status.ok()) {
|
|
ENGINE_LOG_ERROR << "Failed to get merge files for collection: " << collection_id;
|
|
return status;
|
|
}
|
|
|
|
if (raw_files.size() < options_.merge_trigger_number_) {
|
|
ENGINE_LOG_TRACE << "Files number not greater equal than merge trigger number, skip merge action";
|
|
return Status::OK();
|
|
}
|
|
|
|
status = OngoingFileChecker::GetInstance().MarkOngoingFiles(raw_files);
|
|
MergeFiles(collection_id, raw_files);
|
|
status = OngoingFileChecker::GetInstance().UnmarkOngoingFiles(raw_files);
|
|
|
|
if (!initialized_.load(std::memory_order_acquire)) {
|
|
ENGINE_LOG_DEBUG << "Server will shutdown, skip merge action for collection: " << collection_id;
|
|
}
|
|
|
|
return Status::OK();
|
|
}
|
|
|
|
void
|
|
DBImpl::BackgroundMerge(std::set<std::string> collection_ids) {
|
|
// ENGINE_LOG_TRACE << " Background merge thread start";
|
|
|
|
Status status;
|
|
for (auto& collection_id : collection_ids) {
|
|
status = BackgroundMergeFiles(collection_id);
|
|
if (!status.ok()) {
|
|
ENGINE_LOG_ERROR << "Merge files for collection " << collection_id << " failed: " << status.ToString();
|
|
}
|
|
|
|
if (!initialized_.load(std::memory_order_acquire)) {
|
|
ENGINE_LOG_DEBUG << "Server will shutdown, skip merge action";
|
|
break;
|
|
}
|
|
}
|
|
|
|
meta_ptr_->Archive();
|
|
|
|
{
|
|
uint64_t ttl = 10 * meta::SECOND; // default: file will be hard-deleted few seconds after soft-deleted
|
|
if (options_.mode_ == DBOptions::MODE::CLUSTER_WRITABLE) {
|
|
ttl = meta::HOUR;
|
|
}
|
|
|
|
meta_ptr_->CleanUpFilesWithTTL(ttl);
|
|
}
|
|
|
|
// ENGINE_LOG_TRACE << " Background merge thread exit";
|
|
}
|
|
|
|
void
|
|
DBImpl::StartBuildIndexTask(bool force) {
|
|
static uint64_t index_clock_tick = 0;
|
|
++index_clock_tick;
|
|
if (!force && (index_clock_tick % INDEX_ACTION_INTERVAL != 0)) {
|
|
return;
|
|
}
|
|
|
|
// build index has been finished?
|
|
{
|
|
std::lock_guard<std::mutex> lck(index_result_mutex_);
|
|
if (!index_thread_results_.empty()) {
|
|
std::chrono::milliseconds span(10);
|
|
if (index_thread_results_.back().wait_for(span) == std::future_status::ready) {
|
|
index_thread_results_.pop_back();
|
|
}
|
|
}
|
|
}
|
|
|
|
// add new build index task
|
|
{
|
|
std::lock_guard<std::mutex> lck(index_result_mutex_);
|
|
if (index_thread_results_.empty()) {
|
|
index_thread_results_.push_back(index_thread_pool_.enqueue(&DBImpl::BackgroundBuildIndex, this));
|
|
}
|
|
}
|
|
}
|
|
|
|
void
|
|
DBImpl::BackgroundBuildIndex() {
|
|
std::unique_lock<std::mutex> lock(build_index_mutex_);
|
|
meta::SegmentsSchema to_index_files;
|
|
meta_ptr_->FilesToIndex(to_index_files);
|
|
Status status = index_failed_checker_.IgnoreFailedIndexFiles(to_index_files);
|
|
|
|
if (!to_index_files.empty()) {
|
|
ENGINE_LOG_DEBUG << "Background build index thread begin";
|
|
status = OngoingFileChecker::GetInstance().MarkOngoingFiles(to_index_files);
|
|
|
|
// step 2: put build index task to scheduler
|
|
std::vector<std::pair<scheduler::BuildIndexJobPtr, scheduler::SegmentSchemaPtr>> job2file_map;
|
|
for (auto& file : to_index_files) {
|
|
scheduler::BuildIndexJobPtr job = std::make_shared<scheduler::BuildIndexJob>(meta_ptr_, options_);
|
|
scheduler::SegmentSchemaPtr file_ptr = std::make_shared<meta::SegmentSchema>(file);
|
|
job->AddToIndexFiles(file_ptr);
|
|
scheduler::JobMgrInst::GetInstance()->Put(job);
|
|
job2file_map.push_back(std::make_pair(job, file_ptr));
|
|
}
|
|
|
|
// step 3: wait build index finished and mark failed files
|
|
for (auto iter = job2file_map.begin(); iter != job2file_map.end(); ++iter) {
|
|
scheduler::BuildIndexJobPtr job = iter->first;
|
|
meta::SegmentSchema& file_schema = *(iter->second.get());
|
|
job->WaitBuildIndexFinish();
|
|
if (!job->GetStatus().ok()) {
|
|
Status status = job->GetStatus();
|
|
ENGINE_LOG_ERROR << "Building index job " << job->id() << " failed: " << status.ToString();
|
|
|
|
index_failed_checker_.MarkFailedIndexFile(file_schema, status.message());
|
|
} else {
|
|
ENGINE_LOG_DEBUG << "Building index job " << job->id() << " succeed.";
|
|
|
|
index_failed_checker_.MarkSucceedIndexFile(file_schema);
|
|
}
|
|
status = OngoingFileChecker::GetInstance().UnmarkOngoingFile(file_schema);
|
|
}
|
|
|
|
ENGINE_LOG_DEBUG << "Background build index thread finished";
|
|
}
|
|
}
|
|
|
|
Status
|
|
DBImpl::GetFilesToBuildIndex(const std::string& collection_id, const std::vector<int>& file_types,
|
|
meta::SegmentsSchema& files) {
|
|
files.clear();
|
|
auto status = meta_ptr_->FilesByType(collection_id, file_types, files);
|
|
|
|
// only build index for files that row count greater than certain threshold
|
|
for (auto it = files.begin(); it != files.end();) {
|
|
if ((*it).file_type_ == static_cast<int>(meta::SegmentSchema::RAW) &&
|
|
(*it).row_count_ < meta::BUILD_INDEX_THRESHOLD) {
|
|
it = files.erase(it);
|
|
} else {
|
|
++it;
|
|
}
|
|
}
|
|
|
|
return Status::OK();
|
|
}
|
|
|
|
Status
|
|
DBImpl::GetFilesToSearch(const std::string& collection_id, meta::SegmentsSchema& files) {
|
|
ENGINE_LOG_DEBUG << "Collect files from collection: " << collection_id;
|
|
|
|
meta::SegmentsSchema search_files;
|
|
auto status = meta_ptr_->FilesToSearch(collection_id, search_files);
|
|
if (!status.ok()) {
|
|
return status;
|
|
}
|
|
|
|
for (auto& file : search_files) {
|
|
files.push_back(file);
|
|
}
|
|
return Status::OK();
|
|
}
|
|
|
|
Status
|
|
DBImpl::GetPartitionByTag(const std::string& collection_id, const std::string& partition_tag,
|
|
std::string& partition_name) {
|
|
Status status;
|
|
|
|
if (partition_tag.empty()) {
|
|
partition_name = collection_id;
|
|
|
|
} else {
|
|
// trim side-blank of tag, only compare valid characters
|
|
// for example: " ab cd " is treated as "ab cd"
|
|
std::string valid_tag = partition_tag;
|
|
server::StringHelpFunctions::TrimStringBlank(valid_tag);
|
|
|
|
if (valid_tag == milvus::engine::DEFAULT_PARTITON_TAG) {
|
|
partition_name = collection_id;
|
|
return status;
|
|
}
|
|
|
|
status = meta_ptr_->GetPartitionName(collection_id, partition_tag, partition_name);
|
|
if (!status.ok()) {
|
|
ENGINE_LOG_ERROR << status.message();
|
|
}
|
|
}
|
|
|
|
return status;
|
|
}
|
|
|
|
Status
|
|
DBImpl::GetPartitionsByTags(const std::string& collection_id, const std::vector<std::string>& partition_tags,
|
|
std::set<std::string>& partition_name_array) {
|
|
std::vector<meta::CollectionSchema> partition_array;
|
|
auto status = meta_ptr_->ShowPartitions(collection_id, partition_array);
|
|
|
|
for (auto& tag : partition_tags) {
|
|
// trim side-blank of tag, only compare valid characters
|
|
// for example: " ab cd " is treated as "ab cd"
|
|
std::string valid_tag = tag;
|
|
server::StringHelpFunctions::TrimStringBlank(valid_tag);
|
|
|
|
if (valid_tag == milvus::engine::DEFAULT_PARTITON_TAG) {
|
|
partition_name_array.insert(collection_id);
|
|
return status;
|
|
}
|
|
|
|
for (auto& schema : partition_array) {
|
|
if (server::StringHelpFunctions::IsRegexMatch(schema.partition_tag_, valid_tag)) {
|
|
partition_name_array.insert(schema.collection_id_);
|
|
}
|
|
}
|
|
}
|
|
|
|
if (partition_name_array.empty()) {
|
|
return Status(PARTITION_NOT_FOUND, "Cannot find the specified partitions");
|
|
}
|
|
|
|
return Status::OK();
|
|
}
|
|
|
|
Status
|
|
DBImpl::DropCollectionRecursively(const std::string& collection_id) {
|
|
// dates partly delete files of the collection but currently we don't support
|
|
ENGINE_LOG_DEBUG << "Prepare to delete collection " << collection_id;
|
|
|
|
Status status;
|
|
if (options_.wal_enable_) {
|
|
wal_mgr_->DropCollection(collection_id);
|
|
}
|
|
|
|
status = mem_mgr_->EraseMemVector(collection_id); // not allow insert
|
|
status = meta_ptr_->DropCollection(collection_id); // soft delete collection
|
|
index_failed_checker_.CleanFailedIndexFileOfCollection(collection_id);
|
|
|
|
// scheduler will determine when to delete collection files
|
|
auto nres = scheduler::ResMgrInst::GetInstance()->GetNumOfComputeResource();
|
|
scheduler::DeleteJobPtr job = std::make_shared<scheduler::DeleteJob>(collection_id, meta_ptr_, nres);
|
|
scheduler::JobMgrInst::GetInstance()->Put(job);
|
|
job->WaitAndDelete();
|
|
|
|
std::vector<meta::CollectionSchema> partition_array;
|
|
status = meta_ptr_->ShowPartitions(collection_id, partition_array);
|
|
for (auto& schema : partition_array) {
|
|
status = DropCollectionRecursively(schema.collection_id_);
|
|
fiu_do_on("DBImpl.DropCollectionRecursively.failed", status = Status(DB_ERROR, ""));
|
|
if (!status.ok()) {
|
|
return status;
|
|
}
|
|
}
|
|
|
|
return Status::OK();
|
|
}
|
|
|
|
Status
|
|
DBImpl::UpdateCollectionIndexRecursively(const std::string& collection_id, const CollectionIndex& index) {
|
|
DropIndex(collection_id);
|
|
|
|
auto status = meta_ptr_->UpdateCollectionIndex(collection_id, index);
|
|
fiu_do_on("DBImpl.UpdateCollectionIndexRecursively.fail_update_collection_index",
|
|
status = Status(DB_META_TRANSACTION_FAILED, ""));
|
|
if (!status.ok()) {
|
|
ENGINE_LOG_ERROR << "Failed to update collection index info for collection: " << collection_id;
|
|
return status;
|
|
}
|
|
|
|
std::vector<meta::CollectionSchema> partition_array;
|
|
status = meta_ptr_->ShowPartitions(collection_id, partition_array);
|
|
for (auto& schema : partition_array) {
|
|
status = UpdateCollectionIndexRecursively(schema.collection_id_, index);
|
|
if (!status.ok()) {
|
|
return status;
|
|
}
|
|
}
|
|
|
|
return Status::OK();
|
|
}
|
|
|
|
Status
|
|
DBImpl::WaitCollectionIndexRecursively(const std::string& collection_id, const CollectionIndex& index) {
|
|
// for IDMAP type, only wait all NEW file converted to RAW file
|
|
// for other type, wait NEW/RAW/NEW_MERGE/NEW_INDEX/TO_INDEX files converted to INDEX files
|
|
std::vector<int> file_types;
|
|
if (utils::IsRawIndexType(index.engine_type_)) {
|
|
file_types = {
|
|
static_cast<int32_t>(meta::SegmentSchema::NEW),
|
|
static_cast<int32_t>(meta::SegmentSchema::NEW_MERGE),
|
|
};
|
|
} else {
|
|
file_types = {
|
|
static_cast<int32_t>(meta::SegmentSchema::RAW), static_cast<int32_t>(meta::SegmentSchema::NEW),
|
|
static_cast<int32_t>(meta::SegmentSchema::NEW_MERGE), static_cast<int32_t>(meta::SegmentSchema::NEW_INDEX),
|
|
static_cast<int32_t>(meta::SegmentSchema::TO_INDEX),
|
|
};
|
|
}
|
|
|
|
// get files to build index
|
|
meta::SegmentsSchema collection_files;
|
|
auto status = GetFilesToBuildIndex(collection_id, file_types, collection_files);
|
|
int times = 1;
|
|
|
|
while (!collection_files.empty()) {
|
|
ENGINE_LOG_DEBUG << "Non index files detected! Will build index " << times;
|
|
if (!utils::IsRawIndexType(index.engine_type_)) {
|
|
status = meta_ptr_->UpdateCollectionFilesToIndex(collection_id);
|
|
}
|
|
|
|
std::this_thread::sleep_for(std::chrono::milliseconds(std::min(10 * 1000, times * 100)));
|
|
GetFilesToBuildIndex(collection_id, file_types, collection_files);
|
|
++times;
|
|
|
|
index_failed_checker_.IgnoreFailedIndexFiles(collection_files);
|
|
}
|
|
|
|
// build index for partition
|
|
std::vector<meta::CollectionSchema> partition_array;
|
|
status = meta_ptr_->ShowPartitions(collection_id, partition_array);
|
|
for (auto& schema : partition_array) {
|
|
status = WaitCollectionIndexRecursively(schema.collection_id_, index);
|
|
fiu_do_on("DBImpl.WaitCollectionIndexRecursively.fail_build_collection_Index_for_partition",
|
|
status = Status(DB_ERROR, ""));
|
|
if (!status.ok()) {
|
|
return status;
|
|
}
|
|
}
|
|
|
|
// failed to build index for some files, return error
|
|
std::string err_msg;
|
|
index_failed_checker_.GetErrMsgForCollection(collection_id, err_msg);
|
|
fiu_do_on("DBImpl.WaitCollectionIndexRecursively.not_empty_err_msg", err_msg.append("fiu"));
|
|
if (!err_msg.empty()) {
|
|
return Status(DB_ERROR, err_msg);
|
|
}
|
|
|
|
return Status::OK();
|
|
}
|
|
|
|
Status
|
|
DBImpl::DropCollectionIndexRecursively(const std::string& collection_id) {
|
|
ENGINE_LOG_DEBUG << "Drop index for collection: " << collection_id;
|
|
index_failed_checker_.CleanFailedIndexFileOfCollection(collection_id);
|
|
auto status = meta_ptr_->DropCollectionIndex(collection_id);
|
|
if (!status.ok()) {
|
|
return status;
|
|
}
|
|
|
|
// drop partition index
|
|
std::vector<meta::CollectionSchema> partition_array;
|
|
status = meta_ptr_->ShowPartitions(collection_id, partition_array);
|
|
for (auto& schema : partition_array) {
|
|
status = DropCollectionIndexRecursively(schema.collection_id_);
|
|
fiu_do_on("DBImpl.DropCollectionIndexRecursively.fail_drop_collection_Index_for_partition",
|
|
status = Status(DB_ERROR, ""));
|
|
if (!status.ok()) {
|
|
return status;
|
|
}
|
|
}
|
|
|
|
return Status::OK();
|
|
}
|
|
|
|
Status
|
|
DBImpl::GetCollectionRowCountRecursively(const std::string& collection_id, uint64_t& row_count) {
|
|
row_count = 0;
|
|
auto status = meta_ptr_->Count(collection_id, row_count);
|
|
if (!status.ok()) {
|
|
return status;
|
|
}
|
|
|
|
// get partition row count
|
|
std::vector<meta::CollectionSchema> partition_array;
|
|
status = meta_ptr_->ShowPartitions(collection_id, partition_array);
|
|
for (auto& schema : partition_array) {
|
|
uint64_t partition_row_count = 0;
|
|
status = GetCollectionRowCountRecursively(schema.collection_id_, partition_row_count);
|
|
fiu_do_on("DBImpl.GetCollectionRowCountRecursively.fail_get_collection_rowcount_for_partition",
|
|
status = Status(DB_ERROR, ""));
|
|
if (!status.ok()) {
|
|
return status;
|
|
}
|
|
|
|
row_count += partition_row_count;
|
|
}
|
|
|
|
return Status::OK();
|
|
}
|
|
|
|
Status
|
|
DBImpl::ExecWalRecord(const wal::MXLogRecord& record) {
|
|
fiu_return_on("DBImpl.ExexWalRecord.return", Status(););
|
|
|
|
auto collections_flushed = [&](const std::set<std::string>& collection_ids) -> uint64_t {
|
|
if (collection_ids.empty()) {
|
|
return 0;
|
|
}
|
|
|
|
uint64_t max_lsn = 0;
|
|
if (options_.wal_enable_) {
|
|
for (auto& collection : collection_ids) {
|
|
uint64_t lsn = 0;
|
|
meta_ptr_->GetCollectionFlushLSN(collection, lsn);
|
|
wal_mgr_->CollectionFlushed(collection, lsn);
|
|
if (lsn > max_lsn) {
|
|
max_lsn = lsn;
|
|
}
|
|
}
|
|
}
|
|
|
|
std::lock_guard<std::mutex> lck(merge_result_mutex_);
|
|
for (auto& collection : collection_ids) {
|
|
merge_collection_ids_.insert(collection);
|
|
}
|
|
return max_lsn;
|
|
};
|
|
|
|
Status status;
|
|
|
|
switch (record.type) {
|
|
case wal::MXLogType::InsertBinary: {
|
|
std::string target_collection_name;
|
|
status = GetPartitionByTag(record.collection_id, record.partition_tag, target_collection_name);
|
|
if (!status.ok()) {
|
|
return status;
|
|
}
|
|
|
|
std::set<std::string> flushed_collections;
|
|
status = mem_mgr_->InsertVectors(target_collection_name, record.length, record.ids,
|
|
(record.data_size / record.length / sizeof(uint8_t)),
|
|
(const u_int8_t*)record.data, record.lsn, flushed_collections);
|
|
// even though !status.ok, run
|
|
collections_flushed(flushed_collections);
|
|
|
|
// metrics
|
|
milvus::server::CollectInsertMetrics metrics(record.length, status);
|
|
break;
|
|
}
|
|
|
|
case wal::MXLogType::InsertVector: {
|
|
std::string target_collection_name;
|
|
status = GetPartitionByTag(record.collection_id, record.partition_tag, target_collection_name);
|
|
if (!status.ok()) {
|
|
return status;
|
|
}
|
|
|
|
std::set<std::string> flushed_collections;
|
|
status = mem_mgr_->InsertVectors(target_collection_name, record.length, record.ids,
|
|
(record.data_size / record.length / sizeof(float)),
|
|
(const float*)record.data, record.lsn, flushed_collections);
|
|
// even though !status.ok, run
|
|
collections_flushed(flushed_collections);
|
|
|
|
// metrics
|
|
milvus::server::CollectInsertMetrics metrics(record.length, status);
|
|
break;
|
|
}
|
|
|
|
case wal::MXLogType::Delete: {
|
|
std::vector<meta::CollectionSchema> partition_array;
|
|
status = meta_ptr_->ShowPartitions(record.collection_id, partition_array);
|
|
if (!status.ok()) {
|
|
return status;
|
|
}
|
|
|
|
std::vector<std::string> collection_ids{record.collection_id};
|
|
for (auto& partition : partition_array) {
|
|
auto& partition_collection_id = partition.collection_id_;
|
|
collection_ids.emplace_back(partition_collection_id);
|
|
}
|
|
|
|
if (record.length == 1) {
|
|
for (auto& collection_id : collection_ids) {
|
|
status = mem_mgr_->DeleteVector(collection_id, *record.ids, record.lsn);
|
|
if (!status.ok()) {
|
|
return status;
|
|
}
|
|
}
|
|
} else {
|
|
for (auto& collection_id : collection_ids) {
|
|
status = mem_mgr_->DeleteVectors(collection_id, record.length, record.ids, record.lsn);
|
|
if (!status.ok()) {
|
|
return status;
|
|
}
|
|
}
|
|
}
|
|
break;
|
|
}
|
|
|
|
case wal::MXLogType::Flush: {
|
|
if (!record.collection_id.empty()) {
|
|
// flush one collection
|
|
std::vector<meta::CollectionSchema> partition_array;
|
|
status = meta_ptr_->ShowPartitions(record.collection_id, partition_array);
|
|
if (!status.ok()) {
|
|
return status;
|
|
}
|
|
|
|
std::vector<std::string> collection_ids{record.collection_id};
|
|
for (auto& partition : partition_array) {
|
|
auto& partition_collection_id = partition.collection_id_;
|
|
collection_ids.emplace_back(partition_collection_id);
|
|
}
|
|
|
|
std::set<std::string> flushed_collections;
|
|
for (auto& collection_id : collection_ids) {
|
|
const std::lock_guard<std::mutex> lock(flush_merge_compact_mutex_);
|
|
status = mem_mgr_->Flush(collection_id);
|
|
if (!status.ok()) {
|
|
break;
|
|
}
|
|
flushed_collections.insert(collection_id);
|
|
}
|
|
|
|
collections_flushed(flushed_collections);
|
|
|
|
} else {
|
|
// flush all collections
|
|
std::set<std::string> collection_ids;
|
|
{
|
|
const std::lock_guard<std::mutex> lock(flush_merge_compact_mutex_);
|
|
status = mem_mgr_->Flush(collection_ids);
|
|
}
|
|
|
|
uint64_t lsn = collections_flushed(collection_ids);
|
|
if (options_.wal_enable_) {
|
|
wal_mgr_->RemoveOldFiles(lsn);
|
|
}
|
|
}
|
|
break;
|
|
}
|
|
}
|
|
|
|
return status;
|
|
}
|
|
|
|
void
|
|
DBImpl::BackgroundWalTask() {
|
|
server::SystemInfo::GetInstance().Init();
|
|
|
|
std::chrono::system_clock::time_point next_auto_flush_time;
|
|
auto get_next_auto_flush_time = [&]() {
|
|
return std::chrono::system_clock::now() + std::chrono::seconds(options_.auto_flush_interval_);
|
|
};
|
|
if (options_.auto_flush_interval_ > 0) {
|
|
next_auto_flush_time = get_next_auto_flush_time();
|
|
}
|
|
|
|
wal::MXLogRecord record;
|
|
|
|
auto auto_flush = [&]() {
|
|
record.type = wal::MXLogType::Flush;
|
|
record.collection_id.clear();
|
|
ExecWalRecord(record);
|
|
|
|
StartMetricTask();
|
|
StartMergeTask();
|
|
StartBuildIndexTask();
|
|
};
|
|
|
|
while (true) {
|
|
if (options_.auto_flush_interval_ > 0) {
|
|
if (std::chrono::system_clock::now() >= next_auto_flush_time) {
|
|
auto_flush();
|
|
next_auto_flush_time = get_next_auto_flush_time();
|
|
}
|
|
}
|
|
|
|
auto error_code = wal_mgr_->GetNextRecord(record);
|
|
if (error_code != WAL_SUCCESS) {
|
|
ENGINE_LOG_ERROR << "WAL background GetNextRecord error";
|
|
break;
|
|
}
|
|
|
|
if (record.type != wal::MXLogType::None) {
|
|
ExecWalRecord(record);
|
|
if (record.type == wal::MXLogType::Flush) {
|
|
// user req flush
|
|
flush_task_swn_.Notify();
|
|
|
|
// if user flush all manually, update auto flush also
|
|
if (record.collection_id.empty() && options_.auto_flush_interval_ > 0) {
|
|
next_auto_flush_time = get_next_auto_flush_time();
|
|
}
|
|
}
|
|
|
|
} else {
|
|
if (!initialized_.load(std::memory_order_acquire)) {
|
|
auto_flush();
|
|
WaitMergeFileFinish();
|
|
WaitBuildIndexFinish();
|
|
ENGINE_LOG_DEBUG << "WAL background thread exit";
|
|
break;
|
|
}
|
|
|
|
if (options_.auto_flush_interval_ > 0) {
|
|
bg_task_swn_.Wait_Until(next_auto_flush_time);
|
|
} else {
|
|
bg_task_swn_.Wait();
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|
|
void
|
|
DBImpl::OnCacheInsertDataChanged(bool value) {
|
|
options_.insert_cache_immediately_ = value;
|
|
}
|
|
|
|
void
|
|
DBImpl::OnUseBlasThresholdChanged(int64_t threshold) {
|
|
faiss::distance_compute_blas_threshold = threshold;
|
|
}
|
|
|
|
} // namespace engine
|
|
} // namespace milvus
|