From b576bd6f1fab62eb644720a1d0cf47ff92cf54d7 Mon Sep 17 00:00:00 2001 From: Yu Kun Date: Fri, 23 Aug 2019 11:15:14 +0800 Subject: [PATCH] modify GpuCacheMgr GetInsatnce Former-commit-id: 7323d4a63e58a6e70f8d47f6b2fbe9566197013c --- cpp/src/cache/Cache.h | 4 -- cpp/src/cache/CacheMgr.cpp | 19 ---------- cpp/src/cache/CacheMgr.h | 2 - cpp/src/cache/GpuCacheMgr.cpp | 38 +++++++++++-------- cpp/src/cache/GpuCacheMgr.h | 12 ++++-- .../examples/grpcsimple/src/ClientTest.cpp | 3 -- cpp/src/server/grpc_impl/GrpcRequestTask.cpp | 23 +++++------ cpp/unittest/server/cache_test.cpp | 2 +- 8 files changed, 44 insertions(+), 59 deletions(-) diff --git a/cpp/src/cache/Cache.h b/cpp/src/cache/Cache.h index 6151718530..4d6f32b9eb 100644 --- a/cpp/src/cache/Cache.h +++ b/cpp/src/cache/Cache.h @@ -46,9 +46,6 @@ public: double freemem_percent() const { return freemem_percent_; }; void set_freemem_percent(double percent) { freemem_percent_ = percent; } - void set_gpu_ids(std::vector& gpu_ids) { gpu_ids_ = gpu_ids; } - - std::vector gpu_ids() const { return gpu_ids_; } size_t size() const; bool exists(const std::string& key); @@ -63,7 +60,6 @@ private: int64_t usage_; int64_t capacity_; double freemem_percent_; - std::vector gpu_ids_; LRU lru_; mutable std::mutex mutex_; diff --git a/cpp/src/cache/CacheMgr.cpp b/cpp/src/cache/CacheMgr.cpp index eb3980da61..977c7e1c42 100644 --- a/cpp/src/cache/CacheMgr.cpp +++ b/cpp/src/cache/CacheMgr.cpp @@ -56,7 +56,6 @@ engine::VecIndexPtr CacheMgr::GetIndex(const std::string& key) { } void CacheMgr::InsertItem(const std::string& key, const DataObjPtr& data) { - std::cout << "dashalk\n"; if(cache_ == nullptr) { SERVER_LOG_ERROR << "Cache doesn't exist"; return; @@ -131,24 +130,6 @@ void CacheMgr::SetCapacity(int64_t capacity) { cache_->set_capacity(capacity); } -std::vector CacheMgr::GpuIds() const { - if(cache_ == nullptr) { - SERVER_LOG_ERROR << "Cache doesn't exist"; - std::vector gpu_ids; - return gpu_ids; - } - - return cache_->gpu_ids(); -} - -void CacheMgr::SetGpuIds(std::vector gpu_ids){ - if(cache_ == nullptr) { - SERVER_LOG_ERROR << "Cache doesn't exist"; - return; - } - cache_->set_gpu_ids(gpu_ids); -} - } } } diff --git a/cpp/src/cache/CacheMgr.h b/cpp/src/cache/CacheMgr.h index 9abb30b92f..b6f1ec8ef1 100644 --- a/cpp/src/cache/CacheMgr.h +++ b/cpp/src/cache/CacheMgr.h @@ -33,8 +33,6 @@ public: int64_t CacheUsage() const; int64_t CacheCapacity() const; void SetCapacity(int64_t capacity); - std::vector GpuIds() const; - void SetGpuIds(std::vector gpu_ids); protected: CacheMgr(); diff --git a/cpp/src/cache/GpuCacheMgr.cpp b/cpp/src/cache/GpuCacheMgr.cpp index eb6b1dbeb7..4aa5626348 100644 --- a/cpp/src/cache/GpuCacheMgr.cpp +++ b/cpp/src/cache/GpuCacheMgr.cpp @@ -4,6 +4,7 @@ // Proprietary and confidential. //////////////////////////////////////////////////////////////////////////////// +#include #include "utils/Log.h" #include "GpuCacheMgr.h" #include "server/ServerConfig.h" @@ -18,34 +19,39 @@ std::unordered_map GpuCacheMgr::instance_; namespace { constexpr int64_t unit = 1024 * 1024 * 1024; - void parse_gpu_ids(std::string gpu_ids_str, std::vector& gpu_ids) { - for (auto i = 0; i < gpu_ids_str.length(); ) { - if (gpu_ids_str[i] != ',') { - int id = 0; - while (gpu_ids_str[i] <= '9' && gpu_ids_str[i] >= '0') { - id = id * 10 + gpu_ids_str[i] - '0'; - ++i; - } - gpu_ids.push_back(id); - } else { - ++i; + std::vector load() { + server::ConfigNode& config = server::ServerConfig::GetInstance().GetConfig(server::CONFIG_CACHE); + std::string gpu_ids_str = config.GetValue(server::CONFIG_GPU_IDS, "0,1"); + + std::vector gpu_ids; + + std::stringstream ss(gpu_ids_str); + for (int i; ss >> i;) { + gpu_ids.push_back(i); + if (ss.peek() == ',') { + ss.ignore(); } } + return gpu_ids; } } + +bool GpuCacheMgr::GpuIdInConfig(uint64_t gpu_id) { + static std::vector ids = load(); + for (auto id : ids) { + if (gpu_id == id) return true; + } + return false; +} + GpuCacheMgr::GpuCacheMgr() { server::ConfigNode& config = server::ServerConfig::GetInstance().GetConfig(server::CONFIG_CACHE); - std::string gpu_ids_str = config.GetValue(server::CONFIG_GPU_IDS, "0,1"); int64_t cap = config.GetInt64Value(server::CONFIG_GPU_CACHE_CAPACITY, 2); cap *= unit; cache_ = std::make_shared(cap, 1UL<<32); - std::vector gpu_ids; - parse_gpu_ids(gpu_ids_str, gpu_ids); - cache_->set_gpu_ids(gpu_ids); - double free_percent = config.GetDoubleValue(server::GPU_CACHE_FREE_PERCENT, 0.85); if (free_percent > 0.0 && free_percent <= 1.0) { cache_->set_freemem_percent(free_percent); diff --git a/cpp/src/cache/GpuCacheMgr.h b/cpp/src/cache/GpuCacheMgr.h index 8c6a0c012c..f26dfaa1b7 100644 --- a/cpp/src/cache/GpuCacheMgr.h +++ b/cpp/src/cache/GpuCacheMgr.h @@ -19,12 +19,18 @@ class GpuCacheMgr : public CacheMgr { public: GpuCacheMgr(); -public: + static bool GpuIdInConfig(uint64_t gpu_id); + static CacheMgr* GetInstance(uint64_t gpu_id) { if (instance_.find(gpu_id) == instance_.end()) { std::lock_guard lock(mutex_); - instance_.insert(std::pair(gpu_id, std::make_shared())); -// instance_[gpu_id] = std::make_shared(); + if (instance_.find(gpu_id) == instance_.end()) { + if (GpuIdInConfig(gpu_id)) { + instance_.insert(std::pair(gpu_id, std::make_shared())); + } else { + return nullptr; + } + } } return instance_[gpu_id].get(); } diff --git a/cpp/src/sdk/examples/grpcsimple/src/ClientTest.cpp b/cpp/src/sdk/examples/grpcsimple/src/ClientTest.cpp index 1e44c0e469..f30a23e174 100644 --- a/cpp/src/sdk/examples/grpcsimple/src/ClientTest.cpp +++ b/cpp/src/sdk/examples/grpcsimple/src/ClientTest.cpp @@ -263,9 +263,6 @@ ClientTest::Test(const std::string& address, const std::string& port) { search_record_array.push_back( std::make_pair(record_ids[SEARCH_TARGET], record_array[SEARCH_TARGET])); } - int64_t row_count; - conn->CountTable(TABLE_NAME, row_count); - std::cout << "\t" << TABLE_NAME << "(" << row_count << " rows)" << std::endl; } } diff --git a/cpp/src/server/grpc_impl/GrpcRequestTask.cpp b/cpp/src/server/grpc_impl/GrpcRequestTask.cpp index e10d2ae070..8a6ce0c298 100644 --- a/cpp/src/server/grpc_impl/GrpcRequestTask.cpp +++ b/cpp/src/server/grpc_impl/GrpcRequestTask.cpp @@ -448,18 +448,19 @@ InsertTask::OnExecute() { // TODO: change to one dimension array in protobuf or use multiple-thread to copy the data for (size_t i = 0; i < insert_param_.row_record_array_size(); i++) { + if (insert_param_.row_record_array(i).vector_data().empty()) { + return SetError(SERVER_INVALID_ROWRECORD_ARRAY, "Row record float array is empty"); + } + uint64_t vec_dim = insert_param_.row_record_array(i).vector_data().size(); + if (vec_dim != table_info.dimension_) { + ServerError error_code = SERVER_INVALID_VECTOR_DIMENSION; + std::string error_msg = "Invalid rowrecord dimension: " + std::to_string(vec_dim) + + " vs. table dimension:" + + std::to_string(table_info.dimension_); + return SetError(error_code, error_msg); + } + //TODO: use memcpy for (size_t j = 0; j < table_info.dimension_; j++) { - if (insert_param_.row_record_array(i).vector_data().empty()) { - return SetError(SERVER_INVALID_ROWRECORD_ARRAY, "Row record float array is empty"); - } - uint64_t vec_dim = insert_param_.row_record_array(i).vector_data().size(); - if (vec_dim != table_info.dimension_) { - ServerError error_code = SERVER_INVALID_VECTOR_DIMENSION; - std::string error_msg = "Invalid rowrecord dimension: " + std::to_string(vec_dim) - + " vs. table dimension:" + - std::to_string(table_info.dimension_); - return SetError(error_code, error_msg); - } vec_f[i * table_info.dimension_ + j] = insert_param_.row_record_array(i).vector_data(j); } } diff --git a/cpp/unittest/server/cache_test.cpp b/cpp/unittest/server/cache_test.cpp index a4e19f0a98..d52e34143a 100644 --- a/cpp/unittest/server/cache_test.cpp +++ b/cpp/unittest/server/cache_test.cpp @@ -165,8 +165,8 @@ TEST(CacheTest, GPU_CACHE_TEST) { gpu_mgr->ClearCache(); ASSERT_EQ(gpu_mgr->ItemCount(), 0); - gpu_mgr->SetCapacity(4096000000); for (auto i = 0; i < 3; i++) { + // TODO: use gpu index to mock MockVecIndex *mock_index = new MockVecIndex(); mock_index->ntotal_ = 1000000; //2G engine::VecIndexPtr index(mock_index);