// Licensed to the LF AI & Data foundation under one // or more contributor license agreements. See the NOTICE file // distributed with this work for additional information // regarding copyright ownership. The ASF licenses this file // to you under the Apache License, Version 2.0 (the // "License"); you may not use this file except in compliance // with the License. You may obtain a copy of the License at // // http://www.apache.org/licenses/LICENSE-2.0 // // Unless required by applicable law or agreed to in writing, software // distributed under the License is distributed on an "AS IS" BASIS, // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. // See the License for the specific language governing permissions and // limitations under the License. #include #include "storage/DataCodec.h" #include "storage/InsertData.h" #include "storage/IndexData.h" #include "storage/Util.h" #include "common/Consts.h" #include "utils/Json.h" using namespace milvus; TEST(storage, InsertDataBool) { FixedVector data = {true, false, true, false, true}; auto field_data = milvus::storage::CreateFieldData(storage::DataType::BOOL); field_data->FillFieldData(data.data(), data.size()); storage::InsertData insert_data(field_data); storage::FieldDataMeta field_data_meta{100, 101, 102, 103}; insert_data.SetFieldDataMeta(field_data_meta); insert_data.SetTimestamps(0, 100); auto serialized_bytes = insert_data.Serialize(storage::StorageType::Remote); std::shared_ptr serialized_data_ptr(serialized_bytes.data(), [&](uint8_t*) {}); auto new_insert_data = storage::DeserializeFileData( serialized_data_ptr, serialized_bytes.size()); ASSERT_EQ(new_insert_data->GetCodecType(), storage::InsertDataType); ASSERT_EQ(new_insert_data->GetTimeRage(), std::make_pair(Timestamp(0), Timestamp(100))); auto new_payload = new_insert_data->GetFieldData(); ASSERT_EQ(new_payload->get_data_type(), storage::DataType::BOOL); ASSERT_EQ(new_payload->get_num_rows(), data.size()); FixedVector new_data(data.size()); memcpy(new_data.data(), new_payload->Data(), new_payload->Size()); ASSERT_EQ(data, new_data); } TEST(storage, InsertDataInt8) { FixedVector data = {1, 2, 3, 4, 5}; auto field_data = milvus::storage::CreateFieldData(storage::DataType::INT8); field_data->FillFieldData(data.data(), data.size()); storage::InsertData insert_data(field_data); storage::FieldDataMeta field_data_meta{100, 101, 102, 103}; insert_data.SetFieldDataMeta(field_data_meta); insert_data.SetTimestamps(0, 100); auto serialized_bytes = insert_data.Serialize(storage::StorageType::Remote); std::shared_ptr serialized_data_ptr(serialized_bytes.data(), [&](uint8_t*) {}); auto new_insert_data = storage::DeserializeFileData( serialized_data_ptr, serialized_bytes.size()); ASSERT_EQ(new_insert_data->GetCodecType(), storage::InsertDataType); ASSERT_EQ(new_insert_data->GetTimeRage(), std::make_pair(Timestamp(0), Timestamp(100))); auto new_payload = new_insert_data->GetFieldData(); ASSERT_EQ(new_payload->get_data_type(), storage::DataType::INT8); ASSERT_EQ(new_payload->get_num_rows(), data.size()); FixedVector new_data(data.size()); memcpy(new_data.data(), new_payload->Data(), new_payload->Size()); ASSERT_EQ(data, new_data); } TEST(storage, InsertDataInt16) { FixedVector data = {1, 2, 3, 4, 5}; auto field_data = milvus::storage::CreateFieldData(storage::DataType::INT16); field_data->FillFieldData(data.data(), data.size()); storage::InsertData insert_data(field_data); storage::FieldDataMeta field_data_meta{100, 101, 102, 103}; insert_data.SetFieldDataMeta(field_data_meta); insert_data.SetTimestamps(0, 100); auto serialized_bytes = insert_data.Serialize(storage::StorageType::Remote); std::shared_ptr serialized_data_ptr(serialized_bytes.data(), [&](uint8_t*) {}); auto new_insert_data = storage::DeserializeFileData( serialized_data_ptr, serialized_bytes.size()); ASSERT_EQ(new_insert_data->GetCodecType(), storage::InsertDataType); ASSERT_EQ(new_insert_data->GetTimeRage(), std::make_pair(Timestamp(0), Timestamp(100))); auto new_payload = new_insert_data->GetFieldData(); ASSERT_EQ(new_payload->get_data_type(), storage::DataType::INT16); ASSERT_EQ(new_payload->get_num_rows(), data.size()); FixedVector new_data(data.size()); memcpy(new_data.data(), new_payload->Data(), new_payload->Size()); ASSERT_EQ(data, new_data); } TEST(storage, InsertDataInt32) { FixedVector data = {true, false, true, false, true}; auto field_data = milvus::storage::CreateFieldData(storage::DataType::INT32); field_data->FillFieldData(data.data(), data.size()); storage::InsertData insert_data(field_data); storage::FieldDataMeta field_data_meta{100, 101, 102, 103}; insert_data.SetFieldDataMeta(field_data_meta); insert_data.SetTimestamps(0, 100); auto serialized_bytes = insert_data.Serialize(storage::StorageType::Remote); std::shared_ptr serialized_data_ptr(serialized_bytes.data(), [&](uint8_t*) {}); auto new_insert_data = storage::DeserializeFileData( serialized_data_ptr, serialized_bytes.size()); ASSERT_EQ(new_insert_data->GetCodecType(), storage::InsertDataType); ASSERT_EQ(new_insert_data->GetTimeRage(), std::make_pair(Timestamp(0), Timestamp(100))); auto new_payload = new_insert_data->GetFieldData(); ASSERT_EQ(new_payload->get_data_type(), storage::DataType::INT32); ASSERT_EQ(new_payload->get_num_rows(), data.size()); FixedVector new_data(data.size()); memcpy(new_data.data(), new_payload->Data(), new_payload->Size()); ASSERT_EQ(data, new_data); } TEST(storage, InsertDataInt64) { FixedVector data = {1, 2, 3, 4, 5}; auto field_data = milvus::storage::CreateFieldData(storage::DataType::INT64); field_data->FillFieldData(data.data(), data.size()); storage::InsertData insert_data(field_data); storage::FieldDataMeta field_data_meta{100, 101, 102, 103}; insert_data.SetFieldDataMeta(field_data_meta); insert_data.SetTimestamps(0, 100); auto serialized_bytes = insert_data.Serialize(storage::StorageType::Remote); std::shared_ptr serialized_data_ptr(serialized_bytes.data(), [&](uint8_t*) {}); auto new_insert_data = storage::DeserializeFileData( serialized_data_ptr, serialized_bytes.size()); ASSERT_EQ(new_insert_data->GetCodecType(), storage::InsertDataType); ASSERT_EQ(new_insert_data->GetTimeRage(), std::make_pair(Timestamp(0), Timestamp(100))); auto new_payload = new_insert_data->GetFieldData(); ASSERT_EQ(new_payload->get_data_type(), storage::DataType::INT64); ASSERT_EQ(new_payload->get_num_rows(), data.size()); FixedVector new_data(data.size()); memcpy(new_data.data(), new_payload->Data(), new_payload->Size()); ASSERT_EQ(data, new_data); } TEST(storage, InsertDataString) { FixedVector data = { "test1", "test2", "test3", "test4", "test5"}; auto field_data = milvus::storage::CreateFieldData(storage::DataType::VARCHAR); field_data->FillFieldData(data.data(), data.size()); storage::InsertData insert_data(field_data); storage::FieldDataMeta field_data_meta{100, 101, 102, 103}; insert_data.SetFieldDataMeta(field_data_meta); insert_data.SetTimestamps(0, 100); auto serialized_bytes = insert_data.Serialize(storage::StorageType::Remote); std::shared_ptr serialized_data_ptr(serialized_bytes.data(), [&](uint8_t*) {}); auto new_insert_data = storage::DeserializeFileData( serialized_data_ptr, serialized_bytes.size()); ASSERT_EQ(new_insert_data->GetCodecType(), storage::InsertDataType); ASSERT_EQ(new_insert_data->GetTimeRage(), std::make_pair(Timestamp(0), Timestamp(100))); auto new_payload = new_insert_data->GetFieldData(); ASSERT_EQ(new_payload->get_data_type(), storage::DataType::VARCHAR); ASSERT_EQ(new_payload->get_num_rows(), data.size()); FixedVector new_data(data.size()); for (int i = 0; i < data.size(); ++i) { new_data[i] = *static_cast(new_payload->RawValue(i)); ASSERT_EQ(new_payload->Size(i), data[i].size()); } ASSERT_EQ(data, new_data); } TEST(storage, InsertDataFloat) { FixedVector data = {1, 2, 3, 4, 5}; auto field_data = milvus::storage::CreateFieldData(storage::DataType::FLOAT); field_data->FillFieldData(data.data(), data.size()); storage::InsertData insert_data(field_data); storage::FieldDataMeta field_data_meta{100, 101, 102, 103}; insert_data.SetFieldDataMeta(field_data_meta); insert_data.SetTimestamps(0, 100); auto serialized_bytes = insert_data.Serialize(storage::StorageType::Remote); std::shared_ptr serialized_data_ptr(serialized_bytes.data(), [&](uint8_t*) {}); auto new_insert_data = storage::DeserializeFileData( serialized_data_ptr, serialized_bytes.size()); ASSERT_EQ(new_insert_data->GetCodecType(), storage::InsertDataType); ASSERT_EQ(new_insert_data->GetTimeRage(), std::make_pair(Timestamp(0), Timestamp(100))); auto new_payload = new_insert_data->GetFieldData(); ASSERT_EQ(new_payload->get_data_type(), storage::DataType::FLOAT); ASSERT_EQ(new_payload->get_num_rows(), data.size()); FixedVector new_data(data.size()); memcpy(new_data.data(), new_payload->Data(), new_payload->Size()); ASSERT_EQ(data, new_data); } TEST(storage, InsertDataDouble) { FixedVector data = {1.0, 2.0, 3.0, 4.2, 5.3}; auto field_data = milvus::storage::CreateFieldData(storage::DataType::DOUBLE); field_data->FillFieldData(data.data(), data.size()); storage::InsertData insert_data(field_data); storage::FieldDataMeta field_data_meta{100, 101, 102, 103}; insert_data.SetFieldDataMeta(field_data_meta); insert_data.SetTimestamps(0, 100); auto serialized_bytes = insert_data.Serialize(storage::StorageType::Remote); std::shared_ptr serialized_data_ptr(serialized_bytes.data(), [&](uint8_t*) {}); auto new_insert_data = storage::DeserializeFileData( serialized_data_ptr, serialized_bytes.size()); ASSERT_EQ(new_insert_data->GetCodecType(), storage::InsertDataType); ASSERT_EQ(new_insert_data->GetTimeRage(), std::make_pair(Timestamp(0), Timestamp(100))); auto new_payload = new_insert_data->GetFieldData(); ASSERT_EQ(new_payload->get_data_type(), storage::DataType::DOUBLE); ASSERT_EQ(new_payload->get_num_rows(), data.size()); FixedVector new_data(data.size()); memcpy(new_data.data(), new_payload->Data(), new_payload->Size()); ASSERT_EQ(data, new_data); } TEST(storage, InsertDataFloatVector) { std::vector data = {1, 2, 3, 4, 5, 6, 7, 8}; int DIM = 2; auto field_data = milvus::storage::CreateFieldData(storage::DataType::VECTOR_FLOAT, DIM); field_data->FillFieldData(data.data(), data.size() / DIM); storage::InsertData insert_data(field_data); storage::FieldDataMeta field_data_meta{100, 101, 102, 103}; insert_data.SetFieldDataMeta(field_data_meta); insert_data.SetTimestamps(0, 100); auto serialized_bytes = insert_data.Serialize(storage::StorageType::Remote); std::shared_ptr serialized_data_ptr(serialized_bytes.data(), [&](uint8_t*) {}); auto new_insert_data = storage::DeserializeFileData( serialized_data_ptr, serialized_bytes.size()); ASSERT_EQ(new_insert_data->GetCodecType(), storage::InsertDataType); ASSERT_EQ(new_insert_data->GetTimeRage(), std::make_pair(Timestamp(0), Timestamp(100))); auto new_payload = new_insert_data->GetFieldData(); ASSERT_EQ(new_payload->get_data_type(), storage::DataType::VECTOR_FLOAT); ASSERT_EQ(new_payload->get_num_rows(), data.size() / DIM); std::vector new_data(data.size()); memcpy(new_data.data(), new_payload->Data(), new_payload->get_num_rows() * sizeof(float) * DIM); ASSERT_EQ(data, new_data); } TEST(storage, InsertDataBinaryVector) { std::vector data = {1, 2, 3, 4, 5, 6, 7, 8}; int DIM = 16; auto field_data = milvus::storage::CreateFieldData(storage::DataType::VECTOR_BINARY, DIM); field_data->FillFieldData(data.data(), data.size() * 8 / DIM); storage::InsertData insert_data(field_data); storage::FieldDataMeta field_data_meta{100, 101, 102, 103}; insert_data.SetFieldDataMeta(field_data_meta); insert_data.SetTimestamps(0, 100); auto serialized_bytes = insert_data.Serialize(storage::StorageType::Remote); std::shared_ptr serialized_data_ptr(serialized_bytes.data(), [&](uint8_t*) {}); auto new_insert_data = storage::DeserializeFileData( serialized_data_ptr, serialized_bytes.size()); ASSERT_EQ(new_insert_data->GetCodecType(), storage::InsertDataType); ASSERT_EQ(new_insert_data->GetTimeRage(), std::make_pair(Timestamp(0), Timestamp(100))); auto new_payload = new_insert_data->GetFieldData(); ASSERT_EQ(new_payload->get_data_type(), storage::DataType::VECTOR_BINARY); ASSERT_EQ(new_payload->get_num_rows(), data.size() * 8 / DIM); std::vector new_data(data.size()); memcpy(new_data.data(), new_payload->Data(), new_payload->Size()); ASSERT_EQ(data, new_data); } TEST(storage, IndexData) { std::vector data = {1, 2, 3, 4, 5, 6, 7, 8}; auto field_data = milvus::storage::CreateFieldData(storage::DataType::INT8); field_data->FillFieldData(data.data(), data.size()); storage::IndexData index_data(field_data); storage::FieldDataMeta field_data_meta{100, 101, 102, 103}; index_data.SetFieldDataMeta(field_data_meta); index_data.SetTimestamps(0, 100); storage::IndexMeta index_meta{102, 103, 104, 1}; index_data.set_index_meta(index_meta); auto serialized_bytes = index_data.Serialize(storage::StorageType::Remote); std::shared_ptr serialized_data_ptr(serialized_bytes.data(), [&](uint8_t*) {}); auto new_index_data = storage::DeserializeFileData(serialized_data_ptr, serialized_bytes.size()); ASSERT_EQ(new_index_data->GetCodecType(), storage::IndexDataType); ASSERT_EQ(new_index_data->GetTimeRage(), std::make_pair(Timestamp(0), Timestamp(100))); auto new_field_data = new_index_data->GetFieldData(); ASSERT_EQ(new_field_data->get_data_type(), storage::DataType::INT8); ASSERT_EQ(new_field_data->Size(), data.size()); std::vector new_data(data.size()); memcpy(new_data.data(), new_field_data->Data(), new_field_data->Size()); ASSERT_EQ(data, new_data); }