From f5c49d7cc967b85820b2987612c5a2e7c6b1f9a6 Mon Sep 17 00:00:00 2001 From: MrPresent-Han Date: Fri, 27 Dec 2024 01:13:11 -0500 Subject: [PATCH] enhance: refine array view to optimize memory usage(#38736) Signed-off-by: MrPresent-Han --- internal/core/src/common/Array.h | 147 +++++++++--------- internal/core/src/common/Chunk.cpp | 20 ++- internal/core/src/common/ChunkWriter.cpp | 28 ++-- internal/core/src/mmap/ChunkData.h | 36 +++-- internal/core/src/mmap/ChunkVector.h | 3 +- internal/core/src/mmap/Column.h | 20 ++- internal/core/src/mmap/Utils.h | 6 +- .../core/src/segcore/SegmentSealedImpl.cpp | 2 +- .../core/src/storage/MmapChunkManager.cpp | 4 +- internal/core/unittest/test_array.cpp | 55 ++++--- .../core/unittest/test_array_bitmap_index.cpp | 3 - 11 files changed, 183 insertions(+), 141 deletions(-) diff --git a/internal/core/src/common/Array.h b/internal/core/src/common/Array.h index 157fe78702818..bdf62ace88fdc 100644 --- a/internal/core/src/common/Array.h +++ b/internal/core/src/common/Array.h @@ -35,6 +35,27 @@ class Array { ~Array() { delete[] data_; + if (offsets_ptr_) { + // only deallocate offsets for string type array + delete[] offsets_ptr_; + } + } + + Array(char* data, + int len, + size_t size, + DataType element_type, + const uint32_t* offsets_ptr) + : size_(size), length_(len), element_type_(element_type) { + data_ = new char[size]; + std::copy(data, data + size, data_); + if (IsVariableDataType(element_type)) { + AssertInfo(offsets_ptr != nullptr, + "For variable type elements in array, offsets_ptr must " + "be non-null"); + offsets_ptr_ = new uint32_t[len]; + std::copy(offsets_ptr, offsets_ptr + len, offsets_ptr_); + } } explicit Array(const ScalarArray& field_data) { @@ -97,17 +118,19 @@ class Array { case ScalarArray::kStringData: { element_type_ = DataType::STRING; length_ = field_data.string_data().data().size(); - offsets_.reserve(length_); + offsets_ptr_ = new uint32_t[length_]; for (int i = 0; i < length_; ++i) { - offsets_.push_back(size_); - size_ += field_data.string_data().data(i).size(); + offsets_ptr_[i] = size_; + size_ += + field_data.string_data() + .data(i) + .size(); //type risk here between uint32_t vs size_t } - data_ = new char[size_]; for (int i = 0; i < length_; ++i) { std::copy_n(field_data.string_data().data(i).data(), field_data.string_data().data(i).size(), - data_ + offsets_[i]); + data_ + offsets_ptr_[i]); } break; } @@ -117,49 +140,39 @@ class Array { } } - Array(char* data, - size_t size, - DataType element_type, - std::vector&& element_offsets) - : size_(size), - offsets_(std::move(element_offsets)), - element_type_(element_type) { - delete[] data_; - data_ = new char[size]; - std::copy(data, data + size, data_); - if (IsVariableDataType(element_type_)) { - length_ = offsets_.size(); - } else { - // int8, int16, int32 are all promoted to int32 - if (element_type_ == DataType::INT8 || - element_type_ == DataType::INT16) { - length_ = size / sizeof(int32_t); - } else { - length_ = size / GetDataTypeSize(element_type_); - } - } - } - Array(const Array& array) noexcept : length_{array.length_}, size_{array.size_}, element_type_{array.element_type_} { - delete[] data_; data_ = new char[array.size_]; std::copy(array.data_, array.data_ + array.size_, data_); - offsets_ = array.offsets_; + if (IsVariableDataType(array.element_type_)) { + AssertInfo(array.get_offsets_data() != nullptr, + "for array with variable length elements, offsets_ptr" + "must not be nullptr"); + offsets_ptr_ = new uint32_t[length_]; + std::copy_n(array.get_offsets_data(), array.length(), offsets_ptr_); + } } Array& operator=(const Array& array) { delete[] data_; - - data_ = new char[array.size_]; - std::copy(array.data_, array.data_ + array.size_, data_); + if (offsets_ptr_) { + delete[] offsets_ptr_; + } length_ = array.length_; size_ = array.size_; - offsets_ = array.offsets_; element_type_ = array.element_type_; + data_ = new char[array.size_]; + std::copy(array.data_, array.data_ + array.size_, data_); + if (IsVariableDataType(array.get_element_type())) { + AssertInfo(array.get_offsets_data() != nullptr, + "for array with variable length elements, offsets_ptr" + "must not be nullptr"); + offsets_ptr_ = new uint32_t[length_]; + std::copy_n(array.get_offsets_data(), array.length(), offsets_ptr_); + } return *this; } @@ -241,10 +254,11 @@ class Array { length_); if constexpr (std::is_same_v || std::is_same_v) { - size_t element_length = (index == length_ - 1) - ? size_ - offsets_.back() - : offsets_[index + 1] - offsets_[index]; - return T(data_ + offsets_[index], element_length); + size_t element_length = + (index == length_ - 1) + ? size_ - offsets_ptr_[length_ - 1] + : offsets_ptr_[index + 1] - offsets_ptr_[index]; + return T(data_ + offsets_ptr_[index], element_length); } if constexpr (std::is_same_v || std::is_same_v || std::is_same_v || std::is_same_v || @@ -272,14 +286,9 @@ class Array { return reinterpret_cast(data_)[index]; } - const std::vector& - get_offsets() const { - return offsets_; - } - - std::vector - get_offsets_in_copy() const { - return offsets_; + uint32_t* + get_offsets_data() const { + return offsets_ptr_; } ScalarArray @@ -436,8 +445,8 @@ class Array { char* data_{nullptr}; int length_ = 0; int size_ = 0; - std::vector offsets_{}; DataType element_type_ = DataType::NONE; + uint32_t* offsets_ptr_{nullptr}; }; class ArrayView { @@ -445,23 +454,21 @@ class ArrayView { ArrayView() = default; ArrayView(char* data, + int len, size_t size, DataType element_type, - std::vector&& element_offsets) - : size_(size), - offsets_(std::move(element_offsets)), - element_type_(element_type) { - data_ = data; + uint32_t* offsets_ptr) + : data_(data), + length_(len), + size_(size), + element_type_(element_type), + offsets_ptr_(offsets_ptr) { + AssertInfo(data != nullptr, + "data pointer for ArrayView cannot be nullptr"); if (IsVariableDataType(element_type_)) { - length_ = offsets_.size(); - } else { - // int8, int16, int32 are all promoted to int32 - if (element_type_ == DataType::INT8 || - element_type_ == DataType::INT16) { - length_ = size / sizeof(int32_t); - } else { - length_ = size / GetDataTypeSize(element_type_); - } + AssertInfo(offsets_ptr != nullptr, + "for array with variable length elements, offsets_ptr " + "must not be nullptr"); } } @@ -475,10 +482,11 @@ class ArrayView { if constexpr (std::is_same_v || std::is_same_v) { - size_t element_length = (index == length_ - 1) - ? size_ - offsets_.back() - : offsets_[index + 1] - offsets_[index]; - return T(data_ + offsets_[index], element_length); + size_t element_length = + (index == length_ - 1) + ? size_ - offsets_ptr_[length_ - 1] + : offsets_ptr_[index + 1] - offsets_ptr_[index]; + return T(data_ + offsets_ptr_[index], element_length); } if constexpr (std::is_same_v || std::is_same_v || std::is_same_v || std::is_same_v) { @@ -580,11 +588,6 @@ class ArrayView { data() const { return data_; } - // copy to result - std::vector - get_offsets_in_copy() const { - return offsets_; - } bool is_same_array(const proto::plan::Array& arr2) const { @@ -661,8 +664,10 @@ class ArrayView { char* data_{nullptr}; int length_ = 0; int size_ = 0; - std::vector offsets_{}; DataType element_type_ = DataType::NONE; + + //offsets ptr + uint32_t* offsets_ptr_{nullptr}; }; } // namespace milvus diff --git a/internal/core/src/common/Chunk.cpp b/internal/core/src/common/Chunk.cpp index 4b5c17ac1df6e..4cf10955c3f6d 100644 --- a/internal/core/src/common/Chunk.cpp +++ b/internal/core/src/common/Chunk.cpp @@ -15,6 +15,7 @@ #include "common/Span.h" #include "common/Types.h" #include "common/Chunk.h" +#include "log/Log.h" namespace milvus { @@ -51,21 +52,18 @@ ArrayChunk::ConstructViews() { int offset = offsets_lens_[2 * i]; int next_offset = offsets_lens_[2 * (i + 1)]; int len = offsets_lens_[2 * i + 1]; - auto data_ptr = data_ + offset; - auto offsets_len = 0; - std::vector element_indices = {}; + auto offsets_bytes_len = 0; + uint32_t* offsets_ptr = nullptr; if (IsStringDataType(element_type_)) { - offsets_len = len * sizeof(uint64_t); - std::vector tmp( - reinterpret_cast(data_ptr), - reinterpret_cast(data_ptr + offsets_len)); - element_indices = std::move(tmp); + offsets_bytes_len = len * sizeof(uint32_t); + offsets_ptr = reinterpret_cast(data_ptr); } - views_.emplace_back(data_ptr + offsets_len, - next_offset - offset - offsets_len, + views_.emplace_back(data_ptr + offsets_bytes_len, + len, + next_offset - offset - offsets_bytes_len, element_type_, - std::move(element_indices)); + offsets_ptr); } } diff --git a/internal/core/src/common/ChunkWriter.cpp b/internal/core/src/common/ChunkWriter.cpp index dc2d9e4bfe45e..ac4ebd877a71c 100644 --- a/internal/core/src/common/ChunkWriter.cpp +++ b/internal/core/src/common/ChunkWriter.cpp @@ -205,32 +205,32 @@ ArrayChunkWriter::write(std::shared_ptr data) { int offsets_num = row_nums_ + 1; int len_num = row_nums_; - int offset_start_pos = - target_->tell() + sizeof(uint64_t) * (offsets_num + len_num); - std::vector offsets; - std::vector lens; - for (auto& arr : arrays) { - offsets.push_back(offset_start_pos); - lens.push_back(arr.length()); - offset_start_pos += - is_string ? sizeof(uint64_t) * arr.get_offsets().size() : 0; + uint32_t offset_start_pos = + target_->tell() + sizeof(uint32_t) * (offsets_num + len_num); + std::vector offsets(offsets_num); + std::vector lens(len_num); + for (auto i = 0; i < arrays.size(); i++) { + auto& arr = arrays[i]; + offsets[i] = offset_start_pos; + lens[i] = arr.length(); + offset_start_pos += is_string ? sizeof(uint32_t) * lens[i] : 0; offset_start_pos += arr.byte_size(); } offsets.push_back(offset_start_pos); for (int i = 0; i < offsets.size(); i++) { if (i == offsets.size() - 1) { - target_->write(&offsets[i], sizeof(uint64_t)); + target_->write(&offsets[i], sizeof(uint32_t)); break; } - target_->write(&offsets[i], sizeof(uint64_t)); - target_->write(&lens[i], sizeof(uint64_t)); + target_->write(&offsets[i], sizeof(uint32_t)); + target_->write(&lens[i], sizeof(uint32_t)); } for (auto& arr : arrays) { if (is_string) { - target_->write(arr.get_offsets().data(), - arr.get_offsets().size() * sizeof(uint64_t)); + target_->write(arr.get_offsets_data(), + arr.length() * sizeof(uint32_t)); } target_->write(arr.data(), arr.byte_size()); } diff --git a/internal/core/src/mmap/ChunkData.h b/internal/core/src/mmap/ChunkData.h index ec70d94ab6423..842a3792b3dbc 100644 --- a/internal/core/src/mmap/ChunkData.h +++ b/internal/core/src/mmap/ChunkData.h @@ -191,21 +191,35 @@ VariableLengthChunk::set(const Array* src, begin, size_); size_t total_size = 0; - size_t padding_size = 0; for (auto i = 0; i < length; i++) { - total_size += src[i].byte_size() + padding_size; + total_size += src[i].byte_size(); } + if (length > 0 && IsVariableDataType(src[0].get_element_type())) { + for (auto i = 0; i < length; i++) { + total_size += (src[i].length() * sizeof(uint32_t)); + } + } + auto buf = (char*)mcm->Allocate(mmap_descriptor_, total_size); AssertInfo(buf != nullptr, "failed to allocate memory from mmap_manager."); - for (auto i = 0, offset = 0; i < length; i++) { - auto data_size = src[i].byte_size() + padding_size; - char* data_ptr = buf + offset; - std::copy(src[i].data(), src[i].data() + src[i].byte_size(), data_ptr); - data_[i + begin] = ArrayView(data_ptr, - data_size, - src[i].get_element_type(), - src[i].get_offsets_in_copy()); - offset += data_size; + char* data_ptr = buf; + for (auto i = 0; i < length; i++) { + int length = src[i].length(); + uint32_t* src_offsets_ptr = src[i].get_offsets_data(); + auto element_type = src[i].get_element_type(); + // need copy offsets for variable types + uint32_t* target_offsets_ptr = nullptr; + if (IsVariableDataType(element_type)) { + target_offsets_ptr = reinterpret_cast(data_ptr); + std::copy( + src_offsets_ptr, src_offsets_ptr + length, target_offsets_ptr); + data_ptr += length * sizeof(uint32_t); + } + auto data_size = src[i].byte_size(); + std::copy(src[i].data(), src[i].data() + data_size, data_ptr); + data_[i + begin] = ArrayView( + data_ptr, length, data_size, element_type, target_offsets_ptr); + data_ptr += data_size; } } diff --git a/internal/core/src/mmap/ChunkVector.h b/internal/core/src/mmap/ChunkVector.h index 74341195c8edc..5c0a2b4de828c 100644 --- a/internal/core/src/mmap/ChunkVector.h +++ b/internal/core/src/mmap/ChunkVector.h @@ -119,9 +119,10 @@ class ThreadSafeChunkVector : public ChunkVectorBase { } else if constexpr (std::is_same_v) { auto& src = chunk[chunk_offset]; return ArrayView(const_cast(src.data()), + src.length(), src.byte_size(), src.get_element_type(), - src.get_offsets_in_copy()); + src.get_offsets_data()); } else { return chunk[chunk_offset]; } diff --git a/internal/core/src/mmap/Column.h b/internal/core/src/mmap/Column.h index 0862f53b052de..e1034528e8915 100644 --- a/internal/core/src/mmap/Column.h +++ b/internal/core/src/mmap/Column.h @@ -918,7 +918,15 @@ class SingleChunkArrayColumn : public SingleChunkColumnBase { void Append(const Array& array, bool valid_data = false) { indices_.emplace_back(data_size_); - element_indices_.emplace_back(array.get_offsets()); + if (IsVariableDataType(array.get_element_type())) { + element_indices_.emplace_back( + array.get_offsets_data(), + array.get_offsets_data() + array.length()); + } else { + element_indices_.emplace_back(); + } + + // have to copy element offsets from external array if (nullable_) { return SingleChunkColumnBase::Append( static_cast(array.data()), @@ -931,7 +939,7 @@ class SingleChunkArrayColumn : public SingleChunkColumnBase { void Seal(std::vector&& indices = {}, - std::vector>&& element_indices = {}) { + std::vector>&& element_indices = {}) { if (!indices.empty()) { indices_ = std::move(indices); element_indices_ = std::move(element_indices); @@ -946,20 +954,22 @@ class SingleChunkArrayColumn : public SingleChunkColumnBase { views_.reserve(indices_.size()); for (size_t i = 0; i < indices_.size() - 1; i++) { views_.emplace_back(data_ + indices_[i], + element_indices_[i].size(), indices_[i + 1] - indices_[i], element_type_, - std::move(element_indices_[i])); + element_indices_[i].data()); } views_.emplace_back(data_ + indices_.back(), + element_indices_[indices_.size() - 1].size(), data_size_ - indices_.back(), element_type_, - std::move(element_indices_[indices_.size() - 1])); + element_indices_[indices_.size() - 1].data()); element_indices_.clear(); } private: std::vector indices_{}; - std::vector> element_indices_{}; + std::vector> element_indices_{}; // Compatible with current Span type std::vector views_{}; DataType element_type_; diff --git a/internal/core/src/mmap/Utils.h b/internal/core/src/mmap/Utils.h index c93165df31812..a7a4acc3a3cbc 100644 --- a/internal/core/src/mmap/Utils.h +++ b/internal/core/src/mmap/Utils.h @@ -90,7 +90,7 @@ WriteFieldData(File& file, const FieldDataPtr& data, uint64_t& total_written, std::vector& indices, - std::vector>& element_indices, + std::vector>& element_indices, FixedVector& valid_data) { if (IsVariableDataType(data_type)) { // use buffered writer to reduce fwrite/write syscall @@ -131,7 +131,9 @@ WriteFieldData(File& file, indices.push_back(total_written); auto array = static_cast(data->RawValue(i)); bw.Write(array->data(), array->byte_size()); - element_indices.emplace_back(array->get_offsets()); + element_indices.emplace_back( + array->get_offsets_data(), + array->get_offsets_data() + array->length()); total_written += array->byte_size(); } break; diff --git a/internal/core/src/segcore/SegmentSealedImpl.cpp b/internal/core/src/segcore/SegmentSealedImpl.cpp index ee8652da06d50..d8145859d0360 100644 --- a/internal/core/src/segcore/SegmentSealedImpl.cpp +++ b/internal/core/src/segcore/SegmentSealedImpl.cpp @@ -544,7 +544,7 @@ SegmentSealedImpl::MapFieldData(const FieldId field_id, FieldDataInfo& data) { FieldDataPtr field_data; uint64_t total_written = 0; std::vector indices{}; - std::vector> element_indices{}; + std::vector> element_indices{}; FixedVector valid_data{}; while (data.channel->pop(field_data)) { WriteFieldData(file, diff --git a/internal/core/src/storage/MmapChunkManager.cpp b/internal/core/src/storage/MmapChunkManager.cpp index 935e9db2e8260..44547491b4e0a 100644 --- a/internal/core/src/storage/MmapChunkManager.cpp +++ b/internal/core/src/storage/MmapChunkManager.cpp @@ -169,8 +169,10 @@ MmapBlocksHandler::AllocateLargeBlock(const uint64_t size) { if (size + Size() > max_disk_limit_) { PanicInfo(ErrorCode::MemAllocateSizeNotMatch, "Failed to create a new mmap_block, not enough disk for " - "create a new mmap block. Allocated size: {}, Max size: {} " + "create a new mmap block. To Allocate:{} Allocated size: {}, " + "Max size: {} " "under mmap file_prefix: {}", + size, Size(), max_disk_limit_, mmap_file_prefix_); diff --git a/internal/core/unittest/test_array.cpp b/internal/core/unittest/test_array.cpp index 37caa3b64c555..c436a5ea95dc7 100644 --- a/internal/core/unittest/test_array.cpp +++ b/internal/core/unittest/test_array.cpp @@ -18,6 +18,7 @@ TEST(Array, TestConstructArray) { using namespace milvus; int N = 10; + // 1. test int milvus::proto::schema::ScalarField field_int_data; milvus::proto::plan::Array field_int_array; field_int_array.set_same_type(true); @@ -33,28 +34,33 @@ TEST(Array, TestConstructArray) { } ASSERT_TRUE(int_array.is_same_array(field_int_array)); auto int_array_tmp = Array(const_cast(int_array.data()), + int_array.length(), int_array.byte_size(), int_array.get_element_type(), - {}); + int_array.get_offsets_data()); auto int_8_array = Array(const_cast(int_array.data()), + int_array.length(), int_array.byte_size(), DataType::INT8, - {}); + int_array.get_offsets_data()); ASSERT_EQ(int_array.length(), int_8_array.length()); auto int_16_array = Array(const_cast(int_array.data()), + int_array.length(), int_array.byte_size(), DataType::INT16, - {}); + int_array.get_offsets_data()); ASSERT_EQ(int_array.length(), int_16_array.length()); ASSERT_TRUE(int_array_tmp == int_array); auto int_array_view = ArrayView(const_cast(int_array.data()), + int_array.length(), int_array.byte_size(), int_array.get_element_type(), - {}); + int_array.get_offsets_data()); ASSERT_EQ(int_array.length(), int_array_view.length()); ASSERT_EQ(int_array.byte_size(), int_array_view.byte_size()); ASSERT_EQ(int_array.get_element_type(), int_array_view.get_element_type()); + // 2. test long milvus::proto::schema::ScalarField field_long_data; milvus::proto::plan::Array field_long_array; field_long_array.set_same_type(true); @@ -70,19 +76,22 @@ TEST(Array, TestConstructArray) { } ASSERT_TRUE(long_array.is_same_array(field_int_array)); auto long_array_tmp = Array(const_cast(long_array.data()), + long_array.length(), long_array.byte_size(), long_array.get_element_type(), - {}); + long_array.get_offsets_data()); ASSERT_TRUE(long_array_tmp == long_array); auto long_array_view = ArrayView(const_cast(long_array.data()), + long_array.length(), long_array.byte_size(), long_array.get_element_type(), - {}); + long_array.get_offsets_data()); ASSERT_EQ(long_array.length(), long_array_view.length()); ASSERT_EQ(long_array.byte_size(), long_array_view.byte_size()); ASSERT_EQ(long_array.get_element_type(), long_array_view.get_element_type()); + // 3. test string milvus::proto::schema::ScalarField field_string_data; milvus::proto::plan::Array field_string_array; field_string_array.set_same_type(true); @@ -94,32 +103,28 @@ TEST(Array, TestConstructArray) { } auto string_array = Array(field_string_data); ASSERT_EQ(N, string_array.length()); - // ASSERT_EQ(N, string_array.size()); for (int i = 0; i < N; ++i) { ASSERT_EQ(string_array.get_data(i), std::to_string(i)); } ASSERT_TRUE(string_array.is_same_array(field_string_array)); - std::vector string_element_offsets; - std::vector string_view_element_offsets; - for (auto& offset : string_array.get_offsets()) { - string_element_offsets.emplace_back(offset); - string_view_element_offsets.emplace_back(offset); - } auto string_array_tmp = Array(const_cast(string_array.data()), + string_array.length(), string_array.byte_size(), string_array.get_element_type(), - std::move(string_element_offsets)); + string_array.get_offsets_data()); ASSERT_TRUE(string_array_tmp == string_array); auto string_array_view = ArrayView(const_cast(string_array.data()), + string_array.length(), string_array.byte_size(), string_array.get_element_type(), - std::move(string_view_element_offsets)); + string_array.get_offsets_data()); ASSERT_EQ(string_array.length(), string_array_view.length()); ASSERT_EQ(string_array.byte_size(), string_array_view.byte_size()); ASSERT_EQ(string_array.get_element_type(), string_array_view.get_element_type()); + // 4. test bool milvus::proto::schema::ScalarField field_bool_data; milvus::proto::plan::Array field_bool_array; field_bool_array.set_same_type(true); @@ -135,19 +140,22 @@ TEST(Array, TestConstructArray) { } ASSERT_TRUE(bool_array.is_same_array(field_bool_array)); auto bool_array_tmp = Array(const_cast(bool_array.data()), + bool_array.length(), bool_array.byte_size(), bool_array.get_element_type(), - {}); + bool_array.get_offsets_data()); ASSERT_TRUE(bool_array_tmp == bool_array); auto bool_array_view = ArrayView(const_cast(bool_array.data()), + bool_array.length(), bool_array.byte_size(), bool_array.get_element_type(), - {}); + bool_array.get_offsets_data()); ASSERT_EQ(bool_array.length(), bool_array_view.length()); ASSERT_EQ(bool_array.byte_size(), bool_array_view.byte_size()); ASSERT_EQ(bool_array.get_element_type(), bool_array_view.get_element_type()); + //5. test float milvus::proto::schema::ScalarField field_float_data; milvus::proto::plan::Array field_float_array; field_float_array.set_same_type(true); @@ -163,19 +171,22 @@ TEST(Array, TestConstructArray) { } ASSERT_TRUE(float_array.is_same_array(field_float_array)); auto float_array_tmp = Array(const_cast(float_array.data()), + float_array.length(), float_array.byte_size(), float_array.get_element_type(), - {}); + float_array.get_offsets_data()); ASSERT_TRUE(float_array_tmp == float_array); auto float_array_view = ArrayView(const_cast(float_array.data()), + float_array.length(), float_array.byte_size(), float_array.get_element_type(), - {}); + float_array.get_offsets_data()); ASSERT_EQ(float_array.length(), float_array_view.length()); ASSERT_EQ(float_array.byte_size(), float_array_view.byte_size()); ASSERT_EQ(float_array.get_element_type(), float_array_view.get_element_type()); + //6. test double milvus::proto::schema::ScalarField field_double_data; milvus::proto::plan::Array field_double_array; field_double_array.set_same_type(true); @@ -192,14 +203,16 @@ TEST(Array, TestConstructArray) { } ASSERT_TRUE(double_array.is_same_array(field_double_array)); auto double_array_tmp = Array(const_cast(double_array.data()), + double_array.length(), double_array.byte_size(), double_array.get_element_type(), - {}); + double_array.get_offsets_data()); ASSERT_TRUE(double_array_tmp == double_array); auto double_array_view = ArrayView(const_cast(double_array.data()), + double_array.length(), double_array.byte_size(), double_array.get_element_type(), - {}); + double_array.get_offsets_data()); ASSERT_EQ(double_array.length(), double_array_view.length()); ASSERT_EQ(double_array.byte_size(), double_array_view.byte_size()); ASSERT_EQ(double_array.get_element_type(), diff --git a/internal/core/unittest/test_array_bitmap_index.cpp b/internal/core/unittest/test_array_bitmap_index.cpp index b6cad45ce8bdc..b9e17a0a9df76 100644 --- a/internal/core/unittest/test_array_bitmap_index.cpp +++ b/internal/core/unittest/test_array_bitmap_index.cpp @@ -211,7 +211,6 @@ class ArrayBitmapIndexTest : public testing::Test { insert_data.SetTimestamps(0, 100); auto serialized_bytes = insert_data.Serialize(storage::Remote); - auto log_path = fmt::format("/{}/{}/{}/{}/{}/{}", "/tmp/test_array_bitmap", collection_id, @@ -221,7 +220,6 @@ class ArrayBitmapIndexTest : public testing::Test { 0); chunk_manager_->Write( log_path, serialized_bytes.data(), serialized_bytes.size()); - storage::FileManagerContext ctx(field_meta, index_meta, chunk_manager_); std::vector index_files; @@ -241,7 +239,6 @@ class ArrayBitmapIndexTest : public testing::Test { index_files.push_back(key); } } - index::CreateIndexInfo index_info{}; index_info.index_type = milvus::index::HYBRID_INDEX_TYPE; index_info.field_type = DataType::ARRAY;