From d94433ae07c9e7df10c9ac5366a91f530f0f1024 Mon Sep 17 00:00:00 2001 From: Theodore Tsirpanis Date: Wed, 14 Aug 2024 13:15:23 +0300 Subject: [PATCH 1/2] Remove unused `FragmentMetadata::bounding_coords_` field. (#5213) [SC-51602](https://app.shortcut.com/tiledb-inc/story/51602/remove-unused-fragmentmetadata-bounding-coords-field) This field existed in very old pre-2.0 storage format versions and is no longer used by the Core. It is removed from the `FragmentMetadata` class and the `load_bounding_coords` method was updated to skip over these bytes, using a new method added to `Deserializer`. --- TYPE: NO_HISTORY --- tiledb/sm/fragment/fragment_metadata.cc | 17 +++++++---------- tiledb/sm/fragment/fragment_metadata.h | 3 --- .../storage_format/serialization/serializers.h | 15 +++++++++++++++ 3 files changed, 22 insertions(+), 13 deletions(-) diff --git a/tiledb/sm/fragment/fragment_metadata.cc b/tiledb/sm/fragment/fragment_metadata.cc index 5cf2cf3ded4..27bb0498253 100644 --- a/tiledb/sm/fragment/fragment_metadata.cc +++ b/tiledb/sm/fragment/fragment_metadata.cc @@ -1938,22 +1938,19 @@ void FragmentMetadata::expand_non_empty_domain(const NDRange& mbr) { // ===== FORMAT ===== // bounding_coords_num (uint64_t) -// bounding_coords_#1 (void*) bounding_coords_#2 (void*) ... +// bounding_coords_#1 (dim_type[2][n_dims]) +// bounding_coords_#2 (dim_type[2][n_dims]) +// ... +// Note: This version supports only dimensions domains with the same type void FragmentMetadata::load_bounding_coords(Deserializer& deserializer) { // Get number of bounding coordinates - uint64_t bounding_coords_num = 0; - bounding_coords_num = deserializer.read(); + uint64_t bounding_coords_num = deserializer.read(); - // Get bounding coordinates - // Note: This version supports only dimensions domains with the same type auto coord_size{array_schema_->domain().dimension_ptr(0)->coord_size()}; auto dim_num = array_schema_->domain().dim_num(); uint64_t bounding_coords_size = 2 * dim_num * coord_size; - bounding_coords_.resize(bounding_coords_num); - for (uint64_t i = 0; i < bounding_coords_num; ++i) { - bounding_coords_[i].resize(bounding_coords_size); - deserializer.read(&bounding_coords_[i][0], bounding_coords_size); - } + // Skip bounding coordinates. They are not actually being used. + deserializer.skip(bounding_coords_num * bounding_coords_size); } void FragmentMetadata::load_file_sizes(Deserializer& deserializer) { diff --git a/tiledb/sm/fragment/fragment_metadata.h b/tiledb/sm/fragment/fragment_metadata.h index b5ba41a8e32..931d6d0099f 100644 --- a/tiledb/sm/fragment/fragment_metadata.h +++ b/tiledb/sm/fragment/fragment_metadata.h @@ -853,9 +853,6 @@ class FragmentMetadata { */ std::unordered_map idx_map_; - /** A vector storing the first and last coordinates of each tile. */ - std::vector> bounding_coords_; - /** True if the fragment is dense, and false if it is sparse. */ bool dense_; diff --git a/tiledb/storage_format/serialization/serializers.h b/tiledb/storage_format/serialization/serializers.h index 95506e0645b..387abe764fa 100644 --- a/tiledb/storage_format/serialization/serializers.h +++ b/tiledb/storage_format/serialization/serializers.h @@ -184,6 +184,21 @@ class Deserializer { size_ -= size; } + /** + * Advances the deserializer's pointer by a specified number of bytes, without + * reading them. + * + * @param size number of bytes to skip. + */ + void skip(storage_size_t size) { + if (size > size_) { + throw std::logic_error("Reading data past end of serialized data size."); + } + + ptr_ += size; + size_ -= size; + } + /** * Return remaining number of bytes to deserialize. * From 2edb451d4a5f97f473062d49a22ef649c39cc82f Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Du=C5=A1an=20Baran?= Date: Thu, 15 Aug 2024 11:41:19 +0200 Subject: [PATCH 2/2] Install pybind from pip. (#5238) This installs pybind11 from PIP so that the windows builds can find it. It is a workaround that will be properly fixed but for now this will unblock the 2.26 release and allow us to merge PRs. [sc-52966] --- TYPE: NO_HISTORY DESC: Use pybind11 from pip. --- .github/workflows/build-windows.yml | 2 ++ test/CMakeLists.txt | 6 +++--- 2 files changed, 5 insertions(+), 3 deletions(-) diff --git a/.github/workflows/build-windows.yml b/.github/workflows/build-windows.yml index 7b26ecee8c7..7ff184c78a1 100644 --- a/.github/workflows/build-windows.yml +++ b/.github/workflows/build-windows.yml @@ -136,6 +136,8 @@ jobs: uses: seanmiddleditch/gha-setup-ninja@v4 - name: Prevent vcpkg from building debug variants run: python $env:GITHUB_WORKSPACE/scripts/ci/patch_vcpkg_triplets.py + - name: Install dependencies from pip + run: python -m pip install pybind11[global] - name: Configure TileDB shell: pwsh diff --git a/test/CMakeLists.txt b/test/CMakeLists.txt index bf7c60f6b22..edc9b4b7be2 100644 --- a/test/CMakeLists.txt +++ b/test/CMakeLists.txt @@ -58,9 +58,9 @@ if (${TILEDB_ARROW_TESTS}) if (NOT ${pybind11_FOUND}) # Get the include arguments from the python executable (has "-I" compiler option) execute_process(COMMAND ${Python_EXECUTABLE} -m pybind11 --includes - OUTPUT_VARIABLE CMD_PYBIND11_INCLUDE - RESULT_VARIABLE CMD_PYBIND11_RESULT - OUTPUT_STRIP_TRAILING_WHITESPACE) + OUTPUT_VARIABLE CMD_PYBIND11_INCLUDE + RESULT_VARIABLE CMD_PYBIND11_RESULT + OUTPUT_STRIP_TRAILING_WHITESPACE) if (${CMD_PYBIND11_RESULT}) message(FATAL_ERROR "Unable to find pybind11 via cmake or 'python3 -m pybind11 --includes'") endif()