From 189349ee550cc23b987aa74534ba9f98a03ad563 Mon Sep 17 00:00:00 2001 From: Alan Liddell Date: Thu, 19 Oct 2023 15:29:39 -0400 Subject: [PATCH] Fixes --- src/CMakeLists.txt | 2 - src/writers/shard.writer.cpp | 292 ----------------------------------- src/writers/shard.writer.hh | 63 -------- tests/get-meta.cpp | 7 +- 4 files changed, 2 insertions(+), 362 deletions(-) delete mode 100644 src/writers/shard.writer.cpp delete mode 100644 src/writers/shard.writer.hh diff --git a/src/CMakeLists.txt b/src/CMakeLists.txt index 3f6aa175..5ac73553 100644 --- a/src/CMakeLists.txt +++ b/src/CMakeLists.txt @@ -13,8 +13,6 @@ add_library(${tgt} MODULE writers/writer.cpp writers/chunk.writer.hh writers/chunk.writer.cpp - writers/shard.writer.hh - writers/shard.writer.cpp writers/blosc.compressor.hh writers/blosc.compressor.cpp zarr.hh diff --git a/src/writers/shard.writer.cpp b/src/writers/shard.writer.cpp deleted file mode 100644 index 9449fa0c..00000000 --- a/src/writers/shard.writer.cpp +++ /dev/null @@ -1,292 +0,0 @@ -#include "shard.writer.hh" -#include "../zarr.hh" - -#include -#include - -namespace zarr = acquire::sink::zarr; - -zarr::ShardWriter::ShardWriter(const ImageDims& frame_dims, - const ImageDims& shard_dims, - const ImageDims& tile_dims, - uint32_t frames_per_chunk, - const std::string& data_root, - Zarr* zarr) - : Writer(frame_dims, tile_dims, frames_per_chunk, data_root, zarr) - , shard_dims_{ shard_dims } -{ - shards_per_frame_x_ = - std::ceil((float)frame_dims.cols / (float)shard_dims.cols); - shards_per_frame_y_ = - std::ceil((float)frame_dims.rows / (float)shard_dims.rows); -} - -zarr::ShardWriter::ShardWriter(const ImageDims& frame_dims, - const ImageDims& shard_dims, - const ImageDims& tile_dims, - uint32_t frames_per_chunk, - const std::string& data_root, - Zarr* zarr, - const BloscCompressionParams& compression_params) - : Writer(frame_dims, - tile_dims, - frames_per_chunk, - data_root, - zarr, - compression_params) - , shard_dims_{ shard_dims } -{ - shards_per_frame_x_ = - std::ceil((float)frame_dims.cols / (float)shard_dims.cols); - shards_per_frame_y_ = - std::ceil((float)frame_dims.rows / (float)shard_dims.rows); -} - -bool -zarr::ShardWriter::write(const VideoFrame* frame) noexcept -{ - using namespace std::chrono_literals; - - if (!validate_frame_(frame)) { - // log is written in validate_frame - return false; - } - - try { - if (chunk_buffers_.empty()) { - make_buffers_(); - } - - bytes_to_flush_ += - write_bytes_(frame->data, frame->bytes_of_frame - sizeof(*frame)); - - ++frames_written_; - - // rollover if necessary - const auto frames_this_chunk = frames_written_ % frames_per_chunk_; - if (frames_written_ > 0 && frames_this_chunk == 0) { - flush_(); - rollover_(); - } - - return true; - } catch (const std::exception& exc) { - LOGE("Failed to write frame: %s", exc.what()); - } catch (...) { - LOGE("Failed to write frame (unknown)"); - } - - return false; -} - -uint16_t -zarr::ShardWriter::chunks_per_shard_() const -{ - const uint16_t chunks_per_shard_x = shard_dims_.cols / tile_dims_.cols; - const uint16_t chunks_per_shard_y = shard_dims_.rows / tile_dims_.rows; - return chunks_per_shard_x * chunks_per_shard_y; -} - -uint16_t -zarr::ShardWriter::shards_per_frame_() const -{ - return shards_per_frame_x_ * shards_per_frame_y_; -} - -void -zarr::ShardWriter::make_buffers_() noexcept -{ - const auto nchunks = tiles_per_frame_(); - chunk_buffers_.resize(nchunks); - buffers_ready_ = new bool[nchunks]; - std::fill(buffers_ready_, buffers_ready_ + nchunks, true); - - const auto bytes_of_type = common::bytes_of_type(pixel_type_); - const auto bytes_per_tile = - tile_dims_.cols * tile_dims_.rows * bytes_of_type; - const auto bytes_per_chunk = bytes_per_tile * frames_per_chunk_; - - for (auto& buf : chunk_buffers_) { - buf.resize(frames_per_chunk_ * bytes_per_tile); - std::fill(buf.begin(), buf.end(), 0); - } - - const auto nshards = shards_per_frame_(); - shard_buffers_.resize(nshards); - - for (auto& buf : shard_buffers_) { - buf.resize(chunks_per_shard_() * bytes_per_chunk // data - + 2 * chunks_per_shard_() * sizeof(uint64_t) // indices - ); - } -} - -size_t -zarr::ShardWriter::write_bytes_(const uint8_t* buf, size_t buf_size) noexcept -{ - const auto bytes_of_type = common::bytes_of_type(pixel_type_); - const auto bytes_per_tile = - tile_dims_.cols * tile_dims_.rows * bytes_of_type; - const auto frames_this_chunk = frames_written_ % frames_per_chunk_; - - size_t bytes_written = 0; - - for (auto i = 0; i < tiles_per_frame_y_; ++i) { - for (auto j = 0; j < tiles_per_frame_x_; ++j) { - size_t offset = bytes_per_tile * frames_this_chunk; - - uint8_t* bytes_out = - chunk_buffers_.at(i * tiles_per_frame_x_ + j).data(); - for (auto k = 0; k < tile_dims_.rows; ++k) { - const auto frame_row = i * tile_dims_.rows + k; - if (frame_row < frame_dims_.rows) { - const auto frame_col = j * tile_dims_.cols; - - const auto buf_offset = - bytes_of_type * - (frame_row * frame_dims_.cols + frame_col); - - const auto region_width = - std::min(frame_col + tile_dims_.cols, frame_dims_.cols) - - frame_col; - - const auto nbytes = region_width * bytes_of_type; - memcpy(bytes_out + offset, buf + buf_offset, nbytes); - } - offset += tile_dims_.cols * bytes_of_type; - } - bytes_written += bytes_per_tile; - } - } - - return bytes_written; -} - -void -zarr::ShardWriter::flush_() noexcept -{ - if (bytes_to_flush_ == 0) { - return; - } - - using namespace std::chrono_literals; - const auto bytes_of_type = common::bytes_of_type(pixel_type_); - const auto bytes_per_tile = - tile_dims_.cols * tile_dims_.rows * bytes_of_type; - if (bytes_to_flush_ % bytes_per_tile != 0) { - LOGE("Expected bytes to flush to be a multiple of the " - "number of bytes per tile."); - } - const auto chunks_per_shard = chunks_per_shard_(); - - // create shard files if necessary - if (files_.empty() && !make_files_()) { - zarr_->set_error("Failed to flush."); - return; - } - - // compress buffers - auto chunk_sizes = compress_buffers_(); - const size_t index_size = 2 * chunks_per_shard * sizeof(uint64_t); - - // concatenate chunks into shards - std::vector shard_sizes; - for (auto i = 0; i < shard_buffers_.size(); ++i) { - auto& shard = shard_buffers_.at(i); - size_t shard_size = 0; - std::vector chunk_indices; - - for (auto j = 0; j < chunks_per_shard; ++j) { - chunk_indices.push_back(shard_size); // chunk index - const auto k = i * chunks_per_shard + j; - shard_size += chunk_sizes.at(k); - chunk_indices.push_back(chunk_sizes.at(k)); // chunk extent - } - - // if we're very unlucky we can technically run into this - if (shard.size() < shard_size + index_size) { - shard.resize(shard_size + index_size); - } - - size_t offset = 0; - for (auto j = 0; j < chunks_per_shard; ++j) { - const auto k = i * chunks_per_shard + j; - const auto& chunk = chunk_buffers_.at(k); - memcpy(shard.data() + offset, chunk.data(), chunk_sizes.at(k)); - offset += chunk_sizes.at(k); - } - memcpy(shard.data() + offset, - chunk_indices.data(), - chunk_indices.size() * 8); - offset += chunk_indices.size() * 8; - shard_sizes.push_back(offset); - } - - // write out - std::fill(buffers_ready_, buffers_ready_ + shard_buffers_.size(), false); - { - std::scoped_lock lock(mutex_); - for (auto i = 0; i < files_.size(); ++i) { - const auto& shard = shard_buffers_.at(i); - zarr_->push_to_job_queue(std::move( - [fh = &files_.at(i), - shard = shard.data(), - size = shard_sizes.at(i), - finished = buffers_ready_ + i](std::string& err) -> bool { - bool success = false; - try { - success = file_write(fh, 0, shard, shard + size); - } catch (const std::exception& exc) { - char buf[128]; - snprintf(buf, - sizeof(buf), - "Failed to write shard: %s", - exc.what()); - err = buf; - } catch (...) { - err = "Failed to write shard (unknown)"; - } - *finished = true; - - return success; - })); - } - } - - // wait for all threads to finish - while (!std::all_of(buffers_ready_, - buffers_ready_ + shard_buffers_.size(), - [](const auto& b) { return b; })) { - std::this_thread::sleep_for(500us); - } - - // reset buffers - const auto bytes_per_chunk = - tile_dims_.cols * tile_dims_.rows * bytes_of_type * frames_per_chunk_; - for (auto& buf : chunk_buffers_) { - // absurd edge case we need to account for - if (buf.size() > bytes_per_chunk) { - buf.resize(bytes_per_chunk); - } - - std::fill(buf.begin(), buf.end(), 0); - } - const auto bytes_per_shard = bytes_per_chunk * chunks_per_shard; - for (auto& buf : shard_buffers_) { - // absurd edge case we need to account for - if (buf.size() > bytes_per_shard + index_size) { - buf.resize(bytes_per_shard + index_size); - } - - std::fill(buf.begin(), buf.end(), 0); - } - bytes_to_flush_ = 0; -} - -bool -zarr::ShardWriter::make_files_() noexcept -{ - file_creator_.set_base_dir(data_root_ / ("c" + std::to_string(current_chunk_))); - return file_creator_.create( - 1, shards_per_frame_y_, shards_per_frame_x_, files_); -} diff --git a/src/writers/shard.writer.hh b/src/writers/shard.writer.hh deleted file mode 100644 index 0d05edb3..00000000 --- a/src/writers/shard.writer.hh +++ /dev/null @@ -1,63 +0,0 @@ -#ifndef H_ACQUIRE_ZARR_SHARD_WRITER_V0 -#define H_ACQUIRE_ZARR_SHARD_WRITER_V0 - -#ifndef __cplusplus -#error "This header requires C++20" -#endif - -#include "writer.hh" - -#include "platform.h" -#include "device/props/components.h" - -#include -#include -#include -#include -#include -#include - -namespace fs = std::filesystem; - -namespace acquire::sink::zarr { -struct ShardWriter final : public Writer -{ - public: - ShardWriter() = delete; - ShardWriter(const ImageDims& frame_dims, - const ImageDims& shard_dims, - const ImageDims& tile_dims, - uint32_t frames_per_chunk, - const std::string& data_root, - Zarr* zarr); - - /// Constructor with Blosc compression params - ShardWriter(const ImageDims& frame_dims, - const ImageDims& shard_dims, - const ImageDims& tile_dims, - uint32_t frames_per_chunk, - const std::string& data_root, - Zarr* zarr, - const BloscCompressionParams& compression_params); - ~ShardWriter() override = default; - - [[nodiscard]] bool write(const VideoFrame* frame) noexcept override; - - private: - ImageDims shard_dims_; - uint16_t shards_per_frame_x_; - uint16_t shards_per_frame_y_; - - std::vector> shard_buffers_; - - uint16_t chunks_per_shard_() const; - uint16_t shards_per_frame_() const; - - void make_buffers_() noexcept override; - size_t write_bytes_(const uint8_t* buf, size_t buf_size) noexcept override; - void flush_() noexcept override; - [[nodiscard]] bool make_files_() noexcept override; -}; -} // namespace acquire::sink::zarr - -#endif // H_ACQUIRE_ZARR_SHARD_WRITER_V0 diff --git a/tests/get-meta.cpp b/tests/get-meta.cpp index e12f88fe..9ed0d09e 100644 --- a/tests/get-meta.cpp +++ b/tests/get-meta.cpp @@ -86,9 +86,7 @@ main() CHECK(Device_Ok == storage_get_meta(storage, &metadata)); CHECK(metadata.chunking.supported); - ASSERT_EQ(int, - "%d", - PropertyType_FixedPrecision, + ASSERT_EQ(int, "%d", PropertyType_FixedPrecision, (int)metadata.chunking.max_bytes_per_chunk.type); // minimum cap on chunk size is 16 MiB ASSERT_EQ(int, @@ -101,8 +99,7 @@ main() 1 << 30, (int)metadata.chunking.max_bytes_per_chunk.high); - CHECK((bool)metadata.multiscale.supported != - name.starts_with("ZarrV3")); + CHECK(metadata.multiscale.supported); CHECK(Device_Ok == driver_close_device(device)); }