From b77a44790835e5207958f2ac09eb2cfff6398180 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Jean-No=C3=ABl=20Grad?= Date: Fri, 4 Aug 2023 11:10:16 +0200 Subject: [PATCH 1/3] core: Refactor MPI code Factor out code duplication. Make remaining MpiCallbacks return void. --- src/core/communication.hpp | 1 + .../observables/CylindricalDensityProfile.hpp | 6 ++-- .../CylindricalFluxDensityProfile.hpp | 12 ++------ ...BFluxDensityProfileAtParticlePositions.cpp | 10 +++---- .../CylindricalLBVelocityProfile.cpp | 16 +++------- ...alLBVelocityProfileAtParticlePositions.cpp | 16 +++------- .../CylindricalVelocityProfile.hpp | 15 +++------- src/core/observables/DensityProfile.hpp | 8 ++--- src/core/observables/FluxDensityProfile.hpp | 14 ++------- src/core/observables/ForceDensityProfile.hpp | 12 ++------ src/core/observables/LBVelocityProfile.cpp | 18 ++++------- src/core/observables/PidObservable.hpp | 2 +- src/core/observables/utils_histogram.hpp | 30 +++++++++++++++++-- src/core/particle_node.cpp | 26 ++++++++-------- 14 files changed, 80 insertions(+), 106 deletions(-) diff --git a/src/core/communication.hpp b/src/core/communication.hpp index 2f7d149259b..9acdef0c561 100644 --- a/src/core/communication.hpp +++ b/src/core/communication.hpp @@ -47,6 +47,7 @@ #include "MpiCallbacks.hpp" #include +#include #include #include diff --git a/src/core/observables/CylindricalDensityProfile.hpp b/src/core/observables/CylindricalDensityProfile.hpp index 01e387e6ba6..4b0c18f7871 100644 --- a/src/core/observables/CylindricalDensityProfile.hpp +++ b/src/core/observables/CylindricalDensityProfile.hpp @@ -23,6 +23,7 @@ #include "BoxGeometry.hpp" #include "grid.hpp" +#include "utils_histogram.hpp" #include #include @@ -53,9 +54,8 @@ class CylindricalDensityProfile : public CylindricalPidProfileObservable { transform_params->orientation())); } - std::vector global_folded_positions{}; - boost::mpi::gather(comm, local_folded_positions, global_folded_positions, - 0); + auto const global_folded_positions = + detail::gather(comm, local_folded_positions); if (comm.rank() != 0) { return {}; diff --git a/src/core/observables/CylindricalFluxDensityProfile.hpp b/src/core/observables/CylindricalFluxDensityProfile.hpp index 5796705a601..9e27a6c3394 100644 --- a/src/core/observables/CylindricalFluxDensityProfile.hpp +++ b/src/core/observables/CylindricalFluxDensityProfile.hpp @@ -60,21 +60,15 @@ class CylindricalFluxDensityProfile : public CylindricalPidProfileObservable { traits.velocity(p), transform_params->axis(), pos)); } - auto const world_size = comm.size(); - std::vector global_folded_positions{}; - std::vector global_velocities{}; - global_folded_positions.reserve(world_size); - global_velocities.reserve(world_size); - boost::mpi::gather(comm, local_folded_positions, global_folded_positions, - 0); - boost::mpi::gather(comm, local_velocities, global_velocities, 0); + auto const [global_folded_positions, global_velocities] = + detail::gather(comm, local_folded_positions, local_velocities); if (comm.rank() != 0) { return {}; } Utils::CylindricalHistogram histogram(n_bins(), limits()); - accumulate(histogram, global_folded_positions, global_velocities); + detail::accumulate(histogram, global_folded_positions, global_velocities); histogram.normalize(); return histogram.get_histogram(); } diff --git a/src/core/observables/CylindricalLBFluxDensityProfileAtParticlePositions.cpp b/src/core/observables/CylindricalLBFluxDensityProfileAtParticlePositions.cpp index d881e82dcb9..a8360630999 100644 --- a/src/core/observables/CylindricalLBFluxDensityProfileAtParticlePositions.cpp +++ b/src/core/observables/CylindricalLBFluxDensityProfileAtParticlePositions.cpp @@ -61,17 +61,15 @@ CylindricalLBFluxDensityProfileAtParticlePositions::evaluate( local_flux_densities.emplace_back(flux_cyl); } - std::vector global_folded_positions{}; - std::vector global_flux_densities{}; - boost::mpi::gather(comm, local_folded_positions, global_folded_positions, 0); - boost::mpi::gather(comm, local_flux_densities, global_flux_densities, 0); + auto const [global_folded_positions, global_flux_densities] = + detail::gather(comm, local_folded_positions, local_flux_densities); if (comm.rank() != 0) { return {}; } Utils::CylindricalHistogram histogram(n_bins(), limits()); - accumulate(histogram, global_folded_positions, global_flux_densities); - return normalize_by_bin_size(histogram); + detail::accumulate(histogram, global_folded_positions, global_flux_densities); + return detail::normalize_by_bin_size(histogram); } } // namespace Observables diff --git a/src/core/observables/CylindricalLBVelocityProfile.cpp b/src/core/observables/CylindricalLBVelocityProfile.cpp index 2f0ae68ce59..6a12d4285ef 100644 --- a/src/core/observables/CylindricalLBVelocityProfile.cpp +++ b/src/core/observables/CylindricalLBVelocityProfile.cpp @@ -25,9 +25,6 @@ #include #include -#include -#include - #include namespace Observables { @@ -55,21 +52,16 @@ std::vector CylindricalLBVelocityProfile::operator()( } } - auto const world_size = comm.size(); - std::vector global_positions{}; - std::vector global_velocities{}; - global_positions.reserve(world_size); - global_velocities.reserve(world_size); - boost::mpi::gather(comm, local_positions, global_positions, 0); - boost::mpi::gather(comm, local_velocities, global_velocities, 0); + auto const [global_positions, global_velocities] = + detail::gather(comm, local_positions, local_velocities); if (comm.rank() != 0) { return {}; } Utils::CylindricalHistogram histogram(n_bins(), limits()); - accumulate(histogram, global_positions, global_velocities); - return normalize_by_bin_size(histogram); + detail::accumulate(histogram, global_positions, global_velocities); + return detail::normalize_by_bin_size(histogram); } } // namespace Observables diff --git a/src/core/observables/CylindricalLBVelocityProfileAtParticlePositions.cpp b/src/core/observables/CylindricalLBVelocityProfileAtParticlePositions.cpp index a139561a164..f498b168f07 100644 --- a/src/core/observables/CylindricalLBVelocityProfileAtParticlePositions.cpp +++ b/src/core/observables/CylindricalLBVelocityProfileAtParticlePositions.cpp @@ -26,9 +26,6 @@ #include #include -#include -#include - #include #include @@ -59,21 +56,16 @@ std::vector CylindricalLBVelocityProfileAtParticlePositions::evaluate( local_velocities.emplace_back(vel_cyl); } - auto const world_size = comm.size(); - std::vector global_folded_positions{}; - std::vector global_velocities{}; - global_folded_positions.reserve(world_size); - global_velocities.reserve(world_size); - boost::mpi::gather(comm, local_folded_positions, global_folded_positions, 0); - boost::mpi::gather(comm, local_velocities, global_velocities, 0); + auto const [global_folded_positions, global_velocities] = + detail::gather(comm, local_folded_positions, local_velocities); if (comm.rank() != 0) { return {}; } Utils::CylindricalHistogram histogram(n_bins(), limits()); - accumulate(histogram, global_folded_positions, global_velocities); - return normalize_by_bin_size(histogram); + detail::accumulate(histogram, global_folded_positions, global_velocities); + return detail::normalize_by_bin_size(histogram); } } // namespace Observables diff --git a/src/core/observables/CylindricalVelocityProfile.hpp b/src/core/observables/CylindricalVelocityProfile.hpp index ab54d4610d1..394df7cb034 100644 --- a/src/core/observables/CylindricalVelocityProfile.hpp +++ b/src/core/observables/CylindricalVelocityProfile.hpp @@ -28,7 +28,6 @@ #include #include -#include #include namespace Observables { @@ -59,22 +58,16 @@ class CylindricalVelocityProfile : public CylindricalPidProfileObservable { traits.velocity(p), transform_params->axis(), pos)); } - auto const world_size = comm.size(); - std::vector global_folded_positions{}; - std::vector global_velocities{}; - global_folded_positions.reserve(world_size); - global_velocities.reserve(world_size); - boost::mpi::gather(comm, local_folded_positions, global_folded_positions, - 0); - boost::mpi::gather(comm, local_velocities, global_velocities, 0); + auto const [global_folded_positions, global_velocities] = + detail::gather(comm, local_folded_positions, local_velocities); if (comm.rank() != 0) { return {}; } Utils::CylindricalHistogram histogram(n_bins(), limits()); - accumulate(histogram, global_folded_positions, global_velocities); - return normalize_by_bin_size(histogram); + detail::accumulate(histogram, global_folded_positions, global_velocities); + return detail::normalize_by_bin_size(histogram); } std::vector shape() const override { diff --git a/src/core/observables/DensityProfile.hpp b/src/core/observables/DensityProfile.hpp index 325d38908c9..4ebad035dca 100644 --- a/src/core/observables/DensityProfile.hpp +++ b/src/core/observables/DensityProfile.hpp @@ -23,6 +23,7 @@ #include "Particle.hpp" #include "PidProfileObservable.hpp" #include "grid.hpp" +#include "utils_histogram.hpp" #include @@ -49,11 +50,8 @@ class DensityProfile : public PidProfileObservable { folded_position(traits.position(p), box_geo)); } - auto const world_size = comm.size(); - std::vector global_folded_positions{}; - global_folded_positions.reserve(world_size); - boost::mpi::gather(comm, local_folded_positions, global_folded_positions, - 0); + auto const global_folded_positions = + detail::gather(comm, local_folded_positions); if (comm.rank() != 0) { return {}; diff --git a/src/core/observables/FluxDensityProfile.hpp b/src/core/observables/FluxDensityProfile.hpp index 1304ce263eb..1887c8d8c61 100644 --- a/src/core/observables/FluxDensityProfile.hpp +++ b/src/core/observables/FluxDensityProfile.hpp @@ -27,8 +27,6 @@ #include -#include - #include #include #include @@ -60,21 +58,15 @@ class FluxDensityProfile : public PidProfileObservable { local_velocities.emplace_back(traits.velocity(p)); } - auto const world_size = comm.size(); - std::vector global_folded_positions{}; - std::vector global_velocities{}; - global_folded_positions.reserve(world_size); - global_velocities.reserve(world_size); - boost::mpi::gather(comm, local_folded_positions, global_folded_positions, - 0); - boost::mpi::gather(comm, local_velocities, global_velocities, 0); + auto const [global_folded_positions, global_velocities] = + detail::gather(comm, local_folded_positions, local_velocities); if (comm.rank() != 0) { return {}; } Utils::Histogram histogram(n_bins(), limits()); - accumulate(histogram, global_folded_positions, global_velocities); + detail::accumulate(histogram, global_folded_positions, global_velocities); histogram.normalize(); return histogram.get_histogram(); } diff --git a/src/core/observables/ForceDensityProfile.hpp b/src/core/observables/ForceDensityProfile.hpp index 3bdda403ca0..bd3ded0f03e 100644 --- a/src/core/observables/ForceDensityProfile.hpp +++ b/src/core/observables/ForceDensityProfile.hpp @@ -62,21 +62,15 @@ class ForceDensityProfile : public PidProfileObservable { local_forces.emplace_back(traits.force(p)); } - auto const world_size = comm.size(); - std::vector global_folded_positions{}; - std::vector global_forces{}; - global_folded_positions.reserve(world_size); - global_forces.reserve(world_size); - boost::mpi::gather(comm, local_folded_positions, global_folded_positions, - 0); - boost::mpi::gather(comm, local_forces, global_forces, 0); + auto const [global_folded_positions, global_forces] = + detail::gather(comm, local_folded_positions, local_forces); if (comm.rank() != 0) { return {}; } Utils::Histogram histogram(n_bins(), limits()); - accumulate(histogram, global_folded_positions, global_forces); + detail::accumulate(histogram, global_folded_positions, global_forces); histogram.normalize(); return histogram.get_histogram(); } diff --git a/src/core/observables/LBVelocityProfile.cpp b/src/core/observables/LBVelocityProfile.cpp index c15c6c63100..706d824afee 100644 --- a/src/core/observables/LBVelocityProfile.cpp +++ b/src/core/observables/LBVelocityProfile.cpp @@ -24,9 +24,6 @@ #include #include -#include -#include - #include #include @@ -48,23 +45,18 @@ LBVelocityProfile::operator()(boost::mpi::communicator const &comm) const { } } - auto const world_size = comm.size(); - std::vector global_positions{}; - std::vector global_velocities{}; - global_positions.reserve(world_size); - global_velocities.reserve(world_size); - boost::mpi::gather(comm, local_positions, global_positions, 0); - boost::mpi::gather(comm, local_velocities, global_velocities, 0); + auto const [global_positions, global_velocities] = + detail::gather(comm, local_positions, local_velocities); if (comm.rank() != 0) { return {}; } Utils::Histogram histogram(n_bins(), limits()); - accumulate(histogram, global_positions, global_velocities); + detail::accumulate(histogram, global_positions, global_velocities); try { - return normalize_by_bin_size(histogram, allow_empty_bins); - } catch (empty_bin_exception const &) { + return detail::normalize_by_bin_size(histogram, allow_empty_bins); + } catch (detail::empty_bin_exception const &) { throw std::runtime_error( "Decrease sampling delta(s), some bins have no hit"); } diff --git a/src/core/observables/PidObservable.hpp b/src/core/observables/PidObservable.hpp index ee2e0ba3f0f..1f61f9eb97c 100644 --- a/src/core/observables/PidObservable.hpp +++ b/src/core/observables/PidObservable.hpp @@ -31,9 +31,9 @@ #include #include - #include #include +#include #include #include diff --git a/src/core/observables/utils_histogram.hpp b/src/core/observables/utils_histogram.hpp index 7f4bbc003e6..fc0854a3904 100644 --- a/src/core/observables/utils_histogram.hpp +++ b/src/core/observables/utils_histogram.hpp @@ -21,10 +21,36 @@ #include +#include +#include +#include + #include +#include #include -namespace Observables { +namespace Observables::detail { + +/** @brief Gather data from all MPI ranks. */ +template +auto gather(boost::mpi::communicator const &comm, + std::vector const &local_pos) { + std::vector> global_pos{}; + boost::mpi::gather(comm, local_pos, global_pos, 0); + return global_pos; +} + +/** @brief Gather data from all MPI ranks. */ +template +auto gather(boost::mpi::communicator const &comm, + std::vector const &local_pos, + std::vector const &local_val) { + std::vector> global_pos{}; + boost::mpi::gather(comm, local_pos, global_pos, 0); + std::vector> global_val{}; + boost::mpi::gather(comm, local_val, global_val, 0); + return std::make_pair(global_pos, global_val); +} /** @brief Accumulate histogram data gathered from multiple MPI ranks. */ template @@ -58,4 +84,4 @@ auto normalize_by_bin_size(Utils::Histogram &histogram, return hist_data; } -} // Namespace Observables +} // Namespace Observables::detail diff --git a/src/core/particle_node.cpp b/src/core/particle_node.cpp index 8c8d46d37a6..ef66de66b84 100644 --- a/src/core/particle_node.cpp +++ b/src/core/particle_node.cpp @@ -36,6 +36,7 @@ #include #include +#include #include #include #include @@ -155,17 +156,18 @@ Utils::Cache particle_fetch_cache(max_cache_size); void invalidate_fetch_cache() { particle_fetch_cache.invalidate(); } std::size_t fetch_cache_max_size() { return particle_fetch_cache.max_size(); } -static boost::optional get_particle_data_local(int p_id) { - auto p = cell_structure.get_local_particle(p_id); - - if (p and (not p->is_ghost())) { - return *p; +static void mpi_send_particle_data_local(int p_id) { + auto const p = cell_structure.get_local_particle(p_id); + auto const found = p and not p->is_ghost(); + assert(1 == boost::mpi::all_reduce(::comm_cart, static_cast(found), + std::plus<>()) && + "Particle not found"); + if (found) { + ::comm_cart.send(0, 42, *p); } - - return {}; } -REGISTER_CALLBACK_ONE_RANK(get_particle_data_local) +REGISTER_CALLBACK(mpi_send_particle_data_local) const Particle &get_particle_data(int p_id) { auto const pnode = get_particle_node(p_id); @@ -183,10 +185,10 @@ const Particle &get_particle_data(int p_id) { /* Cache miss, fetch the particle, * put it into the cache and return a pointer into the cache. */ - auto const cache_ptr = particle_fetch_cache.put( - p_id, Communication::mpiCallbacks().call(Communication::Result::one_rank, - get_particle_data_local, p_id)); - return *cache_ptr; + Communication::mpiCallbacks().call_all(mpi_send_particle_data_local, p_id); + Particle result{}; + ::comm_cart.recv(boost::mpi::any_source, boost::mpi::any_tag, result); + return *(particle_fetch_cache.put(p_id, std::move(result))); } static void mpi_get_particles_local() { From 959ebd4e870b2de25783dd6caa43de101ebd9af2 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Jean-No=C3=ABl=20Grad?= Date: Fri, 4 Aug 2023 11:17:15 +0200 Subject: [PATCH 2/3] core: Remove MpiCallbacks tag dispatch --- src/core/MpiCallbacks.hpp | 371 +--------------------- src/core/communication.hpp | 32 -- src/core/unit_tests/MpiCallbacks_test.cpp | 80 +---- 3 files changed, 16 insertions(+), 467 deletions(-) diff --git a/src/core/MpiCallbacks.hpp b/src/core/MpiCallbacks.hpp index 03f3a014b79..5ea39c0e553 100644 --- a/src/core/MpiCallbacks.hpp +++ b/src/core/MpiCallbacks.hpp @@ -31,28 +31,20 @@ * e.g. to broadcast global variables or run an algorithm in parallel. * * Callbacks are registered on the head node as function pointers via - * the @ref callback_macros "callback macros". The visitor pattern - * allows using arbitrary function signatures. For non-void returning - * callbacks, several return value policies are available: ignore return - * value, return only one value (this is achieved using a boost optional - * that is empty on all but one node), return the value of the head node, - * or return a reduced value (by specifying the reduction operation). + * the @ref REGISTER_CALLBACK. The visitor pattern allows using arbitrary + * function signatures. */ #include #include #include -#include #include -#include #include -#include +#include #include #include -#include -#include #include #include #include @@ -63,26 +55,6 @@ namespace Communication { class MpiCallbacks; -/** - * This namespace contains tag types - * to indicate what to do with the return - * values of callbacks. - */ -namespace Result { -/** %Ignore result */ -struct Ignore {}; -constexpr auto ignore = Ignore{}; -/** Return value from one rank */ -struct OneRank {}; -constexpr auto one_rank = OneRank{}; -/** Return value from the head node */ -struct MainRank {}; -constexpr auto main_rank = MainRank{}; -/** Reduce return value over all ranks */ -struct Reduction {}; -constexpr auto reduction = Reduction{}; -} // namespace Result - namespace detail { /** * @brief Check if a type can be used as a callback argument. @@ -153,8 +125,7 @@ struct callback_concept_t { * @brief Callback without a return value. * * This is an implementation of a callback for a specific callable - * @p F and a set of arguments to call it with, where the there - * is no return value. + * @p F and a set of arguments to call it with. */ template struct callback_void_t final : public callback_concept_t { @@ -171,112 +142,6 @@ struct callback_void_t final : public callback_concept_t { } }; -/** - * @brief Callback where the return value is ignored. - * - * This is an implementation of a callback for a specific callable - * @p F and a set of arguments to call it with, where the valued from - * all ranks are ignored. - */ -template -struct callback_ignore_t final : public callback_concept_t { - F m_f; - - callback_ignore_t(callback_ignore_t const &) = delete; - callback_ignore_t(callback_ignore_t &&) = delete; - - template - explicit callback_ignore_t(FRef &&f) : m_f(std::forward(f)) {} - void operator()(boost::mpi::communicator const &, - boost::mpi::packed_iarchive &ia) const override { - detail::invoke(m_f, ia); - } -}; - -/** - * @brief Callback with a return value from one rank. - * - * This is an implementation of a callback for a specific callable - * @p F and a set of arguments to call it with, where the value from - * one rank is returned. Only one node is allowed to return a value. - */ -template -struct callback_one_rank_t final : public callback_concept_t { - F m_f; - - callback_one_rank_t(callback_one_rank_t const &) = delete; - callback_one_rank_t(callback_one_rank_t &&) = delete; - - template - explicit callback_one_rank_t(FRef &&f) : m_f(std::forward(f)) {} - void operator()(boost::mpi::communicator const &comm, - boost::mpi::packed_iarchive &ia) const override { - auto const result = detail::invoke(m_f, ia); - - assert(1 == boost::mpi::all_reduce(comm, static_cast(!!result), - std::plus<>()) && - "Incorrect number of return values"); - - /* If this rank returned a result, send it to the head node. */ - if (!!result) { - comm.send(0, 42, *result); - } - } -}; - -/** - * @brief Callback with a return value from the head node. - * - * This is an implementation of a callback for a specific callable - * @p F and a set of arguments to call it with, where the value from - * the head node is returned. - */ -template -struct callback_main_rank_t final : public callback_concept_t { - F m_f; - - callback_main_rank_t(callback_main_rank_t const &) = delete; - callback_main_rank_t(callback_main_rank_t &&) = delete; - - template - explicit callback_main_rank_t(FRef &&f) : m_f(std::forward(f)) {} - void operator()(boost::mpi::communicator const &, - boost::mpi::packed_iarchive &ia) const override { - std::ignore = detail::invoke(m_f, ia); - } -}; - -/** - * @brief Callback with return value reduction. - * - * This is an implementation of a callback for a specific callable - * @p F and a set of arguments to call it with, where the return - * value is reduced over the communicator. - */ -template -struct callback_reduce_t final : public callback_concept_t { - Op m_op; - F m_f; - - template - explicit callback_reduce_t(OpRef &&op, FRef &&f) - : m_op(std::forward(op)), m_f(std::forward(f)) {} - - /** - * @brief Execute the callback. - * - * Receive parameters for this callback, and then call it. - * - * @param comm The communicator to receive the parameters on. - */ - void operator()(boost::mpi::communicator const &comm, - boost::mpi::packed_iarchive &ia) const override { - /* Call the callback function, and reduce over the results with - * the stored reduction operation. */ - boost::mpi::reduce(comm, detail::invoke(m_f, ia), m_op, 0); - } -}; - template struct FunctorTypes { using functor_type = F; using return_type = R; @@ -293,7 +158,7 @@ using functor_types = decltype(functor_types_impl(&std::remove_reference_t::operator())); template -auto make_model_impl(Result::Ignore, CRef &&c, FunctorTypes) { +auto make_model_impl(CRef &&c, FunctorTypes) { return std::make_unique>(std::forward(c)); } @@ -304,43 +169,15 @@ auto make_model_impl(Result::Ignore, CRef &&c, FunctorTypes) { * to exist and can not be overloaded. */ template auto make_model(F &&f) { - return make_model_impl(Result::Ignore{}, std::forward(f), - functor_types{}); + return make_model_impl(std::forward(f), functor_types{}); } /** * @brief Make a @ref callback_model_t for a function pointer. - * - * This instantiates an implementation of a callback for a function - * pointer. The main task here is to transfer the signature from - * the pointer to the callback_model_t by template argument type - * deduction. */ template auto make_model(void (*f_ptr)(Args...)) { return std::make_unique>(f_ptr); } - -template -auto make_model(Result::Reduction, R (*f_ptr)(Args...), Op &&op) { - return std::make_unique< - callback_reduce_t, R (*)(Args...), Args...>>( - std::forward(op), f_ptr); -} - -template -auto make_model(Result::Ignore, R (*f_ptr)(Args...)) { - return std::make_unique>(f_ptr); -} - -template -auto make_model(Result::OneRank, R (*f_ptr)(Args...)) { - return std::make_unique>(f_ptr); -} - -template -auto make_model(Result::MainRank, R (*f_ptr)(Args...)) { - return std::make_unique>(f_ptr); -} } // namespace detail /** @@ -484,25 +321,6 @@ class MpiCallbacks { detail::make_model(fp)); } - /** - * @brief Add a new callback with a return value. - * - * Add a new callback to the system. This is a collective - * function that must be run on all nodes. - * @p tag is one of the tag types from @ref Communication::Result, - * which indicates what to do with the return values. - * - * @param tag Tag type indicating return operation - * @param tag_args Argument for the return operation, if any. - * @param fp Pointer to the static callback function to add. - */ - template - static void add_static(Tag tag, R (*fp)(Args...), TagArgs &&...tag_args) { - static_callbacks().emplace_back( - reinterpret_cast(fp), - detail::make_model(tag, fp, std::forward(tag_args)...)); - } - private: /** * @brief Remove callback. @@ -566,8 +384,7 @@ class MpiCallbacks { */ template auto call(void (*fp)(Args...), ArgRef &&...args) const -> - /* Enable only if fp can be called with the provided arguments, - * e.g. if fp(args...) is well-formed. */ + /* enable only if fp can be called with the provided arguments */ std::enable_if_t> { const int id = m_func_ptr_to_id.at(reinterpret_cast(fp)); @@ -585,104 +402,13 @@ class MpiCallbacks { * @param args Arguments for the callback. */ template - void call_all(void (*fp)(Args...), ArgRef &&...args) const { + auto call_all(void (*fp)(Args...), ArgRef &&...args) const -> + /* enable only if fp can be called with the provided arguments */ + std::enable_if_t> { call(fp, args...); fp(args...); } - /** - * @brief Call a callback and reduce the result over all nodes. - * - * This calls a callback on all nodes, including the head node, - * and does a mpi reduction with the registered operation. - * - * This method can only be called on the head node. - */ - template - auto call(Result::Reduction, Op op, R (*fp)(Args...), Args... args) const - -> std::remove_reference_t(), - std::declval()))> { - const int id = m_func_ptr_to_id.at(reinterpret_cast(fp)); - - call(id, args...); - - std::remove_cv_t(), - std::declval()))>> - result{}; - boost::mpi::reduce(m_comm, fp(args...), result, op, 0); - - return result; - } - - /** - * @brief Call a callback and ignore the result over all nodes. - * - * This calls a callback on all nodes, including the head node, - * and ignore all return values. - * - * This method can only be called on the head node. - */ - template - auto call(Result::Ignore, R (*fp)(Args...), ArgRef... args) const - -> std::remove_reference_t { - - const int id = m_func_ptr_to_id.at(reinterpret_cast(fp)); - call(id, args...); - - fp(std::forward(args)...); - - return {}; - } - - /** - * @brief Call a callback and reduce the result over all nodes. - * - * This calls a callback on all nodes, including the head node, - * and returns the value from the node which returned an engaged - * optional. Only one node is allowed to return a value. - * - * This method can only be called on the head node. - */ - template - auto call(Result::OneRank, boost::optional (*fp)(Args...), - ArgRef... args) const -> std::remove_reference_t { - - const int id = m_func_ptr_to_id.at(reinterpret_cast(fp)); - call(id, args...); - - auto const local_result = fp(std::forward(args)...); - - assert(1 == boost::mpi::all_reduce(m_comm, static_cast(!!local_result), - std::plus<>()) && - "Incorrect number of return values"); - - if (!!local_result) { - return *local_result; - } - - std::remove_cv_t> result; - m_comm.recv(boost::mpi::any_source, boost::mpi::any_tag, result); - return result; - } - - /** - * @brief Call a callback and return the result of the head node. - * - * This calls a callback on all nodes, including the head node, - * and returns the value from the head node. - * - * This method can only be called on the head node. - */ - template - auto call(Result::MainRank, R (*fp)(Args...), ArgRef... args) const - -> std::remove_reference_t { - - const int id = m_func_ptr_to_id.at(reinterpret_cast(fp)); - call(id, args...); - - return fp(std::forward(args)...); - } - /** * @brief Start the MPI loop. * @@ -771,20 +497,9 @@ class RegisterCallback { template explicit RegisterCallback(void (*cb)(Args...)) { MpiCallbacks::add_static(cb); } - - template - explicit RegisterCallback(Tag tag, R (*cb)(Args...), TagArgs &&...tag_args) { - MpiCallbacks::add_static(tag, cb, std::forward(tag_args)...); - } }; } /* namespace Communication */ -/** - * @name Callback macros - * @anchor callback_macros - */ -/**@{*/ - /** * @brief Register a static callback without return value. * @@ -798,70 +513,4 @@ class RegisterCallback { static ::Communication::RegisterCallback register_##cb(&(cb)); \ } -/** - * @brief Register a static callback whose return value is reduced. - * - * This registers a function as an mpi callback with - * reduction of the return values from the nodes. - * The macro should be used at global scope. - * - * @param cb A function - * @param op Reduction operation - */ -#define REGISTER_CALLBACK_REDUCTION(cb, op) \ - namespace Communication { \ - static ::Communication::RegisterCallback \ - register_reduction_##cb(::Communication::Result::Reduction{}, &(cb), \ - (op)); \ - } - -/** - * @brief Register a static callback whose return value is to be ignored. - * - * This registers a function as an mpi callback with - * ignored return values. - * The macro should be used at global scope. - * - * @param cb A function - */ -#define REGISTER_CALLBACK_IGNORE(cb) \ - namespace Communication { \ - static ::Communication::RegisterCallback \ - register_ignore_##cb(::Communication::Result::Ignore{}, &(cb)); \ - } - -/** - * @brief Register a static callback which returns a value on only one node. - * - * This registers a function as an mpi callback with - * reduction of the return values from one node - * where the value of the optional is set. - * The macro should be used at global scope. - * - * @param cb A function - */ -#define REGISTER_CALLBACK_ONE_RANK(cb) \ - namespace Communication { \ - static ::Communication::RegisterCallback \ - register_one_rank_##cb(::Communication::Result::OneRank{}, &(cb)); \ - } - -/** - * @brief Register a static callback whose return value is ignored except on - * the head node. - * - * This registers a function as an mpi callback with - * reduction of the return values from the head node. - * The macro should be used at global scope. - * - * @param cb A function - */ -#define REGISTER_CALLBACK_MAIN_RANK(cb) \ - namespace Communication { \ - static ::Communication::RegisterCallback \ - register_main_rank_##cb(::Communication::Result::MainRank{}, &(cb)); \ - } - -/**@}*/ - #endif diff --git a/src/core/communication.hpp b/src/core/communication.hpp index 9acdef0c561..a7dbcf42800 100644 --- a/src/core/communication.hpp +++ b/src/core/communication.hpp @@ -98,38 +98,6 @@ void mpi_call_all(void (*fp)(Args...), ArgRef &&...args) { Communication::mpiCallbacks().call_all(fp, std::forward(args)...); } -/** @brief Call a local function. - * @tparam Tag Any tag type defined in @ref Communication::Result - * @tparam R Return type of the local function - * @tparam Args Local function argument types - * @tparam ArgRef Local function argument types - * @param tag Reduction strategy - * @param fp Local function - * @param args Local function arguments - */ -template -auto mpi_call(Tag tag, R (*fp)(Args...), ArgRef &&...args) { - return Communication::mpiCallbacks().call(tag, fp, - std::forward(args)...); -} - -/** @brief Call a local function. - * @tparam Tag Any tag type defined in @ref Communication::Result - * @tparam TagArg Types of arguments to @p Tag - * @tparam R Return type of the local function - * @tparam Args Local function argument types - * @tparam ArgRef Local function argument types - * @param tag Reduction strategy - * @param tag_arg Arguments to the reduction strategy - * @param fp Local function - * @param args Local function arguments - */ -template -auto mpi_call(Tag tag, TagArg &&tag_arg, R (*fp)(Args...), ArgRef &&...args) { - return Communication::mpiCallbacks().call(tag, std::forward(tag_arg), - fp, std::forward(args)...); -} - /** Process requests from head node. Worker nodes main loop. */ void mpi_loop(); diff --git a/src/core/unit_tests/MpiCallbacks_test.cpp b/src/core/unit_tests/MpiCallbacks_test.cpp index 3afbe3f2a63..27884057ebf 100644 --- a/src/core/unit_tests/MpiCallbacks_test.cpp +++ b/src/core/unit_tests/MpiCallbacks_test.cpp @@ -175,38 +175,20 @@ BOOST_AUTO_TEST_CASE(CallbackHandle) { } } -BOOST_AUTO_TEST_CASE(reduce_callback) { - auto cb = []() -> int { return boost::mpi::communicator().rank(); }; - Communication::MpiCallbacks::add_static(Communication::Result::Reduction{}, - static_cast(cb), - std::plus()); - - boost::mpi::communicator world; - Communication::MpiCallbacks cbs(world); - - if (0 == world.rank()) { - auto const ret = cbs.call(Communication::Result::reduction, - std::plus(), static_cast(cb)); - auto const n = world.size(); - BOOST_CHECK_EQUAL(ret, (n * (n - 1)) / 2); - } else { - cbs.loop(); - } -} - -BOOST_AUTO_TEST_CASE(ignore_callback) { +BOOST_AUTO_TEST_CASE(call) { called = false; - auto cb = []() -> int { return called = true, -1; }; + auto cb = []() { called = true; }; - auto const fp = static_cast(cb); + auto const fp = static_cast(cb); - Communication::MpiCallbacks::add_static(Communication::Result::ignore, fp); + Communication::MpiCallbacks::add_static(fp); boost::mpi::communicator world; Communication::MpiCallbacks cbs(world); if (0 == world.rank()) { - cbs.call(Communication::Result::ignore, fp); + cbs.call(fp); + fp(); } else { cbs.loop(); } @@ -214,56 +196,6 @@ BOOST_AUTO_TEST_CASE(ignore_callback) { BOOST_CHECK(called); } -BOOST_AUTO_TEST_CASE(one_rank_callback) { - auto cb = []() -> boost::optional { - boost::mpi::communicator world; - if (world.rank() == (world.size() - 1)) { - return world.rank(); - } - - return {}; - }; - - auto const fp = static_cast (*)()>(cb); - - Communication::MpiCallbacks::add_static(Communication::Result::one_rank, fp); - - boost::mpi::communicator world; - Communication::MpiCallbacks cbs(world); - - if (0 == world.rank()) { - BOOST_CHECK_EQUAL(cbs.call(Communication::Result::one_rank, fp), - world.size() - 1); - } else { - cbs.loop(); - } -} - -BOOST_AUTO_TEST_CASE(main_rank_callback) { - auto cb = []() -> int { - boost::mpi::communicator world; - if (world.rank() == 0) { - return world.size(); - } - - return -1; - }; - - auto const fp = static_cast(cb); - - Communication::MpiCallbacks::add_static(Communication::Result::main_rank, fp); - - boost::mpi::communicator world; - Communication::MpiCallbacks cbs(world); - - if (0 == world.rank()) { - BOOST_CHECK_EQUAL(cbs.call(Communication::Result::main_rank, fp), - world.size()); - } else { - cbs.loop(); - } -} - BOOST_AUTO_TEST_CASE(call_all) { called = false; auto cb = []() { called = true; }; From 50af4b1e320d0f71b0ca2f15eeca1eb67d0a2985 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Jean-No=C3=ABl=20Grad?= Date: Mon, 7 Aug 2023 12:15:14 +0200 Subject: [PATCH 3/3] core: Reserve vector capacity before MPI gather Co-authored-by: Alexander Reinauer <38552369+reinaual@users.noreply.github.com> --- src/core/observables/utils_histogram.hpp | 4 ++++ 1 file changed, 4 insertions(+) diff --git a/src/core/observables/utils_histogram.hpp b/src/core/observables/utils_histogram.hpp index fc0854a3904..591423e2c3e 100644 --- a/src/core/observables/utils_histogram.hpp +++ b/src/core/observables/utils_histogram.hpp @@ -36,6 +36,7 @@ template auto gather(boost::mpi::communicator const &comm, std::vector const &local_pos) { std::vector> global_pos{}; + global_pos.reserve(comm.size()); boost::mpi::gather(comm, local_pos, global_pos, 0); return global_pos; } @@ -45,9 +46,12 @@ template auto gather(boost::mpi::communicator const &comm, std::vector const &local_pos, std::vector const &local_val) { + auto const world_size = comm.size(); std::vector> global_pos{}; + global_pos.reserve(world_size); boost::mpi::gather(comm, local_pos, global_pos, 0); std::vector> global_val{}; + global_val.reserve(world_size); boost::mpi::gather(comm, local_val, global_val, 0); return std::make_pair(global_pos, global_val); }