From b1d9d973b316207fb3173541df19631e9f4d7a8c Mon Sep 17 00:00:00 2001 From: Lawrence Kidder Date: Fri, 15 Mar 2024 15:07:44 -0400 Subject: [PATCH] Add ability to monitor size of DataBox items - Adds a function to observe the size in bytes of all non-reference items in a DataBox - Adds an observer to gather the sizes in MB of each item (summed over all elements) for the DataBoxes of each component --- src/DataStructures/DataBox/DataBox.hpp | 33 ++++ src/ParallelAlgorithms/Events/CMakeLists.txt | 2 + .../Events/ObserveDataBox.cpp | 14 ++ .../Events/ObserveDataBox.hpp | 166 ++++++++++++++++++ .../DataStructures/DataBox/Test_DataBox.cpp | 36 ++++ 5 files changed, 251 insertions(+) create mode 100644 src/ParallelAlgorithms/Events/ObserveDataBox.cpp create mode 100644 src/ParallelAlgorithms/Events/ObserveDataBox.hpp diff --git a/src/DataStructures/DataBox/DataBox.hpp b/src/DataStructures/DataBox/DataBox.hpp index 92d8ad02de0d..f59d42eba3c0 100644 --- a/src/DataStructures/DataBox/DataBox.hpp +++ b/src/DataStructures/DataBox/DataBox.hpp @@ -10,11 +10,13 @@ #include #include #include +#include #include #include #include #include #include +#include #include #include "DataStructures/DataBox/Access.hpp" @@ -321,6 +323,9 @@ class DataBox> : public Access, template std::string print_items() const; + /// The size in bytes of each item (excluding reference items) + std::map size_of_items() const; + /// Retrieve the tag `Tag`, should be called by the free function db::get template const auto& get() const; @@ -546,6 +551,34 @@ std::string DataBox>::print_items() const { return os.str(); } +template +std::map DataBox>::size_of_items() + const { + std::map result{}; + const auto add_item_size = [this, &result](auto tag_v) { + (void)this; + using tag = tmpl::type_from; + if constexpr (not db::is_reference_tag_v) { + // For item of ItemType::Compute, this will not evaluate its function + // (i.e. if the item has never been evaluated its size will be that of a + // default initialized object) + const auto& item = get_item().get(); + if constexpr (tt::is_a_v) { + if (item == nullptr) { + result[pretty_type::get_name()] = 0; + } else { + result[pretty_type::get_name()] = size_of_object_in_bytes(*item); + } + } else { + result[pretty_type::get_name()] = size_of_object_in_bytes(item); + } + } + }; + tmpl::for_each(add_item_size); + tmpl::for_each(add_item_size); + return result; +} + namespace detail { // This function exists so that the user can look at the template // arguments to find out what triggered the static_assert. diff --git a/src/ParallelAlgorithms/Events/CMakeLists.txt b/src/ParallelAlgorithms/Events/CMakeLists.txt index e3db9dd41dc5..b8fdb56af48d 100644 --- a/src/ParallelAlgorithms/Events/CMakeLists.txt +++ b/src/ParallelAlgorithms/Events/CMakeLists.txt @@ -9,6 +9,7 @@ spectre_target_sources( ${LIBRARY} PRIVATE ObserveAdaptiveSteppingDiagnostics.cpp + ObserveDataBox.cpp ObserveNorms.cpp ) @@ -20,6 +21,7 @@ spectre_target_headers( Factory.hpp MonitorMemory.hpp ObserveAdaptiveSteppingDiagnostics.hpp + ObserveDataBox.hpp ObserveAtExtremum.hpp ObserveFields.hpp ObserveNorms.hpp diff --git a/src/ParallelAlgorithms/Events/ObserveDataBox.cpp b/src/ParallelAlgorithms/Events/ObserveDataBox.cpp new file mode 100644 index 000000000000..52fe0ff2b65a --- /dev/null +++ b/src/ParallelAlgorithms/Events/ObserveDataBox.cpp @@ -0,0 +1,14 @@ +// Distributed under the MIT License. +// See LICENSE.txt for details. + +#include "ParallelAlgorithms/Events/ObserveDataBox.hpp" + +#include + +namespace Events { +ObserveDataBox::ObserveDataBox(CkMigrateMessage* /*m*/) {} + +void ObserveDataBox::pup(PUP::er& p) { Event::pup(p); } + +PUP::able::PUP_ID ObserveDataBox::my_PUP_ID = 0; // NOLINT +} // namespace Events diff --git a/src/ParallelAlgorithms/Events/ObserveDataBox.hpp b/src/ParallelAlgorithms/Events/ObserveDataBox.hpp new file mode 100644 index 000000000000..601396dd07d0 --- /dev/null +++ b/src/ParallelAlgorithms/Events/ObserveDataBox.hpp @@ -0,0 +1,166 @@ +// Distributed under the MIT License. +// See LICENSE.txt for details. + +#pragma once + +#include +#include +#include +#include + +#include "DataStructures/DataBox/DataBox.hpp" +#include "Domain/Structure/ElementId.hpp" +#include "IO/Observer/ObserverComponent.hpp" +#include "IO/Observer/ReductionActions.hpp" +#include "Options/String.hpp" +#include "Parallel/DistributedObject.hpp" +#include "Parallel/GlobalCache.hpp" +#include "Parallel/Invoke.hpp" +#include "Parallel/Reduction.hpp" +#include "ParallelAlgorithms/EventsAndTriggers/Event.hpp" +#include "Utilities/PrettyType.hpp" +#include "Utilities/TMPL.hpp" + +namespace Events { + +namespace detail { + +struct map_add { + std::map operator()( + std::map map_1, + const std::map& map_2) { + for (const auto& [key, value] : map_2) { + map_1.at(key) += value; + } + return map_1; + } +}; + +using ReductionType = Parallel::ReductionData< + // Time + Parallel::ReductionDatum>, + // Map of total mem usage in MB per item in DataBoxes + Parallel::ReductionDatum, map_add>>; + +template +struct ReduceDataBoxSize { + template + static void apply(db::DataBox& /*box*/, + Parallel::GlobalCache& cache, + const ArrayIndex& /*array_index*/, const double time, + const std::map& item_sizes) { + auto& observer_writer_proxy = Parallel::get_parallel_component< + observers::ObserverWriter>(cache); + const std::string subfile_name = + "/DataBoxSizeInMb/" + pretty_type::name(); + std::vector legend; + legend.reserve(item_sizes.size() + 1); + legend.emplace_back("Time"); + std::vector columns; + columns.reserve(item_sizes.size() + 1); + columns.emplace_back(time); + const double scaling = 1.0 / 1048576.0; // so size is in MB + for (const auto& [name, size] : item_sizes) { + legend.emplace_back(name); + columns.emplace_back(scaling * static_cast(size)); + } + Parallel::threaded_action< + observers::ThreadedActions::WriteReductionDataRow>( + // Node 0 is always the writer + observer_writer_proxy[0], subfile_name, legend, + std::make_tuple(columns)); + } +}; + +struct ContributeDataBoxSize { + template + static void apply(db::DataBox& box, + Parallel::GlobalCache& cache, + const ArrayIndex& array_index, const double time) { + const auto& my_proxy = + Parallel::get_parallel_component(cache)[array_index]; + auto& target_proxy = Parallel::get_parallel_component< + observers::ObserverWriter>(cache); + const auto item_sizes = box.size_of_items(); + if constexpr (Parallel::is_singleton_v) { + Parallel::simple_action>( + target_proxy[0], time, item_sizes); + } else { + Parallel::contribute_to_reduction>( + ReductionType{time, item_sizes}, my_proxy, target_proxy[0]); + } + } +}; +} // namespace detail + +/// \brief Event that will collect the size in MBs used by each DataBox item on +/// each parallel component. +/// +/// \details The data will be written to disk in the reductions file under the +/// `/DataBoxSizeInMb/` group. The name of each file is the `pretty_type::name` +/// of each parallel component. There will be a column for each item in the +/// DataBox that is not a subitem or reference item. +class ObserveDataBox : public Event { + public: + /// \cond + explicit ObserveDataBox(CkMigrateMessage* m); + using PUP::able::register_constructor; + WRAPPED_PUPable_decl_template(ObserveDataBox); // NOLINT + /// \endcond + + using options = tmpl::list<>; + static constexpr Options::String help = { + "Observe size (in MB) of each item (except reference items) in each " + "DataBox"}; + + ObserveDataBox() = default; + + using compute_tags_for_observation_box = tmpl::list<>; + + using return_tags = tmpl::list<>; + using argument_tags = tmpl::list<::Tags::DataBox>; + + template + void operator()(const DataBoxType& box, + Parallel::GlobalCache& /*cache*/, + const ArrayIndex& array_index, + const ParallelComponent* /*meta*/, + const ObservationValue& observation_value) const; + + using is_ready_argument_tags = tmpl::list<>; + + template + bool is_ready(Parallel::GlobalCache& /*cache*/, + const ArrayIndex& /*array_index*/, + const Component* const /*meta*/) const { + return true; + } + + bool needs_evolved_variables() const override { return false; } + + // NOLINTNEXTLINE(google-runtime-references) + void pup(PUP::er& p) override; +}; + +template +void ObserveDataBox::operator()( + const DataBoxType& /*box*/, Parallel::GlobalCache& cache, + const ArrayIndex& array_index, const ParallelComponent* const /*meta*/, + const ObservationValue& observation_value) const { + if (is_zeroth_element(array_index)) { + using component_list = + tmpl::push_back; + tmpl::for_each([&observation_value, + &cache](auto component_v) { + using component = tmpl::type_from; + auto& target_proxy = Parallel::get_parallel_component(cache); + Parallel::simple_action( + target_proxy, observation_value.value); + }); + } +} +} // namespace Events diff --git a/tests/Unit/DataStructures/DataBox/Test_DataBox.cpp b/tests/Unit/DataStructures/DataBox/Test_DataBox.cpp index 1e4676be673c..baf7a5a54d25 100644 --- a/tests/Unit/DataStructures/DataBox/Test_DataBox.cpp +++ b/tests/Unit/DataStructures/DataBox/Test_DataBox.cpp @@ -3263,6 +3263,42 @@ void test_output() { remove_whitespace(output_stream); remove_whitespace(expected_stream); CHECK(output_stream == expected_stream); + const auto item_size = box.size_of_items(); + CHECK(item_size.size() == 5); + CHECK(item_size.at("(anonymous namespace)::test_databox_tags::Tag0") == 8); + CHECK(item_size.at("(anonymous namespace)::test_databox_tags::Tag1") == 32); + CHECK(item_size.at("(anonymous namespace)::test_databox_tags::Tag2") == 24); + CHECK(item_size.at("(anonymous namespace)::test_databox_tags::Tag4Compute") == + 8); + CHECK(item_size.at("(anonymous namespace)::test_databox_tags::Tag5Compute") == + 28); + + const auto box_with_ptrs = + db::create, + db::AddComputeTags>( + std::make_unique(3)); + const auto item_size_ptrs = box_with_ptrs.size_of_items(); + CHECK(item_size_ptrs.size() == 3); + CHECK(item_size_ptrs.at( + "(anonymous namespace)::test_databox_tags::Pointer") == 4); + CHECK(item_size_ptrs.at( + "(anonymous " + "namespace)::test_databox_tags::PointerToCounterCompute") == 0); + CHECK(item_size_ptrs.at( + "(anonymous namespace)::test_databox_tags::PointerToSumCompute") == + 0); + db::get(box_with_ptrs); + const auto item_size_ptrs_after = box_with_ptrs.size_of_items(); + CHECK(item_size_ptrs_after.size() == 3); + CHECK(item_size_ptrs_after.at( + "(anonymous namespace)::test_databox_tags::Pointer") == 4); + CHECK(item_size_ptrs_after.at( + "(anonymous " + "namespace)::test_databox_tags::PointerToCounterCompute") == 4); + CHECK(item_size_ptrs_after.at( + "(anonymous namespace)::test_databox_tags::PointerToSumCompute") == + 4); } void test_exception_safety() {