sxs-collaboration · nilsvu · Aug 14, 2024 · Aug 13, 2024 · Aug 13, 2024 · Aug 13, 2024
diff --git a/cmake/AddSpectreExecutable.cmake b/cmake/AddSpectreExecutable.cmake
@@ -26,11 +26,21 @@ function(add_spectre_executable TARGET_NAME)
     PUBLIC
     ${SPECTRE_ALLOCATOR_LIBRARY}
     SpectreAllocator
-    )
+  )
+
+  set(SPECTRE_KOKKOS_LAUNCHER "")
+  if(SPECTRE_KOKKOS)
+    # We need to make sure we don't drop the Kokkos link wrapper
+    get_target_property(
+      SPECTRE_KOKKOS_LAUNCHER
+      ${TARGET_NAME}
+      RULE_LAUNCH_LINK)
+  endif()
   set_target_properties(
     ${TARGET_NAME}
     PROPERTIES
-    RULE_LAUNCH_LINK "${CMAKE_BINARY_DIR}/tmp/WrapExecutableLinker.sh"
+    RULE_LAUNCH_LINK
+    "${CMAKE_BINARY_DIR}/tmp/WrapExecutableLinker.sh ${SPECTRE_KOKKOS_LAUNCHER}"
     LINK_DEPENDS "${CMAKE_BINARY_DIR}/tmp/WrapExecutableLinker.sh"
     # Expose readable symbol names in backtrace (adds flags like -rdynamic)
     ENABLE_EXPORTS ON

diff --git a/cmake/SetupKokkos.cmake b/cmake/SetupKokkos.cmake
@@ -27,7 +27,9 @@ if(SPECTRE_KOKKOS)
 
   find_package(Kokkos REQUIRED)
 
-  if (TARGET Kokkos::kokkos AND Kokkos_ENABLE_CUDA)
+  if (TARGET Kokkos::kokkos
+      AND Kokkos_ENABLE_CUDA
+      AND CMAKE_CXX_COMPILER_ID STREQUAL "GNU")
     set_property(TARGET Kokkos::kokkos
       APPEND PROPERTY
       INTERFACE_COMPILE_OPTIONS

diff --git a/cmake/SetupPch.cmake b/cmake/SetupPch.cmake
@@ -49,6 +49,7 @@ target_link_libraries(
   Charmxx::pup
   HDF5::HDF5
   SpectreFlags
+  SpectreKokkos
   )
 
 # Targets can reuse the PCH generated for this library. They must also link

diff --git a/cmake/SpectreAddLibraries.cmake b/cmake/SpectreAddLibraries.cmake
@@ -39,14 +39,23 @@ function(ADD_SPECTRE_LIBRARY LIBRARY_NAME)
       PUBLIC
       ${SPECTRE_ALLOCATOR_LIBRARY}
       SpectreAllocator
-      )
+    )
 
+    set(SPECTRE_KOKKOS_LAUNCHER "")
+    if(SPECTRE_KOKKOS)
+      # We need to make sure we don't drop the Kokkos link wrapper
+      get_target_property(
+        SPECTRE_KOKKOS_LAUNCHER
+        ${LIBRARY_NAME}
+        RULE_LAUNCH_LINK)
+    endif()
     set_target_properties(
       ${LIBRARY_NAME}
       PROPERTIES
-      RULE_LAUNCH_LINK "${CMAKE_BINARY_DIR}/tmp/WrapLibraryLinker.sh"
+      RULE_LAUNCH_LINK
+      "${CMAKE_BINARY_DIR}/tmp/WrapLibraryLinker.sh ${SPECTRE_KOKKOS_LAUNCHER}"
       LINK_DEPENDS "${CMAKE_BINARY_DIR}/tmp/WrapLibraryLinker.sh"
-      )
+    )
   endif (NOT ${LIBRARY_TYPE} STREQUAL INTERFACE_LIBRARY)
   if (NOT "${LIBRARY_NAME}" MATCHES "^SpectrePch"
       AND NOT ${LIBRARY_IS_IMPORTED}

diff --git a/src/Domain/BlockLogicalCoordinates.cpp b/src/Domain/BlockLogicalCoordinates.cpp
@@ -17,14 +17,14 @@
 #include "Utilities/ErrorHandling/Error.hpp"
 #include "Utilities/GenerateInstantiations.hpp"
 
-template <size_t Dim, typename Frame>
+template <size_t Dim, typename Fr>
 std::optional<tnsr::I<double, Dim, ::Frame::BlockLogical>>
 block_logical_coordinates_single_point(
-    const tnsr::I<double, Dim, Frame>& input_point, const Block<Dim>& block,
+    const tnsr::I<double, Dim, Fr>& input_point, const Block<Dim>& block,
     const double time, const domain::FunctionsOfTimeMap& functions_of_time) {
   std::optional<tnsr::I<double, Dim, ::Frame::BlockLogical>> logical_point{};
   if (block.is_time_dependent()) {
-    if constexpr (std::is_same_v<Frame, ::Frame::Inertial>) {
+    if constexpr (std::is_same_v<Fr, ::Frame::Inertial>) {
       // Point is in the inertial frame, so we need to map to the grid
       // frame and then the logical frame.
       const auto moving_inv = block.moving_mesh_grid_to_inertial_map().inverse(
@@ -35,7 +35,7 @@ block_logical_coordinates_single_point(
       // logical to grid map is time-independent.
       logical_point =
           block.moving_mesh_logical_to_grid_map().inverse(moving_inv.value());
-    } else if constexpr (std::is_same_v<Frame, ::Frame::Distorted>) {
+    } else if constexpr (std::is_same_v<Fr, ::Frame::Distorted>) {
       // Point is in the distorted frame, so we need to map to the grid
       // frame and then the logical frame.
       if (not block.has_distorted_frame()) {
@@ -78,24 +78,24 @@ block_logical_coordinates_single_point(
       // frames in the block, so make sure Frame is
       // ::Frame::Grid. (The Inertial and Distorted cases were
       // handled above.)
-      static_assert(std::is_same_v<Frame, ::Frame::Grid>,
+      static_assert(std::is_same_v<Fr, ::Frame::Grid>,
                     "Cannot convert from given frame to Grid frame");
 
       // Point is in the grid frame, just map to logical frame.
       logical_point =
           block.moving_mesh_logical_to_grid_map().inverse(input_point);
     }
   } else {  // not block.is_time_dependent()
-    if constexpr (std::is_same_v<Frame, ::Frame::Inertial>) {
+    if constexpr (std::is_same_v<Fr, ::Frame::Inertial>) {
       logical_point = block.stationary_map().inverse(input_point);
     } else {
       // If the map is time-independent, then the grid, distorted, and
       // inertial frames are the same.  So if we are in the grid
       // or distorted frames, convert to the inertial frame
       // (this conversion is just a type conversion).
       // Otherwise throw a static_assert.
-      static_assert(std::is_same_v<Frame, ::Frame::Grid> or
-                        std::is_same_v<Frame, ::Frame::Distorted>,
+      static_assert(std::is_same_v<Fr, ::Frame::Grid> or
+                        std::is_same_v<Fr, ::Frame::Distorted>,
                     "Cannot convert from given frame to Inertial frame");
       tnsr::I<double, Dim, ::Frame::Inertial> x_inertial(0.0);
       for (size_t d = 0; d < Dim; ++d) {
@@ -133,14 +133,14 @@ block_logical_coordinates_single_point(
   return logical_point;
 }
 
-template <size_t Dim, typename Frame>
+template <size_t Dim, typename Fr>
 std::vector<BlockLogicalCoords<Dim>> block_logical_coordinates(
-    const Domain<Dim>& domain, const tnsr::I<DataVector, Dim, Frame>& x,
+    const Domain<Dim>& domain, const tnsr::I<DataVector, Dim, Fr>& x,
     const double time, const domain::FunctionsOfTimeMap& functions_of_time) {
   const size_t num_pts = get<0>(x).size();
   std::vector<BlockLogicalCoords<Dim>> block_coord_holders(num_pts);
   for (size_t s = 0; s < num_pts; ++s) {
-    tnsr::I<double, Dim, Frame> x_frame(0.0);
+    tnsr::I<double, Dim, Fr> x_frame(0.0);
     for (size_t d = 0; d < Dim; ++d) {
       x_frame.get(d) = x.get(d)[s];
     }

diff --git a/src/Domain/BlockLogicalCoordinates.hpp b/src/Domain/BlockLogicalCoordinates.hpp
@@ -62,17 +62,17 @@ using BlockLogicalCoords = std::optional<
 /// typical use cases.  This means that `block_logical_coordinates`
 /// does not assume that grid and distorted frames are equal in
 /// `Block`s that lack a distorted frame.
-template <size_t Dim, typename Frame>
+template <size_t Dim, typename Fr>
 auto block_logical_coordinates(
-    const Domain<Dim>& domain, const tnsr::I<DataVector, Dim, Frame>& x,
+    const Domain<Dim>& domain, const tnsr::I<DataVector, Dim, Fr>& x,
     double time = std::numeric_limits<double>::signaling_NaN(),
     const domain::FunctionsOfTimeMap& functions_of_time = {})
     -> std::vector<BlockLogicalCoords<Dim>>;
 
-template <size_t Dim, typename Frame>
+template <size_t Dim, typename Fr>
 std::optional<tnsr::I<double, Dim, ::Frame::BlockLogical>>
 block_logical_coordinates_single_point(
-    const tnsr::I<double, Dim, Frame>& input_point, const Block<Dim>& block,
+    const tnsr::I<double, Dim, Fr>& input_point, const Block<Dim>& block,
     double time = std::numeric_limits<double>::signaling_NaN(),
     const domain::FunctionsOfTimeMap& functions_of_time = {});
 /// @}
diff --git a/src/Domain/FunctionsOfTime/PiecewisePolynomial.cpp b/src/Domain/FunctionsOfTime/PiecewisePolynomial.cpp
@@ -225,6 +225,11 @@ void PiecewisePolynomial<MaxDeriv>::pup(PUP::er& p) {
 namespace {
 template <size_t MaxDerivPlusOne>
 struct LegacyStoredInfo {
+  LegacyStoredInfo() = default;
+  LegacyStoredInfo(double in_time,
+                   std::array<DataVector, 1> in_stored_quantities)
+      : time(in_time), stored_quantities(in_stored_quantities) {}
+
   double time{std::numeric_limits<double>::signaling_NaN()};
   std::array<DataVector, MaxDerivPlusOne> stored_quantities;
 

diff --git a/src/Domain/FunctionsOfTime/QuaternionFunctionOfTime.cpp b/src/Domain/FunctionsOfTime/QuaternionFunctionOfTime.cpp
@@ -116,6 +116,11 @@
 
 namespace {
 struct LegacyStoredInfo {
+  LegacyStoredInfo() = default;
+  LegacyStoredInfo(double in_time,
+                   std::array<DataVector, 1> in_stored_quantities)
+      : time(in_time), stored_quantities(in_stored_quantities) {}
+
   double time{std::numeric_limits<double>::signaling_NaN()};
   std::array<DataVector, 1> stored_quantities;
 

diff --git a/src/Domain/FunctionsOfTime/ThreadsafeList.hpp b/src/Domain/FunctionsOfTime/ThreadsafeList.hpp
@@ -130,7 +130,7 @@ class ThreadsafeList {
   class iterator {
    public:
     using iterator_category = std::input_iterator_tag;
-    using value_type = decltype(ThreadsafeList{}(double{}));
+    using value_type = IntervalInfo;
     using reference = value_type;
     using pointer = std::optional<value_type>;
     using difference_type = std::ptrdiff_t;

diff --git a/src/Domain/FunctionsOfTime/ThreadsafeList.tpp b/src/Domain/FunctionsOfTime/ThreadsafeList.tpp
@@ -19,9 +19,15 @@ namespace domain::FunctionsOfTime::FunctionOfTimeHelpers {
 namespace ThreadsafeList_detail {
 template <typename T>
 struct Interval {
-  double expiration;
-  T data;
-  std::unique_ptr<Interval> previous;
+  Interval() = default;
+  Interval(double in_expiration, T in_data,
+           std::unique_ptr<Interval> in_previous)
+      : expiration(in_expiration),
+        data(std::move(in_data)),
+        previous(std::move(in_previous)) {}
+  double expiration{};
+  T data{};
+  std::unique_ptr<Interval> previous{};
 
   void pup(PUP::er& p);
 };

diff --git a/src/IO/H5/Cce.cpp b/src/IO/H5/Cce.cpp
@@ -141,6 +141,10 @@ Cce::~Cce() {
   // internals of CHECK_H5), so older compilers that we support may not have
   // fixed this bug.
   for (const auto& name_and_dataset : bondi_datasets_) {
+#ifdef __CUDACC__
+    // nvcc warns that 'name' is unused
+    [[maybe_unused]]
+#endif
     const auto& name = name_and_dataset.first;
     const auto& dataset = name_and_dataset.second;
     CHECK_H5(H5Dclose(dataset.id), "Failed to close dataset " << name);

diff --git a/src/IO/Importers/Actions/ReadVolumeData.hpp b/src/IO/Importers/Actions/ReadVolumeData.hpp
@@ -21,6 +21,7 @@
 #include "Domain/Structure/ElementId.hpp"
 #include "IO/H5/AccessType.hpp"
 #include "IO/H5/File.hpp"
+#include "IO/H5/TensorData.hpp"
 #include "IO/H5/VolumeData.hpp"
 #include "IO/Importers/ObservationSelector.hpp"
 #include "IO/Importers/Tags.hpp"

diff --git a/src/NumericalAlgorithms/FiniteDifference/Reconstruct.tpp b/src/NumericalAlgorithms/FiniteDifference/Reconstruct.tpp
@@ -19,15 +19,15 @@
 
 namespace fd::reconstruction {
 namespace detail {
-template <size_t Index, size_t DimToReplace, size_t... Is,
+template <size_t IndexToSet, size_t DimToReplace, size_t... Is,
           size_t Dim = sizeof...(Is)>
 auto generate_index_for_u_to_reconstruct_impl(
     const std::array<size_t, sizeof...(Is)>& indices,
     std::index_sequence<Is...>) -> ::Index<Dim> {
-  return ::Index<Dim>{(DimToReplace != Is ? indices[Is] : Index)...};
+  return ::Index<Dim>{(DimToReplace != Is ? indices[Is] : IndexToSet)...};
 }
 
-template <size_t Index, size_t DimToReplace, size_t NumberOfNeighborCells,
+template <size_t IndexToSet, size_t DimToReplace, size_t NumberOfNeighborCells,
           size_t... Is, size_t Dim = sizeof...(Is)>
 auto generate_upper_volume_index_for_u_to_reconstruct_impl(
     const std::array<size_t, sizeof...(Is)>& indices,
@@ -36,7 +36,7 @@ auto generate_upper_volume_index_for_u_to_reconstruct_impl(
   return ::Index<Dim>{
       (DimToReplace != Is
            ? indices[Is]
-           : (volume_extents[Is] - (NumberOfNeighborCells - Index)))...};
+           : (volume_extents[Is] - (NumberOfNeighborCells - IndexToSet)))...};
 }
 
 template <Side UpperLower, size_t DimToReplace, size_t Dim,

diff --git a/src/NumericalAlgorithms/SphericalHarmonics/TagsTypeAliases.hpp b/src/NumericalAlgorithms/SphericalHarmonics/TagsTypeAliases.hpp
@@ -13,21 +13,20 @@ class DataVector;
 namespace ylm::Tags {
 /// Defines type aliases used in Strahlkorper-related Tags.
 namespace aliases {
-template <typename Frame>
+template <typename Fr>
 using Jacobian =
     Tensor<DataVector, tmpl::integral_list<std::int32_t, 2, 1>,
-           index_list<SpatialIndex<3, UpLo::Up, Frame>,
-                      SpatialIndex<2, UpLo::Lo, ::Frame::Spherical<Frame>>>>;
-template <typename Frame>
+           index_list<SpatialIndex<3, UpLo::Up, Fr>,
+                      SpatialIndex<2, UpLo::Lo, ::Frame::Spherical<Fr>>>>;
+template <typename Fr>
 using InvJacobian =
     Tensor<DataVector, tmpl::integral_list<std::int32_t, 2, 1>,
-           index_list<SpatialIndex<2, UpLo::Up, ::Frame::Spherical<Frame>>,
-                      SpatialIndex<3, UpLo::Lo, Frame>>>;
-template <typename Frame>
-using InvHessian =
-    Tensor<DataVector, tmpl::integral_list<std::int32_t, 3, 2, 1>,
-           index_list<SpatialIndex<2, UpLo::Up, ::Frame::Spherical<Frame>>,
-                      SpatialIndex<3, UpLo::Lo, Frame>,
-                      SpatialIndex<3, UpLo::Lo, Frame>>>;
+           index_list<SpatialIndex<2, UpLo::Up, ::Frame::Spherical<Fr>>,
+                      SpatialIndex<3, UpLo::Lo, Fr>>>;
+template <typename Fr>
+using InvHessian = Tensor<
+    DataVector, tmpl::integral_list<std::int32_t, 3, 2, 1>,
+    index_list<SpatialIndex<2, UpLo::Up, ::Frame::Spherical<Fr>>,
+               SpatialIndex<3, UpLo::Lo, Fr>, SpatialIndex<3, UpLo::Lo, Fr>>>;
 }  // namespace aliases
 }  // namespace ylm::Tags
diff --git a/tools/BlazeExceptions.hpp b/tools/BlazeExceptions.hpp
@@ -3,6 +3,12 @@
 
 #include <csignal>
 
+#ifdef __CUDA_ARCH__
+// When building for Nvidia GPUs we need to disable the use of vector
+// intrinsics.
+#define BLAZE_USE_VECTORIZATION 0
+#endif
+
 #ifndef SPECTRE_BLAZE_EXCEPTIONS_HPP
 #define SPECTRE_BLAZE_EXCEPTIONS_HPP