cpp/latest/GinkgoRBFKernels_8cpp_source.html

#include "mapping/device/GinkgoRBFKernels.hpp"


#include "mapping/impl/BasisFunctions.hpp"

#include "math/math.hpp"


#include <functional>

#include <ginkgo/extensions/kokkos.hpp>

#include <ginkgo/ginkgo.hpp>


using precice::mapping::RadialBasisParameters;

using precice::math::pow_int;


using gko::ext::kokkos::map_data;


namespace precice::mapping {


std::shared_ptr<gko::Executor> create_device_executor(const std::string &execName, bool enableUnifiedMemory)

{

#ifdef KOKKOS_ENABLE_SERIAL

  if (execName == "reference-executor") {

    return gko::ext::kokkos::create_executor(Kokkos::Serial{});

  }

#endif

#ifdef PRECICE_WITH_OPENMP

  if (execName == "omp-executor") {

    return gko::ext::kokkos::create_executor(Kokkos::OpenMP{});

  }

#endif

#ifdef PRECICE_WITH_CUDA

  if (execName == "cuda-executor") {

    if (enableUnifiedMemory) {

      return gko::ext::kokkos::create_executor(Kokkos::Cuda{}, Kokkos::CudaUVMSpace{});

    } else {

      return gko::ext::kokkos::create_executor(Kokkos::Cuda{}, Kokkos::CudaSpace{});

    }

  }

#endif

#ifdef PRECICE_WITH_HIP

  if (execName == "hip-executor") {

    if (enableUnifiedMemory) {

      return gko::ext::kokkos::create_executor(Kokkos::HIP{}, Kokkos::HIPManagedSpace{});

    } else {

      return gko::ext::kokkos::create_executor(Kokkos::HIP{}, Kokkos::HIPSpace{});

    }

  }

#endif

  PRECICE_UNREACHABLE("Executor {} unknown to preCICE", execName);

}


namespace kernel {


template <typename MemorySpace, typename EvalFunctionType>


void create_rbf_system_matrix_impl(std::shared_ptr<const gko::Executor>      exec,

                                   gko::ptr_param<GinkgoMatrix>              mtx,

                                   const std::array<bool, 3>                 activeAxis,

                                   gko::ptr_param<GinkgoMatrix>              supportPoints,

                                   gko::ptr_param<GinkgoMatrix>              targetPoints,

                                   EvalFunctionType                          f,

                                   ::precice::mapping::RadialBasisParameters rbf_params,

                                   bool                                      addPolynomial,

                                   unsigned int                              extraDims)

{

  auto k_mtx           = map_data<MemorySpace>(mtx.get());

  auto k_supportPoints = map_data<MemorySpace>(supportPoints.get());

  auto k_targetPoints  = map_data<MemorySpace>(targetPoints.get());


  // the outcome of this if-condition is known at compile time. However, Cuda

  // has issues with constexpr

  if (std::is_same_v<MemorySpace, Kokkos::HostSpace>) {

    // Row-major access

    Kokkos::parallel_for(

        "create_rbf_system_matrix_row_major",

        Kokkos::MDRangePolicy<typename MemorySpace::execution_space, Kokkos::Rank<2>>{{0, 0}, {mtx->get_size()[0], mtx->get_size()[1]}},

        KOKKOS_LAMBDA(const int &i, const int &j) {

          double dist = 0;

          if (addPolynomial) {

            k_mtx(i, j) = 0; // Zero the matrix entry if polynomial terms are added

          }

          // We need to use a pointer here, because the bound checking of std::array

          // contains some host-only code, which yields errors when compiling in

          // debug mode

          const bool *deviceActiveAxis = activeAxis.data();


          // Compute Euclidean distance using row-major indexing

          for (size_t k = 0; k < activeAxis.size(); ++k) {

            if (deviceActiveAxis[k]) {

              double diff = k_supportPoints(j, k) - k_targetPoints(i, k);

              dist += diff * diff;

            }

          }

          dist        = Kokkos::sqrt(dist);

          k_mtx(i, j) = f(dist, rbf_params); // Evaluate the RBF function

        });

  } else {

    // Column-major access

    Kokkos::parallel_for(

        "create_rbf_system_matrix_col_major",

        Kokkos::MDRangePolicy<typename MemorySpace::execution_space, Kokkos::Rank<2>>{{0, 0}, {mtx->get_size()[0], mtx->get_size()[1]}},

        KOKKOS_LAMBDA(const int &i, const int &j) {

          double dist = 0;

          if (addPolynomial) {

            k_mtx(i, j) = 0; // Zero the matrix entry if polynomial terms are added

          }

          const bool *deviceActiveAxis = activeAxis.data();


          // Compute Euclidean distance using column-major indexing

          for (size_t k = 0; k < activeAxis.size(); ++k) {

            if (deviceActiveAxis[k]) {

              double diff = k_supportPoints(k, j) - k_targetPoints(k, i);

              dist += diff * diff;

            }

          }

          dist        = Kokkos::sqrt(dist);

          k_mtx(i, j) = f(dist, rbf_params); // Evaluate the RBF function

        });

  }

}


template <typename EvalFunctionType>


void create_rbf_system_matrix(std::shared_ptr<const gko::Executor>      exec,

                              bool                                      unifiedMemory,

                              gko::ptr_param<GinkgoMatrix>              mtx,

                              const std::array<bool, 3>                 activeAxis,

                              gko::ptr_param<GinkgoMatrix>              supportPoints,

                              gko::ptr_param<GinkgoMatrix>              targetPoints,

                              EvalFunctionType                          f,

                              ::precice::mapping::RadialBasisParameters rbf_params,

                              bool                                      addPolynomial,

                              unsigned int                              extraDims)

{

#ifdef KOKKOS_ENABLE_SERIAL

  if (std::dynamic_pointer_cast<const gko::ReferenceExecutor>(exec)) {

    create_rbf_system_matrix_impl<Kokkos::Serial::memory_space>(exec, mtx, activeAxis, supportPoints, targetPoints, f, rbf_params, addPolynomial, extraDims);

    return;

  }

#endif

#ifdef PRECICE_WITH_OPENMP

  if (std::dynamic_pointer_cast<const gko::OmpExecutor>(exec)) {

    create_rbf_system_matrix_impl<Kokkos::OpenMP::memory_space>(exec, mtx, activeAxis, supportPoints, targetPoints, f, rbf_params, addPolynomial, extraDims);

    return;

  }

#endif

#ifdef PRECICE_WITH_CUDA

  if (std::dynamic_pointer_cast<const gko::CudaExecutor>(exec)) {

    if (unifiedMemory) {

      create_rbf_system_matrix_impl<Kokkos::CudaUVMSpace>(exec, mtx, activeAxis, supportPoints, targetPoints, f, rbf_params, addPolynomial, extraDims);

    } else {

      create_rbf_system_matrix_impl<Kokkos::CudaSpace>(exec, mtx, activeAxis, supportPoints, targetPoints, f, rbf_params, addPolynomial, extraDims);

    }

    return;

  }

#endif

#ifdef PRECICE_WITH_HIP

  if (std::dynamic_pointer_cast<const gko::HipExecutor>(exec)) {

    if (unifiedMemory) {

      create_rbf_system_matrix_impl<Kokkos::HIPManagedSpace>(exec, mtx, activeAxis, supportPoints, targetPoints, f, rbf_params, addPolynomial, extraDims);

    } else {

      create_rbf_system_matrix_impl<Kokkos::HIPSpace>(exec, mtx, activeAxis, supportPoints, targetPoints, f, rbf_params, addPolynomial, extraDims);

    }

    return;

  }

#endif

  PRECICE_UNREACHABLE("Executor unknown to preCICE");

}


#define PRECICE_INSTANTIATE_CREATE_RBF_SYSTEM_MATRIX(_function_type)                                                                            \

  template void create_rbf_system_matrix<_function_type>(std::shared_ptr<const gko::Executor> exec,                                             \

                                                         bool                                 unifiedMemory,                                    \

                                                         gko::ptr_param<GinkgoMatrix> mtx, const std::array<bool, 3> activeAxis,                \

                                                         gko::ptr_param<GinkgoMatrix> supportPoints, gko::ptr_param<GinkgoMatrix> targetPoints, \

                                                         _function_type f, RadialBasisParameters rbf_params, bool addPolynomial, unsigned int extraDims)


PRECICE_INSTANTIATE_CREATE_RBF_SYSTEM_MATRIX(ThinPlateSplines);

PRECICE_INSTANTIATE_CREATE_RBF_SYSTEM_MATRIX(Multiquadrics);

PRECICE_INSTANTIATE_CREATE_RBF_SYSTEM_MATRIX(InverseMultiquadrics);

PRECICE_INSTANTIATE_CREATE_RBF_SYSTEM_MATRIX(VolumeSplines);

PRECICE_INSTANTIATE_CREATE_RBF_SYSTEM_MATRIX(Gaussian);

PRECICE_INSTANTIATE_CREATE_RBF_SYSTEM_MATRIX(CompactThinPlateSplinesC2);

PRECICE_INSTANTIATE_CREATE_RBF_SYSTEM_MATRIX(CompactPolynomialC0);

PRECICE_INSTANTIATE_CREATE_RBF_SYSTEM_MATRIX(CompactPolynomialC2);

PRECICE_INSTANTIATE_CREATE_RBF_SYSTEM_MATRIX(CompactPolynomialC4);

PRECICE_INSTANTIATE_CREATE_RBF_SYSTEM_MATRIX(CompactPolynomialC6);

PRECICE_INSTANTIATE_CREATE_RBF_SYSTEM_MATRIX(CompactPolynomialC8);

#undef PRECICE_INSTANTIATE_CREATE_RBF_SYSTEM_MATRIX


template <typename MemorySpace>


void fill_polynomial_matrix_impl(std::shared_ptr<const gko::Executor> exec,

                                 gko::ptr_param<GinkgoMatrix>         mtx,

                                 gko::ptr_param<const GinkgoMatrix>   x,

                                 const unsigned int                   dims)

{


  auto k_mtx = map_data<MemorySpace>(mtx.get());

  auto k_x   = map_data<MemorySpace>(x.get());


  if (std::is_same_v<MemorySpace, Kokkos::HostSpace>) {

    Kokkos::parallel_for(

        "fill_polynomial_matrix_row_major",

        Kokkos::MDRangePolicy<typename MemorySpace::execution_space, Kokkos::Rank<2>>{{0, 0}, {mtx->get_size()[0], mtx->get_size()[1]}},

        KOKKOS_LAMBDA(const int &i, const int &j) {

          double value;

          if (j < dims - 1) {

            value = k_x(i, j); // Row-major access

          } else {

            value = 1;

          }

          k_mtx(i, j) = value;

        });

  } else {

    Kokkos::parallel_for(

        "fill_polynomial_matrix_col_major",

        Kokkos::MDRangePolicy<typename MemorySpace::execution_space, Kokkos::Rank<2>>{{0, 0}, {mtx->get_size()[0], mtx->get_size()[1]}},

        KOKKOS_LAMBDA(const int &i, const int &j) {

          double value;

          if (j < dims - 1) {

            value = k_x(j, i); // Column-major access

          } else {

            value = 1;

          }

          k_mtx(i, j) = value;

        });

  }

}


void fill_polynomial_matrix(std::shared_ptr<const gko::Executor> exec,

                            bool                                 unifiedMemory,

                            gko::ptr_param<GinkgoMatrix>         mtx,

                            gko::ptr_param<const GinkgoMatrix>   x,

                            const unsigned int                   dims)

{

#ifdef KOKKOS_ENABLE_SERIAL

  if (std::dynamic_pointer_cast<const gko::ReferenceExecutor>(exec)) {

    fill_polynomial_matrix_impl<Kokkos::Serial::memory_space>(exec, mtx, x, dims);

    return;

  }

#endif

#ifdef PRECICE_WITH_OPENMP

  if (std::dynamic_pointer_cast<const gko::OmpExecutor>(exec)) {

    fill_polynomial_matrix_impl<Kokkos::OpenMP::memory_space>(exec, mtx, x, dims);

    return;

  }

#endif

#ifdef PRECICE_WITH_CUDA

  if (auto p = std::dynamic_pointer_cast<const gko::CudaExecutor>(exec); p) {

    if (unifiedMemory) {

      fill_polynomial_matrix_impl<Kokkos::CudaUVMSpace>(exec, mtx, x, dims);

    } else {

      fill_polynomial_matrix_impl<Kokkos::CudaSpace>(exec, mtx, x, dims);

    }

    return;

  }

#endif

#ifdef PRECICE_WITH_HIP

  if (std::dynamic_pointer_cast<const gko::HipExecutor>(exec)) {

    if (unifiedMemory) {

      fill_polynomial_matrix_impl<Kokkos::HIPManagedSpace>(exec, mtx, x, dims);

    } else {

      fill_polynomial_matrix_impl<Kokkos::HIPSpace>(exec, mtx, x, dims);

    }

    return;

  }

#endif

  PRECICE_UNREACHABLE("Executor unknown to preCICE");

}


} // namespace kernel


} // namespace precice::mapping

BasisFunctions.hpp

PRECICE_INSTANTIATE_CREATE_RBF_SYSTEM_MATRIX
#define PRECICE_INSTANTIATE_CREATE_RBF_SYSTEM_MATRIX(_function_type)
Definition GinkgoRBFKernels.cpp:166

GinkgoRBFKernels.hpp

PRECICE_UNREACHABLE
#define PRECICE_UNREACHABLE(...)
Definition assertion.hpp:93

precice::mapping::CompactPolynomialC0
Wendland radial basis function with compact support.
Definition BasisFunctions.hpp:369

precice::mapping::CompactPolynomialC2
Wendland radial basis function with compact support.
Definition BasisFunctions.hpp:421

precice::mapping::CompactPolynomialC4
Wendland radial basis function with compact support.
Definition BasisFunctions.hpp:474

precice::mapping::CompactPolynomialC6
Wendland radial basis function with compact support.
Definition BasisFunctions.hpp:527

precice::mapping::CompactPolynomialC8
Wendland radial basis function with compact support.
Definition BasisFunctions.hpp:579

precice::mapping::CompactThinPlateSplinesC2
Radial basis function with compact support.
Definition BasisFunctions.hpp:317

precice::mapping::Gaussian
Radial basis function with global and compact support.
Definition BasisFunctions.hpp:238

precice::mapping::InverseMultiquadrics
Radial basis function with global support.
Definition BasisFunctions.hpp:167

precice::mapping::Multiquadrics
Radial basis function with global support.
Definition BasisFunctions.hpp:129

precice::mapping::ThinPlateSplines
Radial basis function with global support.
Definition BasisFunctions.hpp:99

precice::mapping::VolumeSplines
Radial basis function with global support.
Definition BasisFunctions.hpp:208

math.hpp

precice::mapping::kernel
Definition GinkgoRBFKernels.cpp:50

precice::mapping::kernel::fill_polynomial_matrix
void fill_polynomial_matrix(std::shared_ptr< const gko::Executor > exec, bool unifiedMemory, gko::ptr_param< GinkgoMatrix > mtx, gko::ptr_param< const GinkgoMatrix > x, const unsigned int dims)
Definition GinkgoRBFKernels.cpp:225

precice::mapping::kernel::fill_polynomial_matrix_impl
void fill_polynomial_matrix_impl(std::shared_ptr< const gko::Executor > exec, gko::ptr_param< GinkgoMatrix > mtx, gko::ptr_param< const GinkgoMatrix > x, const unsigned int dims)
Definition GinkgoRBFKernels.cpp:187

precice::mapping::kernel::create_rbf_system_matrix
void create_rbf_system_matrix(std::shared_ptr< const gko::Executor > exec, bool unifiedMemory, gko::ptr_param< GinkgoMatrix > mtx, const std::array< bool, 3 > activeAxis, gko::ptr_param< GinkgoMatrix > supportPoints, gko::ptr_param< GinkgoMatrix > targetPoints, EvalFunctionType f, ::precice::mapping::RadialBasisParameters rbf_params, bool addPolynomial, unsigned int extraDims)
Definition GinkgoRBFKernels.cpp:120

precice::mapping::kernel::create_rbf_system_matrix_impl
void create_rbf_system_matrix_impl(std::shared_ptr< const gko::Executor > exec, gko::ptr_param< GinkgoMatrix > mtx, const std::array< bool, 3 > activeAxis, gko::ptr_param< GinkgoMatrix > supportPoints, gko::ptr_param< GinkgoMatrix > targetPoints, EvalFunctionType f, ::precice::mapping::RadialBasisParameters rbf_params, bool addPolynomial, unsigned int extraDims)
Definition GinkgoRBFKernels.cpp:53

precice::mapping
contains data mapping from points to meshes.
Definition AxialGeoMultiscaleMapping.cpp:5

precice::mapping::create_device_executor
std::shared_ptr< gko::Executor > create_device_executor(const std::string &execName, bool enableUnifiedMemory)
Definition GinkgoRBFKernels.cpp:17

precice::math::pow_int
constexpr T pow_int(const T base)
Computes the power of a given number by an integral exponent given at compile time,...
Definition math.hpp:22

precice::mapping::RadialBasisParameters
Wrapper struct that is used to transfer RBF-specific parameters to the GPU.
Definition BasisFunctions.hpp:51