DiFfRG/cpp/integrator__1D__cartesian__gpu_8hh_source.html

#pragma once


#ifdef __CUDACC__


// standard library

#include <future>


// external libraries

#include <rmm/cuda_stream_pool.hpp>

#include <rmm/device_uvector.hpp>

#include <rmm/mr/device/pool_memory_resource.hpp>

#include <thrust/reduce.h>

#include <thrust/transform_reduce.h>


// DiFfRG

#include <DiFfRG/common/cuda_prefix.hh>

#include <DiFfRG/common/quadrature/quadrature_provider.hh>


namespace DiFfRG

{


  template <typename NT, typename KERNEL> class Integrator1DCartesianGPU

  {

  public:

    using ctype = typename get_type::ctype<NT>;


    template <typename... T> struct functor {

    public:


      functor(const ctype *x_quadrature_p, const ctype *x_quadrature_w, const ctype qx_min, const ctype qx_extent,

              const ctype k, T... t)

          : x_quadrature_p(x_quadrature_p), x_quadrature_w(x_quadrature_w), qx_min(qx_min), qx_extent(qx_extent), k(k),

            t(t...)

      {

      }


      __device__ NT operator()(const uint idx) const

      {

        constexpr int d = 1;

        constexpr ctype int_element = powr<-d>(2 * (ctype)M_PI); // fourier factor


        const ctype q = qx_min + qx_extent * x_quadrature_p[idx];

        const ctype weight = qx_extent * x_quadrature_w[idx];


        const NT res = NT(1) * std::apply([&](auto &&...args) { return KERNEL::kernel(q, k, args...); }, t);

        return int_element * res * weight;

      }


    private:

      const ctype *x_quadrature_p;

      const ctype *x_quadrature_w;

      const ctype qx_min, qx_extent;

      const ctype k;

      const std::tuple<T...> t;

    };


    Integrator1DCartesianGPU(QuadratureProvider &quadrature_provider, const std::array<uint, 1> grid_size,

                             const ctype x_extent = 0., const uint max_block_size = 0, const ctype qx_min = -M_PI,

                             const ctype qx_max = M_PI)

        : Integrator1DCartesianGPU(quadrature_provider, grid_size[0], x_extent, qx_min, qx_max)

    {

    }


    Integrator1DCartesianGPU(QuadratureProvider &quadrature_provider, const std::array<uint, 1> grid_size,

                             const JSONValue &json)

        : Integrator1DCartesianGPU(quadrature_provider, grid_size[0], 0.,

                                   json.get_double("/discretization/integration/qx_min", -M_PI),

                                   json.get_double("/discretization/integration/qx_max", M_PI))

    {

    }


    Integrator1DCartesianGPU(QuadratureProvider &quadrature_provider, const std::array<uint, 1> grid_size,

                             const ctype x_extent, const JSONValue &json)

        : Integrator1DCartesianGPU(quadrature_provider, grid_size[0], x_extent,

                                   json.get_double("/discretization/integration/qx_min", -M_PI),

                                   json.get_double("/discretization/integration/qx_max", M_PI))

    {

    }


    Integrator1DCartesianGPU(QuadratureProvider &quadrature_provider, const uint grid_size, const ctype x_extent = 0.,

                             const ctype qx_min = -M_PI, const ctype qx_max = M_PI)

        : grid_size(grid_size)

    {

      ptr_x_quadrature_p = quadrature_provider.get_device_points<ctype>(grid_size);

      ptr_x_quadrature_w = quadrature_provider.get_device_weights<ctype>(grid_size);


      this->qx_min = qx_min;

      this->qx_extent = qx_max - qx_min;

    }


    Integrator1DCartesianGPU(const Integrator1DCartesianGPU &other)

        : grid_size(other.grid_size), ptr_x_quadrature_p(other.ptr_x_quadrature_p),

          ptr_x_quadrature_w(other.ptr_x_quadrature_w)

    {

      qx_min = other.qx_min;

      qx_extent = other.qx_extent;

    }


    void set_qx_min(const ctype qx_min)

    {

      this->qx_extent = this->qx_extent - qx_min + this->qx_min;

      this->qx_min = qx_min;

    }


    void set_qx_max(const ctype qx_max) { this->qx_extent = qx_max - qx_min; }


    template <typename... T> NT get(const ctype k, const T &...t) const

    {

      return KERNEL::constant(k, t...) +

             thrust::transform_reduce(thrust::cuda::par.on(rmm::cuda_stream_per_thread.value()),

                                      thrust::make_counting_iterator<uint>(0),

                                      thrust::make_counting_iterator<uint>(grid_size),

                                      functor<T...>(ptr_x_quadrature_p, ptr_x_quadrature_w, qx_min, qx_extent, k, t...),

                                      NT(0), thrust::plus<NT>());

    }


    template <typename... T> std::future<NT> request(const ctype k, const T &...t) const

    {

      return std::async(std::launch::deferred, [=, this]() { return get(k, t...); });

    }


  private:

    const uint grid_size;


    ctype qx_min = -M_PI;

    ctype qx_extent = 2. * M_PI;


    const ctype *ptr_x_quadrature_p;

    const ctype *ptr_x_quadrature_w;

  };


} // namespace DiFfRG


#else


#ifdef USE_CUDA


namespace DiFfRG

{

  template <typename NT, typename KERNEL> class Integrator1DCartesianGPU;

}


#else


#include <DiFfRG/physics/integration/integrator_1D_cartesian_cpu.hh>


namespace DiFfRG

{

  template <typename NT, typename KERNEL> class Integrator1DCartesianGPU : public Integrator1DCartesianTBB<NT, KERNEL>

  {

  public:

    using ctype = typename get_type::ctype<NT>;


    Integrator1DCartesianGPU(QuadratureProvider &quadrature_provider, const std::array<uint, 1> grid_size,

                             const ctype x_extent, const uint max_block_size = 256, const ctype qx_min = -M_PI,

                             const ctype qx_max = M_PI)

        : Integrator1DCartesianTBB<NT, KERNEL>(quadrature_provider, grid_size[0], x_extent, qx_min, qx_max)

    {

      (void)max_block_size;

    }


    Integrator1DCartesianGPU(QuadratureProvider &quadrature_provider, const uint grid_size, const ctype x_extent,

                             const uint max_block_size = 256, const ctype qx_min = -M_PI, const ctype qx_max = M_PI)

        : Integrator1DCartesianTBB<NT, KERNEL>(quadrature_provider, grid_size, x_extent, x_extent, qx_min, qx_max)

    {

      (void)max_block_size;

    }


    Integrator1DCartesianGPU(QuadratureProvider &quadrature_provider, const std::array<uint, 1> grid_size,

                             const ctype x_extent, const JSONValue &json)

        : Integrator1DCartesianTBB<NT, KERNEL>(quadrature_provider, grid_size, x_extent, json)

    {

    }

  };

} // namespace DiFfRG


#endif


#endif

DiFfRG::Integrator1DCartesianGPU
Integration of an arbitrary 1D function from qx_min to qx_max using CUDA.
Definition integrator_1D_cartesian_gpu.hh:28

DiFfRG::Integrator1DCartesianGPU::ptr_x_quadrature_p
const ctype * ptr_x_quadrature_p
Definition integrator_1D_cartesian_gpu.hh:201

DiFfRG::Integrator1DCartesianGPU::grid_size
const uint grid_size
Definition integrator_1D_cartesian_gpu.hh:196

DiFfRG::Integrator1DCartesianGPU::ctype
typename get_type::ctype< NT > ctype
Numerical type to be used for integration tasks e.g. the argument or possible jacobians.
Definition integrator_1D_cartesian_gpu.hh:33

DiFfRG::Integrator1DCartesianGPU::Integrator1DCartesianGPU
Integrator1DCartesianGPU(QuadratureProvider &quadrature_provider, const std::array< uint, 1 > grid_size, const JSONValue &json)
Construct a new Integrator1DCartesianGPU object.
Definition integrator_1D_cartesian_gpu.hh:93

DiFfRG::Integrator1DCartesianGPU::ptr_x_quadrature_w
const ctype * ptr_x_quadrature_w
Definition integrator_1D_cartesian_gpu.hh:202

DiFfRG::Integrator1DCartesianGPU::request
std::future< NT > request(const ctype k, const T &...t) const
Get the result of the integration asynchronously.
Definition integrator_1D_cartesian_gpu.hh:190

DiFfRG::Integrator1DCartesianGPU::Integrator1DCartesianGPU
Integrator1DCartesianGPU(QuadratureProvider &quadrature_provider, const std::array< uint, 1 > grid_size, const ctype x_extent=0., const uint max_block_size=0, const ctype qx_min=-M_PI, const ctype qx_max=M_PI)
Construct a new Integrator1DCartesianGPU object.
Definition integrator_1D_cartesian_gpu.hh:79

DiFfRG::Integrator1DCartesianGPU::qx_min
ctype qx_min
Definition integrator_1D_cartesian_gpu.hh:198

DiFfRG::Integrator1DCartesianGPU::set_qx_min
void set_qx_min(const ctype qx_min)
Set the minimum value of the qx integration range.
Definition integrator_1D_cartesian_gpu.hh:153

DiFfRG::Integrator1DCartesianGPU::Integrator1DCartesianGPU
Integrator1DCartesianGPU(QuadratureProvider &quadrature_provider, const uint grid_size, const ctype x_extent=0., const ctype qx_min=-M_PI, const ctype qx_max=M_PI)
Construct a new Integrator1DCartesianGPU object.
Definition integrator_1D_cartesian_gpu.hh:126

DiFfRG::Integrator1DCartesianGPU::qx_extent
ctype qx_extent
Definition integrator_1D_cartesian_gpu.hh:199

DiFfRG::Integrator1DCartesianGPU::Integrator1DCartesianGPU
Integrator1DCartesianGPU(QuadratureProvider &quadrature_provider, const std::array< uint, 1 > grid_size, const ctype x_extent, const JSONValue &json)
Construct a new Integrator1DCartesianGPU object.
Definition integrator_1D_cartesian_gpu.hh:109

DiFfRG::Integrator1DCartesianGPU::Integrator1DCartesianGPU
Integrator1DCartesianGPU(const Integrator1DCartesianGPU &other)
Construct a copy of an existing Integrator1DCartesianGPU object.
Definition integrator_1D_cartesian_gpu.hh:142

DiFfRG::Integrator1DCartesianGPU::get
NT get(const ctype k, const T &...t) const
Get the result of the integration.
Definition integrator_1D_cartesian_gpu.hh:172

DiFfRG::Integrator1DCartesianGPU::set_qx_max
void set_qx_max(const ctype qx_max)
Set the maximum value of the qx integration range.
Definition integrator_1D_cartesian_gpu.hh:162

DiFfRG::JSONValue
A wrapper around the boost json value class.
Definition json.hh:19

DiFfRG::QuadratureProvider
A class that provides quadrature points and weights, in host and device memory. The quadrature points...
Definition quadrature_provider.hh:139

DiFfRG::QuadratureProvider::get_device_weights
const NT * get_device_weights(const size_t order, const int device=0, const QuadratureType type=QuadratureType::legendre)
Get the device-side quadrature weights for a quadrature of size quadrature_size.
Definition quadrature_provider.hh:211

DiFfRG::QuadratureProvider::get_device_points
const NT * get_device_points(const size_t order, const int device=0, const QuadratureType type=QuadratureType::legendre)
Get the device-side quadrature points for a quadrature of size quadrature_size.
Definition quadrature_provider.hh:198

cuda_prefix.hh

integrator_1D_cartesian_cpu.hh

DiFfRG::get_type::ctype
typename internal::_ctype< CT >::value ctype
Definition types.hh:106

DiFfRG
Definition complex_math.hh:14

DiFfRG::powr
constexpr __forceinline__ __host__ __device__ NumberType powr(const NumberType x)
A compile-time evaluatable power function for whole number exponents.
Definition math.hh:45

DiFfRG::uint
unsigned int uint
Definition utils.hh:22

quadrature_provider.hh

DiFfRG::Integrator1DCartesianGPU::functor
Custom functor for the thrust::transform_reduce function.
Definition integrator_1D_cartesian_gpu.hh:40

DiFfRG::Integrator1DCartesianGPU::functor::t
const std::tuple< T... > t
Definition integrator_1D_cartesian_gpu.hh:66

DiFfRG::Integrator1DCartesianGPU::functor::k
const ctype k
Definition integrator_1D_cartesian_gpu.hh:65

DiFfRG::Integrator1DCartesianGPU::functor::qx_extent
const ctype qx_extent
Definition integrator_1D_cartesian_gpu.hh:64

DiFfRG::Integrator1DCartesianGPU::functor::x_quadrature_w
const ctype * x_quadrature_w
Definition integrator_1D_cartesian_gpu.hh:63

DiFfRG::Integrator1DCartesianGPU::functor::qx_min
const ctype qx_min
Definition integrator_1D_cartesian_gpu.hh:64

DiFfRG::Integrator1DCartesianGPU::functor::x_quadrature_p
const ctype * x_quadrature_p
Definition integrator_1D_cartesian_gpu.hh:62

DiFfRG::Integrator1DCartesianGPU::functor::operator()
__device__ NT operator()(const uint idx) const
Definition integrator_1D_cartesian_gpu.hh:49

DiFfRG::Integrator1DCartesianGPU::functor::functor
functor(const ctype *x_quadrature_p, const ctype *x_quadrature_w, const ctype qx_min, const ctype qx_extent, const ctype k, T... t)
Definition integrator_1D_cartesian_gpu.hh:42