milupHPC/kernels_8cu_source.html

#include "../../include/processing/kernels.cuh"

#include "../../include/cuda_utils/cuda_launcher.cuh"


namespace Processing {


    namespace Kernel {


        __global__ void particlesWithinRadii(Particles *particles, int *particlesWithin, real deltaRadial, int n) {


            int bodyIndex = threadIdx.x + blockIdx.x * blockDim.x;

            int stride = blockDim.x * gridDim.x;

            int offset = 0;


            real r;

            int index;


            while ((bodyIndex + offset) < n) {


#if DIM == 1

                r = cuda::math::sqrt(particles->x[bodyIndex + offset] * particles->x[bodyIndex + offset]);

#elif DIM == 2

                r = cuda::math::sqrt(particles->x[bodyIndex + offset] * particles->x[bodyIndex + offset] +

                                        particles->y[bodyIndex + offset] * particles->y[bodyIndex + offset]);

#else

                r = cuda::math::sqrt(particles->x[bodyIndex + offset] * particles->x[bodyIndex + offset] +

                                     particles->y[bodyIndex + offset] * particles->y[bodyIndex + offset] +

                                     particles->z[bodyIndex + offset] * particles->z[bodyIndex + offset]);

#endif


                index = (int) (r / deltaRadial);

                atomicAdd(&particlesWithin[index], 1);


                offset += stride;

            }


        }


        template<typename T>

        __global__ void

        cartesianToRadial(Particles *particles, int *particlesWithin, T *input, T *output, real deltaRadial, int n) {


            int bodyIndex = threadIdx.x + blockIdx.x * blockDim.x;

            int stride = blockDim.x * gridDim.x;

            int offset = 0;


            real r;

            int index;


            while ((bodyIndex + offset) < n) {


#if DIM == 1

                r = cuda::math::sqrt(particles->x[bodyIndex + offset] * particles->x[bodyIndex + offset]);

#elif DIM == 2

                r = cuda::math::sqrt(particles->x[bodyIndex + offset] * particles->x[bodyIndex + offset] +

                                        particles->y[bodyIndex + offset] * particles->y[bodyIndex + offset]);

#else

                r = cuda::math::sqrt(particles->x[bodyIndex + offset] * particles->x[bodyIndex + offset] +

                                     particles->y[bodyIndex + offset] * particles->y[bodyIndex + offset] +

                                     particles->z[bodyIndex + offset] * particles->z[bodyIndex + offset]);

#endif


                index = (int) (r / deltaRadial);


                if (particlesWithin[index] > 0) {

                    output[index] += input[bodyIndex + offset] / particlesWithin[index];

                }


                offset += stride;

            }


        }


        namespace Launch {

            void particlesWithinRadii(Particles *particles, int *particlesWithin, real deltaRadial, int n) {

                ExecutionPolicy executionPolicy;

                cuda::launch(false, executionPolicy, ::Processing::Kernel::particlesWithinRadii, particles, particlesWithin, deltaRadial, n);

            }


            template<typename T>

            void cartesianToRadial(Particles *particles, int *particlesWithin, T *input, T *output, real deltaRadial, int n) {

                ExecutionPolicy executionPolicy;

                cuda::launch(false, executionPolicy, ::Processing::Kernel::cartesianToRadial<T>, particles, particlesWithin, input, output, deltaRadial, n);

            }

            template void cartesianToRadial<real>(Particles *particles, int *particlesWithin, real *input, real *output, real deltaRadial, int n);

        }


    }

}

ExecutionPolicy
Execution policy/instruction for CUDA kernel execution.
Definition: cuda_launcher.cuh:33

Particles
Particle(s) class based on SoA (Structur of Arrays).
Definition: particles.cuh:50

Particles::x
real * x
(pointer to) x position (array)
Definition: particles.cuh:62

Particles::y
real * y
(pointer to) y position (array)
Definition: particles.cuh:70

Particles::z
real * z
(pointer to) z position (array)
Definition: particles.cuh:78

Kernel
Definition: device_rhs.cuh:7

Processing::Kernel::Launch::cartesianToRadial
void cartesianToRadial(Particles *particles, int *particlesWithin, T *input, T *output, real deltaRadial, int n)
Wrapper for Processing::Kernel::cartesianToRadial().
Definition: kernels.cu:81

Processing::Kernel::Launch::cartesianToRadial< real >
template void cartesianToRadial< real >(Particles *particles, int *particlesWithin, real *input, real *output, real deltaRadial, int n)

Processing::Kernel::Launch::particlesWithinRadii
void particlesWithinRadii(Particles *particles, int *particlesWithin, real deltaRadial, int n)
Wrapper for Processing::Kernel::particlesWithinRadii().
Definition: kernels.cu:75

Processing::Kernel::cartesianToRadial
__global__ void cartesianToRadial(Particles *particles, int *particlesWithin, T *input, T *output, real deltaRadial, int n)
Convert cartesian to radial.
Definition: kernels.cu:40

Processing::Kernel::particlesWithinRadii
__global__ void particlesWithinRadii(Particles *particles, int *particlesWithin, real deltaRadial, int n)
Particles within radius/radii.
Definition: kernels.cu:8

Processing
Definition: kernels.cuh:19

cuda::math::sqrt
__device__ real sqrt(real a)
Square root of a floating point value.
Definition: cuda_utilities.cu:456

cuda::launch
real launch(bool timeKernel, const ExecutionPolicy &policy, void(*f)(Arguments...), Arguments... args)
CUDA execution wrapper function.
Definition: cuda_launcher.cuh:114

real
double real
Definition: parameter.h:15