1#include "../../include/processing/kernels.cuh"
2#include "../../include/cuda_utils/cuda_launcher.cuh"
10 int bodyIndex = threadIdx.x + blockIdx.x * blockDim.x;
11 int stride = blockDim.x * gridDim.x;
17 while ((bodyIndex + offset) < n) {
20 r =
cuda::math::sqrt(particles->
x[bodyIndex + offset] * particles->
x[bodyIndex + offset]);
22 r =
cuda::math::sqrt(particles->
x[bodyIndex + offset] * particles->
x[bodyIndex + offset] +
23 particles->
y[bodyIndex + offset] * particles->
y[bodyIndex + offset]);
25 r =
cuda::math::sqrt(particles->
x[bodyIndex + offset] * particles->
x[bodyIndex + offset] +
26 particles->
y[bodyIndex + offset] * particles->
y[bodyIndex + offset] +
27 particles->
z[bodyIndex + offset] * particles->
z[bodyIndex + offset]);
30 index = (int) (r / deltaRadial);
31 atomicAdd(&particlesWithin[index], 1);
42 int bodyIndex = threadIdx.x + blockIdx.x * blockDim.x;
43 int stride = blockDim.x * gridDim.x;
49 while ((bodyIndex + offset) < n) {
52 r =
cuda::math::sqrt(particles->
x[bodyIndex + offset] * particles->
x[bodyIndex + offset]);
54 r =
cuda::math::sqrt(particles->
x[bodyIndex + offset] * particles->
x[bodyIndex + offset] +
55 particles->
y[bodyIndex + offset] * particles->
y[bodyIndex + offset]);
57 r =
cuda::math::sqrt(particles->
x[bodyIndex + offset] * particles->
x[bodyIndex + offset] +
58 particles->
y[bodyIndex + offset] * particles->
y[bodyIndex + offset] +
59 particles->
z[bodyIndex + offset] * particles->
z[bodyIndex + offset]);
62 index = (int) (r / deltaRadial);
64 if (particlesWithin[index] > 0) {
65 output[index] += input[bodyIndex + offset] / particlesWithin[index];
83 cuda::launch(
false, executionPolicy, ::Processing::Kernel::cartesianToRadial<T>, particles, particlesWithin, input, output, deltaRadial, n);
Execution policy/instruction for CUDA kernel execution.
Particle(s) class based on SoA (Structur of Arrays).
real * x
(pointer to) x position (array)
real * y
(pointer to) y position (array)
real * z
(pointer to) z position (array)
void cartesianToRadial(Particles *particles, int *particlesWithin, T *input, T *output, real deltaRadial, int n)
Wrapper for Processing::Kernel::cartesianToRadial().
template void cartesianToRadial< real >(Particles *particles, int *particlesWithin, real *input, real *output, real deltaRadial, int n)
void particlesWithinRadii(Particles *particles, int *particlesWithin, real deltaRadial, int n)
Wrapper for Processing::Kernel::particlesWithinRadii().
__global__ void cartesianToRadial(Particles *particles, int *particlesWithin, T *input, T *output, real deltaRadial, int n)
Convert cartesian to radial.
__global__ void particlesWithinRadii(Particles *particles, int *particlesWithin, real deltaRadial, int n)
Particles within radius/radii.
__device__ real sqrt(real a)
Square root of a floating point value.
real launch(bool timeKernel, const ExecutionPolicy &policy, void(*f)(Arguments...), Arguments... args)
CUDA execution wrapper function.