Namespaces | |
namespace | Launch |
Functions | |
__global__ void | set (Tree *tree, integer *count, integer *start, integer *child, integer *sorted, integer *index, integer *toDeleteLeaf, integer *toDeleteNode, real *minX, real *maxX) |
Kernel call to setter. More... | |
__global__ void | info (Tree *tree, Particles *particles, integer n, integer m) |
Info Kernel for tree class (for debugging purposes) More... | |
__global__ void | info (Tree *tree, Particles *particles) |
__global__ void | testTree (Tree *tree, Particles *particles, integer n, integer m) |
__global__ void | set (Tree *tree, integer *count, integer *start, integer *child, integer *sorted, integer *index, integer *toDeleteLeaf, integer *toDeleteNode, real *minX, real *maxX, real *minY, real *maxY) |
Kernel call to setter. More... | |
__global__ void | set (Tree *tree, integer *count, integer *start, integer *child, integer *sorted, integer *index, integer *toDeleteLeaf, integer *toDeleteNode, real *minX, real *maxX, real *minY, real *maxY, real *minZ, real *maxZ) |
__global__ void | sumParticles (Tree *tree) |
Kernel call to sum particles within tree. More... | |
__global__ void | buildTree (Tree *tree, Particles *particles, integer n, integer m) |
Kernel to construct the tree using the particles within particles More... | |
__global__ void | prepareSorting (Tree *tree, Particles *particles, integer n, integer m) |
__global__ void | calculateCentersOfMass (Tree *tree, Particles *particles, integer n, integer level) |
Compute center of masses (level wise). More... | |
__global__ void | computeBoundingBox (Tree *tree, Particles *particles, integer *mutex, integer n, integer blockSize) |
Kernel to compute the bounding box/borders of the tree or rather the particles within the tree. More... | |
__global__ void | centerOfMass (Tree *tree, Particles *particles, integer n) |
__global__ void | sort (Tree *tree, integer n, integer m) |
Kernel to sort tree/child indices to optimize cache efficiency. More... | |
__global__ void | getParticleKeys (Tree *tree, Particles *particles, keyType *keys, integer maxLevel, integer n, Curve::Type curveType=Curve::lebesgue) |
Kernel to get all particle's keys. More... | |
__global__ void | globalCOM (Tree *tree, Particles *particles, real com[DIM]) |
Compute center of mass for all particles. More... | |
__global__ void TreeNS::Kernel::buildTree | ( | Tree * | tree, |
Particles * | particles, | ||
integer | n, | ||
integer | m | ||
) |
Kernel to construct the tree using the particles within particles
Corresponding wrapper function: TreeNS::Kernel::Launch::buildTree()
The algorithm shows an iterative tree construction algorithm utilizing lightweight locks for leaf nodes to avoid race conditions. Particles are assigned to threads, those threads insert its body by traversing the tree from root to the correct node trying to lock the corresponding child pointer via the array index "-2" using atomic operations. If the locking is successful the particle is inserted into the tree, releasing the lock and executing a memory fence to ensure visibility for the other threads. If a particle is already stored at the desired node, a new cell is automatically generated or rather requested and the old and new body are inserted correspondingly. However, if the locking is not successful, the thread need to try again until accomplishing the task. This approach is very similar to the one presented in An Efficient CUDA Implementation of the Tree-Based Barnes Hut n-Body Algorithm.
tree | Tree class target instance |
particles | Particles class instance/particles to be inserted in tree |
n | number of particles |
m | number of potential particles to be inserted (needed for start index of nodes) |
Definition at line 768 of file tree.cu.
__global__ void TreeNS::Kernel::calculateCentersOfMass | ( | Tree * | tree, |
Particles * | particles, | ||
integer | n, | ||
integer | level | ||
) |
Compute center of masses (level wise).
The local COM computation kernel is called iteratively starting with the deepest tree level and finishing at the root. The pseudo-particles children entries are weighted to derive the COM, their masses are accumulated and finally the position is normalized by dividing through the summed mass.
tree | Tree class instance |
particles | Particle class instance |
n | Number of particles |
level | Current (relevant) tree level |
Definition at line 1416 of file tree.cu.
__global__ void TreeNS::Kernel::computeBoundingBox | ( | Tree * | tree, |
Particles * | particles, | ||
integer * | mutex, | ||
integer | n, | ||
integer | blockSize | ||
) |
Kernel to compute the bounding box/borders of the tree or rather the particles within the tree.
Corresponding wrapper function: TreeNS::Kernel::Launch::computeBoundingBox()
The algorithm to compute the bounding box is basically a parallel reduction primitive to derive the minimum and maximum for each coordinate axis.
tree | Tree class target instance |
particles | Particles class instance/particles within the tree |
mutex | mutex/lock |
n | number of particles |
blockSize | device block size |
Definition at line 302 of file tree.cu.
__global__ void TreeNS::Kernel::getParticleKeys | ( | Tree * | tree, |
Particles * | particles, | ||
keyType * | keys, | ||
integer | maxLevel, | ||
integer | n, | ||
Curve::Type | curveType = Curve::lebesgue |
||
) |
Kernel to get all particle's keys.
Corresponding wrapper function: TreeNS::Kernel::Launch::getParticleKeys()
Compute center of mass for all particles.
Corresponding wrapper function: TreeNS::Kernel::Launch::globalCOM()
[in] | tree | Tree class instance |
[in] | particles | Particle class instance |
[out] | com | Center of mass |
Definition at line 1645 of file tree.cu.
Info Kernel for tree class (for debugging purposes)
Corresponding wrapper function: TreeNS::Kernel::Launch::info()
tree | |
n | |
m |
__global__ void TreeNS::Kernel::set | ( | Tree * | tree, |
integer * | count, | ||
integer * | start, | ||
integer * | child, | ||
integer * | sorted, | ||
integer * | index, | ||
integer * | toDeleteLeaf, | ||
integer * | toDeleteNode, | ||
real * | minX, | ||
real * | maxX | ||
) |
Kernel call to setter.
Corresponding wrapper function: TreeNS::Kernel::Launch::set()
tree | Tree class instance (to be constructed) |
count | |
start | |
child | |
sorted | |
index | |
toDeleteLeaf | |
toDeleteNode | |
minX | |
maxX |
Kernel to sort tree/child indices to optimize cache efficiency.
Corresponding wrapper function: TreeNS::Kernel::Launch::sort()
tree | Tree class instance |
n | |
m |
__global__ void TreeNS::Kernel::sumParticles | ( | Tree * | tree | ) |
Kernel call to sum particles within tree.
Corresponding wrapper function: TreeNS::Kernel::Launch::sumParticles()
tree | target tree instance |
Definition at line 440 of file tree.cu.