12#ifndef MILUPHPC_TREE_CUH
13#define MILUPHPC_TREE_CUH
15#include "../cuda_utils/cuda_utilities.cuh"
16#include "../parameter.h"
17#include "../particles.cuh"
40 const unsigned char DirTable[12][8] =
41 {{8, 10, 3, 3, 4, 5, 4, 5},
42 {2, 2, 11, 9, 4, 5, 4, 5},
43 {7, 6, 7, 6, 8, 10, 1, 1},
44 {7, 6, 7, 6, 0, 0, 11, 9},
45 {0, 8, 1, 11, 6, 8, 6, 11},
46 {10, 0, 9, 1, 10, 7, 9, 7},
47 {10, 4, 9, 4, 10, 2, 9, 3},
48 {5, 8, 5, 11, 2, 8, 3, 11},
49 {4, 9, 0, 0, 7, 9, 2, 2},
50 {1, 1, 8, 5, 3, 3, 8, 6},
51 {11, 5, 0, 0, 11, 6, 2, 2},
52 {1, 1, 4, 10, 3, 3, 7, 10}};
54 __device__
const unsigned char DirTable[12][8] =
55 {{8, 10, 3, 3, 4, 5, 4, 5},
56 {2, 2, 11, 9, 4, 5, 4, 5},
57 {7, 6, 7, 6, 8, 10, 1, 1},
58 {7, 6, 7, 6, 0, 0, 11, 9},
59 {0, 8, 1, 11, 6, 8, 6, 11},
60 {10, 0, 9, 1, 10, 7, 9, 7},
61 {10, 4, 9, 4, 10, 2, 9, 3},
62 {5, 8, 5, 11, 2, 8, 3, 11},
63 {4, 9, 0, 0, 7, 9, 2, 2},
64 {1, 1, 8, 5, 3, 3, 8, 6},
65 {11, 5, 0, 0, 11, 6, 2, 2},
66 {1, 1, 4, 10, 3, 3, 7, 10}};
83 const unsigned char HilbertTable[12][8] = {{0, 7, 3, 4, 1, 6, 2, 5},
84 {4, 3, 7, 0, 5, 2, 6, 1},
85 {6, 1, 5, 2, 7, 0, 4, 3},
86 {2, 5, 1, 6, 3, 4, 0, 7},
87 {0, 1, 7, 6, 3, 2, 4, 5},
88 {6, 7, 1, 0, 5, 4, 2, 3},
89 {2, 3, 5, 4, 1, 0, 6, 7},
90 {4, 5, 3, 2, 7, 6, 0, 1},
91 {0, 3, 1, 2, 7, 4, 6, 5},
92 {2, 1, 3, 0, 5, 6, 4, 7},
93 {4, 7, 5, 6, 3, 0, 2, 1},
94 {6, 5, 7, 4, 1, 2, 0, 3}};
96 __device__
const unsigned char HilbertTable[12][8] = {{0, 7, 3, 4, 1, 6, 2, 5},
97 {4, 3, 7, 0, 5, 2, 6, 1},
98 {6, 1, 5, 2, 7, 0, 4, 3},
99 {2, 5, 1, 6, 3, 4, 0, 7},
100 {0, 1, 7, 6, 3, 2, 4, 5},
101 {6, 7, 1, 0, 5, 4, 2, 3},
102 {2, 3, 5, 4, 1, 0, 6, 7},
103 {4, 5, 3, 2, 7, 6, 0, 1},
104 {0, 3, 1, 2, 7, 4, 6, 5},
105 {2, 1, 3, 0, 5, 6, 4, 7},
106 {4, 7, 5, 6, 3, 0, 2, 1},
107 {6, 5, 7, 4, 1, 2, 0, 3}};
653 integer blockSize,
bool time=
false);
681namespace UnitTesting {
Particle(s) class based on SoA (Structur of Arrays).
CUDA_CALLABLE_MEMBER void reset(integer index, integer n)
Reset (specific) entries.
integer * index
index used for counting nodes
real * minZ
bounding box minimal z
integer * child
children/child nodes or leaves (beneath)
CUDA_CALLABLE_MEMBER keyType getParticleKey(Particles *particles, integer index, integer maxLevel, Curve::Type curveType=Curve::lebesgue)
Get SFC key of a particle.
real * maxX
bounding box maximal x
integer * sorted
sorted (indices) for better cache performance
integer * count
accumulated nodes/leaves beneath
CUDA_CALLABLE_MEMBER integer sumParticles()
Sum particles in tree.
integer * toDeleteNode
buffer for remembering old indices for rebuilding tree
CUDA_CALLABLE_MEMBER ~Tree()
Destructor.
CUDA_CALLABLE_MEMBER Tree()
Default constructor.
real * minX
bounding box minimal x
integer * start
TODO: describe start.
integer * toDeleteLeaf
buffer for remembering old indices for rebuilding tree
CUDA_CALLABLE_MEMBER integer getTreeLevel(Particles *particles, integer index, integer maxLevel, Curve::Type curveType=Curve::lebesgue)
Get tree level for a (specific) particle.
CUDA_CALLABLE_MEMBER void set(integer *count, integer *start, integer *child, integer *sorted, integer *index, integer *toDeleteLeaf, integer *toDeleteNode, real *minX, real *maxX)
Setter, passing pointer to member variables.
real * maxY
bounding box maximal y
real * minY
bounding box minimal y
real * maxZ
bounding box maximal z
#define CUDA_CALLABLE_MEMBER
Key (keyType) related functions and kernels.
const unsigned char HilbertTable[12][8]
Table needed to convert from Lebesgue to Hilbert keys.
DIM
Table needed to convert from Lebesgue to Hilbert keys.
CUDA_CALLABLE_MEMBER keyType lebesgue2hilbert(keyType lebesgue, integer maxLevel)
Convert a Lebesgue key to a Hilbert key.
real calculateCentersOfMass(Tree *tree, Particles *particles, integer n, integer level, bool time=false)
real prepareSorting(Tree *tree, Particles *particles, integer n, integer m)
real sort(Tree *tree, integer n, integer m, bool time=false)
Wrapper for TreeNS::Kernel::sort()
real centerOfMass(Tree *tree, Particles *particles, integer n, bool time=false)
Wrapper for TreeNS::Kernel::centerOfMass()
real sumParticles(Tree *tree)
Wrapper for TreeNS::Kernel::sumParticles()
real globalCOM(Tree *tree, Particles *particles, real com[DIM])
Wrapper for TreeNS::Kernel::globalCOM()
real testTree(Tree *tree, Particles *particles, integer n, integer m)
real computeBoundingBox(Tree *tree, Particles *particles, integer *mutex, integer n, integer blockSize, bool time=false)
Wrapper for TreeNS::Kernel::computeBoundingBox()
void set(Tree *tree, integer *count, integer *start, integer *child, integer *sorted, integer *index, integer *toDeleteLeaf, integer *toDeleteNode, real *minX, real *maxX)
Wrapper for TreeNS::Kernel::set()
real getParticleKeys(Tree *tree, Particles *particles, keyType *keys, integer maxLevel, integer n, Curve::Type curveType=Curve::lebesgue, bool time=false)
Wrapper for TreeNS::Kernel::getParticleKeys()
real info(Tree *tree, Particles *particles, integer n, integer m)
Wrapper for TreeNS::Kernel::Launch::info()
real buildTree(Tree *tree, Particles *particles, integer n, integer m, bool time=false)
Wrapper for TreeNS::Kernel::buildTree()
__global__ void prepareSorting(Tree *tree, Particles *particles, integer n, integer m)
__global__ void set(Tree *tree, integer *count, integer *start, integer *child, integer *sorted, integer *index, integer *toDeleteLeaf, integer *toDeleteNode, real *minX, real *maxX)
Kernel call to setter.
__global__ void testTree(Tree *tree, Particles *particles, integer n, integer m)
__global__ void info(Tree *tree, Particles *particles, integer n, integer m)
Info Kernel for tree class (for debugging purposes)
__global__ void getParticleKeys(Tree *tree, Particles *particles, keyType *keys, integer maxLevel, integer n, Curve::Type curveType=Curve::lebesgue)
Kernel to get all particle's keys.
__global__ void computeBoundingBox(Tree *tree, Particles *particles, integer *mutex, integer n, integer blockSize)
Kernel to compute the bounding box/borders of the tree or rather the particles within the tree.
__global__ void calculateCentersOfMass(Tree *tree, Particles *particles, integer n, integer level)
Compute center of masses (level wise).
__global__ void sumParticles(Tree *tree)
Kernel call to sum particles within tree.
__global__ void sort(Tree *tree, integer n, integer m)
Kernel to sort tree/child indices to optimize cache efficiency.
__global__ void buildTree(Tree *tree, Particles *particles, integer n, integer m)
Kernel to construct the tree using the particles within particles
__global__ void globalCOM(Tree *tree, Particles *particles, real com[DIM])
Compute center of mass for all particles.
__global__ void centerOfMass(Tree *tree, Particles *particles, integer n)