Memory saving opportunities for lage KDTrees

This commit is contained in:
Guilhem Lavaux 2014-05-30 17:11:49 +02:00
parent 113a14e00c
commit f0a951e38d
4 changed files with 33 additions and 10 deletions

View file

@ -2,6 +2,7 @@ SET(tolink ${GSL_LIBRARIES} CosmoTool ${CosmoTool_LIBS})
include_directories(${CMAKE_SOURCE_DIR}/src)
include_directories(${FFTW3_INCLUDE_DIRS}
${EIGEN3_INCLUDE_DIRS} ${NETCDF_INCLUDE_PATH} ${GSL_INCLUDE_PATH})
include_directories(${CMAKE_SOURCE_DIR}/sample)
IF(SHARP_INCLUDE_PATH)
include_directories(BEFORE ${SHARP_INCLUDE_PATH})

View file

@ -1,3 +1,4 @@
#include "omptl/algorithm"
#include <cassert>
#include "yorick.hpp"
#include "sphSmooth.hpp"
@ -106,7 +107,7 @@ int main(int argc, char **argv)
array3_type out_den_1(boost::extents[Nres][Nres][Nres]);
array4_type out_v3d_1(boost::extents[Nres][Nres][Nres][3]);
array3_type out_rad_1(boost::extents[Nres][Nres][Nres]);
// array3_type out_rad_1(boost::extents[Nres][Nres][Nres]);
cout << "Weighing..." << endl;
@ -174,7 +175,7 @@ int main(int argc, char **argv)
out_v3d_1[rx][ry][rz][1] = 0;
out_v3d_1[rx][ry][rz][2] = 0;
out_den_1[rx][ry][rz] = 0;
out_rad_1[rx][ry][rz] = -1;
//out_rad_1[rx][ry][rz] = -1;
continue;
}
@ -184,9 +185,7 @@ int main(int argc, char **argv)
else
smooth1.fetchNeighbours(c);
float val;
out_rad_1[rx][ry][rz] = smooth1.getSmoothingLen();
//out_rad_1[rx][ry][rz] = smooth1.getSmoothingLen();
out_v3d_1[rx][ry][rz][0] = smooth1.computeSmoothedValue(c, getVelocity<0>);
out_v3d_1[rx][ry][rz][1] = smooth1.computeSmoothedValue(c, getVelocity<1>);
out_v3d_1[rx][ry][rz][2] = smooth1.computeSmoothedValue(c, getVelocity<2>);
@ -196,7 +195,7 @@ int main(int argc, char **argv)
}
}
hdf5_write_array(out_f, "radii", out_rad_1);
//hdf5_write_array(out_f, "radii", out_rad_1);
hdf5_write_array(out_f, "velocity", out_v3d_1);
hdf5_write_array(out_f, "density", out_den_1);

View file

@ -40,6 +40,10 @@ knowledge of the CeCILL license and that you accept its terms.
#include "config.hpp"
#include "bqueue.hpp"
#ifndef __KD_TREE_ACTIVE_CELLS
#define __KD_TREE_ACTIVE_CELLS 1
#endif
namespace CosmoTool {
template<int N, typename CType = ComputePrecision>
@ -52,7 +56,9 @@ namespace CosmoTool {
template<int N, typename ValType, typename CType = ComputePrecision>
struct KDCell
{
#if __KD_TREE_ACTIVE_CELLS == 1
bool active;
#endif
ValType val;
typename KDDef<N,CType>::KDCoordinates coord;
};

View file

@ -184,7 +184,9 @@ namespace CosmoTool {
int axis = level % N;
CoordType d2 = 0;
#if __KD_TREE_ACTIVE_CELLS == 1
if (node->value->active)
#endif
{
for (int j = 0; j < 3; j++)
{
@ -229,6 +231,7 @@ namespace CosmoTool {
uint32_t swapId = Ncells-1;
uint32_t i = 0;
#if __KD_TREE_ACTIVE_CELLS == 1
while (!cells[swapId]->active && swapId > 0)
swapId--;
@ -244,6 +247,7 @@ namespace CosmoTool {
}
i++;
}
#endif
return swapId+1;
}
@ -251,7 +255,7 @@ namespace CosmoTool {
void KD_default_cell_splitter<N,ValType,CType>::operator()(KDCell<N,ValType,CType> **cells, uint32_t Ncells, uint32_t& split_index, int axis, typename KDDef<N,CType>::KDCoordinates minBound, typename KDDef<N,CType>::KDCoordinates maxBound)
{
CellCompare<N,ValType,CType> compare(axis);
std::sort(cells, cells+Ncells, compare);
omptl::sort(cells,cells+Ncells,compare); // std::sort(cells, cells+Ncells, compare);
split_index = Ncells/2;
}
@ -266,10 +270,13 @@ namespace CosmoTool {
if (Ncells == 0)
return 0;
Node *node;
int axis = depth % N;
Node *node = &nodes[lastNode++];
uint32_t mid;
coords tmpBound;
#pragma omp critical
node = &nodes[lastNode++];
// Isolate the environment
splitter(cell0, Ncells, mid, axis, minBound, maxBound);
@ -282,12 +289,20 @@ namespace CosmoTool {
tmpBound[axis] = node->value->coord[axis];
depth++;
node->children[0] = buildTree(cell0, mid, depth, minBound, tmpBound);
#pragma omp task private(tmpBound)
{
node->children[0] = buildTree(cell0, mid, depth, minBound, tmpBound);
}
memcpy(tmpBound, minBound, sizeof(coords));
tmpBound[axis] = node->value->coord[axis];
node->children[1] = buildTree(cell0+mid+1, Ncells-mid-1, depth,
#pragma omp task private(tmpBound)
{
node->children[1] = buildTree(cell0+mid+1, Ncells-mid-1, depth,
tmpBound, maxBound);
}
#pragma omp taskwait
#ifdef __KD_TREE_NUMNODES
node->numNodes = (node->children[0] != 0) ? node->children[0]->numNodes : 0;
@ -304,7 +319,9 @@ namespace CosmoTool {
uint32_t numActive = 0;
for (uint32_t i = 0; i < lastNode; i++)
{
#if __KD_TREE_ACTIVE_CELLS == 1
if (nodes[i].value->active)
#endif
numActive++;
}
return numActive;