Merge branch 'master' of bitbucket.org:glavaux/cosmotool
This commit is contained in:
commit
03033b64b6
@ -70,7 +70,7 @@ SET(CPACK_PACKAGE_DESCRIPTION_SUMMARY "A toolbox for impatient cosmologists")
|
|||||||
SET(CPACK_PACKAGE_VENDOR "Guilhem Lavaux")
|
SET(CPACK_PACKAGE_VENDOR "Guilhem Lavaux")
|
||||||
SET(CPACK_RESOURCE_FILE_LICENSE "${CMAKE_CURRENT_SOURCE_DIR}/LICENCE_CeCILL_V2")
|
SET(CPACK_RESOURCE_FILE_LICENSE "${CMAKE_CURRENT_SOURCE_DIR}/LICENCE_CeCILL_V2")
|
||||||
SET(CPACK_PACKAGE_VERSION_MAJOR "1")
|
SET(CPACK_PACKAGE_VERSION_MAJOR "1")
|
||||||
SET(CPACK_PACKAGE_VERSION_MINOR "1")
|
SET(CPACK_PACKAGE_VERSION_MINOR "2")
|
||||||
SET(CPACK_PACKAGE_VERSION_PATCH "2${EXTRA_VERSION}")
|
SET(CPACK_PACKAGE_VERSION_PATCH "2${EXTRA_VERSION}")
|
||||||
SET(CPACK_PACKAGE_INSTALL_DIRECTORY "CosmoToolbox-${CPACK_PACKAGE_VERSION_MAJOR}.${CPACK_PACKAGE_VERSION_MINOR}")
|
SET(CPACK_PACKAGE_INSTALL_DIRECTORY "CosmoToolbox-${CPACK_PACKAGE_VERSION_MAJOR}.${CPACK_PACKAGE_VERSION_MINOR}")
|
||||||
SET(CPACK_STRIP_FILES "lib/libCosmoTool.so")
|
SET(CPACK_STRIP_FILES "lib/libCosmoTool.so")
|
||||||
|
@ -8,7 +8,7 @@ export CC CXX
|
|||||||
|
|
||||||
# Install a system package required by our library
|
# Install a system package required by our library
|
||||||
#yum install -y atlas-devel
|
#yum install -y atlas-devel
|
||||||
yum install -y cmake3 gsl-devel zlib-devel
|
yum install -y cmake3 gsl-devel zlib-devel fftw3-devel
|
||||||
|
|
||||||
ln -fs /usr/bin/cmake3 /usr/bin/cmake
|
ln -fs /usr/bin/cmake3 /usr/bin/cmake
|
||||||
|
|
||||||
@ -19,17 +19,18 @@ ALL_PYTHON="cp36-cp36m cp37-cp37m cp38-cp38 cp39-cp39"
|
|||||||
for pkg in $ALL_PYTHON; do
|
for pkg in $ALL_PYTHON; do
|
||||||
PYBIN=/opt/python/${pkg}/bin
|
PYBIN=/opt/python/${pkg}/bin
|
||||||
# "${PYBIN}/pip" install -r /io/dev-requirements.txt
|
# "${PYBIN}/pip" install -r /io/dev-requirements.txt
|
||||||
|
"${PYBIN}/pip" install setuptools wheel Cython
|
||||||
"${PYBIN}/pip" install -r /io/requirements.txt
|
"${PYBIN}/pip" install -r /io/requirements.txt
|
||||||
"${PYBIN}/pip" wheel -vvv /io/ -w wheelhouse/
|
"${PYBIN}/pip" wheel -vvv /io/ -w wheelhouse/
|
||||||
done
|
done
|
||||||
|
|
||||||
# Bundle external shared libraries into the wheels
|
# Bundle external shared libraries into the wheels
|
||||||
for whl in wheelhouse/*.whl; do
|
for whl in wheelhouse/cosmotool*.whl; do
|
||||||
auditwheel repair "$whl" --plat $PLAT -w /io/wheelhouse/
|
auditwheel repair "$whl" --plat $PLAT -w /io/wheelhouse/
|
||||||
done
|
done
|
||||||
|
|
||||||
# Install packages and test
|
# Install packages and test
|
||||||
for pkg in $ALL_PYTHON; do
|
#for pkg in $ALL_PYTHON; do
|
||||||
PYBIN=/opt/python/${pkg}/bin
|
# PYBIN=/opt/python/${pkg}/bin
|
||||||
"${PYBIN}/pip" install cosmotool --no-index -f /io/wheelhouse
|
# "${PYBIN}/pip" install cosmotool --no-index -f /io/wheelhouse
|
||||||
done
|
#done
|
||||||
|
12
external/patch-omptl
vendored
12
external/patch-omptl
vendored
@ -92,3 +92,15 @@ diff -ur omptl.orig/omptl_numeric_par.h omptl/omptl_numeric_par.h
|
|||||||
|
|
||||||
namespace omptl
|
namespace omptl
|
||||||
{
|
{
|
||||||
|
diff -ur omptl.orig/omptl_algorithm_par.h omptl/omptl_algorithm_par.h
|
||||||
|
--- omptl.orig/omptl_algorithm_par.h 2021-05-09 14:26:47.227632829 +0300
|
||||||
|
+++ omptl/omptl_algorithm_par.h 2021-05-09 14:27:02.815744567 +0300
|
||||||
|
@@ -1700,7 +1700,7 @@
|
||||||
|
|
||||||
|
std::vector<char> pivot_used(pivots.size(), false); // can't be bool due to parallel write
|
||||||
|
|
||||||
|
- const unsigned max_depth = std::floor(std::tr1::log2(P));
|
||||||
|
+ const unsigned max_depth = unsigned(std::floor(std::tr1::log2(P)));
|
||||||
|
assert(1u << max_depth <= P);
|
||||||
|
for (unsigned i = 0; i < max_depth; ++i)
|
||||||
|
{
|
||||||
|
@ -54,6 +54,10 @@ SET(CMAKE_MODULE_LINKER_FLAGS "${CMAKE_MODULE_LINKER_FLAGS} -Bsymbolic-functions
|
|||||||
if(APPLE)
|
if(APPLE)
|
||||||
set(CMAKE_MODULE_LINKER_FLAGS "-undefined dynamic_lookup")
|
set(CMAKE_MODULE_LINKER_FLAGS "-undefined dynamic_lookup")
|
||||||
endif()
|
endif()
|
||||||
|
IF(NOT APPLE)
|
||||||
|
set(CMAKE_MODULE_LINKER_FLAGS "-Wl,--version-script=${CMAKE_CURRENT_SOURCE_DIR}/cosmotool.version")
|
||||||
|
ENDIF()
|
||||||
|
|
||||||
|
|
||||||
target_link_libraries(_cosmotool PRIVATE ${CosmoTool_local} ${GSL_LIBRARIES})
|
target_link_libraries(_cosmotool PRIVATE ${CosmoTool_local} ${GSL_LIBRARIES})
|
||||||
target_link_libraries(_cosmo_power PRIVATE ${CosmoTool_local} ${GSL_LIBRARIES})
|
target_link_libraries(_cosmo_power PRIVATE ${CosmoTool_local} ${GSL_LIBRARIES})
|
||||||
|
@ -410,7 +410,7 @@ def loadGadget(str filename, int snapshot_id, int gadgetFormat = 1, bool loadPos
|
|||||||
with nogil:
|
with nogil:
|
||||||
data = loadGadgetMulti(filename_bs, snapshot_id, flags, gadgetFormat)
|
data = loadGadgetMulti(filename_bs, snapshot_id, flags, gadgetFormat)
|
||||||
if data == <SimuData*>0:
|
if data == <SimuData*>0:
|
||||||
return None
|
raise RuntimeError("File could not be read")
|
||||||
|
|
||||||
return PySimulationAdaptor(wrap_simudata(data, flags))
|
return PySimulationAdaptor(wrap_simudata(data, flags))
|
||||||
|
|
||||||
|
7
python/cosmotool.version
Normal file
7
python/cosmotool.version
Normal file
@ -0,0 +1,7 @@
|
|||||||
|
CODEABI_1.0 {
|
||||||
|
global:
|
||||||
|
PyInit_*;
|
||||||
|
_init;
|
||||||
|
_fini;
|
||||||
|
local: *;
|
||||||
|
};
|
11
setup.py
11
setup.py
@ -167,15 +167,20 @@ class BuildCMakeExt(build_ext):
|
|||||||
# Change your cmake arguments below as necessary
|
# Change your cmake arguments below as necessary
|
||||||
# Below is just an example set of arguments for building Blender as a Python module
|
# Below is just an example set of arguments for building Blender as a Python module
|
||||||
|
|
||||||
|
compilers=[]
|
||||||
|
if "CC" in os.environ:
|
||||||
|
compilers.append('-DCMAKE_C_COMPILER=' + os.environ["CC"])
|
||||||
|
if "CXX" in os.environ:
|
||||||
|
compilers.append("-DCMAKE_CXX_COMPILER=" + os.environ["CXX"])
|
||||||
|
|
||||||
self.spawn(['cmake', '-H'+SOURCE_DIR, '-B'+self.build_temp,
|
self.spawn(['cmake', '-H'+SOURCE_DIR, '-B'+self.build_temp,
|
||||||
'-DCMAKE_C_COMPILER=' + os.environ["CC"], "-DCMAKE_CXX_COMPILER=" + os.environ["CXX"],
|
|
||||||
'-DENABLE_OPENMP=ON','-DINTERNAL_BOOST=ON','-DINTERNAL_EIGEN=ON',
|
'-DENABLE_OPENMP=ON','-DINTERNAL_BOOST=ON','-DINTERNAL_EIGEN=ON',
|
||||||
'-DINTERNAL_HDF5=ON','-DINTERNAL_NETCDF=ON',
|
'-DINTERNAL_HDF5=ON','-DINTERNAL_NETCDF=ON',
|
||||||
'-DBUILD_PYTHON=ON', '-DINSTALL_PYTHON_LOCAL=OFF',
|
'-DBUILD_PYTHON=ON', '-DINSTALL_PYTHON_LOCAL=OFF',
|
||||||
'-DCOSMOTOOL_PYTHON_PACKAGING=ON',
|
'-DCOSMOTOOL_PYTHON_PACKAGING=ON',
|
||||||
f"-DCYTHON={cython_code}",
|
f"-DCYTHON={cython_code}",
|
||||||
f"-DPYTHON_SITE_PACKAGES={build_dir.absolute()}/private_install",
|
f"-DPYTHON_SITE_PACKAGES={build_dir.absolute()}/private_install",
|
||||||
f"-DPYTHON_EXECUTABLE={sys.executable}"])
|
f"-DPYTHON_EXECUTABLE={sys.executable}"] + compilers)
|
||||||
|
|
||||||
|
|
||||||
self.announce("Building binaries", level=3)
|
self.announce("Building binaries", level=3)
|
||||||
@ -218,7 +223,7 @@ class BuildCMakeExt(build_ext):
|
|||||||
CosmoTool_extension = CMakeExtension(name="cosmotool")
|
CosmoTool_extension = CMakeExtension(name="cosmotool")
|
||||||
|
|
||||||
setup(name='cosmotool',
|
setup(name='cosmotool',
|
||||||
version='1.1.2',
|
version='1.2.2',
|
||||||
packages=["cosmotool"],
|
packages=["cosmotool"],
|
||||||
package_dir={'cosmotool': 'python/cosmotool'},
|
package_dir={'cosmotool': 'python/cosmotool'},
|
||||||
install_requires=['numpy','cffi','numexpr','pyfftw','h5py'],
|
install_requires=['numpy','cffi','numexpr','pyfftw','h5py'],
|
||||||
|
@ -342,12 +342,14 @@ void CosmoPower::normalize(double k_min, double k_max)
|
|||||||
|
|
||||||
normPower = 1;
|
normPower = 1;
|
||||||
|
|
||||||
|
#if 0
|
||||||
ofstream ff("PP_k.txt");
|
ofstream ff("PP_k.txt");
|
||||||
for (int i = 0; i < 100; i++)
|
for (int i = 0; i < 100; i++)
|
||||||
{
|
{
|
||||||
double k = pow(10.0, 8.0*i/100.-4);
|
double k = pow(10.0, 8.0*i/100.-4);
|
||||||
ff << k << " " << power(k) << endl;
|
ff << k << " " << power(k) << endl;
|
||||||
}
|
}
|
||||||
|
#endif
|
||||||
|
|
||||||
// gsl_integration_qagiu(&f, 0, 0, TOLERANCE, NUM_ITERATION, w, &normVal, &abserr);
|
// gsl_integration_qagiu(&f, 0, 0, TOLERANCE, NUM_ITERATION, w, &normVal, &abserr);
|
||||||
gsl_integration_qag(&f, x_min, x_max, 0, TOLERANCE, NUM_ITERATION, GSL_INTEG_GAUSS61, w, &normVal, &abserr);
|
gsl_integration_qag(&f, x_min, x_max, 0, TOLERANCE, NUM_ITERATION, GSL_INTEG_GAUSS61, w, &normVal, &abserr);
|
||||||
|
@ -146,9 +146,9 @@ void UnformattedRead::endCheckpoint(bool autodrop)
|
|||||||
recordBuffer = 0;
|
recordBuffer = 0;
|
||||||
}
|
}
|
||||||
if (cSize == Check_32bits) {
|
if (cSize == Check_32bits) {
|
||||||
if (checkPointAccum >= 1<<32UL) {
|
if (checkPointAccum >= 1UL<<32UL) {
|
||||||
always_fail = true;
|
always_fail = true;
|
||||||
checkPointAccum %= (1<<32UL);
|
checkPointAccum %= (1UL<<32UL);
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
|
@ -39,91 +39,112 @@ knowledge of the CeCILL license and that you accept its terms.
|
|||||||
#include <fftw3.h>
|
#include <fftw3.h>
|
||||||
#include <complex>
|
#include <complex>
|
||||||
|
|
||||||
namespace CosmoTool
|
namespace CosmoTool {
|
||||||
{
|
|
||||||
|
|
||||||
static inline void init_fftw_wisdom()
|
static inline void init_fftw_wisdom() {
|
||||||
{
|
fftw_import_system_wisdom();
|
||||||
fftw_import_system_wisdom();
|
fftw_import_wisdom_from_filename("fft_wisdom");
|
||||||
fftw_import_wisdom_from_filename("fft_wisdom");
|
}
|
||||||
}
|
|
||||||
|
|
||||||
static inline void save_fftw_wisdom()
|
static inline void save_fftw_wisdom() {
|
||||||
{
|
fftw_export_wisdom_to_filename("fft_wisdom");
|
||||||
fftw_export_wisdom_to_filename("fft_wisdom");
|
}
|
||||||
}
|
|
||||||
|
|
||||||
template<typename T> class FFTW_Calls {};
|
template <typename T>
|
||||||
|
class FFTW_Calls {};
|
||||||
|
|
||||||
|
#define FFTW_CALLS_BASE(rtype, prefix) \
|
||||||
|
template <> \
|
||||||
|
class FFTW_Calls<rtype> { \
|
||||||
|
public: \
|
||||||
|
typedef rtype real_type; \
|
||||||
|
typedef prefix##_complex complex_type; \
|
||||||
|
typedef prefix##_plan plan_type; \
|
||||||
|
\
|
||||||
|
static complex_type *alloc_complex(size_t N) { \
|
||||||
|
return prefix##_alloc_complex(N); \
|
||||||
|
} \
|
||||||
|
static real_type *alloc_real(size_t N) { return prefix##_alloc_real(N); } \
|
||||||
|
static void free(void *p) { fftw_free(p); } \
|
||||||
|
\
|
||||||
|
static void execute(plan_type p) { prefix##_execute(p); } \
|
||||||
|
static void execute_r2c(plan_type p, real_type *in, complex_type *out) { \
|
||||||
|
prefix##_execute_dft_r2c(p, in, out); \
|
||||||
|
} \
|
||||||
|
static void execute_c2r(plan_type p, complex_type *in, real_type *out) { \
|
||||||
|
prefix##_execute_dft_c2r(p, in, out); \
|
||||||
|
} \
|
||||||
|
static void \
|
||||||
|
execute_r2c(plan_type p, real_type *in, std::complex<real_type> *out) { \
|
||||||
|
prefix##_execute_dft_r2c(p, in, (complex_type *)out); \
|
||||||
|
} \
|
||||||
|
static void \
|
||||||
|
execute_c2r(plan_type p, std::complex<real_type> *in, real_type *out) { \
|
||||||
|
prefix##_execute_dft_c2r(p, (complex_type *)in, out); \
|
||||||
|
} \
|
||||||
|
static void execute_c2c( \
|
||||||
|
plan_type p, std::complex<real_type> *in, \
|
||||||
|
std::complex<real_type> *out) { \
|
||||||
|
prefix##_execute_dft(p, (complex_type *)in, (complex_type *)out); \
|
||||||
|
} \
|
||||||
|
static plan_type plan_dft_r2c_1d( \
|
||||||
|
int Nx, real_type *in, complex_type *out, unsigned flags) { \
|
||||||
|
return prefix##_plan_dft_r2c_1d(Nx, in, out, flags); \
|
||||||
|
} \
|
||||||
|
static plan_type plan_dft_c2r_1d( \
|
||||||
|
int Nx, complex_type *in, real_type *out, unsigned flags) { \
|
||||||
|
return prefix##_plan_dft_c2r_1d(Nx, in, out, flags); \
|
||||||
|
} \
|
||||||
|
static plan_type plan_dft_r2c_2d( \
|
||||||
|
int Nx, int Ny, real_type *in, complex_type *out, unsigned flags) { \
|
||||||
|
return prefix##_plan_dft_r2c_2d(Nx, Ny, in, out, flags); \
|
||||||
|
} \
|
||||||
|
static plan_type plan_dft_c2r_2d( \
|
||||||
|
int Nx, int Ny, complex_type *in, real_type *out, unsigned flags) { \
|
||||||
|
return prefix##_plan_dft_c2r_2d(Nx, Ny, in, out, flags); \
|
||||||
|
} \
|
||||||
|
static plan_type plan_dft_r2c_3d( \
|
||||||
|
int Nx, int Ny, int Nz, real_type *in, complex_type *out, \
|
||||||
|
unsigned flags) { \
|
||||||
|
return prefix##_plan_dft_r2c_3d(Nx, Ny, Nz, in, out, flags); \
|
||||||
|
} \
|
||||||
|
static plan_type plan_dft_c2r_3d( \
|
||||||
|
int Nx, int Ny, int Nz, complex_type *in, real_type *out, \
|
||||||
|
unsigned flags) { \
|
||||||
|
return prefix##_plan_dft_c2r_3d(Nx, Ny, Nz, in, out, flags); \
|
||||||
|
} \
|
||||||
|
\
|
||||||
|
static plan_type plan_dft_r2c( \
|
||||||
|
int rank, const int *n, real_type *in, complex_type *out, \
|
||||||
|
unsigned flags) { \
|
||||||
|
return prefix##_plan_dft_r2c(rank, n, in, out, flags); \
|
||||||
|
} \
|
||||||
|
static plan_type plan_dft_c2r( \
|
||||||
|
int rank, const int *n, complex_type *in, real_type *out, \
|
||||||
|
unsigned flags) { \
|
||||||
|
return prefix##_plan_dft_c2r(rank, n, in, out, flags); \
|
||||||
|
} \
|
||||||
|
static plan_type plan_dft_3d( \
|
||||||
|
int Nx, int Ny, int Nz, complex_type *in, complex_type *out, int sign, \
|
||||||
|
unsigned flags) { \
|
||||||
|
return prefix##_plan_dft_3d(Nx, Ny, Nz, in, out, sign, flags); \
|
||||||
|
} \
|
||||||
|
static plan_type plan_dft_2d( \
|
||||||
|
int Nx, int Ny, complex_type *in, complex_type *out, int sign, \
|
||||||
|
unsigned flags) { \
|
||||||
|
return prefix##_plan_dft_2d(Nx, Ny, in, out, sign, flags); \
|
||||||
|
} \
|
||||||
|
static plan_type plan_dft_1d( \
|
||||||
|
int Nx, complex_type *in, complex_type *out, int sign, \
|
||||||
|
unsigned flags) { \
|
||||||
|
return prefix##_plan_dft_1d(Nx, in, out, sign, flags); \
|
||||||
|
} \
|
||||||
|
static void destroy_plan(plan_type plan) { prefix##_destroy_plan(plan); } \
|
||||||
|
}
|
||||||
|
|
||||||
#define FFTW_CALLS_BASE(rtype, prefix) \
|
FFTW_CALLS_BASE(double, fftw);
|
||||||
template<> \
|
FFTW_CALLS_BASE(float, fftwf);
|
||||||
class FFTW_Calls<rtype> { \
|
|
||||||
public: \
|
|
||||||
typedef rtype real_type; \
|
|
||||||
typedef prefix ## _complex complex_type; \
|
|
||||||
typedef prefix ## _plan plan_type; \
|
|
||||||
\
|
|
||||||
static complex_type *alloc_complex(size_t N) { return prefix ## _alloc_complex(N); } \
|
|
||||||
static real_type *alloc_real(size_t N) { return prefix ## _alloc_real(N); } \
|
|
||||||
static void free(void *p) { fftw_free(p); } \
|
|
||||||
\
|
|
||||||
static void execute(plan_type p) { prefix ## _execute(p); } \
|
|
||||||
static void execute_r2c(plan_type p, real_type *in, complex_type *out) { prefix ## _execute_dft_r2c(p, in, out); } \
|
|
||||||
static void execute_c2r(plan_type p, complex_type *in, real_type *out) { prefix ## _execute_dft_c2r(p, in, out); } \
|
|
||||||
static void execute_r2c(plan_type p, real_type *in, std::complex<real_type> *out) { prefix ## _execute_dft_r2c(p, in, (complex_type*)out); } \
|
|
||||||
static void execute_c2r(plan_type p, std::complex<real_type> *in, real_type *out) { prefix ## _execute_dft_c2r(p, (complex_type*) in, out); } \
|
|
||||||
static void execute_c2c(plan_type p, std::complex<real_type> *in, std::complex<real_type> *out) { prefix ## _execute_dft(p, (complex_type *)in, (complex_type*)out); } \
|
|
||||||
static plan_type plan_dft_r2c_2d(int Nx, int Ny, \
|
|
||||||
real_type *in, complex_type *out, \
|
|
||||||
unsigned flags) \
|
|
||||||
{ \
|
|
||||||
return prefix ## _plan_dft_r2c_2d(Nx, Ny, in, out, \
|
|
||||||
flags); \
|
|
||||||
} \
|
|
||||||
static plan_type plan_dft_c2r_2d(int Nx, int Ny, \
|
|
||||||
complex_type *in, real_type *out, \
|
|
||||||
unsigned flags) \
|
|
||||||
{ \
|
|
||||||
return prefix ## _plan_dft_c2r_2d(Nx, Ny, in, out, \
|
|
||||||
flags); \
|
|
||||||
} \
|
|
||||||
static plan_type plan_dft_r2c_3d(int Nx, int Ny, int Nz, \
|
|
||||||
real_type *in, complex_type *out, \
|
|
||||||
unsigned flags) \
|
|
||||||
{ \
|
|
||||||
return prefix ## _plan_dft_r2c_3d(Nx, Ny, Nz, in, out, flags); \
|
|
||||||
} \
|
|
||||||
static plan_type plan_dft_c2r_3d(int Nx, int Ny, int Nz, \
|
|
||||||
complex_type *in, real_type *out, \
|
|
||||||
unsigned flags) \
|
|
||||||
{ \
|
|
||||||
return prefix ## _plan_dft_c2r_3d(Nx, Ny, Nz, in, out, flags); \
|
|
||||||
} \
|
|
||||||
\
|
|
||||||
static plan_type plan_dft_r2c(int rank, const int *n, real_type *in, \
|
|
||||||
complex_type *out, unsigned flags) \
|
|
||||||
{ \
|
|
||||||
return prefix ## _plan_dft_r2c(rank, n, in, out, flags); \
|
|
||||||
} \
|
|
||||||
static plan_type plan_dft_c2r(int rank, const int *n, complex_type *in, \
|
|
||||||
real_type *out, unsigned flags) \
|
|
||||||
{ \
|
|
||||||
return prefix ## _plan_dft_c2r(rank, n, in, out, flags); \
|
|
||||||
} \
|
|
||||||
static plan_type plan_dft_3d(int Nx, int Ny, int Nz, complex_type *in, complex_type *out, int sign, unsigned flags) { \
|
|
||||||
return prefix ## _plan_dft_3d(Nx, Ny, Nz, in, out, sign, flags); \
|
|
||||||
} \
|
|
||||||
static plan_type plan_dft_2d(int Nx, int Ny, complex_type *in, complex_type *out, int sign, unsigned flags) { \
|
|
||||||
return prefix ## _plan_dft_2d(Nx, Ny, in, out, sign, flags); \
|
|
||||||
} \
|
|
||||||
static void destroy_plan(plan_type plan) { prefix ## _destroy_plan(plan); } \
|
|
||||||
}
|
|
||||||
|
|
||||||
|
|
||||||
FFTW_CALLS_BASE(double, fftw);
|
|
||||||
FFTW_CALLS_BASE(float, fftwf);
|
|
||||||
#undef FFTW_CALLS_BASE
|
#undef FFTW_CALLS_BASE
|
||||||
};
|
}; // namespace CosmoTool
|
||||||
|
|
||||||
#endif
|
#endif
|
||||||
|
@ -5,110 +5,140 @@
|
|||||||
#include <mpi.h>
|
#include <mpi.h>
|
||||||
#include <fftw3-mpi.h>
|
#include <fftw3-mpi.h>
|
||||||
|
|
||||||
namespace CosmoTool
|
namespace CosmoTool {
|
||||||
{
|
|
||||||
|
|
||||||
static inline void init_fftw_mpi()
|
static inline void init_fftw_mpi() { fftw_mpi_init(); }
|
||||||
{
|
|
||||||
fftw_mpi_init();
|
|
||||||
}
|
|
||||||
|
|
||||||
static inline void done_fftw_mpi()
|
static inline void done_fftw_mpi() { fftw_mpi_cleanup(); }
|
||||||
{
|
|
||||||
fftw_mpi_cleanup();
|
|
||||||
}
|
|
||||||
|
|
||||||
template<typename T> class FFTW_MPI_Calls {};
|
template <typename T>
|
||||||
|
class FFTW_MPI_Calls {};
|
||||||
|
|
||||||
|
#define FFTW_MPI_CALLS_BASE(rtype, prefix) \
|
||||||
|
template <> \
|
||||||
|
class FFTW_MPI_Calls<rtype> { \
|
||||||
|
public: \
|
||||||
|
typedef rtype real_type; \
|
||||||
|
typedef prefix##_complex complex_type; \
|
||||||
|
typedef prefix##_plan plan_type; \
|
||||||
|
\
|
||||||
|
static complex_type *alloc_complex(size_t N) { \
|
||||||
|
return prefix##_alloc_complex(N); \
|
||||||
|
} \
|
||||||
|
static real_type *alloc_real(size_t N) { return prefix##_alloc_real(N); } \
|
||||||
|
static void free(void *p) { fftw_free(p); } \
|
||||||
|
\
|
||||||
|
template <size_t Nd> \
|
||||||
|
static ptrdiff_t local_size( \
|
||||||
|
std::array<ptrdiff_t, Nd> const &N, MPI_Comm comm, \
|
||||||
|
ptrdiff_t *local_n0, ptrdiff_t *local_0_start) { \
|
||||||
|
return prefix##_mpi_local_size( \
|
||||||
|
Nd, N.data(), comm, local_n0, local_0_start); \
|
||||||
|
} \
|
||||||
|
static ptrdiff_t local_size_2d( \
|
||||||
|
ptrdiff_t N0, ptrdiff_t N1, MPI_Comm comm, ptrdiff_t *local_n0, \
|
||||||
|
ptrdiff_t *local_0_start) { \
|
||||||
|
return prefix##_mpi_local_size_2d( \
|
||||||
|
N0, N1, comm, local_n0, local_0_start); \
|
||||||
|
} \
|
||||||
|
\
|
||||||
|
static ptrdiff_t local_size_3d( \
|
||||||
|
ptrdiff_t N0, ptrdiff_t N1, ptrdiff_t N2, MPI_Comm comm, \
|
||||||
|
ptrdiff_t *local_n0, ptrdiff_t *local_0_start) { \
|
||||||
|
return prefix##_mpi_local_size_3d( \
|
||||||
|
N0, N1, N2, comm, local_n0, local_0_start); \
|
||||||
|
} \
|
||||||
|
\
|
||||||
|
static void execute(plan_type p) { prefix##_execute(p); } \
|
||||||
|
static void \
|
||||||
|
execute_c2c(plan_type p, complex_type *in, complex_type *out) { \
|
||||||
|
prefix##_mpi_execute_dft(p, in, out); \
|
||||||
|
} \
|
||||||
|
static void execute_c2c( \
|
||||||
|
plan_type p, std::complex<real_type> *in, \
|
||||||
|
std::complex<real_type> *out) { \
|
||||||
|
prefix##_mpi_execute_dft(p, (complex_type *)in, (complex_type *)out); \
|
||||||
|
} \
|
||||||
|
static void execute_r2c(plan_type p, real_type *in, complex_type *out) { \
|
||||||
|
prefix##_mpi_execute_dft_r2c(p, in, out); \
|
||||||
|
} \
|
||||||
|
static void \
|
||||||
|
execute_c2r(plan_type p, std::complex<real_type> *in, real_type *out) { \
|
||||||
|
prefix##_mpi_execute_dft_c2r(p, (complex_type *)in, out); \
|
||||||
|
} \
|
||||||
|
static void execute_c2r(plan_type p, complex_type *in, real_type *out) { \
|
||||||
|
prefix##_mpi_execute_dft_c2r(p, in, out); \
|
||||||
|
} \
|
||||||
|
static void \
|
||||||
|
execute_r2c(plan_type p, real_type *in, std::complex<real_type> *out) { \
|
||||||
|
prefix##_mpi_execute_dft_r2c(p, in, (complex_type *)out); \
|
||||||
|
} \
|
||||||
|
\
|
||||||
|
static plan_type plan_dft_r2c_1d( \
|
||||||
|
int n, real_type *in, complex_type *out, MPI_Comm, unsigned flags) { \
|
||||||
|
return prefix##_plan_dft_r2c_1d(n, in, out, flags); \
|
||||||
|
} \
|
||||||
|
\
|
||||||
|
static plan_type plan_dft_r2c_2d( \
|
||||||
|
int Nx, int Ny, real_type *in, complex_type *out, MPI_Comm comm, \
|
||||||
|
unsigned flags) { \
|
||||||
|
return prefix##_mpi_plan_dft_r2c_2d(Nx, Ny, in, out, comm, flags); \
|
||||||
|
} \
|
||||||
|
\
|
||||||
|
static plan_type plan_dft_c2r_1d( \
|
||||||
|
int n, complex_type *in, real_type *out, MPI_Comm, unsigned flags) { \
|
||||||
|
return prefix##_plan_dft_c2r_1d(n, in, out, flags); \
|
||||||
|
} \
|
||||||
|
static plan_type plan_dft_c2r_2d( \
|
||||||
|
int Nx, int Ny, complex_type *in, real_type *out, MPI_Comm comm, \
|
||||||
|
unsigned flags) { \
|
||||||
|
return prefix##_mpi_plan_dft_c2r_2d(Nx, Ny, in, out, comm, flags); \
|
||||||
|
} \
|
||||||
|
\
|
||||||
|
static plan_type plan_dft_r2c_3d( \
|
||||||
|
int Nx, int Ny, int Nz, real_type *in, complex_type *out, \
|
||||||
|
MPI_Comm comm, unsigned flags) { \
|
||||||
|
return prefix##_mpi_plan_dft_r2c_3d(Nx, Ny, Nz, in, out, comm, flags); \
|
||||||
|
} \
|
||||||
|
static plan_type plan_dft_c2r_3d( \
|
||||||
|
int Nx, int Ny, int Nz, complex_type *in, real_type *out, \
|
||||||
|
MPI_Comm comm, unsigned flags) { \
|
||||||
|
return prefix##_mpi_plan_dft_c2r_3d(Nx, Ny, Nz, in, out, comm, flags); \
|
||||||
|
} \
|
||||||
|
\
|
||||||
|
static plan_type plan_dft_r2c( \
|
||||||
|
int rank, const ptrdiff_t *n, real_type *in, complex_type *out, \
|
||||||
|
MPI_Comm comm, unsigned flags) { \
|
||||||
|
return prefix##_mpi_plan_dft_r2c(rank, n, in, out, comm, flags); \
|
||||||
|
} \
|
||||||
|
static plan_type plan_dft_c2r( \
|
||||||
|
int rank, const ptrdiff_t *n, complex_type *in, real_type *out, \
|
||||||
|
MPI_Comm comm, unsigned flags) { \
|
||||||
|
return prefix##_mpi_plan_dft_c2r(rank, n, in, out, comm, flags); \
|
||||||
|
} \
|
||||||
|
static plan_type plan_dft_3d( \
|
||||||
|
int Nx, int Ny, int Nz, complex_type *in, complex_type *out, \
|
||||||
|
MPI_Comm comm, int sign, unsigned flags) { \
|
||||||
|
return prefix##_mpi_plan_dft_3d(Nx, Ny, Nz, in, out, comm, sign, flags); \
|
||||||
|
} \
|
||||||
|
static plan_type plan_dft_2d( \
|
||||||
|
int Nx, int Ny, complex_type *in, complex_type *out, MPI_Comm comm, \
|
||||||
|
int sign, unsigned flags) { \
|
||||||
|
return prefix##_mpi_plan_dft_2d(Nx, Ny, in, out, comm, sign, flags); \
|
||||||
|
} \
|
||||||
|
static plan_type plan_dft_1d( \
|
||||||
|
int Nx, complex_type *in, complex_type *out, MPI_Comm comm, int sign, \
|
||||||
|
unsigned flags) { \
|
||||||
|
return prefix##_plan_dft_1d(Nx, in, out, sign, flags); \
|
||||||
|
} \
|
||||||
|
static void destroy_plan(plan_type plan) { prefix##_destroy_plan(plan); } \
|
||||||
|
}
|
||||||
|
|
||||||
#define FFTW_MPI_CALLS_BASE(rtype, prefix) \
|
FFTW_MPI_CALLS_BASE(double, fftw);
|
||||||
template<> \
|
FFTW_MPI_CALLS_BASE(float, fftwf);
|
||||||
class FFTW_MPI_Calls<rtype> { \
|
|
||||||
public: \
|
|
||||||
typedef rtype real_type; \
|
|
||||||
typedef prefix ## _complex complex_type; \
|
|
||||||
typedef prefix ## _plan plan_type; \
|
|
||||||
\
|
|
||||||
static complex_type *alloc_complex(size_t N) { return prefix ## _alloc_complex(N); } \
|
|
||||||
static real_type *alloc_real(size_t N) { return prefix ## _alloc_real(N); } \
|
|
||||||
static void free(void *p) { fftw_free(p); } \
|
|
||||||
\
|
|
||||||
template<size_t Nd> \
|
|
||||||
static ptrdiff_t local_size(std::array<ptrdiff_t,Nd> const& N, MPI_Comm comm, \
|
|
||||||
ptrdiff_t *local_n0, ptrdiff_t *local_0_start) { \
|
|
||||||
return prefix ## _mpi_local_size(Nd, N.data(), comm, local_n0, local_0_start); \
|
|
||||||
} \
|
|
||||||
static ptrdiff_t local_size_2d(ptrdiff_t N0, ptrdiff_t N1, MPI_Comm comm, \
|
|
||||||
ptrdiff_t *local_n0, ptrdiff_t *local_0_start) { \
|
|
||||||
return prefix ## _mpi_local_size_2d(N0, N1, comm, local_n0, local_0_start); \
|
|
||||||
} \
|
|
||||||
\
|
|
||||||
static ptrdiff_t local_size_3d(ptrdiff_t N0, ptrdiff_t N1, ptrdiff_t N2, MPI_Comm comm, \
|
|
||||||
ptrdiff_t *local_n0, ptrdiff_t *local_0_start) { \
|
|
||||||
return prefix ## _mpi_local_size_3d(N0, N1, N2, comm, local_n0, local_0_start); \
|
|
||||||
} \
|
|
||||||
\
|
|
||||||
static void execute(plan_type p) { prefix ## _execute(p); } \
|
|
||||||
static void execute_c2c(plan_type p, complex_type *in, complex_type *out) { prefix ## _mpi_execute_dft(p, in, out); } \
|
|
||||||
static void execute_c2c(plan_type p, std::complex<real_type> *in, std::complex<real_type> *out) { prefix ## _mpi_execute_dft(p, (complex_type*)in, (complex_type*)out); } \
|
|
||||||
static void execute_r2c(plan_type p, real_type *in, complex_type *out) { prefix ## _mpi_execute_dft_r2c(p, in, out); } \
|
|
||||||
static void execute_c2r(plan_type p, std::complex<real_type> *in, real_type *out) { prefix ## _mpi_execute_dft_c2r(p, (complex_type*)in, out); } \
|
|
||||||
static void execute_c2r(plan_type p, complex_type *in, real_type *out) { prefix ## _mpi_execute_dft_c2r(p, in, out); } \
|
|
||||||
static void execute_r2c(plan_type p, real_type *in, std::complex<real_type> *out) { prefix ## _mpi_execute_dft_r2c(p, in, (complex_type*)out); } \
|
|
||||||
\
|
|
||||||
static plan_type plan_dft_r2c_2d(int Nx, int Ny, \
|
|
||||||
real_type *in, complex_type *out, \
|
|
||||||
MPI_Comm comm, unsigned flags) \
|
|
||||||
{ \
|
|
||||||
return prefix ## _mpi_plan_dft_r2c_2d(Nx, Ny, in, out, \
|
|
||||||
comm, flags); \
|
|
||||||
} \
|
|
||||||
static plan_type plan_dft_c2r_2d(int Nx, int Ny, \
|
|
||||||
complex_type *in, real_type *out, \
|
|
||||||
MPI_Comm comm, unsigned flags) \
|
|
||||||
{ \
|
|
||||||
return prefix ## _mpi_plan_dft_c2r_2d(Nx, Ny, in, out, \
|
|
||||||
comm, flags); \
|
|
||||||
} \
|
|
||||||
static plan_type plan_dft_r2c_3d(int Nx, int Ny, int Nz, \
|
|
||||||
real_type *in, complex_type *out, \
|
|
||||||
MPI_Comm comm, unsigned flags) \
|
|
||||||
{ \
|
|
||||||
return prefix ## _mpi_plan_dft_r2c_3d(Nx, Ny, Nz, in, out, comm, flags); \
|
|
||||||
} \
|
|
||||||
static plan_type plan_dft_c2r_3d(int Nx, int Ny, int Nz, \
|
|
||||||
complex_type *in, real_type *out, \
|
|
||||||
MPI_Comm comm, \
|
|
||||||
unsigned flags) \
|
|
||||||
{ \
|
|
||||||
return prefix ## _mpi_plan_dft_c2r_3d(Nx, Ny, Nz, in, out, comm, flags); \
|
|
||||||
} \
|
|
||||||
\
|
|
||||||
static plan_type plan_dft_r2c(int rank, const ptrdiff_t *n, real_type *in, \
|
|
||||||
complex_type *out, MPI_Comm comm, unsigned flags) \
|
|
||||||
{ \
|
|
||||||
return prefix ## _mpi_plan_dft_r2c(rank, n, in, out, comm, flags); \
|
|
||||||
} \
|
|
||||||
static plan_type plan_dft_c2r(int rank, const ptrdiff_t *n, complex_type *in, \
|
|
||||||
real_type *out, MPI_Comm comm, unsigned flags) \
|
|
||||||
{ \
|
|
||||||
return prefix ## _mpi_plan_dft_c2r(rank, n, in, out, comm, flags); \
|
|
||||||
} \
|
|
||||||
static plan_type plan_dft_3d(int Nx, int Ny, int Nz, complex_type *in, complex_type *out, MPI_Comm comm, int sign, unsigned flags) { \
|
|
||||||
return prefix ## _mpi_plan_dft_3d(Nx, Ny, Nz, in, out, comm, sign, flags); \
|
|
||||||
} \
|
|
||||||
static plan_type plan_dft_2d(int Nx, int Ny, complex_type *in, complex_type *out, MPI_Comm comm, int sign, unsigned flags) { \
|
|
||||||
return prefix ## _mpi_plan_dft_2d(Nx, Ny, in, out, comm, sign, flags); \
|
|
||||||
} \
|
|
||||||
static void destroy_plan(plan_type plan) { prefix ## _destroy_plan(plan); } \
|
|
||||||
}
|
|
||||||
|
|
||||||
|
|
||||||
FFTW_MPI_CALLS_BASE(double, fftw);
|
|
||||||
FFTW_MPI_CALLS_BASE(float, fftwf);
|
|
||||||
|
|
||||||
#undef FFTW_MPI_CALLS_BASE
|
#undef FFTW_MPI_CALLS_BASE
|
||||||
|
|
||||||
};
|
}; // namespace CosmoTool
|
||||||
|
|
||||||
#endif
|
#endif
|
||||||
|
@ -144,8 +144,8 @@ namespace CosmoTool {
|
|||||||
bool useBases = false)
|
bool useBases = false)
|
||||||
{
|
{
|
||||||
std::vector<hsize_t> memdims(data.shape(), data.shape() + data.num_dimensions());
|
std::vector<hsize_t> memdims(data.shape(), data.shape() + data.num_dimensions());
|
||||||
H5::DataSpace dataspace(dimensions.size(), dimensions.data());
|
H5::DataSpace dataspace(int(dimensions.size()), dimensions.data());
|
||||||
H5::DataSpace memspace(memdims.size(), memdims.data());
|
H5::DataSpace memspace(int(memdims.size()), memdims.data());
|
||||||
|
|
||||||
if (useBases) {
|
if (useBases) {
|
||||||
std::vector<hsize_t> offsets(data.index_bases(), data.index_bases() + data.num_dimensions());
|
std::vector<hsize_t> offsets(data.index_bases(), data.index_bases() + data.num_dimensions());
|
||||||
@ -398,7 +398,7 @@ namespace CosmoTool {
|
|||||||
hdf5_weak_check_array(data, dimensions);
|
hdf5_weak_check_array(data, dimensions);
|
||||||
|
|
||||||
std::vector<hsize_t> memdims(data.shape(), data.shape() + data.num_dimensions());
|
std::vector<hsize_t> memdims(data.shape(), data.shape() + data.num_dimensions());
|
||||||
H5::DataSpace memspace(memdims.size(), memdims.data());
|
H5::DataSpace memspace(int(memdims.size()), memdims.data());
|
||||||
|
|
||||||
std::vector<hsize_t> offsets(data.index_bases(), data.index_bases() + data.num_dimensions());
|
std::vector<hsize_t> offsets(data.index_bases(), data.index_bases() + data.num_dimensions());
|
||||||
dataspace.selectHyperslab(H5S_SELECT_SET, memdims.data(), offsets.data());
|
dataspace.selectHyperslab(H5S_SELECT_SET, memdims.data(), offsets.data());
|
||||||
|
@ -221,7 +221,7 @@ SimuData *CosmoTool::loadGadgetMulti(const char *fname, int id,
|
|||||||
cerr << "Invalid format while reading header" << endl;
|
cerr << "Invalid format while reading header" << endl;
|
||||||
delete data;
|
delete data;
|
||||||
delete f;
|
delete f;
|
||||||
return 0;
|
throw;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
|
||||||
@ -275,7 +275,7 @@ SimuData *CosmoTool::loadGadgetMulti(const char *fname, int id,
|
|||||||
cerr << "Invalid format while reading positions" << endl;
|
cerr << "Invalid format while reading positions" << endl;
|
||||||
delete f;
|
delete f;
|
||||||
delete data;
|
delete data;
|
||||||
return 0;
|
throw;
|
||||||
}
|
}
|
||||||
|
|
||||||
} else {
|
} else {
|
||||||
@ -292,7 +292,7 @@ SimuData *CosmoTool::loadGadgetMulti(const char *fname, int id,
|
|||||||
{
|
{
|
||||||
delete f;
|
delete f;
|
||||||
delete data;
|
delete data;
|
||||||
return 0;
|
throw;
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
@ -317,7 +317,7 @@ SimuData *CosmoTool::loadGadgetMulti(const char *fname, int id,
|
|||||||
cerr << "Invalid format while reading velocities" << endl;
|
cerr << "Invalid format while reading velocities" << endl;
|
||||||
delete f;
|
delete f;
|
||||||
delete data;
|
delete data;
|
||||||
return 0;
|
throw;
|
||||||
}
|
}
|
||||||
|
|
||||||
// THE VELOCITIES ARE IN PHYSICAL COORDINATES
|
// THE VELOCITIES ARE IN PHYSICAL COORDINATES
|
||||||
@ -367,7 +367,7 @@ SimuData *CosmoTool::loadGadgetMulti(const char *fname, int id,
|
|||||||
cerr << "Invalid unformatted access while reading ID" << endl;
|
cerr << "Invalid unformatted access while reading ID" << endl;
|
||||||
delete f;
|
delete f;
|
||||||
delete data;
|
delete data;
|
||||||
return 0;
|
throw;
|
||||||
}
|
}
|
||||||
} else {
|
} else {
|
||||||
f->skip(2*4);
|
f->skip(2*4);
|
||||||
|
Loading…
Reference in New Issue
Block a user