Skip to content
Snippets Groups Projects
Commit eb16cf21 authored by Pietro Incardona's avatar Pietro Incardona
Browse files

Fixing performance

parent 9f032ba7
No related branches found
No related tags found
No related merge requests found
Pipeline #4009 passed
...@@ -64,10 +64,15 @@ Params params; ...@@ -64,10 +64,15 @@ Params params;
typedef struct typedef struct
{ {
openfpm::vector_gpu<aggregate<float[3],int>> d_protein; // _lin = AOS
openfpm::vector_gpu<aggregate<float[3],int>> d_ligand; openfpm::vector_gpu_lin<aggregate<float[3],int>> d_protein;
openfpm::vector_gpu<aggregate<int,float,float,float>> d_forcefield; // AOS
openfpm::vector_gpu_lin<aggregate<float[3],int>> d_ligand;
// AOS
openfpm::vector_gpu_lin<aggregate<int,float,float,float>> d_forcefield;
// SOA
openfpm::vector_gpu<aggregate<float>> d_results; openfpm::vector_gpu<aggregate<float>> d_results;
// SOA
openfpm::vector_gpu<aggregate<float,float,float,float,float,float>> d_poses; openfpm::vector_gpu<aggregate<float,float,float,float,float,float>> d_poses;
openfpm::vector<double> gflops_data; openfpm::vector<double> gflops_data;
...@@ -601,14 +606,18 @@ void loadParameters(int argc, char *argv[], OpenFPM & _openfpm) ...@@ -601,14 +606,18 @@ void loadParameters(int argc, char *argv[], OpenFPM & _openfpm)
fclose(file); fclose(file);
} }
#ifndef __APPLE__
#include <fenv.h> #include <fenv.h>
#include <xmmintrin.h> #include <xmmintrin.h>
#include <pmmintrin.h> #include <pmmintrin.h>
#endif
int main(int argc, char *argv[]) int main(int argc, char *argv[])
{ {
#ifndef __APPLE__
_MM_SET_FLUSH_ZERO_MODE(_MM_FLUSH_ZERO_ON); _MM_SET_FLUSH_ZERO_MODE(_MM_FLUSH_ZERO_ON);
_MM_SET_DENORMALS_ZERO_MODE(_MM_DENORMALS_ZERO_ON); _MM_SET_DENORMALS_ZERO_MODE(_MM_DENORMALS_ZERO_ON);
#endif
init_wrappers(); init_wrappers();
OpenFPM _openfpm; OpenFPM _openfpm;
......
...@@ -5,8 +5,9 @@ CUDA_CC= ...@@ -5,8 +5,9 @@ CUDA_CC=
CUDA_CC_LINK= CUDA_CC_LINK=
ifdef CUDA_ON_CPU ifdef CUDA_ON_CPU
CUDA_CC=mpic++ -x c++ $(INCLUDE_PATH) CUDA_CC=mpic++ -x c++ $(INCLUDE_PATH)
INCLUDE_PATH_NVCC= INCLUDE_PATH_NVCC=
CUDA_CC_LINK=mpic++ CUDA_CC_LINK=mpic++
LIBS_SELECT=$(LIBS)
else else
ifeq (, $(shell which nvcc)) ifeq (, $(shell which nvcc))
CUDA_CC=mpic++ -x c++ $(INCLUDE_PATH) CUDA_CC=mpic++ -x c++ $(INCLUDE_PATH)
......
openfpm_data @ df7c8617
Subproject commit f84f0a370f906dcf2f35ef2747d7adbbe2a397d4 Subproject commit df7c8617df88632b0de820a9f9d258f3d6b86c44
openfpm_devices @ 33dfcd4c
Subproject commit 4e23dd287dd78e69b0072d0b1c3fe832e0c45966 Subproject commit 33dfcd4c1486af8ff33dcb856facd941e044e254
0% Loading or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment