-
Notifications
You must be signed in to change notification settings - Fork 21
/
Copy pathmake_MC-GPU_v1.3.sh
executable file
·47 lines (34 loc) · 2.44 KB
/
make_MC-GPU_v1.3.sh
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
#!/bin/bash
#
# ** Simple script to compile the code MC-GPU v1.3 with CUDA 5.0 **
#
# The installations paths to the CUDA toolkit and SDK (http://www.nvidia.com/cuda) and the MPI
# library path may have to be adapted before runing the script!
# The zlib.h library is used to allow gzip-ed input files.
#
# Default paths:
# CUDA: /usr/local/cuda
# SDK: /usr/local/cuda/samples
# MPI: /usr/include/openmpi
#
#
# @file make_MC-GPU_v1.3.sh
# @author Andreu Badal [Andreu.Badal-Soler(at)fda.hhs.gov]
# @date 2012/12/12
#
# -- Compile GPU code for compute capability 1.3 and 2.0, with MPI:
echo " "
echo " -- Compiling MC-GPU v1.3 with CUDA 5.0 for both compute capability 2.0 and 3.0 (64 bits), with MPI:"
echo " To run a simulation in parallel with openMPI execute:"
echo " $ time mpirun --tag-output -v -x LD_LIBRARY_PATH -hostfile hostfile_gpunodes -n 22 /GPU_cluster/MC-GPU_v1.3.x /GPU_cluster/MC-GPU_v1.3.in | tee MC-GPU_v1.3.out"
echo " "
echo "nvcc MC-GPU_v1.3.cu -o MC-GPU_v1.3.x -m64 -O3 -use_fast_math -DUSING_CUDA -DUSING_MPI -I. -I/usr/local/cuda/include -I/usr/local/cuda/samples/common/inc -I/usr/local/cuda/samples/shared/inc/ -I/usr/include/openmpi -L/usr/lib/ -lmpi -lz --ptxas-options=-v -gencode=arch=compute_20,code=sm_20 -gencode=arch=compute_30,code=sm_30"
nvcc MC-GPU_v1.3.cu -o MC-GPU_v1.3.x -m64 -O3 -use_fast_math -DUSING_CUDA -DUSING_MPI -I. -I/usr/local/cuda/include -I/usr/local/cuda/samples/common/inc -I/usr/local/cuda/samples/shared/inc/ -I/usr/include/openmpi -L/usr/lib/ -lmpi -lz --ptxas-options=-v -gencode=arch=compute_20,code=sm_20 -gencode=arch=compute_30,code=sm_30
# -gencode=arch=compute_13,code=sm_13 -gencode=arch=compute_35,code=sm_35 -gencode=arch=compute_35,code=compute_35
# -- CPU compilation:
# ** GCC (with MPI):
# gcc -x c -DUSING_MPI MC-GPU_v1.3.cu -o MC-GPU_v1.3_gcc_MPI.x -Wall -O3 -ffast-math -ftree-vectorize -ftree-vectorizer-verbose=1 -funroll-loops -static-libgcc -I./ -lm -I/usr/include/openmpi -I/usr/lib/openmpi/include/openmpi/ -L/usr/lib/openmpi/lib -lmpi
# ** Intel compiler (with MPI):
# icc -x c -O3 -ipo -no-prec-div -msse4.2 -parallel -Wall -DUSING_MPI MC-GPU_v1.3.cu -o MC-GPU_v1.3_icc_MPI.x -I./ -lm -I/usr/include/openmpi -L/usr/lib/openmpi/lib/ -lmpi
# ** PGI compiler:
# pgcc -fast,sse -O3 -Mipa=fast -Minfo -csuffix=cu -Mconcur MC-GPU_v1.3.cu -I./ -lm -o MC-GPU_v1.3_PGI.x