root / addons / Build.Debian_CUBLAS.sh
Historique | Voir | Annoter | Télécharger (798 octet)
1 | 9 | equemene | # CUBLAS script to build HPL using CUBLAS Thunking |
---|---|---|---|
2 | 9 | equemene | # |
3 | 9 | equemene | # 2010-11-26 : Initial release |
4 | 9 | equemene | # Emmanuel Quemener <emmanuel.quemener@ens-lyon.fr> |
5 | 9 | equemene | # |
6 | 9 | equemene | # Copy this script on HPL root folder and execute |
7 | 9 | equemene | |
8 | 9 | equemene | # Define root folder for CUDA toolkit (default dir is /usr/local/cuda) |
9 | 9 | equemene | CUDASRC=/opt/cuda |
10 | 9 | equemene | # Clean all objects files |
11 | 9 | equemene | find . -name "*.o" -exec rm {} \; |
12 | 9 | equemene | # Copy of source for thunking CUBLAS approach |
13 | 9 | equemene | cp $CUDASRC/src/fortran_thunking.c $CUDASRC/src/fortran_thunking.h $CUDASRC/src/fortran_common.h . |
14 | 9 | equemene | # Patch Thunking prototypes to compile on Debian Lenny |
15 | 9 | equemene | patch fortran_common.h patch_thunking.h |
16 | 9 | equemene | # patching file fortran_common.h |
17 | 9 | equemene | gcc -funroll-loops -W -I$CUDASRC/include -Wall -O3 -c fortran_thunking.c |
18 | 9 | equemene | # Clean old builds |
19 | 9 | equemene | make arch=Debian_CUBLAS_OpenMPI clean_all_arch |
20 | 9 | equemene | # Compile HPL |
21 | 9 | equemene | make arch=Debian_CUBLAS_OpenMPI |