Révision 146
BLAS/xGEMM/Makefile (revision 146) | ||
---|---|---|
1 | 1 |
SOURCE=xGEMM.c |
2 | 2 |
|
3 |
CC=gcc-4.7
|
|
4 |
FC=gfortran-4.7
|
|
3 |
CC=gcc |
|
4 |
FC=gfortran |
|
5 | 5 |
CFLAGS=-Wall -O3 -ffast-math |
6 | 6 |
LDFLAGS=-lm |
7 | 7 |
CUDASRC=/usr/share/doc/nvidia-cuda-doc/examples/ |
... | ... | |
9 | 9 |
CUDASRCINC=fortran_common.h |
10 | 10 |
CUDAINC=/usr/include |
11 | 11 |
CUDALIB=/usr/lib/x86_64-linux-gnu/ |
12 |
CLBLASINC=/opt/clBLAS/build/include
|
|
13 |
CLBLASLIB=/opt/clBLAS/build/library/
|
|
12 |
CLBLASINC=/usr/include
|
|
13 |
CLBLASLIB=/usr/lib
|
|
14 | 14 |
# CLBLASINC=/opt/clBLAS/src |
15 | 15 |
# CLBLASLIB=/opt/clBLAS/src/library/ |
16 | 16 |
|
... | ... | |
20 | 20 |
|
21 | 21 |
GOTO2=/opt/GotoBLAS2 |
22 | 22 |
|
23 |
OPENBLAS=/usr/lib/openblas-base |
|
23 |
#OPENBLAS=/usr/lib/openblas-base |
|
24 |
OPENBLAS=/usr/lib |
|
24 | 25 |
|
25 | 26 |
ACML=/opt/acml |
26 | 27 |
ACMLINC=$(ACML)/gfortran64_mp/include |
... | ... | |
28 | 29 |
|
29 | 30 |
ATLAS=/usr/lib/atlas-base |
30 | 31 |
|
31 |
EXECUTABLE=cblas fblas gsl cublas thunking openblas acml clblas |
|
32 |
#EXECUTABLE=cblas fblas gsl cublas thunking openblas acml clblas |
|
33 |
#EXECUTABLE=cblas fblas gsl cublas thunking openblas clblas |
|
34 |
#EXECUTABLE=gsl openblas clblas cublas thunking |
|
35 |
#EXECUTABLE=openblas clblas cublas thunking |
|
36 |
#EXECUTABLE=clblas cublas thunking |
|
37 |
EXECUTABLE=openblas |
|
32 | 38 |
|
33 | 39 |
FORMAT=DOUBLE |
34 | 40 |
#FORMAT=FLOAT |
... | ... | |
57 | 63 |
|
58 | 64 |
openblas: $(SOURCE) |
59 | 65 |
|
60 |
$(CC) $(CFLAGS) $(DIRECTIVES) -fopenmp -DFLOAT -DCBLAS $(LDFLAGS) \ |
|
66 |
$(CC) $(CFLAGS) $(DIRECTIVES) -L/usr/include/openblas -fopenmp -DFLOAT -DCBLAS $(LDFLAGS) \
|
|
61 | 67 |
$(SOURCE) $(OPENBLAS)/libopenblas.a -lpthread -o $(SOURCE:.c=)_SP_$@ |
62 | 68 |
|
63 |
$(CC) $(CFLAGS) $(DIRECTIVES) -fopenmp -DDOUBLE -DCBLAS $(LDFLAGS) \ |
|
69 |
$(CC) $(CFLAGS) $(DIRECTIVES) -L/usr/include/openblas -fopenmp -DDOUBLE -DCBLAS $(LDFLAGS) \
|
|
64 | 70 |
$(SOURCE) $(OPENBLAS)/libopenblas.a -lpthread -o $(SOURCE:.c=)_DP_$@ |
65 | 71 |
|
66 | 72 |
acml: $(SOURCE) |
BLAS/xGEMM/xGEMM.c (revision 146) | ||
---|---|---|
37 | 37 |
#include <acml.h> |
38 | 38 |
#else |
39 | 39 |
#include <cblas.h> |
40 |
#include <blaswrap.h> |
|
40 | 41 |
#endif |
41 | 42 |
|
42 | 43 |
#ifdef CLBLAS |
... | ... | |
597 | 598 |
dim,dim,dim,alpha,A,dim,B,dim,beta,C,dim); |
598 | 599 |
cblas_dgemm(CblasRowMajor,CblasTrans,CblasTrans, |
599 | 600 |
dim,dim,dim,alpha,B,dim,A,dim,beta,D,dim); |
601 |
/* dgemm(CblasRowMajor,CblasNoTrans,CblasNoTrans, */ |
|
602 |
/* dim,dim,dim,alpha,A,dim,B,dim,beta,C,dim); */ |
|
603 |
/* dgemm(CblasRowMajor,CblasTrans,CblasTrans, */ |
|
604 |
/* dim,dim,dim,alpha,B,dim,A,dim,beta,D,dim); */ |
|
600 | 605 |
} |
601 | 606 |
|
602 | 607 |
#else |
... | ... | |
607 | 612 |
dim,dim,dim,alpha,A,dim,B,dim,beta,C,dim); |
608 | 613 |
cblas_sgemm(CblasRowMajor,CblasTrans,CblasTrans, |
609 | 614 |
dim,dim,dim,alpha,B,dim,A,dim,beta,D,dim); |
615 |
/* sgemm(CblasRowMajor,CblasNoTrans,CblasNoTrans, */ |
|
616 |
/* dim,dim,dim,alpha,A,dim,B,dim,beta,C,dim); */ |
|
617 |
/* sgemm(CblasRowMajor,CblasTrans,CblasTrans, */ |
|
618 |
/* dim,dim,dim,alpha,B,dim,A,dim,beta,D,dim); */ |
|
610 | 619 |
} |
611 | 620 |
|
612 | 621 |
#endif |
Formats disponibles : Unified diff