Statistiques
| Révision :

root / BLAS / xGEMM / Makefile @ 6

Historique | Voir | Annoter | Télécharger (3,34 ko)

1 1 equemene
SOURCE=xGEMM.c
2 1 equemene
3 1 equemene
CC=gcc
4 1 equemene
CFLAGS=-Wall -O3
5 1 equemene
LDFLAGS=-lm
6 1 equemene
CUDADIR=/opt/cuda
7 1 equemene
CUDASRC=$(CUDADIR)/src
8 1 equemene
THUNKING=fortran_thunking.c
9 1 equemene
CUDASRCINC=fortran_common.h
10 1 equemene
CUDAINC=$(CUDADIR)/include
11 1 equemene
CUDALIB=$(CUDADIR)/lib64
12 1 equemene
13 1 equemene
PATCHTHUNKING=patch_thunking.h
14 1 equemene
15 1 equemene
GSLINC=/usr/include/gsl
16 1 equemene
17 1 equemene
GOTO2=/opt/GotoBLAS2
18 1 equemene
19 6 equemene
OPENBLAS=/opt/OpenBLAS
20 6 equemene
21 1 equemene
ACML=/opt/acml
22 1 equemene
ACMLINC=$(ACML)/gfortran64_mp/include
23 1 equemene
ACMLLIB=$(ACML)/gfortran64_mp/lib
24 1 equemene
25 1 equemene
26 6 equemene
EXECUTABLE=cblas fblas gsl cublas thunking gotoblas openblas acml
27 1 equemene
28 1 equemene
FORMAT=DOUBLE
29 1 equemene
#FORMAT=FLOAT
30 1 equemene
31 1 equemene
#DIRECTIVES=-D$(FORMAT) -DPRINT -DUNIT
32 1 equemene
#DIRECTIVES=-D$(FORMAT) -DUNIT -DRESULTS -DQUIET
33 1 equemene
DIRECTIVES=-DUNIT -DQUIET
34 1 equemene
35 1 equemene
all: $(EXECUTABLE)
36 1 equemene
37 1 equemene
cblas: $(SOURCE)
38 1 equemene
39 1 equemene
	$(CC) $(CFLAGS) $(DIRECTIVES) -DFLOAT -DCBLAS $(LDFLAGS) \
40 1 equemene
		$(SOURCE) -lcblas -o $(SOURCE:.c=)_SP_$@
41 1 equemene
42 1 equemene
	$(CC) $(CFLAGS) $(DIRECTIVES) -DDOUBLE -DCBLAS $(LDFLAGS) \
43 1 equemene
		$(SOURCE) -lcblas -o $(SOURCE:.c=)_DP_$@
44 1 equemene
45 1 equemene
gotoblas: $(SOURCE)
46 1 equemene
47 1 equemene
	$(CC) $(CFLAGS) $(DIRECTIVES) -DFLOAT -DCBLAS $(LDFLAGS) \
48 1 equemene
		$(SOURCE) $(GOTO2)/libgoto2.a -lpthread -o $(SOURCE:.c=)_SP_$@
49 1 equemene
50 1 equemene
	$(CC) $(CFLAGS) $(DIRECTIVES) -DDOUBLE -DCBLAS $(LDFLAGS) \
51 1 equemene
		$(SOURCE) $(GOTO2)/libgoto2.a -lpthread -o $(SOURCE:.c=)_DP_$@
52 1 equemene
53 6 equemene
openblas: $(SOURCE)
54 6 equemene
55 6 equemene
	$(CC) $(CFLAGS) $(DIRECTIVES) -DFLOAT -DCBLAS $(LDFLAGS) \
56 6 equemene
		$(SOURCE) $(OPENBLAS)/libopenblas.a -lpthread -o $(SOURCE:.c=)_SP_$@
57 6 equemene
58 6 equemene
	$(CC) $(CFLAGS) $(DIRECTIVES) -DDOUBLE -DCBLAS $(LDFLAGS) \
59 6 equemene
		$(SOURCE) $(OPENBLAS)/libopenblas.a -lpthread -o $(SOURCE:.c=)_DP_$@
60 6 equemene
61 1 equemene
acml: $(SOURCE)
62 1 equemene
63 1 equemene
	$(CC) -I$(ACMLINC) $(CFLAGS) $(DIRECTIVES) -DFLOAT -DACML $(LDFLAGS) \
64 1 equemene
		$(SOURCE) -L$(ACMLLIB) -lacml_mp -lacml_mv \
65 1 equemene
		-lgomp -lgfortran -lpthread -o $(SOURCE:.c=)_SP_$@
66 1 equemene
67 1 equemene
	$(CC) -I$(ACMLINC) $(CFLAGS) $(DIRECTIVES) -DDOUBLE -DACML $(LDFLAGS) \
68 1 equemene
		$(SOURCE) -L$(ACMLLIB) -lacml_mp -lacml_mv \
69 1 equemene
		-lgomp -lgfortran -lpthread -o $(SOURCE:.c=)_DP_$@
70 1 equemene
71 1 equemene
fblas: $(SOURCE)
72 1 equemene
73 1 equemene
	$(CC) $(CFLAGS) $(DIRECTIVES) -DFLOAT -DFBLAS $(LDFLAGS) \
74 1 equemene
		$(SOURCE) -lf77blas -o $(SOURCE:.c=)_SP_$@
75 1 equemene
76 1 equemene
	$(CC) $(CFLAGS) $(DIRECTIVES) -DDOUBLE -DFBLAS $(LDFLAGS) \
77 1 equemene
		$(SOURCE) -lf77blas -o $(SOURCE:.c=)_DP_$@
78 1 equemene
79 1 equemene
80 1 equemene
gsl: $(SOURCE)
81 1 equemene
82 1 equemene
	$(CC) -I$(GSLINC) $(CFLAGS) $(DIRECTIVES) -DFLOAT \
83 1 equemene
		-DGSL $(LDFLAGS) \
84 1 equemene
		$(SOURCE) -lgslcblas -o $(SOURCE:.c=)_SP_$@
85 1 equemene
86 1 equemene
	$(CC) -I$(GSLINC) $(CFLAGS) $(DIRECTIVES) -DDOUBLE \
87 1 equemene
		-DGSL $(LDFLAGS) \
88 1 equemene
		$(SOURCE) -lgslcblas -o $(SOURCE:.c=)_DP_$@
89 1 equemene
90 1 equemene
cublas: $(SOURCE)
91 1 equemene
92 1 equemene
	$(CC) -I$(CUDAINC) -L$(CUDALIB) $(CFLAGS) -DFLOAT \
93 1 equemene
		-DCUBLAS $(LDFLAGS) \
94 1 equemene
		$(DIRECTIVES) $(SOURCE) -lcublas -o $(SOURCE:.c=)_SP_$@
95 1 equemene
96 1 equemene
	$(CC) -I$(CUDAINC) -L$(CUDALIB) $(CFLAGS) -DDOUBLE \
97 1 equemene
		-DCUBLAS $(LDFLAGS) \
98 1 equemene
		$(DIRECTIVES) $(SOURCE) -lcublas -o $(SOURCE:.c=)_DP_$@
99 1 equemene
100 1 equemene
thunking: $(SOURCE)
101 1 equemene
102 1 equemene
	# Copy of source for thunking CUBLAS approach
103 1 equemene
	cp $(CUDASRC)/$(THUNKING) $(CUDASRC)/$(THUNKING:.c=.h) \
104 1 equemene
		$(CUDASRC)/$(CUDASRCINC) .
105 1 equemene
	# Patch Thunking prototypes to compile on Debian Lenny
106 1 equemene
	patch $(CUDASRCINC) $(PATCHTHUNKING)
107 1 equemene
	$(CC) -I$(CUDAINC) $(CFLAGS) -c $(THUNKING)
108 1 equemene
109 1 equemene
	$(CC) -I$(CUDAINC) -L$(CUDALIB) $(CFLAGS) -DFLOAT -DTHUNKING \
110 1 equemene
		$(LDFLAGS) $(DIRECTIVES) $(SOURCE) \
111 1 equemene
		$(THUNKING:.c=.o) -lcublas -o $(SOURCE:.c=)_SP_$@
112 1 equemene
113 1 equemene
	$(CC) -I$(CUDAINC) -L$(CUDALIB) $(CFLAGS) -DDOUBLE -DTHUNKING \
114 1 equemene
		$(LDFLAGS) $(DIRECTIVES) $(SOURCE) \
115 1 equemene
		$(THUNKING:.c=.o) -lcublas -o $(SOURCE:.c=)_DP_$@
116 1 equemene
117 1 equemene
clean: $(SOURCE)
118 1 equemene
	find . -name "$(SOURCE:.c=)_*" -exec rm {} \;
119 1 equemene
	find . -name "$(THUNKING:.c=)*" -exec rm {} \;
120 1 equemene
	find . -name "*~" -exec rm {} \;
121 1 equemene
	find . -name "$(CUDASRCINC)" -exec rm {} \;
122 1 equemene
123 1 equemene
check: $(EXECUTABLE)
124 1 equemene
125 1 equemene
	$(SOURCE:.c=)_SP_$(EXECUTABLE) 2 1