Statistiques
| Révision :

root / setup / Make.Debian_GotoBLAS2_OpenMPI

Historique | Voir | Annoter | Télécharger (8,99 ko)

1 11 equemene
#
2 11 equemene
#  -- High Performance Computing Linpack Benchmark (HPL)
3 11 equemene
#     HPL - 2.0 - September 10, 2008
4 11 equemene
#     Antoine P. Petitet
5 11 equemene
#     University of Tennessee, Knoxville
6 11 equemene
#     Innovative Computing Laboratory
7 11 equemene
#     (C) Copyright 2000-2008 All Rights Reserved
8 11 equemene
#
9 11 equemene
#  -- Copyright notice and Licensing terms:
10 11 equemene
#
11 11 equemene
#  Redistribution  and  use in  source and binary forms, with or without
12 11 equemene
#  modification, are  permitted provided  that the following  conditions
13 11 equemene
#  are met:
14 11 equemene
#
15 11 equemene
#  1. Redistributions  of  source  code  must retain the above copyright
16 11 equemene
#  notice, this list of conditions and the following disclaimer.
17 11 equemene
#
18 11 equemene
#  2. Redistributions in binary form must reproduce  the above copyright
19 11 equemene
#  notice, this list of conditions,  and the following disclaimer in the
20 11 equemene
#  documentation and/or other materials provided with the distribution.
21 11 equemene
#
22 11 equemene
#  3. All  advertising  materials  mentioning  features  or  use of this
23 11 equemene
#  software must display the following acknowledgement:
24 11 equemene
#  This  product  includes  software  developed  at  the  University  of
25 11 equemene
#  Tennessee, Knoxville, Innovative Computing Laboratory.
26 11 equemene
#
27 11 equemene
#  4. The name of the  University,  the name of the  Laboratory,  or the
28 11 equemene
#  names  of  its  contributors  may  not  be used to endorse or promote
29 11 equemene
#  products  derived   from   this  software  without  specific  written
30 11 equemene
#  permission.
31 11 equemene
#
32 11 equemene
#  -- Disclaimer:
33 11 equemene
#
34 11 equemene
#  THIS  SOFTWARE  IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
35 11 equemene
#  ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES,  INCLUDING,  BUT NOT
36 11 equemene
#  LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
37 11 equemene
#  A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE UNIVERSITY
38 11 equemene
#  OR  CONTRIBUTORS  BE  LIABLE FOR ANY  DIRECT,  INDIRECT,  INCIDENTAL,
39 11 equemene
#  SPECIAL,  EXEMPLARY,  OR  CONSEQUENTIAL DAMAGES  (INCLUDING,  BUT NOT
40 11 equemene
#  LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
41 11 equemene
#  DATA OR PROFITS; OR BUSINESS INTERRUPTION)  HOWEVER CAUSED AND ON ANY
42 11 equemene
#  THEORY OF LIABILITY, WHETHER IN CONTRACT,  STRICT LIABILITY,  OR TORT
43 11 equemene
#  (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
44 11 equemene
#  OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
45 11 equemene
# ######################################################################
46 11 equemene
#
47 11 equemene
# ----------------------------------------------------------------------
48 11 equemene
# - shell --------------------------------------------------------------
49 11 equemene
# ----------------------------------------------------------------------
50 11 equemene
#
51 11 equemene
SHELL        = /bin/sh
52 11 equemene
#
53 11 equemene
CD           = cd
54 11 equemene
CP           = cp
55 11 equemene
LN_S         = ln -s
56 11 equemene
MKDIR        = mkdir
57 11 equemene
RM           = /bin/rm -f
58 11 equemene
TOUCH        = touch
59 11 equemene
#
60 11 equemene
# ----------------------------------------------------------------------
61 11 equemene
# - Platform identifier ------------------------------------------------
62 11 equemene
# ----------------------------------------------------------------------
63 11 equemene
#
64 11 equemene
ARCH         = $(arch)
65 11 equemene
#
66 11 equemene
# ----------------------------------------------------------------------
67 11 equemene
# - HPL Directory Structure / HPL library ------------------------------
68 11 equemene
# ----------------------------------------------------------------------
69 11 equemene
#
70 11 equemene
TOPdir       = $(topdir)
71 11 equemene
INCdir       = $(TOPdir)/include
72 11 equemene
BINdir       = $(TOPdir)/bin/$(ARCH)
73 11 equemene
LIBdir       = $(TOPdir)/lib/$(ARCH)
74 11 equemene
#
75 11 equemene
HPLlib       = $(LIBdir)/libhpl.a
76 11 equemene
#
77 11 equemene
# ----------------------------------------------------------------------
78 11 equemene
# - Message Passing library (MPI) --------------------------------------
79 11 equemene
# ----------------------------------------------------------------------
80 11 equemene
# MPinc tells the  C  compiler where to find the Message Passing library
81 11 equemene
# header files,  MPlib  is defined  to be the name of  the library to be
82 11 equemene
# used. The variable MPdir is only used for defining MPinc and MPlib.
83 11 equemene
#
84 11 equemene
MPdir        = /usr/lib/openmpi
85 11 equemene
MPinc        = -I/include/include/openmpi
86 11 equemene
MPlib        = -L$(MPdir)/lib/libmpi.so
87 11 equemene
#
88 11 equemene
# ----------------------------------------------------------------------
89 11 equemene
# - Linear Algebra library (BLAS or VSIPL) -----------------------------
90 11 equemene
# ----------------------------------------------------------------------
91 11 equemene
# LAinc tells the  C  compiler where to find the Linear Algebra  library
92 11 equemene
# header files,  LAlib  is defined  to be the name of  the library to be
93 11 equemene
# used. The variable LAdir is only used for defining LAinc and LAlib.
94 11 equemene
#
95 11 equemene
LAdir        = /opt/GotoBLAS2
96 11 equemene
LAinc        = -I/opt/GotoBLAS2
97 11 equemene
LAlib        = $(LAdir)/libgoto2.a
98 11 equemene
#
99 11 equemene
# ----------------------------------------------------------------------
100 11 equemene
# - F77 / C interface --------------------------------------------------
101 11 equemene
# ----------------------------------------------------------------------
102 11 equemene
# You can skip this section  if and only if  you are not planning to use
103 11 equemene
# a  BLAS  library featuring a Fortran 77 interface.  Otherwise,  it  is
104 11 equemene
# necessary  to  fill out the  F2CDEFS  variable  with  the  appropriate
105 11 equemene
# options.  **One and only one**  option should be chosen in **each** of
106 11 equemene
# the 3 following categories:
107 11 equemene
#
108 11 equemene
# 1) name space (How C calls a Fortran 77 routine)
109 11 equemene
#
110 11 equemene
# -DAdd_              : all lower case and a suffixed underscore  (Suns,
111 11 equemene
#                       Intel, ...),                           [default]
112 11 equemene
# -DNoChange          : all lower case (IBM RS6000),
113 11 equemene
# -DUpCase            : all upper case (Cray),
114 11 equemene
# -DAdd__             : the FORTRAN compiler in use is f2c.
115 11 equemene
#
116 11 equemene
# 2) C and Fortran 77 integer mapping
117 11 equemene
#
118 11 equemene
# -DF77_INTEGER=int   : Fortran 77 INTEGER is a C int,         [default]
119 11 equemene
# -DF77_INTEGER=long  : Fortran 77 INTEGER is a C long,
120 11 equemene
# -DF77_INTEGER=short : Fortran 77 INTEGER is a C short.
121 11 equemene
#
122 11 equemene
# 3) Fortran 77 string handling
123 11 equemene
#
124 11 equemene
# -DStringSunStyle    : The string address is passed at the string loca-
125 11 equemene
#                       tion on the stack, and the string length is then
126 11 equemene
#                       passed as  an  F77_INTEGER  after  all  explicit
127 11 equemene
#                       stack arguments,                       [default]
128 11 equemene
# -DStringStructPtr   : The address  of  a  structure  is  passed  by  a
129 11 equemene
#                       Fortran 77  string,  and the structure is of the
130 11 equemene
#                       form: struct {char *cp; F77_INTEGER len;},
131 11 equemene
# -DStringStructVal   : A structure is passed by value for each  Fortran
132 11 equemene
#                       77 string,  and  the  structure is  of the form:
133 11 equemene
#                       struct {char *cp; F77_INTEGER len;},
134 11 equemene
# -DStringCrayStyle   : Special option for  Cray  machines,  which  uses
135 11 equemene
#                       Cray  fcd  (fortran  character  descriptor)  for
136 11 equemene
#                       interoperation.
137 11 equemene
#
138 11 equemene
F2CDEFS      =
139 11 equemene
#
140 11 equemene
# ----------------------------------------------------------------------
141 11 equemene
# - HPL includes / libraries / specifics -------------------------------
142 11 equemene
# ----------------------------------------------------------------------
143 11 equemene
#
144 11 equemene
HPL_INCLUDES = -I$(INCdir) -I$(INCdir)/$(ARCH) $(LAinc) $(MPinc)
145 11 equemene
HPL_LIBS     = $(HPLlib) $(LAlib) $(MPlib)
146 11 equemene
#
147 11 equemene
# - Compile time options -----------------------------------------------
148 11 equemene
#
149 11 equemene
# -DHPL_COPY_L           force the copy of the panel L before bcast;
150 11 equemene
# -DHPL_CALL_CBLAS       call the cblas interface;
151 11 equemene
# -DHPL_CALL_VSIPL       call the vsip  library;
152 11 equemene
# -DHPL_CALL_CUBLAS      call the CuBLAS library from Nvidia Cuda;
153 11 equemene
# -DHPL_CALL_ACML        call the ACML library from ATI;
154 11 equemene
# -DHPL_CALL_GOTOBLAS    call the ACML library from ATI;
155 11 equemene
156 11 equemene
# -DHPL_DETAILED_TIMING  enable detailed timers;
157 11 equemene
#
158 11 equemene
# By default HPL will:
159 11 equemene
#    *) not copy L before broadcast,
160 11 equemene
#    *) call the BLAS Fortran 77 interface,
161 11 equemene
#    *) not display detailed timing information.
162 11 equemene
#
163 11 equemene
HPL_OPTS     = -DHPL_CALL_CBLAS
164 11 equemene
#
165 11 equemene
# ----------------------------------------------------------------------
166 11 equemene
#
167 11 equemene
HPL_DEFS     = $(F2CDEFS) $(HPL_OPTS) $(HPL_INCLUDES)
168 11 equemene
#
169 11 equemene
# ----------------------------------------------------------------------
170 11 equemene
# - Compilers / linkers - Optimization flags ---------------------------
171 11 equemene
# ----------------------------------------------------------------------
172 11 equemene
#
173 11 equemene
CC           = /usr/bin/mpicc.openmpi
174 11 equemene
CCNOOPT      = $(HPL_DEFS)
175 11 equemene
CCFLAGS      = $(HPL_DEFS) -fomit-frame-pointer -O3 -funroll-loops -W -Wall
176 11 equemene
#
177 11 equemene
# On some platforms,  it is necessary  to use the Fortran linker to find
178 11 equemene
# the Fortran internals used in the BLAS library.
179 11 equemene
#
180 11 equemene
LINKER       = /usr/bin/mpicc.openmpi
181 11 equemene
LINKFLAGS    = $(CCFLAGS)
182 11 equemene
#
183 11 equemene
ARCHIVER     = ar
184 11 equemene
ARFLAGS      = r
185 11 equemene
RANLIB       = echo
186 11 equemene
#
187 11 equemene
# ----------------------------------------------------------------------