Statistiques
| Révision :

root / testing / matgen / HPL_lmul.c @ 9

Historique | Voir | Annoter | Télécharger (5,4 ko)

1
/* 
2
 * -- High Performance Computing Linpack Benchmark (HPL)                
3
 *    HPL - 2.0 - September 10, 2008                          
4
 *    Antoine P. Petitet                                                
5
 *    University of Tennessee, Knoxville                                
6
 *    Innovative Computing Laboratory                                 
7
 *    (C) Copyright 2000-2008 All Rights Reserved                       
8
 *                                                                      
9
 * -- Copyright notice and Licensing terms:                             
10
 *                                                                      
11
 * Redistribution  and  use in  source and binary forms, with or without
12
 * modification, are  permitted provided  that the following  conditions
13
 * are met:                                                             
14
 *                                                                      
15
 * 1. Redistributions  of  source  code  must retain the above copyright
16
 * notice, this list of conditions and the following disclaimer.        
17
 *                                                                      
18
 * 2. Redistributions in binary form must reproduce  the above copyright
19
 * notice, this list of conditions,  and the following disclaimer in the
20
 * documentation and/or other materials provided with the distribution. 
21
 *                                                                      
22
 * 3. All  advertising  materials  mentioning  features  or  use of this
23
 * software must display the following acknowledgement:                 
24
 * This  product  includes  software  developed  at  the  University  of
25
 * Tennessee, Knoxville, Innovative Computing Laboratory.             
26
 *                                                                      
27
 * 4. The name of the  University,  the name of the  Laboratory,  or the
28
 * names  of  its  contributors  may  not  be used to endorse or promote
29
 * products  derived   from   this  software  without  specific  written
30
 * permission.                                                          
31
 *                                                                      
32
 * -- Disclaimer:                                                       
33
 *                                                                      
34
 * THIS  SOFTWARE  IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
35
 * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES,  INCLUDING,  BUT NOT
36
 * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
37
 * A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE UNIVERSITY
38
 * OR  CONTRIBUTORS  BE  LIABLE FOR ANY  DIRECT,  INDIRECT,  INCIDENTAL,
39
 * SPECIAL,  EXEMPLARY,  OR  CONSEQUENTIAL DAMAGES  (INCLUDING,  BUT NOT
40
 * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
41
 * DATA OR PROFITS; OR BUSINESS INTERRUPTION)  HOWEVER CAUSED AND ON ANY
42
 * THEORY OF LIABILITY, WHETHER IN CONTRACT,  STRICT LIABILITY,  OR TORT
43
 * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
44
 * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. 
45
 * ---------------------------------------------------------------------
46
 */ 
47
/*
48
 * Include files
49
 */
50
#include "hpl.h"
51

    
52
#ifdef STDC_HEADERS
53
void HPL_lmul
54
(
55
   int *                            K,
56
   int *                            J,
57
   int *                            I
58
)
59
#else
60
void HPL_lmul
61
( K, J, I )
62
   int *                            K;
63
   int *                            J;
64
   int *                            I;
65
#endif
66
{
67
/* 
68
 * Purpose
69
 * =======
70
 *
71
 * HPL_lmul multiplies  without carry two long positive integers K and J
72
 * and puts the result into I. The long integers  I, J, K are encoded on
73
 * 32 bits using an array of 2 integers. The 32-lower bits are stored in
74
 * the first entry of each array, the 32-higher bits in the second entry
75
 * of each array. For efficiency purposes, the  intrisic modulo function
76
 * is inlined.
77
 *
78
 * Arguments
79
 * =========
80
 *
81
 * K       (local input)                 int *
82
 *         On entry, K is an integer array of dimension 2 containing the
83
 *         encoded long integer K.
84
 *
85
 * J       (local input)                 int *
86
 *         On entry, J is an integer array of dimension 2 containing the
87
 *         encoded long integer J.
88
 *
89
 * I       (local output)                int *
90
 *         On entry, I is an integer array of dimension 2. On exit, this
91
 *         array contains the encoded long integer result.
92
 *
93
 * ---------------------------------------------------------------------
94
 */ 
95
/*
96
 * .. Local Variables ..
97
 */
98
   int                        r, c;
99
   unsigned int               kk[4], jj[4], res[5];
100
/* ..
101
 * .. Executable Statements ..
102
 */
103
/*
104
 * Addition is done with 16 bits at a time. Multiplying two 16-bit
105
 * integers yields a 32-bit result. The lower 16-bits of the result
106
 * are kept in I, and the higher 16-bits are carried over to the
107
 * next multiplication.
108
 */
109
   for (c = 0; c < 2; ++c) {
110
     kk[2*c] = K[c] & 65535;
111
     kk[2*c+1] = ((unsigned)K[c] >> 16) & 65535;
112
     jj[2*c] = J[c] & 65535;
113
     jj[2*c+1] = ((unsigned)J[c] >> 16) & 65535;
114
   }
115

    
116
   res[0] = 0;
117
   for (c = 0; c < 4; ++c) {
118
     res[c+1] = (res[c] >> 16) & 65535;
119
     res[c] &= 65535;
120
     for (r = 0; r < c+1; ++r) {
121
       res[c] = kk[r] * jj[c-r] + (res[c] & 65535);
122
       res[c+1] += (res[c] >> 16) & 65535;
123
     }
124
   }
125

    
126
   for (c = 0; c < 2; ++c)
127
     I[c] = (int)(((res[2*c+1] & 65535) << 16) | (res[2*c] & 65535));
128
/*
129
 * End of HPL_lmul
130
 */
131
}