Statistiques
| Révision :

root / Pi / C / OpenMP / XeonPhi / Pi_OpenMP.c @ 186

Historique | Voir | Annoter | Télécharger (5,49 ko)

1 78 equemene
//
2 78 equemene
// Estimation of Pi using Monte Carlo exploration process
3 83 equemene
// Cecill v2 Emmanuel QUEMENER <emmanuel.quemener@gmail.com>
4 82 equemene
// Exploit OpenMP on Xeon Phi
5 82 equemene
// source /opt/intel/bin/compilervars.sh intel64
6 82 equemene
// icpc -std=c99 -O3 -o Pi Pi.c -lm
7 78 equemene
//
8 78 equemene
9 78 equemene
#include <math.h>
10 78 equemene
#include <stdio.h>
11 78 equemene
#include <stdlib.h>
12 78 equemene
#include <omp.h>
13 78 equemene
#include <limits.h>
14 184 equemene
#include <sys/time.h>
15 78 equemene
16 78 equemene
// Marsaglia RNG very simple implementation
17 78 equemene
#define znew  ((z=36969*(z&65535)+(z>>16))<<16)
18 78 equemene
#define wnew  ((w=18000*(w&65535)+(w>>16))&65535)
19 78 equemene
#define MWC   (znew+wnew)
20 78 equemene
#define SHR3  (jsr=(jsr=(jsr=jsr^(jsr<<17))^(jsr>>13))^(jsr<<5))
21 78 equemene
#define CONG  (jcong=69069*jcong+1234567)
22 78 equemene
#define KISS  ((MWC^CONG)+SHR3)
23 78 equemene
24 78 equemene
#define MWCfp MWC * 2.328306435454494e-10f
25 78 equemene
#define KISSfp KISS * 2.328306435454494e-10f
26 82 equemene
#define SHR3fp SHR3 * 2.328306435454494e-10f
27 82 equemene
#define CONGfp CONG * 2.328306435454494e-10f
28 78 equemene
29 78 equemene
#define ITERATIONS 1000000000
30 78 equemene
31 184 equemene
#define PARALLELRATE 1024
32 78 equemene
33 78 equemene
#ifdef LONG
34 78 equemene
#define LENGTH long long
35 78 equemene
#else
36 78 equemene
#define LENGTH int
37 78 equemene
#endif
38 78 equemene
39 78 equemene
#pragma omp declare target
40 184 equemene
LENGTH splitter(LENGTH,int,int,int);
41 78 equemene
42 78 equemene
LENGTH MainLoopGlobal(LENGTH iterations,unsigned int seed_w,unsigned int seed_z)
43 78 equemene
{
44 82 equemene
#if defined TCONG
45 82 equemene
   unsigned int jcong=seed_z;
46 82 equemene
#elif defined TSHR3
47 82 equemene
   unsigned int jsr=seed_w;
48 82 equemene
#elif defined TMWC
49 78 equemene
   unsigned int z=seed_z;
50 78 equemene
   unsigned int w=seed_w;
51 82 equemene
#elif defined TKISS
52 82 equemene
   unsigned int jcong=seed_z;
53 82 equemene
   unsigned int jsr=seed_w;
54 82 equemene
   unsigned int z=seed_z;
55 82 equemene
   unsigned int w=seed_w;
56 82 equemene
#endif
57 82 equemene
58 78 equemene
   LENGTH total=0;
59 78 equemene
60 78 equemene
   for (LENGTH i=0;i<iterations;i++) {
61 78 equemene
62 82 equemene
#if defined TINT32
63 82 equemene
    #define THEONE 1073741824
64 82 equemene
    #if defined TCONG
65 82 equemene
        unsigned int x=CONG>>17 ;
66 82 equemene
        unsigned int y=CONG>>17 ;
67 82 equemene
    #elif defined TSHR3
68 82 equemene
        unsigned int x=SHR3>>17 ;
69 82 equemene
        unsigned int y=SHR3>>17 ;
70 82 equemene
    #elif defined TMWC
71 82 equemene
        unsigned int x=MWC>>17 ;
72 82 equemene
        unsigned int y=MWC>>17 ;
73 82 equemene
    #elif defined TKISS
74 82 equemene
        unsigned int x=KISS>>17 ;
75 82 equemene
        unsigned int y=KISS>>17 ;
76 82 equemene
    #endif
77 82 equemene
#elif defined TINT64
78 82 equemene
    #define THEONE 4611686018427387904
79 82 equemene
    #if defined TCONG
80 82 equemene
        unsigned long x=(unsigned long)(CONG>>1) ;
81 82 equemene
        unsigned long y=(unsigned long)(CONG>>1) ;
82 82 equemene
    #elif defined TSHR3
83 82 equemene
        unsigned long x=(unsigned long)(SHR3>>1) ;
84 82 equemene
        unsigned long y=(unsigned long)(SHR3>>1) ;
85 82 equemene
    #elif defined TMWC
86 82 equemene
        unsigned long x=(unsigned long)(MWC>>1) ;
87 82 equemene
        unsigned long y=(unsigned long)(MWC>>1) ;
88 82 equemene
    #elif defined TKISS
89 82 equemene
        unsigned long x=(unsigned long)(KISS>>1) ;
90 82 equemene
        unsigned long y=(unsigned long)(KISS>>1) ;
91 82 equemene
    #endif
92 82 equemene
#elif defined TFP32
93 82 equemene
    #define THEONE 1.0f
94 82 equemene
    #if defined TCONG
95 82 equemene
        float x=CONGfp ;
96 82 equemene
        float y=CONGfp ;
97 82 equemene
    #elif defined TSHR3
98 82 equemene
        float x=SHR3fp ;
99 82 equemene
        float y=SHR3fp ;
100 82 equemene
    #elif defined TMWC
101 82 equemene
        float x=MWCfp ;
102 82 equemene
        float y=MWCfp ;
103 82 equemene
    #elif defined TKISS
104 82 equemene
      float x=KISSfp ;
105 82 equemene
      float y=KISSfp ;
106 82 equemene
    #endif
107 82 equemene
#elif defined TFP64
108 82 equemene
    #define THEONE 1.0f
109 82 equemene
    #if defined TCONG
110 82 equemene
        double x=(double)CONGfp ;
111 82 equemene
        double y=(double)CONGfp ;
112 82 equemene
    #elif defined TSHR3
113 82 equemene
        double x=(double)SHR3fp ;
114 82 equemene
        double y=(double)SHR3fp ;
115 82 equemene
    #elif defined TMWC
116 82 equemene
        double x=(double)MWCfp ;
117 82 equemene
        double y=(double)MWCfp ;
118 82 equemene
    #elif defined TKISS
119 82 equemene
        double x=(double)KISSfp ;
120 82 equemene
        double y=(double)KISSfp ;
121 82 equemene
    #endif
122 82 equemene
#endif
123 78 equemene
124 78 equemene
      // Matching test
125 82 equemene
      unsigned long inside=((x*x+y*y) < THEONE) ? 1:0;
126 78 equemene
      total+=inside;
127 82 equemene
128 78 equemene
   }
129 78 equemene
130 78 equemene
   return(total);
131 78 equemene
}
132 78 equemene
133 184 equemene
LENGTH splitter(LENGTH iterations,int seed_w,int seed_z,int ParallelRate) {
134 78 equemene
135 186 equemene
  LENGTH *inside,insides=0;
136 78 equemene
  int i;
137 184 equemene
  struct timeval tv1,tv2;
138 184 equemene
  struct timezone tz;
139 184 equemene
  LENGTH IterationsEach=((iterations%ParallelRate)==0)?iterations/ParallelRate:iterations/ParallelRate+1;
140 184 equemene
141 186 equemene
  inside=(LENGTH*)malloc(sizeof(LENGTH)*ParallelRate);
142 186 equemene
143 184 equemene
  gettimeofday(&tv1, &tz);
144 78 equemene
145 78 equemene
#pragma omp target device(0)
146 78 equemene
#pragma omp teams num_teams(60) thread_limit(4)
147 82 equemene
// #pragma omp parallel for
148 78 equemene
#pragma omp distribute
149 184 equemene
  for (int i=0 ; i<ParallelRate; i++) {
150 184 equemene
    inside[i]=MainLoopGlobal(IterationsEach,seed_w+i,seed_z+i);
151 78 equemene
  }
152 78 equemene
153 184 equemene
  for (int i=0 ; i<ParallelRate; i++) {
154 78 equemene
    insides+=inside[i];
155 78 equemene
  }
156 184 equemene
157 184 equemene
  gettimeofday(&tv2, &tz);
158 184 equemene
159 184 equemene
  for (int i=0 ; i<ParallelRate; i++) {
160 184 equemene
    printf("\tFound %lld for process %i\n",(long long)inside[i],i);
161 184 equemene
  }
162 82 equemene
  printf("\n");
163 184 equemene
164 184 equemene
  double elapsed=(double)((tv2.tv_sec-tv1.tv_sec) * 1000000L +
165 184 equemene
                          (tv2.tv_usec-tv1.tv_usec))/1000000;
166 78 equemene
167 184 equemene
  double itops=(double)(ParallelRate*IterationsEach)/elapsed;
168 184 equemene
169 184 equemene
  printf("ParallelRate %i\nElapsed Time %.2f\nItops %.0f\n",ParallelRate,elapsed,itops);
170 186 equemene
171 186 equemene
  free(inside);
172 78 equemene
  return(insides);
173 78 equemene
}
174 78 equemene
175 78 equemene
int main(int argc, char *argv[]) {
176 78 equemene
177 184 equemene
  unsigned int seed_w=110271,seed_z=101008,ParallelRate=PARALLELRATE;
178 78 equemene
  LENGTH iterations=ITERATIONS;
179 82 equemene
  LENGTH insides=0;
180 78 equemene
181 78 equemene
  if (argc > 1) {
182 78 equemene
    iterations=(LENGTH)atoll(argv[1]);
183 184 equemene
    ParallelRate=atoi(argv[2]);
184 78 equemene
  }
185 78 equemene
  else {
186 78 equemene
    printf("\n\tPi : Estimate Pi with Monte Carlo exploration\n\n");
187 78 equemene
    printf("\t\t#1 : number of iterations (default 1 billion)\n");
188 184 equemene
    printf("\t\t#2 : ParallelRate (default 1024)\n\n");
189 78 equemene
  }
190 78 equemene
191 78 equemene
  printf ("\n\tInformation about architecture:\n\n");
192 78 equemene
193 78 equemene
  printf ("\tSizeof int = %lld bytes.\n", (long long)sizeof(int));
194 78 equemene
  printf ("\tSizeof long = %lld bytes.\n", (long long)sizeof(long));
195 78 equemene
  printf ("\tSizeof long long = %lld bytes.\n\n", (long long)sizeof(long long));
196 78 equemene
197 78 equemene
  printf ("\tMax int = %u\n", INT_MAX);
198 78 equemene
  printf ("\tMax long = %ld\n", LONG_MAX);
199 78 equemene
  printf ("\tMax long long = %lld\n\n", LLONG_MAX);
200 78 equemene
201 184 equemene
  insides=splitter(iterations,seed_w,seed_z,ParallelRate);
202 78 equemene
203 184 equemene
  LENGTH total=((iterations%ParallelRate)==0)?iterations:(iterations/ParallelRate+1)*ParallelRate;
204 78 equemene
205 184 equemene
  printf("Inside/Total %ld %ld\nPi estimation %f\n\n",insides,total,(4.*(float)insides/total));
206 78 equemene
207 78 equemene
}