Statistiques
| Révision :

root / Pi / C / OpenMP / Pi_OpenMP.c @ 308

Historique | Voir | Annoter | Télécharger (5,33 ko)

1 8 equemene
//
2 8 equemene
// Estimation of Pi using Monte Carlo exploration process
3 84 equemene
// Cecill v2 Emmanuel QUEMENER <emmanuel.quemener@gmail.com>
4 247 equemene
// gcc -std=c99 -O3 -o Pi_OpenMP Pi_OpenMP.c -lm
5 8 equemene
//
6 8 equemene
7 8 equemene
#include <math.h>
8 8 equemene
#include <stdio.h>
9 8 equemene
#include <stdlib.h>
10 8 equemene
#include <omp.h>
11 29 equemene
#include <limits.h>
12 185 equemene
#include <sys/time.h>
13 8 equemene
14 8 equemene
// Marsaglia RNG very simple implementation
15 8 equemene
#define znew  ((z=36969*(z&65535)+(z>>16))<<16)
16 8 equemene
#define wnew  ((w=18000*(w&65535)+(w>>16))&65535)
17 8 equemene
#define MWC   (znew+wnew)
18 8 equemene
#define SHR3  (jsr=(jsr=(jsr=jsr^(jsr<<17))^(jsr>>13))^(jsr<<5))
19 8 equemene
#define CONG  (jcong=69069*jcong+1234567)
20 8 equemene
#define KISS  ((MWC^CONG)+SHR3)
21 8 equemene
22 8 equemene
#define MWCfp MWC * 2.328306435454494e-10f
23 8 equemene
#define KISSfp KISS * 2.328306435454494e-10f
24 84 equemene
#define SHR3fp SHR3 * 2.328306435454494e-10f
25 84 equemene
#define CONGfp CONG * 2.328306435454494e-10f
26 8 equemene
27 8 equemene
#define ITERATIONS 1000000000
28 8 equemene
29 185 equemene
#define PARALLELRATE 1024
30 8 equemene
31 8 equemene
#ifdef LONG
32 29 equemene
#define LENGTH long long
33 8 equemene
#else
34 29 equemene
#define LENGTH int
35 8 equemene
#endif
36 8 equemene
37 8 equemene
LENGTH MainLoopGlobal(LENGTH iterations,unsigned int seed_w,unsigned int seed_z)
38 8 equemene
{
39 84 equemene
#if defined TCONG
40 84 equemene
   unsigned int jcong=seed_z;
41 84 equemene
#elif defined TSHR3
42 84 equemene
   unsigned int jsr=seed_w;
43 84 equemene
#elif defined TMWC
44 8 equemene
   unsigned int z=seed_z;
45 8 equemene
   unsigned int w=seed_w;
46 84 equemene
#elif defined TKISS
47 84 equemene
   unsigned int jcong=seed_z;
48 84 equemene
   unsigned int jsr=seed_w;
49 84 equemene
   unsigned int z=seed_z;
50 84 equemene
   unsigned int w=seed_w;
51 84 equemene
#endif
52 8 equemene
53 8 equemene
   LENGTH total=0;
54 84 equemene
55 8 equemene
   for (LENGTH i=0;i<iterations;i++) {
56 8 equemene
57 84 equemene
#if defined TINT32
58 84 equemene
    #define THEONE 1073741824
59 84 equemene
    #if defined TCONG
60 84 equemene
        unsigned int x=CONG>>17 ;
61 84 equemene
        unsigned int y=CONG>>17 ;
62 84 equemene
    #elif defined TSHR3
63 84 equemene
        unsigned int x=SHR3>>17 ;
64 84 equemene
        unsigned int y=SHR3>>17 ;
65 84 equemene
    #elif defined TMWC
66 84 equemene
        unsigned int x=MWC>>17 ;
67 84 equemene
        unsigned int y=MWC>>17 ;
68 84 equemene
    #elif defined TKISS
69 84 equemene
        unsigned int x=KISS>>17 ;
70 84 equemene
        unsigned int y=KISS>>17 ;
71 84 equemene
    #endif
72 84 equemene
#elif defined TINT64
73 84 equemene
    #define THEONE 4611686018427387904
74 84 equemene
    #if defined TCONG
75 84 equemene
        unsigned long x=(unsigned long)(CONG>>1) ;
76 84 equemene
        unsigned long y=(unsigned long)(CONG>>1) ;
77 84 equemene
    #elif defined TSHR3
78 84 equemene
        unsigned long x=(unsigned long)(SHR3>>1) ;
79 84 equemene
        unsigned long y=(unsigned long)(SHR3>>1) ;
80 84 equemene
    #elif defined TMWC
81 84 equemene
        unsigned long x=(unsigned long)(MWC>>1) ;
82 84 equemene
        unsigned long y=(unsigned long)(MWC>>1) ;
83 84 equemene
    #elif defined TKISS
84 84 equemene
        unsigned long x=(unsigned long)(KISS>>1) ;
85 84 equemene
        unsigned long y=(unsigned long)(KISS>>1) ;
86 84 equemene
    #endif
87 84 equemene
#elif defined TFP32
88 84 equemene
    #define THEONE 1.0f
89 84 equemene
    #if defined TCONG
90 84 equemene
        float x=CONGfp ;
91 84 equemene
        float y=CONGfp ;
92 84 equemene
    #elif defined TSHR3
93 84 equemene
        float x=SHR3fp ;
94 84 equemene
        float y=SHR3fp ;
95 84 equemene
    #elif defined TMWC
96 84 equemene
        float x=MWCfp ;
97 84 equemene
        float y=MWCfp ;
98 84 equemene
    #elif defined TKISS
99 84 equemene
      float x=KISSfp ;
100 84 equemene
      float y=KISSfp ;
101 84 equemene
    #endif
102 84 equemene
#elif defined TFP64
103 84 equemene
    #define THEONE 1.0f
104 84 equemene
    #if defined TCONG
105 84 equemene
        double x=(double)CONGfp ;
106 84 equemene
        double y=(double)CONGfp ;
107 84 equemene
    #elif defined TSHR3
108 84 equemene
        double x=(double)SHR3fp ;
109 84 equemene
        double y=(double)SHR3fp ;
110 84 equemene
    #elif defined TMWC
111 84 equemene
        double x=(double)MWCfp ;
112 84 equemene
        double y=(double)MWCfp ;
113 84 equemene
    #elif defined TKISS
114 84 equemene
        double x=(double)KISSfp ;
115 84 equemene
        double y=(double)KISSfp ;
116 84 equemene
    #endif
117 84 equemene
#endif
118 8 equemene
119 84 equemene
      unsigned long inside=((x*x+y*y) < THEONE) ? 1:0;
120 8 equemene
      total+=inside;
121 8 equemene
   }
122 8 equemene
123 8 equemene
   return(total);
124 8 equemene
}
125 8 equemene
126 185 equemene
LENGTH splitter(LENGTH iterations,unsigned int seed_w,unsigned int seed_z,unsigned int ParallelRate)
127 78 equemene
{
128 185 equemene
  LENGTH *inside,insides=0;
129 185 equemene
  struct timeval tv1,tv2;
130 185 equemene
  LENGTH IterationsEach=((iterations%ParallelRate)==0)?iterations/ParallelRate:iterations/ParallelRate+1;
131 78 equemene
132 189 equemene
  inside=(LENGTH*)malloc(sizeof(LENGTH)*ParallelRate);
133 189 equemene
134 189 equemene
  gettimeofday(&tv1, NULL);
135 189 equemene
136 189 equemene
#pragma omp parallel for
137 189 equemene
  for (int i=0 ; i<ParallelRate; i++) {
138 189 equemene
    inside[i]=MainLoopGlobal(IterationsEach,seed_w+i,seed_z+i);
139 78 equemene
  }
140 189 equemene
141 189 equemene
  for (int i=0 ; i<ParallelRate; i++) {
142 78 equemene
    insides+=inside[i];
143 78 equemene
  }
144 189 equemene
145 189 equemene
  gettimeofday(&tv2, NULL);
146 189 equemene
147 189 equemene
  for (int i=0 ; i<ParallelRate; i++) {
148 189 equemene
    printf("\tFound %lld for ParallelRate %i\n",(long long)inside[i],i);
149 189 equemene
  }
150 185 equemene
  printf("\n");
151 78 equemene
152 185 equemene
  double elapsed=(double)((tv2.tv_sec-tv1.tv_sec) * 1000000L +
153 185 equemene
                            (tv2.tv_usec-tv1.tv_usec))/1000000;
154 185 equemene
155 185 equemene
  double itops=(double)(ParallelRate*IterationsEach)/elapsed;
156 185 equemene
157 247 equemene
  printf("ParallelRate %i\nElapsed Time %.2f\nItops %.0f\nLogItops %.2f\n",ParallelRate,elapsed,itops,log10(itops));
158 185 equemene
159 185 equemene
  free(inside);
160 185 equemene
161 78 equemene
  return(insides);
162 78 equemene
}
163 78 equemene
164 78 equemene
165 8 equemene
int main(int argc, char *argv[]) {
166 8 equemene
167 185 equemene
  unsigned int seed_w=110271,seed_z=101008,ParallelRate=PARALLELRATE;
168 78 equemene
  LENGTH iterations=ITERATIONS,insides=0;
169 78 equemene
170 8 equemene
  if (argc > 1) {
171 31 equemene
    iterations=(LENGTH)atoll(argv[1]);
172 247 equemene
    if (argc > 2) {
173 247 equemene
      ParallelRate=atoi(argv[2]);
174 247 equemene
    }
175 8 equemene
  }
176 8 equemene
  else {
177 10 equemene
    printf("\n\tPi : Estimate Pi with Monte Carlo exploration\n\n");
178 10 equemene
    printf("\t\t#1 : number of iterations (default 1 billion)\n");
179 185 equemene
    printf("\t\t#2 : number of ParallelRate (default 1024)\n\n");
180 8 equemene
  }
181 8 equemene
182 29 equemene
  printf ("\n\tInformation about architecture:\n\n");
183 29 equemene
184 29 equemene
  printf ("\tSizeof int = %lld bytes.\n", (long long)sizeof(int));
185 29 equemene
  printf ("\tSizeof long = %lld bytes.\n", (long long)sizeof(long));
186 29 equemene
  printf ("\tSizeof long long = %lld bytes.\n\n", (long long)sizeof(long long));
187 29 equemene
188 29 equemene
  printf ("\tMax int = %u\n", INT_MAX);
189 29 equemene
  printf ("\tMax long = %ld\n", LONG_MAX);
190 29 equemene
  printf ("\tMax long long = %lld\n\n", LLONG_MAX);
191 29 equemene
192 185 equemene
  insides=splitter(iterations,seed_w,seed_z,ParallelRate);
193 8 equemene
194 185 equemene
  LENGTH total=((iterations%ParallelRate)==0)?iterations:(iterations/ParallelRate+1)*ParallelRate;
195 185 equemene
196 185 equemene
  printf("Inside/Total %ld %ld\nPi estimation %f\n\n",(long int)insides,(long int)total,(4.*(float)insides/total));
197 8 equemene
198 8 equemene
}