root / ETSN / MySteps_6_openmp.c @ 301
Historique | Voir | Annoter | Télécharger (3,18 ko)
1 | 296 | equemene | /* Simple SillySum function in C and OpenMP/C */
|
---|---|---|---|
2 | 296 | equemene | /* compilation with sequential compute : gcc -fopenmp -O3 -o MySteps_6_openmp MySteps_6_openmp.c -lm -lgomp */
|
3 | 296 | equemene | /* compilation without sequential compute : gcc -DNOSERIAL -fopenmp -O3 -o MySteps_6_openmp_NoSerial MySteps_6_openmp.c -lm -lgomp */
|
4 | 296 | equemene | |
5 | 296 | equemene | #include <math.h> |
6 | 296 | equemene | #include <stdio.h> |
7 | 296 | equemene | #include <stdlib.h> |
8 | 296 | equemene | #include <sys/time.h> |
9 | 296 | equemene | |
10 | 296 | equemene | #define PI 3.141592653589793 |
11 | 296 | equemene | |
12 | 296 | equemene | #define MYFLOAT float |
13 | 296 | equemene | |
14 | 296 | equemene | MYFLOAT MySillyFunction(MYFLOAT x) |
15 | 296 | equemene | { |
16 | 296 | equemene | return(pow(sqrt(log(exp(atanh(tanh(asinh(sinh(acosh(cosh(atan(tan(asin(sin(acos(cos(x))))))))))))))),2)); |
17 | 296 | equemene | } |
18 | 296 | equemene | |
19 | 296 | equemene | void MySillySum(MYFLOAT *res, MYFLOAT *a, MYFLOAT *b,int calls, int size) |
20 | 296 | equemene | { |
21 | 296 | equemene | for (uint i=0; i<size;i++) |
22 | 296 | equemene | { |
23 | 296 | equemene | MYFLOAT ai=a[i]; |
24 | 296 | equemene | MYFLOAT bi=b[i]; |
25 | 296 | equemene | |
26 | 296 | equemene | for (int c=0;c<calls;c++) |
27 | 296 | equemene | { |
28 | 296 | equemene | ai=MySillyFunction(ai); |
29 | 296 | equemene | bi=MySillyFunction(bi); |
30 | 296 | equemene | } |
31 | 296 | equemene | |
32 | 296 | equemene | res[i] = ai + bi; |
33 | 296 | equemene | } |
34 | 296 | equemene | } |
35 | 296 | equemene | |
36 | 296 | equemene | void MySillySumOMP(MYFLOAT *res, MYFLOAT *a, MYFLOAT *b,int calls, int size) |
37 | 296 | equemene | { |
38 | 296 | equemene | #pragma omp parallel for |
39 | 296 | equemene | for (uint i=0; i<size;i++) |
40 | 296 | equemene | { |
41 | 296 | equemene | MYFLOAT ai=a[i]; |
42 | 296 | equemene | MYFLOAT bi=b[i]; |
43 | 296 | equemene | |
44 | 296 | equemene | for (int c=0;c<calls;c++) |
45 | 296 | equemene | { |
46 | 296 | equemene | ai=MySillyFunction(ai); |
47 | 296 | equemene | bi=MySillyFunction(bi); |
48 | 296 | equemene | } |
49 | 296 | equemene | |
50 | 296 | equemene | res[i] = ai + bi; |
51 | 296 | equemene | } |
52 | 296 | equemene | } |
53 | 296 | equemene | |
54 | 296 | equemene | MYFLOAT MyNorm(MYFLOAT *a,MYFLOAT *b,int size)
|
55 | 296 | equemene | { |
56 | 296 | equemene | MYFLOAT norm=0.;
|
57 | 296 | equemene | |
58 | 296 | equemene | for (int i=0;i<size;i++) |
59 | 296 | equemene | { |
60 | 296 | equemene | norm+=pow(a[i]-b[i],2);
|
61 | 296 | equemene | } |
62 | 296 | equemene | |
63 | 296 | equemene | return(sqrt(norm));
|
64 | 296 | equemene | } |
65 | 296 | equemene | |
66 | 296 | equemene | void MyPrint(MYFLOAT *a,int size) |
67 | 296 | equemene | { |
68 | 296 | equemene | printf("[");
|
69 | 296 | equemene | for (int i=0;i<size;i++) |
70 | 296 | equemene | { |
71 | 296 | equemene | printf(" %.8e ",a[i]);
|
72 | 296 | equemene | } |
73 | 296 | equemene | printf("]\n");
|
74 | 296 | equemene | } |
75 | 296 | equemene | |
76 | 296 | equemene | int main(int argc,char *argv[]) |
77 | 296 | equemene | { |
78 | 296 | equemene | float *a,*b,*res,*resacc;
|
79 | 296 | equemene | int size=1024; |
80 | 296 | equemene | int calls=1; |
81 | 296 | equemene | struct timeval tv1,tv2;
|
82 | 296 | equemene | |
83 | 296 | equemene | if (argc > 1) { |
84 | 296 | equemene | size=(int)atoll(argv[1]); |
85 | 296 | equemene | calls=(int)atoll(argv[2]); |
86 | 296 | equemene | } |
87 | 296 | equemene | else {
|
88 | 296 | equemene | printf("\n\tPi : Estimate SillySum\n\n\t\t#1 : size (default 1024)\n\t\t#2 : calls (default 1)\n\n");
|
89 | 296 | equemene | } |
90 | 296 | equemene | |
91 | 296 | equemene | printf("%i %i\n",size,calls);
|
92 | 296 | equemene | |
93 | 296 | equemene | a=(float*)malloc(size*sizeof(MYFLOAT)); |
94 | 296 | equemene | b=(float*)malloc(size*sizeof(MYFLOAT)); |
95 | 296 | equemene | res=(float*)malloc(size*sizeof(MYFLOAT)); |
96 | 296 | equemene | resacc=(float*)malloc(size*sizeof(MYFLOAT)); |
97 | 296 | equemene | |
98 | 296 | equemene | srand(110271);
|
99 | 296 | equemene | |
100 | 296 | equemene | for (int i=0;i<size;i++) |
101 | 296 | equemene | { |
102 | 296 | equemene | a[i]=(MYFLOAT)rand()/(MYFLOAT)RAND_MAX; |
103 | 296 | equemene | b[i]=(MYFLOAT)rand()/(MYFLOAT)RAND_MAX; |
104 | 296 | equemene | res[i]=0.;
|
105 | 296 | equemene | resacc[i]=0.;
|
106 | 296 | equemene | } |
107 | 296 | equemene | |
108 | 296 | equemene | #ifndef NOSERIAL
|
109 | 296 | equemene | gettimeofday(&tv1, NULL);
|
110 | 296 | equemene | MySillySum(res,a,b,calls,size); |
111 | 296 | equemene | gettimeofday(&tv2, NULL);
|
112 | 296 | equemene | #endif
|
113 | 296 | equemene | |
114 | 296 | equemene | MYFLOAT elapsed=(MYFLOAT)((tv2.tv_sec-tv1.tv_sec) * 1000000L +
|
115 | 296 | equemene | (tv2.tv_usec-tv1.tv_usec))/1000000;
|
116 | 296 | equemene | |
117 | 296 | equemene | gettimeofday(&tv1, NULL);
|
118 | 296 | equemene | MySillySumOMP(resacc,a,b,calls,size); |
119 | 296 | equemene | gettimeofday(&tv2, NULL);
|
120 | 296 | equemene | |
121 | 296 | equemene | MYFLOAT elapsedAcc=(MYFLOAT)((tv2.tv_sec-tv1.tv_sec) * 1000000L +
|
122 | 296 | equemene | (tv2.tv_usec-tv1.tv_usec))/1000000;
|
123 | 296 | equemene | |
124 | 296 | equemene | #ifndef NOSERIAL
|
125 | 296 | equemene | MYFLOAT MyChecker=MyNorm(res,resacc,size); |
126 | 296 | equemene | printf("Norm: %.8e\n",MyChecker);
|
127 | 296 | equemene | #endif
|
128 | 296 | equemene | |
129 | 296 | equemene | #ifdef VERBOSE
|
130 | 296 | equemene | MyPrint(res,size); |
131 | 296 | equemene | MyPrint(resacc,size); |
132 | 296 | equemene | #endif
|
133 | 296 | equemene | |
134 | 296 | equemene | #ifndef NOSERIAL
|
135 | 296 | equemene | printf("Elapsed Time: %.3f\n",elapsed);
|
136 | 296 | equemene | #endif
|
137 | 296 | equemene | |
138 | 296 | equemene | printf("OMP Elapsed Time: %.3f\n",elapsedAcc);
|
139 | 296 | equemene | |
140 | 296 | equemene | #ifndef NOSERIAL
|
141 | 299 | equemene | printf("NativeRate: %.lld\n",(unsigned long)((float)size/elapsed)); |
142 | 296 | equemene | #endif
|
143 | 296 | equemene | printf("OMPRate: %.lld\n",(unsigned long)((float)size/elapsedAcc)); |
144 | 296 | equemene | |
145 | 296 | equemene | #ifndef NOSERIAL
|
146 | 296 | equemene | printf("AccRatio: %.3f\n",elapsed/elapsedAcc);
|
147 | 296 | equemene | #endif
|
148 | 296 | equemene | |
149 | 296 | equemene | free(a); |
150 | 296 | equemene | free(b); |
151 | 296 | equemene | free(res); |
152 | 296 | equemene | free(resacc); |
153 | 296 | equemene | } |