-
Notifications
You must be signed in to change notification settings - Fork 17
/
Copy pathmandelbrot-openmp-offload.cc
75 lines (58 loc) · 2.3 KB
/
mandelbrot-openmp-offload.cc
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
#include "common.inc"
#pragma omp declare target
template<bool WithMoment>
double Iterate(double zr, double zi)
{
const double escape_radius_squared = ESCAPE_RADIUS_SQUARED;
const int maxiter = MAXITER;
double cr = zr, sr = cr;
double ci = zi, si = ci;
double dist;
int iter = maxiter, notescaped = -1;
if(zr*(1+zr*(8*zr*zr+(16*zi*zi-3)))+zi*zi*(8*zi*zi-3) < 3./32 || ((zr+1)*(zr+1)+zi*zi)<1./16) { notescaped=iter=0; }
while(notescaped)
{
double r2 = cr * cr;
double i2 = ci * ci;
dist = r2 + i2;
notescaped &= ((iter != 0) & (dist < escape_radius_squared)) ? -1 : 0;
iter += notescaped;
double ri = cr * ci;
ci = zi + (ri * 2);
cr = zr + (r2 - i2);
if(WithMoment)
{
bool notmoment = iter & (iter-1);
iter = (cr == sr && ci == si) ? 0 : iter;
sr = notmoment ? sr : cr;
si = notmoment ? si : ci;
}
}
return iter ? std::log2( maxiter-iter + 1 - std::log2(std::log2(dist) / 2)) * (4/std::log2(std::exp(1.))) : 0;
}
#pragma omp end declare target
int main()
{
static double results[Xres*Yres];
bool NeedMoment = true;
std::vector<unsigned> pixels (Xres * Yres);
MAINLOOP_START(1);
while(MAINLOOP_GET_CONDITION())
{
double zr, zi, xscale, yscale; MAINLOOP_SET_COORDINATES();
#pragma omp target firstprivate(zr,zi,xscale,yscale,NeedMoment) map(from:results[0:Xres*Yres])
#pragma omp teams distribute parallel for collapse(2) dist_schedule(static,64)
for(unsigned y=0; y<Yres; ++y)
for(unsigned x=0; x<Xres; ++x)
results[y*Xres+x] = NeedMoment ? Iterate<true>( zr+xscale*int(x-Xres/2), zi+yscale*int(y-Yres/2) )
: Iterate<false>( zr+xscale*int(x-Xres/2), zi+yscale*int(y-Yres/2) );
unsigned n_inside = std::count_if(results, results+Xres*Yres, std::bind1st(std::equal_to<double>(), 0.));
NeedMoment = n_inside >= (Xres*Yres)/1024;
#pragma omp parallel for /* This part is run natively */
for(unsigned y=0; y<Yres; ++y)
for(unsigned x=0; x<Xres; ++x)
pixels[y*Xres + x] = Color(x,y, results[y*Xres+x]);
MAINLOOP_PUT_RESULT(pixels);
}
MAINLOOP_FINISH();
}