added cuda file
This commit is contained in:
106
examples_ptx/mandelbrot_tasks/mandelbrot_tasks.cu
Normal file
106
examples_ptx/mandelbrot_tasks/mandelbrot_tasks.cu
Normal file
@@ -0,0 +1,106 @@
|
||||
/*
|
||||
Copyright (c) 2010-2012, Intel Corporation
|
||||
All rights reserved.
|
||||
|
||||
Redistribution and use in source and binary forms, with or without
|
||||
modification, are permitted provided that the following conditions are
|
||||
met:
|
||||
|
||||
* Redistributions of source code must retain the above copyright
|
||||
notice, this list of conditions and the following disclaimer.
|
||||
|
||||
* Redistributions in binary form must reproduce the above copyright
|
||||
notice, this list of conditions and the following disclaimer in the
|
||||
documentation and/or other materials provided with the distribution.
|
||||
|
||||
* Neither the name of Intel Corporation nor the names of its
|
||||
contributors may be used to endorse or promote products derived from
|
||||
this software without specific prior written permission.
|
||||
|
||||
|
||||
THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS
|
||||
IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
|
||||
TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A
|
||||
PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER
|
||||
OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,
|
||||
EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
|
||||
PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR
|
||||
PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF
|
||||
LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING
|
||||
NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
|
||||
SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
|
||||
*/
|
||||
|
||||
#include "cuda_helpers.cuh"
|
||||
|
||||
__device__
|
||||
static inline int
|
||||
mandel(float c_re, float c_im, int count) {
|
||||
float z_re = c_re, z_im = c_im;
|
||||
int i;
|
||||
for (i = 0; i < count; ++i) {
|
||||
if (z_re * z_re + z_im * z_im > 4.0f)
|
||||
break;
|
||||
|
||||
float new_re = z_re*z_re - z_im*z_im;
|
||||
float new_im = 2.f * z_re * z_im;
|
||||
z_re = c_re + new_re;
|
||||
z_im = c_im + new_im;
|
||||
}
|
||||
|
||||
return i;
|
||||
}
|
||||
|
||||
|
||||
/* Task to compute the Mandelbrot iterations for a single scanline.
|
||||
*/
|
||||
__global__ void
|
||||
mandelbrot_scanline( float x0, float dx,
|
||||
float y0, float dy,
|
||||
int width, int height,
|
||||
int xspan, int yspan,
|
||||
int maxIterations, int output[]) {
|
||||
const int xstart = taskIndex0 * xspan;
|
||||
const int xend = min(xstart + xspan, width);
|
||||
|
||||
const int ystart = taskIndex1 * yspan;
|
||||
const int yend = min(ystart + yspan, height);
|
||||
|
||||
for ( int yi = ystart; yi < yend; yi++)
|
||||
for ( int xi = xstart+programIndex; xi < xend; xi += programCount)
|
||||
{
|
||||
const float x = x0 + xi * dx;
|
||||
const float y = y0 + yi * dy;
|
||||
|
||||
const int res = mandel(x,y,maxIterations);
|
||||
const int index = yi * width + xi;
|
||||
if (xi < xend)
|
||||
output[index] = res;
|
||||
}
|
||||
}
|
||||
|
||||
extern "C" __global__ void
|
||||
mandelbrot_ispc___export( float x0, float y0,
|
||||
float x1, float y1,
|
||||
int width, int height,
|
||||
int maxIterations, int output[]) {
|
||||
float dx = (x1 - x0) / width;
|
||||
float dy = (y1 - y0) / height;
|
||||
const int xspan = 64; /* make sure it is big enough to avoid false-sharing */
|
||||
const int yspan = 16;
|
||||
|
||||
|
||||
launch(width/xspan, height/yspan, 1, mandelbrot_scanline)
|
||||
(x0, dx, y0, dy, width, height, xspan, yspan, maxIterations, output);
|
||||
cudaDeviceSynchronize();
|
||||
}
|
||||
|
||||
extern "C" __host__ void
|
||||
mandelbrot_ispc( float x0, float y0,
|
||||
float x1, float y1,
|
||||
int width, int height,
|
||||
int maxIterations, int output[])
|
||||
{
|
||||
mandelbrot_ispc___export<<<1,32>>>(x0,y0,x1,y1,width,height,maxIterations,output);
|
||||
cudaDeviceSynchronize();
|
||||
}
|
||||
Reference in New Issue
Block a user