added volume rendering example
This commit is contained in:
2
examples/portable/volume_rendering/.gitignore
vendored
Normal file
2
examples/portable/volume_rendering/.gitignore
vendored
Normal file
@@ -0,0 +1,2 @@
|
|||||||
|
mandelbrot
|
||||||
|
*.ppm
|
||||||
8
examples/portable/volume_rendering/Makefile_cpu
Normal file
8
examples/portable/volume_rendering/Makefile_cpu
Normal file
@@ -0,0 +1,8 @@
|
|||||||
|
|
||||||
|
EXAMPLE=volume
|
||||||
|
CPP_SRC=volume.cpp
|
||||||
|
ISPC_SRC=volume.ispc
|
||||||
|
ISPC_IA_TARGETS=avx1-i32x8
|
||||||
|
ISPC_ARM_TARGETS=neon
|
||||||
|
|
||||||
|
include ../common_cpu.mk
|
||||||
13
examples/portable/volume_rendering/Makefile_gpu
Normal file
13
examples/portable/volume_rendering/Makefile_gpu
Normal file
@@ -0,0 +1,13 @@
|
|||||||
|
PROG=volume
|
||||||
|
ISPC_SRC=volume.ispc
|
||||||
|
CU_SRC=volume.cu
|
||||||
|
CXX_SRC=volume.cpp
|
||||||
|
PTXCC_REGMAX=64
|
||||||
|
|
||||||
|
LLVM_GPU=1
|
||||||
|
NVVM_GPU=1
|
||||||
|
|
||||||
|
include ../common_gpu.mk
|
||||||
|
|
||||||
|
|
||||||
|
|
||||||
13
examples/portable/volume_rendering/Makefile_ptx
Normal file
13
examples/portable/volume_rendering/Makefile_ptx
Normal file
@@ -0,0 +1,13 @@
|
|||||||
|
PROG=volume
|
||||||
|
ISPC_SRC=volume.ispc
|
||||||
|
CU_SRC=volume.cu
|
||||||
|
CXX_SRC=volume.cpp
|
||||||
|
PTXCC_REGMAX=64
|
||||||
|
|
||||||
|
#LLVM_GPU=1
|
||||||
|
NVVM_GPU=1
|
||||||
|
|
||||||
|
include ../common_ptx.mk
|
||||||
|
|
||||||
|
|
||||||
|
|
||||||
11
examples/portable/volume_rendering/camera.dat
Normal file
11
examples/portable/volume_rendering/camera.dat
Normal file
@@ -0,0 +1,11 @@
|
|||||||
|
896 1184
|
||||||
|
|
||||||
|
0.000155 0.000000 0.000000 -0.069927
|
||||||
|
0.000000 -0.000155 0.000000 0.093236
|
||||||
|
0.000000 0.000000 0.000000 1.000000
|
||||||
|
0.000000 0.000000 -99.999001 100.000000
|
||||||
|
|
||||||
|
1.000000 0.000000 0.000000 1.000000
|
||||||
|
0.000000 0.980129 -0.198360 2.900000
|
||||||
|
0.000000 0.198360 0.980129 -10.500000
|
||||||
|
0.000000 0.000000 0.000000 1.000000
|
||||||
5
examples/portable/volume_rendering/density_highres.vol
Normal file
5
examples/portable/volume_rendering/density_highres.vol
Normal file
File diff suppressed because one or more lines are too long
4
examples/portable/volume_rendering/density_lowres.vol
Normal file
4
examples/portable/volume_rendering/density_lowres.vol
Normal file
File diff suppressed because one or more lines are too long
183
examples/portable/volume_rendering/volume.cpp
Normal file
183
examples/portable/volume_rendering/volume.cpp
Normal file
@@ -0,0 +1,183 @@
|
|||||||
|
/*
|
||||||
|
Copyright (c) 2011, Intel Corporation
|
||||||
|
All rights reserved.
|
||||||
|
|
||||||
|
Redistribution and use in source and binary forms, with or without
|
||||||
|
modification, are permitted provided that the following conditions are
|
||||||
|
met:
|
||||||
|
|
||||||
|
* Redistributions of source code must retain the above copyright
|
||||||
|
notice, this list of conditions and the following disclaimer.
|
||||||
|
|
||||||
|
* Redistributions in binary form must reproduce the above copyright
|
||||||
|
notice, this list of conditions and the following disclaimer in the
|
||||||
|
documentation and/or other materials provided with the distribution.
|
||||||
|
|
||||||
|
* Neither the name of Intel Corporation nor the names of its
|
||||||
|
contributors may be used to endorse or promote products derived from
|
||||||
|
this software without specific prior written permission.
|
||||||
|
|
||||||
|
|
||||||
|
THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS
|
||||||
|
IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
|
||||||
|
TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A
|
||||||
|
PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER
|
||||||
|
OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,
|
||||||
|
EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
|
||||||
|
PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR
|
||||||
|
PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF
|
||||||
|
LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING
|
||||||
|
NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
|
||||||
|
SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
|
||||||
|
*/
|
||||||
|
|
||||||
|
#ifdef _MSC_VER
|
||||||
|
#define _CRT_SECURE_NO_WARNINGS
|
||||||
|
#define NOMINMAX
|
||||||
|
#pragma warning (disable: 4244)
|
||||||
|
#pragma warning (disable: 4305)
|
||||||
|
#endif
|
||||||
|
|
||||||
|
#include <cstdio>
|
||||||
|
#include <algorithm>
|
||||||
|
#include "timing.h"
|
||||||
|
#include "ispc_malloc.h"
|
||||||
|
#include "volume_ispc.h"
|
||||||
|
using namespace ispc;
|
||||||
|
|
||||||
|
/* Write a PPM image file with the image */
|
||||||
|
static void
|
||||||
|
writePPM(float *buf, int width, int height, const char *fn) {
|
||||||
|
FILE *fp = fopen(fn, "wb");
|
||||||
|
fprintf(fp, "P6\n");
|
||||||
|
fprintf(fp, "%d %d\n", width, height);
|
||||||
|
fprintf(fp, "255\n");
|
||||||
|
for (int i = 0; i < width*height; ++i) {
|
||||||
|
float v = buf[i] * 255.f;
|
||||||
|
if (v < 0.f) v = 0.f;
|
||||||
|
else if (v > 255.f) v = 255.f;
|
||||||
|
unsigned char c = (unsigned char)v;
|
||||||
|
for (int j = 0; j < 3; ++j)
|
||||||
|
fputc(c, fp);
|
||||||
|
}
|
||||||
|
fclose(fp);
|
||||||
|
printf("Wrote image file %s\n", fn);
|
||||||
|
}
|
||||||
|
|
||||||
|
|
||||||
|
/* Load image and viewing parameters from a camera data file.
|
||||||
|
FIXME: we should add support to be able to specify viewing parameters
|
||||||
|
in the program here directly. */
|
||||||
|
static void
|
||||||
|
loadCamera(const char *fn, int *width, int *height, float raster2camera[4][4],
|
||||||
|
float camera2world[4][4]) {
|
||||||
|
FILE *f = fopen(fn, "r");
|
||||||
|
if (!f) {
|
||||||
|
perror(fn);
|
||||||
|
exit(1);
|
||||||
|
}
|
||||||
|
if (fscanf(f, "%d %d", width, height) != 2) {
|
||||||
|
fprintf(stderr, "Unexpected end of file in camera file\n");
|
||||||
|
exit(1);
|
||||||
|
}
|
||||||
|
|
||||||
|
for (int i = 0; i < 4; ++i) {
|
||||||
|
for (int j = 0; j < 4; ++j) {
|
||||||
|
if (fscanf(f, "%f", &raster2camera[i][j]) != 1) {
|
||||||
|
fprintf(stderr, "Unexpected end of file in camera file\n");
|
||||||
|
exit(1);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
for (int i = 0; i < 4; ++i) {
|
||||||
|
for (int j = 0; j < 4; ++j) {
|
||||||
|
if (fscanf(f, "%f", &camera2world[i][j]) != 1) {
|
||||||
|
fprintf(stderr, "Unexpected end of file in camera file\n");
|
||||||
|
exit(1);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
fclose(f);
|
||||||
|
}
|
||||||
|
|
||||||
|
|
||||||
|
/* Load a volume density file. Expects the number of x, y, and z samples
|
||||||
|
as the first three values (as integer strings), then x*y*z
|
||||||
|
floating-point values (also as strings) to give the densities. */
|
||||||
|
static float *
|
||||||
|
loadVolume(const char *fn, int n[3]) {
|
||||||
|
FILE *f = fopen(fn, "r");
|
||||||
|
if (!f) {
|
||||||
|
perror(fn);
|
||||||
|
exit(1);
|
||||||
|
}
|
||||||
|
|
||||||
|
if (fscanf(f, "%d %d %d", &n[0], &n[1], &n[2]) != 3) {
|
||||||
|
fprintf(stderr, "Couldn't find resolution at start of density file\n");
|
||||||
|
exit(1);
|
||||||
|
}
|
||||||
|
|
||||||
|
int count = n[0] * n[1] * n[2];
|
||||||
|
float *v = new float[count];
|
||||||
|
for (int i = 0; i < count; ++i) {
|
||||||
|
if (fscanf(f, "%f", &v[i]) != 1) {
|
||||||
|
fprintf(stderr, "Unexpected end of file at %d'th density value\n", i);
|
||||||
|
exit(1);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
return v;
|
||||||
|
}
|
||||||
|
|
||||||
|
|
||||||
|
int main(int argc, char *argv[]) {
|
||||||
|
static unsigned int test_iterations[] = {3, 7, 1};
|
||||||
|
if (argc < 3) {
|
||||||
|
fprintf(stderr, "usage: volume <camera.dat> <volume_density.vol> [ispc iterations] [tasks iterations] [serial iterations]\n");
|
||||||
|
return 1;
|
||||||
|
}
|
||||||
|
if (argc == 6) {
|
||||||
|
for (int i = 0; i < 3; i++) {
|
||||||
|
test_iterations[i] = atoi(argv[3 + i]);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
//
|
||||||
|
// Load viewing data and the volume density data
|
||||||
|
//
|
||||||
|
int width, height;
|
||||||
|
|
||||||
|
float *camera2world_ispc = new float[4*4];
|
||||||
|
float *raster2camera_ispc = new float[4*4];
|
||||||
|
float (*camera2world )[4] = (float (*)[4])camera2world_ispc;
|
||||||
|
float (*raster2camera)[4] = (float (*)[4])raster2camera_ispc;
|
||||||
|
|
||||||
|
loadCamera(argv[1], &width, &height, raster2camera, camera2world);
|
||||||
|
float *image = new float[width*height];
|
||||||
|
|
||||||
|
int *n = new int[3];
|
||||||
|
float *density = loadVolume(argv[2], n);
|
||||||
|
|
||||||
|
// Clear out the buffer
|
||||||
|
for (int i = 0; i < width * height; ++i)
|
||||||
|
image[i] = 0.;
|
||||||
|
|
||||||
|
//
|
||||||
|
// Compute the image using the ispc implementation that also uses
|
||||||
|
// tasks; report the minimum time of three runs.
|
||||||
|
//
|
||||||
|
double minISPCtasks = 1e30;
|
||||||
|
for (int i = 0; i < test_iterations[1]; ++i) {
|
||||||
|
reset_and_start_timer();
|
||||||
|
volume_ispc_tasks(density, n, raster2camera, camera2world,
|
||||||
|
width, height, image);
|
||||||
|
double dt = get_elapsed_msec();
|
||||||
|
printf("@time of ISPC + TASKS run:\t\t\t[%.3f] msec\n", dt);
|
||||||
|
minISPCtasks = std::min(minISPCtasks, dt);
|
||||||
|
}
|
||||||
|
|
||||||
|
printf("[volume ispc + tasks]:\t\t[%.3f] msec\n", minISPCtasks);
|
||||||
|
writePPM(image, width, height, "volume-ispc-tasks.ppm");
|
||||||
|
|
||||||
|
return 0;
|
||||||
|
}
|
||||||
454
examples/portable/volume_rendering/volume.cu
Normal file
454
examples/portable/volume_rendering/volume.cu
Normal file
@@ -0,0 +1,454 @@
|
|||||||
|
/*
|
||||||
|
Copyright (c) 2011, Intel Corporation
|
||||||
|
All rights reserved.
|
||||||
|
|
||||||
|
Redistribution and use in source and binary forms, with or without
|
||||||
|
modification, are permitted provided that the following conditions are
|
||||||
|
met:
|
||||||
|
|
||||||
|
* Redistributions of source code must retain the above copyright
|
||||||
|
notice, this list of conditions and the following disclaimer.
|
||||||
|
|
||||||
|
* Redistributions in binary form must reproduce the above copyright
|
||||||
|
notice, this list of conditions and the following disclaimer in the
|
||||||
|
documentation and/or other materials provided with the distribution.
|
||||||
|
|
||||||
|
* Neither the name of Intel Corporation nor the names of its
|
||||||
|
contributors may be used to endorse or promote products derived from
|
||||||
|
this software without specific prior written permission.
|
||||||
|
|
||||||
|
|
||||||
|
THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS
|
||||||
|
IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
|
||||||
|
TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A
|
||||||
|
PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER
|
||||||
|
OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,
|
||||||
|
EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
|
||||||
|
PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR
|
||||||
|
PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF
|
||||||
|
LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING
|
||||||
|
NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
|
||||||
|
SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
|
||||||
|
*/
|
||||||
|
|
||||||
|
#include "cuda_helpers.cuh"
|
||||||
|
__device__ static inline float clamp(float v, float low, float high)
|
||||||
|
{
|
||||||
|
return min(max(v, low), high);
|
||||||
|
}
|
||||||
|
|
||||||
|
|
||||||
|
#define float3 Float3
|
||||||
|
struct Float3
|
||||||
|
{
|
||||||
|
float x,y,z;
|
||||||
|
__device__ friend Float3 operator+(const Float3 a, const Float3 b)
|
||||||
|
{
|
||||||
|
Float3 c;
|
||||||
|
c.x = a.x+b.x;
|
||||||
|
c.y = a.y+b.y;
|
||||||
|
c.z = a.z+b.z;
|
||||||
|
return c;
|
||||||
|
}
|
||||||
|
__device__ friend Float3 operator-(const Float3 a, const Float3 b)
|
||||||
|
{
|
||||||
|
Float3 c;
|
||||||
|
c.x = a.x-b.x;
|
||||||
|
c.y = a.y-b.y;
|
||||||
|
c.z = a.z-b.z;
|
||||||
|
return c;
|
||||||
|
}
|
||||||
|
__device__ friend Float3 operator/(const Float3 a, const Float3 b)
|
||||||
|
{
|
||||||
|
Float3 c;
|
||||||
|
c.x = a.x/b.x;
|
||||||
|
c.y = a.y/b.y;
|
||||||
|
c.z = a.z/b.z;
|
||||||
|
return c;
|
||||||
|
}
|
||||||
|
__device__ friend Float3 operator*(const Float3 a, const Float3 b)
|
||||||
|
{
|
||||||
|
Float3 c;
|
||||||
|
c.x = a.x*b.x;
|
||||||
|
c.y = a.y*b.y;
|
||||||
|
c.z = a.z*b.z;
|
||||||
|
return c;
|
||||||
|
}
|
||||||
|
__device__ friend Float3 operator*(const Float3 a, const float b)
|
||||||
|
{
|
||||||
|
Float3 c;
|
||||||
|
c.x = a.x*b;
|
||||||
|
c.y = a.y*b;
|
||||||
|
c.z = a.z*b;
|
||||||
|
return c;
|
||||||
|
}
|
||||||
|
};
|
||||||
|
|
||||||
|
struct Ray {
|
||||||
|
float3 origin, dir;
|
||||||
|
};
|
||||||
|
|
||||||
|
|
||||||
|
__device__ static void
|
||||||
|
generateRay(const float raster2camera[4][4],
|
||||||
|
const float camera2world[4][4],
|
||||||
|
float x, float y, Ray &ray) {
|
||||||
|
// transform raster coordinate (x, y, 0) to camera space
|
||||||
|
float camx = raster2camera[0][0] * x + raster2camera[0][1] * y + raster2camera[0][3];
|
||||||
|
float camy = raster2camera[1][0] * x + raster2camera[1][1] * y + raster2camera[1][3];
|
||||||
|
float camz = raster2camera[2][3];
|
||||||
|
float camw = raster2camera[3][3];
|
||||||
|
camx /= camw;
|
||||||
|
camy /= camw;
|
||||||
|
camz /= camw;
|
||||||
|
|
||||||
|
ray.dir.x = camera2world[0][0] * camx + camera2world[0][1] * camy + camera2world[0][2] * camz;
|
||||||
|
ray.dir.y = camera2world[1][0] * camx + camera2world[1][1] * camy + camera2world[1][2] * camz;
|
||||||
|
ray.dir.z = camera2world[2][0] * camx + camera2world[2][1] * camy + camera2world[2][2] * camz;
|
||||||
|
|
||||||
|
ray.origin.x = camera2world[0][3] / camera2world[3][3];
|
||||||
|
ray.origin.y = camera2world[1][3] / camera2world[3][3];
|
||||||
|
ray.origin.z = camera2world[2][3] / camera2world[3][3];
|
||||||
|
}
|
||||||
|
|
||||||
|
|
||||||
|
__device__ static inline bool
|
||||||
|
Inside(float3 p, float3 pMin, float3 pMax) {
|
||||||
|
return (p.x >= pMin.x && p.x <= pMax.x &&
|
||||||
|
p.y >= pMin.y && p.y <= pMax.y &&
|
||||||
|
p.z >= pMin.z && p.z <= pMax.z);
|
||||||
|
}
|
||||||
|
|
||||||
|
|
||||||
|
__device__ static bool
|
||||||
|
IntersectP(Ray ray, float3 pMin, float3 pMax, float &hit0, float &hit1) {
|
||||||
|
float t0 = -1e30f, t1 = 1e30f;
|
||||||
|
|
||||||
|
float3 tNear = (pMin - ray.origin) / ray.dir;
|
||||||
|
float3 tFar = (pMax - ray.origin) / ray.dir;
|
||||||
|
if (tNear.x > tFar.x) {
|
||||||
|
float tmp = tNear.x;
|
||||||
|
tNear.x = tFar.x;
|
||||||
|
tFar.x = tmp;
|
||||||
|
}
|
||||||
|
t0 = max(tNear.x, t0);
|
||||||
|
t1 = min(tFar.x, t1);
|
||||||
|
|
||||||
|
if (tNear.y > tFar.y) {
|
||||||
|
float tmp = tNear.y;
|
||||||
|
tNear.y = tFar.y;
|
||||||
|
tFar.y = tmp;
|
||||||
|
}
|
||||||
|
t0 = max(tNear.y, t0);
|
||||||
|
t1 = min(tFar.y, t1);
|
||||||
|
|
||||||
|
if (tNear.z > tFar.z) {
|
||||||
|
float tmp = tNear.z;
|
||||||
|
tNear.z = tFar.z;
|
||||||
|
tFar.z = tmp;
|
||||||
|
}
|
||||||
|
t0 = max(tNear.z, t0);
|
||||||
|
t1 = min(tFar.z, t1);
|
||||||
|
|
||||||
|
if (t0 <= t1) {
|
||||||
|
hit0 = t0;
|
||||||
|
hit1 = t1;
|
||||||
|
return true;
|
||||||
|
}
|
||||||
|
else
|
||||||
|
return false;
|
||||||
|
}
|
||||||
|
|
||||||
|
|
||||||
|
__device__ static inline float Lerp(float t, float a, float b) {
|
||||||
|
return (1.f - t) * a + t * b;
|
||||||
|
}
|
||||||
|
|
||||||
|
|
||||||
|
__device__ static inline float D(int x, int y, int z, int nVoxels[3],
|
||||||
|
float density[]) {
|
||||||
|
x = clamp(x, 0, nVoxels[0]-1);
|
||||||
|
y = clamp(y, 0, nVoxels[1]-1);
|
||||||
|
z = clamp(z, 0, nVoxels[2]-1);
|
||||||
|
|
||||||
|
return density[z*nVoxels[0]*nVoxels[1] + y*nVoxels[0] + x];
|
||||||
|
}
|
||||||
|
|
||||||
|
|
||||||
|
__device__ static inline float3 Offset(float3 p, float3 pMin, float3 pMax) {
|
||||||
|
return (p - pMin) / (pMax - pMin);
|
||||||
|
}
|
||||||
|
|
||||||
|
|
||||||
|
__device__ static inline float Density(float3 Pobj, float3 pMin, float3 pMax,
|
||||||
|
float density[], int nVoxels[3]) {
|
||||||
|
if (!Inside(Pobj, pMin, pMax))
|
||||||
|
return 0;
|
||||||
|
// Compute voxel coordinates and offsets for _Pobj_
|
||||||
|
float3 vox = Offset(Pobj, pMin, pMax);
|
||||||
|
vox.x = vox.x * nVoxels[0] - .5f;
|
||||||
|
vox.y = vox.y * nVoxels[1] - .5f;
|
||||||
|
vox.z = vox.z * nVoxels[2] - .5f;
|
||||||
|
int vx = (int)(vox.x), vy = (int)(vox.y), vz = (int)(vox.z);
|
||||||
|
float dx = vox.x - vx, dy = vox.y - vy, dz = vox.z - vz;
|
||||||
|
|
||||||
|
// Trilinearly interpolate density values to compute local density
|
||||||
|
float d00 = Lerp(dx, D(vx, vy, vz, nVoxels, density),
|
||||||
|
D(vx+1, vy, vz, nVoxels, density));
|
||||||
|
float d10 = Lerp(dx, D(vx, vy+1, vz, nVoxels, density),
|
||||||
|
D(vx+1, vy+1, vz, nVoxels, density));
|
||||||
|
float d01 = Lerp(dx, D(vx, vy, vz+1, nVoxels, density),
|
||||||
|
D(vx+1, vy, vz+1, nVoxels, density));
|
||||||
|
float d11 = Lerp(dx, D(vx, vy+1, vz+1, nVoxels, density),
|
||||||
|
D(vx+1, vy+1, vz+1, nVoxels, density));
|
||||||
|
float d0 = Lerp(dy, d00, d10);
|
||||||
|
float d1 = Lerp(dy, d01, d11);
|
||||||
|
return Lerp(dz, d0, d1);
|
||||||
|
}
|
||||||
|
|
||||||
|
|
||||||
|
/* Returns the transmittance between two points p0 and p1, in a volume
|
||||||
|
with extent (pMin,pMax) with transmittance coefficient sigma_t,
|
||||||
|
defined by nVoxels[3] voxels in each dimension in the given density
|
||||||
|
array. */
|
||||||
|
__device__ static inline float
|
||||||
|
transmittance(float3 p0, float3 p1, float3 pMin,
|
||||||
|
float3 pMax, float sigma_t,
|
||||||
|
float density[], int nVoxels[3]) {
|
||||||
|
float rayT0, rayT1;
|
||||||
|
Ray ray;
|
||||||
|
ray.origin = p1;
|
||||||
|
ray.dir = p0 - p1;
|
||||||
|
|
||||||
|
// Find the parametric t range along the ray that is inside the volume.
|
||||||
|
if (!IntersectP(ray, pMin, pMax, rayT0, rayT1))
|
||||||
|
return 1.f;
|
||||||
|
|
||||||
|
rayT0 = max(rayT0, 0.f);
|
||||||
|
|
||||||
|
// Accumulate beam transmittance in tau
|
||||||
|
float tau = 0.0f;
|
||||||
|
float rayLength = sqrt(ray.dir.x * ray.dir.x + ray.dir.y * ray.dir.y +
|
||||||
|
ray.dir.z * ray.dir.z);
|
||||||
|
float stepDist = 0.2f;
|
||||||
|
float stepT = stepDist / rayLength;
|
||||||
|
|
||||||
|
float t = rayT0;
|
||||||
|
float3 pos = ray.origin + ray.dir * rayT0;
|
||||||
|
float3 dirStep = ray.dir * stepT;
|
||||||
|
while (t < rayT1) {
|
||||||
|
tau += stepDist * sigma_t * Density(pos, pMin, pMax, density, nVoxels);
|
||||||
|
pos = pos + dirStep;
|
||||||
|
t += stepT;
|
||||||
|
}
|
||||||
|
|
||||||
|
return exp(-tau);
|
||||||
|
}
|
||||||
|
|
||||||
|
|
||||||
|
__device__ static inline float
|
||||||
|
distanceSquared(float3 a, float3 b) {
|
||||||
|
float3 d = a-b;
|
||||||
|
return d.x*d.x + d.y*d.y + d.z*d.z;
|
||||||
|
}
|
||||||
|
|
||||||
|
|
||||||
|
__device__ static inline float
|
||||||
|
raymarch(float density[], int nVoxels[3], Ray ray) {
|
||||||
|
float rayT0, rayT1;
|
||||||
|
float3 pMin = {.3f, -.2f, .3f}, pMax = {1.8f, 2.3f, 1.8f};
|
||||||
|
float3 lightPos = { -1.f, 4., 1.5f };
|
||||||
|
|
||||||
|
if (!IntersectP(ray, pMin, pMax, rayT0, rayT1))
|
||||||
|
return 0.f;
|
||||||
|
|
||||||
|
rayT0 = max(rayT0, 0.f);
|
||||||
|
|
||||||
|
// Parameters that define the volume scattering characteristics and
|
||||||
|
// sampling rate for raymarching
|
||||||
|
float Le = .25f; // Emission coefficient
|
||||||
|
float sigma_a = 10.f; // Absorption coefficient
|
||||||
|
float sigma_s = 10.f; // Scattering coefficient
|
||||||
|
float stepDist = 0.025f; // Ray step amount
|
||||||
|
float lightIntensity = 40.0f; // Light source intensity
|
||||||
|
|
||||||
|
float tau = 0.f; // accumulated beam transmittance
|
||||||
|
float L = 0.f; // radiance along the ray
|
||||||
|
float rayLength = sqrt(ray.dir.x * ray.dir.x + ray.dir.y * ray.dir.y +
|
||||||
|
ray.dir.z * ray.dir.z);
|
||||||
|
float stepT = stepDist / rayLength;
|
||||||
|
|
||||||
|
float t = rayT0;
|
||||||
|
float3 pos = ray.origin + ray.dir * rayT0;
|
||||||
|
float3 dirStep = ray.dir * stepT;
|
||||||
|
while (t < rayT1)
|
||||||
|
{
|
||||||
|
float d = Density(pos, pMin, pMax, density, nVoxels);
|
||||||
|
|
||||||
|
// terminate once attenuation is high
|
||||||
|
float atten = exp(-tau);
|
||||||
|
if (atten < .005f)
|
||||||
|
break;
|
||||||
|
|
||||||
|
// direct lighting
|
||||||
|
float Li = lightIntensity / distanceSquared(lightPos, pos) *
|
||||||
|
transmittance(lightPos, pos, pMin, pMax, sigma_a + sigma_s,
|
||||||
|
density, nVoxels);
|
||||||
|
L += stepDist * atten * d * sigma_s * (Li + Le);
|
||||||
|
|
||||||
|
// update beam transmittance
|
||||||
|
tau += stepDist * (sigma_a + sigma_s) * d;
|
||||||
|
|
||||||
|
pos = pos + dirStep;
|
||||||
|
t += stepT;
|
||||||
|
}
|
||||||
|
|
||||||
|
// Gamma correction
|
||||||
|
return pow(L, 1.f / 2.2f);
|
||||||
|
}
|
||||||
|
|
||||||
|
|
||||||
|
/* Utility routine used by both the task-based and the single-core entrypoints.
|
||||||
|
Renders a tile of the image, covering [x0,x0) * [y0, y1), storing the
|
||||||
|
result into the image[] array.
|
||||||
|
*/
|
||||||
|
__device__ static void
|
||||||
|
volume_tile(int x0, int y0, int x1,
|
||||||
|
int y1, float density[], int nVoxels[3],
|
||||||
|
const float raster2camera[4][4],
|
||||||
|
const float camera2world[4][4],
|
||||||
|
int width, int height, float image[]) {
|
||||||
|
// Work on 4x4=16 pixel big tiles of the image. This function thus
|
||||||
|
// implicitly assumes that both (x1-x0) and (y1-y0) are evenly divisble
|
||||||
|
// by 4.
|
||||||
|
for (int y = y0; y < y1; y += 8) {
|
||||||
|
for (int x = x0; x < x1; x += 8) {
|
||||||
|
for (int ob = 0; ob < 64; ob += programCount)
|
||||||
|
{
|
||||||
|
const int o = ob + programIndex;
|
||||||
|
|
||||||
|
|
||||||
|
// These two arrays encode the mapping from [0,15] to
|
||||||
|
// offsets within the 4x4 pixel block so that we render
|
||||||
|
// each pixel inside the block
|
||||||
|
const int xoffsets[16] = { 0, 1, 0, 1, 2, 3, 2, 3,
|
||||||
|
0, 1, 0, 1, 2, 3, 2, 3 };
|
||||||
|
const int yoffsets[16] = { 0, 0, 1, 1, 0, 0, 1, 1,
|
||||||
|
2, 2, 3, 3, 2, 2, 3, 3 };
|
||||||
|
|
||||||
|
const int xblock[4] = {0, 4, 0, 4};
|
||||||
|
const int yblock[4] = {0, 0, 4, 4};
|
||||||
|
|
||||||
|
// Figure out the pixel to render for this program instance
|
||||||
|
const int xo = x + xblock[o/16] + xoffsets[o&15];
|
||||||
|
const int yo = y + yblock[o/16] + yoffsets[o&15];
|
||||||
|
|
||||||
|
// Use viewing parameters to compute the corresponding ray
|
||||||
|
// for the pixel
|
||||||
|
Ray ray;
|
||||||
|
generateRay(raster2camera, camera2world, xo, yo, ray);
|
||||||
|
|
||||||
|
// And raymarch through the volume to compute the pixel's
|
||||||
|
// value
|
||||||
|
int offset = yo * width + xo;
|
||||||
|
if (xo < x1 && yo < y1)
|
||||||
|
image[offset] = raymarch(density, nVoxels, ray);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
|
||||||
|
__global__ void
|
||||||
|
volume_task(float density[], int _nVoxels[3],
|
||||||
|
const float _raster2camera[4][4],
|
||||||
|
const float _camera2world[4][4],
|
||||||
|
int width, int height, float image[]) {
|
||||||
|
if (taskIndex0 >= taskCount0) return;
|
||||||
|
|
||||||
|
#if 0
|
||||||
|
int nVoxels[3];
|
||||||
|
nVoxels[0] = _nVoxels[0];
|
||||||
|
nVoxels[1] = _nVoxels[1];
|
||||||
|
nVoxels[2] = _nVoxels[2];
|
||||||
|
|
||||||
|
float raster2camera[4][4];
|
||||||
|
raster2camera[0][0] = _raster2camera[0][0];
|
||||||
|
raster2camera[0][1] = _raster2camera[0][1];
|
||||||
|
raster2camera[0][2] = _raster2camera[0][2];
|
||||||
|
raster2camera[0][3] = _raster2camera[0][3];
|
||||||
|
raster2camera[1][0] = _raster2camera[1][0];
|
||||||
|
raster2camera[1][1] = _raster2camera[1][1];
|
||||||
|
raster2camera[1][2] = _raster2camera[1][2];
|
||||||
|
raster2camera[1][3] = _raster2camera[1][3];
|
||||||
|
raster2camera[2][0] = _raster2camera[2][0];
|
||||||
|
raster2camera[2][1] = _raster2camera[2][1];
|
||||||
|
raster2camera[2][2] = _raster2camera[2][2];
|
||||||
|
raster2camera[2][3] = _raster2camera[2][3];
|
||||||
|
raster2camera[3][0] = _raster2camera[3][0];
|
||||||
|
raster2camera[3][1] = _raster2camera[3][1];
|
||||||
|
raster2camera[3][2] = _raster2camera[3][2];
|
||||||
|
raster2camera[3][3] = _raster2camera[3][3];
|
||||||
|
|
||||||
|
float camera2world[4][4];
|
||||||
|
camera2world[0][0] = _camera2world[0][0];
|
||||||
|
camera2world[0][1] = _camera2world[0][1];
|
||||||
|
camera2world[0][2] = _camera2world[0][2];
|
||||||
|
camera2world[0][3] = _camera2world[0][3];
|
||||||
|
camera2world[1][0] = _camera2world[1][0];
|
||||||
|
camera2world[1][1] = _camera2world[1][1];
|
||||||
|
camera2world[1][2] = _camera2world[1][2];
|
||||||
|
camera2world[1][3] = _camera2world[1][3];
|
||||||
|
camera2world[2][0] = _camera2world[2][0];
|
||||||
|
camera2world[2][1] = _camera2world[2][1];
|
||||||
|
camera2world[2][2] = _camera2world[2][2];
|
||||||
|
camera2world[2][3] = _camera2world[2][3];
|
||||||
|
camera2world[3][0] = _camera2world[3][0];
|
||||||
|
camera2world[3][1] = _camera2world[3][1];
|
||||||
|
camera2world[3][2] = _camera2world[3][2];
|
||||||
|
camera2world[3][3] = _camera2world[3][3];
|
||||||
|
#else
|
||||||
|
#define nVoxels _nVoxels
|
||||||
|
#define raster2camera _raster2camera
|
||||||
|
#define camera2world _camera2world
|
||||||
|
#endif
|
||||||
|
|
||||||
|
int dx = 8, dy = 8; // must match value in volume_ispc_tasks
|
||||||
|
int xbuckets = (width + (dx-1)) / dx;
|
||||||
|
int ybuckets = (height + (dy-1)) / dy;
|
||||||
|
|
||||||
|
int x0 = (taskIndex % xbuckets) * dx;
|
||||||
|
int y0 = (taskIndex / xbuckets) * dy;
|
||||||
|
int x1 = x0 + dx, y1 = y0 + dy;
|
||||||
|
x1 = min(x1, width);
|
||||||
|
y1 = min(y1, height);
|
||||||
|
|
||||||
|
volume_tile(x0, y0, x1, y1, density, nVoxels, raster2camera,
|
||||||
|
camera2world, width, height, image);
|
||||||
|
}
|
||||||
|
|
||||||
|
|
||||||
|
extern "C"
|
||||||
|
__global__ void
|
||||||
|
volume_ispc_tasks___export( float density[], int nVoxels[3],
|
||||||
|
const float raster2camera[4][4],
|
||||||
|
const float camera2world[4][4],
|
||||||
|
int width, int height, float image[]) {
|
||||||
|
// Launch tasks to work on (dx,dy)-sized tiles of the image
|
||||||
|
int dx = 8, dy = 8;
|
||||||
|
int nTasks = ((width+(dx-1))/dx) * ((height+(dy-1))/dy);
|
||||||
|
launch(nTasks,1,1,volume_task)
|
||||||
|
(density, nVoxels, raster2camera, camera2world,
|
||||||
|
width, height, image);
|
||||||
|
cudaDeviceSynchronize();
|
||||||
|
}
|
||||||
|
|
||||||
|
extern "C"
|
||||||
|
__host__ void
|
||||||
|
volume_ispc_tasks( float density[], int nVoxels[3],
|
||||||
|
const float raster2camera[4][4],
|
||||||
|
const float camera2world[4][4],
|
||||||
|
int width, int height, float image[]) {
|
||||||
|
volume_ispc_tasks___export<<<1,32>>>(density, nVoxels, raster2camera, camera2world, width, height,image);
|
||||||
|
cudaDeviceSynchronize();
|
||||||
|
}
|
||||||
413
examples/portable/volume_rendering/volume.ispc
Normal file
413
examples/portable/volume_rendering/volume.ispc
Normal file
@@ -0,0 +1,413 @@
|
|||||||
|
/*
|
||||||
|
Copyright (c) 2011, Intel Corporation
|
||||||
|
All rights reserved.
|
||||||
|
|
||||||
|
Redistribution and use in source and binary forms, with or without
|
||||||
|
modification, are permitted provided that the following conditions are
|
||||||
|
met:
|
||||||
|
|
||||||
|
* Redistributions of source code must retain the above copyright
|
||||||
|
notice, this list of conditions and the following disclaimer.
|
||||||
|
|
||||||
|
* Redistributions in binary form must reproduce the above copyright
|
||||||
|
notice, this list of conditions and the following disclaimer in the
|
||||||
|
documentation and/or other materials provided with the distribution.
|
||||||
|
|
||||||
|
* Neither the name of Intel Corporation nor the names of its
|
||||||
|
contributors may be used to endorse or promote products derived from
|
||||||
|
this software without specific prior written permission.
|
||||||
|
|
||||||
|
|
||||||
|
THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS
|
||||||
|
IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
|
||||||
|
TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A
|
||||||
|
PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER
|
||||||
|
OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,
|
||||||
|
EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
|
||||||
|
PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR
|
||||||
|
PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF
|
||||||
|
LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING
|
||||||
|
NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
|
||||||
|
SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
|
||||||
|
*/
|
||||||
|
|
||||||
|
|
||||||
|
|
||||||
|
typedef float<3> float3;
|
||||||
|
|
||||||
|
struct Ray {
|
||||||
|
float3 origin, dir;
|
||||||
|
};
|
||||||
|
|
||||||
|
|
||||||
|
static inline void
|
||||||
|
generateRay(const uniform float raster2camera[4][4],
|
||||||
|
const uniform float camera2world[4][4],
|
||||||
|
float x, float y, Ray &ray) {
|
||||||
|
// transform raster coordinate (x, y, 0) to camera space
|
||||||
|
float camx = raster2camera[0][0] * x + raster2camera[0][1] * y + raster2camera[0][3];
|
||||||
|
float camy = raster2camera[1][0] * x + raster2camera[1][1] * y + raster2camera[1][3];
|
||||||
|
float camz = raster2camera[2][3];
|
||||||
|
float camw = raster2camera[3][3];
|
||||||
|
camx /= camw;
|
||||||
|
camy /= camw;
|
||||||
|
camz /= camw;
|
||||||
|
|
||||||
|
ray.dir.x = camera2world[0][0] * camx + camera2world[0][1] * camy + camera2world[0][2] * camz;
|
||||||
|
ray.dir.y = camera2world[1][0] * camx + camera2world[1][1] * camy + camera2world[1][2] * camz;
|
||||||
|
ray.dir.z = camera2world[2][0] * camx + camera2world[2][1] * camy + camera2world[2][2] * camz;
|
||||||
|
|
||||||
|
ray.origin.x = camera2world[0][3] / camera2world[3][3];
|
||||||
|
ray.origin.y = camera2world[1][3] / camera2world[3][3];
|
||||||
|
ray.origin.z = camera2world[2][3] / camera2world[3][3];
|
||||||
|
}
|
||||||
|
|
||||||
|
|
||||||
|
static inline bool
|
||||||
|
Inside(float3 p, float3 pMin, float3 pMax) {
|
||||||
|
return (p.x >= pMin.x && p.x <= pMax.x &&
|
||||||
|
p.y >= pMin.y && p.y <= pMax.y &&
|
||||||
|
p.z >= pMin.z && p.z <= pMax.z);
|
||||||
|
}
|
||||||
|
|
||||||
|
|
||||||
|
static inline bool
|
||||||
|
IntersectP(Ray ray, float3 pMin, float3 pMax, float &hit0, float &hit1) {
|
||||||
|
float t0 = -1e30, t1 = 1e30;
|
||||||
|
|
||||||
|
float3 tNear = (pMin - ray.origin) / ray.dir;
|
||||||
|
float3 tFar = (pMax - ray.origin) / ray.dir;
|
||||||
|
if (tNear.x > tFar.x) {
|
||||||
|
float tmp = tNear.x;
|
||||||
|
tNear.x = tFar.x;
|
||||||
|
tFar.x = tmp;
|
||||||
|
}
|
||||||
|
t0 = max(tNear.x, t0);
|
||||||
|
t1 = min(tFar.x, t1);
|
||||||
|
|
||||||
|
if (tNear.y > tFar.y) {
|
||||||
|
float tmp = tNear.y;
|
||||||
|
tNear.y = tFar.y;
|
||||||
|
tFar.y = tmp;
|
||||||
|
}
|
||||||
|
t0 = max(tNear.y, t0);
|
||||||
|
t1 = min(tFar.y, t1);
|
||||||
|
|
||||||
|
if (tNear.z > tFar.z) {
|
||||||
|
float tmp = tNear.z;
|
||||||
|
tNear.z = tFar.z;
|
||||||
|
tFar.z = tmp;
|
||||||
|
}
|
||||||
|
t0 = max(tNear.z, t0);
|
||||||
|
t1 = min(tFar.z, t1);
|
||||||
|
|
||||||
|
if (t0 <= t1) {
|
||||||
|
hit0 = t0;
|
||||||
|
hit1 = t1;
|
||||||
|
return true;
|
||||||
|
}
|
||||||
|
else
|
||||||
|
return false;
|
||||||
|
}
|
||||||
|
|
||||||
|
|
||||||
|
static inline float Lerp(float t, float a, float b) {
|
||||||
|
return (1.f - t) * a + t * b;
|
||||||
|
}
|
||||||
|
|
||||||
|
|
||||||
|
static inline float D(int x, int y, int z, uniform int nVoxels[3],
|
||||||
|
uniform float density[]) {
|
||||||
|
x = clamp(x, 0, nVoxels[0]-1);
|
||||||
|
y = clamp(y, 0, nVoxels[1]-1);
|
||||||
|
z = clamp(z, 0, nVoxels[2]-1);
|
||||||
|
|
||||||
|
return density[z*nVoxels[0]*nVoxels[1] + y*nVoxels[0] + x];
|
||||||
|
}
|
||||||
|
|
||||||
|
|
||||||
|
static inline float3 Offset(float3 p, float3 pMin, float3 pMax) {
|
||||||
|
return (p - pMin) / (pMax - pMin);
|
||||||
|
}
|
||||||
|
|
||||||
|
|
||||||
|
static inline float Density(float3 Pobj, float3 pMin, float3 pMax,
|
||||||
|
uniform float density[], uniform int nVoxels[3]) {
|
||||||
|
if (!Inside(Pobj, pMin, pMax))
|
||||||
|
return 0;
|
||||||
|
// Compute voxel coordinates and offsets for _Pobj_
|
||||||
|
float3 vox = Offset(Pobj, pMin, pMax);
|
||||||
|
vox.x = vox.x * nVoxels[0] - .5f;
|
||||||
|
vox.y = vox.y * nVoxels[1] - .5f;
|
||||||
|
vox.z = vox.z * nVoxels[2] - .5f;
|
||||||
|
int vx = (int)(vox.x), vy = (int)(vox.y), vz = (int)(vox.z);
|
||||||
|
float dx = vox.x - vx, dy = vox.y - vy, dz = vox.z - vz;
|
||||||
|
|
||||||
|
// Trilinearly interpolate density values to compute local density
|
||||||
|
float d00 = Lerp(dx, D(vx, vy, vz, nVoxels, density),
|
||||||
|
D(vx+1, vy, vz, nVoxels, density));
|
||||||
|
float d10 = Lerp(dx, D(vx, vy+1, vz, nVoxels, density),
|
||||||
|
D(vx+1, vy+1, vz, nVoxels, density));
|
||||||
|
float d01 = Lerp(dx, D(vx, vy, vz+1, nVoxels, density),
|
||||||
|
D(vx+1, vy, vz+1, nVoxels, density));
|
||||||
|
float d11 = Lerp(dx, D(vx, vy+1, vz+1, nVoxels, density),
|
||||||
|
D(vx+1, vy+1, vz+1, nVoxels, density));
|
||||||
|
float d0 = Lerp(dy, d00, d10);
|
||||||
|
float d1 = Lerp(dy, d01, d11);
|
||||||
|
return Lerp(dz, d0, d1);
|
||||||
|
}
|
||||||
|
|
||||||
|
|
||||||
|
/* Returns the transmittance between two points p0 and p1, in a volume
|
||||||
|
with extent (pMin,pMax) with transmittance coefficient sigma_t,
|
||||||
|
defined by nVoxels[3] voxels in each dimension in the given density
|
||||||
|
array. */
|
||||||
|
static inline float
|
||||||
|
transmittance(uniform float3 p0, float3 p1, uniform float3 pMin,
|
||||||
|
uniform float3 pMax, uniform float sigma_t,
|
||||||
|
uniform float density[], uniform int nVoxels[3]) {
|
||||||
|
float rayT0, rayT1;
|
||||||
|
Ray ray;
|
||||||
|
ray.origin = p1;
|
||||||
|
ray.dir = p0 - p1;
|
||||||
|
|
||||||
|
// Find the parametric t range along the ray that is inside the volume.
|
||||||
|
if (!IntersectP(ray, pMin, pMax, rayT0, rayT1))
|
||||||
|
return 1.;
|
||||||
|
|
||||||
|
rayT0 = max(rayT0, 0.f);
|
||||||
|
|
||||||
|
// Accumulate beam transmittance in tau
|
||||||
|
float tau = 0;
|
||||||
|
float rayLength = sqrt(ray.dir.x * ray.dir.x + ray.dir.y * ray.dir.y +
|
||||||
|
ray.dir.z * ray.dir.z);
|
||||||
|
const uniform float stepDist = 0.2;
|
||||||
|
float stepT = stepDist / rayLength;
|
||||||
|
|
||||||
|
float t = rayT0;
|
||||||
|
float3 pos = ray.origin + ray.dir * rayT0;
|
||||||
|
float3 dirStep = ray.dir * stepT;
|
||||||
|
while (t < rayT1) {
|
||||||
|
tau += stepDist * sigma_t * Density(pos, pMin, pMax, density, nVoxels);
|
||||||
|
pos = pos + dirStep;
|
||||||
|
t += stepT;
|
||||||
|
}
|
||||||
|
|
||||||
|
return exp(-tau);
|
||||||
|
}
|
||||||
|
|
||||||
|
|
||||||
|
static inline float
|
||||||
|
distanceSquared(float3 a, float3 b) {
|
||||||
|
float3 d = a-b;
|
||||||
|
return d.x*d.x + d.y*d.y + d.z*d.z;
|
||||||
|
}
|
||||||
|
|
||||||
|
|
||||||
|
static inline float
|
||||||
|
raymarch(uniform float density[], uniform int nVoxels[3], Ray ray) {
|
||||||
|
float rayT0, rayT1;
|
||||||
|
const uniform float3 pMin = {.3, -.2, .3}, pMax = {1.8, 2.3, 1.8};
|
||||||
|
const uniform float3 lightPos = { -1, 4, 1.5 };
|
||||||
|
|
||||||
|
if (!IntersectP(ray, pMin, pMax, rayT0, rayT1))
|
||||||
|
return 0.;
|
||||||
|
|
||||||
|
rayT0 = max(rayT0, 0.f);
|
||||||
|
|
||||||
|
// Parameters that define the volume scattering characteristics and
|
||||||
|
// sampling rate for raymarching
|
||||||
|
const uniform float Le = .25; // Emission coefficient
|
||||||
|
const uniform float sigma_a = 10; // Absorption coefficient
|
||||||
|
const uniform float sigma_s = 10; // Scattering coefficient
|
||||||
|
const uniform float stepDist = 0.025; // Ray step amount
|
||||||
|
const uniform float lightIntensity = 40; // Light source intensity
|
||||||
|
|
||||||
|
float tau = 0.f; // accumulated beam transmittance
|
||||||
|
float L = 0; // radiance along the ray
|
||||||
|
float rayLength = sqrt(ray.dir.x * ray.dir.x + ray.dir.y * ray.dir.y +
|
||||||
|
ray.dir.z * ray.dir.z);
|
||||||
|
float stepT = stepDist / rayLength;
|
||||||
|
|
||||||
|
float t = rayT0;
|
||||||
|
float3 pos = ray.origin + ray.dir * rayT0;
|
||||||
|
float3 dirStep = ray.dir * stepT;
|
||||||
|
while (t < rayT1)
|
||||||
|
{
|
||||||
|
float d = Density(pos, pMin, pMax, density, nVoxels);
|
||||||
|
|
||||||
|
// terminate once attenuation is high
|
||||||
|
float atten = exp(-tau);
|
||||||
|
if (atten < .005)
|
||||||
|
break;
|
||||||
|
|
||||||
|
// direct lighting
|
||||||
|
float Li = lightIntensity / distanceSquared(lightPos, pos) *
|
||||||
|
transmittance(lightPos, pos, pMin, pMax, sigma_a + sigma_s,
|
||||||
|
density, nVoxels);
|
||||||
|
L += stepDist * atten * d * sigma_s * (Li + Le);
|
||||||
|
|
||||||
|
// update beam transmittance
|
||||||
|
tau += stepDist * (sigma_a + sigma_s) * d;
|
||||||
|
|
||||||
|
pos = pos + dirStep;
|
||||||
|
t += stepT;
|
||||||
|
}
|
||||||
|
|
||||||
|
// Gamma correction
|
||||||
|
return pow(L, 1.f / 2.2f);
|
||||||
|
}
|
||||||
|
|
||||||
|
|
||||||
|
/* Utility routine used by both the task-based and the single-core entrypoints.
|
||||||
|
Renders a tile of the image, covering [x0,x0) * [y0, y1), storing the
|
||||||
|
result into the image[] array.
|
||||||
|
*/
|
||||||
|
static inline void
|
||||||
|
volume_tile(uniform int x0, uniform int y0, uniform int x1,
|
||||||
|
uniform int y1, uniform float density[], uniform int nVoxels[3],
|
||||||
|
const uniform float raster2camera[4][4],
|
||||||
|
const uniform float camera2world[4][4],
|
||||||
|
uniform int width, uniform int height, uniform float image[]) {
|
||||||
|
// Work on 4x4=16 pixel big tiles of the image. This function thus
|
||||||
|
// implicitly assumes that both (x1-x0) and (y1-y0) are evenly divisble
|
||||||
|
// by 4.
|
||||||
|
#if 0
|
||||||
|
for (uniform int y = y0; y < y1; y += 8)
|
||||||
|
for (uniform int x = x0; x < x1; x += 8)
|
||||||
|
foreach (o = 0 ... 64)
|
||||||
|
{
|
||||||
|
// These two arrays encode the mapping from [0,15] to
|
||||||
|
// offsets within the 4x4 pixel block so that we render
|
||||||
|
// each pixel inside the block
|
||||||
|
const uniform int xoffsets[16] = { 0, 1, 0, 1, 2, 3, 2, 3,
|
||||||
|
0, 1, 0, 1, 2, 3, 2, 3 };
|
||||||
|
const uniform int yoffsets[16] = { 0, 0, 1, 1, 0, 0, 1, 1,
|
||||||
|
2, 2, 3, 3, 2, 2, 3, 3 };
|
||||||
|
|
||||||
|
const uniform int xblock[4] = {0, 4, 0, 4};
|
||||||
|
const uniform int yblock[4] = {0, 0, 4, 4};
|
||||||
|
|
||||||
|
// Figure out the pixel to render for this program instance
|
||||||
|
const int xo = x + xblock[o/16] + xoffsets[o&15];
|
||||||
|
const int yo = y + yblock[o/16] + yoffsets[o&15];
|
||||||
|
|
||||||
|
// Use viewing parameters to compute the corresponding ray
|
||||||
|
// for the pixel
|
||||||
|
Ray ray;
|
||||||
|
generateRay(raster2camera, camera2world, xo, yo, ray);
|
||||||
|
|
||||||
|
// And raymarch through the volume to compute the pixel's
|
||||||
|
// value
|
||||||
|
int offset = yo * width + xo;
|
||||||
|
if (xo < x1 && yo < y1)
|
||||||
|
image[offset] = raymarch(density, nVoxels, ray);
|
||||||
|
}
|
||||||
|
#else
|
||||||
|
foreach_tiled (y = y0 ... y1, x = x0 ... x1)
|
||||||
|
{
|
||||||
|
// Use viewing parameters to compute the corresponding ray
|
||||||
|
// for the pixel
|
||||||
|
Ray ray;
|
||||||
|
generateRay(raster2camera, camera2world, x, y, ray);
|
||||||
|
|
||||||
|
// And raymarch through the volume to compute the pixel's
|
||||||
|
// value
|
||||||
|
int offset = y * width + x;
|
||||||
|
image[offset] = raymarch(density, nVoxels, ray);
|
||||||
|
}
|
||||||
|
#endif
|
||||||
|
}
|
||||||
|
|
||||||
|
|
||||||
|
task void
|
||||||
|
volume_task(uniform float density[], uniform int _nVoxels[3],
|
||||||
|
const uniform float _raster2camera[4][4],
|
||||||
|
const uniform float _camera2world[4][4],
|
||||||
|
uniform int width, uniform int height, uniform float image[])
|
||||||
|
{
|
||||||
|
if (taskIndex >= taskCount) return;
|
||||||
|
|
||||||
|
#if 1 /* cannot pass shared memory pointers to functions, need to find a way to solve this one :S */
|
||||||
|
uniform int nVoxels[3];
|
||||||
|
nVoxels[0] = _nVoxels[0];
|
||||||
|
nVoxels[1] = _nVoxels[1];
|
||||||
|
nVoxels[2] = _nVoxels[2];
|
||||||
|
|
||||||
|
uniform float raster2camera[4][4];
|
||||||
|
raster2camera[0][0] = _raster2camera[0][0];
|
||||||
|
raster2camera[0][1] = _raster2camera[0][1];
|
||||||
|
raster2camera[0][2] = _raster2camera[0][2];
|
||||||
|
raster2camera[0][3] = _raster2camera[0][3];
|
||||||
|
raster2camera[1][0] = _raster2camera[1][0];
|
||||||
|
raster2camera[1][1] = _raster2camera[1][1];
|
||||||
|
raster2camera[1][2] = _raster2camera[1][2];
|
||||||
|
raster2camera[1][3] = _raster2camera[1][3];
|
||||||
|
raster2camera[2][0] = _raster2camera[2][0];
|
||||||
|
raster2camera[2][1] = _raster2camera[2][1];
|
||||||
|
raster2camera[2][2] = _raster2camera[2][2];
|
||||||
|
raster2camera[2][3] = _raster2camera[2][3];
|
||||||
|
raster2camera[3][0] = _raster2camera[3][0];
|
||||||
|
raster2camera[3][1] = _raster2camera[3][1];
|
||||||
|
raster2camera[3][2] = _raster2camera[3][2];
|
||||||
|
raster2camera[3][3] = _raster2camera[3][3];
|
||||||
|
|
||||||
|
uniform float camera2world[4][4];
|
||||||
|
camera2world[0][0] = _camera2world[0][0];
|
||||||
|
camera2world[0][1] = _camera2world[0][1];
|
||||||
|
camera2world[0][2] = _camera2world[0][2];
|
||||||
|
camera2world[0][3] = _camera2world[0][3];
|
||||||
|
camera2world[1][0] = _camera2world[1][0];
|
||||||
|
camera2world[1][1] = _camera2world[1][1];
|
||||||
|
camera2world[1][2] = _camera2world[1][2];
|
||||||
|
camera2world[1][3] = _camera2world[1][3];
|
||||||
|
camera2world[2][0] = _camera2world[2][0];
|
||||||
|
camera2world[2][1] = _camera2world[2][1];
|
||||||
|
camera2world[2][2] = _camera2world[2][2];
|
||||||
|
camera2world[2][3] = _camera2world[2][3];
|
||||||
|
camera2world[3][0] = _camera2world[3][0];
|
||||||
|
camera2world[3][1] = _camera2world[3][1];
|
||||||
|
camera2world[3][2] = _camera2world[3][2];
|
||||||
|
camera2world[3][3] = _camera2world[3][3];
|
||||||
|
#else
|
||||||
|
#define nVoxels _nVoxels
|
||||||
|
#define raster2camera _raster2camera
|
||||||
|
#define camera2world _camera2world
|
||||||
|
#endif
|
||||||
|
|
||||||
|
const uniform int dx = 8, dy = 8; // must match value in volume_ispc_tasks
|
||||||
|
const uniform int xbuckets = (width + (dx-1)) / dx;
|
||||||
|
const uniform int ybuckets = (height + (dy-1)) / dy;
|
||||||
|
|
||||||
|
const uniform int x0 = (taskIndex % xbuckets) * dx;
|
||||||
|
const uniform int y0 = (taskIndex / xbuckets) * dy;
|
||||||
|
const uniform int x1 = min(x0 + dx, width);
|
||||||
|
const uniform int y1 = min(y0 + dy, height);
|
||||||
|
|
||||||
|
volume_tile(x0, y0, x1, y1, density, nVoxels, raster2camera,
|
||||||
|
camera2world, width, height, image);
|
||||||
|
}
|
||||||
|
|
||||||
|
|
||||||
|
export void
|
||||||
|
volume_ispc(uniform float density[], uniform int nVoxels[3],
|
||||||
|
const uniform float raster2camera[4][4],
|
||||||
|
const uniform float camera2world[4][4],
|
||||||
|
uniform int width, uniform int height, uniform float image[]) {
|
||||||
|
volume_tile(0, 0, width, height, density, nVoxels, raster2camera,
|
||||||
|
camera2world, width, height, image);
|
||||||
|
}
|
||||||
|
|
||||||
|
|
||||||
|
export void
|
||||||
|
volume_ispc_tasks(uniform float density[], uniform int nVoxels[3],
|
||||||
|
const uniform float raster2camera[4][4],
|
||||||
|
const uniform float camera2world[4][4],
|
||||||
|
uniform int width, uniform int height, uniform float image[]) {
|
||||||
|
// Launch tasks to work on (dx,dy)-sized tiles of the image
|
||||||
|
const uniform int dx = 8, dy = 8;
|
||||||
|
const uniform int nTasks = ((width+(dx-1))/dx) * ((height+(dy-1))/dy);
|
||||||
|
launch[nTasks] volume_task(density, nVoxels, raster2camera, camera2world,
|
||||||
|
width, height, image);
|
||||||
|
sync;
|
||||||
|
}
|
||||||
341
examples/portable/volume_rendering/volume.orig.ispc
Normal file
341
examples/portable/volume_rendering/volume.orig.ispc
Normal file
@@ -0,0 +1,341 @@
|
|||||||
|
/*
|
||||||
|
Copyright (c) 2011, Intel Corporation
|
||||||
|
All rights reserved.
|
||||||
|
|
||||||
|
Redistribution and use in source and binary forms, with or without
|
||||||
|
modification, are permitted provided that the following conditions are
|
||||||
|
met:
|
||||||
|
|
||||||
|
* Redistributions of source code must retain the above copyright
|
||||||
|
notice, this list of conditions and the following disclaimer.
|
||||||
|
|
||||||
|
* Redistributions in binary form must reproduce the above copyright
|
||||||
|
notice, this list of conditions and the following disclaimer in the
|
||||||
|
documentation and/or other materials provided with the distribution.
|
||||||
|
|
||||||
|
* Neither the name of Intel Corporation nor the names of its
|
||||||
|
contributors may be used to endorse or promote products derived from
|
||||||
|
this software without specific prior written permission.
|
||||||
|
|
||||||
|
|
||||||
|
THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS
|
||||||
|
IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
|
||||||
|
TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A
|
||||||
|
PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER
|
||||||
|
OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,
|
||||||
|
EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
|
||||||
|
PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR
|
||||||
|
PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF
|
||||||
|
LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING
|
||||||
|
NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
|
||||||
|
SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
|
||||||
|
*/
|
||||||
|
|
||||||
|
typedef float<3> float3;
|
||||||
|
|
||||||
|
struct Ray {
|
||||||
|
float3 origin, dir;
|
||||||
|
};
|
||||||
|
|
||||||
|
|
||||||
|
static void
|
||||||
|
generateRay(const uniform float raster2camera[4][4],
|
||||||
|
const uniform float camera2world[4][4],
|
||||||
|
float x, float y, Ray &ray) {
|
||||||
|
// transform raster coordinate (x, y, 0) to camera space
|
||||||
|
float camx = raster2camera[0][0] * x + raster2camera[0][1] * y + raster2camera[0][3];
|
||||||
|
float camy = raster2camera[1][0] * x + raster2camera[1][1] * y + raster2camera[1][3];
|
||||||
|
float camz = raster2camera[2][3];
|
||||||
|
float camw = raster2camera[3][3];
|
||||||
|
camx /= camw;
|
||||||
|
camy /= camw;
|
||||||
|
camz /= camw;
|
||||||
|
|
||||||
|
ray.dir.x = camera2world[0][0] * camx + camera2world[0][1] * camy + camera2world[0][2] * camz;
|
||||||
|
ray.dir.y = camera2world[1][0] * camx + camera2world[1][1] * camy + camera2world[1][2] * camz;
|
||||||
|
ray.dir.z = camera2world[2][0] * camx + camera2world[2][1] * camy + camera2world[2][2] * camz;
|
||||||
|
|
||||||
|
ray.origin.x = camera2world[0][3] / camera2world[3][3];
|
||||||
|
ray.origin.y = camera2world[1][3] / camera2world[3][3];
|
||||||
|
ray.origin.z = camera2world[2][3] / camera2world[3][3];
|
||||||
|
}
|
||||||
|
|
||||||
|
|
||||||
|
static inline bool
|
||||||
|
Inside(float3 p, float3 pMin, float3 pMax) {
|
||||||
|
return (p.x >= pMin.x && p.x <= pMax.x &&
|
||||||
|
p.y >= pMin.y && p.y <= pMax.y &&
|
||||||
|
p.z >= pMin.z && p.z <= pMax.z);
|
||||||
|
}
|
||||||
|
|
||||||
|
|
||||||
|
static bool
|
||||||
|
IntersectP(Ray ray, float3 pMin, float3 pMax, float &hit0, float &hit1) {
|
||||||
|
float t0 = -1e30, t1 = 1e30;
|
||||||
|
|
||||||
|
float3 tNear = (pMin - ray.origin) / ray.dir;
|
||||||
|
float3 tFar = (pMax - ray.origin) / ray.dir;
|
||||||
|
if (tNear.x > tFar.x) {
|
||||||
|
float tmp = tNear.x;
|
||||||
|
tNear.x = tFar.x;
|
||||||
|
tFar.x = tmp;
|
||||||
|
}
|
||||||
|
t0 = max(tNear.x, t0);
|
||||||
|
t1 = min(tFar.x, t1);
|
||||||
|
|
||||||
|
if (tNear.y > tFar.y) {
|
||||||
|
float tmp = tNear.y;
|
||||||
|
tNear.y = tFar.y;
|
||||||
|
tFar.y = tmp;
|
||||||
|
}
|
||||||
|
t0 = max(tNear.y, t0);
|
||||||
|
t1 = min(tFar.y, t1);
|
||||||
|
|
||||||
|
if (tNear.z > tFar.z) {
|
||||||
|
float tmp = tNear.z;
|
||||||
|
tNear.z = tFar.z;
|
||||||
|
tFar.z = tmp;
|
||||||
|
}
|
||||||
|
t0 = max(tNear.z, t0);
|
||||||
|
t1 = min(tFar.z, t1);
|
||||||
|
|
||||||
|
if (t0 <= t1) {
|
||||||
|
hit0 = t0;
|
||||||
|
hit1 = t1;
|
||||||
|
return true;
|
||||||
|
}
|
||||||
|
else
|
||||||
|
return false;
|
||||||
|
}
|
||||||
|
|
||||||
|
|
||||||
|
static inline float Lerp(float t, float a, float b) {
|
||||||
|
return (1.f - t) * a + t * b;
|
||||||
|
}
|
||||||
|
|
||||||
|
|
||||||
|
static inline float D(int x, int y, int z, uniform int nVoxels[3],
|
||||||
|
uniform float density[]) {
|
||||||
|
x = clamp(x, 0, nVoxels[0]-1);
|
||||||
|
y = clamp(y, 0, nVoxels[1]-1);
|
||||||
|
z = clamp(z, 0, nVoxels[2]-1);
|
||||||
|
|
||||||
|
return density[z*nVoxels[0]*nVoxels[1] + y*nVoxels[0] + x];
|
||||||
|
}
|
||||||
|
|
||||||
|
|
||||||
|
static inline float3 Offset(float3 p, float3 pMin, float3 pMax) {
|
||||||
|
return (p - pMin) / (pMax - pMin);
|
||||||
|
}
|
||||||
|
|
||||||
|
|
||||||
|
static float Density(float3 Pobj, float3 pMin, float3 pMax,
|
||||||
|
uniform float density[], uniform int nVoxels[3]) {
|
||||||
|
if (!Inside(Pobj, pMin, pMax))
|
||||||
|
return 0;
|
||||||
|
// Compute voxel coordinates and offsets for _Pobj_
|
||||||
|
float3 vox = Offset(Pobj, pMin, pMax);
|
||||||
|
vox.x = vox.x * nVoxels[0] - .5f;
|
||||||
|
vox.y = vox.y * nVoxels[1] - .5f;
|
||||||
|
vox.z = vox.z * nVoxels[2] - .5f;
|
||||||
|
int vx = (int)(vox.x), vy = (int)(vox.y), vz = (int)(vox.z);
|
||||||
|
float dx = vox.x - vx, dy = vox.y - vy, dz = vox.z - vz;
|
||||||
|
|
||||||
|
// Trilinearly interpolate density values to compute local density
|
||||||
|
float d00 = Lerp(dx, D(vx, vy, vz, nVoxels, density),
|
||||||
|
D(vx+1, vy, vz, nVoxels, density));
|
||||||
|
float d10 = Lerp(dx, D(vx, vy+1, vz, nVoxels, density),
|
||||||
|
D(vx+1, vy+1, vz, nVoxels, density));
|
||||||
|
float d01 = Lerp(dx, D(vx, vy, vz+1, nVoxels, density),
|
||||||
|
D(vx+1, vy, vz+1, nVoxels, density));
|
||||||
|
float d11 = Lerp(dx, D(vx, vy+1, vz+1, nVoxels, density),
|
||||||
|
D(vx+1, vy+1, vz+1, nVoxels, density));
|
||||||
|
float d0 = Lerp(dy, d00, d10);
|
||||||
|
float d1 = Lerp(dy, d01, d11);
|
||||||
|
return Lerp(dz, d0, d1);
|
||||||
|
}
|
||||||
|
|
||||||
|
|
||||||
|
/* Returns the transmittance between two points p0 and p1, in a volume
|
||||||
|
with extent (pMin,pMax) with transmittance coefficient sigma_t,
|
||||||
|
defined by nVoxels[3] voxels in each dimension in the given density
|
||||||
|
array. */
|
||||||
|
static float
|
||||||
|
transmittance(uniform float3 p0, float3 p1, uniform float3 pMin,
|
||||||
|
uniform float3 pMax, uniform float sigma_t,
|
||||||
|
uniform float density[], uniform int nVoxels[3]) {
|
||||||
|
float rayT0, rayT1;
|
||||||
|
Ray ray;
|
||||||
|
ray.origin = p1;
|
||||||
|
ray.dir = p0 - p1;
|
||||||
|
|
||||||
|
// Find the parametric t range along the ray that is inside the volume.
|
||||||
|
if (!IntersectP(ray, pMin, pMax, rayT0, rayT1))
|
||||||
|
return 1.;
|
||||||
|
|
||||||
|
rayT0 = max(rayT0, 0.f);
|
||||||
|
|
||||||
|
// Accumulate beam transmittance in tau
|
||||||
|
float tau = 0;
|
||||||
|
float rayLength = sqrt(ray.dir.x * ray.dir.x + ray.dir.y * ray.dir.y +
|
||||||
|
ray.dir.z * ray.dir.z);
|
||||||
|
uniform float stepDist = 0.2;
|
||||||
|
float stepT = stepDist / rayLength;
|
||||||
|
|
||||||
|
float t = rayT0;
|
||||||
|
float3 pos = ray.origin + ray.dir * rayT0;
|
||||||
|
float3 dirStep = ray.dir * stepT;
|
||||||
|
while (t < rayT1) {
|
||||||
|
tau += stepDist * sigma_t * Density(pos, pMin, pMax, density, nVoxels);
|
||||||
|
pos = pos + dirStep;
|
||||||
|
t += stepT;
|
||||||
|
}
|
||||||
|
|
||||||
|
return exp(-tau);
|
||||||
|
}
|
||||||
|
|
||||||
|
|
||||||
|
static inline float
|
||||||
|
distanceSquared(float3 a, float3 b) {
|
||||||
|
float3 d = a-b;
|
||||||
|
return d.x*d.x + d.y*d.y + d.z*d.z;
|
||||||
|
}
|
||||||
|
|
||||||
|
|
||||||
|
static float
|
||||||
|
raymarch(uniform float density[], uniform int nVoxels[3], Ray ray) {
|
||||||
|
float rayT0, rayT1;
|
||||||
|
uniform float3 pMin = {.3, -.2, .3}, pMax = {1.8, 2.3, 1.8};
|
||||||
|
uniform float3 lightPos = { -1, 4, 1.5 };
|
||||||
|
|
||||||
|
cif (!IntersectP(ray, pMin, pMax, rayT0, rayT1))
|
||||||
|
return 0.;
|
||||||
|
|
||||||
|
rayT0 = max(rayT0, 0.f);
|
||||||
|
|
||||||
|
// Parameters that define the volume scattering characteristics and
|
||||||
|
// sampling rate for raymarching
|
||||||
|
uniform float Le = .25; // Emission coefficient
|
||||||
|
uniform float sigma_a = 10; // Absorption coefficient
|
||||||
|
uniform float sigma_s = 10; // Scattering coefficient
|
||||||
|
uniform float stepDist = 0.025; // Ray step amount
|
||||||
|
uniform float lightIntensity = 40; // Light source intensity
|
||||||
|
|
||||||
|
float tau = 0.f; // accumulated beam transmittance
|
||||||
|
float L = 0; // radiance along the ray
|
||||||
|
float rayLength = sqrt(ray.dir.x * ray.dir.x + ray.dir.y * ray.dir.y +
|
||||||
|
ray.dir.z * ray.dir.z);
|
||||||
|
float stepT = stepDist / rayLength;
|
||||||
|
|
||||||
|
float t = rayT0;
|
||||||
|
float3 pos = ray.origin + ray.dir * rayT0;
|
||||||
|
float3 dirStep = ray.dir * stepT;
|
||||||
|
cwhile (t < rayT1) {
|
||||||
|
float d = Density(pos, pMin, pMax, density, nVoxels);
|
||||||
|
|
||||||
|
// terminate once attenuation is high
|
||||||
|
float atten = exp(-tau);
|
||||||
|
if (atten < .005)
|
||||||
|
break;
|
||||||
|
|
||||||
|
// direct lighting
|
||||||
|
float Li = lightIntensity / distanceSquared(lightPos, pos) *
|
||||||
|
transmittance(lightPos, pos, pMin, pMax, sigma_a + sigma_s,
|
||||||
|
density, nVoxels);
|
||||||
|
L += stepDist * atten * d * sigma_s * (Li + Le);
|
||||||
|
|
||||||
|
// update beam transmittance
|
||||||
|
tau += stepDist * (sigma_a + sigma_s) * d;
|
||||||
|
|
||||||
|
pos = pos + dirStep;
|
||||||
|
t += stepT;
|
||||||
|
}
|
||||||
|
|
||||||
|
// Gamma correction
|
||||||
|
return pow(L, 1.f / 2.2f);
|
||||||
|
}
|
||||||
|
|
||||||
|
|
||||||
|
/* Utility routine used by both the task-based and the single-core entrypoints.
|
||||||
|
Renders a tile of the image, covering [x0,x0) * [y0, y1), storing the
|
||||||
|
result into the image[] array.
|
||||||
|
*/
|
||||||
|
static void
|
||||||
|
volume_tile(uniform int x0, uniform int y0, uniform int x1,
|
||||||
|
uniform int y1, uniform float density[], uniform int nVoxels[3],
|
||||||
|
const uniform float raster2camera[4][4],
|
||||||
|
const uniform float camera2world[4][4],
|
||||||
|
uniform int width, uniform int height, uniform float image[]) {
|
||||||
|
// Work on 4x4=16 pixel big tiles of the image. This function thus
|
||||||
|
// implicitly assumes that both (x1-x0) and (y1-y0) are evenly divisble
|
||||||
|
// by 4.
|
||||||
|
for (uniform int y = y0; y < y1; y += 4) {
|
||||||
|
for (uniform int x = x0; x < x1; x += 4) {
|
||||||
|
foreach (o = 0 ... 16) {
|
||||||
|
// These two arrays encode the mapping from [0,15] to
|
||||||
|
// offsets within the 4x4 pixel block so that we render
|
||||||
|
// each pixel inside the block
|
||||||
|
const uniform int xoffsets[16] = { 0, 1, 0, 1, 2, 3, 2, 3,
|
||||||
|
0, 1, 0, 1, 2, 3, 2, 3 };
|
||||||
|
const uniform int yoffsets[16] = { 0, 0, 1, 1, 0, 0, 1, 1,
|
||||||
|
2, 2, 3, 3, 2, 2, 3, 3 };
|
||||||
|
|
||||||
|
// Figure out the pixel to render for this program instance
|
||||||
|
int xo = x + xoffsets[o], yo = y + yoffsets[o];
|
||||||
|
|
||||||
|
// Use viewing parameters to compute the corresponding ray
|
||||||
|
// for the pixel
|
||||||
|
Ray ray;
|
||||||
|
generateRay(raster2camera, camera2world, xo, yo, ray);
|
||||||
|
|
||||||
|
// And raymarch through the volume to compute the pixel's
|
||||||
|
// value
|
||||||
|
int offset = yo * width + xo;
|
||||||
|
image[offset] = raymarch(density, nVoxels, ray);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
|
||||||
|
task void
|
||||||
|
volume_task(uniform float density[], uniform int nVoxels[3],
|
||||||
|
const uniform float raster2camera[4][4],
|
||||||
|
const uniform float camera2world[4][4],
|
||||||
|
uniform int width, uniform int height, uniform float image[]) {
|
||||||
|
uniform int dx = 8, dy = 8; // must match value in volume_ispc_tasks
|
||||||
|
uniform int xbuckets = (width + (dx-1)) / dx;
|
||||||
|
uniform int ybuckets = (height + (dy-1)) / dy;
|
||||||
|
|
||||||
|
uniform int x0 = (taskIndex % xbuckets) * dx;
|
||||||
|
uniform int y0 = (taskIndex / xbuckets) * dy;
|
||||||
|
uniform int x1 = x0 + dx, y1 = y0 + dy;
|
||||||
|
x1 = min(x1, width);
|
||||||
|
y1 = min(y1, height);
|
||||||
|
|
||||||
|
volume_tile(x0, y0, x1, y1, density, nVoxels, raster2camera,
|
||||||
|
camera2world, width, height, image);
|
||||||
|
}
|
||||||
|
|
||||||
|
|
||||||
|
export void
|
||||||
|
volume_ispc(uniform float density[], uniform int nVoxels[3],
|
||||||
|
const uniform float raster2camera[4][4],
|
||||||
|
const uniform float camera2world[4][4],
|
||||||
|
uniform int width, uniform int height, uniform float image[]) {
|
||||||
|
volume_tile(0, 0, width, height, density, nVoxels, raster2camera,
|
||||||
|
camera2world, width, height, image);
|
||||||
|
}
|
||||||
|
|
||||||
|
|
||||||
|
export void
|
||||||
|
volume_ispc_tasks(uniform float density[], uniform int nVoxels[3],
|
||||||
|
const uniform float raster2camera[4][4],
|
||||||
|
const uniform float camera2world[4][4],
|
||||||
|
uniform int width, uniform int height, uniform float image[]) {
|
||||||
|
// Launch tasks to work on (dx,dy)-sized tiles of the image
|
||||||
|
uniform int dx = 8, dy = 8;
|
||||||
|
uniform int nTasks = ((width+(dx-1))/dx) * ((height+(dy-1))/dy);
|
||||||
|
launch[nTasks] volume_task(density, nVoxels, raster2camera, camera2world,
|
||||||
|
width, height, image);
|
||||||
|
}
|
||||||
34
examples/portable/volume_rendering/volume.vcxproj
Normal file
34
examples/portable/volume_rendering/volume.vcxproj
Normal file
@@ -0,0 +1,34 @@
|
|||||||
|
<?xml version="1.0" encoding="utf-8"?>
|
||||||
|
<Project DefaultTargets="Build" ToolsVersion="4.0" xmlns="http://schemas.microsoft.com/developer/msbuild/2003">
|
||||||
|
<ItemGroup Label="ProjectConfigurations">
|
||||||
|
<ProjectConfiguration Include="Debug|Win32">
|
||||||
|
<Configuration>Debug</Configuration>
|
||||||
|
<Platform>Win32</Platform>
|
||||||
|
</ProjectConfiguration>
|
||||||
|
<ProjectConfiguration Include="Debug|x64">
|
||||||
|
<Configuration>Debug</Configuration>
|
||||||
|
<Platform>x64</Platform>
|
||||||
|
</ProjectConfiguration>
|
||||||
|
<ProjectConfiguration Include="Release|Win32">
|
||||||
|
<Configuration>Release</Configuration>
|
||||||
|
<Platform>Win32</Platform>
|
||||||
|
</ProjectConfiguration>
|
||||||
|
<ProjectConfiguration Include="Release|x64">
|
||||||
|
<Configuration>Release</Configuration>
|
||||||
|
<Platform>x64</Platform>
|
||||||
|
</ProjectConfiguration>
|
||||||
|
</ItemGroup>
|
||||||
|
<PropertyGroup Label="Globals">
|
||||||
|
<ProjectGuid>{dee5733a-e93e-449d-9114-9bffcaeb4df9}</ProjectGuid>
|
||||||
|
<Keyword>Win32Proj</Keyword>
|
||||||
|
<RootNamespace>volume</RootNamespace>
|
||||||
|
<ISPC_file>volume</ISPC_file>
|
||||||
|
<default_targets>sse2,sse4-x2,avx1-i32x8</default_targets>
|
||||||
|
</PropertyGroup>
|
||||||
|
<Import Project="..\common.props" />
|
||||||
|
<ItemGroup>
|
||||||
|
<ClCompile Include="volume.cpp" />
|
||||||
|
<ClCompile Include="volume_serial.cpp" />
|
||||||
|
<ClCompile Include="../tasksys.cpp" />
|
||||||
|
</ItemGroup>
|
||||||
|
</Project>
|
||||||
Reference in New Issue
Block a user