handwired CDP launch

This commit is contained in:
Evghenii
2013-11-12 11:25:43 +01:00
parent 4e5299a9bf
commit f445a470df
2 changed files with 10 additions and 3 deletions

View File

@@ -417,6 +417,11 @@ void ao_ispc_tasks(
const int nby = ntiley;
const int nbz = 1;
const dim3 blocks (nbx, nby, nbz);
ao_task<<<blocks, 128>>>(w,h,nsubsamples,image);
if (threadIdx.x == 0)
{
printf(" --- using CDP -- \n");
ao_task<<<blocks, 128>>>(w,h,nsubsamples,image);
}
cudaDeviceSynchronize();
}
#endif

View File

@@ -340,8 +340,10 @@ extern "C"
const char * module = &module_str[0];
#endif
CUmodule cudaModule = loadModule(module);
CUfunction cudaFunction = getFunction(cudaModule, func_name);
deviceLaunch(cudaFunction, countx, county, countz, func_args);
// CUfunction cudaFunction = getFunction(cudaModule, func_name);
// deviceLaunch(cudaFunction, countx, county, countz, func_args);
CUfunction cudaFunction = getFunction(cudaModule, "ao_ispc_tasks");
deviceLaunch(cudaFunction, 1, 1, 1, func_args);
unloadModule(cudaModule);
}
void CUDASync(void *handle)