Mercurial > hg > Papers > 2022 > soto-sigos
view Paper/src/cuLaunchKernel.cbc @ 14:ba98083f9853 default tip
FIX
author | soto <soto@cr.ie.u-ryukyu.ac.jp> |
---|---|
date | Fri, 27 May 2022 12:31:39 +0900 |
parents | 14a0e409d574 |
children |
line wrap: on
line source
int computeblockDim(int count, int maxThreadPerBlock) { return count < maxThreadPerBlock ? count : maxThreadPerBlock; } __code execCUDAExecutor(struct CUDAExecutor* executor, struct Context* task, __code next(...)) { // check data parallelism task if (task->iterate) { struct MultiDimIterator* iterator = &task->iterator->iterator->MultiDimIterator; // compute block thread size int blockDimX = computeblockDim(iterator->x, executor->maxThreadPerBlock); int blockDimY = computeblockDim(iterator->y, executor->maxThreadPerBlock); int blockDimZ = computeblockDim(iterator->z, executor->maxThreadPerBlock); checkCudaErrors(cuLaunchKernel(task->function, iterator->x/blockDimX, iterator->y/blockDimY, iterator->z/blockDimZ, blockDimX, blockDimY, blockDimZ, 0, NULL, (void**)executor->kernelParams, NULL)); } ... }