annotate paper/src/cuLaunchKernel.cbc @ 2:c7acb9211784

add code, figure. and paper fix content
author ryokka
date Mon, 27 Jan 2020 20:41:36 +0900
parents
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
2
c7acb9211784 add code, figure. and paper fix content
ryokka
parents:
diff changeset
1 int computeblockDim(int count, int maxThreadPerBlock) {
c7acb9211784 add code, figure. and paper fix content
ryokka
parents:
diff changeset
2 return count < maxThreadPerBlock ? count : maxThreadPerBlock;
c7acb9211784 add code, figure. and paper fix content
ryokka
parents:
diff changeset
3 }
c7acb9211784 add code, figure. and paper fix content
ryokka
parents:
diff changeset
4
c7acb9211784 add code, figure. and paper fix content
ryokka
parents:
diff changeset
5 __code execCUDAExecutor(struct CUDAExecutor* executor, struct Context* task, __code next(...)) {
c7acb9211784 add code, figure. and paper fix content
ryokka
parents:
diff changeset
6 // check data parallelism task
c7acb9211784 add code, figure. and paper fix content
ryokka
parents:
diff changeset
7 if (task->iterate) {
c7acb9211784 add code, figure. and paper fix content
ryokka
parents:
diff changeset
8 struct MultiDimIterator* iterator = &task->iterator->iterator->MultiDimIterator;
c7acb9211784 add code, figure. and paper fix content
ryokka
parents:
diff changeset
9
c7acb9211784 add code, figure. and paper fix content
ryokka
parents:
diff changeset
10 // compute block thread size
c7acb9211784 add code, figure. and paper fix content
ryokka
parents:
diff changeset
11 int blockDimX = computeblockDim(iterator->x, executor->maxThreadPerBlock);
c7acb9211784 add code, figure. and paper fix content
ryokka
parents:
diff changeset
12 int blockDimY = computeblockDim(iterator->y, executor->maxThreadPerBlock);
c7acb9211784 add code, figure. and paper fix content
ryokka
parents:
diff changeset
13 int blockDimZ = computeblockDim(iterator->z, executor->maxThreadPerBlock);
c7acb9211784 add code, figure. and paper fix content
ryokka
parents:
diff changeset
14
c7acb9211784 add code, figure. and paper fix content
ryokka
parents:
diff changeset
15 checkCudaErrors(cuLaunchKernel(task->function,
c7acb9211784 add code, figure. and paper fix content
ryokka
parents:
diff changeset
16 iterator->x/blockDimX, iterator->y/blockDimY, iterator->z/blockDimZ,
c7acb9211784 add code, figure. and paper fix content
ryokka
parents:
diff changeset
17 blockDimX, blockDimY, blockDimZ,
c7acb9211784 add code, figure. and paper fix content
ryokka
parents:
diff changeset
18 0, NULL, (void**)executor->kernelParams, NULL));
c7acb9211784 add code, figure. and paper fix content
ryokka
parents:
diff changeset
19 }
c7acb9211784 add code, figure. and paper fix content
ryokka
parents:
diff changeset
20 ...
c7acb9211784 add code, figure. and paper fix content
ryokka
parents:
diff changeset
21 }