We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent 8d7e2f8 commit d68d0b8Copy full SHA for d68d0b8
1 file changed
src/infiniop/ops/sum/nvidia/sum_nvidia.cu
@@ -107,6 +107,8 @@ infiniStatus_t Descriptor::calculate(
107
CALCULATE_SUM_WITH_BLOCK_SIZE(CUDA_BLOCK_SIZE_1024)
108
} else if (_opaque->internal->maxThreadsPerBlock() == CUDA_BLOCK_SIZE_512) {
109
CALCULATE_SUM_WITH_BLOCK_SIZE(CUDA_BLOCK_SIZE_512)
110
+ } else if (_opaque->internal->maxThreadsPerBlock() == CUDA_BLOCK_SIZE_2048) {
111
+ CALCULATE_SUM_WITH_BLOCK_SIZE(CUDA_BLOCK_SIZE_2048)
112
} else if (_opaque->internal->maxThreadsPerBlock() == CUDA_BLOCK_SIZE_4096) {
113
CALCULATE_SUM_WITH_BLOCK_SIZE(CUDA_BLOCK_SIZE_4096)
114
} else {
0 commit comments