We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent b09ce70 commit bbe8597Copy full SHA for bbe8597
examples/plain-malloc/source/main.cpp
@@ -45,7 +45,7 @@ auto makeExecutionDetails() {
45
cudaDeviceSetLimit(cudaLimitMallocHeapSize, 1024U * 1024U * 1024U);
46
#endif
47
uint32_t const numThreadsPerBlock = 256U;
48
- uint32_t const numThreads = 4U * numThreadsPerBlock;
+ uint32_t const numThreads = 16U * numThreadsPerBlock;
49
auto workdiv = [numThreads, numThreadsPerBlock]() -> alpaka::WorkDivMembers<Dim, Idx> {
50
if constexpr (std::is_same_v<alpaka::AccToTag<Acc>, alpaka::TagCpuSerial>) {
51
return {{1U}, {1U}, {numThreads}};
0 commit comments