|
9 | 9 | #include <tuple> |
10 | 10 | #include <utility> |
11 | 11 | #include <variant> |
12 | | -#ifdef alpaka_ACC_GPU_CUDA_ENABLED |
| 12 | +#ifdef ALPAKA_ACC_GPU_CUDA_ENABLED |
13 | 13 | # include <cuda_runtime.h> |
14 | 14 | #endif // alpaka_ACC_GPU_CUDA_ENABLE |
15 | 15 |
|
@@ -41,8 +41,11 @@ namespace membenchmc::Actions { |
41 | 41 | auto makeExecutionDetails() { |
42 | 42 | auto const platformAcc = alpaka::Platform<Acc>{}; |
43 | 43 | auto const dev = alpaka::getDevByIdx(platformAcc, 0); |
| 44 | +#ifdef ALPAKA_ACC_GPU_CUDA_ENABLED |
| 45 | + cudaDeviceSetLimit(cudaLimitMallocHeapSize, 1024U * 1024U * 1024U); |
| 46 | +#endif |
44 | 47 | uint32_t const numThreadsPerBlock = 256U; |
45 | | - uint32_t const numThreads = 8U * numThreadsPerBlock; |
| 48 | + uint32_t const numThreads = 4U * numThreadsPerBlock; |
46 | 49 | auto workdiv = [numThreads, numThreadsPerBlock]() -> alpaka::WorkDivMembers<Dim, Idx> { |
47 | 50 | if constexpr (std::is_same_v<alpaka::AccToTag<Acc>, alpaka::TagCpuSerial>) { |
48 | 51 | return {{1U}, {1U}, {numThreads}}; |
@@ -175,8 +178,6 @@ struct IotaReductionChecker { |
175 | 178 | if (range.data() == nullptr) { |
176 | 179 | return std::make_tuple(Actions::CHECK, Payload(std::make_pair(false, Reason::nullpointer))); |
177 | 180 | } |
178 | | - static_assert(decltype(isSpan(range))::value, |
179 | | - "We expected a span pointing to the allocated memory here."); |
180 | 181 | auto uintRange = convertDataType<uint32_t>(range); |
181 | 182 | std::iota(std::begin(uintRange), std::end(uintRange), currentValue); |
182 | 183 | size_t n = uintRange.size(); |
@@ -222,7 +223,7 @@ template <typename T> struct AcumulateChecksProvider { |
222 | 223 | namespace setups { |
223 | 224 | struct SingleSizeMallocRecipe { |
224 | 225 | static constexpr std::uint32_t allocationSize{ALLOCATION_SIZE}; |
225 | | - static constexpr std::uint32_t numAllocations{16U}; |
| 226 | + static constexpr std::uint32_t numAllocations{256U}; |
226 | 227 | std::array<std::byte*, numAllocations> pointers{{}}; |
227 | 228 | std::uint32_t counter{0U}; |
228 | 229 |
|
|
0 commit comments