We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
2 parents 46a6cac + b6c3b69 commit 430e559Copy full SHA for 430e559
paddle/fluid/platform/cuda_device_function.h
@@ -53,10 +53,12 @@ inline static int RoundToPowerOfTwo(int dim) {
53
__VA_ARGS__; \
54
} break
55
56
-#define CUDA_LAUNCH_KERNEL_HELPER(...) \
57
- CUDA_LAUNCH_KERNEL_BASE(256, ##__VA_ARGS__); \
58
- CUDA_LAUNCH_KERNEL_BASE(128, ##__VA_ARGS__); \
59
- CUDA_LAUNCH_KERNEL_BASE(64, ##__VA_ARGS__); \
+#define CUDA_LAUNCH_KERNEL_HELPER(...) \
+ CUDA_LAUNCH_KERNEL_BASE(1024, ##__VA_ARGS__); \
+ CUDA_LAUNCH_KERNEL_BASE(512, ##__VA_ARGS__); \
+ CUDA_LAUNCH_KERNEL_BASE(256, ##__VA_ARGS__); \
60
+ CUDA_LAUNCH_KERNEL_BASE(128, ##__VA_ARGS__); \
61
+ CUDA_LAUNCH_KERNEL_BASE(64, ##__VA_ARGS__); \
62
CUDA_LAUNCH_KERNEL_BASE(32, ##__VA_ARGS__);
63
64
template <typename T>
0 commit comments