We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 022b909 commit 9e9cb6fCopy full SHA for 9e9cb6f
cuda/include/cuda_utils.h
@@ -10,7 +10,7 @@
10
11
#include <vector>
12
13
-#define TOTAL_THREADS 512
+#define TOTAL_THREADS 1024
14
15
inline int opt_n_threads(int work_size) {
16
const int pow_2 = std::log(static_cast<double>(work_size)) / std::log(2.0);
0 commit comments