|
5 | 5 | // RUN: %cladclang_cuda -Xclang -plugin-arg-clad -Xclang -disable-tbr -I%S/../../include --cuda-path=%cudapath \ |
6 | 6 | // RUN: --cuda-gpu-arch=%cudaarch %cudaldflags -oGradientKernels.out %s |
7 | 7 | // |
8 | | -// RUN: ./GradientKernels.out | %filecheck_exec %s |
| 8 | +// RUN: %cudarun ./GradientKernels.out | %filecheck_exec %s |
9 | 9 | // |
10 | 10 | // REQUIRES: cuda-runtime |
11 | 11 |
|
@@ -1019,11 +1019,11 @@ __global__ void injective_reassignment_loop(int *a) { |
1019 | 1019 |
|
1020 | 1020 | int main(void) { |
1021 | 1021 | int *a, *d_a; |
1022 | | - cudaMalloc(&a, sizeof(int)); |
1023 | | - cudaMalloc(&d_a, sizeof(int)); |
| 1022 | + cudaMalloc(&a, 2 * sizeof(int)); |
| 1023 | + cudaMalloc(&d_a, 2 * sizeof(int)); |
1024 | 1024 |
|
1025 | | - TEST(kernel, dim3(1), dim3(1), 0, false, a, d_a, 1); // CHECK-EXEC: 10 |
1026 | | - TEST(kernel, dim3(1), dim3(1), 0, true, a, d_a, 1); // CHECK-EXEC: 10 |
| 1025 | + TEST(kernel, dim3(1), dim3(1), 0, false, a, d_a, 2); // CHECK-EXEC: 10 |
| 1026 | + TEST(kernel, dim3(1), dim3(1), 0, true, a, d_a, 2); // CHECK-EXEC: 10 |
1027 | 1027 |
|
1028 | 1028 | auto error = clad::gradient(fake_kernel); |
1029 | 1029 | error.execute_kernel(dim3(1), dim3(1), a, d_a); // CHECK-EXEC: Use execute() for non-global CUDA kernels |
@@ -1146,12 +1146,12 @@ int main(void) { |
1146 | 1146 | TEST_2(indices_lin_comb, dim3(1), dim3(5, 1, 1), 0, false, "out, in", dummy_out, dummy_in, d_out, d_in, 5); // CHECK-EXEC: 20, 25, 45, 15, 15 |
1147 | 1147 |
|
1148 | 1148 | int *n, *d_n; |
1149 | | - cudaMalloc(&n, sizeof(int)); |
1150 | | - cudaMalloc(&d_n, sizeof(int)); |
| 1149 | + cudaMalloc(&n, 2 * sizeof(int)); |
| 1150 | + cudaMalloc(&d_n, 2 * sizeof(int)); |
1151 | 1151 |
|
1152 | | - TEST(kernel_device_injective, dim3(1), dim3(1), 0, false, n, d_n, 1); // CHECK-EXEC: 4 |
1153 | | - TEST(injective_reassignment, dim3(1), dim3(1), 0, false, n, d_n, 1); // CHECK-EXEC: 1 |
1154 | | - TEST(injective_reassignment_loop, dim3(1), dim3(1), 0, false, n, d_n, 1); // CHECK-EXEC: 1 |
| 1152 | + TEST(kernel_device_injective, dim3(1), dim3(1), 0, false, n, d_n, 2); // CHECK-EXEC: 4 |
| 1153 | + TEST(injective_reassignment, dim3(1), dim3(1), 0, false, n, d_n, 2); // CHECK-EXEC: 1 |
| 1154 | + TEST(injective_reassignment_loop, dim3(1), dim3(1), 0, false, n, d_n,2); // CHECK-EXEC: 1 |
1155 | 1155 |
|
1156 | 1156 | cudaFree(dummy_in); |
1157 | 1157 | cudaFree(dummy_out); |
|
0 commit comments