Skip to content

Commit be0698e

Browse files
committed
Update movmatrix.cu
Update LIT test.
1 parent e99cbec commit be0698e

File tree

1 file changed

+3
-4
lines changed

1 file changed

+3
-4
lines changed

clang/test/dpct/asm/movmatrix.cu

Lines changed: 3 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -1,6 +1,6 @@
11
// UNSUPPORTED: cuda-8.0, cuda-9.0, cuda-9.1, cuda-9.2, cuda-10.0, cuda-10.1, cuda-10.2
22
// UNSUPPORTED: v8.0, v9.0, v9.1, v9.2, v10.0, v10.1, v10.2
3-
// RUN: dpct --format-range=none -out-root %T/mov %s --cuda-include-path="%cuda-path/include" -- -std=c++14 -x cuda --cuda-host-only
3+
// RUN: dpct --format-range=none -out-root %T/movmatrix %s --cuda-include-path="%cuda-path/include" -- -std=c++14 -x cuda --cuda-host-only
44
// RUN: FileCheck %s --match-full-lines --input-file %T/movmatrix/movmatrix.dp.cpp
55
// RUN: %if build_lit %{icpx -c -fsycl %T/movmatrix/movmatrix.dp.cpp -o %T/movmatrix/movmatrix.dp.o %}
66

@@ -18,10 +18,9 @@ using bf16_2 = __nv_bfloat162;
1818
// Only .m8n8.b16
1919
//
2020

21-
__device__ inline void movmatrix(bf16_2 &dst, const bf16_2 &src) {
22-
23-
// CHECK: dpct::experimental::matrix::movmatrix(*(uint32_t *)(&dst), (*(uint32_t *)(&src)));;
21+
__global__ void movmatrix(bf16_2 &dst, const bf16_2 &src) {
2422

23+
// CHECK: dpct::experimental::matrix::movmatrix(*(uint32_t *)(&dst), (*(uint32_t *)(&src)));
2524
asm volatile("movmatrix.sync.aligned.m8n8.trans.b16 %0, %1;\n"
2625
: "+r"(*(uint32_t *)(&dst))
2726
: "r"(*(uint32_t *)(&src)));

0 commit comments

Comments
 (0)