Skip to content

Commit c4c8083

Browse files
committed
fixup! [DirectX] Use scalar arguments for @llvm.dx.dot intrinsics
1 parent 1fa97b4 commit c4c8083

File tree

1 file changed

+8
-2
lines changed

1 file changed

+8
-2
lines changed

clang/test/CodeGenDirectX/Builtins/dot2add.c

Lines changed: 8 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -17,7 +17,13 @@ typedef half half2 __attribute__((ext_vector_type(2)));
1717
// CHECK-NEXT: [[TMP0:%.*]] = load <2 x half>, ptr [[X_ADDR]], align 4
1818
// CHECK-NEXT: [[TMP1:%.*]] = load <2 x half>, ptr [[Y_ADDR]], align 4
1919
// CHECK-NEXT: [[TMP2:%.*]] = load float, ptr [[Z_ADDR]], align 4
20-
// CHECK-NEXT: [[DX_DOT2ADD:%.*]] = call float @llvm.dx.dot2add.v2f16(<2 x half> [[TMP0]], <2 x half> [[TMP1]], float [[TMP2]])
20+
// CHECK-NEXT: [[TMP3:%.*]] = extractelement <2 x half> [[TMP0]], i32 0
21+
// CHECK-NEXT: [[TMP4:%.*]] = extractelement <2 x half> [[TMP0]], i32 1
22+
// CHECK-NEXT: [[TMP5:%.*]] = extractelement <2 x half> [[TMP1]], i32 0
23+
// CHECK-NEXT: [[TMP6:%.*]] = extractelement <2 x half> [[TMP1]], i32 1
24+
// CHECK-NEXT: [[DX_DOT2ADD:%.*]] = call float @llvm.dx.dot2add(float [[TMP2]], half [[TMP3]], half [[TMP4]], half [[TMP5]], half [[TMP6]])
2125
// CHECK-NEXT: ret float [[DX_DOT2ADD]]
2226
//
23-
float test_dot2add(half2 X, half2 Y, float Z) { return __builtin_dx_dot2add(X, Y, Z); }
27+
float test_dot2add(half2 X, half2 Y, float Z) {
28+
return __builtin_dx_dot2add(X, Y, Z);
29+
}

0 commit comments

Comments
 (0)