|
33 | 33 | define amdgpu_kernel void @test_mfma_f32_16x16x2bf16(ptr addrspace(1) %arg) #0 { |
34 | 34 | bb: |
35 | 35 | %in.1 = load <16 x float>, ptr addrspace(1) %arg |
36 | | - %mai.1 = tail call <16 x float> @llvm.amdgcn.mfma.f32.16x16x2bf16(<2 x i16> undef, <2 x i16> undef, <16 x float> %in.1, i32 0, i32 0, i32 0) |
| 36 | + %mai.1 = tail call <16 x float> @llvm.amdgcn.mfma.f32.16x16x2bf16(<2 x i16> poison, <2 x i16> poison, <16 x float> %in.1, i32 0, i32 0, i32 0) |
37 | 37 | store <16 x float> %mai.1, ptr addrspace(1) %arg |
38 | 38 | ret void |
39 | 39 | } |
|
43 | 43 | define amdgpu_kernel void @test_mfma_f32_4x4x2bf16(ptr addrspace(1) %arg) #0 { |
44 | 44 | bb: |
45 | 45 | %in.1 = load <4 x float>, ptr addrspace(1) %arg |
46 | | - %mai.1 = tail call <4 x float> @llvm.amdgcn.mfma.f32.4x4x2bf16(<2 x i16> undef, <2 x i16> undef, <4 x float> %in.1, i32 0, i32 0, i32 0) |
| 46 | + %mai.1 = tail call <4 x float> @llvm.amdgcn.mfma.f32.4x4x2bf16(<2 x i16> poison, <2 x i16> poison, <4 x float> %in.1, i32 0, i32 0, i32 0) |
47 | 47 | store <4 x float> %mai.1, ptr addrspace(1) %arg |
48 | 48 | ret void |
49 | 49 | } |
|
53 | 53 | define amdgpu_kernel void @test_mfma_f32_32x32x4bf16(ptr addrspace(1) %arg) #0 { |
54 | 54 | bb: |
55 | 55 | %in.1 = load <16 x float>, ptr addrspace(1) %arg |
56 | | - %mai.1 = tail call <16 x float> @llvm.amdgcn.mfma.f32.32x32x4bf16(<2 x i16> undef, <2 x i16> undef, <16 x float> %in.1, i32 0, i32 0, i32 0) |
| 56 | + %mai.1 = tail call <16 x float> @llvm.amdgcn.mfma.f32.32x32x4bf16(<2 x i16> poison, <2 x i16> poison, <16 x float> %in.1, i32 0, i32 0, i32 0) |
57 | 57 | store <16 x float> %mai.1, ptr addrspace(1) %arg |
58 | 58 | ret void |
59 | 59 | } |
|
63 | 63 | define amdgpu_kernel void @test_mfma_f32_16x16x8bf16(ptr addrspace(1) %arg) #0 { |
64 | 64 | bb: |
65 | 65 | %in.1 = load <4 x float>, ptr addrspace(1) %arg |
66 | | - %mai.1 = tail call <4 x float> @llvm.amdgcn.mfma.f32.16x16x8bf16(<2 x i16> undef, <2 x i16> undef, <4 x float> %in.1, i32 0, i32 0, i32 0) |
| 66 | + %mai.1 = tail call <4 x float> @llvm.amdgcn.mfma.f32.16x16x8bf16(<2 x i16> poison, <2 x i16> poison, <4 x float> %in.1, i32 0, i32 0, i32 0) |
67 | 67 | store <4 x float> %mai.1, ptr addrspace(1) %arg |
68 | 68 | ret void |
69 | 69 | } |
|
73 | 73 | define amdgpu_kernel void @test_mfma_f32_32x32x4bf16_1k(ptr addrspace(1) %arg) #0 { |
74 | 74 | bb: |
75 | 75 | %in.1 = load <32 x float>, ptr addrspace(1) %arg |
76 | | - %mai.1 = tail call <32 x float> @llvm.amdgcn.mfma.f32.32x32x4bf16.1k(<4 x i16> undef, <4 x i16> undef, <32 x float> %in.1, i32 0, i32 0, i32 0) |
| 76 | + %mai.1 = tail call <32 x float> @llvm.amdgcn.mfma.f32.32x32x4bf16.1k(<4 x i16> poison, <4 x i16> poison, <32 x float> %in.1, i32 0, i32 0, i32 0) |
77 | 77 | store <32 x float> %mai.1, ptr addrspace(1) %arg |
78 | 78 | ret void |
79 | 79 | } |
|
83 | 83 | define amdgpu_kernel void @test_mfma_f32_16x16x4bf16_1k(ptr addrspace(1) %arg) #0 { |
84 | 84 | bb: |
85 | 85 | %in.1 = load <16 x float>, ptr addrspace(1) %arg |
86 | | - %mai.1 = tail call <16 x float> @llvm.amdgcn.mfma.f32.16x16x4bf16.1k(<4 x i16> undef, <4 x i16> undef, <16 x float> %in.1, i32 0, i32 0, i32 0) |
| 86 | + %mai.1 = tail call <16 x float> @llvm.amdgcn.mfma.f32.16x16x4bf16.1k(<4 x i16> poison, <4 x i16> poison, <16 x float> %in.1, i32 0, i32 0, i32 0) |
87 | 87 | store <16 x float> %mai.1, ptr addrspace(1) %arg |
88 | 88 | ret void |
89 | 89 | } |
|
93 | 93 | define amdgpu_kernel void @test_mfma_f32_4x4x4bf16_1k(ptr addrspace(1) %arg) #0 { |
94 | 94 | bb: |
95 | 95 | %in.1 = load <4 x float>, ptr addrspace(1) %arg |
96 | | - %mai.1 = tail call <4 x float> @llvm.amdgcn.mfma.f32.4x4x4bf16.1k(<4 x i16> undef, <4 x i16> undef, <4 x float> %in.1, i32 0, i32 0, i32 0) |
| 96 | + %mai.1 = tail call <4 x float> @llvm.amdgcn.mfma.f32.4x4x4bf16.1k(<4 x i16> poison, <4 x i16> poison, <4 x float> %in.1, i32 0, i32 0, i32 0) |
97 | 97 | store <4 x float> %mai.1, ptr addrspace(1) %arg |
98 | 98 | ret void |
99 | 99 | } |
|
103 | 103 | define amdgpu_kernel void @test_mfma_f32_32x32x8bf16_1k(ptr addrspace(1) %arg) #0 { |
104 | 104 | bb: |
105 | 105 | %in.1 = load <16 x float>, ptr addrspace(1) %arg |
106 | | - %mai.1 = tail call <16 x float> @llvm.amdgcn.mfma.f32.32x32x8bf16.1k(<4 x i16> undef, <4 x i16> undef, <16 x float> %in.1, i32 0, i32 0, i32 0) |
| 106 | + %mai.1 = tail call <16 x float> @llvm.amdgcn.mfma.f32.32x32x8bf16.1k(<4 x i16> poison, <4 x i16> poison, <16 x float> %in.1, i32 0, i32 0, i32 0) |
107 | 107 | store <16 x float> %mai.1, ptr addrspace(1) %arg |
108 | 108 | ret void |
109 | 109 | } |
|
113 | 113 | define amdgpu_kernel void @test_mfma_f32_16x16x16bf16_1k(ptr addrspace(1) %arg) #0 { |
114 | 114 | bb: |
115 | 115 | %in.1 = load <4 x float>, ptr addrspace(1) %arg |
116 | | - %mai.1 = tail call <4 x float> @llvm.amdgcn.mfma.f32.16x16x16bf16.1k(<4 x i16> undef, <4 x i16> undef, <4 x float> %in.1, i32 0, i32 0, i32 0) |
| 116 | + %mai.1 = tail call <4 x float> @llvm.amdgcn.mfma.f32.16x16x16bf16.1k(<4 x i16> poison, <4 x i16> poison, <4 x float> %in.1, i32 0, i32 0, i32 0) |
117 | 117 | store <4 x float> %mai.1, ptr addrspace(1) %arg |
118 | 118 | ret void |
119 | 119 | } |
|
0 commit comments