|
4 | 4 | typedef float float4 __attribute__((ext_vector_type(4))); |
5 | 5 | typedef float float16 __attribute__((ext_vector_type(16))); |
6 | 6 | typedef half half8 __attribute__((ext_vector_type(8))); |
| 7 | +typedef half half16 __attribute__((ext_vector_type(16))); |
7 | 8 | typedef __bf16 bfloat8 __attribute__((ext_vector_type(8))); |
| 9 | +typedef __bf16 bfloat16 __attribute__((ext_vector_type(16))); |
| 10 | +typedef unsigned int uint2 __attribute__((ext_vector_type(2))); |
| 11 | +typedef int int4 __attribute__((ext_vector_type(4))); |
| 12 | +typedef int int8 __attribute__((ext_vector_type(8))); |
| 13 | +typedef int int16 __attribute__((ext_vector_type(16))); |
8 | 14 |
|
9 | 15 | void test(__global float4* out0, half8 a0, half8 b0, float4 c0, |
10 | 16 | __global float16* out1, half8 a1, half8 b1, float16 c1, |
11 | | - __global float16* out2, bfloat8 a2, bfloat8 b2, float16 c2) { |
| 17 | + __global float16* out2, bfloat8 a2, bfloat8 b2, float16 c2, |
| 18 | + __global int4* out3, int4 a3, int4 b3, int4 c3, |
| 19 | + __global int16* out4, int4 a4, int4 b4, int16 c4, |
| 20 | + __global float4* out5, bfloat8 a5, bfloat8 b5, float4 c5, |
| 21 | + __global float4* out6, half8 a6, half16 b6, float4 c6, |
| 22 | + __global float16* out7, half8 a7, half16 b7, float16 c7, |
| 23 | + __global float4* out8, bfloat8 a8, bfloat16 b8, float4 c8, |
| 24 | + __global float16* out9, bfloat8 a9, bfloat16 b9, float16 c9, |
| 25 | + __global int4* out10, int4 a10, int8 b10, int4 c10, |
| 26 | + __global int16* out11, int4 a11, int8 b11, int16 c11, |
| 27 | + __global float4* out12, int4 a12, int8 b12, float4 c12, |
| 28 | + __global float16* out13, int4 a13, int8 b13, float16 c13, |
| 29 | + __global float4* out14, int8 a14, int8 b14, float4 c14, int d14, int e14, |
| 30 | + __global float16* out15, int8 a15, int8 b15, float16 c15, int d15, int e15) { |
12 | 31 | *out0 = __builtin_amdgcn_mfma_f32_16x16x32_f16(a0, b0, c0, 0, 0, 0); // expected-error{{'__builtin_amdgcn_mfma_f32_16x16x32_f16' needs target feature gfx950-insts}} |
13 | 32 | *out1 = __builtin_amdgcn_mfma_f32_32x32x16_f16(a1, b1, c1, 0, 0, 0); // expected-error{{'__builtin_amdgcn_mfma_f32_32x32x16_f16' needs target feature gfx950-insts}} |
14 | 33 | *out2 = __builtin_amdgcn_mfma_f32_32x32x16_bf16(a2, b2, c2, 0, 0, 0); // expected-error{{'__builtin_amdgcn_mfma_f32_32x32x16_bf16' needs target feature gfx950-insts}} |
| 34 | + *out14 = __builtin_amdgcn_mfma_scale_f32_16x16x128_f8f6f4(a14, b14, c14, 0, 0, 0, d14, 0, e14); // expected-error{{'__builtin_amdgcn_mfma_scale_f32_16x16x128_f8f6f4' needs target feature gfx950-insts}} |
| 35 | + *out15 = __builtin_amdgcn_mfma_scale_f32_32x32x64_f8f6f4(a15, b15, c15, 0, 0, 0, d15, 0, e15); // expected-error{{'__builtin_amdgcn_mfma_scale_f32_32x32x64_f8f6f4' needs target feature gfx950-insts}} |
15 | 36 | } |
0 commit comments