|
1 | 1 | // NOTE: Assertions have been autogenerated by utils/update_cc_test_checks.py UTC_ARGS: --version 5 |
2 | | -// RUN: %clang_cc1 -triple arm64-none-linux-gnu -target-feature +neon -target-feature +fullfp16 -target-feature +v8.6a -target-feature +i8mm \ |
| 2 | +// RUN: %clang_cc1 -triple arm64-none-linux-gnu -target-feature +neon -target-feature +fullfp16 -target-feature +v8.6a -target-feature +i8mm -target-feature +f8f16mm -target-feature +f8f32mm -target-feature +fp8 \ |
3 | 3 | // RUN: -disable-O0-optnone -emit-llvm -o - %s \ |
4 | 4 | // RUN: | opt -S -passes=mem2reg,sroa \ |
5 | 5 | // RUN: | FileCheck %s |
@@ -32,6 +32,31 @@ uint32x4_t test_vmmlaq_u32(uint32x4_t r, uint8x16_t a, uint8x16_t b) { |
32 | 32 | return vmmlaq_u32(r, a, b); |
33 | 33 | } |
34 | 34 |
|
| 35 | +// CHECK-LABEL: define dso_local <8 x half> @test_vmmlaq_f16_mf8( |
| 36 | +// CHECK-SAME: <8 x half> noundef [[P0:%.*]], <16 x i8> [[P1:%.*]], <16 x i8> [[P2:%.*]], i64 noundef [[P3:%.*]]) #[[ATTR0]] { |
| 37 | +// CHECK-NEXT: [[ENTRY:.*:]] |
| 38 | +// CHECK-NEXT: [[TMP0:%.*]] = bitcast <8 x half> [[P0]] to <8 x i16> |
| 39 | +// CHECK-NEXT: [[TMP1:%.*]] = bitcast <8 x i16> [[TMP0]] to <16 x i8> |
| 40 | +// CHECK-NEXT: call void @llvm.aarch64.set.fpmr(i64 [[P3]]) |
| 41 | +// CHECK-NEXT: [[FMMLA_I:%.*]] = bitcast <16 x i8> [[TMP1]] to <8 x half> |
| 42 | +// CHECK-NEXT: [[FMMLA1_I:%.*]] = call <8 x half> @llvm.aarch64.neon.fmmla.v8f16(<8 x half> [[FMMLA_I]], <16 x i8> [[P1]], <16 x i8> [[P2]]) |
| 43 | +// CHECK-NEXT: ret <8 x half> [[FMMLA1_I]] |
| 44 | +// |
| 45 | +float16x8_t test_vmmlaq_f16_mf8(float16x8_t p0, mfloat8x16_t p1, mfloat8x16_t p2, fpm_t p3) { |
| 46 | + return vmmlaq_f16_mf8_fpm(p0, p1, p2, p3); |
| 47 | +} |
| 48 | + |
| 49 | +// CHECK-LABEL: define dso_local <4 x float> @test_vmmlaq_f32_mf8( |
| 50 | +// CHECK-SAME: <4 x float> noundef [[P0:%.*]], <16 x i8> [[P1:%.*]], <16 x i8> [[P2:%.*]], i64 noundef [[P3:%.*]]) #[[ATTR0]] { |
| 51 | +// CHECK-NEXT: [[ENTRY:.*:]] |
| 52 | +// CHECK-NEXT: call void @llvm.aarch64.set.fpmr(i64 [[P3]]) |
| 53 | +// CHECK-NEXT: [[FMMLA_I:%.*]] = call <4 x float> @llvm.aarch64.neon.fmmla.v4f32(<4 x float> [[P0]], <16 x i8> [[P1]], <16 x i8> [[P2]]) |
| 54 | +// CHECK-NEXT: ret <4 x float> [[FMMLA_I]] |
| 55 | +// |
| 56 | +float32x4_t test_vmmlaq_f32_mf8(float32x4_t p0, mfloat8x16_t p1, mfloat8x16_t p2, fpm_t p3) { |
| 57 | + return vmmlaq_f32_mf8_fpm(p0, p1, p2, p3); |
| 58 | +} |
| 59 | + |
35 | 60 | // CHECK-LABEL: define dso_local <4 x i32> @test_vusmmlaq_s32( |
36 | 61 | // CHECK-SAME: <4 x i32> noundef [[R:%.*]], <16 x i8> noundef [[A:%.*]], <16 x i8> noundef [[B:%.*]]) #[[ATTR0]] { |
37 | 62 | // CHECK-NEXT: [[ENTRY:.*:]] |
|
0 commit comments