Commit 4a79123
committed
[AArch64] Implement NEON FP8 intrinsics for fused multiply-add (indexed)
This patch adds the following intrinsics:
* Floating-point multiply-add long to half-precision (vector, by element)
float16x8_t vmlalbq_lane_f16_mf8_fpm(float16x8_t vd, mfloat8x16_t vn, mfloat8x8_t vm, __builtin_constant_p(lane), fpm_t fpm)
float16x8_t vmlalbq_laneq_f16_mf8_fpm(float16x8_t vd, mfloat8x16_t vn, mfloat8x16_t vm, __builtin_constant_p(lane), fpm_t fpm)
float16x8_t vmlaltq_lane_f16_mf8_fpm(float16x8_t vd, mfloat8x16_t vn, mfloat8x8_t vm, __builtin_constant_p(lane), fpm_t fpm)
float16x8_t vmlaltq_laneq_f16_mf8_fpm(float16x8_t vd, mfloat8x16_t vn, mfloat8x16_t vm, __builtin_constant_p(lane), fpm_t fpm)
* Floating-point multiply-add long-long to single-precision (vector, by element)
float32x4_t vmlallbbq_lane_f32_mf8_fpm(float32x4_t vd, mfloat8x16_t vn, mfloat8x8_t vm, __builtin_constant_p(lane), fpm_t fpm)
float32x4_t vmlallbbq_laneq_f32_mf8_fpm(float32x4_t vd, mfloat8x16_t vn, mfloat8x16_t vm, __builtin_constant_p(lane), fpm_t fpm)
float32x4_t vmlallbtq_lane_f32_mf8_fpm(float32x4_t vd, mfloat8x16_t vn, mfloat8x8_t vm, __builtin_constant_p(lane), fpm_t fpm)
float32x4_t vmlallbtq_laneq_f32_mf8_fpm(float32x4_t vd, mfloat8x16_t vn, mfloat8x16_t vm, __builtin_constant_p(lane), fpm_t fpm)
float32x4_t vmlalltbq_lane_f32_mf8_fpm(float32x4_t vd, mfloat8x16_t vn, mfloat8x8_t vm, __builtin_constant_p(lane), fpm_t fpm)
float32x4_t vmlalltbq_laneq_f32_mf8_fpm(float32x4_t vd, mfloat8x16_t vn, mfloat8x16_t vm, __builtin_constant_p(lane), fpm_t fpm)
float32x4_t vmlallttq_lane_f32_mf8_fpm(float32x4_t vd, mfloat8x16_t vn, mfloat8x8_t vm, __builtin_constant_p(lane), fpm_t fpm)
float32x4_t vmlallttq_laneq_f32_mf8_fpm(float32x4_t vd, mfloat8x16_t vn, mfloat8x16_t vm, __builtin_constant_p(lane), fpm_t fpm)
[fixup] Update intrinsics definitions
[fixup] Regenerate tests1 parent e677f83 commit 4a79123
File tree
9 files changed
+445
-24
lines changed- clang
- include/clang/Basic
- lib/CodeGen
- test
- CodeGen/AArch64/fp8-intrinsics
- Sema/aarch64-fp8-intrinsics
- llvm
- include/llvm/IR
- lib/Target/AArch64
- test/CodeGen/AArch64
9 files changed
+445
-24
lines changed| Original file line number | Diff line number | Diff line change | |
|---|---|---|---|
| |||
2169 | 2169 | | |
2170 | 2170 | | |
2171 | 2171 | | |
| 2172 | + | |
| 2173 | + | |
| 2174 | + | |
| 2175 | + | |
| 2176 | + | |
| 2177 | + | |
| 2178 | + | |
| 2179 | + | |
| 2180 | + | |
| 2181 | + | |
| 2182 | + | |
| 2183 | + | |
| 2184 | + | |
| 2185 | + | |
2172 | 2186 | | |
2173 | 2187 | | |
2174 | 2188 | | |
| |||
| Original file line number | Diff line number | Diff line change | |
|---|---|---|---|
| |||
6770 | 6770 | | |
6771 | 6771 | | |
6772 | 6772 | | |
6773 | | - | |
| 6773 | + | |
6774 | 6774 | | |
6775 | 6775 | | |
6776 | 6776 | | |
6777 | 6777 | | |
6778 | 6778 | | |
6779 | 6779 | | |
6780 | | - | |
| 6780 | + | |
6781 | 6781 | | |
6782 | 6782 | | |
6783 | 6783 | | |
6784 | 6784 | | |
6785 | 6785 | | |
6786 | 6786 | | |
6787 | 6787 | | |
| 6788 | + | |
| 6789 | + | |
| 6790 | + | |
| 6791 | + | |
| 6792 | + | |
| 6793 | + | |
| 6794 | + | |
| 6795 | + | |
| 6796 | + | |
| 6797 | + | |
| 6798 | + | |
| 6799 | + | |
| 6800 | + | |
| 6801 | + | |
| 6802 | + | |
6788 | 6803 | | |
6789 | 6804 | | |
6790 | 6805 | | |
| |||
12778 | 12793 | | |
12779 | 12794 | | |
12780 | 12795 | | |
12781 | | - | |
| 12796 | + | |
12782 | 12797 | | |
12783 | 12798 | | |
12784 | 12799 | | |
| |||
14053 | 14068 | | |
14054 | 14069 | | |
14055 | 14070 | | |
14056 | | - | |
| 14071 | + | |
14057 | 14072 | | |
14058 | 14073 | | |
14059 | 14074 | | |
14060 | 14075 | | |
14061 | | - | |
| 14076 | + | |
14062 | 14077 | | |
14063 | 14078 | | |
14064 | 14079 | | |
14065 | 14080 | | |
14066 | 14081 | | |
14067 | 14082 | | |
14068 | | - | |
| 14083 | + | |
14069 | 14084 | | |
14070 | 14085 | | |
14071 | 14086 | | |
14072 | 14087 | | |
14073 | | - | |
| 14088 | + | |
14074 | 14089 | | |
14075 | 14090 | | |
14076 | 14091 | | |
| |||
14096 | 14111 | | |
14097 | 14112 | | |
14098 | 14113 | | |
14099 | | - | |
| 14114 | + | |
| 14115 | + | |
| 14116 | + | |
| 14117 | + | |
| 14118 | + | |
| 14119 | + | |
| 14120 | + | |
| 14121 | + | |
| 14122 | + | |
| 14123 | + | |
| 14124 | + | |
| 14125 | + | |
| 14126 | + | |
| 14127 | + | |
| 14128 | + | |
| 14129 | + | |
| 14130 | + | |
| 14131 | + | |
| 14132 | + | |
| 14133 | + | |
| 14134 | + | |
| 14135 | + | |
| 14136 | + | |
| 14137 | + | |
| 14138 | + | |
| 14139 | + | |
| 14140 | + | |
| 14141 | + | |
| 14142 | + | |
| 14143 | + | |
| 14144 | + | |
| 14145 | + | |
| 14146 | + | |
| 14147 | + | |
| 14148 | + | |
| 14149 | + | |
14100 | 14150 | | |
14101 | 14151 | | |
14102 | 14152 | | |
| |||
| Original file line number | Diff line number | Diff line change | |
|---|---|---|---|
| |||
4699 | 4699 | | |
4700 | 4700 | | |
4701 | 4701 | | |
4702 | | - | |
| 4702 | + | |
| 4703 | + | |
| 4704 | + | |
| 4705 | + | |
| 4706 | + | |
4703 | 4707 | | |
4704 | 4708 | | |
4705 | 4709 | | |
| |||
0 commit comments