Commit afc66a8
committed
[AArch64] Implement NEON FP8 intrinsics for fused multiply-add (indexed)
This patch adds the following intrinsics:
* Floating-point multiply-add long to half-precision (vector, by element)
float16x8_t vmlalbq_lane_f16_mf8_fpm(float16x8_t vd, mfloat8x16_t vn, mfloat8x8_t vm, __builtin_constant_p(lane), fpm_t fpm)
float16x8_t vmlalbq_laneq_f16_mf8_fpm(float16x8_t vd, mfloat8x16_t vn, mfloat8x16_t vm, __builtin_constant_p(lane), fpm_t fpm)
float16x8_t vmlaltq_lane_f16_mf8_fpm(float16x8_t vd, mfloat8x16_t vn, mfloat8x8_t vm, __builtin_constant_p(lane), fpm_t fpm)
float16x8_t vmlaltq_laneq_f16_mf8_fpm(float16x8_t vd, mfloat8x16_t vn, mfloat8x16_t vm, __builtin_constant_p(lane), fpm_t fpm)
* Floating-point multiply-add long-long to single-precision (vector, by element)
float32x4_t vmlallbbq_lane_f32_mf8_fpm(float32x4_t vd, mfloat8x16_t vn, mfloat8x8_t vm, __builtin_constant_p(lane), fpm_t fpm)
float32x4_t vmlallbbq_laneq_f32_mf8_fpm(float32x4_t vd, mfloat8x16_t vn, mfloat8x16_t vm, __builtin_constant_p(lane), fpm_t fpm)
float32x4_t vmlallbtq_lane_f32_mf8_fpm(float32x4_t vd, mfloat8x16_t vn, mfloat8x8_t vm, __builtin_constant_p(lane), fpm_t fpm)
float32x4_t vmlallbtq_laneq_f32_mf8_fpm(float32x4_t vd, mfloat8x16_t vn, mfloat8x16_t vm, __builtin_constant_p(lane), fpm_t fpm)
float32x4_t vmlalltbq_lane_f32_mf8_fpm(float32x4_t vd, mfloat8x16_t vn, mfloat8x8_t vm, __builtin_constant_p(lane), fpm_t fpm)
float32x4_t vmlalltbq_laneq_f32_mf8_fpm(float32x4_t vd, mfloat8x16_t vn, mfloat8x16_t vm, __builtin_constant_p(lane), fpm_t fpm)
float32x4_t vmlallttq_lane_f32_mf8_fpm(float32x4_t vd, mfloat8x16_t vn, mfloat8x8_t vm, __builtin_constant_p(lane), fpm_t fpm)
float32x4_t vmlallttq_laneq_f32_mf8_fpm(float32x4_t vd, mfloat8x16_t vn, mfloat8x16_t vm, __builtin_constant_p(lane), fpm_t fpm)
[fixup] Update intrinsics definitions
[fixup] Regenerate tests1 parent 2ceaf4b commit afc66a8
File tree
9 files changed
+445
-24
lines changed- clang
- include/clang/Basic
- lib/CodeGen
- test
- CodeGen/AArch64/fp8-intrinsics
- Sema/aarch64-fp8-intrinsics
- llvm
- include/llvm/IR
- lib/Target/AArch64
- test/CodeGen/AArch64
9 files changed
+445
-24
lines changed| Original file line number | Diff line number | Diff line change | |
|---|---|---|---|
| |||
2175 | 2175 | | |
2176 | 2176 | | |
2177 | 2177 | | |
| 2178 | + | |
| 2179 | + | |
| 2180 | + | |
| 2181 | + | |
| 2182 | + | |
| 2183 | + | |
| 2184 | + | |
| 2185 | + | |
| 2186 | + | |
| 2187 | + | |
| 2188 | + | |
| 2189 | + | |
| 2190 | + | |
| 2191 | + | |
2178 | 2192 | | |
2179 | 2193 | | |
2180 | 2194 | | |
| |||
| Original file line number | Diff line number | Diff line change | |
|---|---|---|---|
| |||
6910 | 6910 | | |
6911 | 6911 | | |
6912 | 6912 | | |
6913 | | - | |
| 6913 | + | |
6914 | 6914 | | |
6915 | 6915 | | |
6916 | 6916 | | |
6917 | 6917 | | |
6918 | 6918 | | |
6919 | 6919 | | |
6920 | | - | |
| 6920 | + | |
6921 | 6921 | | |
6922 | 6922 | | |
6923 | 6923 | | |
6924 | 6924 | | |
6925 | 6925 | | |
6926 | 6926 | | |
6927 | 6927 | | |
| 6928 | + | |
| 6929 | + | |
| 6930 | + | |
| 6931 | + | |
| 6932 | + | |
| 6933 | + | |
| 6934 | + | |
| 6935 | + | |
| 6936 | + | |
| 6937 | + | |
| 6938 | + | |
| 6939 | + | |
| 6940 | + | |
| 6941 | + | |
| 6942 | + | |
6928 | 6943 | | |
6929 | 6944 | | |
6930 | 6945 | | |
| |||
12883 | 12898 | | |
12884 | 12899 | | |
12885 | 12900 | | |
12886 | | - | |
| 12901 | + | |
12887 | 12902 | | |
12888 | 12903 | | |
12889 | 12904 | | |
| |||
14158 | 14173 | | |
14159 | 14174 | | |
14160 | 14175 | | |
14161 | | - | |
| 14176 | + | |
14162 | 14177 | | |
14163 | 14178 | | |
14164 | 14179 | | |
14165 | 14180 | | |
14166 | | - | |
| 14181 | + | |
14167 | 14182 | | |
14168 | 14183 | | |
14169 | 14184 | | |
14170 | 14185 | | |
14171 | 14186 | | |
14172 | 14187 | | |
14173 | | - | |
| 14188 | + | |
14174 | 14189 | | |
14175 | 14190 | | |
14176 | 14191 | | |
14177 | 14192 | | |
14178 | | - | |
| 14193 | + | |
14179 | 14194 | | |
14180 | 14195 | | |
14181 | 14196 | | |
| |||
14201 | 14216 | | |
14202 | 14217 | | |
14203 | 14218 | | |
14204 | | - | |
| 14219 | + | |
| 14220 | + | |
| 14221 | + | |
| 14222 | + | |
| 14223 | + | |
| 14224 | + | |
| 14225 | + | |
| 14226 | + | |
| 14227 | + | |
| 14228 | + | |
| 14229 | + | |
| 14230 | + | |
| 14231 | + | |
| 14232 | + | |
| 14233 | + | |
| 14234 | + | |
| 14235 | + | |
| 14236 | + | |
| 14237 | + | |
| 14238 | + | |
| 14239 | + | |
| 14240 | + | |
| 14241 | + | |
| 14242 | + | |
| 14243 | + | |
| 14244 | + | |
| 14245 | + | |
| 14246 | + | |
| 14247 | + | |
| 14248 | + | |
| 14249 | + | |
| 14250 | + | |
| 14251 | + | |
| 14252 | + | |
| 14253 | + | |
| 14254 | + | |
14205 | 14255 | | |
14206 | 14256 | | |
14207 | 14257 | | |
| |||
| Original file line number | Diff line number | Diff line change | |
|---|---|---|---|
| |||
4698 | 4698 | | |
4699 | 4699 | | |
4700 | 4700 | | |
4701 | | - | |
| 4701 | + | |
| 4702 | + | |
| 4703 | + | |
| 4704 | + | |
| 4705 | + | |
4702 | 4706 | | |
4703 | 4707 | | |
4704 | 4708 | | |
| |||
0 commit comments