Commit 880e69b
committed
[AArch64] Implement NEON FP8 intrinsics for fused multiply-add (indexed)
This patch adds the following intrinsics:
* Floating-point multiply-add long to half-precision (vector, by element)
float16x8_t vmlalbq_lane_f16_mf8_fpm(float16x8_t vd, mfloat8x16_t vn, mfloat8x8_t vm, __builtin_constant_p(lane), fpm_t fpm)
float16x8_t vmlalbq_laneq_f16_mf8_fpm(float16x8_t vd, mfloat8x16_t vn, mfloat8x16_t vm, __builtin_constant_p(lane), fpm_t fpm)
float16x8_t vmlaltq_lane_f16_mf8_fpm(float16x8_t vd, mfloat8x16_t vn, mfloat8x8_t vm, __builtin_constant_p(lane), fpm_t fpm)
float16x8_t vmlaltq_laneq_f16_mf8_fpm(float16x8_t vd, mfloat8x16_t vn, mfloat8x16_t vm, __builtin_constant_p(lane), fpm_t fpm)
* Floating-point multiply-add long-long to single-precision (vector, by element)
float32x4_t vmlallbbq_lane_f32_mf8_fpm(float32x4_t vd, mfloat8x16_t vn, mfloat8x8_t vm, __builtin_constant_p(lane), fpm_t fpm)
float32x4_t vmlallbbq_laneq_f32_mf8_fpm(float32x4_t vd, mfloat8x16_t vn, mfloat8x16_t vm, __builtin_constant_p(lane), fpm_t fpm)
float32x4_t vmlallbtq_lane_f32_mf8_fpm(float32x4_t vd, mfloat8x16_t vn, mfloat8x8_t vm, __builtin_constant_p(lane), fpm_t fpm)
float32x4_t vmlallbtq_laneq_f32_mf8_fpm(float32x4_t vd, mfloat8x16_t vn, mfloat8x16_t vm, __builtin_constant_p(lane), fpm_t fpm)
float32x4_t vmlalltbq_lane_f32_mf8_fpm(float32x4_t vd, mfloat8x16_t vn, mfloat8x8_t vm, __builtin_constant_p(lane), fpm_t fpm)
float32x4_t vmlalltbq_laneq_f32_mf8_fpm(float32x4_t vd, mfloat8x16_t vn, mfloat8x16_t vm, __builtin_constant_p(lane), fpm_t fpm)
float32x4_t vmlallttq_lane_f32_mf8_fpm(float32x4_t vd, mfloat8x16_t vn, mfloat8x8_t vm, __builtin_constant_p(lane), fpm_t fpm)
float32x4_t vmlallttq_laneq_f32_mf8_fpm(float32x4_t vd, mfloat8x16_t vn, mfloat8x16_t vm, __builtin_constant_p(lane), fpm_t fpm)1 parent 2b939e3 commit 880e69b
File tree
9 files changed
+429
-24
lines changed- clang
- include/clang/Basic
- lib/CodeGen
- test
- CodeGen/AArch64/fp8-intrinsics
- Sema/aarch64-fp8-intrinsics
- llvm
- include/llvm/IR
- lib/Target/AArch64
- test/CodeGen/AArch64
9 files changed
+429
-24
lines changed| Original file line number | Diff line number | Diff line change | |
|---|---|---|---|
| |||
2175 | 2175 | | |
2176 | 2176 | | |
2177 | 2177 | | |
| 2178 | + | |
| 2179 | + | |
| 2180 | + | |
| 2181 | + | |
| 2182 | + | |
| 2183 | + | |
| 2184 | + | |
| 2185 | + | |
| 2186 | + | |
| 2187 | + | |
| 2188 | + | |
| 2189 | + | |
| 2190 | + | |
| 2191 | + | |
2178 | 2192 | | |
2179 | 2193 | | |
2180 | 2194 | | |
| |||
| Original file line number | Diff line number | Diff line change | |
|---|---|---|---|
| |||
6909 | 6909 | | |
6910 | 6910 | | |
6911 | 6911 | | |
6912 | | - | |
| 6912 | + | |
6913 | 6913 | | |
6914 | 6914 | | |
6915 | 6915 | | |
6916 | 6916 | | |
6917 | 6917 | | |
6918 | 6918 | | |
6919 | | - | |
| 6919 | + | |
6920 | 6920 | | |
6921 | 6921 | | |
6922 | 6922 | | |
6923 | 6923 | | |
6924 | 6924 | | |
6925 | 6925 | | |
6926 | 6926 | | |
| 6927 | + | |
| 6928 | + | |
| 6929 | + | |
| 6930 | + | |
| 6931 | + | |
| 6932 | + | |
| 6933 | + | |
| 6934 | + | |
| 6935 | + | |
| 6936 | + | |
| 6937 | + | |
| 6938 | + | |
| 6939 | + | |
| 6940 | + | |
| 6941 | + | |
6927 | 6942 | | |
6928 | 6943 | | |
6929 | 6944 | | |
| |||
12882 | 12897 | | |
12883 | 12898 | | |
12884 | 12899 | | |
12885 | | - | |
| 12900 | + | |
12886 | 12901 | | |
12887 | 12902 | | |
12888 | 12903 | | |
| |||
14157 | 14172 | | |
14158 | 14173 | | |
14159 | 14174 | | |
14160 | | - | |
| 14175 | + | |
14161 | 14176 | | |
14162 | 14177 | | |
14163 | 14178 | | |
14164 | 14179 | | |
14165 | | - | |
| 14180 | + | |
14166 | 14181 | | |
14167 | 14182 | | |
14168 | 14183 | | |
14169 | 14184 | | |
14170 | 14185 | | |
14171 | 14186 | | |
14172 | | - | |
| 14187 | + | |
14173 | 14188 | | |
14174 | 14189 | | |
14175 | 14190 | | |
14176 | 14191 | | |
14177 | | - | |
| 14192 | + | |
14178 | 14193 | | |
14179 | 14194 | | |
14180 | 14195 | | |
| |||
14200 | 14215 | | |
14201 | 14216 | | |
14202 | 14217 | | |
14203 | | - | |
| 14218 | + | |
| 14219 | + | |
| 14220 | + | |
| 14221 | + | |
| 14222 | + | |
| 14223 | + | |
| 14224 | + | |
| 14225 | + | |
| 14226 | + | |
| 14227 | + | |
| 14228 | + | |
| 14229 | + | |
| 14230 | + | |
| 14231 | + | |
| 14232 | + | |
| 14233 | + | |
| 14234 | + | |
| 14235 | + | |
| 14236 | + | |
| 14237 | + | |
| 14238 | + | |
| 14239 | + | |
| 14240 | + | |
| 14241 | + | |
| 14242 | + | |
| 14243 | + | |
| 14244 | + | |
| 14245 | + | |
| 14246 | + | |
| 14247 | + | |
| 14248 | + | |
| 14249 | + | |
| 14250 | + | |
| 14251 | + | |
| 14252 | + | |
| 14253 | + | |
14204 | 14254 | | |
14205 | 14255 | | |
14206 | 14256 | | |
| |||
| Original file line number | Diff line number | Diff line change | |
|---|---|---|---|
| |||
4689 | 4689 | | |
4690 | 4690 | | |
4691 | 4691 | | |
4692 | | - | |
| 4692 | + | |
| 4693 | + | |
| 4694 | + | |
| 4695 | + | |
| 4696 | + | |
4693 | 4697 | | |
4694 | 4698 | | |
4695 | 4699 | | |
| |||
0 commit comments