Commit 1cde192
committed
[AArch64] Implement NEON FP8 intrinsics for fused multiply-add (indexed)
This patch adds the following intrinsics:
* Floating-point multiply-add long to half-precision (vector, by element)
float16x8_t vmlalbq_lane_f16_mf8_fpm(float16x8_t vd, mfloat8x16_t vn, mfloat8x8_t vm, __builtin_constant_p(lane), fpm_t fpm)
float16x8_t vmlalbq_laneq_f16_mf8_fpm(float16x8_t vd, mfloat8x16_t vn, mfloat8x16_t vm, __builtin_constant_p(lane), fpm_t fpm)
float16x8_t vmlaltq_lane_f16_mf8_fpm(float16x8_t vd, mfloat8x16_t vn, mfloat8x8_t vm, __builtin_constant_p(lane), fpm_t fpm)
float16x8_t vmlaltq_laneq_f16_mf8_fpm(float16x8_t vd, mfloat8x16_t vn, mfloat8x16_t vm, __builtin_constant_p(lane), fpm_t fpm)
* Floating-point multiply-add long-long to single-precision (vector, by element)
float32x4_t vmlallbbq_lane_f32_mf8_fpm(float32x4_t vd, mfloat8x16_t vn, mfloat8x8_t vm, __builtin_constant_p(lane), fpm_t fpm)
float32x4_t vmlallbbq_laneq_f32_mf8_fpm(float32x4_t vd, mfloat8x16_t vn, mfloat8x16_t vm, __builtin_constant_p(lane), fpm_t fpm)
float32x4_t vmlallbtq_lane_f32_mf8_fpm(float32x4_t vd, mfloat8x16_t vn, mfloat8x8_t vm, __builtin_constant_p(lane), fpm_t fpm)
float32x4_t vmlallbtq_laneq_f32_mf8_fpm(float32x4_t vd, mfloat8x16_t vn, mfloat8x16_t vm, __builtin_constant_p(lane), fpm_t fpm)
float32x4_t vmlalltbq_lane_f32_mf8_fpm(float32x4_t vd, mfloat8x16_t vn, mfloat8x8_t vm, __builtin_constant_p(lane), fpm_t fpm)
float32x4_t vmlalltbq_laneq_f32_mf8_fpm(float32x4_t vd, mfloat8x16_t vn, mfloat8x16_t vm, __builtin_constant_p(lane), fpm_t fpm)
float32x4_t vmlallttq_lane_f32_mf8_fpm(float32x4_t vd, mfloat8x16_t vn, mfloat8x8_t vm, __builtin_constant_p(lane), fpm_t fpm)
float32x4_t vmlallttq_laneq_f32_mf8_fpm(float32x4_t vd, mfloat8x16_t vn, mfloat8x16_t vm, __builtin_constant_p(lane), fpm_t fpm)1 parent 660fdce commit 1cde192
File tree
9 files changed
+429
-24
lines changed- clang
- include/clang/Basic
- lib/CodeGen
- test
- CodeGen/AArch64/fp8-intrinsics
- Sema/aarch64-fp8-intrinsics
- llvm
- include/llvm/IR
- lib/Target/AArch64
- test/CodeGen/AArch64
9 files changed
+429
-24
lines changed| Original file line number | Diff line number | Diff line change | |
|---|---|---|---|
| |||
2179 | 2179 | | |
2180 | 2180 | | |
2181 | 2181 | | |
| 2182 | + | |
| 2183 | + | |
| 2184 | + | |
| 2185 | + | |
| 2186 | + | |
| 2187 | + | |
| 2188 | + | |
| 2189 | + | |
| 2190 | + | |
| 2191 | + | |
| 2192 | + | |
| 2193 | + | |
| 2194 | + | |
| 2195 | + | |
2182 | 2196 | | |
2183 | 2197 | | |
2184 | 2198 | | |
| |||
| Original file line number | Diff line number | Diff line change | |
|---|---|---|---|
| |||
6880 | 6880 | | |
6881 | 6881 | | |
6882 | 6882 | | |
6883 | | - | |
| 6883 | + | |
6884 | 6884 | | |
6885 | 6885 | | |
6886 | 6886 | | |
6887 | 6887 | | |
6888 | 6888 | | |
6889 | 6889 | | |
6890 | | - | |
| 6890 | + | |
6891 | 6891 | | |
6892 | 6892 | | |
6893 | 6893 | | |
6894 | 6894 | | |
6895 | 6895 | | |
6896 | 6896 | | |
6897 | 6897 | | |
| 6898 | + | |
| 6899 | + | |
| 6900 | + | |
| 6901 | + | |
| 6902 | + | |
| 6903 | + | |
| 6904 | + | |
| 6905 | + | |
| 6906 | + | |
| 6907 | + | |
| 6908 | + | |
| 6909 | + | |
| 6910 | + | |
| 6911 | + | |
| 6912 | + | |
6898 | 6913 | | |
6899 | 6914 | | |
6900 | 6915 | | |
| |||
12840 | 12855 | | |
12841 | 12856 | | |
12842 | 12857 | | |
12843 | | - | |
| 12858 | + | |
12844 | 12859 | | |
12845 | 12860 | | |
12846 | 12861 | | |
| |||
14115 | 14130 | | |
14116 | 14131 | | |
14117 | 14132 | | |
14118 | | - | |
| 14133 | + | |
14119 | 14134 | | |
14120 | 14135 | | |
14121 | 14136 | | |
14122 | 14137 | | |
14123 | | - | |
| 14138 | + | |
14124 | 14139 | | |
14125 | 14140 | | |
14126 | 14141 | | |
14127 | 14142 | | |
14128 | 14143 | | |
14129 | 14144 | | |
14130 | | - | |
| 14145 | + | |
14131 | 14146 | | |
14132 | 14147 | | |
14133 | 14148 | | |
14134 | 14149 | | |
14135 | | - | |
| 14150 | + | |
14136 | 14151 | | |
14137 | 14152 | | |
14138 | 14153 | | |
| |||
14158 | 14173 | | |
14159 | 14174 | | |
14160 | 14175 | | |
14161 | | - | |
| 14176 | + | |
| 14177 | + | |
| 14178 | + | |
| 14179 | + | |
| 14180 | + | |
| 14181 | + | |
| 14182 | + | |
| 14183 | + | |
| 14184 | + | |
| 14185 | + | |
| 14186 | + | |
| 14187 | + | |
| 14188 | + | |
| 14189 | + | |
| 14190 | + | |
| 14191 | + | |
| 14192 | + | |
| 14193 | + | |
| 14194 | + | |
| 14195 | + | |
| 14196 | + | |
| 14197 | + | |
| 14198 | + | |
| 14199 | + | |
| 14200 | + | |
| 14201 | + | |
| 14202 | + | |
| 14203 | + | |
| 14204 | + | |
| 14205 | + | |
| 14206 | + | |
| 14207 | + | |
| 14208 | + | |
| 14209 | + | |
| 14210 | + | |
| 14211 | + | |
14162 | 14212 | | |
14163 | 14213 | | |
14164 | 14214 | | |
| |||
| Original file line number | Diff line number | Diff line change | |
|---|---|---|---|
| |||
4655 | 4655 | | |
4656 | 4656 | | |
4657 | 4657 | | |
4658 | | - | |
| 4658 | + | |
| 4659 | + | |
| 4660 | + | |
| 4661 | + | |
| 4662 | + | |
4659 | 4663 | | |
4660 | 4664 | | |
4661 | 4665 | | |
| |||
0 commit comments