@@ -146,6 +146,9 @@ TARGET_BUILTIN(__builtin_ia32_tcvtrowps2pbf16l_internal, "V32yUsUsV256iUi", "n",
146146TARGET_BUILTIN(__builtin_ia32_tcvtrowps2phh_internal, " V32xUsUsV256iUi" , " n" , " amx-avx512,avx10.2-512" )
147147TARGET_BUILTIN(__builtin_ia32_tcvtrowps2phl_internal, " V32xUsUsV256iUi" , " n" , " amx-avx512,avx10.2-512" )
148148TARGET_BUILTIN(__builtin_ia32_tilemovrow_internal, " V16iUsUsV256iUi" , " n" , " amx-avx512,avx10.2-512" )
149+ TARGET_BUILTIN(__builtin_ia32_tmmultf32ps_internal, " V256iUsUsUsV256iV256iV256i" , " n" , " amx-tf32" )
150+ TARGET_BUILTIN(__builtin_ia32_ttmmultf32ps_internal, " V256iUsUsUsV256iV256iV256i" , " n" , " amx-tf32,amx-transpose" )
151+
149152// AMX
150153TARGET_BUILTIN(__builtin_ia32_tile_loadconfig, " vvC*" , " n" , " amx-tile" )
151154TARGET_BUILTIN(__builtin_ia32_tile_storeconfig, " vvC*" , " n" , " amx-tile" )
@@ -186,10 +189,6 @@ TARGET_BUILTIN(__builtin_ia32_tcvtrowps2phh, "V32xIUcUi", "n", "amx-avx512,avx10
186189TARGET_BUILTIN(__builtin_ia32_tcvtrowps2phl, " V32xIUcUi" , " n" , " amx-avx512,avx10.2-512" )
187190TARGET_BUILTIN(__builtin_ia32_tilemovrow, " V16iIUcUi" , " n" , " amx-avx512,avx10.2-512" )
188191
189- TARGET_BUILTIN(__builtin_ia32_prefetchi, " vvC*Ui" , " nc" , " prefetchi" )
190- TARGET_BUILTIN(__builtin_ia32_cmpccxadd32, " Siv*SiSiIi" , " n" , " cmpccxadd" )
191- TARGET_BUILTIN(__builtin_ia32_cmpccxadd64, " SLLiSLLi*SLLiSLLiIi" , " n" , " cmpccxadd" )
192-
193192// AMX_FP16 FP16
194193TARGET_BUILTIN(__builtin_ia32_tdpfp16ps, " vIUcIUcIUc" , " n" , " amx-fp16" )
195194
@@ -199,6 +198,14 @@ TARGET_BUILTIN(__builtin_ia32_tdpbhf8ps, "vIUcUIcUIc", "n", "amx-fp8")
199198TARGET_BUILTIN(__builtin_ia32_tdphbf8ps, " vIUcUIcUIc" , " n" , " amx-fp8" )
200199TARGET_BUILTIN(__builtin_ia32_tdphf8ps, " vIUcUIcUIc" , " n" , " amx-fp8" )
201200
201+ // AMX TF32
202+ TARGET_BUILTIN(__builtin_ia32_tmmultf32ps, " vIUcIUcIUc" , " n" , " amx-tf32" )
203+ TARGET_BUILTIN(__builtin_ia32_ttmmultf32ps, " vIUcIUcIUc" , " n" , " amx-tf32,amx-transpose" )
204+
205+ TARGET_BUILTIN(__builtin_ia32_prefetchi, " vvC*Ui" , " nc" , " prefetchi" )
206+ TARGET_BUILTIN(__builtin_ia32_cmpccxadd32, " Siv*SiSiIi" , " n" , " cmpccxadd" )
207+ TARGET_BUILTIN(__builtin_ia32_cmpccxadd64, " SLLiSLLi*SLLiSLLiIi" , " n" , " cmpccxadd" )
208+
202209// RAO-INT
203210TARGET_BUILTIN(__builtin_ia32_aadd64, " vv*SOi" , " n" , " raoint" )
204211TARGET_BUILTIN(__builtin_ia32_aand64, " vv*SOi" , " n" , " raoint" )
0 commit comments