@@ -139,6 +139,9 @@ TARGET_BUILTIN(__builtin_ia32_tcvtrowps2pbf16l_internal, "V32yUsUsV256iUi", "n",
139139TARGET_BUILTIN(__builtin_ia32_tcvtrowps2phh_internal, " V32xUsUsV256iUi" , " n" , " amx-avx512,avx10.2-512" )
140140TARGET_BUILTIN(__builtin_ia32_tcvtrowps2phl_internal, " V32xUsUsV256iUi" , " n" , " amx-avx512,avx10.2-512" )
141141TARGET_BUILTIN(__builtin_ia32_tilemovrow_internal, " V16iUsUsV256iUi" , " n" , " amx-avx512,avx10.2-512" )
142+ TARGET_BUILTIN(__builtin_ia32_tmmultf32ps_internal, " V256iUsUsUsV256iV256iV256i" , " n" , " amx-tf32" )
143+ TARGET_BUILTIN(__builtin_ia32_ttmmultf32ps_internal, " V256iUsUsUsV256iV256iV256i" , " n" , " amx-tf32,amx-transpose" )
144+
142145// AMX
143146TARGET_BUILTIN(__builtin_ia32_tile_loadconfig, " vvC*" , " n" , " amx-tile" )
144147TARGET_BUILTIN(__builtin_ia32_tile_storeconfig, " vvC*" , " n" , " amx-tile" )
@@ -172,10 +175,6 @@ TARGET_BUILTIN(__builtin_ia32_tcvtrowps2phh, "V32xIUcUi", "n", "amx-avx512,avx10
172175TARGET_BUILTIN(__builtin_ia32_tcvtrowps2phl, " V32xIUcUi" , " n" , " amx-avx512,avx10.2-512" )
173176TARGET_BUILTIN(__builtin_ia32_tilemovrow, " V16iIUcUi" , " n" , " amx-avx512,avx10.2-512" )
174177
175- TARGET_BUILTIN(__builtin_ia32_prefetchi, " vvC*Ui" , " nc" , " prefetchi" )
176- TARGET_BUILTIN(__builtin_ia32_cmpccxadd32, " Siv*SiSiIi" , " n" , " cmpccxadd" )
177- TARGET_BUILTIN(__builtin_ia32_cmpccxadd64, " SLLiSLLi*SLLiSLLiIi" , " n" , " cmpccxadd" )
178-
179178// AMX_FP16 FP16
180179TARGET_BUILTIN(__builtin_ia32_tdpfp16ps, " vIUcIUcIUc" , " n" , " amx-fp16" )
181180
@@ -185,6 +184,14 @@ TARGET_BUILTIN(__builtin_ia32_tdpbhf8ps, "vIUcUIcUIc", "n", "amx-fp8")
185184TARGET_BUILTIN(__builtin_ia32_tdphbf8ps, " vIUcUIcUIc" , " n" , " amx-fp8" )
186185TARGET_BUILTIN(__builtin_ia32_tdphf8ps, " vIUcUIcUIc" , " n" , " amx-fp8" )
187186
187+ // AMX TF32
188+ TARGET_BUILTIN(__builtin_ia32_tmmultf32ps, " vIUcIUcIUc" , " n" , " amx-tf32" )
189+ TARGET_BUILTIN(__builtin_ia32_ttmmultf32ps, " vIUcIUcIUc" , " n" , " amx-tf32,amx-transpose" )
190+
191+ TARGET_BUILTIN(__builtin_ia32_prefetchi, " vvC*Ui" , " nc" , " prefetchi" )
192+ TARGET_BUILTIN(__builtin_ia32_cmpccxadd32, " Siv*SiSiIi" , " n" , " cmpccxadd" )
193+ TARGET_BUILTIN(__builtin_ia32_cmpccxadd64, " SLLiSLLi*SLLiSLLiIi" , " n" , " cmpccxadd" )
194+
188195// RAO-INT
189196TARGET_BUILTIN(__builtin_ia32_aadd64, " vv*SOi" , " n" , " raoint" )
190197TARGET_BUILTIN(__builtin_ia32_aand64, " vv*SOi" , " n" , " raoint" )
0 commit comments