@@ -2573,7 +2573,7 @@ define void @vec384_i8_widen_to_i24_factor3_broadcast_to_v16i24_factor16(ptr %in
25732573; AVX512F-NEXT: vpalignr {{.*#+}} xmm1 = xmm1[1,2,3,4,5,6,7,8,9,10,11,12,13,14,15],xmm0[0]
25742574; AVX512F-NEXT: vpshufb {{.*#+}} xmm1 = xmm1[15,0,1,15,3,4,15,6,7,15,9,10,15,12,13,15]
25752575; AVX512F-NEXT: vpbroadcastb %xmm0, %ymm0
2576- ; AVX512F-NEXT: vinserti128 $1, %xmm0, % ymm1, % ymm1
2576+ ; AVX512F-NEXT: vpblendd {{.*#+}} ymm1 = ymm1[0,1,2,3],ymm0[4,5,6,7]
25772577; AVX512F-NEXT: vpaddb (%rdx), %ymm1, %ymm1
25782578; AVX512F-NEXT: vpaddb 32(%rdx), %ymm0, %ymm0
25792579; AVX512F-NEXT: vmovdqa %ymm0, 32(%rcx)
@@ -2590,7 +2590,7 @@ define void @vec384_i8_widen_to_i24_factor3_broadcast_to_v16i24_factor16(ptr %in
25902590; AVX512DQ-NEXT: vpalignr {{.*#+}} xmm1 = xmm1[1,2,3,4,5,6,7,8,9,10,11,12,13,14,15],xmm0[0]
25912591; AVX512DQ-NEXT: vpshufb {{.*#+}} xmm1 = xmm1[15,0,1,15,3,4,15,6,7,15,9,10,15,12,13,15]
25922592; AVX512DQ-NEXT: vpbroadcastb %xmm0, %ymm0
2593- ; AVX512DQ-NEXT: vinserti128 $1, %xmm0, % ymm1, % ymm1
2593+ ; AVX512DQ-NEXT: vpblendd {{.*#+}} ymm1 = ymm1[0,1,2,3],ymm0[4,5,6,7]
25942594; AVX512DQ-NEXT: vpaddb (%rdx), %ymm1, %ymm1
25952595; AVX512DQ-NEXT: vpaddb 32(%rdx), %ymm0, %ymm0
25962596; AVX512DQ-NEXT: vmovdqa %ymm0, 32(%rcx)
@@ -2835,7 +2835,7 @@ define void @vec384_i8_widen_to_i48_factor6_broadcast_to_v8i48_factor8(ptr %in.v
28352835; AVX512F-NEXT: vpalignr {{.*#+}} xmm1 = xmm1[1,2,3,4,5,6,7,8,9,10,11,12,13,14,15],xmm0[0]
28362836; AVX512F-NEXT: vpshufb {{.*#+}} xmm1 = xmm1[15,0,1,2,3,4,15,6,7,8,9,10,15,12,13,14]
28372837; AVX512F-NEXT: vpbroadcastb %xmm0, %ymm0
2838- ; AVX512F-NEXT: vinserti128 $1, %xmm0, % ymm1, % ymm1
2838+ ; AVX512F-NEXT: vpblendd {{.*#+}} ymm1 = ymm1[0,1,2,3],ymm0[4,5,6,7]
28392839; AVX512F-NEXT: vpaddb (%rdx), %ymm1, %ymm1
28402840; AVX512F-NEXT: vpaddb 32(%rdx), %ymm0, %ymm0
28412841; AVX512F-NEXT: vmovdqa %ymm0, 32(%rcx)
@@ -2852,7 +2852,7 @@ define void @vec384_i8_widen_to_i48_factor6_broadcast_to_v8i48_factor8(ptr %in.v
28522852; AVX512DQ-NEXT: vpalignr {{.*#+}} xmm1 = xmm1[1,2,3,4,5,6,7,8,9,10,11,12,13,14,15],xmm0[0]
28532853; AVX512DQ-NEXT: vpshufb {{.*#+}} xmm1 = xmm1[15,0,1,2,3,4,15,6,7,8,9,10,15,12,13,14]
28542854; AVX512DQ-NEXT: vpbroadcastb %xmm0, %ymm0
2855- ; AVX512DQ-NEXT: vinserti128 $1, %xmm0, % ymm1, % ymm1
2855+ ; AVX512DQ-NEXT: vpblendd {{.*#+}} ymm1 = ymm1[0,1,2,3],ymm0[4,5,6,7]
28562856; AVX512DQ-NEXT: vpaddb (%rdx), %ymm1, %ymm1
28572857; AVX512DQ-NEXT: vpaddb 32(%rdx), %ymm0, %ymm0
28582858; AVX512DQ-NEXT: vmovdqa %ymm0, 32(%rcx)
@@ -2868,7 +2868,7 @@ define void @vec384_i8_widen_to_i48_factor6_broadcast_to_v8i48_factor8(ptr %in.v
28682868; AVX512BW-NEXT: vpalignr {{.*#+}} xmm1 = xmm1[1,2,3,4,5,6,7,8,9,10,11,12,13,14,15],xmm0[0]
28692869; AVX512BW-NEXT: vpshufb {{.*#+}} xmm1 = xmm1[15,0,1,2,3,4,15,6,7,8,9,10,15,12,13,14]
28702870; AVX512BW-NEXT: vpbroadcastb %xmm0, %ymm0
2871- ; AVX512BW-NEXT: vinserti128 $1, %xmm0, % ymm1, % ymm1
2871+ ; AVX512BW-NEXT: vpblendd {{.*#+}} ymm1 = ymm1[0,1,2,3],ymm0[4,5,6,7]
28722872; AVX512BW-NEXT: vinserti64x4 $1, %ymm0, %zmm1, %zmm0
28732873; AVX512BW-NEXT: vpaddb (%rdx), %zmm0, %zmm0
28742874; AVX512BW-NEXT: vmovdqa64 %zmm0, (%rcx)
@@ -3096,7 +3096,7 @@ define void @vec384_i8_widen_to_i96_factor12_broadcast_to_v4i96_factor4(ptr %in.
30963096; AVX512F-NEXT: vpalignr {{.*#+}} xmm1 = xmm1[1,2,3,4,5,6,7,8,9,10,11,12,13,14,15],xmm0[0]
30973097; AVX512F-NEXT: vpshufb {{.*#+}} xmm1 = xmm1[15,0,1,2,3,4,5,6,7,8,9,10,15,12,13,14]
30983098; AVX512F-NEXT: vpbroadcastb %xmm0, %ymm0
3099- ; AVX512F-NEXT: vinserti128 $1, %xmm0, % ymm1, % ymm1
3099+ ; AVX512F-NEXT: vpblendd {{.*#+}} ymm1 = ymm1[0,1,2,3],ymm0[4,5,6,7]
31003100; AVX512F-NEXT: vpaddb (%rdx), %ymm1, %ymm1
31013101; AVX512F-NEXT: vpaddb 32(%rdx), %ymm0, %ymm0
31023102; AVX512F-NEXT: vmovdqa %ymm0, 32(%rcx)
@@ -3113,7 +3113,7 @@ define void @vec384_i8_widen_to_i96_factor12_broadcast_to_v4i96_factor4(ptr %in.
31133113; AVX512DQ-NEXT: vpalignr {{.*#+}} xmm1 = xmm1[1,2,3,4,5,6,7,8,9,10,11,12,13,14,15],xmm0[0]
31143114; AVX512DQ-NEXT: vpshufb {{.*#+}} xmm1 = xmm1[15,0,1,2,3,4,5,6,7,8,9,10,15,12,13,14]
31153115; AVX512DQ-NEXT: vpbroadcastb %xmm0, %ymm0
3116- ; AVX512DQ-NEXT: vinserti128 $1, %xmm0, % ymm1, % ymm1
3116+ ; AVX512DQ-NEXT: vpblendd {{.*#+}} ymm1 = ymm1[0,1,2,3],ymm0[4,5,6,7]
31173117; AVX512DQ-NEXT: vpaddb (%rdx), %ymm1, %ymm1
31183118; AVX512DQ-NEXT: vpaddb 32(%rdx), %ymm0, %ymm0
31193119; AVX512DQ-NEXT: vmovdqa %ymm0, 32(%rcx)
@@ -3129,7 +3129,7 @@ define void @vec384_i8_widen_to_i96_factor12_broadcast_to_v4i96_factor4(ptr %in.
31293129; AVX512BW-NEXT: vpalignr {{.*#+}} xmm1 = xmm1[1,2,3,4,5,6,7,8,9,10,11,12,13,14,15],xmm0[0]
31303130; AVX512BW-NEXT: vpshufb {{.*#+}} xmm1 = xmm1[15,0,1,2,3,4,5,6,7,8,9,10,15,12,13,14]
31313131; AVX512BW-NEXT: vpbroadcastb %xmm0, %ymm0
3132- ; AVX512BW-NEXT: vinserti128 $1, %xmm0, % ymm1, % ymm1
3132+ ; AVX512BW-NEXT: vpblendd {{.*#+}} ymm1 = ymm1[0,1,2,3],ymm0[4,5,6,7]
31333133; AVX512BW-NEXT: vinserti64x4 $1, %ymm0, %zmm1, %zmm0
31343134; AVX512BW-NEXT: vpaddb (%rdx), %zmm0, %zmm0
31353135; AVX512BW-NEXT: vmovdqa64 %zmm0, (%rcx)
@@ -3612,7 +3612,7 @@ define void @vec384_i16_widen_to_i48_factor3_broadcast_to_v8i48_factor8(ptr %in.
36123612; AVX512F-NEXT: vpaddb (%rsi), %xmm0, %xmm0
36133613; AVX512F-NEXT: vpbroadcastw %xmm0, %ymm0
36143614; AVX512F-NEXT: vpblendw {{.*#+}} xmm1 = xmm0[0],xmm1[1,2],xmm0[3],xmm1[4,5],xmm0[6],xmm1[7]
3615- ; AVX512F-NEXT: vinserti128 $1, %xmm0, % ymm1, % ymm1
3615+ ; AVX512F-NEXT: vpblendd {{.*#+}} ymm1 = ymm1[0,1,2,3],ymm0[4,5,6,7]
36163616; AVX512F-NEXT: vpaddb (%rdx), %ymm1, %ymm1
36173617; AVX512F-NEXT: vpaddb 32(%rdx), %ymm0, %ymm0
36183618; AVX512F-NEXT: vmovdqa %ymm0, 32(%rcx)
@@ -3628,7 +3628,7 @@ define void @vec384_i16_widen_to_i48_factor3_broadcast_to_v8i48_factor8(ptr %in.
36283628; AVX512DQ-NEXT: vpaddb (%rsi), %xmm0, %xmm0
36293629; AVX512DQ-NEXT: vpbroadcastw %xmm0, %ymm0
36303630; AVX512DQ-NEXT: vpblendw {{.*#+}} xmm1 = xmm0[0],xmm1[1,2],xmm0[3],xmm1[4,5],xmm0[6],xmm1[7]
3631- ; AVX512DQ-NEXT: vinserti128 $1, %xmm0, % ymm1, % ymm1
3631+ ; AVX512DQ-NEXT: vpblendd {{.*#+}} ymm1 = ymm1[0,1,2,3],ymm0[4,5,6,7]
36323632; AVX512DQ-NEXT: vpaddb (%rdx), %ymm1, %ymm1
36333633; AVX512DQ-NEXT: vpaddb 32(%rdx), %ymm0, %ymm0
36343634; AVX512DQ-NEXT: vmovdqa %ymm0, 32(%rcx)
@@ -3864,7 +3864,7 @@ define void @vec384_i16_widen_to_i96_factor6_broadcast_to_v4i96_factor4(ptr %in.
38643864; AVX512F-NEXT: vpaddb (%rsi), %xmm0, %xmm0
38653865; AVX512F-NEXT: vpbroadcastw %xmm0, %ymm0
38663866; AVX512F-NEXT: vpblendw {{.*#+}} xmm1 = xmm0[0],xmm1[1,2,3,4,5],xmm0[6],xmm1[7]
3867- ; AVX512F-NEXT: vinserti128 $1, %xmm0, % ymm1, % ymm1
3867+ ; AVX512F-NEXT: vpblendd {{.*#+}} ymm1 = ymm1[0,1,2,3],ymm0[4,5,6,7]
38683868; AVX512F-NEXT: vpaddb (%rdx), %ymm1, %ymm1
38693869; AVX512F-NEXT: vpaddb 32(%rdx), %ymm0, %ymm0
38703870; AVX512F-NEXT: vmovdqa %ymm0, 32(%rcx)
@@ -3880,7 +3880,7 @@ define void @vec384_i16_widen_to_i96_factor6_broadcast_to_v4i96_factor4(ptr %in.
38803880; AVX512DQ-NEXT: vpaddb (%rsi), %xmm0, %xmm0
38813881; AVX512DQ-NEXT: vpbroadcastw %xmm0, %ymm0
38823882; AVX512DQ-NEXT: vpblendw {{.*#+}} xmm1 = xmm0[0],xmm1[1,2,3,4,5],xmm0[6],xmm1[7]
3883- ; AVX512DQ-NEXT: vinserti128 $1, %xmm0, % ymm1, % ymm1
3883+ ; AVX512DQ-NEXT: vpblendd {{.*#+}} ymm1 = ymm1[0,1,2,3],ymm0[4,5,6,7]
38843884; AVX512DQ-NEXT: vpaddb (%rdx), %ymm1, %ymm1
38853885; AVX512DQ-NEXT: vpaddb 32(%rdx), %ymm0, %ymm0
38863886; AVX512DQ-NEXT: vmovdqa %ymm0, 32(%rcx)
0 commit comments