Skip to content
Closed
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
48 changes: 24 additions & 24 deletions bench/boost/optimized/dump_ssse3.ll
Original file line number Diff line number Diff line change
Expand Up @@ -1263,9 +1263,9 @@ define hidden void @_ZN5boost3log11v2_mt_posix3aux32dump_data_char_ssse3_slow_ps
%30 = or disjoint <16 x i8> %27, splat (i8 48)
%31 = bitcast <2 x i64> %.084.i to <16 x i8>
%32 = select <16 x i1> %26, <16 x i8> %31, <16 x i8> zeroinitializer
%33 = add <16 x i8> %32, %29
%33 = add nuw nsw <16 x i8> %32, %29
%34 = select <16 x i1> %28, <16 x i8> %31, <16 x i8> zeroinitializer
%35 = add <16 x i8> %34, %30
%35 = add nuw nsw <16 x i8> %34, %30
%36 = shufflevector <16 x i8> %33, <16 x i8> %35, <16 x i32> <i32 0, i32 16, i32 1, i32 17, i32 2, i32 18, i32 3, i32 19, i32 4, i32 20, i32 5, i32 21, i32 6, i32 22, i32 7, i32 23>
%37 = shufflevector <16 x i8> %33, <16 x i8> %35, <16 x i32> <i32 8, i32 24, i32 9, i32 25, i32 10, i32 26, i32 11, i32 27, i32 12, i32 28, i32 13, i32 29, i32 14, i32 30, i32 15, i32 31>
%38 = shufflevector <16 x i8> %36, <16 x i8> <i8 0, i8 poison, i8 poison, i8 poison, i8 poison, i8 poison, i8 poison, i8 poison, i8 poison, i8 poison, i8 poison, i8 poison, i8 poison, i8 poison, i8 poison, i8 poison>, <16 x i32> <i32 16, i32 0, i32 1, i32 16, i32 2, i32 3, i32 16, i32 4, i32 5, i32 16, i32 6, i32 7, i32 16, i32 8, i32 9, i32 16>
Expand Down Expand Up @@ -1345,9 +1345,9 @@ define hidden void @_ZN5boost3log11v2_mt_posix3aux32dump_data_char_ssse3_slow_ps
%74 = or disjoint <16 x i8> %69, splat (i8 48)
%75 = or disjoint <16 x i8> %72, splat (i8 48)
%76 = select <16 x i1> %70, <16 x i8> %55, <16 x i8> zeroinitializer
%77 = add <16 x i8> %76, %74
%77 = add nuw nsw <16 x i8> %76, %74
%78 = select <16 x i1> %73, <16 x i8> %55, <16 x i8> zeroinitializer
%79 = add <16 x i8> %78, %75
%79 = add nuw nsw <16 x i8> %78, %75
%80 = shufflevector <16 x i8> %77, <16 x i8> %79, <16 x i32> <i32 0, i32 16, i32 1, i32 17, i32 2, i32 18, i32 3, i32 19, i32 4, i32 20, i32 5, i32 21, i32 6, i32 22, i32 7, i32 23>
%81 = shufflevector <16 x i8> %77, <16 x i8> %79, <16 x i32> <i32 8, i32 24, i32 9, i32 25, i32 10, i32 26, i32 11, i32 27, i32 12, i32 28, i32 13, i32 29, i32 14, i32 30, i32 15, i32 31>
%82 = shufflevector <16 x i8> %80, <16 x i8> <i8 0, i8 poison, i8 poison, i8 poison, i8 poison, i8 poison, i8 poison, i8 poison, i8 poison, i8 poison, i8 poison, i8 poison, i8 poison, i8 poison, i8 poison, i8 poison>, <16 x i32> <i32 16, i32 0, i32 1, i32 16, i32 2, i32 3, i32 16, i32 4, i32 5, i32 16, i32 6, i32 7, i32 16, i32 8, i32 9, i32 16>
Expand Down Expand Up @@ -1384,9 +1384,9 @@ define hidden void @_ZN5boost3log11v2_mt_posix3aux32dump_data_char_ssse3_slow_ps
%104 = or disjoint <16 x i8> %99, splat (i8 48)
%105 = or disjoint <16 x i8> %102, splat (i8 48)
%106 = select <16 x i1> %100, <16 x i8> %58, <16 x i8> zeroinitializer
%107 = add <16 x i8> %106, %104
%107 = add nuw nsw <16 x i8> %106, %104
%108 = select <16 x i1> %103, <16 x i8> %58, <16 x i8> zeroinitializer
%109 = add <16 x i8> %108, %105
%109 = add nuw nsw <16 x i8> %108, %105
%110 = shufflevector <16 x i8> %107, <16 x i8> %109, <16 x i32> <i32 0, i32 16, i32 1, i32 17, i32 2, i32 18, i32 3, i32 19, i32 4, i32 20, i32 5, i32 21, i32 6, i32 22, i32 7, i32 23>
%111 = shufflevector <16 x i8> %107, <16 x i8> %109, <16 x i32> <i32 8, i32 24, i32 9, i32 25, i32 10, i32 26, i32 11, i32 27, i32 12, i32 28, i32 13, i32 29, i32 14, i32 30, i32 15, i32 31>
%112 = shufflevector <16 x i8> %110, <16 x i8> <i8 0, i8 poison, i8 poison, i8 poison, i8 poison, i8 poison, i8 poison, i8 poison, i8 poison, i8 poison, i8 poison, i8 poison, i8 poison, i8 poison, i8 poison, i8 poison>, <16 x i32> <i32 16, i32 0, i32 1, i32 16, i32 2, i32 3, i32 16, i32 4, i32 5, i32 16, i32 6, i32 7, i32 16, i32 8, i32 9, i32 16>
Expand Down Expand Up @@ -1509,9 +1509,9 @@ define hidden void @_ZN5boost3log11v2_mt_posix3aux33dump_data_wchar_ssse3_slow_p
%30 = or disjoint <16 x i8> %27, splat (i8 48)
%31 = bitcast <2 x i64> %.084.i to <16 x i8>
%32 = select <16 x i1> %26, <16 x i8> %31, <16 x i8> zeroinitializer
%33 = add <16 x i8> %32, %29
%33 = add nuw nsw <16 x i8> %32, %29
%34 = select <16 x i1> %28, <16 x i8> %31, <16 x i8> zeroinitializer
%35 = add <16 x i8> %34, %30
%35 = add nuw nsw <16 x i8> %34, %30
%36 = shufflevector <16 x i8> %33, <16 x i8> %35, <16 x i32> <i32 0, i32 16, i32 1, i32 17, i32 2, i32 18, i32 3, i32 19, i32 4, i32 20, i32 5, i32 21, i32 6, i32 22, i32 7, i32 23>
%37 = shufflevector <16 x i8> %33, <16 x i8> %35, <16 x i32> <i32 8, i32 24, i32 9, i32 25, i32 10, i32 26, i32 11, i32 27, i32 12, i32 28, i32 13, i32 29, i32 14, i32 30, i32 15, i32 31>
%38 = shufflevector <16 x i8> %36, <16 x i8> <i8 0, i8 poison, i8 poison, i8 poison, i8 poison, i8 poison, i8 poison, i8 poison, i8 poison, i8 poison, i8 poison, i8 poison, i8 poison, i8 poison, i8 poison, i8 poison>, <16 x i32> <i32 16, i32 0, i32 1, i32 16, i32 2, i32 3, i32 16, i32 4, i32 5, i32 16, i32 6, i32 7, i32 16, i32 8, i32 9, i32 16>
Expand Down Expand Up @@ -1634,9 +1634,9 @@ define hidden void @_ZN5boost3log11v2_mt_posix3aux33dump_data_wchar_ssse3_slow_p
%108 = or disjoint <16 x i8> %103, splat (i8 48)
%109 = or disjoint <16 x i8> %106, splat (i8 48)
%110 = select <16 x i1> %104, <16 x i8> %88, <16 x i8> zeroinitializer
%111 = add <16 x i8> %110, %108
%111 = add nuw nsw <16 x i8> %110, %108
%112 = select <16 x i1> %107, <16 x i8> %88, <16 x i8> zeroinitializer
%113 = add <16 x i8> %112, %109
%113 = add nuw nsw <16 x i8> %112, %109
%114 = shufflevector <16 x i8> %111, <16 x i8> %113, <16 x i32> <i32 0, i32 16, i32 1, i32 17, i32 2, i32 18, i32 3, i32 19, i32 4, i32 20, i32 5, i32 21, i32 6, i32 22, i32 7, i32 23>
%115 = shufflevector <16 x i8> %111, <16 x i8> %113, <16 x i32> <i32 8, i32 24, i32 9, i32 25, i32 10, i32 26, i32 11, i32 27, i32 12, i32 28, i32 13, i32 29, i32 14, i32 30, i32 15, i32 31>
%116 = shufflevector <16 x i8> %114, <16 x i8> <i8 0, i8 poison, i8 poison, i8 poison, i8 poison, i8 poison, i8 poison, i8 poison, i8 poison, i8 poison, i8 poison, i8 poison, i8 poison, i8 poison, i8 poison, i8 poison>, <16 x i32> <i32 16, i32 0, i32 1, i32 16, i32 2, i32 3, i32 16, i32 4, i32 5, i32 16, i32 6, i32 7, i32 16, i32 8, i32 9, i32 16>
Expand Down Expand Up @@ -1715,9 +1715,9 @@ define hidden void @_ZN5boost3log11v2_mt_posix3aux33dump_data_wchar_ssse3_slow_p
%171 = or disjoint <16 x i8> %166, splat (i8 48)
%172 = or disjoint <16 x i8> %169, splat (i8 48)
%173 = select <16 x i1> %167, <16 x i8> %91, <16 x i8> zeroinitializer
%174 = add <16 x i8> %173, %171
%174 = add nuw nsw <16 x i8> %173, %171
%175 = select <16 x i1> %170, <16 x i8> %91, <16 x i8> zeroinitializer
%176 = add <16 x i8> %175, %172
%176 = add nuw nsw <16 x i8> %175, %172
%177 = shufflevector <16 x i8> %174, <16 x i8> %176, <16 x i32> <i32 0, i32 16, i32 1, i32 17, i32 2, i32 18, i32 3, i32 19, i32 4, i32 20, i32 5, i32 21, i32 6, i32 22, i32 7, i32 23>
%178 = shufflevector <16 x i8> %174, <16 x i8> %176, <16 x i32> <i32 8, i32 24, i32 9, i32 25, i32 10, i32 26, i32 11, i32 27, i32 12, i32 28, i32 13, i32 29, i32 14, i32 30, i32 15, i32 31>
%179 = shufflevector <16 x i8> %177, <16 x i8> <i8 0, i8 poison, i8 poison, i8 poison, i8 poison, i8 poison, i8 poison, i8 poison, i8 poison, i8 poison, i8 poison, i8 poison, i8 poison, i8 poison, i8 poison, i8 poison>, <16 x i32> <i32 16, i32 0, i32 1, i32 16, i32 2, i32 3, i32 16, i32 4, i32 5, i32 16, i32 6, i32 7, i32 16, i32 8, i32 9, i32 16>
Expand Down Expand Up @@ -1885,9 +1885,9 @@ define hidden void @_ZN5boost3log11v2_mt_posix3aux34dump_data_char16_ssse3_slow_
%30 = or disjoint <16 x i8> %27, splat (i8 48)
%31 = bitcast <2 x i64> %.084.i to <16 x i8>
%32 = select <16 x i1> %26, <16 x i8> %31, <16 x i8> zeroinitializer
%33 = add <16 x i8> %32, %29
%33 = add nuw nsw <16 x i8> %32, %29
%34 = select <16 x i1> %28, <16 x i8> %31, <16 x i8> zeroinitializer
%35 = add <16 x i8> %34, %30
%35 = add nuw nsw <16 x i8> %34, %30
%36 = shufflevector <16 x i8> %33, <16 x i8> %35, <16 x i32> <i32 0, i32 16, i32 1, i32 17, i32 2, i32 18, i32 3, i32 19, i32 4, i32 20, i32 5, i32 21, i32 6, i32 22, i32 7, i32 23>
%37 = shufflevector <16 x i8> %33, <16 x i8> %35, <16 x i32> <i32 8, i32 24, i32 9, i32 25, i32 10, i32 26, i32 11, i32 27, i32 12, i32 28, i32 13, i32 29, i32 14, i32 30, i32 15, i32 31>
%38 = shufflevector <16 x i8> %36, <16 x i8> <i8 0, i8 poison, i8 poison, i8 poison, i8 poison, i8 poison, i8 poison, i8 poison, i8 poison, i8 poison, i8 poison, i8 poison, i8 poison, i8 poison, i8 poison, i8 poison>, <16 x i32> <i32 16, i32 0, i32 1, i32 16, i32 2, i32 3, i32 16, i32 4, i32 5, i32 16, i32 6, i32 7, i32 16, i32 8, i32 9, i32 16>
Expand Down Expand Up @@ -1980,9 +1980,9 @@ define hidden void @_ZN5boost3log11v2_mt_posix3aux34dump_data_char16_ssse3_slow_
%84 = or disjoint <16 x i8> %79, splat (i8 48)
%85 = or disjoint <16 x i8> %82, splat (i8 48)
%86 = select <16 x i1> %80, <16 x i8> %64, <16 x i8> zeroinitializer
%87 = add <16 x i8> %86, %84
%87 = add nuw nsw <16 x i8> %86, %84
%88 = select <16 x i1> %83, <16 x i8> %64, <16 x i8> zeroinitializer
%89 = add <16 x i8> %88, %85
%89 = add nuw nsw <16 x i8> %88, %85
%90 = shufflevector <16 x i8> %87, <16 x i8> %89, <16 x i32> <i32 0, i32 16, i32 1, i32 17, i32 2, i32 18, i32 3, i32 19, i32 4, i32 20, i32 5, i32 21, i32 6, i32 22, i32 7, i32 23>
%91 = shufflevector <16 x i8> %87, <16 x i8> %89, <16 x i32> <i32 8, i32 24, i32 9, i32 25, i32 10, i32 26, i32 11, i32 27, i32 12, i32 28, i32 13, i32 29, i32 14, i32 30, i32 15, i32 31>
%92 = shufflevector <16 x i8> %90, <16 x i8> <i8 0, i8 poison, i8 poison, i8 poison, i8 poison, i8 poison, i8 poison, i8 poison, i8 poison, i8 poison, i8 poison, i8 poison, i8 poison, i8 poison, i8 poison, i8 poison>, <16 x i32> <i32 16, i32 0, i32 1, i32 16, i32 2, i32 3, i32 16, i32 4, i32 5, i32 16, i32 6, i32 7, i32 16, i32 8, i32 9, i32 16>
Expand Down Expand Up @@ -2031,9 +2031,9 @@ define hidden void @_ZN5boost3log11v2_mt_posix3aux34dump_data_char16_ssse3_slow_
%123 = or disjoint <16 x i8> %118, splat (i8 48)
%124 = or disjoint <16 x i8> %121, splat (i8 48)
%125 = select <16 x i1> %119, <16 x i8> %67, <16 x i8> zeroinitializer
%126 = add <16 x i8> %125, %123
%126 = add nuw nsw <16 x i8> %125, %123
%127 = select <16 x i1> %122, <16 x i8> %67, <16 x i8> zeroinitializer
%128 = add <16 x i8> %127, %124
%128 = add nuw nsw <16 x i8> %127, %124
%129 = shufflevector <16 x i8> %126, <16 x i8> %128, <16 x i32> <i32 0, i32 16, i32 1, i32 17, i32 2, i32 18, i32 3, i32 19, i32 4, i32 20, i32 5, i32 21, i32 6, i32 22, i32 7, i32 23>
%130 = shufflevector <16 x i8> %126, <16 x i8> %128, <16 x i32> <i32 8, i32 24, i32 9, i32 25, i32 10, i32 26, i32 11, i32 27, i32 12, i32 28, i32 13, i32 29, i32 14, i32 30, i32 15, i32 31>
%131 = shufflevector <16 x i8> %129, <16 x i8> <i8 0, i8 poison, i8 poison, i8 poison, i8 poison, i8 poison, i8 poison, i8 poison, i8 poison, i8 poison, i8 poison, i8 poison, i8 poison, i8 poison, i8 poison, i8 poison>, <16 x i32> <i32 16, i32 0, i32 1, i32 16, i32 2, i32 3, i32 16, i32 4, i32 5, i32 16, i32 6, i32 7, i32 16, i32 8, i32 9, i32 16>
Expand Down Expand Up @@ -2171,9 +2171,9 @@ define hidden void @_ZN5boost3log11v2_mt_posix3aux34dump_data_char32_ssse3_slow_
%30 = or disjoint <16 x i8> %27, splat (i8 48)
%31 = bitcast <2 x i64> %.084.i to <16 x i8>
%32 = select <16 x i1> %26, <16 x i8> %31, <16 x i8> zeroinitializer
%33 = add <16 x i8> %32, %29
%33 = add nuw nsw <16 x i8> %32, %29
%34 = select <16 x i1> %28, <16 x i8> %31, <16 x i8> zeroinitializer
%35 = add <16 x i8> %34, %30
%35 = add nuw nsw <16 x i8> %34, %30
%36 = shufflevector <16 x i8> %33, <16 x i8> %35, <16 x i32> <i32 0, i32 16, i32 1, i32 17, i32 2, i32 18, i32 3, i32 19, i32 4, i32 20, i32 5, i32 21, i32 6, i32 22, i32 7, i32 23>
%37 = shufflevector <16 x i8> %33, <16 x i8> %35, <16 x i32> <i32 8, i32 24, i32 9, i32 25, i32 10, i32 26, i32 11, i32 27, i32 12, i32 28, i32 13, i32 29, i32 14, i32 30, i32 15, i32 31>
%38 = shufflevector <16 x i8> %36, <16 x i8> <i8 0, i8 poison, i8 poison, i8 poison, i8 poison, i8 poison, i8 poison, i8 poison, i8 poison, i8 poison, i8 poison, i8 poison, i8 poison, i8 poison, i8 poison, i8 poison>, <16 x i32> <i32 16, i32 0, i32 1, i32 16, i32 2, i32 3, i32 16, i32 4, i32 5, i32 16, i32 6, i32 7, i32 16, i32 8, i32 9, i32 16>
Expand Down Expand Up @@ -2296,9 +2296,9 @@ define hidden void @_ZN5boost3log11v2_mt_posix3aux34dump_data_char32_ssse3_slow_
%108 = or disjoint <16 x i8> %103, splat (i8 48)
%109 = or disjoint <16 x i8> %106, splat (i8 48)
%110 = select <16 x i1> %104, <16 x i8> %88, <16 x i8> zeroinitializer
%111 = add <16 x i8> %110, %108
%111 = add nuw nsw <16 x i8> %110, %108
%112 = select <16 x i1> %107, <16 x i8> %88, <16 x i8> zeroinitializer
%113 = add <16 x i8> %112, %109
%113 = add nuw nsw <16 x i8> %112, %109
%114 = shufflevector <16 x i8> %111, <16 x i8> %113, <16 x i32> <i32 0, i32 16, i32 1, i32 17, i32 2, i32 18, i32 3, i32 19, i32 4, i32 20, i32 5, i32 21, i32 6, i32 22, i32 7, i32 23>
%115 = shufflevector <16 x i8> %111, <16 x i8> %113, <16 x i32> <i32 8, i32 24, i32 9, i32 25, i32 10, i32 26, i32 11, i32 27, i32 12, i32 28, i32 13, i32 29, i32 14, i32 30, i32 15, i32 31>
%116 = shufflevector <16 x i8> %114, <16 x i8> <i8 0, i8 poison, i8 poison, i8 poison, i8 poison, i8 poison, i8 poison, i8 poison, i8 poison, i8 poison, i8 poison, i8 poison, i8 poison, i8 poison, i8 poison, i8 poison>, <16 x i32> <i32 16, i32 0, i32 1, i32 16, i32 2, i32 3, i32 16, i32 4, i32 5, i32 16, i32 6, i32 7, i32 16, i32 8, i32 9, i32 16>
Expand Down Expand Up @@ -2377,9 +2377,9 @@ define hidden void @_ZN5boost3log11v2_mt_posix3aux34dump_data_char32_ssse3_slow_
%171 = or disjoint <16 x i8> %166, splat (i8 48)
%172 = or disjoint <16 x i8> %169, splat (i8 48)
%173 = select <16 x i1> %167, <16 x i8> %91, <16 x i8> zeroinitializer
%174 = add <16 x i8> %173, %171
%174 = add nuw nsw <16 x i8> %173, %171
%175 = select <16 x i1> %170, <16 x i8> %91, <16 x i8> zeroinitializer
%176 = add <16 x i8> %175, %172
%176 = add nuw nsw <16 x i8> %175, %172
%177 = shufflevector <16 x i8> %174, <16 x i8> %176, <16 x i32> <i32 0, i32 16, i32 1, i32 17, i32 2, i32 18, i32 3, i32 19, i32 4, i32 20, i32 5, i32 21, i32 6, i32 22, i32 7, i32 23>
%178 = shufflevector <16 x i8> %174, <16 x i8> %176, <16 x i32> <i32 8, i32 24, i32 9, i32 25, i32 10, i32 26, i32 11, i32 27, i32 12, i32 28, i32 13, i32 29, i32 14, i32 30, i32 15, i32 31>
%179 = shufflevector <16 x i8> %177, <16 x i8> <i8 0, i8 poison, i8 poison, i8 poison, i8 poison, i8 poison, i8 poison, i8 poison, i8 poison, i8 poison, i8 poison, i8 poison, i8 poison, i8 poison, i8 poison, i8 poison>, <16 x i32> <i32 16, i32 0, i32 1, i32 16, i32 2, i32 3, i32 16, i32 4, i32 5, i32 16, i32 6, i32 7, i32 16, i32 8, i32 9, i32 16>
Expand Down
12 changes: 6 additions & 6 deletions bench/libquic/optimized/poly1305_vec.ll
Original file line number Diff line number Diff line change
Expand Up @@ -1228,7 +1228,7 @@ poly1305_combine.exit: ; preds = %12, %24
%309 = add <2 x i64> %299, %308
%310 = bitcast <2 x i64> %301 to <4 x i32>
%311 = extractelement <4 x i32> %310, i64 0
%312 = sext i32 %311 to i64
%312 = zext nneg i32 %311 to i64
%313 = lshr i64 %312, 26
%314 = and i64 %312, 67108863
%315 = bitcast <2 x i64> %303 to <4 x i32>
Expand All @@ -1239,13 +1239,13 @@ poly1305_combine.exit: ; preds = %12, %24
%320 = and i64 %318, 67108863
%321 = bitcast <2 x i64> %305 to <4 x i32>
%322 = extractelement <4 x i32> %321, i64 0
%323 = sext i32 %322 to i64
%324 = add nsw i64 %319, %323
%323 = zext nneg i32 %322 to i64
%324 = add nuw nsw i64 %319, %323
%325 = lshr i64 %324, 26
%326 = bitcast <2 x i64> %307 to <4 x i32>
%327 = extractelement <4 x i32> %326, i64 0
%328 = sext i32 %327 to i64
%329 = add nsw i64 %325, %328
%328 = zext nneg i32 %327 to i64
%329 = add nuw nsw i64 %325, %328
%330 = lshr i64 %329, 26
%331 = and i64 %329, 67108863
%332 = bitcast <2 x i64> %309 to <4 x i32>
Expand All @@ -1263,7 +1263,7 @@ poly1305_combine.exit: ; preds = %12, %24
%343 = or disjoint i64 %.masked.i, %340
store i64 %343, ptr %.phi.trans.insert, align 32, !tbaa !10
%344 = lshr i64 %341, 18
%345 = shl nsw i64 %324, 8
%345 = shl nuw nsw i64 %324, 8
%346 = and i64 %345, 17179868928
%347 = shl nuw nsw i64 %331, 34
%.masked366.i = and i64 %347, 17575006175232
Expand Down
8 changes: 4 additions & 4 deletions bench/libwebp/optimized/lossless_enc_sse2.ll
Original file line number Diff line number Diff line change
Expand Up @@ -140,7 +140,7 @@ define internal void @TransformColor_SSE2(ptr noalias noundef %0, ptr noalias no
%38 = shl <8 x i16> %34, splat (i16 8)
%39 = tail call <8 x i16> @llvm.x86.sse2.pmulh.w(<8 x i16> %38, <8 x i16> %29)
%40 = bitcast <8 x i16> %39 to <4 x i32>
%41 = lshr <4 x i32> %40, splat (i32 16)
%41 = lshr exact <4 x i32> %40, splat (i32 16)
%42 = bitcast <4 x i32> %41 to <16 x i8>
%43 = bitcast <8 x i16> %37 to <16 x i8>
%44 = add <16 x i8> %42, %43
Expand Down Expand Up @@ -233,9 +233,9 @@ define internal void @CollectColorBlueTransforms_SSE2(ptr noalias noundef %0, i3
%44 = bitcast <2 x i64> %31 to <16 x i8>
%45 = bitcast <8 x i16> %41 to <16 x i8>
%46 = bitcast <8 x i16> %36 to <4 x i32>
%47 = lshr <4 x i32> %46, splat (i32 16)
%47 = lshr exact <4 x i32> %46, splat (i32 16)
%48 = bitcast <8 x i16> %37 to <4 x i32>
%49 = lshr <4 x i32> %48, splat (i32 16)
%49 = lshr exact <4 x i32> %48, splat (i32 16)
%50 = bitcast <4 x i32> %47 to <16 x i8>
%51 = add <16 x i8> %50, %43
%52 = sub <16 x i8> %42, %51
Expand Down Expand Up @@ -968,7 +968,7 @@ define internal void @BundleColorMap_SSE2(ptr noalias noundef %0, i32 noundef %1
%37 = lshr <4 x i32> %36, splat (i32 12)
%38 = bitcast <4 x i32> %37 to <2 x i64>
%39 = or <2 x i64> %35, splat (i64 -72057589759737856)
%40 = or <2 x i64> %39, %38
%40 = or disjoint <2 x i64> %39, %38
store <2 x i64> %40, ptr %.3103, align 1, !tbaa !7
%41 = getelementptr inbounds nuw i8, ptr %.3103, i64 16
%indvars.iv.next = add nuw nsw i64 %indvars.iv, 16
Expand Down
2 changes: 1 addition & 1 deletion bench/libwebp/optimized/lossless_sse2.ll
Original file line number Diff line number Diff line change
Expand Up @@ -1332,7 +1332,7 @@ define internal void @TransformColorInverse_SSE2(ptr noundef %0, ptr noundef %1,
%43 = shl <8 x i16> %42, splat (i16 8)
%44 = tail call <8 x i16> @llvm.x86.sse2.pmulh.w(<8 x i16> %43, <8 x i16> %30)
%45 = bitcast <8 x i16> %44 to <4 x i32>
%46 = lshr <4 x i32> %45, splat (i32 8)
%46 = lshr exact <4 x i32> %45, splat (i32 8)
%47 = bitcast <4 x i32> %46 to <16 x i8>
%48 = bitcast <8 x i16> %43 to <16 x i8>
%49 = add <16 x i8> %48, %47
Expand Down
4 changes: 2 additions & 2 deletions bench/llama.cpp/optimized/ggml-cpu-quants.ll
Original file line number Diff line number Diff line change
Expand Up @@ -1703,7 +1703,7 @@ define void @ggml_vec_dot_q4_K_q8_K(i32 noundef %0, ptr noalias noundef writeonl
%50 = insertelement <4 x i32> %49, i32 %40, i64 2
%51 = insertelement <4 x i32> %50, i32 %39, i64 3
%52 = bitcast <4 x i32> %51 to <16 x i8>
%53 = zext <16 x i8> %52 to <16 x i16>
%53 = zext nneg <16 x i8> %52 to <16 x i16>
%54 = getelementptr inbounds nuw i8, ptr %22, i64 260
%55 = load <4 x i64>, ptr %54, align 1, !tbaa !4
%56 = bitcast <16 x i16> %53 to <8 x i32>
Expand Down Expand Up @@ -1846,7 +1846,7 @@ define void @ggml_vec_dot_q5_K_q8_K(i32 noundef %0, ptr noalias noundef writeonl
%47 = insertelement <4 x i32> %46, i32 %39, i64 2
%48 = insertelement <4 x i32> %47, i32 %38, i64 3
%49 = bitcast <4 x i32> %48 to <16 x i8>
%50 = zext <16 x i8> %49 to <16 x i16>
%50 = zext nneg <16 x i8> %49 to <16 x i16>
%51 = getelementptr inbounds nuw i8, ptr %21, i64 260
%52 = load <4 x i64>, ptr %51, align 1, !tbaa !4
%53 = bitcast <16 x i16> %50 to <8 x i32>
Expand Down
Loading