@@ -244,9 +244,9 @@ define void @tail_predicate_without_optsize(ptr %p, i8 %a, i8 %b, i8 %c, i32 %n)
244244; DEFAULT-NEXT: br label %[[VECTOR_BODY:.*]]
245245; DEFAULT: [[VECTOR_BODY]]:
246246; DEFAULT-NEXT: [[INDEX:%.*]] = phi i64 [ 0, %[[VECTOR_PH]] ], [ [[INDEX_NEXT:%.*]], %[[PRED_STORE_CONTINUE36:.*]] ]
247- ; DEFAULT-NEXT: [[VEC_IND:%.*]] = phi <16 x i64 > [ <i64 0, i64 1, i64 2, i64 3, i64 4, i64 5, i64 6, i64 7, i64 8, i64 9, i64 10, i64 11, i64 12, i64 13, i64 14, i64 15>, %[[VECTOR_PH]] ], [ [[VEC_IND_NEXT:%.*]], %[[PRED_STORE_CONTINUE36]] ]
247+ ; DEFAULT-NEXT: [[VEC_IND:%.*]] = phi <16 x i8 > [ <i8 0, i8 1, i8 2, i8 3, i8 4, i8 5, i8 6, i8 7, i8 8, i8 9, i8 10, i8 11, i8 12, i8 13, i8 14, i8 15>, %[[VECTOR_PH]] ], [ [[VEC_IND_NEXT:%.*]], %[[PRED_STORE_CONTINUE36]] ]
248248; DEFAULT-NEXT: [[VEC_IND1:%.*]] = phi <16 x i8> [ <i8 0, i8 1, i8 2, i8 3, i8 4, i8 5, i8 6, i8 7, i8 8, i8 9, i8 10, i8 11, i8 12, i8 13, i8 14, i8 15>, %[[VECTOR_PH]] ], [ [[VEC_IND_NEXT2:%.*]], %[[PRED_STORE_CONTINUE36]] ]
249- ; DEFAULT-NEXT: [[TMP0:%.*]] = icmp ule <16 x i64 > [[VEC_IND]], splat (i64 14)
249+ ; DEFAULT-NEXT: [[TMP0:%.*]] = icmp ule <16 x i8 > [[VEC_IND]], splat (i8 14)
250250; DEFAULT-NEXT: [[TMP1:%.*]] = mul <16 x i8> [[BROADCAST_SPLAT]], [[VEC_IND1]]
251251; DEFAULT-NEXT: [[TMP2:%.*]] = lshr <16 x i8> [[VEC_IND1]], splat (i8 1)
252252; DEFAULT-NEXT: [[TMP3:%.*]] = mul <16 x i8> [[TMP2]], [[BROADCAST_SPLAT4]]
@@ -398,7 +398,7 @@ define void @tail_predicate_without_optsize(ptr %p, i8 %a, i8 %b, i8 %c, i32 %n)
398398; DEFAULT-NEXT: store i8 [[TMP71]], ptr [[TMP70]], align 1
399399; DEFAULT-NEXT: br label %[[PRED_STORE_CONTINUE36]]
400400; DEFAULT: [[PRED_STORE_CONTINUE36]]:
401- ; DEFAULT-NEXT: [[VEC_IND_NEXT]] = add <16 x i64 > [[VEC_IND]], splat (i64 16)
401+ ; DEFAULT-NEXT: [[VEC_IND_NEXT]] = add <16 x i8 > [[VEC_IND]], splat (i8 16)
402402; DEFAULT-NEXT: [[VEC_IND_NEXT2]] = add <16 x i8> [[VEC_IND1]], splat (i8 16)
403403; DEFAULT-NEXT: [[INDEX_NEXT]] = add nuw i64 [[INDEX]], 16
404404; DEFAULT-NEXT: br i1 true, label %[[MIDDLE_BLOCK:.*]], label %[[VECTOR_BODY]], !llvm.loop [[LOOP5:![0-9]+]]
@@ -439,9 +439,9 @@ define void @tail_predicate_without_optsize(ptr %p, i8 %a, i8 %b, i8 %c, i32 %n)
439439; OPTSIZE-NEXT: br label %[[VECTOR_BODY:.*]]
440440; OPTSIZE: [[VECTOR_BODY]]:
441441; OPTSIZE-NEXT: [[INDEX:%.*]] = phi i64 [ 0, %[[VECTOR_PH]] ], [ [[INDEX_NEXT:%.*]], %[[PRED_STORE_CONTINUE36:.*]] ]
442- ; OPTSIZE-NEXT: [[VEC_IND:%.*]] = phi <16 x i64 > [ <i64 0, i64 1, i64 2, i64 3, i64 4, i64 5, i64 6, i64 7, i64 8, i64 9, i64 10, i64 11, i64 12, i64 13, i64 14, i64 15>, %[[VECTOR_PH]] ], [ [[VEC_IND_NEXT:%.*]], %[[PRED_STORE_CONTINUE36]] ]
442+ ; OPTSIZE-NEXT: [[VEC_IND:%.*]] = phi <16 x i8 > [ <i8 0, i8 1, i8 2, i8 3, i8 4, i8 5, i8 6, i8 7, i8 8, i8 9, i8 10, i8 11, i8 12, i8 13, i8 14, i8 15>, %[[VECTOR_PH]] ], [ [[VEC_IND_NEXT:%.*]], %[[PRED_STORE_CONTINUE36]] ]
443443; OPTSIZE-NEXT: [[VEC_IND1:%.*]] = phi <16 x i8> [ <i8 0, i8 1, i8 2, i8 3, i8 4, i8 5, i8 6, i8 7, i8 8, i8 9, i8 10, i8 11, i8 12, i8 13, i8 14, i8 15>, %[[VECTOR_PH]] ], [ [[VEC_IND_NEXT2:%.*]], %[[PRED_STORE_CONTINUE36]] ]
444- ; OPTSIZE-NEXT: [[TMP72:%.*]] = icmp ule <16 x i64 > [[VEC_IND]], splat (i64 14)
444+ ; OPTSIZE-NEXT: [[TMP72:%.*]] = icmp ule <16 x i8 > [[VEC_IND]], splat (i8 14)
445445; OPTSIZE-NEXT: [[TMP1:%.*]] = mul <16 x i8> [[BROADCAST_SPLAT]], [[VEC_IND1]]
446446; OPTSIZE-NEXT: [[TMP2:%.*]] = lshr <16 x i8> [[VEC_IND1]], splat (i8 1)
447447; OPTSIZE-NEXT: [[TMP3:%.*]] = mul <16 x i8> [[TMP2]], [[BROADCAST_SPLAT4]]
@@ -593,7 +593,7 @@ define void @tail_predicate_without_optsize(ptr %p, i8 %a, i8 %b, i8 %c, i32 %n)
593593; OPTSIZE-NEXT: store i8 [[TMP71]], ptr [[TMP70]], align 1
594594; OPTSIZE-NEXT: br label %[[PRED_STORE_CONTINUE36]]
595595; OPTSIZE: [[PRED_STORE_CONTINUE36]]:
596- ; OPTSIZE-NEXT: [[VEC_IND_NEXT]] = add <16 x i64 > [[VEC_IND]], splat (i64 16)
596+ ; OPTSIZE-NEXT: [[VEC_IND_NEXT]] = add <16 x i8 > [[VEC_IND]], splat (i8 16)
597597; OPTSIZE-NEXT: [[VEC_IND_NEXT2]] = add <16 x i8> [[VEC_IND1]], splat (i8 16)
598598; OPTSIZE-NEXT: [[INDEX_NEXT]] = add nuw i64 [[INDEX]], 16
599599; OPTSIZE-NEXT: br i1 true, label %[[MIDDLE_BLOCK:.*]], label %[[VECTOR_BODY]], !llvm.loop [[LOOP3:![0-9]+]]
0 commit comments