@@ -68,28 +68,32 @@ define i32 @iv_zext_zext_gt_slt(i32 %iter.count, ptr %ptr) {
6868; CHECK-LABEL: define i32 @iv_zext_zext_gt_slt(
6969; CHECK-SAME: i32 [[ITER_COUNT:%.*]], ptr [[PTR:%.*]]) {
7070; CHECK-NEXT: [[ENTRY:.*]]:
71- ; CHECK-NEXT: [[TMP0:%.*]] = sext i32 [[ITER_COUNT]] to i64
71+ ; CHECK-NEXT: [[TMP0:%.*]] = add nsw i32 [[ITER_COUNT]], -1
7272; CHECK-NEXT: br label %[[OUTER_LOOP:.*]]
7373; CHECK: [[PH_LOOPEXIT:.*]]:
7474; CHECK-NEXT: br label %[[PH:.*]]
7575; CHECK: [[PH]]:
76+ ; CHECK-NEXT: [[INDVARS_IV_NEXT3:%.*]] = add i32 [[INDVARS_IV1:%.*]], -1
7677; CHECK-NEXT: br label %[[OUTER_LOOP]]
7778; CHECK: [[OUTER_LOOP]]:
78- ; CHECK-NEXT: [[INDVARS_IV1:%.*]] = phi i64 [ [[INDVARS_IV_NEXT2:%.*]], %[[PH]] ], [ [[TMP0]], %[[ENTRY]] ]
79- ; CHECK-NEXT: [[INDVARS_IV_NEXT2]] = add nsw i64 [[INDVARS_IV1]], -1
79+ ; CHECK-NEXT: [[INDVARS_IV1]] = phi i32 [ [[INDVARS_IV_NEXT3]], %[[PH]] ], [ [[TMP0]], %[[ENTRY]] ]
80+ ; CHECK-NEXT: [[IV_OUTER:%.*]] = phi i32 [ [[IV_OUTER_1:%.*]], %[[PH]] ], [ [[ITER_COUNT]], %[[ENTRY]] ]
81+ ; CHECK-NEXT: [[IV_OUTER_1]] = add nsw i32 [[IV_OUTER]], -1
82+ ; CHECK-NEXT: [[INDVARS_IV_NEXT2:%.*]] = zext nneg i32 [[IV_OUTER_1]] to i64
8083; CHECK-NEXT: [[GEP_OUTER:%.*]] = getelementptr i8, ptr [[PTR]], i64 [[INDVARS_IV_NEXT2]]
8184; CHECK-NEXT: store i8 0, ptr [[GEP_OUTER]], align 1
82- ; CHECK-NEXT: [[EXIT_COND_OUTER:%.*]] = icmp samesign ugt i64 [[INDVARS_IV1 ]], 1
85+ ; CHECK-NEXT: [[EXIT_COND_OUTER:%.*]] = icmp samesign ugt i32 [[IV_OUTER ]], 1
8386; CHECK-NEXT: br i1 [[EXIT_COND_OUTER]], label %[[INNER_LOOP_PREHEADER:.*]], label %[[PH]]
8487; CHECK: [[INNER_LOOP_PREHEADER]]:
88+ ; CHECK-NEXT: [[WIDE_TRIP_COUNT:%.*]] = zext i32 [[INDVARS_IV1]] to i64
8589; CHECK-NEXT: br label %[[INNER_LOOP:.*]]
8690; CHECK: [[INNER_LOOP]]:
8791; CHECK-NEXT: [[INDVARS_IV:%.*]] = phi i64 [ 0, %[[INNER_LOOP_PREHEADER]] ], [ [[INDVARS_IV_NEXT:%.*]], %[[INNER_LOOP]] ]
8892; CHECK-NEXT: [[GEP_INNER:%.*]] = getelementptr i8, ptr [[PTR]], i64 [[INDVARS_IV]]
8993; CHECK-NEXT: store i8 0, ptr [[GEP_INNER]], align 1
9094; CHECK-NEXT: [[INDVARS_IV_NEXT]] = add nuw nsw i64 [[INDVARS_IV]], 1
91- ; CHECK-NEXT: [[EXIT_COND_INNER :%.*]] = icmp slt i64 [[INDVARS_IV_NEXT]], [[INDVARS_IV_NEXT2 ]]
92- ; CHECK-NEXT: br i1 [[EXIT_COND_INNER ]], label %[[INNER_LOOP]], label %[[PH_LOOPEXIT]]
95+ ; CHECK-NEXT: [[EXITCOND :%.*]] = icmp ne i64 [[INDVARS_IV_NEXT]], [[WIDE_TRIP_COUNT ]]
96+ ; CHECK-NEXT: br i1 [[EXITCOND ]], label %[[INNER_LOOP]], label %[[PH_LOOPEXIT]]
9397; CHECK: [[EXIT:.*:]]
9498; CHECK-NEXT: ret i32 0
9599;
@@ -424,28 +428,32 @@ define i32 @iv_sext_sext_gt_slt(i32 %iter.count, ptr %ptr) {
424428; CHECK-LABEL: define i32 @iv_sext_sext_gt_slt(
425429; CHECK-SAME: i32 [[ITER_COUNT:%.*]], ptr [[PTR:%.*]]) {
426430; CHECK-NEXT: [[ENTRY:.*]]:
431+ ; CHECK-NEXT: [[TMP1:%.*]] = add nsw i32 [[ITER_COUNT]], -1
427432; CHECK-NEXT: [[TMP0:%.*]] = sext i32 [[ITER_COUNT]] to i64
428433; CHECK-NEXT: br label %[[OUTER_LOOP:.*]]
429434; CHECK: [[PH_LOOPEXIT:.*]]:
430435; CHECK-NEXT: br label %[[PH:.*]]
431436; CHECK: [[PH]]:
437+ ; CHECK-NEXT: [[INDVARS_IV_NEXT3:%.*]] = add i32 [[INDVARS_IV2:%.*]], -1
432438; CHECK-NEXT: br label %[[OUTER_LOOP]]
433439; CHECK: [[OUTER_LOOP]]:
434440; CHECK-NEXT: [[INDVARS_IV1:%.*]] = phi i64 [ [[INDVARS_IV_NEXT2:%.*]], %[[PH]] ], [ [[TMP0]], %[[ENTRY]] ]
441+ ; CHECK-NEXT: [[INDVARS_IV2]] = phi i32 [ [[INDVARS_IV_NEXT3]], %[[PH]] ], [ [[TMP1]], %[[ENTRY]] ]
435442; CHECK-NEXT: [[INDVARS_IV_NEXT2]] = add nsw i64 [[INDVARS_IV1]], -1
436443; CHECK-NEXT: [[GEP_OUTER:%.*]] = getelementptr i8, ptr [[PTR]], i64 [[INDVARS_IV_NEXT2]]
437444; CHECK-NEXT: store i8 0, ptr [[GEP_OUTER]], align 1
438445; CHECK-NEXT: [[EXIT_COND_OUTER:%.*]] = icmp samesign ugt i64 [[INDVARS_IV1]], 1
439446; CHECK-NEXT: br i1 [[EXIT_COND_OUTER]], label %[[INNER_LOOP_PREHEADER:.*]], label %[[PH]]
440447; CHECK: [[INNER_LOOP_PREHEADER]]:
448+ ; CHECK-NEXT: [[WIDE_TRIP_COUNT:%.*]] = zext i32 [[INDVARS_IV2]] to i64
441449; CHECK-NEXT: br label %[[INNER_LOOP:.*]]
442450; CHECK: [[INNER_LOOP]]:
443451; CHECK-NEXT: [[INDVARS_IV:%.*]] = phi i64 [ 0, %[[INNER_LOOP_PREHEADER]] ], [ [[INDVARS_IV_NEXT:%.*]], %[[INNER_LOOP]] ]
444452; CHECK-NEXT: [[GEP_INNER:%.*]] = getelementptr i8, ptr [[PTR]], i64 [[INDVARS_IV]]
445453; CHECK-NEXT: store i8 0, ptr [[GEP_INNER]], align 1
446454; CHECK-NEXT: [[INDVARS_IV_NEXT]] = add nuw nsw i64 [[INDVARS_IV]], 1
447- ; CHECK-NEXT: [[EXIT_COND_INNER :%.*]] = icmp slt i64 [[INDVARS_IV_NEXT]], [[INDVARS_IV_NEXT2 ]]
448- ; CHECK-NEXT: br i1 [[EXIT_COND_INNER ]], label %[[INNER_LOOP]], label %[[PH_LOOPEXIT]]
455+ ; CHECK-NEXT: [[EXITCOND :%.*]] = icmp ne i64 [[INDVARS_IV_NEXT]], [[WIDE_TRIP_COUNT ]]
456+ ; CHECK-NEXT: br i1 [[EXITCOND ]], label %[[INNER_LOOP]], label %[[PH_LOOPEXIT]]
449457; CHECK: [[EXIT:.*:]]
450458; CHECK-NEXT: ret i32 0
451459;
0 commit comments