Skip to content

Commit b51b967

Browse files
committed
[LV] Add test for more precise no-free checks.
1 parent 3e54505 commit b51b967

File tree

1 file changed

+192
-0
lines changed

1 file changed

+192
-0
lines changed

llvm/test/Transforms/LoopVectorize/dereferenceable-info-from-assumption-constant-size.ll

Lines changed: 192 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -1519,6 +1519,196 @@ exit:
15191519
declare ptr @get_ptr()
15201520
declare void @may_free()
15211521

1522+
define void @deref_assumption_in_header_constant_trip_count_nofree_via_context(ptr noalias noundef %a, ptr noalias %b, ptr noalias %c) nosync {
1523+
; CHECK-LABEL: define void @deref_assumption_in_header_constant_trip_count_nofree_via_context(
1524+
; CHECK-SAME: ptr noalias noundef [[A:%.*]], ptr noalias [[B:%.*]], ptr noalias [[C:%.*]]) #[[ATTR2:[0-9]+]] {
1525+
; CHECK-NEXT: [[ENTRY:.*:]]
1526+
; CHECK-NEXT: call void @llvm.assume(i1 true) [ "align"(ptr [[A]], i64 4), "dereferenceable"(ptr [[A]], i64 4000) ]
1527+
; CHECK-NEXT: br label %[[VECTOR_PH:.*]]
1528+
; CHECK: [[VECTOR_PH]]:
1529+
; CHECK-NEXT: br label %[[VECTOR_BODY:.*]]
1530+
; CHECK: [[VECTOR_BODY]]:
1531+
; CHECK-NEXT: [[INDEX:%.*]] = phi i64 [ 0, %[[VECTOR_PH]] ], [ [[INDEX_NEXT:%.*]], %[[PRED_LOAD_CONTINUE2:.*]] ]
1532+
; CHECK-NEXT: [[TMP0:%.*]] = getelementptr inbounds i32, ptr [[B]], i64 [[INDEX]]
1533+
; CHECK-NEXT: [[WIDE_LOAD:%.*]] = load <2 x i32>, ptr [[TMP0]], align 4
1534+
; CHECK-NEXT: [[TMP1:%.*]] = icmp slt <2 x i32> [[WIDE_LOAD]], zeroinitializer
1535+
; CHECK-NEXT: [[TMP2:%.*]] = extractelement <2 x i1> [[TMP1]], i32 0
1536+
; CHECK-NEXT: br i1 [[TMP2]], label %[[PRED_LOAD_IF:.*]], label %[[PRED_LOAD_CONTINUE:.*]]
1537+
; CHECK: [[PRED_LOAD_IF]]:
1538+
; CHECK-NEXT: [[TMP3:%.*]] = add i64 [[INDEX]], 0
1539+
; CHECK-NEXT: [[TMP4:%.*]] = getelementptr i32, ptr [[A]], i64 [[TMP3]]
1540+
; CHECK-NEXT: [[TMP5:%.*]] = load i32, ptr [[TMP4]], align 4
1541+
; CHECK-NEXT: [[TMP6:%.*]] = insertelement <2 x i32> poison, i32 [[TMP5]], i32 0
1542+
; CHECK-NEXT: br label %[[PRED_LOAD_CONTINUE]]
1543+
; CHECK: [[PRED_LOAD_CONTINUE]]:
1544+
; CHECK-NEXT: [[TMP7:%.*]] = phi <2 x i32> [ poison, %[[VECTOR_BODY]] ], [ [[TMP6]], %[[PRED_LOAD_IF]] ]
1545+
; CHECK-NEXT: [[TMP8:%.*]] = extractelement <2 x i1> [[TMP1]], i32 1
1546+
; CHECK-NEXT: br i1 [[TMP8]], label %[[PRED_LOAD_IF1:.*]], label %[[PRED_LOAD_CONTINUE2]]
1547+
; CHECK: [[PRED_LOAD_IF1]]:
1548+
; CHECK-NEXT: [[TMP9:%.*]] = add i64 [[INDEX]], 1
1549+
; CHECK-NEXT: [[TMP10:%.*]] = getelementptr i32, ptr [[A]], i64 [[TMP9]]
1550+
; CHECK-NEXT: [[TMP11:%.*]] = load i32, ptr [[TMP10]], align 4
1551+
; CHECK-NEXT: [[TMP12:%.*]] = insertelement <2 x i32> [[TMP7]], i32 [[TMP11]], i32 1
1552+
; CHECK-NEXT: br label %[[PRED_LOAD_CONTINUE2]]
1553+
; CHECK: [[PRED_LOAD_CONTINUE2]]:
1554+
; CHECK-NEXT: [[TMP13:%.*]] = phi <2 x i32> [ [[TMP7]], %[[PRED_LOAD_CONTINUE]] ], [ [[TMP12]], %[[PRED_LOAD_IF1]] ]
1555+
; CHECK-NEXT: [[PREDPHI:%.*]] = select <2 x i1> [[TMP1]], <2 x i32> [[TMP13]], <2 x i32> [[WIDE_LOAD]]
1556+
; CHECK-NEXT: [[TMP14:%.*]] = getelementptr inbounds i32, ptr [[C]], i64 [[INDEX]]
1557+
; CHECK-NEXT: store <2 x i32> [[PREDPHI]], ptr [[TMP14]], align 4
1558+
; CHECK-NEXT: [[INDEX_NEXT]] = add nuw i64 [[INDEX]], 2
1559+
; CHECK-NEXT: [[TMP15:%.*]] = icmp eq i64 [[INDEX_NEXT]], 1000
1560+
; CHECK-NEXT: br i1 [[TMP15]], label %[[MIDDLE_BLOCK:.*]], label %[[VECTOR_BODY]], !llvm.loop [[LOOP20:![0-9]+]]
1561+
; CHECK: [[MIDDLE_BLOCK]]:
1562+
; CHECK-NEXT: br label %[[EXIT:.*]]
1563+
; CHECK: [[SCALAR_PH:.*]]:
1564+
; CHECK-NEXT: br label %[[LOOP_HEADER:.*]]
1565+
; CHECK: [[LOOP_HEADER]]:
1566+
; CHECK-NEXT: [[IV:%.*]] = phi i64 [ 0, %[[SCALAR_PH]] ], [ [[IV_NEXT:%.*]], %[[LOOP_LATCH:.*]] ]
1567+
; CHECK-NEXT: [[GEP_A:%.*]] = getelementptr i32, ptr [[A]], i64 [[IV]]
1568+
; CHECK-NEXT: [[GEP_B:%.*]] = getelementptr inbounds i32, ptr [[B]], i64 [[IV]]
1569+
; CHECK-NEXT: [[L_B:%.*]] = load i32, ptr [[GEP_B]], align 4
1570+
; CHECK-NEXT: [[C_1:%.*]] = icmp sge i32 [[L_B]], 0
1571+
; CHECK-NEXT: br i1 [[C_1]], label %[[LOOP_LATCH]], label %[[LOOP_THEN:.*]]
1572+
; CHECK: [[LOOP_THEN]]:
1573+
; CHECK-NEXT: [[L_A:%.*]] = load i32, ptr [[GEP_A]], align 4
1574+
; CHECK-NEXT: br label %[[LOOP_LATCH]]
1575+
; CHECK: [[LOOP_LATCH]]:
1576+
; CHECK-NEXT: [[MERGE:%.*]] = phi i32 [ [[L_A]], %[[LOOP_THEN]] ], [ [[L_B]], %[[LOOP_HEADER]] ]
1577+
; CHECK-NEXT: [[GEP_C:%.*]] = getelementptr inbounds i32, ptr [[C]], i64 [[IV]]
1578+
; CHECK-NEXT: store i32 [[MERGE]], ptr [[GEP_C]], align 4
1579+
; CHECK-NEXT: [[IV_NEXT]] = add nuw nsw i64 [[IV]], 1
1580+
; CHECK-NEXT: [[EC:%.*]] = icmp eq i64 [[IV_NEXT]], 1000
1581+
; CHECK-NEXT: br i1 [[EC]], label %[[EXIT]], label %[[LOOP_HEADER]]
1582+
; CHECK: [[EXIT]]:
1583+
; CHECK-NEXT: ret void
1584+
;
1585+
entry:
1586+
call void @llvm.assume(i1 true) [ "align"(ptr %a, i64 4), "dereferenceable"(ptr %a, i64 4000) ]
1587+
br label %loop.header
1588+
1589+
loop.header:
1590+
%iv = phi i64 [ 0, %entry ], [ %iv.next, %loop.latch ]
1591+
%gep.a = getelementptr i32, ptr %a, i64 %iv
1592+
%gep.b = getelementptr inbounds i32, ptr %b, i64 %iv
1593+
%l.b = load i32, ptr %gep.b, align 4
1594+
%c.1 = icmp sge i32 %l.b, 0
1595+
br i1 %c.1, label %loop.latch, label %loop.then
1596+
1597+
loop.then:
1598+
%l.a = load i32, ptr %gep.a, align 4
1599+
br label %loop.latch
1600+
1601+
loop.latch:
1602+
%merge = phi i32 [ %l.a, %loop.then ], [ %l.b, %loop.header ]
1603+
%gep.c = getelementptr inbounds i32, ptr %c, i64 %iv
1604+
store i32 %merge, ptr %gep.c, align 4
1605+
%iv.next = add nuw nsw i64 %iv, 1
1606+
%ec = icmp eq i64 %iv.next, 1000
1607+
br i1 %ec, label %exit, label %loop.header
1608+
1609+
exit:
1610+
ret void
1611+
}
1612+
1613+
define void @deref_assumption_in_header_constant_trip_count_may_free(ptr noalias noundef %a, ptr noalias %b, ptr noalias %c) nosync {
1614+
; CHECK-LABEL: define void @deref_assumption_in_header_constant_trip_count_may_free(
1615+
; CHECK-SAME: ptr noalias noundef [[A:%.*]], ptr noalias [[B:%.*]], ptr noalias [[C:%.*]]) #[[ATTR2]] {
1616+
; CHECK-NEXT: [[ENTRY:.*:]]
1617+
; CHECK-NEXT: call void @llvm.assume(i1 true) [ "align"(ptr [[A]], i64 4), "dereferenceable"(ptr [[A]], i64 4000) ]
1618+
; CHECK-NEXT: call void @may_free()
1619+
; CHECK-NEXT: br label %[[VECTOR_PH:.*]]
1620+
; CHECK: [[VECTOR_PH]]:
1621+
; CHECK-NEXT: br label %[[VECTOR_BODY:.*]]
1622+
; CHECK: [[VECTOR_BODY]]:
1623+
; CHECK-NEXT: [[INDEX:%.*]] = phi i64 [ 0, %[[VECTOR_PH]] ], [ [[INDEX_NEXT:%.*]], %[[PRED_LOAD_CONTINUE2:.*]] ]
1624+
; CHECK-NEXT: [[VEC_IND:%.*]] = phi <2 x i64> [ <i64 0, i64 1>, %[[VECTOR_PH]] ], [ [[VEC_IND_NEXT:%.*]], %[[PRED_LOAD_CONTINUE2]] ]
1625+
; CHECK-NEXT: [[TMP0:%.*]] = getelementptr i32, ptr [[A]], <2 x i64> [[VEC_IND]]
1626+
; CHECK-NEXT: [[TMP1:%.*]] = extractelement <2 x ptr> [[TMP0]], i32 0
1627+
; CHECK-NEXT: call void @llvm.assume(i1 true) [ "align"(ptr [[TMP1]], i64 4), "dereferenceable"(ptr [[TMP1]], i64 4) ]
1628+
; CHECK-NEXT: [[TMP2:%.*]] = extractelement <2 x ptr> [[TMP0]], i32 1
1629+
; CHECK-NEXT: call void @llvm.assume(i1 true) [ "align"(ptr [[TMP2]], i64 4), "dereferenceable"(ptr [[TMP2]], i64 4) ]
1630+
; CHECK-NEXT: [[TMP3:%.*]] = getelementptr inbounds i32, ptr [[B]], i64 [[INDEX]]
1631+
; CHECK-NEXT: [[WIDE_LOAD:%.*]] = load <2 x i32>, ptr [[TMP3]], align 4
1632+
; CHECK-NEXT: [[TMP4:%.*]] = icmp slt <2 x i32> [[WIDE_LOAD]], zeroinitializer
1633+
; CHECK-NEXT: [[TMP5:%.*]] = extractelement <2 x i1> [[TMP4]], i32 0
1634+
; CHECK-NEXT: br i1 [[TMP5]], label %[[PRED_LOAD_IF:.*]], label %[[PRED_LOAD_CONTINUE:.*]]
1635+
; CHECK: [[PRED_LOAD_IF]]:
1636+
; CHECK-NEXT: [[TMP6:%.*]] = extractelement <2 x ptr> [[TMP0]], i32 0
1637+
; CHECK-NEXT: [[TMP7:%.*]] = load i32, ptr [[TMP6]], align 4
1638+
; CHECK-NEXT: [[TMP8:%.*]] = insertelement <2 x i32> poison, i32 [[TMP7]], i32 0
1639+
; CHECK-NEXT: br label %[[PRED_LOAD_CONTINUE]]
1640+
; CHECK: [[PRED_LOAD_CONTINUE]]:
1641+
; CHECK-NEXT: [[TMP9:%.*]] = phi <2 x i32> [ poison, %[[VECTOR_BODY]] ], [ [[TMP8]], %[[PRED_LOAD_IF]] ]
1642+
; CHECK-NEXT: [[TMP10:%.*]] = extractelement <2 x i1> [[TMP4]], i32 1
1643+
; CHECK-NEXT: br i1 [[TMP10]], label %[[PRED_LOAD_IF1:.*]], label %[[PRED_LOAD_CONTINUE2]]
1644+
; CHECK: [[PRED_LOAD_IF1]]:
1645+
; CHECK-NEXT: [[TMP11:%.*]] = extractelement <2 x ptr> [[TMP0]], i32 1
1646+
; CHECK-NEXT: [[TMP12:%.*]] = load i32, ptr [[TMP11]], align 4
1647+
; CHECK-NEXT: [[TMP13:%.*]] = insertelement <2 x i32> [[TMP9]], i32 [[TMP12]], i32 1
1648+
; CHECK-NEXT: br label %[[PRED_LOAD_CONTINUE2]]
1649+
; CHECK: [[PRED_LOAD_CONTINUE2]]:
1650+
; CHECK-NEXT: [[TMP14:%.*]] = phi <2 x i32> [ [[TMP9]], %[[PRED_LOAD_CONTINUE]] ], [ [[TMP13]], %[[PRED_LOAD_IF1]] ]
1651+
; CHECK-NEXT: [[PREDPHI:%.*]] = select <2 x i1> [[TMP4]], <2 x i32> [[TMP14]], <2 x i32> [[WIDE_LOAD]]
1652+
; CHECK-NEXT: [[TMP15:%.*]] = getelementptr inbounds i32, ptr [[C]], i64 [[INDEX]]
1653+
; CHECK-NEXT: store <2 x i32> [[PREDPHI]], ptr [[TMP15]], align 4
1654+
; CHECK-NEXT: [[INDEX_NEXT]] = add nuw i64 [[INDEX]], 2
1655+
; CHECK-NEXT: [[VEC_IND_NEXT]] = add <2 x i64> [[VEC_IND]], splat (i64 2)
1656+
; CHECK-NEXT: [[TMP16:%.*]] = icmp eq i64 [[INDEX_NEXT]], 1000
1657+
; CHECK-NEXT: br i1 [[TMP16]], label %[[MIDDLE_BLOCK:.*]], label %[[VECTOR_BODY]], !llvm.loop [[LOOP21:![0-9]+]]
1658+
; CHECK: [[MIDDLE_BLOCK]]:
1659+
; CHECK-NEXT: br label %[[EXIT:.*]]
1660+
; CHECK: [[SCALAR_PH:.*]]:
1661+
; CHECK-NEXT: br label %[[LOOP_HEADER:.*]]
1662+
; CHECK: [[LOOP_HEADER]]:
1663+
; CHECK-NEXT: [[IV:%.*]] = phi i64 [ 0, %[[SCALAR_PH]] ], [ [[IV_NEXT:%.*]], %[[LOOP_LATCH:.*]] ]
1664+
; CHECK-NEXT: [[GEP_A:%.*]] = getelementptr i32, ptr [[A]], i64 [[IV]]
1665+
; CHECK-NEXT: call void @llvm.assume(i1 true) [ "align"(ptr [[GEP_A]], i64 4), "dereferenceable"(ptr [[GEP_A]], i64 4) ]
1666+
; CHECK-NEXT: [[GEP_B:%.*]] = getelementptr inbounds i32, ptr [[B]], i64 [[IV]]
1667+
; CHECK-NEXT: [[L_B:%.*]] = load i32, ptr [[GEP_B]], align 4
1668+
; CHECK-NEXT: [[C_1:%.*]] = icmp sge i32 [[L_B]], 0
1669+
; CHECK-NEXT: br i1 [[C_1]], label %[[LOOP_LATCH]], label %[[LOOP_THEN:.*]]
1670+
; CHECK: [[LOOP_THEN]]:
1671+
; CHECK-NEXT: [[L_A:%.*]] = load i32, ptr [[GEP_A]], align 4
1672+
; CHECK-NEXT: br label %[[LOOP_LATCH]]
1673+
; CHECK: [[LOOP_LATCH]]:
1674+
; CHECK-NEXT: [[MERGE:%.*]] = phi i32 [ [[L_A]], %[[LOOP_THEN]] ], [ [[L_B]], %[[LOOP_HEADER]] ]
1675+
; CHECK-NEXT: [[GEP_C:%.*]] = getelementptr inbounds i32, ptr [[C]], i64 [[IV]]
1676+
; CHECK-NEXT: store i32 [[MERGE]], ptr [[GEP_C]], align 4
1677+
; CHECK-NEXT: [[IV_NEXT]] = add nuw nsw i64 [[IV]], 1
1678+
; CHECK-NEXT: [[EC:%.*]] = icmp eq i64 [[IV_NEXT]], 1000
1679+
; CHECK-NEXT: br i1 [[EC]], label %[[EXIT]], label %[[LOOP_HEADER]]
1680+
; CHECK: [[EXIT]]:
1681+
; CHECK-NEXT: ret void
1682+
;
1683+
entry:
1684+
call void @llvm.assume(i1 true) [ "align"(ptr %a, i64 4), "dereferenceable"(ptr %a, i64 4000) ]
1685+
call void @may_free()
1686+
br label %loop.header
1687+
1688+
loop.header:
1689+
%iv = phi i64 [ 0, %entry ], [ %iv.next, %loop.latch ]
1690+
%gep.a = getelementptr i32, ptr %a, i64 %iv
1691+
call void @llvm.assume(i1 true) [ "align"(ptr %gep.a, i64 4), "dereferenceable"(ptr %gep.a, i64 4) ]
1692+
%gep.b = getelementptr inbounds i32, ptr %b, i64 %iv
1693+
%l.b = load i32, ptr %gep.b, align 4
1694+
%c.1 = icmp sge i32 %l.b, 0
1695+
br i1 %c.1, label %loop.latch, label %loop.then
1696+
1697+
loop.then:
1698+
%l.a = load i32, ptr %gep.a, align 4
1699+
br label %loop.latch
1700+
1701+
loop.latch:
1702+
%merge = phi i32 [ %l.a, %loop.then ], [ %l.b, %loop.header ]
1703+
%gep.c = getelementptr inbounds i32, ptr %c, i64 %iv
1704+
store i32 %merge, ptr %gep.c, align 4
1705+
%iv.next = add nuw nsw i64 %iv, 1
1706+
%ec = icmp eq i64 %iv.next, 1000
1707+
br i1 %ec, label %exit, label %loop.header
1708+
1709+
exit:
1710+
ret void
1711+
}
15221712
;.
15231713
; CHECK: [[LOOP0]] = distinct !{[[LOOP0]], [[META1:![0-9]+]], [[META2:![0-9]+]]}
15241714
; CHECK: [[META1]] = !{!"llvm.loop.isvectorized", i32 1}
@@ -1540,4 +1730,6 @@ declare void @may_free()
15401730
; CHECK: [[LOOP17]] = distinct !{[[LOOP17]], [[META1]], [[META2]]}
15411731
; CHECK: [[LOOP18]] = distinct !{[[LOOP18]], [[META1]], [[META2]]}
15421732
; CHECK: [[LOOP19]] = distinct !{[[LOOP19]], [[META1]], [[META2]]}
1733+
; CHECK: [[LOOP20]] = distinct !{[[LOOP20]], [[META1]], [[META2]]}
1734+
; CHECK: [[LOOP21]] = distinct !{[[LOOP21]], [[META1]], [[META2]]}
15431735
;.

0 commit comments

Comments
 (0)