@@ -1519,6 +1519,196 @@ exit:
15191519declare ptr @get_ptr ()
15201520declare void @may_free ()
15211521
1522+ define void @deref_assumption_in_header_constant_trip_count_nofree_via_context (ptr noalias noundef %a , ptr noalias %b , ptr noalias %c ) nosync {
1523+ ; CHECK-LABEL: define void @deref_assumption_in_header_constant_trip_count_nofree_via_context(
1524+ ; CHECK-SAME: ptr noalias noundef [[A:%.*]], ptr noalias [[B:%.*]], ptr noalias [[C:%.*]]) #[[ATTR2:[0-9]+]] {
1525+ ; CHECK-NEXT: [[ENTRY:.*:]]
1526+ ; CHECK-NEXT: call void @llvm.assume(i1 true) [ "align"(ptr [[A]], i64 4), "dereferenceable"(ptr [[A]], i64 4000) ]
1527+ ; CHECK-NEXT: br label %[[VECTOR_PH:.*]]
1528+ ; CHECK: [[VECTOR_PH]]:
1529+ ; CHECK-NEXT: br label %[[VECTOR_BODY:.*]]
1530+ ; CHECK: [[VECTOR_BODY]]:
1531+ ; CHECK-NEXT: [[INDEX:%.*]] = phi i64 [ 0, %[[VECTOR_PH]] ], [ [[INDEX_NEXT:%.*]], %[[PRED_LOAD_CONTINUE2:.*]] ]
1532+ ; CHECK-NEXT: [[TMP0:%.*]] = getelementptr inbounds i32, ptr [[B]], i64 [[INDEX]]
1533+ ; CHECK-NEXT: [[WIDE_LOAD:%.*]] = load <2 x i32>, ptr [[TMP0]], align 4
1534+ ; CHECK-NEXT: [[TMP1:%.*]] = icmp slt <2 x i32> [[WIDE_LOAD]], zeroinitializer
1535+ ; CHECK-NEXT: [[TMP2:%.*]] = extractelement <2 x i1> [[TMP1]], i32 0
1536+ ; CHECK-NEXT: br i1 [[TMP2]], label %[[PRED_LOAD_IF:.*]], label %[[PRED_LOAD_CONTINUE:.*]]
1537+ ; CHECK: [[PRED_LOAD_IF]]:
1538+ ; CHECK-NEXT: [[TMP3:%.*]] = add i64 [[INDEX]], 0
1539+ ; CHECK-NEXT: [[TMP4:%.*]] = getelementptr i32, ptr [[A]], i64 [[TMP3]]
1540+ ; CHECK-NEXT: [[TMP5:%.*]] = load i32, ptr [[TMP4]], align 4
1541+ ; CHECK-NEXT: [[TMP6:%.*]] = insertelement <2 x i32> poison, i32 [[TMP5]], i32 0
1542+ ; CHECK-NEXT: br label %[[PRED_LOAD_CONTINUE]]
1543+ ; CHECK: [[PRED_LOAD_CONTINUE]]:
1544+ ; CHECK-NEXT: [[TMP7:%.*]] = phi <2 x i32> [ poison, %[[VECTOR_BODY]] ], [ [[TMP6]], %[[PRED_LOAD_IF]] ]
1545+ ; CHECK-NEXT: [[TMP8:%.*]] = extractelement <2 x i1> [[TMP1]], i32 1
1546+ ; CHECK-NEXT: br i1 [[TMP8]], label %[[PRED_LOAD_IF1:.*]], label %[[PRED_LOAD_CONTINUE2]]
1547+ ; CHECK: [[PRED_LOAD_IF1]]:
1548+ ; CHECK-NEXT: [[TMP9:%.*]] = add i64 [[INDEX]], 1
1549+ ; CHECK-NEXT: [[TMP10:%.*]] = getelementptr i32, ptr [[A]], i64 [[TMP9]]
1550+ ; CHECK-NEXT: [[TMP11:%.*]] = load i32, ptr [[TMP10]], align 4
1551+ ; CHECK-NEXT: [[TMP12:%.*]] = insertelement <2 x i32> [[TMP7]], i32 [[TMP11]], i32 1
1552+ ; CHECK-NEXT: br label %[[PRED_LOAD_CONTINUE2]]
1553+ ; CHECK: [[PRED_LOAD_CONTINUE2]]:
1554+ ; CHECK-NEXT: [[TMP13:%.*]] = phi <2 x i32> [ [[TMP7]], %[[PRED_LOAD_CONTINUE]] ], [ [[TMP12]], %[[PRED_LOAD_IF1]] ]
1555+ ; CHECK-NEXT: [[PREDPHI:%.*]] = select <2 x i1> [[TMP1]], <2 x i32> [[TMP13]], <2 x i32> [[WIDE_LOAD]]
1556+ ; CHECK-NEXT: [[TMP14:%.*]] = getelementptr inbounds i32, ptr [[C]], i64 [[INDEX]]
1557+ ; CHECK-NEXT: store <2 x i32> [[PREDPHI]], ptr [[TMP14]], align 4
1558+ ; CHECK-NEXT: [[INDEX_NEXT]] = add nuw i64 [[INDEX]], 2
1559+ ; CHECK-NEXT: [[TMP15:%.*]] = icmp eq i64 [[INDEX_NEXT]], 1000
1560+ ; CHECK-NEXT: br i1 [[TMP15]], label %[[MIDDLE_BLOCK:.*]], label %[[VECTOR_BODY]], !llvm.loop [[LOOP20:![0-9]+]]
1561+ ; CHECK: [[MIDDLE_BLOCK]]:
1562+ ; CHECK-NEXT: br label %[[EXIT:.*]]
1563+ ; CHECK: [[SCALAR_PH:.*]]:
1564+ ; CHECK-NEXT: br label %[[LOOP_HEADER:.*]]
1565+ ; CHECK: [[LOOP_HEADER]]:
1566+ ; CHECK-NEXT: [[IV:%.*]] = phi i64 [ 0, %[[SCALAR_PH]] ], [ [[IV_NEXT:%.*]], %[[LOOP_LATCH:.*]] ]
1567+ ; CHECK-NEXT: [[GEP_A:%.*]] = getelementptr i32, ptr [[A]], i64 [[IV]]
1568+ ; CHECK-NEXT: [[GEP_B:%.*]] = getelementptr inbounds i32, ptr [[B]], i64 [[IV]]
1569+ ; CHECK-NEXT: [[L_B:%.*]] = load i32, ptr [[GEP_B]], align 4
1570+ ; CHECK-NEXT: [[C_1:%.*]] = icmp sge i32 [[L_B]], 0
1571+ ; CHECK-NEXT: br i1 [[C_1]], label %[[LOOP_LATCH]], label %[[LOOP_THEN:.*]]
1572+ ; CHECK: [[LOOP_THEN]]:
1573+ ; CHECK-NEXT: [[L_A:%.*]] = load i32, ptr [[GEP_A]], align 4
1574+ ; CHECK-NEXT: br label %[[LOOP_LATCH]]
1575+ ; CHECK: [[LOOP_LATCH]]:
1576+ ; CHECK-NEXT: [[MERGE:%.*]] = phi i32 [ [[L_A]], %[[LOOP_THEN]] ], [ [[L_B]], %[[LOOP_HEADER]] ]
1577+ ; CHECK-NEXT: [[GEP_C:%.*]] = getelementptr inbounds i32, ptr [[C]], i64 [[IV]]
1578+ ; CHECK-NEXT: store i32 [[MERGE]], ptr [[GEP_C]], align 4
1579+ ; CHECK-NEXT: [[IV_NEXT]] = add nuw nsw i64 [[IV]], 1
1580+ ; CHECK-NEXT: [[EC:%.*]] = icmp eq i64 [[IV_NEXT]], 1000
1581+ ; CHECK-NEXT: br i1 [[EC]], label %[[EXIT]], label %[[LOOP_HEADER]]
1582+ ; CHECK: [[EXIT]]:
1583+ ; CHECK-NEXT: ret void
1584+ ;
1585+ entry:
1586+ call void @llvm.assume (i1 true ) [ "align" (ptr %a , i64 4 ), "dereferenceable" (ptr %a , i64 4000 ) ]
1587+ br label %loop.header
1588+
1589+ loop.header:
1590+ %iv = phi i64 [ 0 , %entry ], [ %iv.next , %loop.latch ]
1591+ %gep.a = getelementptr i32 , ptr %a , i64 %iv
1592+ %gep.b = getelementptr inbounds i32 , ptr %b , i64 %iv
1593+ %l.b = load i32 , ptr %gep.b , align 4
1594+ %c.1 = icmp sge i32 %l.b , 0
1595+ br i1 %c.1 , label %loop.latch , label %loop.then
1596+
1597+ loop.then:
1598+ %l.a = load i32 , ptr %gep.a , align 4
1599+ br label %loop.latch
1600+
1601+ loop.latch:
1602+ %merge = phi i32 [ %l.a , %loop.then ], [ %l.b , %loop.header ]
1603+ %gep.c = getelementptr inbounds i32 , ptr %c , i64 %iv
1604+ store i32 %merge , ptr %gep.c , align 4
1605+ %iv.next = add nuw nsw i64 %iv , 1
1606+ %ec = icmp eq i64 %iv.next , 1000
1607+ br i1 %ec , label %exit , label %loop.header
1608+
1609+ exit:
1610+ ret void
1611+ }
1612+
1613+ define void @deref_assumption_in_header_constant_trip_count_may_free (ptr noalias noundef %a , ptr noalias %b , ptr noalias %c ) nosync {
1614+ ; CHECK-LABEL: define void @deref_assumption_in_header_constant_trip_count_may_free(
1615+ ; CHECK-SAME: ptr noalias noundef [[A:%.*]], ptr noalias [[B:%.*]], ptr noalias [[C:%.*]]) #[[ATTR2]] {
1616+ ; CHECK-NEXT: [[ENTRY:.*:]]
1617+ ; CHECK-NEXT: call void @llvm.assume(i1 true) [ "align"(ptr [[A]], i64 4), "dereferenceable"(ptr [[A]], i64 4000) ]
1618+ ; CHECK-NEXT: call void @may_free()
1619+ ; CHECK-NEXT: br label %[[VECTOR_PH:.*]]
1620+ ; CHECK: [[VECTOR_PH]]:
1621+ ; CHECK-NEXT: br label %[[VECTOR_BODY:.*]]
1622+ ; CHECK: [[VECTOR_BODY]]:
1623+ ; CHECK-NEXT: [[INDEX:%.*]] = phi i64 [ 0, %[[VECTOR_PH]] ], [ [[INDEX_NEXT:%.*]], %[[PRED_LOAD_CONTINUE2:.*]] ]
1624+ ; CHECK-NEXT: [[VEC_IND:%.*]] = phi <2 x i64> [ <i64 0, i64 1>, %[[VECTOR_PH]] ], [ [[VEC_IND_NEXT:%.*]], %[[PRED_LOAD_CONTINUE2]] ]
1625+ ; CHECK-NEXT: [[TMP0:%.*]] = getelementptr i32, ptr [[A]], <2 x i64> [[VEC_IND]]
1626+ ; CHECK-NEXT: [[TMP1:%.*]] = extractelement <2 x ptr> [[TMP0]], i32 0
1627+ ; CHECK-NEXT: call void @llvm.assume(i1 true) [ "align"(ptr [[TMP1]], i64 4), "dereferenceable"(ptr [[TMP1]], i64 4) ]
1628+ ; CHECK-NEXT: [[TMP2:%.*]] = extractelement <2 x ptr> [[TMP0]], i32 1
1629+ ; CHECK-NEXT: call void @llvm.assume(i1 true) [ "align"(ptr [[TMP2]], i64 4), "dereferenceable"(ptr [[TMP2]], i64 4) ]
1630+ ; CHECK-NEXT: [[TMP3:%.*]] = getelementptr inbounds i32, ptr [[B]], i64 [[INDEX]]
1631+ ; CHECK-NEXT: [[WIDE_LOAD:%.*]] = load <2 x i32>, ptr [[TMP3]], align 4
1632+ ; CHECK-NEXT: [[TMP4:%.*]] = icmp slt <2 x i32> [[WIDE_LOAD]], zeroinitializer
1633+ ; CHECK-NEXT: [[TMP5:%.*]] = extractelement <2 x i1> [[TMP4]], i32 0
1634+ ; CHECK-NEXT: br i1 [[TMP5]], label %[[PRED_LOAD_IF:.*]], label %[[PRED_LOAD_CONTINUE:.*]]
1635+ ; CHECK: [[PRED_LOAD_IF]]:
1636+ ; CHECK-NEXT: [[TMP6:%.*]] = extractelement <2 x ptr> [[TMP0]], i32 0
1637+ ; CHECK-NEXT: [[TMP7:%.*]] = load i32, ptr [[TMP6]], align 4
1638+ ; CHECK-NEXT: [[TMP8:%.*]] = insertelement <2 x i32> poison, i32 [[TMP7]], i32 0
1639+ ; CHECK-NEXT: br label %[[PRED_LOAD_CONTINUE]]
1640+ ; CHECK: [[PRED_LOAD_CONTINUE]]:
1641+ ; CHECK-NEXT: [[TMP9:%.*]] = phi <2 x i32> [ poison, %[[VECTOR_BODY]] ], [ [[TMP8]], %[[PRED_LOAD_IF]] ]
1642+ ; CHECK-NEXT: [[TMP10:%.*]] = extractelement <2 x i1> [[TMP4]], i32 1
1643+ ; CHECK-NEXT: br i1 [[TMP10]], label %[[PRED_LOAD_IF1:.*]], label %[[PRED_LOAD_CONTINUE2]]
1644+ ; CHECK: [[PRED_LOAD_IF1]]:
1645+ ; CHECK-NEXT: [[TMP11:%.*]] = extractelement <2 x ptr> [[TMP0]], i32 1
1646+ ; CHECK-NEXT: [[TMP12:%.*]] = load i32, ptr [[TMP11]], align 4
1647+ ; CHECK-NEXT: [[TMP13:%.*]] = insertelement <2 x i32> [[TMP9]], i32 [[TMP12]], i32 1
1648+ ; CHECK-NEXT: br label %[[PRED_LOAD_CONTINUE2]]
1649+ ; CHECK: [[PRED_LOAD_CONTINUE2]]:
1650+ ; CHECK-NEXT: [[TMP14:%.*]] = phi <2 x i32> [ [[TMP9]], %[[PRED_LOAD_CONTINUE]] ], [ [[TMP13]], %[[PRED_LOAD_IF1]] ]
1651+ ; CHECK-NEXT: [[PREDPHI:%.*]] = select <2 x i1> [[TMP4]], <2 x i32> [[TMP14]], <2 x i32> [[WIDE_LOAD]]
1652+ ; CHECK-NEXT: [[TMP15:%.*]] = getelementptr inbounds i32, ptr [[C]], i64 [[INDEX]]
1653+ ; CHECK-NEXT: store <2 x i32> [[PREDPHI]], ptr [[TMP15]], align 4
1654+ ; CHECK-NEXT: [[INDEX_NEXT]] = add nuw i64 [[INDEX]], 2
1655+ ; CHECK-NEXT: [[VEC_IND_NEXT]] = add <2 x i64> [[VEC_IND]], splat (i64 2)
1656+ ; CHECK-NEXT: [[TMP16:%.*]] = icmp eq i64 [[INDEX_NEXT]], 1000
1657+ ; CHECK-NEXT: br i1 [[TMP16]], label %[[MIDDLE_BLOCK:.*]], label %[[VECTOR_BODY]], !llvm.loop [[LOOP21:![0-9]+]]
1658+ ; CHECK: [[MIDDLE_BLOCK]]:
1659+ ; CHECK-NEXT: br label %[[EXIT:.*]]
1660+ ; CHECK: [[SCALAR_PH:.*]]:
1661+ ; CHECK-NEXT: br label %[[LOOP_HEADER:.*]]
1662+ ; CHECK: [[LOOP_HEADER]]:
1663+ ; CHECK-NEXT: [[IV:%.*]] = phi i64 [ 0, %[[SCALAR_PH]] ], [ [[IV_NEXT:%.*]], %[[LOOP_LATCH:.*]] ]
1664+ ; CHECK-NEXT: [[GEP_A:%.*]] = getelementptr i32, ptr [[A]], i64 [[IV]]
1665+ ; CHECK-NEXT: call void @llvm.assume(i1 true) [ "align"(ptr [[GEP_A]], i64 4), "dereferenceable"(ptr [[GEP_A]], i64 4) ]
1666+ ; CHECK-NEXT: [[GEP_B:%.*]] = getelementptr inbounds i32, ptr [[B]], i64 [[IV]]
1667+ ; CHECK-NEXT: [[L_B:%.*]] = load i32, ptr [[GEP_B]], align 4
1668+ ; CHECK-NEXT: [[C_1:%.*]] = icmp sge i32 [[L_B]], 0
1669+ ; CHECK-NEXT: br i1 [[C_1]], label %[[LOOP_LATCH]], label %[[LOOP_THEN:.*]]
1670+ ; CHECK: [[LOOP_THEN]]:
1671+ ; CHECK-NEXT: [[L_A:%.*]] = load i32, ptr [[GEP_A]], align 4
1672+ ; CHECK-NEXT: br label %[[LOOP_LATCH]]
1673+ ; CHECK: [[LOOP_LATCH]]:
1674+ ; CHECK-NEXT: [[MERGE:%.*]] = phi i32 [ [[L_A]], %[[LOOP_THEN]] ], [ [[L_B]], %[[LOOP_HEADER]] ]
1675+ ; CHECK-NEXT: [[GEP_C:%.*]] = getelementptr inbounds i32, ptr [[C]], i64 [[IV]]
1676+ ; CHECK-NEXT: store i32 [[MERGE]], ptr [[GEP_C]], align 4
1677+ ; CHECK-NEXT: [[IV_NEXT]] = add nuw nsw i64 [[IV]], 1
1678+ ; CHECK-NEXT: [[EC:%.*]] = icmp eq i64 [[IV_NEXT]], 1000
1679+ ; CHECK-NEXT: br i1 [[EC]], label %[[EXIT]], label %[[LOOP_HEADER]]
1680+ ; CHECK: [[EXIT]]:
1681+ ; CHECK-NEXT: ret void
1682+ ;
1683+ entry:
1684+ call void @llvm.assume (i1 true ) [ "align" (ptr %a , i64 4 ), "dereferenceable" (ptr %a , i64 4000 ) ]
1685+ call void @may_free ()
1686+ br label %loop.header
1687+
1688+ loop.header:
1689+ %iv = phi i64 [ 0 , %entry ], [ %iv.next , %loop.latch ]
1690+ %gep.a = getelementptr i32 , ptr %a , i64 %iv
1691+ call void @llvm.assume (i1 true ) [ "align" (ptr %gep.a , i64 4 ), "dereferenceable" (ptr %gep.a , i64 4 ) ]
1692+ %gep.b = getelementptr inbounds i32 , ptr %b , i64 %iv
1693+ %l.b = load i32 , ptr %gep.b , align 4
1694+ %c.1 = icmp sge i32 %l.b , 0
1695+ br i1 %c.1 , label %loop.latch , label %loop.then
1696+
1697+ loop.then:
1698+ %l.a = load i32 , ptr %gep.a , align 4
1699+ br label %loop.latch
1700+
1701+ loop.latch:
1702+ %merge = phi i32 [ %l.a , %loop.then ], [ %l.b , %loop.header ]
1703+ %gep.c = getelementptr inbounds i32 , ptr %c , i64 %iv
1704+ store i32 %merge , ptr %gep.c , align 4
1705+ %iv.next = add nuw nsw i64 %iv , 1
1706+ %ec = icmp eq i64 %iv.next , 1000
1707+ br i1 %ec , label %exit , label %loop.header
1708+
1709+ exit:
1710+ ret void
1711+ }
15221712;.
15231713; CHECK: [[LOOP0]] = distinct !{[[LOOP0]], [[META1:![0-9]+]], [[META2:![0-9]+]]}
15241714; CHECK: [[META1]] = !{!"llvm.loop.isvectorized", i32 1}
@@ -1540,4 +1730,6 @@ declare void @may_free()
15401730; CHECK: [[LOOP17]] = distinct !{[[LOOP17]], [[META1]], [[META2]]}
15411731; CHECK: [[LOOP18]] = distinct !{[[LOOP18]], [[META1]], [[META2]]}
15421732; CHECK: [[LOOP19]] = distinct !{[[LOOP19]], [[META1]], [[META2]]}
1733+ ; CHECK: [[LOOP20]] = distinct !{[[LOOP20]], [[META1]], [[META2]]}
1734+ ; CHECK: [[LOOP21]] = distinct !{[[LOOP21]], [[META1]], [[META2]]}
15431735;.
0 commit comments