@@ -467,83 +467,3 @@ loop:
467467exit:
468468 ret i32 %red.next
469469}
470-
471- define i64 @partial_reduction_mul_two_users (i64 %n , ptr %a , i16 %b , i32 %c ) {
472- ; CHECK-LABEL: define i64 @partial_reduction_mul_two_users(
473- ; CHECK-SAME: i64 [[N:%.*]], ptr [[A:%.*]], i16 [[B:%.*]], i32 [[C:%.*]]) #[[ATTR0]] {
474- ; CHECK-NEXT: [[ENTRY:.*]]:
475- ; CHECK-NEXT: [[TMP0:%.*]] = add i64 [[N]], 1
476- ; CHECK-NEXT: [[MIN_ITERS_CHECK:%.*]] = icmp ult i64 [[TMP0]], 8
477- ; CHECK-NEXT: br i1 [[MIN_ITERS_CHECK]], label %[[SCALAR_PH:.*]], label %[[VECTOR_PH:.*]]
478- ; CHECK: [[VECTOR_PH]]:
479- ; CHECK-NEXT: [[N_MOD_VF:%.*]] = urem i64 [[TMP0]], 8
480- ; CHECK-NEXT: [[N_VEC:%.*]] = sub i64 [[TMP0]], [[N_MOD_VF]]
481- ; CHECK-NEXT: [[BROADCAST_SPLATINSERT:%.*]] = insertelement <8 x i16> poison, i16 [[B]], i64 0
482- ; CHECK-NEXT: [[BROADCAST_SPLAT:%.*]] = shufflevector <8 x i16> [[BROADCAST_SPLATINSERT]], <8 x i16> poison, <8 x i32> zeroinitializer
483- ; CHECK-NEXT: [[TMP1:%.*]] = sext <8 x i16> [[BROADCAST_SPLAT]] to <8 x i32>
484- ; CHECK-NEXT: [[TMP2:%.*]] = mul <8 x i32> [[TMP1]], [[TMP1]]
485- ; CHECK-NEXT: br label %[[VECTOR_BODY:.*]]
486- ; CHECK: [[VECTOR_BODY]]:
487- ; CHECK-NEXT: [[INDEX:%.*]] = phi i64 [ 0, %[[VECTOR_PH]] ], [ [[INDEX_NEXT:%.*]], %[[VECTOR_BODY]] ]
488- ; CHECK-NEXT: [[VEC_PHI:%.*]] = phi <4 x i64> [ zeroinitializer, %[[VECTOR_PH]] ], [ [[PARTIAL_REDUCE:%.*]], %[[VECTOR_BODY]] ]
489- ; CHECK-NEXT: [[TMP4:%.*]] = load i16, ptr [[A]], align 2
490- ; CHECK-NEXT: [[BROADCAST_SPLATINSERT1:%.*]] = insertelement <8 x i16> poison, i16 [[TMP4]], i64 0
491- ; CHECK-NEXT: [[BROADCAST_SPLAT2:%.*]] = shufflevector <8 x i16> [[BROADCAST_SPLATINSERT1]], <8 x i16> poison, <8 x i32> zeroinitializer
492- ; CHECK-NEXT: [[TMP3:%.*]] = zext <8 x i32> [[TMP2]] to <8 x i64>
493- ; CHECK-NEXT: [[PARTIAL_REDUCE]] = call <4 x i64> @llvm.vector.partial.reduce.add.v4i64.v8i64(<4 x i64> [[VEC_PHI]], <8 x i64> [[TMP3]])
494- ; CHECK-NEXT: [[TMP5:%.*]] = sext <8 x i16> [[BROADCAST_SPLAT2]] to <8 x i32>
495- ; CHECK-NEXT: [[TMP6:%.*]] = sext <8 x i32> [[TMP5]] to <8 x i64>
496- ; CHECK-NEXT: [[INDEX_NEXT]] = add nuw i64 [[INDEX]], 8
497- ; CHECK-NEXT: [[TMP7:%.*]] = icmp eq i64 [[INDEX_NEXT]], [[N_VEC]]
498- ; CHECK-NEXT: br i1 [[TMP7]], label %[[MIDDLE_BLOCK:.*]], label %[[VECTOR_BODY]], !llvm.loop [[LOOP18:![0-9]+]]
499- ; CHECK: [[MIDDLE_BLOCK]]:
500- ; CHECK-NEXT: [[TMP8:%.*]] = call i64 @llvm.vector.reduce.add.v4i64(<4 x i64> [[PARTIAL_REDUCE]])
501- ; CHECK-NEXT: [[VECTOR_RECUR_EXTRACT:%.*]] = extractelement <8 x i64> [[TMP6]], i32 7
502- ; CHECK-NEXT: [[CMP_N:%.*]] = icmp eq i64 [[TMP0]], [[N_VEC]]
503- ; CHECK-NEXT: br i1 [[CMP_N]], label %[[EXIT:.*]], label %[[SCALAR_PH]]
504- ; CHECK: [[SCALAR_PH]]:
505- ; CHECK-NEXT: [[BC_RESUME_VAL:%.*]] = phi i64 [ [[N_VEC]], %[[MIDDLE_BLOCK]] ], [ 0, %[[ENTRY]] ]
506- ; CHECK-NEXT: [[SCALAR_RECUR_INIT:%.*]] = phi i64 [ [[VECTOR_RECUR_EXTRACT]], %[[MIDDLE_BLOCK]] ], [ 0, %[[ENTRY]] ]
507- ; CHECK-NEXT: [[BC_MERGE_RDX:%.*]] = phi i64 [ [[TMP8]], %[[MIDDLE_BLOCK]] ], [ 0, %[[ENTRY]] ]
508- ; CHECK-NEXT: br label %[[LOOP:.*]]
509- ; CHECK: [[LOOP]]:
510- ; CHECK-NEXT: [[IV:%.*]] = phi i64 [ [[BC_RESUME_VAL]], %[[SCALAR_PH]] ], [ [[IV_NEXT:%.*]], %[[LOOP]] ]
511- ; CHECK-NEXT: [[RES1:%.*]] = phi i64 [ [[SCALAR_RECUR_INIT]], %[[SCALAR_PH]] ], [ [[LOAD_EXT_EXT:%.*]], %[[LOOP]] ]
512- ; CHECK-NEXT: [[RES2:%.*]] = phi i64 [ [[BC_MERGE_RDX]], %[[SCALAR_PH]] ], [ [[ADD:%.*]], %[[LOOP]] ]
513- ; CHECK-NEXT: [[LOAD:%.*]] = load i16, ptr [[A]], align 2
514- ; CHECK-NEXT: [[IV_NEXT]] = add i64 [[IV]], 1
515- ; CHECK-NEXT: [[CONV:%.*]] = sext i16 [[B]] to i32
516- ; CHECK-NEXT: [[MUL:%.*]] = mul i32 [[CONV]], [[CONV]]
517- ; CHECK-NEXT: [[MUL_EXT:%.*]] = zext i32 [[MUL]] to i64
518- ; CHECK-NEXT: [[ADD]] = add i64 [[RES2]], [[MUL_EXT]]
519- ; CHECK-NEXT: [[OR:%.*]] = or i32 [[MUL]], [[C]]
520- ; CHECK-NEXT: [[LOAD_EXT:%.*]] = sext i16 [[LOAD]] to i32
521- ; CHECK-NEXT: [[LOAD_EXT_EXT]] = sext i32 [[LOAD_EXT]] to i64
522- ; CHECK-NEXT: [[EXITCOND740_NOT:%.*]] = icmp eq i64 [[IV]], [[N]]
523- ; CHECK-NEXT: br i1 [[EXITCOND740_NOT]], label %[[EXIT]], label %[[LOOP]], !llvm.loop [[LOOP19:![0-9]+]]
524- ; CHECK: [[EXIT]]:
525- ; CHECK-NEXT: [[ADD_LCSSA:%.*]] = phi i64 [ [[ADD]], %[[LOOP]] ], [ [[TMP8]], %[[MIDDLE_BLOCK]] ]
526- ; CHECK-NEXT: ret i64 [[ADD_LCSSA]]
527- ;
528- entry:
529- br label %loop
530-
531- loop:
532- %iv = phi i64 [ 0 , %entry ], [ %iv.next , %loop ]
533- %res1 = phi i64 [ 0 , %entry ], [ %load.ext.ext , %loop ]
534- %res2 = phi i64 [ 0 , %entry ], [ %add , %loop ]
535- %load = load i16 , ptr %a , align 2
536- %iv.next = add i64 %iv , 1
537- %conv = sext i16 %b to i32
538- %mul = mul i32 %conv , %conv
539- %mul.ext = zext i32 %mul to i64
540- %add = add i64 %res2 , %mul.ext
541- %second_use = or i32 %mul , %c ; this value is otherwise unused, but that's sufficient for the test
542- %load.ext = sext i16 %load to i32
543- %load.ext.ext = sext i32 %load.ext to i64
544- %exitcond740.not = icmp eq i64 %iv , %n
545- br i1 %exitcond740.not , label %exit , label %loop
546-
547- exit:
548- ret i64 %add
549- }
0 commit comments