|
| 1 | +; REQUIRES: asserts |
| 2 | +; RUN: opt -passes=loop-vectorize -mtriple riscv64 -mattr=+v -vectorizer-maximize-bandwidth -debug-only=loop-vectorize,vplan -disable-output -S < %s 2>&1 | FileCheck %s --check-prefixes=CHECK-REGS-VP |
| 3 | + |
| 4 | +define i32 @dotp(ptr %a, ptr %b) { |
| 5 | +; CHECK-REGS-VP: LV(REG): VF = vscale x 16 |
| 6 | +; CHECK-REGS-VP-NEXT: LV(REG): Found max usage: 2 item |
| 7 | +; CHECK-REGS-VP-NEXT: LV(REG): RegisterClass: RISCV::GPRRC, 6 registers |
| 8 | +; CHECK-REGS-VP-NEXT: LV(REG): RegisterClass: RISCV::VRRC, 24 registers |
| 9 | +; CHECK-REGS-VP-NEXT: LV(REG): Found invariant usage: 1 item |
| 10 | +; CHECK-REGS-VP-NEXT: LV(REG): RegisterClass: RISCV::GPRRC, 1 registers |
| 11 | +; CHECK-REGS-VP: LV: Selecting VF: vscale x 16. |
| 12 | +entry: |
| 13 | + br label %for.body |
| 14 | + |
| 15 | +for.body: ; preds = %for.body, %entry |
| 16 | + %iv = phi i64 [ 0, %entry ], [ %iv.next, %for.body ] |
| 17 | + %accum = phi i32 [ 0, %entry ], [ %add, %for.body ] |
| 18 | + %gep.a = getelementptr i8, ptr %a, i64 %iv |
| 19 | + %load.a = load i8, ptr %gep.a, align 1 |
| 20 | + %ext.a = zext i8 %load.a to i32 |
| 21 | + %gep.b = getelementptr i8, ptr %b, i64 %iv |
| 22 | + %load.b = load i8, ptr %gep.b, align 1 |
| 23 | + %ext.b = zext i8 %load.b to i32 |
| 24 | + %mul = mul i32 %ext.b, %ext.a |
| 25 | + %sub = sub i32 0, %mul |
| 26 | + %add = add i32 %accum, %sub |
| 27 | + %iv.next = add i64 %iv, 1 |
| 28 | + %exitcond.not = icmp eq i64 %iv.next, 1024 |
| 29 | + br i1 %exitcond.not, label %for.exit, label %for.body |
| 30 | + |
| 31 | +for.exit: ; preds = %for.body |
| 32 | + ret i32 %add |
| 33 | +} |
0 commit comments