Skip to content

Commit 956be69

Browse files
committed
optimized getrf_single.c for POWER8
1 parent 6a2bde7 commit 956be69

File tree

1 file changed

+7
-0
lines changed

1 file changed

+7
-0
lines changed

lapack/getrf/getrf_single.c

Lines changed: 7 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -77,10 +77,17 @@ blasint CNAME(blas_arg_t *args, BLASLONG *range_m, BLASLONG *range_n, FLOAT *sa,
7777
blocking = (mn / 2 + GEMM_UNROLL_N - 1) & ~(GEMM_UNROLL_N - 1);
7878
if (blocking > GEMM_Q) blocking = GEMM_Q;
7979

80+
#ifdef POWER8
81+
if (blocking <= GEMM_UNROLL_N) {
82+
info = GETF2(args, NULL, range_n, sa, sb, 0);
83+
return info;
84+
}
85+
#else
8086
if (blocking <= GEMM_UNROLL_N * 2) {
8187
info = GETF2(args, NULL, range_n, sa, sb, 0);
8288
return info;
8389
}
90+
#endif
8491

8592
sbb = (FLOAT *)((((BLASULONG)(sb + blocking * blocking * COMPSIZE) + GEMM_ALIGN) & ~GEMM_ALIGN) + GEMM_OFFSET_B);
8693

0 commit comments

Comments
 (0)