Skip to content

Commit b4cc4be

Browse files
authored
Merge pull request #5410 from martin-frbg/issue5404
Adjust multithreading threshold in S/DGER and add an intermediate step
2 parents 0968ddd + 30d11bc commit b4cc4be

File tree

1 file changed

+3
-1
lines changed

1 file changed

+3
-1
lines changed

interface/ger.c

Lines changed: 3 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -180,8 +180,10 @@ void CNAME(enum CBLAS_ORDER order,
180180

181181
#ifdef SMPTEST
182182
// Threshold chosen so that speed-up is > 1 on a Xeon E5-2630
183-
if(1L * m * n > 2048L * GEMM_MULTITHREAD_THRESHOLD)
183+
if(1L * m * n > 20480L * GEMM_MULTITHREAD_THRESHOLD)
184184
nthreads = num_cpu_avail(2);
185+
else if(1L * m * n > 2048L * GEMM_MULTITHREAD_THRESHOLD)
186+
nthreads = MIN(3,num_cpu_avail(2));
185187
else
186188
nthreads = 1;
187189

0 commit comments

Comments
 (0)