Skip to content

Commit 9ebe748

Browse files
committed
shorter patch; new performance data for zgemm
1 parent f02baa1 commit 9ebe748

File tree

2 files changed

+5
-14
lines changed

2 files changed

+5
-14
lines changed

cscs-checks/libraries/magma/magma_checks.py

Lines changed: 5 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -40,6 +40,7 @@ def __init__(self, subtest):
4040
},
4141
}
4242
elif subtest == 'zgemm':
43+
self.executable_opts = ['--range 1088:3136:1024']
4344
self.perf_patterns = {
4445
'magma': sn.extractsingle(
4546
r'MAGMA GFlops: (?P<magma_gflops>\S+)',
@@ -51,12 +52,12 @@ def __init__(self, subtest):
5152
}
5253
self.reference = {
5354
'daint:gpu': {
54-
'magma': (3749, -0.05, None, 'Gflop/s'),
55-
'cublas': (4050, -0.05, None, 'Gflop/s'),
55+
'magma': (3692.65, -0.05, None, 'Gflop/s'),
56+
'cublas': (4269.31, -0.0847, None, 'Gflop/s'),
5657
},
5758
'dom:gpu': {
58-
'magma': (3749, -0.05, None, 'Gflop/s'),
59-
'cublas': (4050, -0.05, None, 'Gflop/s'),
59+
'magma': (3692.65, -0.05, None, 'Gflop/s'),
60+
'cublas': (4269.31, -0.0847, None, 'Gflop/s'),
6061
},
6162
}
6263
elif subtest == 'zsymmetrize':

cscs-checks/libraries/magma/src/patch.txt

Lines changed: 0 additions & 10 deletions
Original file line numberDiff line numberDiff line change
@@ -67,16 +67,6 @@ diff -Naur src/testing_zgemm.cpp src_patched/testing_zgemm.cpp
6767

6868
// Allow 3*eps; complex needs 2*sqrt(2) factor; see Higham, 2002, sec. 3.6.
6969
double eps = lapackf77_dlamch("E");
70-
@@ -87,7 +88,8 @@
71-
g_platform_str, g_platform_str );
72-
#endif
73-
printf("%%========================================================================================================\n");
74-
- for( int itest = 0; itest < opts.ntest; ++itest ) {
75-
+//ajajajaj for( int itest = 0; itest < opts.ntest; ++itest ) {
76-
+ for( int itest = 0; itest < 3; itest++ ) {
77-
for( int iter = 0; iter < opts.niter; ++iter ) {
78-
M = opts.msize[itest];
79-
N = opts.nsize[itest];
8070
@@ -220,6 +222,9 @@
8171
cpu_perf, 1000.*cpu_time,
8272
magma_error, dev_error,

0 commit comments

Comments
 (0)