@@ -42,78 +42,60 @@ def __init__(self, subtest):
4242 elif subtest == 'zgemm' :
4343 self .perf_patterns = {
4444 'magma' : sn .extractsingle (r'MAGMA GFlops: (?P<magma_gflops>\S+)' ,
45- self .stdout , 'magma_gflops' , float ),
45+ self .stdout , 'magma_gflops' , float , 2 ),
4646 'cublas' : sn .extractsingle (
4747 r'cuBLAS GFlops: (?P<cublas_gflops>\S+)' , self .stdout ,
48- 'cublas_gflops' , float ),
49- 'cpu' : sn .extractsingle (r'CPU GFlops: (?P<cpu_gflops>\S+)' ,
50- self .stdout , 'cpu_gflops' , float )
48+ 'cublas_gflops' , float , 2 )
5149 }
5250 self .reference = {
5351 'daint:gpu' : {
54- 'magma' : (3344 , - 0.05 , None , 'Gflop/s' ),
55- 'cublas' : (3709 , - 0.05 , None , 'Gflop/s' ),
56- 'cpu' : (42.8 , - 0.27 , None , 'Gflop/s' ),
52+ 'magma' : (3749 , - 0.05 , None , 'Gflop/s' ),
53+ 'cublas' : (4050 , - 0.05 , None , 'Gflop/s' ),
5754 },
5855 'dom:gpu' : {
59- 'magma' : (3344 , - 0.05 , None , 'Gflop/s' ),
60- 'cublas' : (3709 , - 0.05 , None , 'Gflop/s' ),
61- 'cpu' : (42.8 , - 0.27 , None , 'Gflop/s' ),
56+ 'magma' : (3749 , - 0.05 , None , 'Gflop/s' ),
57+ 'cublas' : (4050 , - 0.05 , None , 'Gflop/s' ),
6258 },
6359 }
6460 elif subtest == 'zsymmetrize' :
6561 self .perf_patterns = {
66- 'cpu_perf' : sn .extractsingle (r'CPU performance: (\S+)' ,
67- self .stdout , 1 , float ),
6862 'gpu_perf' : sn .extractsingle (r'GPU performance: (\S+)' ,
6963 self .stdout , 1 , float ),
7064 }
7165 self .reference = {
7266 'daint:gpu' : {
73- 'cpu_perf' : (0.91 , - 0.05 , None , 'GB/s' ),
7467 'gpu_perf' : (158.3 , - 0.05 , None , 'GB/s' ),
7568 },
7669 'dom:gpu' : {
77- 'cpu_perf' : (0.91 , - 0.05 , None , 'GB/s' ),
7870 'gpu_perf' : (158.3 , - 0.05 , None , 'GB/s' ),
7971 },
8072 }
8173 elif subtest == 'ztranspose' :
8274 self .perf_patterns = {
83- 'cpu_perf' :
84- sn .extractsingle (r'CPU performance: (?P<cpu_performance>\S+)' ,
85- self .stdout , 'cpu_performance' , float ),
8675 'gpu_perf' :
8776 sn .extractsingle (r'GPU performance: (?P<gpu_performance>\S+)' ,
8877 self .stdout , 'gpu_performance' , float )
8978 }
9079 self .reference = {
9180 'daint:gpu' : {
92- 'cpu_perf' : (1.51 , - 0.05 , None , 'GB/s' ),
9381 'gpu_perf' : (498.2 , - 0.05 , None , 'GB/s' ),
9482 },
9583 'dom:gpu' : {
96- 'cpu_perf' : (1.51 , - 0.05 , None , 'GB/s' ),
9784 'gpu_perf' : (498.2 , - 0.05 , None , 'GB/s' ),
9885 },
9986 }
10087 elif subtest == 'zunmbr' :
10188 # This test fails to compile with Magma 2.4
10289 self .perf_patterns = {
103- 'cpu_perf' :
104- sn .extractsingle (r'CPU performance: (?P<cpu_performance>\S+)' ,
105- self .stdout , 'cpu_performance' , float ),
10690 'gpu_perf' :
10791 sn .extractsingle (r'GPU performance: (?P<gpu_performance>\S+)' ,
10892 self .stdout , 'gpu_performance' , float )
10993 }
11094 self .reference = {
11195 'daint:gpu' : {
112- 'cpu_perf' : (36.6 , - 0.05 , None , 'Gflop/s' ),
11396 'gpu_perf' : (254.7 , - 0.05 , None , 'Gflop/s' ),
11497 },
11598 'dom:gpu' : {
116- 'cpu_perf' : (36.6 , - 0.05 , None , 'Gflop/s' ),
11799 'gpu_perf' : (254.7 , - 0.05 , None , 'Gflop/s' ),
118100 },
119101 }
0 commit comments