Skip to content

Commit acc6889

Browse files
committed
added numQueues to performance data
1 parent f6ae9ac commit acc6889

File tree

5 files changed

+10
-12
lines changed

5 files changed

+10
-12
lines changed

doc/performance/clBLAS_2.7.1/S9150/cgemmNT_S9150_14.50.2_2.7.1_8.csv

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,4 @@
1-
m,n,k,lda,ldb,ldc,offa,offb,offc,alpha,beta,order,transa,transb,side,uplo,diag,function,device,library,label,GFLOPS
1+
m,n,k,lda,ldb,ldc,offa,offb,offc,alpha,beta,order,transa,transb,side,uplo,diag,function,device,library,numQueues,label,GFLOPS
22
8,8,8,0,0,0,0,0,0,1.0,1.0,column,none,transpose,left,upper,unit,cgemm,gpu,clblas,4,S9150_14.50.2,0.361199
33
16,16,16,0,0,0,0,0,0,1.0,1.0,column,none,transpose,left,upper,unit,cgemm,gpu,clblas,4,S9150_14.50.2,2.2276
44
24,24,24,0,0,0,0,0,0,1.0,1.0,column,none,transpose,left,upper,unit,cgemm,gpu,clblas,4,S9150_14.50.2,2.32776

doc/performance/clBLAS_2.7.1/S9150/dgemmNT_S9150_14.50.2_2.7.1_8.csv

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,4 @@
1-
m,n,k,lda,ldb,ldc,offa,offb,offc,alpha,beta,order,transa,transb,side,uplo,diag,function,device,library,label,GFLOPS
1+
m,n,k,lda,ldb,ldc,offa,offb,offc,alpha,beta,order,transa,transb,side,uplo,diag,function,device,library,numQueues,label,GFLOPS
22
8,8,8,0,0,0,0,0,0,1.0,1.0,column,none,transpose,left,upper,unit,dgemm,gpu,clblas,4,S9150_14.50.2,0.0782277
33
16,16,16,0,0,0,0,0,0,1.0,1.0,column,none,transpose,left,upper,unit,dgemm,gpu,clblas,4,S9150_14.50.2,0.5681
44
24,24,24,0,0,0,0,0,0,1.0,1.0,column,none,transpose,left,upper,unit,dgemm,gpu,clblas,4,S9150_14.50.2,0.516013

doc/performance/clBLAS_2.7.1/S9150/sgemmNT_S9150_14.50.2_2.7.1_8.csv

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,4 @@
1-
m,n,k,lda,ldb,ldc,offa,offb,offc,alpha,beta,order,transa,transb,side,uplo,diag,function,device,library,label,GFLOPS
1+
m,n,k,lda,ldb,ldc,offa,offb,offc,alpha,beta,order,transa,transb,side,uplo,diag,function,device,library,numQueues,label,GFLOPS
22
8,8,8,0,0,0,0,0,0,1.0,1.0,column,none,transpose,left,upper,unit,sgemm,gpu,clblas,4,S9150_14.50.2,0.0752941
33
16,16,16,0,0,0,0,0,0,1.0,1.0,column,none,transpose,left,upper,unit,sgemm,gpu,clblas,4,S9150_14.50.2,0.630639
44
24,24,24,0,0,0,0,0,0,1.0,1.0,column,none,transpose,left,upper,unit,sgemm,gpu,clblas,4,S9150_14.50.2,0.645378

doc/performance/clBLAS_2.7.1/S9150/zgemmNT_S9150_14.50.2_2.7.1_8.csv

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,4 @@
1-
m,n,k,lda,ldb,ldc,offa,offb,offc,alpha,beta,order,transa,transb,side,uplo,diag,function,device,library,label,GFLOPS
1+
m,n,k,lda,ldb,ldc,offa,offb,offc,alpha,beta,order,transa,transb,side,uplo,diag,function,device,library,numQueues,label,GFLOPS
22
8,8,8,0,0,0,0,0,0,1.0,1.0,column,none,transpose,left,upper,unit,zgemm,gpu,clblas,4,S9150_14.50.2,0.286634
33
16,16,16,0,0,0,0,0,0,1.0,1.0,column,none,transpose,left,upper,unit,zgemm,gpu,clblas,4,S9150_14.50.2,2.31086
44
24,24,24,0,0,0,0,0,0,1.0,1.0,column,none,transpose,left,upper,unit,zgemm,gpu,clblas,4,S9150_14.50.2,2.20435

src/scripts/perf/blasPerformanceTesting.py

Lines changed: 6 additions & 8 deletions
Original file line numberDiff line numberDiff line change
@@ -1,12 +1,12 @@
11
# ########################################################################
22
# Copyright 2013 Advanced Micro Devices, Inc.
3-
#
3+
#
44
# Licensed under the Apache License, Version 2.0 (the "License");
55
# you may not use this file except in compliance with the License.
66
# You may obtain a copy of the License at
7-
#
7+
#
88
# http://www.apache.org/licenses/LICENSE-2.0
9-
#
9+
#
1010
# Unless required by applicable law or agreed to in writing, software
1111
# distributed under the License is distributed on an "AS IS" BASIS,
1212
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
@@ -23,8 +23,6 @@
2323

2424
# Common data and functions for the performance suite
2525

26-
tableHeader = 'lengthx,lengthy,lengthz,batch,device,inlay,outlay,place,ldsComp,ldsFrac,cache,xfactor,label,GFLOPS'
27-
2826
class TestCombination:
2927
def __init__(self,
3028
lengthx, lengthy, lengthz, batchsize,
@@ -115,7 +113,7 @@ def executable(library):
115113

116114
def max_mem_available_in_bytes(exe, device):
117115
arguments = [exe, '-i', device]
118-
116+
119117
deviceInfo = subprocess.check_output(arguments, stderr=subprocess.STDOUT).split(os.linesep)
120118
deviceInfo = itertools.ifilter( lambda x: x.count('MAX_MEM_ALLOC_SIZE'), deviceInfo)
121119
deviceInfo = list(itertools.islice(deviceInfo, None))
@@ -250,7 +248,7 @@ def decode_parameter_problemsize(problemsize):
250248
return problemsize
251249

252250
def blas_table_header():
253-
return 'm,n,k,lda,ldb,ldc,offa,offb,offc,alpha,beta,order,transa,transb,side,uplo,diag,function,device,library,label,GFLOPS'
251+
return 'm,n,k,lda,ldb,ldc,offa,offb,offc,alpha,beta,order,transa,transb,side,uplo,diag,function,device,library,numQueues,label,GFLOPS'
254252

255253
class BlasTestCombination:
256254
def __init__(self,
@@ -329,5 +327,5 @@ def open_file( filename ):
329327
filename = filename + datetime.now().isoformat().replace(':','.')
330328
message = 'A file with the name ' + oldname + ' already exists. Changing filename to ' + filename
331329
print message
332-
330+
333331
return open(filename, 'w')

0 commit comments

Comments
 (0)