Skip to content

Commit f7397fe

Browse files
shehzan10pavanky
authored andcommitted
Add cl_khr_fp64 when using double precision
1 parent 596925c commit f7397fe

7 files changed

+13
-0
lines changed

src/library/blas/AutoGemm/KernelOpenCL.py

Lines changed: 7 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -25,6 +25,13 @@ def makeOpenCLKernelString(kernel):
2525
kStr += "/* %s */" % kernel.getName()
2626
kStr += endLine
2727

28+
####################################
29+
# Double precision pragma
30+
prec = kernel.getName()[0].lower()
31+
if prec == "d" or prec == "z":
32+
kStr += endLine
33+
kStr += "#pragma OPENCL EXTENSION cl_khr_fp64 : enable" + endLine
34+
2835
####################################
2936
# kernel parameters
3037
kStr += endLine

src/library/blas/AutoGemm/UserGemmKernelSources/dgemm_Col_NN_B0_MX048_NX048_KX08_src.cpp

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -18,6 +18,7 @@ const unsigned int dgemm_Col_NN_B0_MX048_NX048_KX08_microTileNumCols = 6;
1818
const unsigned int dgemm_Col_NN_B0_MX048_NX048_KX08_unroll = 8;
1919

2020
const char * const dgemm_Col_NN_B0_MX048_NX048_KX08_src = STRINGIFY(
21+
#pragma OPENCL EXTENSION cl_khr_fp64 : enable \n
2122

2223
#define M6x6 \
2324
rA[0] = lA[offA + 0];\

src/library/blas/AutoGemm/UserGemmKernelSources/dgemm_Col_NN_B1_MX048_NX048_KX08_src.cpp

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -18,6 +18,7 @@ const unsigned int dgemm_Col_NN_B1_MX048_NX048_KX08_microTileNumCols = 6;
1818
const unsigned int dgemm_Col_NN_B1_MX048_NX048_KX08_unroll = 8;
1919

2020
const char * const dgemm_Col_NN_B1_MX048_NX048_KX08_src = STRINGIFY(
21+
#pragma OPENCL EXTENSION cl_khr_fp64 : enable \n
2122

2223
#define M6x6 \
2324
rA[0] = lA[offA + 0]; \

src/library/blas/AutoGemm/UserGemmKernelSources/dgemm_Col_NT_B0_MX048_NX048_KX08_src.cpp

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -18,6 +18,7 @@ const unsigned int dgemm_Col_NT_B0_MX048_NX048_KX08_microTileNumCols = 6;
1818
const unsigned int dgemm_Col_NT_B0_MX048_NX048_KX08_unroll = 8;
1919

2020
const char * const dgemm_Col_NT_B0_MX048_NX048_KX08_src = STRINGIFY(
21+
#pragma OPENCL EXTENSION cl_khr_fp64 : enable \n
2122
\n
2223
\ntypedef union _GPtr {
2324
\n __global float *f;

src/library/blas/AutoGemm/UserGemmKernelSources/dgemm_Col_NT_B1_MX048_NX048_KX08_src.cpp

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -18,6 +18,7 @@ const unsigned int dgemm_Col_NT_B1_MX048_NX048_KX08_microTileNumCols = 6;
1818
const unsigned int dgemm_Col_NT_B1_MX048_NX048_KX08_unroll = 8;
1919

2020
const char * const dgemm_Col_NT_B1_MX048_NX048_KX08_src = STRINGIFY(
21+
#pragma OPENCL EXTENSION cl_khr_fp64 : enable \n
2122
\n
2223
\ntypedef union _GPtr {
2324
\n __global float *f;

src/library/blas/AutoGemm/UserGemmKernelSources/dgemm_Col_TN_B0_MX048_NX048_KX08_src.cpp

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -18,6 +18,7 @@ const unsigned int dgemm_Col_TN_B0_MX048_NX048_KX08_microTileNumCols = 6;
1818
const unsigned int dgemm_Col_TN_B0_MX048_NX048_KX08_unroll = 8;
1919

2020
const char * const dgemm_Col_TN_B0_MX048_NX048_KX08_src = STRINGIFY(
21+
#pragma OPENCL EXTENSION cl_khr_fp64 : enable \n
2122

2223
__attribute__( (reqd_work_group_size(8, 8, 1)) )
2324
__kernel void dgemm_Col_TN_B0_MX048_NX048_KX08_src (

src/library/blas/AutoGemm/UserGemmKernelSources/dgemm_Col_TN_B1_MX048_NX048_KX08_src.cpp

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -18,6 +18,7 @@ const unsigned int dgemm_Col_TN_B1_MX048_NX048_KX08_microTileNumCols = 6;
1818
const unsigned int dgemm_Col_TN_B1_MX048_NX048_KX08_unroll = 8;
1919

2020
const char * const dgemm_Col_TN_B1_MX048_NX048_KX08_src = STRINGIFY(
21+
#pragma OPENCL EXTENSION cl_khr_fp64 : enable \n
2122

2223
__attribute__( (reqd_work_group_size(8, 8, 1)) )
2324
__kernel void dgemm_Col_TN_B1_MX048_NX048_KX08_src (

0 commit comments

Comments
 (0)