Skip to content

Commit 76d3e84

Browse files
shawngu-quiclhez
authored andcommitted
Keep GGML_OPENCL_SOA_Q default
1 parent 29b73d4 commit 76d3e84

File tree

2 files changed

+3
-10
lines changed

2 files changed

+3
-10
lines changed

ggml/src/ggml-opencl/CMakeLists.txt

Lines changed: 2 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -13,9 +13,8 @@ if (GGML_OPENCL_PROFILING)
1313
message(STATUS "OpenCL profiling enabled (increases CPU overhead)")
1414
add_compile_definitions(GGML_OPENCL_PROFILING)
1515
endif ()
16-
if (GGML_OPENCL_SOA_Q)
17-
add_compile_definitions(GGML_OPENCL_SOA_Q)
18-
endif()
16+
17+
add_compile_definitions(GGML_OPENCL_SOA_Q)
1918

2019
add_compile_definitions(GGML_OPENCL_TARGET_VERSION=${GGML_OPENCL_TARGET_VERSION})
2120

ggml/src/ggml-opencl/ggml-opencl.cpp

Lines changed: 1 addition & 7 deletions
Original file line numberDiff line numberDiff line change
@@ -3477,7 +3477,6 @@ static void ggml_backend_opencl_buffer_set_tensor(ggml_backend_buffer_t buffer,
34773477
cl_image_format img_format_q = {CL_RG, CL_UNSIGNED_INT32};
34783478
cl_image_desc img_desc_q = {CL_MEM_OBJECT_IMAGE1D_BUFFER, static_cast<size_t>(tensor->ne[0] * tensor->ne[1] * tensor->ne[2] / 32 * 2), 0,0,0,0,0,0,0, extra->q};
34793479
extra->q_img = clCreateImage(context, CL_MEM_READ_ONLY, &img_format_q, &img_desc_q, NULL, &err);
3480-
CL_CHECK(clReleaseMemObject(extra->q));
34813480

34823481
tensor->extra = extra;
34833482

@@ -7172,14 +7171,9 @@ static void ggml_cl_mul_mat_id(ggml_backend_t backend, const ggml_tensor * src0,
71727171
} else {
71737172
GGML_ASSERT(false && "TODO: Unknown GPU");
71747173
}
7175-
7176-
#ifdef GGML_OPENCL_SOA_Q
7174+
71777175
CL_CHECK(clSetKernelArg(kernel, 0, sizeof(cl_mem), &extra0_q4_0->q));
71787176
CL_CHECK(clSetKernelArg(kernel, 1, sizeof(cl_mem), &extra0_q4_0->d));
7179-
#else
7180-
CL_CHECK(clSetKernelArg(kernel, 0, sizeof(cl_mem), &extra0->data_device));
7181-
CL_CHECK(clSetKernelArg(kernel, 1, sizeof(cl_ulong), &offset0));
7182-
#endif
71837177
CL_CHECK(clSetKernelArg(kernel, 2, sizeof(cl_mem), &extra1->data_device));
71847178
CL_CHECK(clSetKernelArg(kernel, 3, sizeof(cl_ulong), &offset1));
71857179
CL_CHECK(clSetKernelArg(kernel, 4, sizeof(cl_mem), &extra2->data_device));

0 commit comments

Comments
 (0)