Skip to content

Commit fad3960

Browse files
committed
add log
1 parent d70d9f0 commit fad3960

File tree

2 files changed

+3
-3
lines changed

2 files changed

+3
-3
lines changed

ggml/src/ggml-cuda/fattn.cu

Lines changed: 0 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -7,11 +7,9 @@
77
#include "fattn-vec-f32.cuh"
88
#include "fattn-wmma-f16.cuh"
99
#include "fattn.cuh"
10-
#include "ggml-impl.h"
1110

1211
template <int D, int ncols2>
1312
static void ggml_cuda_flash_attn_ext_mma_f16_switch_ncols1(ggml_backend_cuda_context & ctx, ggml_tensor * dst) {
14-
GGML_LOG_INFO("ggml_cuda_flash_attn_ext_mma_f16_switch_ncols1: D=%d, ncols2=%d", D, ncols2);
1513
const ggml_tensor * Q = dst->src[0];
1614

1715
if (Q->ne[1] <= 8/ncols2) {
@@ -34,7 +32,6 @@ static void ggml_cuda_flash_attn_ext_mma_f16_switch_ncols1(ggml_backend_cuda_con
3432

3533
template <int ncols2>
3634
static void ggml_cuda_flash_attn_ext_mma_f16_switch_hs(ggml_backend_cuda_context & ctx, ggml_tensor * dst) {
37-
GGML_LOG_INFO("ggml_cuda_flash_attn_ext_mma_f16_switch_hs: ncols2=%d", ncols2);
3835
const ggml_tensor * Q = dst->src[0];
3936

4037
switch (Q->ne[0]) {

ggml/src/ggml-cuda/pad.cu

Lines changed: 3 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -57,6 +57,7 @@ static void pad_f32_cuda(const float * x, float * dst,
5757
dim3 gridDim(num_blocks, ne1, ne2*ne3);
5858
pad_f32<<<gridDim, CUDA_PAD_BLOCK_SIZE, 0, stream>>>(x, dst, ne0, ne00, ne01, ne02, ne03);
5959
}
60+
#include "ggml-impl.h"
6061

6162
static void pad_f16_cuda(const half * x, half * dst,
6263
const int ne00, const int ne01, const int ne02, const int ne03,
@@ -73,6 +74,8 @@ void ggml_cuda_op_pad(ggml_backend_cuda_context & ctx, ggml_tensor * dst) {
7374
GGML_ASSERT(src0->type == GGML_TYPE_F32 || src0->type == GGML_TYPE_F16);
7475
GGML_ASSERT(dst->type == src0->type);
7576
GGML_ASSERT(src0->ne[3] == 1 && dst->ne[3] == 1); // just 3D tensors
77+
GGML_LOG_INFO("ggml_cuda_op_pad: type=%d, ne0=%d, ne1=%d, ne2=%d, ne3=%d, ne0=%d, ne1=%d, ne2=%d, ne3=%d\n",
78+
src0->type, src0->ne[0], src0->ne[1], src0->ne[2], src0->ne[3], dst->ne[0], dst->ne[1], dst->ne[2], dst->ne[3]);
7679

7780
if (src0->type == GGML_TYPE_F32) {
7881
const float * src0_d = (const float *)src0->data;

0 commit comments

Comments
 (0)