Skip to content

Commit 3e3a878

Browse files
committed
use ggml_barrier instead of ggml_barrier_numa_aware for src1 data barrier as the barrier only happens in few cores
1 parent ab80f55 commit 3e3a878

File tree

1 file changed

+2
-2
lines changed

1 file changed

+2
-2
lines changed

ggml/src/ggml-cpu/ggml-cpu-aarch64.cpp

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -6111,7 +6111,7 @@ template <typename BLOC_TYPE, int64_t INTER_SIZE, int64_t NB_COLS, ggml_type PAR
61116111
from_float((float *) ((char *) src1->data + i11 * nb11), (void *) (wdata + i11 * nbw1), ne10);
61126112
}
61136113

6114-
ggml_barrier_numa_aware(params->threadpool, ith, GGML_BARRIER_NODE_LAST);
6114+
ggml_barrier(params->threadpool);
61156115

61166116
const void * src1_wdata = params->wdata;
61176117
const size_t src1_col_stride = ggml_row_size(PARAM_TYPE, ne10);
@@ -6219,7 +6219,7 @@ template <typename BLOC_TYPE, int64_t INTER_SIZE, int64_t NB_COLS, ggml_type PAR
62196219
}
62206220
}
62216221

6222-
ggml_barrier_numa_aware(params->threadpool, ith, GGML_BARRIER_NODE_LAST);
6222+
ggml_barrier(params->threadpool);
62236223

62246224
// compute each matrix multiplication in sequence
62256225
for (int cur_a = 0; cur_a < n_as; ++cur_a) {

0 commit comments

Comments
 (0)