Skip to content

Commit d42bc91

Browse files
committed
iterate - MUL_MAT_ID kernel, untested at inference though
1 parent 600cba7 commit d42bc91

File tree

8 files changed

+1096
-36
lines changed

8 files changed

+1096
-36
lines changed

.devcontainer/tasks.json

Lines changed: 5 additions & 36 deletions
Original file line numberDiff line numberDiff line change
@@ -8,7 +8,10 @@
88
"args": [
99
"-B", "build",
1010
"-DCMAKE_BUILD_TYPE=Debug",
11-
"-DCMAKE_EXPORT_COMPILE_COMMANDS=ON"
11+
"-DCMAKE_EXPORT_COMPILE_COMMANDS=ON",
12+
"-DGGML_NUMA_MIRROR=ON",
13+
"-DGGML_OPENMP=ON",
14+
"-DCMAKE_C_FLAGS:STRING=-march=native"
1215
],
1316
"group": "build",
1417
"presentation": {
@@ -28,7 +31,7 @@
2831
"command": "bash",
2932
"args": [
3033
"-c",
31-
"cmake -B build -DCMAKE_BUILD_TYPE=Debug -DCMAKE_EXPORT_COMPILE_COMMANDS=ON -DGGML_NUMA_MIRROR=ON -DGGML_AVX512=ON -DGGML_AVX512_VNNI=ON -DGGML_AVX512_VBMI=ON -DGGML_AVX512_BF16=ON && cmake --build build --parallel"
34+
"cmake -B build -DCMAKE_BUILD_TYPE=Debug -DCMAKE_EXPORT_COMPILE_COMMANDS=ON -DGGML_NUMA_MIRROR=ON -DCMAKE_C_FLAGS:STRING=-march=native && cmake --build build --parallel"
3235
],
3336
"group": {
3437
"kind": "build",
@@ -83,40 +86,6 @@
8386
"$gcc"
8487
],
8588
"detail": "Build release version with NUMA support"
86-
},
87-
{
88-
"label": "test-cpu-topology",
89-
"type": "shell",
90-
"command": "./build/bin/llama-server",
91-
"args": [
92-
"--cpu-topology"
93-
],
94-
"group": "test",
95-
"presentation": {
96-
"echo": true,
97-
"reveal": "always",
98-
"focus": false,
99-
"panel": "shared"
100-
},
101-
"dependsOn": "cmake-build",
102-
"detail": "Test consolidated CPU/GPU/NUMA topology and threading plan"
103-
},
104-
{
105-
"label": "check-numa",
106-
"type": "shell",
107-
"command": "bash",
108-
"args": [
109-
"-c",
110-
"echo '=== NUMA Hardware ===' && numactl --hardware && echo -e '\\n=== CPU Info ===' && lscpu && echo -e '\\n=== Topology ===' && hwloc-info"
111-
],
112-
"group": "test",
113-
"presentation": {
114-
"echo": true,
115-
"reveal": "always",
116-
"focus": false,
117-
"panel": "shared"
118-
},
119-
"detail": "Check NUMA and CPU topology information"
12089
}
12190
]
12291
}

ggml/src/ggml-cpu/CMakeLists.txt

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -57,6 +57,8 @@ function(ggml_add_cpu_backend_variant_impl tag_name)
5757
ggml-cpu/numa-kernels/sub.h
5858
ggml-cpu/numa-kernels/mul_mat.c
5959
ggml-cpu/numa-kernels/mul_mat.h
60+
ggml-cpu/numa-kernels/mul_mat_id.c
61+
ggml-cpu/numa-kernels/mul_mat_id.h
6062
ggml-cpu/numa-kernels/rope.c
6163
ggml-cpu/numa-kernels/rope.h
6264
ggml-cpu/numa-kernels/noop.c

0 commit comments

Comments
 (0)