We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 7e5d0ee commit 5d10e3aCopy full SHA for 5d10e3a
src/llama-hparams.h
@@ -6,7 +6,7 @@
6
7
// bump if necessary
8
#define LLAMA_MAX_LAYERS 512
9
-#define LLAMA_MAX_EXPERTS 256 // DeepSeekV3
+#define LLAMA_MAX_EXPERTS 384 // Kimi-K2
10
11
enum llama_expert_gating_func_type {
12
LLAMA_EXPERT_GATING_FUNC_TYPE_NONE = 0,
0 commit comments