We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent ccbe419 commit 97b117cCopy full SHA for 97b117c
src/llama-hparams.h
@@ -6,7 +6,7 @@
6
7
// bump if necessary
8
#define LLAMA_MAX_LAYERS 512
9
-#define LLAMA_MAX_EXPERTS 256 // DeepSeekV3
+#define LLAMA_MAX_EXPERTS 384 // DeepSeekV3=256 Kimi-K2=384
10
11
enum llama_expert_gating_func_type {
12
LLAMA_EXPERT_GATING_FUNC_TYPE_NONE = 0,
0 commit comments