Skip to content

Commit 20b1dc9

Browse files
authored
Merge branch 'ggml-org:master' into mradermacher
2 parents 34fe8c7 + 670e136 commit 20b1dc9

File tree

2 files changed

+6
-4
lines changed

2 files changed

+6
-4
lines changed

.devops/nix/package.nix

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -47,6 +47,7 @@ let
4747
inherit (lib)
4848
cmakeBool
4949
cmakeFeature
50+
optionalAttrs
5051
optionals
5152
strings
5253
;
@@ -197,7 +198,7 @@ effectiveStdenv.mkDerivation (finalAttrs: {
197198
];
198199

199200
# Environment variables needed for ROCm
200-
env = optionals useRocm {
201+
env = optionalAttrs useRocm {
201202
ROCM_PATH = "${rocmPackages.clr}";
202203
HIP_DEVICE_LIB_PATH = "${rocmPackages.rocm-device-libs}/amdgcn/bitcode";
203204
};

convert_hf_to_gguf.py

Lines changed: 4 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -2910,11 +2910,12 @@ def set_gguf_parameters(self):
29102910
self.gguf_writer.add_expert_used_count(self.hparams["moe_k"])
29112911
self.gguf_writer.add_interleave_moe_layer_step(self.hparams["moe_layer_interval"])
29122912
self.gguf_writer.add_leading_dense_block_count(self.hparams["moe_layer_start_index"])
2913-
self.gguf_writer.add_rope_freq_base(self.hparams["rope_theta"])
29142913
if (moe_intermediate_size := self.hparams.get("moe_intermediate_size")) is not None:
29152914
self.gguf_writer.add_expert_feed_forward_length(moe_intermediate_size)
2916-
if (shared_expert_intermediate_size := self.hparams.get('intermediate_size')) is not None and (num_key_value_heads := self.hparams.get('num_key_value_heads')) is not None:
2917-
self.gguf_writer.add_expert_shared_feed_forward_length(shared_expert_intermediate_size // num_key_value_heads)
2915+
if (shared_expert_count := self.hparams.get('moe_num_shared_experts')) is not None:
2916+
self.gguf_writer.add_expert_shared_count(shared_expert_count)
2917+
if shared_expert_count > 0 and (shared_expert_intermediate_size := self.hparams.get('intermediate_size')) is not None and (num_key_value_heads := self.hparams.get('num_key_value_heads')) is not None:
2918+
self.gguf_writer.add_expert_shared_feed_forward_length(shared_expert_intermediate_size // num_key_value_heads)
29182919

29192920
def modify_tensors(self, data_torch: Tensor, name: str, bid: int | None) -> Iterable[tuple[str, Tensor]]:
29202921
# Modify correction bias name as in DeepseekV2

0 commit comments

Comments
 (0)