We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 3b7e1a2 commit b44d392Copy full SHA for b44d392
xllm/core/layers/npu/npu_qwen3_moe_decoder_layer_impl.cpp
@@ -557,7 +557,9 @@ void NpuQwen3MoeDecoderLayerImpl::process_general_weights(
557
558
if (index == IN_QKV_WEIGHT_1 || index == IN_QKV_WEIGHT_2 ||
559
index == IN_QKV_BIAS_1 || index == IN_QKV_BIAS_2 ||
560
- index == IN_QKV_DESCALE_1 || index == IN_QKV_DESCALE_2) {
+ index == IN_QKV_DESCALE_1 || index == IN_QKV_DESCALE_2 ||
561
+ index == IN_QKV_OFFSET_1 || index == IN_QKV_OFFSET_2 ||
562
+ index == IN_QKV_SCALE_1 || index == IN_QKV_SCALE_2) {
563
if (n_kv_heads_ < dp_local_tp_size_) {
564
int32_t repeat_times = (dp_local_tp_size_ / n_kv_heads_);
565
0 commit comments