bugfix: resolve compilation issues when building without NPU TORCH.

yingxudeng · yingxudeng · commit 1a5e2f0292d6 · 2025-11-06T20:23:15.000+08:00
diff --git a/CMakeLists.txt b/CMakeLists.txt
@@ -298,7 +298,7 @@ else()
 endif()
 
 if(USE_NPU)
-  add_definitions(-DUSE_NPU_TORCH)
+  # add_definitions(-DUSE_NPU_TORCH)
   add_definitions(-DUSE_NPU)
   add_definitions(-DBUILD_LIBTORCH)
   add_definitions(-DTORCH_SETCUSTOMHANDLER=ON)
diff --git a/xllm/models/llm/qwen3.h b/xllm/models/llm/qwen3.h
@@ -45,7 +45,7 @@ class QWen3ModelImpl : public LlmModelImplBase<QWen3DecoderLayer> {
         xllm::layer::RmsNorm(
             model_args.hidden_size(), model_args.rms_norm_eps(), options));
 #else
-    norm_ = register_module("norm", layer::RmsNorm(context));
+    norm_ = register_module("norm", layer::NpuRmsNorm(context));
 #endif
     for (auto i = 0; i < FLAGS_micro_batch_num; i++) {
 #if defined(USE_NPU_TORCH)
diff --git a/xllm/models/llm/qwen3_moe.h b/xllm/models/llm/qwen3_moe.h
@@ -274,10 +274,13 @@ class Qwen3MoeModelImpl : public torch::nn::Module {
   torch::Dtype dtype_;
   layer::WordEmbedding embed_tokens_{nullptr};
   layer::AttentionMask attn_mask_;
-  layer::RmsNorm norm_{nullptr};
+
 #if defined(USE_NPU)
   torch::Tensor cos_sin_;
   layer::PosEmbedding atb_pos_emb_{nullptr};
+  layer::NpuRmsNorm norm_{nullptr};
+#else
+  layer::RmsNorm norm_{nullptr};
 #endif
 };
 TORCH_MODULE(Qwen3MoeModel);