feat: qwen3 export to HF (#873)

ashors1 · abdalgader-a · web-flow · commit d73c942cdb57 · 2025-08-08T16:27:15.000Z
Signed-off-by: Abdalgader Abubaker &lt;136640907+abdalgader-a@users.noreply.github.com&gt;
Signed-off-by: Anna Shors &lt;ashors@nvidia.com&gt;
Co-authored-by: Abdalgader Abubaker &lt;136640907+abdalgader-a@users.noreply.github.com&gt;
diff --git a/.gitmodules b/.gitmodules
@@ -1,7 +1,7 @@
 [submodule "3rdparty/NeMo"]
 	path = 3rdparty/NeMo-workspace/NeMo
 	url = https://github.com/NVIDIA/NeMo.git
-	branch = zhiyul/yukih/prepare-refit-info
+	branch = https://github.com/NVIDIA/NeMo/tree/ashors/rl-qwen3-export
 	shallow = true
 [submodule "3rdparty/Megatron-LM"]
 	path = 3rdparty/Megatron-LM-workspace/Megatron-LM
diff --git a/3rdparty/NeMo-workspace/NeMo b/3rdparty/NeMo-workspace/NeMo
@@ -1 +1 @@
-Subproject commit 8ddf4387344c6423763ec9ee0c9a755cbb5d8d35
+Subproject commit aaefedd1d13f4ccd5cd06a19e06f1df33589a235
diff --git a/nemo_rl/models/megatron/community_import.py b/nemo_rl/models/megatron/community_import.py
@@ -85,9 +85,14 @@ def export_model_from_megatron(
         from nemo.tron.converter.qwen import HFQwen2Exporter
 
         exporter_cls = HFQwen2Exporter
+
+    elif hf_config.model_type in ("qwen3", "qwen3_moe"):
+        from nemo.tron.converter.qwen import HFQwen3Exporter
+
+        exporter_cls = HFQwen3Exporter
     else:
         raise ValueError(
-            f"Unknown model: {hf_model_name}. Currently, only Qwen2 and Llama are supported. "
+            f"Unknown model: {hf_model_name}. Currently, only Qwen2, Qwen3 and Llama are supported. "
             "If you'd like to run with a different model, please raise an issue or consider adding your own converter."
         )
     print(f"Exporting model {hf_model_name} to {output_path}...")