Remove gpt-oss hybrid swa gate for trtllm_mha (#19079)

mmangkad · web-flow · commit 35ef38c61b2d · 2026-02-27T10:30:00.000-08:00
diff --git a/python/sglang/srt/server_args.py b/python/sglang/srt/server_args.py
@@ -1356,16 +1356,6 @@ def _handle_model_specific_adjustments(self):
                 f"- Decode: {decode_attn_backend}\n"
             )
 
-            if (
-                prefill_attn_backend == "trtllm_mha"
-                or decode_attn_backend == "trtllm_mha"
-            ):
-                # TODO: support swa kv indices translation for trtllm_mha attention backend
-                self.disable_hybrid_swa_memory = True
-                logger.warning(
-                    "Disable hybrid SWA memory for GPT-OSS model with trtllm_mha attention backend."
-                )
-
             quant_method = get_quantization_config(hf_config)
             is_mxfp4_quant_format = quant_method == "mxfp4"
             if is_blackwell_supported():