fix: support use_sync flag in xFuserLongContextAttention (#505)

Lay2000 · aoyuli · web-flow · commit ec257684f283 · 2025-04-21T13:52:25.000+08:00
Co-authored-by: aoyuli &lt;aoyuli@bytedance.com&gt;
diff --git a/xfuser/core/long_ctx_attention/hybrid/attn_layer.py b/xfuser/core/long_ctx_attention/hybrid/attn_layer.py
@@ -29,6 +29,7 @@ def __init__(
         ring_impl_type: str = "basic",
         use_pack_qkv: bool = False,
         use_kv_cache: bool = False,
+        use_sync: bool = False,
         attn_type: AttnType = AttnType.FA,
         attn_processor: torch.nn.Module = None,
     ) -> None:
@@ -47,6 +48,7 @@ def __init__(
             gather_idx=gather_idx,
             ring_impl_type=ring_impl_type,
             use_pack_qkv=use_pack_qkv,
+            use_sync=use_sync,
             attn_type = attn_type,
         )
         self.use_kv_cache = use_kv_cache