We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent 0d131f8 commit 498ae4cCopy full SHA for 498ae4c
nemo_automodel/_transformers/auto_model.py
@@ -434,7 +434,7 @@ def from_pretrained(
434
use_sdpa_patching: bool = True,
435
sdpa_method: Optional[List[SDPBackend]] = None,
436
torch_dtype="auto",
437
- attn_implementation: str = "sdpa", #flash_attention_2",
+ attn_implementation: str = "flash_attention_2",
438
quantization_config=None,
439
force_hf: bool = False,
440
**kwargs,
0 commit comments