pytorch
diff --git a/‎backends/arm/_passes/arm_pass_manager.py‎
Lines changed: 4 additions & 0 deletions b/‎backends/arm/_passes/arm_pass_manager.py‎
Lines changed: 4 additions & 0 deletions
diff --git a/‎backends/arm/_passes/decompose_softmax_pass.py‎
Lines changed: 5 additions & 1 deletion b/‎backends/arm/_passes/decompose_softmax_pass.py‎
Lines changed: 5 additions & 1 deletion
diff --git a/‎backends/arm/operator_support/tosa_supported_operators.py‎
Lines changed: 2 additions & 0 deletions b/‎backends/arm/operator_support/tosa_supported_operators.py‎
Lines changed: 2 additions & 0 deletions
diff --git a/‎backends/arm/operators/__init__.py‎
Lines changed: 1 addition & 0 deletions b/‎backends/arm/operators/__init__.py‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎backends/arm/operators/op_neg.py‎
Lines changed: 78 additions & 0 deletions b/‎backends/arm/operators/op_neg.py‎
Lines changed: 78 additions & 0 deletions
diff --git a/‎backends/arm/quantizer/quantization_annotator.py‎
Lines changed: 3 additions & 0 deletions b/‎backends/arm/quantizer/quantization_annotator.py‎
Lines changed: 3 additions & 0 deletions
diff --git a/‎backends/arm/test/models/test_conformer.py‎
Lines changed: 13 additions & 7 deletions b/‎backends/arm/test/models/test_conformer.py‎
Lines changed: 13 additions & 7 deletions
diff --git a/‎backends/arm/test/ops/test_neg.py‎
Lines changed: 66 additions & 0 deletions b/‎backends/arm/test/ops/test_neg.py‎
Lines changed: 66 additions & 0 deletions
diff --git a/‎backends/arm/test/ops/test_sdpa.py‎
Lines changed: 45 additions & 0 deletions b/‎backends/arm/test/ops/test_sdpa.py‎
Lines changed: 45 additions & 0 deletions
diff --git a/‎backends/cadence/aot/TARGETS‎
Lines changed: 1 addition & 0 deletions b/‎backends/cadence/aot/TARGETS‎
Lines changed: 1 addition & 0 deletions
@@ -59,6 +59,9 @@
 )
 
 from executorch.backends.arm.tosa_specification import Tosa_0_80, TosaSpecification
+from executorch.backends.transforms.decompose_sdpa import (
+    DecomposeScaledDotProductAttention,
+)
 from executorch.backends.transforms.fuse_view_copy import FuseViewCopyTransform
 from executorch.backends.xnnpack._passes.remove_getitem_op import RemoveGetItemPass
 from executorch.exir import ExportedProgram
@@ -194,6 +197,7 @@ def transform_to_backend_pipeline(self, exported_program: ExportedProgram):
             )
 
     def transform_for_annotation_pipeline(self, graph_module: GraphModule):
+        self.add_pass(DecomposeScaledDotProductAttention())
         self.add_pass(ReplaceScalarWithTensorArgPassTOSABI())
         self.add_pass(ScalarsToAttributePass())
         self.add_pass(DecomposeLayerNormPass())
 
@@ -8,7 +8,11 @@
 from executorch.exir.pass_base import ExportPass
 
 # For BI case
-torch_softmax = (torch.ops.aten.softmax.int, torch.ops.aten.log_softmax.int)
+torch_softmax = (
+    torch.ops.aten.softmax.int,
+    torch.ops.aten._safe_softmax.default,
+    torch.ops.aten.log_softmax.int,
+)
 # For MI case
 edge_softmax = (
     exir_ops.edge.aten._softmax.default,
 
@@ -194,6 +194,7 @@ def is_node_supported(
             exir_ops.edge.aten.mul.Tensor,
             exir_ops.edge.aten.ne.Tensor,
             exir_ops.edge.aten.ne.Scalar,
+            exir_ops.edge.aten.neg.default,
             exir_ops.edge.aten.add.Scalar,
             exir_ops.edge.aten.sub.Scalar,
             exir_ops.edge.aten.mul.Scalar,
@@ -311,6 +312,7 @@ class CheckProperQuantization(OperatorSupportBase):
         exir_ops.edge.aten.max_pool2d_with_indices.default,
         exir_ops.edge.aten.mm.default,
         exir_ops.edge.aten.mul.Tensor,
+        exir_ops.edge.aten.neg.default,
         exir_ops.edge.aten.relu.default,
         exir_ops.edge.aten.sub.Tensor,
         exir_ops.edge.aten.upsample_bilinear2d.vec,
 
@@ -31,6 +31,7 @@
     op_maximum,
     op_minimum,
     op_mul,
+    op_neg,
     op_permute,
     op_pow,
     op_reciprocal,
 
@@ -0,0 +1,78 @@
+# Copyright 2025 Arm Limited and/or its affiliates.
+#
+# This source code is licensed under the BSD-style license found in the
+# LICENSE file in the root directory of this source tree.
+
+# pyre-unsafe
+from typing import List
+
+import torch.fx
+
+import tosa_tools.v0_80.serializer.tosa_serializer as ts  # type: ignore
+from executorch.backends.arm._passes.fold_qdq_with_annotated_qparams_pass import (
+    get_input_qparams,
+    get_output_qparams,
+)
+from executorch.backends.arm.operators.node_visitor import (
+    NodeVisitor,
+    register_node_visitor,
+)
+
+from executorch.backends.arm.tosa_mapping import TosaArg
+
+
+def get_negate_zero_points(node: torch.fx.Node, dtype: ts.DType) -> tuple[int, int]:
+    """
+    Returns (input1_zp, output_zp) for TOSA NEGATE.
+    Must be zero for non-int8 types.
+    """
+    if dtype == ts.DType.INT8:
+        return (
+            get_input_qparams(node)[0].zp,
+            get_output_qparams(node)[0].zp,
+        )
+    return (0, 0)
+
+
+@register_node_visitor
+class NegVisitor(NodeVisitor):
+    target = "aten.neg.default"
+
+    supported_dtypes = {
+        ts.DType.INT8,
+        ts.DType.INT16,
+        ts.DType.INT32,
+        ts.DType.FP16,
+        ts.DType.BF16,
+        ts.DType.FP32,
+    }
+
+    def __init__(self, *args):
+        super().__init__(*args)
+
+    def define_node(
+        self,
+        node: torch.fx.Node,
+        tosa_graph: ts.TosaSerializer,
+        inputs: List[TosaArg],
+        output: TosaArg,
+    ) -> None:
+
+        if inputs[0].dtype not in self.supported_dtypes:
+            raise ValueError(f"Unsupported dtype for NEGATE: {inputs[0].dtype}")
+
+        if inputs[0].dtype != output.dtype:
+            raise ValueError(
+                "All inputs and output need same dtype."
+                f"Got {inputs[0].dtype=}, {output.dtype=}"
+            )
+        input_zp, output_zp = get_negate_zero_points(node, inputs[0].dtype)
+
+        attr = ts.TosaSerializerAttribute()
+        attr.NegateAttribute(input1_zp=input_zp, output_zp=output_zp)
+        tosa_graph.addOperator(
+            ts.TosaOp.Op().NEGATE,
+            [inputs[0].name],
+            [output.name],
+            attributes=attr,
+        )
@@ -375,6 +375,9 @@ def any_or_hardtanh_min_zero(n: Node):
             )
         ]
         quant_properties.quant_output = _QuantProperty(0, shared_qspec)  # type: ignore[arg-type]
+    elif node.target in (torch.ops.aten.neg.default,):
+        quant_properties.quant_inputs = [_QuantProperty(0, input_act_qspec)]
+        quant_properties.quant_output = _QuantProperty(0, input_act_qspec)
     elif node.target in _one_to_one:
         quant_properties.quant_inputs = [_QuantProperty(0, input_act_qspec)]
         quant_properties.quant_output = _QuantProperty(0, output_act_qspec)
 
@@ -83,7 +83,6 @@ def test_conformer_tosa_BI(self):
             )
         )
 
-    @unittest.expectedFailure  # TODO(MLETORCH-635)
     def test_conformer_u55_BI(self):
         tester = (
             ArmTester(
@@ -97,13 +96,20 @@ def test_conformer_u55_BI(self):
             .to_executorch()
             .serialize()
         )
+
         if conftest.is_option_enabled("corstone_fvp"):
-            tester.run_method_and_compare_outputs(
-                qtol=1.0,
-                rtol=1.0,
-                atol=5.0,
-                inputs=get_test_inputs(self.dim, self.lengths, self.num_examples),
-            )
+            try:
+                tester.run_method_and_compare_outputs(
+                    qtol=1.0,
+                    rtol=1.0,
+                    atol=5.0,
+                    inputs=get_test_inputs(self.dim, self.lengths, self.num_examples),
+                )
+                self.fail(
+                    "TODO(MLETORCH-635): Expected failure under FVP option, but test passed."
+                )
+            except Exception:
+                pass
 
     @unittest.expectedFailure  # TODO(MLETORCH-635)
     def test_conformer_u85_BI(self):
 
@@ -0,0 +1,66 @@
+# Copyright 2025 Arm Limited and/or its affiliates.
+#
+# This source code is licensed under the BSD-style license found in the
+# LICENSE file in the root directory of this source tree.
+
+
+from typing import Dict, Tuple
+
+import torch
+from executorch.backends.arm.test import common
+from executorch.backends.arm.test.tester.test_pipeline import (
+    EthosU55PipelineBI,
+    EthosU85PipelineBI,
+    TosaPipelineBI,
+    TosaPipelineMI,
+)
+
+input_t1 = Tuple[torch.Tensor]
+
+
+class Neg(torch.nn.Module):
+
+    aten_op = "torch.ops.aten.neg.default"
+    exir_op = "executorch_exir_dialects_edge__ops_aten_neg_default"
+
+    test_data: Dict[str, input_t1] = {
+        "rank_1_ramp": (torch.arange(-16, 16, 0.2),),
+        "rank_2_rand_uniform": (torch.rand(10, 10) - 0.5,),
+        "rank_3_all_ones": (torch.ones(10, 10, 10),),
+        "rank_4_all_zeros": (torch.zeros(1, 10, 10, 10),),
+        "rank_4_randn_pos": (torch.randn(1, 4, 4, 4) + 10,),
+        "rank_4_randn_neg": (torch.randn(1, 4, 4, 4) - 10,),
+    }
+
+    def forward(self, x: torch.Tensor):
+        return torch.neg(x)
+
+
+@common.parametrize("test_data", Neg.test_data)
+def test_neg_tosa_MI(test_data: input_t1):
+    pipeline = TosaPipelineMI[input_t1](Neg(), test_data, Neg.aten_op, Neg.exir_op)
+    pipeline.run()
+
+
+@common.parametrize("test_data", Neg.test_data)
+def test_neg_tosa_BI(test_data: input_t1):
+    pipeline = TosaPipelineBI[input_t1](Neg(), test_data, Neg.aten_op, Neg.exir_op)
+    pipeline.run()
+
+
+@common.parametrize("test_data", Neg.test_data)
+@common.XfailIfNoCorstone300
+def test_neg_u55_BI(test_data: input_t1):
+    pipeline = EthosU55PipelineBI[input_t1](
+        Neg(), test_data, Neg.aten_op, Neg.exir_op, run_on_fvp=True
+    )
+    pipeline.run()
+
+
+@common.parametrize("test_data", Neg.test_data)
+@common.XfailIfNoCorstone320
+def test_neg_u85_BI(test_data: input_t1):
+    pipeline = EthosU85PipelineBI[input_t1](
+        Neg(), test_data, Neg.aten_op, Neg.exir_op, run_on_fvp=True
+    )
+    pipeline.run()
@@ -0,0 +1,45 @@
+# Copyright 2025 Arm Limited and/or its affiliates.
+#
+# This source code is licensed under the BSD-style license found in the
+# LICENSE file in the root directory of this source tree.
+
+
+from typing import Tuple
+
+import torch
+
+from executorch.backends.arm.test.tester.test_pipeline import (
+    TosaPipelineBI,
+    TosaPipelineMI,
+)
+
+
+class SDPA(torch.nn.Module):
+    def __init__(self):
+        super().__init__()
+
+    def forward(self, query, key, value):
+        return torch.nn.functional.scaled_dot_product_attention(
+            query, key, value, attn_mask=None, dropout_p=0.0, is_causal=False
+        )
+
+
+input_t = Tuple[torch.Tensor, torch.Tensor, torch.Tensor]
+
+
+def test_sdpa_MI():
+    test_input = tuple(torch.randn(1, 3, 197, 64) for x in range(3))
+    pipeline = TosaPipelineMI[input_t](SDPA(), test_input, [], [])
+    pipeline.pop_stage("check_count.exir")
+    pipeline.run()
+
+
+def test_sdpa_BI():
+    test_input = tuple(torch.randn(1, 3, 197, 64) for x in range(3))
+    pipeline = TosaPipelineBI[input_t](SDPA(), test_input, [], [])
+    pipeline.pop_stage("check.quant_nodes")
+    pipeline.pop_stage("check_count.exir")
+    pipeline.pop_stage(
+        "run_method_and_compare_outputs"
+    )  # TODO: reference is not quantized
+    pipeline.run()
@@ -347,6 +347,7 @@ python_unittest(
         ":compiler",
         "//caffe2:torch",
         "//executorch/backends/cadence/aot:compiler",
+        "//executorch/backends/cadence/aot:graph_builder",
         "//executorch/backends/cadence/aot:ops_registrations",
         "//executorch/backends/cadence/aot:pass_utils",
         "//executorch/backends/cadence/aot:remove_ops",
Original file line number	Diff line number	Diff line change
`@@ -375,6 +375,9 @@ def any_or_hardtanh_min_zero(n: Node):`
`375`	`375`	`)`
`376`	`376`	`]`
`377`	`377`	`quant_properties.quant_output = _QuantProperty(0, shared_qspec) # type: ignore[arg-type]`
	`378`	`+ elif node.target in (torch.ops.aten.neg.default,):`
	`379`	`+ quant_properties.quant_inputs = [_QuantProperty(0, input_act_qspec)]`
	`380`	`+ quant_properties.quant_output = _QuantProperty(0, input_act_qspec)`
`378`	`381`	`elif node.target in _one_to_one:`
`379`	`382`	`quant_properties.quant_inputs = [_QuantProperty(0, input_act_qspec)]`
`380`	`383`	`quant_properties.quant_output = _QuantProperty(0, output_act_qspec)`