pytorch
diff --git a/‎.ci/scripts/utils.sh‎
Lines changed: 1 addition & 2 deletions b/‎.ci/scripts/utils.sh‎
Lines changed: 1 addition & 2 deletions
diff --git a/‎backends/vulkan/runtime/graph/ops/glsl/tan.glsl‎
Lines changed: 60 additions & 0 deletions b/‎backends/vulkan/runtime/graph/ops/glsl/tan.glsl‎
Lines changed: 60 additions & 0 deletions
diff --git a/‎backends/vulkan/runtime/graph/ops/glsl/tan.yaml‎
Lines changed: 13 additions & 0 deletions b/‎backends/vulkan/runtime/graph/ops/glsl/tan.yaml‎
Lines changed: 13 additions & 0 deletions
diff --git a/‎backends/vulkan/runtime/graph/ops/impl/Tan.cpp‎
Lines changed: 64 additions & 0 deletions b/‎backends/vulkan/runtime/graph/ops/impl/Tan.cpp‎
Lines changed: 64 additions & 0 deletions
diff --git a/‎backends/vulkan/test/op_tests/cases.py‎
Lines changed: 16 additions & 0 deletions b/‎backends/vulkan/test/op_tests/cases.py‎
Lines changed: 16 additions & 0 deletions
diff --git a/‎devtools/inspector/tests/TARGETS‎
Lines changed: 13 additions & 0 deletions b/‎devtools/inspector/tests/TARGETS‎
Lines changed: 13 additions & 0 deletions
diff --git a/‎devtools/inspector/tests/inspector_test_utils.py‎
Lines changed: 118 additions & 0 deletions b/‎devtools/inspector/tests/inspector_test_utils.py‎
Lines changed: 118 additions & 0 deletions
@@ -158,8 +158,7 @@ build_executorch_runner() {
 cmake_install_executorch_lib() {
   echo "Installing libexecutorch.a and libportable_kernels.a"
   clean_executorch_install_folders
-  retry cmake -DBUCK2="$BUCK" \
-          -DCMAKE_INSTALL_PREFIX=cmake-out \
+  retry cmake -DCMAKE_INSTALL_PREFIX=cmake-out \
           -DCMAKE_BUILD_TYPE=Release \
           -DPYTHON_EXECUTABLE="$PYTHON_EXECUTABLE" \
           -Bcmake-out .
 
@@ -0,0 +1,60 @@
+/*
+ * Copyright (c) Meta Platforms, Inc. and affiliates.
+ * All rights reserved.
+ *
+ * This source code is licensed under the BSD-style license found in the
+ * LICENSE file in the root directory of this source tree.
+ */
+
+#version 450 core
+
+#define PRECISION ${PRECISION}
+
+#define VEC4_T ${texel_load_type(DTYPE, STORAGE)}
+#define T ${buffer_scalar_type(DTYPE)}
+
+${define_active_storage_type(STORAGE)}
+
+#include "indexing_utils.h"
+
+${define_required_extensions(DTYPE)}
+
+layout(std430) buffer;
+
+${layout_declare_tensor(0, "w", "t_out", DTYPE, STORAGE)}
+${layout_declare_tensor(1, "r", "t_in", DTYPE, STORAGE)}
+$if STORAGE == "buffer":
+  ${layout_declare_ubo(2, "int", "numel")}
+$else:
+  ${layout_declare_ubo(2, "ivec3", "out_limits")}
+
+layout(local_size_x_id = 0, local_size_y_id = 1, local_size_z_id = 2) in;
+
+#include "activations.h"
+
+#ifdef USING_BUFFER
+
+void main() {
+  const int i = int(gl_GlobalInvocationID.x);
+  if (i >= numel) {
+    return;
+  }
+
+  float in_val = float(t_in[i]);
+  t_out[i] = T(tan(in_val));
+}
+
+#else
+
+void main() {
+  const ivec3 pos = ivec3(gl_GlobalInvocationID);
+
+  if (any(greaterThanEqual(pos, out_limits))) {
+    return;
+  }
+
+  VEC4_T in_texel = texelFetch(t_in, pos, 0);
+  imageStore(t_out, pos, VEC4_T(tan(in_texel)));
+}
+
+#endif
@@ -0,0 +1,13 @@
+tan:
+  parameter_names_with_default_values:
+    DTYPE: float
+    STORAGE: texture3d
+  generate_variant_forall:
+    DTYPE:
+      - VALUE: half
+      - VALUE: float
+    STORAGE:
+      - VALUE: texture3d
+      - VALUE: buffer
+  shader_variants:
+    - NAME: tan
@@ -0,0 +1,64 @@
+/*
+ * Copyright (c) Meta Platforms, Inc. and affiliates.
+ * All rights reserved.
+ *
+ * This source code is licensed under the BSD-style license found in the
+ * LICENSE file in the root directory of this source tree.
+ */
+
+#include <executorch/backends/vulkan/runtime/graph/ops/OperatorRegistry.h>
+
+#include <executorch/backends/vulkan/runtime/graph/ops/impl/utils/TensorUtils.h>
+#include <executorch/backends/vulkan/runtime/graph/ops/utils/ShaderNameUtils.h>
+
+namespace vkcompute {
+
+using namespace utils;
+
+void resize_tan_node(
+    ComputeGraph* graph,
+    const std::vector<ArgGroup>& args,
+    const std::vector<ValueRef>& extra_args) {
+  (void)extra_args;
+  vTensorPtr out = graph->get_tensor(args[0].refs[0]);
+  vTensorPtr self = graph->get_tensor(args[1].refs[0]);
+
+  out->virtual_resize(self->sizes());
+}
+
+void add_tan_node(ComputeGraph& graph, const ValueRef in, const ValueRef out) {
+  std::string kernel_name = "tan";
+  add_dtype_suffix(kernel_name, graph.dtype_of(out));
+  add_storage_type_suffix(kernel_name, graph.storage_type_of(out));
+
+  vkapi::ParamsBindList ubos({});
+  ubos.append({graph.logical_limits_ubo(out)});
+
+  graph.execute_nodes().emplace_back(new DispatchNode(
+      graph,
+      VK_KERNEL_FROM_STR(kernel_name),
+      graph.create_global_wg_size(out),
+      graph.create_local_wg_size(out),
+      // Inputs and Outputs
+      {{out, vkapi::kWrite}, {in, vkapi::kRead}},
+      // Shader params buffers
+      ubos,
+      // Push Constants
+      {},
+      // Specialization Constants
+      {},
+      // Resize Args
+      {},
+      // Resizing Logic
+      resize_tan_node));
+}
+
+void tan(ComputeGraph& graph, const std::vector<ValueRef>& args) {
+  return add_tan_node(graph, args[0], args[1]);
+}
+
+REGISTER_OPERATORS {
+  VK_REGISTER_OP(aten.tan.default, tan);
+}
+
+} // namespace vkcompute
@@ -1171,6 +1171,22 @@ def get_unary_ops_inputs():
     return test_suite
 
 
+# separate test suite from unary_ops for learning purposes
+@register_test_suite("aten.tan.default")
+def get_tan_inputs():
+    test_suite = VkTestSuite(
+        [
+            (M1,),
+            (M1, M2),
+            (S1, M1, M2),
+            (S1, S2, S2, M2),
+        ]
+    )
+    test_suite.storage_types = ["utils::kTexture3D", "utils::kBuffer"]
+    test_suite.dtypes = ["at::kFloat", "at::kHalf"]
+    return test_suite
+
+
 @register_test_suite("aten._native_batch_norm_legit_no_training.default")
 def get_native_batch_norm_inputs():
     Test = namedtuple(
 
@@ -1,4 +1,5 @@
 load("@fbcode_macros//build_defs:python_unittest.bzl", "python_unittest")
+load("@fbcode_macros//build_defs:python_library.bzl", "python_library")
 
 oncall("executorch")
 
@@ -13,6 +14,7 @@ python_unittest(
         "//executorch/devtools/inspector:inspector",
         "//executorch/devtools/inspector:lib",
         "//executorch/exir:lib",
+        "//executorch/devtools/inspector/tests:inspector_test_utils",
     ],
 )
 
@@ -48,5 +50,16 @@ python_unittest(
         "//executorch/devtools/inspector:lib",
         "//executorch/devtools/inspector:intermediate_output_capturer",
         "//executorch/exir:lib",
+        "//executorch/devtools/inspector/tests:inspector_test_utils",
+    ],
+)
+
+python_library(
+    name = "inspector_test_utils",
+    srcs = [
+        "inspector_test_utils.py",
+    ],
+    deps = [
+        "//caffe2:torch",
     ],
 )
@@ -0,0 +1,118 @@
+# Copyright (c) Meta Platforms, Inc. and affiliates.
+# All rights reserved.
+#
+# This source code is licensed under the BSD-style license found in the
+# LICENSE file in the root directory of this source tree.
+
+# pyre-unsafe
+
+import torch
+import torch.nn as nn
+import torch.nn.functional as F
+
+
+class ConvlLinearModel(nn.Module):
+    """
+    A neural network model with a convolutional layer followed by a linear layer.
+    """
+
+    def __init__(self):
+        super(ConvlLinearModel, self).__init__()
+        self.conv_layer = nn.Conv2d(
+            in_channels=1, out_channels=1, kernel_size=3, stride=1, padding=1
+        )
+        self.conv_layer.weight = nn.Parameter(
+            torch.tensor([[[[0.1, 0.2, 0.3], [0.4, 0.5, 0.6], [0.7, 0.8, 0.9]]]])
+        )
+        self.conv_layer.bias = nn.Parameter(torch.tensor([0.0]))
+
+        self.linear_layer = nn.Linear(in_features=4, out_features=2)
+        self.linear_layer.weight = nn.Parameter(
+            torch.tensor([[0.1, 0.2, 0.3, 0.4], [0.5, 0.6, 0.7, 0.8]])
+        )
+        self.linear_layer.bias = nn.Parameter(torch.tensor([0.0, 0.0]))
+        self.additional_bias = nn.Parameter(
+            torch.tensor([0.5, -0.5]), requires_grad=False
+        )
+        self.scale_factor = nn.Parameter(torch.tensor([2.0, 0.5]), requires_grad=False)
+
+    def forward(self, x):
+        x = self.conv_layer(x)
+        x = x.view(x.size(0), -1)
+        x = self.linear_layer(x)
+        x = x + self.additional_bias
+        x = x - 0.1
+        x = x * self.scale_factor
+        x = x / (self.scale_factor + 1.0)
+        x = F.relu(x)
+        x = torch.sigmoid(x)
+        output1, output2 = torch.split(x, 1, dim=1)
+        return output1, output2
+
+    @staticmethod
+    def get_input():
+        """
+        Returns the pre-defined input tensor for this model.
+        """
+        return torch.tensor([[[[1.0, 2.0], [3.0, 4.0]]]], requires_grad=True)
+
+    @staticmethod
+    def get_expected_intermediate_outputs():
+        """
+        Returns the expected outputs of the debug handles and intermediate output mapping for this model for the given input.
+        """
+        return {
+            (10,): torch.tensor([[[[7.7000, 6.7000], [4.7000, 3.7000]]]]),
+            (11,): torch.tensor([[7.7000, 6.7000, 4.7000, 3.7000]]),
+            (12,): torch.tensor(
+                [
+                    [0.1000, 0.5000],
+                    [0.2000, 0.6000],
+                    [0.3000, 0.7000],
+                    [0.4000, 0.8000],
+                ]
+            ),
+            (13,): torch.tensor([[5.0000, 14.1200]]),
+            (14,): torch.tensor([[5.5000, 13.6200]]),
+            (15,): torch.tensor([[5.4000, 13.5200]]),
+            (16,): torch.tensor([[10.8000, 6.7600]]),
+            (17,): torch.tensor([3.0000, 1.5000]),
+            (18,): torch.tensor([[3.6000, 4.5067]]),
+            (19,): torch.tensor([[3.6000, 4.5067]]),
+            (20,): torch.tensor([[0.9734, 0.9891]]),
+            (21,): [torch.tensor([[0.9734]]), torch.tensor([[0.9891]])],
+        }
+
+
+# Global model registry
+model_registry = {
+    "ConvLinearModel": ConvlLinearModel,
+    # Add new models here
+}
+
+
+def check_if_final_outputs_match(model_name, actual_outputs_with_handles):
+    """
+    Checks if the actual outputs match the expected outputs for the specified model.
+    Returns True if all outputs match, otherwise returns False.
+    """
+    model_instance = model_registry[model_name]
+    expected_outputs_with_handles = model_instance.get_expected_intermediate_outputs()
+    if len(actual_outputs_with_handles) != len(expected_outputs_with_handles):
+        return False
+    for debug_handle, expected_output in expected_outputs_with_handles.items():
+        actual_output = actual_outputs_with_handles.get(debug_handle)
+        if actual_output is None:
+            return False
+        if isinstance(expected_output, list):
+            if not isinstance(actual_output, list):
+                return False
+            if len(actual_output) != len(expected_output):
+                return False
+            for actual, expected in zip(actual_output, expected_output):
+                if not torch.allclose(actual, expected, rtol=1e-4, atol=1e-5):
+                    return False
+        else:
+            if not torch.allclose(actual_output, expected_output, rtol=1e-4, atol=1e-5):
+                return False
+    return True