remove unused macro

Zonglin Peng · zonglinpeng · commit 21ec3610785f · 2024-12-04T13:33:56.000-08:00
diff --git a/backends/cadence/reference/operators/CMakeLists.txt b/backends/cadence/reference/operators/CMakeLists.txt
@@ -55,7 +55,16 @@ set(_aten_ops__srcs
     "${EXECUTORCH_ROOT}/kernels/portable/cpu/op_expand_copy.cpp"
     "${EXECUTORCH_ROOT}/kernels/portable/cpu/op_gelu.cpp"
     "${EXECUTORCH_ROOT}/kernels/portable/cpu/op_empty.cpp"
+    "${EXECUTORCH_ROOT}/kernels/portable/cpu/op_transpose_copy.cpp"
+    "${EXECUTORCH_ROOT}/kernels/portable/cpu/op_eq.cpp"
+    "${EXECUTORCH_ROOT}/kernels/portable/cpu/op_logical_not.cpp"
+    "${EXECUTORCH_ROOT}/kernels/portable/cpu/op_any.cpp"
+    "${EXECUTORCH_ROOT}/kernels/portable/cpu/op_native_group_norm.cpp"
+    "${EXECUTORCH_ROOT}/kernels/portable/cpu/op_sum.cpp"
+    "${EXECUTORCH_ROOT}/kernels/portable/cpu/op_select_copy.cpp"
     "${EXECUTORCH_ROOT}/kernels/portable/cpu/util/dtype_util.cpp"
+    "${EXECUTORCH_ROOT}/kernels/portable/cpu/util/normalization_ops_util.cpp"
+    "${EXECUTORCH_ROOT}/kernels/portable/cpu/util/select_copy_util.cpp"
 )
 add_library(aten_ops_cadence ${_aten_ops__srcs})
 target_link_libraries(aten_ops_cadence PUBLIC executorch)
diff --git a/backends/cadence/reference/operators/quantized_ops.h b/backends/cadence/reference/operators/quantized_ops.h
@@ -5,49 +5,6 @@
 #include <executorch/backends/cadence/reference/kernels/kernels.h>
 #include <executorch/backends/cadence/reference/operators/operators.h>
 
-// Generate kernels that perform elementwise arithmetic on two quantized
-// tensors. The tensors are either the same size, or the second tensor is a
-// scalar.
-#define DECLARE_POINTWISE_TENSOR_QUANTIZED_BINARY_OP(BINARY_FUNC_NAME, OP)    \
-  template <typename T>                                                       \
-  void BINARY_FUNC_NAME(                                                      \
-      const ::executorch::aten::Tensor& X,                                    \
-      float X_scale,                                                          \
-      int32_t X_zero_point,                                                   \
-      const ::executorch::aten::Tensor& Y,                                    \
-      float Y_scale,                                                          \
-      int32_t Y_zero_point,                                                   \
-      float out_scale,                                                        \
-      int32_t out_zero_point,                                                 \
-      ::executorch::aten::Tensor& out) {                                      \
-    const T* __restrict__ X_data = X.const_data_ptr<T>();                     \
-    const T* __restrict__ Y_data = Y.const_data_ptr<T>();                     \
-    T* __restrict__ out_data = out.mutable_data_ptr<T>();                     \
-    size_t Y_numel = Y.numel();                                               \
-    size_t X_numel = X.numel();                                               \
-    float inv_out_scale = 1.0f / out_scale;                                   \
-    /* Tensor that has the same element of X */                               \
-    if (Y_numel == X_numel) {                                                 \
-      for (size_t i = 0; i < X_numel; ++i) {                                  \
-        float x = kernels::dequantize<T>(X_data[i], X_scale, X_zero_point);   \
-        float y = kernels::dequantize<T>(Y_data[i], Y_scale, Y_zero_point);   \
-        float z = x OP y;                                                     \
-        out_data[i] = kernels::quantize<T>(z, inv_out_scale, out_zero_point); \
-      }                                                                       \
-    } /* if Y is a scalar Tensor */                                           \
-    else if (Y_numel == 1) {                                                  \
-      float y = kernels::dequantize<T>(Y_data[0], Y_scale, Y_zero_point);     \
-      for (size_t i = 0; i < X_numel; ++i) {                                  \
-        float x = kernels::dequantize<T>(X_data[i], X_scale, X_zero_point);   \
-        float z = x OP y;                                                     \
-        out_data[i] = kernels::quantize<T>(z, inv_out_scale, out_zero_point); \
-      }                                                                       \
-    } /* other broadcasting cases */                                          \
-    else {                                                                    \
-      ET_DCHECK_MSG(false, "Unsupported broadcasting");                       \
-    }                                                                         \
-  }
-
 template <typename T>
 inline __attribute__((always_inline)) void quantized_linear_per_tensor_(
     const ::executorch::aten::Tensor& src,