Collect a torch::stable wishlist in src/libtorchaudio/stable

pearu · pearu · commit ee07051e00c4 · 2025-09-18T19:40:52.000+03:00
diff --git a/src/libtorchaudio/stable/Device.h b/src/libtorchaudio/stable/Device.h
@@ -0,0 +1,47 @@
+#pragma once
+
+/*
+  This header files provides torchaudio::stable::Device struct that is
+  torch::stable::Tensor-compatible analogus of c10::Device defined
+  c10/core/Device.h.
+
+  TODO: remove this header file when torch::stable provides all
+  features implemented here.
+*/
+
+#include <torch/csrc/stable/accelerator.h>
+
+namespace torchaudio::stable {
+
+  using DeviceType = int32_t;
+  using torch::stable::accelerator::DeviceIndex;
+
+struct Device {
+
+  Device(DeviceType type, DeviceIndex index = -1)
+      : type_(type), index_(index) {
+    // TODO: validate();
+  }
+
+  /// Returns the type of device this is.
+  DeviceType type() const noexcept {
+    return type_;
+  }
+
+  /// Returns the optional index.
+  DeviceIndex index() const noexcept {
+    return index_;
+  }
+
+private:
+  DeviceType type_;
+  DeviceIndex index_ = -1;
+};
+
+// A convinience function, not a part of torch::stable
+inline Device cpu_device() {
+  Device d(aoti_torch_device_type_cpu(), 0);
+  return d;
+}
+
+}  // namespace torchaudio::stable
diff --git a/src/libtorchaudio/stable/TensorAccessor.h b/src/libtorchaudio/stable/TensorAccessor.h
@@ -0,0 +1,217 @@
+#pragma once
+/*
+  This header files provides torchaudio::stable::TensorAccessor
+  templates that are torch::stable::Tensor-compatible analogus of
+  at::TensorAccessor defined in ATen/core/TensorAccessor.h.
+
+  TODO: remove this header file when torch::stable provides all
+  features implemented here.
+*/
+
+// #include <libtorchaudio/stable/Device.h>
+
+#include <torch/headeronly/macros/Macros.h>
+#include <type_traits>
+
+namespace torchaudio::stable {
+
+template <typename T>
+struct DefaultPtrTraits {
+  typedef T* PtrType;
+};
+
+#if defined(__CUDACC__) || defined(__HIPCC__)
+template <typename T>
+struct RestrictPtrTraits {
+  typedef T* __restrict__ PtrType;
+};
+#endif
+
+template<typename T, size_t N, template <typename U> class PtrTraits = DefaultPtrTraits, typename index_t = int64_t>
+class TensorAccessorBase {
+public:
+  typedef typename PtrTraits<T>::PtrType PtrType;
+
+  C10_HOST_DEVICE TensorAccessorBase(
+      PtrType data_,
+      const index_t* sizes_,
+      const index_t* strides_)
+    : data_(data_) /*, sizes_(sizes_), strides_(strides_)*/ {
+    // Originally, TensorAccessor is a view of sizes and strides as
+    // these are ArrayRef instances. Until torch::stable supports
+    // ArrayRef-like features, we store copies of sizes and strides:
+    for (auto i=0; i < N; ++i) {
+      this->sizes_[i] = sizes_[i];
+      this->strides_[i] = strides_[i];
+    }
+  }
+
+  C10_HOST_DEVICE PtrType data() {
+    return data_;
+  }
+  C10_HOST_DEVICE const PtrType data() const {
+    return data_;
+  }
+protected:
+  PtrType data_;
+  /*
+    const index_t* sizes_;
+    const index_t* strides_;
+  */
+  // NOLINTNEXTLINE(*c-arrays*)
+  index_t sizes_[N];
+  // NOLINTNEXTLINE(*c-arrays*)
+  index_t strides_[N];
+};
+
+template<typename T, size_t N, template <typename U> class PtrTraits = DefaultPtrTraits, typename index_t = int64_t>
+class TensorAccessor : public TensorAccessorBase<T,N,PtrTraits,index_t> {
+public:
+  typedef typename PtrTraits<T>::PtrType PtrType;
+
+  C10_HOST_DEVICE TensorAccessor(
+      PtrType data_,
+      const index_t* sizes_,
+      const index_t* strides_)
+      : TensorAccessorBase<T, N, PtrTraits, index_t>(data_,sizes_,strides_) {}
+
+  C10_HOST_DEVICE TensorAccessor<T, N - 1, PtrTraits, index_t> operator[](index_t i) {
+    return TensorAccessor<T,N-1,PtrTraits,index_t>(this->data_ + this->strides_[0]*i,this->sizes_+1,this->strides_+1);
+  }
+
+  C10_HOST_DEVICE const TensorAccessor<T, N-1, PtrTraits, index_t> operator[](index_t i) const {
+    return TensorAccessor<T,N-1,PtrTraits,index_t>(this->data_ + this->strides_[0]*i,this->sizes_+1,this->strides_+1);
+  }
+};
+
+template<typename T, template <typename U> class PtrTraits, typename index_t>
+class TensorAccessor<T,1,PtrTraits,index_t> : public TensorAccessorBase<T,1,PtrTraits,index_t> {
+public:
+  typedef typename PtrTraits<T>::PtrType PtrType;
+
+  C10_HOST_DEVICE TensorAccessor(
+      PtrType data_,
+      const index_t* sizes_,
+      const index_t* strides_)
+      : TensorAccessorBase<T, 1, PtrTraits, index_t>(data_,sizes_,strides_) {}
+  C10_HOST_DEVICE T & operator[](index_t i) {
+    // NOLINTNEXTLINE(clang-analyzer-core.NullDereference)
+    return this->data_[this->strides_[0]*i];
+  }
+  C10_HOST_DEVICE const T & operator[](index_t i) const {
+    return this->data_[this->strides_[0]*i];
+  }
+};
+
+template<typename T, size_t N, template <typename U> class PtrTraits = DefaultPtrTraits, typename index_t = int64_t>
+class GenericPackedTensorAccessorBase {
+public:
+  typedef typename PtrTraits<T>::PtrType PtrType;
+  C10_HOST GenericPackedTensorAccessorBase(
+      PtrType data_,
+      const index_t* sizes_,
+      const index_t* strides_)
+      : data_(data_) {
+    std::copy(sizes_, sizes_ + N, std::begin(this->sizes_));
+    std::copy(strides_, strides_ + N, std::begin(this->strides_));
+  }
+
+  template <typename source_index_t, class = std::enable_if_t<std::is_same_v<source_index_t, int64_t>>>
+  C10_HOST GenericPackedTensorAccessorBase(
+      PtrType data_,
+      const source_index_t* sizes_,
+      const source_index_t* strides_)
+      : data_(data_) {
+    for (auto i=0; i < N; ++i) {
+      this->sizes_[i] = sizes_[i];
+      this->strides_[i] = strides_[i];
+    }
+  }
+
+  C10_HOST_DEVICE PtrType data() {
+    return data_;
+  }
+  C10_HOST_DEVICE const PtrType data() const {
+    return data_;
+  }
+protected:
+  PtrType data_;
+  // NOLINTNEXTLINE(*c-arrays*)
+  index_t sizes_[N];
+  // NOLINTNEXTLINE(*c-arrays*)
+  index_t strides_[N];
+  C10_HOST void bounds_check_(index_t i) const {
+    STD_TORCH_CHECK(
+        0 <= i && i < index_t{N},
+        "Index ",
+        i,
+        " is not within bounds of a tensor of dimension ",
+        N);
+  }
+};
+
+template<typename T, size_t N, template <typename U> class PtrTraits = DefaultPtrTraits, typename index_t = int64_t>
+class GenericPackedTensorAccessor : public GenericPackedTensorAccessorBase<T,N,PtrTraits,index_t> {
+public:
+  typedef typename PtrTraits<T>::PtrType PtrType;
+
+  C10_HOST GenericPackedTensorAccessor(
+      PtrType data_,
+      const index_t* sizes_,
+      const index_t* strides_)
+      : GenericPackedTensorAccessorBase<T, N, PtrTraits, index_t>(data_, sizes_, strides_) {}
+
+  // if index_t is not int64_t, we want to have an int64_t constructor
+  template <typename source_index_t, class = std::enable_if_t<std::is_same_v<source_index_t, int64_t>>>
+  C10_HOST GenericPackedTensorAccessor(
+      PtrType data_,
+      const source_index_t* sizes_,
+      const source_index_t* strides_)
+      : GenericPackedTensorAccessorBase<T, N, PtrTraits, index_t>(data_, sizes_, strides_) {}
+
+  C10_DEVICE TensorAccessor<T, N - 1, PtrTraits, index_t> operator[](index_t i) {
+    index_t* new_sizes = this->sizes_ + 1;
+    index_t* new_strides = this->strides_ + 1;
+    return TensorAccessor<T,N-1,PtrTraits,index_t>(this->data_ + this->strides_[0]*i, new_sizes, new_strides);
+  }
+
+  C10_DEVICE const TensorAccessor<T, N - 1, PtrTraits, index_t> operator[](index_t i) const {
+    const index_t* new_sizes = this->sizes_ + 1;
+    const index_t* new_strides = this->strides_ + 1;
+    return TensorAccessor<T,N-1,PtrTraits,index_t>(this->data_ + this->strides_[0]*i, new_sizes, new_strides);
+  }
+};
+
+template<typename T, template <typename U> class PtrTraits, typename index_t>
+class GenericPackedTensorAccessor<T,1,PtrTraits,index_t> : public GenericPackedTensorAccessorBase<T,1,PtrTraits,index_t> {
+public:
+  typedef typename PtrTraits<T>::PtrType PtrType;
+  C10_HOST GenericPackedTensorAccessor(
+      PtrType data_,
+      const index_t* sizes_,
+      const index_t* strides_)
+      : GenericPackedTensorAccessorBase<T, 1, PtrTraits, index_t>(data_, sizes_, strides_) {}
+
+  template <typename source_index_t, class = std::enable_if_t<std::is_same_v<source_index_t, int64_t>>>
+  C10_HOST GenericPackedTensorAccessor(
+      PtrType data_,
+      const source_index_t* sizes_,
+      const source_index_t* strides_)
+      : GenericPackedTensorAccessorBase<T, 1, PtrTraits, index_t>(data_, sizes_, strides_) {}
+
+  C10_DEVICE T & operator[](index_t i) {
+    return this->data_[this->strides_[0] * i];
+  }
+  C10_DEVICE const T& operator[](index_t i) const {
+    return this->data_[this->strides_[0]*i];
+  }
+
+};
+
+template <typename T, size_t N, template <typename U> class PtrTraits = DefaultPtrTraits>
+using PackedTensorAccessor32 = GenericPackedTensorAccessor<T, N, PtrTraits, int32_t>;
+
+template <typename T, size_t N, template <typename U> class PtrTraits = DefaultPtrTraits>
+using PackedTensorAccessor64 = GenericPackedTensorAccessor<T, N, PtrTraits, int64_t>;
+
+}  // namespace torchaudio::stable
diff --git a/src/libtorchaudio/stable/dispatch.h b/src/libtorchaudio/stable/dispatch.h
@@ -0,0 +1,77 @@
+#pragma once
+/*
+  This header files provides CPP macros
+
+    STABLE_DISPATCH_FLOATING_TYPES_AND_HALF(TYPE, NAME, ...)
+
+  that are torch::stable::Tensor-compatible analogous of
+  the following macros:
+
+    AT_DISPATCH_CASE_FLOATING_TYPES_AND_HALF(TYPE, NAME, ...)
+
+  respectively.
+
+  TODO: remove this header file when torch::stable provides all
+  features implemented here.
+*/
+
+#include <torch/headeronly/util/Exception.h>
+#include <torch/headeronly/core/ScalarType.h>
+
+namespace torchaudio::stable {
+
+using torch::headeronly::ScalarType;
+
+namespace impl {
+
+template <ScalarType N>
+struct ScalarTypeToCPPType;
+
+#define SPECIALIZE_ScalarTypeToCPPType(cpp_type, scalar_type)   \
+  template <>                                                \
+  struct ScalarTypeToCPPType<ScalarType::scalar_type> { \
+  using type = cpp_type;                                     \
+  };
+
+  AT_FORALL_SCALAR_TYPES_WITH_COMPLEX_AND_QINTS(SPECIALIZE_ScalarTypeToCPPType)
+
+#undef SPECIALIZE_ScalarTypeToCPPType
+
+template <ScalarType N>
+using ScalarTypeToCPPTypeT = typename ScalarTypeToCPPType<N>::type;
+  
+}  // namespace impl
+
+}  // namespace torchaudio::stable
+  
+#define STABLE_DISPATCH_CASE(enum_type, ...) \
+  case enum_type: {                                                           \
+    using scalar_t [[maybe_unused]] = torchaudio::stable::impl::ScalarTypeToCPPTypeT<enum_type>; \
+    return __VA_ARGS__();                                                     \
+  }
+
+#define STABLE_DISPATCH_SWITCH(TYPE, NAME, ...)                         \
+  [&] {                                                                 \
+    const auto& the_type = TYPE;                                        \
+    constexpr const char* at_dispatch_name = NAME;                      \
+    switch (the_type) {                                                 \
+      __VA_ARGS__                                                       \
+    default:                                                            \
+      STD_TORCH_CHECK(                                                  \
+            false,                                                          \
+            '"',                                                            \
+            at_dispatch_name,                                               \
+            "\" not implemented for '",                                     \
+            toString(the_type),                                                  \
+            "'");                                                           \
+    }                                                                       \
+  }()
+
+#define STABLE_DISPATCH_CASE_FLOATING_TYPES_AND_HALF(...)   \
+  STABLE_DISPATCH_CASE(ScalarType::Double, __VA_ARGS__)        \
+  STABLE_DISPATCH_CASE(ScalarType::Float, __VA_ARGS__)  \
+  STABLE_DISPATCH_CASE(ScalarType::Half, __VA_ARGS__)
+
+#define STABLE_DISPATCH_FLOATING_TYPES_AND_HALF(TYPE, NAME, ...) \
+  STABLE_DISPATCH_SWITCH(                                        \
+      TYPE, NAME, STABLE_DISPATCH_CASE_FLOATING_TYPES_AND_HALF(__VA_ARGS__))
diff --git a/src/libtorchaudio/stable/ops.h b/src/libtorchaudio/stable/ops.h