nikic
diff --git a/‎mlir/include/mlir/Dialect/Tensor/IR/CMakeLists.txt
Lines changed: 5 additions & 0 deletions b/‎mlir/include/mlir/Dialect/Tensor/IR/CMakeLists.txt
Lines changed: 5 additions & 0 deletions
diff --git a/‎mlir/include/mlir/Dialect/Tensor/IR/Tensor.h
Lines changed: 8 additions & 0 deletions b/‎mlir/include/mlir/Dialect/Tensor/IR/Tensor.h
Lines changed: 8 additions & 0 deletions
diff --git a/‎mlir/include/mlir/Dialect/Tensor/IR/TensorAttrDefs.td
Lines changed: 82 additions & 0 deletions b/‎mlir/include/mlir/Dialect/Tensor/IR/TensorAttrDefs.td
Lines changed: 82 additions & 0 deletions
diff --git a/‎mlir/include/mlir/Dialect/Tensor/IR/TensorOps.td
Lines changed: 1 addition & 0 deletions b/‎mlir/include/mlir/Dialect/Tensor/IR/TensorOps.td
Lines changed: 1 addition & 0 deletions
diff --git a/‎mlir/include/mlir/IR/CMakeLists.txt
Lines changed: 5 additions & 0 deletions b/‎mlir/include/mlir/IR/CMakeLists.txt
Lines changed: 5 additions & 0 deletions
diff --git a/‎mlir/include/mlir/IR/TensorEncoding.h
Lines changed: 21 additions & 0 deletions b/‎mlir/include/mlir/IR/TensorEncoding.h
Lines changed: 21 additions & 0 deletions
diff --git a/‎mlir/include/mlir/IR/TensorEncoding.td
Lines changed: 44 additions & 0 deletions b/‎mlir/include/mlir/IR/TensorEncoding.td
Lines changed: 44 additions & 0 deletions
diff --git a/‎mlir/lib/Dialect/Tensor/IR/CMakeLists.txt
Lines changed: 1 addition & 0 deletions b/‎mlir/lib/Dialect/Tensor/IR/CMakeLists.txt
Lines changed: 1 addition & 0 deletions
diff --git a/‎mlir/lib/Dialect/Tensor/IR/TensorDialect.cpp
Lines changed: 159 additions & 0 deletions b/‎mlir/lib/Dialect/Tensor/IR/TensorDialect.cpp
Lines changed: 159 additions & 0 deletions
@@ -1,2 +1,7 @@
 add_mlir_dialect(TensorOps tensor)
 add_mlir_doc(TensorOps TensorOps Dialects/ -gen-dialect-doc)
+
+set(LLVM_TARGET_DEFINITIONS TensorAttrDefs.td)
+mlir_tablegen(TensorAttrDefs.h.inc -gen-attrdef-decls)
+mlir_tablegen(TensorAttrDefs.cpp.inc -gen-attrdef-defs)
+add_public_tablegen_target(MLIRTensorAttrDefsIncGen)
@@ -13,6 +13,7 @@
 #include "mlir/IR/Dialect.h"
 #include "mlir/IR/OpDefinition.h"
 #include "mlir/IR/OpImplementation.h"
+#include "mlir/IR/TensorEncoding.h"
 #include "mlir/Interfaces/CastInterfaces.h"
 #include "mlir/Interfaces/ControlFlowInterfaces.h"
 #include "mlir/Interfaces/SideEffectInterfaces.h"
@@ -23,6 +24,13 @@
 
 #include "mlir/Dialect/Tensor/IR/TensorOpsDialect.h.inc"
 
+//===----------------------------------------------------------------------===//
+// Tensor Dialect Attributes
+//===----------------------------------------------------------------------===//
+
+#define GET_ATTRDEF_CLASSES
+#include "mlir/Dialect/Tensor/IR/TensorAttrDefs.h.inc"
+
 //===----------------------------------------------------------------------===//
 // Tensor Dialect Operations
 //===----------------------------------------------------------------------===//
 
@@ -0,0 +1,82 @@
+//===-- TensorAttrDefs.td - Tensor Attributes Definitions --*- tablegen -*-===//
+//
+// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
+// See https://llvm.org/LICENSE.txt for license information.
+// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
+//
+//===----------------------------------------------------------------------===//
+
+#ifndef TENSOR_ATTRDEFS
+#define TENSOR_ATTRDEFS
+
+include "mlir/Dialect/Tensor/IR/TensorBase.td"
+include "mlir/IR/TensorEncoding.td"
+
+// All of the Tensor attributes will extend this class.
+class Tensor_Attr<string name,
+                  list<Trait> traits = []> : AttrDef<Tensor_Dialect, name, traits>;
+
+// Sparse tensor encoding attribute.
+def SparseTensorEncodingAttr : Tensor_Attr<"SparseTensorEncoding",
+         [ DeclareAttrInterfaceMethods<VerifiableTensorEncoding> ] > {
+  let mnemonic = "sparse";
+
+  let description = [{
+    An attribute to encode "TACO"-style information (see tensor-compiler.org)
+    on the sparsity of tensors. The semantics are defined by means of the
+    methods getDimLevelType(), getDimOrdering(), getPointerType(), and
+    getIndexType(), documented below. The encoding is eventually used by
+    a `sparse compiler` pass to generate sparse code fully automatically
+    for all tensor expressions that involve tensors with a sparse encoding.
+    Compiler passes that run before this sparse compiler pass need to be
+    aware of the semantics of tensor types with such an encoding.
+  }];
+
+  // All data is stored in a dictionary, interpreted by the methods below.
+  let parameters = (
+    ins
+    "DictionaryAttr":$dict
+  );
+
+  let extraClassDeclaration = [{
+    // Dimension level types that define sparse tensors:
+    //   Dense      - dimension is dense, every entry is stored
+    //   Compressed - dimension is sparse, only nonzeros are stored
+    //   Singleton  - dimension contains single coordinate, no siblings
+    enum class DimLevelType {
+      Dense, Compressed, Singleton
+    };
+
+    // Returns the dimension level type in the given dimension `dim`
+    // of this tensor type. The choices, defined by the `DimLevelType`
+    // enum, are `dense` (the dimension should be stored in its entirety),
+    // `compressed` (only non-zero regions or elements should be stored),
+    // or `singleton` (no sibling elements for parent).
+    DimLevelType getDimLevelType(unsigned dim) const;
+
+    // Returns the dimension order of this tensor type as an AffineMap.
+    // Unlike dense storage, most sparse storage schemes do not provide
+    // fast random access. This affine map specifies the order of
+    // dimensions that should be support by the sparse storage scheme
+    // (e.g. (i,j) -> (i,j) requests 2-d row-wise and (i,j) -> (j,i)
+    // requests 2-d column-wise storage).
+    // TODO: block structure with higher-dim inputs
+    AffineMap getDimOrdering() const;
+
+    // Returns the required bit width for pointer storage. A narrow width
+    // reduces the memory footprint of overhead storage, as long as the
+    // width suffices to define the total required range (viz. the maximum
+    // number of stored entries over all indirection dimensions). The choices
+    // are `8`, `16`, `32`, `64`, or `0` for a native width.
+    unsigned getPointerBitWidth() const;
+
+    // Returns the required bit width for index storage. A narrow width
+    // reduces the memory footprint of overhead storage, as long as the
+    // width suffices to define the total required range (viz. the maximum
+    // value of each tensor index over all dimensions). The choices are `8`,
+    // `16`, `32`, `64`, or `0` for a native width.
+    unsigned getIndexBitWidth() const;
+  }];
+}
+
+#endif // LLVMIR_ATTRDEFS
@@ -10,6 +10,7 @@
 #define TENSOR_OPS
 
 include "mlir/Dialect/Tensor/IR/TensorBase.td"
+include "mlir/Dialect/Tensor/IR/TensorAttrDefs.td"
 include "mlir/Interfaces/CastInterfaces.td"
 include "mlir/Interfaces/ControlFlowInterfaces.td"
 include "mlir/Interfaces/SideEffectInterfaces.td"
 
@@ -26,6 +26,11 @@ mlir_tablegen(BuiltinTypes.h.inc -gen-typedef-decls)
 mlir_tablegen(BuiltinTypes.cpp.inc -gen-typedef-defs)
 add_public_tablegen_target(MLIRBuiltinTypesIncGen)
 
+set(LLVM_TARGET_DEFINITIONS TensorEncoding.td)
+mlir_tablegen(TensorEncInterfaces.h.inc -gen-attr-interface-decls)
+mlir_tablegen(TensorEncInterfaces.cpp.inc -gen-attr-interface-defs)
+add_public_tablegen_target(MLIRTensorEncodingIncGen)
+
 add_mlir_doc(BuiltinAttributes BuiltinAttributes Dialects/ -gen-attrdef-doc)
 add_mlir_doc(BuiltinLocationAttributes BuiltinLocationAttributes Dialects/ -gen-attrdef-doc)
 add_mlir_doc(BuiltinOps BuiltinOps Dialects/ -gen-op-doc)
 
@@ -0,0 +1,21 @@
+//===- TensorEncoding.h - MLIR Tensor Encoding Declarations------*- C++ -*-===//
+//
+// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
+// See https://llvm.org/LICENSE.txt for license information.
+// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
+//
+//===----------------------------------------------------------------------===//
+
+#ifndef MLIR_IR_TENSORENCODING_H
+#define MLIR_IR_TENSORENCODING_H
+
+#include "mlir/IR/AffineMap.h"
+#include "mlir/IR/OpDefinition.h"
+
+//===----------------------------------------------------------------------===//
+// Tablegen Type Declarations
+//===----------------------------------------------------------------------===//
+
+#include "mlir/IR/TensorEncInterfaces.h.inc"
+
+#endif // MLIR_IR_TENSORENCODING_H
@@ -0,0 +1,44 @@
+//===- TensorEncoding.td - Tensor encoding interfaces ------*- tablegen -*-===//
+//
+// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
+// See https://llvm.org/LICENSE.txt for license information.
+// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
+//
+//===----------------------------------------------------------------------===//
+//
+// Defines the interfaces associated with tensor encoding attributes.
+//
+//===----------------------------------------------------------------------===//
+
+#ifndef MLIR_IR_TENSORINTERFACES
+#define MLIR_IR_TENSORINTERFACES
+
+include "mlir/IR/OpBase.td"
+
+//===----------------------------------------------------------------------===//
+// Attribute interface to verify a tensor encoding.
+//===----------------------------------------------------------------------===//
+
+def VerifiableTensorEncoding : AttrInterface<"VerifiableTensorEncoding"> {
+  let cppNamespace = "::mlir";
+  let description = [{
+    Verifies an encoding attribute for a tensor.
+  }];
+  let methods = [
+    InterfaceMethod<
+      /*desc=*/[{
+        Verifies the encoding is valid for a tensor type with the
+        given shape and element type. Generates a diagnostic using
+        the supplied callback on failure.
+      }],
+      /*retTy=*/"::mlir::LogicalResult",
+      /*methodName=*/"verifyEncoding",
+      /*args=*/(ins
+        "ArrayRef<int64_t>":$shape,
+        "Type":$elementType,
+        "::llvm::function_ref<::mlir::InFlightDiagnostic()>":$emitError)
+    >,
+  ];
+}
+
+#endif // MLIR_IR_TENSORINTERFACES
@@ -7,6 +7,7 @@ add_mlir_dialect_library(MLIRTensor
 
   DEPENDS
   MLIRTensorOpsIncGen
+  MLIRTensorAttrDefsIncGen
 
   LINK_COMPONENTS
   Core
 
@@ -7,11 +7,142 @@
 //===----------------------------------------------------------------------===//
 
 #include "mlir/Dialect/Tensor/IR/Tensor.h"
+#include "mlir/IR/DialectImplementation.h"
 #include "mlir/Transforms/InliningUtils.h"
+#include "llvm/ADT/TypeSwitch.h"
 
 using namespace mlir;
 using namespace mlir::tensor;
 
+//===----------------------------------------------------------------------===//
+// TableGen'd Attributes Methods
+//===----------------------------------------------------------------------===//
+
+#define GET_ATTRDEF_CLASSES
+#include "mlir/Dialect/Tensor/IR/TensorAttrDefs.cpp.inc"
+
+// Dictionary keys.
+static constexpr StringRef getSparseDimLevelTypeAttrName() {
+  return "sparseDimLevelType";
+}
+static constexpr StringRef getSparseDimOrderingAttrName() {
+  return "sparseDimOrdering";
+}
+static constexpr StringRef getSparsePointerBitWidthAttrName() {
+  return "sparsePointerBitWidth";
+}
+static constexpr StringRef getSparseIndexBitWidthAttrName() {
+  return "sparseIndexBitWidth";
+}
+
+// Dictionary values.
+static constexpr StringRef getDenseDimLevelTypeVal() { return "dense"; }
+static constexpr StringRef getCompressedDimLevelTypeVal() {
+  return "compressed";
+}
+static constexpr StringRef getSingletonDimLevelTypeVal() { return "singleton"; }
+
+Attribute SparseTensorEncodingAttr::parse(MLIRContext *context,
+                                          DialectAsmParser &parser, Type type) {
+  if (failed(parser.parseLess()))
+    return {};
+  DictionaryAttr dict;
+  if (failed(parser.parseAttribute(dict)))
+    return {};
+  if (failed(parser.parseGreater()))
+    return {};
+  return SparseTensorEncodingAttr::get(context, dict);
+}
+
+void SparseTensorEncodingAttr::print(DialectAsmPrinter &printer) const {
+  printer << "sparse<" << getDict() << ">";
+}
+
+LogicalResult SparseTensorEncodingAttr::verifyEncoding(
+    llvm::ArrayRef<int64_t> shape, Type elementType,
+    llvm::function_ref<mlir::InFlightDiagnostic()> emitError) const {
+  unsigned size = shape.size();
+  for (const NamedAttribute &attr : getDict()) {
+    if (attr.first == getSparseDimLevelTypeAttrName()) {
+      // Dimension level type verification.
+      auto arrayAttr = attr.second.dyn_cast<ArrayAttr>();
+      if (!arrayAttr || size != static_cast<int64_t>(arrayAttr.size()))
+        return emitError() << "expected an array of size " << size
+                           << " for dimension level types";
+      for (unsigned i = 0; i < size; i++) {
+        auto strAttr = arrayAttr[i].dyn_cast<StringAttr>();
+        if (!strAttr)
+          return emitError()
+                 << "expected string value in dimension level types";
+        auto strVal = strAttr.getValue();
+        if (strVal != getDenseDimLevelTypeVal() &&
+            strVal != getCompressedDimLevelTypeVal() &&
+            strVal != getSingletonDimLevelTypeVal())
+          return emitError() << "unexpected dimension level type: " << strAttr;
+      }
+    } else if (attr.first == getSparseDimOrderingAttrName()) {
+      // Dimension order verification.
+      auto affineAttr = attr.second.dyn_cast<AffineMapAttr>();
+      if (!affineAttr)
+        return emitError() << "expected an affine map for dimension ordering";
+      AffineMap map = affineAttr.getValue();
+      if (size != map.getNumResults() || !map.isPermutation())
+        return emitError() << "expected a permutation affine map of size "
+                           << size << " for dimension ordering";
+    } else if (attr.first == getSparsePointerBitWidthAttrName() ||
+               attr.first == getSparseIndexBitWidthAttrName()) {
+      // Pointer or index bitwidth verification.
+      auto intAttr = attr.second.dyn_cast<IntegerAttr>();
+      if (!intAttr)
+        return emitError() << "expected an integral bitwidth";
+      switch (intAttr.getInt()) {
+      case 0:
+      case 8:
+      case 16:
+      case 32:
+      case 64:
+        continue;
+      default:
+        return emitError() << "unexpected bitwidth: " << intAttr.getInt();
+      }
+    } else {
+      return emitError() << "unexpected key: " << attr.first.str();
+    }
+  }
+  return success();
+}
+
+SparseTensorEncodingAttr::DimLevelType
+SparseTensorEncodingAttr::getDimLevelType(unsigned dim) const {
+  if (auto value = getDict().get(getSparseDimLevelTypeAttrName())) {
+    auto strVal =
+        value.dyn_cast<ArrayAttr>()[dim].cast<StringAttr>().getValue();
+    if (strVal == getCompressedDimLevelTypeVal())
+      return DimLevelType::Compressed;
+    if (strVal == getSingletonDimLevelTypeVal())
+      return DimLevelType::Singleton;
+  }
+  return DimLevelType::Dense;
+}
+
+AffineMap SparseTensorEncodingAttr::getDimOrdering() const {
+  if (auto value = getDict().get(getSparseDimOrderingAttrName()))
+    return value.cast<AffineMapAttr>().getValue();
+  return {};
+}
+
+unsigned SparseTensorEncodingAttr::getPointerBitWidth() const {
+  if (auto value = getDict().get(getSparsePointerBitWidthAttrName()))
+    return value.cast<IntegerAttr>().getInt();
+  return 0;
+}
+
+unsigned SparseTensorEncodingAttr::getIndexBitWidth() const {
+  if (auto value = getDict().get(getSparseIndexBitWidthAttrName()))
+    return value.cast<IntegerAttr>().getInt();
+  return 0;
+}
+
 //===----------------------------------------------------------------------===//
 // TensorDialect Dialect Interfaces
 //===----------------------------------------------------------------------===//
@@ -30,10 +161,38 @@ struct TensorInlinerInterface : public DialectInlinerInterface {
 };
 } // end anonymous namespace
 
+//===----------------------------------------------------------------------===//
+// TensorDialect Methods
+//===----------------------------------------------------------------------===//
+
 void TensorDialect::initialize() {
+  addAttributes<
+#define GET_ATTRDEF_LIST
+#include "mlir/Dialect/Tensor/IR/TensorAttrDefs.cpp.inc"
+      >();
   addOperations<
 #define GET_OP_LIST
 #include "mlir/Dialect/Tensor/IR/TensorOps.cpp.inc"
       >();
   addInterfaces<TensorInlinerInterface>();
 }
+
+Attribute TensorDialect::parseAttribute(DialectAsmParser &parser,
+                                        Type type) const {
+  StringRef attrTag;
+  if (failed(parser.parseKeyword(&attrTag)))
+    return Attribute();
+  Attribute attr;
+  auto parseResult =
+      generatedAttributeParser(getContext(), parser, attrTag, type, attr);
+  if (parseResult.hasValue())
+    return attr;
+  parser.emitError(parser.getNameLoc(), "unknown tensor attribute");
+  return Attribute();
+}
+
+void TensorDialect::printAttribute(::mlir::Attribute attr,
+                                   ::mlir::DialectAsmPrinter &printer) const {
+  if (succeeded(generatedAttributePrinter(attr, printer)))
+    return;
+}