llvm
diff --git a/‎mlir/include/mlir/Dialect/XeGPU/uArch/IntelGpuXe2.h‎
Lines changed: 170 additions & 22 deletions b/‎mlir/include/mlir/Dialect/XeGPU/uArch/IntelGpuXe2.h‎
Lines changed: 170 additions & 22 deletions
diff --git a/‎mlir/include/mlir/Dialect/XeGPU/uArch/uArchBase.h‎
Lines changed: 43 additions & 0 deletions b/‎mlir/include/mlir/Dialect/XeGPU/uArch/uArchBase.h‎
Lines changed: 43 additions & 0 deletions
diff --git a/‎mlir/include/mlir/Dialect/XeGPU/uArch/uArchInterfaces.h‎
Lines changed: 0 additions & 74 deletions b/‎mlir/include/mlir/Dialect/XeGPU/uArch/uArchInterfaces.h‎
Lines changed: 0 additions & 74 deletions
diff --git a/‎mlir/lib/Dialect/LLVMIR/CMakeLists.txt‎
Lines changed: 0 additions & 1 deletion b/‎mlir/lib/Dialect/LLVMIR/CMakeLists.txt‎
Lines changed: 0 additions & 1 deletion
diff --git a/‎mlir/lib/Dialect/LLVMIR/IR/XeVMDialect.cpp‎
Lines changed: 0 additions & 1 deletion b/‎mlir/lib/Dialect/LLVMIR/IR/XeVMDialect.cpp‎
Lines changed: 0 additions & 1 deletion
diff --git a/‎mlir/lib/Dialect/XeGPU/CMakeLists.txt‎
Lines changed: 0 additions & 1 deletion b/‎mlir/lib/Dialect/XeGPU/CMakeLists.txt‎
Lines changed: 0 additions & 1 deletion
diff --git a/‎mlir/lib/Dialect/XeGPU/IR/CMakeLists.txt‎
Lines changed: 0 additions & 1 deletion b/‎mlir/lib/Dialect/XeGPU/IR/CMakeLists.txt‎
Lines changed: 0 additions & 1 deletion
@@ -15,17 +15,22 @@
 #ifndef MLIR_DIALECT_XEGPU_UARCH_INTELGPUXE2_H
 #define MLIR_DIALECT_XEGPU_UARCH_INTELGPUXE2_H
 
-#include "mlir/Dialect/XeGPU/uArch/uArchInterfaces.h"
+#include "mlir/Dialect/XeGPU/uArch/uArchBase.h"
 #include "mlir/IR/BuiltinTypes.h"
 #include "mlir/IR/TypeUtilities.h"
+#include "llvm/Support/DebugLog.h"
 #include <map>
 #include <string>
 #include <vector>
 
+#define DEBUG_TYPE "xegpu-uarch"
+
+using namespace mlir;
+using namespace mlir::xegpu::uArch;
+
 namespace mlir {
 namespace xegpu {
 namespace uArch {
-namespace Xe2Plus {
 struct XeCoreInfo {
   uint32_t num_threads;
   SharedMemory shared_memory;
@@ -61,30 +66,27 @@ struct DPASInstruction : public Instruction, public MMAInstructionInterface {
 
   // Override all virtuals from MatrixOpInterface
   virtual std::vector<std::pair<uint32_t, uint32_t>>
-  getSupportedShapes(mlir::Type dataType, MMAOpndKind matrixType) override;
-  virtual std::vector<mlir::Type>
-  getSupportedTypes(MLIRContext &context, MMAOpndKind matrixType) override;
+  getSupportedShapes(Type dataType, MMAOpndKind matrixType) override;
+  virtual std::vector<Type> getSupportedTypes(MLIRContext &context,
+                                              MMAOpndKind matrixType) override;
   virtual bool
   checkSupportedShapesAndTypes(std::pair<uint32_t, uint32_t> AShape,
                                std::pair<uint32_t, uint32_t> BShape,
                                std::pair<uint32_t, uint32_t> CShape,
-                               std::pair<uint32_t, uint32_t> DShape,
-                               mlir::Type AType, mlir::Type BType,
-                               mlir::Type CType, mlir::Type DType) override;
-  virtual bool checkSupportedTypes(mlir::Type AType, mlir::Type BType,
-                                   mlir::Type CType, mlir::Type DType) override;
+                               std::pair<uint32_t, uint32_t> DShape, Type AType,
+                               Type BType, Type CType, Type DType) override;
+  virtual bool checkSupportedTypes(Type AType, Type BType, Type CType,
+                                   Type DType) override;
   virtual bool validate(std::pair<uint32_t, uint32_t> AShape,
                         std::pair<uint32_t, uint32_t> BShape,
                         std::pair<uint32_t, uint32_t> CShape,
-                        std::pair<uint32_t, uint32_t> DShape, mlir::Type AType,
-                        mlir::Type BType, mlir::Type CType,
-                        mlir::Type DType) override;
-  virtual std::vector<uint32_t> getSupportedM(mlir::Type type) override;
-  virtual std::vector<uint32_t> getSupportedK(mlir::Type type) override;
-  virtual std::vector<uint32_t> getSupportedN(mlir::Type type) override;
+                        std::pair<uint32_t, uint32_t> DShape, Type AType,
+                        Type BType, Type CType, Type DType) override;
+  virtual std::vector<uint32_t> getSupportedM(Type type) override;
+  virtual std::vector<uint32_t> getSupportedK(Type type) override;
+  virtual std::vector<uint32_t> getSupportedN(Type type) override;
 };
 
-namespace PVCuArch {
 struct PVCuArch : public Xe2Plus {
   // Maintaines ownership of the instructions owned by PVUarch
   std::vector<std::shared_ptr<Instruction>> owned_instructions;
@@ -120,9 +122,7 @@ struct PVCuArch : public Xe2Plus {
     owned_instructions.push_back(dpas);
   }
 };
-} // namespace PVCuArch
 
-namespace BMGuArch {
 struct BMGuArch : public Xe2Plus {
   // Maintaines ownership of the instructions owned by PVUarch
   std::vector<std::shared_ptr<Instruction>> owned_instructions;
@@ -156,11 +156,159 @@ struct BMGuArch : public Xe2Plus {
     owned_instructions.push_back(dpas);
   }
 };
-} // namespace BMGuArch
-
-} // namespace Xe2Plus
 } // namespace uArch
 } // namespace xegpu
 } // namespace mlir
 
+inline std::vector<std::pair<uint32_t, uint32_t>>
+DPASInstruction::getSupportedShapes(Type dataType, MMAOpndKind matrixType) {
+  auto combineVectors = [](const std::vector<uint32_t> &a,
+                           const std::vector<uint32_t> &b)
+      -> std::vector<std::pair<uint32_t, uint32_t>> {
+    std::vector<std::pair<uint32_t, uint32_t>> result;
+    for (unsigned x : a) {
+      for (unsigned y : b) {
+        result.emplace_back(x, y);
+      }
+    }
+    return result;
+  };
+
+  auto M = getSupportedM(dataType);
+  auto K = getSupportedK(dataType);
+  auto N = getSupportedN(dataType);
+  std::vector<std::pair<unsigned, unsigned>> resultMatrix;
+
+  switch (matrixType) {
+  case MMAOpndKind::MatrixA:
+    resultMatrix = combineVectors(M, K);
+    break;
+  case MMAOpndKind::MatrixB:
+    resultMatrix = combineVectors(K, N);
+    break;
+  case MMAOpndKind::MatrixC:
+    resultMatrix = combineVectors(M, N);
+    break;
+  case MMAOpndKind::MatrixD:
+    resultMatrix = combineVectors(M, N);
+    break;
+  }
+  return resultMatrix;
+}
+
+inline std::vector<Type>
+DPASInstruction::getSupportedTypes(MLIRContext &context,
+                                   MMAOpndKind matrixType) {
+  Type bf16Type = BFloat16Type::get(&context);
+  Type f16Type = Float16Type::get(&context);
+  Type tf32Type = FloatTF32Type::get(&context);
+  Type f32Type = Float32Type::get(&context);
+
+  switch (matrixType) {
+  case MMAOpndKind::MatrixA:
+    return {bf16Type, f16Type, tf32Type};
+    break;
+  case MMAOpndKind::MatrixB:
+    return {bf16Type, f16Type, tf32Type};
+    break;
+  case MMAOpndKind::MatrixC:
+    return {bf16Type, f16Type, f32Type};
+    break;
+  case MMAOpndKind::MatrixD:
+    return {bf16Type, f16Type, f32Type};
+    break;
+  }
+}
+
+inline bool DPASInstruction::checkSupportedTypes(Type AType, Type BType,
+                                                 Type CType, Type DType) {
+  if (AType.isF16() || BType.isF16()) {
+    if (AType != BType || (CType && (!CType.isF32() && !CType.isF16())) ||
+        (!DType.isF32() && !DType.isF16())) {
+      LDBG() << "Unsupported dpas combinations of Dst, Acc, A and B matrices.";
+      return false;
+    }
+  } else if (AType.isBF16() || BType.isBF16()) {
+    if (AType != BType || (CType && (!CType.isF32() && !CType.isBF16())) ||
+        (!DType.isF32() && !DType.isBF16())) {
+      LDBG() << "Unsupported dpas combinations of Dst, Acc, A and B matrices.";
+      return false;
+    }
+  } else if (AType.isTF32() || BType.isTF32()) {
+    if (AType != BType || (CType && (!CType.isF32() && !DType.isF32())) ||
+        (!DType.isF32())) {
+      LDBG() << "Unsupported dpas combinations of Dst, Acc, A and B matrices.";
+      return false;
+    }
+  } else if (!(AType.isInteger(2) || AType.isInteger(4) ||
+               AType.isInteger(8)) &&
+             !(BType.isInteger(2) || BType.isInteger(4) ||
+               BType.isInteger(8))) {
+    LDBG() << "Unsupported dpas combinations of Dst, Acc, A and B matrices.";
+    return false;
+  }
+
+  return true;
+}
+
+inline bool DPASInstruction::checkSupportedShapesAndTypes(
+    std::pair<uint32_t, uint32_t> AShape, std::pair<uint32_t, uint32_t> BShape,
+    std::pair<uint32_t, uint32_t> CShape, std::pair<uint32_t, uint32_t> DShape,
+    Type AType, Type BType, Type CType, Type DType) {
+  auto supportedAShapes = getSupportedShapes(AType, MMAOpndKind::MatrixA);
+  auto supportedBShapes = getSupportedShapes(BType, MMAOpndKind::MatrixB);
+  auto supportedCShapes = getSupportedShapes(CType, MMAOpndKind::MatrixC);
+  auto supportedDShapes = getSupportedShapes(DType, MMAOpndKind::MatrixD);
+  return llvm::is_contained(supportedAShapes, AShape) &&
+         llvm::is_contained(supportedBShapes, BShape) &&
+         llvm::is_contained(supportedCShapes, CShape) &&
+         llvm::is_contained(supportedDShapes, DShape) &&
+         checkSupportedTypes(AType, BType, CType, DType);
+}
+
+inline bool DPASInstruction::validate(std::pair<uint32_t, uint32_t> AShape,
+                                      std::pair<uint32_t, uint32_t> BShape,
+                                      std::pair<uint32_t, uint32_t> CShape,
+                                      std::pair<uint32_t, uint32_t> DShape,
+                                      Type AType, Type BType, Type CType,
+                                      Type DType) {
+  return checkSupportedShapesAndTypes(AShape, BShape, CShape, DShape, AType,
+                                      BType, CType, DType);
+}
+
+inline std::vector<uint32_t> DPASInstruction::getSupportedM(Type type) {
+  return {1, 2, 3, 4, 5, 6, 7, 8};
+}
+
+inline std::vector<uint32_t> DPASInstruction::getSupportedK(Type type) {
+  // assert if data type is not int or float type
+  assert(type.isIntOrFloat() && "Matrix type must be int or float");
+  auto bitWidth = type.getIntOrFloatBitWidth();
+  uint32_t kSize = 0;
+  switch (bitWidth) {
+  case 2:
+    kSize = 64;
+    break;
+  case 4:
+    kSize = 64;
+    break;
+  case 8:
+    kSize = 32;
+    break;
+  case 16:
+    kSize = 16;
+    break;
+  case 32:
+    kSize = 8;
+    break;
+  default:
+    llvm_unreachable("Invalid int or float");
+  }
+  return {kSize};
+}
+
+inline std::vector<uint32_t> DPASInstruction::getSupportedN(Type type) {
+  return {16};
+}
+
 #endif // MLIR_DIALECT_XEGPU_UARCH_INTELGPUXE2H
@@ -199,6 +199,49 @@ struct SharedMemory {
   // @TODO: Add more fields as needed (e.g., latency, throughput, bandwidth)
 };
 
+//===----------------------------------------------------------------------===//
+// Interfaces
+//===----------------------------------------------------------------------===//
+enum class MMAOpndKind { MatrixA, MatrixB, MatrixC, MatrixD };
+struct MMAInstructionInterface {
+  // Get supported Matrix shapes
+  virtual std::vector<std::pair<uint32_t, uint32_t>>
+  getSupportedShapes(Type dataType, MMAOpndKind matrixType) = 0;
+  // @TODO: This method takes an context object as a parameter, this is to
+  // create the Type objects from the same context. Since type objects are
+  // uniqued in a specific context, to do things like "aType == bType" (where
+  // aType and bType are both same type) kind of checks, the both types should
+  // be from the same context.
+  //
+  // One alternative to this is to create enum to represent each types, but this
+  // adds an extra burden to user to convert these enums to specific types. In
+  // fact the utility that would convert enumToType() and vice versa would still
+  // have to use the context object.
+  //
+  // Untill we have a better solution, we stick to passing context object to
+  // this method.
+  virtual std::vector<Type> getSupportedTypes(MLIRContext &context,
+                                              MMAOpndKind matrixType) = 0;
+  virtual bool
+  checkSupportedShapesAndTypes(std::pair<uint32_t, uint32_t> AShape,
+                               std::pair<uint32_t, uint32_t> BShape,
+                               std::pair<uint32_t, uint32_t> CShape,
+                               std::pair<uint32_t, uint32_t> DShape, Type AType,
+                               Type BType, Type CType, Type DType) = 0;
+  virtual bool checkSupportedTypes(Type AType, Type BType, Type CType,
+                                   Type DType) = 0;
+  virtual bool validate(std::pair<uint32_t, uint32_t> AShape,
+                        std::pair<uint32_t, uint32_t> BShape,
+                        std::pair<uint32_t, uint32_t> CShape,
+                        std::pair<uint32_t, uint32_t> DShape, Type AType,
+                        Type BType, Type CType, Type DType) = 0;
+  virtual std::vector<uint32_t> getSupportedM(Type type) = 0;
+  virtual std::vector<uint32_t> getSupportedK(Type type) = 0;
+  virtual std::vector<uint32_t> getSupportedN(Type type) = 0;
+
+  virtual ~MMAInstructionInterface() = default;
+};
+
 } // namespace uArch
 } // namespace xegpu
 } // namespace mlir
 
@@ -128,6 +128,5 @@ add_mlir_dialect_library(MLIRXeVMDialect
   MLIRDialectUtils
   MLIRIR
   MLIRLLVMDialect
-  MLIRXeGPUuArch
   MLIRSideEffectInterfaces
 )
@@ -8,7 +8,6 @@
 #include "mlir/Dialect/LLVMIR/XeVMDialect.h"
 #include "mlir/Dialect/GPU/IR/CompilationInterfaces.h"
 #include "mlir/Dialect/Utils/StaticValueUtils.h"
-#include "mlir/Dialect/XeGPU/uArch/IntelGpuXe2.h"
 #include "mlir/IR/DialectImplementation.h"
 #include "llvm/ADT/TypeSwitch.h"
 #include "llvm/Support/FileSystem.h"
 
@@ -1,4 +1,3 @@
 add_subdirectory(IR)
 add_subdirectory(Transforms)
-add_subdirectory(uArch)
 add_subdirectory(Utils)
@@ -18,7 +18,6 @@ add_mlir_dialect_library(MLIRXeGPUDialect
   MLIRArithUtils
   MLIRDialectUtils
   MLIRIR
-  MLIRXeGPUuArch
   MLIRViewLikeInterface
   MLIRVectorDialect
 )
Original file line number	Diff line number	Diff line change
`@@ -128,6 +128,5 @@ add_mlir_dialect_library(MLIRXeVMDialect`
`128`	`128`	`MLIRDialectUtils`
`129`	`129`	`MLIRIR`
`130`	`130`	`MLIRLLVMDialect`
`131`		`- MLIRXeGPUuArch`
`132`	`131`	`MLIRSideEffectInterfaces`
`133`	`132`	`)`
Original file line number	Diff line number	Diff line change
`@@ -18,7 +18,6 @@ add_mlir_dialect_library(MLIRXeGPUDialect`
`18`	`18`	`MLIRArithUtils`
`19`	`19`	`MLIRDialectUtils`
`20`	`20`	`MLIRIR`
`21`		`- MLIRXeGPUuArch`
`22`	`21`	`MLIRViewLikeInterface`
`23`	`22`	`MLIRVectorDialect`
`24`	`23`	`)`