Address review comments.

mshahneo · mshahneo · commit 38ff707197ab · 2025-09-25T15:49:17.000Z
Use LLVM data structures whenever possible.
diff --git a/mlir/include/mlir/Dialect/XeGPU/uArch/IntelGpuXe2.h b/mlir/include/mlir/Dialect/XeGPU/uArch/IntelGpuXe2.h
@@ -18,10 +18,10 @@
 #include "mlir/Dialect/XeGPU/uArch/uArchBase.h"
 #include "mlir/IR/BuiltinTypes.h"
 #include "mlir/IR/TypeUtilities.h"
+#include "llvm/ADT/SmallVector.h"
 #include "llvm/Support/DebugLog.h"
 #include <map>
 #include <string>
-#include <vector>
 
 #define DEBUG_TYPE "xegpu-uarch"
 
@@ -47,28 +47,29 @@ struct XeCoreInfo {
 
 struct Xe2Plus : public uArch {
   XeCoreInfo xe_core;
-  Xe2Plus(
-      const std::string &archName, const std::string &archDescription,
-      const XeCoreInfo &xeCore,
-      const std::map<RegisterFileType, RegisterFileInfo> &regInfo = {},
-      const std::vector<CacheInfo> &cacheInfo = {},
-      const std::map<std::string, std::shared_ptr<Instruction>> &instrs = {})
+  Xe2Plus(const std::string &archName, const std::string &archDescription,
+          const XeCoreInfo &xeCore,
+          const std::map<RegisterFileType, RegisterFileInfo> &regInfo = {},
+          const llvm::SmallVector<CacheInfo, 4> &cacheInfo = {},
+          const std::map<InstructionKind, std::shared_ptr<Instruction>>
+              &instrs = {})
       : uArch(archName, archDescription, regInfo, cacheInfo, instrs),
         xe_core(xeCore) {}
 };
 
 // struct to represent DPAS instruction
 struct DPASInstruction : public Instruction, public MMAInstructionInterface {
   DPASInstruction()
-      : Instruction("dpas",                   // name
-                    "Dot Product Accumulate") // description
+      : Instruction(InstructionKind::DPAS, // name
+                    "Dot Product Accumulate",
+                    InstructionScope::Subgroup) // description
   {}
 
   // Override all virtuals from MatrixOpInterface
-  virtual std::vector<std::pair<uint32_t, uint32_t>>
+  virtual llvm::SmallVector<std::pair<uint32_t, uint32_t>, 16>
   getSupportedShapes(Type dataType, MMAOpndKind matrixType) override;
-  virtual std::vector<Type> getSupportedTypes(MLIRContext &context,
-                                              MMAOpndKind matrixType) override;
+  virtual llvm::SmallVector<Type, 8>
+  getSupportedTypes(MLIRContext &context, MMAOpndKind matrixType) override;
   virtual bool
   checkSupportedShapesAndTypes(std::pair<uint32_t, uint32_t> AShape,
                                std::pair<uint32_t, uint32_t> BShape,
@@ -82,14 +83,14 @@ struct DPASInstruction : public Instruction, public MMAInstructionInterface {
                         std::pair<uint32_t, uint32_t> CShape,
                         std::pair<uint32_t, uint32_t> DShape, Type AType,
                         Type BType, Type CType, Type DType) override;
-  virtual std::vector<uint32_t> getSupportedM(Type type) override;
-  virtual std::vector<uint32_t> getSupportedK(Type type) override;
-  virtual std::vector<uint32_t> getSupportedN(Type type) override;
+  virtual llvm::SmallVector<uint32_t, 8> getSupportedM(Type type) override;
+  virtual llvm::SmallVector<uint32_t, 8> getSupportedK(Type type) override;
+  virtual llvm::SmallVector<uint32_t, 8> getSupportedN(Type type) override;
 };
 
 struct PVCuArch : public Xe2Plus {
   // Maintaines ownership of the instructions owned by PVUarch
-  std::vector<std::shared_ptr<Instruction>> owned_instructions;
+  llvm::SmallVector<std::shared_ptr<Instruction>, 8> owned_instructions;
   PVCuArch()
       : Xe2Plus("pvc",                        // archName
                 "Ponte Vecchio Architecture", // archDescription
@@ -115,17 +116,16 @@ struct PVCuArch : public Xe2Plus {
     this->cacheInfo.push_back(
         CacheInfo(512 * 1024, 64, CacheHierarchyLevel::L2));
 
-    // Add the instructions
+    // Add the instructions-
     auto dpas = std::make_shared<DPASInstruction>();
-    instructions.emplace(dpas->getName(), dpas);
-    // instructions[dpas->name] = dpas.get();
+    instructions.emplace(dpas->getInstructionKind(), dpas);
     owned_instructions.push_back(dpas);
   }
 };
 
 struct BMGuArch : public Xe2Plus {
   // Maintaines ownership of the instructions owned by PVUarch
-  std::vector<std::shared_ptr<Instruction>> owned_instructions;
+  llvm::SmallVector<std::shared_ptr<Instruction>, 8> owned_instructions;
   BMGuArch()
       : Xe2Plus("bmg",                     // archName
                 "Battlemage Architecture", // archDescription
@@ -151,21 +151,20 @@ struct BMGuArch : public Xe2Plus {
 
     // Add the instructions
     auto dpas = std::make_shared<DPASInstruction>();
-    instructions.emplace(dpas->getName(), dpas);
-    // instructions[dpas->name] = dpas.get();
+    instructions.emplace(dpas->getInstructionKind(), dpas);
     owned_instructions.push_back(dpas);
   }
 };
 } // namespace uArch
 } // namespace xegpu
 } // namespace mlir
 
-inline std::vector<std::pair<uint32_t, uint32_t>>
+inline llvm::SmallVector<std::pair<uint32_t, uint32_t>, 16>
 DPASInstruction::getSupportedShapes(Type dataType, MMAOpndKind matrixType) {
-  auto combineVectors = [](const std::vector<uint32_t> &a,
-                           const std::vector<uint32_t> &b)
-      -> std::vector<std::pair<uint32_t, uint32_t>> {
-    std::vector<std::pair<uint32_t, uint32_t>> result;
+  auto combineVectors = [](const llvm::SmallVector<uint32_t, 8> &a,
+                           const llvm::SmallVector<uint32_t, 8> &b)
+      -> llvm::SmallVector<std::pair<uint32_t, uint32_t>, 16> {
+    llvm::SmallVector<std::pair<uint32_t, uint32_t>, 16> result;
     for (unsigned x : a) {
       for (unsigned y : b) {
         result.emplace_back(x, y);
@@ -177,7 +176,7 @@ DPASInstruction::getSupportedShapes(Type dataType, MMAOpndKind matrixType) {
   auto M = getSupportedM(dataType);
   auto K = getSupportedK(dataType);
   auto N = getSupportedN(dataType);
-  std::vector<std::pair<unsigned, unsigned>> resultMatrix;
+  llvm::SmallVector<std::pair<unsigned, unsigned>, 16> resultMatrix;
 
   switch (matrixType) {
   case MMAOpndKind::MatrixA:
@@ -196,7 +195,7 @@ DPASInstruction::getSupportedShapes(Type dataType, MMAOpndKind matrixType) {
   return resultMatrix;
 }
 
-inline std::vector<Type>
+inline llvm::SmallVector<Type, 8>
 DPASInstruction::getSupportedTypes(MLIRContext &context,
                                    MMAOpndKind matrixType) {
   Type bf16Type = BFloat16Type::get(&context);
@@ -207,17 +206,14 @@ DPASInstruction::getSupportedTypes(MLIRContext &context,
   switch (matrixType) {
   case MMAOpndKind::MatrixA:
     return {bf16Type, f16Type, tf32Type};
-    break;
   case MMAOpndKind::MatrixB:
     return {bf16Type, f16Type, tf32Type};
-    break;
   case MMAOpndKind::MatrixC:
     return {bf16Type, f16Type, f32Type};
-    break;
   case MMAOpndKind::MatrixD:
     return {bf16Type, f16Type, f32Type};
-    break;
   }
+  return {};
 }
 
 inline bool DPASInstruction::checkSupportedTypes(Type AType, Type BType,
@@ -276,11 +272,13 @@ inline bool DPASInstruction::validate(std::pair<uint32_t, uint32_t> AShape,
                                       BType, CType, DType);
 }
 
-inline std::vector<uint32_t> DPASInstruction::getSupportedM(Type type) {
+inline llvm::SmallVector<uint32_t, 8>
+DPASInstruction::getSupportedM(Type type) {
   return {1, 2, 3, 4, 5, 6, 7, 8};
 }
 
-inline std::vector<uint32_t> DPASInstruction::getSupportedK(Type type) {
+inline llvm::SmallVector<uint32_t, 8>
+DPASInstruction::getSupportedK(Type type) {
   // assert if data type is not int or float type
   assert(type.isIntOrFloat() && "Matrix type must be int or float");
   auto bitWidth = type.getIntOrFloatBitWidth();
@@ -307,8 +305,9 @@ inline std::vector<uint32_t> DPASInstruction::getSupportedK(Type type) {
   return {kSize};
 }
 
-inline std::vector<uint32_t> DPASInstruction::getSupportedN(Type type) {
+inline llvm::SmallVector<uint32_t, 8>
+DPASInstruction::getSupportedN(Type type) {
   return {16};
 }
 
-#endif // MLIR_DIALECT_XEGPU_UARCH_INTELGPUXE2H
+#endif // MLIR_DIALECT_XEGPU_UARCH_INTELGPUXE2_H
diff --git a/mlir/include/mlir/Dialect/XeGPU/uArch/uArchBase.h b/mlir/include/mlir/Dialect/XeGPU/uArch/uArchBase.h
@@ -23,6 +23,7 @@
 #include <tuple>
 
 #include "mlir/IR/Types.h"
+#include "llvm/ADT/SmallVector.h"
 
 namespace mlir {
 namespace xegpu {
@@ -31,12 +32,26 @@ namespace uArch {
 // An enum class to represent the scope of an instruction
 enum class InstructionScope { WorkItem, Subgroup, Workgroup, Cluster };
 
-enum class InstructionName {
-  DPAS, // Dot Product Accumulate Systolic (DPAS) is a matrix multiply-add
-        // operation
+enum class InstructionKind {
+  DPAS, // Dot Product Accumulate Systolic (DPAS) is a matrix
+        // multiply-add operation
   // Add more instructions as needed
 };
 
+llvm::StringRef toString(InstructionKind name) {
+  switch (name) {
+  case InstructionKind::DPAS:
+    return "dpas";
+  }
+  llvm_unreachable("Unknown InstructionKind");
+}
+
+std::optional<InstructionKind> parseInstructionKind(llvm::StringRef str) {
+  if (str.equals_insensitive("dpas"))
+    return InstructionKind::DPAS;
+  return std::nullopt;
+}
+
 // A struct to represent basic information about an instruction
 // This struct is used to represent the information about an instruction in the
 // uArch The information includes:
@@ -56,17 +71,17 @@ enum class InstructionName {
 
 struct Instruction {
   // @TODO: Add more fields as needed
-  Instruction(std::string name, std::string desc)
-      : name(std::move(name)), description(std::move(desc)) {}
+  Instruction(InstructionKind kind, std::string desc, InstructionScope scope)
+      : instKind(kind), description(std::move(desc)), scope(scope) {}
 
   virtual ~Instruction() = default;
   // Get methods
-  std::string getName() { return name; }
+  InstructionKind getInstructionKind() { return instKind; }
   std::string getDescription() { return description; }
   InstructionScope getScope() { return scope; }
 
 protected:
-  std::string name;
+  InstructionKind instKind;
   std::string description;
   InstructionScope scope;
 };
@@ -78,23 +93,25 @@ enum class RegisterFileType : uint8_t { GRF, ARF };
 struct RegisterFileInfo {
   // Constructor
   RegisterFileInfo() = default;
-  RegisterFileInfo(uint32_t size, const std::vector<RegisterFileMode> &mode,
-                   const std::vector<uint32_t> &numRegs)
+  RegisterFileInfo(uint32_t size,
+                   const llvm::SmallVector<RegisterFileMode, 4> &mode,
+                   const llvm::SmallVector<uint32_t, 4> &numRegs)
       : size(size), mode(mode), numRegsPerThreadPerMode(numRegs) {}
 
   uint32_t getSize() const { return size; }
-  const std::vector<RegisterFileMode> &getModes() const { return mode; }
-  const std::vector<uint32_t> &getNumRegsPerThreadPerMode() const {
+  const llvm::SmallVector<RegisterFileMode, 4> &getModes() const {
+    return mode;
+  }
+  const llvm::SmallVector<uint32_t, 4> &getNumRegsPerThreadPerMode() const {
     return numRegsPerThreadPerMode;
   }
 
 protected:
-  uint32_t size;                      // size per register in bits
-  std::vector<RegisterFileMode> mode; // e.g., "small", "large" GRF modes
-  std::vector<uint32_t>
+  uint32_t size; // size per register in bits
+  llvm::SmallVector<RegisterFileMode, 4>
+      mode; // e.g., "small", "large" GRF modes
+  llvm::SmallVector<uint32_t, 4>
       numRegsPerThreadPerMode; // number of registers per thread per mode
-  // TODO: Add more fields as needed (e.g., num_banks, bank_size, num_ports,
-  // port_width, bank_conflicts)
 };
 
 enum class CacheHierarchyLevel { L1 = 1, L2 = 2, L3 = 3 };
@@ -136,8 +153,8 @@ struct uArch {
   uArch(const std::string &name, const std::string &description,
         const std::map<RegisterFileType, RegisterFileInfo> &register_file_info =
             {},
-        const std::vector<CacheInfo> &cache_info = {},
-        const std::map<std::string, std::shared_ptr<Instruction>>
+        const llvm::SmallVector<CacheInfo, 4> &cache_info = {},
+        const std::map<InstructionKind, std::shared_ptr<Instruction>>
             &instructions = {})
       : name(name), description(description),
         registerFileInfo(register_file_info), cacheInfo(cache_info),
@@ -153,34 +170,36 @@ struct uArch {
     return registerFileInfo;
   }
 
-  const std::vector<CacheInfo> &getCacheInfo() const { return cacheInfo; }
+  const llvm::SmallVector<CacheInfo, 4> &getCacheInfo() const {
+    return cacheInfo;
+  }
 
-  const std::map<std::string, std::shared_ptr<Instruction>> &
+  const std::map<InstructionKind, std::shared_ptr<Instruction>> &
   getInstructions() const {
     return instructions;
   }
 
   // Get the name of the supported instruction names for that
   // architecture. It returns the names of the instructions added to the uArch.
-  std::vector<std::string> getSupportedInstructionNames() const {
-    std::vector<std::string> instructionNames;
+  llvm::SmallVector<StringRef, 8> getSupportedInstructionNames() const {
+    llvm::SmallVector<StringRef, 8> instructionNames;
     for (const auto &inst : instructions) {
-      instructionNames.push_back(inst.first);
+      instructionNames.push_back(toString(inst.first));
     }
     return instructionNames;
   }
 
   // Checks if an instruction is supported in this uArch
-  bool checkSupportedInstruction(const std::string &instructionName) const {
-    return instructions.find(instructionName) != instructions.end();
+  bool checkSupportedInstruction(InstructionKind instr) const {
+    return instructions.find(instr) != instructions.end();
   }
 
 protected:
   std::string name; // Similar to target triple
   std::string description;
   std::map<RegisterFileType, RegisterFileInfo> registerFileInfo;
-  std::vector<CacheInfo> cacheInfo;
-  std::map<std::string, std::shared_ptr<Instruction>> instructions;
+  llvm::SmallVector<CacheInfo, 4> cacheInfo;
+  std::map<InstructionKind, std::shared_ptr<Instruction>> instructions;
 };
 
 // A struct to represent shared memory information
@@ -205,7 +224,7 @@ struct SharedMemory {
 enum class MMAOpndKind { MatrixA, MatrixB, MatrixC, MatrixD };
 struct MMAInstructionInterface {
   // Get supported Matrix shapes
-  virtual std::vector<std::pair<uint32_t, uint32_t>>
+  virtual llvm::SmallVector<std::pair<uint32_t, uint32_t>, 16>
   getSupportedShapes(Type dataType, MMAOpndKind matrixType) = 0;
   // @TODO: This method takes an context object as a parameter, this is to
   // create the Type objects from the same context. Since type objects are
@@ -220,8 +239,8 @@ struct MMAInstructionInterface {
   //
   // Untill we have a better solution, we stick to passing context object to
   // this method.
-  virtual std::vector<Type> getSupportedTypes(MLIRContext &context,
-                                              MMAOpndKind matrixType) = 0;
+  virtual llvm::SmallVector<Type, 8>
+  getSupportedTypes(MLIRContext &context, MMAOpndKind matrixType) = 0;
   virtual bool
   checkSupportedShapesAndTypes(std::pair<uint32_t, uint32_t> AShape,
                                std::pair<uint32_t, uint32_t> BShape,
@@ -235,9 +254,9 @@ struct MMAInstructionInterface {
                         std::pair<uint32_t, uint32_t> CShape,
                         std::pair<uint32_t, uint32_t> DShape, Type AType,
                         Type BType, Type CType, Type DType) = 0;
-  virtual std::vector<uint32_t> getSupportedM(Type type) = 0;
-  virtual std::vector<uint32_t> getSupportedK(Type type) = 0;
-  virtual std::vector<uint32_t> getSupportedN(Type type) = 0;
+  virtual llvm::SmallVector<uint32_t, 8> getSupportedM(Type type) = 0;
+  virtual llvm::SmallVector<uint32_t, 8> getSupportedK(Type type) = 0;
+  virtual llvm::SmallVector<uint32_t, 8> getSupportedN(Type type) = 0;
 
   virtual ~MMAInstructionInterface() = default;
 };