Remove Intel code

chengjunlu · chengjunlu · commit 4bf30c45d74a · 2024-12-06T15:41:25.000Z
diff --git a/lib/Dialect/TritonGPU/IR/Dialect.cpp b/lib/Dialect/TritonGPU/IR/Dialect.cpp
@@ -5,9 +5,6 @@
 
 #include "mlir/IR/DialectImplementation.h"
 #include "mlir/IR/OpImplementation.h"
-
-#include "intel/include/Dialect/TritonIntelGPU/IR/Dialect.h"
-
 #include "mlir/Support/LLVM.h"
 #include "triton/Analysis/Utility.h"
 #include "triton/Dialect/Triton/IR/Utility.h"
@@ -325,11 +322,11 @@ SmallVector<unsigned> getOrder(Attribute layout) {
     // with Intel layouts.
     // More details:
     // https://github.com/intel/intel-xpu-backend-for-triton/pull/2517
-    if (dyn_cast<intel::DpasEncodingAttr>(dotLayout.getParent())) {
-      SmallVector<unsigned> order(rank);
-      std::iota(order.rbegin(), order.rend(), 0);
-      return order;
-    }
+    //    if (dyn_cast<intel::DpasEncodingAttr>(dotLayout.getParent())) {
+    //      SmallVector<unsigned> order(rank);
+    //      std::iota(order.rbegin(), order.rend(), 0);
+    //      return order;
+    //    }
     return getOrderForDotOperand(dotLayout.getOpIdx(), rank, /*kMajor*/ true);
   }
   if (auto sliceLayout = dyn_cast<SliceEncodingAttr>(layout)) {
@@ -1129,10 +1126,11 @@ unsigned DotOperandEncodingAttr::getTotalElemsPerThread(ArrayRef<int64_t> shape,
       return amdWmmaParent.getTotalElemsPerThreadForOperand(
           shape, eltTy, getKWidth(), getOpIdx());
     }
-    if (auto dpasParent = mlir::dyn_cast<intel::DpasEncodingAttr>(mmaParent)) {
-      return dpasParent.getTotalElemsPerThreadForOperand(
-          shape, eltTy, getKWidth(), getOpIdx());
-    }
+    //    if (auto dpasParent =
+    //    mlir::dyn_cast<intel::DpasEncodingAttr>(mmaParent)) {
+    //      return dpasParent.getTotalElemsPerThreadForOperand(
+    //          shape, eltTy, getKWidth(), getOpIdx());
+    //    }
   }
   if (auto blockedLayout = mlir::dyn_cast<BlockedEncodingAttr>(getParent())) {
     auto shapePerCTA = getShapePerCTA(*this, shape);
@@ -1197,17 +1195,19 @@ SmallVector<unsigned> DotOperandEncodingAttr::getWarpOrder() const {
   return {};
 }
 SmallVector<unsigned> DotOperandEncodingAttr::getThreadOrder() const {
-  // FIXME: delete if branch for `DpasEncodingAttr` and provide more
-  // general solution to make `getOrderForDotOperand` function compatible
-  // with Intel layouts.
-  // More details:
-  // https://github.com/intel/intel-xpu-backend-for-triton/pull/2517
-  if (mlir::dyn_cast<intel::DpasEncodingAttr>(getParent())) {
-    return ::getOrder(*this);
-  } else {
-    return getOrderForDotOperand(getOpIdx(), getWarpsPerCTA().size(),
-                                 /*kMajor*/ true);
-  }
+  //  // FIXME: delete if branch for `DpasEncodingAttr` and provide more
+  //  // general solution to make `getOrderForDotOperand` function compatible
+  //  // with Intel layouts.
+  //  // More details:
+  //  // https://github.com/intel/intel-xpu-backend-for-triton/pull/2517
+  //  if (mlir::dyn_cast<intel::DpasEncodingAttr>(getParent())) {
+  //    return ::getOrder(*this);
+  //  } else {
+  //    return getOrderForDotOperand(getOpIdx(), getWarpsPerCTA().size(),
+  //                                 /*kMajor*/ true);
+  //  }
+  return getOrderForDotOperand(getOpIdx(), getWarpsPerCTA().size(),
+                               /*kMajor*/ true);
 }
 
 LogicalResult DotOperandEncodingAttr::verify(
@@ -1250,19 +1250,16 @@ LogicalResult DotOperandEncodingAttr::verify(
     return success();
   }
 
-  if (auto parentAttr = mlir::dyn_cast<intel::DpasEncodingAttr>(parent)) {
-    if (kWidth != parentAttr.getOpsPerChannel())
-      return emitError() << "ttg.dot_op kWidth parameter must match the "
-                            "parent's opsPerChannel";
-    return success();
-  }
-
-  if (auto parentAttr = mlir::dyn_cast<intel::WarpEncodingAttr>(parent)) {
-    if (kWidth != 0)
-      return emitError() << "ttg.dot_op kWidth parameter is not supported "
-                            "when the parent is a warp layout";
+  if (auto parentAttr = mlir::dyn_cast<MmaEncodingTrait>(parent)) {
     return success();
   }
+  //
+  //  if (auto parentAttr = mlir::dyn_cast<intel::WarpEncodingAttr>(parent)) {
+  //    if (kWidth != 0)
+  //      return emitError() << "ttg.dot_op kWidth parameter is not supported "
+  //                            "when the parent is a warp layout";
+  //    return success();
+  //  }
 
   if (auto parentAttr = mlir::dyn_cast<BlockedEncodingAttr>(parent)) {
     if (kWidth != 0)
@@ -2527,9 +2524,6 @@ class TritonGPUOpAsmInterface : public OpAsmDialectInterface {
     } else if (auto linearAttr = mlir::dyn_cast<LinearEncodingAttr>(attr)) {
       os << "linear";
       return AliasResult::FinalAlias;
-    } else if (auto warpAttr = mlir::dyn_cast<intel::WarpEncodingAttr>(attr)) {
-      os << "warp";
-      return AliasResult::FinalAlias;
     } /* else if (auto sliceAttr = dyn_cast<SliceEncodingAttr>(attr)) {
       os << "slice";
       return AliasResult::FinalAlias;
@@ -3248,8 +3242,7 @@ struct CanonicalizeConvertFromConvert
     auto srcType = op.getSrc().getType();
     auto dstType = op.getType();
     if (mlir::isa<DotOperandEncodingAttr>(dstType.getEncoding()) &&
-        (mlir::isa<NvidiaMmaEncodingAttr>(srcType.getEncoding()) ||
-         mlir::isa<intel::DpasEncodingAttr>(srcType.getEncoding())))
+        mlir::isa<NvidiaMmaEncodingAttr>(srcType.getEncoding()))
       return failure();
 
     // for hopper MMAv3
diff --git a/third_party/intel/include/Dialect/TritonIntelGPU/IR/TritonIntelGPUAttrDefs.td b/third_party/intel/include/Dialect/TritonIntelGPU/IR/TritonIntelGPUAttrDefs.td
@@ -125,7 +125,7 @@ along the row (resp. col) dimension.
 //===----------------------------------------------------------------------===//
 
 def WarpEncodingAttr : TritonGPU_Attr<"WarpEncoding", "intel_warp_encoding",
-                                     [], TritonIntelGPU_Dialect> {
+                                     [MmaEncodingTrait], TritonIntelGPU_Dialect> {
   let mnemonic = "warp";
 
   let description = [{
@@ -144,6 +144,23 @@ def WarpEncodingAttr : TritonGPU_Attr<"WarpEncoding", "intel_warp_encoding",
   let extraClassDeclaration = [{
     unsigned getTotalElemsPerThread(ArrayRef<int64_t> shape, Type eltTy) const;
     SmallVector<unsigned> getElemsPerThread(ArrayRef<int64_t> shape, Type eltTy) const;
+
+    SmallVector<unsigned> getRepOrderForOperand(int opIdx) const {
+      llvm::report_fatal_error("NYI. WarpEncodingAttr::getRepOrder");
+    };
+
+    bool supportReduction() const {
+      llvm::report_fatal_error("NYI. WarpEncodingAttr::supportReduction");
+    };
+
+    SmallVector<unsigned> getSizePerThreadForOperand(int kWidth,unsigned opIdx) const {
+      llvm::report_fatal_error("NYI. WarpEncodingAttr::getSizePerThreadForOperand");
+    };
+
+    SmallVector<unsigned> getElemsPerThreadForOperands(ArrayRef<int64_t> shape, Type eltTy, unsigned opIdx) const {
+      llvm::report_fatal_error("NYI. WarpEncodingAttr::getElemsPerThreadForOperands");
+    };
+
   }];
 
   let hasCustomAssemblyFormat = 1;