llvm
diff --git a/‎mlir/include/mlir/Dialect/XeGPU/IR/XeGPUAttrs.td
Lines changed: 6 additions & 0 deletions b/‎mlir/include/mlir/Dialect/XeGPU/IR/XeGPUAttrs.td
Lines changed: 6 additions & 0 deletions
diff --git a/‎mlir/include/mlir/Dialect/XeGPU/Transforms/Passes.td
Lines changed: 13 additions & 0 deletions b/‎mlir/include/mlir/Dialect/XeGPU/Transforms/Passes.td
Lines changed: 13 additions & 0 deletions
diff --git a/‎mlir/include/mlir/Dialect/XeGPU/Utils/XeGPUUtils.h
Lines changed: 59 additions & 0 deletions b/‎mlir/include/mlir/Dialect/XeGPU/Utils/XeGPUUtils.h
Lines changed: 59 additions & 0 deletions
diff --git a/‎mlir/lib/Dialect/XeGPU/Transforms/CMakeLists.txt
Lines changed: 1 addition & 0 deletions b/‎mlir/lib/Dialect/XeGPU/Transforms/CMakeLists.txt
Lines changed: 1 addition & 0 deletions
@@ -295,11 +295,17 @@ def XeGPU_LayoutAttr : XeGPUAttr<"Layout", "layout"> {
     }
 
     LayoutAttr dropSgLayoutAndData() {
+      // avoid every field of the attribute is nullptr, which may lead to segment fault
+      if (!getInstData() && !getLaneLayout())
+        return nullptr;
       return LayoutAttr::get(getContext(), nullptr, nullptr, getInstData(),
                              getLaneLayout(), getLaneData(), getOrder());
     }
 
     LayoutAttr dropInstData() {
+      // avoid every field of the attribute is nullptr, which may lead to segment fault
+      if (!getSgLayout() && !getLaneLayout())
+        return nullptr;
       return LayoutAttr::get(getContext(), getSgLayout(), getSgData(), nullptr,
                              getLaneLayout(), getLaneData(), getOrder());
     }
 
@@ -45,4 +45,17 @@ def XeGPUWgToSgDistribute : Pass<"xegpu-wg-to-sg-distribute"> {
                            "gpu::GPUDialect", "index::IndexDialect"];
 }
 
+def XeGPUBlocking: Pass<"xegpu-blocking"> {
+  let summary = "Block XeGPU ops into smaller size.";
+  let description = [{
+    This pass partitions operations that process large shapes into multiple
+    operations on smaller shapes, as specified by the inst_data in the layout
+    attribute. This enables each resulting operation to be efficiently mapped
+    to a hardware instruction.
+  }];
+  let dependentDialects = [
+      "memref::MemRefDialect", "xegpu::XeGPUDialect", "vector::VectorDialect"
+  ];
+}
+
 #endif // MLIR_DIALECT_XEGPU_TRANSFORMS_PASSES_TD
@@ -13,6 +13,12 @@
 namespace mlir {
 
 class VectorType;
+class OpOperand;
+class OpResult;
+class OpBuilder;
+class ValueRange;
+class TypeConverter;
+
 namespace xegpu {
 class LayoutAttr;
 class TensorDescType;
@@ -50,6 +56,59 @@ FailureOr<VectorType> getDistributedVectorType(xegpu::TensorDescType tdescTy);
 FailureOr<VectorType> getDistributedVectorType(VectorType originalType,
                                                LayoutAttr layout);
 
+/// Return the attribute name for the OpOperand to attach LayoutAttr
+std::string getLayoutName(const OpOperand &operand);
+
+/// Return the attribute name for the OpResult to attach LayoutAttr
+std::string getLayoutName(const OpResult result);
+
+/// Retrieves the LayoutAttr associated with a given Value. For TensorDescType
+/// values, the LayoutAttr is extracted from the TensorDescType itself. For
+/// other values, it is obtained from the attributes of the defining operation.
+/// Returns nullptr if no LayoutAttr is found.
+LayoutAttr getLayoutAttr(const Value value);
+
+/// Retrieves the LayoutAttr associated with a given OpOperand. It will
+/// first check the operand_layout_{id} of the owner operation. If not found,
+/// it will check the operand itself and its defining op.
+LayoutAttr getLayoutAttr(const OpOperand &opr);
+
+/// Sets the LayoutAttr for a given OpOperand or OpResult by attaching
+/// it to the owner's dictionary attributes
+template <typename T,
+          typename = std::enable_if_t<std::is_same_v<T, OpOperand> ||
+                                      std::is_same_v<T, OpResult>>>
+void setLayoutAttr(const T &operandOrResult, const LayoutAttr layout);
+
+/// Set the LayoutAttr for each OpOperand and OpResult of the given operation.
+/// If the operation contains regions, it is also applied recursively to the
+/// contained operations
+void setLayoutAttrs(Operation *op,
+                    function_ref<LayoutAttr(Value)> getLayoutImpl);
+
+/// Extract a set of small vectors from a value with a given shape using
+/// vector.extract_stride_slice
+SmallVector<Value> extractVectorsWithShapeFromValue(OpBuilder &builder,
+                                                    Location loc, Value value,
+                                                    ArrayRef<int64_t> shape);
+
+/// Create a vector of shape from a set of values using
+/// vector.insert_stride_slice.
+Value createVectorWithShapeFromValues(OpBuilder &builder, Location loc,
+                                      ValueRange values,
+                                      ArrayRef<int64_t> shape);
+
+/// Do type conversion for SCF structural ops, e.g., scf.for using SCF structure
+/// type convertion patterns. Since VectorType cannot carry the layout
+/// attribute, which is needed to guide the type conversion for XeGPU, they are
+/// first converted into RankedTensorType, where the layout attribute can be
+/// attached. And then upstream SCF structural type conversion patterns are
+/// applied with the provided converter.
+/// TODO: This is a temporary solution. We should refactor it when context-aware
+/// type conversion is available.
+void doSCFStructuralTypeConversionWithTensorType(Operation *op,
+                                                 TypeConverter converter);
+
 } // namespace xegpu
 
 } // namespace mlir
 
@@ -1,4 +1,5 @@
 add_mlir_dialect_library(MLIRXeGPUTransforms
+  XeGPUBlocking.cpp
   XeGPUFoldAliasOps.cpp
   XeGPUSubgroupDistribute.cpp
   XeGPUUnroll.cpp
Original file line number	Diff line number	Diff line change
`@@ -295,11 +295,17 @@ def XeGPU_LayoutAttr : XeGPUAttr<"Layout", "layout"> {`
`295`	`295`	`}`
`296`	`296`
`297`	`297`	`LayoutAttr dropSgLayoutAndData() {`
	`298`	`+ // avoid every field of the attribute is nullptr, which may lead to segment fault`
	`299`	`+ if (!getInstData() && !getLaneLayout())`
	`300`	`+ return nullptr;`
`298`	`301`	`return LayoutAttr::get(getContext(), nullptr, nullptr, getInstData(),`
`299`	`302`	`getLaneLayout(), getLaneData(), getOrder());`
`300`	`303`	`}`
`301`	`304`
`302`	`305`	`LayoutAttr dropInstData() {`
	`306`	`+ // avoid every field of the attribute is nullptr, which may lead to segment fault`
	`307`	`+ if (!getSgLayout() && !getLaneLayout())`
	`308`	`+ return nullptr;`
`303`	`309`	`return LayoutAttr::get(getContext(), getSgLayout(), getSgData(), nullptr,`
`304`	`310`	`getLaneLayout(), getLaneData(), getOrder());`
`305`	`311`	`}`
Original file line number	Diff line number	Diff line change
`@@ -1,4 +1,5 @@`
`1`	`1`	`add_mlir_dialect_library(MLIRXeGPUTransforms`
	`2`	`+ XeGPUBlocking.cpp`
`2`	`3`	`XeGPUFoldAliasOps.cpp`
`3`	`4`	`XeGPUSubgroupDistribute.cpp`
`4`	`5`	`XeGPUUnroll.cpp`