|
| 1 | +//===- XeGPUTransformOps.td - XeGPU transformation ops -----*- tablegen -*-===// |
| 2 | +// |
| 3 | +// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. |
| 4 | +// See https://llvm.org/LICENSE.txt for license information. |
| 5 | +// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception |
| 6 | +// |
| 7 | +//===----------------------------------------------------------------------===// |
| 8 | + |
| 9 | +#ifndef XEGPU_EXTENSION |
| 10 | +#define XEGPU_EXTENSION |
| 11 | + |
| 12 | +include "mlir/Dialect/Transform/IR/TransformDialect.td" |
| 13 | +include "mlir/Dialect/Transform/Interfaces/TransformInterfaces.td" |
| 14 | +include "mlir/Dialect/Transform/IR/TransformTypes.td" |
| 15 | +include "mlir/IR/OpBase.td" |
| 16 | +include "mlir/Interfaces/SideEffectInterfaces.td" |
| 17 | + |
| 18 | +def XeGPUHoistDescOp : Op<Transform_Dialect, "xegpu.hoist_desc_ops", [ |
| 19 | + TransformOpInterface, TransformEachOpTrait, |
| 20 | + DeclareOpInterfaceMethods<MemoryEffectsOpInterface> |
| 21 | +]> { |
| 22 | + |
| 23 | + let summary = "Hoists xegpu tile descriptor ops outside the containing loop"; |
| 24 | + let description = [{ |
| 25 | + Hoists `xepu.create_nd_tdesc` out of the loop. If the |
| 26 | + descriptor's offset is loop dependent, a `xegpu.update_nd_offset` op is |
| 27 | + inserted in the loop to increment the offset. |
| 28 | + }]; |
| 29 | + |
| 30 | + let arguments = (ins TransformHandleTypeInterface : $loop); |
| 31 | + let results = (outs TransformHandleTypeInterface : $transformed); |
| 32 | + |
| 33 | + let assemblyFormat = "$loop attr-dict `:` functional-type(operands, results)"; |
| 34 | + |
| 35 | + let extraClassDeclaration = [{ |
| 36 | + ::mlir::DiagnosedSilenceableFailure applyToOne( |
| 37 | + ::mlir::transform::TransformRewriter & rewriter, |
| 38 | + ::mlir::Operation * target, |
| 39 | + ::mlir::transform::ApplyToEachResultList & results, |
| 40 | + ::mlir::transform::TransformState & state); |
| 41 | + }]; |
| 42 | +} |
| 43 | + |
| 44 | +def XeGPUSetDPASLayoutOp : Op<Transform_Dialect, "xegpu.set_dpas_layout", [ |
| 45 | + TransformOpInterface, TransformEachOpTrait, |
| 46 | + DeclareOpInterfaceMethods<MemoryEffectsOpInterface> |
| 47 | +]> { |
| 48 | + |
| 49 | + let summary = "Set xegpu.layout attribute to an DPAS op operand."; |
| 50 | + let description = [{ |
| 51 | + Given a `xegpu.dpas` operation, this transform adds `xegpu.layout` |
| 52 | + attribute to it's operand's tensor descriptor. The target operand is |
| 53 | + defined by the `tileIndex` argument. The layout is defined by the |
| 54 | + `sg_layout`, `sg_data` and `inst_data` attributes. The `load_data` |
| 55 | + attribute defines the tile size used for loading the data. It must be a |
| 56 | + multiple of the `inst_data` size. |
| 57 | + }]; |
| 58 | + |
| 59 | + let arguments = (ins TransformHandleTypeInterface : $dpasOp, |
| 60 | + I64Attr : $tileIndex, |
| 61 | + DenseI32ArrayAttr : $sgLayout, |
| 62 | + DenseI32ArrayAttr : $sgData, |
| 63 | + DenseI32ArrayAttr : $loadData, |
| 64 | + DenseI32ArrayAttr : $instData); |
| 65 | + |
| 66 | + let results = (outs); |
| 67 | + |
| 68 | + let assemblyFormat = |
| 69 | + "$dpasOp `index` `=` $tileIndex `sg_layout` `=` $sgLayout `sg_data` `=` " |
| 70 | + "$sgData `load_data` `=` $loadData `inst_data` `=` $instData attr-dict `:` type($dpasOp)"; |
| 71 | + |
| 72 | + let extraClassDeclaration = [{ |
| 73 | + ::mlir::DiagnosedSilenceableFailure applyToOne( |
| 74 | + ::mlir::transform::TransformRewriter & rewriter, |
| 75 | + ::mlir::Operation * target, |
| 76 | + ::mlir::transform::ApplyToEachResultList & results, |
| 77 | + ::mlir::transform::TransformState & state); |
| 78 | + }]; |
| 79 | +} |
| 80 | + |
| 81 | +def XeGPUInsertPrefetchOp : Op<Transform_Dialect, "xegpu.insert_prefetch", |
| 82 | + [FunctionalStyleTransformOpTrait, MemoryEffectsOpInterface, |
| 83 | + DeclareOpInterfaceMethods<TransformOpInterface>]> { |
| 84 | + |
| 85 | + let summary = "Adds xegpu prefetch ops to matmul operand tiles."; |
| 86 | + let description = [{ |
| 87 | + Given a `xegpu.dpas` operation residing in a `scf.for` loop, this transform inserts cooperative `xegpu.prefetch` operations for the A (index = 0) or B (index = 1) operand. The prefetch tile size is determined by the `sg_layout` and `sg_data` attributes. |
| 88 | + }]; |
| 89 | + |
| 90 | + let arguments = (ins TransformHandleTypeInterface : $dpasOp, |
| 91 | + TransformHandleTypeInterface : $loopOp, |
| 92 | + I64Attr : $tileIndex, |
| 93 | + DenseI32ArrayAttr : $sgLayout, |
| 94 | + DenseI32ArrayAttr : $sgData); |
| 95 | + |
| 96 | + let results = (outs TransformHandleTypeInterface : $transformedDpasOp, |
| 97 | + TransformHandleTypeInterface : $transformedLoopOp); |
| 98 | + |
| 99 | + let assemblyFormat = |
| 100 | + "$dpasOp $loopOp `index` `=` $tileIndex `sg_layout` `=` $sgLayout `sg_data` `=` " |
| 101 | + "$sgData attr-dict `:` functional-type(operands, results)"; |
| 102 | +} |
| 103 | + |
| 104 | +// TODO this should be handled with gpu transform ops. |
| 105 | +// Add gpu mapping to scf.forall op and use something like |
| 106 | +// transform.gpu.map_forall_to_blocks to convert to gpu.launch op. |
| 107 | +def XeGPUSetGPULaunchThreadsOp |
| 108 | + : Op<Transform_Dialect, "xegpu.set_gpu_launch_threads", [ |
| 109 | + TransformOpInterface, TransformEachOpTrait, |
| 110 | + DeclareOpInterfaceMethods<MemoryEffectsOpInterface> |
| 111 | + ]> { |
| 112 | + |
| 113 | + let summary = "Set number of threads for a given gpu.launch operation"; |
| 114 | + let description = [{Set number of threads for a given gpu.launch operation}]; |
| 115 | + |
| 116 | + let arguments = (ins TransformHandleTypeInterface |
| 117 | + : $launchOp, DenseI32ArrayAttr |
| 118 | + : $threads); |
| 119 | + let results = (outs); |
| 120 | + let assemblyFormat = |
| 121 | + "$launchOp `threads` `=` $threads attr-dict `:` type($launchOp)"; |
| 122 | + |
| 123 | + let extraClassDeclaration = [{ |
| 124 | + ::mlir::DiagnosedSilenceableFailure applyToOne( |
| 125 | + ::mlir::transform::TransformRewriter & rewriter, |
| 126 | + ::mlir::Operation * target, |
| 127 | + ::mlir::transform::ApplyToEachResultList & results, |
| 128 | + ::mlir::transform::TransformState & state); |
| 129 | + }]; |
| 130 | +} |
| 131 | + |
| 132 | +#endif // XEGPU_EXTENSION |
0 commit comments