| //===- TestTilingInterface.cpp - Test tiling using `TilingInterface` -----===// |
| // |
| // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. |
| // See https://llvm.org/LICENSE.txt for license information. |
| // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception |
| // |
| //===----------------------------------------------------------------------===// |
| // |
| // This file implements a pass for testing tiling operations using |
| // `TilingInterface`. |
| // |
| //===----------------------------------------------------------------------===// |
| |
| #include <optional> |
| #include <utility> |
| |
| #include "mlir/Dialect/Affine/IR/AffineOps.h" |
| #include "mlir/Dialect/Func/IR/FuncOps.h" |
| #include "mlir/Dialect/GPU/IR/GPUDialect.h" |
| #include "mlir/Dialect/Linalg/IR/Linalg.h" |
| #include "mlir/Dialect/Linalg/Transforms/TilingInterfaceImpl.h" |
| #include "mlir/Dialect/Linalg/Transforms/Transforms.h" |
| #include "mlir/Dialect/MemRef/IR/MemRef.h" |
| #include "mlir/Dialect/SCF/IR/SCF.h" |
| #include "mlir/Dialect/SCF/Transforms/TileUsingInterface.h" |
| #include "mlir/Dialect/Tensor/IR/Tensor.h" |
| #include "mlir/Dialect/Tensor/IR/TensorTilingInterfaceImpl.h" |
| #include "mlir/Interfaces/TilingInterface.h" |
| #include "mlir/Pass/Pass.h" |
| #include "mlir/Pass/PassManager.h" |
| #include "mlir/Transforms/GreedyPatternRewriteDriver.h" |
| #include "llvm/ADT/TypeSwitch.h" |
| |
| using namespace mlir; |
| |
| // TODO: this file should disappear and instead tests should make use of the |
| // transform dialect. |
| namespace { |
| |
| /// Marker used as attribute name in generated Linalg rewriting transformations. |
| const StringLiteral kTransformMarker = "__internal_transform__"; |
| |
| /// Helper class to control application of linalg transformation patterns. |
| /// Control comes in 2 forms: |
| /// 1. attribute matching and setting behavior using the attribute named |
| /// `kTransformMarker`. This can be used to build a state machine |
| /// using attributes and incrementally applying patterns to advance states. |
| /// 2. filter function, which is a simple lambda on the Operation* that |
| /// returns a LogicalResult. |
| struct TransformationFilter { |
| using FilterFunction = std::function<LogicalResult(Operation *)>; |
| |
| explicit TransformationFilter( |
| ArrayRef<StringAttr> matchDisjunction = {}, |
| std::optional<StringAttr> replacement = std::nullopt); |
| |
| explicit TransformationFilter( |
| const FilterFunction &f, ArrayRef<StringAttr> matchDisjunction = {}, |
| std::optional<StringAttr> replacement = std::nullopt); |
| |
| TransformationFilter(TransformationFilter &&) = default; |
| TransformationFilter(const TransformationFilter &) = default; |
| LogicalResult checkAndNotify(PatternRewriter &rewriter, Operation *op) const; |
| void replaceTransformationFilter(PatternRewriter &rewriter, |
| Operation *op) const; |
| |
| TransformationFilter &addFilter(const FilterFunction &f) { |
| if (f) |
| filters.push_back(f); |
| return *this; |
| } |
| |
| template <typename... OpTypes> |
| TransformationFilter &addOpFilter() { |
| return addFilter( |
| [](Operation *op) { return success(isa<OpTypes...>(op)); }); |
| } |
| |
| TransformationFilter &addOpNameFilter(StringRef opName) { |
| return addFilter([opName](Operation *op) { |
| return success(op->getName().getStringRef() == opName); |
| }); |
| } |
| |
| TransformationFilter &setMatchByDefault() { |
| matchByDefault = true; |
| return *this; |
| } |
| |
| private: |
| SmallVector<FilterFunction> filters; |
| SmallVector<StringAttr> matchDisjunction; |
| std::optional<StringAttr> replacement; |
| /// When set to true, if the attribute is not set, it will be treated as |
| /// a match. Default is false. |
| bool matchByDefault; |
| }; |
| |
| TransformationFilter::TransformationFilter( |
| ArrayRef<StringAttr> matchDisjunction, |
| std::optional<StringAttr> replacement) |
| : matchDisjunction(matchDisjunction.begin(), matchDisjunction.end()), |
| replacement(replacement), matchByDefault(false) {} |
| |
| LogicalResult TransformationFilter::checkAndNotify(PatternRewriter &rewriter, |
| Operation *op) const { |
| if (llvm::any_of(filters, |
| [&](const FilterFunction &f) { return failed(f(op)); })) |
| return failure(); |
| |
| auto attr = op->template getAttrOfType<StringAttr>(kTransformMarker); |
| |
| if (!attr) { |
| // 1. Has no filter case and matchDisjunction is empty. |
| if (matchDisjunction.empty() || matchByDefault) |
| return success(); |
| |
| // 2. Has no filter but was expecting a filter. |
| return rewriter.notifyMatchFailure(op, [&](Diagnostic &diag) { |
| diag << " does not have any filter from list: "; |
| interleaveComma(matchDisjunction, diag); |
| }); |
| } |
| |
| // 4. Match explicit filter. |
| for (auto filter : matchDisjunction) |
| if (attr.getValue() == filter) |
| return success(); |
| |
| // 5. Fail to match. |
| return rewriter.notifyMatchFailure(op, [&](Diagnostic &diag) { |
| diag << " does not have any filter from list: "; |
| interleaveComma(matchDisjunction, diag); |
| }); |
| } |
| |
| void TransformationFilter::replaceTransformationFilter( |
| PatternRewriter &rewriter, Operation *op) const { |
| if (replacement.has_value()) |
| op->setAttr(kTransformMarker, *replacement); |
| else |
| op->removeAttr(rewriter.getStringAttr(kTransformMarker)); |
| } |
| |
| /// Pattern for testing `TileUsingSCFForOp` pattern (that tiles operations using |
| /// the `TilingInterface` with `scf.for` ops for iterating over the tiles) while |
| /// using a `filter` to avoid recursive application. |
| struct TestTileUsingSCFForOp |
| : public OpInterfaceRewritePattern<TilingInterface> { |
| TestTileUsingSCFForOp(MLIRContext *context, scf::SCFTilingOptions options, |
| TransformationFilter filter = TransformationFilter(), |
| PatternBenefit benefit = 1) |
| : OpInterfaceRewritePattern<TilingInterface>(context, benefit), |
| options(std::move(options)), filter(std::move(filter)) {} |
| |
| /// Construct a generic pattern applied to `opName`. |
| TestTileUsingSCFForOp(StringRef opName, MLIRContext *context, |
| scf::SCFTilingOptions options, |
| TransformationFilter filter = TransformationFilter(), |
| PatternBenefit benefit = 1) |
| : OpInterfaceRewritePattern<TilingInterface>(context, benefit), |
| options(std::move(options)), filter(std::move(filter)) {} |
| |
| LogicalResult matchAndRewrite(TilingInterface op, |
| PatternRewriter &rewriter) const override { |
| if (failed(filter.checkAndNotify(rewriter, op))) |
| return failure(); |
| |
| FailureOr<scf::SCFTilingResult> tilingResult = |
| scf::tileUsingSCFForOp(rewriter, op, options); |
| if (failed(tilingResult)) |
| return rewriter.notifyMatchFailure(op, "failed to tile operation"); |
| |
| if (op->getNumResults()) { |
| rewriter.replaceOp(op, tilingResult->replacements); |
| } else { |
| rewriter.eraseOp(op); |
| } |
| |
| for (auto *tiledOp : tilingResult->tiledOps) |
| filter.replaceTransformationFilter(rewriter, tiledOp); |
| return success(); |
| } |
| |
| private: |
| scf::SCFTilingOptions options; |
| TransformationFilter filter; |
| }; |
| |
| /// Pattern for testing `tileUsingSCFForallOp` (that tiles operations using |
| /// the `TilingInterface` with `scf.forall` ops for iterating over the tiles) |
| /// while using a `filter` to avoid recursive application. |
| struct TestTileUsingSCFForallOp |
| : public OpInterfaceRewritePattern<TilingInterface> { |
| TestTileUsingSCFForallOp(MLIRContext *context, scf::SCFTilingOptions options, |
| TransformationFilter filter = TransformationFilter(), |
| PatternBenefit benefit = 1) |
| : OpInterfaceRewritePattern<TilingInterface>(context, benefit), |
| options(std::move(options)), filter(std::move(filter)) {} |
| |
| /// Construct a generic pattern applied to `opName`. |
| TestTileUsingSCFForallOp(StringRef opName, MLIRContext *context, |
| scf::SCFTilingOptions options, |
| TransformationFilter filter = TransformationFilter(), |
| PatternBenefit benefit = 1) |
| : OpInterfaceRewritePattern<TilingInterface>(context, benefit), |
| options(std::move(options)), filter(std::move(filter)) {} |
| |
| LogicalResult matchAndRewrite(TilingInterface op, |
| PatternRewriter &rewriter) const override { |
| if (failed(filter.checkAndNotify(rewriter, op))) |
| return failure(); |
| |
| FailureOr<scf::SCFTilingResult> tilingResult = |
| scf::tileUsingSCFForallOp(rewriter, op, options); |
| if (failed(tilingResult)) |
| return rewriter.notifyMatchFailure(op, "failed to tile operation"); |
| |
| if (op->getNumResults()) { |
| rewriter.replaceOp(op, tilingResult->replacements); |
| } else { |
| rewriter.eraseOp(op); |
| } |
| |
| for (auto *tiledOp : tilingResult->tiledOps) |
| filter.replaceTransformationFilter(rewriter, tiledOp); |
| return success(); |
| } |
| |
| private: |
| scf::SCFTilingOptions options; |
| TransformationFilter filter; |
| }; |
| |
| /// Pattern for testing `TileConsumerAndFuseProducersUsingSCFForOp` pattern |
| /// (that tiles and fuses operations using the `TilingInterface` with `scf.for` |
| /// ops for iterating over the tiles) while using a `filter` to avoid recursive |
| /// application. |
| struct TestTileConsumerAndFuseProducersGreedilyUsingSCFForOp |
| : public OpInterfaceRewritePattern<TilingInterface> { |
| TestTileConsumerAndFuseProducersGreedilyUsingSCFForOp( |
| MLIRContext *context, scf::SCFTileAndFuseOptions options, |
| TransformationFilter filter = TransformationFilter(), |
| PatternBenefit benefit = 1) |
| : OpInterfaceRewritePattern<TilingInterface>(context, benefit), |
| options(std::move(options)), filter(std::move(filter)) {} |
| |
| /// Construct a generic pattern applied to `opName`. |
| TestTileConsumerAndFuseProducersGreedilyUsingSCFForOp( |
| StringRef opName, MLIRContext *context, |
| scf::SCFTileAndFuseOptions options, |
| TransformationFilter filter = TransformationFilter(), |
| PatternBenefit benefit = 1) |
| : OpInterfaceRewritePattern<TilingInterface>(context, benefit), |
| options(std::move(options)), filter(std::move(filter)) {} |
| |
| LogicalResult matchAndRewrite(TilingInterface op, |
| PatternRewriter &rewriter) const override { |
| if (failed(filter.checkAndNotify(rewriter, op))) |
| return failure(); |
| |
| FailureOr<scf::SCFTileAndFuseResult> tileAndFuseResult = |
| scf::tileConsumerAndFuseProducerGreedilyUsingSCFForOp(rewriter, op, |
| options); |
| if (failed(tileAndFuseResult)) { |
| return failure(); |
| } |
| // Replace the tiled op with replacements. |
| SmallVector<Value> replacements(op->getNumResults()); |
| for (const auto &result : llvm::enumerate(op->getResults())) { |
| replacements[result.index()] = |
| tileAndFuseResult->replacements.lookup(result.value()); |
| } |
| rewriter.replaceOp(op, replacements); |
| |
| filter.replaceTransformationFilter( |
| rewriter, tileAndFuseResult->tiledAndFusedOps.front()); |
| return success(); |
| } |
| |
| private: |
| scf::SCFTileAndFuseOptions options; |
| TransformationFilter filter; |
| }; |
| |
| /// Pattern to tile a consumer and fuse producer with it |
| /// while reconstructing the value of the fused producer |
| /// from within the loop nest to replace any external |
| /// uses of the producer. In general yielding the producer |
| /// this way requires a guarantee that the slice of the producer |
| /// is not computed redundantly within the tiled loops. An analysis that |
| /// figures it out has shown to be very complex. So this is left as a caller |
| /// side determination. In this test pattern it is assumed that the tile sizes |
| /// are selected such that all producers when fused into the tiled loops do no |
| /// have redundant computation. |
| struct TestTileConsumerFuseAndYieldProducerUsingSCFForOp |
| : public OpInterfaceRewritePattern<TilingInterface> { |
| |
| TestTileConsumerFuseAndYieldProducerUsingSCFForOp( |
| MLIRContext *context, scf::SCFTilingOptions options, |
| TransformationFilter filter = TransformationFilter(), |
| PatternBenefit benefit = 1) |
| : OpInterfaceRewritePattern<TilingInterface>(context, benefit), |
| options(std::move(options)), filter(std::move(filter)) {} |
| |
| LogicalResult matchAndRewrite(TilingInterface rootOp, |
| PatternRewriter &rewriter) const override { |
| if (failed(filter.checkAndNotify(rewriter, rootOp))) |
| return failure(); |
| |
| // Collect list of operations that can be tiled and fused. |
| llvm::SmallDenseSet<Operation *> tiledAndFusedOps = |
| collectTiledAndFusedOps(rootOp); |
| auto isIgnoredUser = [&](Operation *user, scf::ForOp outerMostTiledLoop) { |
| return tiledAndFusedOps.count(user) || isa<tensor::DimOp>(user) || |
| outerMostTiledLoop->isAncestor(user); |
| }; |
| |
| // The rest of this method is similar to |
| // scf::tileConsumerAndFuseProducerGreedilyUsingSCFForOp, except that also |
| // yields replacements for values of the fused producer. |
| |
| // 1. Tile the consumer. |
| SmallVector<OpResult> yieldedValuesToOrigValues; |
| FailureOr<scf::SCFTilingResult> tilingResult = |
| scf::tileUsingSCFForOp(rewriter, rootOp, options); |
| if (failed(tilingResult)) { |
| return rewriter.notifyMatchFailure(rootOp, |
| "failed to tile base operation"); |
| } |
| yieldedValuesToOrigValues.append(rootOp->result_begin(), |
| rootOp->result_end()); |
| |
| // 2. Tiling each operation results in generation of slices. The source of |
| // these slices could be producers that can be fused into the tiled loops by |
| // computing the slices of these producers in-place. This results in more |
| // slices created for operands of the "fused producer". This open up more |
| // opportunities for fusion. Use a worklist to fuse greedily. |
| auto addCandidateSlices = |
| [](Operation *fusedOp, std::deque<tensor::ExtractSliceOp> &candidates) { |
| for (Value operand : fusedOp->getOperands()) |
| if (auto sliceOp = operand.getDefiningOp<tensor::ExtractSliceOp>()) |
| candidates.push_back(sliceOp); |
| }; |
| |
| std::deque<tensor::ExtractSliceOp> candidates; |
| addCandidateSlices(tilingResult->tiledOps.back(), candidates); |
| OpBuilder::InsertionGuard g(rewriter); |
| auto forLoops = llvm::to_vector(llvm::map_range( |
| tilingResult->loops, [](auto op) { return cast<scf::ForOp>(op); })); |
| while (!candidates.empty()) { |
| // Traverse the slices in BFS fashion. |
| tensor::ExtractSliceOp candidateSliceOp = candidates.front(); |
| candidates.pop_front(); |
| |
| // Materialize the slice of the producer in place. |
| std::optional<scf::SCFFuseProducerOfSliceResult> fusedProducer = |
| tileAndFuseProducerOfSlice(rewriter, candidateSliceOp, forLoops); |
| if (!fusedProducer) |
| continue; |
| |
| // Check if the fused producer has other uses that require the value |
| // to be yielded from within the tiled loop. |
| OpResult untiledProducer = fusedProducer->origProducer; |
| if (llvm::any_of(untiledProducer.getUsers(), [&](Operation *user) { |
| return !isIgnoredUser(user, forLoops.front()); |
| })) { |
| yieldReplacementForFusedProducer(rewriter, candidateSliceOp, |
| fusedProducer.value(), forLoops); |
| yieldedValuesToOrigValues.push_back(untiledProducer); |
| } |
| |
| // Add more fusion candidates to the worklist. |
| if (auto fusedProducerOp = |
| fusedProducer->tiledAndFusedProducer.getDefiningOp()) |
| addCandidateSlices(fusedProducerOp, candidates); |
| } |
| |
| scf::ForOp outermostLoop = forLoops.front(); |
| for (auto [index, origVal] : llvm::enumerate(yieldedValuesToOrigValues)) { |
| Value replacement = outermostLoop.getResult(index); |
| rewriter.replaceUsesWithIf(origVal, replacement, [&](OpOperand &use) { |
| return !isIgnoredUser(use.getOwner(), outermostLoop); |
| }); |
| } |
| rewriter.eraseOp(rootOp); |
| filter.replaceTransformationFilter(rewriter, tilingResult->tiledOps.back()); |
| return success(); |
| } |
| |
| private: |
| /// Starting from `op` walk all operands backwards to find all |
| /// potentially fusable operations, i.e. operations that implement |
| /// the `TilingInterface`. |
| llvm::SmallDenseSet<Operation *> |
| collectTiledAndFusedOps(Operation *op) const { |
| SmallVector<Operation *> worklist; |
| llvm::SmallDenseSet<Operation *> producers; |
| worklist.push_back(op); |
| producers.insert(op); |
| while (!worklist.empty()) { |
| Operation *current = worklist.pop_back_val(); |
| for (OpOperand &operand : current->getOpOperands()) { |
| Operation *producer = operand.get().getDefiningOp(); |
| if (!producer || !isa<TilingInterface>(producer) || |
| producers.count(producer)) |
| continue; |
| worklist.push_back(producer); |
| producers.insert(producer); |
| } |
| } |
| return producers; |
| } |
| |
| scf::SCFTilingOptions options; |
| TransformationFilter filter; |
| }; |
| |
| /// Pattern to lower operations that implement the `TilingInterface` to |
| /// loops/scalar IR using `scf.for`. |
| struct LowerToLoopsUsingSCFForOp |
| : public OpInterfaceRewritePattern<TilingInterface> { |
| using OpInterfaceRewritePattern<TilingInterface>::OpInterfaceRewritePattern; |
| |
| /// `matchAndRewrite` implementation that returns the significant transformed |
| /// pieces of IR. |
| LogicalResult matchAndRewrite(TilingInterface op, |
| PatternRewriter &rewriter) const override { |
| FailureOr<SmallVector<scf::ForOp>> loops = |
| scf::lowerToLoopsUsingSCFForOp(rewriter, op); |
| if (failed(loops)) |
| return rewriter.notifyMatchFailure(op, "failed to lower to loops"); |
| rewriter.eraseOp(op); |
| return loops; |
| } |
| }; |
| |
| /// Test pass for testing the use of `TilingInterface`. |
| struct TestTilingInterfacePass |
| : public PassWrapper<TestTilingInterfacePass, OperationPass<func::FuncOp>> { |
| MLIR_DEFINE_EXPLICIT_INTERNAL_INLINE_TYPE_ID(TestTilingInterfacePass) |
| |
| TestTilingInterfacePass() = default; |
| TestTilingInterfacePass(const TestTilingInterfacePass &pass) |
| : PassWrapper(pass) {} |
| void getDependentDialects(DialectRegistry ®istry) const override { |
| registry.insert<affine::AffineDialect, gpu::GPUDialect, |
| linalg::LinalgDialect, memref::MemRefDialect, |
| scf::SCFDialect, tensor::TensorDialect>(); |
| linalg::registerTilingInterfaceExternalModels(registry); |
| tensor::registerTilingInterfaceExternalModels(registry); |
| } |
| StringRef getArgument() const final { return "test-tiling-interface"; } |
| StringRef getDescription() const final { |
| return "Test tiling using TilingInterface"; |
| } |
| |
| Option<bool> testTiling{ |
| *this, "tile-using-scf-for", |
| llvm::cl::desc( |
| "Test tiling using TilingInterface with scf.for operations"), |
| llvm::cl::init(false)}; |
| |
| Option<bool> testTilingForAll{ |
| *this, "tile-using-scf-forall", |
| llvm::cl::desc( |
| "Test tiling using TilingInterface with scf.forall operations"), |
| llvm::cl::init(false)}; |
| |
| Option<bool> testTileConsumerFuseAndYieldProducer{ |
| *this, "tile-consumer-fuse-and-yield-producer-using-scf-for", |
| llvm::cl::desc( |
| "Test tile and fuse transformation while yielding fused producer " |
| "replacements using TilingInterface with scf.for operations"), |
| llvm::cl::init(false)}; |
| |
| Option<bool> testTileConsumerAndFuseProducer{ |
| *this, "tile-consumer-and-fuse-producer-using-scf-for", |
| llvm::cl::desc("Test tile and fuse transformation using TilingInterface " |
| "with scf.for operations"), |
| llvm::cl::init(false)}; |
| |
| Option<bool> testLoweringToScalar{ |
| *this, "lower-to-scalar-using-scf-for", |
| llvm::cl::desc("Test lowering to scalar implementation using " |
| "TilingInterface with scf.for operations"), |
| llvm::cl::init(false)}; |
| |
| void runOnOperation() override; |
| |
| private: |
| void addTestPatterns(MLIRContext *context, RewritePatternSet &patterns); |
| }; |
| } // namespace |
| |
| static void addPatternForTiling(MLIRContext *context, |
| RewritePatternSet &patterns, |
| StringRef filterName, |
| ArrayRef<int64_t> tileSizes, |
| ArrayRef<int64_t> interchange = {}) { |
| scf::SCFTilingOptions tilingOptions; |
| SmallVector<OpFoldResult> tileSizesOfr = |
| getAsIndexOpFoldResult(context, tileSizes); |
| tilingOptions.setTileSizes(tileSizesOfr).setInterchange(interchange); |
| TransformationFilter filter(StringAttr::get(context, filterName), |
| StringAttr::get(context, "tiled")); |
| patterns.add<TestTileUsingSCFForOp>(context, tilingOptions, filter); |
| } |
| |
| static void addPatternForTilingUsingForall( |
| MLIRContext *context, RewritePatternSet &patterns, StringRef filterName, |
| ArrayRef<int64_t> tileSizes, |
| ArrayRef<DeviceMappingAttrInterface> mapping = {}, |
| ArrayRef<int64_t> interchange = {}) { |
| scf::SCFTilingOptions tilingOptions; |
| SmallVector<OpFoldResult> tileSizesOfr = |
| getAsIndexOpFoldResult(context, tileSizes); |
| tilingOptions.setTileSizes(tileSizesOfr).setInterchange(interchange); |
| tilingOptions.setMapping(mapping); |
| TransformationFilter filter(StringAttr::get(context, filterName), |
| StringAttr::get(context, "tiled")); |
| patterns.add<TestTileUsingSCFForallOp>(context, tilingOptions, filter); |
| } |
| |
| static void addPatternForTileFuseAndYield(MLIRContext *context, |
| RewritePatternSet &patterns, |
| StringRef filterName, |
| ArrayRef<int64_t> tileSizes, |
| ArrayRef<int64_t> interchange = {}) { |
| scf::SCFTilingOptions tilingOptions; |
| SmallVector<OpFoldResult> tileSizesOfr = |
| getAsIndexOpFoldResult(context, tileSizes); |
| tilingOptions.setTileSizes(tileSizesOfr).setInterchange(interchange); |
| TransformationFilter filter(StringAttr::get(context, filterName), |
| StringAttr::get(context, "tiled")); |
| patterns.add<TestTileConsumerFuseAndYieldProducerUsingSCFForOp>( |
| context, tilingOptions, filter); |
| } |
| |
| static void addPatternForTileAndFuse(MLIRContext *context, |
| RewritePatternSet &patterns, |
| StringRef filterName, |
| ArrayRef<int64_t> tileSizes, |
| ArrayRef<int64_t> interchange = {}) { |
| scf::SCFTileAndFuseOptions tileAndFuseOptions; |
| SmallVector<OpFoldResult> tileSizesOfr = |
| getAsIndexOpFoldResult(context, tileSizes); |
| tileAndFuseOptions.tilingOptions.setTileSizes(tileSizesOfr) |
| .setInterchange(interchange); |
| TransformationFilter filter(StringAttr::get(context, filterName), |
| StringAttr::get(context, "tiled")); |
| patterns.add<TestTileConsumerAndFuseProducersGreedilyUsingSCFForOp>( |
| context, tileAndFuseOptions, filter); |
| } |
| |
| void TestTilingInterfacePass::addTestPatterns(MLIRContext *context, |
| RewritePatternSet &patterns) { |
| if (testTiling) { |
| // 1. Tiling M and N dims of `linalg.matmul` on tensors. |
| addPatternForTiling(context, patterns, "simple_gemm", {10, 20}); |
| // 2. Tiling M, N and K of `linalg.matmul` on buffers. |
| addPatternForTiling(context, patterns, "simple_gemm_memref", {10, 20, 30}); |
| // 3. Tiling 3D parallel generic op which implements a transpose |
| addPatternForTiling(context, patterns, "parallel_generic_transpose", |
| {10, 0, 20}); |
| // 4. Tiling 2D conv op. |
| addPatternForTiling(context, patterns, "simple_conv", |
| {0, 0, 0, 0, 10, 20, 30}); |
| // 5. Tiling a simple op with `linalg.index` inside. |
| addPatternForTiling(context, patterns, "indexed_semantics", {10, 20}); |
| // 6. Tiling + interchange of an operation |
| addPatternForTiling(context, patterns, "gemm_interchange", {10, 20, 30}, |
| {1, 2, 0}); |
| // 7. Tiling for 2D pad tensor operations. |
| addPatternForTiling(context, patterns, "pad_2dtiling", {2, 3}); |
| // 8. Tiling inner dimension of 2d pad tensor operations. |
| addPatternForTiling(context, patterns, "pad_inner_tiling", {0, 3}); |
| // 9. Tiling inner dimension of 2d pad tensor operations. |
| addPatternForTiling(context, patterns, "pad_outer_tiling", {2, 3}); |
| // 10. Tiling M and N dims of `linalg.copy` on memrefs. |
| addPatternForTiling(context, patterns, "simple_copy_memref", {10, 20}); |
| // 11. Tiling scalar operations. |
| addPatternForTiling(context, patterns, "scalar_op", {}); |
| return; |
| } |
| if (testTilingForAll) { |
| // 1. Tiling M and N dims of `linalg.matmul` on tensors. |
| addPatternForTilingUsingForall( |
| context, patterns, "simple_gemm", {10, 20}, |
| {gpu::GPUBlockMappingAttr::get(context, gpu::MappingId::DimY), |
| gpu::GPUBlockMappingAttr::get(context, gpu::MappingId::DimX)}); |
| // 2. Tiling 3D parallel generic op which implements a transpose. |
| addPatternForTilingUsingForall(context, patterns, |
| "parallel_generic_transpose", {10, 0, 20}); |
| // 3. Tiling 2D conv op. |
| addPatternForTilingUsingForall(context, patterns, "simple_conv", |
| {0, 0, 0, 0, 10, 20, 30}); |
| // 4. Tiling a simple op with `linalg.index` inside. |
| addPatternForTilingUsingForall(context, patterns, "indexed_semantics", |
| {10, 20}); |
| return; |
| } |
| if (testTileConsumerAndFuseProducer) { |
| // 1. Tile and fuse of gemm with fill producer and bias-add consumer. |
| addPatternForTileAndFuse(context, patterns, "fusion", {10, 20}); |
| // 2. Tile and fuse sequence of GEMMs, by fusing only along M. |
| addPatternForTileAndFuse(context, patterns, "gemm_fusion", {10}); |
| // 3. Tile and fuse gemm with consumer + interchange of tiled loops. |
| addPatternForTileAndFuse(context, patterns, "gemm_interchange_fusion", |
| {10, 20}, {1, 0}); |
| // 4. Tile and fuse matmul + transpose(matmul). Will introduce redundant |
| // computations. |
| addPatternForTileAndFuse(context, patterns, "gemm_plus_gemm_fusion", |
| {10, 20}); |
| // 5. Tile and fuse a sequence of GEMMs by tiling and fusing only along M |
| // dimension. |
| addPatternForTileAndFuse(context, patterns, "gemm_sequence_fusion", {10}); |
| // 6. Fusion of back-to-back-reduction ops |
| addPatternForTileAndFuse(context, patterns, "reduction_sequence_fusion", |
| {10}); |
| return; |
| } |
| if (testTileConsumerFuseAndYieldProducer) { |
| // 1. Fusion of back-to-back-reduction ops |
| addPatternForTileFuseAndYield(context, patterns, |
| "gemm_sequence_fusion_and_yield", {10}); |
| return; |
| } |
| if (testLoweringToScalar) { |
| patterns.add<LowerToLoopsUsingSCFForOp>(context); |
| } |
| } |
| |
| void TestTilingInterfacePass::runOnOperation() { |
| MLIRContext *context = &getContext(); |
| |
| RewritePatternSet tilingPatterns(context); |
| addTestPatterns(context, tilingPatterns); |
| if (failed(applyPatternsAndFoldGreedily(getOperation(), |
| std::move(tilingPatterns)))) |
| return signalPassFailure(); |
| } |
| |
| namespace mlir { |
| namespace test { |
| void registerTestTilingInterface() { |
| PassRegistration<TestTilingInterfacePass>(); |
| } |
| } // namespace test |
| } // namespace mlir |