#include "mlir/Dialect/Arith/IR/Arith.h"
#include "mlir/Dialect/Func/IR/FuncOps.h"
#include "mlir/Dialect/GPU/Transforms/Passes.h"
#include "mlir/Dialect/Index/IR/IndexDialect.h"
#include "mlir/Dialect/MemRef/IR/MemRef.h"
#include "mlir/Dialect/Vector/IR/VectorOps.h"
#include "mlir/IR/PatternMatch.h"
#include "mlir/Pass/Pass.h"
#include "mlir/Transforms/GreedyPatternRewriteDriver.h"
using namespace mlir;
namespace {
struct TestGpuRewritePass
: public PassWrapper<TestGpuRewritePass, OperationPass<ModuleOp>> {
MLIR_DEFINE_EXPLICIT_INTERNAL_INLINE_TYPE_ID(TestGpuRewritePass)
void getDependentDialects(DialectRegistry ®istry) const override {
registry.insert<arith::ArithDialect, func::FuncDialect, index::IndexDialect,
memref::MemRefDialect>();
}
StringRef getArgument() const final { return "test-gpu-rewrite"; }
StringRef getDescription() const final {
return "Applies all rewrite patterns within the GPU dialect.";
}
void runOnOperation() override {
RewritePatternSet patterns(&getContext());
populateGpuRewritePatterns(patterns);
(void)applyPatternsAndFoldGreedily(getOperation(), std::move(patterns));
}
};
struct TestGpuSubgroupReduceLoweringPass
: public PassWrapper<TestGpuSubgroupReduceLoweringPass,
OperationPass<ModuleOp>> {
MLIR_DEFINE_EXPLICIT_INTERNAL_INLINE_TYPE_ID(
TestGpuSubgroupReduceLoweringPass)
TestGpuSubgroupReduceLoweringPass() = default;
TestGpuSubgroupReduceLoweringPass(
const TestGpuSubgroupReduceLoweringPass &pass)
: PassWrapper(pass) {}
void getDependentDialects(DialectRegistry ®istry) const override {
registry.insert<arith::ArithDialect, vector::VectorDialect>();
}
StringRef getArgument() const final {
return "test-gpu-subgroup-reduce-lowering";
}
StringRef getDescription() const final {
return "Applies gpu.subgroup_reduce lowering patterns.";
}
Option<bool> expandToShuffles{
*this, "expand-to-shuffles",
llvm::cl::desc("Expand subgroup_reduce ops to shuffle ops."),
llvm::cl::init(false)};
void runOnOperation() override {
RewritePatternSet patterns(&getContext());
populateGpuBreakDownSubgrupReducePatterns(patterns,
32,
PatternBenefit(2));
if (expandToShuffles)
populateGpuLowerSubgroupReduceToShufflePattenrs(
patterns, 32, 32);
(void)applyPatternsAndFoldGreedily(getOperation(), std::move(patterns));
}
};
}
namespace mlir {
void registerTestGpuLoweringPasses() {
PassRegistration<TestGpuRewritePass>();
PassRegistration<TestGpuSubgroupReduceLoweringPass>();
}
}