xref: /llvm-project/mlir/lib/Conversion/SCFToGPU/SCFToGPUPass.cpp (revision 4c48f016effde67d500fc95290096aec9f3bdb70)
14ead2cf7SAlex Zinenko //===- SCFToGPUPass.cpp - Convert a loop nest to a GPU kernel -----------===//
24ead2cf7SAlex Zinenko //
34ead2cf7SAlex Zinenko // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
44ead2cf7SAlex Zinenko // See https://llvm.org/LICENSE.txt for license information.
54ead2cf7SAlex Zinenko // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
64ead2cf7SAlex Zinenko //
74ead2cf7SAlex Zinenko //===----------------------------------------------------------------------===//
84ead2cf7SAlex Zinenko 
94ead2cf7SAlex Zinenko #include "mlir/Conversion/SCFToGPU/SCFToGPUPass.h"
1067d0d7acSMichele Scuttari 
114ead2cf7SAlex Zinenko #include "mlir/Conversion/SCFToGPU/SCFToGPU.h"
124ead2cf7SAlex Zinenko #include "mlir/Dialect/Affine/IR/AffineOps.h"
13abc362a1SJakub Kuderski #include "mlir/Dialect/Arith/IR/Arith.h"
14b1e1bbaeSAlexander Belyaev #include "mlir/Dialect/Complex/IR/Complex.h"
15d7ef488bSMogball #include "mlir/Dialect/GPU/IR/GPUDialect.h"
168b68da2cSAlex Zinenko #include "mlir/Dialect/SCF/IR/SCF.h"
1767d0d7acSMichele Scuttari #include "mlir/Pass/Pass.h"
184ead2cf7SAlex Zinenko #include "mlir/Transforms/DialectConversion.h"
194ead2cf7SAlex Zinenko #include "llvm/ADT/ArrayRef.h"
204ead2cf7SAlex Zinenko #include "llvm/Support/CommandLine.h"
214ead2cf7SAlex Zinenko 
2267d0d7acSMichele Scuttari namespace mlir {
2367d0d7acSMichele Scuttari #define GEN_PASS_DEF_CONVERTAFFINEFORTOGPU
2467d0d7acSMichele Scuttari #define GEN_PASS_DEF_CONVERTPARALLELLOOPTOGPU
2567d0d7acSMichele Scuttari #include "mlir/Conversion/Passes.h.inc"
2667d0d7acSMichele Scuttari } // namespace mlir
2767d0d7acSMichele Scuttari 
284ead2cf7SAlex Zinenko using namespace mlir;
294ead2cf7SAlex Zinenko using namespace mlir::scf;
304ead2cf7SAlex Zinenko 
314ead2cf7SAlex Zinenko namespace {
324ead2cf7SAlex Zinenko // A pass that traverses top-level loops in the function and converts them to
334ead2cf7SAlex Zinenko // GPU launch operations.  Nested launches are not allowed, so this does not
344ead2cf7SAlex Zinenko // walk the function recursively to avoid considering nested loops.
3567d0d7acSMichele Scuttari struct ForLoopMapper : public impl::ConvertAffineForToGPUBase<ForLoopMapper> {
364ead2cf7SAlex Zinenko   ForLoopMapper() = default;
ForLoopMapper__anond710c38d0111::ForLoopMapper374ead2cf7SAlex Zinenko   ForLoopMapper(unsigned numBlockDims, unsigned numThreadDims) {
384ead2cf7SAlex Zinenko     this->numBlockDims = numBlockDims;
394ead2cf7SAlex Zinenko     this->numThreadDims = numThreadDims;
404ead2cf7SAlex Zinenko   }
414ead2cf7SAlex Zinenko 
runOnOperation__anond710c38d0111::ForLoopMapper4241574554SRiver Riddle   void runOnOperation() override {
43ecba7c58SRiver Riddle     for (Operation &op : llvm::make_early_inc_range(
44ecba7c58SRiver Riddle              getOperation().getFunctionBody().getOps())) {
45*4c48f016SMatthias Springer       if (auto forOp = dyn_cast<affine::AffineForOp>(&op)) {
464ead2cf7SAlex Zinenko         if (failed(convertAffineLoopNestToGPULaunch(forOp, numBlockDims,
474ead2cf7SAlex Zinenko                                                     numThreadDims)))
484ead2cf7SAlex Zinenko           signalPassFailure();
494ead2cf7SAlex Zinenko       }
504ead2cf7SAlex Zinenko     }
514ead2cf7SAlex Zinenko   }
524ead2cf7SAlex Zinenko };
534ead2cf7SAlex Zinenko 
544ead2cf7SAlex Zinenko struct ParallelLoopToGpuPass
5567d0d7acSMichele Scuttari     : public impl::ConvertParallelLoopToGpuBase<ParallelLoopToGpuPass> {
runOnOperation__anond710c38d0111::ParallelLoopToGpuPass564ead2cf7SAlex Zinenko   void runOnOperation() override {
57dc4e913bSChris Lattner     RewritePatternSet patterns(&getContext());
583a506b31SChris Lattner     populateParallelLoopToGPUPatterns(patterns);
594ead2cf7SAlex Zinenko     ConversionTarget target(getContext());
6033a58c1cSStephan Herhut     target.markUnknownOpDynamicallyLegal([](Operation *) { return true; });
615da2423bSStephan Herhut     configureParallelLoopToGPULegality(target);
623fffffa8SRiver Riddle     if (failed(applyPartialConversion(getOperation(), target,
633fffffa8SRiver Riddle                                       std::move(patterns))))
644ead2cf7SAlex Zinenko       signalPassFailure();
65ec03bbe8SVladislav Vinogradov     finalizeParallelLoopToGPUConversion(getOperation());
664ead2cf7SAlex Zinenko   }
674ead2cf7SAlex Zinenko };
684ead2cf7SAlex Zinenko 
694ead2cf7SAlex Zinenko } // namespace
704ead2cf7SAlex Zinenko 
7147f175b0SRiver Riddle std::unique_ptr<InterfacePass<FunctionOpInterface>>
createAffineForToGPUPass(unsigned numBlockDims,unsigned numThreadDims)722bcd1927SMaheshRavishankar mlir::createAffineForToGPUPass(unsigned numBlockDims, unsigned numThreadDims) {
734ead2cf7SAlex Zinenko   return std::make_unique<ForLoopMapper>(numBlockDims, numThreadDims);
744ead2cf7SAlex Zinenko }
7547f175b0SRiver Riddle std::unique_ptr<InterfacePass<FunctionOpInterface>>
createAffineForToGPUPass()7647f175b0SRiver Riddle mlir::createAffineForToGPUPass() {
774ead2cf7SAlex Zinenko   return std::make_unique<ForLoopMapper>();
784ead2cf7SAlex Zinenko }
79039b969bSMichele Scuttari 
createParallelLoopToGpuPass()80039b969bSMichele Scuttari std::unique_ptr<Pass> mlir::createParallelLoopToGpuPass() {
81039b969bSMichele Scuttari   return std::make_unique<ParallelLoopToGpuPass>();
82039b969bSMichele Scuttari }
83