mlir/lib/Conversion/SCFToGPU/SCFToGPUPass.cpp

//===- SCFToGPUPass.cpp - Convert a loop nest to a GPU kernel -----------===//
//
// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
// See https://llvm.org/LICENSE.txt for license information.
// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
//
//===----------------------------------------------------------------------===//

#include "mlir/Conversion/SCFToGPU/SCFToGPUPass.h"
#include "../PassDetail.h"
#include "mlir/Conversion/SCFToGPU/SCFToGPU.h"
#include "mlir/Dialect/Affine/IR/AffineOps.h"
#include "mlir/Dialect/GPU/GPUDialect.h"
#include "mlir/Dialect/SCF/SCF.h"
#include "mlir/Dialect/StandardOps/IR/Ops.h"
#include "mlir/Transforms/DialectConversion.h"

#include "llvm/ADT/ArrayRef.h"
#include "llvm/Support/CommandLine.h"

using namespace mlir;
using namespace mlir::scf;

namespace {
// A pass that traverses top-level loops in the function and converts them to
// GPU launch operations.  Nested launches are not allowed, so this does not
// walk the function recursively to avoid considering nested loops.
struct ForLoopMapper : public ConvertAffineForToGPUBase<ForLoopMapper> {
  ForLoopMapper() = default;
  ForLoopMapper(unsigned numBlockDims, unsigned numThreadDims) {
    this->numBlockDims = numBlockDims;
    this->numThreadDims = numThreadDims;
  }

  void runOnFunction() override {
    for (Operation &op : llvm::make_early_inc_range(getFunction().getOps())) {
      if (auto forOp = dyn_cast<AffineForOp>(&op)) {
        if (failed(convertAffineLoopNestToGPULaunch(forOp, numBlockDims,
                                                    numThreadDims)))
          signalPassFailure();
      }
    }
  }
};

struct ParallelLoopToGpuPass
    : public ConvertParallelLoopToGpuBase<ParallelLoopToGpuPass> {
  void runOnOperation() override {
    OwningRewritePatternList patterns;
    populateParallelLoopToGPUPatterns(patterns, &getContext());
    ConversionTarget target(getContext());
    target.addLegalDialect<StandardOpsDialect>();
    target.addLegalDialect<AffineDialect>();
    target.addLegalDialect<gpu::GPUDialect>();
    target.addLegalDialect<scf::SCFDialect>();
    target.addIllegalOp<scf::ParallelOp>();
    if (failed(applyPartialConversion(getOperation(), target, patterns)))
      signalPassFailure();
  }
};

} // namespace

std::unique_ptr<OperationPass<FuncOp>>
mlir::createAffineForToGPUPass(unsigned numBlockDims, unsigned numThreadDims) {
  return std::make_unique<ForLoopMapper>(numBlockDims, numThreadDims);
}
std::unique_ptr<OperationPass<FuncOp>> mlir::createAffineForToGPUPass() {
  return std::make_unique<ForLoopMapper>();
}

std::unique_ptr<Pass> mlir::createParallelLoopToGpuPass() {
  return std::make_unique<ParallelLoopToGpuPass>();
}
[mlir] Rename conversions involving ex-Loop dialect to mention SCF 2020-05-14 14:41:35 +02:00			`//===- SCFToGPUPass.cpp - Convert a loop nest to a GPU kernel -----------===//`
Convert a nest affine loops to a GPU kernel 2019-06-14 01:56:19 -07:00			`//`
Mass update the MLIR license header to mention "Part of the LLVM project" 2020-01-26 03:58:30 +00:00			`// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.`
Adjust License.txt file to use the LLVM license 2019-12-23 09:35:36 -08:00			`// See https://llvm.org/LICENSE.txt for license information.`
			`// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception`
Convert a nest affine loops to a GPU kernel 2019-06-14 01:56:19 -07:00			`//`
Adjust License.txt file to use the LLVM license 2019-12-23 09:35:36 -08:00			`//===----------------------------------------------------------------------===//`
Convert a nest affine loops to a GPU kernel 2019-06-14 01:56:19 -07:00
[mlir] Rename conversions involving ex-Loop dialect to mention SCF 2020-05-14 14:41:35 +02:00			`#include "mlir/Conversion/SCFToGPU/SCFToGPUPass.h"`
[mlir][Pass] Update the PassGen to generate base classes instead of utilities 2020-04-07 13:58:12 -07:00			`#include "../PassDetail.h"`
[mlir] Rename conversions involving ex-Loop dialect to mention SCF 2020-05-14 14:41:35 +02:00			`#include "mlir/Conversion/SCFToGPU/SCFToGPU.h"`
[mlir][NFC] Cleanup AffineOps directory structure 2020-03-20 14:18:47 -07:00			`#include "mlir/Dialect/Affine/IR/AffineOps.h"`
[MLIR][GPU] Properly model step in parallel loop to gpu conversion. 2020-02-24 16:02:50 +01:00			`#include "mlir/Dialect/GPU/GPUDialect.h"`
[mlir] NFC: Rename LoopOps dialect to SCF (Structured Control Flow) 2020-05-11 15:00:48 +02:00			`#include "mlir/Dialect/SCF/SCF.h"`
Move StandardOps/Ops.h to StandardOps/IR/Ops.h 2020-02-21 11:54:49 -08:00			`#include "mlir/Dialect/StandardOps/IR/Ops.h"`
[MLIR][GPU] Properly model step in parallel loop to gpu conversion. 2020-02-24 16:02:50 +01:00			`#include "mlir/Transforms/DialectConversion.h"`
Convert a nest affine loops to a GPU kernel 2019-06-14 01:56:19 -07:00
Support lowering of imperfectly nested loops into GPU dialect. 2019-11-01 10:51:33 -07:00			`#include "llvm/ADT/ArrayRef.h"`
Convert a nest affine loops to a GPU kernel 2019-06-14 01:56:19 -07:00			`#include "llvm/Support/CommandLine.h"`

			`using namespace mlir;`
[mlir] NFC: Rename LoopOps dialect to SCF (Structured Control Flow) 2020-05-11 15:00:48 +02:00			`using namespace mlir::scf;`
Convert a nest affine loops to a GPU kernel 2019-06-14 01:56:19 -07:00
			`namespace {`
			`// A pass that traverses top-level loops in the function and converts them to`
			`// GPU launch operations. Nested launches are not allowed, so this does not`
			`// walk the function recursively to avoid considering nested loops.`
[mlir][SCFToGPU] Remove conversions from scf.for to gpu.launch. 2020-06-01 22:42:33 -07:00			`struct ForLoopMapper : public ConvertAffineForToGPUBase<ForLoopMapper> {`
[mlir] Move several static cl::opts to be pass options instead. 2020-03-21 15:08:49 -07:00			`ForLoopMapper() = default;`
			`ForLoopMapper(unsigned numBlockDims, unsigned numThreadDims) {`
			`this->numBlockDims = numBlockDims;`
			`this->numThreadDims = numThreadDims;`
			`}`
Expose AffineToGPUPass for use with PassManager 2019-07-01 00:47:58 -07:00
Convert a nest affine loops to a GPU kernel 2019-06-14 01:56:19 -07:00			`void runOnFunction() override {`
[mlir][IR] Add a Region::getOps method that returns a range of immediately nested operations 2020-05-04 17:46:06 -07:00			`for (Operation &op : llvm::make_early_inc_range(getFunction().getOps())) {`
			`if (auto forOp = dyn_cast<AffineForOp>(&op)) {`
			`if (failed(convertAffineLoopNestToGPULaunch(forOp, numBlockDims,`
			`numThreadDims)))`
			`signalPassFailure();`
Support lowering of imperfectly nested loops into GPU dialect. 2019-11-01 10:51:33 -07:00			`}`
			`}`
			`}`
			`};`

[mlir][Pass] Remove the use of CRTP from the Pass classes 2020-04-07 13:56:16 -07:00			`struct ParallelLoopToGpuPass`
[mlir][Pass] Update the PassGen to generate base classes instead of utilities 2020-04-07 13:58:12 -07:00			`: public ConvertParallelLoopToGpuBase<ParallelLoopToGpuPass> {`
[MLIR][GPU] Properly model step in parallel loop to gpu conversion. 2020-02-24 16:02:50 +01:00			`void runOnOperation() override {`
			`OwningRewritePatternList patterns;`
			`populateParallelLoopToGPUPatterns(patterns, &getContext());`
			`ConversionTarget target(getContext());`
			`target.addLegalDialect<StandardOpsDialect>();`
[mlir][NFC] Cleanup AffineOps directory structure 2020-03-20 14:18:47 -07:00			`target.addLegalDialect<AffineDialect>();`
[MLIR][GPU] Properly model step in parallel loop to gpu conversion. 2020-02-24 16:02:50 +01:00			`target.addLegalDialect<gpu::GPUDialect>();`
[mlir] NFC: Rename LoopOps dialect to SCF (Structured Control Flow) 2020-05-11 15:00:48 +02:00			`target.addLegalDialect<scf::SCFDialect>();`
			`target.addIllegalOp<scf::ParallelOp>();`
[MLIR][GPU] Properly model step in parallel loop to gpu conversion. 2020-02-24 16:02:50 +01:00			`if (failed(applyPartialConversion(getOperation(), target, patterns)))`
			`signalPassFailure();`
			`}`
			`};`

Convert a nest affine loops to a GPU kernel 2019-06-14 01:56:19 -07:00			`} // namespace`

[mlir][Pass] Remove the use of CRTP from the Pass classes 2020-04-07 13:56:16 -07:00			`std::unique_ptr<OperationPass<FuncOp>>`
[mlir][SCFToGPU] Remove conversions from scf.for to gpu.launch. 2020-06-01 22:42:33 -07:00			`mlir::createAffineForToGPUPass(unsigned numBlockDims, unsigned numThreadDims) {`
Change from llvm::make_unique to std::make_unique 2019-08-17 11:05:35 -07:00			`return std::make_unique<ForLoopMapper>(numBlockDims, numThreadDims);`
Expose AffineToGPUPass for use with PassManager 2019-07-01 00:47:58 -07:00			`}`
[mlir][SCFToGPU] Remove conversions from scf.for to gpu.launch. 2020-06-01 22:42:33 -07:00			`std::unique_ptr<OperationPass<FuncOp>> mlir::createAffineForToGPUPass() {`
[mlir][Pass] Move the registration of conversion passes to tablegen 2020-04-01 01:49:43 -07:00			`return std::make_unique<ForLoopMapper>();`
			`}`
Expose AffineToGPUPass for use with PassManager 2019-07-01 00:47:58 -07:00
[MLIR][GPU] Properly model step in parallel loop to gpu conversion. 2020-02-24 16:02:50 +01:00			`std::unique_ptr<Pass> mlir::createParallelLoopToGpuPass() {`
			`return std::make_unique<ParallelLoopToGpuPass>();`
			`}`