Files
llvm-project/mlir/lib/Transforms/LoopUnroll.cpp
T

192 lines
7.1 KiB
C++
Raw Normal View History

//===- LoopUnroll.cpp - Code to perform loop unrolling --------------------===//
2018-07-24 20:01:16 -07:00
//
// Copyright 2019 The MLIR Authors.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
// http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.
// =============================================================================
//
// This file implements loop unrolling.
//
//===----------------------------------------------------------------------===//
#include "mlir/Transforms/Passes.h"
#include "mlir/Analysis/LoopAnalysis.h"
#include "mlir/Dialect/AffineOps/AffineOps.h"
#include "mlir/IR/AffineExpr.h"
#include "mlir/IR/AffineMap.h"
2018-07-24 20:01:16 -07:00
#include "mlir/IR/Builders.h"
2019-02-19 17:17:46 -08:00
#include "mlir/Pass/Pass.h"
#include "mlir/Transforms/LoopUtils.h"
#include "llvm/ADT/DenseMap.h"
#include "llvm/Support/CommandLine.h"
#include "llvm/Support/Debug.h"
2018-07-24 20:01:16 -07:00
using namespace mlir;
#define DEBUG_TYPE "affine-loop-unroll"
static llvm::cl::OptionCategory clOptionsCategory(DEBUG_TYPE " options");
// Loop unrolling factor.
static llvm::cl::opt<unsigned> clUnrollFactor(
"unroll-factor",
llvm::cl::desc("Use this unroll factor for all loops being unrolled"),
llvm::cl::cat(clOptionsCategory));
static llvm::cl::opt<bool> clUnrollFull("unroll-full",
llvm::cl::desc("Fully unroll loops"),
llvm::cl::cat(clOptionsCategory));
static llvm::cl::opt<unsigned> clUnrollNumRepetitions(
"unroll-num-reps",
llvm::cl::desc("Unroll innermost loops repeatedly this many times"),
llvm::cl::cat(clOptionsCategory));
static llvm::cl::opt<unsigned> clUnrollFullThreshold(
"unroll-full-threshold", llvm::cl::Hidden,
llvm::cl::desc(
"Unroll all loops with trip count less than or equal to this"),
llvm::cl::cat(clOptionsCategory));
2018-07-24 20:01:16 -07:00
namespace {
/// Loop unrolling pass. Unrolls all innermost loops unless full unrolling and a
/// full unroll threshold was specified, in which case, fully unrolls all loops
/// with trip count less than the specified threshold. The latter is for testing
/// purposes, especially for testing outer loop unrolling.
struct LoopUnroll : public FunctionPass<LoopUnroll> {
const Optional<unsigned> unrollFactor;
const Optional<bool> unrollFull;
// Callback to obtain unroll factors; if this has a callable target, takes
// precedence over command-line argument or passed argument.
const std::function<unsigned(AffineForOp)> getUnrollFactor;
explicit LoopUnroll(
Optional<unsigned> unrollFactor = None, Optional<bool> unrollFull = None,
const std::function<unsigned(AffineForOp)> &getUnrollFactor = nullptr)
: unrollFactor(unrollFactor), unrollFull(unrollFull),
getUnrollFactor(getUnrollFactor) {}
2018-08-16 13:51:44 -07:00
void runOnFunction() override;
/// Unroll this for op. Returns failure if nothing was done.
LogicalResult runOnAffineForOp(AffineForOp forOp);
2018-11-06 18:34:18 -08:00
static const unsigned kDefaultUnrollFactor = 4;
2018-08-06 18:40:34 -07:00
};
} // end anonymous namespace
2018-07-24 20:01:16 -07:00
void LoopUnroll::runOnFunction() {
2018-07-27 10:58:14 -07:00
// Gathers all innermost loops through a post order pruned walk.
struct InnermostLoopGatherer {
2018-07-27 10:58:14 -07:00
// Store innermost loops as we walk.
std::vector<AffineForOp> loops;
2018-07-27 10:58:14 -07:00
2019-07-09 16:17:55 -07:00
void walkPostOrder(FuncOp f) {
2019-07-01 10:29:09 -07:00
for (auto &b : f)
walkPostOrder(b.begin(), b.end());
}
bool walkPostOrder(Block::iterator Start, Block::iterator End) {
bool hasInnerLoops = false;
// We need to walk all elements since all innermost loops need to be
// gathered as opposed to determining whether this list has any inner
// loops or not.
2018-07-27 10:58:14 -07:00
while (Start != End)
hasInnerLoops |= walkPostOrder(&(*Start++));
return hasInnerLoops;
2018-07-24 20:01:16 -07:00
}
bool walkPostOrder(Operation *opInst) {
bool hasInnerLoops = false;
2019-03-14 10:38:44 -07:00
for (auto &region : opInst->getRegions())
for (auto &block : region)
hasInnerLoops |= walkPostOrder(block.begin(), block.end());
2019-05-11 18:59:54 -07:00
if (isa<AffineForOp>(opInst)) {
if (!hasInnerLoops)
2019-05-11 17:57:32 -07:00
loops.push_back(cast<AffineForOp>(opInst));
return true;
}
return hasInnerLoops;
}
};
if (clUnrollFull.getNumOccurrences() > 0 &&
clUnrollFullThreshold.getNumOccurrences() > 0) {
// Store short loops as we walk.
std::vector<AffineForOp> loops;
// Gathers all loops with trip count <= minTripCount. Do a post order walk
// so that loops are gathered from innermost to outermost (or else unrolling
// an outer one may delete gathered inner ones).
2019-08-29 13:04:22 -07:00
getFunction().walk([&](AffineForOp forOp) {
Optional<uint64_t> tripCount = getConstantTripCount(forOp);
if (tripCount.hasValue() && tripCount.getValue() <= clUnrollFullThreshold)
loops.push_back(forOp);
});
for (auto forOp : loops)
loopUnrollFull(forOp);
return;
}
unsigned numRepetitions = clUnrollNumRepetitions.getNumOccurrences() > 0
? clUnrollNumRepetitions
: 1;
// If the call back is provided, we will recurse until no loops are found.
2019-07-09 16:17:55 -07:00
FuncOp func = getFunction();
for (unsigned i = 0; i < numRepetitions || getUnrollFactor; i++) {
InnermostLoopGatherer ilg;
2019-07-01 10:29:09 -07:00
ilg.walkPostOrder(func);
auto &loops = ilg.loops;
if (loops.empty())
break;
bool unrolled = false;
for (auto forOp : loops)
unrolled |= succeeded(runOnAffineForOp(forOp));
if (!unrolled)
// Break out if nothing was unrolled.
break;
}
2018-08-06 18:40:34 -07:00
}
/// Unrolls a 'affine.for' op. Returns success if the loop was unrolled,
/// failure otherwise. The default unroll factor is 4.
LogicalResult LoopUnroll::runOnAffineForOp(AffineForOp forOp) {
// Use the function callback if one was provided.
if (getUnrollFactor) {
return loopUnrollByFactor(forOp, getUnrollFactor(forOp));
}
2018-08-28 18:24:27 -07:00
// Unroll by the factor passed, if any.
if (unrollFactor.hasValue())
return loopUnrollByFactor(forOp, unrollFactor.getValue());
2018-08-28 18:24:27 -07:00
// Unroll by the command line factor if one was specified.
if (clUnrollFactor.getNumOccurrences() > 0)
return loopUnrollByFactor(forOp, clUnrollFactor);
// Unroll completely if full loop unroll was specified.
if (clUnrollFull.getNumOccurrences() > 0 ||
(unrollFull.hasValue() && unrollFull.getValue()))
return loopUnrollFull(forOp);
// Unroll by four otherwise.
return loopUnrollByFactor(forOp, kDefaultUnrollFactor);
}
std::unique_ptr<OpPassBase<FuncOp>> mlir::createLoopUnrollPass(
int unrollFactor, int unrollFull,
const std::function<unsigned(AffineForOp)> &getUnrollFactor) {
return std::make_unique<LoopUnroll>(
unrollFactor == -1 ? None : Optional<unsigned>(unrollFactor),
unrollFull == -1 ? None : Optional<bool>(unrollFull), getUnrollFactor);
2018-11-06 18:34:18 -08:00
}
static PassRegistration<LoopUnroll> pass("affine-loop-unroll", "Unroll loops");