Make this dependent only on the minsize attribute and drop the pipeline handling. Rename the enable-loop-header-duplication option to enable-loop-header-duplication-at-minsize to clarify that it controls header duplication at minsize only (in other cases it is enabled by default, independently of this option).
108 lines
4.2 KiB
C++
108 lines
4.2 KiB
C++
//===- LoopRotation.cpp - Loop Rotation Pass ------------------------------===//
|
|
//
|
|
// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
|
|
// See https://llvm.org/LICENSE.txt for license information.
|
|
// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
|
|
//
|
|
//===----------------------------------------------------------------------===//
|
|
//
|
|
// This file implements Loop Rotation Pass.
|
|
//
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
#include "llvm/Transforms/Scalar/LoopRotation.h"
|
|
#include "llvm/Analysis/AssumptionCache.h"
|
|
#include "llvm/Analysis/InstructionSimplify.h"
|
|
#include "llvm/Analysis/LazyBlockFrequencyInfo.h"
|
|
#include "llvm/Analysis/LoopInfo.h"
|
|
#include "llvm/Analysis/LoopPass.h"
|
|
#include "llvm/Analysis/MemorySSA.h"
|
|
#include "llvm/Analysis/MemorySSAUpdater.h"
|
|
#include "llvm/Analysis/ScalarEvolution.h"
|
|
#include "llvm/Analysis/TargetTransformInfo.h"
|
|
#include "llvm/Support/CommandLine.h"
|
|
#include "llvm/Transforms/Scalar.h"
|
|
#include "llvm/Transforms/Utils/LoopRotationUtils.h"
|
|
#include "llvm/Transforms/Utils/LoopUtils.h"
|
|
#include <optional>
|
|
using namespace llvm;
|
|
|
|
#define DEBUG_TYPE "loop-rotate"
|
|
|
|
static cl::opt<unsigned> DefaultRotationThreshold(
|
|
"rotation-max-header-size", cl::init(16), cl::Hidden,
|
|
cl::desc("The default maximum header size for automatic loop rotation"));
|
|
|
|
static cl::opt<bool> PrepareForLTOOption(
|
|
"rotation-prepare-for-lto", cl::init(false), cl::Hidden,
|
|
cl::desc("Run loop-rotation in the prepare-for-lto stage. This option "
|
|
"should be used for testing only."));
|
|
|
|
// Experimentally allow loop header duplication. This should allow for better
|
|
// optimization at Oz, since loop-idiom recognition can then recognize things
|
|
// like memcpy. If this ends up being useful for many targets, we should drop
|
|
// this flag and make a code generation option that can be controlled
|
|
// independent of the opt level and exposed through the frontend.
|
|
static cl::opt<bool> EnableLoopHeaderDuplicationAtMinSize(
|
|
"enable-loop-header-duplication-at-minsize", cl::init(false), cl::Hidden,
|
|
cl::desc("Enable loop header duplication even for minsize"));
|
|
|
|
LoopRotatePass::LoopRotatePass(bool EnableHeaderDuplication, bool PrepareForLTO,
|
|
bool CheckExitCount)
|
|
: EnableHeaderDuplication(EnableHeaderDuplication),
|
|
PrepareForLTO(PrepareForLTO), CheckExitCount(CheckExitCount) {}
|
|
|
|
void LoopRotatePass::printPipeline(
|
|
raw_ostream &OS, function_ref<StringRef(StringRef)> MapClassName2PassName) {
|
|
static_cast<PassInfoMixin<LoopRotatePass> *>(this)->printPipeline(
|
|
OS, MapClassName2PassName);
|
|
OS << "<";
|
|
if (!EnableHeaderDuplication)
|
|
OS << "no-";
|
|
OS << "header-duplication;";
|
|
|
|
if (!PrepareForLTO)
|
|
OS << "no-";
|
|
OS << "prepare-for-lto;";
|
|
|
|
if (!CheckExitCount)
|
|
OS << "no-";
|
|
OS << "check-exit-count";
|
|
OS << ">";
|
|
}
|
|
|
|
PreservedAnalyses LoopRotatePass::run(Loop &L, LoopAnalysisManager &AM,
|
|
LoopStandardAnalysisResults &AR,
|
|
LPMUpdater &) {
|
|
// Vectorization requires loop-rotation. Use default threshold for loops the
|
|
// user explicitly marked for vectorization, even when header duplication is
|
|
// disabled.
|
|
int Threshold = EnableHeaderDuplication &&
|
|
(!L.getHeader()->getParent()->hasMinSize() ||
|
|
EnableLoopHeaderDuplicationAtMinSize ||
|
|
hasVectorizeTransformation(&L) == TM_ForcedByUser)
|
|
? DefaultRotationThreshold
|
|
: 0;
|
|
const DataLayout &DL = L.getHeader()->getDataLayout();
|
|
const SimplifyQuery SQ = getBestSimplifyQuery(AR, DL);
|
|
|
|
std::optional<MemorySSAUpdater> MSSAU;
|
|
if (AR.MSSA)
|
|
MSSAU = MemorySSAUpdater(AR.MSSA);
|
|
bool Changed =
|
|
LoopRotation(&L, &AR.LI, &AR.TTI, &AR.AC, &AR.DT, &AR.SE,
|
|
MSSAU ? &*MSSAU : nullptr, SQ, false, Threshold, false,
|
|
PrepareForLTO || PrepareForLTOOption, CheckExitCount);
|
|
|
|
if (!Changed)
|
|
return PreservedAnalyses::all();
|
|
|
|
if (AR.MSSA && VerifyMemorySSA)
|
|
AR.MSSA->verifyMemorySSA();
|
|
|
|
auto PA = getLoopPassPreservedAnalyses();
|
|
if (AR.MSSA)
|
|
PA.preserve<MemorySSAAnalysis>();
|
|
return PA;
|
|
}
|