This reverts commit a1d11348ab.
Two problems have been identified:
- The expansion for powi was functionally wrong - the second argument
stales scalar even when the first is a vector.
- AArch64 uses the Expand option on libcalls to select vector libcalls
in some cases. The test coverage for this uses -start-after which
happens to miss this pass.
63 lines
2.3 KiB
C++
63 lines
2.3 KiB
C++
//===- LowerVectorIntrinsics.cpp ------------------------------------------===//
|
|
//
|
|
// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
|
|
// See https://llvm.org/LICENSE.txt for license information.
|
|
// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
|
|
//
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
#include "llvm/Transforms/Utils/LowerVectorIntrinsics.h"
|
|
#include "llvm/IR/IRBuilder.h"
|
|
#include "llvm/IR/Module.h"
|
|
|
|
#define DEBUG_TYPE "lower-vector-intrinsics"
|
|
|
|
using namespace llvm;
|
|
|
|
bool llvm::lowerUnaryVectorIntrinsicAsLoop(Module &M, CallInst *CI) {
|
|
Type *ArgTy = CI->getArgOperand(0)->getType();
|
|
VectorType *VecTy = cast<VectorType>(ArgTy);
|
|
|
|
BasicBlock *PreLoopBB = CI->getParent();
|
|
BasicBlock *PostLoopBB = nullptr;
|
|
Function *ParentFunc = PreLoopBB->getParent();
|
|
LLVMContext &Ctx = PreLoopBB->getContext();
|
|
Type *IdxTy = M.getDataLayout().getIndexType(Ctx, 0);
|
|
|
|
PostLoopBB = PreLoopBB->splitBasicBlock(CI);
|
|
BasicBlock *LoopBB = BasicBlock::Create(Ctx, "", ParentFunc, PostLoopBB);
|
|
PreLoopBB->getTerminator()->setSuccessor(0, LoopBB);
|
|
|
|
// Loop preheader
|
|
IRBuilder<> PreLoopBuilder(PreLoopBB->getTerminator());
|
|
Value *LoopEnd =
|
|
PreLoopBuilder.CreateElementCount(IdxTy, VecTy->getElementCount());
|
|
|
|
// Loop body
|
|
IRBuilder<> LoopBuilder(LoopBB);
|
|
|
|
PHINode *LoopIndex = LoopBuilder.CreatePHI(IdxTy, 2);
|
|
LoopIndex->addIncoming(ConstantInt::get(IdxTy, 0U), PreLoopBB);
|
|
PHINode *Vec = LoopBuilder.CreatePHI(VecTy, 2);
|
|
Vec->addIncoming(CI->getArgOperand(0), PreLoopBB);
|
|
|
|
Value *Elem = LoopBuilder.CreateExtractElement(Vec, LoopIndex);
|
|
Function *Exp = Intrinsic::getOrInsertDeclaration(&M, CI->getIntrinsicID(),
|
|
VecTy->getElementType());
|
|
Value *Res = LoopBuilder.CreateCall(Exp, Elem);
|
|
Value *NewVec = LoopBuilder.CreateInsertElement(Vec, Res, LoopIndex);
|
|
Vec->addIncoming(NewVec, LoopBB);
|
|
|
|
Value *One = ConstantInt::get(IdxTy, 1U);
|
|
Value *NextLoopIndex = LoopBuilder.CreateAdd(LoopIndex, One);
|
|
LoopIndex->addIncoming(NextLoopIndex, LoopBB);
|
|
|
|
Value *ExitCond =
|
|
LoopBuilder.CreateICmp(CmpInst::ICMP_EQ, NextLoopIndex, LoopEnd);
|
|
LoopBuilder.CreateCondBr(ExitCond, PostLoopBB, LoopBB);
|
|
|
|
CI->replaceAllUsesWith(NewVec);
|
|
CI->eraseFromParent();
|
|
return true;
|
|
}
|