74 lines
2.8 KiB
C++
74 lines
2.8 KiB
C++
//===- LowerVectorIntrinsics.cpp ------------------------------------------===//
|
|
//
|
|
// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
|
|
// See https://llvm.org/LICENSE.txt for license information.
|
|
// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
|
|
//
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
#include "llvm/Transforms/Utils/LowerVectorIntrinsics.h"
|
|
#include "llvm/IR/IRBuilder.h"
|
|
#include "llvm/IR/IntrinsicInst.h"
|
|
#include "llvm/Support/Debug.h"
|
|
|
|
#define DEBUG_TYPE "lower-vector-intrinsics"
|
|
|
|
using namespace llvm;
|
|
|
|
bool llvm::lowerUnaryVectorIntrinsicAsLoop(Module &M, CallInst *CI) {
|
|
Type *ArgTy = CI->getArgOperand(0)->getType();
|
|
VectorType *VecTy = cast<VectorType>(ArgTy);
|
|
|
|
BasicBlock *PreLoopBB = CI->getParent();
|
|
BasicBlock *PostLoopBB = nullptr;
|
|
Function *ParentFunc = PreLoopBB->getParent();
|
|
LLVMContext &Ctx = PreLoopBB->getContext();
|
|
|
|
PostLoopBB = PreLoopBB->splitBasicBlock(CI);
|
|
BasicBlock *LoopBB = BasicBlock::Create(Ctx, "", ParentFunc, PostLoopBB);
|
|
PreLoopBB->getTerminator()->setSuccessor(0, LoopBB);
|
|
|
|
// Loop preheader
|
|
IRBuilder<> PreLoopBuilder(PreLoopBB->getTerminator());
|
|
Value *LoopEnd = nullptr;
|
|
if (auto *ScalableVecTy = dyn_cast<ScalableVectorType>(VecTy)) {
|
|
Value *VScale = PreLoopBuilder.CreateVScale(
|
|
ConstantInt::get(PreLoopBuilder.getInt64Ty(), 1));
|
|
Value *N = ConstantInt::get(PreLoopBuilder.getInt64Ty(),
|
|
ScalableVecTy->getMinNumElements());
|
|
LoopEnd = PreLoopBuilder.CreateMul(VScale, N);
|
|
} else {
|
|
FixedVectorType *FixedVecTy = cast<FixedVectorType>(VecTy);
|
|
LoopEnd = ConstantInt::get(PreLoopBuilder.getInt64Ty(),
|
|
FixedVecTy->getNumElements());
|
|
}
|
|
|
|
// Loop body
|
|
IRBuilder<> LoopBuilder(LoopBB);
|
|
Type *Int64Ty = LoopBuilder.getInt64Ty();
|
|
|
|
PHINode *LoopIndex = LoopBuilder.CreatePHI(Int64Ty, 2);
|
|
LoopIndex->addIncoming(ConstantInt::get(Int64Ty, 0U), PreLoopBB);
|
|
PHINode *Vec = LoopBuilder.CreatePHI(VecTy, 2);
|
|
Vec->addIncoming(CI->getArgOperand(0), PreLoopBB);
|
|
|
|
Value *Elem = LoopBuilder.CreateExtractElement(Vec, LoopIndex);
|
|
Function *Exp = Intrinsic::getOrInsertDeclaration(&M, CI->getIntrinsicID(),
|
|
VecTy->getElementType());
|
|
Value *Res = LoopBuilder.CreateCall(Exp, Elem);
|
|
Value *NewVec = LoopBuilder.CreateInsertElement(Vec, Res, LoopIndex);
|
|
Vec->addIncoming(NewVec, LoopBB);
|
|
|
|
Value *One = ConstantInt::get(Int64Ty, 1U);
|
|
Value *NextLoopIndex = LoopBuilder.CreateAdd(LoopIndex, One);
|
|
LoopIndex->addIncoming(NextLoopIndex, LoopBB);
|
|
|
|
Value *ExitCond =
|
|
LoopBuilder.CreateICmp(CmpInst::ICMP_EQ, NextLoopIndex, LoopEnd);
|
|
LoopBuilder.CreateCondBr(ExitCond, PostLoopBB, LoopBB);
|
|
|
|
CI->replaceAllUsesWith(NewVec);
|
|
CI->eraseFromParent();
|
|
return true;
|
|
}
|