
This Change adds support for two SiFive vendor attributes in clang: - "SiFive-CLIC-preemptible" - "SiFive-CLIC-stack-swap" These can be given together, and can be combined with "machine", but cannot be combined with any other interrupt attribute values. These are handled primarily in RISCVFrameLowering: - "SiFive-CLIC-stack-swap" entails swapping `sp` with `sf.mscratchcsw` at function entry and exit, which holds the trap stack pointer. - "SiFive-CLIC-preemptible" entails saving `mcause` and `mepc` before re-enabling interrupts using `mstatus`. To save these, `s0` and `s1` are first spilled to the stack, and then the values are read into these registers. If these registers are used in the function, their values will be spilled a second time onto the stack with the generic callee-saved-register handling. At the end of the function interrupts are disabled again before `mepc` and `mcause` are restored. This Change also adds support for the following two experimental extensions, which only contain CSRs: - XSfsclic - for SiFive's CLIC Supervisor-Mode CSRs - XSfmclic - for SiFive's CLIC Machine-Mode CSRs The latter is needed for interrupt support. The CFI information for this implementation is not correct, but I'd prefer to correct this in a follow-up. While it's unlikely anyone wants to unwind through a handler, the CFI information is also used by debuggers so it would be good to get it right. Co-authored-by: Ana Pazos <apazos@quicinc.com>
878 lines
33 KiB
C++
878 lines
33 KiB
C++
//===- RISCV.cpp ----------------------------------------------------------===//
|
||
//
|
||
// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
|
||
// See https://llvm.org/LICENSE.txt for license information.
|
||
// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
|
||
//
|
||
//===----------------------------------------------------------------------===//
|
||
|
||
#include "ABIInfoImpl.h"
|
||
#include "TargetInfo.h"
|
||
#include "llvm/TargetParser/RISCVTargetParser.h"
|
||
|
||
using namespace clang;
|
||
using namespace clang::CodeGen;
|
||
|
||
//===----------------------------------------------------------------------===//
|
||
// RISC-V ABI Implementation
|
||
//===----------------------------------------------------------------------===//
|
||
|
||
namespace {
|
||
class RISCVABIInfo : public DefaultABIInfo {
|
||
private:
|
||
// Size of the integer ('x') registers in bits.
|
||
unsigned XLen;
|
||
// Size of the floating point ('f') registers in bits. Note that the target
|
||
// ISA might have a wider FLen than the selected ABI (e.g. an RV32IF target
|
||
// with soft float ABI has FLen==0).
|
||
unsigned FLen;
|
||
const int NumArgGPRs;
|
||
const int NumArgFPRs;
|
||
const bool EABI;
|
||
bool detectFPCCEligibleStructHelper(QualType Ty, CharUnits CurOff,
|
||
llvm::Type *&Field1Ty,
|
||
CharUnits &Field1Off,
|
||
llvm::Type *&Field2Ty,
|
||
CharUnits &Field2Off) const;
|
||
|
||
bool detectVLSCCEligibleStruct(QualType Ty, unsigned ABIVLen,
|
||
llvm::Type *&VLSType) const;
|
||
|
||
public:
|
||
RISCVABIInfo(CodeGen::CodeGenTypes &CGT, unsigned XLen, unsigned FLen,
|
||
bool EABI)
|
||
: DefaultABIInfo(CGT), XLen(XLen), FLen(FLen), NumArgGPRs(EABI ? 6 : 8),
|
||
NumArgFPRs(FLen != 0 ? 8 : 0), EABI(EABI) {}
|
||
|
||
// DefaultABIInfo's classifyReturnType and classifyArgumentType are
|
||
// non-virtual, but computeInfo is virtual, so we overload it.
|
||
void computeInfo(CGFunctionInfo &FI) const override;
|
||
|
||
ABIArgInfo classifyArgumentType(QualType Ty, bool IsFixed, int &ArgGPRsLeft,
|
||
int &ArgFPRsLeft, unsigned ABIVLen) const;
|
||
ABIArgInfo classifyReturnType(QualType RetTy, unsigned ABIVLen) const;
|
||
|
||
RValue EmitVAArg(CodeGenFunction &CGF, Address VAListAddr, QualType Ty,
|
||
AggValueSlot Slot) const override;
|
||
|
||
ABIArgInfo extendType(QualType Ty, llvm::Type *CoerceTy = nullptr) const;
|
||
|
||
bool detectFPCCEligibleStruct(QualType Ty, llvm::Type *&Field1Ty,
|
||
CharUnits &Field1Off, llvm::Type *&Field2Ty,
|
||
CharUnits &Field2Off, int &NeededArgGPRs,
|
||
int &NeededArgFPRs) const;
|
||
ABIArgInfo coerceAndExpandFPCCEligibleStruct(llvm::Type *Field1Ty,
|
||
CharUnits Field1Off,
|
||
llvm::Type *Field2Ty,
|
||
CharUnits Field2Off) const;
|
||
|
||
ABIArgInfo coerceVLSVector(QualType Ty, unsigned ABIVLen = 0) const;
|
||
|
||
using ABIInfo::appendAttributeMangling;
|
||
void appendAttributeMangling(TargetClonesAttr *Attr, unsigned Index,
|
||
raw_ostream &Out) const override;
|
||
void appendAttributeMangling(StringRef AttrStr,
|
||
raw_ostream &Out) const override;
|
||
};
|
||
} // end anonymous namespace
|
||
|
||
void RISCVABIInfo::appendAttributeMangling(TargetClonesAttr *Attr,
|
||
unsigned Index,
|
||
raw_ostream &Out) const {
|
||
appendAttributeMangling(Attr->getFeatureStr(Index), Out);
|
||
}
|
||
|
||
void RISCVABIInfo::appendAttributeMangling(StringRef AttrStr,
|
||
raw_ostream &Out) const {
|
||
if (AttrStr == "default") {
|
||
Out << ".default";
|
||
return;
|
||
}
|
||
|
||
Out << '.';
|
||
|
||
SmallVector<StringRef, 8> Attrs;
|
||
AttrStr.split(Attrs, ';');
|
||
|
||
// Only consider the arch string.
|
||
StringRef ArchStr;
|
||
for (auto &Attr : Attrs) {
|
||
if (Attr.starts_with("arch="))
|
||
ArchStr = Attr;
|
||
}
|
||
|
||
// Extract features string.
|
||
SmallVector<StringRef, 8> Features;
|
||
ArchStr.consume_front("arch=");
|
||
ArchStr.split(Features, ',');
|
||
|
||
llvm::stable_sort(Features);
|
||
|
||
for (auto Feat : Features) {
|
||
Feat.consume_front("+");
|
||
Out << "_" << Feat;
|
||
}
|
||
}
|
||
|
||
void RISCVABIInfo::computeInfo(CGFunctionInfo &FI) const {
|
||
unsigned ABIVLen;
|
||
switch (FI.getExtInfo().getCC()) {
|
||
default:
|
||
ABIVLen = 0;
|
||
break;
|
||
#define CC_VLS_CASE(ABI_VLEN) \
|
||
case CallingConv::CC_RISCVVLSCall_##ABI_VLEN: \
|
||
ABIVLen = ABI_VLEN; \
|
||
break;
|
||
CC_VLS_CASE(32)
|
||
CC_VLS_CASE(64)
|
||
CC_VLS_CASE(128)
|
||
CC_VLS_CASE(256)
|
||
CC_VLS_CASE(512)
|
||
CC_VLS_CASE(1024)
|
||
CC_VLS_CASE(2048)
|
||
CC_VLS_CASE(4096)
|
||
CC_VLS_CASE(8192)
|
||
CC_VLS_CASE(16384)
|
||
CC_VLS_CASE(32768)
|
||
CC_VLS_CASE(65536)
|
||
#undef CC_VLS_CASE
|
||
}
|
||
QualType RetTy = FI.getReturnType();
|
||
if (!getCXXABI().classifyReturnType(FI))
|
||
FI.getReturnInfo() = classifyReturnType(RetTy, ABIVLen);
|
||
|
||
// IsRetIndirect is true if classifyArgumentType indicated the value should
|
||
// be passed indirect, or if the type size is a scalar greater than 2*XLen
|
||
// and not a complex type with elements <= FLen. e.g. fp128 is passed direct
|
||
// in LLVM IR, relying on the backend lowering code to rewrite the argument
|
||
// list and pass indirectly on RV32.
|
||
bool IsRetIndirect = FI.getReturnInfo().getKind() == ABIArgInfo::Indirect;
|
||
if (!IsRetIndirect && RetTy->isScalarType() &&
|
||
getContext().getTypeSize(RetTy) > (2 * XLen)) {
|
||
if (RetTy->isComplexType() && FLen) {
|
||
QualType EltTy = RetTy->castAs<ComplexType>()->getElementType();
|
||
IsRetIndirect = getContext().getTypeSize(EltTy) > FLen;
|
||
} else {
|
||
// This is a normal scalar > 2*XLen, such as fp128 on RV32.
|
||
IsRetIndirect = true;
|
||
}
|
||
}
|
||
|
||
int ArgGPRsLeft = IsRetIndirect ? NumArgGPRs - 1 : NumArgGPRs;
|
||
int ArgFPRsLeft = NumArgFPRs;
|
||
int NumFixedArgs = FI.getNumRequiredArgs();
|
||
|
||
int ArgNum = 0;
|
||
for (auto &ArgInfo : FI.arguments()) {
|
||
bool IsFixed = ArgNum < NumFixedArgs;
|
||
ArgInfo.info = classifyArgumentType(ArgInfo.type, IsFixed, ArgGPRsLeft,
|
||
ArgFPRsLeft, ABIVLen);
|
||
ArgNum++;
|
||
}
|
||
}
|
||
|
||
// Returns true if the struct is a potential candidate for the floating point
|
||
// calling convention. If this function returns true, the caller is
|
||
// responsible for checking that if there is only a single field then that
|
||
// field is a float.
|
||
bool RISCVABIInfo::detectFPCCEligibleStructHelper(QualType Ty, CharUnits CurOff,
|
||
llvm::Type *&Field1Ty,
|
||
CharUnits &Field1Off,
|
||
llvm::Type *&Field2Ty,
|
||
CharUnits &Field2Off) const {
|
||
bool IsInt = Ty->isIntegralOrEnumerationType();
|
||
bool IsFloat = Ty->isRealFloatingType();
|
||
|
||
if (IsInt || IsFloat) {
|
||
uint64_t Size = getContext().getTypeSize(Ty);
|
||
if (IsInt && Size > XLen)
|
||
return false;
|
||
// Can't be eligible if larger than the FP registers. Handling of half
|
||
// precision values has been specified in the ABI, so don't block those.
|
||
if (IsFloat && Size > FLen)
|
||
return false;
|
||
// Can't be eligible if an integer type was already found (int+int pairs
|
||
// are not eligible).
|
||
if (IsInt && Field1Ty && Field1Ty->isIntegerTy())
|
||
return false;
|
||
if (!Field1Ty) {
|
||
Field1Ty = CGT.ConvertType(Ty);
|
||
Field1Off = CurOff;
|
||
return true;
|
||
}
|
||
if (!Field2Ty) {
|
||
Field2Ty = CGT.ConvertType(Ty);
|
||
Field2Off = CurOff;
|
||
return true;
|
||
}
|
||
return false;
|
||
}
|
||
|
||
if (auto CTy = Ty->getAs<ComplexType>()) {
|
||
if (Field1Ty)
|
||
return false;
|
||
QualType EltTy = CTy->getElementType();
|
||
if (getContext().getTypeSize(EltTy) > FLen)
|
||
return false;
|
||
Field1Ty = CGT.ConvertType(EltTy);
|
||
Field1Off = CurOff;
|
||
Field2Ty = Field1Ty;
|
||
Field2Off = Field1Off + getContext().getTypeSizeInChars(EltTy);
|
||
return true;
|
||
}
|
||
|
||
if (const ConstantArrayType *ATy = getContext().getAsConstantArrayType(Ty)) {
|
||
uint64_t ArraySize = ATy->getZExtSize();
|
||
QualType EltTy = ATy->getElementType();
|
||
// Non-zero-length arrays of empty records make the struct ineligible for
|
||
// the FP calling convention in C++.
|
||
if (const auto *RTy = EltTy->getAs<RecordType>()) {
|
||
if (ArraySize != 0 && isa<CXXRecordDecl>(RTy->getDecl()) &&
|
||
isEmptyRecord(getContext(), EltTy, true, true))
|
||
return false;
|
||
}
|
||
CharUnits EltSize = getContext().getTypeSizeInChars(EltTy);
|
||
for (uint64_t i = 0; i < ArraySize; ++i) {
|
||
bool Ret = detectFPCCEligibleStructHelper(EltTy, CurOff, Field1Ty,
|
||
Field1Off, Field2Ty, Field2Off);
|
||
if (!Ret)
|
||
return false;
|
||
CurOff += EltSize;
|
||
}
|
||
return true;
|
||
}
|
||
|
||
if (const auto *RTy = Ty->getAs<RecordType>()) {
|
||
// Structures with either a non-trivial destructor or a non-trivial
|
||
// copy constructor are not eligible for the FP calling convention.
|
||
if (getRecordArgABI(Ty, CGT.getCXXABI()))
|
||
return false;
|
||
if (isEmptyRecord(getContext(), Ty, true, true))
|
||
return true;
|
||
const RecordDecl *RD = RTy->getDecl();
|
||
// Unions aren't eligible unless they're empty (which is caught above).
|
||
if (RD->isUnion())
|
||
return false;
|
||
const ASTRecordLayout &Layout = getContext().getASTRecordLayout(RD);
|
||
// If this is a C++ record, check the bases first.
|
||
if (const CXXRecordDecl *CXXRD = dyn_cast<CXXRecordDecl>(RD)) {
|
||
for (const CXXBaseSpecifier &B : CXXRD->bases()) {
|
||
const auto *BDecl =
|
||
cast<CXXRecordDecl>(B.getType()->castAs<RecordType>()->getDecl());
|
||
CharUnits BaseOff = Layout.getBaseClassOffset(BDecl);
|
||
bool Ret = detectFPCCEligibleStructHelper(B.getType(), CurOff + BaseOff,
|
||
Field1Ty, Field1Off, Field2Ty,
|
||
Field2Off);
|
||
if (!Ret)
|
||
return false;
|
||
}
|
||
}
|
||
int ZeroWidthBitFieldCount = 0;
|
||
for (const FieldDecl *FD : RD->fields()) {
|
||
uint64_t FieldOffInBits = Layout.getFieldOffset(FD->getFieldIndex());
|
||
QualType QTy = FD->getType();
|
||
if (FD->isBitField()) {
|
||
unsigned BitWidth = FD->getBitWidthValue();
|
||
// Allow a bitfield with a type greater than XLen as long as the
|
||
// bitwidth is XLen or less.
|
||
if (getContext().getTypeSize(QTy) > XLen && BitWidth <= XLen)
|
||
QTy = getContext().getIntTypeForBitwidth(XLen, false);
|
||
if (BitWidth == 0) {
|
||
ZeroWidthBitFieldCount++;
|
||
continue;
|
||
}
|
||
}
|
||
|
||
bool Ret = detectFPCCEligibleStructHelper(
|
||
QTy, CurOff + getContext().toCharUnitsFromBits(FieldOffInBits),
|
||
Field1Ty, Field1Off, Field2Ty, Field2Off);
|
||
if (!Ret)
|
||
return false;
|
||
|
||
// As a quirk of the ABI, zero-width bitfields aren't ignored for fp+fp
|
||
// or int+fp structs, but are ignored for a struct with an fp field and
|
||
// any number of zero-width bitfields.
|
||
if (Field2Ty && ZeroWidthBitFieldCount > 0)
|
||
return false;
|
||
}
|
||
return Field1Ty != nullptr;
|
||
}
|
||
|
||
return false;
|
||
}
|
||
|
||
// Determine if a struct is eligible for passing according to the floating
|
||
// point calling convention (i.e., when flattened it contains a single fp
|
||
// value, fp+fp, or int+fp of appropriate size). If so, NeededArgFPRs and
|
||
// NeededArgGPRs are incremented appropriately.
|
||
bool RISCVABIInfo::detectFPCCEligibleStruct(QualType Ty, llvm::Type *&Field1Ty,
|
||
CharUnits &Field1Off,
|
||
llvm::Type *&Field2Ty,
|
||
CharUnits &Field2Off,
|
||
int &NeededArgGPRs,
|
||
int &NeededArgFPRs) const {
|
||
Field1Ty = nullptr;
|
||
Field2Ty = nullptr;
|
||
NeededArgGPRs = 0;
|
||
NeededArgFPRs = 0;
|
||
bool IsCandidate = detectFPCCEligibleStructHelper(
|
||
Ty, CharUnits::Zero(), Field1Ty, Field1Off, Field2Ty, Field2Off);
|
||
if (!Field1Ty)
|
||
return false;
|
||
// Not really a candidate if we have a single int but no float.
|
||
if (Field1Ty && !Field2Ty && !Field1Ty->isFloatingPointTy())
|
||
return false;
|
||
if (!IsCandidate)
|
||
return false;
|
||
if (Field1Ty && Field1Ty->isFloatingPointTy())
|
||
NeededArgFPRs++;
|
||
else if (Field1Ty)
|
||
NeededArgGPRs++;
|
||
if (Field2Ty && Field2Ty->isFloatingPointTy())
|
||
NeededArgFPRs++;
|
||
else if (Field2Ty)
|
||
NeededArgGPRs++;
|
||
return true;
|
||
}
|
||
|
||
// Call getCoerceAndExpand for the two-element flattened struct described by
|
||
// Field1Ty, Field1Off, Field2Ty, Field2Off. This method will create an
|
||
// appropriate coerceToType and unpaddedCoerceToType.
|
||
ABIArgInfo RISCVABIInfo::coerceAndExpandFPCCEligibleStruct(
|
||
llvm::Type *Field1Ty, CharUnits Field1Off, llvm::Type *Field2Ty,
|
||
CharUnits Field2Off) const {
|
||
SmallVector<llvm::Type *, 3> CoerceElts;
|
||
SmallVector<llvm::Type *, 2> UnpaddedCoerceElts;
|
||
if (!Field1Off.isZero())
|
||
CoerceElts.push_back(llvm::ArrayType::get(
|
||
llvm::Type::getInt8Ty(getVMContext()), Field1Off.getQuantity()));
|
||
|
||
CoerceElts.push_back(Field1Ty);
|
||
UnpaddedCoerceElts.push_back(Field1Ty);
|
||
|
||
if (!Field2Ty) {
|
||
return ABIArgInfo::getCoerceAndExpand(
|
||
llvm::StructType::get(getVMContext(), CoerceElts, !Field1Off.isZero()),
|
||
UnpaddedCoerceElts[0]);
|
||
}
|
||
|
||
CharUnits Field2Align =
|
||
CharUnits::fromQuantity(getDataLayout().getABITypeAlign(Field2Ty));
|
||
CharUnits Field1End = Field1Off +
|
||
CharUnits::fromQuantity(getDataLayout().getTypeStoreSize(Field1Ty));
|
||
CharUnits Field2OffNoPadNoPack = Field1End.alignTo(Field2Align);
|
||
|
||
CharUnits Padding = CharUnits::Zero();
|
||
if (Field2Off > Field2OffNoPadNoPack)
|
||
Padding = Field2Off - Field2OffNoPadNoPack;
|
||
else if (Field2Off != Field2Align && Field2Off > Field1End)
|
||
Padding = Field2Off - Field1End;
|
||
|
||
bool IsPacked = !Field2Off.isMultipleOf(Field2Align);
|
||
|
||
if (!Padding.isZero())
|
||
CoerceElts.push_back(llvm::ArrayType::get(
|
||
llvm::Type::getInt8Ty(getVMContext()), Padding.getQuantity()));
|
||
|
||
CoerceElts.push_back(Field2Ty);
|
||
UnpaddedCoerceElts.push_back(Field2Ty);
|
||
|
||
auto CoerceToType =
|
||
llvm::StructType::get(getVMContext(), CoerceElts, IsPacked);
|
||
auto UnpaddedCoerceToType =
|
||
llvm::StructType::get(getVMContext(), UnpaddedCoerceElts, IsPacked);
|
||
|
||
return ABIArgInfo::getCoerceAndExpand(CoerceToType, UnpaddedCoerceToType);
|
||
}
|
||
|
||
bool RISCVABIInfo::detectVLSCCEligibleStruct(QualType Ty, unsigned ABIVLen,
|
||
llvm::Type *&VLSType) const {
|
||
// No riscv_vls_cc attribute.
|
||
if (ABIVLen == 0)
|
||
return false;
|
||
|
||
// Legal struct for VLS calling convention should fulfill following rules:
|
||
// 1. Struct element should be either "homogeneous fixed-length vectors" or "a
|
||
// fixed-length vector array".
|
||
// 2. Number of struct elements or array elements should be greater or equal
|
||
// to 1 and less or equal to 8
|
||
// 3. Total number of vector registers needed should not exceed 8.
|
||
//
|
||
// Examples: Assume ABI_VLEN = 128.
|
||
// These are legal structs:
|
||
// a. Structs with 1~8 "same" fixed-length vectors, e.g.
|
||
// struct {
|
||
// __attribute__((vector_size(16))) int a;
|
||
// __attribute__((vector_size(16))) int b;
|
||
// }
|
||
//
|
||
// b. Structs with "single" fixed-length vector array with lengh 1~8, e.g.
|
||
// struct {
|
||
// __attribute__((vector_size(16))) int a[3];
|
||
// }
|
||
// These are illegal structs:
|
||
// a. Structs with 9 fixed-length vectors, e.g.
|
||
// struct {
|
||
// __attribute__((vector_size(16))) int a;
|
||
// __attribute__((vector_size(16))) int b;
|
||
// __attribute__((vector_size(16))) int c;
|
||
// __attribute__((vector_size(16))) int d;
|
||
// __attribute__((vector_size(16))) int e;
|
||
// __attribute__((vector_size(16))) int f;
|
||
// __attribute__((vector_size(16))) int g;
|
||
// __attribute__((vector_size(16))) int h;
|
||
// __attribute__((vector_size(16))) int i;
|
||
// }
|
||
//
|
||
// b. Structs with "multiple" fixed-length vector array, e.g.
|
||
// struct {
|
||
// __attribute__((vector_size(16))) int a[2];
|
||
// __attribute__((vector_size(16))) int b[2];
|
||
// }
|
||
//
|
||
// c. Vector registers needed exceeds 8, e.g.
|
||
// struct {
|
||
// // Registers needed for single fixed-length element:
|
||
// // 64 * 8 / ABI_VLEN = 4
|
||
// __attribute__((vector_size(64))) int a;
|
||
// __attribute__((vector_size(64))) int b;
|
||
// __attribute__((vector_size(64))) int c;
|
||
// __attribute__((vector_size(64))) int d;
|
||
// }
|
||
//
|
||
// Struct of 1 fixed-length vector is passed as a scalable vector.
|
||
// Struct of >1 fixed-length vectors are passed as vector tuple.
|
||
// Struct of 1 array of fixed-length vectors is passed as a scalable vector.
|
||
// Otherwise, pass the struct indirectly.
|
||
|
||
if (llvm::StructType *STy = dyn_cast<llvm::StructType>(CGT.ConvertType(Ty))) {
|
||
unsigned NumElts = STy->getStructNumElements();
|
||
if (NumElts > 8)
|
||
return false;
|
||
|
||
auto *FirstEltTy = STy->getElementType(0);
|
||
if (!STy->containsHomogeneousTypes())
|
||
return false;
|
||
|
||
// Check structure of fixed-length vectors and turn them into vector tuple
|
||
// type if legal.
|
||
if (auto *FixedVecTy = dyn_cast<llvm::FixedVectorType>(FirstEltTy)) {
|
||
if (NumElts == 1) {
|
||
// Handle single fixed-length vector.
|
||
VLSType = llvm::ScalableVectorType::get(
|
||
FixedVecTy->getElementType(),
|
||
llvm::divideCeil(FixedVecTy->getNumElements() *
|
||
llvm::RISCV::RVVBitsPerBlock,
|
||
ABIVLen));
|
||
// Check registers needed <= 8.
|
||
return llvm::divideCeil(
|
||
FixedVecTy->getNumElements() *
|
||
FixedVecTy->getElementType()->getScalarSizeInBits(),
|
||
ABIVLen) <= 8;
|
||
}
|
||
// LMUL
|
||
// = fixed-length vector size / ABIVLen
|
||
// = 8 * I8EltCount / RVVBitsPerBlock
|
||
// =>
|
||
// I8EltCount
|
||
// = (fixed-length vector size * RVVBitsPerBlock) / (ABIVLen * 8)
|
||
unsigned I8EltCount = llvm::divideCeil(
|
||
FixedVecTy->getNumElements() *
|
||
FixedVecTy->getElementType()->getScalarSizeInBits() *
|
||
llvm::RISCV::RVVBitsPerBlock,
|
||
ABIVLen * 8);
|
||
VLSType = llvm::TargetExtType::get(
|
||
getVMContext(), "riscv.vector.tuple",
|
||
llvm::ScalableVectorType::get(llvm::Type::getInt8Ty(getVMContext()),
|
||
I8EltCount),
|
||
NumElts);
|
||
// Check registers needed <= 8.
|
||
return NumElts *
|
||
llvm::divideCeil(
|
||
FixedVecTy->getNumElements() *
|
||
FixedVecTy->getElementType()->getScalarSizeInBits(),
|
||
ABIVLen) <=
|
||
8;
|
||
}
|
||
|
||
// If elements are not fixed-length vectors, it should be an array.
|
||
if (NumElts != 1)
|
||
return false;
|
||
|
||
// Check array of fixed-length vector and turn it into scalable vector type
|
||
// if legal.
|
||
if (auto *ArrTy = dyn_cast<llvm::ArrayType>(FirstEltTy)) {
|
||
unsigned NumArrElt = ArrTy->getNumElements();
|
||
if (NumArrElt > 8)
|
||
return false;
|
||
|
||
auto *ArrEltTy = dyn_cast<llvm::FixedVectorType>(ArrTy->getElementType());
|
||
if (!ArrEltTy)
|
||
return false;
|
||
|
||
// LMUL
|
||
// = NumArrElt * fixed-length vector size / ABIVLen
|
||
// = fixed-length vector elt size * ScalVecNumElts / RVVBitsPerBlock
|
||
// =>
|
||
// ScalVecNumElts
|
||
// = (NumArrElt * fixed-length vector size * RVVBitsPerBlock) /
|
||
// (ABIVLen * fixed-length vector elt size)
|
||
// = NumArrElt * num fixed-length vector elt * RVVBitsPerBlock /
|
||
// ABIVLen
|
||
unsigned ScalVecNumElts = llvm::divideCeil(
|
||
NumArrElt * ArrEltTy->getNumElements() * llvm::RISCV::RVVBitsPerBlock,
|
||
ABIVLen);
|
||
VLSType = llvm::ScalableVectorType::get(ArrEltTy->getElementType(),
|
||
ScalVecNumElts);
|
||
// Check registers needed <= 8.
|
||
return llvm::divideCeil(
|
||
ScalVecNumElts *
|
||
ArrEltTy->getElementType()->getScalarSizeInBits(),
|
||
llvm::RISCV::RVVBitsPerBlock) <= 8;
|
||
}
|
||
}
|
||
return false;
|
||
}
|
||
|
||
// Fixed-length RVV vectors are represented as scalable vectors in function
|
||
// args/return and must be coerced from fixed vectors.
|
||
ABIArgInfo RISCVABIInfo::coerceVLSVector(QualType Ty, unsigned ABIVLen) const {
|
||
assert(Ty->isVectorType() && "expected vector type!");
|
||
|
||
const auto *VT = Ty->castAs<VectorType>();
|
||
assert(VT->getElementType()->isBuiltinType() && "expected builtin type!");
|
||
|
||
auto VScale = getContext().getTargetInfo().getVScaleRange(
|
||
getContext().getLangOpts(), false);
|
||
|
||
unsigned NumElts = VT->getNumElements();
|
||
llvm::Type *EltType = llvm::Type::getInt1Ty(getVMContext());
|
||
switch (VT->getVectorKind()) {
|
||
case VectorKind::RVVFixedLengthMask_1:
|
||
break;
|
||
case VectorKind::RVVFixedLengthMask_2:
|
||
NumElts *= 2;
|
||
break;
|
||
case VectorKind::RVVFixedLengthMask_4:
|
||
NumElts *= 4;
|
||
break;
|
||
case VectorKind::RVVFixedLengthMask:
|
||
NumElts *= 8;
|
||
break;
|
||
default:
|
||
assert((VT->getVectorKind() == VectorKind::Generic ||
|
||
VT->getVectorKind() == VectorKind::RVVFixedLengthData) &&
|
||
"Unexpected vector kind");
|
||
EltType = CGT.ConvertType(VT->getElementType());
|
||
}
|
||
|
||
llvm::ScalableVectorType *ResType;
|
||
|
||
if (ABIVLen == 0) {
|
||
// The MinNumElts is simplified from equation:
|
||
// NumElts / VScale =
|
||
// (EltSize * NumElts / (VScale * RVVBitsPerBlock))
|
||
// * (RVVBitsPerBlock / EltSize)
|
||
ResType = llvm::ScalableVectorType::get(EltType, NumElts / VScale->first);
|
||
} else {
|
||
// Check registers needed <= 8.
|
||
if ((EltType->getScalarSizeInBits() * NumElts / ABIVLen) > 8)
|
||
return getNaturalAlignIndirect(
|
||
Ty, /*AddrSpace=*/getDataLayout().getAllocaAddrSpace(),
|
||
/*ByVal=*/false);
|
||
|
||
// Generic vector
|
||
// The number of elements needs to be at least 1.
|
||
ResType = llvm::ScalableVectorType::get(
|
||
EltType,
|
||
llvm::divideCeil(NumElts * llvm::RISCV::RVVBitsPerBlock, ABIVLen));
|
||
|
||
// If the corresponding extension is not supported, just make it an i8
|
||
// vector with same LMUL.
|
||
const TargetInfo &TI = getContext().getTargetInfo();
|
||
if ((EltType->isHalfTy() && !TI.hasFeature("zvfhmin")) ||
|
||
(EltType->isBFloatTy() && !TI.hasFeature("zvfbfmin")) ||
|
||
(EltType->isFloatTy() && !TI.hasFeature("zve32f")) ||
|
||
(EltType->isDoubleTy() && !TI.hasFeature("zve64d")) ||
|
||
(EltType->isIntegerTy(64) && !TI.hasFeature("zve64x")) ||
|
||
EltType->isIntegerTy(128)) {
|
||
// The number of elements needs to be at least 1.
|
||
ResType = llvm::ScalableVectorType::get(
|
||
llvm::Type::getInt8Ty(getVMContext()),
|
||
llvm::divideCeil(EltType->getScalarSizeInBits() * NumElts *
|
||
llvm::RISCV::RVVBitsPerBlock,
|
||
8 * ABIVLen));
|
||
}
|
||
}
|
||
|
||
return ABIArgInfo::getDirect(ResType);
|
||
}
|
||
|
||
ABIArgInfo RISCVABIInfo::classifyArgumentType(QualType Ty, bool IsFixed,
|
||
int &ArgGPRsLeft,
|
||
int &ArgFPRsLeft,
|
||
unsigned ABIVLen) const {
|
||
assert(ArgGPRsLeft <= NumArgGPRs && "Arg GPR tracking underflow");
|
||
Ty = useFirstFieldIfTransparentUnion(Ty);
|
||
|
||
// Structures with either a non-trivial destructor or a non-trivial
|
||
// copy constructor are always passed indirectly.
|
||
if (CGCXXABI::RecordArgABI RAA = getRecordArgABI(Ty, getCXXABI())) {
|
||
if (ArgGPRsLeft)
|
||
ArgGPRsLeft -= 1;
|
||
return getNaturalAlignIndirect(
|
||
Ty, /*AddrSpace=*/getDataLayout().getAllocaAddrSpace(),
|
||
/*ByVal=*/RAA == CGCXXABI::RAA_DirectInMemory);
|
||
}
|
||
|
||
uint64_t Size = getContext().getTypeSize(Ty);
|
||
|
||
// Ignore empty structs/unions whose size is zero. According to the calling
|
||
// convention empty structs/unions are required to be sized types in C++.
|
||
if (isEmptyRecord(getContext(), Ty, true) && Size == 0)
|
||
return ABIArgInfo::getIgnore();
|
||
|
||
// Pass floating point values via FPRs if possible.
|
||
if (IsFixed && Ty->isFloatingType() && !Ty->isComplexType() &&
|
||
FLen >= Size && ArgFPRsLeft) {
|
||
ArgFPRsLeft--;
|
||
return ABIArgInfo::getDirect();
|
||
}
|
||
|
||
// Complex types for the hard float ABI must be passed direct rather than
|
||
// using CoerceAndExpand.
|
||
if (IsFixed && Ty->isComplexType() && FLen && ArgFPRsLeft >= 2) {
|
||
QualType EltTy = Ty->castAs<ComplexType>()->getElementType();
|
||
if (getContext().getTypeSize(EltTy) <= FLen) {
|
||
ArgFPRsLeft -= 2;
|
||
return ABIArgInfo::getDirect();
|
||
}
|
||
}
|
||
|
||
if (IsFixed && FLen && Ty->isStructureOrClassType()) {
|
||
llvm::Type *Field1Ty = nullptr;
|
||
llvm::Type *Field2Ty = nullptr;
|
||
CharUnits Field1Off = CharUnits::Zero();
|
||
CharUnits Field2Off = CharUnits::Zero();
|
||
int NeededArgGPRs = 0;
|
||
int NeededArgFPRs = 0;
|
||
bool IsCandidate =
|
||
detectFPCCEligibleStruct(Ty, Field1Ty, Field1Off, Field2Ty, Field2Off,
|
||
NeededArgGPRs, NeededArgFPRs);
|
||
if (IsCandidate && NeededArgGPRs <= ArgGPRsLeft &&
|
||
NeededArgFPRs <= ArgFPRsLeft) {
|
||
ArgGPRsLeft -= NeededArgGPRs;
|
||
ArgFPRsLeft -= NeededArgFPRs;
|
||
return coerceAndExpandFPCCEligibleStruct(Field1Ty, Field1Off, Field2Ty,
|
||
Field2Off);
|
||
}
|
||
}
|
||
|
||
if (IsFixed && Ty->isStructureOrClassType()) {
|
||
llvm::Type *VLSType = nullptr;
|
||
if (detectVLSCCEligibleStruct(Ty, ABIVLen, VLSType))
|
||
return ABIArgInfo::getDirect(VLSType);
|
||
}
|
||
|
||
uint64_t NeededAlign = getContext().getTypeAlign(Ty);
|
||
// Determine the number of GPRs needed to pass the current argument
|
||
// according to the ABI. 2*XLen-aligned varargs are passed in "aligned"
|
||
// register pairs, so may consume 3 registers.
|
||
// TODO: To be compatible with GCC's behaviors, we don't align registers
|
||
// currently if we are using ILP32E calling convention. This behavior may be
|
||
// changed when RV32E/ILP32E is ratified.
|
||
int NeededArgGPRs = 1;
|
||
if (!IsFixed && NeededAlign == 2 * XLen)
|
||
NeededArgGPRs = 2 + (EABI && XLen == 32 ? 0 : (ArgGPRsLeft % 2));
|
||
else if (Size > XLen && Size <= 2 * XLen)
|
||
NeededArgGPRs = 2;
|
||
|
||
if (NeededArgGPRs > ArgGPRsLeft) {
|
||
NeededArgGPRs = ArgGPRsLeft;
|
||
}
|
||
|
||
ArgGPRsLeft -= NeededArgGPRs;
|
||
|
||
if (!isAggregateTypeForABI(Ty) && !Ty->isVectorType()) {
|
||
// Treat an enum type as its underlying type.
|
||
if (const EnumType *EnumTy = Ty->getAs<EnumType>())
|
||
Ty = EnumTy->getDecl()->getIntegerType();
|
||
|
||
// All integral types are promoted to XLen width
|
||
if (Size < XLen && Ty->isIntegralOrEnumerationType()) {
|
||
return extendType(Ty, CGT.ConvertType(Ty));
|
||
}
|
||
|
||
if (const auto *EIT = Ty->getAs<BitIntType>()) {
|
||
if (EIT->getNumBits() < XLen)
|
||
return extendType(Ty, CGT.ConvertType(Ty));
|
||
if (EIT->getNumBits() > 128 ||
|
||
(!getContext().getTargetInfo().hasInt128Type() &&
|
||
EIT->getNumBits() > 64))
|
||
return getNaturalAlignIndirect(
|
||
Ty, /*AddrSpace=*/getDataLayout().getAllocaAddrSpace(),
|
||
/*ByVal=*/false);
|
||
}
|
||
|
||
return ABIArgInfo::getDirect();
|
||
}
|
||
|
||
// TODO: _BitInt is not handled yet in VLS calling convention since _BitInt
|
||
// ABI is also not merged yet in RISC-V:
|
||
// https://github.com/riscv-non-isa/riscv-elf-psabi-doc/pull/419
|
||
if (const VectorType *VT = Ty->getAs<VectorType>();
|
||
VT && !VT->getElementType()->isBitIntType()) {
|
||
if (VT->getVectorKind() == VectorKind::RVVFixedLengthData ||
|
||
VT->getVectorKind() == VectorKind::RVVFixedLengthMask ||
|
||
VT->getVectorKind() == VectorKind::RVVFixedLengthMask_1 ||
|
||
VT->getVectorKind() == VectorKind::RVVFixedLengthMask_2 ||
|
||
VT->getVectorKind() == VectorKind::RVVFixedLengthMask_4)
|
||
return coerceVLSVector(Ty);
|
||
if (VT->getVectorKind() == VectorKind::Generic && ABIVLen != 0)
|
||
// Generic vector without riscv_vls_cc should fall through and pass by
|
||
// reference.
|
||
return coerceVLSVector(Ty, ABIVLen);
|
||
}
|
||
|
||
// Aggregates which are <= 2*XLen will be passed in registers if possible,
|
||
// so coerce to integers.
|
||
if (Size <= 2 * XLen) {
|
||
unsigned Alignment = getContext().getTypeAlign(Ty);
|
||
|
||
// Use a single XLen int if possible, 2*XLen if 2*XLen alignment is
|
||
// required, and a 2-element XLen array if only XLen alignment is required.
|
||
if (Size <= XLen) {
|
||
return ABIArgInfo::getDirect(
|
||
llvm::IntegerType::get(getVMContext(), XLen));
|
||
} else if (Alignment == 2 * XLen) {
|
||
return ABIArgInfo::getDirect(
|
||
llvm::IntegerType::get(getVMContext(), 2 * XLen));
|
||
} else {
|
||
return ABIArgInfo::getDirect(llvm::ArrayType::get(
|
||
llvm::IntegerType::get(getVMContext(), XLen), 2));
|
||
}
|
||
}
|
||
return getNaturalAlignIndirect(
|
||
Ty, /*AddrSpace=*/getDataLayout().getAllocaAddrSpace(),
|
||
/*ByVal=*/false);
|
||
}
|
||
|
||
ABIArgInfo RISCVABIInfo::classifyReturnType(QualType RetTy,
|
||
unsigned ABIVLen) const {
|
||
if (RetTy->isVoidType())
|
||
return ABIArgInfo::getIgnore();
|
||
|
||
int ArgGPRsLeft = 2;
|
||
int ArgFPRsLeft = FLen ? 2 : 0;
|
||
|
||
// The rules for return and argument types are the same, so defer to
|
||
// classifyArgumentType.
|
||
return classifyArgumentType(RetTy, /*IsFixed=*/true, ArgGPRsLeft, ArgFPRsLeft,
|
||
ABIVLen);
|
||
}
|
||
|
||
RValue RISCVABIInfo::EmitVAArg(CodeGenFunction &CGF, Address VAListAddr,
|
||
QualType Ty, AggValueSlot Slot) const {
|
||
CharUnits SlotSize = CharUnits::fromQuantity(XLen / 8);
|
||
|
||
// Empty records are ignored for parameter passing purposes.
|
||
if (isEmptyRecord(getContext(), Ty, true))
|
||
return Slot.asRValue();
|
||
|
||
auto TInfo = getContext().getTypeInfoInChars(Ty);
|
||
|
||
// TODO: To be compatible with GCC's behaviors, we force arguments with
|
||
// 2×XLEN-bit alignment and size at most 2×XLEN bits like `long long`,
|
||
// `unsigned long long` and `double` to have 4-byte alignment. This
|
||
// behavior may be changed when RV32E/ILP32E is ratified.
|
||
if (EABI && XLen == 32)
|
||
TInfo.Align = std::min(TInfo.Align, CharUnits::fromQuantity(4));
|
||
|
||
// Arguments bigger than 2*Xlen bytes are passed indirectly.
|
||
bool IsIndirect = TInfo.Width > 2 * SlotSize;
|
||
|
||
return emitVoidPtrVAArg(CGF, VAListAddr, Ty, IsIndirect, TInfo, SlotSize,
|
||
/*AllowHigherAlign=*/true, Slot);
|
||
}
|
||
|
||
ABIArgInfo RISCVABIInfo::extendType(QualType Ty, llvm::Type *CoerceTy) const {
|
||
int TySize = getContext().getTypeSize(Ty);
|
||
// RV64 ABI requires unsigned 32 bit integers to be sign extended.
|
||
if (XLen == 64 && Ty->isUnsignedIntegerOrEnumerationType() && TySize == 32)
|
||
return ABIArgInfo::getSignExtend(Ty, CoerceTy);
|
||
return ABIArgInfo::getExtend(Ty, CoerceTy);
|
||
}
|
||
|
||
namespace {
|
||
class RISCVTargetCodeGenInfo : public TargetCodeGenInfo {
|
||
public:
|
||
RISCVTargetCodeGenInfo(CodeGen::CodeGenTypes &CGT, unsigned XLen,
|
||
unsigned FLen, bool EABI)
|
||
: TargetCodeGenInfo(
|
||
std::make_unique<RISCVABIInfo>(CGT, XLen, FLen, EABI)) {
|
||
SwiftInfo =
|
||
std::make_unique<SwiftABIInfo>(CGT, /*SwiftErrorInRegister=*/false);
|
||
}
|
||
|
||
void setTargetAttributes(const Decl *D, llvm::GlobalValue *GV,
|
||
CodeGen::CodeGenModule &CGM) const override {
|
||
const auto *FD = dyn_cast_or_null<FunctionDecl>(D);
|
||
if (!FD) return;
|
||
|
||
auto *Fn = cast<llvm::Function>(GV);
|
||
|
||
if (CGM.getCodeGenOpts().CFProtectionReturn)
|
||
Fn->addFnAttr("hw-shadow-stack");
|
||
|
||
const auto *Attr = FD->getAttr<RISCVInterruptAttr>();
|
||
if (!Attr)
|
||
return;
|
||
|
||
StringRef Kind = "machine";
|
||
bool HasSiFiveCLICPreemptible = false;
|
||
bool HasSiFiveCLICStackSwap = false;
|
||
for (RISCVInterruptAttr::InterruptType type : Attr->interrupt()) {
|
||
switch (type) {
|
||
case RISCVInterruptAttr::machine:
|
||
// Do not update `Kind` because `Kind` is already "machine", or the
|
||
// kinds also contains SiFive types which need to be applied.
|
||
break;
|
||
case RISCVInterruptAttr::supervisor:
|
||
Kind = "supervisor";
|
||
break;
|
||
case RISCVInterruptAttr::qcinest:
|
||
Kind = "qci-nest";
|
||
break;
|
||
case RISCVInterruptAttr::qcinonest:
|
||
Kind = "qci-nonest";
|
||
break;
|
||
// There are three different LLVM IR attribute values for SiFive CLIC
|
||
// interrupt kinds, one for each kind and one extra for their combination.
|
||
case RISCVInterruptAttr::SiFiveCLICPreemptible: {
|
||
HasSiFiveCLICPreemptible = true;
|
||
Kind = HasSiFiveCLICStackSwap ? "SiFive-CLIC-preemptible-stack-swap"
|
||
: "SiFive-CLIC-preemptible";
|
||
break;
|
||
}
|
||
case RISCVInterruptAttr::SiFiveCLICStackSwap: {
|
||
HasSiFiveCLICStackSwap = true;
|
||
Kind = HasSiFiveCLICPreemptible ? "SiFive-CLIC-preemptible-stack-swap"
|
||
: "SiFive-CLIC-stack-swap";
|
||
break;
|
||
}
|
||
}
|
||
}
|
||
|
||
Fn->addFnAttr("interrupt", Kind);
|
||
}
|
||
};
|
||
} // namespace
|
||
|
||
std::unique_ptr<TargetCodeGenInfo>
|
||
CodeGen::createRISCVTargetCodeGenInfo(CodeGenModule &CGM, unsigned XLen,
|
||
unsigned FLen, bool EABI) {
|
||
return std::make_unique<RISCVTargetCodeGenInfo>(CGM.getTypes(), XLen, FLen,
|
||
EABI);
|
||
}
|