This patch disallows the use of the -maix-small-local-exec-tls and -fno-data-sections options within clang, and also disallows the use of the aix-small-local-exec-tls attribute with the -data-sections=false option in llc. This is because having data sections off when using the aix-small-local-exec-tls feature is not ideal for performance. As the small-local-exec-tls region is a limited resource, this space should not used for variables that may be replaced. Note, that on AIX, data sections is turned on by default, so this patch makes it so that a diagnostic is emitted when users explicitly turn off data sections while using the aix-small-local-exec-tls feature.
221 lines
7.6 KiB
C++
221 lines
7.6 KiB
C++
//===-- PowerPCSubtarget.cpp - PPC Subtarget Information ------------------===//
|
|
//
|
|
// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
|
|
// See https://llvm.org/LICENSE.txt for license information.
|
|
// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
|
|
//
|
|
//===----------------------------------------------------------------------===//
|
|
//
|
|
// This file implements the PPC specific subclass of TargetSubtargetInfo.
|
|
//
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
#include "PPCSubtarget.h"
|
|
#include "GISel/PPCCallLowering.h"
|
|
#include "GISel/PPCLegalizerInfo.h"
|
|
#include "GISel/PPCRegisterBankInfo.h"
|
|
#include "PPC.h"
|
|
#include "PPCRegisterInfo.h"
|
|
#include "PPCTargetMachine.h"
|
|
#include "llvm/CodeGen/GlobalISel/InstructionSelect.h"
|
|
#include "llvm/CodeGen/GlobalISel/InstructionSelector.h"
|
|
#include "llvm/CodeGen/MachineFunction.h"
|
|
#include "llvm/CodeGen/MachineScheduler.h"
|
|
#include "llvm/IR/Attributes.h"
|
|
#include "llvm/IR/Function.h"
|
|
#include "llvm/IR/GlobalValue.h"
|
|
#include "llvm/MC/TargetRegistry.h"
|
|
#include "llvm/Support/CommandLine.h"
|
|
#include "llvm/Target/TargetMachine.h"
|
|
#include <cstdlib>
|
|
|
|
using namespace llvm;
|
|
|
|
#define DEBUG_TYPE "ppc-subtarget"
|
|
|
|
#define GET_SUBTARGETINFO_TARGET_DESC
|
|
#define GET_SUBTARGETINFO_CTOR
|
|
#include "PPCGenSubtargetInfo.inc"
|
|
|
|
static cl::opt<bool>
|
|
UseSubRegLiveness("ppc-track-subreg-liveness",
|
|
cl::desc("Enable subregister liveness tracking for PPC"),
|
|
cl::init(true), cl::Hidden);
|
|
|
|
static cl::opt<bool>
|
|
EnableMachinePipeliner("ppc-enable-pipeliner",
|
|
cl::desc("Enable Machine Pipeliner for PPC"),
|
|
cl::init(false), cl::Hidden);
|
|
|
|
PPCSubtarget &PPCSubtarget::initializeSubtargetDependencies(StringRef CPU,
|
|
StringRef TuneCPU,
|
|
StringRef FS) {
|
|
initializeEnvironment();
|
|
initSubtargetFeatures(CPU, TuneCPU, FS);
|
|
return *this;
|
|
}
|
|
|
|
PPCSubtarget::PPCSubtarget(const Triple &TT, const std::string &CPU,
|
|
const std::string &TuneCPU, const std::string &FS,
|
|
const PPCTargetMachine &TM)
|
|
: PPCGenSubtargetInfo(TT, CPU, TuneCPU, FS), TargetTriple(TT),
|
|
IsPPC64(TargetTriple.getArch() == Triple::ppc64 ||
|
|
TargetTriple.getArch() == Triple::ppc64le),
|
|
TM(TM), FrameLowering(initializeSubtargetDependencies(CPU, TuneCPU, FS)),
|
|
InstrInfo(*this), TLInfo(TM, *this) {
|
|
CallLoweringInfo.reset(new PPCCallLowering(*getTargetLowering()));
|
|
Legalizer.reset(new PPCLegalizerInfo(*this));
|
|
auto *RBI = new PPCRegisterBankInfo(*getRegisterInfo());
|
|
RegBankInfo.reset(RBI);
|
|
|
|
InstSelector.reset(createPPCInstructionSelector(
|
|
*static_cast<const PPCTargetMachine *>(&TM), *this, *RBI));
|
|
}
|
|
|
|
void PPCSubtarget::initializeEnvironment() {
|
|
StackAlignment = Align(16);
|
|
CPUDirective = PPC::DIR_NONE;
|
|
HasPOPCNTD = POPCNTD_Unavailable;
|
|
}
|
|
|
|
void PPCSubtarget::initSubtargetFeatures(StringRef CPU, StringRef TuneCPU,
|
|
StringRef FS) {
|
|
// Determine default and user specified characteristics
|
|
std::string CPUName = std::string(CPU);
|
|
if (CPUName.empty() || CPU == "generic") {
|
|
// If cross-compiling with -march=ppc64le without -mcpu
|
|
if (TargetTriple.getArch() == Triple::ppc64le)
|
|
CPUName = "ppc64le";
|
|
else if (TargetTriple.getSubArch() == Triple::PPCSubArch_spe)
|
|
CPUName = "e500";
|
|
else
|
|
CPUName = "generic";
|
|
}
|
|
|
|
// Determine the CPU to schedule for.
|
|
if (TuneCPU.empty()) TuneCPU = CPUName;
|
|
|
|
// Initialize scheduling itinerary for the specified CPU.
|
|
InstrItins = getInstrItineraryForCPU(CPUName);
|
|
|
|
// Parse features string.
|
|
ParseSubtargetFeatures(CPUName, TuneCPU, FS);
|
|
|
|
// If the user requested use of 64-bit regs, but the cpu selected doesn't
|
|
// support it, ignore.
|
|
if (IsPPC64 && has64BitSupport())
|
|
Use64BitRegs = true;
|
|
|
|
if (TargetTriple.isPPC32SecurePlt())
|
|
IsSecurePlt = true;
|
|
|
|
if (HasSPE && IsPPC64)
|
|
report_fatal_error( "SPE is only supported for 32-bit targets.\n", false);
|
|
if (HasSPE && (HasAltivec || HasVSX || HasFPU))
|
|
report_fatal_error(
|
|
"SPE and traditional floating point cannot both be enabled.\n", false);
|
|
|
|
// If not SPE, set standard FPU
|
|
if (!HasSPE)
|
|
HasFPU = true;
|
|
|
|
StackAlignment = getPlatformStackAlignment();
|
|
|
|
// Determine endianness.
|
|
IsLittleEndian = TM.isLittleEndian();
|
|
|
|
if (HasAIXSmallLocalExecTLS) {
|
|
if (!TargetTriple.isOSAIX() || !IsPPC64)
|
|
report_fatal_error(
|
|
"The aix-small-local-exec-tls attribute is only supported on AIX in "
|
|
"64-bit mode.\n",
|
|
false);
|
|
// The aix-small-local-exec-tls attribute should only be used with
|
|
// -data-sections, as having data sections turned off with this option
|
|
// is not ideal for performance. Moreover, the small-local-exec-tls region
|
|
// is a limited resource, and should not be used for variables that may
|
|
// be replaced.
|
|
if (!TM.getDataSections())
|
|
report_fatal_error(
|
|
"The aix-small-local-exec-tls attribute can only be specified with "
|
|
"-data-sections.\n",
|
|
false);
|
|
}
|
|
}
|
|
|
|
bool PPCSubtarget::enableMachineScheduler() const { return true; }
|
|
|
|
bool PPCSubtarget::enableMachinePipeliner() const {
|
|
return getSchedModel().hasInstrSchedModel() && EnableMachinePipeliner;
|
|
}
|
|
|
|
bool PPCSubtarget::useDFAforSMS() const { return false; }
|
|
|
|
// This overrides the PostRAScheduler bit in the SchedModel for each CPU.
|
|
bool PPCSubtarget::enablePostRAScheduler() const { return true; }
|
|
|
|
PPCGenSubtargetInfo::AntiDepBreakMode PPCSubtarget::getAntiDepBreakMode() const {
|
|
return TargetSubtargetInfo::ANTIDEP_ALL;
|
|
}
|
|
|
|
void PPCSubtarget::getCriticalPathRCs(RegClassVector &CriticalPathRCs) const {
|
|
CriticalPathRCs.clear();
|
|
CriticalPathRCs.push_back(isPPC64() ?
|
|
&PPC::G8RCRegClass : &PPC::GPRCRegClass);
|
|
}
|
|
|
|
void PPCSubtarget::overrideSchedPolicy(MachineSchedPolicy &Policy,
|
|
unsigned NumRegionInstrs) const {
|
|
// The GenericScheduler that we use defaults to scheduling bottom up only.
|
|
// We want to schedule from both the top and the bottom and so we set
|
|
// OnlyBottomUp to false.
|
|
// We want to do bi-directional scheduling since it provides a more balanced
|
|
// schedule leading to better performance.
|
|
Policy.OnlyBottomUp = false;
|
|
// Spilling is generally expensive on all PPC cores, so always enable
|
|
// register-pressure tracking.
|
|
Policy.ShouldTrackPressure = true;
|
|
}
|
|
|
|
bool PPCSubtarget::useAA() const {
|
|
return true;
|
|
}
|
|
|
|
bool PPCSubtarget::enableSubRegLiveness() const {
|
|
return UseSubRegLiveness;
|
|
}
|
|
|
|
bool PPCSubtarget::isGVIndirectSymbol(const GlobalValue *GV) const {
|
|
// Large code model always uses the TOC even for local symbols.
|
|
if (TM.getCodeModel() == CodeModel::Large)
|
|
return true;
|
|
if (TM.shouldAssumeDSOLocal(*GV->getParent(), GV))
|
|
return false;
|
|
return true;
|
|
}
|
|
|
|
bool PPCSubtarget::isELFv2ABI() const { return TM.isELFv2ABI(); }
|
|
bool PPCSubtarget::isPPC64() const { return TM.isPPC64(); }
|
|
|
|
bool PPCSubtarget::isUsingPCRelativeCalls() const {
|
|
return isPPC64() && hasPCRelativeMemops() && isELFv2ABI() &&
|
|
CodeModel::Medium == getTargetMachine().getCodeModel();
|
|
}
|
|
|
|
// GlobalISEL
|
|
const CallLowering *PPCSubtarget::getCallLowering() const {
|
|
return CallLoweringInfo.get();
|
|
}
|
|
|
|
const RegisterBankInfo *PPCSubtarget::getRegBankInfo() const {
|
|
return RegBankInfo.get();
|
|
}
|
|
|
|
const LegalizerInfo *PPCSubtarget::getLegalizerInfo() const {
|
|
return Legalizer.get();
|
|
}
|
|
|
|
InstructionSelector *PPCSubtarget::getInstructionSelector() const {
|
|
return InstSelector.get();
|
|
}
|