PPCSubtarget.cpp revision 302408
1//===-- PowerPCSubtarget.cpp - PPC Subtarget Information ------------------===// 2// 3// The LLVM Compiler Infrastructure 4// 5// This file is distributed under the University of Illinois Open Source 6// License. See LICENSE.TXT for details. 7// 8//===----------------------------------------------------------------------===// 9// 10// This file implements the PPC specific subclass of TargetSubtargetInfo. 11// 12//===----------------------------------------------------------------------===// 13 14#include "PPCSubtarget.h" 15#include "PPC.h" 16#include "PPCRegisterInfo.h" 17#include "PPCTargetMachine.h" 18#include "llvm/CodeGen/MachineFunction.h" 19#include "llvm/CodeGen/MachineScheduler.h" 20#include "llvm/IR/Attributes.h" 21#include "llvm/IR/Function.h" 22#include "llvm/IR/GlobalValue.h" 23#include "llvm/Support/CommandLine.h" 24#include "llvm/Support/TargetRegistry.h" 25#include "llvm/Target/TargetMachine.h" 26#include <cstdlib> 27 28using namespace llvm; 29 30#define DEBUG_TYPE "ppc-subtarget" 31 32#define GET_SUBTARGETINFO_TARGET_DESC 33#define GET_SUBTARGETINFO_CTOR 34#include "PPCGenSubtargetInfo.inc" 35 36static cl::opt<bool> UseSubRegLiveness("ppc-track-subreg-liveness", 37cl::desc("Enable subregister liveness tracking for PPC"), cl::Hidden); 38 39static cl::opt<bool> QPXStackUnaligned("qpx-stack-unaligned", 40 cl::desc("Even when QPX is enabled the stack is not 32-byte aligned"), 41 cl::Hidden); 42 43PPCSubtarget &PPCSubtarget::initializeSubtargetDependencies(StringRef CPU, 44 StringRef FS) { 45 initializeEnvironment(); 46 initSubtargetFeatures(CPU, FS); 47 return *this; 48} 49 50PPCSubtarget::PPCSubtarget(const Triple &TT, const std::string &CPU, 51 const std::string &FS, const PPCTargetMachine &TM) 52 : PPCGenSubtargetInfo(TT, CPU, FS), TargetTriple(TT), 53 IsPPC64(TargetTriple.getArch() == Triple::ppc64 || 54 TargetTriple.getArch() == Triple::ppc64le), 55 TM(TM), FrameLowering(initializeSubtargetDependencies(CPU, FS)), 56 InstrInfo(*this), TLInfo(TM, *this) {} 57 58void PPCSubtarget::initializeEnvironment() { 59 StackAlignment = 16; 60 DarwinDirective = PPC::DIR_NONE; 61 HasMFOCRF = false; 62 Has64BitSupport = false; 63 Use64BitRegs = false; 64 UseCRBits = false; 65 UseSoftFloat = false; 66 HasAltivec = false; 67 HasSPE = false; 68 HasQPX = false; 69 HasVSX = false; 70 HasP8Vector = false; 71 HasP8Altivec = false; 72 HasP8Crypto = false; 73 HasFCPSGN = false; 74 HasFSQRT = false; 75 HasFRE = false; 76 HasFRES = false; 77 HasFRSQRTE = false; 78 HasFRSQRTES = false; 79 HasRecipPrec = false; 80 HasSTFIWX = false; 81 HasLFIWAX = false; 82 HasFPRND = false; 83 HasFPCVT = false; 84 HasISEL = false; 85 HasPOPCNTD = false; 86 HasBPERMD = false; 87 HasExtDiv = false; 88 HasCMPB = false; 89 HasLDBRX = false; 90 IsBookE = false; 91 HasOnlyMSYNC = false; 92 IsPPC4xx = false; 93 IsPPC6xx = false; 94 IsE500 = false; 95 FeatureMFTB = false; 96 DeprecatedDST = false; 97 HasLazyResolverStubs = false; 98 HasICBT = false; 99 HasInvariantFunctionDescriptors = false; 100 HasPartwordAtomics = false; 101 HasDirectMove = false; 102 IsQPXStackUnaligned = false; 103 HasHTM = false; 104 HasFusion = false; 105 HasFloat128 = false; 106} 107 108void PPCSubtarget::initSubtargetFeatures(StringRef CPU, StringRef FS) { 109 // Determine default and user specified characteristics 110 std::string CPUName = CPU; 111 if (CPUName.empty()) { 112 // If cross-compiling with -march=ppc64le without -mcpu 113 if (TargetTriple.getArch() == Triple::ppc64le) 114 CPUName = "ppc64le"; 115 else 116 CPUName = "generic"; 117 } 118 119 // Initialize scheduling itinerary for the specified CPU. 120 InstrItins = getInstrItineraryForCPU(CPUName); 121 122 // Parse features string. 123 ParseSubtargetFeatures(CPUName, FS); 124 125 // If the user requested use of 64-bit regs, but the cpu selected doesn't 126 // support it, ignore. 127 if (IsPPC64 && has64BitSupport()) 128 Use64BitRegs = true; 129 130 // Set up darwin-specific properties. 131 if (isDarwin()) 132 HasLazyResolverStubs = true; 133 134 // QPX requires a 32-byte aligned stack. Note that we need to do this if 135 // we're compiling for a BG/Q system regardless of whether or not QPX 136 // is enabled because external functions will assume this alignment. 137 IsQPXStackUnaligned = QPXStackUnaligned; 138 StackAlignment = getPlatformStackAlignment(); 139 140 // Determine endianness. 141 // FIXME: Part of the TargetMachine. 142 IsLittleEndian = (TargetTriple.getArch() == Triple::ppc64le); 143} 144 145/// hasLazyResolverStub - Return true if accesses to the specified global have 146/// to go through a dyld lazy resolution stub. This means that an extra load 147/// is required to get the address of the global. 148bool PPCSubtarget::hasLazyResolverStub(const GlobalValue *GV) const { 149 // We never have stubs if HasLazyResolverStubs=false or if in static mode. 150 if (!HasLazyResolverStubs || TM.getRelocationModel() == Reloc::Static) 151 return false; 152 bool isDecl = GV->isDeclaration(); 153 if (GV->hasHiddenVisibility() && !isDecl && !GV->hasCommonLinkage()) 154 return false; 155 return GV->hasWeakLinkage() || GV->hasLinkOnceLinkage() || 156 GV->hasCommonLinkage() || isDecl; 157} 158 159// Embedded cores need aggressive scheduling (and some others also benefit). 160static bool needsAggressiveScheduling(unsigned Directive) { 161 switch (Directive) { 162 default: return false; 163 case PPC::DIR_440: 164 case PPC::DIR_A2: 165 case PPC::DIR_E500mc: 166 case PPC::DIR_E5500: 167 case PPC::DIR_PWR7: 168 case PPC::DIR_PWR8: 169 return true; 170 } 171} 172 173bool PPCSubtarget::enableMachineScheduler() const { 174 // Enable MI scheduling for the embedded cores. 175 // FIXME: Enable this for all cores (some additional modeling 176 // may be necessary). 177 return needsAggressiveScheduling(DarwinDirective); 178} 179 180// This overrides the PostRAScheduler bit in the SchedModel for each CPU. 181bool PPCSubtarget::enablePostRAScheduler() const { return true; } 182 183PPCGenSubtargetInfo::AntiDepBreakMode PPCSubtarget::getAntiDepBreakMode() const { 184 return TargetSubtargetInfo::ANTIDEP_ALL; 185} 186 187void PPCSubtarget::getCriticalPathRCs(RegClassVector &CriticalPathRCs) const { 188 CriticalPathRCs.clear(); 189 CriticalPathRCs.push_back(isPPC64() ? 190 &PPC::G8RCRegClass : &PPC::GPRCRegClass); 191} 192 193void PPCSubtarget::overrideSchedPolicy(MachineSchedPolicy &Policy, 194 MachineInstr *begin, 195 MachineInstr *end, 196 unsigned NumRegionInstrs) const { 197 if (needsAggressiveScheduling(DarwinDirective)) { 198 Policy.OnlyTopDown = false; 199 Policy.OnlyBottomUp = false; 200 } 201 202 // Spilling is generally expensive on all PPC cores, so always enable 203 // register-pressure tracking. 204 Policy.ShouldTrackPressure = true; 205} 206 207bool PPCSubtarget::useAA() const { 208 // Use AA during code generation for the embedded cores. 209 return needsAggressiveScheduling(DarwinDirective); 210} 211 212bool PPCSubtarget::enableSubRegLiveness() const { 213 return UseSubRegLiveness; 214} 215 216unsigned char PPCSubtarget::classifyGlobalReference( 217 const GlobalValue *GV) const { 218 // Note that currently we don't generate non-pic references. 219 // If a caller wants that, this will have to be updated. 220 221 // Large code model always uses the TOC even for local symbols. 222 if (TM.getCodeModel() == CodeModel::Large) 223 return PPCII::MO_PIC_FLAG | PPCII::MO_NLP_FLAG; 224 225 unsigned char flags = PPCII::MO_PIC_FLAG; 226 227 // Only if the relocation mode is PIC do we have to worry about 228 // interposition. In all other cases we can use a slightly looser standard to 229 // decide how to access the symbol. 230 if (TM.getRelocationModel() == Reloc::PIC_) { 231 // If it's local, or it's non-default, it can't be interposed. 232 if (!GV->hasLocalLinkage() && 233 GV->hasDefaultVisibility()) { 234 flags |= PPCII::MO_NLP_FLAG; 235 } 236 return flags; 237 } 238 239 if (GV->isStrongDefinitionForLinker()) 240 return flags; 241 return flags | PPCII::MO_NLP_FLAG; 242} 243 244bool PPCSubtarget::isELFv2ABI() const { return TM.isELFv2ABI(); } 245bool PPCSubtarget::isPPC64() const { return TM.isPPC64(); } 246