SystemZFrameLowering.cpp revision 263508
1//===-- SystemZFrameLowering.cpp - Frame lowering for SystemZ -------------===//
2//
3//                     The LLVM Compiler Infrastructure
4//
5// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
9
10#include "SystemZFrameLowering.h"
11#include "SystemZCallingConv.h"
12#include "SystemZInstrBuilder.h"
13#include "SystemZMachineFunctionInfo.h"
14#include "SystemZTargetMachine.h"
15#include "llvm/CodeGen/MachineModuleInfo.h"
16#include "llvm/CodeGen/MachineRegisterInfo.h"
17#include "llvm/CodeGen/RegisterScavenging.h"
18#include "llvm/IR/Function.h"
19
20using namespace llvm;
21
22namespace {
23  // The ABI-defined register save slots, relative to the incoming stack
24  // pointer.
25  static const TargetFrameLowering::SpillSlot SpillOffsetTable[] = {
26    { SystemZ::R2D,  0x10 },
27    { SystemZ::R3D,  0x18 },
28    { SystemZ::R4D,  0x20 },
29    { SystemZ::R5D,  0x28 },
30    { SystemZ::R6D,  0x30 },
31    { SystemZ::R7D,  0x38 },
32    { SystemZ::R8D,  0x40 },
33    { SystemZ::R9D,  0x48 },
34    { SystemZ::R10D, 0x50 },
35    { SystemZ::R11D, 0x58 },
36    { SystemZ::R12D, 0x60 },
37    { SystemZ::R13D, 0x68 },
38    { SystemZ::R14D, 0x70 },
39    { SystemZ::R15D, 0x78 },
40    { SystemZ::F0D,  0x80 },
41    { SystemZ::F2D,  0x88 },
42    { SystemZ::F4D,  0x90 },
43    { SystemZ::F6D,  0x98 }
44  };
45}
46
47SystemZFrameLowering::SystemZFrameLowering(const SystemZTargetMachine &tm,
48                                           const SystemZSubtarget &sti)
49  : TargetFrameLowering(TargetFrameLowering::StackGrowsDown, 8,
50                        -SystemZMC::CallFrameSize, 8),
51    TM(tm), STI(sti) {
52  // Create a mapping from register number to save slot offset.
53  RegSpillOffsets.grow(SystemZ::NUM_TARGET_REGS);
54  for (unsigned I = 0, E = array_lengthof(SpillOffsetTable); I != E; ++I)
55    RegSpillOffsets[SpillOffsetTable[I].Reg] = SpillOffsetTable[I].Offset;
56}
57
58const TargetFrameLowering::SpillSlot *
59SystemZFrameLowering::getCalleeSavedSpillSlots(unsigned &NumEntries) const {
60  NumEntries = array_lengthof(SpillOffsetTable);
61  return SpillOffsetTable;
62}
63
64void SystemZFrameLowering::
65processFunctionBeforeCalleeSavedScan(MachineFunction &MF,
66                                     RegScavenger *RS) const {
67  MachineFrameInfo *MFFrame = MF.getFrameInfo();
68  MachineRegisterInfo &MRI = MF.getRegInfo();
69  const TargetRegisterInfo *TRI = MF.getTarget().getRegisterInfo();
70  bool HasFP = hasFP(MF);
71  SystemZMachineFunctionInfo *MFI = MF.getInfo<SystemZMachineFunctionInfo>();
72  bool IsVarArg = MF.getFunction()->isVarArg();
73
74  // va_start stores incoming FPR varargs in the normal way, but delegates
75  // the saving of incoming GPR varargs to spillCalleeSavedRegisters().
76  // Record these pending uses, which typically include the call-saved
77  // argument register R6D.
78  if (IsVarArg)
79    for (unsigned I = MFI->getVarArgsFirstGPR(); I < SystemZ::NumArgGPRs; ++I)
80      MRI.setPhysRegUsed(SystemZ::ArgGPRs[I]);
81
82  // If the function requires a frame pointer, record that the hard
83  // frame pointer will be clobbered.
84  if (HasFP)
85    MRI.setPhysRegUsed(SystemZ::R11D);
86
87  // If the function calls other functions, record that the return
88  // address register will be clobbered.
89  if (MFFrame->hasCalls())
90    MRI.setPhysRegUsed(SystemZ::R14D);
91
92  // If we are saving GPRs other than the stack pointer, we might as well
93  // save and restore the stack pointer at the same time, via STMG and LMG.
94  // This allows the deallocation to be done by the LMG, rather than needing
95  // a separate %r15 addition.
96  const uint16_t *CSRegs = TRI->getCalleeSavedRegs(&MF);
97  for (unsigned I = 0; CSRegs[I]; ++I) {
98    unsigned Reg = CSRegs[I];
99    if (SystemZ::GR64BitRegClass.contains(Reg) && MRI.isPhysRegUsed(Reg)) {
100      MRI.setPhysRegUsed(SystemZ::R15D);
101      break;
102    }
103  }
104}
105
106// Add GPR64 to the save instruction being built by MIB, which is in basic
107// block MBB.  IsImplicit says whether this is an explicit operand to the
108// instruction, or an implicit one that comes between the explicit start
109// and end registers.
110static void addSavedGPR(MachineBasicBlock &MBB, MachineInstrBuilder &MIB,
111                        const SystemZTargetMachine &TM,
112                        unsigned GPR64, bool IsImplicit) {
113  const SystemZRegisterInfo *RI = TM.getRegisterInfo();
114  unsigned GPR32 = RI->getSubReg(GPR64, SystemZ::subreg_l32);
115  bool IsLive = MBB.isLiveIn(GPR64) || MBB.isLiveIn(GPR32);
116  if (!IsLive || !IsImplicit) {
117    MIB.addReg(GPR64, getImplRegState(IsImplicit) | getKillRegState(!IsLive));
118    if (!IsLive)
119      MBB.addLiveIn(GPR64);
120  }
121}
122
123bool SystemZFrameLowering::
124spillCalleeSavedRegisters(MachineBasicBlock &MBB,
125                          MachineBasicBlock::iterator MBBI,
126                          const std::vector<CalleeSavedInfo> &CSI,
127                          const TargetRegisterInfo *TRI) const {
128  if (CSI.empty())
129    return false;
130
131  MachineFunction &MF = *MBB.getParent();
132  const TargetInstrInfo *TII = MF.getTarget().getInstrInfo();
133  SystemZMachineFunctionInfo *ZFI = MF.getInfo<SystemZMachineFunctionInfo>();
134  bool IsVarArg = MF.getFunction()->isVarArg();
135  DebugLoc DL = MBBI != MBB.end() ? MBBI->getDebugLoc() : DebugLoc();
136
137  // Scan the call-saved GPRs and find the bounds of the register spill area.
138  unsigned LowGPR = 0;
139  unsigned HighGPR = SystemZ::R15D;
140  unsigned StartOffset = -1U;
141  for (unsigned I = 0, E = CSI.size(); I != E; ++I) {
142    unsigned Reg = CSI[I].getReg();
143    if (SystemZ::GR64BitRegClass.contains(Reg)) {
144      unsigned Offset = RegSpillOffsets[Reg];
145      assert(Offset && "Unexpected GPR save");
146      if (StartOffset > Offset) {
147        LowGPR = Reg;
148        StartOffset = Offset;
149      }
150    }
151  }
152
153  // Save the range of call-saved registers, for use by the epilogue inserter.
154  ZFI->setLowSavedGPR(LowGPR);
155  ZFI->setHighSavedGPR(HighGPR);
156
157  // Include the GPR varargs, if any.  R6D is call-saved, so would
158  // be included by the loop above, but we also need to handle the
159  // call-clobbered argument registers.
160  if (IsVarArg) {
161    unsigned FirstGPR = ZFI->getVarArgsFirstGPR();
162    if (FirstGPR < SystemZ::NumArgGPRs) {
163      unsigned Reg = SystemZ::ArgGPRs[FirstGPR];
164      unsigned Offset = RegSpillOffsets[Reg];
165      if (StartOffset > Offset) {
166        LowGPR = Reg; StartOffset = Offset;
167      }
168    }
169  }
170
171  // Save GPRs
172  if (LowGPR) {
173    assert(LowGPR != HighGPR && "Should be saving %r15 and something else");
174
175    // Build an STMG instruction.
176    MachineInstrBuilder MIB = BuildMI(MBB, MBBI, DL, TII->get(SystemZ::STMG));
177
178    // Add the explicit register operands.
179    addSavedGPR(MBB, MIB, TM, LowGPR, false);
180    addSavedGPR(MBB, MIB, TM, HighGPR, false);
181
182    // Add the address.
183    MIB.addReg(SystemZ::R15D).addImm(StartOffset);
184
185    // Make sure all call-saved GPRs are included as operands and are
186    // marked as live on entry.
187    for (unsigned I = 0, E = CSI.size(); I != E; ++I) {
188      unsigned Reg = CSI[I].getReg();
189      if (SystemZ::GR64BitRegClass.contains(Reg))
190        addSavedGPR(MBB, MIB, TM, Reg, true);
191    }
192
193    // ...likewise GPR varargs.
194    if (IsVarArg)
195      for (unsigned I = ZFI->getVarArgsFirstGPR(); I < SystemZ::NumArgGPRs; ++I)
196        addSavedGPR(MBB, MIB, TM, SystemZ::ArgGPRs[I], true);
197  }
198
199  // Save FPRs in the normal TargetInstrInfo way.
200  for (unsigned I = 0, E = CSI.size(); I != E; ++I) {
201    unsigned Reg = CSI[I].getReg();
202    if (SystemZ::FP64BitRegClass.contains(Reg)) {
203      MBB.addLiveIn(Reg);
204      TII->storeRegToStackSlot(MBB, MBBI, Reg, true, CSI[I].getFrameIdx(),
205                               &SystemZ::FP64BitRegClass, TRI);
206    }
207  }
208
209  return true;
210}
211
212bool SystemZFrameLowering::
213restoreCalleeSavedRegisters(MachineBasicBlock &MBB,
214                            MachineBasicBlock::iterator MBBI,
215                            const std::vector<CalleeSavedInfo> &CSI,
216                            const TargetRegisterInfo *TRI) const {
217  if (CSI.empty())
218    return false;
219
220  MachineFunction &MF = *MBB.getParent();
221  const TargetInstrInfo *TII = MF.getTarget().getInstrInfo();
222  SystemZMachineFunctionInfo *ZFI = MF.getInfo<SystemZMachineFunctionInfo>();
223  bool HasFP = hasFP(MF);
224  DebugLoc DL = MBBI != MBB.end() ? MBBI->getDebugLoc() : DebugLoc();
225
226  // Restore FPRs in the normal TargetInstrInfo way.
227  for (unsigned I = 0, E = CSI.size(); I != E; ++I) {
228    unsigned Reg = CSI[I].getReg();
229    if (SystemZ::FP64BitRegClass.contains(Reg))
230      TII->loadRegFromStackSlot(MBB, MBBI, Reg, CSI[I].getFrameIdx(),
231                                &SystemZ::FP64BitRegClass, TRI);
232  }
233
234  // Restore call-saved GPRs (but not call-clobbered varargs, which at
235  // this point might hold return values).
236  unsigned LowGPR = ZFI->getLowSavedGPR();
237  unsigned HighGPR = ZFI->getHighSavedGPR();
238  unsigned StartOffset = RegSpillOffsets[LowGPR];
239  if (LowGPR) {
240    // If we saved any of %r2-%r5 as varargs, we should also be saving
241    // and restoring %r6.  If we're saving %r6 or above, we should be
242    // restoring it too.
243    assert(LowGPR != HighGPR && "Should be loading %r15 and something else");
244
245    // Build an LMG instruction.
246    MachineInstrBuilder MIB = BuildMI(MBB, MBBI, DL, TII->get(SystemZ::LMG));
247
248    // Add the explicit register operands.
249    MIB.addReg(LowGPR, RegState::Define);
250    MIB.addReg(HighGPR, RegState::Define);
251
252    // Add the address.
253    MIB.addReg(HasFP ? SystemZ::R11D : SystemZ::R15D);
254    MIB.addImm(StartOffset);
255
256    // Do a second scan adding regs as being defined by instruction
257    for (unsigned I = 0, E = CSI.size(); I != E; ++I) {
258      unsigned Reg = CSI[I].getReg();
259      if (Reg != LowGPR && Reg != HighGPR)
260        MIB.addReg(Reg, RegState::ImplicitDefine);
261    }
262  }
263
264  return true;
265}
266
267void SystemZFrameLowering::
268processFunctionBeforeFrameFinalized(MachineFunction &MF,
269                                    RegScavenger *RS) const {
270  MachineFrameInfo *MFFrame = MF.getFrameInfo();
271  uint64_t MaxReach = (MFFrame->estimateStackSize(MF) +
272                       SystemZMC::CallFrameSize * 2);
273  if (!isUInt<12>(MaxReach)) {
274    // We may need register scavenging slots if some parts of the frame
275    // are outside the reach of an unsigned 12-bit displacement.
276    // Create 2 for the case where both addresses in an MVC are
277    // out of range.
278    RS->addScavengingFrameIndex(MFFrame->CreateStackObject(8, 8, false));
279    RS->addScavengingFrameIndex(MFFrame->CreateStackObject(8, 8, false));
280  }
281}
282
283// Emit instructions before MBBI (in MBB) to add NumBytes to Reg.
284static void emitIncrement(MachineBasicBlock &MBB,
285                          MachineBasicBlock::iterator &MBBI,
286                          const DebugLoc &DL,
287                          unsigned Reg, int64_t NumBytes,
288                          const TargetInstrInfo *TII) {
289  while (NumBytes) {
290    unsigned Opcode;
291    int64_t ThisVal = NumBytes;
292    if (isInt<16>(NumBytes))
293      Opcode = SystemZ::AGHI;
294    else {
295      Opcode = SystemZ::AGFI;
296      // Make sure we maintain 8-byte stack alignment.
297      int64_t MinVal = -int64_t(1) << 31;
298      int64_t MaxVal = (int64_t(1) << 31) - 8;
299      if (ThisVal < MinVal)
300        ThisVal = MinVal;
301      else if (ThisVal > MaxVal)
302        ThisVal = MaxVal;
303    }
304    MachineInstr *MI = BuildMI(MBB, MBBI, DL, TII->get(Opcode), Reg)
305      .addReg(Reg).addImm(ThisVal);
306    // The CC implicit def is dead.
307    MI->getOperand(3).setIsDead();
308    NumBytes -= ThisVal;
309  }
310}
311
312void SystemZFrameLowering::emitPrologue(MachineFunction &MF) const {
313  MachineBasicBlock &MBB = MF.front();
314  MachineFrameInfo *MFFrame = MF.getFrameInfo();
315  const SystemZInstrInfo *ZII =
316    static_cast<const SystemZInstrInfo*>(MF.getTarget().getInstrInfo());
317  SystemZMachineFunctionInfo *ZFI = MF.getInfo<SystemZMachineFunctionInfo>();
318  MachineBasicBlock::iterator MBBI = MBB.begin();
319  MachineModuleInfo &MMI = MF.getMMI();
320  const MCRegisterInfo *MRI = MMI.getContext().getRegisterInfo();
321  const std::vector<CalleeSavedInfo> &CSI = MFFrame->getCalleeSavedInfo();
322  bool HasFP = hasFP(MF);
323  DebugLoc DL = MBBI != MBB.end() ? MBBI->getDebugLoc() : DebugLoc();
324
325  // The current offset of the stack pointer from the CFA.
326  int64_t SPOffsetFromCFA = -SystemZMC::CFAOffsetFromInitialSP;
327
328  if (ZFI->getLowSavedGPR()) {
329    // Skip over the GPR saves.
330    if (MBBI != MBB.end() && MBBI->getOpcode() == SystemZ::STMG)
331      ++MBBI;
332    else
333      llvm_unreachable("Couldn't skip over GPR saves");
334
335    // Add CFI for the GPR saves.
336    MCSymbol *GPRSaveLabel = MMI.getContext().CreateTempSymbol();
337    BuildMI(MBB, MBBI, DL,
338            ZII->get(TargetOpcode::PROLOG_LABEL)).addSym(GPRSaveLabel);
339    for (std::vector<CalleeSavedInfo>::const_iterator
340           I = CSI.begin(), E = CSI.end(); I != E; ++I) {
341      unsigned Reg = I->getReg();
342      if (SystemZ::GR64BitRegClass.contains(Reg)) {
343        int64_t Offset = SPOffsetFromCFA + RegSpillOffsets[Reg];
344        MMI.addFrameInst(MCCFIInstruction::createOffset(
345            GPRSaveLabel, MRI->getDwarfRegNum(Reg, true), Offset));
346      }
347    }
348  }
349
350  uint64_t StackSize = getAllocatedStackSize(MF);
351  if (StackSize) {
352    // Allocate StackSize bytes.
353    int64_t Delta = -int64_t(StackSize);
354    emitIncrement(MBB, MBBI, DL, SystemZ::R15D, Delta, ZII);
355
356    // Add CFI for the allocation.
357    MCSymbol *AdjustSPLabel = MMI.getContext().CreateTempSymbol();
358    BuildMI(MBB, MBBI, DL, ZII->get(TargetOpcode::PROLOG_LABEL))
359      .addSym(AdjustSPLabel);
360    MMI.addFrameInst(MCCFIInstruction::createDefCfaOffset(
361        AdjustSPLabel, SPOffsetFromCFA + Delta));
362    SPOffsetFromCFA += Delta;
363  }
364
365  if (HasFP) {
366    // Copy the base of the frame to R11.
367    BuildMI(MBB, MBBI, DL, ZII->get(SystemZ::LGR), SystemZ::R11D)
368      .addReg(SystemZ::R15D);
369
370    // Add CFI for the new frame location.
371    MCSymbol *SetFPLabel = MMI.getContext().CreateTempSymbol();
372    BuildMI(MBB, MBBI, DL, ZII->get(TargetOpcode::PROLOG_LABEL))
373      .addSym(SetFPLabel);
374    unsigned HardFP = MRI->getDwarfRegNum(SystemZ::R11D, true);
375    MMI.addFrameInst(
376        MCCFIInstruction::createDefCfaRegister(SetFPLabel, HardFP));
377
378    // Mark the FramePtr as live at the beginning of every block except
379    // the entry block.  (We'll have marked R11 as live on entry when
380    // saving the GPRs.)
381    for (MachineFunction::iterator
382           I = llvm::next(MF.begin()), E = MF.end(); I != E; ++I)
383      I->addLiveIn(SystemZ::R11D);
384  }
385
386  // Skip over the FPR saves.
387  MCSymbol *FPRSaveLabel = 0;
388  for (std::vector<CalleeSavedInfo>::const_iterator
389         I = CSI.begin(), E = CSI.end(); I != E; ++I) {
390    unsigned Reg = I->getReg();
391    if (SystemZ::FP64BitRegClass.contains(Reg)) {
392      if (MBBI != MBB.end() &&
393          (MBBI->getOpcode() == SystemZ::STD ||
394           MBBI->getOpcode() == SystemZ::STDY))
395        ++MBBI;
396      else
397        llvm_unreachable("Couldn't skip over FPR save");
398
399      // Add CFI for the this save.
400      if (!FPRSaveLabel)
401        FPRSaveLabel = MMI.getContext().CreateTempSymbol();
402      unsigned Reg = MRI->getDwarfRegNum(I->getReg(), true);
403      int64_t Offset = getFrameIndexOffset(MF, I->getFrameIdx());
404      MMI.addFrameInst(MCCFIInstruction::createOffset(
405          FPRSaveLabel, Reg, SPOffsetFromCFA + Offset));
406    }
407  }
408  // Complete the CFI for the FPR saves, modelling them as taking effect
409  // after the last save.
410  if (FPRSaveLabel)
411    BuildMI(MBB, MBBI, DL, ZII->get(TargetOpcode::PROLOG_LABEL))
412      .addSym(FPRSaveLabel);
413}
414
415void SystemZFrameLowering::emitEpilogue(MachineFunction &MF,
416                                        MachineBasicBlock &MBB) const {
417  MachineBasicBlock::iterator MBBI = MBB.getLastNonDebugInstr();
418  const SystemZInstrInfo *ZII =
419    static_cast<const SystemZInstrInfo*>(MF.getTarget().getInstrInfo());
420  SystemZMachineFunctionInfo *ZFI = MF.getInfo<SystemZMachineFunctionInfo>();
421
422  // Skip the return instruction.
423  assert(MBBI->isReturn() && "Can only insert epilogue into returning blocks");
424
425  uint64_t StackSize = getAllocatedStackSize(MF);
426  if (ZFI->getLowSavedGPR()) {
427    --MBBI;
428    unsigned Opcode = MBBI->getOpcode();
429    if (Opcode != SystemZ::LMG)
430      llvm_unreachable("Expected to see callee-save register restore code");
431
432    unsigned AddrOpNo = 2;
433    DebugLoc DL = MBBI->getDebugLoc();
434    uint64_t Offset = StackSize + MBBI->getOperand(AddrOpNo + 1).getImm();
435    unsigned NewOpcode = ZII->getOpcodeForOffset(Opcode, Offset);
436
437    // If the offset is too large, use the largest stack-aligned offset
438    // and add the rest to the base register (the stack or frame pointer).
439    if (!NewOpcode) {
440      uint64_t NumBytes = Offset - 0x7fff8;
441      emitIncrement(MBB, MBBI, DL, MBBI->getOperand(AddrOpNo).getReg(),
442                    NumBytes, ZII);
443      Offset -= NumBytes;
444      NewOpcode = ZII->getOpcodeForOffset(Opcode, Offset);
445      assert(NewOpcode && "No restore instruction available");
446    }
447
448    MBBI->setDesc(ZII->get(NewOpcode));
449    MBBI->getOperand(AddrOpNo + 1).ChangeToImmediate(Offset);
450  } else if (StackSize) {
451    DebugLoc DL = MBBI->getDebugLoc();
452    emitIncrement(MBB, MBBI, DL, SystemZ::R15D, StackSize, ZII);
453  }
454}
455
456bool SystemZFrameLowering::hasFP(const MachineFunction &MF) const {
457  return (MF.getTarget().Options.DisableFramePointerElim(MF) ||
458          MF.getFrameInfo()->hasVarSizedObjects() ||
459          MF.getInfo<SystemZMachineFunctionInfo>()->getManipulatesSP());
460}
461
462int SystemZFrameLowering::getFrameIndexOffset(const MachineFunction &MF,
463                                              int FI) const {
464  const MachineFrameInfo *MFFrame = MF.getFrameInfo();
465
466  // Start with the offset of FI from the top of the caller-allocated frame
467  // (i.e. the top of the 160 bytes allocated by the caller).  This initial
468  // offset is therefore negative.
469  int64_t Offset = (MFFrame->getObjectOffset(FI) +
470                    MFFrame->getOffsetAdjustment());
471
472  // Make the offset relative to the incoming stack pointer.
473  Offset -= getOffsetOfLocalArea();
474
475  // Make the offset relative to the bottom of the frame.
476  Offset += getAllocatedStackSize(MF);
477
478  return Offset;
479}
480
481uint64_t SystemZFrameLowering::
482getAllocatedStackSize(const MachineFunction &MF) const {
483  const MachineFrameInfo *MFFrame = MF.getFrameInfo();
484
485  // Start with the size of the local variables and spill slots.
486  uint64_t StackSize = MFFrame->getStackSize();
487
488  // We need to allocate the ABI-defined 160-byte base area whenever
489  // we allocate stack space for our own use and whenever we call another
490  // function.
491  if (StackSize || MFFrame->hasVarSizedObjects() || MFFrame->hasCalls())
492    StackSize += SystemZMC::CallFrameSize;
493
494  return StackSize;
495}
496
497bool
498SystemZFrameLowering::hasReservedCallFrame(const MachineFunction &MF) const {
499  // The ABI requires us to allocate 160 bytes of stack space for the callee,
500  // with any outgoing stack arguments being placed above that.  It seems
501  // better to make that area a permanent feature of the frame even if
502  // we're using a frame pointer.
503  return true;
504}
505
506void SystemZFrameLowering::
507eliminateCallFramePseudoInstr(MachineFunction &MF,
508                              MachineBasicBlock &MBB,
509                              MachineBasicBlock::iterator MI) const {
510  switch (MI->getOpcode()) {
511  case SystemZ::ADJCALLSTACKDOWN:
512  case SystemZ::ADJCALLSTACKUP:
513    assert(hasReservedCallFrame(MF) &&
514           "ADJSTACKDOWN and ADJSTACKUP should be no-ops");
515    MBB.erase(MI);
516    break;
517
518  default:
519    llvm_unreachable("Unexpected call frame instruction");
520  }
521}
522