Home | History | Annotate | Line # | Download | only in SystemZ
      1 //===-- SystemZFrameLowering.cpp - Frame lowering for SystemZ -------------===//
      2 //
      3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
      4 // See https://llvm.org/LICENSE.txt for license information.
      5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
      6 //
      7 //===----------------------------------------------------------------------===//
      8 
      9 #include "SystemZFrameLowering.h"
     10 #include "SystemZCallingConv.h"
     11 #include "SystemZInstrBuilder.h"
     12 #include "SystemZInstrInfo.h"
     13 #include "SystemZMachineFunctionInfo.h"
     14 #include "SystemZRegisterInfo.h"
     15 #include "SystemZSubtarget.h"
     16 #include "llvm/CodeGen/MachineModuleInfo.h"
     17 #include "llvm/CodeGen/MachineRegisterInfo.h"
     18 #include "llvm/CodeGen/RegisterScavenging.h"
     19 #include "llvm/IR/Function.h"
     20 #include "llvm/Target/TargetMachine.h"
     21 
     22 using namespace llvm;
     23 
     24 namespace {
     25 // The ABI-defined register save slots, relative to the CFA (i.e.
     26 // incoming stack pointer + SystemZMC::ELFCallFrameSize).
     27 static const TargetFrameLowering::SpillSlot SpillOffsetTable[] = {
     28   { SystemZ::R2D,  0x10 },
     29   { SystemZ::R3D,  0x18 },
     30   { SystemZ::R4D,  0x20 },
     31   { SystemZ::R5D,  0x28 },
     32   { SystemZ::R6D,  0x30 },
     33   { SystemZ::R7D,  0x38 },
     34   { SystemZ::R8D,  0x40 },
     35   { SystemZ::R9D,  0x48 },
     36   { SystemZ::R10D, 0x50 },
     37   { SystemZ::R11D, 0x58 },
     38   { SystemZ::R12D, 0x60 },
     39   { SystemZ::R13D, 0x68 },
     40   { SystemZ::R14D, 0x70 },
     41   { SystemZ::R15D, 0x78 },
     42   { SystemZ::F0D,  0x80 },
     43   { SystemZ::F2D,  0x88 },
     44   { SystemZ::F4D,  0x90 },
     45   { SystemZ::F6D,  0x98 }
     46 };
     47 } // end anonymous namespace
     48 
     49 SystemZFrameLowering::SystemZFrameLowering()
     50     : TargetFrameLowering(TargetFrameLowering::StackGrowsDown, Align(8),
     51                           0, Align(8), false /* StackRealignable */),
     52       RegSpillOffsets(0) {
     53   // Due to the SystemZ ABI, the DWARF CFA (Canonical Frame Address) is not
     54   // equal to the incoming stack pointer, but to incoming stack pointer plus
     55   // 160.  Instead of using a Local Area Offset, the Register save area will
     56   // be occupied by fixed frame objects, and all offsets are actually
     57   // relative to CFA.
     58 
     59   // Create a mapping from register number to save slot offset.
     60   // These offsets are relative to the start of the register save area.
     61   RegSpillOffsets.grow(SystemZ::NUM_TARGET_REGS);
     62   for (unsigned I = 0, E = array_lengthof(SpillOffsetTable); I != E; ++I)
     63     RegSpillOffsets[SpillOffsetTable[I].Reg] = SpillOffsetTable[I].Offset;
     64 }
     65 
     66 bool SystemZFrameLowering::
     67 assignCalleeSavedSpillSlots(MachineFunction &MF,
     68                             const TargetRegisterInfo *TRI,
     69                             std::vector<CalleeSavedInfo> &CSI) const {
     70   SystemZMachineFunctionInfo *ZFI = MF.getInfo<SystemZMachineFunctionInfo>();
     71   MachineFrameInfo &MFFrame = MF.getFrameInfo();
     72   bool IsVarArg = MF.getFunction().isVarArg();
     73   if (CSI.empty())
     74     return true; // Early exit if no callee saved registers are modified!
     75 
     76   unsigned LowGPR = 0;
     77   unsigned HighGPR = SystemZ::R15D;
     78   int StartSPOffset = SystemZMC::ELFCallFrameSize;
     79   for (auto &CS : CSI) {
     80     unsigned Reg = CS.getReg();
     81     int Offset = getRegSpillOffset(MF, Reg);
     82     if (Offset) {
     83       if (SystemZ::GR64BitRegClass.contains(Reg) && StartSPOffset > Offset) {
     84         LowGPR = Reg;
     85         StartSPOffset = Offset;
     86       }
     87       Offset -= SystemZMC::ELFCallFrameSize;
     88       int FrameIdx = MFFrame.CreateFixedSpillStackObject(8, Offset);
     89       CS.setFrameIdx(FrameIdx);
     90     } else
     91       CS.setFrameIdx(INT32_MAX);
     92   }
     93 
     94   // Save the range of call-saved registers, for use by the
     95   // prologue/epilogue inserters.
     96   ZFI->setRestoreGPRRegs(LowGPR, HighGPR, StartSPOffset);
     97   if (IsVarArg) {
     98     // Also save the GPR varargs, if any.  R6D is call-saved, so would
     99     // already be included, but we also need to handle the call-clobbered
    100     // argument registers.
    101     unsigned FirstGPR = ZFI->getVarArgsFirstGPR();
    102     if (FirstGPR < SystemZ::ELFNumArgGPRs) {
    103       unsigned Reg = SystemZ::ELFArgGPRs[FirstGPR];
    104       int Offset = getRegSpillOffset(MF, Reg);
    105       if (StartSPOffset > Offset) {
    106         LowGPR = Reg; StartSPOffset = Offset;
    107       }
    108     }
    109   }
    110   ZFI->setSpillGPRRegs(LowGPR, HighGPR, StartSPOffset);
    111 
    112   // Create fixed stack objects for the remaining registers.
    113   int CurrOffset = -SystemZMC::ELFCallFrameSize;
    114   if (usePackedStack(MF))
    115     CurrOffset += StartSPOffset;
    116 
    117   for (auto &CS : CSI) {
    118     if (CS.getFrameIdx() != INT32_MAX)
    119       continue;
    120     unsigned Reg = CS.getReg();
    121     const TargetRegisterClass *RC = TRI->getMinimalPhysRegClass(Reg);
    122     unsigned Size = TRI->getSpillSize(*RC);
    123     CurrOffset -= Size;
    124     assert(CurrOffset % 8 == 0 &&
    125            "8-byte alignment required for for all register save slots");
    126     int FrameIdx = MFFrame.CreateFixedSpillStackObject(Size, CurrOffset);
    127     CS.setFrameIdx(FrameIdx);
    128   }
    129 
    130   return true;
    131 }
    132 
    133 void SystemZFrameLowering::determineCalleeSaves(MachineFunction &MF,
    134                                                 BitVector &SavedRegs,
    135                                                 RegScavenger *RS) const {
    136   TargetFrameLowering::determineCalleeSaves(MF, SavedRegs, RS);
    137 
    138   MachineFrameInfo &MFFrame = MF.getFrameInfo();
    139   const TargetRegisterInfo *TRI = MF.getSubtarget().getRegisterInfo();
    140   bool HasFP = hasFP(MF);
    141   SystemZMachineFunctionInfo *MFI = MF.getInfo<SystemZMachineFunctionInfo>();
    142   bool IsVarArg = MF.getFunction().isVarArg();
    143 
    144   // va_start stores incoming FPR varargs in the normal way, but delegates
    145   // the saving of incoming GPR varargs to spillCalleeSavedRegisters().
    146   // Record these pending uses, which typically include the call-saved
    147   // argument register R6D.
    148   if (IsVarArg)
    149     for (unsigned I = MFI->getVarArgsFirstGPR(); I < SystemZ::ELFNumArgGPRs; ++I)
    150       SavedRegs.set(SystemZ::ELFArgGPRs[I]);
    151 
    152   // If there are any landing pads, entering them will modify r6/r7.
    153   if (!MF.getLandingPads().empty()) {
    154     SavedRegs.set(SystemZ::R6D);
    155     SavedRegs.set(SystemZ::R7D);
    156   }
    157 
    158   // If the function requires a frame pointer, record that the hard
    159   // frame pointer will be clobbered.
    160   if (HasFP)
    161     SavedRegs.set(SystemZ::R11D);
    162 
    163   // If the function calls other functions, record that the return
    164   // address register will be clobbered.
    165   if (MFFrame.hasCalls())
    166     SavedRegs.set(SystemZ::R14D);
    167 
    168   // If we are saving GPRs other than the stack pointer, we might as well
    169   // save and restore the stack pointer at the same time, via STMG and LMG.
    170   // This allows the deallocation to be done by the LMG, rather than needing
    171   // a separate %r15 addition.
    172   const MCPhysReg *CSRegs = TRI->getCalleeSavedRegs(&MF);
    173   for (unsigned I = 0; CSRegs[I]; ++I) {
    174     unsigned Reg = CSRegs[I];
    175     if (SystemZ::GR64BitRegClass.contains(Reg) && SavedRegs.test(Reg)) {
    176       SavedRegs.set(SystemZ::R15D);
    177       break;
    178     }
    179   }
    180 }
    181 
    182 // Add GPR64 to the save instruction being built by MIB, which is in basic
    183 // block MBB.  IsImplicit says whether this is an explicit operand to the
    184 // instruction, or an implicit one that comes between the explicit start
    185 // and end registers.
    186 static void addSavedGPR(MachineBasicBlock &MBB, MachineInstrBuilder &MIB,
    187                         unsigned GPR64, bool IsImplicit) {
    188   const TargetRegisterInfo *RI =
    189       MBB.getParent()->getSubtarget().getRegisterInfo();
    190   Register GPR32 = RI->getSubReg(GPR64, SystemZ::subreg_l32);
    191   bool IsLive = MBB.isLiveIn(GPR64) || MBB.isLiveIn(GPR32);
    192   if (!IsLive || !IsImplicit) {
    193     MIB.addReg(GPR64, getImplRegState(IsImplicit) | getKillRegState(!IsLive));
    194     if (!IsLive)
    195       MBB.addLiveIn(GPR64);
    196   }
    197 }
    198 
    199 bool SystemZFrameLowering::spillCalleeSavedRegisters(
    200     MachineBasicBlock &MBB, MachineBasicBlock::iterator MBBI,
    201     ArrayRef<CalleeSavedInfo> CSI, const TargetRegisterInfo *TRI) const {
    202   if (CSI.empty())
    203     return false;
    204 
    205   MachineFunction &MF = *MBB.getParent();
    206   const TargetInstrInfo *TII = MF.getSubtarget().getInstrInfo();
    207   SystemZMachineFunctionInfo *ZFI = MF.getInfo<SystemZMachineFunctionInfo>();
    208   bool IsVarArg = MF.getFunction().isVarArg();
    209   DebugLoc DL;
    210 
    211   // Save GPRs
    212   SystemZ::GPRRegs SpillGPRs = ZFI->getSpillGPRRegs();
    213   if (SpillGPRs.LowGPR) {
    214     assert(SpillGPRs.LowGPR != SpillGPRs.HighGPR &&
    215            "Should be saving %r15 and something else");
    216 
    217     // Build an STMG instruction.
    218     MachineInstrBuilder MIB = BuildMI(MBB, MBBI, DL, TII->get(SystemZ::STMG));
    219 
    220     // Add the explicit register operands.
    221     addSavedGPR(MBB, MIB, SpillGPRs.LowGPR, false);
    222     addSavedGPR(MBB, MIB, SpillGPRs.HighGPR, false);
    223 
    224     // Add the address.
    225     MIB.addReg(SystemZ::R15D).addImm(SpillGPRs.GPROffset);
    226 
    227     // Make sure all call-saved GPRs are included as operands and are
    228     // marked as live on entry.
    229     for (unsigned I = 0, E = CSI.size(); I != E; ++I) {
    230       unsigned Reg = CSI[I].getReg();
    231       if (SystemZ::GR64BitRegClass.contains(Reg))
    232         addSavedGPR(MBB, MIB, Reg, true);
    233     }
    234 
    235     // ...likewise GPR varargs.
    236     if (IsVarArg)
    237       for (unsigned I = ZFI->getVarArgsFirstGPR(); I < SystemZ::ELFNumArgGPRs; ++I)
    238         addSavedGPR(MBB, MIB, SystemZ::ELFArgGPRs[I], true);
    239   }
    240 
    241   // Save FPRs/VRs in the normal TargetInstrInfo way.
    242   for (unsigned I = 0, E = CSI.size(); I != E; ++I) {
    243     unsigned Reg = CSI[I].getReg();
    244     if (SystemZ::FP64BitRegClass.contains(Reg)) {
    245       MBB.addLiveIn(Reg);
    246       TII->storeRegToStackSlot(MBB, MBBI, Reg, true, CSI[I].getFrameIdx(),
    247                                &SystemZ::FP64BitRegClass, TRI);
    248     }
    249     if (SystemZ::VR128BitRegClass.contains(Reg)) {
    250       MBB.addLiveIn(Reg);
    251       TII->storeRegToStackSlot(MBB, MBBI, Reg, true, CSI[I].getFrameIdx(),
    252                                &SystemZ::VR128BitRegClass, TRI);
    253     }
    254   }
    255 
    256   return true;
    257 }
    258 
    259 bool SystemZFrameLowering::restoreCalleeSavedRegisters(
    260     MachineBasicBlock &MBB, MachineBasicBlock::iterator MBBI,
    261     MutableArrayRef<CalleeSavedInfo> CSI, const TargetRegisterInfo *TRI) const {
    262   if (CSI.empty())
    263     return false;
    264 
    265   MachineFunction &MF = *MBB.getParent();
    266   const TargetInstrInfo *TII = MF.getSubtarget().getInstrInfo();
    267   SystemZMachineFunctionInfo *ZFI = MF.getInfo<SystemZMachineFunctionInfo>();
    268   bool HasFP = hasFP(MF);
    269   DebugLoc DL = MBBI != MBB.end() ? MBBI->getDebugLoc() : DebugLoc();
    270 
    271   // Restore FPRs/VRs in the normal TargetInstrInfo way.
    272   for (unsigned I = 0, E = CSI.size(); I != E; ++I) {
    273     unsigned Reg = CSI[I].getReg();
    274     if (SystemZ::FP64BitRegClass.contains(Reg))
    275       TII->loadRegFromStackSlot(MBB, MBBI, Reg, CSI[I].getFrameIdx(),
    276                                 &SystemZ::FP64BitRegClass, TRI);
    277     if (SystemZ::VR128BitRegClass.contains(Reg))
    278       TII->loadRegFromStackSlot(MBB, MBBI, Reg, CSI[I].getFrameIdx(),
    279                                 &SystemZ::VR128BitRegClass, TRI);
    280   }
    281 
    282   // Restore call-saved GPRs (but not call-clobbered varargs, which at
    283   // this point might hold return values).
    284   SystemZ::GPRRegs RestoreGPRs = ZFI->getRestoreGPRRegs();
    285   if (RestoreGPRs.LowGPR) {
    286     // If we saved any of %r2-%r5 as varargs, we should also be saving
    287     // and restoring %r6.  If we're saving %r6 or above, we should be
    288     // restoring it too.
    289     assert(RestoreGPRs.LowGPR != RestoreGPRs.HighGPR &&
    290            "Should be loading %r15 and something else");
    291 
    292     // Build an LMG instruction.
    293     MachineInstrBuilder MIB = BuildMI(MBB, MBBI, DL, TII->get(SystemZ::LMG));
    294 
    295     // Add the explicit register operands.
    296     MIB.addReg(RestoreGPRs.LowGPR, RegState::Define);
    297     MIB.addReg(RestoreGPRs.HighGPR, RegState::Define);
    298 
    299     // Add the address.
    300     MIB.addReg(HasFP ? SystemZ::R11D : SystemZ::R15D);
    301     MIB.addImm(RestoreGPRs.GPROffset);
    302 
    303     // Do a second scan adding regs as being defined by instruction
    304     for (unsigned I = 0, E = CSI.size(); I != E; ++I) {
    305       unsigned Reg = CSI[I].getReg();
    306       if (Reg != RestoreGPRs.LowGPR && Reg != RestoreGPRs.HighGPR &&
    307           SystemZ::GR64BitRegClass.contains(Reg))
    308         MIB.addReg(Reg, RegState::ImplicitDefine);
    309     }
    310   }
    311 
    312   return true;
    313 }
    314 
    315 void SystemZFrameLowering::
    316 processFunctionBeforeFrameFinalized(MachineFunction &MF,
    317                                     RegScavenger *RS) const {
    318   MachineFrameInfo &MFFrame = MF.getFrameInfo();
    319   SystemZMachineFunctionInfo *ZFI = MF.getInfo<SystemZMachineFunctionInfo>();
    320   MachineRegisterInfo *MRI = &MF.getRegInfo();
    321   bool BackChain = MF.getFunction().hasFnAttribute("backchain");
    322 
    323   if (!usePackedStack(MF) || BackChain)
    324     // Create the incoming register save area.
    325     getOrCreateFramePointerSaveIndex(MF);
    326 
    327   // Get the size of our stack frame to be allocated ...
    328   uint64_t StackSize = (MFFrame.estimateStackSize(MF) +
    329                         SystemZMC::ELFCallFrameSize);
    330   // ... and the maximum offset we may need to reach into the
    331   // caller's frame to access the save area or stack arguments.
    332   int64_t MaxArgOffset = 0;
    333   for (int I = MFFrame.getObjectIndexBegin(); I != 0; ++I)
    334     if (MFFrame.getObjectOffset(I) >= 0) {
    335       int64_t ArgOffset = MFFrame.getObjectOffset(I) +
    336                           MFFrame.getObjectSize(I);
    337       MaxArgOffset = std::max(MaxArgOffset, ArgOffset);
    338     }
    339 
    340   uint64_t MaxReach = StackSize + MaxArgOffset;
    341   if (!isUInt<12>(MaxReach)) {
    342     // We may need register scavenging slots if some parts of the frame
    343     // are outside the reach of an unsigned 12-bit displacement.
    344     // Create 2 for the case where both addresses in an MVC are
    345     // out of range.
    346     RS->addScavengingFrameIndex(MFFrame.CreateStackObject(8, Align(8), false));
    347     RS->addScavengingFrameIndex(MFFrame.CreateStackObject(8, Align(8), false));
    348   }
    349 
    350   // If R6 is used as an argument register it is still callee saved. If it in
    351   // this case is not clobbered (and restored) it should never be marked as
    352   // killed.
    353   if (MF.front().isLiveIn(SystemZ::R6D) &&
    354       ZFI->getRestoreGPRRegs().LowGPR != SystemZ::R6D)
    355     for (auto &MO : MRI->use_nodbg_operands(SystemZ::R6D))
    356       MO.setIsKill(false);
    357 }
    358 
    359 // Emit instructions before MBBI (in MBB) to add NumBytes to Reg.
    360 static void emitIncrement(MachineBasicBlock &MBB,
    361                           MachineBasicBlock::iterator &MBBI, const DebugLoc &DL,
    362                           Register Reg, int64_t NumBytes,
    363                           const TargetInstrInfo *TII) {
    364   while (NumBytes) {
    365     unsigned Opcode;
    366     int64_t ThisVal = NumBytes;
    367     if (isInt<16>(NumBytes))
    368       Opcode = SystemZ::AGHI;
    369     else {
    370       Opcode = SystemZ::AGFI;
    371       // Make sure we maintain 8-byte stack alignment.
    372       int64_t MinVal = -uint64_t(1) << 31;
    373       int64_t MaxVal = (int64_t(1) << 31) - 8;
    374       if (ThisVal < MinVal)
    375         ThisVal = MinVal;
    376       else if (ThisVal > MaxVal)
    377         ThisVal = MaxVal;
    378     }
    379     MachineInstr *MI = BuildMI(MBB, MBBI, DL, TII->get(Opcode), Reg)
    380       .addReg(Reg).addImm(ThisVal);
    381     // The CC implicit def is dead.
    382     MI->getOperand(3).setIsDead();
    383     NumBytes -= ThisVal;
    384   }
    385 }
    386 
    387 // Add CFI for the new CFA offset.
    388 static void buildCFAOffs(MachineBasicBlock &MBB,
    389                          MachineBasicBlock::iterator MBBI,
    390                          const DebugLoc &DL, int Offset,
    391                          const SystemZInstrInfo *ZII) {
    392   unsigned CFIIndex = MBB.getParent()->addFrameInst(
    393     MCCFIInstruction::cfiDefCfaOffset(nullptr, -Offset));
    394   BuildMI(MBB, MBBI, DL, ZII->get(TargetOpcode::CFI_INSTRUCTION))
    395     .addCFIIndex(CFIIndex);
    396 }
    397 
    398 // Add CFI for the new frame location.
    399 static void buildDefCFAReg(MachineBasicBlock &MBB,
    400                            MachineBasicBlock::iterator MBBI,
    401                            const DebugLoc &DL, unsigned Reg,
    402                            const SystemZInstrInfo *ZII) {
    403   MachineFunction &MF = *MBB.getParent();
    404   MachineModuleInfo &MMI = MF.getMMI();
    405   const MCRegisterInfo *MRI = MMI.getContext().getRegisterInfo();
    406   unsigned RegNum = MRI->getDwarfRegNum(Reg, true);
    407   unsigned CFIIndex = MF.addFrameInst(
    408                         MCCFIInstruction::createDefCfaRegister(nullptr, RegNum));
    409   BuildMI(MBB, MBBI, DL, ZII->get(TargetOpcode::CFI_INSTRUCTION))
    410     .addCFIIndex(CFIIndex);
    411 }
    412 
    413 void SystemZFrameLowering::emitPrologue(MachineFunction &MF,
    414                                         MachineBasicBlock &MBB) const {
    415   assert(&MF.front() == &MBB && "Shrink-wrapping not yet supported");
    416   const SystemZSubtarget &STI = MF.getSubtarget<SystemZSubtarget>();
    417   const SystemZTargetLowering &TLI = *STI.getTargetLowering();
    418   MachineFrameInfo &MFFrame = MF.getFrameInfo();
    419   auto *ZII = static_cast<const SystemZInstrInfo *>(STI.getInstrInfo());
    420   SystemZMachineFunctionInfo *ZFI = MF.getInfo<SystemZMachineFunctionInfo>();
    421   MachineBasicBlock::iterator MBBI = MBB.begin();
    422   MachineModuleInfo &MMI = MF.getMMI();
    423   const MCRegisterInfo *MRI = MMI.getContext().getRegisterInfo();
    424   const std::vector<CalleeSavedInfo> &CSI = MFFrame.getCalleeSavedInfo();
    425   bool HasFP = hasFP(MF);
    426 
    427   // In GHC calling convention C stack space, including the ABI-defined
    428   // 160-byte base area, is (de)allocated by GHC itself.  This stack space may
    429   // be used by LLVM as spill slots for the tail recursive GHC functions.  Thus
    430   // do not allocate stack space here, too.
    431   if (MF.getFunction().getCallingConv() == CallingConv::GHC) {
    432     if (MFFrame.getStackSize() > 2048 * sizeof(long)) {
    433       report_fatal_error(
    434           "Pre allocated stack space for GHC function is too small");
    435     }
    436     if (HasFP) {
    437       report_fatal_error(
    438           "In GHC calling convention a frame pointer is not supported");
    439     }
    440     MFFrame.setStackSize(MFFrame.getStackSize() + SystemZMC::ELFCallFrameSize);
    441     return;
    442   }
    443 
    444   // Debug location must be unknown since the first debug location is used
    445   // to determine the end of the prologue.
    446   DebugLoc DL;
    447 
    448   // The current offset of the stack pointer from the CFA.
    449   int64_t SPOffsetFromCFA = -SystemZMC::ELFCFAOffsetFromInitialSP;
    450 
    451   if (ZFI->getSpillGPRRegs().LowGPR) {
    452     // Skip over the GPR saves.
    453     if (MBBI != MBB.end() && MBBI->getOpcode() == SystemZ::STMG)
    454       ++MBBI;
    455     else
    456       llvm_unreachable("Couldn't skip over GPR saves");
    457 
    458     // Add CFI for the GPR saves.
    459     for (auto &Save : CSI) {
    460       unsigned Reg = Save.getReg();
    461       if (SystemZ::GR64BitRegClass.contains(Reg)) {
    462         int FI = Save.getFrameIdx();
    463         int64_t Offset = MFFrame.getObjectOffset(FI);
    464         unsigned CFIIndex = MF.addFrameInst(MCCFIInstruction::createOffset(
    465             nullptr, MRI->getDwarfRegNum(Reg, true), Offset));
    466         BuildMI(MBB, MBBI, DL, ZII->get(TargetOpcode::CFI_INSTRUCTION))
    467             .addCFIIndex(CFIIndex);
    468       }
    469     }
    470   }
    471 
    472   uint64_t StackSize = MFFrame.getStackSize();
    473   // We need to allocate the ABI-defined 160-byte base area whenever
    474   // we allocate stack space for our own use and whenever we call another
    475   // function.
    476   bool HasStackObject = false;
    477   for (unsigned i = 0, e = MFFrame.getObjectIndexEnd(); i != e; ++i)
    478     if (!MFFrame.isDeadObjectIndex(i)) {
    479       HasStackObject = true;
    480       break;
    481     }
    482   if (HasStackObject || MFFrame.hasCalls())
    483     StackSize += SystemZMC::ELFCallFrameSize;
    484   // Don't allocate the incoming reg save area.
    485   StackSize = StackSize > SystemZMC::ELFCallFrameSize
    486                   ? StackSize - SystemZMC::ELFCallFrameSize
    487                   : 0;
    488   MFFrame.setStackSize(StackSize);
    489 
    490   if (StackSize) {
    491     // Allocate StackSize bytes.
    492     int64_t Delta = -int64_t(StackSize);
    493     const unsigned ProbeSize = TLI.getStackProbeSize(MF);
    494     bool FreeProbe = (ZFI->getSpillGPRRegs().GPROffset &&
    495            (ZFI->getSpillGPRRegs().GPROffset + StackSize) < ProbeSize);
    496     if (!FreeProbe &&
    497         MF.getSubtarget().getTargetLowering()->hasInlineStackProbe(MF)) {
    498       // Stack probing may involve looping, but splitting the prologue block
    499       // is not possible at this point since it would invalidate the
    500       // SaveBlocks / RestoreBlocks sets of PEI in the single block function
    501       // case. Build a pseudo to be handled later by inlineStackProbe().
    502       BuildMI(MBB, MBBI, DL, ZII->get(SystemZ::PROBED_STACKALLOC))
    503         .addImm(StackSize);
    504     }
    505     else {
    506       bool StoreBackchain = MF.getFunction().hasFnAttribute("backchain");
    507       // If we need backchain, save current stack pointer.  R1 is free at
    508       // this point.
    509       if (StoreBackchain)
    510         BuildMI(MBB, MBBI, DL, ZII->get(SystemZ::LGR))
    511           .addReg(SystemZ::R1D, RegState::Define).addReg(SystemZ::R15D);
    512       emitIncrement(MBB, MBBI, DL, SystemZ::R15D, Delta, ZII);
    513       buildCFAOffs(MBB, MBBI, DL, SPOffsetFromCFA + Delta, ZII);
    514       if (StoreBackchain)
    515         BuildMI(MBB, MBBI, DL, ZII->get(SystemZ::STG))
    516           .addReg(SystemZ::R1D, RegState::Kill).addReg(SystemZ::R15D)
    517           .addImm(getBackchainOffset(MF)).addReg(0);
    518     }
    519     SPOffsetFromCFA += Delta;
    520   }
    521 
    522   if (HasFP) {
    523     // Copy the base of the frame to R11.
    524     BuildMI(MBB, MBBI, DL, ZII->get(SystemZ::LGR), SystemZ::R11D)
    525       .addReg(SystemZ::R15D);
    526 
    527     // Add CFI for the new frame location.
    528     buildDefCFAReg(MBB, MBBI, DL, SystemZ::R11D, ZII);
    529 
    530     // Mark the FramePtr as live at the beginning of every block except
    531     // the entry block.  (We'll have marked R11 as live on entry when
    532     // saving the GPRs.)
    533     for (auto I = std::next(MF.begin()), E = MF.end(); I != E; ++I)
    534       I->addLiveIn(SystemZ::R11D);
    535   }
    536 
    537   // Skip over the FPR/VR saves.
    538   SmallVector<unsigned, 8> CFIIndexes;
    539   for (auto &Save : CSI) {
    540     unsigned Reg = Save.getReg();
    541     if (SystemZ::FP64BitRegClass.contains(Reg)) {
    542       if (MBBI != MBB.end() &&
    543           (MBBI->getOpcode() == SystemZ::STD ||
    544            MBBI->getOpcode() == SystemZ::STDY))
    545         ++MBBI;
    546       else
    547         llvm_unreachable("Couldn't skip over FPR save");
    548     } else if (SystemZ::VR128BitRegClass.contains(Reg)) {
    549       if (MBBI != MBB.end() &&
    550           MBBI->getOpcode() == SystemZ::VST)
    551         ++MBBI;
    552       else
    553         llvm_unreachable("Couldn't skip over VR save");
    554     } else
    555       continue;
    556 
    557     // Add CFI for the this save.
    558     unsigned DwarfReg = MRI->getDwarfRegNum(Reg, true);
    559     Register IgnoredFrameReg;
    560     int64_t Offset =
    561         getFrameIndexReference(MF, Save.getFrameIdx(), IgnoredFrameReg)
    562             .getFixed();
    563 
    564     unsigned CFIIndex = MF.addFrameInst(MCCFIInstruction::createOffset(
    565           nullptr, DwarfReg, SPOffsetFromCFA + Offset));
    566     CFIIndexes.push_back(CFIIndex);
    567   }
    568   // Complete the CFI for the FPR/VR saves, modelling them as taking effect
    569   // after the last save.
    570   for (auto CFIIndex : CFIIndexes) {
    571     BuildMI(MBB, MBBI, DL, ZII->get(TargetOpcode::CFI_INSTRUCTION))
    572         .addCFIIndex(CFIIndex);
    573   }
    574 }
    575 
    576 void SystemZFrameLowering::emitEpilogue(MachineFunction &MF,
    577                                         MachineBasicBlock &MBB) const {
    578   MachineBasicBlock::iterator MBBI = MBB.getLastNonDebugInstr();
    579   auto *ZII =
    580       static_cast<const SystemZInstrInfo *>(MF.getSubtarget().getInstrInfo());
    581   SystemZMachineFunctionInfo *ZFI = MF.getInfo<SystemZMachineFunctionInfo>();
    582   MachineFrameInfo &MFFrame = MF.getFrameInfo();
    583 
    584   // See SystemZFrameLowering::emitPrologue
    585   if (MF.getFunction().getCallingConv() == CallingConv::GHC)
    586     return;
    587 
    588   // Skip the return instruction.
    589   assert(MBBI->isReturn() && "Can only insert epilogue into returning blocks");
    590 
    591   uint64_t StackSize = MFFrame.getStackSize();
    592   if (ZFI->getRestoreGPRRegs().LowGPR) {
    593     --MBBI;
    594     unsigned Opcode = MBBI->getOpcode();
    595     if (Opcode != SystemZ::LMG)
    596       llvm_unreachable("Expected to see callee-save register restore code");
    597 
    598     unsigned AddrOpNo = 2;
    599     DebugLoc DL = MBBI->getDebugLoc();
    600     uint64_t Offset = StackSize + MBBI->getOperand(AddrOpNo + 1).getImm();
    601     unsigned NewOpcode = ZII->getOpcodeForOffset(Opcode, Offset);
    602 
    603     // If the offset is too large, use the largest stack-aligned offset
    604     // and add the rest to the base register (the stack or frame pointer).
    605     if (!NewOpcode) {
    606       uint64_t NumBytes = Offset - 0x7fff8;
    607       emitIncrement(MBB, MBBI, DL, MBBI->getOperand(AddrOpNo).getReg(),
    608                     NumBytes, ZII);
    609       Offset -= NumBytes;
    610       NewOpcode = ZII->getOpcodeForOffset(Opcode, Offset);
    611       assert(NewOpcode && "No restore instruction available");
    612     }
    613 
    614     MBBI->setDesc(ZII->get(NewOpcode));
    615     MBBI->getOperand(AddrOpNo + 1).ChangeToImmediate(Offset);
    616   } else if (StackSize) {
    617     DebugLoc DL = MBBI->getDebugLoc();
    618     emitIncrement(MBB, MBBI, DL, SystemZ::R15D, StackSize, ZII);
    619   }
    620 }
    621 
    622 void SystemZFrameLowering::inlineStackProbe(MachineFunction &MF,
    623                                             MachineBasicBlock &PrologMBB) const {
    624   auto *ZII =
    625     static_cast<const SystemZInstrInfo *>(MF.getSubtarget().getInstrInfo());
    626   const SystemZSubtarget &STI = MF.getSubtarget<SystemZSubtarget>();
    627   const SystemZTargetLowering &TLI = *STI.getTargetLowering();
    628 
    629   MachineInstr *StackAllocMI = nullptr;
    630   for (MachineInstr &MI : PrologMBB)
    631     if (MI.getOpcode() == SystemZ::PROBED_STACKALLOC) {
    632       StackAllocMI = &MI;
    633       break;
    634     }
    635   if (StackAllocMI == nullptr)
    636     return;
    637   uint64_t StackSize = StackAllocMI->getOperand(0).getImm();
    638   const unsigned ProbeSize = TLI.getStackProbeSize(MF);
    639   uint64_t NumFullBlocks = StackSize / ProbeSize;
    640   uint64_t Residual = StackSize % ProbeSize;
    641   int64_t SPOffsetFromCFA = -SystemZMC::ELFCFAOffsetFromInitialSP;
    642   MachineBasicBlock *MBB = &PrologMBB;
    643   MachineBasicBlock::iterator MBBI = StackAllocMI;
    644   const DebugLoc DL = StackAllocMI->getDebugLoc();
    645 
    646   // Allocate a block of Size bytes on the stack and probe it.
    647   auto allocateAndProbe = [&](MachineBasicBlock &InsMBB,
    648                               MachineBasicBlock::iterator InsPt, unsigned Size,
    649                               bool EmitCFI) -> void {
    650     emitIncrement(InsMBB, InsPt, DL, SystemZ::R15D, -int64_t(Size), ZII);
    651     if (EmitCFI) {
    652       SPOffsetFromCFA -= Size;
    653       buildCFAOffs(InsMBB, InsPt, DL, SPOffsetFromCFA, ZII);
    654     }
    655     // Probe by means of a volatile compare.
    656     MachineMemOperand *MMO = MF.getMachineMemOperand(MachinePointerInfo(),
    657       MachineMemOperand::MOVolatile | MachineMemOperand::MOLoad, 8, Align(1));
    658     BuildMI(InsMBB, InsPt, DL, ZII->get(SystemZ::CG))
    659       .addReg(SystemZ::R0D, RegState::Undef)
    660       .addReg(SystemZ::R15D).addImm(Size - 8).addReg(0)
    661       .addMemOperand(MMO);
    662   };
    663 
    664   bool StoreBackchain = MF.getFunction().hasFnAttribute("backchain");
    665   if (StoreBackchain)
    666     BuildMI(*MBB, MBBI, DL, ZII->get(SystemZ::LGR))
    667       .addReg(SystemZ::R1D, RegState::Define).addReg(SystemZ::R15D);
    668 
    669   MachineBasicBlock *DoneMBB = nullptr;
    670   MachineBasicBlock *LoopMBB = nullptr;
    671   if (NumFullBlocks < 3) {
    672     // Emit unrolled probe statements.
    673     for (unsigned int i = 0; i < NumFullBlocks; i++)
    674       allocateAndProbe(*MBB, MBBI, ProbeSize, true/*EmitCFI*/);
    675   } else {
    676     // Emit a loop probing the pages.
    677     uint64_t LoopAlloc = ProbeSize * NumFullBlocks;
    678     SPOffsetFromCFA -= LoopAlloc;
    679 
    680     // Use R0D to hold the exit value.
    681     BuildMI(*MBB, MBBI, DL, ZII->get(SystemZ::LGR), SystemZ::R0D)
    682       .addReg(SystemZ::R15D);
    683     buildDefCFAReg(*MBB, MBBI, DL, SystemZ::R0D, ZII);
    684     emitIncrement(*MBB, MBBI, DL, SystemZ::R0D, -int64_t(LoopAlloc), ZII);
    685     buildCFAOffs(*MBB, MBBI, DL, -int64_t(SystemZMC::ELFCallFrameSize + LoopAlloc),
    686                  ZII);
    687 
    688     DoneMBB = SystemZ::splitBlockBefore(MBBI, MBB);
    689     LoopMBB = SystemZ::emitBlockAfter(MBB);
    690     MBB->addSuccessor(LoopMBB);
    691     LoopMBB->addSuccessor(LoopMBB);
    692     LoopMBB->addSuccessor(DoneMBB);
    693 
    694     MBB = LoopMBB;
    695     allocateAndProbe(*MBB, MBB->end(), ProbeSize, false/*EmitCFI*/);
    696     BuildMI(*MBB, MBB->end(), DL, ZII->get(SystemZ::CLGR))
    697       .addReg(SystemZ::R15D).addReg(SystemZ::R0D);
    698     BuildMI(*MBB, MBB->end(), DL, ZII->get(SystemZ::BRC))
    699       .addImm(SystemZ::CCMASK_ICMP).addImm(SystemZ::CCMASK_CMP_GT).addMBB(MBB);
    700 
    701     MBB = DoneMBB;
    702     MBBI = DoneMBB->begin();
    703     buildDefCFAReg(*MBB, MBBI, DL, SystemZ::R15D, ZII);
    704   }
    705 
    706   if (Residual)
    707     allocateAndProbe(*MBB, MBBI, Residual, true/*EmitCFI*/);
    708 
    709   if (StoreBackchain)
    710     BuildMI(*MBB, MBBI, DL, ZII->get(SystemZ::STG))
    711       .addReg(SystemZ::R1D, RegState::Kill).addReg(SystemZ::R15D)
    712       .addImm(getBackchainOffset(MF)).addReg(0);
    713 
    714   StackAllocMI->eraseFromParent();
    715   if (DoneMBB != nullptr) {
    716     // Compute the live-in lists for the new blocks.
    717     recomputeLiveIns(*DoneMBB);
    718     recomputeLiveIns(*LoopMBB);
    719   }
    720 }
    721 
    722 bool SystemZFrameLowering::hasFP(const MachineFunction &MF) const {
    723   return (MF.getTarget().Options.DisableFramePointerElim(MF) ||
    724           MF.getFrameInfo().hasVarSizedObjects() ||
    725           MF.getInfo<SystemZMachineFunctionInfo>()->getManipulatesSP());
    726 }
    727 
    728 bool
    729 SystemZFrameLowering::hasReservedCallFrame(const MachineFunction &MF) const {
    730   // The ABI requires us to allocate 160 bytes of stack space for the callee,
    731   // with any outgoing stack arguments being placed above that.  It seems
    732   // better to make that area a permanent feature of the frame even if
    733   // we're using a frame pointer.
    734   return true;
    735 }
    736 
    737 StackOffset
    738 SystemZFrameLowering::getFrameIndexReference(const MachineFunction &MF, int FI,
    739                                              Register &FrameReg) const {
    740   // Our incoming SP is actually SystemZMC::ELFCallFrameSize below the CFA, so
    741   // add that difference here.
    742   StackOffset Offset =
    743       TargetFrameLowering::getFrameIndexReference(MF, FI, FrameReg);
    744   return Offset + StackOffset::getFixed(SystemZMC::ELFCallFrameSize);
    745 }
    746 
    747 MachineBasicBlock::iterator SystemZFrameLowering::
    748 eliminateCallFramePseudoInstr(MachineFunction &MF,
    749                               MachineBasicBlock &MBB,
    750                               MachineBasicBlock::iterator MI) const {
    751   switch (MI->getOpcode()) {
    752   case SystemZ::ADJCALLSTACKDOWN:
    753   case SystemZ::ADJCALLSTACKUP:
    754     assert(hasReservedCallFrame(MF) &&
    755            "ADJSTACKDOWN and ADJSTACKUP should be no-ops");
    756     return MBB.erase(MI);
    757     break;
    758 
    759   default:
    760     llvm_unreachable("Unexpected call frame instruction");
    761   }
    762 }
    763 
    764 unsigned SystemZFrameLowering::getRegSpillOffset(MachineFunction &MF,
    765                                                  Register Reg) const {
    766   bool IsVarArg = MF.getFunction().isVarArg();
    767   bool BackChain = MF.getFunction().hasFnAttribute("backchain");
    768   bool SoftFloat = MF.getSubtarget<SystemZSubtarget>().hasSoftFloat();
    769   unsigned Offset = RegSpillOffsets[Reg];
    770   if (usePackedStack(MF) && !(IsVarArg && !SoftFloat)) {
    771     if (SystemZ::GR64BitRegClass.contains(Reg))
    772       // Put all GPRs at the top of the Register save area with packed
    773       // stack. Make room for the backchain if needed.
    774       Offset += BackChain ? 24 : 32;
    775     else
    776       Offset = 0;
    777   }
    778   return Offset;
    779 }
    780 
    781 int SystemZFrameLowering::
    782 getOrCreateFramePointerSaveIndex(MachineFunction &MF) const {
    783   SystemZMachineFunctionInfo *ZFI = MF.getInfo<SystemZMachineFunctionInfo>();
    784   int FI = ZFI->getFramePointerSaveIndex();
    785   if (!FI) {
    786     MachineFrameInfo &MFFrame = MF.getFrameInfo();
    787     int Offset = getBackchainOffset(MF) - SystemZMC::ELFCallFrameSize;
    788     FI = MFFrame.CreateFixedObject(8, Offset, false);
    789     ZFI->setFramePointerSaveIndex(FI);
    790   }
    791   return FI;
    792 }
    793 
    794 bool SystemZFrameLowering::usePackedStack(MachineFunction &MF) const {
    795   bool HasPackedStackAttr = MF.getFunction().hasFnAttribute("packed-stack");
    796   bool BackChain = MF.getFunction().hasFnAttribute("backchain");
    797   bool SoftFloat = MF.getSubtarget<SystemZSubtarget>().hasSoftFloat();
    798   if (HasPackedStackAttr && BackChain && !SoftFloat)
    799     report_fatal_error("packed-stack + backchain + hard-float is unsupported.");
    800   bool CallConv = MF.getFunction().getCallingConv() != CallingConv::GHC;
    801   return HasPackedStackAttr && CallConv;
    802 }
    803