Target/Sparc/LeonPasses.cpp

303231Sdim//===------ LeonPasses.cpp - Define passes specific to LEON ---------------===//
303231Sdim//
303231Sdim//                     The LLVM Compiler Infrastructure
303231Sdim//
303231Sdim// This file is distributed under the University of Illinois Open Source
303231Sdim// License. See LICENSE.TXT for details.
303231Sdim//
303231Sdim//===----------------------------------------------------------------------===//
303231Sdim//
303231Sdim//
303231Sdim//===----------------------------------------------------------------------===//
303231Sdim
303231Sdim#include "LeonPasses.h"
303231Sdim#include "llvm/CodeGen/ISDOpcodes.h"
303231Sdim#include "llvm/CodeGen/MachineFunction.h"
303231Sdim#include "llvm/CodeGen/MachineInstr.h"
303231Sdim#include "llvm/CodeGen/MachineInstrBuilder.h"
303231Sdim#include "llvm/CodeGen/MachineRegisterInfo.h"
314564Sdim#include "llvm/IR/DiagnosticInfo.h"
303231Sdim#include "llvm/IR/LLVMContext.h"
303231Sdim#include "llvm/Support/raw_ostream.h"
303231Sdimusing namespace llvm;
303231Sdim
303231SdimLEONMachineFunctionPass::LEONMachineFunctionPass(char &ID)
303231Sdim    : MachineFunctionPass(ID) {}
303231Sdim
303231Sdimint LEONMachineFunctionPass::GetRegIndexForOperand(MachineInstr &MI,
303231Sdim                                                   int OperandIndex) {
303231Sdim  if (MI.getNumOperands() > 0) {
303231Sdim    if (OperandIndex == LAST_OPERAND) {
303231Sdim      OperandIndex = MI.getNumOperands() - 1;
303231Sdim    }
303231Sdim
303231Sdim    if (MI.getNumOperands() > (unsigned)OperandIndex &&
303231Sdim        MI.getOperand(OperandIndex).isReg()) {
303231Sdim      return (int)MI.getOperand(OperandIndex).getReg();
303231Sdim    }
303231Sdim  }
303231Sdim
303231Sdim  static int NotFoundIndex = -10;
303231Sdim  // Return a different number each time to avoid any comparisons between the
303231Sdim  // values returned.
303231Sdim  NotFoundIndex -= 10;
303231Sdim  return NotFoundIndex;
303231Sdim}
303231Sdim
303231Sdim// finds a new free FP register
303231Sdim// checks also the AllocatedRegisters vector
303231Sdimint LEONMachineFunctionPass::getUnusedFPRegister(MachineRegisterInfo &MRI) {
303231Sdim  for (int RegisterIndex = SP::F0; RegisterIndex <= SP::F31; ++RegisterIndex) {
303231Sdim    if (!MRI.isPhysRegUsed(RegisterIndex) &&
314564Sdim        !is_contained(UsedRegisters, RegisterIndex)) {
303231Sdim      return RegisterIndex;
303231Sdim    }
303231Sdim  }
303231Sdim
303231Sdim  return -1;
303231Sdim}
303231Sdim
303231Sdim//*****************************************************************************
303231Sdim//**** InsertNOPLoad pass
303231Sdim//*****************************************************************************
303231Sdim// This pass fixes the incorrectly working Load instructions that exists for
303231Sdim// some earlier versions of the LEON processor line. NOP instructions must
303231Sdim// be inserted after the load instruction to ensure that the Load instruction
303231Sdim// behaves as expected for these processors.
303231Sdim//
303231Sdim// This pass inserts a NOP after any LD or LDF instruction.
303231Sdim//
303231Sdimchar InsertNOPLoad::ID = 0;
303231Sdim
321369SdimInsertNOPLoad::InsertNOPLoad() : LEONMachineFunctionPass(ID) {}
303231Sdim
303231Sdimbool InsertNOPLoad::runOnMachineFunction(MachineFunction &MF) {
303231Sdim  Subtarget = &MF.getSubtarget<SparcSubtarget>();
303231Sdim  const TargetInstrInfo &TII = *Subtarget->getInstrInfo();
303231Sdim  DebugLoc DL = DebugLoc();
303231Sdim
303231Sdim  bool Modified = false;
303231Sdim  for (auto MFI = MF.begin(), E = MF.end(); MFI != E; ++MFI) {
303231Sdim    MachineBasicBlock &MBB = *MFI;
303231Sdim    for (auto MBBI = MBB.begin(), E = MBB.end(); MBBI != E; ++MBBI) {
303231Sdim      MachineInstr &MI = *MBBI;
303231Sdim      unsigned Opcode = MI.getOpcode();
303231Sdim      if (Opcode >= SP::LDDArr && Opcode <= SP::LDrr) {
303231Sdim        MachineBasicBlock::iterator NMBBI = std::next(MBBI);
303231Sdim        BuildMI(MBB, NMBBI, DL, TII.get(SP::NOP));
303231Sdim        Modified = true;
303231Sdim      }
303231Sdim    }
303231Sdim  }
303231Sdim
303231Sdim  return Modified;
303231Sdim}
303231Sdim
303231Sdim//*****************************************************************************
303231Sdim//**** FixFSMULD pass
303231Sdim//*****************************************************************************
303231Sdim// This pass fixes the incorrectly working FSMULD instruction that exists for
303231Sdim// some earlier versions of the LEON processor line.
303231Sdim//
303231Sdim// The pass should convert the FSMULD operands to double precision in scratch
303231Sdim// registers, then calculate the result with the FMULD instruction. Therefore,
303231Sdim// the pass should replace operations of the form:
303231Sdim// fsmuld %f20,%f21,%f8
303231Sdim// with the sequence:
303231Sdim// fstod %f20,%f0
303231Sdim// fstod %f21,%f2
303231Sdim// fmuld %f0,%f2,%f8
303231Sdim//
303231Sdimchar FixFSMULD::ID = 0;
303231Sdim
321369SdimFixFSMULD::FixFSMULD() : LEONMachineFunctionPass(ID) {}
303231Sdim
303231Sdimbool FixFSMULD::runOnMachineFunction(MachineFunction &MF) {
303231Sdim  Subtarget = &MF.getSubtarget<SparcSubtarget>();
303231Sdim  const TargetInstrInfo &TII = *Subtarget->getInstrInfo();
303231Sdim  DebugLoc DL = DebugLoc();
303231Sdim
303231Sdim  bool Modified = false;
303231Sdim  for (auto MFI = MF.begin(), E = MF.end(); MFI != E; ++MFI) {
303231Sdim    MachineBasicBlock &MBB = *MFI;
303231Sdim    for (auto MBBI = MBB.begin(), E = MBB.end(); MBBI != E; ++MBBI) {
303231Sdim
303231Sdim      MachineInstr &MI = *MBBI;
303231Sdim      unsigned Opcode = MI.getOpcode();
303231Sdim
303231Sdim      const int UNASSIGNED_INDEX = -1;
303231Sdim      int Reg1Index = UNASSIGNED_INDEX;
303231Sdim      int Reg2Index = UNASSIGNED_INDEX;
303231Sdim      int Reg3Index = UNASSIGNED_INDEX;
303231Sdim
303231Sdim      if (Opcode == SP::FSMULD && MI.getNumOperands() == 3) {
303231Sdim        // take the registers from fsmuld %f20,%f21,%f8
303231Sdim        Reg1Index = MI.getOperand(0).getReg();
303231Sdim        Reg2Index = MI.getOperand(1).getReg();
303231Sdim        Reg3Index = MI.getOperand(2).getReg();
303231Sdim      }
303231Sdim
303231Sdim      if (Reg1Index != UNASSIGNED_INDEX && Reg2Index != UNASSIGNED_INDEX &&
303231Sdim          Reg3Index != UNASSIGNED_INDEX) {
303231Sdim        clearUsedRegisterList();
303231Sdim        MachineBasicBlock::iterator NMBBI = std::next(MBBI);
303231Sdim        // Whatever Reg3Index is hasn't been used yet, so we need to reserve it.
303231Sdim        markRegisterUsed(Reg3Index);
303231Sdim        const int ScratchReg1Index = getUnusedFPRegister(MF.getRegInfo());
303231Sdim        markRegisterUsed(ScratchReg1Index);
303231Sdim        const int ScratchReg2Index = getUnusedFPRegister(MF.getRegInfo());
303231Sdim        markRegisterUsed(ScratchReg2Index);
303231Sdim
303231Sdim        if (ScratchReg1Index == UNASSIGNED_INDEX ||
303231Sdim            ScratchReg2Index == UNASSIGNED_INDEX) {
303231Sdim          errs() << "Cannot allocate free scratch registers for the FixFSMULD "
303231Sdim                    "pass."
303231Sdim                 << "\n";
303231Sdim        } else {
303231Sdim          // create fstod %f20,%f0
303231Sdim          BuildMI(MBB, MBBI, DL, TII.get(SP::FSTOD))
303231Sdim              .addReg(ScratchReg1Index)
303231Sdim              .addReg(Reg1Index);
303231Sdim
303231Sdim          // create fstod %f21,%f2
303231Sdim          BuildMI(MBB, MBBI, DL, TII.get(SP::FSTOD))
303231Sdim              .addReg(ScratchReg2Index)
303231Sdim              .addReg(Reg2Index);
303231Sdim
303231Sdim          // create fmuld %f0,%f2,%f8
303231Sdim          BuildMI(MBB, MBBI, DL, TII.get(SP::FMULD))
303231Sdim              .addReg(Reg3Index)
303231Sdim              .addReg(ScratchReg1Index)
303231Sdim              .addReg(ScratchReg2Index);
303231Sdim
303231Sdim          MI.eraseFromParent();
303231Sdim          MBBI = NMBBI;
303231Sdim
303231Sdim          Modified = true;
303231Sdim        }
303231Sdim      }
303231Sdim    }
303231Sdim  }
303231Sdim
303231Sdim  return Modified;
303231Sdim}
303231Sdim
303231Sdim//*****************************************************************************
303231Sdim//**** ReplaceFMULS pass
303231Sdim//*****************************************************************************
303231Sdim// This pass fixes the incorrectly working FMULS instruction that exists for
303231Sdim// some earlier versions of the LEON processor line.
303231Sdim//
303231Sdim// This pass converts the FMULS operands to double precision in scratch
303231Sdim// registers, then calculates the result with the FMULD instruction.
303231Sdim// The pass should replace operations of the form:
303231Sdim// fmuls %f20,%f21,%f8
303231Sdim// with the sequence:
303231Sdim// fstod %f20,%f0
303231Sdim// fstod %f21,%f2
303231Sdim// fmuld %f0,%f2,%f8
303231Sdim//
303231Sdimchar ReplaceFMULS::ID = 0;
303231Sdim
321369SdimReplaceFMULS::ReplaceFMULS() : LEONMachineFunctionPass(ID) {}
303231Sdim
303231Sdimbool ReplaceFMULS::runOnMachineFunction(MachineFunction &MF) {
303231Sdim  Subtarget = &MF.getSubtarget<SparcSubtarget>();
303231Sdim  const TargetInstrInfo &TII = *Subtarget->getInstrInfo();
303231Sdim  DebugLoc DL = DebugLoc();
303231Sdim
303231Sdim  bool Modified = false;
303231Sdim  for (auto MFI = MF.begin(), E = MF.end(); MFI != E; ++MFI) {
303231Sdim    MachineBasicBlock &MBB = *MFI;
303231Sdim    for (auto MBBI = MBB.begin(), E = MBB.end(); MBBI != E; ++MBBI) {
303231Sdim      MachineInstr &MI = *MBBI;
303231Sdim      unsigned Opcode = MI.getOpcode();
303231Sdim
303231Sdim      const int UNASSIGNED_INDEX = -1;
303231Sdim      int Reg1Index = UNASSIGNED_INDEX;
303231Sdim      int Reg2Index = UNASSIGNED_INDEX;
303231Sdim      int Reg3Index = UNASSIGNED_INDEX;
303231Sdim
303231Sdim      if (Opcode == SP::FMULS && MI.getNumOperands() == 3) {
303231Sdim        // take the registers from fmuls %f20,%f21,%f8
303231Sdim        Reg1Index = MI.getOperand(0).getReg();
303231Sdim        Reg2Index = MI.getOperand(1).getReg();
303231Sdim        Reg3Index = MI.getOperand(2).getReg();
303231Sdim      }
303231Sdim
303231Sdim      if (Reg1Index != UNASSIGNED_INDEX && Reg2Index != UNASSIGNED_INDEX &&
303231Sdim          Reg3Index != UNASSIGNED_INDEX) {
303231Sdim        clearUsedRegisterList();
303231Sdim        MachineBasicBlock::iterator NMBBI = std::next(MBBI);
303231Sdim        // Whatever Reg3Index is hasn't been used yet, so we need to reserve it.
303231Sdim        markRegisterUsed(Reg3Index);
303231Sdim        const int ScratchReg1Index = getUnusedFPRegister(MF.getRegInfo());
303231Sdim        markRegisterUsed(ScratchReg1Index);
303231Sdim        const int ScratchReg2Index = getUnusedFPRegister(MF.getRegInfo());
303231Sdim        markRegisterUsed(ScratchReg2Index);
303231Sdim
303231Sdim        if (ScratchReg1Index == UNASSIGNED_INDEX ||
303231Sdim            ScratchReg2Index == UNASSIGNED_INDEX) {
303231Sdim          errs() << "Cannot allocate free scratch registers for the "
303231Sdim                    "ReplaceFMULS pass."
303231Sdim                 << "\n";
303231Sdim        } else {
303231Sdim          // create fstod %f20,%f0
303231Sdim          BuildMI(MBB, MBBI, DL, TII.get(SP::FSTOD))
303231Sdim              .addReg(ScratchReg1Index)
303231Sdim              .addReg(Reg1Index);
303231Sdim
303231Sdim          // create fstod %f21,%f2
303231Sdim          BuildMI(MBB, MBBI, DL, TII.get(SP::FSTOD))
303231Sdim              .addReg(ScratchReg2Index)
303231Sdim              .addReg(Reg2Index);
303231Sdim
303231Sdim          // create fmuld %f0,%f2,%f8
303231Sdim          BuildMI(MBB, MBBI, DL, TII.get(SP::FMULD))
303231Sdim              .addReg(Reg3Index)
303231Sdim              .addReg(ScratchReg1Index)
303231Sdim              .addReg(ScratchReg2Index);
303231Sdim
303231Sdim          MI.eraseFromParent();
303231Sdim          MBBI = NMBBI;
303231Sdim
303231Sdim          Modified = true;
303231Sdim        }
303231Sdim      }
303231Sdim    }
303231Sdim  }
303231Sdim
303231Sdim  return Modified;
303231Sdim}
303231Sdim
303231Sdim
303231Sdim//*****************************************************************************
314564Sdim//**** DetectRoundChange pass
303231Sdim//*****************************************************************************
314564Sdim// To prevent any explicit change of the default rounding mode, this pass
314564Sdim// detects any call of the fesetround function.
314564Sdim// A warning is generated to ensure the user knows this has happened.
303231Sdim//
314564Sdim// Detects an erratum in UT699 LEON 3 processor
303231Sdim
314564Sdimchar DetectRoundChange::ID = 0;
303231Sdim
321369SdimDetectRoundChange::DetectRoundChange() : LEONMachineFunctionPass(ID) {}
303231Sdim
314564Sdimbool DetectRoundChange::runOnMachineFunction(MachineFunction &MF) {
303231Sdim  Subtarget = &MF.getSubtarget<SparcSubtarget>();
303231Sdim
303231Sdim  bool Modified = false;
303231Sdim  for (auto MFI = MF.begin(), E = MF.end(); MFI != E; ++MFI) {
303231Sdim    MachineBasicBlock &MBB = *MFI;
303231Sdim    for (auto MBBI = MBB.begin(), E = MBB.end(); MBBI != E; ++MBBI) {
303231Sdim      MachineInstr &MI = *MBBI;
303231Sdim      unsigned Opcode = MI.getOpcode();
303231Sdim      if (Opcode == SP::CALL && MI.getNumOperands() > 0) {
303231Sdim        MachineOperand &MO = MI.getOperand(0);
303231Sdim
303231Sdim        if (MO.isGlobal()) {
303231Sdim          StringRef FuncName = MO.getGlobal()->getName();
303231Sdim          if (FuncName.compare_lower("fesetround") == 0) {
314564Sdim            errs() << "Error: You are using the detectroundchange "
314564Sdim                      "option to detect rounding changes that will "
314564Sdim                      "cause LEON errata. The only way to fix this "
314564Sdim                      "is to remove the call to fesetround from "
314564Sdim                      "the source code.\n";
303231Sdim          }
303231Sdim        }
303231Sdim      }
303231Sdim    }
303231Sdim  }
303231Sdim
303231Sdim  return Modified;
303231Sdim}
314564Sdim
303231Sdim//*****************************************************************************
314564Sdim//**** FixAllFDIVSQRT pass
303231Sdim//*****************************************************************************
314564Sdim// This pass fixes the incorrectly working FDIVx and FSQRTx instructions that
314564Sdim// exist for some earlier versions of the LEON processor line. Five NOP
314564Sdim// instructions need to be inserted after these instructions to ensure the
314564Sdim// correct result is placed in the destination registers before they are used.
303231Sdim//
314564Sdim// This pass implements two fixes:
314564Sdim//  1) fixing the FSQRTS and FSQRTD instructions.
314564Sdim//  2) fixing the FDIVS and FDIVD instructions.
314564Sdim//
314564Sdim// FSQRTS and FDIVS are converted to FDIVD and FSQRTD respectively earlier in
314564Sdim// the pipeline when this option is enabled, so this pass needs only to deal
314564Sdim// with the changes that still need implementing for the "double" versions
314564Sdim// of these instructions.
314564Sdim//
314564Sdimchar FixAllFDIVSQRT::ID = 0;
303231Sdim
321369SdimFixAllFDIVSQRT::FixAllFDIVSQRT() : LEONMachineFunctionPass(ID) {}
303231Sdim
314564Sdimbool FixAllFDIVSQRT::runOnMachineFunction(MachineFunction &MF) {
303231Sdim  Subtarget = &MF.getSubtarget<SparcSubtarget>();
303231Sdim  const TargetInstrInfo &TII = *Subtarget->getInstrInfo();
303231Sdim  DebugLoc DL = DebugLoc();
303231Sdim
303231Sdim  bool Modified = false;
303231Sdim  for (auto MFI = MF.begin(), E = MF.end(); MFI != E; ++MFI) {
303231Sdim    MachineBasicBlock &MBB = *MFI;
303231Sdim    for (auto MBBI = MBB.begin(), E = MBB.end(); MBBI != E; ++MBBI) {
303231Sdim      MachineInstr &MI = *MBBI;
303231Sdim      unsigned Opcode = MI.getOpcode();
303231Sdim
314564Sdim      // Note: FDIVS and FSQRTS cannot be generated when this erratum fix is
314564Sdim      // switched on so we don't need to check for them here. They will
314564Sdim      // already have been converted to FSQRTD or FDIVD earlier in the
314564Sdim      // pipeline.
314564Sdim      if (Opcode == SP::FSQRTD || Opcode == SP::FDIVD) {
314564Sdim        for (int InsertedCount = 0; InsertedCount < 5; InsertedCount++)
303231Sdim          BuildMI(MBB, MBBI, DL, TII.get(SP::NOP));
303231Sdim
314564Sdim        MachineBasicBlock::iterator NMBBI = std::next(MBBI);
314564Sdim        for (int InsertedCount = 0; InsertedCount < 28; InsertedCount++)
314564Sdim          BuildMI(MBB, NMBBI, DL, TII.get(SP::NOP));
303231Sdim
314564Sdim        Modified = true;
303231Sdim      }
303231Sdim    }
303231Sdim  }
303231Sdim
303231Sdim  return Modified;
303231Sdim}