When optimising for code size at the expense of performance, it is often worth saving and restoring some of r0-r3, if IPRA will be able to take advantage of them. This doesn't cost any extra code size if we already have a PUSH/POP pair, and increases the number of available registers across any calls to the function. We already have an optimisation which tries fold the subtract/add of the SP into the PUSH/POP by using extra registers, which somewhat conflicts with this. I've made the new optimisation less aggressive in cases where the existing one is likely to trigger, which gives better results than either of these optimisations by themselves. Differential revision: https://reviews.llvm.org/D69936
98 lines
4.0 KiB
C++
98 lines
4.0 KiB
C++
//===- ARMTargetFrameLowering.h - Define frame lowering for ARM -*- C++ -*-===//
|
|
//
|
|
// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
|
|
// See https://llvm.org/LICENSE.txt for license information.
|
|
// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
|
|
//
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
#ifndef LLVM_LIB_TARGET_ARM_ARMFRAMELOWERING_H
|
|
#define LLVM_LIB_TARGET_ARM_ARMFRAMELOWERING_H
|
|
|
|
#include "llvm/CodeGen/MachineBasicBlock.h"
|
|
#include "llvm/CodeGen/TargetFrameLowering.h"
|
|
#include <vector>
|
|
|
|
namespace llvm {
|
|
|
|
class ARMSubtarget;
|
|
class CalleeSavedInfo;
|
|
class MachineFunction;
|
|
|
|
class ARMFrameLowering : public TargetFrameLowering {
|
|
protected:
|
|
const ARMSubtarget &STI;
|
|
|
|
public:
|
|
explicit ARMFrameLowering(const ARMSubtarget &sti);
|
|
|
|
/// emitProlog/emitEpilog - These methods insert prolog and epilog code into
|
|
/// the function.
|
|
void emitPrologue(MachineFunction &MF, MachineBasicBlock &MBB) const override;
|
|
void emitEpilogue(MachineFunction &MF, MachineBasicBlock &MBB) const override;
|
|
|
|
bool spillCalleeSavedRegisters(MachineBasicBlock &MBB,
|
|
MachineBasicBlock::iterator MI,
|
|
ArrayRef<CalleeSavedInfo> CSI,
|
|
const TargetRegisterInfo *TRI) const override;
|
|
|
|
bool
|
|
restoreCalleeSavedRegisters(MachineBasicBlock &MBB,
|
|
MachineBasicBlock::iterator MI,
|
|
MutableArrayRef<CalleeSavedInfo> CSI,
|
|
const TargetRegisterInfo *TRI) const override;
|
|
|
|
bool keepFramePointer(const MachineFunction &MF) const override;
|
|
|
|
bool enableCalleeSaveSkip(const MachineFunction &MF) const override;
|
|
|
|
bool hasFP(const MachineFunction &MF) const override;
|
|
bool hasReservedCallFrame(const MachineFunction &MF) const override;
|
|
bool canSimplifyCallFramePseudos(const MachineFunction &MF) const override;
|
|
int getFrameIndexReference(const MachineFunction &MF, int FI,
|
|
unsigned &FrameReg) const override;
|
|
int ResolveFrameIndexReference(const MachineFunction &MF, int FI,
|
|
unsigned &FrameReg, int SPAdj) const;
|
|
|
|
void getCalleeSaves(const MachineFunction &MF,
|
|
BitVector &SavedRegs) const override;
|
|
void findRegDefsOutsideSaveRestore(MachineFunction &MF,
|
|
BitVector &Regs) const;
|
|
unsigned spillExtraRegsForIPRA(MachineFunction &MF, BitVector &SavedRegs,
|
|
bool HasFPRegSaves) const;
|
|
void determineCalleeSaves(MachineFunction &MF, BitVector &SavedRegs,
|
|
RegScavenger *RS) const override;
|
|
|
|
void adjustForSegmentedStacks(MachineFunction &MF,
|
|
MachineBasicBlock &MBB) const override;
|
|
|
|
/// Returns true if the target will correctly handle shrink wrapping.
|
|
bool enableShrinkWrapping(const MachineFunction &MF) const override;
|
|
|
|
bool isProfitableForNoCSROpt(const Function &F) const override {
|
|
// The no-CSR optimisation is bad for code size on ARM, because we can save
|
|
// many registers with a single PUSH/POP pair.
|
|
return false;
|
|
}
|
|
|
|
private:
|
|
void emitPushInst(MachineBasicBlock &MBB, MachineBasicBlock::iterator MI,
|
|
ArrayRef<CalleeSavedInfo> CSI, unsigned StmOpc,
|
|
unsigned StrOpc, bool NoGap, bool (*Func)(unsigned, bool),
|
|
unsigned NumAlignedDPRCS2Regs, unsigned MIFlags = 0) const;
|
|
void emitPopInst(MachineBasicBlock &MBB, MachineBasicBlock::iterator MI,
|
|
MutableArrayRef<CalleeSavedInfo> CSI, unsigned LdmOpc,
|
|
unsigned LdrOpc, bool isVarArg, bool NoGap,
|
|
bool (*Func)(unsigned, bool),
|
|
unsigned NumAlignedDPRCS2Regs) const;
|
|
|
|
MachineBasicBlock::iterator
|
|
eliminateCallFramePseudoInstr(MachineFunction &MF,
|
|
MachineBasicBlock &MBB,
|
|
MachineBasicBlock::iterator MI) const override;
|
|
};
|
|
|
|
} // end namespace llvm
|
|
|
|
#endif // LLVM_LIB_TARGET_ARM_ARMFRAMELOWERING_H
|