To reduce the register pressure during allocation, when the allocator spills a virtual register that corresponds to a whole wave mode operation, the spill loads and restores should be activated for all lanes by temporarily flipping all bits in exec register to one just before the spills. It is not implemented in the compiler as of today and this patch enables the necessary support. This is a pre-patch before the SGPR spill to virtual VGPR lanes that would eventually causes the whole wave register spills during allocation. Reviewed By: arsenm, cdevadas Differential Revision: https://reviews.llvm.org/D143759
152 lines
5.3 KiB
C++
152 lines
5.3 KiB
C++
//===-- AMDGPUTargetMachine.h - AMDGPU TargetMachine Interface --*- C++ -*-===//
|
|
//
|
|
// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
|
|
// See https://llvm.org/LICENSE.txt for license information.
|
|
// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
|
|
//
|
|
//===----------------------------------------------------------------------===//
|
|
//
|
|
/// \file
|
|
/// The AMDGPU TargetMachine interface definition for hw codegen targets.
|
|
//
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
#ifndef LLVM_LIB_TARGET_AMDGPU_AMDGPUTARGETMACHINE_H
|
|
#define LLVM_LIB_TARGET_AMDGPU_AMDGPUTARGETMACHINE_H
|
|
|
|
#include "GCNSubtarget.h"
|
|
#include "llvm/CodeGen/TargetPassConfig.h"
|
|
#include "llvm/Target/TargetMachine.h"
|
|
#include <optional>
|
|
#include <utility>
|
|
|
|
namespace llvm {
|
|
|
|
//===----------------------------------------------------------------------===//
|
|
// AMDGPU Target Machine (R600+)
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
class AMDGPUTargetMachine : public LLVMTargetMachine {
|
|
protected:
|
|
std::unique_ptr<TargetLoweringObjectFile> TLOF;
|
|
|
|
StringRef getGPUName(const Function &F) const;
|
|
StringRef getFeatureString(const Function &F) const;
|
|
|
|
public:
|
|
static bool EnableLateStructurizeCFG;
|
|
static bool EnableFunctionCalls;
|
|
static bool EnableLowerModuleLDS;
|
|
|
|
AMDGPUTargetMachine(const Target &T, const Triple &TT, StringRef CPU,
|
|
StringRef FS, TargetOptions Options,
|
|
std::optional<Reloc::Model> RM,
|
|
std::optional<CodeModel::Model> CM, CodeGenOpt::Level OL);
|
|
~AMDGPUTargetMachine() override;
|
|
|
|
const TargetSubtargetInfo *getSubtargetImpl() const;
|
|
const TargetSubtargetInfo *getSubtargetImpl(const Function &) const override = 0;
|
|
|
|
TargetLoweringObjectFile *getObjFileLowering() const override {
|
|
return TLOF.get();
|
|
}
|
|
|
|
void registerPassBuilderCallbacks(PassBuilder &PB) override;
|
|
void registerDefaultAliasAnalyses(AAManager &) override;
|
|
|
|
/// Get the integer value of a null pointer in the given address space.
|
|
static int64_t getNullPointerValue(unsigned AddrSpace);
|
|
|
|
bool isNoopAddrSpaceCast(unsigned SrcAS, unsigned DestAS) const override;
|
|
|
|
unsigned getAssumedAddrSpace(const Value *V) const override;
|
|
|
|
std::pair<const Value *, unsigned>
|
|
getPredicatedAddrSpace(const Value *V) const override;
|
|
|
|
unsigned getAddressSpaceForPseudoSourceKind(unsigned Kind) const override;
|
|
};
|
|
|
|
//===----------------------------------------------------------------------===//
|
|
// GCN Target Machine (SI+)
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
class GCNTargetMachine final : public AMDGPUTargetMachine {
|
|
private:
|
|
mutable StringMap<std::unique_ptr<GCNSubtarget>> SubtargetMap;
|
|
|
|
public:
|
|
GCNTargetMachine(const Target &T, const Triple &TT, StringRef CPU,
|
|
StringRef FS, TargetOptions Options,
|
|
std::optional<Reloc::Model> RM,
|
|
std::optional<CodeModel::Model> CM, CodeGenOpt::Level OL,
|
|
bool JIT);
|
|
|
|
TargetPassConfig *createPassConfig(PassManagerBase &PM) override;
|
|
|
|
const TargetSubtargetInfo *getSubtargetImpl(const Function &) const override;
|
|
|
|
TargetTransformInfo getTargetTransformInfo(const Function &F) const override;
|
|
|
|
bool useIPRA() const override {
|
|
return true;
|
|
}
|
|
|
|
void registerMachineRegisterInfoCallback(MachineFunction &MF) const override;
|
|
|
|
MachineFunctionInfo *
|
|
createMachineFunctionInfo(BumpPtrAllocator &Allocator, const Function &F,
|
|
const TargetSubtargetInfo *STI) const override;
|
|
|
|
yaml::MachineFunctionInfo *createDefaultFuncInfoYAML() const override;
|
|
yaml::MachineFunctionInfo *
|
|
convertFuncInfoToYAML(const MachineFunction &MF) const override;
|
|
bool parseMachineFunctionInfo(const yaml::MachineFunctionInfo &,
|
|
PerFunctionMIParsingState &PFS,
|
|
SMDiagnostic &Error,
|
|
SMRange &SourceRange) const override;
|
|
};
|
|
|
|
//===----------------------------------------------------------------------===//
|
|
// AMDGPU Pass Setup
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
class AMDGPUPassConfig : public TargetPassConfig {
|
|
public:
|
|
AMDGPUPassConfig(LLVMTargetMachine &TM, PassManagerBase &PM);
|
|
|
|
AMDGPUTargetMachine &getAMDGPUTargetMachine() const {
|
|
return getTM<AMDGPUTargetMachine>();
|
|
}
|
|
|
|
ScheduleDAGInstrs *
|
|
createMachineScheduler(MachineSchedContext *C) const override;
|
|
|
|
void addEarlyCSEOrGVNPass();
|
|
void addStraightLineScalarOptimizationPasses();
|
|
void addIRPasses() override;
|
|
void addCodeGenPrepare() override;
|
|
bool addPreISel() override;
|
|
bool addInstSelector() override;
|
|
bool addGCPasses() override;
|
|
|
|
std::unique_ptr<CSEConfigBase> getCSEConfig() const override;
|
|
|
|
/// Check if a pass is enabled given \p Opt option. The option always
|
|
/// overrides defaults if explicitly used. Otherwise its default will
|
|
/// be used given that a pass shall work at an optimization \p Level
|
|
/// minimum.
|
|
bool isPassEnabled(const cl::opt<bool> &Opt,
|
|
CodeGenOpt::Level Level = CodeGenOpt::Default) const {
|
|
if (Opt.getNumOccurrences())
|
|
return Opt;
|
|
if (TM->getOptLevel() < Level)
|
|
return false;
|
|
return Opt;
|
|
}
|
|
};
|
|
|
|
} // end namespace llvm
|
|
|
|
#endif // LLVM_LIB_TARGET_AMDGPU_AMDGPUTARGETMACHINE_H
|