I was wrong last patch. I viewed the `Visited` set purely as a possible recursion deterrent where functions calling a callee multiple times are handled elsewhere. This doesn't consider cases where a function is called multiple times by different callers still part of the same call graph. New test shows the aforementioned case. Reapplies #111004, fixes #115562.
125 lines
4.5 KiB
C++
125 lines
4.5 KiB
C++
//===- AMDGPUMCExpr.h - AMDGPU specific MC expression classes ---*- C++ -*-===//
|
|
//
|
|
// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
|
|
// See https://llvm.org/LICENSE.txt for license information.
|
|
// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
|
|
//
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
#ifndef LLVM_LIB_TARGET_AMDGPU_MCTARGETDESC_AMDGPUMCEXPR_H
|
|
#define LLVM_LIB_TARGET_AMDGPU_MCTARGETDESC_AMDGPUMCEXPR_H
|
|
|
|
#include "llvm/ADT/ArrayRef.h"
|
|
#include "llvm/MC/MCExpr.h"
|
|
|
|
namespace llvm {
|
|
|
|
class Function;
|
|
class GCNSubtarget;
|
|
|
|
/// AMDGPU target specific MCExpr operations.
|
|
///
|
|
/// Takes in a minimum of 1 argument to be used with an operation. The supported
|
|
/// operations are:
|
|
/// - (bitwise) or
|
|
/// - max
|
|
///
|
|
/// \note If the 'or'/'max' operations are provided only a single argument, the
|
|
/// operation will act as a no-op and simply resolve as the provided argument.
|
|
///
|
|
class AMDGPUMCExpr : public MCTargetExpr {
|
|
public:
|
|
enum VariantKind {
|
|
AGVK_None,
|
|
AGVK_Or,
|
|
AGVK_Max,
|
|
AGVK_ExtraSGPRs,
|
|
AGVK_TotalNumVGPRs,
|
|
AGVK_AlignTo,
|
|
AGVK_Occupancy
|
|
};
|
|
|
|
private:
|
|
VariantKind Kind;
|
|
MCContext &Ctx;
|
|
const MCExpr **RawArgs;
|
|
ArrayRef<const MCExpr *> Args;
|
|
|
|
AMDGPUMCExpr(VariantKind Kind, ArrayRef<const MCExpr *> Args, MCContext &Ctx);
|
|
~AMDGPUMCExpr();
|
|
|
|
bool evaluateExtraSGPRs(MCValue &Res, const MCAssembler *Asm,
|
|
const MCFixup *Fixup) const;
|
|
bool evaluateTotalNumVGPR(MCValue &Res, const MCAssembler *Asm,
|
|
const MCFixup *Fixup) const;
|
|
bool evaluateAlignTo(MCValue &Res, const MCAssembler *Asm,
|
|
const MCFixup *Fixup) const;
|
|
bool evaluateOccupancy(MCValue &Res, const MCAssembler *Asm,
|
|
const MCFixup *Fixup) const;
|
|
|
|
public:
|
|
static const AMDGPUMCExpr *
|
|
create(VariantKind Kind, ArrayRef<const MCExpr *> Args, MCContext &Ctx);
|
|
|
|
static const AMDGPUMCExpr *createOr(ArrayRef<const MCExpr *> Args,
|
|
MCContext &Ctx) {
|
|
return create(VariantKind::AGVK_Or, Args, Ctx);
|
|
}
|
|
|
|
static const AMDGPUMCExpr *createMax(ArrayRef<const MCExpr *> Args,
|
|
MCContext &Ctx) {
|
|
return create(VariantKind::AGVK_Max, Args, Ctx);
|
|
}
|
|
|
|
static const AMDGPUMCExpr *createExtraSGPRs(const MCExpr *VCCUsed,
|
|
const MCExpr *FlatScrUsed,
|
|
bool XNACKUsed, MCContext &Ctx);
|
|
|
|
static const AMDGPUMCExpr *createTotalNumVGPR(const MCExpr *NumAGPR,
|
|
const MCExpr *NumVGPR,
|
|
MCContext &Ctx);
|
|
|
|
static const AMDGPUMCExpr *
|
|
createAlignTo(const MCExpr *Value, const MCExpr *Align, MCContext &Ctx) {
|
|
return create(VariantKind::AGVK_AlignTo, {Value, Align}, Ctx);
|
|
}
|
|
|
|
static const AMDGPUMCExpr *createOccupancy(unsigned InitOcc,
|
|
const MCExpr *NumSGPRs,
|
|
const MCExpr *NumVGPRs,
|
|
const GCNSubtarget &STM,
|
|
MCContext &Ctx);
|
|
|
|
ArrayRef<const MCExpr *> getArgs() const { return Args; }
|
|
VariantKind getKind() const { return Kind; }
|
|
const MCExpr *getSubExpr(size_t Index) const;
|
|
|
|
void printImpl(raw_ostream &OS, const MCAsmInfo *MAI) const override;
|
|
bool evaluateAsRelocatableImpl(MCValue &Res, const MCAssembler *Asm,
|
|
const MCFixup *Fixup) const override;
|
|
bool isSymbolUsedInExpression(const MCSymbol *Sym) const override;
|
|
void visitUsedExpr(MCStreamer &Streamer) const override;
|
|
MCFragment *findAssociatedFragment() const override;
|
|
void fixELFSymbolsInTLSFixups(MCAssembler &) const override{};
|
|
|
|
static bool classof(const MCExpr *E) {
|
|
return E->getKind() == MCExpr::Target;
|
|
}
|
|
};
|
|
|
|
namespace AMDGPU {
|
|
// Tries to leverage KnownBits for MCExprs to reduce and limit any composed
|
|
// MCExprs printing. E.g., for an expression such as
|
|
// ((unevaluatable_sym | 1) & 1) won't evaluate due to unevaluatable_sym and
|
|
// would verbosely print the full expression; however, KnownBits should deduce
|
|
// the value to be 1. Particularly useful for AMDGPU metadata MCExprs.
|
|
void printAMDGPUMCExpr(const MCExpr *Expr, raw_ostream &OS,
|
|
const MCAsmInfo *MAI);
|
|
|
|
const MCExpr *foldAMDGPUMCExpr(const MCExpr *Expr, MCContext &Ctx);
|
|
|
|
} // end namespace AMDGPU
|
|
} // end namespace llvm
|
|
|
|
#endif // LLVM_LIB_TARGET_AMDGPU_MCTARGETDESC_AMDGPUMCEXPR_H
|