doxygen/AMDGPUMCExpr_8cpp_source.html

//===- AMDGPUMCExpr.cpp - AMDGPU specific MC expression classes -----------===//

//

// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.

// See https://llvm.org/LICENSE.txt for license information.

// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception

//

//===----------------------------------------------------------------------===//


#include "AMDGPUMCExpr.h"

#include "Utils/AMDGPUBaseInfo.h"

#include "llvm/MC/MCAsmInfo.h"

#include "llvm/MC/MCAssembler.h"

#include "llvm/MC/MCContext.h"

#include "llvm/MC/MCStreamer.h"

#include "llvm/MC/MCSubtargetInfo.h"

#include "llvm/MC/MCSymbol.h"

#include "llvm/MC/MCValue.h"

#include "llvm/Support/AMDHSAKernelDescriptor.h"

#include "llvm/Support/KnownBits.h"

#include "llvm/Support/MathExtras.h"

#include "llvm/Support/raw_ostream.h"

#include <functional>

#include <optional>


using namespace llvm;

using namespace llvm::AMDGPU;


AMDGPUMCExpr::AMDGPUMCExpr(VariantKind Kind, ArrayRef<const MCExpr *> Args,

                           MCContext &Ctx)

    : Kind(Kind), Ctx(Ctx) {

  assert(Args.size() >= 1 && "Needs a minimum of one expression.");

  assert(Kind != AGVK_None && "Cannot construct AMDGPUMCExpr of kind none.");


  // Allocating the variadic arguments through the same allocation mechanism

  // that the object itself is allocated with so they end up in the same memory.

  //

  // Will result in an asan failure if allocated on the heap through standard

  // allocation (e.g., through SmallVector's grow).

  RawArgs = static_cast<const MCExpr **>(

      Ctx.allocate(sizeof(const MCExpr *) * Args.size()));

  llvm::uninitialized_copy(Args, RawArgs);

  this->Args = ArrayRef<const MCExpr *>(RawArgs, Args.size());

}


AMDGPUMCExpr::~AMDGPUMCExpr() { Ctx.deallocate(RawArgs); }


const AMDGPUMCExpr *AMDGPUMCExpr::create(VariantKind Kind,

                                         ArrayRef<const MCExpr *> Args,

                                         MCContext &Ctx) {

  return new (Ctx) AMDGPUMCExpr(Kind, Args, Ctx);

}


const MCExpr *AMDGPUMCExpr::getSubExpr(size_t Index) const {

  assert(Index < Args.size() && "Indexing out of bounds AMDGPUMCExpr sub-expr");

  return Args[Index];

}


void AMDGPUMCExpr::printImpl(raw_ostream &OS, const MCAsmInfo *MAI) const {

  switch (Kind) {

  default:

    llvm_unreachable("Unknown AMDGPUMCExpr kind.");

  case AGVK_Or:

    OS << "or(";

    break;

  case AGVK_Max:

    OS << "max(";

    break;

  case AGVK_Min:

    OS << "min(";

    break;

  case AGVK_ExtraSGPRs:

    OS << "extrasgprs(";

    break;

  case AGVK_TotalNumVGPRs:

    OS << "totalnumvgprs(";

    break;

  case AGVK_AlignTo:

    OS << "alignto(";

    break;

  case AGVK_Occupancy:

    OS << "occupancy(";

    break;

  case AGVK_InstPrefSize:

    OS << "instprefsize(";

    break;

  case AGVK_Lit:

    OS << "lit(";

    break;

  case AGVK_Lit64:

    OS << "lit64(";

    break;

  }

  for (const auto *It = Args.begin(); It != Args.end(); ++It) {

    MAI->printExpr(OS, **It);

    if ((It + 1) != Args.end())

      OS << ", ";

  }

  OS << ')';

}


static int64_t op(AMDGPUMCExpr::VariantKind Kind, int64_t Arg1, int64_t Arg2) {

  switch (Kind) {

  default:

    llvm_unreachable("Unknown AMDGPUMCExpr kind.");

  case AMDGPUMCExpr::AGVK_Max:

    return std::max(Arg1, Arg2);

  case AMDGPUMCExpr::AGVK_Or:

    return Arg1 | Arg2;

  case AMDGPUMCExpr::AGVK_Min:

    return std::min(Arg1, Arg2);

  }

}


static bool


evaluateMCExprs(ArrayRef<const MCExpr *> Exprs, const MCAssembler *Asm,

                std::initializer_list<std::reference_wrapper<uint64_t>> Vals) {

  return llvm::all_of(llvm::zip_equal(Exprs, Vals), [&](const auto &Pair) {

    auto [Expr, ValRef] = Pair;

    uint64_t &Val = ValRef.get();

    MCValue MCVal;

    if (!Expr->evaluateAsRelocatable(MCVal, Asm) || !MCVal.isAbsolute())

      return false;

    Val = MCVal.getConstant();

    return true;

  });

}


bool AMDGPUMCExpr::evaluateExtraSGPRs(MCValue &Res,

                                      const MCAssembler *Asm) const {

  const MCSubtargetInfo &STI = *Ctx.getSubtargetInfo();

  uint64_t VCCUsed = 0, FlatScrUsed = 0, XNACKUsed = 0;


  if (!evaluateMCExprs(Args, Asm, {VCCUsed, FlatScrUsed, XNACKUsed}))

    return false;


  uint64_t ExtraSGPRs = IsaInfo::getNumExtraSGPRs(

      STI, (bool)VCCUsed, (bool)FlatScrUsed, (bool)XNACKUsed);

  Res = MCValue::get(ExtraSGPRs);

  return true;

}


bool AMDGPUMCExpr::evaluateTotalNumVGPR(MCValue &Res,

                                        const MCAssembler *Asm) const {

  const MCSubtargetInfo &STI = *Ctx.getSubtargetInfo();

  uint64_t NumAGPR = 0, NumVGPR = 0;


  bool Has90AInsts = AMDGPU::isGFX90A(STI);


  if (!evaluateMCExprs(Args, Asm, {NumAGPR, NumVGPR}))

    return false;


  uint64_t TotalNum = Has90AInsts && NumAGPR ? alignTo(NumVGPR, 4) + NumAGPR

                                             : std::max(NumVGPR, NumAGPR);

  Res = MCValue::get(TotalNum);

  return true;

}


bool AMDGPUMCExpr::evaluateAlignTo(MCValue &Res, const MCAssembler *Asm) const {

  uint64_t Value = 0, Align = 0;

  if (!evaluateMCExprs(Args, Asm, {Value, Align}))

    return false;


  Res = MCValue::get(alignTo(Value, Align));

  return true;

}


bool AMDGPUMCExpr::evaluateOccupancy(MCValue &Res,

                                     const MCAssembler *Asm) const {

  uint64_t InitOccupancy, MaxWaves, Granule, TargetTotalNumVGPRs, Generation,

      NumSGPRs, NumVGPRs;


  bool Success = evaluateMCExprs(

      Args.slice(0, 5), Asm,

      {MaxWaves, Granule, TargetTotalNumVGPRs, Generation, InitOccupancy});


  assert(Success && "Arguments 1 to 5 for Occupancy should be known constants");


  if (!Success || !evaluateMCExprs(Args.slice(5, 2), Asm, {NumSGPRs, NumVGPRs}))

    return false;


  unsigned Occupancy = InitOccupancy;

  if (NumSGPRs)

    Occupancy = std::min(

        Occupancy, IsaInfo::getOccupancyWithNumSGPRs(

                       NumSGPRs, MaxWaves,

                       static_cast<AMDGPUSubtarget::Generation>(Generation)));

  if (NumVGPRs)

    Occupancy = std::min(Occupancy,

                         IsaInfo::getNumWavesPerEUWithNumVGPRs(

                             NumVGPRs, Granule, MaxWaves, TargetTotalNumVGPRs));


  Res = MCValue::get(Occupancy);

  return true;

}


/// Get the inst_pref_size field width for the given subtarget.


static unsigned getInstPrefSizeFieldWidth(const MCSubtargetInfo &STI) {

  if (AMDGPU::isGFX12Plus(STI))

    return amdhsa::COMPUTE_PGM_RSRC3_GFX12_PLUS_INST_PREF_SIZE_WIDTH;

  return amdhsa::COMPUTE_PGM_RSRC3_GFX11_INST_PREF_SIZE_WIDTH;

}


bool AMDGPUMCExpr::evaluateInstPrefSize(MCValue &Res,

                                        const MCAssembler *Asm) const {

  uint64_t CodeSizeInBytes = 0;

  if (!evaluateMCExprs(Args, Asm, {CodeSizeInBytes}))

    return false;

  const MCSubtargetInfo *STI = Ctx.getSubtargetInfo();

  unsigned FieldWidth = getInstPrefSizeFieldWidth(*STI);

  unsigned CacheLineSize = AMDGPU::IsaInfo::getInstCacheLineSize(*STI);

  uint64_t CodeSizeInLines = divideCeil(CodeSizeInBytes, CacheLineSize);

  uint64_t MaxVal = (1u << FieldWidth) - 1;

  Res = MCValue::get(std::min(CodeSizeInLines, MaxVal));

  return true;

}


bool AMDGPUMCExpr::isSymbolUsedInExpression(const MCSymbol *Sym,

                                            const MCExpr *E) {

  switch (E->getKind()) {

  case MCExpr::Constant:

    return false;

  case MCExpr::Unary:

    return isSymbolUsedInExpression(

        Sym, static_cast<const MCUnaryExpr *>(E)->getSubExpr());

  case MCExpr::Binary: {

    const MCBinaryExpr *BE = static_cast<const MCBinaryExpr *>(E);

    return isSymbolUsedInExpression(Sym, BE->getLHS()) ||

           isSymbolUsedInExpression(Sym, BE->getRHS());

  }

  case MCExpr::SymbolRef: {

    const MCSymbol &S = static_cast<const MCSymbolRefExpr *>(E)->getSymbol();

    if (S.isVariable())

      return isSymbolUsedInExpression(Sym, S.getVariableValue());

    return &S == Sym;

  }

  case MCExpr::Specifier:

  case MCExpr::Target: {

    auto *TE = static_cast<const AMDGPUMCExpr *>(E);

    for (const MCExpr *E : TE->getArgs())

      if (isSymbolUsedInExpression(Sym, E))

        return true;

    return false;

  }

  }

  llvm_unreachable("Unknown expr kind!");

}


bool AMDGPUMCExpr::evaluateAsRelocatableImpl(MCValue &Res,

                                             const MCAssembler *Asm) const {

  std::optional<int64_t> Total;

  switch (Kind) {

  default:

    break;

  case AGVK_ExtraSGPRs:

    return evaluateExtraSGPRs(Res, Asm);

  case AGVK_AlignTo:

    return evaluateAlignTo(Res, Asm);

  case AGVK_TotalNumVGPRs:

    return evaluateTotalNumVGPR(Res, Asm);

  case AGVK_Occupancy:

    return evaluateOccupancy(Res, Asm);

  case AGVK_InstPrefSize:

    return evaluateInstPrefSize(Res, Asm);

  case AGVK_Lit:

  case AGVK_Lit64:

    return Args[0]->evaluateAsRelocatable(Res, Asm);

  }


  for (const MCExpr *Arg : Args) {

    MCValue ArgRes;

    if (!Arg->evaluateAsRelocatable(ArgRes, Asm) || !ArgRes.isAbsolute())

      return false;


    if (!Total.has_value())

      Total = ArgRes.getConstant();

    Total = op(Kind, *Total, ArgRes.getConstant());

  }


  Res = MCValue::get(*Total);

  return true;

}


void AMDGPUMCExpr::visitUsedExpr(MCStreamer &Streamer) const {

  for (const MCExpr *Arg : Args)

    Streamer.visitUsedExpr(*Arg);

}


MCFragment *AMDGPUMCExpr::findAssociatedFragment() const {

  for (const MCExpr *Arg : Args) {

    if (Arg->findAssociatedFragment())

      return Arg->findAssociatedFragment();

  }

  return nullptr;

}


/// Allow delayed MCExpr resolve of ExtraSGPRs (in case VCCUsed or FlatScrUsed

/// are unresolvable but needed for further MCExprs). Derived from

/// implementation of IsaInfo::getNumExtraSGPRs in AMDGPUBaseInfo.cpp.

///


const AMDGPUMCExpr *AMDGPUMCExpr::createExtraSGPRs(const MCExpr *VCCUsed,

                                                   const MCExpr *FlatScrUsed,

                                                   bool XNACKUsed,

                                                   MCContext &Ctx) {


  return create(AGVK_ExtraSGPRs,

                {VCCUsed, FlatScrUsed, MCConstantExpr::create(XNACKUsed, Ctx)},

                Ctx);

}


const AMDGPUMCExpr *AMDGPUMCExpr::createTotalNumVGPR(const MCExpr *NumAGPR,

                                                     const MCExpr *NumVGPR,

                                                     MCContext &Ctx) {

  return create(AGVK_TotalNumVGPRs, {NumAGPR, NumVGPR}, Ctx);

}


const AMDGPUMCExpr *


AMDGPUMCExpr::createInstPrefSize(const MCExpr *CodeSizeBytes, MCContext &Ctx) {

  return create(AGVK_InstPrefSize, {CodeSizeBytes}, Ctx);

}


const AMDGPUMCExpr *AMDGPUMCExpr::createLit(LitModifier Lit, int64_t Value,

                                            MCContext &Ctx) {

  assert(Lit == LitModifier::Lit || Lit == LitModifier::Lit64);

  return create(Lit == LitModifier::Lit ? VariantKind::AGVK_Lit

                                        : VariantKind::AGVK_Lit64,

                {MCConstantExpr::create(Value, Ctx, /*PrintInHex=*/true)}, Ctx);

}


static KnownBits fromOptionalToKnownBits(std::optional<bool> CompareResult) {

  static constexpr unsigned BitWidth = 64;

  const APInt True(BitWidth, 1);

  const APInt False(BitWidth, 0);

  if (CompareResult) {

    return *CompareResult ? KnownBits::makeConstant(True)

                          : KnownBits::makeConstant(False);

  }


  KnownBits UnknownBool(/*BitWidth=*/1);

  return UnknownBool.zext(BitWidth);

}


using KnownBitsMap = DenseMap<const MCExpr *, KnownBits>;

static void knownBitsMapHelper(const MCExpr *Expr, KnownBitsMap &KBM,

                               unsigned Depth = 0);


static void binaryOpKnownBitsMapHelper(const MCExpr *Expr, KnownBitsMap &KBM,

                                       unsigned Depth) {

  static constexpr unsigned BitWidth = 64;

  const MCBinaryExpr *BExpr = cast<MCBinaryExpr>(Expr);

  const MCExpr *LHS = BExpr->getLHS();

  const MCExpr *RHS = BExpr->getRHS();


  knownBitsMapHelper(LHS, KBM, Depth + 1);

  knownBitsMapHelper(RHS, KBM, Depth + 1);

  KnownBits LHSKnown = KBM[LHS];

  KnownBits RHSKnown = KBM[RHS];


  switch (BExpr->getOpcode()) {

  default:

    KBM[Expr] = KnownBits(BitWidth);

    return;

  case MCBinaryExpr::Opcode::Add:

    KBM[Expr] = KnownBits::add(LHSKnown, RHSKnown);

    return;

  case MCBinaryExpr::Opcode::And:

    KBM[Expr] = LHSKnown & RHSKnown;

    return;

  case MCBinaryExpr::Opcode::Div:

    KBM[Expr] = KnownBits::sdiv(LHSKnown, RHSKnown);

    return;

  case MCBinaryExpr::Opcode::EQ: {

    std::optional<bool> CompareRes = KnownBits::eq(LHSKnown, RHSKnown);

    KBM[Expr] = fromOptionalToKnownBits(CompareRes);

    return;

  }

  case MCBinaryExpr::Opcode::NE: {

    std::optional<bool> CompareRes = KnownBits::ne(LHSKnown, RHSKnown);

    KBM[Expr] = fromOptionalToKnownBits(CompareRes);

    return;

  }

  case MCBinaryExpr::Opcode::GT: {

    std::optional<bool> CompareRes = KnownBits::sgt(LHSKnown, RHSKnown);

    KBM[Expr] = fromOptionalToKnownBits(CompareRes);

    return;

  }

  case MCBinaryExpr::Opcode::GTE: {

    std::optional<bool> CompareRes = KnownBits::sge(LHSKnown, RHSKnown);

    KBM[Expr] = fromOptionalToKnownBits(CompareRes);

    return;

  }

  case MCBinaryExpr::Opcode::LAnd: {

    std::optional<bool> CompareRes;

    const APInt False(BitWidth, 0);

    std::optional<bool> LHSBool =

        KnownBits::ne(LHSKnown, KnownBits::makeConstant(False));

    std::optional<bool> RHSBool =

        KnownBits::ne(RHSKnown, KnownBits::makeConstant(False));

    if (LHSBool && RHSBool)

      CompareRes = *LHSBool && *RHSBool;

    KBM[Expr] = fromOptionalToKnownBits(CompareRes);

    return;

  }

  case MCBinaryExpr::Opcode::LOr: {

    const APInt False(BitWidth, 0);

    KnownBits Bits = LHSKnown | RHSKnown;

    std::optional<bool> CompareRes =

        KnownBits::ne(Bits, KnownBits::makeConstant(False));

    KBM[Expr] = fromOptionalToKnownBits(CompareRes);

    return;

  }

  case MCBinaryExpr::Opcode::LT: {

    std::optional<bool> CompareRes = KnownBits::slt(LHSKnown, RHSKnown);

    KBM[Expr] = fromOptionalToKnownBits(CompareRes);

    return;

  }

  case MCBinaryExpr::Opcode::LTE: {

    std::optional<bool> CompareRes = KnownBits::sle(LHSKnown, RHSKnown);

    KBM[Expr] = fromOptionalToKnownBits(CompareRes);

    return;

  }

  case MCBinaryExpr::Opcode::Mod:

    KBM[Expr] = KnownBits::srem(LHSKnown, RHSKnown);

    return;

  case MCBinaryExpr::Opcode::Mul:

    KBM[Expr] = KnownBits::mul(LHSKnown, RHSKnown);

    return;

  case MCBinaryExpr::Opcode::Or:

    KBM[Expr] = LHSKnown | RHSKnown;

    return;

  case MCBinaryExpr::Opcode::Shl:

    KBM[Expr] = KnownBits::shl(LHSKnown, RHSKnown);

    return;

  case MCBinaryExpr::Opcode::AShr:

    KBM[Expr] = KnownBits::ashr(LHSKnown, RHSKnown);

    return;

  case MCBinaryExpr::Opcode::LShr:

    KBM[Expr] = KnownBits::lshr(LHSKnown, RHSKnown);

    return;

  case MCBinaryExpr::Opcode::Sub:

    KBM[Expr] = KnownBits::sub(LHSKnown, RHSKnown);

    return;

  case MCBinaryExpr::Opcode::Xor:

    KBM[Expr] = LHSKnown ^ RHSKnown;

    return;

  }

}


static void unaryOpKnownBitsMapHelper(const MCExpr *Expr, KnownBitsMap &KBM,

                                      unsigned Depth) {

  static constexpr unsigned BitWidth = 64;

  const MCUnaryExpr *UExpr = cast<MCUnaryExpr>(Expr);

  knownBitsMapHelper(UExpr->getSubExpr(), KBM, Depth + 1);

  KnownBits KB = KBM[UExpr->getSubExpr()];


  switch (UExpr->getOpcode()) {

  default:

    KBM[Expr] = KnownBits(BitWidth);

    return;

  case MCUnaryExpr::Opcode::Minus: {

    KB.makeNegative();

    KBM[Expr] = std::move(KB);

    return;

  }

  case MCUnaryExpr::Opcode::Not: {

    KnownBits AllOnes(BitWidth);

    AllOnes.setAllOnes();

    KBM[Expr] = KB ^ AllOnes;

    return;

  }

  case MCUnaryExpr::Opcode::Plus: {

    KB.makeNonNegative();

    KBM[Expr] = std::move(KB);

    return;

  }

  }

}


static void targetOpKnownBitsMapHelper(const MCExpr *Expr, KnownBitsMap &KBM,

                                       unsigned Depth) {

  static constexpr unsigned BitWidth = 64;

  const AMDGPUMCExpr *AGVK = cast<AMDGPUMCExpr>(Expr);


  switch (AGVK->getKind()) {

  default:

    KBM[Expr] = KnownBits(BitWidth);

    return;

  case AMDGPUMCExpr::VariantKind::AGVK_Or: {

    knownBitsMapHelper(AGVK->getSubExpr(0), KBM, Depth + 1);

    KnownBits KB = KBM[AGVK->getSubExpr(0)];

    for (const MCExpr *Arg : AGVK->getArgs()) {

      knownBitsMapHelper(Arg, KBM, Depth + 1);

      KB |= KBM[Arg];

    }

    KBM[Expr] = std::move(KB);

    return;

  }

  case AMDGPUMCExpr::VariantKind::AGVK_Max: {

    knownBitsMapHelper(AGVK->getSubExpr(0), KBM, Depth + 1);

    KnownBits KB = KBM[AGVK->getSubExpr(0)];

    for (const MCExpr *Arg : AGVK->getArgs()) {

      knownBitsMapHelper(Arg, KBM, Depth + 1);

      KB = KnownBits::smax(KB, KBM[Arg]);

    }

    KBM[Expr] = std::move(KB);

    return;

  }

  case AMDGPUMCExpr::VariantKind::AGVK_Min: {

    knownBitsMapHelper(AGVK->getSubExpr(0), KBM, Depth + 1);

    KnownBits KB = KBM[AGVK->getSubExpr(0)];

    for (const MCExpr *Arg : AGVK->getArgs()) {

      knownBitsMapHelper(Arg, KBM, Depth + 1);

      KB = KnownBits::smin(KB, KBM[Arg]);

    }

    KBM[Expr] = std::move(KB);

    return;

  }

  case AMDGPUMCExpr::VariantKind::AGVK_ExtraSGPRs:

  case AMDGPUMCExpr::VariantKind::AGVK_TotalNumVGPRs:

  case AMDGPUMCExpr::VariantKind::AGVK_AlignTo:

  case AMDGPUMCExpr::VariantKind::AGVK_Occupancy:

  case AMDGPUMCExpr::VariantKind::AGVK_InstPrefSize:

  case AMDGPUMCExpr::VariantKind::AGVK_Lit:

  case AMDGPUMCExpr::VariantKind::AGVK_Lit64: {

    int64_t Val;

    if (AGVK->evaluateAsAbsolute(Val)) {

      APInt APValue(BitWidth, Val);

      KBM[Expr] = KnownBits::makeConstant(APValue);

      return;

    }

    if (AGVK->getKind() == AMDGPUMCExpr::VariantKind::AGVK_InstPrefSize) {

      // The result is clamped to (1 << FieldWidth) - 1, so upper bits are

      // known zero. FieldWidth is derived from the subtarget.

      const MCSubtargetInfo *STI = AGVK->getCtx().getSubtargetInfo();

      unsigned FieldWidth = getInstPrefSizeFieldWidth(*STI);

      KnownBits KB(BitWidth);

      KB.Zero.setBitsFrom(FieldWidth);

      KBM[Expr] = KB;

      return;

    }

    KBM[Expr] = KnownBits(BitWidth);

    return;

  }

  }

}


static void knownBitsMapHelper(const MCExpr *Expr, KnownBitsMap &KBM,

                               unsigned Depth) {

  static constexpr unsigned BitWidth = 64;


  int64_t Val;

  if (Expr->evaluateAsAbsolute(Val)) {

    APInt APValue(BitWidth, Val, /*isSigned=*/true);

    KBM[Expr] = KnownBits::makeConstant(APValue);

    return;

  }


  if (Depth == 16) {

    KBM[Expr] = KnownBits(BitWidth);

    return;

  }


  switch (Expr->getKind()) {

  case MCExpr::ExprKind::Binary: {

    binaryOpKnownBitsMapHelper(Expr, KBM, Depth);

    return;

  }

  case MCExpr::ExprKind::Constant: {

    const MCConstantExpr *CE = cast<MCConstantExpr>(Expr);

    APInt APValue(BitWidth, CE->getValue(), /*isSigned=*/true);

    KBM[Expr] = KnownBits::makeConstant(APValue);

    return;

  }

  case MCExpr::ExprKind::SymbolRef: {

    const MCSymbolRefExpr *RExpr = cast<MCSymbolRefExpr>(Expr);

    const MCSymbol &Sym = RExpr->getSymbol();

    if (!Sym.isVariable()) {

      KBM[Expr] = KnownBits(BitWidth);

      return;

    }


    // Variable value retrieval is not for actual use but only for knownbits

    // analysis.

    const MCExpr *SymVal = Sym.getVariableValue();

    knownBitsMapHelper(SymVal, KBM, Depth + 1);


    // Explicitly copy-construct so that there exists a local KnownBits in case

    // KBM[SymVal] gets invalidated after a potential growth through KBM[Expr].

    KBM[Expr] = KnownBits(KBM[SymVal]);

    return;

  }

  case MCExpr::ExprKind::Unary: {

    unaryOpKnownBitsMapHelper(Expr, KBM, Depth);

    return;

  }

  case MCExpr::ExprKind::Target: {

    targetOpKnownBitsMapHelper(Expr, KBM, Depth);

    return;

  case MCExpr::Specifier:

    llvm_unreachable("unused by this backend");

  }

  }

}


static const MCExpr *tryFoldHelper(const MCExpr *Expr, KnownBitsMap &KBM,

                                   MCContext &Ctx) {

  if (!KBM.count(Expr))

    return Expr;


  auto ValueCheckKnownBits = [](KnownBits &KB, unsigned Value) -> bool {

    if (!KB.isConstant())

      return false;


    return Value == KB.getConstant();

  };


  if (Expr->getKind() == MCExpr::ExprKind::Constant)

    return Expr;


  // Resolving unary operations to constants may make the value more ambiguous.

  // For example, `~62` becomes `-63`; however, to me it's more ambiguous if a

  // bit mask value is represented through a negative number.

  if (Expr->getKind() != MCExpr::ExprKind::Unary) {

    if (KBM[Expr].isConstant()) {

      APInt ConstVal = KBM[Expr].getConstant();

      return MCConstantExpr::create(ConstVal.getSExtValue(), Ctx);

    }


    int64_t EvalValue;

    if (Expr->evaluateAsAbsolute(EvalValue))

      return MCConstantExpr::create(EvalValue, Ctx);

  }


  switch (Expr->getKind()) {

  default:

    return Expr;

  case MCExpr::ExprKind::Binary: {

    const MCBinaryExpr *BExpr = cast<MCBinaryExpr>(Expr);

    const MCExpr *LHS = BExpr->getLHS();

    const MCExpr *RHS = BExpr->getRHS();


    switch (BExpr->getOpcode()) {

    default:

      return Expr;

    case MCBinaryExpr::Opcode::Sub: {

      if (ValueCheckKnownBits(KBM[RHS], 0))

        return tryFoldHelper(LHS, KBM, Ctx);

      break;

    }

    case MCBinaryExpr::Opcode::Add:

    case MCBinaryExpr::Opcode::Or: {

      if (ValueCheckKnownBits(KBM[LHS], 0))

        return tryFoldHelper(RHS, KBM, Ctx);

      if (ValueCheckKnownBits(KBM[RHS], 0))

        return tryFoldHelper(LHS, KBM, Ctx);

      break;

    }

    case MCBinaryExpr::Opcode::Mul: {

      if (ValueCheckKnownBits(KBM[LHS], 1))

        return tryFoldHelper(RHS, KBM, Ctx);

      if (ValueCheckKnownBits(KBM[RHS], 1))

        return tryFoldHelper(LHS, KBM, Ctx);

      break;

    }

    case MCBinaryExpr::Opcode::Shl:

    case MCBinaryExpr::Opcode::AShr:

    case MCBinaryExpr::Opcode::LShr: {

      if (ValueCheckKnownBits(KBM[RHS], 0))

        return tryFoldHelper(LHS, KBM, Ctx);

      if (ValueCheckKnownBits(KBM[LHS], 0))

        return MCConstantExpr::create(0, Ctx);

      break;

    }

    case MCBinaryExpr::Opcode::And: {

      if (ValueCheckKnownBits(KBM[LHS], 0) || ValueCheckKnownBits(KBM[RHS], 0))

        return MCConstantExpr::create(0, Ctx);

      break;

    }

    }

    const MCExpr *NewLHS = tryFoldHelper(LHS, KBM, Ctx);

    const MCExpr *NewRHS = tryFoldHelper(RHS, KBM, Ctx);

    if (NewLHS != LHS || NewRHS != RHS)

      return MCBinaryExpr::create(BExpr->getOpcode(), NewLHS, NewRHS, Ctx,

                                  BExpr->getLoc());

    return Expr;

  }

  case MCExpr::ExprKind::Unary: {

    const MCUnaryExpr *UExpr = cast<MCUnaryExpr>(Expr);

    const MCExpr *SubExpr = UExpr->getSubExpr();

    const MCExpr *NewSubExpr = tryFoldHelper(SubExpr, KBM, Ctx);

    if (SubExpr != NewSubExpr)

      return MCUnaryExpr::create(UExpr->getOpcode(), NewSubExpr, Ctx,

                                 UExpr->getLoc());

    return Expr;

  }

  case MCExpr::ExprKind::Target: {

    const AMDGPUMCExpr *AGVK = cast<AMDGPUMCExpr>(Expr);

    SmallVector<const MCExpr *, 8> NewArgs;

    bool Changed = false;

    for (const MCExpr *Arg : AGVK->getArgs()) {

      const MCExpr *NewArg = tryFoldHelper(Arg, KBM, Ctx);

      NewArgs.push_back(NewArg);

      Changed |= Arg != NewArg;

    }

    return Changed ? AMDGPUMCExpr::create(AGVK->getKind(), NewArgs, Ctx) : Expr;

  }

  }

  return Expr;

}


const MCExpr *llvm::AMDGPU::foldAMDGPUMCExpr(const MCExpr *Expr,

                                             MCContext &Ctx) {

  KnownBitsMap KBM;

  knownBitsMapHelper(Expr, KBM);

  const MCExpr *NewExpr = tryFoldHelper(Expr, KBM, Ctx);


  return Expr != NewExpr ? NewExpr : Expr;

}


void llvm::AMDGPU::printAMDGPUMCExpr(const MCExpr *Expr, raw_ostream &OS,

                                     const MCAsmInfo *MAI) {

  int64_t Val;

  if (Expr->evaluateAsAbsolute(Val)) {

    OS << Val;

    return;

  }


  MAI->printExpr(OS, *Expr);

}


bool AMDGPU::isLitExpr(const MCExpr *Expr) {

  const auto *E = dyn_cast<AMDGPUMCExpr>(Expr);

  return E && (E->getKind() == AMDGPUMCExpr::AGVK_Lit ||

               E->getKind() == AMDGPUMCExpr::AGVK_Lit64);

}


int64_t AMDGPU::getLitValue(const MCExpr *Expr) {

  assert(isLitExpr(Expr));

  return cast<MCConstantExpr>(cast<AMDGPUMCExpr>(Expr)->getArgs()[0])

      ->getValue();

}


AMDGPUMCExpr::VariantKind AMDGPU::getExprKind(const MCExpr *Expr) {

  const auto *E = dyn_cast<AMDGPUMCExpr>(Expr);

  if (!E)

    return AMDGPUMCExpr::AGVK_None;

  return E->getKind();

}


assert
assert(UImm &&(UImm !=~static_cast< T >(0)) &&"Invalid immediate!")

AMDGPUBaseInfo.h

isConstant
static bool isConstant(const MachineInstr &MI)
Definition AMDGPUInstructionSelector.cpp:3088

targetOpKnownBitsMapHelper
static void targetOpKnownBitsMapHelper(const MCExpr *Expr, KnownBitsMap &KBM, unsigned Depth)
Definition AMDGPUMCExpr.cpp:478

unaryOpKnownBitsMapHelper
static void unaryOpKnownBitsMapHelper(const MCExpr *Expr, KnownBitsMap &KBM, unsigned Depth)
Definition AMDGPUMCExpr.cpp:448

fromOptionalToKnownBits
static KnownBits fromOptionalToKnownBits(std::optional< bool > CompareResult)
Definition AMDGPUMCExpr.cpp:329

binaryOpKnownBitsMapHelper
static void binaryOpKnownBitsMapHelper(const MCExpr *Expr, KnownBitsMap &KBM, unsigned Depth)
Definition AMDGPUMCExpr.cpp:346

tryFoldHelper
static const MCExpr * tryFoldHelper(const MCExpr *Expr, KnownBitsMap &KBM, MCContext &Ctx)
Definition AMDGPUMCExpr.cpp:604

knownBitsMapHelper
static void knownBitsMapHelper(const MCExpr *Expr, KnownBitsMap &KBM, unsigned Depth=0)
Definition AMDGPUMCExpr.cpp:546

evaluateMCExprs
static bool evaluateMCExprs(ArrayRef< const MCExpr * > Exprs, const MCAssembler *Asm, std::initializer_list< std::reference_wrapper< uint64_t > > Vals)
Definition AMDGPUMCExpr.cpp:115

getInstPrefSizeFieldWidth
static unsigned getInstPrefSizeFieldWidth(const MCSubtargetInfo &STI)
Get the inst_pref_size field width for the given subtarget.
Definition AMDGPUMCExpr.cpp:197

KnownBitsMap
DenseMap< const MCExpr *, KnownBits > KnownBitsMap
Definition AMDGPUMCExpr.cpp:342

AMDGPUMCExpr.h

AMDHSAKernelDescriptor.h
AMDHSA kernel descriptor definitions.

op
#define op(i)

KnownBits.h

MCAsmInfo.h

MCAssembler.h

MCContext.h

MCStreamer.h

MCSubtargetInfo.h

MCSymbol.h

MCValue.h

MathExtras.h

CacheLineSize
static cl::opt< unsigned > CacheLineSize("cache-line-size", cl::init(0), cl::Hidden, cl::desc("Use this to override the target cache line size when " "specified by the user."))

RHS
Value * RHS
Definition X86PartialReduction.cpp:81

LHS
Value * LHS
Definition X86PartialReduction.cpp:80

NewExpr
Definition ItaniumDemangle.h:2142

llvm::AMDGPUMCExpr
AMDGPU target specific MCExpr operations.
Definition AMDGPUMCExpr.h:33

llvm::AMDGPUMCExpr::getArgs
ArrayRef< const MCExpr * > getArgs() const
Definition AMDGPUMCExpr.h:118

llvm::AMDGPUMCExpr::findAssociatedFragment
MCFragment * findAssociatedFragment() const override
Definition AMDGPUMCExpr.cpp:288

llvm::AMDGPUMCExpr::createInstPrefSize
static const AMDGPUMCExpr * createInstPrefSize(const MCExpr *CodeSizeBytes, MCContext &Ctx)
Create an expression for instruction prefetch size computation: min(divideCeil(CodeSizeBytes,...
Definition AMDGPUMCExpr.cpp:317

llvm::AMDGPUMCExpr::visitUsedExpr
void visitUsedExpr(MCStreamer &Streamer) const override
Definition AMDGPUMCExpr.cpp:283

llvm::AMDGPUMCExpr::createTotalNumVGPR
static const AMDGPUMCExpr * createTotalNumVGPR(const MCExpr *NumAGPR, const MCExpr *NumVGPR, MCContext &Ctx)
Definition AMDGPUMCExpr.cpp:310

llvm::AMDGPUMCExpr::createLit
static const AMDGPUMCExpr * createLit(LitModifier Lit, int64_t Value, MCContext &Ctx)
Definition AMDGPUMCExpr.cpp:321

llvm::AMDGPUMCExpr::create
static const AMDGPUMCExpr * create(VariantKind Kind, ArrayRef< const MCExpr * > Args, MCContext &Ctx)
Definition AMDGPUMCExpr.cpp:47

llvm::AMDGPUMCExpr::evaluateAsRelocatableImpl
bool evaluateAsRelocatableImpl(MCValue &Res, const MCAssembler *Asm) const override
Definition AMDGPUMCExpr.cpp:248

llvm::AMDGPUMCExpr::getCtx
MCContext & getCtx() const
Definition AMDGPUMCExpr.h:120

llvm::AMDGPUMCExpr::createExtraSGPRs
static const AMDGPUMCExpr * createExtraSGPRs(const MCExpr *VCCUsed, const MCExpr *FlatScrUsed, bool XNACKUsed, MCContext &Ctx)
Allow delayed MCExpr resolve of ExtraSGPRs (in case VCCUsed or FlatScrUsed are unresolvable but neede...
Definition AMDGPUMCExpr.cpp:300

llvm::AMDGPUMCExpr::getSubExpr
const MCExpr * getSubExpr(size_t Index) const
Definition AMDGPUMCExpr.cpp:53

llvm::AMDGPUMCExpr::VariantKind
VariantKind
Definition AMDGPUMCExpr.h:35

llvm::AMDGPUMCExpr::AGVK_InstPrefSize
@ AGVK_InstPrefSize
Definition AMDGPUMCExpr.h:43

llvm::AMDGPUMCExpr::AGVK_Occupancy
@ AGVK_Occupancy
Definition AMDGPUMCExpr.h:42

llvm::AMDGPUMCExpr::AGVK_AlignTo
@ AGVK_AlignTo
Definition AMDGPUMCExpr.h:41

llvm::AMDGPUMCExpr::AGVK_Or
@ AGVK_Or
Definition AMDGPUMCExpr.h:37

llvm::AMDGPUMCExpr::AGVK_TotalNumVGPRs
@ AGVK_TotalNumVGPRs
Definition AMDGPUMCExpr.h:40

llvm::AMDGPUMCExpr::AGVK_ExtraSGPRs
@ AGVK_ExtraSGPRs
Definition AMDGPUMCExpr.h:39

llvm::AMDGPUMCExpr::AGVK_Lit64
@ AGVK_Lit64
Definition AMDGPUMCExpr.h:45

llvm::AMDGPUMCExpr::AGVK_Lit
@ AGVK_Lit
Definition AMDGPUMCExpr.h:44

llvm::AMDGPUMCExpr::AGVK_Max
@ AGVK_Max
Definition AMDGPUMCExpr.h:38

llvm::AMDGPUMCExpr::AGVK_Min
@ AGVK_Min
Definition AMDGPUMCExpr.h:46

llvm::AMDGPUMCExpr::AGVK_None
@ AGVK_None
Definition AMDGPUMCExpr.h:36

llvm::AMDGPUMCExpr::printImpl
void printImpl(raw_ostream &OS, const MCAsmInfo *MAI) const override
Definition AMDGPUMCExpr.cpp:58

llvm::AMDGPUMCExpr::getKind
VariantKind getKind() const
Definition AMDGPUMCExpr.h:119

llvm::AMDGPUMCExpr::isSymbolUsedInExpression
static bool isSymbolUsedInExpression(const MCSymbol *Sym, const MCExpr *E)
Definition AMDGPUMCExpr.cpp:217

llvm::AMDGPUSubtarget::Generation
Generation
Definition AMDGPUSubtarget.h:32

llvm::APInt
Class for arbitrary precision integers.
Definition APInt.h:78

llvm::APInt::setBitsFrom
void setBitsFrom(unsigned loBit)
Set the top bits starting from loBit.
Definition APInt.h:1408

llvm::APInt::getSExtValue
int64_t getSExtValue() const
Get sign extended value.
Definition APInt.h:1585

llvm::ArrayRef
Represent a constant reference to an array (0 or more elements consecutively in memory),...
Definition ArrayRef.h:40

llvm::DenseMapBase::count
size_type count(const_arg_type_t< KeyT > Val) const
Return 1 if the specified key is in the map, 0 otherwise.
Definition DenseMap.h:221

llvm::DenseMap
Definition DenseMap.h:834

llvm::MCAsmInfo
This class is intended to be used as a base class for asm properties and features specific to the tar...
Definition MCAsmInfo.h:66

llvm::MCAsmInfo::printExpr
void printExpr(raw_ostream &, const MCExpr &) const
Definition MCAsmInfo.cpp:133

llvm::MCAssembler
Definition MCAssembler.h:46

llvm::MCBinaryExpr
Binary assembler expressions.
Definition MCExpr.h:299

llvm::MCBinaryExpr::getLHS
const MCExpr * getLHS() const
Get the left-hand side expression of the binary operator.
Definition MCExpr.h:446

llvm::MCBinaryExpr::getRHS
const MCExpr * getRHS() const
Get the right-hand side expression of the binary operator.
Definition MCExpr.h:449

llvm::MCBinaryExpr::getOpcode
Opcode getOpcode() const
Get the kind of this binary expression.
Definition MCExpr.h:443

llvm::MCBinaryExpr::create
static LLVM_ABI const MCBinaryExpr * create(Opcode Op, const MCExpr *LHS, const MCExpr *RHS, MCContext &Ctx, SMLoc Loc=SMLoc())
Definition MCExpr.cpp:201

llvm::MCBinaryExpr::Div
@ Div
Signed division.
Definition MCExpr.h:304

llvm::MCBinaryExpr::Shl
@ Shl
Shift left.
Definition MCExpr.h:321

llvm::MCBinaryExpr::AShr
@ AShr
Arithmetic shift right.
Definition MCExpr.h:322

llvm::MCBinaryExpr::LShr
@ LShr
Logical shift right.
Definition MCExpr.h:323

llvm::MCBinaryExpr::GTE
@ GTE
Signed greater than or equal comparison (result is either 0 or some target-specific non-zero value).
Definition MCExpr.h:308

llvm::MCBinaryExpr::EQ
@ EQ
Equality comparison.
Definition MCExpr.h:305

llvm::MCBinaryExpr::Sub
@ Sub
Subtraction.
Definition MCExpr.h:324

llvm::MCBinaryExpr::Mul
@ Mul
Multiplication.
Definition MCExpr.h:317

llvm::MCBinaryExpr::GT
@ GT
Signed greater than comparison (result is either 0 or some target-specific non-zero value)
Definition MCExpr.h:306

llvm::MCBinaryExpr::Mod
@ Mod
Signed remainder.
Definition MCExpr.h:316

llvm::MCBinaryExpr::And
@ And
Bitwise and.
Definition MCExpr.h:303

llvm::MCBinaryExpr::Or
@ Or
Bitwise or.
Definition MCExpr.h:319

llvm::MCBinaryExpr::Xor
@ Xor
Bitwise exclusive or.
Definition MCExpr.h:325

llvm::MCBinaryExpr::LAnd
@ LAnd
Logical and.
Definition MCExpr.h:310

llvm::MCBinaryExpr::LOr
@ LOr
Logical or.
Definition MCExpr.h:311

llvm::MCBinaryExpr::LT
@ LT
Signed less than comparison (result is either 0 or some target-specific non-zero value).
Definition MCExpr.h:312

llvm::MCBinaryExpr::Add
@ Add
Addition.
Definition MCExpr.h:302

llvm::MCBinaryExpr::LTE
@ LTE
Signed less than or equal comparison (result is either 0 or some target-specific non-zero value).
Definition MCExpr.h:314

llvm::MCBinaryExpr::NE
@ NE
Inequality comparison.
Definition MCExpr.h:318

llvm::MCConstantExpr
Definition MCExpr.h:142

llvm::MCConstantExpr::create
static LLVM_ABI const MCConstantExpr * create(int64_t Value, MCContext &Ctx, bool PrintInHex=false, unsigned SizeInBytes=0)
Definition MCExpr.cpp:212

llvm::MCContext
Context object for machine code objects.
Definition MCContext.h:83

llvm::MCContext::getSubtargetInfo
const MCSubtargetInfo * getSubtargetInfo() const
Definition MCContext.h:415

llvm::MCExpr
Base class for the full range of assembler expressions which are needed for parsing.
Definition MCExpr.h:34

llvm::MCExpr::Unary
@ Unary
Unary expressions.
Definition MCExpr.h:44

llvm::MCExpr::Constant
@ Constant
Constant expressions.
Definition MCExpr.h:42

llvm::MCExpr::SymbolRef
@ SymbolRef
References to labels and assigned expressions.
Definition MCExpr.h:43

llvm::MCExpr::Target
@ Target
Target specific expression.
Definition MCExpr.h:46

llvm::MCExpr::Specifier
@ Specifier
Expression with a relocation specifier.
Definition MCExpr.h:45

llvm::MCExpr::Binary
@ Binary
Binary expressions.
Definition MCExpr.h:41

llvm::MCExpr::evaluateAsAbsolute
LLVM_ABI bool evaluateAsAbsolute(int64_t &Res) const
Try to evaluate the expression to an absolute value.
Definition MCExpr.cpp:238

llvm::MCExpr::getKind
ExprKind getKind() const
Definition MCExpr.h:85

llvm::MCExpr::getLoc
SMLoc getLoc() const
Definition MCExpr.h:86

llvm::MCFragment
Definition MCSection.h:45

llvm::MCStreamer
Streaming machine code generation interface.
Definition MCStreamer.h:222

llvm::MCStreamer::visitUsedExpr
void visitUsedExpr(const MCExpr &Expr)
Definition MCStreamer.cpp:1241

llvm::MCSubtargetInfo
Generic base class for all target subtargets.
Definition MCSubtargetInfo.h:77

llvm::MCSymbolRefExpr
Represent a reference to a symbol from inside an expression.
Definition MCExpr.h:190

llvm::MCSymbolRefExpr::getSymbol
const MCSymbol & getSymbol() const
Definition MCExpr.h:227

llvm::MCSymbol
MCSymbol - Instances of this class represent a symbol name in the MC file, and MCSymbols are created ...
Definition MCSymbol.h:42

llvm::MCSymbol::isVariable
bool isVariable() const
isVariable - Check if this is a variable symbol.
Definition MCSymbol.h:267

llvm::MCSymbol::getVariableValue
const MCExpr * getVariableValue() const
Get the expression of the variable symbol.
Definition MCSymbol.h:270

llvm::MCUnaryExpr
Unary assembler expressions.
Definition MCExpr.h:243

llvm::MCUnaryExpr::getOpcode
Opcode getOpcode() const
Get the kind of this unary expression.
Definition MCExpr.h:286

llvm::MCUnaryExpr::create
static LLVM_ABI const MCUnaryExpr * create(Opcode Op, const MCExpr *Expr, MCContext &Ctx, SMLoc Loc=SMLoc())
Definition MCExpr.cpp:207

llvm::MCUnaryExpr::Minus
@ Minus
Unary minus.
Definition MCExpr.h:247

llvm::MCUnaryExpr::Plus
@ Plus
Unary plus.
Definition MCExpr.h:249

llvm::MCUnaryExpr::Not
@ Not
Bitwise negation.
Definition MCExpr.h:248

llvm::MCUnaryExpr::getSubExpr
const MCExpr * getSubExpr() const
Get the child of this unary expression.
Definition MCExpr.h:289

llvm::MCValue
Definition MCValue.h:30

llvm::MCValue::get
static MCValue get(const MCSymbol *SymA, const MCSymbol *SymB=nullptr, int64_t Val=0, uint32_t Specifier=0)
Definition MCValue.h:56

llvm::MCValue::getConstant
int64_t getConstant() const
Definition MCValue.h:44

llvm::MCValue::isAbsolute
bool isAbsolute() const
Is this an absolute (as opposed to relocatable) value.
Definition MCValue.h:54

llvm::SmallVectorTemplateBase::push_back
void push_back(const T &Elt)
Definition SmallVector.h:423

llvm::SmallVector
This is a 'vector' (really, a variable-sized array), optimized for the case when the array is small.
Definition SmallVector.h:1225

llvm::Value
LLVM Value Representation.
Definition Value.h:75

llvm::raw_ostream
This class implements an extremely fast bulk output stream that can only output to a stream.
Definition raw_ostream.h:53

uint64_t

Changed
Changed
Definition ObjCARCOpts.cpp:2366

llvm_unreachable
#define llvm_unreachable(msg)
Marks that the current location is not supposed to be reachable.
Definition ErrorHandling.h:164

llvm::AMDGPU::HSAMD::Kernel::Arg::Key::Align
constexpr char Align[]
Key for Kernel::Arg::Metadata::mAlign.
Definition AMDGPUMetadata.h:183

llvm::AMDGPU::HSAMD::Kernel::CodeProps::Key::NumVGPRs
constexpr char NumVGPRs[]
Key for Kernel::CodeProps::Metadata::mNumVGPRs.
Definition AMDGPUMetadata.h:262

llvm::AMDGPU::HSAMD::Kernel::CodeProps::Key::NumSGPRs
constexpr char NumSGPRs[]
Key for Kernel::CodeProps::Metadata::mNumSGPRs.
Definition AMDGPUMetadata.h:260

llvm::AMDGPU::HSAMD::Kernel::Key::Args
constexpr char Args[]
Key for Kernel::Metadata::mArgs.
Definition AMDGPUMetadata.h:396

llvm::AMDGPU::IsaInfo::getNumWavesPerEUWithNumVGPRs
unsigned getNumWavesPerEUWithNumVGPRs(const MCSubtargetInfo &STI, unsigned NumVGPRs, unsigned DynamicVGPRBlockSize)
Definition AMDGPUBaseInfo.cpp:1484

llvm::AMDGPU::IsaInfo::getInstCacheLineSize
unsigned getInstCacheLineSize(const MCSubtargetInfo &STI)
Definition AMDGPUBaseInfo.cpp:1203

llvm::AMDGPU::IsaInfo::getNumExtraSGPRs
unsigned getNumExtraSGPRs(const MCSubtargetInfo &STI, bool VCCUsed, bool FlatScrUsed, bool XNACKUsed)
Definition AMDGPUBaseInfo.cpp:1371

llvm::AMDGPU::IsaInfo::getOccupancyWithNumSGPRs
unsigned getOccupancyWithNumSGPRs(unsigned SGPRs, unsigned MaxWaves, AMDGPUSubtarget::Generation Gen)
Definition AMDGPUBaseInfo.cpp:1501

llvm::AMDGPU
Definition AMDGPUMetadataVerifier.h:34

llvm::AMDGPU::isLitExpr
LLVM_READONLY bool isLitExpr(const MCExpr *Expr)
Definition AMDGPUMCExpr.cpp:730

llvm::AMDGPU::printAMDGPUMCExpr
void printAMDGPUMCExpr(const MCExpr *Expr, raw_ostream &OS, const MCAsmInfo *MAI)
Definition AMDGPUMCExpr.cpp:719

llvm::AMDGPU::isGFX12Plus
bool isGFX12Plus(const MCSubtargetInfo &STI)
Definition AMDGPUBaseInfo.cpp:2647

llvm::AMDGPU::isGFX90A
bool isGFX90A(const MCSubtargetInfo &STI)
Definition AMDGPUBaseInfo.cpp:2703

llvm::AMDGPU::getExprKind
LLVM_READONLY AMDGPUMCExpr::VariantKind getExprKind(const MCExpr *Expr)
Definition AMDGPUMCExpr.cpp:742

llvm::AMDGPU::getLitValue
LLVM_READONLY int64_t getLitValue(const MCExpr *Expr)
Definition AMDGPUMCExpr.cpp:736

llvm::AMDGPU::foldAMDGPUMCExpr
const MCExpr * foldAMDGPUMCExpr(const MCExpr *Expr, MCContext &Ctx)
Definition AMDGPUMCExpr.cpp:710

llvm
This is an optimization pass for GlobalISel generic memory operations.
Definition FunctionInfo.h:25

llvm::Value
FunctionAddr VTableAddr Value
Definition InstrProf.h:137

llvm::all_of
bool all_of(R &&range, UnaryPredicate P)
Provide wrappers to std::all_of which take ranges instead of having to pass begin/end explicitly.
Definition STLExtras.h:1738

llvm::zip_equal
detail::zippy< detail::zip_first, T, U, Args... > zip_equal(T &&t, U &&u, Args &&...args)
zip iterator that assumes that all iteratees have the same length.
Definition STLExtras.h:840

llvm::Depth
@ Depth
Definition SIMachineScheduler.h:36

llvm::dyn_cast
decltype(auto) dyn_cast(const From &Val)
dyn_cast<X> - Return the argument parameter cast to the specified type.
Definition Casting.h:643

llvm::uninitialized_copy
auto uninitialized_copy(R &&Src, IterTy Dst)
Definition STLExtras.h:2110

llvm::LitModifier
LitModifier
Definition AMDGPUMCExpr.h:19

llvm::LitModifier::Lit64
@ Lit64
Definition AMDGPUMCExpr.h:19

llvm::LitModifier::Lit
@ Lit
Definition AMDGPUMCExpr.h:19

llvm::alignTo
constexpr uint64_t alignTo(uint64_t Size, Align A)
Returns a multiple of A needed to store Size bytes.
Definition Alignment.h:144

llvm::WaitForUnlockResult::Success
@ Success
The lock was released successfully.
Definition AdvisoryLock.h:20

llvm::divideCeil
constexpr T divideCeil(U Numerator, V Denominator)
Returns the integer ceil(Numerator / Denominator).
Definition MathExtras.h:394

llvm::ArrayRef
ArrayRef(const T &OneElt) -> ArrayRef< T >

llvm::BitWidth
constexpr unsigned BitWidth
Definition BitmaskEnum.h:219

llvm::cast
decltype(auto) cast(const From &Val)
cast<X> - Return the argument parameter cast to the specified type.
Definition Casting.h:559

llvm::fltNanEncoding::AllOnes
@ AllOnes
Definition APFloat.h:987

llvm::TensorType::Total
@ Total
Definition TensorSpec.h:59

raw_ostream.h

llvm::KnownBits
Definition KnownBits.h:24

llvm::KnownBits::makeConstant
static KnownBits makeConstant(const APInt &C)
Create known bits from a known constant.
Definition KnownBits.h:315

llvm::KnownBits::eq
static LLVM_ABI std::optional< bool > eq(const KnownBits &LHS, const KnownBits &RHS)
Determine if these known bits always give the same ICMP_EQ result.
Definition KnownBits.cpp:645

llvm::KnownBits::smax
static LLVM_ABI KnownBits smax(const KnownBits &LHS, const KnownBits &RHS)
Compute known bits for smax(LHS, RHS).
Definition KnownBits.cpp:333

llvm::KnownBits::makeNonNegative
void makeNonNegative()
Make this value non-negative.
Definition KnownBits.h:125

llvm::KnownBits::ashr
static LLVM_ABI KnownBits ashr(const KnownBits &LHS, const KnownBits &RHS, bool ShAmtNonZero=false, bool Exact=false)
Compute known bits for ashr(LHS, RHS).
Definition KnownBits.cpp:547

llvm::KnownBits::ne
static LLVM_ABI std::optional< bool > ne(const KnownBits &LHS, const KnownBits &RHS)
Determine if these known bits always give the same ICMP_NE result.
Definition KnownBits.cpp:653

llvm::KnownBits::makeNegative
void makeNegative()
Make this value negative.
Definition KnownBits.h:120

llvm::KnownBits::sge
static LLVM_ABI std::optional< bool > sge(const KnownBits &LHS, const KnownBits &RHS)
Determine if these known bits always give the same ICMP_SGE result.
Definition KnownBits.cpp:693

llvm::KnownBits::zext
KnownBits zext(unsigned BitWidth) const
Return known bits for a zero extension of the value we're tracking.
Definition KnownBits.h:176

llvm::KnownBits::isConstant
bool isConstant() const
Returns true if we know the value of all bits.
Definition KnownBits.h:54

llvm::KnownBits::add
static KnownBits add(const KnownBits &LHS, const KnownBits &RHS, bool NSW=false, bool NUW=false, bool SelfAdd=false)
Compute knownbits resulting from addition of LHS and RHS.
Definition KnownBits.h:361

llvm::KnownBits::lshr
static LLVM_ABI KnownBits lshr(const KnownBits &LHS, const KnownBits &RHS, bool ShAmtNonZero=false, bool Exact=false)
Compute known bits for lshr(LHS, RHS).
Definition KnownBits.cpp:491

llvm::KnownBits::smin
static LLVM_ABI KnownBits smin(const KnownBits &LHS, const KnownBits &RHS)
Compute known bits for smin(LHS, RHS).
Definition KnownBits.cpp:337

llvm::KnownBits::srem
static LLVM_ABI KnownBits srem(const KnownBits &LHS, const KnownBits &RHS)
Compute known bits for srem(LHS, RHS).
Definition KnownBits.cpp:1269

llvm::KnownBits::slt
static LLVM_ABI std::optional< bool > slt(const KnownBits &LHS, const KnownBits &RHS)
Determine if these known bits always give the same ICMP_SLT result.
Definition KnownBits.cpp:699

llvm::KnownBits::sdiv
static LLVM_ABI KnownBits sdiv(const KnownBits &LHS, const KnownBits &RHS, bool Exact=false)
Compute known bits for sdiv(LHS, RHS).
Definition KnownBits.cpp:1156

llvm::KnownBits::sub
static KnownBits sub(const KnownBits &LHS, const KnownBits &RHS, bool NSW=false, bool NUW=false)
Compute knownbits resulting from subtraction of LHS and RHS.
Definition KnownBits.h:376

llvm::KnownBits::mul
static LLVM_ABI KnownBits mul(const KnownBits &LHS, const KnownBits &RHS, bool NoUndefSelfMultiply=false)
Compute known bits resulting from multiplying LHS and RHS.
Definition KnownBits.cpp:1001

llvm::KnownBits::Zero
APInt Zero
Definition KnownBits.h:25

llvm::KnownBits::sle
static LLVM_ABI std::optional< bool > sle(const KnownBits &LHS, const KnownBits &RHS)
Determine if these known bits always give the same ICMP_SLE result.
Definition KnownBits.cpp:703

llvm::KnownBits::sgt
static LLVM_ABI std::optional< bool > sgt(const KnownBits &LHS, const KnownBits &RHS)
Determine if these known bits always give the same ICMP_SGT result.
Definition KnownBits.cpp:683

llvm::KnownBits::shl
static LLVM_ABI KnownBits shl(const KnownBits &LHS, const KnownBits &RHS, bool NUW=false, bool NSW=false, bool ShAmtNonZero=false)
Compute known bits for shl(LHS, RHS).
Definition KnownBits.cpp:407

llvm::KnownBits::getConstant
const APInt & getConstant() const
Returns the value when all bits have a known value.
Definition KnownBits.h:58