LLVM 23.0.0git
IRTranslator.cpp
Go to the documentation of this file.
1//===- llvm/CodeGen/GlobalISel/IRTranslator.cpp - IRTranslator ---*- C++ -*-==//
2//
3// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4// See https://llvm.org/LICENSE.txt for license information.
5// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6//
7//===----------------------------------------------------------------------===//
8/// \file
9/// This file implements the IRTranslator class.
10//===----------------------------------------------------------------------===//
11
14#include "llvm/ADT/STLExtras.h"
15#include "llvm/ADT/ScopeExit.h"
20#include "llvm/Analysis/Loads.h"
50#include "llvm/IR/BasicBlock.h"
51#include "llvm/IR/CFG.h"
52#include "llvm/IR/Constant.h"
53#include "llvm/IR/Constants.h"
54#include "llvm/IR/DataLayout.h"
57#include "llvm/IR/Function.h"
59#include "llvm/IR/InlineAsm.h"
60#include "llvm/IR/InstrTypes.h"
63#include "llvm/IR/Intrinsics.h"
64#include "llvm/IR/IntrinsicsAMDGPU.h"
65#include "llvm/IR/LLVMContext.h"
66#include "llvm/IR/Metadata.h"
68#include "llvm/IR/Statepoint.h"
69#include "llvm/IR/Type.h"
70#include "llvm/IR/User.h"
71#include "llvm/IR/Value.h"
73#include "llvm/MC/MCContext.h"
74#include "llvm/Pass.h"
77#include "llvm/Support/Debug.h"
84#include <algorithm>
85#include <cassert>
86#include <cstdint>
87#include <iterator>
88#include <optional>
89#include <string>
90#include <utility>
91#include <vector>
92
93#define DEBUG_TYPE "irtranslator"
94
95using namespace llvm;
96
97static cl::opt<bool>
98 EnableCSEInIRTranslator("enable-cse-in-irtranslator",
99 cl::desc("Should enable CSE in irtranslator"),
100 cl::Optional, cl::init(false));
101char IRTranslator::ID = 0;
102
103INITIALIZE_PASS_BEGIN(IRTranslator, DEBUG_TYPE, "IRTranslator LLVM IR -> MI",
104 false, false)
110INITIALIZE_PASS_END(IRTranslator, DEBUG_TYPE, "IRTranslator LLVM IR -> MI",
112
116 MF.getProperties().setFailedISel();
117 bool IsGlobalISelAbortEnabled =
118 MF.getTarget().Options.GlobalISelAbort == GlobalISelAbortMode::Enable;
119
120 // Print the function name explicitly if we don't have a debug location (which
121 // makes the diagnostic less useful) or if we're going to emit a raw error.
122 if (!R.getLocation().isValid() || IsGlobalISelAbortEnabled)
123 R << (" (in function: " + MF.getName() + ")").str();
124
125 if (IsGlobalISelAbortEnabled)
126 report_fatal_error(Twine(R.getMsg()));
127 else
128 ORE.emit(R);
129}
130
132 : MachineFunctionPass(ID), OptLevel(optlevel) {}
133
134#ifndef NDEBUG
135namespace {
136/// Verify that every instruction created has the same DILocation as the
137/// instruction being translated.
138class DILocationVerifier : public GISelChangeObserver {
139 const Instruction *CurrInst = nullptr;
140
141public:
142 DILocationVerifier() = default;
143 ~DILocationVerifier() override = default;
144
145 const Instruction *getCurrentInst() const { return CurrInst; }
146 void setCurrentInst(const Instruction *Inst) { CurrInst = Inst; }
147
148 void erasingInstr(MachineInstr &MI) override {}
149 void changingInstr(MachineInstr &MI) override {}
150 void changedInstr(MachineInstr &MI) override {}
151
152 void createdInstr(MachineInstr &MI) override {
153 assert(getCurrentInst() && "Inserted instruction without a current MI");
154
155 // Only print the check message if we're actually checking it.
156#ifndef NDEBUG
157 LLVM_DEBUG(dbgs() << "Checking DILocation from " << *CurrInst
158 << " was copied to " << MI);
159#endif
160 // We allow insts in the entry block to have no debug loc because
161 // they could have originated from constants, and we don't want a jumpy
162 // debug experience.
163 assert((CurrInst->getDebugLoc() == MI.getDebugLoc() ||
164 (MI.getParent()->isEntryBlock() && !MI.getDebugLoc()) ||
165 (MI.isDebugInstr())) &&
166 "Line info was not transferred to all instructions");
167 }
168};
169} // namespace
170#endif // ifndef NDEBUG
171
172
189
190IRTranslator::ValueToVRegInfo::VRegListT &
191IRTranslator::allocateVRegs(const Value &Val) {
192 auto VRegsIt = VMap.findVRegs(Val);
193 if (VRegsIt != VMap.vregs_end())
194 return *VRegsIt->second;
195 auto *Regs = VMap.getVRegs(Val);
196 auto *Offsets = VMap.getOffsets(Val);
197 SmallVector<LLT, 4> SplitTys;
198 computeValueLLTs(*DL, *Val.getType(), SplitTys,
199 Offsets->empty() ? Offsets : nullptr);
200 for (unsigned i = 0; i < SplitTys.size(); ++i)
201 Regs->push_back(0);
202 return *Regs;
203}
204
205ArrayRef<Register> IRTranslator::getOrCreateVRegs(const Value &Val) {
206 auto VRegsIt = VMap.findVRegs(Val);
207 if (VRegsIt != VMap.vregs_end())
208 return *VRegsIt->second;
209
210 if (Val.getType()->isVoidTy())
211 return *VMap.getVRegs(Val);
212
213 // Create entry for this type.
214 auto *VRegs = VMap.getVRegs(Val);
215 auto *Offsets = VMap.getOffsets(Val);
216
217 if (!Val.getType()->isTokenTy())
218 assert(Val.getType()->isSized() &&
219 "Don't know how to create an empty vreg");
220
221 // Fast-path values that lower to a single vreg.
222 if (!Val.getType()->isAggregateType()) {
223 LLT Ty = getLLTForType(*Val.getType(), *DL);
224 if (Offsets->empty())
225 Offsets->push_back(0);
226 VRegs->push_back(MRI->createGenericVirtualRegister(Ty));
227 if (isa<Constant>(Val)) {
228 bool Success = translate(cast<Constant>(Val), VRegs->front());
229 if (!Success) {
230 OptimizationRemarkMissed R("gisel-irtranslator", "GISelFailure",
232 &MF->getFunction().getEntryBlock());
233 R << "unable to translate constant: " << ore::NV("Type", Val.getType());
234 reportTranslationError(*MF, *ORE, R);
235 }
236 }
237 return *VRegs;
238 }
239
240 SmallVector<LLT, 4> SplitTys;
241 computeValueLLTs(*DL, *Val.getType(), SplitTys,
242 Offsets->empty() ? Offsets : nullptr);
243
244 if (!isa<Constant>(Val)) {
245 for (auto Ty : SplitTys)
246 VRegs->push_back(MRI->createGenericVirtualRegister(Ty));
247 return *VRegs;
248 }
249
250 // UndefValue, ConstantAggregateZero
251 auto &C = cast<Constant>(Val);
252 unsigned Idx = 0;
253 while (auto Elt = C.getAggregateElement(Idx++)) {
254 auto EltRegs = getOrCreateVRegs(*Elt);
255 llvm::append_range(*VRegs, EltRegs);
256 }
257
258 return *VRegs;
259}
260
261int IRTranslator::getOrCreateFrameIndex(const AllocaInst &AI) {
262 auto [MapEntry, Inserted] = FrameIndices.try_emplace(&AI);
263 if (!Inserted)
264 return MapEntry->second;
265
266 TypeSize TySize = AI.getAllocationSize(*DL).value_or(TypeSize::getZero());
267 uint64_t Size = TySize.getKnownMinValue();
268
269 // Always allocate at least one byte.
270 Size = std::max<uint64_t>(Size, 1u);
271
272 int &FI = MapEntry->second;
273 FI = MF->getFrameInfo().CreateStackObject(Size, AI.getAlign(), false, &AI);
274
275 // Scalable vectors and structures that contain scalable vectors may
276 // need a special StackID to distinguish them from other (fixed size)
277 // stack objects.
278 if (TySize.isScalable()) {
279 auto StackID =
280 MF->getSubtarget().getFrameLowering()->getStackIDForScalableVectors();
281 MF->getFrameInfo().setStackID(FI, StackID);
282 }
283
284 return FI;
285}
286
287Align IRTranslator::getMemOpAlign(const Instruction &I) {
288 if (const StoreInst *SI = dyn_cast<StoreInst>(&I))
289 return SI->getAlign();
290 if (const LoadInst *LI = dyn_cast<LoadInst>(&I))
291 return LI->getAlign();
292 if (const AtomicCmpXchgInst *AI = dyn_cast<AtomicCmpXchgInst>(&I))
293 return AI->getAlign();
294 if (const AtomicRMWInst *AI = dyn_cast<AtomicRMWInst>(&I))
295 return AI->getAlign();
296
297 OptimizationRemarkMissed R("gisel-irtranslator", "", &I);
298 R << "unable to translate memop: " << ore::NV("Opcode", &I);
299 reportTranslationError(*MF, *ORE, R);
300 return Align(1);
301}
302
303MachineBasicBlock &IRTranslator::getMBB(const BasicBlock &BB) {
304 MachineBasicBlock *MBB = FuncInfo.getMBB(&BB);
305 assert(MBB && "BasicBlock was not encountered before");
306 return *MBB;
307}
308
309void IRTranslator::addMachineCFGPred(CFGEdge Edge, MachineBasicBlock *NewPred) {
310 assert(NewPred && "new predecessor must be a real MachineBasicBlock");
311 MachinePreds[Edge].push_back(NewPred);
312}
313
314bool IRTranslator::translateBinaryOp(unsigned Opcode, const User &U,
315 MachineIRBuilder &MIRBuilder) {
316 if (!mayTranslateUserTypes(U))
317 return false;
318
319 // Get or create a virtual register for each value.
320 // Unless the value is a Constant => loadimm cst?
321 // or inline constant each time?
322 // Creation of a virtual register needs to have a size.
323 Register Op0 = getOrCreateVReg(*U.getOperand(0));
324 Register Op1 = getOrCreateVReg(*U.getOperand(1));
325 Register Res = getOrCreateVReg(U);
326 uint32_t Flags = 0;
327 if (isa<Instruction>(U)) {
328 const Instruction &I = cast<Instruction>(U);
330 }
331
332 MIRBuilder.buildInstr(Opcode, {Res}, {Op0, Op1}, Flags);
333 return true;
334}
335
336bool IRTranslator::translateUnaryOp(unsigned Opcode, const User &U,
337 MachineIRBuilder &MIRBuilder) {
338 if (!mayTranslateUserTypes(U))
339 return false;
340
341 Register Op0 = getOrCreateVReg(*U.getOperand(0));
342 Register Res = getOrCreateVReg(U);
343 uint32_t Flags = 0;
344 if (isa<Instruction>(U)) {
345 const Instruction &I = cast<Instruction>(U);
347 }
348 MIRBuilder.buildInstr(Opcode, {Res}, {Op0}, Flags);
349 return true;
350}
351
352bool IRTranslator::translateFNeg(const User &U, MachineIRBuilder &MIRBuilder) {
353 return translateUnaryOp(TargetOpcode::G_FNEG, U, MIRBuilder);
354}
355
356bool IRTranslator::translateCompare(const User &U,
357 MachineIRBuilder &MIRBuilder) {
358 if (!mayTranslateUserTypes(U))
359 return false;
360
361 auto *CI = cast<CmpInst>(&U);
362 Register Op0 = getOrCreateVReg(*U.getOperand(0));
363 Register Op1 = getOrCreateVReg(*U.getOperand(1));
364 Register Res = getOrCreateVReg(U);
365 CmpInst::Predicate Pred = CI->getPredicate();
367 if (CmpInst::isIntPredicate(Pred))
368 MIRBuilder.buildICmp(Pred, Res, Op0, Op1, Flags);
369 else if (Pred == CmpInst::FCMP_FALSE)
370 MIRBuilder.buildCopy(
371 Res, getOrCreateVReg(*Constant::getNullValue(U.getType())));
372 else if (Pred == CmpInst::FCMP_TRUE)
373 MIRBuilder.buildCopy(
374 Res, getOrCreateVReg(*Constant::getAllOnesValue(U.getType())));
375 else
376 MIRBuilder.buildFCmp(Pred, Res, Op0, Op1, Flags);
377
378 return true;
379}
380
381bool IRTranslator::translateRet(const User &U, MachineIRBuilder &MIRBuilder) {
382 const ReturnInst &RI = cast<ReturnInst>(U);
383 const Value *Ret = RI.getReturnValue();
384 if (Ret && DL->getTypeStoreSize(Ret->getType()).isZero())
385 Ret = nullptr;
386
387 ArrayRef<Register> VRegs;
388 if (Ret)
389 VRegs = getOrCreateVRegs(*Ret);
390
391 Register SwiftErrorVReg = 0;
392 if (CLI->supportSwiftError() && SwiftError.getFunctionArg()) {
393 SwiftErrorVReg = SwiftError.getOrCreateVRegUseAt(
394 &RI, &MIRBuilder.getMBB(), SwiftError.getFunctionArg());
395 }
396
397 // The target may mess up with the insertion point, but
398 // this is not important as a return is the last instruction
399 // of the block anyway.
400 return CLI->lowerReturn(MIRBuilder, Ret, VRegs, FuncInfo, SwiftErrorVReg);
401}
402
403void IRTranslator::emitBranchForMergedCondition(
405 MachineBasicBlock *CurBB, MachineBasicBlock *SwitchBB,
406 BranchProbability TProb, BranchProbability FProb, bool InvertCond) {
407 // If the leaf of the tree is a comparison, merge the condition into
408 // the caseblock.
409 if (const CmpInst *BOp = dyn_cast<CmpInst>(Cond)) {
410 CmpInst::Predicate Condition;
411 if (const ICmpInst *IC = dyn_cast<ICmpInst>(Cond)) {
412 Condition = InvertCond ? IC->getInversePredicate() : IC->getPredicate();
413 } else {
414 const FCmpInst *FC = cast<FCmpInst>(Cond);
415 Condition = InvertCond ? FC->getInversePredicate() : FC->getPredicate();
416 }
417
418 SwitchCG::CaseBlock CB(Condition, false, BOp->getOperand(0),
419 BOp->getOperand(1), nullptr, TBB, FBB, CurBB,
420 CurBuilder->getDebugLoc(), TProb, FProb);
421 SL->SwitchCases.push_back(CB);
422 return;
423 }
424
425 // Create a CaseBlock record representing this branch.
427 SwitchCG::CaseBlock CB(
428 Pred, false, Cond, ConstantInt::getTrue(MF->getFunction().getContext()),
429 nullptr, TBB, FBB, CurBB, CurBuilder->getDebugLoc(), TProb, FProb);
430 SL->SwitchCases.push_back(CB);
431}
432
433static bool isValInBlock(const Value *V, const BasicBlock *BB) {
434 if (const Instruction *I = dyn_cast<Instruction>(V))
435 return I->getParent() == BB;
436 return true;
437}
438
439void IRTranslator::findMergedConditions(
441 MachineBasicBlock *CurBB, MachineBasicBlock *SwitchBB,
443 BranchProbability FProb, bool InvertCond) {
444 using namespace PatternMatch;
445 assert((Opc == Instruction::And || Opc == Instruction::Or) &&
446 "Expected Opc to be AND/OR");
447 // Skip over not part of the tree and remember to invert op and operands at
448 // next level.
449 Value *NotCond;
450 if (match(Cond, m_OneUse(m_Not(m_Value(NotCond)))) &&
451 isValInBlock(NotCond, CurBB->getBasicBlock())) {
452 findMergedConditions(NotCond, TBB, FBB, CurBB, SwitchBB, Opc, TProb, FProb,
453 !InvertCond);
454 return;
455 }
456
458 const Value *BOpOp0, *BOpOp1;
459 // Compute the effective opcode for Cond, taking into account whether it needs
460 // to be inverted, e.g.
461 // and (not (or A, B)), C
462 // gets lowered as
463 // and (and (not A, not B), C)
465 if (BOp) {
466 BOpc = match(BOp, m_LogicalAnd(m_Value(BOpOp0), m_Value(BOpOp1)))
467 ? Instruction::And
468 : (match(BOp, m_LogicalOr(m_Value(BOpOp0), m_Value(BOpOp1)))
469 ? Instruction::Or
471 if (InvertCond) {
472 if (BOpc == Instruction::And)
473 BOpc = Instruction::Or;
474 else if (BOpc == Instruction::Or)
475 BOpc = Instruction::And;
476 }
477 }
478
479 // If this node is not part of the or/and tree, emit it as a branch.
480 // Note that all nodes in the tree should have same opcode.
481 bool BOpIsInOrAndTree = BOpc && BOpc == Opc && BOp->hasOneUse();
482 if (!BOpIsInOrAndTree || BOp->getParent() != CurBB->getBasicBlock() ||
483 !isValInBlock(BOpOp0, CurBB->getBasicBlock()) ||
484 !isValInBlock(BOpOp1, CurBB->getBasicBlock())) {
485 emitBranchForMergedCondition(Cond, TBB, FBB, CurBB, SwitchBB, TProb, FProb,
486 InvertCond);
487 return;
488 }
489
490 // Create TmpBB after CurBB.
491 MachineFunction::iterator BBI(CurBB);
492 MachineBasicBlock *TmpBB =
493 MF->CreateMachineBasicBlock(CurBB->getBasicBlock());
494 CurBB->getParent()->insert(++BBI, TmpBB);
495
496 if (Opc == Instruction::Or) {
497 // Codegen X | Y as:
498 // BB1:
499 // jmp_if_X TBB
500 // jmp TmpBB
501 // TmpBB:
502 // jmp_if_Y TBB
503 // jmp FBB
504 //
505
506 // We have flexibility in setting Prob for BB1 and Prob for TmpBB.
507 // The requirement is that
508 // TrueProb for BB1 + (FalseProb for BB1 * TrueProb for TmpBB)
509 // = TrueProb for original BB.
510 // Assuming the original probabilities are A and B, one choice is to set
511 // BB1's probabilities to A/2 and A/2+B, and set TmpBB's probabilities to
512 // A/(1+B) and 2B/(1+B). This choice assumes that
513 // TrueProb for BB1 == FalseProb for BB1 * TrueProb for TmpBB.
514 // Another choice is to assume TrueProb for BB1 equals to TrueProb for
515 // TmpBB, but the math is more complicated.
516
517 auto NewTrueProb = TProb / 2;
518 auto NewFalseProb = TProb / 2 + FProb;
519 // Emit the LHS condition.
520 findMergedConditions(BOpOp0, TBB, TmpBB, CurBB, SwitchBB, Opc, NewTrueProb,
521 NewFalseProb, InvertCond);
522
523 // Normalize A/2 and B to get A/(1+B) and 2B/(1+B).
524 SmallVector<BranchProbability, 2> Probs{TProb / 2, FProb};
526 // Emit the RHS condition into TmpBB.
527 findMergedConditions(BOpOp1, TBB, FBB, TmpBB, SwitchBB, Opc, Probs[0],
528 Probs[1], InvertCond);
529 } else {
530 assert(Opc == Instruction::And && "Unknown merge op!");
531 // Codegen X & Y as:
532 // BB1:
533 // jmp_if_X TmpBB
534 // jmp FBB
535 // TmpBB:
536 // jmp_if_Y TBB
537 // jmp FBB
538 //
539 // This requires creation of TmpBB after CurBB.
540
541 // We have flexibility in setting Prob for BB1 and Prob for TmpBB.
542 // The requirement is that
543 // FalseProb for BB1 + (TrueProb for BB1 * FalseProb for TmpBB)
544 // = FalseProb for original BB.
545 // Assuming the original probabilities are A and B, one choice is to set
546 // BB1's probabilities to A+B/2 and B/2, and set TmpBB's probabilities to
547 // 2A/(1+A) and B/(1+A). This choice assumes that FalseProb for BB1 ==
548 // TrueProb for BB1 * FalseProb for TmpBB.
549
550 auto NewTrueProb = TProb + FProb / 2;
551 auto NewFalseProb = FProb / 2;
552 // Emit the LHS condition.
553 findMergedConditions(BOpOp0, TmpBB, FBB, CurBB, SwitchBB, Opc, NewTrueProb,
554 NewFalseProb, InvertCond);
555
556 // Normalize A and B/2 to get 2A/(1+A) and B/(1+A).
557 SmallVector<BranchProbability, 2> Probs{TProb, FProb / 2};
559 // Emit the RHS condition into TmpBB.
560 findMergedConditions(BOpOp1, TBB, FBB, TmpBB, SwitchBB, Opc, Probs[0],
561 Probs[1], InvertCond);
562 }
563}
564
565bool IRTranslator::shouldEmitAsBranches(
566 const std::vector<SwitchCG::CaseBlock> &Cases) {
567 // For multiple cases, it's better to emit as branches.
568 if (Cases.size() != 2)
569 return true;
570
571 // If this is two comparisons of the same values or'd or and'd together, they
572 // will get folded into a single comparison, so don't emit two blocks.
573 if ((Cases[0].CmpLHS == Cases[1].CmpLHS &&
574 Cases[0].CmpRHS == Cases[1].CmpRHS) ||
575 (Cases[0].CmpRHS == Cases[1].CmpLHS &&
576 Cases[0].CmpLHS == Cases[1].CmpRHS)) {
577 return false;
578 }
579
580 // Handle: (X != null) | (Y != null) --> (X|Y) != 0
581 // Handle: (X == null) & (Y == null) --> (X|Y) == 0
582 if (Cases[0].CmpRHS == Cases[1].CmpRHS &&
583 Cases[0].PredInfo.Pred == Cases[1].PredInfo.Pred &&
584 isa<Constant>(Cases[0].CmpRHS) &&
585 cast<Constant>(Cases[0].CmpRHS)->isNullValue()) {
586 if (Cases[0].PredInfo.Pred == CmpInst::ICMP_EQ &&
587 Cases[0].TrueBB == Cases[1].ThisBB)
588 return false;
589 if (Cases[0].PredInfo.Pred == CmpInst::ICMP_NE &&
590 Cases[0].FalseBB == Cases[1].ThisBB)
591 return false;
592 }
593
594 return true;
595}
596
597bool IRTranslator::translateUncondBr(const User &U,
598 MachineIRBuilder &MIRBuilder) {
599 const UncondBrInst &BrInst = cast<UncondBrInst>(U);
600 auto &CurMBB = MIRBuilder.getMBB();
601 auto *Succ0MBB = &getMBB(*BrInst.getSuccessor(0));
602
603 // If the unconditional target is the layout successor, fallthrough.
604 if (OptLevel == CodeGenOptLevel::None || !CurMBB.isLayoutSuccessor(Succ0MBB))
605 MIRBuilder.buildBr(*Succ0MBB);
606
607 // Link successors.
608 for (const BasicBlock *Succ : successors(&BrInst))
609 CurMBB.addSuccessor(&getMBB(*Succ));
610 return true;
611}
612
613bool IRTranslator::translateCondBr(const User &U,
614 MachineIRBuilder &MIRBuilder) {
615 const CondBrInst &BrInst = cast<CondBrInst>(U);
616 auto &CurMBB = MIRBuilder.getMBB();
617 auto *Succ0MBB = &getMBB(*BrInst.getSuccessor(0));
618
619 // If this condition is one of the special cases we handle, do special stuff
620 // now.
621 const Value *CondVal = BrInst.getCondition();
622 MachineBasicBlock *Succ1MBB = &getMBB(*BrInst.getSuccessor(1));
623
624 // If this is a series of conditions that are or'd or and'd together, emit
625 // this as a sequence of branches instead of setcc's with and/or operations.
626 // As long as jumps are not expensive (exceptions for multi-use logic ops,
627 // unpredictable branches, and vector extracts because those jumps are likely
628 // expensive for any target), this should improve performance.
629 // For example, instead of something like:
630 // cmp A, B
631 // C = seteq
632 // cmp D, E
633 // F = setle
634 // or C, F
635 // jnz foo
636 // Emit:
637 // cmp A, B
638 // je foo
639 // cmp D, E
640 // jle foo
641 using namespace PatternMatch;
642 const Instruction *CondI = dyn_cast<Instruction>(CondVal);
643 if (!TLI->isJumpExpensive() && CondI && CondI->hasOneUse() &&
644 !BrInst.hasMetadata(LLVMContext::MD_unpredictable)) {
646 Value *Vec;
647 const Value *BOp0, *BOp1;
648 if (match(CondI, m_LogicalAnd(m_Value(BOp0), m_Value(BOp1))))
649 Opcode = Instruction::And;
650 else if (match(CondI, m_LogicalOr(m_Value(BOp0), m_Value(BOp1))))
651 Opcode = Instruction::Or;
652
653 if (Opcode && !(match(BOp0, m_ExtractElt(m_Value(Vec), m_Value())) &&
654 match(BOp1, m_ExtractElt(m_Specific(Vec), m_Value())))) {
655 findMergedConditions(CondI, Succ0MBB, Succ1MBB, &CurMBB, &CurMBB, Opcode,
656 getEdgeProbability(&CurMBB, Succ0MBB),
657 getEdgeProbability(&CurMBB, Succ1MBB),
658 /*InvertCond=*/false);
659 assert(SL->SwitchCases[0].ThisBB == &CurMBB && "Unexpected lowering!");
660
661 // Allow some cases to be rejected.
662 if (shouldEmitAsBranches(SL->SwitchCases)) {
663 // Emit the branch for this block.
664 emitSwitchCase(SL->SwitchCases[0], &CurMBB, *CurBuilder);
665 SL->SwitchCases.erase(SL->SwitchCases.begin());
666 return true;
667 }
668
669 // Okay, we decided not to do this, remove any inserted MBB's and clear
670 // SwitchCases.
671 for (unsigned I = 1, E = SL->SwitchCases.size(); I != E; ++I)
672 MF->erase(SL->SwitchCases[I].ThisBB);
673
674 SL->SwitchCases.clear();
675 }
676 }
677
678 // Create a CaseBlock record representing this branch.
679 SwitchCG::CaseBlock CB(CmpInst::ICMP_EQ, false, CondVal,
680 ConstantInt::getTrue(MF->getFunction().getContext()),
681 nullptr, Succ0MBB, Succ1MBB, &CurMBB,
682 CurBuilder->getDebugLoc());
683
684 // Use emitSwitchCase to actually insert the fast branch sequence for this
685 // cond branch.
686 emitSwitchCase(CB, &CurMBB, *CurBuilder);
687 return true;
688}
689
690void IRTranslator::addSuccessorWithProb(MachineBasicBlock *Src,
692 BranchProbability Prob) {
693 if (!FuncInfo.BPI) {
694 Src->addSuccessorWithoutProb(Dst);
695 return;
696 }
697 if (Prob.isUnknown())
698 Prob = getEdgeProbability(Src, Dst);
699 Src->addSuccessor(Dst, Prob);
700}
701
703IRTranslator::getEdgeProbability(const MachineBasicBlock *Src,
704 const MachineBasicBlock *Dst) const {
705 const BasicBlock *SrcBB = Src->getBasicBlock();
706 const BasicBlock *DstBB = Dst->getBasicBlock();
707 if (!FuncInfo.BPI) {
708 // If BPI is not available, set the default probability as 1 / N, where N is
709 // the number of successors.
710 auto SuccSize = std::max<uint32_t>(succ_size(SrcBB), 1);
711 return BranchProbability(1, SuccSize);
712 }
713 return FuncInfo.BPI->getEdgeProbability(SrcBB, DstBB);
714}
715
716bool IRTranslator::translateSwitch(const User &U, MachineIRBuilder &MIB) {
717 using namespace SwitchCG;
718 // Extract cases from the switch.
719 const SwitchInst &SI = cast<SwitchInst>(U);
720 BranchProbabilityInfo *BPI = FuncInfo.BPI;
721 CaseClusterVector Clusters;
722 Clusters.reserve(SI.getNumCases());
723 for (const auto &I : SI.cases()) {
724 MachineBasicBlock *Succ = &getMBB(*I.getCaseSuccessor());
725 assert(Succ && "Could not find successor mbb in mapping");
726 const ConstantInt *CaseVal = I.getCaseValue();
727 BranchProbability Prob =
728 BPI ? BPI->getEdgeProbability(SI.getParent(), I.getSuccessorIndex())
729 : BranchProbability(1, SI.getNumCases() + 1);
730 Clusters.push_back(CaseCluster::range(CaseVal, CaseVal, Succ, Prob));
731 }
732
733 MachineBasicBlock *DefaultMBB = &getMBB(*SI.getDefaultDest());
734
735 // Cluster adjacent cases with the same destination. We do this at all
736 // optimization levels because it's cheap to do and will make codegen faster
737 // if there are many clusters.
738 sortAndRangeify(Clusters);
739
740 MachineBasicBlock *SwitchMBB = &getMBB(*SI.getParent());
741
742 // If there is only the default destination, jump there directly.
743 if (Clusters.empty()) {
744 SwitchMBB->addSuccessor(DefaultMBB);
745 if (DefaultMBB != SwitchMBB->getNextNode())
746 MIB.buildBr(*DefaultMBB);
747 return true;
748 }
749
750 SL->findJumpTables(Clusters, &SI, std::nullopt, DefaultMBB, nullptr, nullptr);
751 SL->findBitTestClusters(Clusters, &SI);
752
753 LLVM_DEBUG({
754 dbgs() << "Case clusters: ";
755 for (const CaseCluster &C : Clusters) {
756 if (C.Kind == CC_JumpTable)
757 dbgs() << "JT:";
758 if (C.Kind == CC_BitTests)
759 dbgs() << "BT:";
760
761 C.Low->getValue().print(dbgs(), true);
762 if (C.Low != C.High) {
763 dbgs() << '-';
764 C.High->getValue().print(dbgs(), true);
765 }
766 dbgs() << ' ';
767 }
768 dbgs() << '\n';
769 });
770
771 assert(!Clusters.empty());
772 SwitchWorkList WorkList;
773 CaseClusterIt First = Clusters.begin();
774 CaseClusterIt Last = Clusters.end() - 1;
775 auto DefaultProb = getEdgeProbability(SwitchMBB, DefaultMBB);
776 WorkList.push_back({SwitchMBB, First, Last, nullptr, nullptr, DefaultProb});
777
778 while (!WorkList.empty()) {
779 SwitchWorkListItem W = WorkList.pop_back_val();
780
781 unsigned NumClusters = W.LastCluster - W.FirstCluster + 1;
782 // For optimized builds, lower large range as a balanced binary tree.
783 if (NumClusters > 3 &&
784 MF->getTarget().getOptLevel() != CodeGenOptLevel::None &&
785 !DefaultMBB->getParent()->getFunction().hasMinSize()) {
786 splitWorkItem(WorkList, W, SI.getCondition(), SwitchMBB, MIB);
787 continue;
788 }
789
790 if (!lowerSwitchWorkItem(W, SI.getCondition(), SwitchMBB, DefaultMBB, MIB))
791 return false;
792 }
793 return true;
794}
795
796void IRTranslator::splitWorkItem(SwitchCG::SwitchWorkList &WorkList,
798 Value *Cond, MachineBasicBlock *SwitchMBB,
799 MachineIRBuilder &MIB) {
800 using namespace SwitchCG;
801 assert(W.FirstCluster->Low->getValue().slt(W.LastCluster->Low->getValue()) &&
802 "Clusters not sorted?");
803 assert(W.LastCluster - W.FirstCluster + 1 >= 2 && "Too small to split!");
804
805 auto [LastLeft, FirstRight, LeftProb, RightProb] =
806 SL->computeSplitWorkItemInfo(W);
807
808 // Use the first element on the right as pivot since we will make less-than
809 // comparisons against it.
810 CaseClusterIt PivotCluster = FirstRight;
811 assert(PivotCluster > W.FirstCluster);
812 assert(PivotCluster <= W.LastCluster);
813
814 CaseClusterIt FirstLeft = W.FirstCluster;
815 CaseClusterIt LastRight = W.LastCluster;
816
817 const ConstantInt *Pivot = PivotCluster->Low;
818
819 // New blocks will be inserted immediately after the current one.
821 ++BBI;
822
823 // We will branch to the LHS if Value < Pivot. If LHS is a single cluster,
824 // we can branch to its destination directly if it's squeezed exactly in
825 // between the known lower bound and Pivot - 1.
826 MachineBasicBlock *LeftMBB;
827 if (FirstLeft == LastLeft && FirstLeft->Kind == CC_Range &&
828 FirstLeft->Low == W.GE &&
829 (FirstLeft->High->getValue() + 1LL) == Pivot->getValue()) {
830 LeftMBB = FirstLeft->MBB;
831 } else {
832 LeftMBB = FuncInfo.MF->CreateMachineBasicBlock(W.MBB->getBasicBlock());
833 FuncInfo.MF->insert(BBI, LeftMBB);
834 WorkList.push_back(
835 {LeftMBB, FirstLeft, LastLeft, W.GE, Pivot, W.DefaultProb / 2});
836 }
837
838 // Similarly, we will branch to the RHS if Value >= Pivot. If RHS is a
839 // single cluster, RHS.Low == Pivot, and we can branch to its destination
840 // directly if RHS.High equals the current upper bound.
841 MachineBasicBlock *RightMBB;
842 if (FirstRight == LastRight && FirstRight->Kind == CC_Range && W.LT &&
843 (FirstRight->High->getValue() + 1ULL) == W.LT->getValue()) {
844 RightMBB = FirstRight->MBB;
845 } else {
846 RightMBB = FuncInfo.MF->CreateMachineBasicBlock(W.MBB->getBasicBlock());
847 FuncInfo.MF->insert(BBI, RightMBB);
848 WorkList.push_back(
849 {RightMBB, FirstRight, LastRight, Pivot, W.LT, W.DefaultProb / 2});
850 }
851
852 // Create the CaseBlock record that will be used to lower the branch.
853 CaseBlock CB(ICmpInst::Predicate::ICMP_SLT, false, Cond, Pivot, nullptr,
854 LeftMBB, RightMBB, W.MBB, MIB.getDebugLoc(), LeftProb,
855 RightProb);
856
857 if (W.MBB == SwitchMBB)
858 emitSwitchCase(CB, SwitchMBB, MIB);
859 else
860 SL->SwitchCases.push_back(CB);
861}
862
863void IRTranslator::emitJumpTable(SwitchCG::JumpTable &JT,
865 // Emit the code for the jump table
866 assert(JT.Reg && "Should lower JT Header first!");
867 MachineIRBuilder MIB(*MBB->getParent());
868 MIB.setMBB(*MBB);
869 MIB.setDebugLoc(CurBuilder->getDebugLoc());
870
871 Type *PtrIRTy = PointerType::getUnqual(MF->getFunction().getContext());
872 const LLT PtrTy = getLLTForType(*PtrIRTy, *DL);
873
874 auto Table = MIB.buildJumpTable(PtrTy, JT.JTI);
875 MIB.buildBrJT(Table.getReg(0), JT.JTI, JT.Reg);
876}
877
878bool IRTranslator::emitJumpTableHeader(SwitchCG::JumpTable &JT,
880 MachineBasicBlock *HeaderBB) {
881 MachineIRBuilder MIB(*HeaderBB->getParent());
882 MIB.setMBB(*HeaderBB);
883 MIB.setDebugLoc(CurBuilder->getDebugLoc());
884
885 const Value &SValue = *JTH.SValue;
886 // Subtract the lowest switch case value from the value being switched on.
887 const LLT SwitchTy = getLLTForType(*SValue.getType(), *DL);
888 Register SwitchOpReg = getOrCreateVReg(SValue);
889 auto FirstCst = MIB.buildConstant(SwitchTy, JTH.First);
890 auto Sub = MIB.buildSub({SwitchTy}, SwitchOpReg, FirstCst);
891
892 // This value may be smaller or larger than the target's pointer type, and
893 // therefore require extension or truncating.
894 auto *PtrIRTy = PointerType::getUnqual(SValue.getContext());
895 const LLT PtrScalarTy = LLT::integer(DL->getTypeSizeInBits(PtrIRTy));
896 Sub = MIB.buildZExtOrTrunc(PtrScalarTy, Sub);
897
898 JT.Reg = Sub.getReg(0);
899
900 if (JTH.FallthroughUnreachable) {
901 if (JT.MBB != HeaderBB->getNextNode())
902 MIB.buildBr(*JT.MBB);
903 return true;
904 }
905
906 // Emit the range check for the jump table, and branch to the default block
907 // for the switch statement if the value being switched on exceeds the
908 // largest case in the switch.
909 auto Cst = getOrCreateVReg(
910 *ConstantInt::get(SValue.getType(), JTH.Last - JTH.First));
911 Cst = MIB.buildZExtOrTrunc(PtrScalarTy, Cst).getReg(0);
912 auto Cmp = MIB.buildICmp(CmpInst::ICMP_UGT, LLT::integer(1), Sub, Cst);
913
914 auto BrCond = MIB.buildBrCond(Cmp.getReg(0), *JT.Default);
915
916 // Avoid emitting unnecessary branches to the next block.
917 if (JT.MBB != HeaderBB->getNextNode())
918 BrCond = MIB.buildBr(*JT.MBB);
919 return true;
920}
921
922void IRTranslator::emitSwitchCase(SwitchCG::CaseBlock &CB,
923 MachineBasicBlock *SwitchBB,
924 MachineIRBuilder &MIB) {
925 Register CondLHS = getOrCreateVReg(*CB.CmpLHS);
927 DebugLoc OldDbgLoc = MIB.getDebugLoc();
928 MIB.setDebugLoc(CB.DbgLoc);
929 MIB.setMBB(*CB.ThisBB);
930
931 if (CB.PredInfo.NoCmp) {
932 // Branch or fall through to TrueBB.
933 addSuccessorWithProb(CB.ThisBB, CB.TrueBB, CB.TrueProb);
934 addMachineCFGPred({SwitchBB->getBasicBlock(), CB.TrueBB->getBasicBlock()},
935 CB.ThisBB);
937 if (CB.TrueBB != CB.ThisBB->getNextNode())
938 MIB.buildBr(*CB.TrueBB);
939 MIB.setDebugLoc(OldDbgLoc);
940 return;
941 }
942
943 const LLT i1Ty = LLT::integer(1);
944 // Build the compare.
945 if (!CB.CmpMHS) {
946 const auto *CI = dyn_cast<ConstantInt>(CB.CmpRHS);
947 // For conditional branch lowering, we might try to do something silly like
948 // emit an G_ICMP to compare an existing G_ICMP i1 result with true. If so,
949 // just re-use the existing condition vreg.
950 if (MRI->getType(CondLHS).getSizeInBits() == 1 && CI && CI->isOne() &&
952 Cond = CondLHS;
953 } else {
954 Register CondRHS = getOrCreateVReg(*CB.CmpRHS);
956 Cond =
957 MIB.buildFCmp(CB.PredInfo.Pred, i1Ty, CondLHS, CondRHS).getReg(0);
958 else
959 Cond =
960 MIB.buildICmp(CB.PredInfo.Pred, i1Ty, CondLHS, CondRHS).getReg(0);
961 }
962 } else {
964 "Can only handle SLE ranges");
965
966 const APInt& Low = cast<ConstantInt>(CB.CmpLHS)->getValue();
967 const APInt& High = cast<ConstantInt>(CB.CmpRHS)->getValue();
968
969 Register CmpOpReg = getOrCreateVReg(*CB.CmpMHS);
970 if (cast<ConstantInt>(CB.CmpLHS)->isMinValue(true)) {
971 Register CondRHS = getOrCreateVReg(*CB.CmpRHS);
972 Cond =
973 MIB.buildICmp(CmpInst::ICMP_SLE, i1Ty, CmpOpReg, CondRHS).getReg(0);
974 } else {
975 const LLT CmpTy = MRI->getType(CmpOpReg);
976 auto Sub = MIB.buildSub({CmpTy}, CmpOpReg, CondLHS);
977 auto Diff = MIB.buildConstant(CmpTy, High - Low);
978 Cond = MIB.buildICmp(CmpInst::ICMP_ULE, i1Ty, Sub, Diff).getReg(0);
979 }
980 }
981
982 // Update successor info
983 addSuccessorWithProb(CB.ThisBB, CB.TrueBB, CB.TrueProb);
984
985 addMachineCFGPred({SwitchBB->getBasicBlock(), CB.TrueBB->getBasicBlock()},
986 CB.ThisBB);
987
988 // TrueBB and FalseBB are always different unless the incoming IR is
989 // degenerate. This only happens when running llc on weird IR.
990 if (CB.TrueBB != CB.FalseBB)
991 addSuccessorWithProb(CB.ThisBB, CB.FalseBB, CB.FalseProb);
993
994 addMachineCFGPred({SwitchBB->getBasicBlock(), CB.FalseBB->getBasicBlock()},
995 CB.ThisBB);
996
997 MIB.buildBrCond(Cond, *CB.TrueBB);
998 MIB.buildBr(*CB.FalseBB);
999 MIB.setDebugLoc(OldDbgLoc);
1000}
1001
1002bool IRTranslator::lowerJumpTableWorkItem(SwitchCG::SwitchWorkListItem W,
1003 MachineBasicBlock *SwitchMBB,
1004 MachineBasicBlock *CurMBB,
1005 MachineBasicBlock *DefaultMBB,
1006 MachineIRBuilder &MIB,
1008 BranchProbability UnhandledProbs,
1010 MachineBasicBlock *Fallthrough,
1011 bool FallthroughUnreachable) {
1012 using namespace SwitchCG;
1013 MachineFunction *CurMF = SwitchMBB->getParent();
1014 // FIXME: Optimize away range check based on pivot comparisons.
1015 JumpTableHeader *JTH = &SL->JTCases[I->JTCasesIndex].first;
1016 SwitchCG::JumpTable *JT = &SL->JTCases[I->JTCasesIndex].second;
1017 BranchProbability DefaultProb = W.DefaultProb;
1018
1019 // The jump block hasn't been inserted yet; insert it here.
1020 MachineBasicBlock *JumpMBB = JT->MBB;
1021 CurMF->insert(BBI, JumpMBB);
1022
1023 // Since the jump table block is separate from the switch block, we need
1024 // to keep track of it as a machine predecessor to the default block,
1025 // otherwise we lose the phi edges.
1026 addMachineCFGPred({SwitchMBB->getBasicBlock(), DefaultMBB->getBasicBlock()},
1027 CurMBB);
1028 addMachineCFGPred({SwitchMBB->getBasicBlock(), DefaultMBB->getBasicBlock()},
1029 JumpMBB);
1030
1031 auto JumpProb = I->Prob;
1032 auto FallthroughProb = UnhandledProbs;
1033
1034 // If the default statement is a target of the jump table, we evenly
1035 // distribute the default probability to successors of CurMBB. Also
1036 // update the probability on the edge from JumpMBB to Fallthrough.
1037 for (MachineBasicBlock::succ_iterator SI = JumpMBB->succ_begin(),
1038 SE = JumpMBB->succ_end();
1039 SI != SE; ++SI) {
1040 if (*SI == DefaultMBB) {
1041 JumpProb += DefaultProb / 2;
1042 FallthroughProb -= DefaultProb / 2;
1043 JumpMBB->setSuccProbability(SI, DefaultProb / 2);
1044 JumpMBB->normalizeSuccProbs();
1045 } else {
1046 // Also record edges from the jump table block to it's successors.
1047 addMachineCFGPred({SwitchMBB->getBasicBlock(), (*SI)->getBasicBlock()},
1048 JumpMBB);
1049 }
1050 }
1051
1052 if (FallthroughUnreachable)
1053 JTH->FallthroughUnreachable = true;
1054
1055 if (!JTH->FallthroughUnreachable)
1056 addSuccessorWithProb(CurMBB, Fallthrough, FallthroughProb);
1057 addSuccessorWithProb(CurMBB, JumpMBB, JumpProb);
1058 CurMBB->normalizeSuccProbs();
1059
1060 // The jump table header will be inserted in our current block, do the
1061 // range check, and fall through to our fallthrough block.
1062 JTH->HeaderBB = CurMBB;
1063 JT->Default = Fallthrough; // FIXME: Move Default to JumpTableHeader.
1064
1065 // If we're in the right place, emit the jump table header right now.
1066 if (CurMBB == SwitchMBB) {
1067 if (!emitJumpTableHeader(*JT, *JTH, CurMBB))
1068 return false;
1069 JTH->Emitted = true;
1070 }
1071 return true;
1072}
1073bool IRTranslator::lowerSwitchRangeWorkItem(SwitchCG::CaseClusterIt I,
1074 Value *Cond,
1075 MachineBasicBlock *Fallthrough,
1076 bool FallthroughUnreachable,
1077 BranchProbability UnhandledProbs,
1078 MachineBasicBlock *CurMBB,
1079 MachineIRBuilder &MIB,
1080 MachineBasicBlock *SwitchMBB) {
1081 using namespace SwitchCG;
1082 const Value *RHS, *LHS, *MHS;
1083 CmpInst::Predicate Pred;
1084 if (I->Low == I->High) {
1085 // Check Cond == I->Low.
1086 Pred = CmpInst::ICMP_EQ;
1087 LHS = Cond;
1088 RHS = I->Low;
1089 MHS = nullptr;
1090 } else {
1091 // Check I->Low <= Cond <= I->High.
1092 Pred = CmpInst::ICMP_SLE;
1093 LHS = I->Low;
1094 MHS = Cond;
1095 RHS = I->High;
1096 }
1097
1098 // If Fallthrough is unreachable, fold away the comparison.
1099 // The false probability is the sum of all unhandled cases.
1100 CaseBlock CB(Pred, FallthroughUnreachable, LHS, RHS, MHS, I->MBB, Fallthrough,
1101 CurMBB, MIB.getDebugLoc(), I->Prob, UnhandledProbs);
1102
1103 emitSwitchCase(CB, SwitchMBB, MIB);
1104 return true;
1105}
1106
1107void IRTranslator::emitBitTestHeader(SwitchCG::BitTestBlock &B,
1108 MachineBasicBlock *SwitchBB) {
1109 MachineIRBuilder &MIB = *CurBuilder;
1110 MIB.setMBB(*SwitchBB);
1111
1112 // Subtract the minimum value.
1113 Register SwitchOpReg = getOrCreateVReg(*B.SValue);
1114
1115 LLT SwitchOpTy = MRI->getType(SwitchOpReg);
1116 Register MinValReg = MIB.buildConstant(SwitchOpTy, B.First).getReg(0);
1117 auto RangeSub = MIB.buildSub(SwitchOpTy, SwitchOpReg, MinValReg);
1118
1119 Type *PtrIRTy = PointerType::getUnqual(MF->getFunction().getContext());
1120 const LLT PtrTy = getLLTForType(*PtrIRTy, *DL);
1121
1122 LLT MaskTy = SwitchOpTy;
1123 if (MaskTy.getSizeInBits() > PtrTy.getSizeInBits() ||
1125 MaskTy = LLT::integer(PtrTy.getSizeInBits());
1126 else {
1127 // Ensure that the type will fit the mask value.
1128 for (const SwitchCG::BitTestCase &Case : B.Cases) {
1129 if (!isUIntN(SwitchOpTy.getSizeInBits(), Case.Mask)) {
1130 // Switch table case range are encoded into series of masks.
1131 // Just use pointer type, it's guaranteed to fit.
1132 MaskTy = LLT::integer(PtrTy.getSizeInBits());
1133 break;
1134 }
1135 }
1136 }
1137 Register SubReg = RangeSub.getReg(0);
1138 if (SwitchOpTy != MaskTy)
1139 SubReg = MIB.buildZExtOrTrunc(MaskTy, SubReg).getReg(0);
1140
1141 B.RegVT = getMVTForLLT(MaskTy);
1142 B.Reg = SubReg;
1143
1144 MachineBasicBlock *MBB = B.Cases[0].ThisBB;
1145
1146 if (!B.FallthroughUnreachable)
1147 addSuccessorWithProb(SwitchBB, B.Default, B.DefaultProb);
1148 addSuccessorWithProb(SwitchBB, MBB, B.Prob);
1149
1150 SwitchBB->normalizeSuccProbs();
1151
1152 if (!B.FallthroughUnreachable) {
1153 // Conditional branch to the default block.
1154 auto RangeCst = MIB.buildConstant(SwitchOpTy, B.Range);
1155 auto RangeCmp = MIB.buildICmp(CmpInst::Predicate::ICMP_UGT, LLT::integer(1),
1156 RangeSub, RangeCst);
1157 MIB.buildBrCond(RangeCmp, *B.Default);
1158 }
1159
1160 // Avoid emitting unnecessary branches to the next block.
1161 if (MBB != SwitchBB->getNextNode())
1162 MIB.buildBr(*MBB);
1163}
1164
1165void IRTranslator::emitBitTestCase(SwitchCG::BitTestBlock &BB,
1166 MachineBasicBlock *NextMBB,
1167 BranchProbability BranchProbToNext,
1169 MachineBasicBlock *SwitchBB) {
1170 MachineIRBuilder &MIB = *CurBuilder;
1171 MIB.setMBB(*SwitchBB);
1172
1173 LLT SwitchTy = getLLTForMVT(BB.RegVT);
1174 Register Cmp;
1175 unsigned PopCount = llvm::popcount(B.Mask);
1176 if (PopCount == 1) {
1177 // Testing for a single bit; just compare the shift count with what it
1178 // would need to be to shift a 1 bit in that position.
1179 auto MaskTrailingZeros =
1180 MIB.buildConstant(SwitchTy, llvm::countr_zero(B.Mask));
1182 MaskTrailingZeros)
1183 .getReg(0);
1184 } else if (PopCount == BB.Range) {
1185 // There is only one zero bit in the range, test for it directly.
1186 auto MaskTrailingOnes =
1187 MIB.buildConstant(SwitchTy, llvm::countr_one(B.Mask));
1188 Cmp =
1189 MIB.buildICmp(CmpInst::ICMP_NE, LLT::integer(1), Reg, MaskTrailingOnes)
1190 .getReg(0);
1191 } else {
1192 // Make desired shift.
1193 auto CstOne = MIB.buildConstant(SwitchTy, 1);
1194 auto SwitchVal = MIB.buildShl(SwitchTy, CstOne, Reg);
1195
1196 // Emit bit tests and jumps.
1197 auto CstMask = MIB.buildConstant(SwitchTy, B.Mask);
1198 auto AndOp = MIB.buildAnd(SwitchTy, SwitchVal, CstMask);
1199 auto CstZero = MIB.buildConstant(SwitchTy, 0);
1200 Cmp = MIB.buildICmp(CmpInst::ICMP_NE, LLT::integer(1), AndOp, CstZero)
1201 .getReg(0);
1202 }
1203
1204 // The branch probability from SwitchBB to B.TargetBB is B.ExtraProb.
1205 addSuccessorWithProb(SwitchBB, B.TargetBB, B.ExtraProb);
1206 // The branch probability from SwitchBB to NextMBB is BranchProbToNext.
1207 addSuccessorWithProb(SwitchBB, NextMBB, BranchProbToNext);
1208 // It is not guaranteed that the sum of B.ExtraProb and BranchProbToNext is
1209 // one as they are relative probabilities (and thus work more like weights),
1210 // and hence we need to normalize them to let the sum of them become one.
1211 SwitchBB->normalizeSuccProbs();
1212
1213 // Record the fact that the IR edge from the header to the bit test target
1214 // will go through our new block. Neeeded for PHIs to have nodes added.
1215 addMachineCFGPred({BB.Parent->getBasicBlock(), B.TargetBB->getBasicBlock()},
1216 SwitchBB);
1217
1218 MIB.buildBrCond(Cmp, *B.TargetBB);
1219
1220 // Avoid emitting unnecessary branches to the next block.
1221 if (NextMBB != SwitchBB->getNextNode())
1222 MIB.buildBr(*NextMBB);
1223}
1224
1225bool IRTranslator::lowerBitTestWorkItem(
1227 MachineBasicBlock *CurMBB, MachineBasicBlock *DefaultMBB,
1229 BranchProbability DefaultProb, BranchProbability UnhandledProbs,
1231 bool FallthroughUnreachable) {
1232 using namespace SwitchCG;
1233 MachineFunction *CurMF = SwitchMBB->getParent();
1234 // FIXME: Optimize away range check based on pivot comparisons.
1235 BitTestBlock *BTB = &SL->BitTestCases[I->BTCasesIndex];
1236 // The bit test blocks haven't been inserted yet; insert them here.
1237 for (BitTestCase &BTC : BTB->Cases)
1238 CurMF->insert(BBI, BTC.ThisBB);
1239
1240 // Fill in fields of the BitTestBlock.
1241 BTB->Parent = CurMBB;
1242 BTB->Default = Fallthrough;
1243
1244 BTB->DefaultProb = UnhandledProbs;
1245 // If the cases in bit test don't form a contiguous range, we evenly
1246 // distribute the probability on the edge to Fallthrough to two
1247 // successors of CurMBB.
1248 if (!BTB->ContiguousRange) {
1249 BTB->Prob += DefaultProb / 2;
1250 BTB->DefaultProb -= DefaultProb / 2;
1251 }
1252
1253 if (FallthroughUnreachable)
1254 BTB->FallthroughUnreachable = true;
1255
1256 // If we're in the right place, emit the bit test header right now.
1257 if (CurMBB == SwitchMBB) {
1258 emitBitTestHeader(*BTB, SwitchMBB);
1259 BTB->Emitted = true;
1260 }
1261 return true;
1262}
1263
1264bool IRTranslator::lowerSwitchWorkItem(SwitchCG::SwitchWorkListItem W,
1265 Value *Cond,
1266 MachineBasicBlock *SwitchMBB,
1267 MachineBasicBlock *DefaultMBB,
1268 MachineIRBuilder &MIB) {
1269 using namespace SwitchCG;
1270 MachineFunction *CurMF = FuncInfo.MF;
1271 MachineBasicBlock *NextMBB = nullptr;
1273 if (++BBI != FuncInfo.MF->end())
1274 NextMBB = &*BBI;
1275
1276 if (EnableOpts) {
1277 // Here, we order cases by probability so the most likely case will be
1278 // checked first. However, two clusters can have the same probability in
1279 // which case their relative ordering is non-deterministic. So we use Low
1280 // as a tie-breaker as clusters are guaranteed to never overlap.
1281 llvm::sort(W.FirstCluster, W.LastCluster + 1,
1282 [](const CaseCluster &a, const CaseCluster &b) {
1283 return a.Prob != b.Prob
1284 ? a.Prob > b.Prob
1285 : a.Low->getValue().slt(b.Low->getValue());
1286 });
1287
1288 // Rearrange the case blocks so that the last one falls through if possible
1289 // without changing the order of probabilities.
1290 for (CaseClusterIt I = W.LastCluster; I > W.FirstCluster;) {
1291 --I;
1292 if (I->Prob > W.LastCluster->Prob)
1293 break;
1294 if (I->Kind == CC_Range && I->MBB == NextMBB) {
1295 std::swap(*I, *W.LastCluster);
1296 break;
1297 }
1298 }
1299 }
1300
1301 // Compute total probability.
1302 BranchProbability DefaultProb = W.DefaultProb;
1303 BranchProbability UnhandledProbs = DefaultProb;
1304 for (CaseClusterIt I = W.FirstCluster; I <= W.LastCluster; ++I)
1305 UnhandledProbs += I->Prob;
1306
1307 MachineBasicBlock *CurMBB = W.MBB;
1308 for (CaseClusterIt I = W.FirstCluster, E = W.LastCluster; I <= E; ++I) {
1309 bool FallthroughUnreachable = false;
1310 MachineBasicBlock *Fallthrough;
1311 if (I == W.LastCluster) {
1312 // For the last cluster, fall through to the default destination.
1313 Fallthrough = DefaultMBB;
1314 FallthroughUnreachable = isa<UnreachableInst>(
1315 DefaultMBB->getBasicBlock()->getFirstNonPHIOrDbg());
1316 } else {
1317 Fallthrough = CurMF->CreateMachineBasicBlock(CurMBB->getBasicBlock());
1318 CurMF->insert(BBI, Fallthrough);
1319 }
1320 UnhandledProbs -= I->Prob;
1321
1322 switch (I->Kind) {
1323 case CC_BitTests: {
1324 if (!lowerBitTestWorkItem(W, SwitchMBB, CurMBB, DefaultMBB, MIB, BBI,
1325 DefaultProb, UnhandledProbs, I, Fallthrough,
1326 FallthroughUnreachable)) {
1327 LLVM_DEBUG(dbgs() << "Failed to lower bit test for switch");
1328 return false;
1329 }
1330 break;
1331 }
1332
1333 case CC_JumpTable: {
1334 if (!lowerJumpTableWorkItem(W, SwitchMBB, CurMBB, DefaultMBB, MIB, BBI,
1335 UnhandledProbs, I, Fallthrough,
1336 FallthroughUnreachable)) {
1337 LLVM_DEBUG(dbgs() << "Failed to lower jump table");
1338 return false;
1339 }
1340 break;
1341 }
1342 case CC_Range: {
1343 if (!lowerSwitchRangeWorkItem(I, Cond, Fallthrough,
1344 FallthroughUnreachable, UnhandledProbs,
1345 CurMBB, MIB, SwitchMBB)) {
1346 LLVM_DEBUG(dbgs() << "Failed to lower switch range");
1347 return false;
1348 }
1349 break;
1350 }
1351 }
1352 CurMBB = Fallthrough;
1353 }
1354
1355 return true;
1356}
1357
1358bool IRTranslator::translateIndirectBr(const User &U,
1359 MachineIRBuilder &MIRBuilder) {
1360 const IndirectBrInst &BrInst = cast<IndirectBrInst>(U);
1361
1362 const Register Tgt = getOrCreateVReg(*BrInst.getAddress());
1363 MIRBuilder.buildBrIndirect(Tgt);
1364
1365 // Link successors.
1366 SmallPtrSet<const BasicBlock *, 32> AddedSuccessors;
1367 MachineBasicBlock &CurBB = MIRBuilder.getMBB();
1368 for (const BasicBlock *Succ : successors(&BrInst)) {
1369 // It's legal for indirectbr instructions to have duplicate blocks in the
1370 // destination list. We don't allow this in MIR. Skip anything that's
1371 // already a successor.
1372 if (!AddedSuccessors.insert(Succ).second)
1373 continue;
1374 CurBB.addSuccessor(&getMBB(*Succ));
1375 }
1376
1377 return true;
1378}
1379
1380static bool isSwiftError(const Value *V) {
1381 if (auto Arg = dyn_cast<Argument>(V))
1382 return Arg->hasSwiftErrorAttr();
1383 if (auto AI = dyn_cast<AllocaInst>(V))
1384 return AI->isSwiftError();
1385 return false;
1386}
1387
1388bool IRTranslator::translateLoad(const User &U, MachineIRBuilder &MIRBuilder) {
1389 const LoadInst &LI = cast<LoadInst>(U);
1390 TypeSize StoreSize = DL->getTypeStoreSize(LI.getType());
1391 if (StoreSize.isZero())
1392 return true;
1393
1394 ArrayRef<Register> Regs = getOrCreateVRegs(LI);
1395 Register Base = getOrCreateVReg(*LI.getPointerOperand());
1396 AAMDNodes AAInfo = LI.getAAMetadata();
1397
1398 const Value *Ptr = LI.getPointerOperand();
1399
1400 if (CLI->supportSwiftError() && isSwiftError(Ptr)) {
1401 assert(Regs.size() == 1 && "swifterror should be single pointer");
1402 Register VReg =
1403 SwiftError.getOrCreateVRegUseAt(&LI, &MIRBuilder.getMBB(), Ptr);
1404 MIRBuilder.buildCopy(Regs[0], VReg);
1405 return true;
1406 }
1407
1409 TLI->getLoadMemOperandFlags(LI, *DL, AC, LibInfo, OptLevel);
1410 if (AA && !(Flags & MachineMemOperand::MOInvariant)) {
1411 if (AA->pointsToConstantMemory(
1412 MemoryLocation(Ptr, LocationSize::precise(StoreSize), AAInfo))) {
1414 }
1415 }
1416
1417 // Fast-path the common single-register load.
1418 if (Regs.size() == 1) {
1419 auto *MMO = MF->getMachineMemOperand(
1420 MachinePointerInfo(LI.getPointerOperand()), Flags,
1421 MRI->getType(Regs[0]), getMemOpAlign(LI), AAInfo,
1422 LI.getMetadata(LLVMContext::MD_range), LI.getSyncScopeID(),
1423 LI.getOrdering());
1424 MIRBuilder.buildLoad(Regs[0], Base, *MMO);
1425 return true;
1426 }
1427
1428 ArrayRef<uint64_t> Offsets = *VMap.getOffsets(LI);
1429 Type *OffsetIRTy = DL->getIndexType(Ptr->getType());
1430 LLT OffsetTy = getLLTForType(*OffsetIRTy, *DL);
1431 for (unsigned i = 0; i < Regs.size(); ++i) {
1432 Register Addr;
1433 MIRBuilder.materializeObjectPtrOffset(Addr, Base, OffsetTy, Offsets[i]);
1434
1435 MachinePointerInfo Ptr(LI.getPointerOperand(), Offsets[i]);
1436 Align BaseAlign = getMemOpAlign(LI);
1437 auto *MMO = MF->getMachineMemOperand(Ptr, Flags, MRI->getType(Regs[i]),
1438 commonAlignment(BaseAlign, Offsets[i]),
1439 AAInfo, nullptr, LI.getSyncScopeID(),
1440 LI.getOrdering());
1441 MIRBuilder.buildLoad(Regs[i], Addr, *MMO);
1442 }
1443
1444 return true;
1445}
1446
1447bool IRTranslator::translateStore(const User &U, MachineIRBuilder &MIRBuilder) {
1448 const StoreInst &SI = cast<StoreInst>(U);
1449 if (DL->getTypeStoreSize(SI.getValueOperand()->getType()).isZero())
1450 return true;
1451
1452 ArrayRef<Register> Vals = getOrCreateVRegs(*SI.getValueOperand());
1453 Register Base = getOrCreateVReg(*SI.getPointerOperand());
1454
1455 if (CLI->supportSwiftError() && isSwiftError(SI.getPointerOperand())) {
1456 assert(Vals.size() == 1 && "swifterror should be single pointer");
1457
1458 Register VReg = SwiftError.getOrCreateVRegDefAt(&SI, &MIRBuilder.getMBB(),
1459 SI.getPointerOperand());
1460 MIRBuilder.buildCopy(VReg, Vals[0]);
1461 return true;
1462 }
1463
1464 MachineMemOperand::Flags Flags = TLI->getStoreMemOperandFlags(SI, *DL);
1465 // Fast-path the common single-register store.
1466 if (Vals.size() == 1) {
1467 auto *MMO = MF->getMachineMemOperand(
1468 MachinePointerInfo(SI.getPointerOperand()), Flags,
1469 MRI->getType(Vals[0]), getMemOpAlign(SI), SI.getAAMetadata(), nullptr,
1470 SI.getSyncScopeID(), SI.getOrdering());
1471 MIRBuilder.buildStore(Vals[0], Base, *MMO);
1472 return true;
1473 }
1474
1475 ArrayRef<uint64_t> Offsets = *VMap.getOffsets(*SI.getValueOperand());
1476 Type *OffsetIRTy = DL->getIndexType(SI.getPointerOperandType());
1477 LLT OffsetTy = getLLTForType(*OffsetIRTy, *DL);
1478 for (unsigned i = 0; i < Vals.size(); ++i) {
1479 Register Addr;
1480 MIRBuilder.materializeObjectPtrOffset(Addr, Base, OffsetTy, Offsets[i]);
1481
1482 MachinePointerInfo Ptr(SI.getPointerOperand(), Offsets[i]);
1483 Align BaseAlign = getMemOpAlign(SI);
1484 auto *MMO = MF->getMachineMemOperand(Ptr, Flags, MRI->getType(Vals[i]),
1485 commonAlignment(BaseAlign, Offsets[i]),
1486 SI.getAAMetadata(), nullptr,
1487 SI.getSyncScopeID(), SI.getOrdering());
1488 MIRBuilder.buildStore(Vals[i], Addr, *MMO);
1489 }
1490 return true;
1491}
1492
1494 const Value *Src = U.getOperand(0);
1495 Type *Int32Ty = Type::getInt32Ty(U.getContext());
1496
1497 // getIndexedOffsetInType is designed for GEPs, so the first index is the
1498 // usual array element rather than looking into the actual aggregate.
1500 Indices.push_back(ConstantInt::get(Int32Ty, 0));
1501
1502 if (const ExtractValueInst *EVI = dyn_cast<ExtractValueInst>(&U)) {
1503 for (auto Idx : EVI->indices())
1504 Indices.push_back(ConstantInt::get(Int32Ty, Idx));
1505 } else if (const InsertValueInst *IVI = dyn_cast<InsertValueInst>(&U)) {
1506 for (auto Idx : IVI->indices())
1507 Indices.push_back(ConstantInt::get(Int32Ty, Idx));
1508 } else {
1509 llvm::append_range(Indices, drop_begin(U.operands()));
1510 }
1511
1512 return static_cast<uint64_t>(
1513 DL.getIndexedOffsetInType(Src->getType(), Indices));
1514}
1515
1516bool IRTranslator::translateExtractValue(const User &U,
1517 MachineIRBuilder &MIRBuilder) {
1518 const Value *Src = U.getOperand(0);
1519 uint64_t Offset = getOffsetFromIndices(U, *DL);
1520 ArrayRef<Register> SrcRegs = getOrCreateVRegs(*Src);
1521 ArrayRef<uint64_t> Offsets = *VMap.getOffsets(*Src);
1522 unsigned Idx = llvm::lower_bound(Offsets, Offset) - Offsets.begin();
1523 auto &DstRegs = allocateVRegs(U);
1524
1525 for (unsigned i = 0; i < DstRegs.size(); ++i)
1526 DstRegs[i] = SrcRegs[Idx++];
1527
1528 return true;
1529}
1530
1531bool IRTranslator::translateInsertValue(const User &U,
1532 MachineIRBuilder &MIRBuilder) {
1533 const Value *Src = U.getOperand(0);
1534 uint64_t Offset = getOffsetFromIndices(U, *DL);
1535 auto &DstRegs = allocateVRegs(U);
1536 ArrayRef<uint64_t> DstOffsets = *VMap.getOffsets(U);
1537 ArrayRef<Register> SrcRegs = getOrCreateVRegs(*Src);
1538 ArrayRef<Register> InsertedRegs = getOrCreateVRegs(*U.getOperand(1));
1539 auto *InsertedIt = InsertedRegs.begin();
1540
1541 for (unsigned i = 0; i < DstRegs.size(); ++i) {
1542 if (DstOffsets[i] >= Offset && InsertedIt != InsertedRegs.end())
1543 DstRegs[i] = *InsertedIt++;
1544 else
1545 DstRegs[i] = SrcRegs[i];
1546 }
1547
1548 return true;
1549}
1550
1551bool IRTranslator::translateSelect(const User &U,
1552 MachineIRBuilder &MIRBuilder) {
1553 Register Tst = getOrCreateVReg(*U.getOperand(0));
1554 ArrayRef<Register> ResRegs = getOrCreateVRegs(U);
1555 ArrayRef<Register> Op0Regs = getOrCreateVRegs(*U.getOperand(1));
1556 ArrayRef<Register> Op1Regs = getOrCreateVRegs(*U.getOperand(2));
1557
1558 uint32_t Flags = 0;
1559 if (const SelectInst *SI = dyn_cast<SelectInst>(&U))
1561
1562 for (unsigned i = 0; i < ResRegs.size(); ++i) {
1563 MIRBuilder.buildSelect(ResRegs[i], Tst, Op0Regs[i], Op1Regs[i], Flags);
1564 }
1565
1566 return true;
1567}
1568
1569bool IRTranslator::translateCopy(const User &U, const Value &V,
1570 MachineIRBuilder &MIRBuilder) {
1571 Register Src = getOrCreateVReg(V);
1572 auto &Regs = *VMap.getVRegs(U);
1573 if (Regs.empty()) {
1574 Regs.push_back(Src);
1575 VMap.getOffsets(U)->push_back(0);
1576 } else {
1577 // If we already assigned a vreg for this instruction, we can't change that.
1578 // Emit a copy to satisfy the users we already emitted.
1579 MIRBuilder.buildCopy(Regs[0], Src);
1580 }
1581 return true;
1582}
1583
1584bool IRTranslator::translateBitCast(const User &U,
1585 MachineIRBuilder &MIRBuilder) {
1586 Type *SrcTy = U.getOperand(0)->getType();
1587 Type *DstTy = U.getType();
1588
1589 // If we're bitcasting to the source type, we can reuse the source vreg.
1590 if (getLLTForType(*SrcTy, *DL) == getLLTForType(*DstTy, *DL)) {
1591 // If the source is a ConstantInt then it was probably created by
1592 // ConstantHoisting and we should leave it alone.
1593 if (isa<ConstantInt>(U.getOperand(0)))
1594 return translateCast(TargetOpcode::G_CONSTANT_FOLD_BARRIER, U,
1595 MIRBuilder);
1596 return translateCopy(U, *U.getOperand(0), MIRBuilder);
1597 }
1598
1599 // Only the scalar byte<->ptr crossing is redirected to G_INTTOPTR/G_PTRTOINT,
1600 // which is the well-typed MIR shape for that boundary. Vector byte<->ptr
1601 // (e.g. <N x b32> -> ptr produced by mixed-type load coalescing) and other
1602 // legacy ptr/non-ptr IR bitcasts (AMDGPU iN<->p3 kernarg packing, etc.)
1603 // keep their historical G_BITCAST lowering — G_INTTOPTR has no vector-src
1604 // -> scalar-ptr form, and downstream passes already handle G_BITCAST.
1605 if (DstTy->isPointerTy() && SrcTy->isByteTy())
1606 return translateCast(TargetOpcode::G_INTTOPTR, U, MIRBuilder);
1607 if (SrcTy->isPointerTy() && DstTy->isByteTy())
1608 return translateCast(TargetOpcode::G_PTRTOINT, U, MIRBuilder);
1609
1610 return translateCast(TargetOpcode::G_BITCAST, U, MIRBuilder);
1611}
1612
1613bool IRTranslator::translateCast(unsigned Opcode, const User &U,
1614 MachineIRBuilder &MIRBuilder) {
1615 if (!mayTranslateUserTypes(U))
1616 return false;
1617
1618 uint32_t Flags = 0;
1619 if (const Instruction *I = dyn_cast<Instruction>(&U))
1621
1622 Register Op = getOrCreateVReg(*U.getOperand(0));
1623 Register Res = getOrCreateVReg(U);
1624 MIRBuilder.buildInstr(Opcode, {Res}, {Op}, Flags);
1625 return true;
1626}
1627
1628bool IRTranslator::translateGetElementPtr(const User &U,
1629 MachineIRBuilder &MIRBuilder) {
1630 Value &Op0 = *U.getOperand(0);
1631 Register BaseReg = getOrCreateVReg(Op0);
1632 Type *PtrIRTy = Op0.getType();
1633 LLT PtrTy = getLLTForType(*PtrIRTy, *DL);
1634 Type *OffsetIRTy = DL->getIndexType(PtrIRTy);
1635 LLT OffsetTy = getLLTForType(*OffsetIRTy, *DL);
1636
1637 uint32_t PtrAddFlags = 0;
1638 // Each PtrAdd generated to implement the GEP inherits its nuw, nusw, inbounds
1639 // flags.
1640 if (const Instruction *I = dyn_cast<Instruction>(&U))
1642
1643 auto PtrAddFlagsWithConst = [&](int64_t Offset) {
1644 // For nusw/inbounds GEP with an offset that is nonnegative when interpreted
1645 // as signed, assume there is no unsigned overflow.
1646 if (Offset >= 0 && (PtrAddFlags & MachineInstr::MIFlag::NoUSWrap))
1647 return PtrAddFlags | MachineInstr::MIFlag::NoUWrap;
1648 return PtrAddFlags;
1649 };
1650
1651 // Normalize Vector GEP - all scalar operands should be converted to the
1652 // splat vector.
1653 unsigned VectorWidth = 0;
1654
1655 // True if we should use a splat vector; using VectorWidth alone is not
1656 // sufficient.
1657 bool WantSplatVector = false;
1658 if (auto *VT = dyn_cast<VectorType>(U.getType())) {
1659 VectorWidth = cast<FixedVectorType>(VT)->getNumElements();
1660 // We don't produce 1 x N vectors; those are treated as scalars.
1661 WantSplatVector = VectorWidth > 1;
1662 }
1663
1664 // We might need to splat the base pointer into a vector if the offsets
1665 // are vectors.
1666 if (WantSplatVector && !PtrTy.isVector()) {
1667 BaseReg = MIRBuilder
1668 .buildSplatBuildVector(LLT::fixed_vector(VectorWidth, PtrTy),
1669 BaseReg)
1670 .getReg(0);
1671 PtrIRTy = FixedVectorType::get(PtrIRTy, VectorWidth);
1672 PtrTy = getLLTForType(*PtrIRTy, *DL);
1673 OffsetIRTy = DL->getIndexType(PtrIRTy);
1674 OffsetTy = getLLTForType(*OffsetIRTy, *DL);
1675 }
1676
1677 int64_t Offset = 0;
1678 for (gep_type_iterator GTI = gep_type_begin(&U), E = gep_type_end(&U);
1679 GTI != E; ++GTI) {
1680 const Value *Idx = GTI.getOperand();
1681 if (StructType *StTy = GTI.getStructTypeOrNull()) {
1682 unsigned Field = cast<Constant>(Idx)->getUniqueInteger().getZExtValue();
1683 Offset += DL->getStructLayout(StTy)->getElementOffset(Field);
1684 continue;
1685 } else {
1686 uint64_t ElementSize = GTI.getSequentialElementStride(*DL);
1687
1688 // If this is a scalar constant or a splat vector of constants,
1689 // handle it quickly.
1690 if (const auto *CI = dyn_cast<ConstantInt>(Idx)) {
1691 if (std::optional<int64_t> Val = CI->getValue().trySExtValue()) {
1692 Offset += ElementSize * *Val;
1693 continue;
1694 }
1695 }
1696
1697 if (Offset != 0) {
1698 auto OffsetMIB = MIRBuilder.buildConstant({OffsetTy}, Offset);
1699 BaseReg = MIRBuilder
1700 .buildPtrAdd(PtrTy, BaseReg, OffsetMIB.getReg(0),
1701 PtrAddFlagsWithConst(Offset))
1702 .getReg(0);
1703 Offset = 0;
1704 }
1705
1706 Register IdxReg = getOrCreateVReg(*Idx);
1707 LLT IdxTy = MRI->getType(IdxReg);
1708 if (IdxTy != OffsetTy) {
1709 if (!IdxTy.isVector() && WantSplatVector) {
1710 IdxReg = MIRBuilder
1712 IdxReg)
1713 .getReg(0);
1714 }
1715
1716 IdxReg = MIRBuilder.buildSExtOrTrunc(OffsetTy, IdxReg).getReg(0);
1717 }
1718
1719 // N = N + Idx * ElementSize;
1720 // Avoid doing it for ElementSize of 1.
1721 Register GepOffsetReg;
1722 if (ElementSize != 1) {
1723 auto ElementSizeMIB = MIRBuilder.buildConstant(
1724 getLLTForType(*OffsetIRTy, *DL), ElementSize);
1725
1726 // The multiplication is NUW if the GEP is NUW and NSW if the GEP is
1727 // NUSW.
1728 uint32_t ScaleFlags = PtrAddFlags & MachineInstr::MIFlag::NoUWrap;
1729 if (PtrAddFlags & MachineInstr::MIFlag::NoUSWrap)
1730 ScaleFlags |= MachineInstr::MIFlag::NoSWrap;
1731
1732 GepOffsetReg =
1733 MIRBuilder.buildMul(OffsetTy, IdxReg, ElementSizeMIB, ScaleFlags)
1734 .getReg(0);
1735 } else {
1736 GepOffsetReg = IdxReg;
1737 }
1738
1739 BaseReg =
1740 MIRBuilder.buildPtrAdd(PtrTy, BaseReg, GepOffsetReg, PtrAddFlags)
1741 .getReg(0);
1742 }
1743 }
1744
1745 if (Offset != 0) {
1746 auto OffsetMIB =
1747 MIRBuilder.buildConstant(OffsetTy, Offset);
1748
1749 MIRBuilder.buildPtrAdd(getOrCreateVReg(U), BaseReg, OffsetMIB.getReg(0),
1750 PtrAddFlagsWithConst(Offset));
1751 return true;
1752 }
1753
1754 MIRBuilder.buildCopy(getOrCreateVReg(U), BaseReg);
1755 return true;
1756}
1757
1758bool IRTranslator::translateMemFunc(const CallInst &CI,
1759 MachineIRBuilder &MIRBuilder,
1760 unsigned Opcode) {
1761 const Value *SrcPtr = CI.getArgOperand(1);
1762 // If the source is undef, then just emit a nop.
1763 if (isa<UndefValue>(SrcPtr))
1764 return true;
1765
1767
1768 unsigned MinPtrSize = UINT_MAX;
1769 for (auto AI = CI.arg_begin(), AE = CI.arg_end(); std::next(AI) != AE; ++AI) {
1770 Register SrcReg = getOrCreateVReg(**AI);
1771 LLT SrcTy = MRI->getType(SrcReg);
1772 if (SrcTy.isPointer())
1773 MinPtrSize = std::min<unsigned>(SrcTy.getSizeInBits(), MinPtrSize);
1774 SrcRegs.push_back(SrcReg);
1775 }
1776
1777 LLT SizeTy = LLT::integer(MinPtrSize);
1778
1779 // The size operand should be the minimum of the pointer sizes.
1780 Register &SizeOpReg = SrcRegs[SrcRegs.size() - 1];
1781 if (MRI->getType(SizeOpReg) != SizeTy)
1782 SizeOpReg = MIRBuilder.buildZExtOrTrunc(SizeTy, SizeOpReg).getReg(0);
1783
1784 auto ICall = MIRBuilder.buildInstr(Opcode);
1785 for (Register SrcReg : SrcRegs)
1786 ICall.addUse(SrcReg);
1787
1788 Align DstAlign;
1789 Align SrcAlign;
1790 unsigned IsVol =
1791 cast<ConstantInt>(CI.getArgOperand(CI.arg_size() - 1))->getZExtValue();
1792
1793 ConstantInt *CopySize = nullptr;
1794
1795 if (auto *MCI = dyn_cast<MemCpyInst>(&CI)) {
1796 DstAlign = MCI->getDestAlign().valueOrOne();
1797 SrcAlign = MCI->getSourceAlign().valueOrOne();
1798 CopySize = dyn_cast<ConstantInt>(MCI->getArgOperand(2));
1799 } else if (auto *MMI = dyn_cast<MemMoveInst>(&CI)) {
1800 DstAlign = MMI->getDestAlign().valueOrOne();
1801 SrcAlign = MMI->getSourceAlign().valueOrOne();
1802 CopySize = dyn_cast<ConstantInt>(MMI->getArgOperand(2));
1803 } else {
1804 auto *MSI = cast<MemSetInst>(&CI);
1805 DstAlign = MSI->getDestAlign().valueOrOne();
1806 }
1807
1808 if (Opcode != TargetOpcode::G_MEMCPY_INLINE) {
1809 // We need to propagate the tail call flag from the IR inst as an argument.
1810 // Otherwise, we have to pessimize and assume later that we cannot tail call
1811 // any memory intrinsics.
1812 ICall.addImm(CI.isTailCall() ? 1 : 0);
1813 }
1814
1815 // Create mem operands to store the alignment and volatile info.
1818 if (IsVol) {
1819 LoadFlags |= MachineMemOperand::MOVolatile;
1820 StoreFlags |= MachineMemOperand::MOVolatile;
1821 }
1822
1823 AAMDNodes AAInfo = CI.getAAMetadata();
1824 if (AA && CopySize &&
1825 AA->pointsToConstantMemory(MemoryLocation(
1826 SrcPtr, LocationSize::precise(CopySize->getZExtValue()), AAInfo))) {
1827 LoadFlags |= MachineMemOperand::MOInvariant;
1828
1829 // FIXME: pointsToConstantMemory probably does not imply dereferenceable,
1830 // but the previous usage implied it did. Probably should check
1831 // isDereferenceableAndAlignedPointer.
1833 }
1834
1835 ICall.addMemOperand(
1836 MF->getMachineMemOperand(MachinePointerInfo(CI.getArgOperand(0)),
1837 StoreFlags, 1, DstAlign, AAInfo));
1838 if (Opcode != TargetOpcode::G_MEMSET)
1839 ICall.addMemOperand(MF->getMachineMemOperand(
1840 MachinePointerInfo(SrcPtr), LoadFlags, 1, SrcAlign, AAInfo));
1841
1842 return true;
1843}
1844
1845bool IRTranslator::translateTrap(const CallInst &CI,
1846 MachineIRBuilder &MIRBuilder,
1847 unsigned Opcode) {
1848 StringRef TrapFuncName =
1849 CI.getAttributes().getFnAttr("trap-func-name").getValueAsString();
1850 if (TrapFuncName.empty()) {
1851 if (Opcode == TargetOpcode::G_UBSANTRAP) {
1852 uint64_t Code = cast<ConstantInt>(CI.getOperand(0))->getZExtValue();
1853 MIRBuilder.buildInstr(Opcode, {}, ArrayRef<llvm::SrcOp>{Code});
1854 } else {
1855 MIRBuilder.buildInstr(Opcode);
1856 }
1857 return true;
1858 }
1859
1860 CallLowering::CallLoweringInfo Info;
1861 if (Opcode == TargetOpcode::G_UBSANTRAP)
1862 Info.OrigArgs.push_back({getOrCreateVRegs(*CI.getArgOperand(0)),
1863 CI.getArgOperand(0)->getType(), 0});
1864
1865 Info.Callee = MachineOperand::CreateES(TrapFuncName.data());
1866 Info.CB = &CI;
1867 Info.OrigRet = {Register(), Type::getVoidTy(CI.getContext()), 0};
1868 return CLI->lowerCall(MIRBuilder, Info);
1869}
1870
1871bool IRTranslator::translateVectorInterleave2Intrinsic(
1872 const CallInst &CI, MachineIRBuilder &MIRBuilder) {
1873 assert(CI.getIntrinsicID() == Intrinsic::vector_interleave2 &&
1874 "This function can only be called on the interleave2 intrinsic!");
1875 // Canonicalize interleave2 to G_SHUFFLE_VECTOR (similar to SelectionDAG).
1876 Register Op0 = getOrCreateVReg(*CI.getOperand(0));
1877 Register Op1 = getOrCreateVReg(*CI.getOperand(1));
1878 Register Res = getOrCreateVReg(CI);
1879
1880 LLT OpTy = MRI->getType(Op0);
1881 MIRBuilder.buildShuffleVector(Res, Op0, Op1,
1883
1884 return true;
1885}
1886
1887bool IRTranslator::translateVectorDeinterleave2Intrinsic(
1888 const CallInst &CI, MachineIRBuilder &MIRBuilder) {
1889 assert(CI.getIntrinsicID() == Intrinsic::vector_deinterleave2 &&
1890 "This function can only be called on the deinterleave2 intrinsic!");
1891 // Canonicalize deinterleave2 to shuffles that extract sub-vectors (similar to
1892 // SelectionDAG).
1893 Register Op = getOrCreateVReg(*CI.getOperand(0));
1894 auto Undef = MIRBuilder.buildUndef(MRI->getType(Op));
1895 ArrayRef<Register> Res = getOrCreateVRegs(CI);
1896
1897 LLT ResTy = MRI->getType(Res[0]);
1898 MIRBuilder.buildShuffleVector(Res[0], Op, Undef,
1899 createStrideMask(0, 2, ResTy.getNumElements()));
1900 MIRBuilder.buildShuffleVector(Res[1], Op, Undef,
1901 createStrideMask(1, 2, ResTy.getNumElements()));
1902
1903 return true;
1904}
1905
1906void IRTranslator::getStackGuard(Register DstReg,
1907 MachineIRBuilder &MIRBuilder) {
1908 Value *Global =
1909 TLI->getSDagStackGuard(*MF->getFunction().getParent(), *Libcalls);
1910 if (!Global) {
1911 LLVMContext &Ctx = MIRBuilder.getContext();
1912 Ctx.diagnose(DiagnosticInfoGeneric("unable to lower stackguard"));
1913 MIRBuilder.buildUndef(DstReg);
1914 return;
1915 }
1916
1917 const TargetRegisterInfo *TRI = MF->getSubtarget().getRegisterInfo();
1918 MRI->setRegClass(DstReg, TRI->getPointerRegClass());
1919 auto MIB =
1920 MIRBuilder.buildInstr(TargetOpcode::LOAD_STACK_GUARD, {DstReg}, {});
1921
1922 unsigned AddrSpace = Global->getType()->getPointerAddressSpace();
1923 LLT PtrTy = LLT::pointer(AddrSpace, DL->getPointerSizeInBits(AddrSpace));
1924
1925 MachinePointerInfo MPInfo(Global);
1928 MachineMemOperand *MemRef = MF->getMachineMemOperand(
1929 MPInfo, Flags, PtrTy, DL->getPointerABIAlignment(AddrSpace));
1930 MIB.setMemRefs({MemRef});
1931}
1932
1933bool IRTranslator::translateOverflowIntrinsic(const CallInst &CI, unsigned Op,
1934 MachineIRBuilder &MIRBuilder) {
1935 ArrayRef<Register> ResRegs = getOrCreateVRegs(CI);
1936 MIRBuilder.buildInstr(
1937 Op, {ResRegs[0], ResRegs[1]},
1938 {getOrCreateVReg(*CI.getOperand(0)), getOrCreateVReg(*CI.getOperand(1))});
1939
1940 return true;
1941}
1942
1943bool IRTranslator::translateFixedPointIntrinsic(unsigned Op, const CallInst &CI,
1944 MachineIRBuilder &MIRBuilder) {
1945 Register Dst = getOrCreateVReg(CI);
1946 Register Src0 = getOrCreateVReg(*CI.getOperand(0));
1947 Register Src1 = getOrCreateVReg(*CI.getOperand(1));
1948 uint64_t Scale = cast<ConstantInt>(CI.getOperand(2))->getZExtValue();
1949 MIRBuilder.buildInstr(Op, {Dst}, { Src0, Src1, Scale });
1950 return true;
1951}
1952
1953unsigned IRTranslator::getSimpleIntrinsicOpcode(Intrinsic::ID ID) {
1954 switch (ID) {
1955 default:
1956 break;
1957 case Intrinsic::acos:
1958 return TargetOpcode::G_FACOS;
1959 case Intrinsic::asin:
1960 return TargetOpcode::G_FASIN;
1961 case Intrinsic::atan:
1962 return TargetOpcode::G_FATAN;
1963 case Intrinsic::atan2:
1964 return TargetOpcode::G_FATAN2;
1965 case Intrinsic::bswap:
1966 return TargetOpcode::G_BSWAP;
1967 case Intrinsic::bitreverse:
1968 return TargetOpcode::G_BITREVERSE;
1969 case Intrinsic::fshl:
1970 return TargetOpcode::G_FSHL;
1971 case Intrinsic::fshr:
1972 return TargetOpcode::G_FSHR;
1973 case Intrinsic::ceil:
1974 return TargetOpcode::G_FCEIL;
1975 case Intrinsic::cos:
1976 return TargetOpcode::G_FCOS;
1977 case Intrinsic::cosh:
1978 return TargetOpcode::G_FCOSH;
1979 case Intrinsic::ctpop:
1980 return TargetOpcode::G_CTPOP;
1981 case Intrinsic::exp:
1982 return TargetOpcode::G_FEXP;
1983 case Intrinsic::exp2:
1984 return TargetOpcode::G_FEXP2;
1985 case Intrinsic::exp10:
1986 return TargetOpcode::G_FEXP10;
1987 case Intrinsic::fabs:
1988 return TargetOpcode::G_FABS;
1989 case Intrinsic::copysign:
1990 return TargetOpcode::G_FCOPYSIGN;
1991 case Intrinsic::minnum:
1992 return TargetOpcode::G_FMINNUM;
1993 case Intrinsic::maxnum:
1994 return TargetOpcode::G_FMAXNUM;
1995 case Intrinsic::minimum:
1996 return TargetOpcode::G_FMINIMUM;
1997 case Intrinsic::maximum:
1998 return TargetOpcode::G_FMAXIMUM;
1999 case Intrinsic::minimumnum:
2000 return TargetOpcode::G_FMINIMUMNUM;
2001 case Intrinsic::maximumnum:
2002 return TargetOpcode::G_FMAXIMUMNUM;
2003 case Intrinsic::canonicalize:
2004 return TargetOpcode::G_FCANONICALIZE;
2005 case Intrinsic::floor:
2006 return TargetOpcode::G_FFLOOR;
2007 case Intrinsic::fma:
2008 return TargetOpcode::G_FMA;
2009 case Intrinsic::log:
2010 return TargetOpcode::G_FLOG;
2011 case Intrinsic::log2:
2012 return TargetOpcode::G_FLOG2;
2013 case Intrinsic::log10:
2014 return TargetOpcode::G_FLOG10;
2015 case Intrinsic::ldexp:
2016 return TargetOpcode::G_FLDEXP;
2017 case Intrinsic::nearbyint:
2018 return TargetOpcode::G_FNEARBYINT;
2019 case Intrinsic::pow:
2020 return TargetOpcode::G_FPOW;
2021 case Intrinsic::powi:
2022 return TargetOpcode::G_FPOWI;
2023 case Intrinsic::rint:
2024 return TargetOpcode::G_FRINT;
2025 case Intrinsic::round:
2026 return TargetOpcode::G_INTRINSIC_ROUND;
2027 case Intrinsic::roundeven:
2028 return TargetOpcode::G_INTRINSIC_ROUNDEVEN;
2029 case Intrinsic::sin:
2030 return TargetOpcode::G_FSIN;
2031 case Intrinsic::sinh:
2032 return TargetOpcode::G_FSINH;
2033 case Intrinsic::sqrt:
2034 return TargetOpcode::G_FSQRT;
2035 case Intrinsic::tan:
2036 return TargetOpcode::G_FTAN;
2037 case Intrinsic::tanh:
2038 return TargetOpcode::G_FTANH;
2039 case Intrinsic::trunc:
2040 return TargetOpcode::G_INTRINSIC_TRUNC;
2041 case Intrinsic::readcyclecounter:
2042 return TargetOpcode::G_READCYCLECOUNTER;
2043 case Intrinsic::readsteadycounter:
2044 return TargetOpcode::G_READSTEADYCOUNTER;
2045 case Intrinsic::ptrmask:
2046 return TargetOpcode::G_PTRMASK;
2047 case Intrinsic::lrint:
2048 return TargetOpcode::G_INTRINSIC_LRINT;
2049 case Intrinsic::llrint:
2050 return TargetOpcode::G_INTRINSIC_LLRINT;
2051 // FADD/FMUL require checking the FMF, so are handled elsewhere.
2052 case Intrinsic::vector_reduce_fmin:
2053 return TargetOpcode::G_VECREDUCE_FMIN;
2054 case Intrinsic::vector_reduce_fmax:
2055 return TargetOpcode::G_VECREDUCE_FMAX;
2056 case Intrinsic::vector_reduce_fminimum:
2057 return TargetOpcode::G_VECREDUCE_FMINIMUM;
2058 case Intrinsic::vector_reduce_fmaximum:
2059 return TargetOpcode::G_VECREDUCE_FMAXIMUM;
2060 case Intrinsic::vector_reduce_add:
2061 return TargetOpcode::G_VECREDUCE_ADD;
2062 case Intrinsic::vector_reduce_mul:
2063 return TargetOpcode::G_VECREDUCE_MUL;
2064 case Intrinsic::vector_reduce_and:
2065 return TargetOpcode::G_VECREDUCE_AND;
2066 case Intrinsic::vector_reduce_or:
2067 return TargetOpcode::G_VECREDUCE_OR;
2068 case Intrinsic::vector_reduce_xor:
2069 return TargetOpcode::G_VECREDUCE_XOR;
2070 case Intrinsic::vector_reduce_smax:
2071 return TargetOpcode::G_VECREDUCE_SMAX;
2072 case Intrinsic::vector_reduce_smin:
2073 return TargetOpcode::G_VECREDUCE_SMIN;
2074 case Intrinsic::vector_reduce_umax:
2075 return TargetOpcode::G_VECREDUCE_UMAX;
2076 case Intrinsic::vector_reduce_umin:
2077 return TargetOpcode::G_VECREDUCE_UMIN;
2078 case Intrinsic::experimental_vector_compress:
2079 return TargetOpcode::G_VECTOR_COMPRESS;
2080 case Intrinsic::lround:
2081 return TargetOpcode::G_LROUND;
2082 case Intrinsic::llround:
2083 return TargetOpcode::G_LLROUND;
2084 case Intrinsic::get_fpenv:
2085 return TargetOpcode::G_GET_FPENV;
2086 case Intrinsic::get_fpmode:
2087 return TargetOpcode::G_GET_FPMODE;
2088 }
2090}
2091
2092bool IRTranslator::translateSimpleIntrinsic(const CallInst &CI,
2094 MachineIRBuilder &MIRBuilder) {
2095
2096 unsigned Op = getSimpleIntrinsicOpcode(ID);
2097
2098 // Is this a simple intrinsic?
2100 return false;
2101
2102 // Yes. Let's translate it.
2104 for (const auto &Arg : CI.args())
2105 VRegs.push_back(getOrCreateVReg(*Arg));
2106
2107 MIRBuilder.buildInstr(Op, {getOrCreateVReg(CI)}, VRegs,
2109 return true;
2110}
2111
2112// TODO: Include ConstainedOps.def when all strict instructions are defined.
2114 switch (ID) {
2115 case Intrinsic::experimental_constrained_fadd:
2116 return TargetOpcode::G_STRICT_FADD;
2117 case Intrinsic::experimental_constrained_fsub:
2118 return TargetOpcode::G_STRICT_FSUB;
2119 case Intrinsic::experimental_constrained_fmul:
2120 return TargetOpcode::G_STRICT_FMUL;
2121 case Intrinsic::experimental_constrained_fdiv:
2122 return TargetOpcode::G_STRICT_FDIV;
2123 case Intrinsic::experimental_constrained_frem:
2124 return TargetOpcode::G_STRICT_FREM;
2125 case Intrinsic::experimental_constrained_fma:
2126 return TargetOpcode::G_STRICT_FMA;
2127 case Intrinsic::experimental_constrained_sqrt:
2128 return TargetOpcode::G_STRICT_FSQRT;
2129 case Intrinsic::experimental_constrained_ldexp:
2130 return TargetOpcode::G_STRICT_FLDEXP;
2131 case Intrinsic::experimental_constrained_fcmp:
2132 return TargetOpcode::G_STRICT_FCMP;
2133 case Intrinsic::experimental_constrained_fcmps:
2134 return TargetOpcode::G_STRICT_FCMPS;
2135 default:
2136 return 0;
2137 }
2138}
2139
2140bool IRTranslator::translateConstrainedFPIntrinsic(
2141 const ConstrainedFPIntrinsic &FPI, MachineIRBuilder &MIRBuilder) {
2143
2144 unsigned Opcode = getConstrainedOpcode(FPI.getIntrinsicID());
2145 if (!Opcode)
2146 return false;
2147
2151
2152 if (Opcode == TargetOpcode::G_STRICT_FCMP ||
2153 Opcode == TargetOpcode::G_STRICT_FCMPS) {
2154 auto *FPCmp = cast<ConstrainedFPCmpIntrinsic>(&FPI);
2155 Register Operand0 = getOrCreateVReg(*FPCmp->getArgOperand(0));
2156 Register Operand1 = getOrCreateVReg(*FPCmp->getArgOperand(1));
2157 Register Result = getOrCreateVReg(FPI);
2158 MIRBuilder.buildInstr(Opcode, {Result}, {}, Flags)
2159 .addPredicate(FPCmp->getPredicate())
2160 .addUse(Operand0)
2161 .addUse(Operand1);
2162 return true;
2163 }
2164
2166 for (unsigned I = 0, E = FPI.getNonMetadataArgCount(); I != E; ++I)
2167 VRegs.push_back(getOrCreateVReg(*FPI.getArgOperand(I)));
2168
2169 MIRBuilder.buildInstr(Opcode, {getOrCreateVReg(FPI)}, VRegs, Flags);
2170 return true;
2171}
2172
2173std::optional<MCRegister> IRTranslator::getArgPhysReg(Argument &Arg) {
2174 auto VRegs = getOrCreateVRegs(Arg);
2175 if (VRegs.size() != 1)
2176 return std::nullopt;
2177
2178 // Arguments are lowered as a copy of a livein physical register.
2179 auto *VRegDef = MF->getRegInfo().getVRegDef(VRegs[0]);
2180 if (!VRegDef || !VRegDef->isCopy())
2181 return std::nullopt;
2182 return VRegDef->getOperand(1).getReg().asMCReg();
2183}
2184
2185bool IRTranslator::translateIfEntryValueArgument(bool isDeclare, Value *Val,
2186 const DILocalVariable *Var,
2187 const DIExpression *Expr,
2188 const DebugLoc &DL,
2189 MachineIRBuilder &MIRBuilder) {
2190 auto *Arg = dyn_cast<Argument>(Val);
2191 if (!Arg)
2192 return false;
2193
2194 if (!Expr->isEntryValue())
2195 return false;
2196
2197 std::optional<MCRegister> PhysReg = getArgPhysReg(*Arg);
2198 if (!PhysReg) {
2199 LLVM_DEBUG(dbgs() << "Dropping dbg." << (isDeclare ? "declare" : "value")
2200 << ": expression is entry_value but "
2201 << "couldn't find a physical register\n");
2202 LLVM_DEBUG(dbgs() << *Var << "\n");
2203 return true;
2204 }
2205
2206 if (isDeclare) {
2207 // Append an op deref to account for the fact that this is a dbg_declare.
2208 Expr = DIExpression::append(Expr, dwarf::DW_OP_deref);
2209 MF->setVariableDbgInfo(Var, Expr, *PhysReg, DL);
2210 } else {
2211 MIRBuilder.buildDirectDbgValue(*PhysReg, Var, Expr);
2212 }
2213
2214 return true;
2215}
2216
2218 switch (ID) {
2219 default:
2220 llvm_unreachable("Unexpected intrinsic");
2221 case Intrinsic::experimental_convergence_anchor:
2222 return TargetOpcode::CONVERGENCECTRL_ANCHOR;
2223 case Intrinsic::experimental_convergence_entry:
2224 return TargetOpcode::CONVERGENCECTRL_ENTRY;
2225 case Intrinsic::experimental_convergence_loop:
2226 return TargetOpcode::CONVERGENCECTRL_LOOP;
2227 }
2228}
2229
2230bool IRTranslator::translateConvergenceControlIntrinsic(
2231 const CallInst &CI, Intrinsic::ID ID, MachineIRBuilder &MIRBuilder) {
2232 MachineInstrBuilder MIB = MIRBuilder.buildInstr(getConvOpcode(ID));
2233 Register OutputReg = getOrCreateConvergenceTokenVReg(CI);
2234 MIB.addDef(OutputReg);
2235
2236 if (ID == Intrinsic::experimental_convergence_loop) {
2238 assert(Bundle && "Expected a convergence control token.");
2239 Register InputReg =
2240 getOrCreateConvergenceTokenVReg(*Bundle->Inputs[0].get());
2241 MIB.addUse(InputReg);
2242 }
2243
2244 return true;
2245}
2246
2247bool IRTranslator::translateKnownIntrinsic(const CallInst &CI, Intrinsic::ID ID,
2248 MachineIRBuilder &MIRBuilder) {
2249 if (auto *MI = dyn_cast<AnyMemIntrinsic>(&CI)) {
2250 if (ORE->enabled()) {
2251 if (MemoryOpRemark::canHandle(MI, *LibInfo)) {
2252 MemoryOpRemark R(*ORE, "gisel-irtranslator-memsize", *DL, *LibInfo);
2253 R.visit(MI);
2254 }
2255 }
2256 }
2257
2258 // If this is a simple intrinsic (that is, we just need to add a def of
2259 // a vreg, and uses for each arg operand, then translate it.
2260 if (translateSimpleIntrinsic(CI, ID, MIRBuilder))
2261 return true;
2262
2263 switch (ID) {
2264 default:
2265 break;
2266 case Intrinsic::lifetime_start:
2267 case Intrinsic::lifetime_end: {
2268 // No stack colouring in O0, discard region information.
2269 if (MF->getTarget().getOptLevel() == CodeGenOptLevel::None ||
2270 MF->getFunction().hasOptNone())
2271 return true;
2272
2273 unsigned Op = ID == Intrinsic::lifetime_start ? TargetOpcode::LIFETIME_START
2274 : TargetOpcode::LIFETIME_END;
2275
2276 const AllocaInst *AI = dyn_cast<AllocaInst>(CI.getArgOperand(0));
2277 if (!AI || !AI->isStaticAlloca())
2278 return true;
2279
2280 MIRBuilder.buildInstr(Op).addFrameIndex(getOrCreateFrameIndex(*AI));
2281 return true;
2282 }
2283 case Intrinsic::fake_use: {
2285 for (const auto &Arg : CI.args())
2286 llvm::append_range(VRegs, getOrCreateVRegs(*Arg));
2287 MIRBuilder.buildInstr(TargetOpcode::FAKE_USE, {}, VRegs);
2288 MF->setHasFakeUses(true);
2289 return true;
2290 }
2291 case Intrinsic::dbg_declare: {
2292 const DbgDeclareInst &DI = cast<DbgDeclareInst>(CI);
2293 assert(DI.getVariable() && "Missing variable");
2294 translateDbgDeclareRecord(DI.getAddress(), DI.hasArgList(), DI.getVariable(),
2295 DI.getExpression(), DI.getDebugLoc(), MIRBuilder);
2296 return true;
2297 }
2298 case Intrinsic::dbg_label: {
2299 const DbgLabelInst &DI = cast<DbgLabelInst>(CI);
2300 assert(DI.getLabel() && "Missing label");
2301
2303 MIRBuilder.getDebugLoc()) &&
2304 "Expected inlined-at fields to agree");
2305
2306 MIRBuilder.buildDbgLabel(DI.getLabel());
2307 return true;
2308 }
2309 case Intrinsic::vaend:
2310 // No target I know of cares about va_end. Certainly no in-tree target
2311 // does. Simplest intrinsic ever!
2312 return true;
2313 case Intrinsic::vastart: {
2314 Value *Ptr = CI.getArgOperand(0);
2315 unsigned ListSize = TLI->getVaListSizeInBits(*DL) / 8;
2316 Align Alignment = getKnownAlignment(Ptr, *DL);
2317
2318 MIRBuilder.buildInstr(TargetOpcode::G_VASTART, {}, {getOrCreateVReg(*Ptr)})
2319 .addMemOperand(MF->getMachineMemOperand(MachinePointerInfo(Ptr),
2321 ListSize, Alignment));
2322 return true;
2323 }
2324 case Intrinsic::dbg_assign:
2325 // A dbg.assign is a dbg.value with more information about stack locations,
2326 // typically produced during optimisation of variables with leaked
2327 // addresses. We can treat it like a normal dbg_value intrinsic here; to
2328 // benefit from the full analysis of stack/SSA locations, GlobalISel would
2329 // need to register for and use the AssignmentTrackingAnalysis pass.
2330 [[fallthrough]];
2331 case Intrinsic::dbg_value: {
2332 // This form of DBG_VALUE is target-independent.
2333 const DbgValueInst &DI = cast<DbgValueInst>(CI);
2334 translateDbgValueRecord(DI.getValue(), DI.hasArgList(), DI.getVariable(),
2335 DI.getExpression(), DI.getDebugLoc(), MIRBuilder);
2336 return true;
2337 }
2338 case Intrinsic::uadd_with_overflow:
2339 return translateOverflowIntrinsic(CI, TargetOpcode::G_UADDO, MIRBuilder);
2340 case Intrinsic::sadd_with_overflow:
2341 return translateOverflowIntrinsic(CI, TargetOpcode::G_SADDO, MIRBuilder);
2342 case Intrinsic::usub_with_overflow:
2343 return translateOverflowIntrinsic(CI, TargetOpcode::G_USUBO, MIRBuilder);
2344 case Intrinsic::ssub_with_overflow:
2345 return translateOverflowIntrinsic(CI, TargetOpcode::G_SSUBO, MIRBuilder);
2346 case Intrinsic::umul_with_overflow:
2347 return translateOverflowIntrinsic(CI, TargetOpcode::G_UMULO, MIRBuilder);
2348 case Intrinsic::smul_with_overflow:
2349 return translateOverflowIntrinsic(CI, TargetOpcode::G_SMULO, MIRBuilder);
2350 case Intrinsic::uadd_sat:
2351 return translateBinaryOp(TargetOpcode::G_UADDSAT, CI, MIRBuilder);
2352 case Intrinsic::sadd_sat:
2353 return translateBinaryOp(TargetOpcode::G_SADDSAT, CI, MIRBuilder);
2354 case Intrinsic::usub_sat:
2355 return translateBinaryOp(TargetOpcode::G_USUBSAT, CI, MIRBuilder);
2356 case Intrinsic::ssub_sat:
2357 return translateBinaryOp(TargetOpcode::G_SSUBSAT, CI, MIRBuilder);
2358 case Intrinsic::ushl_sat:
2359 return translateBinaryOp(TargetOpcode::G_USHLSAT, CI, MIRBuilder);
2360 case Intrinsic::sshl_sat:
2361 return translateBinaryOp(TargetOpcode::G_SSHLSAT, CI, MIRBuilder);
2362 case Intrinsic::umin:
2363 return translateBinaryOp(TargetOpcode::G_UMIN, CI, MIRBuilder);
2364 case Intrinsic::umax:
2365 return translateBinaryOp(TargetOpcode::G_UMAX, CI, MIRBuilder);
2366 case Intrinsic::smin:
2367 return translateBinaryOp(TargetOpcode::G_SMIN, CI, MIRBuilder);
2368 case Intrinsic::smax:
2369 return translateBinaryOp(TargetOpcode::G_SMAX, CI, MIRBuilder);
2370 case Intrinsic::abs:
2371 // TODO: Preserve "int min is poison" arg in GMIR?
2372 return translateUnaryOp(TargetOpcode::G_ABS, CI, MIRBuilder);
2373 case Intrinsic::smul_fix:
2374 return translateFixedPointIntrinsic(TargetOpcode::G_SMULFIX, CI, MIRBuilder);
2375 case Intrinsic::umul_fix:
2376 return translateFixedPointIntrinsic(TargetOpcode::G_UMULFIX, CI, MIRBuilder);
2377 case Intrinsic::smul_fix_sat:
2378 return translateFixedPointIntrinsic(TargetOpcode::G_SMULFIXSAT, CI, MIRBuilder);
2379 case Intrinsic::umul_fix_sat:
2380 return translateFixedPointIntrinsic(TargetOpcode::G_UMULFIXSAT, CI, MIRBuilder);
2381 case Intrinsic::sdiv_fix:
2382 return translateFixedPointIntrinsic(TargetOpcode::G_SDIVFIX, CI, MIRBuilder);
2383 case Intrinsic::udiv_fix:
2384 return translateFixedPointIntrinsic(TargetOpcode::G_UDIVFIX, CI, MIRBuilder);
2385 case Intrinsic::sdiv_fix_sat:
2386 return translateFixedPointIntrinsic(TargetOpcode::G_SDIVFIXSAT, CI, MIRBuilder);
2387 case Intrinsic::udiv_fix_sat:
2388 return translateFixedPointIntrinsic(TargetOpcode::G_UDIVFIXSAT, CI, MIRBuilder);
2389 case Intrinsic::fmuladd: {
2390 const TargetMachine &TM = MF->getTarget();
2391 Register Dst = getOrCreateVReg(CI);
2392 Register Op0 = getOrCreateVReg(*CI.getArgOperand(0));
2393 Register Op1 = getOrCreateVReg(*CI.getArgOperand(1));
2394 Register Op2 = getOrCreateVReg(*CI.getArgOperand(2));
2396 TLI->isFMAFasterThanFMulAndFAdd(*MF,
2397 TLI->getValueType(*DL, CI.getType()))) {
2398 // TODO: Revisit this to see if we should move this part of the
2399 // lowering to the combiner.
2400 MIRBuilder.buildFMA(Dst, Op0, Op1, Op2,
2402 } else {
2403 LLT Ty = getLLTForType(*CI.getType(), *DL);
2404 auto FMul = MIRBuilder.buildFMul(
2405 Ty, Op0, Op1, MachineInstr::copyFlagsFromInstruction(CI));
2406 MIRBuilder.buildFAdd(Dst, FMul, Op2,
2408 }
2409 return true;
2410 }
2411 case Intrinsic::frexp: {
2412 ArrayRef<Register> VRegs = getOrCreateVRegs(CI);
2413 MIRBuilder.buildFFrexp(VRegs[0], VRegs[1],
2414 getOrCreateVReg(*CI.getArgOperand(0)),
2416 return true;
2417 }
2418 case Intrinsic::modf: {
2419 ArrayRef<Register> VRegs = getOrCreateVRegs(CI);
2420 MIRBuilder.buildModf(VRegs[0], VRegs[1],
2421 getOrCreateVReg(*CI.getArgOperand(0)),
2423 return true;
2424 }
2425 case Intrinsic::sincos: {
2426 ArrayRef<Register> VRegs = getOrCreateVRegs(CI);
2427 MIRBuilder.buildFSincos(VRegs[0], VRegs[1],
2428 getOrCreateVReg(*CI.getArgOperand(0)),
2430 return true;
2431 }
2432 case Intrinsic::fptosi_sat:
2433 MIRBuilder.buildFPTOSI_SAT(getOrCreateVReg(CI),
2434 getOrCreateVReg(*CI.getArgOperand(0)));
2435 return true;
2436 case Intrinsic::fptoui_sat:
2437 MIRBuilder.buildFPTOUI_SAT(getOrCreateVReg(CI),
2438 getOrCreateVReg(*CI.getArgOperand(0)));
2439 return true;
2440 case Intrinsic::memcpy_inline:
2441 return translateMemFunc(CI, MIRBuilder, TargetOpcode::G_MEMCPY_INLINE);
2442 case Intrinsic::memcpy:
2443 return translateMemFunc(CI, MIRBuilder, TargetOpcode::G_MEMCPY);
2444 case Intrinsic::memmove:
2445 return translateMemFunc(CI, MIRBuilder, TargetOpcode::G_MEMMOVE);
2446 case Intrinsic::memset:
2447 return translateMemFunc(CI, MIRBuilder, TargetOpcode::G_MEMSET);
2448 case Intrinsic::eh_typeid_for: {
2449 GlobalValue *GV = ExtractTypeInfo(CI.getArgOperand(0));
2450 Register Reg = getOrCreateVReg(CI);
2451 unsigned TypeID = MF->getTypeIDFor(GV);
2452 MIRBuilder.buildConstant(Reg, TypeID);
2453 return true;
2454 }
2455 case Intrinsic::objectsize:
2456 llvm_unreachable("llvm.objectsize.* should have been lowered already");
2457
2458 case Intrinsic::is_constant:
2459 llvm_unreachable("llvm.is.constant.* should have been lowered already");
2460
2461 case Intrinsic::stackguard:
2462 getStackGuard(getOrCreateVReg(CI), MIRBuilder);
2463 return true;
2464 case Intrinsic::stackprotector: {
2465 LLT PtrTy = getLLTForType(*CI.getArgOperand(0)->getType(), *DL);
2466 Register GuardVal;
2467 if (TLI->useLoadStackGuardNode(*CI.getModule())) {
2468 GuardVal = MRI->createGenericVirtualRegister(PtrTy);
2469 getStackGuard(GuardVal, MIRBuilder);
2470 } else
2471 GuardVal = getOrCreateVReg(*CI.getArgOperand(0)); // The guard's value.
2472
2473 AllocaInst *Slot = cast<AllocaInst>(CI.getArgOperand(1));
2474 int FI = getOrCreateFrameIndex(*Slot);
2475 MF->getFrameInfo().setStackProtectorIndex(FI);
2476
2477 MIRBuilder.buildStore(
2478 GuardVal, getOrCreateVReg(*Slot),
2479 *MF->getMachineMemOperand(MachinePointerInfo::getFixedStack(*MF, FI),
2482 PtrTy, Align(8)));
2483 return true;
2484 }
2485 case Intrinsic::stacksave: {
2486 MIRBuilder.buildInstr(TargetOpcode::G_STACKSAVE, {getOrCreateVReg(CI)}, {});
2487 return true;
2488 }
2489 case Intrinsic::stackrestore: {
2490 MIRBuilder.buildInstr(TargetOpcode::G_STACKRESTORE, {},
2491 {getOrCreateVReg(*CI.getArgOperand(0))});
2492 return true;
2493 }
2494 case Intrinsic::cttz:
2495 case Intrinsic::ctlz: {
2496 ConstantInt *Cst = cast<ConstantInt>(CI.getArgOperand(1));
2497 bool isTrailing = ID == Intrinsic::cttz;
2498 unsigned Opcode = isTrailing ? Cst->isZero()
2499 ? TargetOpcode::G_CTTZ
2500 : TargetOpcode::G_CTTZ_ZERO_POISON
2501 : Cst->isZero() ? TargetOpcode::G_CTLZ
2502 : TargetOpcode::G_CTLZ_ZERO_POISON;
2503 MIRBuilder.buildInstr(Opcode, {getOrCreateVReg(CI)},
2504 {getOrCreateVReg(*CI.getArgOperand(0))});
2505 return true;
2506 }
2507 case Intrinsic::invariant_start: {
2508 MIRBuilder.buildUndef(getOrCreateVReg(CI));
2509 return true;
2510 }
2511 case Intrinsic::invariant_end:
2512 return true;
2513 case Intrinsic::expect:
2514 case Intrinsic::expect_with_probability:
2515 case Intrinsic::annotation:
2516 case Intrinsic::ptr_annotation:
2517 case Intrinsic::launder_invariant_group:
2518 case Intrinsic::strip_invariant_group: {
2519 // Drop the intrinsic, but forward the value.
2520 MIRBuilder.buildCopy(getOrCreateVReg(CI),
2521 getOrCreateVReg(*CI.getArgOperand(0)));
2522 return true;
2523 }
2524 case Intrinsic::assume:
2525 case Intrinsic::experimental_noalias_scope_decl:
2526 case Intrinsic::var_annotation:
2527 case Intrinsic::sideeffect:
2528 // Discard annotate attributes, assumptions, and artificial side-effects.
2529 return true;
2530 case Intrinsic::read_volatile_register:
2531 case Intrinsic::read_register: {
2532 Value *Arg = CI.getArgOperand(0);
2533 MIRBuilder
2534 .buildInstr(TargetOpcode::G_READ_REGISTER, {getOrCreateVReg(CI)}, {})
2535 .addMetadata(cast<MDNode>(cast<MetadataAsValue>(Arg)->getMetadata()));
2536 return true;
2537 }
2538 case Intrinsic::write_register: {
2539 Value *Arg = CI.getArgOperand(0);
2540 MIRBuilder.buildInstr(TargetOpcode::G_WRITE_REGISTER)
2541 .addMetadata(cast<MDNode>(cast<MetadataAsValue>(Arg)->getMetadata()))
2542 .addUse(getOrCreateVReg(*CI.getArgOperand(1)));
2543 return true;
2544 }
2545 case Intrinsic::localescape: {
2546 MachineBasicBlock &EntryMBB = MF->front();
2547 StringRef EscapedName = GlobalValue::dropLLVMManglingEscape(MF->getName());
2548
2549 // Directly emit some LOCAL_ESCAPE machine instrs. Label assignment emission
2550 // is the same on all targets.
2551 for (unsigned Idx = 0, E = CI.arg_size(); Idx < E; ++Idx) {
2552 Value *Arg = CI.getArgOperand(Idx)->stripPointerCasts();
2553 if (isa<ConstantPointerNull>(Arg))
2554 continue; // Skip null pointers. They represent a hole in index space.
2555
2556 int FI = getOrCreateFrameIndex(*cast<AllocaInst>(Arg));
2557 MCSymbol *FrameAllocSym =
2558 MF->getContext().getOrCreateFrameAllocSymbol(EscapedName, Idx);
2559
2560 // This should be inserted at the start of the entry block.
2561 auto LocalEscape =
2562 MIRBuilder.buildInstrNoInsert(TargetOpcode::LOCAL_ESCAPE)
2563 .addSym(FrameAllocSym)
2564 .addFrameIndex(FI);
2565
2566 EntryMBB.insert(EntryMBB.begin(), LocalEscape);
2567 }
2568
2569 return true;
2570 }
2571 case Intrinsic::vector_reduce_fadd:
2572 case Intrinsic::vector_reduce_fmul: {
2573 // Need to check for the reassoc flag to decide whether we want a
2574 // sequential reduction opcode or not.
2575 Register Dst = getOrCreateVReg(CI);
2576 Register ScalarSrc = getOrCreateVReg(*CI.getArgOperand(0));
2577 Register VecSrc = getOrCreateVReg(*CI.getArgOperand(1));
2578 unsigned Opc = 0;
2579 if (!CI.hasAllowReassoc()) {
2580 // The sequential ordering case.
2581 Opc = ID == Intrinsic::vector_reduce_fadd
2582 ? TargetOpcode::G_VECREDUCE_SEQ_FADD
2583 : TargetOpcode::G_VECREDUCE_SEQ_FMUL;
2584 if (!MRI->getType(VecSrc).isVector())
2585 Opc = ID == Intrinsic::vector_reduce_fadd ? TargetOpcode::G_FADD
2586 : TargetOpcode::G_FMUL;
2587 MIRBuilder.buildInstr(Opc, {Dst}, {ScalarSrc, VecSrc},
2589 return true;
2590 }
2591 // We split the operation into a separate G_FADD/G_FMUL + the reduce,
2592 // since the associativity doesn't matter.
2593 unsigned ScalarOpc;
2594 if (ID == Intrinsic::vector_reduce_fadd) {
2595 Opc = TargetOpcode::G_VECREDUCE_FADD;
2596 ScalarOpc = TargetOpcode::G_FADD;
2597 } else {
2598 Opc = TargetOpcode::G_VECREDUCE_FMUL;
2599 ScalarOpc = TargetOpcode::G_FMUL;
2600 }
2601 LLT DstTy = MRI->getType(Dst);
2602 auto Rdx = MIRBuilder.buildInstr(
2603 Opc, {DstTy}, {VecSrc}, MachineInstr::copyFlagsFromInstruction(CI));
2604 MIRBuilder.buildInstr(ScalarOpc, {Dst}, {ScalarSrc, Rdx},
2606
2607 return true;
2608 }
2609 case Intrinsic::trap:
2610 return translateTrap(CI, MIRBuilder, TargetOpcode::G_TRAP);
2611 case Intrinsic::debugtrap:
2612 return translateTrap(CI, MIRBuilder, TargetOpcode::G_DEBUGTRAP);
2613 case Intrinsic::ubsantrap:
2614 return translateTrap(CI, MIRBuilder, TargetOpcode::G_UBSANTRAP);
2615 case Intrinsic::allow_runtime_check:
2616 case Intrinsic::allow_ubsan_check:
2617 MIRBuilder.buildCopy(getOrCreateVReg(CI),
2618 getOrCreateVReg(*ConstantInt::getTrue(CI.getType())));
2619 return true;
2620 case Intrinsic::amdgcn_cs_chain:
2621 case Intrinsic::amdgcn_call_whole_wave:
2622 return translateCallBase(CI, MIRBuilder);
2623 case Intrinsic::fptrunc_round: {
2625
2626 // Convert the metadata argument to a constant integer
2627 Metadata *MD = cast<MetadataAsValue>(CI.getArgOperand(1))->getMetadata();
2628 std::optional<RoundingMode> RoundMode =
2629 convertStrToRoundingMode(cast<MDString>(MD)->getString());
2630
2631 // Add the Rounding mode as an integer
2632 MIRBuilder
2633 .buildInstr(TargetOpcode::G_INTRINSIC_FPTRUNC_ROUND,
2634 {getOrCreateVReg(CI)},
2635 {getOrCreateVReg(*CI.getArgOperand(0))}, Flags)
2636 .addImm((int)*RoundMode);
2637
2638 return true;
2639 }
2640 case Intrinsic::is_fpclass: {
2641 Value *FpValue = CI.getOperand(0);
2642 ConstantInt *TestMaskValue = cast<ConstantInt>(CI.getOperand(1));
2643
2644 MIRBuilder
2645 .buildInstr(TargetOpcode::G_IS_FPCLASS, {getOrCreateVReg(CI)},
2646 {getOrCreateVReg(*FpValue)})
2647 .addImm(TestMaskValue->getZExtValue());
2648
2649 return true;
2650 }
2651 case Intrinsic::set_fpenv: {
2652 Value *FPEnv = CI.getOperand(0);
2653 MIRBuilder.buildSetFPEnv(getOrCreateVReg(*FPEnv));
2654 return true;
2655 }
2656 case Intrinsic::reset_fpenv:
2657 MIRBuilder.buildResetFPEnv();
2658 return true;
2659 case Intrinsic::set_fpmode: {
2660 Value *FPState = CI.getOperand(0);
2661 MIRBuilder.buildSetFPMode(getOrCreateVReg(*FPState));
2662 return true;
2663 }
2664 case Intrinsic::reset_fpmode:
2665 MIRBuilder.buildResetFPMode();
2666 return true;
2667 case Intrinsic::get_rounding:
2668 MIRBuilder.buildGetRounding(getOrCreateVReg(CI));
2669 return true;
2670 case Intrinsic::set_rounding:
2671 MIRBuilder.buildSetRounding(getOrCreateVReg(*CI.getOperand(0)));
2672 return true;
2673 case Intrinsic::vscale: {
2674 MIRBuilder.buildVScale(getOrCreateVReg(CI), 1);
2675 return true;
2676 }
2677 case Intrinsic::scmp:
2678 MIRBuilder.buildSCmp(getOrCreateVReg(CI),
2679 getOrCreateVReg(*CI.getOperand(0)),
2680 getOrCreateVReg(*CI.getOperand(1)));
2681 return true;
2682 case Intrinsic::ucmp:
2683 MIRBuilder.buildUCmp(getOrCreateVReg(CI),
2684 getOrCreateVReg(*CI.getOperand(0)),
2685 getOrCreateVReg(*CI.getOperand(1)));
2686 return true;
2687 case Intrinsic::vector_extract:
2688 return translateExtractVector(CI, MIRBuilder);
2689 case Intrinsic::vector_insert:
2690 return translateInsertVector(CI, MIRBuilder);
2691 case Intrinsic::stepvector: {
2692 MIRBuilder.buildStepVector(getOrCreateVReg(CI), 1);
2693 return true;
2694 }
2695 case Intrinsic::prefetch: {
2696 Value *Addr = CI.getOperand(0);
2697 unsigned RW = cast<ConstantInt>(CI.getOperand(1))->getZExtValue();
2698 unsigned Locality = cast<ConstantInt>(CI.getOperand(2))->getZExtValue();
2699 unsigned CacheType = cast<ConstantInt>(CI.getOperand(3))->getZExtValue();
2700
2702 auto &MMO = *MF->getMachineMemOperand(MachinePointerInfo(Addr), Flags,
2703 LLT(), Align());
2704
2705 MIRBuilder.buildPrefetch(getOrCreateVReg(*Addr), RW, Locality, CacheType,
2706 MMO);
2707
2708 return true;
2709 }
2710
2711 case Intrinsic::vector_interleave2:
2712 case Intrinsic::vector_deinterleave2: {
2713 // Both intrinsics have at least one operand.
2714 Value *Op0 = CI.getOperand(0);
2715 LLT ResTy = getLLTForType(*Op0->getType(), MIRBuilder.getDataLayout());
2716 if (!ResTy.isFixedVector())
2717 return false;
2718
2719 if (CI.getIntrinsicID() == Intrinsic::vector_interleave2)
2720 return translateVectorInterleave2Intrinsic(CI, MIRBuilder);
2721
2722 return translateVectorDeinterleave2Intrinsic(CI, MIRBuilder);
2723 }
2724
2725#define INSTRUCTION(NAME, NARG, ROUND_MODE, INTRINSIC) \
2726 case Intrinsic::INTRINSIC:
2727#include "llvm/IR/ConstrainedOps.def"
2728 return translateConstrainedFPIntrinsic(cast<ConstrainedFPIntrinsic>(CI),
2729 MIRBuilder);
2730 case Intrinsic::experimental_convergence_anchor:
2731 case Intrinsic::experimental_convergence_entry:
2732 case Intrinsic::experimental_convergence_loop:
2733 return translateConvergenceControlIntrinsic(CI, ID, MIRBuilder);
2734 case Intrinsic::reloc_none: {
2735 Metadata *MD = cast<MetadataAsValue>(CI.getArgOperand(0))->getMetadata();
2736 StringRef SymbolName = cast<MDString>(MD)->getString();
2737 MIRBuilder.buildInstr(TargetOpcode::RELOC_NONE)
2739 return true;
2740 }
2741 }
2742 return false;
2743}
2744
2745bool IRTranslator::translateInlineAsm(const CallBase &CB,
2746 MachineIRBuilder &MIRBuilder) {
2747 if (!mayTranslateUserTypes(CB))
2748 return false;
2749
2750 const InlineAsmLowering *ALI = MF->getSubtarget().getInlineAsmLowering();
2751
2752 if (!ALI) {
2753 LLVM_DEBUG(
2754 dbgs() << "Inline asm lowering is not supported for this target yet\n");
2755 return false;
2756 }
2757
2758 return ALI->lowerInlineAsm(
2759 MIRBuilder, CB, [&](const Value &Val) { return getOrCreateVRegs(Val); });
2760}
2761
2762bool IRTranslator::translateCallBase(const CallBase &CB,
2763 MachineIRBuilder &MIRBuilder) {
2764 ArrayRef<Register> Res = getOrCreateVRegs(CB);
2765
2767 Register SwiftInVReg = 0;
2768 Register SwiftErrorVReg = 0;
2769 for (const auto &Arg : CB.args()) {
2770 if (CLI->supportSwiftError() && isSwiftError(Arg)) {
2771 assert(SwiftInVReg == 0 && "Expected only one swift error argument");
2772 LLT Ty = getLLTForType(*Arg->getType(), *DL);
2773 SwiftInVReg = MRI->createGenericVirtualRegister(Ty);
2774 MIRBuilder.buildCopy(SwiftInVReg, SwiftError.getOrCreateVRegUseAt(
2775 &CB, &MIRBuilder.getMBB(), Arg));
2776 Args.emplace_back(ArrayRef(SwiftInVReg));
2777 SwiftErrorVReg =
2778 SwiftError.getOrCreateVRegDefAt(&CB, &MIRBuilder.getMBB(), Arg);
2779 continue;
2780 }
2781 Args.push_back(getOrCreateVRegs(*Arg));
2782 }
2783
2784 if (auto *CI = dyn_cast<CallInst>(&CB)) {
2785 if (ORE->enabled()) {
2786 if (MemoryOpRemark::canHandle(CI, *LibInfo)) {
2787 MemoryOpRemark R(*ORE, "gisel-irtranslator-memsize", *DL, *LibInfo);
2788 R.visit(CI);
2789 }
2790 }
2791 }
2792
2793 std::optional<CallLowering::PtrAuthInfo> PAI;
2794 if (auto Bundle = CB.getOperandBundle(LLVMContext::OB_ptrauth)) {
2795 // Functions should never be ptrauth-called directly.
2796 assert(!CB.getCalledFunction() && "invalid direct ptrauth call");
2797
2798 const Value *Key = Bundle->Inputs[0];
2799 const Value *Discriminator = Bundle->Inputs[1];
2800
2801 // Look through ptrauth constants to try to eliminate the matching bundle
2802 // and turn this into a direct call with no ptrauth.
2803 // CallLowering will use the raw pointer if it doesn't find the PAI.
2804 const auto *CalleeCPA = dyn_cast<ConstantPtrAuth>(CB.getCalledOperand());
2805 if (!CalleeCPA || !isa<Function>(CalleeCPA->getPointer()) ||
2806 !CalleeCPA->isKnownCompatibleWith(Key, Discriminator, *DL)) {
2807 // If we can't make it direct, package the bundle into PAI.
2808 Register DiscReg = getOrCreateVReg(*Discriminator);
2809 PAI = CallLowering::PtrAuthInfo{cast<ConstantInt>(Key)->getZExtValue(),
2810 DiscReg};
2811 }
2812 }
2813
2814 Register ConvergenceCtrlToken = 0;
2815 if (auto Bundle = CB.getOperandBundle(LLVMContext::OB_convergencectrl)) {
2816 const auto &Token = *Bundle->Inputs[0].get();
2817 ConvergenceCtrlToken = getOrCreateConvergenceTokenVReg(Token);
2818 }
2819
2820 // We don't set HasCalls on MFI here yet because call lowering may decide to
2821 // optimize into tail calls. Instead, we defer that to selection where a final
2822 // scan is done to check if any instructions are calls.
2823 bool Success = CLI->lowerCall(
2824 MIRBuilder, CB, Res, Args, SwiftErrorVReg, PAI, ConvergenceCtrlToken,
2825 [&]() { return getOrCreateVReg(*CB.getCalledOperand()); });
2826
2827 // Check if we just inserted a tail call.
2828 if (Success) {
2829 assert(!HasTailCall && "Can't tail call return twice from block?");
2830 const TargetInstrInfo *TII = MF->getSubtarget().getInstrInfo();
2831 HasTailCall = TII->isTailCall(*std::prev(MIRBuilder.getInsertPt()));
2832 }
2833
2834 return Success;
2835}
2836
2837bool IRTranslator::translateCall(const User &U, MachineIRBuilder &MIRBuilder) {
2838 if (!mayTranslateUserTypes(U))
2839 return false;
2840
2841 const CallInst &CI = cast<CallInst>(U);
2842 const Function *F = CI.getCalledFunction();
2843
2844 // FIXME: support Windows dllimport function calls and calls through
2845 // weak symbols.
2846 if (F && (F->hasDLLImportStorageClass() ||
2847 (MF->getTarget().getTargetTriple().isOSWindows() &&
2848 F->hasExternalWeakLinkage())))
2849 return false;
2850
2851 // FIXME: support control flow guard targets.
2853 return false;
2854
2855 // FIXME: support statepoints and related.
2857 return false;
2858
2859 if (CI.isInlineAsm())
2860 return translateInlineAsm(CI, MIRBuilder);
2861
2862 Intrinsic::ID ID = F ? F->getIntrinsicID() : Intrinsic::not_intrinsic;
2863 if (!F || ID == Intrinsic::not_intrinsic) {
2864 if (translateCallBase(CI, MIRBuilder)) {
2865 diagnoseDontCall(CI);
2866 return true;
2867 }
2868 return false;
2869 }
2870
2871 assert(ID != Intrinsic::not_intrinsic && "unknown intrinsic");
2872
2873 if (translateKnownIntrinsic(CI, ID, MIRBuilder))
2874 return true;
2875
2877 TLI->getTgtMemIntrinsic(Infos, CI, *MF, ID);
2878
2879 return translateIntrinsic(CI, ID, MIRBuilder, Infos);
2880}
2881
2882/// Translate a call or callbr to an intrinsic.
2883bool IRTranslator::translateIntrinsic(
2884 const CallBase &CB, Intrinsic::ID ID, MachineIRBuilder &MIRBuilder,
2885 ArrayRef<TargetLowering::IntrinsicInfo> TgtMemIntrinsicInfos) {
2886 ArrayRef<Register> ResultRegs;
2887 if (!CB.getType()->isVoidTy())
2888 ResultRegs = getOrCreateVRegs(CB);
2889
2890 // Ignore the callsite attributes. Backend code is most likely not expecting
2891 // an intrinsic to sometimes have side effects and sometimes not.
2892 MachineInstrBuilder MIB = MIRBuilder.buildIntrinsic(ID, ResultRegs);
2893 if (isa<FPMathOperator>(CB))
2894 MIB->copyIRFlags(CB);
2895
2896 for (const auto &Arg : enumerate(CB.args())) {
2897 // If this is required to be an immediate, don't materialize it in a
2898 // register.
2899 if (CB.paramHasAttr(Arg.index(), Attribute::ImmArg)) {
2900 if (ConstantInt *CI = dyn_cast<ConstantInt>(Arg.value())) {
2901 // imm arguments are more convenient than cimm (and realistically
2902 // probably sufficient), so use them.
2903 assert(CI->getBitWidth() <= 64 &&
2904 "large intrinsic immediates not handled");
2905 MIB.addImm(CI->getSExtValue());
2906 } else {
2907 MIB.addFPImm(cast<ConstantFP>(Arg.value()));
2908 }
2909 } else if (auto *MDVal = dyn_cast<MetadataAsValue>(Arg.value())) {
2910 auto *MD = MDVal->getMetadata();
2911 auto *MDN = dyn_cast<MDNode>(MD);
2912 if (!MDN) {
2913 if (auto *ConstMD = dyn_cast<ConstantAsMetadata>(MD))
2914 MDN = MDNode::get(MF->getFunction().getContext(), ConstMD);
2915 else // This was probably an MDString.
2916 return false;
2917 }
2918 MIB.addMetadata(MDN);
2919 } else {
2920 ArrayRef<Register> VRegs = getOrCreateVRegs(*Arg.value());
2921 if (VRegs.size() > 1)
2922 return false;
2923 MIB.addUse(VRegs[0]);
2924 }
2925 }
2926
2927 // Add MachineMemOperands for each memory access described by the target.
2928 for (const auto &Info : TgtMemIntrinsicInfos) {
2929 Align Alignment = Info.align.value_or(
2930 DL->getABITypeAlign(Info.memVT.getTypeForEVT(CB.getContext())));
2931 LLT MemTy = Info.memVT.isSimple()
2932 ? getLLTForMVT(Info.memVT.getSimpleVT())
2933 : LLT::scalar(Info.memVT.getStoreSizeInBits());
2934
2935 // TODO: We currently just fallback to address space 0 if
2936 // getTgtMemIntrinsic didn't yield anything useful.
2937 MachinePointerInfo MPI;
2938 if (Info.ptrVal) {
2939 MPI = MachinePointerInfo(Info.ptrVal, Info.offset);
2940 } else if (Info.fallbackAddressSpace) {
2941 MPI = MachinePointerInfo(*Info.fallbackAddressSpace);
2942 }
2943 MIB.addMemOperand(MF->getMachineMemOperand(
2944 MPI, Info.flags, MemTy, Alignment, CB.getAAMetadata(),
2945 /*Ranges=*/nullptr, Info.ssid, Info.order, Info.failureOrder));
2946 }
2947
2948 if (CB.isConvergent()) {
2949 if (auto Bundle = CB.getOperandBundle(LLVMContext::OB_convergencectrl)) {
2950 auto *Token = Bundle->Inputs[0].get();
2951 Register TokenReg = getOrCreateVReg(*Token);
2952 MIB.addUse(TokenReg, RegState::Implicit);
2953 }
2954 }
2955
2957 MIB->setDeactivationSymbol(*MF, Bundle->Inputs[0].get());
2958
2959 return true;
2960}
2961
2962bool IRTranslator::findUnwindDestinations(
2963 const BasicBlock *EHPadBB,
2964 BranchProbability Prob,
2965 SmallVectorImpl<std::pair<MachineBasicBlock *, BranchProbability>>
2966 &UnwindDests) {
2968 EHPadBB->getParent()->getFunction().getPersonalityFn());
2969 bool IsMSVCCXX = Personality == EHPersonality::MSVC_CXX;
2970 bool IsCoreCLR = Personality == EHPersonality::CoreCLR;
2971 bool IsWasmCXX = Personality == EHPersonality::Wasm_CXX;
2972 bool IsSEH = isAsynchronousEHPersonality(Personality);
2973
2974 if (IsWasmCXX) {
2975 // Ignore this for now.
2976 return false;
2977 }
2978
2979 while (EHPadBB) {
2981 BasicBlock *NewEHPadBB = nullptr;
2982 if (isa<LandingPadInst>(Pad)) {
2983 // Stop on landingpads. They are not funclets.
2984 UnwindDests.emplace_back(&getMBB(*EHPadBB), Prob);
2985 break;
2986 }
2987 if (isa<CleanupPadInst>(Pad)) {
2988 // Stop on cleanup pads. Cleanups are always funclet entries for all known
2989 // personalities.
2990 UnwindDests.emplace_back(&getMBB(*EHPadBB), Prob);
2991 UnwindDests.back().first->setIsEHScopeEntry();
2992 UnwindDests.back().first->setIsEHFuncletEntry();
2993 break;
2994 }
2995 if (auto *CatchSwitch = dyn_cast<CatchSwitchInst>(Pad)) {
2996 // Add the catchpad handlers to the possible destinations.
2997 for (const BasicBlock *CatchPadBB : CatchSwitch->handlers()) {
2998 UnwindDests.emplace_back(&getMBB(*CatchPadBB), Prob);
2999 // For MSVC++ and the CLR, catchblocks are funclets and need prologues.
3000 if (IsMSVCCXX || IsCoreCLR)
3001 UnwindDests.back().first->setIsEHFuncletEntry();
3002 if (!IsSEH)
3003 UnwindDests.back().first->setIsEHScopeEntry();
3004 }
3005 NewEHPadBB = CatchSwitch->getUnwindDest();
3006 } else {
3007 continue;
3008 }
3009
3010 BranchProbabilityInfo *BPI = FuncInfo.BPI;
3011 if (BPI && NewEHPadBB)
3012 Prob *= BPI->getEdgeProbability(EHPadBB, NewEHPadBB);
3013 EHPadBB = NewEHPadBB;
3014 }
3015 return true;
3016}
3017
3018bool IRTranslator::translateInvoke(const User &U,
3019 MachineIRBuilder &MIRBuilder) {
3020 const InvokeInst &I = cast<InvokeInst>(U);
3021 MCContext &Context = MF->getContext();
3022
3023 const BasicBlock *ReturnBB = I.getSuccessor(0);
3024 const BasicBlock *EHPadBB = I.getSuccessor(1);
3025
3026 const Function *Fn = I.getCalledFunction();
3027
3028 // FIXME: support invoking patchpoint and statepoint intrinsics.
3029 if (Fn && Fn->isIntrinsic())
3030 return false;
3031
3032 // FIXME: support whatever these are.
3033 if (I.hasDeoptState())
3034 return false;
3035
3036 // FIXME: support control flow guard targets.
3037 if (I.countOperandBundlesOfType(LLVMContext::OB_cfguardtarget))
3038 return false;
3039
3040 // FIXME: support Windows exception handling.
3041 if (!isa<LandingPadInst>(EHPadBB->getFirstNonPHIIt()))
3042 return false;
3043
3044 // FIXME: support Windows dllimport function calls and calls through
3045 // weak symbols.
3046 if (Fn && (Fn->hasDLLImportStorageClass() ||
3047 (MF->getTarget().getTargetTriple().isOSWindows() &&
3048 Fn->hasExternalWeakLinkage())))
3049 return false;
3050
3051 bool LowerInlineAsm = I.isInlineAsm();
3052 bool NeedEHLabel = true;
3053
3054 // Emit the actual call, bracketed by EH_LABELs so that the MF knows about
3055 // the region covered by the try.
3056 MCSymbol *BeginSymbol = nullptr;
3057 if (NeedEHLabel) {
3058 MIRBuilder.buildInstr(TargetOpcode::G_INVOKE_REGION_START);
3059 BeginSymbol = Context.createTempSymbol();
3060 MIRBuilder.buildInstr(TargetOpcode::EH_LABEL).addSym(BeginSymbol);
3061 }
3062
3063 if (LowerInlineAsm) {
3064 if (!translateInlineAsm(I, MIRBuilder))
3065 return false;
3066 } else if (!translateCallBase(I, MIRBuilder))
3067 return false;
3068
3069 MCSymbol *EndSymbol = nullptr;
3070 if (NeedEHLabel) {
3071 EndSymbol = Context.createTempSymbol();
3072 MIRBuilder.buildInstr(TargetOpcode::EH_LABEL).addSym(EndSymbol);
3073 }
3074
3076 BranchProbabilityInfo *BPI = FuncInfo.BPI;
3077 MachineBasicBlock *InvokeMBB = &MIRBuilder.getMBB();
3078 BranchProbability EHPadBBProb =
3079 BPI ? BPI->getEdgeProbability(InvokeMBB->getBasicBlock(), EHPadBB)
3081
3082 if (!findUnwindDestinations(EHPadBB, EHPadBBProb, UnwindDests))
3083 return false;
3084
3085 MachineBasicBlock &EHPadMBB = getMBB(*EHPadBB),
3086 &ReturnMBB = getMBB(*ReturnBB);
3087 // Update successor info.
3088 addSuccessorWithProb(InvokeMBB, &ReturnMBB);
3089 for (auto &UnwindDest : UnwindDests) {
3090 UnwindDest.first->setIsEHPad();
3091 addSuccessorWithProb(InvokeMBB, UnwindDest.first, UnwindDest.second);
3092 }
3093 InvokeMBB->normalizeSuccProbs();
3094
3095 if (NeedEHLabel) {
3096 assert(BeginSymbol && "Expected a begin symbol!");
3097 assert(EndSymbol && "Expected an end symbol!");
3098 MF->addInvoke(&EHPadMBB, BeginSymbol, EndSymbol);
3099 }
3100
3101 MIRBuilder.buildBr(ReturnMBB);
3102 return true;
3103}
3104
3105/// The intrinsics currently supported by callbr are implicit control flow
3106/// intrinsics such as amdgcn.kill.
3107bool IRTranslator::translateCallBr(const User &U,
3108 MachineIRBuilder &MIRBuilder) {
3109 if (!mayTranslateUserTypes(U))
3110 return false; // see translateCall
3111
3112 const CallBrInst &I = cast<CallBrInst>(U);
3113 MachineBasicBlock *CallBrMBB = &MIRBuilder.getMBB();
3114
3115 Intrinsic::ID IID = I.getIntrinsicID();
3116 if (I.isInlineAsm()) {
3117 // FIXME: inline asm is not yet supported for callbr in GlobalISel. As soon
3118 // as we add support, we need to handle the indirect asm targets, see
3119 // SelectionDAGBuilder::visitCallBr().
3120 return false;
3121 }
3122 if (!translateIntrinsic(I, IID, MIRBuilder))
3123 return false;
3124
3125 // Retrieve successors.
3126 SmallPtrSet<BasicBlock *, 8> Dests = {I.getDefaultDest()};
3127 MachineBasicBlock *Return = &getMBB(*I.getDefaultDest());
3128
3129 // Update successor info.
3130 addSuccessorWithProb(CallBrMBB, Return, BranchProbability::getOne());
3131
3132 // Add indirect targets as successors. For intrinsic callbr, these represent
3133 // implicit control flow (e.g., the "kill" path for amdgcn.kill). We mark them
3134 // with setIsInlineAsmBrIndirectTarget so the machine verifier accepts them as
3135 // valid successors, even though they're not from inline asm.
3136 for (BasicBlock *Dest : I.getIndirectDests()) {
3137 MachineBasicBlock &Target = getMBB(*Dest);
3138 Target.setIsInlineAsmBrIndirectTarget();
3139 Target.setLabelMustBeEmitted();
3140 // Don't add duplicate machine successors.
3141 if (Dests.insert(Dest).second)
3142 addSuccessorWithProb(CallBrMBB, &Target, BranchProbability::getZero());
3143 }
3144
3145 CallBrMBB->normalizeSuccProbs();
3146
3147 // Drop into default successor.
3148 MIRBuilder.buildBr(*Return);
3149
3150 return true;
3151}
3152
3153bool IRTranslator::translateLandingPad(const User &U,
3154 MachineIRBuilder &MIRBuilder) {
3155 const LandingPadInst &LP = cast<LandingPadInst>(U);
3156
3157 MachineBasicBlock &MBB = MIRBuilder.getMBB();
3158
3159 MBB.setIsEHPad();
3160
3161 // If there aren't registers to copy the values into (e.g., during SjLj
3162 // exceptions), then don't bother.
3163 const Constant *PersonalityFn = MF->getFunction().getPersonalityFn();
3164 if (TLI->getExceptionPointerRegister(PersonalityFn) == 0 &&
3165 TLI->getExceptionSelectorRegister(PersonalityFn) == 0)
3166 return true;
3167
3168 // If landingpad's return type is token type, we don't create DAG nodes
3169 // for its exception pointer and selector value. The extraction of exception
3170 // pointer or selector value from token type landingpads is not currently
3171 // supported.
3172 if (LP.getType()->isTokenTy())
3173 return true;
3174
3175 // Add a label to mark the beginning of the landing pad. Deletion of the
3176 // landing pad can thus be detected via the MachineModuleInfo.
3177 MIRBuilder.buildInstr(TargetOpcode::EH_LABEL)
3178 .addSym(MF->addLandingPad(&MBB));
3179
3180 // If the unwinder does not preserve all registers, ensure that the
3181 // function marks the clobbered registers as used.
3182 const TargetRegisterInfo &TRI = *MF->getSubtarget().getRegisterInfo();
3183 if (auto *RegMask = TRI.getCustomEHPadPreservedMask(*MF))
3184 MF->getRegInfo().addPhysRegsUsedFromRegMask(RegMask);
3185
3186 LLT Ty = getLLTForType(*LP.getType(), *DL);
3187 Register Undef = MRI->createGenericVirtualRegister(Ty);
3188 MIRBuilder.buildUndef(Undef);
3189
3191 for (Type *Ty : cast<StructType>(LP.getType())->elements())
3192 Tys.push_back(getLLTForType(*Ty, *DL));
3193 assert(Tys.size() == 2 && "Only two-valued landingpads are supported");
3194
3195 // Mark exception register as live in.
3196 Register ExceptionReg = TLI->getExceptionPointerRegister(PersonalityFn);
3197 if (!ExceptionReg)
3198 return false;
3199
3200 MBB.addLiveIn(ExceptionReg);
3201 ArrayRef<Register> ResRegs = getOrCreateVRegs(LP);
3202 MIRBuilder.buildCopy(ResRegs[0], ExceptionReg);
3203
3204 Register SelectorReg = TLI->getExceptionSelectorRegister(PersonalityFn);
3205 if (!SelectorReg)
3206 return false;
3207
3208 MBB.addLiveIn(SelectorReg);
3209 Register PtrVReg = MRI->createGenericVirtualRegister(Tys[0]);
3210 MIRBuilder.buildCopy(PtrVReg, SelectorReg);
3211 MIRBuilder.buildCast(ResRegs[1], PtrVReg);
3212
3213 return true;
3214}
3215
3216bool IRTranslator::translateAlloca(const User &U,
3217 MachineIRBuilder &MIRBuilder) {
3218 auto &AI = cast<AllocaInst>(U);
3219
3220 if (AI.isSwiftError())
3221 return true;
3222
3223 if (AI.isStaticAlloca()) {
3224 Register Res = getOrCreateVReg(AI);
3225 int FI = getOrCreateFrameIndex(AI);
3226 MIRBuilder.buildFrameIndex(Res, FI);
3227 return true;
3228 }
3229
3230 // FIXME: support stack probing for Windows.
3231 if (MF->getTarget().getTargetTriple().isOSWindows())
3232 return false;
3233
3234 // Now we're in the harder dynamic case.
3235 Register NumElts = getOrCreateVReg(*AI.getArraySize());
3236 Type *IntPtrIRTy = DL->getIntPtrType(AI.getType());
3237 LLT IntPtrTy = getLLTForType(*IntPtrIRTy, *DL);
3238 if (MRI->getType(NumElts) != IntPtrTy) {
3239 Register ExtElts = MRI->createGenericVirtualRegister(IntPtrTy);
3240 MIRBuilder.buildZExtOrTrunc(ExtElts, NumElts);
3241 NumElts = ExtElts;
3242 }
3243
3244 Type *Ty = AI.getAllocatedType();
3245 TypeSize TySize = DL->getTypeAllocSize(Ty);
3246
3247 Register AllocSize = MRI->createGenericVirtualRegister(IntPtrTy);
3248 Register TySizeReg;
3249 if (TySize.isScalable()) {
3250 // For scalable types, use vscale * min_value
3251 TySizeReg = MRI->createGenericVirtualRegister(IntPtrTy);
3252 MIRBuilder.buildVScale(TySizeReg, TySize.getKnownMinValue());
3253 } else {
3254 // For fixed types, use a constant
3255 TySizeReg =
3256 getOrCreateVReg(*ConstantInt::get(IntPtrIRTy, TySize.getFixedValue()));
3257 }
3258 MIRBuilder.buildMul(AllocSize, NumElts, TySizeReg);
3259
3260 // Round the size of the allocation up to the stack alignment size
3261 // by add SA-1 to the size. This doesn't overflow because we're computing
3262 // an address inside an alloca.
3263 Align StackAlign = MF->getSubtarget().getFrameLowering()->getStackAlign();
3264 auto SAMinusOne = MIRBuilder.buildConstant(IntPtrTy, StackAlign.value() - 1);
3265 auto AllocAdd = MIRBuilder.buildAdd(IntPtrTy, AllocSize, SAMinusOne,
3267 auto AlignCst =
3268 MIRBuilder.buildConstant(IntPtrTy, ~(uint64_t)(StackAlign.value() - 1));
3269 auto AlignedAlloc = MIRBuilder.buildAnd(IntPtrTy, AllocAdd, AlignCst);
3270
3271 Align Alignment = AI.getAlign();
3272 if (Alignment <= StackAlign)
3273 Alignment = Align(1);
3274 MIRBuilder.buildDynStackAlloc(getOrCreateVReg(AI), AlignedAlloc, Alignment);
3275
3276 MF->getFrameInfo().CreateVariableSizedObject(Alignment, &AI);
3277 assert(MF->getFrameInfo().hasVarSizedObjects());
3278 return true;
3279}
3280
3281bool IRTranslator::translateVAArg(const User &U, MachineIRBuilder &MIRBuilder) {
3282 // FIXME: We may need more info about the type. Because of how LLT works,
3283 // we're completely discarding the i64/double distinction here (amongst
3284 // others). Fortunately the ABIs I know of where that matters don't use va_arg
3285 // anyway but that's not guaranteed.
3286 MIRBuilder.buildInstr(TargetOpcode::G_VAARG, {getOrCreateVReg(U)},
3287 {getOrCreateVReg(*U.getOperand(0)),
3288 DL->getABITypeAlign(U.getType()).value()});
3289 return true;
3290}
3291
3292bool IRTranslator::translateUnreachable(const User &U,
3293 MachineIRBuilder &MIRBuilder) {
3294 auto &UI = cast<UnreachableInst>(U);
3295 if (!UI.shouldLowerToTrap(MF->getTarget().Options.TrapUnreachable,
3296 MF->getTarget().Options.NoTrapAfterNoreturn))
3297 return true;
3298
3299 MIRBuilder.buildTrap();
3300 return true;
3301}
3302
3303bool IRTranslator::translateInsertElement(const User &U,
3304 MachineIRBuilder &MIRBuilder) {
3305 // If it is a <1 x Ty> vector, use the scalar as it is
3306 // not a legal vector type in LLT.
3307 if (auto *FVT = dyn_cast<FixedVectorType>(U.getType());
3308 FVT && FVT->getNumElements() == 1)
3309 return translateCopy(U, *U.getOperand(1), MIRBuilder);
3310
3311 Register Res = getOrCreateVReg(U);
3312 Register Val = getOrCreateVReg(*U.getOperand(0));
3313 Register Elt = getOrCreateVReg(*U.getOperand(1));
3314 unsigned PreferredVecIdxWidth = TLI->getVectorIdxWidth(*DL);
3315 Register Idx;
3316 if (auto *CI = dyn_cast<ConstantInt>(U.getOperand(2))) {
3317 if (CI->getBitWidth() != PreferredVecIdxWidth) {
3318 APInt NewIdx = CI->getValue().zextOrTrunc(PreferredVecIdxWidth);
3319 auto *NewIdxCI = ConstantInt::get(CI->getContext(), NewIdx);
3320 Idx = getOrCreateVReg(*NewIdxCI);
3321 }
3322 }
3323 if (!Idx)
3324 Idx = getOrCreateVReg(*U.getOperand(2));
3325 if (MRI->getType(Idx).getSizeInBits() != PreferredVecIdxWidth) {
3326 const LLT VecIdxTy =
3327 MRI->getType(Idx).changeElementSize(PreferredVecIdxWidth);
3328 Idx = MIRBuilder.buildZExtOrTrunc(VecIdxTy, Idx).getReg(0);
3329 }
3330 MIRBuilder.buildInsertVectorElement(Res, Val, Elt, Idx);
3331 return true;
3332}
3333
3334bool IRTranslator::translateInsertVector(const User &U,
3335 MachineIRBuilder &MIRBuilder) {
3336 Register Dst = getOrCreateVReg(U);
3337 Register Vec = getOrCreateVReg(*U.getOperand(0));
3338 Register Elt = getOrCreateVReg(*U.getOperand(1));
3339
3340 ConstantInt *CI = cast<ConstantInt>(U.getOperand(2));
3341 unsigned PreferredVecIdxWidth = TLI->getVectorIdxWidth(*DL);
3342
3343 // Resize Index to preferred index width.
3344 if (CI->getBitWidth() != PreferredVecIdxWidth) {
3345 APInt NewIdx = CI->getValue().zextOrTrunc(PreferredVecIdxWidth);
3346 CI = ConstantInt::get(CI->getContext(), NewIdx);
3347 }
3348
3349 // If it is a <1 x Ty> vector, we have to use other means.
3350 if (auto *ResultType = dyn_cast<FixedVectorType>(U.getOperand(1)->getType());
3351 ResultType && ResultType->getNumElements() == 1) {
3352 if (auto *InputType = dyn_cast<FixedVectorType>(U.getOperand(0)->getType());
3353 InputType && InputType->getNumElements() == 1) {
3354 // We are inserting an illegal fixed vector into an illegal
3355 // fixed vector, use the scalar as it is not a legal vector type
3356 // in LLT.
3357 return translateCopy(U, *U.getOperand(0), MIRBuilder);
3358 }
3359 if (isa<FixedVectorType>(U.getOperand(0)->getType())) {
3360 // We are inserting an illegal fixed vector into a legal fixed
3361 // vector, use the scalar as it is not a legal vector type in
3362 // LLT.
3363 Register Idx = getOrCreateVReg(*CI);
3364 MIRBuilder.buildInsertVectorElement(Dst, Vec, Elt, Idx);
3365 return true;
3366 }
3367 if (isa<ScalableVectorType>(U.getOperand(0)->getType())) {
3368 // We are inserting an illegal fixed vector into a scalable
3369 // vector, use a scalar element insert.
3370 LLT VecIdxTy = LLT::scalar(PreferredVecIdxWidth);
3371 Register Idx = getOrCreateVReg(*CI);
3372 auto ScaledIndex = MIRBuilder.buildMul(
3373 VecIdxTy, MIRBuilder.buildVScale(VecIdxTy, 1), Idx);
3374 MIRBuilder.buildInsertVectorElement(Dst, Vec, Elt, ScaledIndex);
3375 return true;
3376 }
3377 }
3378
3379 MIRBuilder.buildInsertSubvector(
3380 getOrCreateVReg(U), getOrCreateVReg(*U.getOperand(0)),
3381 getOrCreateVReg(*U.getOperand(1)), CI->getZExtValue());
3382 return true;
3383}
3384
3385bool IRTranslator::translateExtractElement(const User &U,
3386 MachineIRBuilder &MIRBuilder) {
3387 // If it is a <1 x Ty> vector, use the scalar as it is
3388 // not a legal vector type in LLT.
3389 if (const FixedVectorType *FVT =
3390 dyn_cast<FixedVectorType>(U.getOperand(0)->getType()))
3391 if (FVT->getNumElements() == 1)
3392 return translateCopy(U, *U.getOperand(0), MIRBuilder);
3393
3394 Register Res = getOrCreateVReg(U);
3395 Register Val = getOrCreateVReg(*U.getOperand(0));
3396 unsigned PreferredVecIdxWidth = TLI->getVectorIdxWidth(*DL);
3397 Register Idx;
3398 if (auto *CI = dyn_cast<ConstantInt>(U.getOperand(1))) {
3399 if (CI->getBitWidth() != PreferredVecIdxWidth) {
3400 APInt NewIdx = CI->getValue().zextOrTrunc(PreferredVecIdxWidth);
3401 auto *NewIdxCI = ConstantInt::get(CI->getContext(), NewIdx);
3402 Idx = getOrCreateVReg(*NewIdxCI);
3403 }
3404 }
3405 if (!Idx)
3406 Idx = getOrCreateVReg(*U.getOperand(1));
3407 if (MRI->getType(Idx).getSizeInBits() != PreferredVecIdxWidth) {
3408 const LLT VecIdxTy =
3409 MRI->getType(Idx).changeElementSize(PreferredVecIdxWidth);
3410 Idx = MIRBuilder.buildZExtOrTrunc(VecIdxTy, Idx).getReg(0);
3411 }
3412 MIRBuilder.buildExtractVectorElement(Res, Val, Idx);
3413 return true;
3414}
3415
3416bool IRTranslator::translateExtractVector(const User &U,
3417 MachineIRBuilder &MIRBuilder) {
3418 Register Res = getOrCreateVReg(U);
3419 Register Vec = getOrCreateVReg(*U.getOperand(0));
3420 ConstantInt *CI = cast<ConstantInt>(U.getOperand(1));
3421 unsigned PreferredVecIdxWidth = TLI->getVectorIdxWidth(*DL);
3422
3423 // Resize Index to preferred index width.
3424 if (CI->getBitWidth() != PreferredVecIdxWidth) {
3425 APInt NewIdx = CI->getValue().zextOrTrunc(PreferredVecIdxWidth);
3426 CI = ConstantInt::get(CI->getContext(), NewIdx);
3427 }
3428
3429 // If it is a <1 x Ty> vector, we have to use other means.
3430 if (auto *ResultType = dyn_cast<FixedVectorType>(U.getType());
3431 ResultType && ResultType->getNumElements() == 1) {
3432 if (auto *InputType = dyn_cast<FixedVectorType>(U.getOperand(0)->getType());
3433 InputType && InputType->getNumElements() == 1) {
3434 // We are extracting an illegal fixed vector from an illegal fixed vector,
3435 // use the scalar as it is not a legal vector type in LLT.
3436 return translateCopy(U, *U.getOperand(0), MIRBuilder);
3437 }
3438 if (isa<FixedVectorType>(U.getOperand(0)->getType())) {
3439 // We are extracting an illegal fixed vector from a legal fixed
3440 // vector, use the scalar as it is not a legal vector type in
3441 // LLT.
3442 Register Idx = getOrCreateVReg(*CI);
3443 MIRBuilder.buildExtractVectorElement(Res, Vec, Idx);
3444 return true;
3445 }
3446 if (isa<ScalableVectorType>(U.getOperand(0)->getType())) {
3447 // We are extracting an illegal fixed vector from a scalable
3448 // vector, use a scalar element extract.
3449 LLT VecIdxTy = LLT::scalar(PreferredVecIdxWidth);
3450 Register Idx = getOrCreateVReg(*CI);
3451 auto ScaledIndex = MIRBuilder.buildMul(
3452 VecIdxTy, MIRBuilder.buildVScale(VecIdxTy, 1), Idx);
3453 MIRBuilder.buildExtractVectorElement(Res, Vec, ScaledIndex);
3454 return true;
3455 }
3456 }
3457
3458 MIRBuilder.buildExtractSubvector(getOrCreateVReg(U),
3459 getOrCreateVReg(*U.getOperand(0)),
3460 CI->getZExtValue());
3461 return true;
3462}
3463
3464bool IRTranslator::translateShuffleVector(const User &U,
3465 MachineIRBuilder &MIRBuilder) {
3466 // A ShuffleVector that operates on scalable vectors is a splat vector where
3467 // the value of the splat vector is the 0th element of the first operand,
3468 // since the index mask operand is the zeroinitializer (undef and
3469 // poison are treated as zeroinitializer here).
3470 if (U.getOperand(0)->getType()->isScalableTy()) {
3471 Register Val = getOrCreateVReg(*U.getOperand(0));
3472 auto SplatVal = MIRBuilder.buildExtractVectorElementConstant(
3473 MRI->getType(Val).getElementType(), Val, 0);
3474 MIRBuilder.buildSplatVector(getOrCreateVReg(U), SplatVal);
3475 return true;
3476 }
3477
3478 ArrayRef<int> Mask;
3479 if (auto *SVI = dyn_cast<ShuffleVectorInst>(&U))
3480 Mask = SVI->getShuffleMask();
3481 else
3482 Mask = cast<ConstantExpr>(U).getShuffleMask();
3483
3484 // As GISel does not represent <1 x > vectors as a separate type from scalars,
3485 // we transform shuffle_vector with a scalar output to an
3486 // ExtractVectorElement. If the input type is also scalar it becomes a Copy.
3487 unsigned DstElts = cast<FixedVectorType>(U.getType())->getNumElements();
3488 unsigned SrcElts =
3489 cast<FixedVectorType>(U.getOperand(0)->getType())->getNumElements();
3490 if (DstElts == 1) {
3491 unsigned M = Mask[0];
3492 if (SrcElts == 1) {
3493 if (M == 0 || M == 1)
3494 return translateCopy(U, *U.getOperand(M), MIRBuilder);
3495 MIRBuilder.buildUndef(getOrCreateVReg(U));
3496 } else {
3497 Register Dst = getOrCreateVReg(U);
3498 if (M < SrcElts) {
3500 Dst, getOrCreateVReg(*U.getOperand(0)), M);
3501 } else if (M < SrcElts * 2) {
3503 Dst, getOrCreateVReg(*U.getOperand(1)), M - SrcElts);
3504 } else {
3505 MIRBuilder.buildUndef(Dst);
3506 }
3507 }
3508 return true;
3509 }
3510
3511 // A single element src is transformed to a build_vector.
3512 if (SrcElts == 1) {
3515 for (int M : Mask) {
3516 LLT SrcTy = getLLTForType(*U.getOperand(0)->getType(), *DL);
3517 if (M == 0 || M == 1) {
3518 Ops.push_back(getOrCreateVReg(*U.getOperand(M)));
3519 } else {
3520 if (!Undef.isValid()) {
3521 Undef = MRI->createGenericVirtualRegister(SrcTy);
3522 MIRBuilder.buildUndef(Undef);
3523 }
3524 Ops.push_back(Undef);
3525 }
3526 }
3527 MIRBuilder.buildBuildVector(getOrCreateVReg(U), Ops);
3528 return true;
3529 }
3530
3531 ArrayRef<int> MaskAlloc = MF->allocateShuffleMask(Mask);
3532 MIRBuilder
3533 .buildInstr(TargetOpcode::G_SHUFFLE_VECTOR, {getOrCreateVReg(U)},
3534 {getOrCreateVReg(*U.getOperand(0)),
3535 getOrCreateVReg(*U.getOperand(1))})
3536 .addShuffleMask(MaskAlloc);
3537 return true;
3538}
3539
3540bool IRTranslator::translatePHI(const User &U, MachineIRBuilder &MIRBuilder) {
3541 const PHINode &PI = cast<PHINode>(U);
3542
3543 SmallVector<MachineInstr *, 4> Insts;
3544 for (auto Reg : getOrCreateVRegs(PI)) {
3545 auto MIB = MIRBuilder.buildInstr(TargetOpcode::G_PHI, {Reg}, {});
3546 Insts.push_back(MIB.getInstr());
3547 }
3548
3549 PendingPHIs.emplace_back(&PI, std::move(Insts));
3550 return true;
3551}
3552
3553bool IRTranslator::translateAtomicCmpXchg(const User &U,
3554 MachineIRBuilder &MIRBuilder) {
3555 const AtomicCmpXchgInst &I = cast<AtomicCmpXchgInst>(U);
3556
3557 auto Flags = TLI->getAtomicMemOperandFlags(I, *DL);
3558
3559 auto Res = getOrCreateVRegs(I);
3560 Register OldValRes = Res[0];
3561 Register SuccessRes = Res[1];
3562 Register Addr = getOrCreateVReg(*I.getPointerOperand());
3563 Register Cmp = getOrCreateVReg(*I.getCompareOperand());
3564 Register NewVal = getOrCreateVReg(*I.getNewValOperand());
3565
3567 OldValRes, SuccessRes, Addr, Cmp, NewVal,
3568 *MF->getMachineMemOperand(
3569 MachinePointerInfo(I.getPointerOperand()), Flags, MRI->getType(Cmp),
3570 getMemOpAlign(I), I.getAAMetadata(), nullptr, I.getSyncScopeID(),
3571 I.getSuccessOrdering(), I.getFailureOrdering()));
3572 return true;
3573}
3574
3575bool IRTranslator::translateAtomicRMW(const User &U,
3576 MachineIRBuilder &MIRBuilder) {
3577 if (!mayTranslateUserTypes(U))
3578 return false;
3579
3580 const AtomicRMWInst &I = cast<AtomicRMWInst>(U);
3581 auto Flags = TLI->getAtomicMemOperandFlags(I, *DL);
3582
3583 Register Res = getOrCreateVReg(I);
3584 Register Addr = getOrCreateVReg(*I.getPointerOperand());
3585 Register Val = getOrCreateVReg(*I.getValOperand());
3586
3587 unsigned Opcode = 0;
3588 switch (I.getOperation()) {
3589 default:
3590 return false;
3592 Opcode = TargetOpcode::G_ATOMICRMW_XCHG;
3593 break;
3594 case AtomicRMWInst::Add:
3595 Opcode = TargetOpcode::G_ATOMICRMW_ADD;
3596 break;
3597 case AtomicRMWInst::Sub:
3598 Opcode = TargetOpcode::G_ATOMICRMW_SUB;
3599 break;
3600 case AtomicRMWInst::And:
3601 Opcode = TargetOpcode::G_ATOMICRMW_AND;
3602 break;
3604 Opcode = TargetOpcode::G_ATOMICRMW_NAND;
3605 break;
3606 case AtomicRMWInst::Or:
3607 Opcode = TargetOpcode::G_ATOMICRMW_OR;
3608 break;
3609 case AtomicRMWInst::Xor:
3610 Opcode = TargetOpcode::G_ATOMICRMW_XOR;
3611 break;
3612 case AtomicRMWInst::Max:
3613 Opcode = TargetOpcode::G_ATOMICRMW_MAX;
3614 break;
3615 case AtomicRMWInst::Min:
3616 Opcode = TargetOpcode::G_ATOMICRMW_MIN;
3617 break;
3619 Opcode = TargetOpcode::G_ATOMICRMW_UMAX;
3620 break;
3622 Opcode = TargetOpcode::G_ATOMICRMW_UMIN;
3623 break;
3625 Opcode = TargetOpcode::G_ATOMICRMW_FADD;
3626 break;
3628 Opcode = TargetOpcode::G_ATOMICRMW_FSUB;
3629 break;
3631 Opcode = TargetOpcode::G_ATOMICRMW_FMAX;
3632 break;
3634 Opcode = TargetOpcode::G_ATOMICRMW_FMIN;
3635 break;
3637 Opcode = TargetOpcode::G_ATOMICRMW_FMAXIMUM;
3638 break;
3640 Opcode = TargetOpcode::G_ATOMICRMW_FMINIMUM;
3641 break;
3643 Opcode = TargetOpcode::G_ATOMICRMW_FMAXIMUMNUM;
3644 break;
3646 Opcode = TargetOpcode::G_ATOMICRMW_FMINIMUMNUM;
3647 break;
3649 Opcode = TargetOpcode::G_ATOMICRMW_UINC_WRAP;
3650 break;
3652 Opcode = TargetOpcode::G_ATOMICRMW_UDEC_WRAP;
3653 break;
3655 Opcode = TargetOpcode::G_ATOMICRMW_USUB_COND;
3656 break;
3658 Opcode = TargetOpcode::G_ATOMICRMW_USUB_SAT;
3659 break;
3660 }
3661
3662 MIRBuilder.buildAtomicRMW(
3663 Opcode, Res, Addr, Val,
3664 *MF->getMachineMemOperand(MachinePointerInfo(I.getPointerOperand()),
3665 Flags, MRI->getType(Val), getMemOpAlign(I),
3666 I.getAAMetadata(), nullptr, I.getSyncScopeID(),
3667 I.getOrdering()));
3668 return true;
3669}
3670
3671bool IRTranslator::translateFence(const User &U,
3672 MachineIRBuilder &MIRBuilder) {
3673 const FenceInst &Fence = cast<FenceInst>(U);
3674 MIRBuilder.buildFence(static_cast<unsigned>(Fence.getOrdering()),
3675 Fence.getSyncScopeID());
3676 return true;
3677}
3678
3679bool IRTranslator::translateFreeze(const User &U,
3680 MachineIRBuilder &MIRBuilder) {
3681 const ArrayRef<Register> DstRegs = getOrCreateVRegs(U);
3682 const ArrayRef<Register> SrcRegs = getOrCreateVRegs(*U.getOperand(0));
3683
3684 assert(DstRegs.size() == SrcRegs.size() &&
3685 "Freeze with different source and destination type?");
3686
3687 for (unsigned I = 0; I < DstRegs.size(); ++I) {
3688 MIRBuilder.buildFreeze(DstRegs[I], SrcRegs[I]);
3689 }
3690
3691 return true;
3692}
3693
3694void IRTranslator::finishPendingPhis() {
3695#ifndef NDEBUG
3696 DILocationVerifier Verifier;
3697 GISelObserverWrapper WrapperObserver(&Verifier);
3698 RAIIMFObsDelInstaller ObsInstall(*MF, WrapperObserver);
3699#endif // ifndef NDEBUG
3700 for (auto &Phi : PendingPHIs) {
3701 const PHINode *PI = Phi.first;
3702 if (PI->getType()->isEmptyTy())
3703 continue;
3704 ArrayRef<MachineInstr *> ComponentPHIs = Phi.second;
3705 MachineBasicBlock *PhiMBB = ComponentPHIs[0]->getParent();
3706 EntryBuilder->setDebugLoc(PI->getDebugLoc());
3707#ifndef NDEBUG
3708 Verifier.setCurrentInst(PI);
3709#endif // ifndef NDEBUG
3710
3711 SmallPtrSet<const MachineBasicBlock *, 16> SeenPreds;
3712 for (unsigned i = 0; i < PI->getNumIncomingValues(); ++i) {
3713 auto IRPred = PI->getIncomingBlock(i);
3714 ArrayRef<Register> ValRegs = getOrCreateVRegs(*PI->getIncomingValue(i));
3715 for (auto *Pred : getMachinePredBBs({IRPred, PI->getParent()})) {
3716 if (SeenPreds.count(Pred) || !PhiMBB->isPredecessor(Pred))
3717 continue;
3718 SeenPreds.insert(Pred);
3719 for (unsigned j = 0; j < ValRegs.size(); ++j) {
3720 MachineInstrBuilder MIB(*MF, ComponentPHIs[j]);
3721 MIB.addUse(ValRegs[j]);
3722 MIB.addMBB(Pred);
3723 }
3724 }
3725 }
3726 }
3727}
3728
3729void IRTranslator::translateDbgValueRecord(Value *V, bool HasArgList,
3730 const DILocalVariable *Variable,
3731 const DIExpression *Expression,
3732 const DebugLoc &DL,
3733 MachineIRBuilder &MIRBuilder) {
3734 assert(Variable->isValidLocationForIntrinsic(DL) &&
3735 "Expected inlined-at fields to agree");
3736 // Act as if we're handling a debug intrinsic.
3737 MIRBuilder.setDebugLoc(DL);
3738
3739 if (!V || HasArgList) {
3740 // DI cannot produce a valid DBG_VALUE, so produce an undef DBG_VALUE to
3741 // terminate any prior location.
3742 MIRBuilder.buildIndirectDbgValue(0, Variable, Expression);
3743 return;
3744 }
3745
3746 if (const auto *CI = dyn_cast<Constant>(V)) {
3747 MIRBuilder.buildConstDbgValue(*CI, Variable, Expression);
3748 return;
3749 }
3750
3751 if (auto *AI = dyn_cast<AllocaInst>(V);
3752 AI && AI->isStaticAlloca() && Expression->startsWithDeref()) {
3753 // If the value is an alloca and the expression starts with a
3754 // dereference, track a stack slot instead of a register, as registers
3755 // may be clobbered.
3756 auto ExprOperands = Expression->getElements();
3757 auto *ExprDerefRemoved =
3758 DIExpression::get(AI->getContext(), ExprOperands.drop_front());
3759 MIRBuilder.buildFIDbgValue(getOrCreateFrameIndex(*AI), Variable,
3760 ExprDerefRemoved);
3761 return;
3762 }
3763 if (translateIfEntryValueArgument(false, V, Variable, Expression, DL,
3764 MIRBuilder))
3765 return;
3766 for (Register Reg : getOrCreateVRegs(*V)) {
3767 // FIXME: This does not handle register-indirect values at offset 0. The
3768 // direct/indirect thing shouldn't really be handled by something as
3769 // implicit as reg+noreg vs reg+imm in the first place, but it seems
3770 // pretty baked in right now.
3771 MIRBuilder.buildDirectDbgValue(Reg, Variable, Expression);
3772 }
3773}
3774
3775void IRTranslator::translateDbgDeclareRecord(Value *Address, bool HasArgList,
3776 const DILocalVariable *Variable,
3777 const DIExpression *Expression,
3778 const DebugLoc &DL,
3779 MachineIRBuilder &MIRBuilder) {
3780 if (!Address || isa<UndefValue>(Address)) {
3781 LLVM_DEBUG(dbgs() << "Dropping debug info for " << *Variable << "\n");
3782 return;
3783 }
3784
3785 assert(Variable->isValidLocationForIntrinsic(DL) &&
3786 "Expected inlined-at fields to agree");
3787 auto AI = dyn_cast<AllocaInst>(Address);
3788 if (AI && AI->isStaticAlloca()) {
3789 // Static allocas are tracked at the MF level, no need for DBG_VALUE
3790 // instructions (in fact, they get ignored if they *do* exist).
3791 MF->setVariableDbgInfo(Variable, Expression,
3792 getOrCreateFrameIndex(*AI), DL);
3793 return;
3794 }
3795
3796 if (translateIfEntryValueArgument(true, Address, Variable,
3797 Expression, DL,
3798 MIRBuilder))
3799 return;
3800
3801 // A dbg.declare describes the address of a source variable, so lower it
3802 // into an indirect DBG_VALUE.
3803 MIRBuilder.setDebugLoc(DL);
3804 MIRBuilder.buildIndirectDbgValue(getOrCreateVReg(*Address), Variable,
3805 Expression);
3806}
3807
3808void IRTranslator::translateDbgInfo(const Instruction &Inst,
3809 MachineIRBuilder &MIRBuilder) {
3810 for (DbgRecord &DR : Inst.getDbgRecordRange()) {
3811 if (DbgLabelRecord *DLR = dyn_cast<DbgLabelRecord>(&DR)) {
3812 MIRBuilder.setDebugLoc(DLR->getDebugLoc());
3813 assert(DLR->getLabel() && "Missing label");
3814 assert(DLR->getLabel()->isValidLocationForIntrinsic(
3815 MIRBuilder.getDebugLoc()) &&
3816 "Expected inlined-at fields to agree");
3817 MIRBuilder.buildDbgLabel(DLR->getLabel());
3818 continue;
3819 }
3820 DbgVariableRecord &DVR = cast<DbgVariableRecord>(DR);
3821 const DILocalVariable *Variable = DVR.getVariable();
3822 const DIExpression *Expression = DVR.getExpression();
3823 Value *V = DVR.getVariableLocationOp(0);
3824 if (DVR.isDbgDeclare())
3825 translateDbgDeclareRecord(V, DVR.hasArgList(), Variable, Expression,
3826 DVR.getDebugLoc(), MIRBuilder);
3827 else
3828 translateDbgValueRecord(V, DVR.hasArgList(), Variable, Expression,
3829 DVR.getDebugLoc(), MIRBuilder);
3830 }
3831}
3832
3833bool IRTranslator::translate(const Instruction &Inst) {
3834 CurBuilder->setDebugLoc(Inst.getDebugLoc());
3835 CurBuilder->setPCSections(Inst.getMetadata(LLVMContext::MD_pcsections));
3836 CurBuilder->setMMRAMetadata(Inst.getMetadata(LLVMContext::MD_mmra));
3837
3838 if (TLI->fallBackToDAGISel(Inst))
3839 return false;
3840
3841 switch (Inst.getOpcode()) {
3842#define HANDLE_INST(NUM, OPCODE, CLASS) \
3843 case Instruction::OPCODE: \
3844 return translate##OPCODE(Inst, *CurBuilder.get());
3845#include "llvm/IR/Instruction.def"
3846 default:
3847 return false;
3848 }
3849}
3850
3851bool IRTranslator::translate(const Constant &C, Register Reg) {
3852 // We only emit constants into the entry block from here. To prevent jumpy
3853 // debug behaviour remove debug line.
3854 if (auto CurrInstDL = CurBuilder->getDL())
3855 EntryBuilder->setDebugLoc(DebugLoc());
3856
3857 if (auto CI = dyn_cast<ConstantInt>(&C)) {
3858 // buildConstant expects a to-be-splatted scalar ConstantInt.
3859 if (isa<VectorType>(CI->getType()))
3860 CI = ConstantInt::get(CI->getContext(), CI->getValue());
3861 EntryBuilder->buildConstant(Reg, *CI);
3862 } else if (auto CB = dyn_cast<ConstantByte>(&C)) {
3863 // Byte constants share G_CONSTANT with integers; the destination Reg's
3864 // LLT (an integer LLT, see getLLTForType) determines vector splatting.
3865 EntryBuilder->buildConstant(Reg, CB->getValue());
3866 } else if (auto CF = dyn_cast<ConstantFP>(&C)) {
3867 // buildFConstant expects a to-be-splatted scalar ConstantFP.
3868 if (isa<VectorType>(CF->getType()))
3869 CF = ConstantFP::get(CF->getContext(), CF->getValue());
3870 EntryBuilder->buildFConstant(Reg, *CF);
3871 } else if (isa<UndefValue>(C))
3872 EntryBuilder->buildUndef(Reg);
3873 else if (isa<ConstantPointerNull>(C))
3874 EntryBuilder->buildConstant(Reg, 0);
3875 else if (auto GV = dyn_cast<GlobalValue>(&C))
3876 EntryBuilder->buildGlobalValue(Reg, GV);
3877 else if (auto CPA = dyn_cast<ConstantPtrAuth>(&C)) {
3878 Register Addr = getOrCreateVReg(*CPA->getPointer());
3879 Register AddrDisc = getOrCreateVReg(*CPA->getAddrDiscriminator());
3880 EntryBuilder->buildConstantPtrAuth(Reg, CPA, Addr, AddrDisc);
3881 } else if (auto CAZ = dyn_cast<ConstantAggregateZero>(&C)) {
3882 Constant &Elt = *CAZ->getElementValue(0u);
3883 if (isa<ScalableVectorType>(CAZ->getType())) {
3884 EntryBuilder->buildSplatVector(Reg, getOrCreateVReg(Elt));
3885 return true;
3886 }
3887 // Return the scalar if it is a <1 x Ty> vector.
3888 unsigned NumElts = CAZ->getElementCount().getFixedValue();
3889 if (NumElts == 1)
3890 return translateCopy(C, Elt, *EntryBuilder);
3891 // All elements are zero so we can just use the first one.
3892 EntryBuilder->buildSplatBuildVector(Reg, getOrCreateVReg(Elt));
3893 } else if (auto CV = dyn_cast<ConstantDataVector>(&C)) {
3894 // Return the scalar if it is a <1 x Ty> vector.
3895 if (CV->getNumElements() == 1)
3896 return translateCopy(C, *CV->getElementAsConstant(0), *EntryBuilder);
3898 for (unsigned i = 0; i < CV->getNumElements(); ++i) {
3899 Constant &Elt = *CV->getElementAsConstant(i);
3900 Ops.push_back(getOrCreateVReg(Elt));
3901 }
3902 EntryBuilder->buildBuildVector(Reg, Ops);
3903 } else if (auto CE = dyn_cast<ConstantExpr>(&C)) {
3904 switch(CE->getOpcode()) {
3905#define HANDLE_INST(NUM, OPCODE, CLASS) \
3906 case Instruction::OPCODE: \
3907 return translate##OPCODE(*CE, *EntryBuilder.get());
3908#include "llvm/IR/Instruction.def"
3909 default:
3910 return false;
3911 }
3912 } else if (auto CV = dyn_cast<ConstantVector>(&C)) {
3913 if (CV->getNumOperands() == 1)
3914 return translateCopy(C, *CV->getOperand(0), *EntryBuilder);
3916 for (unsigned i = 0; i < CV->getNumOperands(); ++i) {
3917 Ops.push_back(getOrCreateVReg(*CV->getOperand(i)));
3918 }
3919 EntryBuilder->buildBuildVector(Reg, Ops);
3920 } else if (auto *BA = dyn_cast<BlockAddress>(&C)) {
3921 EntryBuilder->buildBlockAddress(Reg, BA);
3922 } else
3923 return false;
3924
3925 return true;
3926}
3927
3928bool IRTranslator::mayTranslateUserTypes(const User &U) const {
3929 const TargetMachine &TM = TLI->getTargetMachine();
3930 if (LLT::getUseExtended())
3931 return true;
3932
3933 // BF16 cannot currently be represented by default LLT. To avoid miscompiles
3934 // we prevent any instructions using them by default in all targets that do
3935 // not explicitly enable it via LLT::setUseExtended(true).
3936 // SPIRV target is exception.
3937 return TM.getTargetTriple().isSPIRV() ||
3938 (!U.getType()->getScalarType()->isBFloatTy() &&
3939 !any_of(U.operands(), [](Value *V) {
3940 return V->getType()->getScalarType()->isBFloatTy();
3941 }));
3942}
3943
3944bool IRTranslator::finalizeBasicBlock(const BasicBlock &BB,
3946 for (auto &BTB : SL->BitTestCases) {
3947 // Emit header first, if it wasn't already emitted.
3948 if (!BTB.Emitted)
3949 emitBitTestHeader(BTB, BTB.Parent);
3950
3951 BranchProbability UnhandledProb = BTB.Prob;
3952 for (unsigned j = 0, ej = BTB.Cases.size(); j != ej; ++j) {
3953 UnhandledProb -= BTB.Cases[j].ExtraProb;
3954 // Set the current basic block to the mbb we wish to insert the code into
3955 MachineBasicBlock *MBB = BTB.Cases[j].ThisBB;
3956 // If all cases cover a contiguous range, it is not necessary to jump to
3957 // the default block after the last bit test fails. This is because the
3958 // range check during bit test header creation has guaranteed that every
3959 // case here doesn't go outside the range. In this case, there is no need
3960 // to perform the last bit test, as it will always be true. Instead, make
3961 // the second-to-last bit-test fall through to the target of the last bit
3962 // test, and delete the last bit test.
3963
3964 MachineBasicBlock *NextMBB;
3965 if ((BTB.ContiguousRange || BTB.FallthroughUnreachable) && j + 2 == ej) {
3966 // Second-to-last bit-test with contiguous range: fall through to the
3967 // target of the final bit test.
3968 NextMBB = BTB.Cases[j + 1].TargetBB;
3969 } else if (j + 1 == ej) {
3970 // For the last bit test, fall through to Default.
3971 NextMBB = BTB.Default;
3972 } else {
3973 // Otherwise, fall through to the next bit test.
3974 NextMBB = BTB.Cases[j + 1].ThisBB;
3975 }
3976
3977 emitBitTestCase(BTB, NextMBB, UnhandledProb, BTB.Reg, BTB.Cases[j], MBB);
3978
3979 if ((BTB.ContiguousRange || BTB.FallthroughUnreachable) && j + 2 == ej) {
3980 // We need to record the replacement phi edge here that normally
3981 // happens in emitBitTestCase before we delete the case, otherwise the
3982 // phi edge will be lost.
3983 addMachineCFGPred({BTB.Parent->getBasicBlock(),
3984 BTB.Cases[ej - 1].TargetBB->getBasicBlock()},
3985 MBB);
3986 // Since we're not going to use the final bit test, remove it.
3987 BTB.Cases.pop_back();
3988 break;
3989 }
3990 }
3991 // This is "default" BB. We have two jumps to it. From "header" BB and from
3992 // last "case" BB, unless the latter was skipped.
3993 CFGEdge HeaderToDefaultEdge = {BTB.Parent->getBasicBlock(),
3994 BTB.Default->getBasicBlock()};
3995 addMachineCFGPred(HeaderToDefaultEdge, BTB.Parent);
3996 if (!BTB.ContiguousRange) {
3997 addMachineCFGPred(HeaderToDefaultEdge, BTB.Cases.back().ThisBB);
3998 }
3999 }
4000 SL->BitTestCases.clear();
4001
4002 for (auto &JTCase : SL->JTCases) {
4003 // Emit header first, if it wasn't already emitted.
4004 if (!JTCase.first.Emitted)
4005 emitJumpTableHeader(JTCase.second, JTCase.first, JTCase.first.HeaderBB);
4006
4007 emitJumpTable(JTCase.second, JTCase.second.MBB);
4008 }
4009 SL->JTCases.clear();
4010
4011 for (auto &SwCase : SL->SwitchCases)
4012 emitSwitchCase(SwCase, &CurBuilder->getMBB(), *CurBuilder);
4013 SL->SwitchCases.clear();
4014
4015 // Check if we need to generate stack-protector guard checks.
4016 StackProtector &SP = getAnalysis<StackProtector>();
4017 if (SP.shouldEmitSDCheck(BB)) {
4018 bool FunctionBasedInstrumentation =
4019 TLI->getSSPStackGuardCheck(*MF->getFunction().getParent(), *Libcalls);
4020 SPDescriptor.initialize(&BB, &MBB, FunctionBasedInstrumentation);
4021 }
4022 // Handle stack protector.
4023 if (SPDescriptor.shouldEmitFunctionBasedCheckStackProtector()) {
4024 LLVM_DEBUG(dbgs() << "Unimplemented stack protector case\n");
4025 return false;
4026 } else if (SPDescriptor.shouldEmitStackProtector()) {
4027 MachineBasicBlock *ParentMBB = SPDescriptor.getParentMBB();
4028 MachineBasicBlock *SuccessMBB = SPDescriptor.getSuccessMBB();
4029
4030 // Find the split point to split the parent mbb. At the same time copy all
4031 // physical registers used in the tail of parent mbb into virtual registers
4032 // before the split point and back into physical registers after the split
4033 // point. This prevents us needing to deal with Live-ins and many other
4034 // register allocation issues caused by us splitting the parent mbb. The
4035 // register allocator will clean up said virtual copies later on.
4037 ParentMBB, *MF->getSubtarget().getInstrInfo());
4038
4039 // Splice the terminator of ParentMBB into SuccessMBB.
4040 SuccessMBB->splice(SuccessMBB->end(), ParentMBB, SplitPoint,
4041 ParentMBB->end());
4042
4043 // Add compare/jump on neq/jump to the parent BB.
4044 if (!emitSPDescriptorParent(SPDescriptor, ParentMBB))
4045 return false;
4046
4047 // CodeGen Failure MBB if we have not codegened it yet.
4048 MachineBasicBlock *FailureMBB = SPDescriptor.getFailureMBB();
4049 if (FailureMBB->empty()) {
4050 if (!emitSPDescriptorFailure(SPDescriptor, FailureMBB))
4051 return false;
4052 }
4053
4054 // Clear the Per-BB State.
4055 SPDescriptor.resetPerBBState();
4056 }
4057 return true;
4058}
4059
4060bool IRTranslator::emitSPDescriptorParent(StackProtectorDescriptor &SPD,
4061 MachineBasicBlock *ParentBB) {
4062 CurBuilder->setInsertPt(*ParentBB, ParentBB->end());
4063 // First create the loads to the guard/stack slot for the comparison.
4064 Type *PtrIRTy = PointerType::getUnqual(MF->getFunction().getContext());
4065 const LLT PtrTy = getLLTForType(*PtrIRTy, *DL);
4066 LLT PtrMemTy = getLLTForMVT(TLI->getPointerMemTy(*DL));
4067
4068 MachineFrameInfo &MFI = ParentBB->getParent()->getFrameInfo();
4069 int FI = MFI.getStackProtectorIndex();
4070
4071 Register Guard;
4072 Register StackSlotPtr = CurBuilder->buildFrameIndex(PtrTy, FI).getReg(0);
4073 const Module &M = *ParentBB->getParent()->getFunction().getParent();
4074 Align Align = DL->getPrefTypeAlign(PointerType::getUnqual(M.getContext()));
4075
4076 // Generate code to load the content of the guard slot.
4077 Register GuardVal =
4078 CurBuilder
4079 ->buildLoad(PtrMemTy, StackSlotPtr,
4080 MachinePointerInfo::getFixedStack(*MF, FI), Align,
4082 .getReg(0);
4083
4084 if (TLI->useStackGuardXorFP()) {
4085 LLVM_DEBUG(dbgs() << "Stack protector xor'ing with FP not yet implemented");
4086 return false;
4087 }
4088
4089 // Retrieve guard check function, nullptr if instrumentation is inlined.
4090 if (const Function *GuardCheckFn = TLI->getSSPStackGuardCheck(M, *Libcalls)) {
4091 // This path is currently untestable on GlobalISel, since the only platform
4092 // that needs this seems to be Windows, and we fall back on that currently.
4093 // The code still lives here in case that changes.
4094 // Silence warning about unused variable until the code below that uses
4095 // 'GuardCheckFn' is enabled.
4096 (void)GuardCheckFn;
4097 return false;
4098#if 0
4099 // The target provides a guard check function to validate the guard value.
4100 // Generate a call to that function with the content of the guard slot as
4101 // argument.
4102 FunctionType *FnTy = GuardCheckFn->getFunctionType();
4103 assert(FnTy->getNumParams() == 1 && "Invalid function signature");
4104 ISD::ArgFlagsTy Flags;
4105 if (GuardCheckFn->hasAttribute(1, Attribute::AttrKind::InReg))
4106 Flags.setInReg();
4107 CallLowering::ArgInfo GuardArgInfo(
4108 {GuardVal, FnTy->getParamType(0), {Flags}});
4109
4110 CallLowering::CallLoweringInfo Info;
4111 Info.OrigArgs.push_back(GuardArgInfo);
4112 Info.CallConv = GuardCheckFn->getCallingConv();
4113 Info.Callee = MachineOperand::CreateGA(GuardCheckFn, 0);
4114 Info.OrigRet = {Register(), FnTy->getReturnType()};
4115 if (!CLI->lowerCall(MIRBuilder, Info)) {
4116 LLVM_DEBUG(dbgs() << "Failed to lower call to stack protector check\n");
4117 return false;
4118 }
4119 return true;
4120#endif
4121 }
4122
4123 // If useLoadStackGuardNode returns true, generate LOAD_STACK_GUARD.
4124 // Otherwise, emit a volatile load to retrieve the stack guard value.
4125 if (TLI->useLoadStackGuardNode(*ParentBB->getBasicBlock()->getModule())) {
4126 Guard =
4127 MRI->createGenericVirtualRegister(LLT::scalar(PtrTy.getSizeInBits()));
4128 getStackGuard(Guard, *CurBuilder);
4129 } else {
4130 // TODO: test using android subtarget when we support @llvm.thread.pointer.
4131 const Value *IRGuard = TLI->getSDagStackGuard(M, *Libcalls);
4132 Register GuardPtr = getOrCreateVReg(*IRGuard);
4133
4134 Guard = CurBuilder
4135 ->buildLoad(PtrMemTy, GuardPtr,
4136 MachinePointerInfo::getFixedStack(*MF, FI), Align,
4139 .getReg(0);
4140 }
4141
4142 // Perform the comparison.
4143 auto Cmp =
4144 CurBuilder->buildICmp(CmpInst::ICMP_NE, LLT::integer(1), Guard, GuardVal);
4145 // If the guard/stackslot do not equal, branch to failure MBB.
4146 CurBuilder->buildBrCond(Cmp, *SPD.getFailureMBB());
4147 // Otherwise branch to success MBB.
4148 CurBuilder->buildBr(*SPD.getSuccessMBB());
4149 return true;
4150}
4151
4152bool IRTranslator::emitSPDescriptorFailure(StackProtectorDescriptor &SPD,
4153 MachineBasicBlock *FailureBB) {
4154 const RTLIB::LibcallImpl LibcallImpl =
4155 Libcalls->getLibcallImpl(RTLIB::STACKPROTECTOR_CHECK_FAIL);
4156 if (LibcallImpl == RTLIB::Unsupported)
4157 return false;
4158
4159 CurBuilder->setInsertPt(*FailureBB, FailureBB->end());
4160
4161 CallLowering::CallLoweringInfo Info;
4162 Info.CallConv = Libcalls->getLibcallImplCallingConv(LibcallImpl);
4163
4164 StringRef LibcallName =
4166 Info.Callee = MachineOperand::CreateES(LibcallName.data());
4167 Info.OrigRet = {Register(), Type::getVoidTy(MF->getFunction().getContext()),
4168 0};
4169 if (!CLI->lowerCall(*CurBuilder, Info)) {
4170 LLVM_DEBUG(dbgs() << "Failed to lower call to stack protector fail\n");
4171 return false;
4172 }
4173
4174 // Emit a trap instruction if we are required to do so.
4175 const TargetOptions &TargetOpts = TLI->getTargetMachine().Options;
4176 if (TargetOpts.TrapUnreachable && !TargetOpts.NoTrapAfterNoreturn)
4177 CurBuilder->buildInstr(TargetOpcode::G_TRAP);
4178
4179 return true;
4180}
4181
4182void IRTranslator::finalizeFunction() {
4183 // Release the memory used by the different maps we
4184 // needed during the translation.
4185 PendingPHIs.clear();
4186 VMap.reset();
4187 FrameIndices.clear();
4188 MachinePreds.clear();
4189 // MachineIRBuilder::DebugLoc can outlive the DILocation it holds. Clear it
4190 // to avoid accessing free’d memory (in runOnMachineFunction) and to avoid
4191 // destroying it twice (in ~IRTranslator() and ~LLVMContext())
4192 EntryBuilder.reset();
4193 CurBuilder.reset();
4194 FuncInfo.clear();
4195 SPDescriptor.resetPerFunctionState();
4196}
4197
4198/// Returns true if a BasicBlock \p BB within a variadic function contains a
4199/// variadic musttail call.
4200static bool checkForMustTailInVarArgFn(bool IsVarArg, const BasicBlock &BB) {
4201 if (!IsVarArg)
4202 return false;
4203
4204 // Walk the block backwards, because tail calls usually only appear at the end
4205 // of a block.
4206 return llvm::any_of(llvm::reverse(BB), [](const Instruction &I) {
4207 const auto *CI = dyn_cast<CallInst>(&I);
4208 return CI && CI->isMustTailCall();
4209 });
4210}
4211
4213 MF = &CurMF;
4214 const Function &F = MF->getFunction();
4215 ORE = std::make_unique<OptimizationRemarkEmitter>(&F);
4216 CLI = MF->getSubtarget().getCallLowering();
4217
4218 if (CLI->fallBackToDAGISel(*MF)) {
4219 OptimizationRemarkMissed R("gisel-irtranslator", "GISelFailure",
4220 F.getSubprogram(), &F.getEntryBlock());
4221 R << "unable to lower function: "
4222 << ore::NV("Prototype", F.getFunctionType());
4223
4224 reportTranslationError(*MF, *ORE, R);
4225 return false;
4226 }
4227
4230 // Set the CSEConfig and run the analysis.
4231 GISelCSEInfo *CSEInfo = nullptr;
4233
4234 bool EnableCSE = EnableCSEInIRTranslator.getNumOccurrences()
4236 : TPC->isGISelCSEEnabled();
4237
4238 const TargetSubtargetInfo &Subtarget = MF->getSubtarget();
4239 TLI = Subtarget.getTargetLowering();
4240
4241 if (EnableCSE) {
4242 EntryBuilder = std::make_unique<CSEMIRBuilder>(CurMF);
4243 CSEInfo = &Wrapper.get(TPC->getCSEConfig());
4244 EntryBuilder->setCSEInfo(CSEInfo);
4245 CurBuilder = std::make_unique<CSEMIRBuilder>(CurMF);
4246 CurBuilder->setCSEInfo(CSEInfo);
4247 } else {
4248 EntryBuilder = std::make_unique<MachineIRBuilder>();
4249 CurBuilder = std::make_unique<MachineIRBuilder>();
4250 }
4251 CLI = Subtarget.getCallLowering();
4252 CurBuilder->setMF(*MF);
4253 EntryBuilder->setMF(*MF);
4254 MRI = &MF->getRegInfo();
4255 DL = &F.getDataLayout();
4256 const TargetMachine &TM = MF->getTarget();
4258 EnableOpts = OptLevel != CodeGenOptLevel::None && !skipFunction(F);
4259 FuncInfo.MF = MF;
4260 if (EnableOpts) {
4261 AA = &getAnalysis<AAResultsWrapperPass>().getAAResults();
4262 FuncInfo.BPI = &getAnalysis<BranchProbabilityInfoWrapperPass>().getBPI();
4263 AC = &getAnalysis<AssumptionCacheTracker>().getAssumptionCache(
4264 MF->getFunction());
4265 } else {
4266 AA = nullptr;
4267 FuncInfo.BPI = nullptr;
4268 AC = nullptr;
4269 }
4270 LibInfo = &getAnalysis<TargetLibraryInfoWrapperPass>().getTLI(F);
4271 Libcalls = &getAnalysis<LibcallLoweringInfoWrapper>().getLibcallLowering(
4272 *F.getParent(), Subtarget);
4273
4274 FuncInfo.CanLowerReturn = CLI->checkReturnTypeForCallConv(*MF);
4275
4276 SL = std::make_unique<GISelSwitchLowering>(this, FuncInfo);
4277 SL->init(*TLI, TM, *DL);
4278
4279 assert(PendingPHIs.empty() && "stale PHIs");
4280
4281 // Targets which want to use big endian can enable it using
4282 // enableBigEndian()
4283 if (!DL->isLittleEndian() && !CLI->enableBigEndian()) {
4284 // Currently we don't properly handle big endian code.
4285 OptimizationRemarkMissed R("gisel-irtranslator", "GISelFailure",
4286 F.getSubprogram(), &F.getEntryBlock());
4287 R << "unable to translate in big endian mode";
4288 reportTranslationError(*MF, *ORE, R);
4289 return false;
4290 }
4291
4292 // Release the per-function state when we return, whether we succeeded or not.
4293 llvm::scope_exit FinalizeOnReturn([this]() { finalizeFunction(); });
4294
4295 // Setup a separate basic-block for the arguments and constants
4296 MachineBasicBlock *EntryBB = MF->CreateMachineBasicBlock();
4297 MF->push_back(EntryBB);
4298 EntryBuilder->setMBB(*EntryBB);
4299
4300 DebugLoc DbgLoc = F.getEntryBlock().getFirstNonPHIIt()->getDebugLoc();
4301 SwiftError.setFunction(CurMF);
4302 SwiftError.createEntriesInEntryBlock(DbgLoc);
4303
4304 bool IsVarArg = F.isVarArg();
4305 bool HasMustTailInVarArgFn = false;
4306
4307 // Create all blocks, in IR order, to preserve the layout.
4308 FuncInfo.MBBMap.resize(F.getMaxBlockNumber());
4309 for (const BasicBlock &BB: F) {
4310 auto *&MBB = FuncInfo.MBBMap[BB.getNumber()];
4311
4312 MBB = MF->CreateMachineBasicBlock(&BB);
4313 MF->push_back(MBB);
4314
4315 // Only mark the block if the BlockAddress actually has users. The
4316 // hasAddressTaken flag may be stale if the BlockAddress was optimized away
4317 // but the constant still exists in the uniquing table.
4318 if (BB.hasAddressTaken()) {
4319 if (BlockAddress *BA = BlockAddress::lookup(&BB))
4320 if (!BA->hasZeroLiveUses())
4321 MBB->setAddressTakenIRBlock(const_cast<BasicBlock *>(&BB));
4322 }
4323
4324 if (!HasMustTailInVarArgFn)
4325 HasMustTailInVarArgFn = checkForMustTailInVarArgFn(IsVarArg, BB);
4326 }
4327
4328 MF->getFrameInfo().setHasMustTailInVarArgFunc(HasMustTailInVarArgFn);
4329
4330 // Make our arguments/constants entry block fallthrough to the IR entry block.
4331 EntryBB->addSuccessor(&getMBB(F.front()));
4332
4333 // Lower the actual args into this basic block.
4334 SmallVector<ArrayRef<Register>, 8> VRegArgs;
4335 for (const Argument &Arg: F.args()) {
4336 if (DL->getTypeStoreSize(Arg.getType()).isZero())
4337 continue; // Don't handle zero sized types.
4338 ArrayRef<Register> VRegs = getOrCreateVRegs(Arg);
4339 VRegArgs.push_back(VRegs);
4340
4341 if (CLI->supportSwiftError() && Arg.hasSwiftErrorAttr()) {
4342 assert(VRegs.size() == 1 && "Too many vregs for Swift error");
4343 SwiftError.setCurrentVReg(EntryBB, SwiftError.getFunctionArg(), VRegs[0]);
4344 }
4345 }
4346
4347 if (!CLI->lowerFormalArguments(*EntryBuilder, F, VRegArgs, FuncInfo)) {
4348 OptimizationRemarkMissed R("gisel-irtranslator", "GISelFailure",
4349 F.getSubprogram(), &F.getEntryBlock());
4350 R << "unable to lower arguments: "
4351 << ore::NV("Prototype", F.getFunctionType());
4352 reportTranslationError(*MF, *ORE, R);
4353 return false;
4354 }
4355
4356 // Need to visit defs before uses when translating instructions.
4357 GISelObserverWrapper WrapperObserver;
4358 if (EnableCSE && CSEInfo)
4359 WrapperObserver.addObserver(CSEInfo);
4360 {
4362#ifndef NDEBUG
4363 DILocationVerifier Verifier;
4364 WrapperObserver.addObserver(&Verifier);
4365#endif // ifndef NDEBUG
4366 RAIIMFObsDelInstaller ObsInstall(*MF, WrapperObserver);
4367 for (const BasicBlock *BB : RPOT) {
4368 MachineBasicBlock &MBB = getMBB(*BB);
4369 // Set the insertion point of all the following translations to
4370 // the end of this basic block.
4371 CurBuilder->setMBB(MBB);
4372 HasTailCall = false;
4373 for (const Instruction &Inst : *BB) {
4374 // If we translated a tail call in the last step, then we know
4375 // everything after the call is either a return, or something that is
4376 // handled by the call itself. (E.g. a lifetime marker or assume
4377 // intrinsic.) In this case, we should stop translating the block and
4378 // move on.
4379 if (HasTailCall)
4380 break;
4381#ifndef NDEBUG
4382 Verifier.setCurrentInst(&Inst);
4383#endif // ifndef NDEBUG
4384
4385 // Translate any debug-info attached to the instruction.
4386 translateDbgInfo(Inst, *CurBuilder);
4387
4388 if (translate(Inst))
4389 continue;
4390
4391 OptimizationRemarkMissed R("gisel-irtranslator", "GISelFailure",
4392 Inst.getDebugLoc(), BB);
4393 R << "unable to translate instruction: " << ore::NV("Opcode", &Inst);
4394
4395 if (ORE->allowExtraAnalysis("gisel-irtranslator")) {
4396 std::string InstStrStorage;
4397 raw_string_ostream InstStr(InstStrStorage);
4398 InstStr << Inst;
4399
4400 R << ": '" << InstStrStorage << "'";
4401 }
4402
4403 reportTranslationError(*MF, *ORE, R);
4404 return false;
4405 }
4406
4407 if (!finalizeBasicBlock(*BB, MBB)) {
4408 OptimizationRemarkMissed R("gisel-irtranslator", "GISelFailure",
4409 BB->getTerminator()->getDebugLoc(), BB);
4410 R << "unable to translate basic block";
4411 reportTranslationError(*MF, *ORE, R);
4412 return false;
4413 }
4414 }
4415#ifndef NDEBUG
4416 WrapperObserver.removeObserver(&Verifier);
4417#endif
4418 }
4419
4420 finishPendingPhis();
4421
4422 SwiftError.propagateVRegs();
4423
4424 // Merge the argument lowering and constants block with its single
4425 // successor, the LLVM-IR entry block. We want the basic block to
4426 // be maximal.
4427 assert(EntryBB->succ_size() == 1 &&
4428 "Custom BB used for lowering should have only one successor");
4429 // Get the successor of the current entry block.
4430 MachineBasicBlock &NewEntryBB = **EntryBB->succ_begin();
4431 assert(NewEntryBB.pred_size() == 1 &&
4432 "LLVM-IR entry block has a predecessor!?");
4433 // Move all the instruction from the current entry block to the
4434 // new entry block.
4435 NewEntryBB.splice(NewEntryBB.begin(), EntryBB, EntryBB->begin(),
4436 EntryBB->end());
4437
4438 // Update the live-in information for the new entry block.
4439 for (const MachineBasicBlock::RegisterMaskPair &LiveIn : EntryBB->liveins())
4440 NewEntryBB.addLiveIn(LiveIn);
4441 NewEntryBB.sortUniqueLiveIns();
4442
4443 // Get rid of the now empty basic block.
4444 EntryBB->removeSuccessor(&NewEntryBB);
4445 MF->remove(EntryBB);
4446 MF->deleteMachineBasicBlock(EntryBB);
4447
4448 assert(&MF->front() == &NewEntryBB &&
4449 "New entry wasn't next in the list of basic block!");
4450
4451 // Initialize stack protector information.
4453 SP.copyToMachineFrameInfo(MF->getFrameInfo());
4454
4455 return false;
4456}
#define Success
assert(UImm &&(UImm !=~static_cast< T >(0)) &&"Invalid immediate!")
amdgpu aa AMDGPU Address space based Alias Analysis Wrapper
MachineBasicBlock & MBB
MachineBasicBlock MachineBasicBlock::iterator DebugLoc DL
static GCRegistry::Add< CoreCLRGC > E("coreclr", "CoreCLR-compatible GC")
static GCRegistry::Add< OcamlGC > B("ocaml", "ocaml 3.10-compatible GC")
Provides analysis for continuously CSEing during GISel passes.
This file implements a version of MachineIRBuilder which CSEs insts within a MachineBasicBlock.
This file describes how to lower LLVM calls to machine code calls.
This file contains the declarations for the subclasses of Constant, which represent the different fla...
dxil translate DXIL Translate Metadata
This contains common code to allow clients to notify changes to machine instr.
#define DEBUG_TYPE
const HexagonInstrInfo * TII
static bool checkForMustTailInVarArgFn(bool IsVarArg, const BasicBlock &BB)
Returns true if a BasicBlock BB within a variadic function contains a variadic musttail call.
static unsigned getConvOpcode(Intrinsic::ID ID)
static uint64_t getOffsetFromIndices(const User &U, const DataLayout &DL)
static unsigned getConstrainedOpcode(Intrinsic::ID ID)
IRTranslator LLVM IR MI
IRTranslator LLVM IR static false void reportTranslationError(MachineFunction &MF, OptimizationRemarkEmitter &ORE, OptimizationRemarkMissed &R)
static cl::opt< bool > EnableCSEInIRTranslator("enable-cse-in-irtranslator", cl::desc("Should enable CSE in irtranslator"), cl::Optional, cl::init(false))
static bool isValInBlock(const Value *V, const BasicBlock *BB)
static bool isSwiftError(const Value *V)
This file declares the IRTranslator pass.
This file provides various utilities for inspecting and working with the control flow graph in LLVM I...
This file describes how to lower LLVM inline asm to machine code INLINEASM.
const AbstractManglingParser< Derived, Alloc >::OperatorInfo AbstractManglingParser< Derived, Alloc >::Ops[]
static LVOptions Options
Definition LVOptions.cpp:25
Implement a low-level type suitable for MachineInstr level instruction selection.
Implement a low-level type suitable for MachineInstr level instruction selection.
#define F(x, y, z)
Definition MD5.cpp:54
#define I(x, y, z)
Definition MD5.cpp:57
Machine Check Debug Module
This file declares the MachineIRBuilder class.
Register Reg
Register const TargetRegisterInfo * TRI
Promote Memory to Register
Definition Mem2Reg.cpp:110
This file contains the declarations for metadata subclasses.
Type::TypeID TypeID
uint64_t High
OptimizedStructLayoutField Field
if(PassOpts->AAPipeline)
#define INITIALIZE_PASS_DEPENDENCY(depName)
Definition PassSupport.h:42
#define INITIALIZE_PASS_END(passName, arg, name, cfg, analysis)
Definition PassSupport.h:44
#define INITIALIZE_PASS_BEGIN(passName, arg, name, cfg, analysis)
Definition PassSupport.h:39
This file builds on the ADT/GraphTraits.h file to build a generic graph post order iterator.
const SmallVectorImpl< MachineOperand > MachineBasicBlock * TBB
const SmallVectorImpl< MachineOperand > & Cond
std::pair< BasicBlock *, BasicBlock * > Edge
This file contains some templates that are useful if you are working with the STL at all.
verify safepoint Safepoint IR Verifier
This file defines the make_scope_exit function, which executes user-defined cleanup logic at scope ex...
This file defines the SmallVector class.
#define LLVM_DEBUG(...)
Definition Debug.h:119
This file describes how to lower LLVM code to machine code.
Target-Independent Code Generator Pass Configuration Options pass.
Value * RHS
Value * LHS
A wrapper pass to provide the legacy pass manager access to a suitably prepared AAResults object.
LLVM_ABI APInt zextOrTrunc(unsigned width) const
Zero extend or truncate to width.
Definition APInt.cpp:1076
an instruction to allocate memory on the stack
bool isSwiftError() const
Return true if this alloca is used as a swifterror argument to a call.
LLVM_ABI bool isStaticAlloca() const
Return true if this alloca is in the entry block of the function and is a constant size.
Align getAlign() const
Return the alignment of the memory that is being allocated by the instruction.
PointerType * getType() const
Overload to return most specific pointer type.
Type * getAllocatedType() const
Return the type that is being allocated by the instruction.
LLVM_ABI std::optional< TypeSize > getAllocationSize(const DataLayout &DL) const
Get allocation size in bytes.
const Value * getArraySize() const
Get the number of elements allocated.
Represent the analysis usage information of a pass.
AnalysisUsage & addRequired()
AnalysisUsage & addPreserved()
Add the specified Pass class to the set of analyses preserved by this pass.
This class represents an incoming formal argument to a Function.
Definition Argument.h:32
Represent a constant reference to an array (0 or more elements consecutively in memory),...
Definition ArrayRef.h:40
iterator end() const
Definition ArrayRef.h:130
size_t size() const
Get the array size.
Definition ArrayRef.h:141
iterator begin() const
Definition ArrayRef.h:129
bool empty() const
Check if the array is empty.
Definition ArrayRef.h:136
An immutable pass that tracks lazily created AssumptionCache objects.
@ Add
*p = old + v
@ FAdd
*p = old + v
@ USubCond
Subtract only if no unsigned overflow.
@ FMinimum
*p = minimum(old, v) minimum matches the behavior of llvm.minimum.
@ Min
*p = old <signed v ? old : v
@ Sub
*p = old - v
@ And
*p = old & v
@ Xor
*p = old ^ v
@ USubSat
*p = usub.sat(old, v) usub.sat matches the behavior of llvm.usub.sat.
@ FMaximum
*p = maximum(old, v) maximum matches the behavior of llvm.maximum.
@ FSub
*p = old - v
@ UIncWrap
Increment one up to a maximum value.
@ Max
*p = old >signed v ? old : v
@ UMin
*p = old <unsigned v ? old : v
@ FMin
*p = minnum(old, v) minnum matches the behavior of llvm.minnum.
@ UMax
*p = old >unsigned v ? old : v
@ FMaximumNum
*p = maximumnum(old, v) maximumnum matches the behavior of llvm.maximumnum.
@ FMax
*p = maxnum(old, v) maxnum matches the behavior of llvm.maxnum.
@ UDecWrap
Decrement one until a minimum value or zero.
@ FMinimumNum
*p = minimumnum(old, v) minimumnum matches the behavior of llvm.minimumnum.
@ Nand
*p = ~(old & v)
LLVM Basic Block Representation.
Definition BasicBlock.h:62
unsigned getNumber() const
Definition BasicBlock.h:95
const Function * getParent() const
Return the enclosing method, or null if none.
Definition BasicBlock.h:213
bool hasAddressTaken() const
Returns true if there are any uses of this basic block other than direct branches,...
Definition BasicBlock.h:687
LLVM_ABI InstListType::const_iterator getFirstNonPHIIt() const
Returns an iterator to the first instruction in this block that is not a PHINode instruction.
InstListType::const_iterator const_iterator
Definition BasicBlock.h:171
LLVM_ABI InstListType::const_iterator getFirstNonPHIOrDbg(bool SkipPseudoOp=true) const
Returns a pointer to the first instruction in this block that is not a PHINode or a debug intrinsic,...
LLVM_ABI const Module * getModule() const
Return the module owning the function this basic block belongs to, or nullptr if the function does no...
The address of a basic block.
Definition Constants.h:1082
static LLVM_ABI BlockAddress * lookup(const BasicBlock *BB)
Lookup an existing BlockAddress constant for the given BasicBlock.
Legacy analysis pass which computes BlockFrequencyInfo.
Legacy analysis pass which computes BranchProbabilityInfo.
LLVM_ABI BranchProbability getEdgeProbability(const BasicBlock *Src, unsigned IndexInSuccessors) const
Get an edge's probability, relative to other out-edges of the Src.
static BranchProbability getOne()
static BranchProbability getZero()
static void normalizeProbabilities(ProbabilityIter Begin, ProbabilityIter End)
Base class for all callable instructions (InvokeInst and CallInst) Holds everything related to callin...
bool isInlineAsm() const
Check if this call is an inline asm statement.
std::optional< OperandBundleUse > getOperandBundle(StringRef Name) const
Return an operand bundle by name, if present.
Function * getCalledFunction() const
Returns the function called, or null if this is an indirect function invocation or the function signa...
LLVM_ABI bool paramHasAttr(unsigned ArgNo, Attribute::AttrKind Kind) const
Determine whether the argument or parameter has the given attribute.
User::op_iterator arg_begin()
Return the iterator pointing to the beginning of the argument list.
unsigned countOperandBundlesOfType(StringRef Name) const
Return the number of operand bundles with the tag Name attached to this instruction.
Value * getCalledOperand() const
Value * getArgOperand(unsigned i) const
User::op_iterator arg_end()
Return the iterator pointing to the end of the argument list.
bool isConvergent() const
Determine if the invoke is convergent.
LLVM_ABI Intrinsic::ID getIntrinsicID() const
Returns the intrinsic ID of the intrinsic called or Intrinsic::not_intrinsic if the called function i...
iterator_range< User::op_iterator > args()
Iteration adapter for range-for loops.
unsigned arg_size() const
AttributeList getAttributes() const
Return the attributes for this call.
This class represents a function call, abstracting a target machine's calling convention.
bool isTailCall() const
Predicate
This enumeration lists the possible predicates for CmpInst subclasses.
Definition InstrTypes.h:740
@ FCMP_TRUE
1 1 1 1 Always true (always folded)
Definition InstrTypes.h:757
@ ICMP_SLT
signed less than
Definition InstrTypes.h:769
@ ICMP_SLE
signed less or equal
Definition InstrTypes.h:770
@ ICMP_UGT
unsigned greater than
Definition InstrTypes.h:763
@ ICMP_NE
not equal
Definition InstrTypes.h:762
@ ICMP_ULE
unsigned less or equal
Definition InstrTypes.h:766
@ FCMP_FALSE
0 0 0 0 Always false (always folded)
Definition InstrTypes.h:742
bool isFPPredicate() const
Definition InstrTypes.h:845
bool isIntPredicate() const
Definition InstrTypes.h:846
Value * getCondition() const
BasicBlock * getSuccessor(unsigned i) const
static LLVM_ABI ConstantInt * getTrue(LLVMContext &Context)
bool isZero() const
This is just a convenience method to make client code smaller for a common code.
Definition Constants.h:219
unsigned getBitWidth() const
getBitWidth - Return the scalar bitwidth of this constant.
Definition Constants.h:162
uint64_t getZExtValue() const
Return the constant as a 64-bit unsigned integer value after it has been zero extended as appropriate...
Definition Constants.h:168
const APInt & getValue() const
Return the constant as an APInt value reference.
Definition Constants.h:159
This is an important base class in LLVM.
Definition Constant.h:43
static LLVM_ABI Constant * getAllOnesValue(Type *Ty)
static LLVM_ABI Constant * getNullValue(Type *Ty)
Constructor to create a '0' constant of arbitrary type.
This is the common base class for constrained floating point intrinsics.
LLVM_ABI std::optional< fp::ExceptionBehavior > getExceptionBehavior() const
LLVM_ABI unsigned getNonMetadataArgCount() const
DWARF expression.
LLVM_ABI bool isEntryValue() const
Check if the expression consists of exactly one entry value operand.
static LLVM_ABI DIExpression * append(const DIExpression *Expr, ArrayRef< uint64_t > Ops)
Append the opcodes Ops to DIExpr.
LLVM_ABI bool startsWithDeref() const
Return whether the first element a DW_OP_deref.
ArrayRef< uint64_t > getElements() const
bool isValidLocationForIntrinsic(const DILocation *DL) const
Check that a location is valid for this label.
A parsed version of the target data layout string in and methods for querying it.
Definition DataLayout.h:64
Value * getAddress() const
DILabel * getLabel() const
DebugLoc getDebugLoc() const
Value * getValue(unsigned OpIdx=0) const
DILocalVariable * getVariable() const
DIExpression * getExpression() const
LLVM_ABI Value * getVariableLocationOp(unsigned OpIdx) const
DIExpression * getExpression() const
DILocalVariable * getVariable() const
A debug info location.
Definition DebugLoc.h:124
Class representing an expression and its matching format.
This instruction extracts a struct member or array element value from an aggregate value.
static LLVM_ABI FixedVectorType * get(Type *ElementType, unsigned NumElts)
Definition Type.cpp:869
bool skipFunction(const Function &F) const
Optional passes call this function to check whether the pass should be skipped.
Definition Pass.cpp:188
const BasicBlock & getEntryBlock() const
Definition Function.h:809
DISubprogram * getSubprogram() const
Get the attached subprogram.
bool hasMinSize() const
Optimize this function for minimum size (-Oz).
Definition Function.h:711
Constant * getPersonalityFn() const
Get the personality function associated with this function.
const Function & getFunction() const
Definition Function.h:166
bool isIntrinsic() const
isIntrinsic - Returns true if the function's name starts with "llvm.".
Definition Function.h:251
The actual analysis pass wrapper.
Definition CSEInfo.h:242
Simple wrapper that does the following.
Definition CSEInfo.h:212
The CSE Analysis object.
Definition CSEInfo.h:72
Abstract class that contains various methods for clients to notify about changes.
Simple wrapper observer that takes several observers, and calls each one for each event.
void removeObserver(GISelChangeObserver *O)
void addObserver(GISelChangeObserver *O)
static StringRef dropLLVMManglingEscape(StringRef Name)
If the given string begins with the GlobalValue name mangling escape character '\1',...
bool hasExternalWeakLinkage() const
bool hasDLLImportStorageClass() const
Module * getParent()
Get the module that this global value is contained inside of...
bool isTailCall(const MachineInstr &MI) const override
bool runOnMachineFunction(MachineFunction &MF) override
runOnMachineFunction - This method must be overloaded to perform the desired machine code transformat...
IRTranslator(CodeGenOptLevel OptLevel=CodeGenOptLevel::None)
void getAnalysisUsage(AnalysisUsage &AU) const override
getAnalysisUsage - This function should be overriden by passes that need analysis information to do t...
bool lowerInlineAsm(MachineIRBuilder &MIRBuilder, const CallBase &CB, std::function< ArrayRef< Register >(const Value &Val)> GetOrCreateVRegs) const
Lower the given inline asm call instruction GetOrCreateVRegs is a callback to materialize a register ...
This instruction inserts a struct field of array element value into an aggregate value.
iterator_range< simple_ilist< DbgRecord >::iterator > getDbgRecordRange() const
Return a range over the DbgRecords attached to this instruction.
const DebugLoc & getDebugLoc() const
Return the debug location for this node as a DebugLoc.
LLVM_ABI const Module * getModule() const
Return the module owning the function this instruction belongs to or nullptr it the function does not...
MDNode * getMetadata(unsigned KindID) const
Get the metadata of given kind attached to this Instruction.
LLVM_ABI AAMDNodes getAAMetadata() const
Returns the AA metadata for this instruction.
unsigned getOpcode() const
Returns a member of one of the enums like Instruction::Add.
LLVM_ABI bool hasAllowReassoc() const LLVM_READONLY
Determine whether the allow-reassociation flag is set.
Intrinsic::ID getIntrinsicID() const
Return the intrinsic ID of this intrinsic.
static bool getUseExtended()
constexpr LLT changeElementType(LLT NewEltTy) const
If this type is a vector, return a vector with the same number of elements but the new element type.
static constexpr LLT scalar(unsigned SizeInBits)
Get a low-level scalar or aggregate "bag of bits".
constexpr uint16_t getNumElements() const
Returns the number of elements in a vector LLT.
constexpr bool isVector() const
static constexpr LLT pointer(unsigned AddressSpace, unsigned SizeInBits)
Get a low-level pointer in the given address space.
constexpr TypeSize getSizeInBits() const
Returns the total size of the type. Must only be called on sized types.
constexpr bool isPointer() const
static constexpr LLT fixed_vector(unsigned NumElements, unsigned ScalarSizeInBits)
Get a low-level fixed-width vector of some number of elements and element width.
constexpr bool isFixedVector() const
Returns true if the LLT is a fixed vector.
static LLT integer(unsigned SizeInBits)
LLT changeElementSize(unsigned NewEltSize) const
If this type is a vector, return a vector with the same number of elements but the new element size.
LLVM_ABI void diagnose(const DiagnosticInfo &DI)
Report a message to the currently installed diagnostic handler.
Value * getPointerOperand()
AtomicOrdering getOrdering() const
Returns the ordering constraint of this load instruction.
SyncScope::ID getSyncScopeID() const
Returns the synchronization scope ID of this load instruction.
static LocationSize precise(uint64_t Value)
static MDTuple * get(LLVMContext &Context, ArrayRef< Metadata * > MDs)
Definition Metadata.h:1567
void normalizeSuccProbs()
Normalize probabilities of all successors so that the sum of them becomes one.
LLVM_ABI instr_iterator insert(instr_iterator I, MachineInstr *M)
Insert MI into the instruction list before I, possibly inside a bundle.
void push_back(MachineInstr *MI)
const BasicBlock * getBasicBlock() const
Return the LLVM basic block that this instance corresponded to originally.
LLVM_ABI void setSuccProbability(succ_iterator I, BranchProbability Prob)
Set successor probability of a given iterator.
LLVM_ABI void addSuccessor(MachineBasicBlock *Succ, BranchProbability Prob=BranchProbability::getUnknown())
Add Succ as a successor of this MachineBasicBlock.
SmallVectorImpl< MachineBasicBlock * >::iterator succ_iterator
LLVM_ABI void sortUniqueLiveIns()
Sorts and uniques the LiveIns vector.
LLVM_ABI bool isPredecessor(const MachineBasicBlock *MBB) const
Return true if the specified MBB is a predecessor of this block.
void addLiveIn(MCRegister PhysReg, LaneBitmask LaneMask=LaneBitmask::getAll())
Adds the specified register as a live in.
const MachineFunction * getParent() const
Return the MachineFunction containing this basic block.
void splice(iterator Where, MachineBasicBlock *Other, iterator From)
Take an instruction from MBB 'Other' at the position From, and insert it into this MBB right before '...
MachineInstrBundleIterator< MachineInstr > iterator
void setIsEHPad(bool V=true)
Indicates the block is a landing pad.
int getStackProtectorIndex() const
Return the index for the stack protector object.
void getAnalysisUsage(AnalysisUsage &AU) const override
getAnalysisUsage - Subclasses that override getAnalysisUsage must call this.
MachineFrameInfo & getFrameInfo()
getFrameInfo - Return the frame info object for the current function.
Function & getFunction()
Return the LLVM function that this machine code represents.
BasicBlockListType::iterator iterator
MachineBasicBlock * CreateMachineBasicBlock(const BasicBlock *BB=nullptr, std::optional< UniqueBBID > BBID=std::nullopt)
CreateMachineInstr - Allocate a new MachineInstr.
void insert(iterator MBBI, MachineBasicBlock *MBB)
Helper class to build MachineInstr.
MachineInstrBuilder buildFPTOUI_SAT(const DstOp &Dst, const SrcOp &Src0)
Build and insert Res = G_FPTOUI_SAT Src0.
MachineInstrBuilder buildFMul(const DstOp &Dst, const SrcOp &Src0, const SrcOp &Src1, std::optional< unsigned > Flags=std::nullopt)
MachineInstrBuilder buildFreeze(const DstOp &Dst, const SrcOp &Src)
Build and insert Dst = G_FREEZE Src.
MachineInstrBuilder buildBr(MachineBasicBlock &Dest)
Build and insert G_BR Dest.
MachineInstrBuilder buildModf(const DstOp &Fract, const DstOp &Int, const SrcOp &Src, std::optional< unsigned > Flags=std::nullopt)
Build and insert Fract, Int = G_FMODF Src.
LLVMContext & getContext() const
MachineInstrBuilder buildAdd(const DstOp &Dst, const SrcOp &Src0, const SrcOp &Src1, std::optional< unsigned > Flags=std::nullopt)
Build and insert Res = G_ADD Op0, Op1.
MachineInstrBuilder buildUndef(const DstOp &Res)
Build and insert Res = IMPLICIT_DEF.
MachineInstrBuilder buildResetFPMode()
Build and insert G_RESET_FPMODE.
MachineInstrBuilder buildFPTOSI_SAT(const DstOp &Dst, const SrcOp &Src0)
Build and insert Res = G_FPTOSI_SAT Src0.
MachineInstrBuilder buildUCmp(const DstOp &Res, const SrcOp &Op0, const SrcOp &Op1)
Build and insert a Res = G_UCMP Op0, Op1.
MachineInstrBuilder buildJumpTable(const LLT PtrTy, unsigned JTI)
Build and insert Res = G_JUMP_TABLE JTI.
MachineInstrBuilder buildGetRounding(const DstOp &Dst)
Build and insert Dst = G_GET_ROUNDING.
MachineInstrBuilder buildSCmp(const DstOp &Res, const SrcOp &Op0, const SrcOp &Op1)
Build and insert a Res = G_SCMP Op0, Op1.
MachineInstrBuilder buildFence(unsigned Ordering, unsigned Scope)
Build and insert G_FENCE Ordering, Scope.
MachineInstrBuilder buildSelect(const DstOp &Res, const SrcOp &Tst, const SrcOp &Op0, const SrcOp &Op1, std::optional< unsigned > Flags=std::nullopt)
Build and insert a Res = G_SELECT Tst, Op0, Op1.
MachineInstrBuilder buildFMA(const DstOp &Dst, const SrcOp &Src0, const SrcOp &Src1, const SrcOp &Src2, std::optional< unsigned > Flags=std::nullopt)
Build and insert Res = G_FMA Op0, Op1, Op2.
MachineInstrBuilder buildMul(const DstOp &Dst, const SrcOp &Src0, const SrcOp &Src1, std::optional< unsigned > Flags=std::nullopt)
Build and insert Res = G_MUL Op0, Op1.
MachineInstrBuilder buildInsertSubvector(const DstOp &Res, const SrcOp &Src0, const SrcOp &Src1, unsigned Index)
Build and insert Res = G_INSERT_SUBVECTOR Src0, Src1, Idx.
MachineInstrBuilder buildAnd(const DstOp &Dst, const SrcOp &Src0, const SrcOp &Src1)
Build and insert Res = G_AND Op0, Op1.
MachineInstrBuilder buildCast(const DstOp &Dst, const SrcOp &Src)
Build and insert an appropriate cast between two registers of equal size.
MachineInstrBuilder buildICmp(CmpInst::Predicate Pred, const DstOp &Res, const SrcOp &Op0, const SrcOp &Op1, std::optional< unsigned > Flags=std::nullopt)
Build and insert a Res = G_ICMP Pred, Op0, Op1.
MachineBasicBlock::iterator getInsertPt()
Current insertion point for new instructions.
MachineInstrBuilder buildSExtOrTrunc(const DstOp &Res, const SrcOp &Op)
Build and insert Res = G_SEXT Op, Res = G_TRUNC Op, or Res = COPY Op depending on the differing sizes...
MachineInstrBuilder buildAtomicRMW(unsigned Opcode, const DstOp &OldValRes, const SrcOp &Addr, const SrcOp &Val, MachineMemOperand &MMO)
Build and insert OldValRes<def> = G_ATOMICRMW_<Opcode> Addr, Val, MMO.
MachineInstrBuilder buildSub(const DstOp &Dst, const SrcOp &Src0, const SrcOp &Src1, std::optional< unsigned > Flags=std::nullopt)
Build and insert Res = G_SUB Op0, Op1.
MachineInstrBuilder buildIntrinsic(Intrinsic::ID ID, ArrayRef< Register > Res, bool HasSideEffects, bool isConvergent)
Build and insert a G_INTRINSIC instruction.
MachineInstrBuilder buildVScale(const DstOp &Res, unsigned MinElts)
Build and insert Res = G_VSCALE MinElts.
MachineInstrBuilder buildSplatBuildVector(const DstOp &Res, const SrcOp &Src)
Build and insert Res = G_BUILD_VECTOR with Src replicated to fill the number of elements.
MachineInstrBuilder buildSetFPMode(const SrcOp &Src)
Build and insert G_SET_FPMODE Src.
MachineInstrBuilder buildIndirectDbgValue(Register Reg, const MDNode *Variable, const MDNode *Expr)
Build and insert a DBG_VALUE instruction expressing the fact that the associated Variable lives in me...
MachineInstrBuilder buildBuildVector(const DstOp &Res, ArrayRef< Register > Ops)
Build and insert Res = G_BUILD_VECTOR Op0, ...
MachineInstrBuilder buildConstDbgValue(const Constant &C, const MDNode *Variable, const MDNode *Expr)
Build and insert a DBG_VALUE instructions specifying that Variable is given by C (suitably modified b...
MachineInstrBuilder buildBrCond(const SrcOp &Tst, MachineBasicBlock &Dest)
Build and insert G_BRCOND Tst, Dest.
std::optional< MachineInstrBuilder > materializeObjectPtrOffset(Register &Res, Register Op0, const LLT ValueTy, uint64_t Value)
Materialize and insert an instruction with appropriate flags for addressing some offset of an object,...
MachineInstrBuilder buildSetRounding(const SrcOp &Src)
Build and insert G_SET_ROUNDING.
MachineInstrBuilder buildExtractVectorElement(const DstOp &Res, const SrcOp &Val, const SrcOp &Idx)
Build and insert Res = G_EXTRACT_VECTOR_ELT Val, Idx.
MachineInstrBuilder buildLoad(const DstOp &Res, const SrcOp &Addr, MachineMemOperand &MMO)
Build and insert Res = G_LOAD Addr, MMO.
MachineInstrBuilder buildPtrAdd(const DstOp &Res, const SrcOp &Op0, const SrcOp &Op1, std::optional< unsigned > Flags=std::nullopt)
Build and insert Res = G_PTR_ADD Op0, Op1.
MachineInstrBuilder buildZExtOrTrunc(const DstOp &Res, const SrcOp &Op)
Build and insert Res = G_ZEXT Op, Res = G_TRUNC Op, or Res = COPY Op depending on the differing sizes...
MachineInstrBuilder buildExtractVectorElementConstant(const DstOp &Res, const SrcOp &Val, const int Idx)
Build and insert Res = G_EXTRACT_VECTOR_ELT Val, Idx.
MachineInstrBuilder buildShl(const DstOp &Dst, const SrcOp &Src0, const SrcOp &Src1, std::optional< unsigned > Flags=std::nullopt)
MachineInstrBuilder buildStore(const SrcOp &Val, const SrcOp &Addr, MachineMemOperand &MMO)
Build and insert G_STORE Val, Addr, MMO.
MachineInstrBuilder buildInstr(unsigned Opcode)
Build and insert <empty> = Opcode <empty>.
MachineInstrBuilder buildFrameIndex(const DstOp &Res, int Idx)
Build and insert Res = G_FRAME_INDEX Idx.
MachineInstrBuilder buildDirectDbgValue(Register Reg, const MDNode *Variable, const MDNode *Expr)
Build and insert a DBG_VALUE instruction expressing the fact that the associated Variable lives in Re...
MachineInstrBuilder buildDbgLabel(const MDNode *Label)
Build and insert a DBG_LABEL instructions specifying that Label is given.
MachineInstrBuilder buildBrJT(Register TablePtr, unsigned JTI, Register IndexReg)
Build and insert G_BRJT TablePtr, JTI, IndexReg.
MachineInstrBuilder buildDynStackAlloc(const DstOp &Res, const SrcOp &Size, Align Alignment)
Build and insert Res = G_DYN_STACKALLOC Size, Align.
MachineInstrBuilder buildFIDbgValue(int FI, const MDNode *Variable, const MDNode *Expr)
Build and insert a DBG_VALUE instruction expressing the fact that the associated Variable lives in th...
MachineInstrBuilder buildResetFPEnv()
Build and insert G_RESET_FPENV.
void setDebugLoc(const DebugLoc &DL)
Set the debug location to DL for all the next build instructions.
const MachineBasicBlock & getMBB() const
Getter for the basic block we currently build.
MachineInstrBuilder buildInsertVectorElement(const DstOp &Res, const SrcOp &Val, const SrcOp &Elt, const SrcOp &Idx)
Build and insert Res = G_INSERT_VECTOR_ELT Val, Elt, Idx.
MachineInstrBuilder buildAtomicCmpXchgWithSuccess(const DstOp &OldValRes, const DstOp &SuccessRes, const SrcOp &Addr, const SrcOp &CmpVal, const SrcOp &NewVal, MachineMemOperand &MMO)
Build and insert OldValRes<def>, SuccessRes<def> = / G_ATOMIC_CMPXCHG_WITH_SUCCESS Addr,...
void setMBB(MachineBasicBlock &MBB)
Set the insertion point to the end of MBB.
const DebugLoc & getDebugLoc()
Get the current instruction's debug location.
MachineInstrBuilder buildTrap(bool Debug=false)
Build and insert G_TRAP or G_DEBUGTRAP.
MachineInstrBuilder buildFFrexp(const DstOp &Fract, const DstOp &Exp, const SrcOp &Src, std::optional< unsigned > Flags=std::nullopt)
Build and insert Fract, Exp = G_FFREXP Src.
MachineInstrBuilder buildFSincos(const DstOp &Sin, const DstOp &Cos, const SrcOp &Src, std::optional< unsigned > Flags=std::nullopt)
Build and insert Sin, Cos = G_FSINCOS Src.
MachineInstrBuilder buildShuffleVector(const DstOp &Res, const SrcOp &Src1, const SrcOp &Src2, ArrayRef< int > Mask)
Build and insert Res = G_SHUFFLE_VECTOR Src1, Src2, Mask.
MachineInstrBuilder buildInstrNoInsert(unsigned Opcode)
Build but don't insert <empty> = Opcode <empty>.
MachineInstrBuilder buildCopy(const DstOp &Res, const SrcOp &Op)
Build and insert Res = COPY Op.
MachineInstrBuilder buildPrefetch(const SrcOp &Addr, unsigned RW, unsigned Locality, unsigned CacheType, MachineMemOperand &MMO)
Build and insert G_PREFETCH Addr, RW, Locality, CacheType.
MachineInstrBuilder buildExtractSubvector(const DstOp &Res, const SrcOp &Src, unsigned Index)
Build and insert Res = G_EXTRACT_SUBVECTOR Src, Idx0.
const DataLayout & getDataLayout() const
MachineInstrBuilder buildBrIndirect(Register Tgt)
Build and insert G_BRINDIRECT Tgt.
MachineInstrBuilder buildSplatVector(const DstOp &Res, const SrcOp &Val)
Build and insert Res = G_SPLAT_VECTOR Val.
MachineInstrBuilder buildStepVector(const DstOp &Res, unsigned Step)
Build and insert Res = G_STEP_VECTOR Step.
virtual MachineInstrBuilder buildConstant(const DstOp &Res, const ConstantInt &Val)
Build and insert Res = G_CONSTANT Val.
MachineInstrBuilder buildFCmp(CmpInst::Predicate Pred, const DstOp &Res, const SrcOp &Op0, const SrcOp &Op1, std::optional< unsigned > Flags=std::nullopt)
Build and insert a Res = G_FCMP PredOp0, Op1.
MachineInstrBuilder buildFAdd(const DstOp &Dst, const SrcOp &Src0, const SrcOp &Src1, std::optional< unsigned > Flags=std::nullopt)
Build and insert Res = G_FADD Op0, Op1.
MachineInstrBuilder buildSetFPEnv(const SrcOp &Src)
Build and insert G_SET_FPENV Src.
Register getReg(unsigned Idx) const
Get the register for the operand index.
const MachineInstrBuilder & addExternalSymbol(const char *FnName, unsigned TargetFlags=0) const
const MachineInstrBuilder & addUse(Register RegNo, RegState Flags={}, unsigned SubReg=0) const
Add a virtual register use operand.
const MachineInstrBuilder & addImm(int64_t Val) const
Add a new immediate operand.
const MachineInstrBuilder & addMetadata(const MDNode *MD) const
const MachineInstrBuilder & addSym(MCSymbol *Sym, unsigned char TargetFlags=0) const
const MachineInstrBuilder & addFrameIndex(int Idx) const
const MachineInstrBuilder & addFPImm(const ConstantFP *Val) const
const MachineInstrBuilder & addMBB(MachineBasicBlock *MBB, unsigned TargetFlags=0) const
const MachineInstrBuilder & addDef(Register RegNo, RegState Flags={}, unsigned SubReg=0) const
Add a virtual register definition operand.
const MachineInstrBuilder & addMemOperand(MachineMemOperand *MMO) const
MachineInstr * getInstr() const
If conversion operators fail, use this method to get the MachineInstr explicitly.
LLVM_ABI void copyIRFlags(const Instruction &I)
Copy all flags to MachineInst MIFlags.
static LLVM_ABI uint32_t copyFlagsFromInstruction(const Instruction &I)
LLVM_ABI void setDeactivationSymbol(MachineFunction &MF, Value *DS)
void setDebugLoc(DebugLoc DL)
Replace current source information with new such.
Flags
Flags values. These may be or'd together.
@ MOVolatile
The memory access is volatile.
@ MODereferenceable
The memory access is dereferenceable (i.e., doesn't trap).
@ MOLoad
The memory access reads data.
@ MOInvariant
The memory access always returns the same value (or traps).
@ MOStore
The memory access writes data.
static MachineOperand CreateES(const char *SymName, unsigned TargetFlags=0)
static MachineOperand CreateGA(const GlobalValue *GV, int64_t Offset, unsigned TargetFlags=0)
LLVM_ABI Register createGenericVirtualRegister(LLT Ty, StringRef Name="")
Create and return a new generic virtual register with low-level type Ty.
The optimization diagnostic interface.
Diagnostic information for missed-optimization remarks.
BasicBlock * getIncomingBlock(unsigned i) const
Return incoming basic block number i.
Value * getIncomingValue(unsigned i) const
Return incoming value number x.
unsigned getNumIncomingValues() const
Return the number of incoming edges.
AnalysisType & getAnalysis() const
getAnalysis<AnalysisType>() - This function is used by subclasses to get to the analysis information ...
static PointerType * getUnqual(Type *ElementType)
This constructs a pointer to an object of the specified type in the default address space (address sp...
Class to install both of the above.
Wrapper class representing virtual and physical registers.
Definition Register.h:20
Value * getReturnValue() const
Convenience accessor. Returns null if there is no return value.
size_type count(ConstPtrType Ptr) const
count - Return 1 if the specified pointer is in the set, 0 otherwise.
std::pair< iterator, bool > insert(PtrType Ptr)
Inserts Ptr if and only if there is no element in the container equal to Ptr.
This class consists of common code factored out of the SmallVector class to reduce code duplication b...
void push_back(const T &Elt)
This is a 'vector' (really, a variable-sized array), optimized for the case when the array is small.
Encapsulates all of the information needed to generate a stack protector check, and signals to isel w...
MachineBasicBlock * getSuccessMBB()
MachineBasicBlock * getFailureMBB()
constexpr bool empty() const
Check if the string is empty.
Definition StringRef.h:141
constexpr const char * data() const
Get a pointer to the start of the string (which may not be null terminated).
Definition StringRef.h:138
Primary interface to the complete machine description for the target machine.
const Triple & getTargetTriple() const
TargetOptions Options
const Target & getTarget() const
void resetTargetOptions(const Function &F) const
Reset the target options based on the function's attributes.
unsigned NoTrapAfterNoreturn
Do not emit a trap instruction for 'unreachable' IR instructions behind noreturn calls,...
unsigned TrapUnreachable
Emit target-specific trap instruction for 'unreachable' IR instructions.
FPOpFusion::FPOpFusionMode AllowFPOpFusion
AllowFPOpFusion - This flag is set by the -fp-contract=xxx option.
Target-Independent Code Generator Pass Configuration Options.
TargetSubtargetInfo - Generic base class for all target subtargets.
virtual const CallLowering * getCallLowering() const
virtual const TargetLowering * getTargetLowering() const
bool isSPIRV() const
Tests whether the target is SPIR-V (32/64-bit/Logical).
Definition Triple.h:891
Twine - A lightweight data structure for efficiently representing the concatenation of temporary valu...
Definition Twine.h:82
static constexpr TypeSize getZero()
Definition TypeSize.h:349
The instances of the Type class are immutable: once they are created, they are never changed.
Definition Type.h:46
LLVM_ABI bool isEmptyTy() const
Return true if this type is empty, that is, it has no elements or all of its elements are empty.
Definition Type.cpp:180
bool isByteTy() const
True if this is an instance of ByteType.
Definition Type.h:242
static LLVM_ABI IntegerType * getInt32Ty(LLVMContext &C)
Definition Type.cpp:309
bool isPointerTy() const
True if this is an instance of PointerType.
Definition Type.h:282
static LLVM_ABI Type * getVoidTy(LLVMContext &C)
Definition Type.cpp:282
bool isSized(SmallPtrSetImpl< Type * > *Visited=nullptr) const
Return true if it makes sense to take the size of this type.
Definition Type.h:326
bool isAggregateType() const
Return true if the type is an aggregate type.
Definition Type.h:319
bool isTokenTy() const
Return true if this is 'token'.
Definition Type.h:236
bool isVoidTy() const
Return true if this is 'void'.
Definition Type.h:141
BasicBlock * getSuccessor(unsigned i=0) const
Value * getOperand(unsigned i) const
Definition User.h:207
LLVM Value Representation.
Definition Value.h:75
Type * getType() const
All values are typed, get the type of this value.
Definition Value.h:255
bool hasOneUse() const
Return true if there is exactly one use of this value.
Definition Value.h:439
LLVMContext & getContext() const
All values hold a context through their type.
Definition Value.h:258
LLVM_ABI const Value * stripPointerCasts() const
Strip off pointer casts, all-zero GEPs and address space casts.
Definition Value.cpp:712
constexpr ScalarTy getFixedValue() const
Definition TypeSize.h:200
constexpr bool isScalable() const
Returns whether the quantity is scaled by a runtime quantity (vscale).
Definition TypeSize.h:168
constexpr ScalarTy getKnownMinValue() const
Returns the minimum value this quantity can represent.
Definition TypeSize.h:165
constexpr bool isZero() const
Definition TypeSize.h:153
const ParentTy * getParent() const
Definition ilist_node.h:34
NodeTy * getNextNode()
Get the next node, or nullptr for the list tail.
Definition ilist_node.h:348
A raw_ostream that writes to an std::string.
#define llvm_unreachable(msg)
Marks that the current location is not supposed to be reachable.
constexpr char Align[]
Key for Kernel::Arg::Metadata::mAlign.
constexpr char Args[]
Key for Kernel::Metadata::mArgs.
constexpr char SymbolName[]
Key for Kernel::Metadata::mSymbolName.
constexpr std::underlying_type_t< E > Mask()
Get a bitmask with 1s in all places up to the high-order bit of E's largest value.
unsigned ID
LLVM IR allows to use arbitrary numbers as calling convention identifiers.
Definition CallingConv.h:24
@ C
The default llvm calling convention, compatible with C.
Definition CallingConv.h:34
@ BasicBlock
Various leaf nodes.
Definition ISDOpcodes.h:81
BinaryOp_match< SrcTy, SpecificConstantMatch, TargetOpcode::G_XOR, true > m_Not(const SrcTy &&Src)
Matches a register not-ed by a G_XOR.
OneUse_match< SubPat > m_OneUse(const SubPat &SP)
bool match(Val *V, const Pattern &P)
specificval_ty m_Specific(const Value *V)
Match if we have a specific specified value.
TwoOps_match< Val_t, Idx_t, Instruction::ExtractElement > m_ExtractElt(const Val_t &Val, const Idx_t &Idx)
Matches ExtractElementInst.
auto m_Value()
Match an arbitrary value and ignore it.
auto m_LogicalOr()
Matches L || R where L and R are arbitrary values.
auto m_LogicalAnd()
Matches L && R where L and R are arbitrary values.
Offsets
Offsets in bytes from the start of the input buffer.
LLVM_ABI void sortAndRangeify(CaseClusterVector &Clusters)
Sort Clusters and merge adjacent cases.
std::vector< CaseCluster > CaseClusterVector
@ CC_Range
A cluster of adjacent case labels with the same destination, or just one case.
@ CC_JumpTable
A cluster of cases suitable for jump table lowering.
@ CC_BitTests
A cluster of cases suitable for bit test lowering.
SmallVector< SwitchWorkListItem, 4 > SwitchWorkList
CaseClusterVector::iterator CaseClusterIt
@ CE
Windows NT (Windows on ARM)
Definition MCAsmInfo.h:50
initializer< Ty > init(const Ty &Val)
ExceptionBehavior
Exception behavior used for floating point operations.
Definition FPEnv.h:39
@ ebIgnore
This corresponds to "fpexcept.ignore".
Definition FPEnv.h:40
DiagnosticInfoOptimizationBase::Argument NV
NodeAddr< PhiNode * > Phi
Definition RDFGraph.h:390
NodeAddr< CodeNode * > Code
Definition RDFGraph.h:388
friend class Instruction
Iterator for Instructions in a `BasicBlock.
Definition BasicBlock.h:73
BaseReg
Stack frame base register. Bit 0 of FREInfo.Info.
Definition SFrame.h:77
This is an optimization pass for GlobalISel generic memory operations.
auto drop_begin(T &&RangeOrContainer, size_t N=1)
Return a range covering RangeOrContainer with the first N elements excluded.
Definition STLExtras.h:315
@ Low
Lower the current thread's priority such that it does not affect foreground tasks significantly.
Definition Threading.h:280
@ Offset
Definition DWP.cpp:558
FunctionAddr VTableAddr Value
Definition InstrProf.h:137
@ Implicit
Not emitted register (e.g. carry, or temporary result).
@ Undef
Value of the register doesn't matter.
auto enumerate(FirstRange &&First, RestRanges &&...Rest)
Given two or more input ranges, returns a new range whose values are tuples (A, B,...
Definition STLExtras.h:2553
decltype(auto) dyn_cast(const From &Val)
dyn_cast<X> - Return the argument parameter cast to the specified type.
Definition Casting.h:643
int countr_one(T Value)
Count the number of ones from the least significant bit to the first zero bit.
Definition bit.h:315
FunctionAddr VTableAddr uintptr_t uintptr_t Int32Ty
Definition InstrProf.h:328
LLVM_ABI void diagnoseDontCall(const CallInst &CI)
auto successors(const MachineBasicBlock *BB)
LLVM_ABI MVT getMVTForLLT(LLT Ty)
Get a rough equivalent of an MVT for a given LLT.
void append_range(Container &C, Range &&R)
Wrapper function to append range R to container C.
Definition STLExtras.h:2207
constexpr bool isUIntN(unsigned N, uint64_t x)
Checks if an unsigned integer fits into the given (dynamic) bit width.
Definition MathExtras.h:243
gep_type_iterator gep_type_end(const User *GEP)
LLVM_ABI MachineBasicBlock::iterator findSplitPointForStackProtector(MachineBasicBlock *BB, const TargetInstrInfo &TII)
Find the split point at which to splice the end of BB into its success stack protector check machine ...
LLVM_ABI LLT getLLTForMVT(MVT Ty)
Get a rough equivalent of an LLT for a given MVT.
constexpr int popcount(T Value) noexcept
Count the number of set bits in a value.
Definition bit.h:156
int countr_zero(T Val)
Count number of 0's from the least significant bit to the most stopping at the first 1.
Definition bit.h:204
Align getKnownAlignment(Value *V, const DataLayout &DL, const Instruction *CxtI=nullptr, AssumptionCache *AC=nullptr, const DominatorTree *DT=nullptr)
Try to infer an alignment for the specified pointer.
Definition Local.h:252
constexpr bool has_single_bit(T Value) noexcept
Definition bit.h:149
bool any_of(R &&range, UnaryPredicate P)
Provide wrappers to std::any_of which take ranges instead of having to pass begin/end explicitly.
Definition STLExtras.h:1745
LLVM_ABI llvm::SmallVector< int, 16 > createStrideMask(unsigned Start, unsigned Stride, unsigned VF)
Create a stride shuffle mask.
auto reverse(ContainerTy &&C)
Definition STLExtras.h:407
void sort(IteratorTy Start, IteratorTy End)
Definition STLExtras.h:1635
LLVM_ABI raw_ostream & dbgs()
dbgs() - This returns a reference to a raw_ostream for debugging messages.
Definition Debug.cpp:209
LLVM_ABI void report_fatal_error(Error Err, bool gen_crash_diag=true)
Definition Error.cpp:163
generic_gep_type_iterator<> gep_type_iterator
auto succ_size(const MachineBasicBlock *BB)
LLVM_ABI EHPersonality classifyEHPersonality(const Value *Pers)
See if the given exception handling personality function is one that we understand.
CodeGenOptLevel
Code generation optimization level.
Definition CodeGen.h:82
class LLVM_GSL_OWNER SmallVector
Forward declaration of SmallVector so that calculateSmallVectorDefaultInlinedElements can reference s...
bool isa(const From &Val)
isa<X> - Return true if the parameter to the template is an instance of one of the template type argu...
Definition Casting.h:547
@ Success
The lock was released successfully.
LLVM_ATTRIBUTE_VISIBILITY_DEFAULT AnalysisKey InnerAnalysisManagerProxy< AnalysisManagerT, IRUnitT, ExtraArgTs... >::Key
@ Global
Append to llvm.global_dtors.
@ First
Helpers to iterate all locations in the MemoryEffectsBase class.
Definition ModRef.h:74
LLVM_ABI void getSelectionDAGFallbackAnalysisUsage(AnalysisUsage &AU)
Modify analysis usage so it preserves passes required for the SelectionDAG fallback.
Definition Utils.cpp:1147
auto lower_bound(R &&Range, T &&Value)
Provide wrappers to std::lower_bound which take ranges instead of having to pass begin/end explicitly...
Definition STLExtras.h:2051
LLVM_ABI llvm::SmallVector< int, 16 > createInterleaveMask(unsigned VF, unsigned NumVecs)
Create an interleave shuffle mask.
@ FMul
Product of floats.
@ Sub
Subtraction of integers.
DWARFExpression::Operation Op
ArrayRef(const T &OneElt) -> ArrayRef< T >
bool isAsynchronousEHPersonality(EHPersonality Pers)
Returns true if this personality function catches asynchronous exceptions.
decltype(auto) cast(const From &Val)
cast<X> - Return the argument parameter cast to the specified type.
Definition Casting.h:559
LLVM_ABI std::optional< RoundingMode > convertStrToRoundingMode(StringRef)
Returns a valid RoundingMode enumerator when given a string that is valid as input in constrained int...
Definition FPEnv.cpp:25
gep_type_iterator gep_type_begin(const User *GEP)
LLVM_ABI void computeValueLLTs(const DataLayout &DL, Type &Ty, SmallVectorImpl< LLT > &ValueLLTs, SmallVectorImpl< TypeSize > *Offsets=nullptr, TypeSize StartingOffset=TypeSize::getZero())
computeValueLLTs - Given an LLVM IR type, compute a sequence of LLTs that represent all the individua...
Definition Analysis.cpp:153
LLVM_ABI GlobalValue * ExtractTypeInfo(Value *V)
ExtractTypeInfo - Returns the type info, possibly bitcast, encoded in V.
Definition Analysis.cpp:181
Align commonAlignment(Align A, uint64_t Offset)
Returns the alignment that satisfies both alignments.
Definition Alignment.h:201
LLVM_ABI LLT getLLTForType(Type &Ty, const DataLayout &DL)
Construct a low-level type based on an LLVM type.
void swap(llvm::BitVector &LHS, llvm::BitVector &RHS)
Implement std::swap in terms of BitVector swap.
Definition BitVector.h:863
This struct is a compact representation of a valid (non-zero power of two) alignment.
Definition Alignment.h:39
constexpr uint64_t value() const
This is a hole in the type system and should not be abused.
Definition Alignment.h:77
Pair of physical register and lane mask.
static LLVM_ABI MachinePointerInfo getFixedStack(MachineFunction &MF, int FI, int64_t Offset=0)
Return a MachinePointerInfo record that refers to the specified FrameIndex.
static bool canHandle(const Instruction *I, const TargetLibraryInfo &TLI)
static StringRef getLibcallImplName(RTLIB::LibcallImpl CallImpl)
Get the libcall routine name for the specified libcall implementation.
This structure is used to communicate between SelectionDAGBuilder and SDISel for the code generation ...
Register Reg
The virtual register containing the index of the jump table entry to jump to.
MachineBasicBlock * Default
The MBB of the default bb, which is a successor of the range check MBB.
unsigned JTI
The JumpTableIndex for this jump table in the function.
MachineBasicBlock * MBB
The MBB into which to emit the code for the indirect jump.