37#define DEBUG_TYPE "x86-fixup-inst-tuning"
39STATISTIC(NumInstChanges,
"Number of instructions changes");
42class X86FixupInstTuningImpl {
60 X86FixupInstTuningLegacy() : MachineFunctionPass(ID) {}
62 StringRef getPassName()
const override {
return "X86 Fixup Inst Tuning"; }
64 bool runOnMachineFunction(MachineFunction &MF)
override;
65 bool processInstruction(MachineFunction &MF, MachineBasicBlock &
MBB,
69 MachineFunctionProperties getRequiredProperties()
const override {
70 return MachineFunctionProperties().setNoVRegs();
75char X86FixupInstTuningLegacy ::ID = 0;
80 return new X86FixupInstTuningLegacy();
85 if (NewVal.has_value() && CurVal.has_value() && *NewVal != *CurVal)
86 return *NewVal < *CurVal;
91bool X86FixupInstTuningImpl::processInstruction(
94 MachineInstr &
MI = *
I;
95 unsigned Opc =
MI.getOpcode();
96 unsigned NumOperands =
MI.getDesc().getNumOperands();
99 auto GetInstTput = [&](
unsigned Opcode) -> std::optional<double> {
102 *ST, *(
SM->getSchedClassDesc(
TII->get(Opcode).getSchedClass())));
105 auto GetInstLat = [&](
unsigned Opcode) -> std::optional<double> {
108 *ST, *(
SM->getSchedClassDesc(
TII->get(Opcode).getSchedClass())));
111 auto GetInstSize = [&](
unsigned Opcode) -> std::optional<unsigned> {
118 auto NewOpcPreferable = [&](
unsigned NewOpc,
119 bool ReplaceInTie =
true) ->
bool {
120 std::optional<bool> Res;
121 if (
SM->hasInstrSchedModel()) {
145 auto ProcessVPERMILPDri = [&](
unsigned NewOpc) ->
bool {
146 if (!NewOpcPreferable(NewOpc))
150 unsigned MaskImm =
MI.getOperand(NumOperands - 1).getImm();
151 MI.removeOperand(NumOperands - 1);
152 MI.addOperand(
MI.getOperand(NumOperands - 2));
153 MI.setDesc(
TII->get(NewOpc));
164 auto ProcessVPERMILPSri = [&](
unsigned NewOpc) ->
bool {
165 if (!NewOpcPreferable(NewOpc))
169 unsigned MaskImm =
MI.getOperand(NumOperands - 1).getImm();
170 MI.removeOperand(NumOperands - 1);
171 MI.addOperand(
MI.getOperand(NumOperands - 2));
172 MI.setDesc(
TII->get(NewOpc));
182 auto ProcessVPERMILPSmi = [&](
unsigned NewOpc) ->
bool {
186 !NewOpcPreferable(NewOpc,
false))
190 MI.setDesc(
TII->get(NewOpc));
210 auto ProcessUNPCK = [&](
unsigned NewOpc,
unsigned MaskImm) ->
bool {
211 if (!NewOpcPreferable(NewOpc,
false))
215 MI.setDesc(
TII->get(NewOpc));
222 auto ProcessUNPCKToIntDomain = [&](
unsigned NewOpc) ->
bool {
227 !NewOpcPreferable(NewOpc,
false))
231 MI.setDesc(
TII->get(NewOpc));
237 auto ProcessUNPCKLPDrr = [&](
unsigned NewOpcIntDomain,
238 unsigned NewOpc) ->
bool {
239 if (ProcessUNPCKToIntDomain(NewOpcIntDomain))
241 return ProcessUNPCK(NewOpc, 0x00);
243 auto ProcessUNPCKHPDrr = [&](
unsigned NewOpcIntDomain,
244 unsigned NewOpc) ->
bool {
245 if (ProcessUNPCKToIntDomain(NewOpcIntDomain))
247 return ProcessUNPCK(NewOpc, 0xff);
250 auto ProcessUNPCKPDrm = [&](
unsigned NewOpcIntDomain) ->
bool {
251 return ProcessUNPCKToIntDomain(NewOpcIntDomain);
254 auto ProcessUNPCKPS = [&](
unsigned NewOpc) ->
bool {
255 return ProcessUNPCKToIntDomain(NewOpc);
260 auto ProcessVPERM2x128ToVINSERT128 = [&](
unsigned InsertOpc) ->
bool {
261 unsigned PermImm =
MI.getOperand(NumOperands - 1).getImm();
263 if (PermImm != 0x20 || !NewOpcPreferable(InsertOpc))
265 Register RHSRegYMM =
MI.getOperand(NumOperands - 2).getReg();
266 Register RHSRegXMM =
TRI->getSubReg(RHSRegYMM, X86::sub_xmm);
269 MI.setDesc(
TII->get(InsertOpc));
270 MI.removeOperand(NumOperands - 1);
271 MI.removeOperand(NumOperands - 2);
283 auto ProcessBLENDWToBLENDD = [&](
unsigned MovOpc,
unsigned NumElts) ->
bool {
284 if (!ST->
hasAVX2() || !NewOpcPreferable(MovOpc))
288 APInt(8,
MI.getOperand(NumOperands - 1).getImm(),
false,
296 MI.setDesc(
TII->get(MovOpc));
297 MI.removeOperand(NumOperands - 1);
304 auto ProcessBLENDToMOV = [&](
unsigned MovOpc,
unsigned Mask,
305 unsigned MovImm) ->
bool {
306 if ((
MI.getOperand(NumOperands - 1).getImm() & Mask) != MovImm)
308 if (!OptSize && !NewOpcPreferable(MovOpc))
312 MI.setDesc(
TII->get(MovOpc));
313 MI.removeOperand(NumOperands - 1);
320 auto ProcessShiftLeftToAdd = [&](
unsigned AddOpc) ->
bool {
321 if (
MI.getOperand(NumOperands - 1).getImm() != 1)
323 if (!NewOpcPreferable(AddOpc,
true))
327 MI.setDesc(
TII->get(AddOpc));
328 MI.removeOperand(NumOperands - 1);
329 MI.addOperand(
MI.getOperand(NumOperands - 2));
341 auto ProcessVPERMQToVINSERT128 = [&](
unsigned NewOpc) ->
bool {
342 if (
MI.getOperand(NumOperands - 1).getImm() != 0x44)
344 if (!NewOpcPreferable(NewOpc,
false))
349 Register XmmReg =
TRI->getSubReg(SrcReg, X86::sub_xmm);
355 MI.setDesc(
TII->get(NewOpc));
357 MI.removeOperand(NumOperands - 1);
370 case X86::BLENDPDrri:
371 return ProcessBLENDToMOV(X86::MOVSDrr, 0x3, 0x1);
372 case X86::VBLENDPDrri:
373 return ProcessBLENDToMOV(X86::VMOVSDrr, 0x3, 0x1);
375 case X86::BLENDPSrri:
376 return ProcessBLENDToMOV(X86::MOVSSrr, 0xF, 0x1) ||
377 ProcessBLENDToMOV(X86::MOVSDrr, 0xF, 0x3);
378 case X86::VBLENDPSrri:
379 return ProcessBLENDToMOV(X86::VMOVSSrr, 0xF, 0x1) ||
380 ProcessBLENDToMOV(X86::VMOVSDrr, 0xF, 0x3);
382 case X86::VPBLENDWrri:
386 return ProcessBLENDWToBLENDD(X86::VPBLENDDrri, 4);
388 case X86::VPERM2F128rri:
389 return ProcessVPERM2x128ToVINSERT128(X86::VINSERTF128rri);
390 case X86::VPERM2I128rri:
391 return ProcessVPERM2x128ToVINSERT128(X86::VINSERTI128rri);
393 case X86::VPERMILPDri:
394 return ProcessVPERMILPDri(X86::VSHUFPDrri);
395 case X86::VPERMILPDYri:
396 return ProcessVPERMILPDri(X86::VSHUFPDYrri);
397 case X86::VPERMILPDZ128ri:
398 return ProcessVPERMILPDri(X86::VSHUFPDZ128rri);
399 case X86::VPERMILPDZ256ri:
400 return ProcessVPERMILPDri(X86::VSHUFPDZ256rri);
401 case X86::VPERMILPDZri:
402 return ProcessVPERMILPDri(X86::VSHUFPDZrri);
403 case X86::VPERMILPDZ128rikz:
404 return ProcessVPERMILPDri(X86::VSHUFPDZ128rrikz);
405 case X86::VPERMILPDZ256rikz:
406 return ProcessVPERMILPDri(X86::VSHUFPDZ256rrikz);
407 case X86::VPERMILPDZrikz:
408 return ProcessVPERMILPDri(X86::VSHUFPDZrrikz);
409 case X86::VPERMILPDZ128rik:
410 return ProcessVPERMILPDri(X86::VSHUFPDZ128rrik);
411 case X86::VPERMILPDZ256rik:
412 return ProcessVPERMILPDri(X86::VSHUFPDZ256rrik);
413 case X86::VPERMILPDZrik:
414 return ProcessVPERMILPDri(X86::VSHUFPDZrrik);
416 case X86::VPERMILPSri:
417 return ProcessVPERMILPSri(X86::VSHUFPSrri);
418 case X86::VPERMILPSYri:
419 return ProcessVPERMILPSri(X86::VSHUFPSYrri);
420 case X86::VPERMILPSZ128ri:
421 return ProcessVPERMILPSri(X86::VSHUFPSZ128rri);
422 case X86::VPERMILPSZ256ri:
423 return ProcessVPERMILPSri(X86::VSHUFPSZ256rri);
424 case X86::VPERMILPSZri:
425 return ProcessVPERMILPSri(X86::VSHUFPSZrri);
426 case X86::VPERMILPSZ128rikz:
427 return ProcessVPERMILPSri(X86::VSHUFPSZ128rrikz);
428 case X86::VPERMILPSZ256rikz:
429 return ProcessVPERMILPSri(X86::VSHUFPSZ256rrikz);
430 case X86::VPERMILPSZrikz:
431 return ProcessVPERMILPSri(X86::VSHUFPSZrrikz);
432 case X86::VPERMILPSZ128rik:
433 return ProcessVPERMILPSri(X86::VSHUFPSZ128rrik);
434 case X86::VPERMILPSZ256rik:
435 return ProcessVPERMILPSri(X86::VSHUFPSZ256rrik);
436 case X86::VPERMILPSZrik:
437 return ProcessVPERMILPSri(X86::VSHUFPSZrrik);
438 case X86::VPERMILPSmi:
439 return ProcessVPERMILPSmi(X86::VPSHUFDmi);
440 case X86::VPERMILPSYmi:
443 return ST->
hasAVX2() ? ProcessVPERMILPSmi(X86::VPSHUFDYmi) :
false;
444 case X86::VPERMILPSZ128mi:
445 return ProcessVPERMILPSmi(X86::VPSHUFDZ128mi);
446 case X86::VPERMILPSZ256mi:
447 return ProcessVPERMILPSmi(X86::VPSHUFDZ256mi);
448 case X86::VPERMILPSZmi:
449 return ProcessVPERMILPSmi(X86::VPSHUFDZmi);
450 case X86::VPERMILPSZ128mikz:
451 return ProcessVPERMILPSmi(X86::VPSHUFDZ128mikz);
452 case X86::VPERMILPSZ256mikz:
453 return ProcessVPERMILPSmi(X86::VPSHUFDZ256mikz);
454 case X86::VPERMILPSZmikz:
455 return ProcessVPERMILPSmi(X86::VPSHUFDZmikz);
456 case X86::VPERMILPSZ128mik:
457 return ProcessVPERMILPSmi(X86::VPSHUFDZ128mik);
458 case X86::VPERMILPSZ256mik:
459 return ProcessVPERMILPSmi(X86::VPSHUFDZ256mik);
460 case X86::VPERMILPSZmik:
461 return ProcessVPERMILPSmi(X86::VPSHUFDZmik);
463 return ProcessVPERMQToVINSERT128(X86::VINSERTI128rri);
464 case X86::VPERMPDYri:
465 return ProcessVPERMQToVINSERT128(X86::VINSERTF128rri);
467 case X86::UNPCKLPDrr:
468 return ProcessUNPCKLPDrr(X86::PUNPCKLQDQrr, X86::SHUFPDrri);
469 case X86::VMOVLHPSrr:
470 case X86::VUNPCKLPDrr:
471 return ProcessUNPCKLPDrr(X86::VPUNPCKLQDQrr, X86::VSHUFPDrri);
472 case X86::VUNPCKLPDYrr:
473 return ProcessUNPCKLPDrr(X86::VPUNPCKLQDQYrr, X86::VSHUFPDYrri);
475 case X86::VMOVLHPSZrr:
476 case X86::VUNPCKLPDZ128rr:
477 return ProcessUNPCKLPDrr(X86::VPUNPCKLQDQZ128rr, X86::VSHUFPDZ128rri);
478 case X86::VUNPCKLPDZ256rr:
479 return ProcessUNPCKLPDrr(X86::VPUNPCKLQDQZ256rr, X86::VSHUFPDZ256rri);
480 case X86::VUNPCKLPDZrr:
481 return ProcessUNPCKLPDrr(X86::VPUNPCKLQDQZrr, X86::VSHUFPDZrri);
482 case X86::VUNPCKLPDZ128rrk:
483 return ProcessUNPCKLPDrr(X86::VPUNPCKLQDQZ128rrk, X86::VSHUFPDZ128rrik);
484 case X86::VUNPCKLPDZ256rrk:
485 return ProcessUNPCKLPDrr(X86::VPUNPCKLQDQZ256rrk, X86::VSHUFPDZ256rrik);
486 case X86::VUNPCKLPDZrrk:
487 return ProcessUNPCKLPDrr(X86::VPUNPCKLQDQZrrk, X86::VSHUFPDZrrik);
488 case X86::VUNPCKLPDZ128rrkz:
489 return ProcessUNPCKLPDrr(X86::VPUNPCKLQDQZ128rrkz, X86::VSHUFPDZ128rrikz);
490 case X86::VUNPCKLPDZ256rrkz:
491 return ProcessUNPCKLPDrr(X86::VPUNPCKLQDQZ256rrkz, X86::VSHUFPDZ256rrikz);
492 case X86::VUNPCKLPDZrrkz:
493 return ProcessUNPCKLPDrr(X86::VPUNPCKLQDQZrrkz, X86::VSHUFPDZrrikz);
494 case X86::UNPCKHPDrr:
495 return ProcessUNPCKHPDrr(X86::PUNPCKHQDQrr, X86::SHUFPDrri);
496 case X86::VUNPCKHPDrr:
497 return ProcessUNPCKHPDrr(X86::VPUNPCKHQDQrr, X86::VSHUFPDrri);
498 case X86::VUNPCKHPDYrr:
499 return ProcessUNPCKHPDrr(X86::VPUNPCKHQDQYrr, X86::VSHUFPDYrri);
500 case X86::VUNPCKHPDZ128rr:
501 return ProcessUNPCKHPDrr(X86::VPUNPCKHQDQZ128rr, X86::VSHUFPDZ128rri);
502 case X86::VUNPCKHPDZ256rr:
503 return ProcessUNPCKHPDrr(X86::VPUNPCKHQDQZ256rr, X86::VSHUFPDZ256rri);
504 case X86::VUNPCKHPDZrr:
505 return ProcessUNPCKHPDrr(X86::VPUNPCKHQDQZrr, X86::VSHUFPDZrri);
506 case X86::VUNPCKHPDZ128rrk:
507 return ProcessUNPCKHPDrr(X86::VPUNPCKHQDQZ128rrk, X86::VSHUFPDZ128rrik);
508 case X86::VUNPCKHPDZ256rrk:
509 return ProcessUNPCKHPDrr(X86::VPUNPCKHQDQZ256rrk, X86::VSHUFPDZ256rrik);
510 case X86::VUNPCKHPDZrrk:
511 return ProcessUNPCKHPDrr(X86::VPUNPCKHQDQZrrk, X86::VSHUFPDZrrik);
512 case X86::VUNPCKHPDZ128rrkz:
513 return ProcessUNPCKHPDrr(X86::VPUNPCKHQDQZ128rrkz, X86::VSHUFPDZ128rrikz);
514 case X86::VUNPCKHPDZ256rrkz:
515 return ProcessUNPCKHPDrr(X86::VPUNPCKHQDQZ256rrkz, X86::VSHUFPDZ256rrikz);
516 case X86::VUNPCKHPDZrrkz:
517 return ProcessUNPCKHPDrr(X86::VPUNPCKHQDQZrrkz, X86::VSHUFPDZrrikz);
518 case X86::UNPCKLPDrm:
519 return ProcessUNPCKPDrm(X86::PUNPCKLQDQrm);
520 case X86::VUNPCKLPDrm:
521 return ProcessUNPCKPDrm(X86::VPUNPCKLQDQrm);
522 case X86::VUNPCKLPDYrm:
523 return ProcessUNPCKPDrm(X86::VPUNPCKLQDQYrm);
524 case X86::VUNPCKLPDZ128rm:
525 return ProcessUNPCKPDrm(X86::VPUNPCKLQDQZ128rm);
526 case X86::VUNPCKLPDZ256rm:
527 return ProcessUNPCKPDrm(X86::VPUNPCKLQDQZ256rm);
528 case X86::VUNPCKLPDZrm:
529 return ProcessUNPCKPDrm(X86::VPUNPCKLQDQZrm);
530 case X86::VUNPCKLPDZ128rmk:
531 return ProcessUNPCKPDrm(X86::VPUNPCKLQDQZ128rmk);
532 case X86::VUNPCKLPDZ256rmk:
533 return ProcessUNPCKPDrm(X86::VPUNPCKLQDQZ256rmk);
534 case X86::VUNPCKLPDZrmk:
535 return ProcessUNPCKPDrm(X86::VPUNPCKLQDQZrmk);
536 case X86::VUNPCKLPDZ128rmkz:
537 return ProcessUNPCKPDrm(X86::VPUNPCKLQDQZ128rmkz);
538 case X86::VUNPCKLPDZ256rmkz:
539 return ProcessUNPCKPDrm(X86::VPUNPCKLQDQZ256rmkz);
540 case X86::VUNPCKLPDZrmkz:
541 return ProcessUNPCKPDrm(X86::VPUNPCKLQDQZrmkz);
542 case X86::UNPCKHPDrm:
543 return ProcessUNPCKPDrm(X86::PUNPCKHQDQrm);
544 case X86::VUNPCKHPDrm:
545 return ProcessUNPCKPDrm(X86::VPUNPCKHQDQrm);
546 case X86::VUNPCKHPDYrm:
547 return ProcessUNPCKPDrm(X86::VPUNPCKHQDQYrm);
548 case X86::VUNPCKHPDZ128rm:
549 return ProcessUNPCKPDrm(X86::VPUNPCKHQDQZ128rm);
550 case X86::VUNPCKHPDZ256rm:
551 return ProcessUNPCKPDrm(X86::VPUNPCKHQDQZ256rm);
552 case X86::VUNPCKHPDZrm:
553 return ProcessUNPCKPDrm(X86::VPUNPCKHQDQZrm);
554 case X86::VUNPCKHPDZ128rmk:
555 return ProcessUNPCKPDrm(X86::VPUNPCKHQDQZ128rmk);
556 case X86::VUNPCKHPDZ256rmk:
557 return ProcessUNPCKPDrm(X86::VPUNPCKHQDQZ256rmk);
558 case X86::VUNPCKHPDZrmk:
559 return ProcessUNPCKPDrm(X86::VPUNPCKHQDQZrmk);
560 case X86::VUNPCKHPDZ128rmkz:
561 return ProcessUNPCKPDrm(X86::VPUNPCKHQDQZ128rmkz);
562 case X86::VUNPCKHPDZ256rmkz:
563 return ProcessUNPCKPDrm(X86::VPUNPCKHQDQZ256rmkz);
564 case X86::VUNPCKHPDZrmkz:
565 return ProcessUNPCKPDrm(X86::VPUNPCKHQDQZrmkz);
567 case X86::UNPCKLPSrr:
568 return ProcessUNPCKPS(X86::PUNPCKLDQrr);
569 case X86::VUNPCKLPSrr:
570 return ProcessUNPCKPS(X86::VPUNPCKLDQrr);
571 case X86::VUNPCKLPSYrr:
572 return ProcessUNPCKPS(X86::VPUNPCKLDQYrr);
573 case X86::VUNPCKLPSZ128rr:
574 return ProcessUNPCKPS(X86::VPUNPCKLDQZ128rr);
575 case X86::VUNPCKLPSZ256rr:
576 return ProcessUNPCKPS(X86::VPUNPCKLDQZ256rr);
577 case X86::VUNPCKLPSZrr:
578 return ProcessUNPCKPS(X86::VPUNPCKLDQZrr);
579 case X86::VUNPCKLPSZ128rrk:
580 return ProcessUNPCKPS(X86::VPUNPCKLDQZ128rrk);
581 case X86::VUNPCKLPSZ256rrk:
582 return ProcessUNPCKPS(X86::VPUNPCKLDQZ256rrk);
583 case X86::VUNPCKLPSZrrk:
584 return ProcessUNPCKPS(X86::VPUNPCKLDQZrrk);
585 case X86::VUNPCKLPSZ128rrkz:
586 return ProcessUNPCKPS(X86::VPUNPCKLDQZ128rrkz);
587 case X86::VUNPCKLPSZ256rrkz:
588 return ProcessUNPCKPS(X86::VPUNPCKLDQZ256rrkz);
589 case X86::VUNPCKLPSZrrkz:
590 return ProcessUNPCKPS(X86::VPUNPCKLDQZrrkz);
591 case X86::UNPCKHPSrr:
592 return ProcessUNPCKPS(X86::PUNPCKHDQrr);
593 case X86::VUNPCKHPSrr:
594 return ProcessUNPCKPS(X86::VPUNPCKHDQrr);
595 case X86::VUNPCKHPSYrr:
596 return ProcessUNPCKPS(X86::VPUNPCKHDQYrr);
597 case X86::VUNPCKHPSZ128rr:
598 return ProcessUNPCKPS(X86::VPUNPCKHDQZ128rr);
599 case X86::VUNPCKHPSZ256rr:
600 return ProcessUNPCKPS(X86::VPUNPCKHDQZ256rr);
601 case X86::VUNPCKHPSZrr:
602 return ProcessUNPCKPS(X86::VPUNPCKHDQZrr);
603 case X86::VUNPCKHPSZ128rrk:
604 return ProcessUNPCKPS(X86::VPUNPCKHDQZ128rrk);
605 case X86::VUNPCKHPSZ256rrk:
606 return ProcessUNPCKPS(X86::VPUNPCKHDQZ256rrk);
607 case X86::VUNPCKHPSZrrk:
608 return ProcessUNPCKPS(X86::VPUNPCKHDQZrrk);
609 case X86::VUNPCKHPSZ128rrkz:
610 return ProcessUNPCKPS(X86::VPUNPCKHDQZ128rrkz);
611 case X86::VUNPCKHPSZ256rrkz:
612 return ProcessUNPCKPS(X86::VPUNPCKHDQZ256rrkz);
613 case X86::VUNPCKHPSZrrkz:
614 return ProcessUNPCKPS(X86::VPUNPCKHDQZrrkz);
615 case X86::UNPCKLPSrm:
616 return ProcessUNPCKPS(X86::PUNPCKLDQrm);
617 case X86::VUNPCKLPSrm:
618 return ProcessUNPCKPS(X86::VPUNPCKLDQrm);
619 case X86::VUNPCKLPSYrm:
620 return ProcessUNPCKPS(X86::VPUNPCKLDQYrm);
621 case X86::VUNPCKLPSZ128rm:
622 return ProcessUNPCKPS(X86::VPUNPCKLDQZ128rm);
623 case X86::VUNPCKLPSZ256rm:
624 return ProcessUNPCKPS(X86::VPUNPCKLDQZ256rm);
625 case X86::VUNPCKLPSZrm:
626 return ProcessUNPCKPS(X86::VPUNPCKLDQZrm);
627 case X86::VUNPCKLPSZ128rmk:
628 return ProcessUNPCKPS(X86::VPUNPCKLDQZ128rmk);
629 case X86::VUNPCKLPSZ256rmk:
630 return ProcessUNPCKPS(X86::VPUNPCKLDQZ256rmk);
631 case X86::VUNPCKLPSZrmk:
632 return ProcessUNPCKPS(X86::VPUNPCKLDQZrmk);
633 case X86::VUNPCKLPSZ128rmkz:
634 return ProcessUNPCKPS(X86::VPUNPCKLDQZ128rmkz);
635 case X86::VUNPCKLPSZ256rmkz:
636 return ProcessUNPCKPS(X86::VPUNPCKLDQZ256rmkz);
637 case X86::VUNPCKLPSZrmkz:
638 return ProcessUNPCKPS(X86::VPUNPCKLDQZrmkz);
639 case X86::UNPCKHPSrm:
640 return ProcessUNPCKPS(X86::PUNPCKHDQrm);
641 case X86::VUNPCKHPSrm:
642 return ProcessUNPCKPS(X86::VPUNPCKHDQrm);
643 case X86::VUNPCKHPSYrm:
644 return ProcessUNPCKPS(X86::VPUNPCKHDQYrm);
645 case X86::VUNPCKHPSZ128rm:
646 return ProcessUNPCKPS(X86::VPUNPCKHDQZ128rm);
647 case X86::VUNPCKHPSZ256rm:
648 return ProcessUNPCKPS(X86::VPUNPCKHDQZ256rm);
649 case X86::VUNPCKHPSZrm:
650 return ProcessUNPCKPS(X86::VPUNPCKHDQZrm);
651 case X86::VUNPCKHPSZ128rmk:
652 return ProcessUNPCKPS(X86::VPUNPCKHDQZ128rmk);
653 case X86::VUNPCKHPSZ256rmk:
654 return ProcessUNPCKPS(X86::VPUNPCKHDQZ256rmk);
655 case X86::VUNPCKHPSZrmk:
656 return ProcessUNPCKPS(X86::VPUNPCKHDQZrmk);
657 case X86::VUNPCKHPSZ128rmkz:
658 return ProcessUNPCKPS(X86::VPUNPCKHDQZ128rmkz);
659 case X86::VUNPCKHPSZ256rmkz:
660 return ProcessUNPCKPS(X86::VPUNPCKHDQZ256rmkz);
661 case X86::VUNPCKHPSZrmkz:
662 return ProcessUNPCKPS(X86::VPUNPCKHDQZrmkz);
665 return ProcessShiftLeftToAdd(X86::PADDWrr);
667 return ProcessShiftLeftToAdd(X86::VPADDWrr);
669 return ProcessShiftLeftToAdd(X86::VPADDWYrr);
670 case X86::VPSLLWZ128ri:
671 return ProcessShiftLeftToAdd(X86::VPADDWZ128rr);
672 case X86::VPSLLWZ256ri:
673 return ProcessShiftLeftToAdd(X86::VPADDWZ256rr);
675 return ProcessShiftLeftToAdd(X86::VPADDWZrr);
677 return ProcessShiftLeftToAdd(X86::PADDDrr);
679 return ProcessShiftLeftToAdd(X86::VPADDDrr);
681 return ProcessShiftLeftToAdd(X86::VPADDDYrr);
682 case X86::VPSLLDZ128ri:
683 return ProcessShiftLeftToAdd(X86::VPADDDZ128rr);
684 case X86::VPSLLDZ256ri:
685 return ProcessShiftLeftToAdd(X86::VPADDDZ256rr);
687 return ProcessShiftLeftToAdd(X86::VPADDDZrr);
689 return ProcessShiftLeftToAdd(X86::PADDQrr);
691 return ProcessShiftLeftToAdd(X86::VPADDQrr);
693 return ProcessShiftLeftToAdd(X86::VPADDQYrr);
694 case X86::VPSLLQZ128ri:
695 return ProcessShiftLeftToAdd(X86::VPADDQZ128rr);
696 case X86::VPSLLQZ256ri:
697 return ProcessShiftLeftToAdd(X86::VPADDQZ256rr);
699 return ProcessShiftLeftToAdd(X86::VPADDQZrr);
706bool X86FixupInstTuningImpl::runOnMachineFunction(MachineFunction &MF) {
712 SM = &ST->getSchedModel();
714 for (MachineBasicBlock &
MBB : MF) {
716 if (processInstruction(MF,
MBB,
I)) {
726bool X86FixupInstTuningLegacy::runOnMachineFunction(MachineFunction &MF) {
727 X86FixupInstTuningImpl Impl;
728 return Impl.runOnMachineFunction(MF);
734 X86FixupInstTuningImpl Impl;
735 return Impl.runOnMachineFunction(MF)
Function Alias Analysis false
const HexagonInstrInfo * TII
Register const TargetRegisterInfo * TRI
Promote Memory to Register
static constexpr unsigned SM(unsigned Version)
#define INITIALIZE_PASS(passName, arg, name, cfg, analysis)
This file defines the 'Statistic' class, which is designed to be an easy way to expose various metric...
#define STATISTIC(VARNAME, DESC)
static std::optional< bool > CmpOptionals(T NewVal, T CurVal)
uint64_t getZExtValue() const
Get zero extended value.
static LLVM_ABI APInt getSplat(unsigned NewLen, const APInt &V)
Return a value containing V broadcasted over NewLen bits.
Represents analyses that only rely on functions' control flow.
FunctionPass class - This class is used to implement most global optimizations.
bool hasOptSize() const
Optimize this function for size (-Os) or minimum size (-Oz).
unsigned getSize(const MachineInstr &MI) const
MachineInstrBundleIterator< MachineInstr > iterator
MachineFunctionPass - This class adapts the FunctionPass interface to allow convenient creation of pa...
const TargetSubtargetInfo & getSubtarget() const
getSubtarget - Return the subtarget for which this machine code is being compiled.
Function & getFunction()
Return the LLVM function that this machine code represents.
static MachineOperand CreateImm(int64_t Val)
static MachineOperand CreateReg(Register Reg, bool isDef, bool isImp=false, bool isKill=false, bool isDead=false, bool isUndef=false, bool isEarlyClobber=false, unsigned SubReg=0, bool isDebug=false, bool isInternalRead=false, bool isRenamable=false)
static PreservedAnalyses all()
Construct a special preserved set that preserves all passes.
PreservedAnalyses & preserveSet()
Mark an analysis set as preserved.
PreservedAnalyses run(MachineFunction &MF, MachineFunctionAnalysisManager &MFAM)
bool hasNoDomainDelayShuffle() const
const X86InstrInfo * getInstrInfo() const override
const X86RegisterInfo * getRegisterInfo() const override
Pass manager infrastructure for declaring and invalidating analyses.
LLVM_ABI APInt ScaleBitMask(const APInt &A, unsigned NewBitWidth, bool MatchAllBits=false)
Splat/Merge neighboring bits to widen/narrow the bitmask represented by.
constexpr std::underlying_type_t< E > Mask()
Get a bitmask with 1s in all places up to the high-order bit of E's largest value.
This is an optimization pass for GlobalISel generic memory operations.
AnalysisManager< MachineFunction > MachineFunctionAnalysisManager
LLVM_ABI PreservedAnalyses getMachineFunctionPassPreservedAnalyses()
Returns the minimum set of Analyses that all machine function passes must preserve.
LLVM_ABI raw_ostream & dbgs()
dbgs() - This returns a reference to a raw_ostream for debugging messages.
FunctionPass * createX86FixupInstTuningLegacyPass()
Machine model for scheduling, bundling, and heuristics.
static LLVM_ABI int computeInstrLatency(const MCSubtargetInfo &STI, const MCSchedClassDesc &SCDesc)
Returns the latency value for the scheduling class.
static LLVM_ABI double getReciprocalThroughput(const MCSubtargetInfo &STI, const MCSchedClassDesc &SCDesc)