Home | History | Annotate | Download | only in Hexagon
      1 //===-- HexagonPeephole.cpp - Hexagon Peephole Optimiztions ---------------===//
      2 //
      3 //                     The LLVM Compiler Infrastructure
      4 //
      5 // This file is distributed under the University of Illinois Open Source
      6 // License. See LICENSE.TXT for details.
      7 //
      8 // This peephole pass optimizes in the following cases.
      9 // 1. Optimizes redundant sign extends for the following case
     10 //    Transform the following pattern
     11 //    %vreg170<def> = SXTW %vreg166
     12 //    ...
     13 //    %vreg176<def> = COPY %vreg170:subreg_loreg
     14 //
     15 //    Into
     16 //    %vreg176<def> = COPY vreg166
     17 //
     18 //  2. Optimizes redundant negation of predicates.
     19 //     %vreg15<def> = CMPGTrr %vreg6, %vreg2
     20 //     ...
     21 //     %vreg16<def> = NOT_p %vreg15<kill>
     22 //     ...
     23 //     JMP_c %vreg16<kill>, <BB#1>, %PC<imp-def,dead>
     24 //
     25 //     Into
     26 //     %vreg15<def> = CMPGTrr %vreg6, %vreg2;
     27 //     ...
     28 //     JMP_cNot %vreg15<kill>, <BB#1>, %PC<imp-def,dead>;
     29 //
     30 // Note: The peephole pass makes the instrucstions like
     31 // %vreg170<def> = SXTW %vreg166 or %vreg16<def> = NOT_p %vreg15<kill>
     32 // redundant and relies on some form of dead removal instructions, like
     33 // DCE or DIE to actually eliminate them.
     34 
     35 
     36 //===----------------------------------------------------------------------===//
     37 
     38 #include "Hexagon.h"
     39 #include "HexagonTargetMachine.h"
     40 #include "llvm/ADT/DenseMap.h"
     41 #include "llvm/ADT/Statistic.h"
     42 #include "llvm/CodeGen/MachineFunction.h"
     43 #include "llvm/CodeGen/MachineFunctionPass.h"
     44 #include "llvm/CodeGen/MachineInstrBuilder.h"
     45 #include "llvm/CodeGen/MachineRegisterInfo.h"
     46 #include "llvm/CodeGen/Passes.h"
     47 #include "llvm/IR/Constants.h"
     48 #include "llvm/PassSupport.h"
     49 #include "llvm/Support/CommandLine.h"
     50 #include "llvm/Support/Debug.h"
     51 #include "llvm/Support/raw_ostream.h"
     52 #include "llvm/Target/TargetInstrInfo.h"
     53 #include "llvm/Target/TargetMachine.h"
     54 #include "llvm/Target/TargetRegisterInfo.h"
     55 #include <algorithm>
     56 
     57 using namespace llvm;
     58 
     59 #define DEBUG_TYPE "hexagon-peephole"
     60 
     61 static cl::opt<bool> DisableHexagonPeephole("disable-hexagon-peephole",
     62     cl::Hidden, cl::ZeroOrMore, cl::init(false),
     63     cl::desc("Disable Peephole Optimization"));
     64 
     65 static cl::opt<bool> DisablePNotP("disable-hexagon-pnotp",
     66     cl::Hidden, cl::ZeroOrMore, cl::init(false),
     67     cl::desc("Disable Optimization of PNotP"));
     68 
     69 static cl::opt<bool> DisableOptSZExt("disable-hexagon-optszext",
     70     cl::Hidden, cl::ZeroOrMore, cl::init(false),
     71     cl::desc("Disable Optimization of Sign/Zero Extends"));
     72 
     73 static cl::opt<bool> DisableOptExtTo64("disable-hexagon-opt-ext-to-64",
     74     cl::Hidden, cl::ZeroOrMore, cl::init(false),
     75     cl::desc("Disable Optimization of extensions to i64."));
     76 
     77 namespace llvm {
     78   FunctionPass *createHexagonPeephole();
     79   void initializeHexagonPeepholePass(PassRegistry&);
     80 }
     81 
     82 namespace {
     83   struct HexagonPeephole : public MachineFunctionPass {
     84     const HexagonInstrInfo    *QII;
     85     const HexagonRegisterInfo *QRI;
     86     const MachineRegisterInfo *MRI;
     87 
     88   public:
     89     static char ID;
     90     HexagonPeephole() : MachineFunctionPass(ID) {
     91       initializeHexagonPeepholePass(*PassRegistry::getPassRegistry());
     92     }
     93 
     94     bool runOnMachineFunction(MachineFunction &MF) override;
     95 
     96     const char *getPassName() const override {
     97       return "Hexagon optimize redundant zero and size extends";
     98     }
     99 
    100     void getAnalysisUsage(AnalysisUsage &AU) const override {
    101       MachineFunctionPass::getAnalysisUsage(AU);
    102     }
    103 
    104   private:
    105     void ChangeOpInto(MachineOperand &Dst, MachineOperand &Src);
    106   };
    107 }
    108 
    109 char HexagonPeephole::ID = 0;
    110 
    111 INITIALIZE_PASS(HexagonPeephole, "hexagon-peephole", "Hexagon Peephole",
    112                 false, false)
    113 
    114 bool HexagonPeephole::runOnMachineFunction(MachineFunction &MF) {
    115   QII = static_cast<const HexagonInstrInfo *>(MF.getSubtarget().getInstrInfo());
    116   QRI = MF.getSubtarget<HexagonSubtarget>().getRegisterInfo();
    117   MRI = &MF.getRegInfo();
    118 
    119   DenseMap<unsigned, unsigned> PeepholeMap;
    120   DenseMap<unsigned, std::pair<unsigned, unsigned> > PeepholeDoubleRegsMap;
    121 
    122   if (DisableHexagonPeephole) return false;
    123 
    124   // Loop over all of the basic blocks.
    125   for (MachineFunction::iterator MBBb = MF.begin(), MBBe = MF.end();
    126        MBBb != MBBe; ++MBBb) {
    127     MachineBasicBlock *MBB = &*MBBb;
    128     PeepholeMap.clear();
    129     PeepholeDoubleRegsMap.clear();
    130 
    131     // Traverse the basic block.
    132     for (MachineBasicBlock::iterator MII = MBB->begin(); MII != MBB->end();
    133                                      ++MII) {
    134       MachineInstr *MI = MII;
    135       // Look for sign extends:
    136       // %vreg170<def> = SXTW %vreg166
    137       if (!DisableOptSZExt && MI->getOpcode() == Hexagon::A2_sxtw) {
    138         assert (MI->getNumOperands() == 2);
    139         MachineOperand &Dst = MI->getOperand(0);
    140         MachineOperand &Src  = MI->getOperand(1);
    141         unsigned DstReg = Dst.getReg();
    142         unsigned SrcReg = Src.getReg();
    143         // Just handle virtual registers.
    144         if (TargetRegisterInfo::isVirtualRegister(DstReg) &&
    145             TargetRegisterInfo::isVirtualRegister(SrcReg)) {
    146           // Map the following:
    147           // %vreg170<def> = SXTW %vreg166
    148           // PeepholeMap[170] = vreg166
    149           PeepholeMap[DstReg] = SrcReg;
    150         }
    151       }
    152 
    153       // Look for  %vreg170<def> = COMBINE_ir_V4 (0, %vreg169)
    154       // %vreg170:DoublRegs, %vreg169:IntRegs
    155       if (!DisableOptExtTo64 &&
    156           MI->getOpcode () == Hexagon::A4_combineir) {
    157         assert (MI->getNumOperands() == 3);
    158         MachineOperand &Dst = MI->getOperand(0);
    159         MachineOperand &Src1 = MI->getOperand(1);
    160         MachineOperand &Src2 = MI->getOperand(2);
    161         if (Src1.getImm() != 0)
    162           continue;
    163         unsigned DstReg = Dst.getReg();
    164         unsigned SrcReg = Src2.getReg();
    165         PeepholeMap[DstReg] = SrcReg;
    166       }
    167 
    168       // Look for this sequence below
    169       // %vregDoubleReg1 = LSRd_ri %vregDoubleReg0, 32
    170       // %vregIntReg = COPY %vregDoubleReg1:subreg_loreg.
    171       // and convert into
    172       // %vregIntReg = COPY %vregDoubleReg0:subreg_hireg.
    173       if (MI->getOpcode() == Hexagon::S2_lsr_i_p) {
    174         assert(MI->getNumOperands() == 3);
    175         MachineOperand &Dst = MI->getOperand(0);
    176         MachineOperand &Src1 = MI->getOperand(1);
    177         MachineOperand &Src2 = MI->getOperand(2);
    178         if (Src2.getImm() != 32)
    179           continue;
    180         unsigned DstReg = Dst.getReg();
    181         unsigned SrcReg = Src1.getReg();
    182         PeepholeDoubleRegsMap[DstReg] =
    183           std::make_pair(*&SrcReg, Hexagon::subreg_hireg);
    184       }
    185 
    186       // Look for P=NOT(P).
    187       if (!DisablePNotP &&
    188           (MI->getOpcode() == Hexagon::C2_not)) {
    189         assert (MI->getNumOperands() == 2);
    190         MachineOperand &Dst = MI->getOperand(0);
    191         MachineOperand &Src  = MI->getOperand(1);
    192         unsigned DstReg = Dst.getReg();
    193         unsigned SrcReg = Src.getReg();
    194         // Just handle virtual registers.
    195         if (TargetRegisterInfo::isVirtualRegister(DstReg) &&
    196             TargetRegisterInfo::isVirtualRegister(SrcReg)) {
    197           // Map the following:
    198           // %vreg170<def> = NOT_xx %vreg166
    199           // PeepholeMap[170] = vreg166
    200           PeepholeMap[DstReg] = SrcReg;
    201         }
    202       }
    203 
    204       // Look for copy:
    205       // %vreg176<def> = COPY %vreg170:subreg_loreg
    206       if (!DisableOptSZExt && MI->isCopy()) {
    207         assert (MI->getNumOperands() == 2);
    208         MachineOperand &Dst = MI->getOperand(0);
    209         MachineOperand &Src  = MI->getOperand(1);
    210 
    211         // Make sure we are copying the lower 32 bits.
    212         if (Src.getSubReg() != Hexagon::subreg_loreg)
    213           continue;
    214 
    215         unsigned DstReg = Dst.getReg();
    216         unsigned SrcReg = Src.getReg();
    217         if (TargetRegisterInfo::isVirtualRegister(DstReg) &&
    218             TargetRegisterInfo::isVirtualRegister(SrcReg)) {
    219           // Try to find in the map.
    220           if (unsigned PeepholeSrc = PeepholeMap.lookup(SrcReg)) {
    221             // Change the 1st operand.
    222             MI->RemoveOperand(1);
    223             MI->addOperand(MachineOperand::CreateReg(PeepholeSrc, false));
    224           } else  {
    225             DenseMap<unsigned, std::pair<unsigned, unsigned> >::iterator DI =
    226               PeepholeDoubleRegsMap.find(SrcReg);
    227             if (DI != PeepholeDoubleRegsMap.end()) {
    228               std::pair<unsigned,unsigned> PeepholeSrc = DI->second;
    229               MI->RemoveOperand(1);
    230               MI->addOperand(MachineOperand::CreateReg(PeepholeSrc.first,
    231                                                        false /*isDef*/,
    232                                                        false /*isImp*/,
    233                                                        false /*isKill*/,
    234                                                        false /*isDead*/,
    235                                                        false /*isUndef*/,
    236                                                        false /*isEarlyClobber*/,
    237                                                        PeepholeSrc.second));
    238             }
    239           }
    240         }
    241       }
    242 
    243       // Look for Predicated instructions.
    244       if (!DisablePNotP) {
    245         bool Done = false;
    246         if (QII->isPredicated(MI)) {
    247           MachineOperand &Op0 = MI->getOperand(0);
    248           unsigned Reg0 = Op0.getReg();
    249           const TargetRegisterClass *RC0 = MRI->getRegClass(Reg0);
    250           if (RC0->getID() == Hexagon::PredRegsRegClassID) {
    251             // Handle instructions that have a prediate register in op0
    252             // (most cases of predicable instructions).
    253             if (TargetRegisterInfo::isVirtualRegister(Reg0)) {
    254               // Try to find in the map.
    255               if (unsigned PeepholeSrc = PeepholeMap.lookup(Reg0)) {
    256                 // Change the 1st operand and, flip the opcode.
    257                 MI->getOperand(0).setReg(PeepholeSrc);
    258                 int NewOp = QII->getInvertedPredicatedOpcode(MI->getOpcode());
    259                 MI->setDesc(QII->get(NewOp));
    260                 Done = true;
    261               }
    262             }
    263           }
    264         }
    265 
    266         if (!Done) {
    267           // Handle special instructions.
    268           unsigned Op = MI->getOpcode();
    269           unsigned NewOp = 0;
    270           unsigned PR = 1, S1 = 2, S2 = 3;   // Operand indices.
    271 
    272           switch (Op) {
    273             case Hexagon::C2_mux:
    274             case Hexagon::C2_muxii:
    275               NewOp = Op;
    276               break;
    277             case Hexagon::C2_muxri:
    278               NewOp = Hexagon::C2_muxir;
    279               break;
    280             case Hexagon::C2_muxir:
    281               NewOp = Hexagon::C2_muxri;
    282               break;
    283           }
    284           if (NewOp) {
    285             unsigned PSrc = MI->getOperand(PR).getReg();
    286             if (unsigned POrig = PeepholeMap.lookup(PSrc)) {
    287               MI->getOperand(PR).setReg(POrig);
    288               MI->setDesc(QII->get(NewOp));
    289               // Swap operands S1 and S2.
    290               MachineOperand Op1 = MI->getOperand(S1);
    291               MachineOperand Op2 = MI->getOperand(S2);
    292               ChangeOpInto(MI->getOperand(S1), Op2);
    293               ChangeOpInto(MI->getOperand(S2), Op1);
    294             }
    295           } // if (NewOp)
    296         } // if (!Done)
    297 
    298       } // if (!DisablePNotP)
    299 
    300     } // Instruction
    301   } // Basic Block
    302   return true;
    303 }
    304 
    305 void HexagonPeephole::ChangeOpInto(MachineOperand &Dst, MachineOperand &Src) {
    306   assert (&Dst != &Src && "Cannot duplicate into itself");
    307   switch (Dst.getType()) {
    308     case MachineOperand::MO_Register:
    309       if (Src.isReg()) {
    310         Dst.setReg(Src.getReg());
    311       } else if (Src.isImm()) {
    312         Dst.ChangeToImmediate(Src.getImm());
    313       } else {
    314         llvm_unreachable("Unexpected src operand type");
    315       }
    316       break;
    317 
    318     case MachineOperand::MO_Immediate:
    319       if (Src.isImm()) {
    320         Dst.setImm(Src.getImm());
    321       } else if (Src.isReg()) {
    322         Dst.ChangeToRegister(Src.getReg(), Src.isDef(), Src.isImplicit(),
    323                              Src.isKill(), Src.isDead(), Src.isUndef(),
    324                              Src.isDebug());
    325       } else {
    326         llvm_unreachable("Unexpected src operand type");
    327       }
    328       break;
    329 
    330     default:
    331       llvm_unreachable("Unexpected dst operand type");
    332       break;
    333   }
    334 }
    335 
    336 FunctionPass *llvm::createHexagonPeephole() {
    337   return new HexagonPeephole();
    338 }
    339