Home | History | Annotate | Download | only in Hexagon
      1 //===-- HexagonPeephole.cpp - Hexagon Peephole Optimiztions ---------------===//
      2 //
      3 //                     The LLVM Compiler Infrastructure
      4 //
      5 // This file is distributed under the University of Illinois Open Source
      6 // License. See LICENSE.TXT for details.
      7 //
      8 // This peephole pass optimizes in the following cases.
      9 // 1. Optimizes redundant sign extends for the following case
     10 //    Transform the following pattern
     11 //    %vreg170<def> = SXTW %vreg166
     12 //    ...
     13 //    %vreg176<def> = COPY %vreg170:subreg_loreg
     14 //
     15 //    Into
     16 //    %vreg176<def> = COPY vreg166
     17 //
     18 //  2. Optimizes redundant negation of predicates.
     19 //     %vreg15<def> = CMPGTrr %vreg6, %vreg2
     20 //     ...
     21 //     %vreg16<def> = NOT_p %vreg15<kill>
     22 //     ...
     23 //     JMP_c %vreg16<kill>, <BB#1>, %PC<imp-def,dead>
     24 //
     25 //     Into
     26 //     %vreg15<def> = CMPGTrr %vreg6, %vreg2;
     27 //     ...
     28 //     JMP_cNot %vreg15<kill>, <BB#1>, %PC<imp-def,dead>;
     29 //
     30 // Note: The peephole pass makes the instrucstions like
     31 // %vreg170<def> = SXTW %vreg166 or %vreg16<def> = NOT_p %vreg15<kill>
     32 // redundant and relies on some form of dead removal instructions, like
     33 // DCE or DIE to actually eliminate them.
     34 
     35 
     36 //===----------------------------------------------------------------------===//
     37 
     38 #include "Hexagon.h"
     39 #include "HexagonTargetMachine.h"
     40 #include "llvm/ADT/DenseMap.h"
     41 #include "llvm/ADT/Statistic.h"
     42 #include "llvm/CodeGen/MachineFunction.h"
     43 #include "llvm/CodeGen/MachineFunctionPass.h"
     44 #include "llvm/CodeGen/MachineInstrBuilder.h"
     45 #include "llvm/CodeGen/MachineRegisterInfo.h"
     46 #include "llvm/CodeGen/Passes.h"
     47 #include "llvm/IR/Constants.h"
     48 #include "llvm/PassSupport.h"
     49 #include "llvm/Support/CommandLine.h"
     50 #include "llvm/Support/Debug.h"
     51 #include "llvm/Support/raw_ostream.h"
     52 #include "llvm/Target/TargetInstrInfo.h"
     53 #include "llvm/Target/TargetMachine.h"
     54 #include "llvm/Target/TargetRegisterInfo.h"
     55 #include <algorithm>
     56 
     57 using namespace llvm;
     58 
     59 #define DEBUG_TYPE "hexagon-peephole"
     60 
     61 static cl::opt<bool> DisableHexagonPeephole("disable-hexagon-peephole",
     62     cl::Hidden, cl::ZeroOrMore, cl::init(false),
     63     cl::desc("Disable Peephole Optimization"));
     64 
     65 static cl::opt<bool> DisablePNotP("disable-hexagon-pnotp",
     66     cl::Hidden, cl::ZeroOrMore, cl::init(false),
     67     cl::desc("Disable Optimization of PNotP"));
     68 
     69 static cl::opt<bool> DisableOptSZExt("disable-hexagon-optszext",
     70     cl::Hidden, cl::ZeroOrMore, cl::init(true),
     71     cl::desc("Disable Optimization of Sign/Zero Extends"));
     72 
     73 static cl::opt<bool> DisableOptExtTo64("disable-hexagon-opt-ext-to-64",
     74     cl::Hidden, cl::ZeroOrMore, cl::init(true),
     75     cl::desc("Disable Optimization of extensions to i64."));
     76 
     77 namespace llvm {
     78   FunctionPass *createHexagonPeephole();
     79   void initializeHexagonPeepholePass(PassRegistry&);
     80 }
     81 
     82 namespace {
     83   struct HexagonPeephole : public MachineFunctionPass {
     84     const HexagonInstrInfo    *QII;
     85     const HexagonRegisterInfo *QRI;
     86     const MachineRegisterInfo *MRI;
     87 
     88   public:
     89     static char ID;
     90     HexagonPeephole() : MachineFunctionPass(ID) {
     91       initializeHexagonPeepholePass(*PassRegistry::getPassRegistry());
     92     }
     93 
     94     bool runOnMachineFunction(MachineFunction &MF) override;
     95 
     96     const char *getPassName() const override {
     97       return "Hexagon optimize redundant zero and size extends";
     98     }
     99 
    100     void getAnalysisUsage(AnalysisUsage &AU) const override {
    101       MachineFunctionPass::getAnalysisUsage(AU);
    102     }
    103 
    104   private:
    105     void ChangeOpInto(MachineOperand &Dst, MachineOperand &Src);
    106   };
    107 }
    108 
    109 char HexagonPeephole::ID = 0;
    110 
    111 INITIALIZE_PASS(HexagonPeephole, "hexagon-peephole", "Hexagon Peephole",
    112                 false, false)
    113 
    114 bool HexagonPeephole::runOnMachineFunction(MachineFunction &MF) {
    115   if (skipFunction(*MF.getFunction()))
    116     return false;
    117 
    118   QII = static_cast<const HexagonInstrInfo *>(MF.getSubtarget().getInstrInfo());
    119   QRI = MF.getSubtarget<HexagonSubtarget>().getRegisterInfo();
    120   MRI = &MF.getRegInfo();
    121 
    122   DenseMap<unsigned, unsigned> PeepholeMap;
    123   DenseMap<unsigned, std::pair<unsigned, unsigned> > PeepholeDoubleRegsMap;
    124 
    125   if (DisableHexagonPeephole) return false;
    126 
    127   // Loop over all of the basic blocks.
    128   for (MachineFunction::iterator MBBb = MF.begin(), MBBe = MF.end();
    129        MBBb != MBBe; ++MBBb) {
    130     MachineBasicBlock *MBB = &*MBBb;
    131     PeepholeMap.clear();
    132     PeepholeDoubleRegsMap.clear();
    133 
    134     // Traverse the basic block.
    135     for (MachineInstr &MI : *MBB) {
    136       // Look for sign extends:
    137       // %vreg170<def> = SXTW %vreg166
    138       if (!DisableOptSZExt && MI.getOpcode() == Hexagon::A2_sxtw) {
    139         assert(MI.getNumOperands() == 2);
    140         MachineOperand &Dst = MI.getOperand(0);
    141         MachineOperand &Src = MI.getOperand(1);
    142         unsigned DstReg = Dst.getReg();
    143         unsigned SrcReg = Src.getReg();
    144         // Just handle virtual registers.
    145         if (TargetRegisterInfo::isVirtualRegister(DstReg) &&
    146             TargetRegisterInfo::isVirtualRegister(SrcReg)) {
    147           // Map the following:
    148           // %vreg170<def> = SXTW %vreg166
    149           // PeepholeMap[170] = vreg166
    150           PeepholeMap[DstReg] = SrcReg;
    151         }
    152       }
    153 
    154       // Look for  %vreg170<def> = COMBINE_ir_V4 (0, %vreg169)
    155       // %vreg170:DoublRegs, %vreg169:IntRegs
    156       if (!DisableOptExtTo64 && MI.getOpcode() == Hexagon::A4_combineir) {
    157         assert(MI.getNumOperands() == 3);
    158         MachineOperand &Dst = MI.getOperand(0);
    159         MachineOperand &Src1 = MI.getOperand(1);
    160         MachineOperand &Src2 = MI.getOperand(2);
    161         if (Src1.getImm() != 0)
    162           continue;
    163         unsigned DstReg = Dst.getReg();
    164         unsigned SrcReg = Src2.getReg();
    165         PeepholeMap[DstReg] = SrcReg;
    166       }
    167 
    168       // Look for this sequence below
    169       // %vregDoubleReg1 = LSRd_ri %vregDoubleReg0, 32
    170       // %vregIntReg = COPY %vregDoubleReg1:subreg_loreg.
    171       // and convert into
    172       // %vregIntReg = COPY %vregDoubleReg0:subreg_hireg.
    173       if (MI.getOpcode() == Hexagon::S2_lsr_i_p) {
    174         assert(MI.getNumOperands() == 3);
    175         MachineOperand &Dst = MI.getOperand(0);
    176         MachineOperand &Src1 = MI.getOperand(1);
    177         MachineOperand &Src2 = MI.getOperand(2);
    178         if (Src2.getImm() != 32)
    179           continue;
    180         unsigned DstReg = Dst.getReg();
    181         unsigned SrcReg = Src1.getReg();
    182         PeepholeDoubleRegsMap[DstReg] =
    183           std::make_pair(*&SrcReg, Hexagon::subreg_hireg);
    184       }
    185 
    186       // Look for P=NOT(P).
    187       if (!DisablePNotP && MI.getOpcode() == Hexagon::C2_not) {
    188         assert(MI.getNumOperands() == 2);
    189         MachineOperand &Dst = MI.getOperand(0);
    190         MachineOperand &Src = MI.getOperand(1);
    191         unsigned DstReg = Dst.getReg();
    192         unsigned SrcReg = Src.getReg();
    193         // Just handle virtual registers.
    194         if (TargetRegisterInfo::isVirtualRegister(DstReg) &&
    195             TargetRegisterInfo::isVirtualRegister(SrcReg)) {
    196           // Map the following:
    197           // %vreg170<def> = NOT_xx %vreg166
    198           // PeepholeMap[170] = vreg166
    199           PeepholeMap[DstReg] = SrcReg;
    200         }
    201       }
    202 
    203       // Look for copy:
    204       // %vreg176<def> = COPY %vreg170:subreg_loreg
    205       if (!DisableOptSZExt && MI.isCopy()) {
    206         assert(MI.getNumOperands() == 2);
    207         MachineOperand &Dst = MI.getOperand(0);
    208         MachineOperand &Src = MI.getOperand(1);
    209 
    210         // Make sure we are copying the lower 32 bits.
    211         if (Src.getSubReg() != Hexagon::subreg_loreg)
    212           continue;
    213 
    214         unsigned DstReg = Dst.getReg();
    215         unsigned SrcReg = Src.getReg();
    216         if (TargetRegisterInfo::isVirtualRegister(DstReg) &&
    217             TargetRegisterInfo::isVirtualRegister(SrcReg)) {
    218           // Try to find in the map.
    219           if (unsigned PeepholeSrc = PeepholeMap.lookup(SrcReg)) {
    220             // Change the 1st operand.
    221             MI.RemoveOperand(1);
    222             MI.addOperand(MachineOperand::CreateReg(PeepholeSrc, false));
    223           } else  {
    224             DenseMap<unsigned, std::pair<unsigned, unsigned> >::iterator DI =
    225               PeepholeDoubleRegsMap.find(SrcReg);
    226             if (DI != PeepholeDoubleRegsMap.end()) {
    227               std::pair<unsigned,unsigned> PeepholeSrc = DI->second;
    228               MI.RemoveOperand(1);
    229               MI.addOperand(MachineOperand::CreateReg(
    230                   PeepholeSrc.first, false /*isDef*/, false /*isImp*/,
    231                   false /*isKill*/, false /*isDead*/, false /*isUndef*/,
    232                   false /*isEarlyClobber*/, PeepholeSrc.second));
    233             }
    234           }
    235         }
    236       }
    237 
    238       // Look for Predicated instructions.
    239       if (!DisablePNotP) {
    240         bool Done = false;
    241         if (QII->isPredicated(MI)) {
    242           MachineOperand &Op0 = MI.getOperand(0);
    243           unsigned Reg0 = Op0.getReg();
    244           const TargetRegisterClass *RC0 = MRI->getRegClass(Reg0);
    245           if (RC0->getID() == Hexagon::PredRegsRegClassID) {
    246             // Handle instructions that have a prediate register in op0
    247             // (most cases of predicable instructions).
    248             if (TargetRegisterInfo::isVirtualRegister(Reg0)) {
    249               // Try to find in the map.
    250               if (unsigned PeepholeSrc = PeepholeMap.lookup(Reg0)) {
    251                 // Change the 1st operand and, flip the opcode.
    252                 MI.getOperand(0).setReg(PeepholeSrc);
    253                 int NewOp = QII->getInvertedPredicatedOpcode(MI.getOpcode());
    254                 MI.setDesc(QII->get(NewOp));
    255                 Done = true;
    256               }
    257             }
    258           }
    259         }
    260 
    261         if (!Done) {
    262           // Handle special instructions.
    263           unsigned Op = MI.getOpcode();
    264           unsigned NewOp = 0;
    265           unsigned PR = 1, S1 = 2, S2 = 3;   // Operand indices.
    266 
    267           switch (Op) {
    268             case Hexagon::C2_mux:
    269             case Hexagon::C2_muxii:
    270               NewOp = Op;
    271               break;
    272             case Hexagon::C2_muxri:
    273               NewOp = Hexagon::C2_muxir;
    274               break;
    275             case Hexagon::C2_muxir:
    276               NewOp = Hexagon::C2_muxri;
    277               break;
    278           }
    279           if (NewOp) {
    280             unsigned PSrc = MI.getOperand(PR).getReg();
    281             if (unsigned POrig = PeepholeMap.lookup(PSrc)) {
    282               MI.getOperand(PR).setReg(POrig);
    283               MI.setDesc(QII->get(NewOp));
    284               // Swap operands S1 and S2.
    285               MachineOperand Op1 = MI.getOperand(S1);
    286               MachineOperand Op2 = MI.getOperand(S2);
    287               ChangeOpInto(MI.getOperand(S1), Op2);
    288               ChangeOpInto(MI.getOperand(S2), Op1);
    289             }
    290           } // if (NewOp)
    291         } // if (!Done)
    292 
    293       } // if (!DisablePNotP)
    294 
    295     } // Instruction
    296   } // Basic Block
    297   return true;
    298 }
    299 
    300 void HexagonPeephole::ChangeOpInto(MachineOperand &Dst, MachineOperand &Src) {
    301   assert (&Dst != &Src && "Cannot duplicate into itself");
    302   switch (Dst.getType()) {
    303     case MachineOperand::MO_Register:
    304       if (Src.isReg()) {
    305         Dst.setReg(Src.getReg());
    306         Dst.setSubReg(Src.getSubReg());
    307       } else if (Src.isImm()) {
    308         Dst.ChangeToImmediate(Src.getImm());
    309       } else {
    310         llvm_unreachable("Unexpected src operand type");
    311       }
    312       break;
    313 
    314     case MachineOperand::MO_Immediate:
    315       if (Src.isImm()) {
    316         Dst.setImm(Src.getImm());
    317       } else if (Src.isReg()) {
    318         Dst.ChangeToRegister(Src.getReg(), Src.isDef(), Src.isImplicit(),
    319                              Src.isKill(), Src.isDead(), Src.isUndef(),
    320                              Src.isDebug());
    321         Dst.setSubReg(Src.getSubReg());
    322       } else {
    323         llvm_unreachable("Unexpected src operand type");
    324       }
    325       break;
    326 
    327     default:
    328       llvm_unreachable("Unexpected dst operand type");
    329       break;
    330   }
    331 }
    332 
    333 FunctionPass *llvm::createHexagonPeephole() {
    334   return new HexagonPeephole();
    335 }
    336