Home | History | Annotate | Download | only in ARM
      1 //===-- ARMExpandPseudoInsts.cpp - Expand pseudo instructions -------------===//
      2 //
      3 //                     The LLVM Compiler Infrastructure
      4 //
      5 // This file is distributed under the University of Illinois Open Source
      6 // License. See LICENSE.TXT for details.
      7 //
      8 //===----------------------------------------------------------------------===//
      9 //
     10 // This file contains a pass that expands pseudo instructions into target
     11 // instructions to allow proper scheduling, if-conversion, and other late
     12 // optimizations. This pass should be run after register allocation but before
     13 // the post-regalloc scheduling pass.
     14 //
     15 //===----------------------------------------------------------------------===//
     16 
     17 #define DEBUG_TYPE "arm-pseudo"
     18 #include "ARM.h"
     19 #include "ARMBaseInstrInfo.h"
     20 #include "ARMBaseRegisterInfo.h"
     21 #include "ARMMachineFunctionInfo.h"
     22 #include "MCTargetDesc/ARMAddressingModes.h"
     23 #include "llvm/CodeGen/MachineFrameInfo.h"
     24 #include "llvm/CodeGen/MachineFunctionPass.h"
     25 #include "llvm/CodeGen/MachineInstrBuilder.h"
     26 #include "llvm/Target/TargetFrameLowering.h"
     27 #include "llvm/Target/TargetRegisterInfo.h"
     28 #include "llvm/Support/CommandLine.h"
     29 #include "llvm/Support/raw_ostream.h" // FIXME: for debug only. remove!
     30 using namespace llvm;
     31 
     32 static cl::opt<bool>
     33 VerifyARMPseudo("verify-arm-pseudo-expand", cl::Hidden,
     34                 cl::desc("Verify machine code after expanding ARM pseudos"));
     35 
     36 namespace {
     37   class ARMExpandPseudo : public MachineFunctionPass {
     38   public:
     39     static char ID;
     40     ARMExpandPseudo() : MachineFunctionPass(ID) {}
     41 
     42     const ARMBaseInstrInfo *TII;
     43     const TargetRegisterInfo *TRI;
     44     const ARMSubtarget *STI;
     45     ARMFunctionInfo *AFI;
     46 
     47     virtual bool runOnMachineFunction(MachineFunction &Fn);
     48 
     49     virtual const char *getPassName() const {
     50       return "ARM pseudo instruction expansion pass";
     51     }
     52 
     53   private:
     54     void TransferImpOps(MachineInstr &OldMI,
     55                         MachineInstrBuilder &UseMI, MachineInstrBuilder &DefMI);
     56     bool ExpandMI(MachineBasicBlock &MBB,
     57                   MachineBasicBlock::iterator MBBI);
     58     bool ExpandMBB(MachineBasicBlock &MBB);
     59     void ExpandVLD(MachineBasicBlock::iterator &MBBI);
     60     void ExpandVST(MachineBasicBlock::iterator &MBBI);
     61     void ExpandLaneOp(MachineBasicBlock::iterator &MBBI);
     62     void ExpandVTBL(MachineBasicBlock::iterator &MBBI,
     63                     unsigned Opc, bool IsExt);
     64     void ExpandMOV32BitImm(MachineBasicBlock &MBB,
     65                            MachineBasicBlock::iterator &MBBI);
     66   };
     67   char ARMExpandPseudo::ID = 0;
     68 }
     69 
     70 /// TransferImpOps - Transfer implicit operands on the pseudo instruction to
     71 /// the instructions created from the expansion.
     72 void ARMExpandPseudo::TransferImpOps(MachineInstr &OldMI,
     73                                      MachineInstrBuilder &UseMI,
     74                                      MachineInstrBuilder &DefMI) {
     75   const MCInstrDesc &Desc = OldMI.getDesc();
     76   for (unsigned i = Desc.getNumOperands(), e = OldMI.getNumOperands();
     77        i != e; ++i) {
     78     const MachineOperand &MO = OldMI.getOperand(i);
     79     assert(MO.isReg() && MO.getReg());
     80     if (MO.isUse())
     81       UseMI.addOperand(MO);
     82     else
     83       DefMI.addOperand(MO);
     84   }
     85 }
     86 
     87 namespace {
     88   // Constants for register spacing in NEON load/store instructions.
     89   // For quad-register load-lane and store-lane pseudo instructors, the
     90   // spacing is initially assumed to be EvenDblSpc, and that is changed to
     91   // OddDblSpc depending on the lane number operand.
     92   enum NEONRegSpacing {
     93     SingleSpc,
     94     EvenDblSpc,
     95     OddDblSpc
     96   };
     97 
     98   // Entries for NEON load/store information table.  The table is sorted by
     99   // PseudoOpc for fast binary-search lookups.
    100   struct NEONLdStTableEntry {
    101     uint16_t PseudoOpc;
    102     uint16_t RealOpc;
    103     bool IsLoad;
    104     bool isUpdating;
    105     bool hasWritebackOperand;
    106     NEONRegSpacing RegSpacing;
    107     unsigned char NumRegs; // D registers loaded or stored
    108     unsigned char RegElts; // elements per D register; used for lane ops
    109     // FIXME: Temporary flag to denote whether the real instruction takes
    110     // a single register (like the encoding) or all of the registers in
    111     // the list (like the asm syntax and the isel DAG). When all definitions
    112     // are converted to take only the single encoded register, this will
    113     // go away.
    114     bool copyAllListRegs;
    115 
    116     // Comparison methods for binary search of the table.
    117     bool operator<(const NEONLdStTableEntry &TE) const {
    118       return PseudoOpc < TE.PseudoOpc;
    119     }
    120     friend bool operator<(const NEONLdStTableEntry &TE, unsigned PseudoOpc) {
    121       return TE.PseudoOpc < PseudoOpc;
    122     }
    123     friend bool LLVM_ATTRIBUTE_UNUSED operator<(unsigned PseudoOpc,
    124                                                 const NEONLdStTableEntry &TE) {
    125       return PseudoOpc < TE.PseudoOpc;
    126     }
    127   };
    128 }
    129 
    130 static const NEONLdStTableEntry NEONLdStTable[] = {
    131 { ARM::VLD1LNq16Pseudo,     ARM::VLD1LNd16,     true, false, false, EvenDblSpc, 1, 4 ,true},
    132 { ARM::VLD1LNq16Pseudo_UPD, ARM::VLD1LNd16_UPD, true, true, true,  EvenDblSpc, 1, 4 ,true},
    133 { ARM::VLD1LNq32Pseudo,     ARM::VLD1LNd32,     true, false, false, EvenDblSpc, 1, 2 ,true},
    134 { ARM::VLD1LNq32Pseudo_UPD, ARM::VLD1LNd32_UPD, true, true, true,  EvenDblSpc, 1, 2 ,true},
    135 { ARM::VLD1LNq8Pseudo,      ARM::VLD1LNd8,      true, false, false, EvenDblSpc, 1, 8 ,true},
    136 { ARM::VLD1LNq8Pseudo_UPD,  ARM::VLD1LNd8_UPD, true, true, true,  EvenDblSpc, 1, 8 ,true},
    137 
    138 { ARM::VLD1d64QPseudo,      ARM::VLD1d64Q,     true,  false, false, SingleSpc,  4, 1 ,false},
    139 { ARM::VLD1d64TPseudo,      ARM::VLD1d64T,     true,  false, false, SingleSpc,  3, 1 ,false},
    140 
    141 { ARM::VLD2LNd16Pseudo,     ARM::VLD2LNd16,     true, false, false, SingleSpc,  2, 4 ,true},
    142 { ARM::VLD2LNd16Pseudo_UPD, ARM::VLD2LNd16_UPD, true, true, true,  SingleSpc,  2, 4 ,true},
    143 { ARM::VLD2LNd32Pseudo,     ARM::VLD2LNd32,     true, false, false, SingleSpc,  2, 2 ,true},
    144 { ARM::VLD2LNd32Pseudo_UPD, ARM::VLD2LNd32_UPD, true, true, true,  SingleSpc,  2, 2 ,true},
    145 { ARM::VLD2LNd8Pseudo,      ARM::VLD2LNd8,      true, false, false, SingleSpc,  2, 8 ,true},
    146 { ARM::VLD2LNd8Pseudo_UPD,  ARM::VLD2LNd8_UPD, true, true, true,  SingleSpc,  2, 8 ,true},
    147 { ARM::VLD2LNq16Pseudo,     ARM::VLD2LNq16,     true, false, false, EvenDblSpc, 2, 4 ,true},
    148 { ARM::VLD2LNq16Pseudo_UPD, ARM::VLD2LNq16_UPD, true, true, true,  EvenDblSpc, 2, 4 ,true},
    149 { ARM::VLD2LNq32Pseudo,     ARM::VLD2LNq32,     true, false, false, EvenDblSpc, 2, 2 ,true},
    150 { ARM::VLD2LNq32Pseudo_UPD, ARM::VLD2LNq32_UPD, true, true, true,  EvenDblSpc, 2, 2 ,true},
    151 
    152 { ARM::VLD2q16Pseudo,       ARM::VLD2q16,      true,  false, false, SingleSpc,  4, 4 ,false},
    153 { ARM::VLD2q16PseudoWB_fixed,   ARM::VLD2q16wb_fixed, true, true, false,  SingleSpc,  4, 4 ,false},
    154 { ARM::VLD2q16PseudoWB_register,   ARM::VLD2q16wb_register, true, true, true,  SingleSpc,  4, 4 ,false},
    155 { ARM::VLD2q32Pseudo,       ARM::VLD2q32,      true,  false, false, SingleSpc,  4, 2 ,false},
    156 { ARM::VLD2q32PseudoWB_fixed,   ARM::VLD2q32wb_fixed, true, true, false,  SingleSpc,  4, 2 ,false},
    157 { ARM::VLD2q32PseudoWB_register,   ARM::VLD2q32wb_register, true, true, true,  SingleSpc,  4, 2 ,false},
    158 { ARM::VLD2q8Pseudo,        ARM::VLD2q8,       true,  false, false, SingleSpc,  4, 8 ,false},
    159 { ARM::VLD2q8PseudoWB_fixed,    ARM::VLD2q8wb_fixed, true, true, false,  SingleSpc,  4, 8 ,false},
    160 { ARM::VLD2q8PseudoWB_register,    ARM::VLD2q8wb_register, true, true, true,  SingleSpc,  4, 8 ,false},
    161 
    162 { ARM::VLD3DUPd16Pseudo,     ARM::VLD3DUPd16,     true, false, false, SingleSpc, 3, 4,true},
    163 { ARM::VLD3DUPd16Pseudo_UPD, ARM::VLD3DUPd16_UPD, true, true, true,  SingleSpc, 3, 4,true},
    164 { ARM::VLD3DUPd32Pseudo,     ARM::VLD3DUPd32,     true, false, false, SingleSpc, 3, 2,true},
    165 { ARM::VLD3DUPd32Pseudo_UPD, ARM::VLD3DUPd32_UPD, true, true, true,  SingleSpc, 3, 2,true},
    166 { ARM::VLD3DUPd8Pseudo,      ARM::VLD3DUPd8,      true, false, false, SingleSpc, 3, 8,true},
    167 { ARM::VLD3DUPd8Pseudo_UPD,  ARM::VLD3DUPd8_UPD, true, true, true,  SingleSpc, 3, 8,true},
    168 
    169 { ARM::VLD3LNd16Pseudo,     ARM::VLD3LNd16,     true, false, false, SingleSpc,  3, 4 ,true},
    170 { ARM::VLD3LNd16Pseudo_UPD, ARM::VLD3LNd16_UPD, true, true, true,  SingleSpc,  3, 4 ,true},
    171 { ARM::VLD3LNd32Pseudo,     ARM::VLD3LNd32,     true, false, false, SingleSpc,  3, 2 ,true},
    172 { ARM::VLD3LNd32Pseudo_UPD, ARM::VLD3LNd32_UPD, true, true, true,  SingleSpc,  3, 2 ,true},
    173 { ARM::VLD3LNd8Pseudo,      ARM::VLD3LNd8,      true, false, false, SingleSpc,  3, 8 ,true},
    174 { ARM::VLD3LNd8Pseudo_UPD,  ARM::VLD3LNd8_UPD, true, true, true,  SingleSpc,  3, 8 ,true},
    175 { ARM::VLD3LNq16Pseudo,     ARM::VLD3LNq16,     true, false, false, EvenDblSpc, 3, 4 ,true},
    176 { ARM::VLD3LNq16Pseudo_UPD, ARM::VLD3LNq16_UPD, true, true, true,  EvenDblSpc, 3, 4 ,true},
    177 { ARM::VLD3LNq32Pseudo,     ARM::VLD3LNq32,     true, false, false, EvenDblSpc, 3, 2 ,true},
    178 { ARM::VLD3LNq32Pseudo_UPD, ARM::VLD3LNq32_UPD, true, true, true,  EvenDblSpc, 3, 2 ,true},
    179 
    180 { ARM::VLD3d16Pseudo,       ARM::VLD3d16,      true,  false, false, SingleSpc,  3, 4 ,true},
    181 { ARM::VLD3d16Pseudo_UPD,   ARM::VLD3d16_UPD, true, true, true,  SingleSpc,  3, 4 ,true},
    182 { ARM::VLD3d32Pseudo,       ARM::VLD3d32,      true,  false, false, SingleSpc,  3, 2 ,true},
    183 { ARM::VLD3d32Pseudo_UPD,   ARM::VLD3d32_UPD, true, true, true,  SingleSpc,  3, 2 ,true},
    184 { ARM::VLD3d8Pseudo,        ARM::VLD3d8,       true,  false, false, SingleSpc,  3, 8 ,true},
    185 { ARM::VLD3d8Pseudo_UPD,    ARM::VLD3d8_UPD, true, true, true,  SingleSpc,  3, 8 ,true},
    186 
    187 { ARM::VLD3q16Pseudo_UPD,    ARM::VLD3q16_UPD, true, true, true,  EvenDblSpc, 3, 4 ,true},
    188 { ARM::VLD3q16oddPseudo,     ARM::VLD3q16,     true,  false, false, OddDblSpc,  3, 4 ,true},
    189 { ARM::VLD3q16oddPseudo_UPD, ARM::VLD3q16_UPD, true, true, true,  OddDblSpc,  3, 4 ,true},
    190 { ARM::VLD3q32Pseudo_UPD,    ARM::VLD3q32_UPD, true, true, true,  EvenDblSpc, 3, 2 ,true},
    191 { ARM::VLD3q32oddPseudo,     ARM::VLD3q32,     true,  false, false, OddDblSpc,  3, 2 ,true},
    192 { ARM::VLD3q32oddPseudo_UPD, ARM::VLD3q32_UPD, true, true, true,  OddDblSpc,  3, 2 ,true},
    193 { ARM::VLD3q8Pseudo_UPD,     ARM::VLD3q8_UPD, true, true, true,  EvenDblSpc, 3, 8 ,true},
    194 { ARM::VLD3q8oddPseudo,      ARM::VLD3q8,      true,  false, false, OddDblSpc,  3, 8 ,true},
    195 { ARM::VLD3q8oddPseudo_UPD,  ARM::VLD3q8_UPD, true, true, true,  OddDblSpc,  3, 8 ,true},
    196 
    197 { ARM::VLD4DUPd16Pseudo,     ARM::VLD4DUPd16,     true, false, false, SingleSpc, 4, 4,true},
    198 { ARM::VLD4DUPd16Pseudo_UPD, ARM::VLD4DUPd16_UPD, true, true, true,  SingleSpc, 4, 4,true},
    199 { ARM::VLD4DUPd32Pseudo,     ARM::VLD4DUPd32,     true, false, false, SingleSpc, 4, 2,true},
    200 { ARM::VLD4DUPd32Pseudo_UPD, ARM::VLD4DUPd32_UPD, true, true, true,  SingleSpc, 4, 2,true},
    201 { ARM::VLD4DUPd8Pseudo,      ARM::VLD4DUPd8,      true, false, false, SingleSpc, 4, 8,true},
    202 { ARM::VLD4DUPd8Pseudo_UPD,  ARM::VLD4DUPd8_UPD, true, true, true,  SingleSpc, 4, 8,true},
    203 
    204 { ARM::VLD4LNd16Pseudo,     ARM::VLD4LNd16,     true, false, false, SingleSpc,  4, 4 ,true},
    205 { ARM::VLD4LNd16Pseudo_UPD, ARM::VLD4LNd16_UPD, true, true, true,  SingleSpc,  4, 4 ,true},
    206 { ARM::VLD4LNd32Pseudo,     ARM::VLD4LNd32,     true, false, false, SingleSpc,  4, 2 ,true},
    207 { ARM::VLD4LNd32Pseudo_UPD, ARM::VLD4LNd32_UPD, true, true, true,  SingleSpc,  4, 2 ,true},
    208 { ARM::VLD4LNd8Pseudo,      ARM::VLD4LNd8,      true, false, false, SingleSpc,  4, 8 ,true},
    209 { ARM::VLD4LNd8Pseudo_UPD,  ARM::VLD4LNd8_UPD, true, true, true,  SingleSpc,  4, 8 ,true},
    210 { ARM::VLD4LNq16Pseudo,     ARM::VLD4LNq16,     true, false, false, EvenDblSpc, 4, 4 ,true},
    211 { ARM::VLD4LNq16Pseudo_UPD, ARM::VLD4LNq16_UPD, true, true, true,  EvenDblSpc, 4, 4 ,true},
    212 { ARM::VLD4LNq32Pseudo,     ARM::VLD4LNq32,     true, false, false, EvenDblSpc, 4, 2 ,true},
    213 { ARM::VLD4LNq32Pseudo_UPD, ARM::VLD4LNq32_UPD, true, true, true,  EvenDblSpc, 4, 2 ,true},
    214 
    215 { ARM::VLD4d16Pseudo,       ARM::VLD4d16,      true,  false, false, SingleSpc,  4, 4 ,true},
    216 { ARM::VLD4d16Pseudo_UPD,   ARM::VLD4d16_UPD, true, true, true,  SingleSpc,  4, 4 ,true},
    217 { ARM::VLD4d32Pseudo,       ARM::VLD4d32,      true,  false, false, SingleSpc,  4, 2 ,true},
    218 { ARM::VLD4d32Pseudo_UPD,   ARM::VLD4d32_UPD, true, true, true,  SingleSpc,  4, 2 ,true},
    219 { ARM::VLD4d8Pseudo,        ARM::VLD4d8,       true,  false, false, SingleSpc,  4, 8 ,true},
    220 { ARM::VLD4d8Pseudo_UPD,    ARM::VLD4d8_UPD, true, true, true,  SingleSpc,  4, 8 ,true},
    221 
    222 { ARM::VLD4q16Pseudo_UPD,    ARM::VLD4q16_UPD, true, true, true,  EvenDblSpc, 4, 4 ,true},
    223 { ARM::VLD4q16oddPseudo,     ARM::VLD4q16,     true,  false, false, OddDblSpc,  4, 4 ,true},
    224 { ARM::VLD4q16oddPseudo_UPD, ARM::VLD4q16_UPD, true, true, true,  OddDblSpc,  4, 4 ,true},
    225 { ARM::VLD4q32Pseudo_UPD,    ARM::VLD4q32_UPD, true, true, true,  EvenDblSpc, 4, 2 ,true},
    226 { ARM::VLD4q32oddPseudo,     ARM::VLD4q32,     true,  false, false, OddDblSpc,  4, 2 ,true},
    227 { ARM::VLD4q32oddPseudo_UPD, ARM::VLD4q32_UPD, true, true, true,  OddDblSpc,  4, 2 ,true},
    228 { ARM::VLD4q8Pseudo_UPD,     ARM::VLD4q8_UPD, true, true, true,  EvenDblSpc, 4, 8 ,true},
    229 { ARM::VLD4q8oddPseudo,      ARM::VLD4q8,      true,  false, false, OddDblSpc,  4, 8 ,true},
    230 { ARM::VLD4q8oddPseudo_UPD,  ARM::VLD4q8_UPD, true, true, true,  OddDblSpc,  4, 8 ,true},
    231 
    232 { ARM::VST1LNq16Pseudo,     ARM::VST1LNd16,    false, false, false, EvenDblSpc, 1, 4 ,true},
    233 { ARM::VST1LNq16Pseudo_UPD, ARM::VST1LNd16_UPD, false, true, true,  EvenDblSpc, 1, 4 ,true},
    234 { ARM::VST1LNq32Pseudo,     ARM::VST1LNd32,    false, false, false, EvenDblSpc, 1, 2 ,true},
    235 { ARM::VST1LNq32Pseudo_UPD, ARM::VST1LNd32_UPD, false, true, true,  EvenDblSpc, 1, 2 ,true},
    236 { ARM::VST1LNq8Pseudo,      ARM::VST1LNd8,     false, false, false, EvenDblSpc, 1, 8 ,true},
    237 { ARM::VST1LNq8Pseudo_UPD,  ARM::VST1LNd8_UPD, false, true, true,  EvenDblSpc, 1, 8 ,true},
    238 
    239 { ARM::VST1d64QPseudo,      ARM::VST1d64Q,     false, false, false, SingleSpc,  4, 1 ,false},
    240 { ARM::VST1d64QPseudoWB_fixed,  ARM::VST1d64Qwb_fixed, false, true, false,  SingleSpc,  4, 1 ,false},
    241 { ARM::VST1d64QPseudoWB_register, ARM::VST1d64Qwb_register, false, true, true,  SingleSpc,  4, 1 ,false},
    242 { ARM::VST1d64TPseudo,      ARM::VST1d64T,     false, false, false, SingleSpc,  3, 1 ,false},
    243 { ARM::VST1d64TPseudoWB_fixed,  ARM::VST1d64Twb_fixed, false, true, false,  SingleSpc,  3, 1 ,false},
    244 { ARM::VST1d64TPseudoWB_register,  ARM::VST1d64Twb_register, false, true, true,  SingleSpc,  3, 1 ,false},
    245 
    246 { ARM::VST2LNd16Pseudo,     ARM::VST2LNd16,     false, false, false, SingleSpc, 2, 4 ,true},
    247 { ARM::VST2LNd16Pseudo_UPD, ARM::VST2LNd16_UPD, false, true, true,  SingleSpc, 2, 4 ,true},
    248 { ARM::VST2LNd32Pseudo,     ARM::VST2LNd32,     false, false, false, SingleSpc, 2, 2 ,true},
    249 { ARM::VST2LNd32Pseudo_UPD, ARM::VST2LNd32_UPD, false, true, true,  SingleSpc, 2, 2 ,true},
    250 { ARM::VST2LNd8Pseudo,      ARM::VST2LNd8,      false, false, false, SingleSpc, 2, 8 ,true},
    251 { ARM::VST2LNd8Pseudo_UPD,  ARM::VST2LNd8_UPD, false, true, true,  SingleSpc, 2, 8 ,true},
    252 { ARM::VST2LNq16Pseudo,     ARM::VST2LNq16,     false, false, false, EvenDblSpc, 2, 4,true},
    253 { ARM::VST2LNq16Pseudo_UPD, ARM::VST2LNq16_UPD, false, true, true,  EvenDblSpc, 2, 4,true},
    254 { ARM::VST2LNq32Pseudo,     ARM::VST2LNq32,     false, false, false, EvenDblSpc, 2, 2,true},
    255 { ARM::VST2LNq32Pseudo_UPD, ARM::VST2LNq32_UPD, false, true, true,  EvenDblSpc, 2, 2,true},
    256 
    257 { ARM::VST2q16Pseudo,       ARM::VST2q16,      false, false, false, SingleSpc,  4, 4 ,false},
    258 { ARM::VST2q16PseudoWB_fixed,   ARM::VST2q16wb_fixed, false, true, false,  SingleSpc,  4, 4 ,false},
    259 { ARM::VST2q16PseudoWB_register,   ARM::VST2q16wb_register, false, true, true,  SingleSpc,  4, 4 ,false},
    260 { ARM::VST2q32Pseudo,       ARM::VST2q32,      false, false, false, SingleSpc,  4, 2 ,false},
    261 { ARM::VST2q32PseudoWB_fixed,   ARM::VST2q32wb_fixed, false, true, false,  SingleSpc,  4, 2 ,false},
    262 { ARM::VST2q32PseudoWB_register,   ARM::VST2q32wb_register, false, true, true,  SingleSpc,  4, 2 ,false},
    263 { ARM::VST2q8Pseudo,        ARM::VST2q8,       false, false, false, SingleSpc,  4, 8 ,false},
    264 { ARM::VST2q8PseudoWB_fixed,    ARM::VST2q8wb_fixed, false, true, false,  SingleSpc,  4, 8 ,false},
    265 { ARM::VST2q8PseudoWB_register,    ARM::VST2q8wb_register, false, true, true,  SingleSpc,  4, 8 ,false},
    266 
    267 { ARM::VST3LNd16Pseudo,     ARM::VST3LNd16,     false, false, false, SingleSpc, 3, 4 ,true},
    268 { ARM::VST3LNd16Pseudo_UPD, ARM::VST3LNd16_UPD, false, true, true,  SingleSpc, 3, 4 ,true},
    269 { ARM::VST3LNd32Pseudo,     ARM::VST3LNd32,     false, false, false, SingleSpc, 3, 2 ,true},
    270 { ARM::VST3LNd32Pseudo_UPD, ARM::VST3LNd32_UPD, false, true, true,  SingleSpc, 3, 2 ,true},
    271 { ARM::VST3LNd8Pseudo,      ARM::VST3LNd8,      false, false, false, SingleSpc, 3, 8 ,true},
    272 { ARM::VST3LNd8Pseudo_UPD,  ARM::VST3LNd8_UPD, false, true, true,  SingleSpc, 3, 8 ,true},
    273 { ARM::VST3LNq16Pseudo,     ARM::VST3LNq16,     false, false, false, EvenDblSpc, 3, 4,true},
    274 { ARM::VST3LNq16Pseudo_UPD, ARM::VST3LNq16_UPD, false, true, true,  EvenDblSpc, 3, 4,true},
    275 { ARM::VST3LNq32Pseudo,     ARM::VST3LNq32,     false, false, false, EvenDblSpc, 3, 2,true},
    276 { ARM::VST3LNq32Pseudo_UPD, ARM::VST3LNq32_UPD, false, true, true,  EvenDblSpc, 3, 2,true},
    277 
    278 { ARM::VST3d16Pseudo,       ARM::VST3d16,      false, false, false, SingleSpc,  3, 4 ,true},
    279 { ARM::VST3d16Pseudo_UPD,   ARM::VST3d16_UPD, false, true, true,  SingleSpc,  3, 4 ,true},
    280 { ARM::VST3d32Pseudo,       ARM::VST3d32,      false, false, false, SingleSpc,  3, 2 ,true},
    281 { ARM::VST3d32Pseudo_UPD,   ARM::VST3d32_UPD, false, true, true,  SingleSpc,  3, 2 ,true},
    282 { ARM::VST3d8Pseudo,        ARM::VST3d8,       false, false, false, SingleSpc,  3, 8 ,true},
    283 { ARM::VST3d8Pseudo_UPD,    ARM::VST3d8_UPD, false, true, true,  SingleSpc,  3, 8 ,true},
    284 
    285 { ARM::VST3q16Pseudo_UPD,    ARM::VST3q16_UPD, false, true, true,  EvenDblSpc, 3, 4 ,true},
    286 { ARM::VST3q16oddPseudo,     ARM::VST3q16,     false, false, false, OddDblSpc,  3, 4 ,true},
    287 { ARM::VST3q16oddPseudo_UPD, ARM::VST3q16_UPD, false, true, true,  OddDblSpc,  3, 4 ,true},
    288 { ARM::VST3q32Pseudo_UPD,    ARM::VST3q32_UPD, false, true, true,  EvenDblSpc, 3, 2 ,true},
    289 { ARM::VST3q32oddPseudo,     ARM::VST3q32,     false, false, false, OddDblSpc,  3, 2 ,true},
    290 { ARM::VST3q32oddPseudo_UPD, ARM::VST3q32_UPD, false, true, true,  OddDblSpc,  3, 2 ,true},
    291 { ARM::VST3q8Pseudo_UPD,     ARM::VST3q8_UPD, false, true, true,  EvenDblSpc, 3, 8 ,true},
    292 { ARM::VST3q8oddPseudo,      ARM::VST3q8,      false, false, false, OddDblSpc,  3, 8 ,true},
    293 { ARM::VST3q8oddPseudo_UPD,  ARM::VST3q8_UPD, false, true, true,  OddDblSpc,  3, 8 ,true},
    294 
    295 { ARM::VST4LNd16Pseudo,     ARM::VST4LNd16,     false, false, false, SingleSpc, 4, 4 ,true},
    296 { ARM::VST4LNd16Pseudo_UPD, ARM::VST4LNd16_UPD, false, true, true,  SingleSpc, 4, 4 ,true},
    297 { ARM::VST4LNd32Pseudo,     ARM::VST4LNd32,     false, false, false, SingleSpc, 4, 2 ,true},
    298 { ARM::VST4LNd32Pseudo_UPD, ARM::VST4LNd32_UPD, false, true, true,  SingleSpc, 4, 2 ,true},
    299 { ARM::VST4LNd8Pseudo,      ARM::VST4LNd8,      false, false, false, SingleSpc, 4, 8 ,true},
    300 { ARM::VST4LNd8Pseudo_UPD,  ARM::VST4LNd8_UPD, false, true, true,  SingleSpc, 4, 8 ,true},
    301 { ARM::VST4LNq16Pseudo,     ARM::VST4LNq16,     false, false, false, EvenDblSpc, 4, 4,true},
    302 { ARM::VST4LNq16Pseudo_UPD, ARM::VST4LNq16_UPD, false, true, true,  EvenDblSpc, 4, 4,true},
    303 { ARM::VST4LNq32Pseudo,     ARM::VST4LNq32,     false, false, false, EvenDblSpc, 4, 2,true},
    304 { ARM::VST4LNq32Pseudo_UPD, ARM::VST4LNq32_UPD, false, true, true,  EvenDblSpc, 4, 2,true},
    305 
    306 { ARM::VST4d16Pseudo,       ARM::VST4d16,      false, false, false, SingleSpc,  4, 4 ,true},
    307 { ARM::VST4d16Pseudo_UPD,   ARM::VST4d16_UPD, false, true, true,  SingleSpc,  4, 4 ,true},
    308 { ARM::VST4d32Pseudo,       ARM::VST4d32,      false, false, false, SingleSpc,  4, 2 ,true},
    309 { ARM::VST4d32Pseudo_UPD,   ARM::VST4d32_UPD, false, true, true,  SingleSpc,  4, 2 ,true},
    310 { ARM::VST4d8Pseudo,        ARM::VST4d8,       false, false, false, SingleSpc,  4, 8 ,true},
    311 { ARM::VST4d8Pseudo_UPD,    ARM::VST4d8_UPD, false, true, true,  SingleSpc,  4, 8 ,true},
    312 
    313 { ARM::VST4q16Pseudo_UPD,    ARM::VST4q16_UPD, false, true, true,  EvenDblSpc, 4, 4 ,true},
    314 { ARM::VST4q16oddPseudo,     ARM::VST4q16,     false, false, false, OddDblSpc,  4, 4 ,true},
    315 { ARM::VST4q16oddPseudo_UPD, ARM::VST4q16_UPD, false, true, true,  OddDblSpc,  4, 4 ,true},
    316 { ARM::VST4q32Pseudo_UPD,    ARM::VST4q32_UPD, false, true, true,  EvenDblSpc, 4, 2 ,true},
    317 { ARM::VST4q32oddPseudo,     ARM::VST4q32,     false, false, false, OddDblSpc,  4, 2 ,true},
    318 { ARM::VST4q32oddPseudo_UPD, ARM::VST4q32_UPD, false, true, true,  OddDblSpc,  4, 2 ,true},
    319 { ARM::VST4q8Pseudo_UPD,     ARM::VST4q8_UPD, false, true, true,  EvenDblSpc, 4, 8 ,true},
    320 { ARM::VST4q8oddPseudo,      ARM::VST4q8,      false, false, false, OddDblSpc,  4, 8 ,true},
    321 { ARM::VST4q8oddPseudo_UPD,  ARM::VST4q8_UPD, false, true, true,  OddDblSpc,  4, 8 ,true}
    322 };
    323 
    324 /// LookupNEONLdSt - Search the NEONLdStTable for information about a NEON
    325 /// load or store pseudo instruction.
    326 static const NEONLdStTableEntry *LookupNEONLdSt(unsigned Opcode) {
    327   const unsigned NumEntries = array_lengthof(NEONLdStTable);
    328 
    329 #ifndef NDEBUG
    330   // Make sure the table is sorted.
    331   static bool TableChecked = false;
    332   if (!TableChecked) {
    333     for (unsigned i = 0; i != NumEntries-1; ++i)
    334       assert(NEONLdStTable[i] < NEONLdStTable[i+1] &&
    335              "NEONLdStTable is not sorted!");
    336     TableChecked = true;
    337   }
    338 #endif
    339 
    340   const NEONLdStTableEntry *I =
    341     std::lower_bound(NEONLdStTable, NEONLdStTable + NumEntries, Opcode);
    342   if (I != NEONLdStTable + NumEntries && I->PseudoOpc == Opcode)
    343     return I;
    344   return NULL;
    345 }
    346 
    347 /// GetDSubRegs - Get 4 D subregisters of a Q, QQ, or QQQQ register,
    348 /// corresponding to the specified register spacing.  Not all of the results
    349 /// are necessarily valid, e.g., a Q register only has 2 D subregisters.
    350 static void GetDSubRegs(unsigned Reg, NEONRegSpacing RegSpc,
    351                         const TargetRegisterInfo *TRI, unsigned &D0,
    352                         unsigned &D1, unsigned &D2, unsigned &D3) {
    353   if (RegSpc == SingleSpc) {
    354     D0 = TRI->getSubReg(Reg, ARM::dsub_0);
    355     D1 = TRI->getSubReg(Reg, ARM::dsub_1);
    356     D2 = TRI->getSubReg(Reg, ARM::dsub_2);
    357     D3 = TRI->getSubReg(Reg, ARM::dsub_3);
    358   } else if (RegSpc == EvenDblSpc) {
    359     D0 = TRI->getSubReg(Reg, ARM::dsub_0);
    360     D1 = TRI->getSubReg(Reg, ARM::dsub_2);
    361     D2 = TRI->getSubReg(Reg, ARM::dsub_4);
    362     D3 = TRI->getSubReg(Reg, ARM::dsub_6);
    363   } else {
    364     assert(RegSpc == OddDblSpc && "unknown register spacing");
    365     D0 = TRI->getSubReg(Reg, ARM::dsub_1);
    366     D1 = TRI->getSubReg(Reg, ARM::dsub_3);
    367     D2 = TRI->getSubReg(Reg, ARM::dsub_5);
    368     D3 = TRI->getSubReg(Reg, ARM::dsub_7);
    369   }
    370 }
    371 
    372 /// ExpandVLD - Translate VLD pseudo instructions with Q, QQ or QQQQ register
    373 /// operands to real VLD instructions with D register operands.
    374 void ARMExpandPseudo::ExpandVLD(MachineBasicBlock::iterator &MBBI) {
    375   MachineInstr &MI = *MBBI;
    376   MachineBasicBlock &MBB = *MI.getParent();
    377 
    378   const NEONLdStTableEntry *TableEntry = LookupNEONLdSt(MI.getOpcode());
    379   assert(TableEntry && TableEntry->IsLoad && "NEONLdStTable lookup failed");
    380   NEONRegSpacing RegSpc = TableEntry->RegSpacing;
    381   unsigned NumRegs = TableEntry->NumRegs;
    382 
    383   MachineInstrBuilder MIB = BuildMI(MBB, MBBI, MI.getDebugLoc(),
    384                                     TII->get(TableEntry->RealOpc));
    385   unsigned OpIdx = 0;
    386 
    387   bool DstIsDead = MI.getOperand(OpIdx).isDead();
    388   unsigned DstReg = MI.getOperand(OpIdx++).getReg();
    389   unsigned D0, D1, D2, D3;
    390   GetDSubRegs(DstReg, RegSpc, TRI, D0, D1, D2, D3);
    391   MIB.addReg(D0, RegState::Define | getDeadRegState(DstIsDead));
    392   if (NumRegs > 1 && TableEntry->copyAllListRegs)
    393     MIB.addReg(D1, RegState::Define | getDeadRegState(DstIsDead));
    394   if (NumRegs > 2 && TableEntry->copyAllListRegs)
    395     MIB.addReg(D2, RegState::Define | getDeadRegState(DstIsDead));
    396   if (NumRegs > 3 && TableEntry->copyAllListRegs)
    397     MIB.addReg(D3, RegState::Define | getDeadRegState(DstIsDead));
    398 
    399   if (TableEntry->isUpdating)
    400     MIB.addOperand(MI.getOperand(OpIdx++));
    401 
    402   // Copy the addrmode6 operands.
    403   MIB.addOperand(MI.getOperand(OpIdx++));
    404   MIB.addOperand(MI.getOperand(OpIdx++));
    405   // Copy the am6offset operand.
    406   if (TableEntry->hasWritebackOperand)
    407     MIB.addOperand(MI.getOperand(OpIdx++));
    408 
    409   // For an instruction writing double-spaced subregs, the pseudo instruction
    410   // has an extra operand that is a use of the super-register.  Record the
    411   // operand index and skip over it.
    412   unsigned SrcOpIdx = 0;
    413   if (RegSpc == EvenDblSpc || RegSpc == OddDblSpc)
    414     SrcOpIdx = OpIdx++;
    415 
    416   // Copy the predicate operands.
    417   MIB.addOperand(MI.getOperand(OpIdx++));
    418   MIB.addOperand(MI.getOperand(OpIdx++));
    419 
    420   // Copy the super-register source operand used for double-spaced subregs over
    421   // to the new instruction as an implicit operand.
    422   if (SrcOpIdx != 0) {
    423     MachineOperand MO = MI.getOperand(SrcOpIdx);
    424     MO.setImplicit(true);
    425     MIB.addOperand(MO);
    426   }
    427   // Add an implicit def for the super-register.
    428   MIB.addReg(DstReg, RegState::ImplicitDefine | getDeadRegState(DstIsDead));
    429   TransferImpOps(MI, MIB, MIB);
    430 
    431   // Transfer memoperands.
    432   MIB->setMemRefs(MI.memoperands_begin(), MI.memoperands_end());
    433 
    434   MI.eraseFromParent();
    435 }
    436 
    437 /// ExpandVST - Translate VST pseudo instructions with Q, QQ or QQQQ register
    438 /// operands to real VST instructions with D register operands.
    439 void ARMExpandPseudo::ExpandVST(MachineBasicBlock::iterator &MBBI) {
    440   MachineInstr &MI = *MBBI;
    441   MachineBasicBlock &MBB = *MI.getParent();
    442 
    443   const NEONLdStTableEntry *TableEntry = LookupNEONLdSt(MI.getOpcode());
    444   assert(TableEntry && !TableEntry->IsLoad && "NEONLdStTable lookup failed");
    445   NEONRegSpacing RegSpc = TableEntry->RegSpacing;
    446   unsigned NumRegs = TableEntry->NumRegs;
    447 
    448   MachineInstrBuilder MIB = BuildMI(MBB, MBBI, MI.getDebugLoc(),
    449                                     TII->get(TableEntry->RealOpc));
    450   unsigned OpIdx = 0;
    451   if (TableEntry->isUpdating)
    452     MIB.addOperand(MI.getOperand(OpIdx++));
    453 
    454   // Copy the addrmode6 operands.
    455   MIB.addOperand(MI.getOperand(OpIdx++));
    456   MIB.addOperand(MI.getOperand(OpIdx++));
    457   // Copy the am6offset operand.
    458   if (TableEntry->hasWritebackOperand)
    459     MIB.addOperand(MI.getOperand(OpIdx++));
    460 
    461   bool SrcIsKill = MI.getOperand(OpIdx).isKill();
    462   bool SrcIsUndef = MI.getOperand(OpIdx).isUndef();
    463   unsigned SrcReg = MI.getOperand(OpIdx++).getReg();
    464   unsigned D0, D1, D2, D3;
    465   GetDSubRegs(SrcReg, RegSpc, TRI, D0, D1, D2, D3);
    466   MIB.addReg(D0, getUndefRegState(SrcIsUndef));
    467   if (NumRegs > 1 && TableEntry->copyAllListRegs)
    468     MIB.addReg(D1, getUndefRegState(SrcIsUndef));
    469   if (NumRegs > 2 && TableEntry->copyAllListRegs)
    470     MIB.addReg(D2, getUndefRegState(SrcIsUndef));
    471   if (NumRegs > 3 && TableEntry->copyAllListRegs)
    472     MIB.addReg(D3, getUndefRegState(SrcIsUndef));
    473 
    474   // Copy the predicate operands.
    475   MIB.addOperand(MI.getOperand(OpIdx++));
    476   MIB.addOperand(MI.getOperand(OpIdx++));
    477 
    478   if (SrcIsKill && !SrcIsUndef) // Add an implicit kill for the super-reg.
    479     MIB->addRegisterKilled(SrcReg, TRI, true);
    480   TransferImpOps(MI, MIB, MIB);
    481 
    482   // Transfer memoperands.
    483   MIB->setMemRefs(MI.memoperands_begin(), MI.memoperands_end());
    484 
    485   MI.eraseFromParent();
    486 }
    487 
    488 /// ExpandLaneOp - Translate VLD*LN and VST*LN instructions with Q, QQ or QQQQ
    489 /// register operands to real instructions with D register operands.
    490 void ARMExpandPseudo::ExpandLaneOp(MachineBasicBlock::iterator &MBBI) {
    491   MachineInstr &MI = *MBBI;
    492   MachineBasicBlock &MBB = *MI.getParent();
    493 
    494   const NEONLdStTableEntry *TableEntry = LookupNEONLdSt(MI.getOpcode());
    495   assert(TableEntry && "NEONLdStTable lookup failed");
    496   NEONRegSpacing RegSpc = TableEntry->RegSpacing;
    497   unsigned NumRegs = TableEntry->NumRegs;
    498   unsigned RegElts = TableEntry->RegElts;
    499 
    500   MachineInstrBuilder MIB = BuildMI(MBB, MBBI, MI.getDebugLoc(),
    501                                     TII->get(TableEntry->RealOpc));
    502   unsigned OpIdx = 0;
    503   // The lane operand is always the 3rd from last operand, before the 2
    504   // predicate operands.
    505   unsigned Lane = MI.getOperand(MI.getDesc().getNumOperands() - 3).getImm();
    506 
    507   // Adjust the lane and spacing as needed for Q registers.
    508   assert(RegSpc != OddDblSpc && "unexpected register spacing for VLD/VST-lane");
    509   if (RegSpc == EvenDblSpc && Lane >= RegElts) {
    510     RegSpc = OddDblSpc;
    511     Lane -= RegElts;
    512   }
    513   assert(Lane < RegElts && "out of range lane for VLD/VST-lane");
    514 
    515   unsigned D0 = 0, D1 = 0, D2 = 0, D3 = 0;
    516   unsigned DstReg = 0;
    517   bool DstIsDead = false;
    518   if (TableEntry->IsLoad) {
    519     DstIsDead = MI.getOperand(OpIdx).isDead();
    520     DstReg = MI.getOperand(OpIdx++).getReg();
    521     GetDSubRegs(DstReg, RegSpc, TRI, D0, D1, D2, D3);
    522     MIB.addReg(D0, RegState::Define | getDeadRegState(DstIsDead));
    523     if (NumRegs > 1)
    524       MIB.addReg(D1, RegState::Define | getDeadRegState(DstIsDead));
    525     if (NumRegs > 2)
    526       MIB.addReg(D2, RegState::Define | getDeadRegState(DstIsDead));
    527     if (NumRegs > 3)
    528       MIB.addReg(D3, RegState::Define | getDeadRegState(DstIsDead));
    529   }
    530 
    531   if (TableEntry->isUpdating)
    532     MIB.addOperand(MI.getOperand(OpIdx++));
    533 
    534   // Copy the addrmode6 operands.
    535   MIB.addOperand(MI.getOperand(OpIdx++));
    536   MIB.addOperand(MI.getOperand(OpIdx++));
    537   // Copy the am6offset operand.
    538   if (TableEntry->hasWritebackOperand)
    539     MIB.addOperand(MI.getOperand(OpIdx++));
    540 
    541   // Grab the super-register source.
    542   MachineOperand MO = MI.getOperand(OpIdx++);
    543   if (!TableEntry->IsLoad)
    544     GetDSubRegs(MO.getReg(), RegSpc, TRI, D0, D1, D2, D3);
    545 
    546   // Add the subregs as sources of the new instruction.
    547   unsigned SrcFlags = (getUndefRegState(MO.isUndef()) |
    548                        getKillRegState(MO.isKill()));
    549   MIB.addReg(D0, SrcFlags);
    550   if (NumRegs > 1)
    551     MIB.addReg(D1, SrcFlags);
    552   if (NumRegs > 2)
    553     MIB.addReg(D2, SrcFlags);
    554   if (NumRegs > 3)
    555     MIB.addReg(D3, SrcFlags);
    556 
    557   // Add the lane number operand.
    558   MIB.addImm(Lane);
    559   OpIdx += 1;
    560 
    561   // Copy the predicate operands.
    562   MIB.addOperand(MI.getOperand(OpIdx++));
    563   MIB.addOperand(MI.getOperand(OpIdx++));
    564 
    565   // Copy the super-register source to be an implicit source.
    566   MO.setImplicit(true);
    567   MIB.addOperand(MO);
    568   if (TableEntry->IsLoad)
    569     // Add an implicit def for the super-register.
    570     MIB.addReg(DstReg, RegState::ImplicitDefine | getDeadRegState(DstIsDead));
    571   TransferImpOps(MI, MIB, MIB);
    572   // Transfer memoperands.
    573   MIB->setMemRefs(MI.memoperands_begin(), MI.memoperands_end());
    574   MI.eraseFromParent();
    575 }
    576 
    577 /// ExpandVTBL - Translate VTBL and VTBX pseudo instructions with Q or QQ
    578 /// register operands to real instructions with D register operands.
    579 void ARMExpandPseudo::ExpandVTBL(MachineBasicBlock::iterator &MBBI,
    580                                  unsigned Opc, bool IsExt) {
    581   MachineInstr &MI = *MBBI;
    582   MachineBasicBlock &MBB = *MI.getParent();
    583 
    584   MachineInstrBuilder MIB = BuildMI(MBB, MBBI, MI.getDebugLoc(), TII->get(Opc));
    585   unsigned OpIdx = 0;
    586 
    587   // Transfer the destination register operand.
    588   MIB.addOperand(MI.getOperand(OpIdx++));
    589   if (IsExt)
    590     MIB.addOperand(MI.getOperand(OpIdx++));
    591 
    592   bool SrcIsKill = MI.getOperand(OpIdx).isKill();
    593   unsigned SrcReg = MI.getOperand(OpIdx++).getReg();
    594   unsigned D0, D1, D2, D3;
    595   GetDSubRegs(SrcReg, SingleSpc, TRI, D0, D1, D2, D3);
    596   MIB.addReg(D0);
    597 
    598   // Copy the other source register operand.
    599   MIB.addOperand(MI.getOperand(OpIdx++));
    600 
    601   // Copy the predicate operands.
    602   MIB.addOperand(MI.getOperand(OpIdx++));
    603   MIB.addOperand(MI.getOperand(OpIdx++));
    604 
    605   if (SrcIsKill)  // Add an implicit kill for the super-reg.
    606     MIB->addRegisterKilled(SrcReg, TRI, true);
    607   TransferImpOps(MI, MIB, MIB);
    608   MI.eraseFromParent();
    609 }
    610 
    611 void ARMExpandPseudo::ExpandMOV32BitImm(MachineBasicBlock &MBB,
    612                                         MachineBasicBlock::iterator &MBBI) {
    613   MachineInstr &MI = *MBBI;
    614   unsigned Opcode = MI.getOpcode();
    615   unsigned PredReg = 0;
    616   ARMCC::CondCodes Pred = getInstrPredicate(&MI, PredReg);
    617   unsigned DstReg = MI.getOperand(0).getReg();
    618   bool DstIsDead = MI.getOperand(0).isDead();
    619   bool isCC = Opcode == ARM::MOVCCi32imm || Opcode == ARM::t2MOVCCi32imm;
    620   const MachineOperand &MO = MI.getOperand(isCC ? 2 : 1);
    621   MachineInstrBuilder LO16, HI16;
    622 
    623   if (!STI->hasV6T2Ops() &&
    624       (Opcode == ARM::MOVi32imm || Opcode == ARM::MOVCCi32imm)) {
    625     // Expand into a movi + orr.
    626     LO16 = BuildMI(MBB, MBBI, MI.getDebugLoc(), TII->get(ARM::MOVi), DstReg);
    627     HI16 = BuildMI(MBB, MBBI, MI.getDebugLoc(), TII->get(ARM::ORRri))
    628       .addReg(DstReg, RegState::Define | getDeadRegState(DstIsDead))
    629       .addReg(DstReg);
    630 
    631     assert (MO.isImm() && "MOVi32imm w/ non-immediate source operand!");
    632     unsigned ImmVal = (unsigned)MO.getImm();
    633     unsigned SOImmValV1 = ARM_AM::getSOImmTwoPartFirst(ImmVal);
    634     unsigned SOImmValV2 = ARM_AM::getSOImmTwoPartSecond(ImmVal);
    635     LO16 = LO16.addImm(SOImmValV1);
    636     HI16 = HI16.addImm(SOImmValV2);
    637     LO16->setMemRefs(MI.memoperands_begin(), MI.memoperands_end());
    638     HI16->setMemRefs(MI.memoperands_begin(), MI.memoperands_end());
    639     LO16.addImm(Pred).addReg(PredReg).addReg(0);
    640     HI16.addImm(Pred).addReg(PredReg).addReg(0);
    641     TransferImpOps(MI, LO16, HI16);
    642     MI.eraseFromParent();
    643     return;
    644   }
    645 
    646   unsigned LO16Opc = 0;
    647   unsigned HI16Opc = 0;
    648   if (Opcode == ARM::t2MOVi32imm || Opcode == ARM::t2MOVCCi32imm) {
    649     LO16Opc = ARM::t2MOVi16;
    650     HI16Opc = ARM::t2MOVTi16;
    651   } else {
    652     LO16Opc = ARM::MOVi16;
    653     HI16Opc = ARM::MOVTi16;
    654   }
    655 
    656   LO16 = BuildMI(MBB, MBBI, MI.getDebugLoc(), TII->get(LO16Opc), DstReg);
    657   HI16 = BuildMI(MBB, MBBI, MI.getDebugLoc(), TII->get(HI16Opc))
    658     .addReg(DstReg, RegState::Define | getDeadRegState(DstIsDead))
    659     .addReg(DstReg);
    660 
    661   if (MO.isImm()) {
    662     unsigned Imm = MO.getImm();
    663     unsigned Lo16 = Imm & 0xffff;
    664     unsigned Hi16 = (Imm >> 16) & 0xffff;
    665     LO16 = LO16.addImm(Lo16);
    666     HI16 = HI16.addImm(Hi16);
    667   } else {
    668     const GlobalValue *GV = MO.getGlobal();
    669     unsigned TF = MO.getTargetFlags();
    670     LO16 = LO16.addGlobalAddress(GV, MO.getOffset(), TF | ARMII::MO_LO16);
    671     HI16 = HI16.addGlobalAddress(GV, MO.getOffset(), TF | ARMII::MO_HI16);
    672   }
    673 
    674   LO16->setMemRefs(MI.memoperands_begin(), MI.memoperands_end());
    675   HI16->setMemRefs(MI.memoperands_begin(), MI.memoperands_end());
    676   LO16.addImm(Pred).addReg(PredReg);
    677   HI16.addImm(Pred).addReg(PredReg);
    678 
    679   TransferImpOps(MI, LO16, HI16);
    680   MI.eraseFromParent();
    681 }
    682 
    683 bool ARMExpandPseudo::ExpandMI(MachineBasicBlock &MBB,
    684                                MachineBasicBlock::iterator MBBI) {
    685   MachineInstr &MI = *MBBI;
    686   unsigned Opcode = MI.getOpcode();
    687   switch (Opcode) {
    688     default:
    689       return false;
    690     case ARM::VMOVScc:
    691     case ARM::VMOVDcc: {
    692       unsigned newOpc = Opcode == ARM::VMOVScc ? ARM::VMOVS : ARM::VMOVD;
    693       BuildMI(MBB, MBBI, MI.getDebugLoc(), TII->get(newOpc),
    694               MI.getOperand(1).getReg())
    695         .addReg(MI.getOperand(2).getReg(),
    696                 getKillRegState(MI.getOperand(2).isKill()))
    697         .addImm(MI.getOperand(3).getImm()) // 'pred'
    698         .addReg(MI.getOperand(4).getReg());
    699 
    700       MI.eraseFromParent();
    701       return true;
    702     }
    703     case ARM::t2MOVCCr:
    704     case ARM::MOVCCr: {
    705       unsigned Opc = AFI->isThumbFunction() ? ARM::t2MOVr : ARM::MOVr;
    706       BuildMI(MBB, MBBI, MI.getDebugLoc(), TII->get(Opc),
    707               MI.getOperand(1).getReg())
    708         .addReg(MI.getOperand(2).getReg(),
    709                 getKillRegState(MI.getOperand(2).isKill()))
    710         .addImm(MI.getOperand(3).getImm()) // 'pred'
    711         .addReg(MI.getOperand(4).getReg())
    712         .addReg(0); // 's' bit
    713 
    714       MI.eraseFromParent();
    715       return true;
    716     }
    717     case ARM::MOVCCsi: {
    718       BuildMI(MBB, MBBI, MI.getDebugLoc(), TII->get(ARM::MOVsi),
    719               (MI.getOperand(1).getReg()))
    720         .addReg(MI.getOperand(2).getReg(),
    721                 getKillRegState(MI.getOperand(2).isKill()))
    722         .addImm(MI.getOperand(3).getImm())
    723         .addImm(MI.getOperand(4).getImm()) // 'pred'
    724         .addReg(MI.getOperand(5).getReg())
    725         .addReg(0); // 's' bit
    726 
    727       MI.eraseFromParent();
    728       return true;
    729     }
    730 
    731     case ARM::MOVCCsr: {
    732       BuildMI(MBB, MBBI, MI.getDebugLoc(), TII->get(ARM::MOVsr),
    733               (MI.getOperand(1).getReg()))
    734         .addReg(MI.getOperand(2).getReg(),
    735                 getKillRegState(MI.getOperand(2).isKill()))
    736         .addReg(MI.getOperand(3).getReg(),
    737                 getKillRegState(MI.getOperand(3).isKill()))
    738         .addImm(MI.getOperand(4).getImm())
    739         .addImm(MI.getOperand(5).getImm()) // 'pred'
    740         .addReg(MI.getOperand(6).getReg())
    741         .addReg(0); // 's' bit
    742 
    743       MI.eraseFromParent();
    744       return true;
    745     }
    746     case ARM::MOVCCi16: {
    747       BuildMI(MBB, MBBI, MI.getDebugLoc(), TII->get(ARM::MOVi16),
    748               MI.getOperand(1).getReg())
    749         .addImm(MI.getOperand(2).getImm())
    750         .addImm(MI.getOperand(3).getImm()) // 'pred'
    751         .addReg(MI.getOperand(4).getReg());
    752 
    753       MI.eraseFromParent();
    754       return true;
    755     }
    756     case ARM::t2MOVCCi:
    757     case ARM::MOVCCi: {
    758       unsigned Opc = AFI->isThumbFunction() ? ARM::t2MOVi : ARM::MOVi;
    759       BuildMI(MBB, MBBI, MI.getDebugLoc(), TII->get(Opc),
    760               MI.getOperand(1).getReg())
    761         .addImm(MI.getOperand(2).getImm())
    762         .addImm(MI.getOperand(3).getImm()) // 'pred'
    763         .addReg(MI.getOperand(4).getReg())
    764         .addReg(0); // 's' bit
    765 
    766       MI.eraseFromParent();
    767       return true;
    768     }
    769     case ARM::MVNCCi: {
    770       BuildMI(MBB, MBBI, MI.getDebugLoc(), TII->get(ARM::MVNi),
    771               MI.getOperand(1).getReg())
    772         .addImm(MI.getOperand(2).getImm())
    773         .addImm(MI.getOperand(3).getImm()) // 'pred'
    774         .addReg(MI.getOperand(4).getReg())
    775         .addReg(0); // 's' bit
    776 
    777       MI.eraseFromParent();
    778       return true;
    779     }
    780     case ARM::Int_eh_sjlj_dispatchsetup:
    781     case ARM::Int_eh_sjlj_dispatchsetup_nofp:
    782     case ARM::tInt_eh_sjlj_dispatchsetup: {
    783       MachineFunction &MF = *MI.getParent()->getParent();
    784       const ARMBaseInstrInfo *AII =
    785         static_cast<const ARMBaseInstrInfo*>(TII);
    786       const ARMBaseRegisterInfo &RI = AII->getRegisterInfo();
    787       // For functions using a base pointer, we rematerialize it (via the frame
    788       // pointer) here since eh.sjlj.setjmp and eh.sjlj.longjmp don't do it
    789       // for us. Otherwise, expand to nothing.
    790       if (RI.hasBasePointer(MF)) {
    791         int32_t NumBytes = AFI->getFramePtrSpillOffset();
    792         unsigned FramePtr = RI.getFrameRegister(MF);
    793         assert(MF.getTarget().getFrameLowering()->hasFP(MF) &&
    794                "base pointer without frame pointer?");
    795 
    796         if (AFI->isThumb2Function()) {
    797           emitT2RegPlusImmediate(MBB, MBBI, MI.getDebugLoc(), ARM::R6,
    798                                  FramePtr, -NumBytes, ARMCC::AL, 0, *TII);
    799         } else if (AFI->isThumbFunction()) {
    800           emitThumbRegPlusImmediate(MBB, MBBI, MI.getDebugLoc(), ARM::R6,
    801                                     FramePtr, -NumBytes, *TII, RI);
    802         } else {
    803           emitARMRegPlusImmediate(MBB, MBBI, MI.getDebugLoc(), ARM::R6,
    804                                   FramePtr, -NumBytes, ARMCC::AL, 0,
    805                                   *TII);
    806         }
    807         // If there's dynamic realignment, adjust for it.
    808         if (RI.needsStackRealignment(MF)) {
    809           MachineFrameInfo  *MFI = MF.getFrameInfo();
    810           unsigned MaxAlign = MFI->getMaxAlignment();
    811           assert (!AFI->isThumb1OnlyFunction());
    812           // Emit bic r6, r6, MaxAlign
    813           unsigned bicOpc = AFI->isThumbFunction() ?
    814             ARM::t2BICri : ARM::BICri;
    815           AddDefaultCC(AddDefaultPred(BuildMI(MBB, MBBI, MI.getDebugLoc(),
    816                                               TII->get(bicOpc), ARM::R6)
    817                                       .addReg(ARM::R6, RegState::Kill)
    818                                       .addImm(MaxAlign-1)));
    819         }
    820 
    821       }
    822       MI.eraseFromParent();
    823       return true;
    824     }
    825 
    826     case ARM::MOVsrl_flag:
    827     case ARM::MOVsra_flag: {
    828       // These are just fancy MOVs insructions.
    829       AddDefaultPred(BuildMI(MBB, MBBI, MI.getDebugLoc(), TII->get(ARM::MOVsi),
    830                              MI.getOperand(0).getReg())
    831                      .addOperand(MI.getOperand(1))
    832                      .addImm(ARM_AM::getSORegOpc((Opcode == ARM::MOVsrl_flag ?
    833                                                   ARM_AM::lsr : ARM_AM::asr),
    834                                                  1)))
    835         .addReg(ARM::CPSR, RegState::Define);
    836       MI.eraseFromParent();
    837       return true;
    838     }
    839     case ARM::RRX: {
    840       // This encodes as "MOVs Rd, Rm, rrx
    841       MachineInstrBuilder MIB =
    842         AddDefaultPred(BuildMI(MBB, MBBI, MI.getDebugLoc(),TII->get(ARM::MOVsi),
    843                                MI.getOperand(0).getReg())
    844                        .addOperand(MI.getOperand(1))
    845                        .addImm(ARM_AM::getSORegOpc(ARM_AM::rrx, 0)))
    846         .addReg(0);
    847       TransferImpOps(MI, MIB, MIB);
    848       MI.eraseFromParent();
    849       return true;
    850     }
    851     case ARM::tTPsoft:
    852     case ARM::TPsoft: {
    853       MachineInstrBuilder MIB =
    854         BuildMI(MBB, MBBI, MI.getDebugLoc(),
    855                 TII->get(Opcode == ARM::tTPsoft ? ARM::tBL : ARM::BL))
    856         .addExternalSymbol("__aeabi_read_tp", 0);
    857 
    858       MIB->setMemRefs(MI.memoperands_begin(), MI.memoperands_end());
    859       TransferImpOps(MI, MIB, MIB);
    860       MI.eraseFromParent();
    861       return true;
    862     }
    863     case ARM::tLDRpci_pic:
    864     case ARM::t2LDRpci_pic: {
    865       unsigned NewLdOpc = (Opcode == ARM::tLDRpci_pic)
    866         ? ARM::tLDRpci : ARM::t2LDRpci;
    867       unsigned DstReg = MI.getOperand(0).getReg();
    868       bool DstIsDead = MI.getOperand(0).isDead();
    869       MachineInstrBuilder MIB1 =
    870         AddDefaultPred(BuildMI(MBB, MBBI, MI.getDebugLoc(),
    871                                TII->get(NewLdOpc), DstReg)
    872                        .addOperand(MI.getOperand(1)));
    873       MIB1->setMemRefs(MI.memoperands_begin(), MI.memoperands_end());
    874       MachineInstrBuilder MIB2 = BuildMI(MBB, MBBI, MI.getDebugLoc(),
    875                                          TII->get(ARM::tPICADD))
    876         .addReg(DstReg, RegState::Define | getDeadRegState(DstIsDead))
    877         .addReg(DstReg)
    878         .addOperand(MI.getOperand(2));
    879       TransferImpOps(MI, MIB1, MIB2);
    880       MI.eraseFromParent();
    881       return true;
    882     }
    883 
    884     case ARM::MOV_ga_dyn:
    885     case ARM::MOV_ga_pcrel:
    886     case ARM::MOV_ga_pcrel_ldr:
    887     case ARM::t2MOV_ga_dyn:
    888     case ARM::t2MOV_ga_pcrel: {
    889       // Expand into movw + movw. Also "add pc" / ldr [pc] in PIC mode.
    890       unsigned LabelId = AFI->createPICLabelUId();
    891       unsigned DstReg = MI.getOperand(0).getReg();
    892       bool DstIsDead = MI.getOperand(0).isDead();
    893       const MachineOperand &MO1 = MI.getOperand(1);
    894       const GlobalValue *GV = MO1.getGlobal();
    895       unsigned TF = MO1.getTargetFlags();
    896       bool isARM = (Opcode != ARM::t2MOV_ga_pcrel && Opcode!=ARM::t2MOV_ga_dyn);
    897       bool isPIC = (Opcode != ARM::MOV_ga_dyn && Opcode != ARM::t2MOV_ga_dyn);
    898       unsigned LO16Opc = isARM ? ARM::MOVi16_ga_pcrel : ARM::t2MOVi16_ga_pcrel;
    899       unsigned HI16Opc = isARM ? ARM::MOVTi16_ga_pcrel :ARM::t2MOVTi16_ga_pcrel;
    900       unsigned LO16TF = isPIC
    901         ? ARMII::MO_LO16_NONLAZY_PIC : ARMII::MO_LO16_NONLAZY;
    902       unsigned HI16TF = isPIC
    903         ? ARMII::MO_HI16_NONLAZY_PIC : ARMII::MO_HI16_NONLAZY;
    904       unsigned PICAddOpc = isARM
    905         ? (Opcode == ARM::MOV_ga_pcrel_ldr ? ARM::PICLDR : ARM::PICADD)
    906         : ARM::tPICADD;
    907       MachineInstrBuilder MIB1 = BuildMI(MBB, MBBI, MI.getDebugLoc(),
    908                                          TII->get(LO16Opc), DstReg)
    909         .addGlobalAddress(GV, MO1.getOffset(), TF | LO16TF)
    910         .addImm(LabelId);
    911       MachineInstrBuilder MIB2 = BuildMI(MBB, MBBI, MI.getDebugLoc(),
    912                                          TII->get(HI16Opc), DstReg)
    913         .addReg(DstReg)
    914         .addGlobalAddress(GV, MO1.getOffset(), TF | HI16TF)
    915         .addImm(LabelId);
    916       if (!isPIC) {
    917         TransferImpOps(MI, MIB1, MIB2);
    918         MI.eraseFromParent();
    919         return true;
    920       }
    921 
    922       MachineInstrBuilder MIB3 = BuildMI(MBB, MBBI, MI.getDebugLoc(),
    923                                          TII->get(PICAddOpc))
    924         .addReg(DstReg, RegState::Define | getDeadRegState(DstIsDead))
    925         .addReg(DstReg).addImm(LabelId);
    926       if (isARM) {
    927         AddDefaultPred(MIB3);
    928         if (Opcode == ARM::MOV_ga_pcrel_ldr)
    929           MIB3->setMemRefs(MI.memoperands_begin(), MI.memoperands_end());
    930       }
    931       TransferImpOps(MI, MIB1, MIB3);
    932       MI.eraseFromParent();
    933       return true;
    934     }
    935 
    936     case ARM::MOVi32imm:
    937     case ARM::MOVCCi32imm:
    938     case ARM::t2MOVi32imm:
    939     case ARM::t2MOVCCi32imm:
    940       ExpandMOV32BitImm(MBB, MBBI);
    941       return true;
    942 
    943     case ARM::VLDMQIA: {
    944       unsigned NewOpc = ARM::VLDMDIA;
    945       MachineInstrBuilder MIB =
    946         BuildMI(MBB, MBBI, MI.getDebugLoc(), TII->get(NewOpc));
    947       unsigned OpIdx = 0;
    948 
    949       // Grab the Q register destination.
    950       bool DstIsDead = MI.getOperand(OpIdx).isDead();
    951       unsigned DstReg = MI.getOperand(OpIdx++).getReg();
    952 
    953       // Copy the source register.
    954       MIB.addOperand(MI.getOperand(OpIdx++));
    955 
    956       // Copy the predicate operands.
    957       MIB.addOperand(MI.getOperand(OpIdx++));
    958       MIB.addOperand(MI.getOperand(OpIdx++));
    959 
    960       // Add the destination operands (D subregs).
    961       unsigned D0 = TRI->getSubReg(DstReg, ARM::dsub_0);
    962       unsigned D1 = TRI->getSubReg(DstReg, ARM::dsub_1);
    963       MIB.addReg(D0, RegState::Define | getDeadRegState(DstIsDead))
    964         .addReg(D1, RegState::Define | getDeadRegState(DstIsDead));
    965 
    966       // Add an implicit def for the super-register.
    967       MIB.addReg(DstReg, RegState::ImplicitDefine | getDeadRegState(DstIsDead));
    968       TransferImpOps(MI, MIB, MIB);
    969       MIB.setMemRefs(MI.memoperands_begin(), MI.memoperands_end());
    970       MI.eraseFromParent();
    971       return true;
    972     }
    973 
    974     case ARM::VSTMQIA: {
    975       unsigned NewOpc = ARM::VSTMDIA;
    976       MachineInstrBuilder MIB =
    977         BuildMI(MBB, MBBI, MI.getDebugLoc(), TII->get(NewOpc));
    978       unsigned OpIdx = 0;
    979 
    980       // Grab the Q register source.
    981       bool SrcIsKill = MI.getOperand(OpIdx).isKill();
    982       unsigned SrcReg = MI.getOperand(OpIdx++).getReg();
    983 
    984       // Copy the destination register.
    985       MIB.addOperand(MI.getOperand(OpIdx++));
    986 
    987       // Copy the predicate operands.
    988       MIB.addOperand(MI.getOperand(OpIdx++));
    989       MIB.addOperand(MI.getOperand(OpIdx++));
    990 
    991       // Add the source operands (D subregs).
    992       unsigned D0 = TRI->getSubReg(SrcReg, ARM::dsub_0);
    993       unsigned D1 = TRI->getSubReg(SrcReg, ARM::dsub_1);
    994       MIB.addReg(D0).addReg(D1);
    995 
    996       if (SrcIsKill)      // Add an implicit kill for the Q register.
    997         MIB->addRegisterKilled(SrcReg, TRI, true);
    998 
    999       TransferImpOps(MI, MIB, MIB);
   1000       MIB.setMemRefs(MI.memoperands_begin(), MI.memoperands_end());
   1001       MI.eraseFromParent();
   1002       return true;
   1003     }
   1004     case ARM::VDUPfqf:
   1005     case ARM::VDUPfdf:{
   1006       unsigned NewOpc = Opcode == ARM::VDUPfqf ? ARM::VDUPLN32q :
   1007         ARM::VDUPLN32d;
   1008       MachineInstrBuilder MIB =
   1009         BuildMI(MBB, MBBI, MI.getDebugLoc(), TII->get(NewOpc));
   1010       unsigned OpIdx = 0;
   1011       unsigned SrcReg = MI.getOperand(1).getReg();
   1012       unsigned Lane = TRI->getEncodingValue(SrcReg) & 1;
   1013       unsigned DReg = TRI->getMatchingSuperReg(SrcReg,
   1014                             Lane & 1 ? ARM::ssub_1 : ARM::ssub_0,
   1015                             &ARM::DPR_VFP2RegClass);
   1016       // The lane is [0,1] for the containing DReg superregister.
   1017       // Copy the dst/src register operands.
   1018       MIB.addOperand(MI.getOperand(OpIdx++));
   1019       MIB.addReg(DReg);
   1020       ++OpIdx;
   1021       // Add the lane select operand.
   1022       MIB.addImm(Lane);
   1023       // Add the predicate operands.
   1024       MIB.addOperand(MI.getOperand(OpIdx++));
   1025       MIB.addOperand(MI.getOperand(OpIdx++));
   1026 
   1027       TransferImpOps(MI, MIB, MIB);
   1028       MI.eraseFromParent();
   1029       return true;
   1030     }
   1031 
   1032     case ARM::VLD2q8Pseudo:
   1033     case ARM::VLD2q16Pseudo:
   1034     case ARM::VLD2q32Pseudo:
   1035     case ARM::VLD2q8PseudoWB_fixed:
   1036     case ARM::VLD2q16PseudoWB_fixed:
   1037     case ARM::VLD2q32PseudoWB_fixed:
   1038     case ARM::VLD2q8PseudoWB_register:
   1039     case ARM::VLD2q16PseudoWB_register:
   1040     case ARM::VLD2q32PseudoWB_register:
   1041     case ARM::VLD3d8Pseudo:
   1042     case ARM::VLD3d16Pseudo:
   1043     case ARM::VLD3d32Pseudo:
   1044     case ARM::VLD1d64TPseudo:
   1045     case ARM::VLD3d8Pseudo_UPD:
   1046     case ARM::VLD3d16Pseudo_UPD:
   1047     case ARM::VLD3d32Pseudo_UPD:
   1048     case ARM::VLD3q8Pseudo_UPD:
   1049     case ARM::VLD3q16Pseudo_UPD:
   1050     case ARM::VLD3q32Pseudo_UPD:
   1051     case ARM::VLD3q8oddPseudo:
   1052     case ARM::VLD3q16oddPseudo:
   1053     case ARM::VLD3q32oddPseudo:
   1054     case ARM::VLD3q8oddPseudo_UPD:
   1055     case ARM::VLD3q16oddPseudo_UPD:
   1056     case ARM::VLD3q32oddPseudo_UPD:
   1057     case ARM::VLD4d8Pseudo:
   1058     case ARM::VLD4d16Pseudo:
   1059     case ARM::VLD4d32Pseudo:
   1060     case ARM::VLD1d64QPseudo:
   1061     case ARM::VLD4d8Pseudo_UPD:
   1062     case ARM::VLD4d16Pseudo_UPD:
   1063     case ARM::VLD4d32Pseudo_UPD:
   1064     case ARM::VLD4q8Pseudo_UPD:
   1065     case ARM::VLD4q16Pseudo_UPD:
   1066     case ARM::VLD4q32Pseudo_UPD:
   1067     case ARM::VLD4q8oddPseudo:
   1068     case ARM::VLD4q16oddPseudo:
   1069     case ARM::VLD4q32oddPseudo:
   1070     case ARM::VLD4q8oddPseudo_UPD:
   1071     case ARM::VLD4q16oddPseudo_UPD:
   1072     case ARM::VLD4q32oddPseudo_UPD:
   1073     case ARM::VLD3DUPd8Pseudo:
   1074     case ARM::VLD3DUPd16Pseudo:
   1075     case ARM::VLD3DUPd32Pseudo:
   1076     case ARM::VLD3DUPd8Pseudo_UPD:
   1077     case ARM::VLD3DUPd16Pseudo_UPD:
   1078     case ARM::VLD3DUPd32Pseudo_UPD:
   1079     case ARM::VLD4DUPd8Pseudo:
   1080     case ARM::VLD4DUPd16Pseudo:
   1081     case ARM::VLD4DUPd32Pseudo:
   1082     case ARM::VLD4DUPd8Pseudo_UPD:
   1083     case ARM::VLD4DUPd16Pseudo_UPD:
   1084     case ARM::VLD4DUPd32Pseudo_UPD:
   1085       ExpandVLD(MBBI);
   1086       return true;
   1087 
   1088     case ARM::VST2q8Pseudo:
   1089     case ARM::VST2q16Pseudo:
   1090     case ARM::VST2q32Pseudo:
   1091     case ARM::VST2q8PseudoWB_fixed:
   1092     case ARM::VST2q16PseudoWB_fixed:
   1093     case ARM::VST2q32PseudoWB_fixed:
   1094     case ARM::VST2q8PseudoWB_register:
   1095     case ARM::VST2q16PseudoWB_register:
   1096     case ARM::VST2q32PseudoWB_register:
   1097     case ARM::VST3d8Pseudo:
   1098     case ARM::VST3d16Pseudo:
   1099     case ARM::VST3d32Pseudo:
   1100     case ARM::VST1d64TPseudo:
   1101     case ARM::VST3d8Pseudo_UPD:
   1102     case ARM::VST3d16Pseudo_UPD:
   1103     case ARM::VST3d32Pseudo_UPD:
   1104     case ARM::VST1d64TPseudoWB_fixed:
   1105     case ARM::VST1d64TPseudoWB_register:
   1106     case ARM::VST3q8Pseudo_UPD:
   1107     case ARM::VST3q16Pseudo_UPD:
   1108     case ARM::VST3q32Pseudo_UPD:
   1109     case ARM::VST3q8oddPseudo:
   1110     case ARM::VST3q16oddPseudo:
   1111     case ARM::VST3q32oddPseudo:
   1112     case ARM::VST3q8oddPseudo_UPD:
   1113     case ARM::VST3q16oddPseudo_UPD:
   1114     case ARM::VST3q32oddPseudo_UPD:
   1115     case ARM::VST4d8Pseudo:
   1116     case ARM::VST4d16Pseudo:
   1117     case ARM::VST4d32Pseudo:
   1118     case ARM::VST1d64QPseudo:
   1119     case ARM::VST4d8Pseudo_UPD:
   1120     case ARM::VST4d16Pseudo_UPD:
   1121     case ARM::VST4d32Pseudo_UPD:
   1122     case ARM::VST1d64QPseudoWB_fixed:
   1123     case ARM::VST1d64QPseudoWB_register:
   1124     case ARM::VST4q8Pseudo_UPD:
   1125     case ARM::VST4q16Pseudo_UPD:
   1126     case ARM::VST4q32Pseudo_UPD:
   1127     case ARM::VST4q8oddPseudo:
   1128     case ARM::VST4q16oddPseudo:
   1129     case ARM::VST4q32oddPseudo:
   1130     case ARM::VST4q8oddPseudo_UPD:
   1131     case ARM::VST4q16oddPseudo_UPD:
   1132     case ARM::VST4q32oddPseudo_UPD:
   1133       ExpandVST(MBBI);
   1134       return true;
   1135 
   1136     case ARM::VLD1LNq8Pseudo:
   1137     case ARM::VLD1LNq16Pseudo:
   1138     case ARM::VLD1LNq32Pseudo:
   1139     case ARM::VLD1LNq8Pseudo_UPD:
   1140     case ARM::VLD1LNq16Pseudo_UPD:
   1141     case ARM::VLD1LNq32Pseudo_UPD:
   1142     case ARM::VLD2LNd8Pseudo:
   1143     case ARM::VLD2LNd16Pseudo:
   1144     case ARM::VLD2LNd32Pseudo:
   1145     case ARM::VLD2LNq16Pseudo:
   1146     case ARM::VLD2LNq32Pseudo:
   1147     case ARM::VLD2LNd8Pseudo_UPD:
   1148     case ARM::VLD2LNd16Pseudo_UPD:
   1149     case ARM::VLD2LNd32Pseudo_UPD:
   1150     case ARM::VLD2LNq16Pseudo_UPD:
   1151     case ARM::VLD2LNq32Pseudo_UPD:
   1152     case ARM::VLD3LNd8Pseudo:
   1153     case ARM::VLD3LNd16Pseudo:
   1154     case ARM::VLD3LNd32Pseudo:
   1155     case ARM::VLD3LNq16Pseudo:
   1156     case ARM::VLD3LNq32Pseudo:
   1157     case ARM::VLD3LNd8Pseudo_UPD:
   1158     case ARM::VLD3LNd16Pseudo_UPD:
   1159     case ARM::VLD3LNd32Pseudo_UPD:
   1160     case ARM::VLD3LNq16Pseudo_UPD:
   1161     case ARM::VLD3LNq32Pseudo_UPD:
   1162     case ARM::VLD4LNd8Pseudo:
   1163     case ARM::VLD4LNd16Pseudo:
   1164     case ARM::VLD4LNd32Pseudo:
   1165     case ARM::VLD4LNq16Pseudo:
   1166     case ARM::VLD4LNq32Pseudo:
   1167     case ARM::VLD4LNd8Pseudo_UPD:
   1168     case ARM::VLD4LNd16Pseudo_UPD:
   1169     case ARM::VLD4LNd32Pseudo_UPD:
   1170     case ARM::VLD4LNq16Pseudo_UPD:
   1171     case ARM::VLD4LNq32Pseudo_UPD:
   1172     case ARM::VST1LNq8Pseudo:
   1173     case ARM::VST1LNq16Pseudo:
   1174     case ARM::VST1LNq32Pseudo:
   1175     case ARM::VST1LNq8Pseudo_UPD:
   1176     case ARM::VST1LNq16Pseudo_UPD:
   1177     case ARM::VST1LNq32Pseudo_UPD:
   1178     case ARM::VST2LNd8Pseudo:
   1179     case ARM::VST2LNd16Pseudo:
   1180     case ARM::VST2LNd32Pseudo:
   1181     case ARM::VST2LNq16Pseudo:
   1182     case ARM::VST2LNq32Pseudo:
   1183     case ARM::VST2LNd8Pseudo_UPD:
   1184     case ARM::VST2LNd16Pseudo_UPD:
   1185     case ARM::VST2LNd32Pseudo_UPD:
   1186     case ARM::VST2LNq16Pseudo_UPD:
   1187     case ARM::VST2LNq32Pseudo_UPD:
   1188     case ARM::VST3LNd8Pseudo:
   1189     case ARM::VST3LNd16Pseudo:
   1190     case ARM::VST3LNd32Pseudo:
   1191     case ARM::VST3LNq16Pseudo:
   1192     case ARM::VST3LNq32Pseudo:
   1193     case ARM::VST3LNd8Pseudo_UPD:
   1194     case ARM::VST3LNd16Pseudo_UPD:
   1195     case ARM::VST3LNd32Pseudo_UPD:
   1196     case ARM::VST3LNq16Pseudo_UPD:
   1197     case ARM::VST3LNq32Pseudo_UPD:
   1198     case ARM::VST4LNd8Pseudo:
   1199     case ARM::VST4LNd16Pseudo:
   1200     case ARM::VST4LNd32Pseudo:
   1201     case ARM::VST4LNq16Pseudo:
   1202     case ARM::VST4LNq32Pseudo:
   1203     case ARM::VST4LNd8Pseudo_UPD:
   1204     case ARM::VST4LNd16Pseudo_UPD:
   1205     case ARM::VST4LNd32Pseudo_UPD:
   1206     case ARM::VST4LNq16Pseudo_UPD:
   1207     case ARM::VST4LNq32Pseudo_UPD:
   1208       ExpandLaneOp(MBBI);
   1209       return true;
   1210 
   1211     case ARM::VSETLNi8Q:
   1212     case ARM::VSETLNi16Q: {
   1213       // Expand VSETLNs acting on a Q register to equivalent VSETLNs acting
   1214       // on the respective D register.
   1215 
   1216       unsigned QReg  = MI.getOperand(1).getReg();
   1217       unsigned QLane = MI.getOperand(3).getImm();
   1218 
   1219       unsigned NewOpcode, DLane, DSubReg;
   1220       switch (Opcode) {
   1221       default: llvm_unreachable("Invalid opcode!");
   1222       case ARM::VSETLNi8Q:
   1223         // 4 possible 8-bit lanes per DPR:
   1224         NewOpcode = ARM::VSETLNi8;
   1225         DLane = QLane % 8;
   1226         DSubReg  = (QLane / 8) ? ARM::dsub_1 : ARM::dsub_0;
   1227         break;
   1228       case ARM::VSETLNi16Q:
   1229         // 4 possible 16-bit lanes per DPR.
   1230         NewOpcode = ARM::VSETLNi16;
   1231         DLane = QLane % 4;
   1232         DSubReg  = (QLane / 4) ? ARM::dsub_1 : ARM::dsub_0;
   1233         break;
   1234       }
   1235 
   1236       MachineInstrBuilder MIB =
   1237         BuildMI(MBB, MBBI, MI.getDebugLoc(), TII->get(NewOpcode));
   1238 
   1239       unsigned DReg = TRI->getSubReg(QReg, DSubReg);
   1240 
   1241       MIB.addReg(DReg, RegState::Define); // Output DPR
   1242       MIB.addReg(DReg);                   // Input DPR
   1243       MIB.addOperand(MI.getOperand(2));   // Input GPR
   1244       MIB.addImm(DLane);                  // Lane
   1245 
   1246       // Add the predicate operands.
   1247       MIB.addOperand(MI.getOperand(4));
   1248       MIB.addOperand(MI.getOperand(5));
   1249 
   1250       if (MI.getOperand(1).isKill()) // Add an implicit kill for the Q register.
   1251         MIB->addRegisterKilled(QReg, TRI, true);
   1252       // And an implicit def of the output register (which should always be the
   1253       // same as the input register).
   1254       MIB->addRegisterDefined(QReg, TRI);
   1255 
   1256       TransferImpOps(MI, MIB, MIB);
   1257 
   1258       MI.eraseFromParent();
   1259       return true;
   1260     }
   1261 
   1262     case ARM::VTBL3Pseudo: ExpandVTBL(MBBI, ARM::VTBL3, false); return true;
   1263     case ARM::VTBL4Pseudo: ExpandVTBL(MBBI, ARM::VTBL4, false); return true;
   1264     case ARM::VTBX3Pseudo: ExpandVTBL(MBBI, ARM::VTBX3, true); return true;
   1265     case ARM::VTBX4Pseudo: ExpandVTBL(MBBI, ARM::VTBX4, true); return true;
   1266   }
   1267 }
   1268 
   1269 bool ARMExpandPseudo::ExpandMBB(MachineBasicBlock &MBB) {
   1270   bool Modified = false;
   1271 
   1272   MachineBasicBlock::iterator MBBI = MBB.begin(), E = MBB.end();
   1273   while (MBBI != E) {
   1274     MachineBasicBlock::iterator NMBBI = llvm::next(MBBI);
   1275     Modified |= ExpandMI(MBB, MBBI);
   1276     MBBI = NMBBI;
   1277   }
   1278 
   1279   return Modified;
   1280 }
   1281 
   1282 bool ARMExpandPseudo::runOnMachineFunction(MachineFunction &MF) {
   1283   const TargetMachine &TM = MF.getTarget();
   1284   TII = static_cast<const ARMBaseInstrInfo*>(TM.getInstrInfo());
   1285   TRI = TM.getRegisterInfo();
   1286   STI = &TM.getSubtarget<ARMSubtarget>();
   1287   AFI = MF.getInfo<ARMFunctionInfo>();
   1288 
   1289   bool Modified = false;
   1290   for (MachineFunction::iterator MFI = MF.begin(), E = MF.end(); MFI != E;
   1291        ++MFI)
   1292     Modified |= ExpandMBB(*MFI);
   1293   if (VerifyARMPseudo)
   1294     MF.verify(this, "After expanding ARM pseudo instructions.");
   1295   return Modified;
   1296 }
   1297 
   1298 /// createARMExpandPseudoPass - returns an instance of the pseudo instruction
   1299 /// expansion pass.
   1300 FunctionPass *llvm::createARMExpandPseudoPass() {
   1301   return new ARMExpandPseudo();
   1302 }
   1303