Home | History | Annotate | Download | only in X86
      1 //===-- X86InstrShiftRotate.td - Shift and Rotate Instrs ---*- tablegen -*-===//
      2 //
      3 //                     The LLVM Compiler Infrastructure
      4 //
      5 // This file is distributed under the University of Illinois Open Source
      6 // License. See LICENSE.TXT for details.
      7 //
      8 //===----------------------------------------------------------------------===//
      9 //
     10 // This file describes the shift and rotate instructions.
     11 //
     12 //===----------------------------------------------------------------------===//
     13 
     14 // FIXME: Someone needs to smear multipattern goodness all over this file.
     15 
     16 let Defs = [EFLAGS] in {
     17 
     18 let Constraints = "$src1 = $dst", SchedRW = [WriteShift] in {
     19 let Uses = [CL] in {
     20 def SHL8rCL  : I<0xD2, MRM4r, (outs GR8 :$dst), (ins GR8 :$src1),
     21                  "shl{b}\t{%cl, $dst|$dst, cl}",
     22                  [(set GR8:$dst, (shl GR8:$src1, CL))], IIC_SR>;
     23 def SHL16rCL : I<0xD3, MRM4r, (outs GR16:$dst), (ins GR16:$src1),
     24                  "shl{w}\t{%cl, $dst|$dst, cl}",
     25                  [(set GR16:$dst, (shl GR16:$src1, CL))], IIC_SR>, OpSize16;
     26 def SHL32rCL : I<0xD3, MRM4r, (outs GR32:$dst), (ins GR32:$src1),
     27                  "shl{l}\t{%cl, $dst|$dst, cl}",
     28                  [(set GR32:$dst, (shl GR32:$src1, CL))], IIC_SR>, OpSize32;
     29 def SHL64rCL : RI<0xD3, MRM4r, (outs GR64:$dst), (ins GR64:$src1),
     30                   "shl{q}\t{%cl, $dst|$dst, cl}",
     31                   [(set GR64:$dst, (shl GR64:$src1, CL))], IIC_SR>;
     32 } // Uses = [CL]
     33 
     34 def SHL8ri   : Ii8<0xC0, MRM4r, (outs GR8 :$dst), (ins GR8 :$src1, i8imm:$src2),
     35                    "shl{b}\t{$src2, $dst|$dst, $src2}",
     36                    [(set GR8:$dst, (shl GR8:$src1, (i8 imm:$src2)))], IIC_SR>;
     37 
     38 let isConvertibleToThreeAddress = 1 in {   // Can transform into LEA.
     39 def SHL16ri  : Ii8<0xC1, MRM4r, (outs GR16:$dst), (ins GR16:$src1, i8imm:$src2),
     40                    "shl{w}\t{$src2, $dst|$dst, $src2}",
     41                    [(set GR16:$dst, (shl GR16:$src1, (i8 imm:$src2)))], IIC_SR>,
     42                    OpSize16;
     43 def SHL32ri  : Ii8<0xC1, MRM4r, (outs GR32:$dst), (ins GR32:$src1, i8imm:$src2),
     44                    "shl{l}\t{$src2, $dst|$dst, $src2}",
     45                    [(set GR32:$dst, (shl GR32:$src1, (i8 imm:$src2)))], IIC_SR>,
     46                    OpSize32;
     47 def SHL64ri  : RIi8<0xC1, MRM4r, (outs GR64:$dst),
     48                     (ins GR64:$src1, i8imm:$src2),
     49                     "shl{q}\t{$src2, $dst|$dst, $src2}",
     50                     [(set GR64:$dst, (shl GR64:$src1, (i8 imm:$src2)))],
     51                     IIC_SR>;
     52 
     53 // NOTE: We don't include patterns for shifts of a register by one, because
     54 // 'add reg,reg' is cheaper (and we have a Pat pattern for shift-by-one).
     55 let hasSideEffects = 0 in {
     56 def SHL8r1   : I<0xD0, MRM4r, (outs GR8:$dst), (ins GR8:$src1),
     57                  "shl{b}\t$dst", [], IIC_SR>;
     58 def SHL16r1  : I<0xD1, MRM4r, (outs GR16:$dst), (ins GR16:$src1),
     59                  "shl{w}\t$dst", [], IIC_SR>, OpSize16;
     60 def SHL32r1  : I<0xD1, MRM4r, (outs GR32:$dst), (ins GR32:$src1),
     61                  "shl{l}\t$dst", [], IIC_SR>, OpSize32;
     62 def SHL64r1  : RI<0xD1, MRM4r, (outs GR64:$dst), (ins GR64:$src1),
     63                  "shl{q}\t$dst", [], IIC_SR>;
     64 } // hasSideEffects = 0
     65 } // isConvertibleToThreeAddress = 1
     66 } // Constraints = "$src = $dst", SchedRW
     67 
     68 
     69 let SchedRW = [WriteShiftLd, WriteRMW] in {
     70 // FIXME: Why do we need an explicit "Uses = [CL]" when the instr has a pattern
     71 // using CL?
     72 let Uses = [CL] in {
     73 def SHL8mCL  : I<0xD2, MRM4m, (outs), (ins i8mem :$dst),
     74                  "shl{b}\t{%cl, $dst|$dst, cl}",
     75                  [(store (shl (loadi8 addr:$dst), CL), addr:$dst)], IIC_SR>;
     76 def SHL16mCL : I<0xD3, MRM4m, (outs), (ins i16mem:$dst),
     77                  "shl{w}\t{%cl, $dst|$dst, cl}",
     78                  [(store (shl (loadi16 addr:$dst), CL), addr:$dst)], IIC_SR>,
     79                  OpSize16;
     80 def SHL32mCL : I<0xD3, MRM4m, (outs), (ins i32mem:$dst),
     81                  "shl{l}\t{%cl, $dst|$dst, cl}",
     82                  [(store (shl (loadi32 addr:$dst), CL), addr:$dst)], IIC_SR>,
     83                  OpSize32;
     84 def SHL64mCL : RI<0xD3, MRM4m, (outs), (ins i64mem:$dst),
     85                   "shl{q}\t{%cl, $dst|$dst, cl}",
     86                   [(store (shl (loadi64 addr:$dst), CL), addr:$dst)], IIC_SR>;
     87 }
     88 def SHL8mi   : Ii8<0xC0, MRM4m, (outs), (ins i8mem :$dst, i8imm:$src),
     89                    "shl{b}\t{$src, $dst|$dst, $src}",
     90                 [(store (shl (loadi8 addr:$dst), (i8 imm:$src)), addr:$dst)],
     91                 IIC_SR>;
     92 def SHL16mi  : Ii8<0xC1, MRM4m, (outs), (ins i16mem:$dst, i8imm:$src),
     93                    "shl{w}\t{$src, $dst|$dst, $src}",
     94                [(store (shl (loadi16 addr:$dst), (i8 imm:$src)), addr:$dst)],
     95                IIC_SR>, OpSize16;
     96 def SHL32mi  : Ii8<0xC1, MRM4m, (outs), (ins i32mem:$dst, i8imm:$src),
     97                    "shl{l}\t{$src, $dst|$dst, $src}",
     98                [(store (shl (loadi32 addr:$dst), (i8 imm:$src)), addr:$dst)],
     99                IIC_SR>, OpSize32;
    100 def SHL64mi : RIi8<0xC1, MRM4m, (outs), (ins i64mem:$dst, i8imm:$src),
    101                   "shl{q}\t{$src, $dst|$dst, $src}",
    102                  [(store (shl (loadi64 addr:$dst), (i8 imm:$src)), addr:$dst)],
    103                  IIC_SR>;
    104 
    105 // Shift by 1
    106 def SHL8m1   : I<0xD0, MRM4m, (outs), (ins i8mem :$dst),
    107                  "shl{b}\t$dst",
    108                 [(store (shl (loadi8 addr:$dst), (i8 1)), addr:$dst)],
    109                 IIC_SR>;
    110 def SHL16m1  : I<0xD1, MRM4m, (outs), (ins i16mem:$dst),
    111                  "shl{w}\t$dst",
    112                [(store (shl (loadi16 addr:$dst), (i8 1)), addr:$dst)],
    113                IIC_SR>, OpSize16;
    114 def SHL32m1  : I<0xD1, MRM4m, (outs), (ins i32mem:$dst),
    115                  "shl{l}\t$dst",
    116                [(store (shl (loadi32 addr:$dst), (i8 1)), addr:$dst)],
    117                IIC_SR>, OpSize32;
    118 def SHL64m1 : RI<0xD1, MRM4m, (outs), (ins i64mem:$dst),
    119                   "shl{q}\t$dst",
    120                  [(store (shl (loadi64 addr:$dst), (i8 1)), addr:$dst)],
    121                  IIC_SR>;
    122 } // SchedRW
    123 
    124 let Constraints = "$src1 = $dst", SchedRW = [WriteShift] in {
    125 let Uses = [CL] in {
    126 def SHR8rCL  : I<0xD2, MRM5r, (outs GR8 :$dst), (ins GR8 :$src1),
    127                  "shr{b}\t{%cl, $dst|$dst, cl}",
    128                  [(set GR8:$dst, (srl GR8:$src1, CL))], IIC_SR>;
    129 def SHR16rCL : I<0xD3, MRM5r, (outs GR16:$dst), (ins GR16:$src1),
    130                  "shr{w}\t{%cl, $dst|$dst, cl}",
    131                  [(set GR16:$dst, (srl GR16:$src1, CL))], IIC_SR>, OpSize16;
    132 def SHR32rCL : I<0xD3, MRM5r, (outs GR32:$dst), (ins GR32:$src1),
    133                  "shr{l}\t{%cl, $dst|$dst, cl}",
    134                  [(set GR32:$dst, (srl GR32:$src1, CL))], IIC_SR>, OpSize32;
    135 def SHR64rCL : RI<0xD3, MRM5r, (outs GR64:$dst), (ins GR64:$src1),
    136                   "shr{q}\t{%cl, $dst|$dst, cl}",
    137                   [(set GR64:$dst, (srl GR64:$src1, CL))], IIC_SR>;
    138 }
    139 
    140 def SHR8ri   : Ii8<0xC0, MRM5r, (outs GR8:$dst), (ins GR8:$src1, i8imm:$src2),
    141                    "shr{b}\t{$src2, $dst|$dst, $src2}",
    142                    [(set GR8:$dst, (srl GR8:$src1, (i8 imm:$src2)))], IIC_SR>;
    143 def SHR16ri  : Ii8<0xC1, MRM5r, (outs GR16:$dst), (ins GR16:$src1, i8imm:$src2),
    144                    "shr{w}\t{$src2, $dst|$dst, $src2}",
    145                    [(set GR16:$dst, (srl GR16:$src1, (i8 imm:$src2)))],
    146                    IIC_SR>, OpSize16;
    147 def SHR32ri  : Ii8<0xC1, MRM5r, (outs GR32:$dst), (ins GR32:$src1, i8imm:$src2),
    148                    "shr{l}\t{$src2, $dst|$dst, $src2}",
    149                    [(set GR32:$dst, (srl GR32:$src1, (i8 imm:$src2)))],
    150                    IIC_SR>, OpSize32;
    151 def SHR64ri : RIi8<0xC1, MRM5r, (outs GR64:$dst), (ins GR64:$src1, i8imm:$src2),
    152                   "shr{q}\t{$src2, $dst|$dst, $src2}",
    153                   [(set GR64:$dst, (srl GR64:$src1, (i8 imm:$src2)))], IIC_SR>;
    154 
    155 // Shift right by 1
    156 def SHR8r1   : I<0xD0, MRM5r, (outs GR8:$dst), (ins GR8:$src1),
    157                  "shr{b}\t$dst",
    158                  [(set GR8:$dst, (srl GR8:$src1, (i8 1)))], IIC_SR>;
    159 def SHR16r1  : I<0xD1, MRM5r, (outs GR16:$dst), (ins GR16:$src1),
    160                  "shr{w}\t$dst",
    161                  [(set GR16:$dst, (srl GR16:$src1, (i8 1)))], IIC_SR>, OpSize16;
    162 def SHR32r1  : I<0xD1, MRM5r, (outs GR32:$dst), (ins GR32:$src1),
    163                  "shr{l}\t$dst",
    164                  [(set GR32:$dst, (srl GR32:$src1, (i8 1)))], IIC_SR>, OpSize32;
    165 def SHR64r1  : RI<0xD1, MRM5r, (outs GR64:$dst), (ins GR64:$src1),
    166                  "shr{q}\t$dst",
    167                  [(set GR64:$dst, (srl GR64:$src1, (i8 1)))], IIC_SR>;
    168 } // Constraints = "$src = $dst", SchedRW
    169 
    170 
    171 let SchedRW = [WriteShiftLd, WriteRMW] in {
    172 let Uses = [CL] in {
    173 def SHR8mCL  : I<0xD2, MRM5m, (outs), (ins i8mem :$dst),
    174                  "shr{b}\t{%cl, $dst|$dst, cl}",
    175                  [(store (srl (loadi8 addr:$dst), CL), addr:$dst)], IIC_SR>;
    176 def SHR16mCL : I<0xD3, MRM5m, (outs), (ins i16mem:$dst),
    177                  "shr{w}\t{%cl, $dst|$dst, cl}",
    178                  [(store (srl (loadi16 addr:$dst), CL), addr:$dst)], IIC_SR>,
    179                  OpSize16;
    180 def SHR32mCL : I<0xD3, MRM5m, (outs), (ins i32mem:$dst),
    181                  "shr{l}\t{%cl, $dst|$dst, cl}",
    182                  [(store (srl (loadi32 addr:$dst), CL), addr:$dst)], IIC_SR>,
    183                  OpSize32;
    184 def SHR64mCL : RI<0xD3, MRM5m, (outs), (ins i64mem:$dst),
    185                   "shr{q}\t{%cl, $dst|$dst, cl}",
    186                   [(store (srl (loadi64 addr:$dst), CL), addr:$dst)], IIC_SR>;
    187 }
    188 def SHR8mi   : Ii8<0xC0, MRM5m, (outs), (ins i8mem :$dst, i8imm:$src),
    189                    "shr{b}\t{$src, $dst|$dst, $src}",
    190                 [(store (srl (loadi8 addr:$dst), (i8 imm:$src)), addr:$dst)],
    191                 IIC_SR>;
    192 def SHR16mi  : Ii8<0xC1, MRM5m, (outs), (ins i16mem:$dst, i8imm:$src),
    193                    "shr{w}\t{$src, $dst|$dst, $src}",
    194                [(store (srl (loadi16 addr:$dst), (i8 imm:$src)), addr:$dst)],
    195                IIC_SR>, OpSize16;
    196 def SHR32mi  : Ii8<0xC1, MRM5m, (outs), (ins i32mem:$dst, i8imm:$src),
    197                    "shr{l}\t{$src, $dst|$dst, $src}",
    198                [(store (srl (loadi32 addr:$dst), (i8 imm:$src)), addr:$dst)],
    199                IIC_SR>, OpSize32;
    200 def SHR64mi : RIi8<0xC1, MRM5m, (outs), (ins i64mem:$dst, i8imm:$src),
    201                   "shr{q}\t{$src, $dst|$dst, $src}",
    202                  [(store (srl (loadi64 addr:$dst), (i8 imm:$src)), addr:$dst)],
    203                  IIC_SR>;
    204 
    205 // Shift by 1
    206 def SHR8m1   : I<0xD0, MRM5m, (outs), (ins i8mem :$dst),
    207                  "shr{b}\t$dst",
    208                 [(store (srl (loadi8 addr:$dst), (i8 1)), addr:$dst)],
    209                 IIC_SR>;
    210 def SHR16m1  : I<0xD1, MRM5m, (outs), (ins i16mem:$dst),
    211                  "shr{w}\t$dst",
    212                [(store (srl (loadi16 addr:$dst), (i8 1)), addr:$dst)],
    213                IIC_SR>, OpSize16;
    214 def SHR32m1  : I<0xD1, MRM5m, (outs), (ins i32mem:$dst),
    215                  "shr{l}\t$dst",
    216                [(store (srl (loadi32 addr:$dst), (i8 1)), addr:$dst)],
    217                IIC_SR>, OpSize32;
    218 def SHR64m1 : RI<0xD1, MRM5m, (outs), (ins i64mem:$dst),
    219                   "shr{q}\t$dst",
    220                  [(store (srl (loadi64 addr:$dst), (i8 1)), addr:$dst)],
    221                  IIC_SR>;
    222 } // SchedRW
    223 
    224 let Constraints = "$src1 = $dst", SchedRW = [WriteShift] in {
    225 let Uses = [CL] in {
    226 def SAR8rCL  : I<0xD2, MRM7r, (outs GR8 :$dst), (ins GR8 :$src1),
    227                  "sar{b}\t{%cl, $dst|$dst, cl}",
    228                  [(set GR8:$dst, (sra GR8:$src1, CL))],
    229                  IIC_SR>;
    230 def SAR16rCL : I<0xD3, MRM7r, (outs GR16:$dst), (ins GR16:$src1),
    231                  "sar{w}\t{%cl, $dst|$dst, cl}",
    232                  [(set GR16:$dst, (sra GR16:$src1, CL))],
    233                  IIC_SR>, OpSize16;
    234 def SAR32rCL : I<0xD3, MRM7r, (outs GR32:$dst), (ins GR32:$src1),
    235                  "sar{l}\t{%cl, $dst|$dst, cl}",
    236                  [(set GR32:$dst, (sra GR32:$src1, CL))],
    237                  IIC_SR>, OpSize32;
    238 def SAR64rCL : RI<0xD3, MRM7r, (outs GR64:$dst), (ins GR64:$src1),
    239                  "sar{q}\t{%cl, $dst|$dst, cl}",
    240                  [(set GR64:$dst, (sra GR64:$src1, CL))],
    241                  IIC_SR>;
    242 }
    243 
    244 def SAR8ri   : Ii8<0xC0, MRM7r, (outs GR8 :$dst), (ins GR8 :$src1, i8imm:$src2),
    245                    "sar{b}\t{$src2, $dst|$dst, $src2}",
    246                    [(set GR8:$dst, (sra GR8:$src1, (i8 imm:$src2)))],
    247                    IIC_SR>;
    248 def SAR16ri  : Ii8<0xC1, MRM7r, (outs GR16:$dst), (ins GR16:$src1, i8imm:$src2),
    249                    "sar{w}\t{$src2, $dst|$dst, $src2}",
    250                    [(set GR16:$dst, (sra GR16:$src1, (i8 imm:$src2)))],
    251                    IIC_SR>, OpSize16;
    252 def SAR32ri  : Ii8<0xC1, MRM7r, (outs GR32:$dst), (ins GR32:$src1, i8imm:$src2),
    253                    "sar{l}\t{$src2, $dst|$dst, $src2}",
    254                    [(set GR32:$dst, (sra GR32:$src1, (i8 imm:$src2)))],
    255                    IIC_SR>, OpSize32;
    256 def SAR64ri  : RIi8<0xC1, MRM7r, (outs GR64:$dst),
    257                     (ins GR64:$src1, i8imm:$src2),
    258                     "sar{q}\t{$src2, $dst|$dst, $src2}",
    259                     [(set GR64:$dst, (sra GR64:$src1, (i8 imm:$src2)))],
    260                     IIC_SR>;
    261 
    262 // Shift by 1
    263 def SAR8r1   : I<0xD0, MRM7r, (outs GR8 :$dst), (ins GR8 :$src1),
    264                  "sar{b}\t$dst",
    265                  [(set GR8:$dst, (sra GR8:$src1, (i8 1)))],
    266                  IIC_SR>;
    267 def SAR16r1  : I<0xD1, MRM7r, (outs GR16:$dst), (ins GR16:$src1),
    268                  "sar{w}\t$dst",
    269                  [(set GR16:$dst, (sra GR16:$src1, (i8 1)))],
    270                  IIC_SR>, OpSize16;
    271 def SAR32r1  : I<0xD1, MRM7r, (outs GR32:$dst), (ins GR32:$src1),
    272                  "sar{l}\t$dst",
    273                  [(set GR32:$dst, (sra GR32:$src1, (i8 1)))],
    274                  IIC_SR>, OpSize32;
    275 def SAR64r1  : RI<0xD1, MRM7r, (outs GR64:$dst), (ins GR64:$src1),
    276                  "sar{q}\t$dst",
    277                  [(set GR64:$dst, (sra GR64:$src1, (i8 1)))],
    278                  IIC_SR>;
    279 } // Constraints = "$src = $dst", SchedRW
    280 
    281 
    282 let SchedRW = [WriteShiftLd, WriteRMW] in {
    283 let Uses = [CL] in {
    284 def SAR8mCL  : I<0xD2, MRM7m, (outs), (ins i8mem :$dst),
    285                  "sar{b}\t{%cl, $dst|$dst, cl}",
    286                  [(store (sra (loadi8 addr:$dst), CL), addr:$dst)],
    287                  IIC_SR>;
    288 def SAR16mCL : I<0xD3, MRM7m, (outs), (ins i16mem:$dst),
    289                  "sar{w}\t{%cl, $dst|$dst, cl}",
    290                  [(store (sra (loadi16 addr:$dst), CL), addr:$dst)],
    291                  IIC_SR>, OpSize16;
    292 def SAR32mCL : I<0xD3, MRM7m, (outs), (ins i32mem:$dst), 
    293                  "sar{l}\t{%cl, $dst|$dst, cl}",
    294                  [(store (sra (loadi32 addr:$dst), CL), addr:$dst)],
    295                  IIC_SR>, OpSize32;
    296 def SAR64mCL : RI<0xD3, MRM7m, (outs), (ins i64mem:$dst), 
    297                  "sar{q}\t{%cl, $dst|$dst, cl}",
    298                  [(store (sra (loadi64 addr:$dst), CL), addr:$dst)],
    299                  IIC_SR>;
    300 }
    301 def SAR8mi   : Ii8<0xC0, MRM7m, (outs), (ins i8mem :$dst, i8imm:$src),
    302                    "sar{b}\t{$src, $dst|$dst, $src}",
    303                 [(store (sra (loadi8 addr:$dst), (i8 imm:$src)), addr:$dst)],
    304                 IIC_SR>;
    305 def SAR16mi  : Ii8<0xC1, MRM7m, (outs), (ins i16mem:$dst, i8imm:$src),
    306                    "sar{w}\t{$src, $dst|$dst, $src}",
    307                [(store (sra (loadi16 addr:$dst), (i8 imm:$src)), addr:$dst)],
    308                IIC_SR>, OpSize16;
    309 def SAR32mi  : Ii8<0xC1, MRM7m, (outs), (ins i32mem:$dst, i8imm:$src),
    310                    "sar{l}\t{$src, $dst|$dst, $src}",
    311                [(store (sra (loadi32 addr:$dst), (i8 imm:$src)), addr:$dst)],
    312                IIC_SR>, OpSize32;
    313 def SAR64mi  : RIi8<0xC1, MRM7m, (outs), (ins i64mem:$dst, i8imm:$src),
    314                     "sar{q}\t{$src, $dst|$dst, $src}",
    315                  [(store (sra (loadi64 addr:$dst), (i8 imm:$src)), addr:$dst)],
    316                  IIC_SR>;
    317 
    318 // Shift by 1
    319 def SAR8m1   : I<0xD0, MRM7m, (outs), (ins i8mem :$dst),
    320                  "sar{b}\t$dst",
    321                 [(store (sra (loadi8 addr:$dst), (i8 1)), addr:$dst)],
    322                 IIC_SR>;
    323 def SAR16m1  : I<0xD1, MRM7m, (outs), (ins i16mem:$dst),
    324                  "sar{w}\t$dst",
    325                [(store (sra (loadi16 addr:$dst), (i8 1)), addr:$dst)],
    326                IIC_SR>, OpSize16;
    327 def SAR32m1  : I<0xD1, MRM7m, (outs), (ins i32mem:$dst),
    328                  "sar{l}\t$dst",
    329                [(store (sra (loadi32 addr:$dst), (i8 1)), addr:$dst)],
    330                IIC_SR>, OpSize32;
    331 def SAR64m1 : RI<0xD1, MRM7m, (outs), (ins i64mem:$dst),
    332                   "sar{q}\t$dst",
    333                  [(store (sra (loadi64 addr:$dst), (i8 1)), addr:$dst)],
    334                  IIC_SR>;
    335 } // SchedRW
    336 
    337 //===----------------------------------------------------------------------===//
    338 // Rotate instructions
    339 //===----------------------------------------------------------------------===//
    340 
    341 let hasSideEffects = 0 in {
    342 let Constraints = "$src1 = $dst", SchedRW = [WriteShift] in {
    343 def RCL8r1 : I<0xD0, MRM2r, (outs GR8:$dst), (ins GR8:$src1),
    344                "rcl{b}\t$dst", [], IIC_SR>;
    345 def RCL8ri : Ii8<0xC0, MRM2r, (outs GR8:$dst), (ins GR8:$src1, i8imm:$cnt),
    346                  "rcl{b}\t{$cnt, $dst|$dst, $cnt}", [], IIC_SR>;
    347 let Uses = [CL] in
    348 def RCL8rCL : I<0xD2, MRM2r, (outs GR8:$dst), (ins GR8:$src1),
    349                 "rcl{b}\t{%cl, $dst|$dst, cl}", [], IIC_SR>;
    350   
    351 def RCL16r1 : I<0xD1, MRM2r, (outs GR16:$dst), (ins GR16:$src1),
    352                 "rcl{w}\t$dst", [], IIC_SR>, OpSize16;
    353 def RCL16ri : Ii8<0xC1, MRM2r, (outs GR16:$dst), (ins GR16:$src1, i8imm:$cnt),
    354                   "rcl{w}\t{$cnt, $dst|$dst, $cnt}", [], IIC_SR>, OpSize16;
    355 let Uses = [CL] in
    356 def RCL16rCL : I<0xD3, MRM2r, (outs GR16:$dst), (ins GR16:$src1),
    357                  "rcl{w}\t{%cl, $dst|$dst, cl}", [], IIC_SR>, OpSize16;
    358 
    359 def RCL32r1 : I<0xD1, MRM2r, (outs GR32:$dst), (ins GR32:$src1),
    360                 "rcl{l}\t$dst", [], IIC_SR>, OpSize32;
    361 def RCL32ri : Ii8<0xC1, MRM2r, (outs GR32:$dst), (ins GR32:$src1, i8imm:$cnt),
    362                   "rcl{l}\t{$cnt, $dst|$dst, $cnt}", [], IIC_SR>, OpSize32;
    363 let Uses = [CL] in
    364 def RCL32rCL : I<0xD3, MRM2r, (outs GR32:$dst), (ins GR32:$src1),
    365                  "rcl{l}\t{%cl, $dst|$dst, cl}", [], IIC_SR>, OpSize32;
    366 
    367 
    368 def RCL64r1 : RI<0xD1, MRM2r, (outs GR64:$dst), (ins GR64:$src1),
    369                  "rcl{q}\t$dst", [], IIC_SR>;
    370 def RCL64ri : RIi8<0xC1, MRM2r, (outs GR64:$dst), (ins GR64:$src1, i8imm:$cnt),
    371                    "rcl{q}\t{$cnt, $dst|$dst, $cnt}", [], IIC_SR>;
    372 let Uses = [CL] in
    373 def RCL64rCL : RI<0xD3, MRM2r, (outs GR64:$dst), (ins GR64:$src1),
    374                   "rcl{q}\t{%cl, $dst|$dst, cl}", [], IIC_SR>;
    375 
    376 
    377 def RCR8r1 : I<0xD0, MRM3r, (outs GR8:$dst), (ins GR8:$src1),
    378                "rcr{b}\t$dst", [], IIC_SR>;
    379 def RCR8ri : Ii8<0xC0, MRM3r, (outs GR8:$dst), (ins GR8:$src1, i8imm:$cnt),
    380                  "rcr{b}\t{$cnt, $dst|$dst, $cnt}", [], IIC_SR>;
    381 let Uses = [CL] in
    382 def RCR8rCL : I<0xD2, MRM3r, (outs GR8:$dst), (ins GR8:$src1),
    383                 "rcr{b}\t{%cl, $dst|$dst, cl}", [], IIC_SR>;
    384   
    385 def RCR16r1 : I<0xD1, MRM3r, (outs GR16:$dst), (ins GR16:$src1),
    386                 "rcr{w}\t$dst", [], IIC_SR>, OpSize16;
    387 def RCR16ri : Ii8<0xC1, MRM3r, (outs GR16:$dst), (ins GR16:$src1, i8imm:$cnt),
    388                   "rcr{w}\t{$cnt, $dst|$dst, $cnt}", [], IIC_SR>, OpSize16;
    389 let Uses = [CL] in
    390 def RCR16rCL : I<0xD3, MRM3r, (outs GR16:$dst), (ins GR16:$src1),
    391                  "rcr{w}\t{%cl, $dst|$dst, cl}", [], IIC_SR>, OpSize16;
    392 
    393 def RCR32r1 : I<0xD1, MRM3r, (outs GR32:$dst), (ins GR32:$src1),
    394                 "rcr{l}\t$dst", [], IIC_SR>, OpSize32;
    395 def RCR32ri : Ii8<0xC1, MRM3r, (outs GR32:$dst), (ins GR32:$src1, i8imm:$cnt),
    396                   "rcr{l}\t{$cnt, $dst|$dst, $cnt}", [], IIC_SR>, OpSize32;
    397 let Uses = [CL] in
    398 def RCR32rCL : I<0xD3, MRM3r, (outs GR32:$dst), (ins GR32:$src1),
    399                  "rcr{l}\t{%cl, $dst|$dst, cl}", [], IIC_SR>, OpSize32;
    400                  
    401 def RCR64r1 : RI<0xD1, MRM3r, (outs GR64:$dst), (ins GR64:$src1),
    402                  "rcr{q}\t$dst", [], IIC_SR>;
    403 def RCR64ri : RIi8<0xC1, MRM3r, (outs GR64:$dst), (ins GR64:$src1, i8imm:$cnt),
    404                    "rcr{q}\t{$cnt, $dst|$dst, $cnt}", [], IIC_SR>;
    405 let Uses = [CL] in
    406 def RCR64rCL : RI<0xD3, MRM3r, (outs GR64:$dst), (ins GR64:$src1),
    407                   "rcr{q}\t{%cl, $dst|$dst, cl}", [], IIC_SR>;
    408 
    409 } // Constraints = "$src = $dst"
    410 
    411 let SchedRW = [WriteShiftLd, WriteRMW] in {
    412 def RCL8m1 : I<0xD0, MRM2m, (outs), (ins i8mem:$dst),
    413                "rcl{b}\t$dst", [], IIC_SR>;
    414 def RCL8mi : Ii8<0xC0, MRM2m, (outs), (ins i8mem:$dst, i8imm:$cnt),
    415                  "rcl{b}\t{$cnt, $dst|$dst, $cnt}", [], IIC_SR>;
    416 def RCL16m1 : I<0xD1, MRM2m, (outs), (ins i16mem:$dst),
    417                 "rcl{w}\t$dst", [], IIC_SR>, OpSize16;
    418 def RCL16mi : Ii8<0xC1, MRM2m, (outs), (ins i16mem:$dst, i8imm:$cnt),
    419                   "rcl{w}\t{$cnt, $dst|$dst, $cnt}", [], IIC_SR>, OpSize16;
    420 def RCL32m1 : I<0xD1, MRM2m, (outs), (ins i32mem:$dst),
    421                 "rcl{l}\t$dst", [], IIC_SR>, OpSize32;
    422 def RCL32mi : Ii8<0xC1, MRM2m, (outs), (ins i32mem:$dst, i8imm:$cnt),
    423                   "rcl{l}\t{$cnt, $dst|$dst, $cnt}", [], IIC_SR>, OpSize32;
    424 def RCL64m1 : RI<0xD1, MRM2m, (outs), (ins i64mem:$dst),
    425                  "rcl{q}\t$dst", [], IIC_SR>;
    426 def RCL64mi : RIi8<0xC1, MRM2m, (outs), (ins i64mem:$dst, i8imm:$cnt),
    427                    "rcl{q}\t{$cnt, $dst|$dst, $cnt}", [], IIC_SR>;
    428 
    429 def RCR8m1 : I<0xD0, MRM3m, (outs), (ins i8mem:$dst),
    430                "rcr{b}\t$dst", [], IIC_SR>;
    431 def RCR8mi : Ii8<0xC0, MRM3m, (outs), (ins i8mem:$dst, i8imm:$cnt),
    432                  "rcr{b}\t{$cnt, $dst|$dst, $cnt}", [], IIC_SR>;
    433 def RCR16m1 : I<0xD1, MRM3m, (outs), (ins i16mem:$dst),
    434                 "rcr{w}\t$dst", [], IIC_SR>, OpSize16;
    435 def RCR16mi : Ii8<0xC1, MRM3m, (outs), (ins i16mem:$dst, i8imm:$cnt),
    436                   "rcr{w}\t{$cnt, $dst|$dst, $cnt}", [], IIC_SR>, OpSize16;
    437 def RCR32m1 : I<0xD1, MRM3m, (outs), (ins i32mem:$dst),
    438                 "rcr{l}\t$dst", [], IIC_SR>, OpSize32;
    439 def RCR32mi : Ii8<0xC1, MRM3m, (outs), (ins i32mem:$dst, i8imm:$cnt),
    440                   "rcr{l}\t{$cnt, $dst|$dst, $cnt}", [], IIC_SR>, OpSize32;
    441 def RCR64m1 : RI<0xD1, MRM3m, (outs), (ins i64mem:$dst),
    442                  "rcr{q}\t$dst", [], IIC_SR>;
    443 def RCR64mi : RIi8<0xC1, MRM3m, (outs), (ins i64mem:$dst, i8imm:$cnt),
    444                    "rcr{q}\t{$cnt, $dst|$dst, $cnt}", [], IIC_SR>;
    445 
    446 let Uses = [CL] in {
    447 def RCL8mCL : I<0xD2, MRM2m, (outs), (ins i8mem:$dst),
    448                 "rcl{b}\t{%cl, $dst|$dst, cl}", [], IIC_SR>;
    449 def RCL16mCL : I<0xD3, MRM2m, (outs), (ins i16mem:$dst),
    450                  "rcl{w}\t{%cl, $dst|$dst, cl}", [], IIC_SR>, OpSize16;
    451 def RCL32mCL : I<0xD3, MRM2m, (outs), (ins i32mem:$dst),
    452                  "rcl{l}\t{%cl, $dst|$dst, cl}", [], IIC_SR>, OpSize32;
    453 def RCL64mCL : RI<0xD3, MRM2m, (outs), (ins i64mem:$dst),
    454                   "rcl{q}\t{%cl, $dst|$dst, cl}", [], IIC_SR>;
    455 
    456 def RCR8mCL : I<0xD2, MRM3m, (outs), (ins i8mem:$dst),
    457                 "rcr{b}\t{%cl, $dst|$dst, cl}", [], IIC_SR>;
    458 def RCR16mCL : I<0xD3, MRM3m, (outs), (ins i16mem:$dst),
    459                  "rcr{w}\t{%cl, $dst|$dst, cl}", [], IIC_SR>, OpSize16;
    460 def RCR32mCL : I<0xD3, MRM3m, (outs), (ins i32mem:$dst),
    461                  "rcr{l}\t{%cl, $dst|$dst, cl}", [], IIC_SR>, OpSize32;
    462 def RCR64mCL : RI<0xD3, MRM3m, (outs), (ins i64mem:$dst),
    463                   "rcr{q}\t{%cl, $dst|$dst, cl}", [], IIC_SR>;
    464 }
    465 } // SchedRW
    466 } // hasSideEffects = 0
    467 
    468 let Constraints = "$src1 = $dst", SchedRW = [WriteShift] in {
    469 // FIXME: provide shorter instructions when imm8 == 1
    470 let Uses = [CL] in {
    471 def ROL8rCL  : I<0xD2, MRM0r, (outs GR8 :$dst), (ins GR8 :$src1),
    472                  "rol{b}\t{%cl, $dst|$dst, cl}",
    473                  [(set GR8:$dst, (rotl GR8:$src1, CL))], IIC_SR>;
    474 def ROL16rCL : I<0xD3, MRM0r, (outs GR16:$dst), (ins GR16:$src1),
    475                  "rol{w}\t{%cl, $dst|$dst, cl}",
    476                  [(set GR16:$dst, (rotl GR16:$src1, CL))], IIC_SR>, OpSize16;
    477 def ROL32rCL : I<0xD3, MRM0r, (outs GR32:$dst), (ins GR32:$src1),
    478                  "rol{l}\t{%cl, $dst|$dst, cl}",
    479                  [(set GR32:$dst, (rotl GR32:$src1, CL))], IIC_SR>, OpSize32;
    480 def ROL64rCL : RI<0xD3, MRM0r, (outs GR64:$dst), (ins GR64:$src1),
    481                   "rol{q}\t{%cl, $dst|$dst, cl}",
    482                   [(set GR64:$dst, (rotl GR64:$src1, CL))], IIC_SR>;
    483 }
    484 
    485 def ROL8ri   : Ii8<0xC0, MRM0r, (outs GR8 :$dst), (ins GR8 :$src1, i8imm:$src2),
    486                    "rol{b}\t{$src2, $dst|$dst, $src2}",
    487                    [(set GR8:$dst, (rotl GR8:$src1, (i8 imm:$src2)))], IIC_SR>;
    488 def ROL16ri  : Ii8<0xC1, MRM0r, (outs GR16:$dst), (ins GR16:$src1, i8imm:$src2),
    489                    "rol{w}\t{$src2, $dst|$dst, $src2}",
    490                    [(set GR16:$dst, (rotl GR16:$src1, (i8 imm:$src2)))],
    491                    IIC_SR>, OpSize16;
    492 def ROL32ri  : Ii8<0xC1, MRM0r, (outs GR32:$dst), (ins GR32:$src1, i8imm:$src2),
    493                    "rol{l}\t{$src2, $dst|$dst, $src2}",
    494                    [(set GR32:$dst, (rotl GR32:$src1, (i8 imm:$src2)))],
    495                    IIC_SR>, OpSize32;
    496 def ROL64ri  : RIi8<0xC1, MRM0r, (outs GR64:$dst), 
    497                     (ins GR64:$src1, i8imm:$src2),
    498                     "rol{q}\t{$src2, $dst|$dst, $src2}",
    499                     [(set GR64:$dst, (rotl GR64:$src1, (i8 imm:$src2)))],
    500                     IIC_SR>;
    501 
    502 // Rotate by 1
    503 def ROL8r1   : I<0xD0, MRM0r, (outs GR8 :$dst), (ins GR8 :$src1),
    504                  "rol{b}\t$dst",
    505                  [(set GR8:$dst, (rotl GR8:$src1, (i8 1)))],
    506                  IIC_SR>;
    507 def ROL16r1  : I<0xD1, MRM0r, (outs GR16:$dst), (ins GR16:$src1),
    508                  "rol{w}\t$dst",
    509                  [(set GR16:$dst, (rotl GR16:$src1, (i8 1)))],
    510                  IIC_SR>, OpSize16;
    511 def ROL32r1  : I<0xD1, MRM0r, (outs GR32:$dst), (ins GR32:$src1),
    512                  "rol{l}\t$dst",
    513                  [(set GR32:$dst, (rotl GR32:$src1, (i8 1)))],
    514                  IIC_SR>, OpSize32;
    515 def ROL64r1  : RI<0xD1, MRM0r, (outs GR64:$dst), (ins GR64:$src1),
    516                   "rol{q}\t$dst",
    517                   [(set GR64:$dst, (rotl GR64:$src1, (i8 1)))],
    518                   IIC_SR>;
    519 } // Constraints = "$src = $dst", SchedRW
    520 
    521 let SchedRW = [WriteShiftLd, WriteRMW] in {
    522 let Uses = [CL] in {
    523 def ROL8mCL  : I<0xD2, MRM0m, (outs), (ins i8mem :$dst),
    524                  "rol{b}\t{%cl, $dst|$dst, cl}",
    525                  [(store (rotl (loadi8 addr:$dst), CL), addr:$dst)],
    526                  IIC_SR>;
    527 def ROL16mCL : I<0xD3, MRM0m, (outs), (ins i16mem:$dst),
    528                  "rol{w}\t{%cl, $dst|$dst, cl}",
    529                  [(store (rotl (loadi16 addr:$dst), CL), addr:$dst)],
    530                  IIC_SR>, OpSize16;
    531 def ROL32mCL : I<0xD3, MRM0m, (outs), (ins i32mem:$dst),
    532                  "rol{l}\t{%cl, $dst|$dst, cl}",
    533                  [(store (rotl (loadi32 addr:$dst), CL), addr:$dst)],
    534                  IIC_SR>, OpSize32;
    535 def ROL64mCL :  RI<0xD3, MRM0m, (outs), (ins i64mem:$dst),
    536                    "rol{q}\t{%cl, $dst|$dst, cl}",
    537                    [(store (rotl (loadi64 addr:$dst), CL), addr:$dst)],
    538                    IIC_SR>;
    539 }
    540 def ROL8mi   : Ii8<0xC0, MRM0m, (outs), (ins i8mem :$dst, i8imm:$src1),
    541                    "rol{b}\t{$src1, $dst|$dst, $src1}",
    542                [(store (rotl (loadi8 addr:$dst), (i8 imm:$src1)), addr:$dst)],
    543                IIC_SR>;
    544 def ROL16mi  : Ii8<0xC1, MRM0m, (outs), (ins i16mem:$dst, i8imm:$src1),
    545                    "rol{w}\t{$src1, $dst|$dst, $src1}",
    546               [(store (rotl (loadi16 addr:$dst), (i8 imm:$src1)), addr:$dst)],
    547               IIC_SR>, OpSize16;
    548 def ROL32mi  : Ii8<0xC1, MRM0m, (outs), (ins i32mem:$dst, i8imm:$src1),
    549                    "rol{l}\t{$src1, $dst|$dst, $src1}",
    550               [(store (rotl (loadi32 addr:$dst), (i8 imm:$src1)), addr:$dst)],
    551               IIC_SR>, OpSize32;
    552 def ROL64mi  : RIi8<0xC1, MRM0m, (outs), (ins i64mem:$dst, i8imm:$src1),
    553                     "rol{q}\t{$src1, $dst|$dst, $src1}",
    554                 [(store (rotl (loadi64 addr:$dst), (i8 imm:$src1)), addr:$dst)],
    555                 IIC_SR>;
    556 
    557 // Rotate by 1
    558 def ROL8m1   : I<0xD0, MRM0m, (outs), (ins i8mem :$dst),
    559                  "rol{b}\t$dst",
    560                [(store (rotl (loadi8 addr:$dst), (i8 1)), addr:$dst)],
    561                IIC_SR>;
    562 def ROL16m1  : I<0xD1, MRM0m, (outs), (ins i16mem:$dst),
    563                  "rol{w}\t$dst",
    564               [(store (rotl (loadi16 addr:$dst), (i8 1)), addr:$dst)],
    565               IIC_SR>, OpSize16;
    566 def ROL32m1  : I<0xD1, MRM0m, (outs), (ins i32mem:$dst),
    567                  "rol{l}\t$dst",
    568               [(store (rotl (loadi32 addr:$dst), (i8 1)), addr:$dst)],
    569               IIC_SR>, OpSize32;
    570 def ROL64m1  : RI<0xD1, MRM0m, (outs), (ins i64mem:$dst),
    571                  "rol{q}\t$dst",
    572                [(store (rotl (loadi64 addr:$dst), (i8 1)), addr:$dst)],
    573                IIC_SR>;
    574 } // SchedRW
    575 
    576 let Constraints = "$src1 = $dst", SchedRW = [WriteShift] in {
    577 let Uses = [CL] in {
    578 def ROR8rCL  : I<0xD2, MRM1r, (outs GR8 :$dst), (ins GR8 :$src1),
    579                  "ror{b}\t{%cl, $dst|$dst, cl}",
    580                  [(set GR8:$dst, (rotr GR8:$src1, CL))], IIC_SR>;
    581 def ROR16rCL : I<0xD3, MRM1r, (outs GR16:$dst), (ins GR16:$src1),
    582                  "ror{w}\t{%cl, $dst|$dst, cl}",
    583                  [(set GR16:$dst, (rotr GR16:$src1, CL))], IIC_SR>, OpSize16;
    584 def ROR32rCL : I<0xD3, MRM1r, (outs GR32:$dst), (ins GR32:$src1),
    585                  "ror{l}\t{%cl, $dst|$dst, cl}",
    586                  [(set GR32:$dst, (rotr GR32:$src1, CL))], IIC_SR>, OpSize32;
    587 def ROR64rCL : RI<0xD3, MRM1r, (outs GR64:$dst), (ins GR64:$src1),
    588                   "ror{q}\t{%cl, $dst|$dst, cl}",
    589                   [(set GR64:$dst, (rotr GR64:$src1, CL))], IIC_SR>;
    590 }
    591 
    592 def ROR8ri   : Ii8<0xC0, MRM1r, (outs GR8 :$dst), (ins GR8 :$src1, i8imm:$src2),
    593                    "ror{b}\t{$src2, $dst|$dst, $src2}",
    594                    [(set GR8:$dst, (rotr GR8:$src1, (i8 imm:$src2)))], IIC_SR>;
    595 def ROR16ri  : Ii8<0xC1, MRM1r, (outs GR16:$dst), (ins GR16:$src1, i8imm:$src2),
    596                    "ror{w}\t{$src2, $dst|$dst, $src2}",
    597                    [(set GR16:$dst, (rotr GR16:$src1, (i8 imm:$src2)))],
    598                    IIC_SR>, OpSize16;
    599 def ROR32ri  : Ii8<0xC1, MRM1r, (outs GR32:$dst), (ins GR32:$src1, i8imm:$src2),
    600                    "ror{l}\t{$src2, $dst|$dst, $src2}",
    601                    [(set GR32:$dst, (rotr GR32:$src1, (i8 imm:$src2)))],
    602                    IIC_SR>, OpSize32;
    603 def ROR64ri  : RIi8<0xC1, MRM1r, (outs GR64:$dst), 
    604                     (ins GR64:$src1, i8imm:$src2),
    605                     "ror{q}\t{$src2, $dst|$dst, $src2}",
    606                     [(set GR64:$dst, (rotr GR64:$src1, (i8 imm:$src2)))],
    607                     IIC_SR>;
    608 
    609 // Rotate by 1
    610 def ROR8r1   : I<0xD0, MRM1r, (outs GR8 :$dst), (ins GR8 :$src1),
    611                  "ror{b}\t$dst",
    612                  [(set GR8:$dst, (rotr GR8:$src1, (i8 1)))],
    613                  IIC_SR>;
    614 def ROR16r1  : I<0xD1, MRM1r, (outs GR16:$dst), (ins GR16:$src1),
    615                  "ror{w}\t$dst",
    616                  [(set GR16:$dst, (rotr GR16:$src1, (i8 1)))],
    617                  IIC_SR>, OpSize16;
    618 def ROR32r1  : I<0xD1, MRM1r, (outs GR32:$dst), (ins GR32:$src1),
    619                  "ror{l}\t$dst",
    620                  [(set GR32:$dst, (rotr GR32:$src1, (i8 1)))],
    621                  IIC_SR>, OpSize32;
    622 def ROR64r1  : RI<0xD1, MRM1r, (outs GR64:$dst), (ins GR64:$src1),
    623                   "ror{q}\t$dst",
    624                   [(set GR64:$dst, (rotr GR64:$src1, (i8 1)))],
    625                   IIC_SR>;
    626 } // Constraints = "$src = $dst", SchedRW
    627 
    628 let SchedRW = [WriteShiftLd, WriteRMW] in {
    629 let Uses = [CL] in {
    630 def ROR8mCL  : I<0xD2, MRM1m, (outs), (ins i8mem :$dst),
    631                  "ror{b}\t{%cl, $dst|$dst, cl}",
    632                  [(store (rotr (loadi8 addr:$dst), CL), addr:$dst)],
    633                  IIC_SR>;
    634 def ROR16mCL : I<0xD3, MRM1m, (outs), (ins i16mem:$dst),
    635                  "ror{w}\t{%cl, $dst|$dst, cl}",
    636                  [(store (rotr (loadi16 addr:$dst), CL), addr:$dst)],
    637                  IIC_SR>, OpSize16;
    638 def ROR32mCL : I<0xD3, MRM1m, (outs), (ins i32mem:$dst), 
    639                  "ror{l}\t{%cl, $dst|$dst, cl}",
    640                  [(store (rotr (loadi32 addr:$dst), CL), addr:$dst)],
    641                  IIC_SR>, OpSize32;
    642 def ROR64mCL : RI<0xD3, MRM1m, (outs), (ins i64mem:$dst), 
    643                   "ror{q}\t{%cl, $dst|$dst, cl}",
    644                   [(store (rotr (loadi64 addr:$dst), CL), addr:$dst)],
    645                   IIC_SR>;
    646 }
    647 def ROR8mi   : Ii8<0xC0, MRM1m, (outs), (ins i8mem :$dst, i8imm:$src),
    648                    "ror{b}\t{$src, $dst|$dst, $src}",
    649                [(store (rotr (loadi8 addr:$dst), (i8 imm:$src)), addr:$dst)],
    650                IIC_SR>;
    651 def ROR16mi  : Ii8<0xC1, MRM1m, (outs), (ins i16mem:$dst, i8imm:$src),
    652                    "ror{w}\t{$src, $dst|$dst, $src}",
    653               [(store (rotr (loadi16 addr:$dst), (i8 imm:$src)), addr:$dst)],
    654               IIC_SR>, OpSize16;
    655 def ROR32mi  : Ii8<0xC1, MRM1m, (outs), (ins i32mem:$dst, i8imm:$src),
    656                    "ror{l}\t{$src, $dst|$dst, $src}",
    657               [(store (rotr (loadi32 addr:$dst), (i8 imm:$src)), addr:$dst)],
    658               IIC_SR>, OpSize32;
    659 def ROR64mi  : RIi8<0xC1, MRM1m, (outs), (ins i64mem:$dst, i8imm:$src),
    660                     "ror{q}\t{$src, $dst|$dst, $src}",
    661                 [(store (rotr (loadi64 addr:$dst), (i8 imm:$src)), addr:$dst)],
    662                 IIC_SR>;
    663 
    664 // Rotate by 1
    665 def ROR8m1   : I<0xD0, MRM1m, (outs), (ins i8mem :$dst),
    666                  "ror{b}\t$dst",
    667                [(store (rotr (loadi8 addr:$dst), (i8 1)), addr:$dst)],
    668                IIC_SR>;
    669 def ROR16m1  : I<0xD1, MRM1m, (outs), (ins i16mem:$dst),
    670                  "ror{w}\t$dst",
    671               [(store (rotr (loadi16 addr:$dst), (i8 1)), addr:$dst)],
    672               IIC_SR>, OpSize16;
    673 def ROR32m1  : I<0xD1, MRM1m, (outs), (ins i32mem:$dst),
    674                  "ror{l}\t$dst",
    675               [(store (rotr (loadi32 addr:$dst), (i8 1)), addr:$dst)],
    676               IIC_SR>, OpSize32;
    677 def ROR64m1  : RI<0xD1, MRM1m, (outs), (ins i64mem:$dst),
    678                  "ror{q}\t$dst",
    679                [(store (rotr (loadi64 addr:$dst), (i8 1)), addr:$dst)],
    680                IIC_SR>;
    681 } // SchedRW
    682 
    683 
    684 //===----------------------------------------------------------------------===//
    685 // Double shift instructions (generalizations of rotate)
    686 //===----------------------------------------------------------------------===//
    687 
    688 let Constraints = "$src1 = $dst", SchedRW = [WriteShift] in {
    689 
    690 let Uses = [CL] in {
    691 def SHLD16rrCL : I<0xA5, MRMDestReg, (outs GR16:$dst), 
    692                    (ins GR16:$src1, GR16:$src2),
    693                    "shld{w}\t{%cl, $src2, $dst|$dst, $src2, cl}",
    694                    [(set GR16:$dst, (X86shld GR16:$src1, GR16:$src2, CL))],
    695                     IIC_SHD16_REG_CL>,
    696                    TB, OpSize16;
    697 def SHRD16rrCL : I<0xAD, MRMDestReg, (outs GR16:$dst), 
    698                    (ins GR16:$src1, GR16:$src2),
    699                    "shrd{w}\t{%cl, $src2, $dst|$dst, $src2, cl}",
    700                    [(set GR16:$dst, (X86shrd GR16:$src1, GR16:$src2, CL))],
    701                     IIC_SHD16_REG_CL>,
    702                    TB, OpSize16;
    703 def SHLD32rrCL : I<0xA5, MRMDestReg, (outs GR32:$dst), 
    704                    (ins GR32:$src1, GR32:$src2),
    705                    "shld{l}\t{%cl, $src2, $dst|$dst, $src2, cl}",
    706                    [(set GR32:$dst, (X86shld GR32:$src1, GR32:$src2, CL))],
    707                     IIC_SHD32_REG_CL>, TB, OpSize32;
    708 def SHRD32rrCL : I<0xAD, MRMDestReg, (outs GR32:$dst),
    709                    (ins GR32:$src1, GR32:$src2),
    710                    "shrd{l}\t{%cl, $src2, $dst|$dst, $src2, cl}",
    711                    [(set GR32:$dst, (X86shrd GR32:$src1, GR32:$src2, CL))],
    712                    IIC_SHD32_REG_CL>, TB, OpSize32;
    713 def SHLD64rrCL : RI<0xA5, MRMDestReg, (outs GR64:$dst), 
    714                     (ins GR64:$src1, GR64:$src2),
    715                     "shld{q}\t{%cl, $src2, $dst|$dst, $src2, cl}",
    716                     [(set GR64:$dst, (X86shld GR64:$src1, GR64:$src2, CL))],
    717                     IIC_SHD64_REG_CL>, 
    718                     TB;
    719 def SHRD64rrCL : RI<0xAD, MRMDestReg, (outs GR64:$dst), 
    720                     (ins GR64:$src1, GR64:$src2),
    721                     "shrd{q}\t{%cl, $src2, $dst|$dst, $src2, cl}",
    722                     [(set GR64:$dst, (X86shrd GR64:$src1, GR64:$src2, CL))],
    723                     IIC_SHD64_REG_CL>, 
    724                     TB;
    725 }
    726 
    727 let isCommutable = 1 in {  // These instructions commute to each other.
    728 def SHLD16rri8 : Ii8<0xA4, MRMDestReg,
    729                      (outs GR16:$dst), 
    730                      (ins GR16:$src1, GR16:$src2, i8imm:$src3),
    731                      "shld{w}\t{$src3, $src2, $dst|$dst, $src2, $src3}",
    732                      [(set GR16:$dst, (X86shld GR16:$src1, GR16:$src2,
    733                                       (i8 imm:$src3)))], IIC_SHD16_REG_IM>,
    734                      TB, OpSize16;
    735 def SHRD16rri8 : Ii8<0xAC, MRMDestReg,
    736                      (outs GR16:$dst), 
    737                      (ins GR16:$src1, GR16:$src2, i8imm:$src3),
    738                      "shrd{w}\t{$src3, $src2, $dst|$dst, $src2, $src3}",
    739                      [(set GR16:$dst, (X86shrd GR16:$src1, GR16:$src2,
    740                                       (i8 imm:$src3)))], IIC_SHD16_REG_IM>,
    741                      TB, OpSize16;
    742 def SHLD32rri8 : Ii8<0xA4, MRMDestReg,
    743                      (outs GR32:$dst), 
    744                      (ins GR32:$src1, GR32:$src2, i8imm:$src3),
    745                      "shld{l}\t{$src3, $src2, $dst|$dst, $src2, $src3}",
    746                      [(set GR32:$dst, (X86shld GR32:$src1, GR32:$src2,
    747                                       (i8 imm:$src3)))], IIC_SHD32_REG_IM>,
    748                  TB, OpSize32;
    749 def SHRD32rri8 : Ii8<0xAC, MRMDestReg,
    750                      (outs GR32:$dst), 
    751                      (ins GR32:$src1, GR32:$src2, i8imm:$src3),
    752                      "shrd{l}\t{$src3, $src2, $dst|$dst, $src2, $src3}",
    753                      [(set GR32:$dst, (X86shrd GR32:$src1, GR32:$src2,
    754                                       (i8 imm:$src3)))], IIC_SHD32_REG_IM>,
    755                  TB, OpSize32;
    756 def SHLD64rri8 : RIi8<0xA4, MRMDestReg,
    757                       (outs GR64:$dst), 
    758                       (ins GR64:$src1, GR64:$src2, i8imm:$src3),
    759                       "shld{q}\t{$src3, $src2, $dst|$dst, $src2, $src3}",
    760                       [(set GR64:$dst, (X86shld GR64:$src1, GR64:$src2,
    761                                        (i8 imm:$src3)))], IIC_SHD64_REG_IM>,
    762                  TB;
    763 def SHRD64rri8 : RIi8<0xAC, MRMDestReg,
    764                       (outs GR64:$dst), 
    765                       (ins GR64:$src1, GR64:$src2, i8imm:$src3),
    766                       "shrd{q}\t{$src3, $src2, $dst|$dst, $src2, $src3}",
    767                       [(set GR64:$dst, (X86shrd GR64:$src1, GR64:$src2,
    768                                        (i8 imm:$src3)))], IIC_SHD64_REG_IM>,
    769                  TB;
    770 }
    771 } // Constraints = "$src = $dst", SchedRW
    772 
    773 let SchedRW = [WriteShiftLd, WriteRMW] in {
    774 let Uses = [CL] in {
    775 def SHLD16mrCL : I<0xA5, MRMDestMem, (outs), (ins i16mem:$dst, GR16:$src2),
    776                    "shld{w}\t{%cl, $src2, $dst|$dst, $src2, cl}",
    777                    [(store (X86shld (loadi16 addr:$dst), GR16:$src2, CL),
    778                      addr:$dst)], IIC_SHD16_MEM_CL>, TB, OpSize16;
    779 def SHRD16mrCL : I<0xAD, MRMDestMem, (outs), (ins i16mem:$dst, GR16:$src2),
    780                   "shrd{w}\t{%cl, $src2, $dst|$dst, $src2, cl}",
    781                   [(store (X86shrd (loadi16 addr:$dst), GR16:$src2, CL),
    782                     addr:$dst)], IIC_SHD16_MEM_CL>, TB, OpSize16;
    783 
    784 def SHLD32mrCL : I<0xA5, MRMDestMem, (outs), (ins i32mem:$dst, GR32:$src2),
    785                    "shld{l}\t{%cl, $src2, $dst|$dst, $src2, cl}",
    786                    [(store (X86shld (loadi32 addr:$dst), GR32:$src2, CL),
    787                      addr:$dst)], IIC_SHD32_MEM_CL>, TB, OpSize32;
    788 def SHRD32mrCL : I<0xAD, MRMDestMem, (outs), (ins i32mem:$dst, GR32:$src2),
    789                   "shrd{l}\t{%cl, $src2, $dst|$dst, $src2, cl}",
    790                   [(store (X86shrd (loadi32 addr:$dst), GR32:$src2, CL),
    791                     addr:$dst)], IIC_SHD32_MEM_CL>, TB, OpSize32;
    792                     
    793 def SHLD64mrCL : RI<0xA5, MRMDestMem, (outs), (ins i64mem:$dst, GR64:$src2),
    794                     "shld{q}\t{%cl, $src2, $dst|$dst, $src2, cl}",
    795                     [(store (X86shld (loadi64 addr:$dst), GR64:$src2, CL),
    796                       addr:$dst)], IIC_SHD64_MEM_CL>, TB;
    797 def SHRD64mrCL : RI<0xAD, MRMDestMem, (outs), (ins i64mem:$dst, GR64:$src2),
    798                     "shrd{q}\t{%cl, $src2, $dst|$dst, $src2, cl}",
    799                     [(store (X86shrd (loadi64 addr:$dst), GR64:$src2, CL),
    800                       addr:$dst)], IIC_SHD64_MEM_CL>, TB;
    801 }
    802 
    803 def SHLD16mri8 : Ii8<0xA4, MRMDestMem,
    804                     (outs), (ins i16mem:$dst, GR16:$src2, i8imm:$src3),
    805                     "shld{w}\t{$src3, $src2, $dst|$dst, $src2, $src3}",
    806                     [(store (X86shld (loadi16 addr:$dst), GR16:$src2,
    807                                       (i8 imm:$src3)), addr:$dst)],
    808                                       IIC_SHD16_MEM_IM>,
    809                     TB, OpSize16;
    810 def SHRD16mri8 : Ii8<0xAC, MRMDestMem, 
    811                      (outs), (ins i16mem:$dst, GR16:$src2, i8imm:$src3),
    812                      "shrd{w}\t{$src3, $src2, $dst|$dst, $src2, $src3}",
    813                     [(store (X86shrd (loadi16 addr:$dst), GR16:$src2,
    814                                       (i8 imm:$src3)), addr:$dst)],
    815                                       IIC_SHD16_MEM_IM>,
    816                      TB, OpSize16;
    817 
    818 def SHLD32mri8 : Ii8<0xA4, MRMDestMem,
    819                     (outs), (ins i32mem:$dst, GR32:$src2, i8imm:$src3),
    820                     "shld{l}\t{$src3, $src2, $dst|$dst, $src2, $src3}",
    821                     [(store (X86shld (loadi32 addr:$dst), GR32:$src2,
    822                                       (i8 imm:$src3)), addr:$dst)],
    823                                       IIC_SHD32_MEM_IM>,
    824                     TB, OpSize32;
    825 def SHRD32mri8 : Ii8<0xAC, MRMDestMem, 
    826                      (outs), (ins i32mem:$dst, GR32:$src2, i8imm:$src3),
    827                      "shrd{l}\t{$src3, $src2, $dst|$dst, $src2, $src3}",
    828                      [(store (X86shrd (loadi32 addr:$dst), GR32:$src2,
    829                                        (i8 imm:$src3)), addr:$dst)],
    830                                        IIC_SHD32_MEM_IM>,
    831                      TB, OpSize32;
    832 
    833 def SHLD64mri8 : RIi8<0xA4, MRMDestMem,
    834                       (outs), (ins i64mem:$dst, GR64:$src2, i8imm:$src3),
    835                       "shld{q}\t{$src3, $src2, $dst|$dst, $src2, $src3}",
    836                       [(store (X86shld (loadi64 addr:$dst), GR64:$src2,
    837                                        (i8 imm:$src3)), addr:$dst)],
    838                                        IIC_SHD64_MEM_IM>,
    839                  TB;
    840 def SHRD64mri8 : RIi8<0xAC, MRMDestMem, 
    841                       (outs), (ins i64mem:$dst, GR64:$src2, i8imm:$src3),
    842                       "shrd{q}\t{$src3, $src2, $dst|$dst, $src2, $src3}",
    843                       [(store (X86shrd (loadi64 addr:$dst), GR64:$src2,
    844                                        (i8 imm:$src3)), addr:$dst)],
    845                                        IIC_SHD64_MEM_IM>,
    846                  TB;
    847 } // SchedRW
    848 
    849 } // Defs = [EFLAGS]
    850 
    851 def ROT32L2R_imm8  : SDNodeXForm<imm, [{
    852   // Convert a ROTL shamt to a ROTR shamt on 32-bit integer.
    853   return getI8Imm(32 - N->getZExtValue());
    854 }]>;
    855 
    856 def ROT64L2R_imm8  : SDNodeXForm<imm, [{
    857   // Convert a ROTL shamt to a ROTR shamt on 64-bit integer.
    858   return getI8Imm(64 - N->getZExtValue());
    859 }]>;
    860 
    861 multiclass bmi_rotate<string asm, RegisterClass RC, X86MemOperand x86memop> {
    862 let neverHasSideEffects = 1 in {
    863   def ri : Ii8<0xF0, MRMSrcReg, (outs RC:$dst), (ins RC:$src1, i8imm:$src2),
    864                !strconcat(asm, "\t{$src2, $src1, $dst|$dst, $src1, $src2}"),
    865                []>, TAXD, VEX, Sched<[WriteShift]>;
    866   let mayLoad = 1 in
    867   def mi : Ii8<0xF0, MRMSrcMem, (outs RC:$dst),
    868                (ins x86memop:$src1, i8imm:$src2),
    869                !strconcat(asm, "\t{$src2, $src1, $dst|$dst, $src1, $src2}"),
    870                []>, TAXD, VEX, Sched<[WriteShiftLd]>;
    871 }
    872 }
    873 
    874 multiclass bmi_shift<string asm, RegisterClass RC, X86MemOperand x86memop> {
    875 let neverHasSideEffects = 1 in {
    876   def rr : I<0xF7, MRMSrcReg, (outs RC:$dst), (ins RC:$src1, RC:$src2),
    877              !strconcat(asm, "\t{$src2, $src1, $dst|$dst, $src1, $src2}"), []>,
    878              VEX_4VOp3, Sched<[WriteShift]>;
    879   let mayLoad = 1 in
    880   def rm : I<0xF7, MRMSrcMem, (outs RC:$dst), (ins x86memop:$src1, RC:$src2),
    881              !strconcat(asm, "\t{$src2, $src1, $dst|$dst, $src1, $src2}"), []>,
    882              VEX_4VOp3,
    883              Sched<[WriteShiftLd,
    884                     // x86memop:$src1
    885                     ReadDefault, ReadDefault, ReadDefault, ReadDefault,
    886                     ReadDefault,
    887                     // RC:$src1
    888                     ReadAfterLd]>;
    889 }
    890 }
    891 
    892 let Predicates = [HasBMI2] in {
    893   defm RORX32 : bmi_rotate<"rorx{l}", GR32, i32mem>;
    894   defm RORX64 : bmi_rotate<"rorx{q}", GR64, i64mem>, VEX_W;
    895   defm SARX32 : bmi_shift<"sarx{l}", GR32, i32mem>, T8XS;
    896   defm SARX64 : bmi_shift<"sarx{q}", GR64, i64mem>, T8XS, VEX_W;
    897   defm SHRX32 : bmi_shift<"shrx{l}", GR32, i32mem>, T8XD;
    898   defm SHRX64 : bmi_shift<"shrx{q}", GR64, i64mem>, T8XD, VEX_W;
    899   defm SHLX32 : bmi_shift<"shlx{l}", GR32, i32mem>, T8PD;
    900   defm SHLX64 : bmi_shift<"shlx{q}", GR64, i64mem>, T8PD, VEX_W;
    901 
    902   // Prefer RORX which is non-destructive and doesn't update EFLAGS.
    903   let AddedComplexity = 10 in {
    904     def : Pat<(rotl GR32:$src, (i8 imm:$shamt)),
    905               (RORX32ri GR32:$src, (ROT32L2R_imm8 imm:$shamt))>;
    906     def : Pat<(rotl GR64:$src, (i8 imm:$shamt)),
    907               (RORX64ri GR64:$src, (ROT64L2R_imm8 imm:$shamt))>;
    908   }
    909 
    910   def : Pat<(rotl (loadi32 addr:$src), (i8 imm:$shamt)),
    911             (RORX32mi addr:$src, (ROT32L2R_imm8 imm:$shamt))>;
    912   def : Pat<(rotl (loadi64 addr:$src), (i8 imm:$shamt)),
    913             (RORX64mi addr:$src, (ROT64L2R_imm8 imm:$shamt))>;
    914 
    915   // Prefer SARX/SHRX/SHLX over SAR/SHR/SHL with variable shift BUT not
    916   // immedidate shift, i.e. the following code is considered better
    917   //
    918   //  mov %edi, %esi
    919   //  shl $imm, %esi
    920   //  ... %edi, ...
    921   //
    922   // than
    923   //
    924   //  movb $imm, %sil
    925   //  shlx %sil, %edi, %esi
    926   //  ... %edi, ...
    927   //
    928   let AddedComplexity = 1 in {
    929     def : Pat<(sra GR32:$src1, GR8:$src2),
    930               (SARX32rr GR32:$src1,
    931                         (INSERT_SUBREG
    932                           (i32 (IMPLICIT_DEF)), GR8:$src2, sub_8bit))>;
    933     def : Pat<(sra GR64:$src1, GR8:$src2),
    934               (SARX64rr GR64:$src1,
    935                         (INSERT_SUBREG
    936                           (i64 (IMPLICIT_DEF)), GR8:$src2, sub_8bit))>;
    937 
    938     def : Pat<(srl GR32:$src1, GR8:$src2),
    939               (SHRX32rr GR32:$src1,
    940                         (INSERT_SUBREG
    941                           (i32 (IMPLICIT_DEF)), GR8:$src2, sub_8bit))>;
    942     def : Pat<(srl GR64:$src1, GR8:$src2),
    943               (SHRX64rr GR64:$src1,
    944                         (INSERT_SUBREG
    945                           (i64 (IMPLICIT_DEF)), GR8:$src2, sub_8bit))>;
    946 
    947     def : Pat<(shl GR32:$src1, GR8:$src2),
    948               (SHLX32rr GR32:$src1,
    949                         (INSERT_SUBREG
    950                           (i32 (IMPLICIT_DEF)), GR8:$src2, sub_8bit))>;
    951     def : Pat<(shl GR64:$src1, GR8:$src2),
    952               (SHLX64rr GR64:$src1,
    953                         (INSERT_SUBREG
    954                           (i64 (IMPLICIT_DEF)), GR8:$src2, sub_8bit))>;
    955   }
    956 
    957   // Patterns on SARXrm/SHRXrm/SHLXrm are explicitly omitted to favor
    958   //
    959   //  mov (%ecx), %esi
    960   //  shl $imm, $esi
    961   //
    962   // over
    963   //
    964   //  movb $imm %al
    965   //  shlx %al, (%ecx), %esi
    966   //
    967   // As SARXrr/SHRXrr/SHLXrr is favored on variable shift, the peephole
    968   // optimization will fold them into SARXrm/SHRXrm/SHLXrm if possible.
    969 }
    970