1 //=-HexagonScheduleV60.td - HexagonV60 Scheduling Definitions *- tablegen -*-=// 2 // 3 // The LLVM Compiler Infrastructure 4 // 5 // This file is distributed under the University of Illinois Open Source 6 // License. See LICENSE.TXT for details. 7 // 8 //===----------------------------------------------------------------------===// 9 10 // CVI pipes from the "Hexagon Multimedia Co-Processor Extensions Arch Spec". 11 def CVI_ST : FuncUnit; 12 def CVI_XLANE : FuncUnit; 13 def CVI_SHIFT : FuncUnit; 14 def CVI_MPY0 : FuncUnit; 15 def CVI_MPY1 : FuncUnit; 16 def CVI_LD : FuncUnit; 17 18 // Combined functional units. 19 def CVI_XLSHF : FuncUnit; 20 def CVI_MPY01 : FuncUnit; 21 def CVI_ALL : FuncUnit; 22 23 // Combined functional unit data. 24 def HexagonComboFuncsV60 : 25 ComboFuncUnits<[ 26 ComboFuncData<CVI_XLSHF , [CVI_XLANE, CVI_SHIFT]>, 27 ComboFuncData<CVI_MPY01 , [CVI_MPY0, CVI_MPY1]>, 28 ComboFuncData<CVI_ALL , [CVI_ST, CVI_XLANE, CVI_SHIFT, 29 CVI_MPY0, CVI_MPY1, CVI_LD]> 30 ]>; 31 32 // Note: When adding additional vector scheduling classes, add the 33 // corresponding methods to the class HexagonInstrInfo. 34 def CVI_VA : InstrItinClass; 35 def CVI_VA_DV : InstrItinClass; 36 def CVI_VX_LONG : InstrItinClass; 37 def CVI_VX_LATE : InstrItinClass; 38 def CVI_VX : InstrItinClass; 39 def CVI_VX_DV_LONG : InstrItinClass; 40 def CVI_VX_DV : InstrItinClass; 41 def CVI_VX_DV_SLOT2 : InstrItinClass; 42 def CVI_VP : InstrItinClass; 43 def CVI_VP_LONG : InstrItinClass; 44 def CVI_VP_VS_EARLY : InstrItinClass; 45 def CVI_VP_VS_LONG_EARLY : InstrItinClass; 46 def CVI_VP_VS_LONG : InstrItinClass; 47 def CVI_VP_VS : InstrItinClass; 48 def CVI_VP_DV : InstrItinClass; 49 def CVI_VS : InstrItinClass; 50 def CVI_VINLANESAT : InstrItinClass; 51 def CVI_VM_LD : InstrItinClass; 52 def CVI_VM_TMP_LD : InstrItinClass; 53 def CVI_VM_CUR_LD : InstrItinClass; 54 def CVI_VM_VP_LDU : InstrItinClass; 55 def CVI_VM_ST : InstrItinClass; 56 def CVI_VM_NEW_ST : InstrItinClass; 57 def CVI_VM_STU : InstrItinClass; 58 def CVI_HIST : InstrItinClass; 59 def CVI_VA_EXT : InstrItinClass; 60 61 // There are four SLOTS (four parallel pipelines) in Hexagon V60 machine. 62 // This file describes that machine information. 63 // 64 // |===========|==================================================| 65 // | PIPELINE | Instruction Classes | 66 // |===========|==================================================| 67 // | SLOT0 | LD ST ALU32 MEMOP NV SYSTEM | 68 // |-----------|--------------------------------------------------| 69 // | SLOT1 | LD ST ALU32 | 70 // |-----------|--------------------------------------------------| 71 // | SLOT2 | XTYPE ALU32 J JR | 72 // |-----------|--------------------------------------------------| 73 // | SLOT3 | XTYPE ALU32 J CR | 74 // |===========|==================================================| 75 // 76 // 77 // In addition to using the above SLOTS, there are also six vector pipelines 78 // in the CVI co-processor in the Hexagon V60 machine. 79 // 80 // |=========| |=========| |=========| |=========| |=========| |=========| 81 // SLOT | CVI_LD | |CVI_MPY3 | |CVI_MPY2 | |CVI_SHIFT| |CVI_XLANE| | CVI_ST | 82 // ==== |=========| |=========| |=========| |=========| |=========| |=========| 83 // S0-3 | | | CVI_VA | | CVI_VA | | CVI_VA | | CVI_VA | | | 84 // S2-3 | | | CVI_VX | | CVI_VX | | | | | | | 85 // S0-3 | | | | | | | | | CVI_VP | | | 86 // S0-3 | | | | | | | CVI_VS | | | | | 87 // S0-1 |(CVI_LD) | | CVI_LD | | CVI_LD | | CVI_LD | | CVI_LD | | | 88 // S0-1 |(C*TMP_LD) | | | | | | | | | | 89 // S01 |(C*_LDU) | | | | | | | | C*_LDU | | | 90 // S0 | | | CVI_ST | | CVI_ST | | CVI_ST | | CVI_ST | |(CVI_ST) | 91 // S0 | | | | | | | | | | |(C*TMP_ST) 92 // S01 | | | | | | | | | VSTU | |(C*_STU) | 93 // |=========| |=========| |=========| |=========| |=========| |=========| 94 // |=====================| |=====================| 95 // | CVI_MPY2 & CVI_MPY3 | |CVI_XLANE & CVI_SHIFT| 96 // |=====================| |=====================| 97 // S0-3 | CVI_VA_DV | | CVI_VA_DV | 98 // S0-3 | | | CVI_VP_DV | 99 // S2-3 | CVI_VX_DV | | | 100 // |=====================| |=====================| 101 // |=====================================================================| 102 // S0-3 | CVI_HIST Histogram | 103 // S0123| CVI_VA_EXT Extract | 104 // |=====================================================================| 105 106 def HexagonItinerariesV60 : 107 ProcessorItineraries<[SLOT0, SLOT1, SLOT2, SLOT3, SLOT_ENDLOOP, 108 CVI_ST, CVI_XLANE, CVI_SHIFT, CVI_MPY0, CVI_MPY1, 109 CVI_LD, CVI_XLSHF, CVI_MPY01, CVI_ALL], [], [ 110 // ALU32 111 InstrItinData<ALU32_2op_tc_1_SLOT0123 , 112 [InstrStage<1, [SLOT0, SLOT1, SLOT2, SLOT3]>]>, 113 InstrItinData<ALU32_2op_tc_2early_SLOT0123, 114 [InstrStage<2, [SLOT0, SLOT1, SLOT2, SLOT3]>]>, 115 InstrItinData<ALU32_3op_tc_1_SLOT0123 , 116 [InstrStage<1, [SLOT0, SLOT1, SLOT2, SLOT3]>]>, 117 InstrItinData<ALU32_3op_tc_2_SLOT0123 , 118 [InstrStage<2, [SLOT0, SLOT1, SLOT2, SLOT3]>]>, 119 InstrItinData<ALU32_3op_tc_2early_SLOT0123, 120 [InstrStage<2, [SLOT0, SLOT1, SLOT2, SLOT3]>]>, 121 InstrItinData<ALU32_ADDI_tc_1_SLOT0123 , 122 [InstrStage<1, [SLOT0, SLOT1, SLOT2, SLOT3]>]>, 123 124 // ALU64 125 InstrItinData<ALU64_tc_1_SLOT23 , [InstrStage<1, [SLOT2, SLOT3]>]>, 126 InstrItinData<ALU64_tc_2_SLOT23 , [InstrStage<2, [SLOT2, SLOT3]>]>, 127 InstrItinData<ALU64_tc_2early_SLOT23, [InstrStage<2, [SLOT2, SLOT3]>]>, 128 InstrItinData<ALU64_tc_3x_SLOT23 , [InstrStage<3, [SLOT2, SLOT3]>]>, 129 130 // CR -> System 131 InstrItinData<CR_tc_2_SLOT3 , [InstrStage<2, [SLOT3]>]>, 132 InstrItinData<CR_tc_2early_SLOT3 , [InstrStage<2, [SLOT3]>]>, 133 InstrItinData<CR_tc_3x_SLOT3 , [InstrStage<3, [SLOT3]>]>, 134 135 // Jump (conditional/unconditional/return etc) 136 InstrItinData<CR_tc_2early_SLOT23, [InstrStage<2, [SLOT2, SLOT3]>]>, 137 InstrItinData<CR_tc_3x_SLOT23 , [InstrStage<3, [SLOT2, SLOT3]>]>, 138 InstrItinData<CJ_tc_1_SLOT23 , [InstrStage<1, [SLOT2, SLOT3]>]>, 139 InstrItinData<CJ_tc_2early_SLOT23, [InstrStage<2, [SLOT2, SLOT3]>]>, 140 InstrItinData<J_tc_2early_SLOT23 , [InstrStage<2, [SLOT2, SLOT3]>]>, 141 InstrItinData<J_tc_2early_CJUMP_UCJUMP_ARCHDEPSLOT , [InstrStage<1, [SLOT2, SLOT3]>]>, 142 143 // JR 144 InstrItinData<J_tc_2early_SLOT2 , [InstrStage<2, [SLOT2]>]>, 145 InstrItinData<J_tc_3stall_SLOT2 , [InstrStage<3, [SLOT2]>]>, 146 147 // Extender 148 InstrItinData<EXTENDER_tc_1_SLOT0123, [InstrStage<1, 149 [SLOT0, SLOT1, SLOT2, SLOT3]>]>, 150 151 // Load 152 InstrItinData<LD_tc_ld_SLOT01 , [InstrStage<3, [SLOT0, SLOT1]>]>, 153 InstrItinData<LD_tc_3or4stall_SLOT0, [InstrStage<4, [SLOT0]>]>, 154 InstrItinData<LD_tc_ld_SLOT0 , [InstrStage<3, [SLOT0]>]>, 155 156 // M 157 InstrItinData<M_tc_1_SLOT23 , [InstrStage<1, [SLOT2, SLOT3]>]>, 158 InstrItinData<M_tc_2_SLOT23 , [InstrStage<2, [SLOT2, SLOT3]>]>, 159 InstrItinData<M_tc_3_SLOT23 , [InstrStage<3, [SLOT2, SLOT3]>]>, 160 InstrItinData<M_tc_3x_SLOT23 , [InstrStage<3, [SLOT2, SLOT3]>]>, 161 InstrItinData<M_tc_3or4x_SLOT23 , [InstrStage<4, [SLOT2, SLOT3]>]>, 162 InstrItinData<M_tc_3stall_SLOT23, [InstrStage<3, [SLOT2, SLOT3]>]>, 163 164 // Store 165 InstrItinData<ST_tc_st_SLOT01 , [InstrStage<1, [SLOT0, SLOT1]>]>, 166 InstrItinData<ST_tc_3stall_SLOT0, [InstrStage<3, [SLOT0]>]>, 167 InstrItinData<ST_tc_ld_SLOT0 , [InstrStage<3, [SLOT0]>]>, 168 InstrItinData<ST_tc_st_SLOT0 , [InstrStage<1, [SLOT0]>]>, 169 170 // Subinsn 171 InstrItinData<SUBINSN_tc_2early_SLOT0, [InstrStage<2, [SLOT0]>]>, 172 InstrItinData<SUBINSN_tc_3stall_SLOT0, [InstrStage<3, [SLOT0]>]>, 173 InstrItinData<SUBINSN_tc_ld_SLOT0 , [InstrStage<3, [SLOT0]>]>, 174 InstrItinData<SUBINSN_tc_1_SLOT01 , [InstrStage<1, [SLOT0, SLOT1]>]>, 175 InstrItinData<SUBINSN_tc_2early_SLOT01, 176 [InstrStage<2, [SLOT0, SLOT1]>]>, 177 InstrItinData<SUBINSN_tc_ld_SLOT01 , [InstrStage<3, [SLOT0, SLOT1]>]>, 178 InstrItinData<SUBINSN_tc_st_SLOT01 , [InstrStage<1, [SLOT0, SLOT1]>]>, 179 180 // S 181 InstrItinData<S_2op_tc_1_SLOT23 , [InstrStage<1, [SLOT2, SLOT3]>]>, 182 InstrItinData<S_2op_tc_2_SLOT23 , [InstrStage<2, [SLOT2, SLOT3]>]>, 183 InstrItinData<S_2op_tc_2early_SLOT23, [InstrStage<2, [SLOT2, SLOT3]>]>, 184 // The S_2op_tc_3x_SLOT23 slots are 4 cycles on v60. 185 InstrItinData<S_2op_tc_3or4x_SLOT23 , [InstrStage<4, [SLOT2, SLOT3]>]>, 186 InstrItinData<S_3op_tc_1_SLOT23 , [InstrStage<1, [SLOT2, SLOT3]>]>, 187 InstrItinData<S_3op_tc_2_SLOT23 , [InstrStage<2, [SLOT2, SLOT3]>]>, 188 InstrItinData<S_3op_tc_2early_SLOT23, [InstrStage<2, [SLOT2, SLOT3]>]>, 189 InstrItinData<S_3op_tc_3_SLOT23 , [InstrStage<3, [SLOT2, SLOT3]>]>, 190 InstrItinData<S_3op_tc_3stall_SLOT23, [InstrStage<3, [SLOT2, SLOT3]>]>, 191 InstrItinData<S_3op_tc_3x_SLOT23 , [InstrStage<3, [SLOT2, SLOT3]>]>, 192 193 // New Value Compare Jump 194 InstrItinData<NCJ_tc_3or4stall_SLOT0, [InstrStage<4, [SLOT0]>]>, 195 196 // Mem ops 197 InstrItinData<V2LDST_tc_st_SLOT0 , [InstrStage<1, [SLOT0]>]>, 198 InstrItinData<V2LDST_tc_ld_SLOT01 , [InstrStage<2, [SLOT0, SLOT1]>]>, 199 InstrItinData<V2LDST_tc_st_SLOT01 , [InstrStage<1, [SLOT0, SLOT1]>]>, 200 InstrItinData<V4LDST_tc_st_SLOT0 , [InstrStage<1, [SLOT0]>]>, 201 InstrItinData<V4LDST_tc_ld_SLOT01 , [InstrStage<3, [SLOT0, SLOT1]>]>, 202 InstrItinData<V4LDST_tc_st_SLOT01 , [InstrStage<1, [SLOT0, SLOT1]>]>, 203 204 // Endloop 205 InstrItinData<J_tc_2early_SLOT0123, [InstrStage<2, [SLOT_ENDLOOP]>]>, 206 207 // Vector 208 InstrItinData<COPROC_VMEM_vtc_long_SLOT01, 209 [InstrStage<3, [SLOT0, SLOT1]>]>, 210 InstrItinData<COPROC_VX_vtc_long_SLOT23 , 211 [InstrStage<3, [SLOT2, SLOT3]>]>, 212 InstrItinData<COPROC_VX_vtc_SLOT23 , 213 [InstrStage<3, [SLOT2, SLOT3]>]>, 214 InstrItinData<MAPPING_tc_1_SLOT0123 , 215 [InstrStage<1, [SLOT0, SLOT1, SLOT2, SLOT3]>]>, 216 217 // Duplex and Compound 218 InstrItinData<DUPLEX , [InstrStage<1, [SLOT0]>]>, 219 InstrItinData<COMPOUND_CJ_ARCHDEPSLOT , [InstrStage<1, [SLOT2, SLOT3]>]>, 220 InstrItinData<COMPOUND , [InstrStage<1, [SLOT2, SLOT3]>]>, 221 // Misc 222 InstrItinData<PREFIX , [InstrStage<1, [SLOT0, SLOT1, SLOT2, SLOT3]>]>, 223 InstrItinData<PSEUDO , [InstrStage<1, [SLOT0, SLOT1, SLOT2, SLOT3]>]>, 224 InstrItinData<PSEUDOM , [InstrStage<1, [SLOT2, SLOT3], 0>, 225 InstrStage<1, [SLOT2, SLOT3]>]>, 226 227 // Latest CVI spec definitions. 228 InstrItinData<CVI_VA,[InstrStage<1, [SLOT0,SLOT1,SLOT2,SLOT3], 0>, 229 InstrStage<1, [CVI_XLANE,CVI_SHIFT, 230 CVI_MPY0, CVI_MPY1]>]>, 231 InstrItinData<CVI_VA_DV, 232 [InstrStage<1, [SLOT0,SLOT1,SLOT2,SLOT3], 0>, 233 InstrStage<1, [CVI_XLSHF, CVI_MPY01]>]>, 234 InstrItinData<CVI_VX_LONG, [InstrStage<1, [SLOT2, SLOT3], 0>, 235 InstrStage<1, [CVI_MPY0, CVI_MPY1]>]>, 236 InstrItinData<CVI_VX_LATE, [InstrStage<1, [SLOT2, SLOT3], 0>, 237 InstrStage<1, [CVI_MPY0, CVI_MPY1]>]>, 238 InstrItinData<CVI_VX,[InstrStage<1, [SLOT2, SLOT3], 0>, 239 InstrStage<1, [CVI_MPY0, CVI_MPY1]>]>, 240 InstrItinData<CVI_VX_DV_LONG, 241 [InstrStage<1, [SLOT2, SLOT3], 0>, 242 InstrStage<1, [CVI_MPY01]>]>, 243 InstrItinData<CVI_VX_DV, 244 [InstrStage<1, [SLOT2, SLOT3], 0>, 245 InstrStage<1, [CVI_MPY01]>]>, 246 InstrItinData<CVI_VX_DV_SLOT2, 247 [InstrStage<1, [SLOT2], 0>, 248 InstrStage<1, [CVI_MPY01]>]>, 249 InstrItinData<CVI_VP, [InstrStage<1, [SLOT0,SLOT1,SLOT2,SLOT3], 0>, 250 InstrStage<1, [CVI_XLANE]>]>, 251 InstrItinData<CVI_VP_LONG, [InstrStage<1, [SLOT0,SLOT1,SLOT2,SLOT3], 0>, 252 InstrStage<1, [CVI_XLANE]>]>, 253 InstrItinData<CVI_VP_VS_EARLY, 254 [InstrStage<1, [SLOT0,SLOT1,SLOT2,SLOT3], 0>, 255 InstrStage<1, [CVI_XLSHF]>]>, 256 InstrItinData<CVI_VP_VS_LONG, 257 [InstrStage<1, [SLOT0,SLOT1,SLOT2,SLOT3], 0>, 258 InstrStage<1, [CVI_XLSHF]>]>, 259 InstrItinData<CVI_VP_VS, 260 [InstrStage<1, [SLOT0,SLOT1,SLOT2,SLOT3], 0>, 261 InstrStage<1, [CVI_XLSHF]>]>, 262 InstrItinData<CVI_VP_VS_LONG_EARLY, 263 [InstrStage<1, [SLOT0,SLOT1,SLOT2,SLOT3], 0>, 264 InstrStage<1, [CVI_XLSHF]>]>, 265 InstrItinData<CVI_VP_DV , [InstrStage<1, [SLOT0,SLOT1,SLOT2,SLOT3], 0>, 266 InstrStage<1, [CVI_XLSHF]>]>, 267 InstrItinData<CVI_VS, 268 [InstrStage<1, [SLOT0,SLOT1,SLOT2,SLOT3], 0>, 269 InstrStage<1, [CVI_SHIFT]>]>, 270 InstrItinData<CVI_VINLANESAT, 271 [InstrStage<1, [SLOT0,SLOT1,SLOT2,SLOT3], 0>, 272 InstrStage<1, [CVI_SHIFT]>]>, 273 InstrItinData<CVI_VM_LD , [InstrStage<1, [SLOT0, SLOT1], 0>, 274 InstrStage<1, [CVI_LD], 0>, 275 InstrStage<1, [CVI_XLANE, CVI_SHIFT, 276 CVI_MPY0, CVI_MPY1]>]>, 277 InstrItinData<CVI_VM_TMP_LD,[InstrStage<1,[SLOT0, SLOT1], 0>, 278 InstrStage<1, [CVI_LD]>]>, 279 InstrItinData<CVI_VM_CUR_LD,[InstrStage<1,[SLOT0, SLOT1], 0>, 280 InstrStage<1, [CVI_LD], 0>, 281 InstrStage<1, [CVI_XLANE, CVI_SHIFT, 282 CVI_MPY0, CVI_MPY1]>]>, 283 InstrItinData<CVI_VM_VP_LDU,[InstrStage<1,[SLOT0], 0>, 284 InstrStage<1, [SLOT1], 0>, 285 InstrStage<1, [CVI_LD], 0>, 286 InstrStage<1, [CVI_XLANE]>]>, 287 InstrItinData<CVI_VM_ST , [InstrStage<1, [SLOT0], 0>, 288 InstrStage<1, [CVI_ST], 0>, 289 InstrStage<1, [CVI_XLANE, CVI_SHIFT, 290 CVI_MPY0, CVI_MPY1]>]>, 291 InstrItinData<CVI_VM_NEW_ST,[InstrStage<1,[SLOT0], 0>, 292 InstrStage<1, [CVI_ST]>]>, 293 InstrItinData<CVI_VM_STU , [InstrStage<1, [SLOT0], 0>, 294 InstrStage<1, [SLOT1], 0>, 295 InstrStage<1, [CVI_ST], 0>, 296 InstrStage<1, [CVI_XLANE]>]>, 297 InstrItinData<CVI_HIST , [InstrStage<1, [SLOT0,SLOT1,SLOT2,SLOT3], 0>, 298 InstrStage<1, [CVI_ALL]>]> 299 ]>; 300 301 def HexagonModelV60 : SchedMachineModel { 302 // Max issue per cycle == bundle width. 303 let IssueWidth = 4; 304 let Itineraries = HexagonItinerariesV60; 305 let LoadLatency = 1; 306 let CompleteModel = 0; 307 } 308 309 //===----------------------------------------------------------------------===// 310 // Hexagon V60 Resource Definitions - 311 //===----------------------------------------------------------------------===// 312