1 ; RUN: llc < %s -march=ptx32 -mattr=+ptx20 | FileCheck %s 2 3 define ptx_device i32 @test_tid_x() { 4 ; CHECK: mov.u32 r0, %tid.x; 5 ; CHECK-NEXT: ret; 6 %x = call i32 @llvm.ptx.read.tid.x() 7 ret i32 %x 8 } 9 10 define ptx_device i32 @test_tid_y() { 11 ; CHECK: mov.u32 r0, %tid.y; 12 ; CHECK-NEXT: ret; 13 %x = call i32 @llvm.ptx.read.tid.y() 14 ret i32 %x 15 } 16 17 define ptx_device i32 @test_tid_z() { 18 ; CHECK: mov.u32 r0, %tid.z; 19 ; CHECK-NEXT: ret; 20 %x = call i32 @llvm.ptx.read.tid.z() 21 ret i32 %x 22 } 23 24 define ptx_device i32 @test_tid_w() { 25 ; CHECK: mov.u32 r0, %tid.w; 26 ; CHECK-NEXT: ret; 27 %x = call i32 @llvm.ptx.read.tid.w() 28 ret i32 %x 29 } 30 31 define ptx_device i32 @test_ntid_x() { 32 ; CHECK: mov.u32 r0, %ntid.x; 33 ; CHECK-NEXT: ret; 34 %x = call i32 @llvm.ptx.read.ntid.x() 35 ret i32 %x 36 } 37 38 define ptx_device i32 @test_ntid_y() { 39 ; CHECK: mov.u32 r0, %ntid.y; 40 ; CHECK-NEXT: ret; 41 %x = call i32 @llvm.ptx.read.ntid.y() 42 ret i32 %x 43 } 44 45 define ptx_device i32 @test_ntid_z() { 46 ; CHECK: mov.u32 r0, %ntid.z; 47 ; CHECK-NEXT: ret; 48 %x = call i32 @llvm.ptx.read.ntid.z() 49 ret i32 %x 50 } 51 52 define ptx_device i32 @test_ntid_w() { 53 ; CHECK: mov.u32 r0, %ntid.w; 54 ; CHECK-NEXT: ret; 55 %x = call i32 @llvm.ptx.read.ntid.w() 56 ret i32 %x 57 } 58 59 define ptx_device i32 @test_laneid() { 60 ; CHECK: mov.u32 r0, %laneid; 61 ; CHECK-NEXT: ret; 62 %x = call i32 @llvm.ptx.read.laneid() 63 ret i32 %x 64 } 65 66 define ptx_device i32 @test_warpid() { 67 ; CHECK: mov.u32 r0, %warpid; 68 ; CHECK-NEXT: ret; 69 %x = call i32 @llvm.ptx.read.warpid() 70 ret i32 %x 71 } 72 73 define ptx_device i32 @test_nwarpid() { 74 ; CHECK: mov.u32 r0, %nwarpid; 75 ; CHECK-NEXT: ret; 76 %x = call i32 @llvm.ptx.read.nwarpid() 77 ret i32 %x 78 } 79 80 define ptx_device i32 @test_ctaid_x() { 81 ; CHECK: mov.u32 r0, %ctaid.x; 82 ; CHECK-NEXT: ret; 83 %x = call i32 @llvm.ptx.read.ctaid.x() 84 ret i32 %x 85 } 86 87 define ptx_device i32 @test_ctaid_y() { 88 ; CHECK: mov.u32 r0, %ctaid.y; 89 ; CHECK-NEXT: ret; 90 %x = call i32 @llvm.ptx.read.ctaid.y() 91 ret i32 %x 92 } 93 94 define ptx_device i32 @test_ctaid_z() { 95 ; CHECK: mov.u32 r0, %ctaid.z; 96 ; CHECK-NEXT: ret; 97 %x = call i32 @llvm.ptx.read.ctaid.z() 98 ret i32 %x 99 } 100 101 define ptx_device i32 @test_ctaid_w() { 102 ; CHECK: mov.u32 r0, %ctaid.w; 103 ; CHECK-NEXT: ret; 104 %x = call i32 @llvm.ptx.read.ctaid.w() 105 ret i32 %x 106 } 107 108 define ptx_device i32 @test_nctaid_x() { 109 ; CHECK: mov.u32 r0, %nctaid.x; 110 ; CHECK-NEXT: ret; 111 %x = call i32 @llvm.ptx.read.nctaid.x() 112 ret i32 %x 113 } 114 115 define ptx_device i32 @test_nctaid_y() { 116 ; CHECK: mov.u32 r0, %nctaid.y; 117 ; CHECK-NEXT: ret; 118 %x = call i32 @llvm.ptx.read.nctaid.y() 119 ret i32 %x 120 } 121 122 define ptx_device i32 @test_nctaid_z() { 123 ; CHECK: mov.u32 r0, %nctaid.z; 124 ; CHECK-NEXT: ret; 125 %x = call i32 @llvm.ptx.read.nctaid.z() 126 ret i32 %x 127 } 128 129 define ptx_device i32 @test_nctaid_w() { 130 ; CHECK: mov.u32 r0, %nctaid.w; 131 ; CHECK-NEXT: ret; 132 %x = call i32 @llvm.ptx.read.nctaid.w() 133 ret i32 %x 134 } 135 136 define ptx_device i32 @test_smid() { 137 ; CHECK: mov.u32 r0, %smid; 138 ; CHECK-NEXT: ret; 139 %x = call i32 @llvm.ptx.read.smid() 140 ret i32 %x 141 } 142 143 define ptx_device i32 @test_nsmid() { 144 ; CHECK: mov.u32 r0, %nsmid; 145 ; CHECK-NEXT: ret; 146 %x = call i32 @llvm.ptx.read.nsmid() 147 ret i32 %x 148 } 149 150 define ptx_device i32 @test_gridid() { 151 ; CHECK: mov.u32 r0, %gridid; 152 ; CHECK-NEXT: ret; 153 %x = call i32 @llvm.ptx.read.gridid() 154 ret i32 %x 155 } 156 157 define ptx_device i32 @test_lanemask_eq() { 158 ; CHECK: mov.u32 r0, %lanemask_eq; 159 ; CHECK-NEXT: ret; 160 %x = call i32 @llvm.ptx.read.lanemask.eq() 161 ret i32 %x 162 } 163 164 define ptx_device i32 @test_lanemask_le() { 165 ; CHECK: mov.u32 r0, %lanemask_le; 166 ; CHECK-NEXT: ret; 167 %x = call i32 @llvm.ptx.read.lanemask.le() 168 ret i32 %x 169 } 170 171 define ptx_device i32 @test_lanemask_lt() { 172 ; CHECK: mov.u32 r0, %lanemask_lt; 173 ; CHECK-NEXT: ret; 174 %x = call i32 @llvm.ptx.read.lanemask.lt() 175 ret i32 %x 176 } 177 178 define ptx_device i32 @test_lanemask_ge() { 179 ; CHECK: mov.u32 r0, %lanemask_ge; 180 ; CHECK-NEXT: ret; 181 %x = call i32 @llvm.ptx.read.lanemask.ge() 182 ret i32 %x 183 } 184 185 define ptx_device i32 @test_lanemask_gt() { 186 ; CHECK: mov.u32 r0, %lanemask_gt; 187 ; CHECK-NEXT: ret; 188 %x = call i32 @llvm.ptx.read.lanemask.gt() 189 ret i32 %x 190 } 191 192 define ptx_device i32 @test_clock() { 193 ; CHECK: mov.u32 r0, %clock; 194 ; CHECK-NEXT: ret; 195 %x = call i32 @llvm.ptx.read.clock() 196 ret i32 %x 197 } 198 199 define ptx_device i64 @test_clock64() { 200 ; CHECK: mov.u64 rd0, %clock64; 201 ; CHECK-NEXT: ret; 202 %x = call i64 @llvm.ptx.read.clock64() 203 ret i64 %x 204 } 205 206 define ptx_device i32 @test_pm0() { 207 ; CHECK: mov.u32 r0, %pm0; 208 ; CHECK-NEXT: ret; 209 %x = call i32 @llvm.ptx.read.pm0() 210 ret i32 %x 211 } 212 213 define ptx_device i32 @test_pm1() { 214 ; CHECK: mov.u32 r0, %pm1; 215 ; CHECK-NEXT: ret; 216 %x = call i32 @llvm.ptx.read.pm1() 217 ret i32 %x 218 } 219 220 define ptx_device i32 @test_pm2() { 221 ; CHECK: mov.u32 r0, %pm2; 222 ; CHECK-NEXT: ret; 223 %x = call i32 @llvm.ptx.read.pm2() 224 ret i32 %x 225 } 226 227 define ptx_device i32 @test_pm3() { 228 ; CHECK: mov.u32 r0, %pm3; 229 ; CHECK-NEXT: ret; 230 %x = call i32 @llvm.ptx.read.pm3() 231 ret i32 %x 232 } 233 234 define ptx_device void @test_bar_sync() { 235 ; CHECK: bar.sync 0 236 ; CHECK-NEXT: ret; 237 call void @llvm.ptx.bar.sync(i32 0) 238 ret void 239 } 240 241 declare i32 @llvm.ptx.read.tid.x() 242 declare i32 @llvm.ptx.read.tid.y() 243 declare i32 @llvm.ptx.read.tid.z() 244 declare i32 @llvm.ptx.read.tid.w() 245 declare i32 @llvm.ptx.read.ntid.x() 246 declare i32 @llvm.ptx.read.ntid.y() 247 declare i32 @llvm.ptx.read.ntid.z() 248 declare i32 @llvm.ptx.read.ntid.w() 249 250 declare i32 @llvm.ptx.read.laneid() 251 declare i32 @llvm.ptx.read.warpid() 252 declare i32 @llvm.ptx.read.nwarpid() 253 254 declare i32 @llvm.ptx.read.ctaid.x() 255 declare i32 @llvm.ptx.read.ctaid.y() 256 declare i32 @llvm.ptx.read.ctaid.z() 257 declare i32 @llvm.ptx.read.ctaid.w() 258 declare i32 @llvm.ptx.read.nctaid.x() 259 declare i32 @llvm.ptx.read.nctaid.y() 260 declare i32 @llvm.ptx.read.nctaid.z() 261 declare i32 @llvm.ptx.read.nctaid.w() 262 263 declare i32 @llvm.ptx.read.smid() 264 declare i32 @llvm.ptx.read.nsmid() 265 declare i32 @llvm.ptx.read.gridid() 266 267 declare i32 @llvm.ptx.read.lanemask.eq() 268 declare i32 @llvm.ptx.read.lanemask.le() 269 declare i32 @llvm.ptx.read.lanemask.lt() 270 declare i32 @llvm.ptx.read.lanemask.ge() 271 declare i32 @llvm.ptx.read.lanemask.gt() 272 273 declare i32 @llvm.ptx.read.clock() 274 declare i64 @llvm.ptx.read.clock64() 275 276 declare i32 @llvm.ptx.read.pm0() 277 declare i32 @llvm.ptx.read.pm1() 278 declare i32 @llvm.ptx.read.pm2() 279 declare i32 @llvm.ptx.read.pm3() 280 281 declare void @llvm.ptx.bar.sync(i32 %i) 282