1 /* 2 * Copyright 2010 Christoph Bumiller 3 * 4 * Permission is hereby granted, free of charge, to any person obtaining a 5 * copy of this software and associated documentation files (the "Software"), 6 * to deal in the Software without restriction, including without limitation 7 * the rights to use, copy, modify, merge, publish, distribute, sublicense, 8 * and/or sell copies of the Software, and to permit persons to whom the 9 * Software is furnished to do so, subject to the following conditions: 10 * 11 * The above copyright notice and this permission notice shall be included in 12 * all copies or substantial portions of the Software. 13 * 14 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR 15 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, 16 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL 17 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR 18 * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, 19 * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR 20 * OTHER DEALINGS IN THE SOFTWARE. 21 */ 22 23 #include "pipe/p_defines.h" 24 #include "util/u_framebuffer.h" 25 #include "util/u_helpers.h" 26 #include "util/u_inlines.h" 27 #include "util/u_transfer.h" 28 #include "util/format_srgb.h" 29 30 #include "tgsi/tgsi_parse.h" 31 32 #include "nv50/nv50_stateobj.h" 33 #include "nv50/nv50_context.h" 34 #include "nv50/nv50_query_hw.h" 35 36 #include "nv50/nv50_3d.xml.h" 37 #include "nv50/g80_texture.xml.h" 38 39 #include "nouveau_gldefs.h" 40 41 /* Caveats: 42 * ! pipe_sampler_state.normalized_coords is ignored - rectangle textures will 43 * use non-normalized coordinates, everything else won't 44 * (The relevant bit is in the TIC entry and not the TSC entry.) 45 * 46 * ! pipe_sampler_state.seamless_cube_map is ignored - seamless filtering is 47 * always activated on NVA0 + 48 * (Give me the global bit, otherwise it's not worth the CPU work.) 49 * 50 * ! pipe_sampler_state.border_color is not swizzled according to the texture 51 * swizzle in pipe_sampler_view 52 * (This will be ugly with indirect independent texture/sampler access, 53 * we'd have to emulate the logic in the shader. GL doesn't have that, 54 * D3D doesn't have swizzle, if we knew what we were implementing we'd be 55 * good.) 56 * 57 * ! pipe_rasterizer_state.line_last_pixel is ignored - it is never drawn 58 * 59 * ! pipe_rasterizer_state.flatshade_first also applies to QUADS 60 * (There's a GL query for that, forcing an exception is just ridiculous.) 61 * 62 * ! pipe_rasterizer_state.sprite_coord_enable is masked with 0xff on NVC0 63 * (The hardware only has 8 slots meant for TexCoord and we have to assign 64 * in advance to maintain elegant separate shader objects.) 65 */ 66 67 static inline uint32_t 68 nv50_colormask(unsigned mask) 69 { 70 uint32_t ret = 0; 71 72 if (mask & PIPE_MASK_R) 73 ret |= 0x0001; 74 if (mask & PIPE_MASK_G) 75 ret |= 0x0010; 76 if (mask & PIPE_MASK_B) 77 ret |= 0x0100; 78 if (mask & PIPE_MASK_A) 79 ret |= 0x1000; 80 81 return ret; 82 } 83 84 #define NV50_BLEND_FACTOR_CASE(a, b) \ 85 case PIPE_BLENDFACTOR_##a: return NV50_BLEND_FACTOR_##b 86 87 static inline uint32_t 88 nv50_blend_fac(unsigned factor) 89 { 90 switch (factor) { 91 NV50_BLEND_FACTOR_CASE(ONE, ONE); 92 NV50_BLEND_FACTOR_CASE(SRC_COLOR, SRC_COLOR); 93 NV50_BLEND_FACTOR_CASE(SRC_ALPHA, SRC_ALPHA); 94 NV50_BLEND_FACTOR_CASE(DST_ALPHA, DST_ALPHA); 95 NV50_BLEND_FACTOR_CASE(DST_COLOR, DST_COLOR); 96 NV50_BLEND_FACTOR_CASE(SRC_ALPHA_SATURATE, SRC_ALPHA_SATURATE); 97 NV50_BLEND_FACTOR_CASE(CONST_COLOR, CONSTANT_COLOR); 98 NV50_BLEND_FACTOR_CASE(CONST_ALPHA, CONSTANT_ALPHA); 99 NV50_BLEND_FACTOR_CASE(SRC1_COLOR, SRC1_COLOR); 100 NV50_BLEND_FACTOR_CASE(SRC1_ALPHA, SRC1_ALPHA); 101 NV50_BLEND_FACTOR_CASE(ZERO, ZERO); 102 NV50_BLEND_FACTOR_CASE(INV_SRC_COLOR, ONE_MINUS_SRC_COLOR); 103 NV50_BLEND_FACTOR_CASE(INV_SRC_ALPHA, ONE_MINUS_SRC_ALPHA); 104 NV50_BLEND_FACTOR_CASE(INV_DST_ALPHA, ONE_MINUS_DST_ALPHA); 105 NV50_BLEND_FACTOR_CASE(INV_DST_COLOR, ONE_MINUS_DST_COLOR); 106 NV50_BLEND_FACTOR_CASE(INV_CONST_COLOR, ONE_MINUS_CONSTANT_COLOR); 107 NV50_BLEND_FACTOR_CASE(INV_CONST_ALPHA, ONE_MINUS_CONSTANT_ALPHA); 108 NV50_BLEND_FACTOR_CASE(INV_SRC1_COLOR, ONE_MINUS_SRC1_COLOR); 109 NV50_BLEND_FACTOR_CASE(INV_SRC1_ALPHA, ONE_MINUS_SRC1_ALPHA); 110 default: 111 return NV50_BLEND_FACTOR_ZERO; 112 } 113 } 114 115 static void * 116 nv50_blend_state_create(struct pipe_context *pipe, 117 const struct pipe_blend_state *cso) 118 { 119 struct nv50_blend_stateobj *so = CALLOC_STRUCT(nv50_blend_stateobj); 120 int i; 121 bool emit_common_func = cso->rt[0].blend_enable; 122 uint32_t ms; 123 124 if (nv50_context(pipe)->screen->tesla->oclass >= NVA3_3D_CLASS) { 125 SB_BEGIN_3D(so, BLEND_INDEPENDENT, 1); 126 SB_DATA (so, cso->independent_blend_enable); 127 } 128 129 so->pipe = *cso; 130 131 SB_BEGIN_3D(so, COLOR_MASK_COMMON, 1); 132 SB_DATA (so, !cso->independent_blend_enable); 133 134 SB_BEGIN_3D(so, BLEND_ENABLE_COMMON, 1); 135 SB_DATA (so, !cso->independent_blend_enable); 136 137 if (cso->independent_blend_enable) { 138 SB_BEGIN_3D(so, BLEND_ENABLE(0), 8); 139 for (i = 0; i < 8; ++i) { 140 SB_DATA(so, cso->rt[i].blend_enable); 141 if (cso->rt[i].blend_enable) 142 emit_common_func = true; 143 } 144 145 if (nv50_context(pipe)->screen->tesla->oclass >= NVA3_3D_CLASS) { 146 emit_common_func = false; 147 148 for (i = 0; i < 8; ++i) { 149 if (!cso->rt[i].blend_enable) 150 continue; 151 SB_BEGIN_3D_(so, NVA3_3D_IBLEND_EQUATION_RGB(i), 6); 152 SB_DATA (so, nvgl_blend_eqn(cso->rt[i].rgb_func)); 153 SB_DATA (so, nv50_blend_fac(cso->rt[i].rgb_src_factor)); 154 SB_DATA (so, nv50_blend_fac(cso->rt[i].rgb_dst_factor)); 155 SB_DATA (so, nvgl_blend_eqn(cso->rt[i].alpha_func)); 156 SB_DATA (so, nv50_blend_fac(cso->rt[i].alpha_src_factor)); 157 SB_DATA (so, nv50_blend_fac(cso->rt[i].alpha_dst_factor)); 158 } 159 } 160 } else { 161 SB_BEGIN_3D(so, BLEND_ENABLE(0), 1); 162 SB_DATA (so, cso->rt[0].blend_enable); 163 } 164 165 if (emit_common_func) { 166 SB_BEGIN_3D(so, BLEND_EQUATION_RGB, 5); 167 SB_DATA (so, nvgl_blend_eqn(cso->rt[0].rgb_func)); 168 SB_DATA (so, nv50_blend_fac(cso->rt[0].rgb_src_factor)); 169 SB_DATA (so, nv50_blend_fac(cso->rt[0].rgb_dst_factor)); 170 SB_DATA (so, nvgl_blend_eqn(cso->rt[0].alpha_func)); 171 SB_DATA (so, nv50_blend_fac(cso->rt[0].alpha_src_factor)); 172 SB_BEGIN_3D(so, BLEND_FUNC_DST_ALPHA, 1); 173 SB_DATA (so, nv50_blend_fac(cso->rt[0].alpha_dst_factor)); 174 } 175 176 if (cso->logicop_enable) { 177 SB_BEGIN_3D(so, LOGIC_OP_ENABLE, 2); 178 SB_DATA (so, 1); 179 SB_DATA (so, nvgl_logicop_func(cso->logicop_func)); 180 } else { 181 SB_BEGIN_3D(so, LOGIC_OP_ENABLE, 1); 182 SB_DATA (so, 0); 183 } 184 185 if (cso->independent_blend_enable) { 186 SB_BEGIN_3D(so, COLOR_MASK(0), 8); 187 for (i = 0; i < 8; ++i) 188 SB_DATA(so, nv50_colormask(cso->rt[i].colormask)); 189 } else { 190 SB_BEGIN_3D(so, COLOR_MASK(0), 1); 191 SB_DATA (so, nv50_colormask(cso->rt[0].colormask)); 192 } 193 194 ms = 0; 195 if (cso->alpha_to_coverage) 196 ms |= NV50_3D_MULTISAMPLE_CTRL_ALPHA_TO_COVERAGE; 197 if (cso->alpha_to_one) 198 ms |= NV50_3D_MULTISAMPLE_CTRL_ALPHA_TO_ONE; 199 200 SB_BEGIN_3D(so, MULTISAMPLE_CTRL, 1); 201 SB_DATA (so, ms); 202 203 assert(so->size <= ARRAY_SIZE(so->state)); 204 return so; 205 } 206 207 static void 208 nv50_blend_state_bind(struct pipe_context *pipe, void *hwcso) 209 { 210 struct nv50_context *nv50 = nv50_context(pipe); 211 212 nv50->blend = hwcso; 213 nv50->dirty_3d |= NV50_NEW_3D_BLEND; 214 } 215 216 static void 217 nv50_blend_state_delete(struct pipe_context *pipe, void *hwcso) 218 { 219 FREE(hwcso); 220 } 221 222 /* NOTE: ignoring line_last_pixel */ 223 static void * 224 nv50_rasterizer_state_create(struct pipe_context *pipe, 225 const struct pipe_rasterizer_state *cso) 226 { 227 struct nv50_rasterizer_stateobj *so; 228 uint32_t reg; 229 230 so = CALLOC_STRUCT(nv50_rasterizer_stateobj); 231 if (!so) 232 return NULL; 233 so->pipe = *cso; 234 235 #ifndef NV50_SCISSORS_CLIPPING 236 for (int i = 0; i < NV50_MAX_VIEWPORTS; i++) { 237 SB_BEGIN_3D(so, SCISSOR_ENABLE(i), 1); 238 SB_DATA (so, cso->scissor); 239 } 240 #endif 241 242 SB_BEGIN_3D(so, SHADE_MODEL, 1); 243 SB_DATA (so, cso->flatshade ? NV50_3D_SHADE_MODEL_FLAT : 244 NV50_3D_SHADE_MODEL_SMOOTH); 245 SB_BEGIN_3D(so, PROVOKING_VERTEX_LAST, 1); 246 SB_DATA (so, !cso->flatshade_first); 247 SB_BEGIN_3D(so, VERTEX_TWO_SIDE_ENABLE, 1); 248 SB_DATA (so, cso->light_twoside); 249 250 SB_BEGIN_3D(so, FRAG_COLOR_CLAMP_EN, 1); 251 SB_DATA (so, cso->clamp_fragment_color ? 0x11111111 : 0x00000000); 252 253 SB_BEGIN_3D(so, MULTISAMPLE_ENABLE, 1); 254 SB_DATA (so, cso->multisample); 255 256 SB_BEGIN_3D(so, LINE_WIDTH, 1); 257 SB_DATA (so, fui(cso->line_width)); 258 SB_BEGIN_3D(so, LINE_SMOOTH_ENABLE, 1); 259 SB_DATA (so, cso->line_smooth); 260 261 SB_BEGIN_3D(so, LINE_STIPPLE_ENABLE, 1); 262 if (cso->line_stipple_enable) { 263 SB_DATA (so, 1); 264 SB_BEGIN_3D(so, LINE_STIPPLE, 1); 265 SB_DATA (so, (cso->line_stipple_pattern << 8) | 266 cso->line_stipple_factor); 267 } else { 268 SB_DATA (so, 0); 269 } 270 271 if (!cso->point_size_per_vertex) { 272 SB_BEGIN_3D(so, POINT_SIZE, 1); 273 SB_DATA (so, fui(cso->point_size)); 274 } 275 SB_BEGIN_3D(so, POINT_SPRITE_ENABLE, 1); 276 SB_DATA (so, cso->point_quad_rasterization); 277 SB_BEGIN_3D(so, POINT_SMOOTH_ENABLE, 1); 278 SB_DATA (so, cso->point_smooth); 279 280 SB_BEGIN_3D(so, POLYGON_MODE_FRONT, 3); 281 SB_DATA (so, nvgl_polygon_mode(cso->fill_front)); 282 SB_DATA (so, nvgl_polygon_mode(cso->fill_back)); 283 SB_DATA (so, cso->poly_smooth); 284 285 SB_BEGIN_3D(so, CULL_FACE_ENABLE, 3); 286 SB_DATA (so, cso->cull_face != PIPE_FACE_NONE); 287 SB_DATA (so, cso->front_ccw ? NV50_3D_FRONT_FACE_CCW : 288 NV50_3D_FRONT_FACE_CW); 289 switch (cso->cull_face) { 290 case PIPE_FACE_FRONT_AND_BACK: 291 SB_DATA(so, NV50_3D_CULL_FACE_FRONT_AND_BACK); 292 break; 293 case PIPE_FACE_FRONT: 294 SB_DATA(so, NV50_3D_CULL_FACE_FRONT); 295 break; 296 case PIPE_FACE_BACK: 297 default: 298 SB_DATA(so, NV50_3D_CULL_FACE_BACK); 299 break; 300 } 301 302 SB_BEGIN_3D(so, POLYGON_STIPPLE_ENABLE, 1); 303 SB_DATA (so, cso->poly_stipple_enable); 304 SB_BEGIN_3D(so, POLYGON_OFFSET_POINT_ENABLE, 3); 305 SB_DATA (so, cso->offset_point); 306 SB_DATA (so, cso->offset_line); 307 SB_DATA (so, cso->offset_tri); 308 309 if (cso->offset_point || cso->offset_line || cso->offset_tri) { 310 SB_BEGIN_3D(so, POLYGON_OFFSET_FACTOR, 1); 311 SB_DATA (so, fui(cso->offset_scale)); 312 SB_BEGIN_3D(so, POLYGON_OFFSET_UNITS, 1); 313 SB_DATA (so, fui(cso->offset_units * 2.0f)); 314 SB_BEGIN_3D(so, POLYGON_OFFSET_CLAMP, 1); 315 SB_DATA (so, fui(cso->offset_clamp)); 316 } 317 318 if (cso->depth_clip) { 319 reg = 0; 320 } else { 321 reg = 322 NV50_3D_VIEW_VOLUME_CLIP_CTRL_DEPTH_CLAMP_NEAR | 323 NV50_3D_VIEW_VOLUME_CLIP_CTRL_DEPTH_CLAMP_FAR | 324 NV50_3D_VIEW_VOLUME_CLIP_CTRL_UNK12_UNK1; 325 } 326 #ifndef NV50_SCISSORS_CLIPPING 327 reg |= 328 NV50_3D_VIEW_VOLUME_CLIP_CTRL_UNK7 | 329 NV50_3D_VIEW_VOLUME_CLIP_CTRL_UNK12_UNK1; 330 #endif 331 SB_BEGIN_3D(so, VIEW_VOLUME_CLIP_CTRL, 1); 332 SB_DATA (so, reg); 333 334 SB_BEGIN_3D(so, DEPTH_CLIP_NEGATIVE_Z, 1); 335 SB_DATA (so, cso->clip_halfz); 336 337 SB_BEGIN_3D(so, PIXEL_CENTER_INTEGER, 1); 338 SB_DATA (so, !cso->half_pixel_center); 339 340 assert(so->size <= ARRAY_SIZE(so->state)); 341 return (void *)so; 342 } 343 344 static void 345 nv50_rasterizer_state_bind(struct pipe_context *pipe, void *hwcso) 346 { 347 struct nv50_context *nv50 = nv50_context(pipe); 348 349 nv50->rast = hwcso; 350 nv50->dirty_3d |= NV50_NEW_3D_RASTERIZER; 351 } 352 353 static void 354 nv50_rasterizer_state_delete(struct pipe_context *pipe, void *hwcso) 355 { 356 FREE(hwcso); 357 } 358 359 static void * 360 nv50_zsa_state_create(struct pipe_context *pipe, 361 const struct pipe_depth_stencil_alpha_state *cso) 362 { 363 struct nv50_zsa_stateobj *so = CALLOC_STRUCT(nv50_zsa_stateobj); 364 365 so->pipe = *cso; 366 367 SB_BEGIN_3D(so, DEPTH_WRITE_ENABLE, 1); 368 SB_DATA (so, cso->depth.writemask); 369 SB_BEGIN_3D(so, DEPTH_TEST_ENABLE, 1); 370 if (cso->depth.enabled) { 371 SB_DATA (so, 1); 372 SB_BEGIN_3D(so, DEPTH_TEST_FUNC, 1); 373 SB_DATA (so, nvgl_comparison_op(cso->depth.func)); 374 } else { 375 SB_DATA (so, 0); 376 } 377 378 SB_BEGIN_3D(so, DEPTH_BOUNDS_EN, 1); 379 if (cso->depth.bounds_test) { 380 SB_DATA (so, 1); 381 SB_BEGIN_3D(so, DEPTH_BOUNDS(0), 2); 382 SB_DATA (so, fui(cso->depth.bounds_min)); 383 SB_DATA (so, fui(cso->depth.bounds_max)); 384 } else { 385 SB_DATA (so, 0); 386 } 387 388 if (cso->stencil[0].enabled) { 389 SB_BEGIN_3D(so, STENCIL_ENABLE, 5); 390 SB_DATA (so, 1); 391 SB_DATA (so, nvgl_stencil_op(cso->stencil[0].fail_op)); 392 SB_DATA (so, nvgl_stencil_op(cso->stencil[0].zfail_op)); 393 SB_DATA (so, nvgl_stencil_op(cso->stencil[0].zpass_op)); 394 SB_DATA (so, nvgl_comparison_op(cso->stencil[0].func)); 395 SB_BEGIN_3D(so, STENCIL_FRONT_MASK, 2); 396 SB_DATA (so, cso->stencil[0].writemask); 397 SB_DATA (so, cso->stencil[0].valuemask); 398 } else { 399 SB_BEGIN_3D(so, STENCIL_ENABLE, 1); 400 SB_DATA (so, 0); 401 } 402 403 if (cso->stencil[1].enabled) { 404 assert(cso->stencil[0].enabled); 405 SB_BEGIN_3D(so, STENCIL_TWO_SIDE_ENABLE, 5); 406 SB_DATA (so, 1); 407 SB_DATA (so, nvgl_stencil_op(cso->stencil[1].fail_op)); 408 SB_DATA (so, nvgl_stencil_op(cso->stencil[1].zfail_op)); 409 SB_DATA (so, nvgl_stencil_op(cso->stencil[1].zpass_op)); 410 SB_DATA (so, nvgl_comparison_op(cso->stencil[1].func)); 411 SB_BEGIN_3D(so, STENCIL_BACK_MASK, 2); 412 SB_DATA (so, cso->stencil[1].writemask); 413 SB_DATA (so, cso->stencil[1].valuemask); 414 } else { 415 SB_BEGIN_3D(so, STENCIL_TWO_SIDE_ENABLE, 1); 416 SB_DATA (so, 0); 417 } 418 419 SB_BEGIN_3D(so, ALPHA_TEST_ENABLE, 1); 420 if (cso->alpha.enabled) { 421 SB_DATA (so, 1); 422 SB_BEGIN_3D(so, ALPHA_TEST_REF, 2); 423 SB_DATA (so, fui(cso->alpha.ref_value)); 424 SB_DATA (so, nvgl_comparison_op(cso->alpha.func)); 425 } else { 426 SB_DATA (so, 0); 427 } 428 429 SB_BEGIN_3D(so, CB_ADDR, 1); 430 SB_DATA (so, NV50_CB_AUX_ALPHATEST_OFFSET << (8 - 2) | NV50_CB_AUX); 431 SB_BEGIN_3D(so, CB_DATA(0), 1); 432 SB_DATA (so, fui(cso->alpha.ref_value)); 433 434 assert(so->size <= ARRAY_SIZE(so->state)); 435 return (void *)so; 436 } 437 438 static void 439 nv50_zsa_state_bind(struct pipe_context *pipe, void *hwcso) 440 { 441 struct nv50_context *nv50 = nv50_context(pipe); 442 443 nv50->zsa = hwcso; 444 nv50->dirty_3d |= NV50_NEW_3D_ZSA; 445 } 446 447 static void 448 nv50_zsa_state_delete(struct pipe_context *pipe, void *hwcso) 449 { 450 FREE(hwcso); 451 } 452 453 /* ====================== SAMPLERS AND TEXTURES ================================ 454 */ 455 456 static inline unsigned 457 nv50_tsc_wrap_mode(unsigned wrap) 458 { 459 switch (wrap) { 460 case PIPE_TEX_WRAP_REPEAT: 461 return G80_TSC_WRAP_WRAP; 462 case PIPE_TEX_WRAP_MIRROR_REPEAT: 463 return G80_TSC_WRAP_MIRROR; 464 case PIPE_TEX_WRAP_CLAMP_TO_EDGE: 465 return G80_TSC_WRAP_CLAMP_TO_EDGE; 466 case PIPE_TEX_WRAP_CLAMP_TO_BORDER: 467 return G80_TSC_WRAP_BORDER; 468 case PIPE_TEX_WRAP_CLAMP: 469 return G80_TSC_WRAP_CLAMP_OGL; 470 case PIPE_TEX_WRAP_MIRROR_CLAMP_TO_EDGE: 471 return G80_TSC_WRAP_MIRROR_ONCE_CLAMP_TO_EDGE; 472 case PIPE_TEX_WRAP_MIRROR_CLAMP_TO_BORDER: 473 return G80_TSC_WRAP_MIRROR_ONCE_BORDER; 474 case PIPE_TEX_WRAP_MIRROR_CLAMP: 475 return G80_TSC_WRAP_MIRROR_ONCE_CLAMP_OGL; 476 default: 477 NOUVEAU_ERR("unknown wrap mode: %d\n", wrap); 478 return G80_TSC_WRAP_WRAP; 479 } 480 } 481 482 void * 483 nv50_sampler_state_create(struct pipe_context *pipe, 484 const struct pipe_sampler_state *cso) 485 { 486 struct nv50_tsc_entry *so = MALLOC_STRUCT(nv50_tsc_entry); 487 float f[2]; 488 489 so->id = -1; 490 491 so->tsc[0] = (0x00026000 | 492 (nv50_tsc_wrap_mode(cso->wrap_s) << 0) | 493 (nv50_tsc_wrap_mode(cso->wrap_t) << 3) | 494 (nv50_tsc_wrap_mode(cso->wrap_r) << 6)); 495 496 switch (cso->mag_img_filter) { 497 case PIPE_TEX_FILTER_LINEAR: 498 so->tsc[1] = G80_TSC_1_MAG_FILTER_LINEAR; 499 break; 500 case PIPE_TEX_FILTER_NEAREST: 501 default: 502 so->tsc[1] = G80_TSC_1_MAG_FILTER_NEAREST; 503 break; 504 } 505 506 switch (cso->min_img_filter) { 507 case PIPE_TEX_FILTER_LINEAR: 508 so->tsc[1] |= G80_TSC_1_MIN_FILTER_LINEAR; 509 break; 510 case PIPE_TEX_FILTER_NEAREST: 511 default: 512 so->tsc[1] |= G80_TSC_1_MIN_FILTER_NEAREST; 513 break; 514 } 515 516 switch (cso->min_mip_filter) { 517 case PIPE_TEX_MIPFILTER_LINEAR: 518 so->tsc[1] |= G80_TSC_1_MIP_FILTER_LINEAR; 519 break; 520 case PIPE_TEX_MIPFILTER_NEAREST: 521 so->tsc[1] |= G80_TSC_1_MIP_FILTER_NEAREST; 522 break; 523 case PIPE_TEX_MIPFILTER_NONE: 524 default: 525 so->tsc[1] |= G80_TSC_1_MIP_FILTER_NONE; 526 break; 527 } 528 529 if (nouveau_screen(pipe->screen)->class_3d >= NVE4_3D_CLASS) { 530 if (cso->seamless_cube_map) 531 so->tsc[1] |= GK104_TSC_1_CUBEMAP_INTERFACE_FILTERING; 532 if (!cso->normalized_coords) 533 so->tsc[1] |= GK104_TSC_1_FLOAT_COORD_NORMALIZATION_FORCE_UNNORMALIZED_COORDS; 534 } else { 535 so->seamless_cube_map = cso->seamless_cube_map; 536 } 537 538 if (cso->max_anisotropy >= 16) 539 so->tsc[0] |= (7 << 20); 540 else 541 if (cso->max_anisotropy >= 12) 542 so->tsc[0] |= (6 << 20); 543 else { 544 so->tsc[0] |= (cso->max_anisotropy >> 1) << 20; 545 546 if (cso->max_anisotropy >= 4) 547 so->tsc[1] |= 6 << G80_TSC_1_TRILIN_OPT__SHIFT; 548 else 549 if (cso->max_anisotropy >= 2) 550 so->tsc[1] |= 4 << G80_TSC_1_TRILIN_OPT__SHIFT; 551 } 552 553 if (cso->compare_mode == PIPE_TEX_COMPARE_R_TO_TEXTURE) { 554 /* NOTE: must be deactivated for non-shadow textures */ 555 so->tsc[0] |= (1 << 9); 556 so->tsc[0] |= (nvgl_comparison_op(cso->compare_func) & 0x7) << 10; 557 } 558 559 f[0] = CLAMP(cso->lod_bias, -16.0f, 15.0f); 560 so->tsc[1] |= ((int)(f[0] * 256.0f) & 0x1fff) << 12; 561 562 f[0] = CLAMP(cso->min_lod, 0.0f, 15.0f); 563 f[1] = CLAMP(cso->max_lod, 0.0f, 15.0f); 564 so->tsc[2] = 565 (((int)(f[1] * 256.0f) & 0xfff) << 12) | ((int)(f[0] * 256.0f) & 0xfff); 566 567 so->tsc[2] |= 568 util_format_linear_float_to_srgb_8unorm(cso->border_color.f[0]) << 24; 569 so->tsc[3] = 570 util_format_linear_float_to_srgb_8unorm(cso->border_color.f[1]) << 12; 571 so->tsc[3] |= 572 util_format_linear_float_to_srgb_8unorm(cso->border_color.f[2]) << 20; 573 574 so->tsc[4] = fui(cso->border_color.f[0]); 575 so->tsc[5] = fui(cso->border_color.f[1]); 576 so->tsc[6] = fui(cso->border_color.f[2]); 577 so->tsc[7] = fui(cso->border_color.f[3]); 578 579 return (void *)so; 580 } 581 582 static void 583 nv50_sampler_state_delete(struct pipe_context *pipe, void *hwcso) 584 { 585 unsigned s, i; 586 587 for (s = 0; s < 3; ++s) { 588 assert(nv50_context(pipe)->num_samplers[s] <= PIPE_MAX_SAMPLERS); 589 for (i = 0; i < nv50_context(pipe)->num_samplers[s]; ++i) 590 if (nv50_context(pipe)->samplers[s][i] == hwcso) 591 nv50_context(pipe)->samplers[s][i] = NULL; 592 } 593 594 nv50_screen_tsc_free(nv50_context(pipe)->screen, nv50_tsc_entry(hwcso)); 595 596 FREE(hwcso); 597 } 598 599 static inline void 600 nv50_stage_sampler_states_bind(struct nv50_context *nv50, int s, 601 unsigned nr, void **hwcso) 602 { 603 unsigned i; 604 605 assert(nr <= PIPE_MAX_SAMPLERS); 606 for (i = 0; i < nr; ++i) { 607 struct nv50_tsc_entry *old = nv50->samplers[s][i]; 608 609 nv50->samplers[s][i] = nv50_tsc_entry(hwcso[i]); 610 if (old) 611 nv50_screen_tsc_unlock(nv50->screen, old); 612 } 613 assert(nv50->num_samplers[s] <= PIPE_MAX_SAMPLERS); 614 for (; i < nv50->num_samplers[s]; ++i) { 615 if (nv50->samplers[s][i]) { 616 nv50_screen_tsc_unlock(nv50->screen, nv50->samplers[s][i]); 617 nv50->samplers[s][i] = NULL; 618 } 619 } 620 621 nv50->num_samplers[s] = nr; 622 623 nv50->dirty_3d |= NV50_NEW_3D_SAMPLERS; 624 } 625 626 static void 627 nv50_vp_sampler_states_bind(struct pipe_context *pipe, unsigned nr, void **s) 628 { 629 nv50_stage_sampler_states_bind(nv50_context(pipe), 0, nr, s); 630 } 631 632 static void 633 nv50_fp_sampler_states_bind(struct pipe_context *pipe, unsigned nr, void **s) 634 { 635 nv50_stage_sampler_states_bind(nv50_context(pipe), 2, nr, s); 636 } 637 638 static void 639 nv50_gp_sampler_states_bind(struct pipe_context *pipe, unsigned nr, void **s) 640 { 641 nv50_stage_sampler_states_bind(nv50_context(pipe), 1, nr, s); 642 } 643 644 static void 645 nv50_bind_sampler_states(struct pipe_context *pipe, 646 enum pipe_shader_type shader, unsigned start, 647 unsigned num_samplers, void **samplers) 648 { 649 assert(start == 0); 650 switch (shader) { 651 case PIPE_SHADER_VERTEX: 652 nv50_vp_sampler_states_bind(pipe, num_samplers, samplers); 653 break; 654 case PIPE_SHADER_GEOMETRY: 655 nv50_gp_sampler_states_bind(pipe, num_samplers, samplers); 656 break; 657 case PIPE_SHADER_FRAGMENT: 658 nv50_fp_sampler_states_bind(pipe, num_samplers, samplers); 659 break; 660 default: 661 assert(!"unexpected shader type"); 662 break; 663 } 664 } 665 666 667 668 /* NOTE: only called when not referenced anywhere, won't be bound */ 669 static void 670 nv50_sampler_view_destroy(struct pipe_context *pipe, 671 struct pipe_sampler_view *view) 672 { 673 pipe_resource_reference(&view->texture, NULL); 674 675 nv50_screen_tic_free(nv50_context(pipe)->screen, nv50_tic_entry(view)); 676 677 FREE(nv50_tic_entry(view)); 678 } 679 680 static inline void 681 nv50_stage_set_sampler_views(struct nv50_context *nv50, int s, 682 unsigned nr, 683 struct pipe_sampler_view **views) 684 { 685 unsigned i; 686 687 assert(nr <= PIPE_MAX_SAMPLERS); 688 for (i = 0; i < nr; ++i) { 689 struct nv50_tic_entry *old = nv50_tic_entry(nv50->textures[s][i]); 690 if (old) 691 nv50_screen_tic_unlock(nv50->screen, old); 692 693 if (views[i] && views[i]->texture) { 694 struct pipe_resource *res = views[i]->texture; 695 if (res->target == PIPE_BUFFER && 696 (res->flags & PIPE_RESOURCE_FLAG_MAP_COHERENT)) 697 nv50->textures_coherent[s] |= 1 << i; 698 else 699 nv50->textures_coherent[s] &= ~(1 << i); 700 } else { 701 nv50->textures_coherent[s] &= ~(1 << i); 702 } 703 704 pipe_sampler_view_reference(&nv50->textures[s][i], views[i]); 705 } 706 707 assert(nv50->num_textures[s] <= PIPE_MAX_SAMPLERS); 708 for (i = nr; i < nv50->num_textures[s]; ++i) { 709 struct nv50_tic_entry *old = nv50_tic_entry(nv50->textures[s][i]); 710 if (!old) 711 continue; 712 nv50_screen_tic_unlock(nv50->screen, old); 713 714 pipe_sampler_view_reference(&nv50->textures[s][i], NULL); 715 } 716 717 nv50->num_textures[s] = nr; 718 719 nouveau_bufctx_reset(nv50->bufctx_3d, NV50_BIND_3D_TEXTURES); 720 721 nv50->dirty_3d |= NV50_NEW_3D_TEXTURES; 722 } 723 724 static void 725 nv50_set_sampler_views(struct pipe_context *pipe, enum pipe_shader_type shader, 726 unsigned start, unsigned nr, 727 struct pipe_sampler_view **views) 728 { 729 assert(start == 0); 730 switch (shader) { 731 case PIPE_SHADER_VERTEX: 732 nv50_stage_set_sampler_views(nv50_context(pipe), 0, nr, views); 733 break; 734 case PIPE_SHADER_GEOMETRY: 735 nv50_stage_set_sampler_views(nv50_context(pipe), 1, nr, views); 736 break; 737 case PIPE_SHADER_FRAGMENT: 738 nv50_stage_set_sampler_views(nv50_context(pipe), 2, nr, views); 739 break; 740 default: 741 ; 742 } 743 } 744 745 746 747 /* ============================= SHADERS ======================================= 748 */ 749 750 static void * 751 nv50_sp_state_create(struct pipe_context *pipe, 752 const struct pipe_shader_state *cso, unsigned type) 753 { 754 struct nv50_program *prog; 755 756 prog = CALLOC_STRUCT(nv50_program); 757 if (!prog) 758 return NULL; 759 760 prog->type = type; 761 prog->pipe.tokens = tgsi_dup_tokens(cso->tokens); 762 763 if (cso->stream_output.num_outputs) 764 prog->pipe.stream_output = cso->stream_output; 765 766 prog->translated = nv50_program_translate( 767 prog, nv50_context(pipe)->screen->base.device->chipset, 768 &nouveau_context(pipe)->debug); 769 770 return (void *)prog; 771 } 772 773 static void 774 nv50_sp_state_delete(struct pipe_context *pipe, void *hwcso) 775 { 776 struct nv50_program *prog = (struct nv50_program *)hwcso; 777 778 nv50_program_destroy(nv50_context(pipe), prog); 779 780 FREE((void *)prog->pipe.tokens); 781 FREE(prog); 782 } 783 784 static void * 785 nv50_vp_state_create(struct pipe_context *pipe, 786 const struct pipe_shader_state *cso) 787 { 788 return nv50_sp_state_create(pipe, cso, PIPE_SHADER_VERTEX); 789 } 790 791 static void 792 nv50_vp_state_bind(struct pipe_context *pipe, void *hwcso) 793 { 794 struct nv50_context *nv50 = nv50_context(pipe); 795 796 nv50->vertprog = hwcso; 797 nv50->dirty_3d |= NV50_NEW_3D_VERTPROG; 798 } 799 800 static void * 801 nv50_fp_state_create(struct pipe_context *pipe, 802 const struct pipe_shader_state *cso) 803 { 804 return nv50_sp_state_create(pipe, cso, PIPE_SHADER_FRAGMENT); 805 } 806 807 static void 808 nv50_fp_state_bind(struct pipe_context *pipe, void *hwcso) 809 { 810 struct nv50_context *nv50 = nv50_context(pipe); 811 812 nv50->fragprog = hwcso; 813 nv50->dirty_3d |= NV50_NEW_3D_FRAGPROG; 814 } 815 816 static void * 817 nv50_gp_state_create(struct pipe_context *pipe, 818 const struct pipe_shader_state *cso) 819 { 820 return nv50_sp_state_create(pipe, cso, PIPE_SHADER_GEOMETRY); 821 } 822 823 static void 824 nv50_gp_state_bind(struct pipe_context *pipe, void *hwcso) 825 { 826 struct nv50_context *nv50 = nv50_context(pipe); 827 828 nv50->gmtyprog = hwcso; 829 nv50->dirty_3d |= NV50_NEW_3D_GMTYPROG; 830 } 831 832 static void * 833 nv50_cp_state_create(struct pipe_context *pipe, 834 const struct pipe_compute_state *cso) 835 { 836 struct nv50_program *prog; 837 838 prog = CALLOC_STRUCT(nv50_program); 839 if (!prog) 840 return NULL; 841 prog->type = PIPE_SHADER_COMPUTE; 842 843 prog->cp.smem_size = cso->req_local_mem; 844 prog->cp.lmem_size = cso->req_private_mem; 845 prog->parm_size = cso->req_input_mem; 846 847 prog->pipe.tokens = tgsi_dup_tokens((const struct tgsi_token *)cso->prog); 848 849 return (void *)prog; 850 } 851 852 static void 853 nv50_cp_state_bind(struct pipe_context *pipe, void *hwcso) 854 { 855 struct nv50_context *nv50 = nv50_context(pipe); 856 857 nv50->compprog = hwcso; 858 nv50->dirty_cp |= NV50_NEW_CP_PROGRAM; 859 } 860 861 static void 862 nv50_set_constant_buffer(struct pipe_context *pipe, uint shader, uint index, 863 const struct pipe_constant_buffer *cb) 864 { 865 struct nv50_context *nv50 = nv50_context(pipe); 866 struct pipe_resource *res = cb ? cb->buffer : NULL; 867 const unsigned s = nv50_context_shader_stage(shader); 868 const unsigned i = index; 869 870 if (shader == PIPE_SHADER_COMPUTE) 871 return; 872 873 assert(i < NV50_MAX_PIPE_CONSTBUFS); 874 if (nv50->constbuf[s][i].user) 875 nv50->constbuf[s][i].u.buf = NULL; 876 else 877 if (nv50->constbuf[s][i].u.buf) { 878 nouveau_bufctx_reset(nv50->bufctx_3d, NV50_BIND_3D_CB(s, i)); 879 nv04_resource(nv50->constbuf[s][i].u.buf)->cb_bindings[s] &= ~(1 << i); 880 } 881 pipe_resource_reference(&nv50->constbuf[s][i].u.buf, res); 882 883 nv50->constbuf[s][i].user = (cb && cb->user_buffer) ? true : false; 884 if (nv50->constbuf[s][i].user) { 885 nv50->constbuf[s][i].u.data = cb->user_buffer; 886 nv50->constbuf[s][i].size = MIN2(cb->buffer_size, 0x10000); 887 nv50->constbuf_valid[s] |= 1 << i; 888 nv50->constbuf_coherent[s] &= ~(1 << i); 889 } else 890 if (res) { 891 nv50->constbuf[s][i].offset = cb->buffer_offset; 892 nv50->constbuf[s][i].size = MIN2(align(cb->buffer_size, 0x100), 0x10000); 893 nv50->constbuf_valid[s] |= 1 << i; 894 if (res->flags & PIPE_RESOURCE_FLAG_MAP_COHERENT) 895 nv50->constbuf_coherent[s] |= 1 << i; 896 else 897 nv50->constbuf_coherent[s] &= ~(1 << i); 898 } else { 899 nv50->constbuf_valid[s] &= ~(1 << i); 900 nv50->constbuf_coherent[s] &= ~(1 << i); 901 } 902 nv50->constbuf_dirty[s] |= 1 << i; 903 904 nv50->dirty_3d |= NV50_NEW_3D_CONSTBUF; 905 } 906 907 /* ============================================================================= 908 */ 909 910 static void 911 nv50_set_blend_color(struct pipe_context *pipe, 912 const struct pipe_blend_color *bcol) 913 { 914 struct nv50_context *nv50 = nv50_context(pipe); 915 916 nv50->blend_colour = *bcol; 917 nv50->dirty_3d |= NV50_NEW_3D_BLEND_COLOUR; 918 } 919 920 static void 921 nv50_set_stencil_ref(struct pipe_context *pipe, 922 const struct pipe_stencil_ref *sr) 923 { 924 struct nv50_context *nv50 = nv50_context(pipe); 925 926 nv50->stencil_ref = *sr; 927 nv50->dirty_3d |= NV50_NEW_3D_STENCIL_REF; 928 } 929 930 static void 931 nv50_set_clip_state(struct pipe_context *pipe, 932 const struct pipe_clip_state *clip) 933 { 934 struct nv50_context *nv50 = nv50_context(pipe); 935 936 memcpy(nv50->clip.ucp, clip->ucp, sizeof(clip->ucp)); 937 938 nv50->dirty_3d |= NV50_NEW_3D_CLIP; 939 } 940 941 static void 942 nv50_set_sample_mask(struct pipe_context *pipe, unsigned sample_mask) 943 { 944 struct nv50_context *nv50 = nv50_context(pipe); 945 946 nv50->sample_mask = sample_mask; 947 nv50->dirty_3d |= NV50_NEW_3D_SAMPLE_MASK; 948 } 949 950 static void 951 nv50_set_min_samples(struct pipe_context *pipe, unsigned min_samples) 952 { 953 struct nv50_context *nv50 = nv50_context(pipe); 954 955 if (nv50->min_samples != min_samples) { 956 nv50->min_samples = min_samples; 957 nv50->dirty_3d |= NV50_NEW_3D_MIN_SAMPLES; 958 } 959 } 960 961 static void 962 nv50_set_framebuffer_state(struct pipe_context *pipe, 963 const struct pipe_framebuffer_state *fb) 964 { 965 struct nv50_context *nv50 = nv50_context(pipe); 966 967 nouveau_bufctx_reset(nv50->bufctx_3d, NV50_BIND_3D_FB); 968 969 util_copy_framebuffer_state(&nv50->framebuffer, fb); 970 971 nv50->dirty_3d |= NV50_NEW_3D_FRAMEBUFFER; 972 } 973 974 static void 975 nv50_set_polygon_stipple(struct pipe_context *pipe, 976 const struct pipe_poly_stipple *stipple) 977 { 978 struct nv50_context *nv50 = nv50_context(pipe); 979 980 nv50->stipple = *stipple; 981 nv50->dirty_3d |= NV50_NEW_3D_STIPPLE; 982 } 983 984 static void 985 nv50_set_scissor_states(struct pipe_context *pipe, 986 unsigned start_slot, 987 unsigned num_scissors, 988 const struct pipe_scissor_state *scissor) 989 { 990 struct nv50_context *nv50 = nv50_context(pipe); 991 int i; 992 993 assert(start_slot + num_scissors <= NV50_MAX_VIEWPORTS); 994 for (i = 0; i < num_scissors; i++) { 995 if (!memcmp(&nv50->scissors[start_slot + i], &scissor[i], sizeof(*scissor))) 996 continue; 997 nv50->scissors[start_slot + i] = scissor[i]; 998 nv50->scissors_dirty |= 1 << (start_slot + i); 999 nv50->dirty_3d |= NV50_NEW_3D_SCISSOR; 1000 } 1001 } 1002 1003 static void 1004 nv50_set_viewport_states(struct pipe_context *pipe, 1005 unsigned start_slot, 1006 unsigned num_viewports, 1007 const struct pipe_viewport_state *vpt) 1008 { 1009 struct nv50_context *nv50 = nv50_context(pipe); 1010 int i; 1011 1012 assert(start_slot + num_viewports <= NV50_MAX_VIEWPORTS); 1013 for (i = 0; i < num_viewports; i++) { 1014 if (!memcmp(&nv50->viewports[start_slot + i], &vpt[i], sizeof(*vpt))) 1015 continue; 1016 nv50->viewports[start_slot + i] = vpt[i]; 1017 nv50->viewports_dirty |= 1 << (start_slot + i); 1018 nv50->dirty_3d |= NV50_NEW_3D_VIEWPORT; 1019 } 1020 } 1021 1022 static void 1023 nv50_set_window_rectangles(struct pipe_context *pipe, 1024 boolean include, 1025 unsigned num_rectangles, 1026 const struct pipe_scissor_state *rectangles) 1027 { 1028 struct nv50_context *nv50 = nv50_context(pipe); 1029 1030 nv50->window_rect.inclusive = include; 1031 nv50->window_rect.rects = MIN2(num_rectangles, NV50_MAX_WINDOW_RECTANGLES); 1032 memcpy(nv50->window_rect.rect, rectangles, 1033 sizeof(struct pipe_scissor_state) * nv50->window_rect.rects); 1034 1035 nv50->dirty_3d |= NV50_NEW_3D_WINDOW_RECTS; 1036 } 1037 1038 static void 1039 nv50_set_vertex_buffers(struct pipe_context *pipe, 1040 unsigned start_slot, unsigned count, 1041 const struct pipe_vertex_buffer *vb) 1042 { 1043 struct nv50_context *nv50 = nv50_context(pipe); 1044 unsigned i; 1045 1046 nouveau_bufctx_reset(nv50->bufctx_3d, NV50_BIND_3D_VERTEX); 1047 nv50->dirty_3d |= NV50_NEW_3D_ARRAYS; 1048 1049 util_set_vertex_buffers_count(nv50->vtxbuf, &nv50->num_vtxbufs, vb, 1050 start_slot, count); 1051 1052 if (!vb) { 1053 nv50->vbo_user &= ~(((1ull << count) - 1) << start_slot); 1054 nv50->vbo_constant &= ~(((1ull << count) - 1) << start_slot); 1055 nv50->vtxbufs_coherent &= ~(((1ull << count) - 1) << start_slot); 1056 return; 1057 } 1058 1059 for (i = 0; i < count; ++i) { 1060 unsigned dst_index = start_slot + i; 1061 1062 if (!vb[i].buffer && vb[i].user_buffer) { 1063 nv50->vbo_user |= 1 << dst_index; 1064 if (!vb[i].stride) 1065 nv50->vbo_constant |= 1 << dst_index; 1066 else 1067 nv50->vbo_constant &= ~(1 << dst_index); 1068 nv50->vtxbufs_coherent &= ~(1 << dst_index); 1069 } else { 1070 nv50->vbo_user &= ~(1 << dst_index); 1071 nv50->vbo_constant &= ~(1 << dst_index); 1072 1073 if (vb[i].buffer && 1074 vb[i].buffer->flags & PIPE_RESOURCE_FLAG_MAP_COHERENT) 1075 nv50->vtxbufs_coherent |= (1 << dst_index); 1076 else 1077 nv50->vtxbufs_coherent &= ~(1 << dst_index); 1078 } 1079 } 1080 } 1081 1082 static void 1083 nv50_set_index_buffer(struct pipe_context *pipe, 1084 const struct pipe_index_buffer *ib) 1085 { 1086 struct nv50_context *nv50 = nv50_context(pipe); 1087 1088 if (nv50->idxbuf.buffer) 1089 nouveau_bufctx_reset(nv50->bufctx_3d, NV50_BIND_3D_INDEX); 1090 1091 if (ib) { 1092 pipe_resource_reference(&nv50->idxbuf.buffer, ib->buffer); 1093 nv50->idxbuf.index_size = ib->index_size; 1094 if (ib->buffer) { 1095 nv50->idxbuf.offset = ib->offset; 1096 BCTX_REFN(nv50->bufctx_3d, 3D_INDEX, nv04_resource(ib->buffer), RD); 1097 } else { 1098 nv50->idxbuf.user_buffer = ib->user_buffer; 1099 } 1100 } else { 1101 pipe_resource_reference(&nv50->idxbuf.buffer, NULL); 1102 } 1103 } 1104 1105 static void 1106 nv50_vertex_state_bind(struct pipe_context *pipe, void *hwcso) 1107 { 1108 struct nv50_context *nv50 = nv50_context(pipe); 1109 1110 nv50->vertex = hwcso; 1111 nv50->dirty_3d |= NV50_NEW_3D_VERTEX; 1112 } 1113 1114 static struct pipe_stream_output_target * 1115 nv50_so_target_create(struct pipe_context *pipe, 1116 struct pipe_resource *res, 1117 unsigned offset, unsigned size) 1118 { 1119 struct nv04_resource *buf = (struct nv04_resource *)res; 1120 struct nv50_so_target *targ = MALLOC_STRUCT(nv50_so_target); 1121 if (!targ) 1122 return NULL; 1123 1124 if (nouveau_context(pipe)->screen->class_3d >= NVA0_3D_CLASS) { 1125 targ->pq = pipe->create_query(pipe, 1126 NVA0_HW_QUERY_STREAM_OUTPUT_BUFFER_OFFSET, 0); 1127 if (!targ->pq) { 1128 FREE(targ); 1129 return NULL; 1130 } 1131 } else { 1132 targ->pq = NULL; 1133 } 1134 targ->clean = true; 1135 1136 targ->pipe.buffer_size = size; 1137 targ->pipe.buffer_offset = offset; 1138 targ->pipe.context = pipe; 1139 targ->pipe.buffer = NULL; 1140 pipe_resource_reference(&targ->pipe.buffer, res); 1141 pipe_reference_init(&targ->pipe.reference, 1); 1142 1143 assert(buf->base.target == PIPE_BUFFER); 1144 util_range_add(&buf->valid_buffer_range, offset, offset + size); 1145 1146 return &targ->pipe; 1147 } 1148 1149 static void 1150 nva0_so_target_save_offset(struct pipe_context *pipe, 1151 struct pipe_stream_output_target *ptarg, 1152 unsigned index, bool serialize) 1153 { 1154 struct nv50_so_target *targ = nv50_so_target(ptarg); 1155 1156 if (serialize) { 1157 struct nouveau_pushbuf *push = nv50_context(pipe)->base.pushbuf; 1158 PUSH_SPACE(push, 2); 1159 BEGIN_NV04(push, SUBC_3D(NV50_GRAPH_SERIALIZE), 1); 1160 PUSH_DATA (push, 0); 1161 } 1162 1163 nv50_query(targ->pq)->index = index; 1164 pipe->end_query(pipe, targ->pq); 1165 } 1166 1167 static void 1168 nv50_so_target_destroy(struct pipe_context *pipe, 1169 struct pipe_stream_output_target *ptarg) 1170 { 1171 struct nv50_so_target *targ = nv50_so_target(ptarg); 1172 if (targ->pq) 1173 pipe->destroy_query(pipe, targ->pq); 1174 pipe_resource_reference(&targ->pipe.buffer, NULL); 1175 FREE(targ); 1176 } 1177 1178 static void 1179 nv50_set_stream_output_targets(struct pipe_context *pipe, 1180 unsigned num_targets, 1181 struct pipe_stream_output_target **targets, 1182 const unsigned *offsets) 1183 { 1184 struct nv50_context *nv50 = nv50_context(pipe); 1185 unsigned i; 1186 bool serialize = true; 1187 const bool can_resume = nv50->screen->base.class_3d >= NVA0_3D_CLASS; 1188 1189 assert(num_targets <= 4); 1190 1191 for (i = 0; i < num_targets; ++i) { 1192 const bool changed = nv50->so_target[i] != targets[i]; 1193 const bool append = (offsets[i] == (unsigned)-1); 1194 if (!changed && append) 1195 continue; 1196 nv50->so_targets_dirty |= 1 << i; 1197 1198 if (can_resume && changed && nv50->so_target[i]) { 1199 nva0_so_target_save_offset(pipe, nv50->so_target[i], i, serialize); 1200 serialize = false; 1201 } 1202 1203 if (targets[i] && !append) 1204 nv50_so_target(targets[i])->clean = true; 1205 1206 pipe_so_target_reference(&nv50->so_target[i], targets[i]); 1207 } 1208 for (; i < nv50->num_so_targets; ++i) { 1209 if (can_resume && nv50->so_target[i]) { 1210 nva0_so_target_save_offset(pipe, nv50->so_target[i], i, serialize); 1211 serialize = false; 1212 } 1213 pipe_so_target_reference(&nv50->so_target[i], NULL); 1214 nv50->so_targets_dirty |= 1 << i; 1215 } 1216 nv50->num_so_targets = num_targets; 1217 1218 if (nv50->so_targets_dirty) { 1219 nouveau_bufctx_reset(nv50->bufctx_3d, NV50_BIND_3D_SO); 1220 nv50->dirty_3d |= NV50_NEW_3D_STRMOUT; 1221 } 1222 } 1223 1224 static void 1225 nv50_set_compute_resources(struct pipe_context *pipe, 1226 unsigned start, unsigned nr, 1227 struct pipe_surface **resources) 1228 { 1229 /* TODO: bind surfaces */ 1230 } 1231 1232 static inline void 1233 nv50_set_global_handle(uint32_t *phandle, struct pipe_resource *res) 1234 { 1235 struct nv04_resource *buf = nv04_resource(res); 1236 if (buf) { 1237 uint64_t limit = (buf->address + buf->base.width0) - 1; 1238 if (limit < (1ULL << 32)) { 1239 *phandle = (uint32_t)buf->address; 1240 } else { 1241 NOUVEAU_ERR("Cannot map into TGSI_RESOURCE_GLOBAL: " 1242 "resource not contained within 32-bit address space !\n"); 1243 *phandle = 0; 1244 } 1245 } else { 1246 *phandle = 0; 1247 } 1248 } 1249 1250 static void 1251 nv50_set_global_bindings(struct pipe_context *pipe, 1252 unsigned start, unsigned nr, 1253 struct pipe_resource **resources, 1254 uint32_t **handles) 1255 { 1256 struct nv50_context *nv50 = nv50_context(pipe); 1257 struct pipe_resource **ptr; 1258 unsigned i; 1259 const unsigned end = start + nr; 1260 1261 if (nv50->global_residents.size <= (end * sizeof(struct pipe_resource *))) { 1262 const unsigned old_size = nv50->global_residents.size; 1263 const unsigned req_size = end * sizeof(struct pipe_resource *); 1264 util_dynarray_resize(&nv50->global_residents, req_size); 1265 memset((uint8_t *)nv50->global_residents.data + old_size, 0, 1266 req_size - old_size); 1267 } 1268 1269 if (resources) { 1270 ptr = util_dynarray_element( 1271 &nv50->global_residents, struct pipe_resource *, start); 1272 for (i = 0; i < nr; ++i) { 1273 pipe_resource_reference(&ptr[i], resources[i]); 1274 nv50_set_global_handle(handles[i], resources[i]); 1275 } 1276 } else { 1277 ptr = util_dynarray_element( 1278 &nv50->global_residents, struct pipe_resource *, start); 1279 for (i = 0; i < nr; ++i) 1280 pipe_resource_reference(&ptr[i], NULL); 1281 } 1282 1283 nouveau_bufctx_reset(nv50->bufctx_cp, NV50_BIND_CP_GLOBAL); 1284 1285 nv50->dirty_cp |= NV50_NEW_CP_GLOBALS; 1286 } 1287 1288 void 1289 nv50_init_state_functions(struct nv50_context *nv50) 1290 { 1291 struct pipe_context *pipe = &nv50->base.pipe; 1292 1293 pipe->create_blend_state = nv50_blend_state_create; 1294 pipe->bind_blend_state = nv50_blend_state_bind; 1295 pipe->delete_blend_state = nv50_blend_state_delete; 1296 1297 pipe->create_rasterizer_state = nv50_rasterizer_state_create; 1298 pipe->bind_rasterizer_state = nv50_rasterizer_state_bind; 1299 pipe->delete_rasterizer_state = nv50_rasterizer_state_delete; 1300 1301 pipe->create_depth_stencil_alpha_state = nv50_zsa_state_create; 1302 pipe->bind_depth_stencil_alpha_state = nv50_zsa_state_bind; 1303 pipe->delete_depth_stencil_alpha_state = nv50_zsa_state_delete; 1304 1305 pipe->create_sampler_state = nv50_sampler_state_create; 1306 pipe->delete_sampler_state = nv50_sampler_state_delete; 1307 pipe->bind_sampler_states = nv50_bind_sampler_states; 1308 1309 pipe->create_sampler_view = nv50_create_sampler_view; 1310 pipe->sampler_view_destroy = nv50_sampler_view_destroy; 1311 pipe->set_sampler_views = nv50_set_sampler_views; 1312 1313 pipe->create_vs_state = nv50_vp_state_create; 1314 pipe->create_fs_state = nv50_fp_state_create; 1315 pipe->create_gs_state = nv50_gp_state_create; 1316 pipe->create_compute_state = nv50_cp_state_create; 1317 pipe->bind_vs_state = nv50_vp_state_bind; 1318 pipe->bind_fs_state = nv50_fp_state_bind; 1319 pipe->bind_gs_state = nv50_gp_state_bind; 1320 pipe->bind_compute_state = nv50_cp_state_bind; 1321 pipe->delete_vs_state = nv50_sp_state_delete; 1322 pipe->delete_fs_state = nv50_sp_state_delete; 1323 pipe->delete_gs_state = nv50_sp_state_delete; 1324 pipe->delete_compute_state = nv50_sp_state_delete; 1325 1326 pipe->set_blend_color = nv50_set_blend_color; 1327 pipe->set_stencil_ref = nv50_set_stencil_ref; 1328 pipe->set_clip_state = nv50_set_clip_state; 1329 pipe->set_sample_mask = nv50_set_sample_mask; 1330 pipe->set_min_samples = nv50_set_min_samples; 1331 pipe->set_constant_buffer = nv50_set_constant_buffer; 1332 pipe->set_framebuffer_state = nv50_set_framebuffer_state; 1333 pipe->set_polygon_stipple = nv50_set_polygon_stipple; 1334 pipe->set_scissor_states = nv50_set_scissor_states; 1335 pipe->set_viewport_states = nv50_set_viewport_states; 1336 pipe->set_window_rectangles = nv50_set_window_rectangles; 1337 1338 pipe->create_vertex_elements_state = nv50_vertex_state_create; 1339 pipe->delete_vertex_elements_state = nv50_vertex_state_delete; 1340 pipe->bind_vertex_elements_state = nv50_vertex_state_bind; 1341 1342 pipe->set_vertex_buffers = nv50_set_vertex_buffers; 1343 pipe->set_index_buffer = nv50_set_index_buffer; 1344 1345 pipe->create_stream_output_target = nv50_so_target_create; 1346 pipe->stream_output_target_destroy = nv50_so_target_destroy; 1347 pipe->set_stream_output_targets = nv50_set_stream_output_targets; 1348 1349 pipe->set_global_binding = nv50_set_global_bindings; 1350 pipe->set_compute_resources = nv50_set_compute_resources; 1351 1352 nv50->sample_mask = ~0; 1353 nv50->min_samples = 1; 1354 } 1355