1 /* 2 * Copyright 2010 Christoph Bumiller 3 * 4 * Permission is hereby granted, free of charge, to any person obtaining a 5 * copy of this software and associated documentation files (the "Software"), 6 * to deal in the Software without restriction, including without limitation 7 * the rights to use, copy, modify, merge, publish, distribute, sublicense, 8 * and/or sell copies of the Software, and to permit persons to whom the 9 * Software is furnished to do so, subject to the following conditions: 10 * 11 * The above copyright notice and this permission notice shall be included in 12 * all copies or substantial portions of the Software. 13 * 14 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR 15 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, 16 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL 17 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR 18 * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, 19 * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR 20 * OTHER DEALINGS IN THE SOFTWARE. 21 */ 22 23 #include "pipe/p_defines.h" 24 #include "util/u_framebuffer.h" 25 #include "util/u_upload_mgr.h" 26 27 #include "nv50/nv50_context.h" 28 #include "nv50/nv50_screen.h" 29 #include "nv50/nv50_resource.h" 30 31 static void 32 nv50_flush(struct pipe_context *pipe, 33 struct pipe_fence_handle **fence, 34 unsigned flags) 35 { 36 struct nouveau_screen *screen = nouveau_screen(pipe->screen); 37 38 if (fence) 39 nouveau_fence_ref(screen->fence.current, (struct nouveau_fence **)fence); 40 41 PUSH_KICK(screen->pushbuf); 42 43 nouveau_context_update_frame_stats(nouveau_context(pipe)); 44 } 45 46 static void 47 nv50_texture_barrier(struct pipe_context *pipe, unsigned flags) 48 { 49 struct nouveau_pushbuf *push = nv50_context(pipe)->base.pushbuf; 50 51 BEGIN_NV04(push, SUBC_3D(NV50_GRAPH_SERIALIZE), 1); 52 PUSH_DATA (push, 0); 53 BEGIN_NV04(push, NV50_3D(TEX_CACHE_CTL), 1); 54 PUSH_DATA (push, 0x20); 55 } 56 57 static void 58 nv50_memory_barrier(struct pipe_context *pipe, unsigned flags) 59 { 60 struct nv50_context *nv50 = nv50_context(pipe); 61 int i, s; 62 63 if (flags & PIPE_BARRIER_MAPPED_BUFFER) { 64 for (i = 0; i < nv50->num_vtxbufs; ++i) { 65 if (!nv50->vtxbuf[i].buffer.resource && !nv50->vtxbuf[i].is_user_buffer) 66 continue; 67 if (nv50->vtxbuf[i].buffer.resource->flags & PIPE_RESOURCE_FLAG_MAP_PERSISTENT) 68 nv50->base.vbo_dirty = true; 69 } 70 71 for (s = 0; s < 3 && !nv50->cb_dirty; ++s) { 72 uint32_t valid = nv50->constbuf_valid[s]; 73 74 while (valid && !nv50->cb_dirty) { 75 const unsigned i = ffs(valid) - 1; 76 struct pipe_resource *res; 77 78 valid &= ~(1 << i); 79 if (nv50->constbuf[s][i].user) 80 continue; 81 82 res = nv50->constbuf[s][i].u.buf; 83 if (!res) 84 continue; 85 86 if (res->flags & PIPE_RESOURCE_FLAG_MAP_PERSISTENT) 87 nv50->cb_dirty = true; 88 } 89 } 90 } 91 } 92 93 static void 94 nv50_emit_string_marker(struct pipe_context *pipe, const char *str, int len) 95 { 96 struct nouveau_pushbuf *push = nv50_context(pipe)->base.pushbuf; 97 int string_words = len / 4; 98 int data_words; 99 100 if (len <= 0) 101 return; 102 string_words = MIN2(string_words, NV04_PFIFO_MAX_PACKET_LEN); 103 if (string_words == NV04_PFIFO_MAX_PACKET_LEN) 104 data_words = string_words; 105 else 106 data_words = string_words + !!(len & 3); 107 BEGIN_NI04(push, SUBC_3D(NV04_GRAPH_NOP), data_words); 108 if (string_words) 109 PUSH_DATAp(push, str, string_words); 110 if (string_words != data_words) { 111 int data = 0; 112 memcpy(&data, &str[string_words * 4], len & 3); 113 PUSH_DATA (push, data); 114 } 115 } 116 117 void 118 nv50_default_kick_notify(struct nouveau_pushbuf *push) 119 { 120 struct nv50_screen *screen = push->user_priv; 121 122 if (screen) { 123 nouveau_fence_next(&screen->base); 124 nouveau_fence_update(&screen->base, true); 125 if (screen->cur_ctx) 126 screen->cur_ctx->state.flushed = true; 127 } 128 } 129 130 static void 131 nv50_context_unreference_resources(struct nv50_context *nv50) 132 { 133 unsigned s, i; 134 135 nouveau_bufctx_del(&nv50->bufctx_3d); 136 nouveau_bufctx_del(&nv50->bufctx); 137 nouveau_bufctx_del(&nv50->bufctx_cp); 138 139 util_unreference_framebuffer_state(&nv50->framebuffer); 140 141 assert(nv50->num_vtxbufs <= PIPE_MAX_ATTRIBS); 142 for (i = 0; i < nv50->num_vtxbufs; ++i) 143 pipe_vertex_buffer_unreference(&nv50->vtxbuf[i]); 144 145 for (s = 0; s < 3; ++s) { 146 assert(nv50->num_textures[s] <= PIPE_MAX_SAMPLERS); 147 for (i = 0; i < nv50->num_textures[s]; ++i) 148 pipe_sampler_view_reference(&nv50->textures[s][i], NULL); 149 150 for (i = 0; i < NV50_MAX_PIPE_CONSTBUFS; ++i) 151 if (!nv50->constbuf[s][i].user) 152 pipe_resource_reference(&nv50->constbuf[s][i].u.buf, NULL); 153 } 154 155 for (i = 0; i < nv50->global_residents.size / sizeof(struct pipe_resource *); 156 ++i) { 157 struct pipe_resource **res = util_dynarray_element( 158 &nv50->global_residents, struct pipe_resource *, i); 159 pipe_resource_reference(res, NULL); 160 } 161 util_dynarray_fini(&nv50->global_residents); 162 } 163 164 static void 165 nv50_destroy(struct pipe_context *pipe) 166 { 167 struct nv50_context *nv50 = nv50_context(pipe); 168 169 if (nv50->screen->cur_ctx == nv50) { 170 nv50->screen->cur_ctx = NULL; 171 /* Save off the state in case another context gets created */ 172 nv50->screen->save_state = nv50->state; 173 } 174 175 if (nv50->base.pipe.stream_uploader) 176 u_upload_destroy(nv50->base.pipe.stream_uploader); 177 178 nouveau_pushbuf_bufctx(nv50->base.pushbuf, NULL); 179 nouveau_pushbuf_kick(nv50->base.pushbuf, nv50->base.pushbuf->channel); 180 181 nv50_context_unreference_resources(nv50); 182 183 FREE(nv50->blit); 184 185 nouveau_context_destroy(&nv50->base); 186 } 187 188 static int 189 nv50_invalidate_resource_storage(struct nouveau_context *ctx, 190 struct pipe_resource *res, 191 int ref) 192 { 193 struct nv50_context *nv50 = nv50_context(&ctx->pipe); 194 unsigned bind = res->bind ? res->bind : PIPE_BIND_VERTEX_BUFFER; 195 unsigned s, i; 196 197 if (bind & PIPE_BIND_RENDER_TARGET) { 198 assert(nv50->framebuffer.nr_cbufs <= PIPE_MAX_COLOR_BUFS); 199 for (i = 0; i < nv50->framebuffer.nr_cbufs; ++i) { 200 if (nv50->framebuffer.cbufs[i] && 201 nv50->framebuffer.cbufs[i]->texture == res) { 202 nv50->dirty_3d |= NV50_NEW_3D_FRAMEBUFFER; 203 nouveau_bufctx_reset(nv50->bufctx_3d, NV50_BIND_3D_FB); 204 if (!--ref) 205 return ref; 206 } 207 } 208 } 209 if (bind & PIPE_BIND_DEPTH_STENCIL) { 210 if (nv50->framebuffer.zsbuf && 211 nv50->framebuffer.zsbuf->texture == res) { 212 nv50->dirty_3d |= NV50_NEW_3D_FRAMEBUFFER; 213 nouveau_bufctx_reset(nv50->bufctx_3d, NV50_BIND_3D_FB); 214 if (!--ref) 215 return ref; 216 } 217 } 218 219 if (bind & (PIPE_BIND_VERTEX_BUFFER | 220 PIPE_BIND_INDEX_BUFFER | 221 PIPE_BIND_CONSTANT_BUFFER | 222 PIPE_BIND_STREAM_OUTPUT | 223 PIPE_BIND_SAMPLER_VIEW)) { 224 225 assert(nv50->num_vtxbufs <= PIPE_MAX_ATTRIBS); 226 for (i = 0; i < nv50->num_vtxbufs; ++i) { 227 if (nv50->vtxbuf[i].buffer.resource == res) { 228 nv50->dirty_3d |= NV50_NEW_3D_ARRAYS; 229 nouveau_bufctx_reset(nv50->bufctx_3d, NV50_BIND_3D_VERTEX); 230 if (!--ref) 231 return ref; 232 } 233 } 234 235 for (s = 0; s < 3; ++s) { 236 assert(nv50->num_textures[s] <= PIPE_MAX_SAMPLERS); 237 for (i = 0; i < nv50->num_textures[s]; ++i) { 238 if (nv50->textures[s][i] && 239 nv50->textures[s][i]->texture == res) { 240 nv50->dirty_3d |= NV50_NEW_3D_TEXTURES; 241 nouveau_bufctx_reset(nv50->bufctx_3d, NV50_BIND_3D_TEXTURES); 242 if (!--ref) 243 return ref; 244 } 245 } 246 } 247 248 for (s = 0; s < 3; ++s) { 249 for (i = 0; i < NV50_MAX_PIPE_CONSTBUFS; ++i) { 250 if (!(nv50->constbuf_valid[s] & (1 << i))) 251 continue; 252 if (!nv50->constbuf[s][i].user && 253 nv50->constbuf[s][i].u.buf == res) { 254 nv50->dirty_3d |= NV50_NEW_3D_CONSTBUF; 255 nv50->constbuf_dirty[s] |= 1 << i; 256 nouveau_bufctx_reset(nv50->bufctx_3d, NV50_BIND_3D_CB(s, i)); 257 if (!--ref) 258 return ref; 259 } 260 } 261 } 262 } 263 264 return ref; 265 } 266 267 static void 268 nv50_context_get_sample_position(struct pipe_context *, unsigned, unsigned, 269 float *); 270 271 struct pipe_context * 272 nv50_create(struct pipe_screen *pscreen, void *priv, unsigned ctxflags) 273 { 274 struct nv50_screen *screen = nv50_screen(pscreen); 275 struct nv50_context *nv50; 276 struct pipe_context *pipe; 277 int ret; 278 uint32_t flags; 279 280 nv50 = CALLOC_STRUCT(nv50_context); 281 if (!nv50) 282 return NULL; 283 pipe = &nv50->base.pipe; 284 285 if (!nv50_blitctx_create(nv50)) 286 goto out_err; 287 288 nv50->base.pushbuf = screen->base.pushbuf; 289 nv50->base.client = screen->base.client; 290 291 ret = nouveau_bufctx_new(screen->base.client, 2, &nv50->bufctx); 292 if (!ret) 293 ret = nouveau_bufctx_new(screen->base.client, NV50_BIND_3D_COUNT, 294 &nv50->bufctx_3d); 295 if (!ret) 296 ret = nouveau_bufctx_new(screen->base.client, NV50_BIND_CP_COUNT, 297 &nv50->bufctx_cp); 298 if (ret) 299 goto out_err; 300 301 nv50->base.screen = &screen->base; 302 nv50->base.copy_data = nv50_m2mf_copy_linear; 303 nv50->base.push_data = nv50_sifc_linear_u8; 304 nv50->base.push_cb = nv50_cb_push; 305 306 nv50->screen = screen; 307 pipe->screen = pscreen; 308 pipe->priv = priv; 309 pipe->stream_uploader = u_upload_create_default(pipe); 310 if (!pipe->stream_uploader) 311 goto out_err; 312 pipe->const_uploader = pipe->stream_uploader; 313 314 pipe->destroy = nv50_destroy; 315 316 pipe->draw_vbo = nv50_draw_vbo; 317 pipe->clear = nv50_clear; 318 pipe->launch_grid = nv50_launch_grid; 319 320 pipe->flush = nv50_flush; 321 pipe->texture_barrier = nv50_texture_barrier; 322 pipe->memory_barrier = nv50_memory_barrier; 323 pipe->get_sample_position = nv50_context_get_sample_position; 324 pipe->emit_string_marker = nv50_emit_string_marker; 325 326 if (!screen->cur_ctx) { 327 /* Restore the last context's state here, normally handled during 328 * context switch 329 */ 330 nv50->state = screen->save_state; 331 screen->cur_ctx = nv50; 332 nouveau_pushbuf_bufctx(screen->base.pushbuf, nv50->bufctx); 333 } 334 nv50->base.pushbuf->kick_notify = nv50_default_kick_notify; 335 336 nouveau_context_init(&nv50->base); 337 nv50_init_query_functions(nv50); 338 nv50_init_surface_functions(nv50); 339 nv50_init_state_functions(nv50); 340 nv50_init_resource_functions(pipe); 341 342 nv50->base.invalidate_resource_storage = nv50_invalidate_resource_storage; 343 344 if (screen->base.device->chipset < 0x84 || 345 debug_get_bool_option("NOUVEAU_PMPEG", false)) { 346 /* PMPEG */ 347 nouveau_context_init_vdec(&nv50->base); 348 } else if (screen->base.device->chipset < 0x98 || 349 screen->base.device->chipset == 0xa0) { 350 /* VP2 */ 351 pipe->create_video_codec = nv84_create_decoder; 352 pipe->create_video_buffer = nv84_video_buffer_create; 353 } else { 354 /* VP3/4 */ 355 pipe->create_video_codec = nv98_create_decoder; 356 pipe->create_video_buffer = nv98_video_buffer_create; 357 } 358 359 flags = NOUVEAU_BO_VRAM | NOUVEAU_BO_RD; 360 361 BCTX_REFN_bo(nv50->bufctx_3d, 3D_SCREEN, flags, screen->code); 362 BCTX_REFN_bo(nv50->bufctx_3d, 3D_SCREEN, flags, screen->uniforms); 363 BCTX_REFN_bo(nv50->bufctx_3d, 3D_SCREEN, flags, screen->txc); 364 BCTX_REFN_bo(nv50->bufctx_3d, 3D_SCREEN, flags, screen->stack_bo); 365 if (screen->compute) { 366 BCTX_REFN_bo(nv50->bufctx_cp, CP_SCREEN, flags, screen->code); 367 BCTX_REFN_bo(nv50->bufctx_cp, CP_SCREEN, flags, screen->txc); 368 BCTX_REFN_bo(nv50->bufctx_cp, CP_SCREEN, flags, screen->stack_bo); 369 } 370 371 flags = NOUVEAU_BO_GART | NOUVEAU_BO_WR; 372 373 BCTX_REFN_bo(nv50->bufctx_3d, 3D_SCREEN, flags, screen->fence.bo); 374 BCTX_REFN_bo(nv50->bufctx, FENCE, flags, screen->fence.bo); 375 if (screen->compute) 376 BCTX_REFN_bo(nv50->bufctx_cp, CP_SCREEN, flags, screen->fence.bo); 377 378 nv50->base.scratch.bo_size = 2 << 20; 379 380 util_dynarray_init(&nv50->global_residents, NULL); 381 382 return pipe; 383 384 out_err: 385 if (pipe->stream_uploader) 386 u_upload_destroy(pipe->stream_uploader); 387 if (nv50->bufctx_3d) 388 nouveau_bufctx_del(&nv50->bufctx_3d); 389 if (nv50->bufctx_cp) 390 nouveau_bufctx_del(&nv50->bufctx_cp); 391 if (nv50->bufctx) 392 nouveau_bufctx_del(&nv50->bufctx); 393 FREE(nv50->blit); 394 FREE(nv50); 395 return NULL; 396 } 397 398 void 399 nv50_bufctx_fence(struct nouveau_bufctx *bufctx, bool on_flush) 400 { 401 struct nouveau_list *list = on_flush ? &bufctx->current : &bufctx->pending; 402 struct nouveau_list *it; 403 404 for (it = list->next; it != list; it = it->next) { 405 struct nouveau_bufref *ref = (struct nouveau_bufref *)it; 406 struct nv04_resource *res = ref->priv; 407 if (res) 408 nv50_resource_validate(res, (unsigned)ref->priv_data); 409 } 410 } 411 412 static void 413 nv50_context_get_sample_position(struct pipe_context *pipe, 414 unsigned sample_count, unsigned sample_index, 415 float *xy) 416 { 417 static const uint8_t ms1[1][2] = { { 0x8, 0x8 } }; 418 static const uint8_t ms2[2][2] = { 419 { 0x4, 0x4 }, { 0xc, 0xc } }; /* surface coords (0,0), (1,0) */ 420 static const uint8_t ms4[4][2] = { 421 { 0x6, 0x2 }, { 0xe, 0x6 }, /* (0,0), (1,0) */ 422 { 0x2, 0xa }, { 0xa, 0xe } }; /* (0,1), (1,1) */ 423 static const uint8_t ms8[8][2] = { 424 { 0x1, 0x7 }, { 0x5, 0x3 }, /* (0,0), (1,0) */ 425 { 0x3, 0xd }, { 0x7, 0xb }, /* (0,1), (1,1) */ 426 { 0x9, 0x5 }, { 0xf, 0x1 }, /* (2,0), (3,0) */ 427 { 0xb, 0xf }, { 0xd, 0x9 } }; /* (2,1), (3,1) */ 428 #if 0 429 /* NOTE: there are alternative modes for MS2 and MS8, currently not used */ 430 static const uint8_t ms8_alt[8][2] = { 431 { 0x9, 0x5 }, { 0x7, 0xb }, /* (2,0), (1,1) */ 432 { 0xd, 0x9 }, { 0x5, 0x3 }, /* (3,1), (1,0) */ 433 { 0x3, 0xd }, { 0x1, 0x7 }, /* (0,1), (0,0) */ 434 { 0xb, 0xf }, { 0xf, 0x1 } }; /* (2,1), (3,0) */ 435 #endif 436 437 const uint8_t (*ptr)[2]; 438 439 switch (sample_count) { 440 case 0: 441 case 1: ptr = ms1; break; 442 case 2: ptr = ms2; break; 443 case 4: ptr = ms4; break; 444 case 8: ptr = ms8; break; 445 default: 446 assert(0); 447 return; /* bad sample count -> undefined locations */ 448 } 449 xy[0] = ptr[sample_index][0] * 0.0625f; 450 xy[1] = ptr[sample_index][1] * 0.0625f; 451 } 452