1 /********************************************************** 2 * Copyright 2008-2009 VMware, Inc. All rights reserved. 3 * 4 * Permission is hereby granted, free of charge, to any person 5 * obtaining a copy of this software and associated documentation 6 * files (the "Software"), to deal in the Software without 7 * restriction, including without limitation the rights to use, copy, 8 * modify, merge, publish, distribute, sublicense, and/or sell copies 9 * of the Software, and to permit persons to whom the Software is 10 * furnished to do so, subject to the following conditions: 11 * 12 * The above copyright notice and this permission notice shall be 13 * included in all copies or substantial portions of the Software. 14 * 15 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, 16 * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF 17 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND 18 * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS 19 * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN 20 * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN 21 * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE 22 * SOFTWARE. 23 * 24 **********************************************************/ 25 26 #include "pipe/p_defines.h" 27 #include "util/u_bitmask.h" 28 #include "util/u_format.h" 29 #include "util/u_helpers.h" 30 #include "util/u_inlines.h" 31 #include "util/u_math.h" 32 #include "util/u_memory.h" 33 #include "util/u_transfer.h" 34 #include "tgsi/tgsi_parse.h" 35 36 #include "svga_context.h" 37 #include "svga_cmd.h" 38 #include "svga_format.h" 39 #include "svga_resource_buffer.h" 40 #include "svga_screen.h" 41 42 43 static void svga_set_vertex_buffers(struct pipe_context *pipe, 44 unsigned start_slot, unsigned count, 45 const struct pipe_vertex_buffer *buffers) 46 { 47 struct svga_context *svga = svga_context(pipe); 48 49 util_set_vertex_buffers_count(svga->curr.vb, 50 &svga->curr.num_vertex_buffers, 51 buffers, start_slot, count); 52 53 svga->dirty |= SVGA_NEW_VBUFFER; 54 } 55 56 57 static void svga_set_index_buffer(struct pipe_context *pipe, 58 const struct pipe_index_buffer *ib) 59 { 60 struct svga_context *svga = svga_context(pipe); 61 62 util_set_index_buffer(&svga->curr.ib, ib); 63 } 64 65 66 /** 67 * Does the given vertex attrib format need range adjustment in the VS? 68 * Range adjustment scales and biases values from [0,1] to [-1,1]. 69 * This lets us avoid the swtnl path. 70 */ 71 static boolean 72 attrib_needs_range_adjustment(enum pipe_format format) 73 { 74 switch (format) { 75 case PIPE_FORMAT_R8G8B8_SNORM: 76 return TRUE; 77 default: 78 return FALSE; 79 } 80 } 81 82 83 /** 84 * Given a gallium vertex element format, return the corresponding 85 * SVGA3dDeclType. 86 */ 87 static SVGA3dDeclType 88 translate_vertex_format_to_decltype(enum pipe_format format) 89 { 90 switch (format) { 91 case PIPE_FORMAT_R32_FLOAT: return SVGA3D_DECLTYPE_FLOAT1; 92 case PIPE_FORMAT_R32G32_FLOAT: return SVGA3D_DECLTYPE_FLOAT2; 93 case PIPE_FORMAT_R32G32B32_FLOAT: return SVGA3D_DECLTYPE_FLOAT3; 94 case PIPE_FORMAT_R32G32B32A32_FLOAT: return SVGA3D_DECLTYPE_FLOAT4; 95 case PIPE_FORMAT_B8G8R8A8_UNORM: return SVGA3D_DECLTYPE_D3DCOLOR; 96 case PIPE_FORMAT_R8G8B8A8_USCALED: return SVGA3D_DECLTYPE_UBYTE4; 97 case PIPE_FORMAT_R16G16_SSCALED: return SVGA3D_DECLTYPE_SHORT2; 98 case PIPE_FORMAT_R16G16B16A16_SSCALED: return SVGA3D_DECLTYPE_SHORT4; 99 case PIPE_FORMAT_R8G8B8A8_UNORM: return SVGA3D_DECLTYPE_UBYTE4N; 100 case PIPE_FORMAT_R16G16_SNORM: return SVGA3D_DECLTYPE_SHORT2N; 101 case PIPE_FORMAT_R16G16B16A16_SNORM: return SVGA3D_DECLTYPE_SHORT4N; 102 case PIPE_FORMAT_R16G16_UNORM: return SVGA3D_DECLTYPE_USHORT2N; 103 case PIPE_FORMAT_R16G16B16A16_UNORM: return SVGA3D_DECLTYPE_USHORT4N; 104 case PIPE_FORMAT_R10G10B10X2_USCALED: return SVGA3D_DECLTYPE_UDEC3; 105 case PIPE_FORMAT_R10G10B10X2_SNORM: return SVGA3D_DECLTYPE_DEC3N; 106 case PIPE_FORMAT_R16G16_FLOAT: return SVGA3D_DECLTYPE_FLOAT16_2; 107 case PIPE_FORMAT_R16G16B16A16_FLOAT: return SVGA3D_DECLTYPE_FLOAT16_4; 108 109 /* See attrib_needs_adjustment() and attrib_needs_w_to_1() above */ 110 case PIPE_FORMAT_R8G8B8_SNORM: return SVGA3D_DECLTYPE_UBYTE4N; 111 112 /* See attrib_needs_w_to_1() above */ 113 case PIPE_FORMAT_R16G16B16_SNORM: return SVGA3D_DECLTYPE_SHORT4N; 114 case PIPE_FORMAT_R16G16B16_UNORM: return SVGA3D_DECLTYPE_USHORT4N; 115 case PIPE_FORMAT_R8G8B8_UNORM: return SVGA3D_DECLTYPE_UBYTE4N; 116 117 default: 118 /* There are many formats without hardware support. This case 119 * will be hit regularly, meaning we'll need swvfetch. 120 */ 121 return SVGA3D_DECLTYPE_MAX; 122 } 123 } 124 125 126 static void 127 define_input_element_object(struct svga_context *svga, 128 struct svga_velems_state *velems) 129 { 130 SVGA3dInputElementDesc elements[PIPE_MAX_ATTRIBS]; 131 enum pipe_error ret; 132 unsigned i; 133 134 assert(velems->count <= PIPE_MAX_ATTRIBS); 135 assert(svga_have_vgpu10(svga)); 136 137 for (i = 0; i < velems->count; i++) { 138 const struct pipe_vertex_element *elem = velems->velem + i; 139 SVGA3dSurfaceFormat svga_format; 140 unsigned vf_flags; 141 142 svga_translate_vertex_format_vgpu10(elem->src_format, 143 &svga_format, &vf_flags); 144 145 velems->decl_type[i] = 146 translate_vertex_format_to_decltype(elem->src_format); 147 elements[i].inputSlot = elem->vertex_buffer_index; 148 elements[i].alignedByteOffset = elem->src_offset; 149 elements[i].format = svga_format; 150 151 if (elem->instance_divisor) { 152 elements[i].inputSlotClass = SVGA3D_INPUT_PER_INSTANCE_DATA; 153 elements[i].instanceDataStepRate = elem->instance_divisor; 154 } 155 else { 156 elements[i].inputSlotClass = SVGA3D_INPUT_PER_VERTEX_DATA; 157 elements[i].instanceDataStepRate = 0; 158 } 159 elements[i].inputRegister = i; 160 161 if (elements[i].format == SVGA3D_FORMAT_INVALID) { 162 velems->need_swvfetch = TRUE; 163 } 164 165 if (util_format_is_pure_integer(elem->src_format)) { 166 velems->attrib_is_pure_int |= (1 << i); 167 } 168 169 if (vf_flags & VF_W_TO_1) { 170 velems->adjust_attrib_w_1 |= (1 << i); 171 } 172 173 if (vf_flags & VF_U_TO_F_CAST) { 174 velems->adjust_attrib_utof |= (1 << i); 175 } 176 else if (vf_flags & VF_I_TO_F_CAST) { 177 velems->adjust_attrib_itof |= (1 << i); 178 } 179 180 if (vf_flags & VF_BGRA) { 181 velems->attrib_is_bgra |= (1 << i); 182 } 183 184 if (vf_flags & VF_PUINT_TO_SNORM) { 185 velems->attrib_puint_to_snorm |= (1 << i); 186 } 187 else if (vf_flags & VF_PUINT_TO_USCALED) { 188 velems->attrib_puint_to_uscaled |= (1 << i); 189 } 190 else if (vf_flags & VF_PUINT_TO_SSCALED) { 191 velems->attrib_puint_to_sscaled |= (1 << i); 192 } 193 } 194 195 velems->id = util_bitmask_add(svga->input_element_object_id_bm); 196 197 ret = SVGA3D_vgpu10_DefineElementLayout(svga->swc, velems->count, 198 velems->id, elements); 199 if (ret != PIPE_OK) { 200 svga_context_flush(svga, NULL); 201 ret = SVGA3D_vgpu10_DefineElementLayout(svga->swc, velems->count, 202 velems->id, elements); 203 assert(ret == PIPE_OK); 204 } 205 } 206 207 208 /** 209 * Translate the vertex element types to SVGA3dDeclType and check 210 * for VS-based vertex attribute adjustments. 211 */ 212 static void 213 translate_vertex_decls(struct svga_context *svga, 214 struct svga_velems_state *velems) 215 { 216 unsigned i; 217 218 assert(!svga_have_vgpu10(svga)); 219 220 for (i = 0; i < velems->count; i++) { 221 const enum pipe_format f = velems->velem[i].src_format; 222 SVGA3dSurfaceFormat svga_format; 223 unsigned vf_flags; 224 225 svga_translate_vertex_format_vgpu10(f, &svga_format, &vf_flags); 226 227 velems->decl_type[i] = translate_vertex_format_to_decltype(f); 228 if (velems->decl_type[i] == SVGA3D_DECLTYPE_MAX) { 229 /* Unsupported format - use software fetch */ 230 velems->need_swvfetch = TRUE; 231 } 232 233 /* Check for VS-based adjustments */ 234 if (attrib_needs_range_adjustment(f)) { 235 velems->adjust_attrib_range |= (1 << i); 236 } 237 238 if (vf_flags & VF_W_TO_1) { 239 velems->adjust_attrib_w_1 |= (1 << i); 240 } 241 } 242 } 243 244 245 static void * 246 svga_create_vertex_elements_state(struct pipe_context *pipe, 247 unsigned count, 248 const struct pipe_vertex_element *attribs) 249 { 250 struct svga_context *svga = svga_context(pipe); 251 struct svga_velems_state *velems; 252 253 assert(count <= PIPE_MAX_ATTRIBS); 254 velems = (struct svga_velems_state *) MALLOC(sizeof(struct svga_velems_state)); 255 if (velems) { 256 velems->count = count; 257 memcpy(velems->velem, attribs, sizeof(*attribs) * count); 258 259 velems->need_swvfetch = FALSE; 260 velems->adjust_attrib_range = 0x0; 261 velems->attrib_is_pure_int = 0x0; 262 velems->adjust_attrib_w_1 = 0x0; 263 velems->adjust_attrib_itof = 0x0; 264 velems->adjust_attrib_utof = 0x0; 265 velems->attrib_is_bgra = 0x0; 266 velems->attrib_puint_to_snorm = 0x0; 267 velems->attrib_puint_to_uscaled = 0x0; 268 velems->attrib_puint_to_sscaled = 0x0; 269 270 if (svga_have_vgpu10(svga)) { 271 define_input_element_object(svga, velems); 272 } 273 else { 274 translate_vertex_decls(svga, velems); 275 } 276 } 277 278 svga->hud.num_vertexelement_objects++; 279 SVGA_STATS_COUNT_INC(svga_screen(svga->pipe.screen)->sws, 280 SVGA_STATS_COUNT_VERTEXELEMENT); 281 282 return velems; 283 } 284 285 286 static void 287 svga_bind_vertex_elements_state(struct pipe_context *pipe, void *state) 288 { 289 struct svga_context *svga = svga_context(pipe); 290 struct svga_velems_state *velems = (struct svga_velems_state *) state; 291 292 svga->curr.velems = velems; 293 svga->dirty |= SVGA_NEW_VELEMENT; 294 } 295 296 297 static void 298 svga_delete_vertex_elements_state(struct pipe_context *pipe, void *state) 299 { 300 struct svga_context *svga = svga_context(pipe); 301 struct svga_velems_state *velems = (struct svga_velems_state *) state; 302 303 if (svga_have_vgpu10(svga)) { 304 enum pipe_error ret; 305 306 svga_hwtnl_flush_retry(svga); 307 308 ret = SVGA3D_vgpu10_DestroyElementLayout(svga->swc, velems->id); 309 if (ret != PIPE_OK) { 310 svga_context_flush(svga, NULL); 311 ret = SVGA3D_vgpu10_DestroyElementLayout(svga->swc, velems->id); 312 assert(ret == PIPE_OK); 313 } 314 315 if (velems->id == svga->state.hw_draw.layout_id) 316 svga->state.hw_draw.layout_id = SVGA3D_INVALID_ID; 317 318 util_bitmask_clear(svga->input_element_object_id_bm, velems->id); 319 velems->id = SVGA3D_INVALID_ID; 320 } 321 322 FREE(velems); 323 svga->hud.num_vertexelement_objects--; 324 } 325 326 void svga_cleanup_vertex_state( struct svga_context *svga ) 327 { 328 unsigned i; 329 330 for (i = 0 ; i < svga->curr.num_vertex_buffers; i++) 331 pipe_resource_reference(&svga->curr.vb[i].buffer, NULL); 332 333 pipe_resource_reference(&svga->state.hw_draw.ib, NULL); 334 335 for (i = 0; i < svga->state.hw_draw.num_vbuffers; i++) 336 pipe_resource_reference(&svga->state.hw_draw.vbuffers[i], NULL); 337 } 338 339 340 void svga_init_vertex_functions( struct svga_context *svga ) 341 { 342 svga->pipe.set_vertex_buffers = svga_set_vertex_buffers; 343 svga->pipe.set_index_buffer = svga_set_index_buffer; 344 svga->pipe.create_vertex_elements_state = svga_create_vertex_elements_state; 345 svga->pipe.bind_vertex_elements_state = svga_bind_vertex_elements_state; 346 svga->pipe.delete_vertex_elements_state = svga_delete_vertex_elements_state; 347 } 348