1 /* 2 * Copyright 2011 Joakim Sindholt <opensource (at) zhasha.com> 3 * 4 * Permission is hereby granted, free of charge, to any person obtaining a 5 * copy of this software and associated documentation files (the "Software"), 6 * to deal in the Software without restriction, including without limitation 7 * on the rights to use, copy, modify, merge, publish, distribute, sub 8 * license, and/or sell copies of the Software, and to permit persons to whom 9 * the Software is furnished to do so, subject to the following conditions: 10 * 11 * The above copyright notice and this permission notice (including the next 12 * paragraph) shall be included in all copies or substantial portions of the 13 * Software. 14 * 15 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR 16 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, 17 * FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT. IN NO EVENT SHALL 18 * THE AUTHOR(S) AND/OR THEIR SUPPLIERS BE LIABLE FOR ANY CLAIM, 19 * DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR 20 * OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE 21 * USE OR OTHER DEALINGS IN THE SOFTWARE. */ 22 23 #include "nine_helpers.h" 24 #include "nine_shader.h" 25 26 #include "vertexdeclaration9.h" 27 #include "vertexshader9.h" 28 29 #include "device9.h" 30 #include "pipe/p_context.h" 31 #include "cso_cache/cso_context.h" 32 33 #define DBG_CHANNEL DBG_VERTEXSHADER 34 35 HRESULT 36 NineVertexShader9_ctor( struct NineVertexShader9 *This, 37 struct NineUnknownParams *pParams, 38 const DWORD *pFunction, void *cso ) 39 { 40 struct NineDevice9 *device; 41 struct nine_shader_info info; 42 struct pipe_context *pipe; 43 HRESULT hr; 44 unsigned i; 45 46 DBG("This=%p pParams=%p pFunction=%p cso=%p\n", 47 This, pParams, pFunction, cso); 48 49 hr = NineUnknown_ctor(&This->base, pParams); 50 if (FAILED(hr)) 51 return hr; 52 53 if (cso) { 54 This->ff_cso = cso; 55 return D3D_OK; 56 } 57 58 device = This->base.device; 59 60 info.type = PIPE_SHADER_VERTEX; 61 info.byte_code = pFunction; 62 info.const_i_base = NINE_CONST_I_BASE(device->max_vs_const_f) / 16; 63 info.const_b_base = NINE_CONST_B_BASE(device->max_vs_const_f) / 16; 64 info.sampler_mask_shadow = 0x0; 65 info.sampler_ps1xtypes = 0x0; 66 info.fog_enable = 0; 67 info.point_size_min = 0; 68 info.point_size_max = 0; 69 info.swvp_on = !!(device->params.BehaviorFlags & D3DCREATE_SOFTWARE_VERTEXPROCESSING); 70 info.process_vertices = false; 71 72 pipe = nine_context_get_pipe_acquire(device); 73 hr = nine_translate_shader(device, &info, pipe); 74 if (hr == D3DERR_INVALIDCALL && 75 (device->params.BehaviorFlags & D3DCREATE_MIXED_VERTEXPROCESSING)) { 76 /* Retry with a swvp shader. It will require swvp to be on. */ 77 info.swvp_on = true; 78 hr = nine_translate_shader(device, &info, pipe); 79 } 80 nine_context_get_pipe_release(device); 81 if (hr == D3DERR_INVALIDCALL) 82 ERR("Encountered buggy shader\n"); 83 if (FAILED(hr)) 84 return hr; 85 This->byte_code.version = info.version; 86 This->swvp_only = info.swvp_on; 87 88 This->byte_code.tokens = mem_dup(pFunction, info.byte_size); 89 if (!This->byte_code.tokens) 90 return E_OUTOFMEMORY; 91 This->byte_code.size = info.byte_size; 92 93 This->variant.cso = info.cso; 94 This->last_cso = info.cso; 95 This->last_key = (uint32_t) (info.swvp_on << 9); 96 97 This->const_used_size = info.const_used_size; 98 This->lconstf = info.lconstf; 99 This->sampler_mask = info.sampler_mask; 100 This->position_t = info.position_t; 101 This->point_size = info.point_size; 102 103 for (i = 0; i < info.num_inputs && i < ARRAY_SIZE(This->input_map); ++i) 104 This->input_map[i].ndecl = info.input_map[i]; 105 This->num_inputs = i; 106 107 return D3D_OK; 108 } 109 110 void 111 NineVertexShader9_dtor( struct NineVertexShader9 *This ) 112 { 113 DBG("This=%p\n", This); 114 115 if (This->base.device) { 116 struct pipe_context *pipe = nine_context_get_pipe_multithread(This->base.device); 117 struct nine_shader_variant *var = &This->variant; 118 struct nine_shader_variant_so *var_so = &This->variant_so; 119 120 do { 121 if (var->cso) { 122 if (This->base.device->context.cso_shader.vs == var->cso) 123 pipe->bind_vs_state(pipe, NULL); 124 pipe->delete_vs_state(pipe, var->cso); 125 } 126 var = var->next; 127 } while (var); 128 129 while (var_so && var_so->vdecl) { 130 if (var_so->cso) { 131 cso_delete_vertex_shader(This->base.device->cso_sw, var_so->cso ); 132 } 133 var_so = var_so->next; 134 } 135 136 if (This->ff_cso) { 137 if (This->ff_cso == This->base.device->context.cso_shader.vs) 138 pipe->bind_vs_state(pipe, NULL); 139 pipe->delete_vs_state(pipe, This->ff_cso); 140 } 141 } 142 nine_shader_variants_free(&This->variant); 143 nine_shader_variants_so_free(&This->variant_so); 144 145 FREE((void *)This->byte_code.tokens); /* const_cast */ 146 147 FREE(This->lconstf.data); 148 FREE(This->lconstf.ranges); 149 150 NineUnknown_dtor(&This->base); 151 } 152 153 HRESULT NINE_WINAPI 154 NineVertexShader9_GetFunction( struct NineVertexShader9 *This, 155 void *pData, 156 UINT *pSizeOfData ) 157 { 158 user_assert(pSizeOfData, D3DERR_INVALIDCALL); 159 160 if (!pData) { 161 *pSizeOfData = This->byte_code.size; 162 return D3D_OK; 163 } 164 user_assert(*pSizeOfData >= This->byte_code.size, D3DERR_INVALIDCALL); 165 166 memcpy(pData, This->byte_code.tokens, This->byte_code.size); 167 168 return D3D_OK; 169 } 170 171 void * 172 NineVertexShader9_GetVariant( struct NineVertexShader9 *This ) 173 { 174 /* GetVariant is called from nine_context, thus we can 175 * get pipe directly */ 176 struct pipe_context *pipe = This->base.device->context.pipe; 177 void *cso; 178 uint64_t key; 179 180 key = This->next_key; 181 if (key == This->last_key) 182 return This->last_cso; 183 184 cso = nine_shader_variant_get(&This->variant, key); 185 if (!cso) { 186 struct NineDevice9 *device = This->base.device; 187 struct nine_shader_info info; 188 HRESULT hr; 189 190 info.type = PIPE_SHADER_VERTEX; 191 info.const_i_base = NINE_CONST_I_BASE(device->max_vs_const_f) / 16; 192 info.const_b_base = NINE_CONST_B_BASE(device->max_vs_const_f) / 16; 193 info.byte_code = This->byte_code.tokens; 194 info.sampler_mask_shadow = key & 0xf; 195 info.fog_enable = device->context.rs[D3DRS_FOGENABLE]; 196 info.point_size_min = asfloat(device->context.rs[D3DRS_POINTSIZE_MIN]); 197 info.point_size_max = asfloat(device->context.rs[D3DRS_POINTSIZE_MAX]); 198 info.swvp_on = device->context.swvp; 199 info.process_vertices = false; 200 201 hr = nine_translate_shader(This->base.device, &info, pipe); 202 if (FAILED(hr)) 203 return NULL; 204 nine_shader_variant_add(&This->variant, key, info.cso); 205 cso = info.cso; 206 } 207 208 This->last_key = key; 209 This->last_cso = cso; 210 211 return cso; 212 } 213 214 void * 215 NineVertexShader9_GetVariantProcessVertices( struct NineVertexShader9 *This, 216 struct NineVertexDeclaration9 *vdecl_out, 217 struct pipe_stream_output_info *so ) 218 { 219 struct nine_shader_info info; 220 HRESULT hr; 221 void *cso; 222 223 cso = nine_shader_variant_so_get(&This->variant_so, vdecl_out, so); 224 if (cso) 225 return cso; 226 227 info.type = PIPE_SHADER_VERTEX; 228 info.const_i_base = 0; 229 info.const_b_base = 0; 230 info.byte_code = This->byte_code.tokens; 231 info.sampler_mask_shadow = 0; 232 info.fog_enable = false; 233 info.point_size_min = 0; 234 info.point_size_max = 0; 235 info.swvp_on = true; 236 info.vdecl_out = vdecl_out; 237 info.process_vertices = true; 238 hr = nine_translate_shader(This->base.device, &info, This->base.device->pipe_sw); 239 if (FAILED(hr)) 240 return NULL; 241 *so = info.so; 242 nine_shader_variant_so_add(&This->variant_so, vdecl_out, so, info.cso); 243 return info.cso; 244 } 245 246 IDirect3DVertexShader9Vtbl NineVertexShader9_vtable = { 247 (void *)NineUnknown_QueryInterface, 248 (void *)NineUnknown_AddRef, 249 (void *)NineUnknown_Release, 250 (void *)NineUnknown_GetDevice, 251 (void *)NineVertexShader9_GetFunction 252 }; 253 254 static const GUID *NineVertexShader9_IIDs[] = { 255 &IID_IDirect3DVertexShader9, 256 &IID_IUnknown, 257 NULL 258 }; 259 260 HRESULT 261 NineVertexShader9_new( struct NineDevice9 *pDevice, 262 struct NineVertexShader9 **ppOut, 263 const DWORD *pFunction, void *cso ) 264 { 265 NINE_DEVICE_CHILD_NEW(VertexShader9, ppOut, pDevice, pFunction, cso); 266 } 267