1 /* 2 * Copyright 2013 Intel Corporation 3 * 4 * Permission is hereby granted, free of charge, to any person obtaining a 5 * copy of this software and associated documentation files (the "Software"), 6 * to deal in the Software without restriction, including without limitation 7 * the rights to use, copy, modify, merge, publish, distribute, sublicense, 8 * and/or sell copies of the Software, and to permit persons to whom the 9 * Software is furnished to do so, subject to the following conditions: 10 * 11 * The above copyright notice and this permission notice (including the next 12 * paragraph) shall be included in all copies or substantial portions of the 13 * Software. 14 * 15 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR 16 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, 17 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL 18 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER 19 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING 20 * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER 21 * DEALINGS IN THE SOFTWARE. 22 */ 23 24 #include "glsl_parser_extras.h" 25 #include "ir.h" 26 #include "ir_uniform.h" 27 #include "linker.h" 28 #include "main/macros.h" 29 30 namespace { 31 /* 32 * Atomic counter uniform as seen by the program. 33 */ 34 struct active_atomic_counter_uniform { 35 unsigned uniform_loc; 36 ir_variable *var; 37 }; 38 39 /* 40 * Atomic counter buffer referenced by the program. There is a one 41 * to one correspondence between these and the objects that can be 42 * queried using glGetActiveAtomicCounterBufferiv(). 43 */ 44 struct active_atomic_buffer { 45 active_atomic_buffer() 46 : uniforms(0), num_uniforms(0), stage_counter_references(), size(0) 47 {} 48 49 ~active_atomic_buffer() 50 { 51 free(uniforms); 52 } 53 54 void push_back(unsigned uniform_loc, ir_variable *var) 55 { 56 active_atomic_counter_uniform *new_uniforms; 57 58 new_uniforms = (active_atomic_counter_uniform *) 59 realloc(uniforms, sizeof(active_atomic_counter_uniform) * 60 (num_uniforms + 1)); 61 62 if (new_uniforms == NULL) { 63 _mesa_error_no_memory(__func__); 64 return; 65 } 66 67 uniforms = new_uniforms; 68 uniforms[num_uniforms].uniform_loc = uniform_loc; 69 uniforms[num_uniforms].var = var; 70 num_uniforms++; 71 } 72 73 active_atomic_counter_uniform *uniforms; 74 unsigned num_uniforms; 75 unsigned stage_counter_references[MESA_SHADER_STAGES]; 76 unsigned size; 77 }; 78 79 int 80 cmp_actives(const void *a, const void *b) 81 { 82 const active_atomic_counter_uniform *const first = (active_atomic_counter_uniform *) a; 83 const active_atomic_counter_uniform *const second = (active_atomic_counter_uniform *) b; 84 85 return int(first->var->data.offset) - int(second->var->data.offset); 86 } 87 88 bool 89 check_atomic_counters_overlap(const ir_variable *x, const ir_variable *y) 90 { 91 return ((x->data.offset >= y->data.offset && 92 x->data.offset < y->data.offset + y->type->atomic_size()) || 93 (y->data.offset >= x->data.offset && 94 y->data.offset < x->data.offset + x->type->atomic_size())); 95 } 96 97 void 98 process_atomic_variable(const glsl_type *t, struct gl_shader_program *prog, 99 unsigned *uniform_loc, ir_variable *var, 100 active_atomic_buffer *const buffers, 101 unsigned *num_buffers, int *offset, 102 const unsigned shader_stage) 103 { 104 /* FIXME: Arrays of arrays get counted separately. For example: 105 * x1[3][3][2] = 9 uniforms, 18 atomic counters 106 * x2[3][2] = 3 uniforms, 6 atomic counters 107 * x3[2] = 1 uniform, 2 atomic counters 108 * 109 * However this code marks all the counters as active even when they 110 * might not be used. 111 */ 112 if (t->is_array() && t->fields.array->is_array()) { 113 for (unsigned i = 0; i < t->length; i++) { 114 process_atomic_variable(t->fields.array, prog, uniform_loc, 115 var, buffers, num_buffers, offset, 116 shader_stage); 117 } 118 } else { 119 active_atomic_buffer *buf = &buffers[var->data.binding]; 120 gl_uniform_storage *const storage = 121 &prog->data->UniformStorage[*uniform_loc]; 122 123 /* If this is the first time the buffer is used, increment 124 * the counter of buffers used. 125 */ 126 if (buf->size == 0) 127 (*num_buffers)++; 128 129 buf->push_back(*uniform_loc, var); 130 131 /* When checking for atomic counters we should count every member in 132 * an array as an atomic counter reference. 133 */ 134 if (t->is_array()) 135 buf->stage_counter_references[shader_stage] += t->length; 136 else 137 buf->stage_counter_references[shader_stage]++; 138 buf->size = MAX2(buf->size, *offset + t->atomic_size()); 139 140 storage->offset = *offset; 141 *offset += t->atomic_size(); 142 143 (*uniform_loc)++; 144 } 145 } 146 147 active_atomic_buffer * 148 find_active_atomic_counters(struct gl_context *ctx, 149 struct gl_shader_program *prog, 150 unsigned *num_buffers) 151 { 152 active_atomic_buffer *const buffers = 153 new active_atomic_buffer[ctx->Const.MaxAtomicBufferBindings]; 154 155 *num_buffers = 0; 156 157 for (unsigned i = 0; i < MESA_SHADER_STAGES; ++i) { 158 struct gl_linked_shader *sh = prog->_LinkedShaders[i]; 159 if (sh == NULL) 160 continue; 161 162 foreach_in_list(ir_instruction, node, sh->ir) { 163 ir_variable *var = node->as_variable(); 164 165 if (var && var->type->contains_atomic()) { 166 int offset = var->data.offset; 167 unsigned uniform_loc = var->data.location; 168 process_atomic_variable(var->type, prog, &uniform_loc, 169 var, buffers, num_buffers, &offset, i); 170 } 171 } 172 } 173 174 for (unsigned i = 0; i < ctx->Const.MaxAtomicBufferBindings; i++) { 175 if (buffers[i].size == 0) 176 continue; 177 178 qsort(buffers[i].uniforms, buffers[i].num_uniforms, 179 sizeof(active_atomic_counter_uniform), 180 cmp_actives); 181 182 for (unsigned j = 1; j < buffers[i].num_uniforms; j++) { 183 /* If an overlapping counter found, it must be a reference to the 184 * same counter from a different shader stage. 185 */ 186 if (check_atomic_counters_overlap(buffers[i].uniforms[j-1].var, 187 buffers[i].uniforms[j].var) 188 && strcmp(buffers[i].uniforms[j-1].var->name, 189 buffers[i].uniforms[j].var->name) != 0) { 190 linker_error(prog, "Atomic counter %s declared at offset %d " 191 "which is already in use.", 192 buffers[i].uniforms[j].var->name, 193 buffers[i].uniforms[j].var->data.offset); 194 } 195 } 196 } 197 return buffers; 198 } 199 } 200 201 void 202 link_assign_atomic_counter_resources(struct gl_context *ctx, 203 struct gl_shader_program *prog) 204 { 205 unsigned num_buffers; 206 unsigned num_atomic_buffers[MESA_SHADER_STAGES] = {}; 207 active_atomic_buffer *abs = 208 find_active_atomic_counters(ctx, prog, &num_buffers); 209 210 prog->data->AtomicBuffers = rzalloc_array(prog->data, gl_active_atomic_buffer, 211 num_buffers); 212 prog->data->NumAtomicBuffers = num_buffers; 213 214 unsigned i = 0; 215 for (unsigned binding = 0; 216 binding < ctx->Const.MaxAtomicBufferBindings; 217 binding++) { 218 219 /* If the binding was not used, skip. 220 */ 221 if (abs[binding].size == 0) 222 continue; 223 224 active_atomic_buffer &ab = abs[binding]; 225 gl_active_atomic_buffer &mab = prog->data->AtomicBuffers[i]; 226 227 /* Assign buffer-specific fields. */ 228 mab.Binding = binding; 229 mab.MinimumSize = ab.size; 230 mab.Uniforms = rzalloc_array(prog->data->AtomicBuffers, GLuint, 231 ab.num_uniforms); 232 mab.NumUniforms = ab.num_uniforms; 233 234 /* Assign counter-specific fields. */ 235 for (unsigned j = 0; j < ab.num_uniforms; j++) { 236 ir_variable *const var = ab.uniforms[j].var; 237 gl_uniform_storage *const storage = 238 &prog->data->UniformStorage[ab.uniforms[j].uniform_loc]; 239 240 mab.Uniforms[j] = ab.uniforms[j].uniform_loc; 241 if (!var->data.explicit_binding) 242 var->data.binding = i; 243 244 storage->atomic_buffer_index = i; 245 storage->offset = var->data.offset; 246 storage->array_stride = (var->type->is_array() ? 247 var->type->without_array()->atomic_size() : 0); 248 if (!var->type->is_matrix()) 249 storage->matrix_stride = 0; 250 } 251 252 /* Assign stage-specific fields. */ 253 for (unsigned j = 0; j < MESA_SHADER_STAGES; ++j) { 254 if (ab.stage_counter_references[j]) { 255 mab.StageReferences[j] = GL_TRUE; 256 num_atomic_buffers[j]++; 257 } else { 258 mab.StageReferences[j] = GL_FALSE; 259 } 260 } 261 262 i++; 263 } 264 265 /* Store a list pointers to atomic buffers per stage and store the index 266 * to the intra-stage buffer list in uniform storage. 267 */ 268 for (unsigned j = 0; j < MESA_SHADER_STAGES; ++j) { 269 if (prog->_LinkedShaders[j] && num_atomic_buffers[j] > 0) { 270 struct gl_program *gl_prog = prog->_LinkedShaders[j]->Program; 271 gl_prog->info.num_abos = num_atomic_buffers[j]; 272 gl_prog->sh.AtomicBuffers = 273 rzalloc_array(gl_prog, gl_active_atomic_buffer *, 274 num_atomic_buffers[j]); 275 276 unsigned intra_stage_idx = 0; 277 for (unsigned i = 0; i < num_buffers; i++) { 278 struct gl_active_atomic_buffer *atomic_buffer = 279 &prog->data->AtomicBuffers[i]; 280 if (atomic_buffer->StageReferences[j]) { 281 gl_prog->sh.AtomicBuffers[intra_stage_idx] = atomic_buffer; 282 283 for (unsigned u = 0; u < atomic_buffer->NumUniforms; u++) { 284 prog->data->UniformStorage[atomic_buffer->Uniforms[u]].opaque[j].index = 285 intra_stage_idx; 286 prog->data->UniformStorage[atomic_buffer->Uniforms[u]].opaque[j].active = 287 true; 288 } 289 290 intra_stage_idx++; 291 } 292 } 293 } 294 } 295 296 delete [] abs; 297 assert(i == num_buffers); 298 } 299 300 void 301 link_check_atomic_counter_resources(struct gl_context *ctx, 302 struct gl_shader_program *prog) 303 { 304 unsigned num_buffers; 305 active_atomic_buffer *const abs = 306 find_active_atomic_counters(ctx, prog, &num_buffers); 307 unsigned atomic_counters[MESA_SHADER_STAGES] = {}; 308 unsigned atomic_buffers[MESA_SHADER_STAGES] = {}; 309 unsigned total_atomic_counters = 0; 310 unsigned total_atomic_buffers = 0; 311 312 /* Sum the required resources. Note that this counts buffers and 313 * counters referenced by several shader stages multiple times 314 * against the combined limit -- That's the behavior the spec 315 * requires. 316 */ 317 for (unsigned i = 0; i < ctx->Const.MaxAtomicBufferBindings; i++) { 318 if (abs[i].size == 0) 319 continue; 320 321 for (unsigned j = 0; j < MESA_SHADER_STAGES; ++j) { 322 const unsigned n = abs[i].stage_counter_references[j]; 323 324 if (n) { 325 atomic_counters[j] += n; 326 total_atomic_counters += n; 327 atomic_buffers[j]++; 328 total_atomic_buffers++; 329 } 330 } 331 } 332 333 /* Check that they are within the supported limits. */ 334 for (unsigned i = 0; i < MESA_SHADER_STAGES; i++) { 335 if (atomic_counters[i] > ctx->Const.Program[i].MaxAtomicCounters) 336 linker_error(prog, "Too many %s shader atomic counters", 337 _mesa_shader_stage_to_string(i)); 338 339 if (atomic_buffers[i] > ctx->Const.Program[i].MaxAtomicBuffers) 340 linker_error(prog, "Too many %s shader atomic counter buffers", 341 _mesa_shader_stage_to_string(i)); 342 } 343 344 if (total_atomic_counters > ctx->Const.MaxCombinedAtomicCounters) 345 linker_error(prog, "Too many combined atomic counters"); 346 347 if (total_atomic_buffers > ctx->Const.MaxCombinedAtomicBuffers) 348 linker_error(prog, "Too many combined atomic buffers"); 349 350 delete [] abs; 351 } 352