1 /*
2 * Copyright © 2018 Intel Corporation
3 *
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8 * and/or sell copies of the Software, and to permit persons to whom the
9 * Software is furnished to do so, subject to the following conditions:
10 *
11 * The above copyright notice and this permission notice (including the next
12 * paragraph) shall be included in all copies or substantial portions of the
13 * Software.
14 *
15 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
18 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
20 * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
21 * IN THE SOFTWARE.
22 */
23
24 #include "nir.h"
25 #include "linker_util.h"
26 #include "gl_nir_linker.h"
27 #include "compiler/glsl/ir_uniform.h" /* for gl_uniform_storage */
28 #include "main/context.h"
29
30 /**
31 * This file do the common link for GLSL atomic counter uniforms, using NIR,
32 * instead of IR as the counter-part glsl/link_uniforms.cpp
33 */
34
35 struct active_atomic_counter_uniform {
36 unsigned loc;
37 nir_variable *var;
38 };
39
40 struct active_atomic_buffer {
41 struct active_atomic_counter_uniform *uniforms;
42 unsigned num_uniforms;
43 unsigned uniform_buffer_size;
44 unsigned stage_counter_references[MESA_SHADER_STAGES];
45 unsigned size;
46 };
47
48 static void
add_atomic_counter(const void * ctx,struct active_atomic_buffer * buffer,unsigned uniform_loc,nir_variable * var)49 add_atomic_counter(const void *ctx,
50 struct active_atomic_buffer *buffer,
51 unsigned uniform_loc,
52 nir_variable *var)
53 {
54 if (buffer->num_uniforms >= buffer->uniform_buffer_size) {
55 if (buffer->uniform_buffer_size == 0)
56 buffer->uniform_buffer_size = 1;
57 else
58 buffer->uniform_buffer_size *= 2;
59 buffer->uniforms = reralloc(ctx,
60 buffer->uniforms,
61 struct active_atomic_counter_uniform,
62 buffer->uniform_buffer_size);
63 }
64
65 struct active_atomic_counter_uniform *uniform =
66 buffer->uniforms + buffer->num_uniforms;
67 uniform->loc = uniform_loc;
68 uniform->var = var;
69 buffer->num_uniforms++;
70 }
71
72 static void
process_atomic_variable(const struct glsl_type * t,struct gl_shader_program * prog,unsigned * uniform_loc,nir_variable * var,struct active_atomic_buffer * buffers,unsigned * num_buffers,int * offset,unsigned shader_stage)73 process_atomic_variable(const struct glsl_type *t,
74 struct gl_shader_program *prog,
75 unsigned *uniform_loc,
76 nir_variable *var,
77 struct active_atomic_buffer *buffers,
78 unsigned *num_buffers,
79 int *offset,
80 unsigned shader_stage)
81 {
82 /* FIXME: Arrays of arrays get counted separately. For example:
83 * x1[3][3][2] = 9 uniforms, 18 atomic counters
84 * x2[3][2] = 3 uniforms, 6 atomic counters
85 * x3[2] = 1 uniform, 2 atomic counters
86 *
87 * However this code marks all the counters as active even when they
88 * might not be used.
89 */
90 if (glsl_type_is_array(t) &&
91 glsl_type_is_array(glsl_get_array_element(t))) {
92 for (unsigned i = 0; i < glsl_get_length(t); i++) {
93 process_atomic_variable(glsl_get_array_element(t),
94 prog,
95 uniform_loc,
96 var,
97 buffers, num_buffers,
98 offset,
99 shader_stage);
100 }
101 } else {
102 struct active_atomic_buffer *buf = buffers + var->data.binding;
103 struct gl_uniform_storage *const storage =
104 &prog->data->UniformStorage[*uniform_loc];
105
106 /* If this is the first time the buffer is used, increment
107 * the counter of buffers used.
108 */
109 if (buf->size == 0)
110 (*num_buffers)++;
111
112 add_atomic_counter(buffers, /* ctx */
113 buf,
114 *uniform_loc,
115 var);
116
117 /* When checking for atomic counters we should count every member in
118 * an array as an atomic counter reference.
119 */
120 if (glsl_type_is_array(t))
121 buf->stage_counter_references[shader_stage] += glsl_get_length(t);
122 else
123 buf->stage_counter_references[shader_stage]++;
124 buf->size = MAX2(buf->size, *offset + glsl_atomic_size(t));
125
126 storage->offset = *offset;
127 *offset += glsl_atomic_size(t);
128
129 (*uniform_loc)++;
130 }
131 }
132
133 static struct active_atomic_buffer *
find_active_atomic_counters(struct gl_context * ctx,struct gl_shader_program * prog,unsigned * num_buffers)134 find_active_atomic_counters(struct gl_context *ctx,
135 struct gl_shader_program *prog,
136 unsigned *num_buffers)
137 {
138 struct active_atomic_buffer *buffers =
139 rzalloc_array(NULL, /* ctx */
140 struct active_atomic_buffer,
141 ctx->Const.MaxAtomicBufferBindings);
142 *num_buffers = 0;
143
144 for (unsigned i = 0; i < MESA_SHADER_STAGES; ++i) {
145 struct gl_linked_shader *sh = prog->_LinkedShaders[i];
146 if (sh == NULL)
147 continue;
148
149 nir_shader *nir = sh->Program->nir;
150
151 nir_foreach_uniform_variable(var, nir) {
152 if (!glsl_contains_atomic(var->type))
153 continue;
154
155 int offset = var->data.offset;
156 unsigned uniform_loc = var->data.location;
157
158 process_atomic_variable(var->type,
159 prog,
160 &uniform_loc,
161 var,
162 buffers,
163 num_buffers,
164 &offset,
165 i);
166 }
167 }
168
169 return buffers;
170 }
171
172 static bool
check_atomic_counters_overlap(const nir_variable * x,const nir_variable * y)173 check_atomic_counters_overlap(const nir_variable *x, const nir_variable *y)
174 {
175 return ((x->data.offset >= y->data.offset &&
176 x->data.offset < y->data.offset + glsl_atomic_size(y->type)) ||
177 (y->data.offset >= x->data.offset &&
178 y->data.offset < x->data.offset + glsl_atomic_size(x->type)));
179 }
180
181 static int
cmp_active_counter_offsets(const void * a,const void * b)182 cmp_active_counter_offsets(const void *a, const void *b)
183 {
184 const struct active_atomic_counter_uniform *const first =
185 (struct active_atomic_counter_uniform *) a;
186 const struct active_atomic_counter_uniform *const second =
187 (struct active_atomic_counter_uniform *) b;
188
189 return first->var->data.offset - second->var->data.offset;
190 }
191
192 void
gl_nir_link_assign_atomic_counter_resources(struct gl_context * ctx,struct gl_shader_program * prog)193 gl_nir_link_assign_atomic_counter_resources(struct gl_context *ctx,
194 struct gl_shader_program *prog)
195 {
196 unsigned num_buffers;
197 unsigned num_atomic_buffers[MESA_SHADER_STAGES] = {0};
198 struct active_atomic_buffer *abs =
199 find_active_atomic_counters(ctx, prog, &num_buffers);
200
201 prog->data->AtomicBuffers =
202 rzalloc_array(prog->data, struct gl_active_atomic_buffer, num_buffers);
203 prog->data->NumAtomicBuffers = num_buffers;
204
205 unsigned buffer_idx = 0;
206 for (unsigned binding = 0;
207 binding < ctx->Const.MaxAtomicBufferBindings;
208 binding++) {
209
210 /* If the binding was not used, skip.
211 */
212 if (abs[binding].size == 0)
213 continue;
214
215 struct active_atomic_buffer *ab = abs + binding;
216 struct gl_active_atomic_buffer *mab =
217 prog->data->AtomicBuffers + buffer_idx;
218
219 /* Assign buffer-specific fields. */
220 mab->Binding = binding;
221 mab->MinimumSize = ab->size;
222 mab->Uniforms = rzalloc_array(prog->data->AtomicBuffers, GLuint,
223 ab->num_uniforms);
224 mab->NumUniforms = ab->num_uniforms;
225
226 /* Assign counter-specific fields. */
227 for (unsigned j = 0; j < ab->num_uniforms; j++) {
228 nir_variable *var = ab->uniforms[j].var;
229 struct gl_uniform_storage *storage =
230 &prog->data->UniformStorage[ab->uniforms[j].loc];
231
232 mab->Uniforms[j] = ab->uniforms[j].loc;
233
234 storage->atomic_buffer_index = buffer_idx;
235 storage->offset = var->data.offset;
236 if (glsl_type_is_array(var->type)) {
237 const struct glsl_type *without_array =
238 glsl_without_array(var->type);
239 storage->array_stride = glsl_atomic_size(without_array);
240 } else {
241 storage->array_stride = 0;
242 }
243 if (!glsl_type_is_matrix(var->type))
244 storage->matrix_stride = 0;
245 }
246
247 /* Assign stage-specific fields. */
248 for (unsigned stage = 0; stage < MESA_SHADER_STAGES; ++stage) {
249 if (ab->stage_counter_references[stage]) {
250 mab->StageReferences[stage] = GL_TRUE;
251 num_atomic_buffers[stage]++;
252 } else {
253 mab->StageReferences[stage] = GL_FALSE;
254 }
255 }
256
257 buffer_idx++;
258 }
259
260 /* Store a list pointers to atomic buffers per stage and store the index
261 * to the intra-stage buffer list in uniform storage.
262 */
263 for (unsigned stage = 0; stage < MESA_SHADER_STAGES; ++stage) {
264 if (prog->_LinkedShaders[stage] == NULL ||
265 num_atomic_buffers[stage] <= 0)
266 continue;
267
268 struct gl_program *gl_prog = prog->_LinkedShaders[stage]->Program;
269 gl_prog->info.num_abos = num_atomic_buffers[stage];
270 gl_prog->sh.AtomicBuffers =
271 rzalloc_array(gl_prog,
272 struct gl_active_atomic_buffer *,
273 num_atomic_buffers[stage]);
274
275 gl_prog->nir->info.num_abos = num_atomic_buffers[stage];
276
277 unsigned intra_stage_idx = 0;
278 for (unsigned i = 0; i < num_buffers; i++) {
279 struct gl_active_atomic_buffer *atomic_buffer =
280 &prog->data->AtomicBuffers[i];
281 if (!atomic_buffer->StageReferences[stage])
282 continue;
283
284 gl_prog->sh.AtomicBuffers[intra_stage_idx] = atomic_buffer;
285
286 for (unsigned u = 0; u < atomic_buffer->NumUniforms; u++) {
287 GLuint uniform_loc = atomic_buffer->Uniforms[u];
288 struct gl_opaque_uniform_index *opaque =
289 prog->data->UniformStorage[uniform_loc].opaque + stage;
290 opaque->index = intra_stage_idx;
291 opaque->active = true;
292 }
293
294 intra_stage_idx++;
295 }
296 }
297
298 assert(buffer_idx == num_buffers);
299
300 ralloc_free(abs);
301 }
302
303 void
gl_nir_link_check_atomic_counter_resources(struct gl_context * ctx,struct gl_shader_program * prog)304 gl_nir_link_check_atomic_counter_resources(struct gl_context *ctx,
305 struct gl_shader_program *prog)
306 {
307 unsigned num_buffers;
308 struct active_atomic_buffer *abs =
309 find_active_atomic_counters(ctx, prog, &num_buffers);
310 unsigned atomic_counters[MESA_SHADER_STAGES] = {0};
311 unsigned atomic_buffers[MESA_SHADER_STAGES] = {0};
312 unsigned total_atomic_counters = 0;
313 unsigned total_atomic_buffers = 0;
314
315 /* Sum the required resources. Note that this counts buffers and
316 * counters referenced by several shader stages multiple times
317 * against the combined limit -- That's the behavior the spec
318 * requires.
319 */
320 for (unsigned i = 0; i < ctx->Const.MaxAtomicBufferBindings; i++) {
321 if (abs[i].size == 0)
322 continue;
323
324 qsort(abs[i].uniforms, abs[i].num_uniforms,
325 sizeof(struct active_atomic_counter_uniform),
326 cmp_active_counter_offsets);
327
328 for (unsigned j = 1; j < abs[i].num_uniforms; j++) {
329 /* If an overlapping counter found, it must be a reference to the
330 * same counter from a different shader stage.
331 */
332 if (check_atomic_counters_overlap(abs[i].uniforms[j-1].var,
333 abs[i].uniforms[j].var)
334 && strcmp(abs[i].uniforms[j-1].var->name,
335 abs[i].uniforms[j].var->name) != 0) {
336 linker_error(prog, "Atomic counter %s declared at offset %d "
337 "which is already in use.",
338 abs[i].uniforms[j].var->name,
339 abs[i].uniforms[j].var->data.offset);
340 }
341 }
342
343 for (unsigned j = 0; j < MESA_SHADER_STAGES; ++j) {
344 const unsigned n = abs[i].stage_counter_references[j];
345
346 if (n) {
347 atomic_counters[j] += n;
348 total_atomic_counters += n;
349 atomic_buffers[j]++;
350 total_atomic_buffers++;
351 }
352 }
353 }
354
355 /* Check that they are within the supported limits. */
356 for (unsigned i = 0; i < MESA_SHADER_STAGES; i++) {
357 if (atomic_counters[i] > ctx->Const.Program[i].MaxAtomicCounters)
358 linker_error(prog, "Too many %s shader atomic counters",
359 _mesa_shader_stage_to_string(i));
360
361 if (atomic_buffers[i] > ctx->Const.Program[i].MaxAtomicBuffers)
362 linker_error(prog, "Too many %s shader atomic counter buffers",
363 _mesa_shader_stage_to_string(i));
364 }
365
366 if (total_atomic_counters > ctx->Const.MaxCombinedAtomicCounters)
367 linker_error(prog, "Too many combined atomic counters");
368
369 if (total_atomic_buffers > ctx->Const.MaxCombinedAtomicBuffers)
370 linker_error(prog, "Too many combined atomic buffers");
371
372 ralloc_free(abs);
373 }
374