1 /**************************************************************************
2 *
3 * Copyright 2016 Samuel Pitoiset
4 * All Rights Reserved.
5 *
6 * Permission is hereby granted, free of charge, to any person obtaining a
7 * copy of this software and associated documentation files (the
8 * "Software"), to deal in the Software without restriction, including
9 * without limitation the rights to use, copy, modify, merge, publish,
10 * distribute, sub license, and/or sell copies of the Software, and to
11 * permit persons to whom the Software is furnished to do so, subject to
12 * the following conditions:
13 *
14 * The above copyright notice and this permission notice (including the
15 * next paragraph) shall be included in all copies or substantial portions
16 * of the Software.
17 *
18 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
19 * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
20 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT.
21 * IN NO EVENT SHALL VMWARE AND/OR ITS SUPPLIERS BE LIABLE FOR
22 * ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT,
23 * TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE
24 * SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
25 *
26 **************************************************************************/
27
28 #include "main/state.h"
29 #include "st_atom.h"
30 #include "st_context.h"
31 #include "st_cb_bitmap.h"
32 #include "st_cb_bufferobjects.h"
33 #include "st_cb_compute.h"
34 #include "st_util.h"
35
36 #include "pipe/p_context.h"
37
st_dispatch_compute_common(struct gl_context * ctx,const GLuint * num_groups,const GLuint * group_size,struct pipe_resource * indirect,GLintptr indirect_offset)38 static void st_dispatch_compute_common(struct gl_context *ctx,
39 const GLuint *num_groups,
40 const GLuint *group_size,
41 struct pipe_resource *indirect,
42 GLintptr indirect_offset)
43 {
44 struct gl_program *prog =
45 ctx->_Shader->CurrentProgram[MESA_SHADER_COMPUTE];
46 struct st_context *st = st_context(ctx);
47 struct pipe_context *pipe = st->pipe;
48 struct pipe_grid_info info = { 0 };
49
50 st_flush_bitmap_cache(st);
51 st_invalidate_readpix_cache(st);
52
53 if (ctx->NewState)
54 _mesa_update_state(ctx);
55
56 if ((st->dirty | ctx->NewDriverState) & st->active_states &
57 ST_PIPELINE_COMPUTE_STATE_MASK ||
58 st->compute_shader_may_be_dirty)
59 st_validate_state(st, ST_PIPELINE_COMPUTE);
60
61 for (unsigned i = 0; i < 3; i++) {
62 info.block[i] = group_size ? group_size[i] : prog->info.workgroup_size[i];
63 info.grid[i] = num_groups ? num_groups[i] : 0;
64 }
65
66 if (indirect) {
67 info.indirect = indirect;
68 info.indirect_offset = indirect_offset;
69 }
70
71 pipe->launch_grid(pipe, &info);
72 }
73
st_dispatch_compute(struct gl_context * ctx,const GLuint * num_groups)74 static void st_dispatch_compute(struct gl_context *ctx,
75 const GLuint *num_groups)
76 {
77 st_dispatch_compute_common(ctx, num_groups, NULL, NULL, 0);
78 }
79
st_dispatch_compute_indirect(struct gl_context * ctx,GLintptr indirect_offset)80 static void st_dispatch_compute_indirect(struct gl_context *ctx,
81 GLintptr indirect_offset)
82 {
83 struct gl_buffer_object *indirect_buffer = ctx->DispatchIndirectBuffer;
84 struct pipe_resource *indirect = st_buffer_object(indirect_buffer)->buffer;
85
86 st_dispatch_compute_common(ctx, NULL, NULL, indirect, indirect_offset);
87 }
88
st_dispatch_compute_group_size(struct gl_context * ctx,const GLuint * num_groups,const GLuint * group_size)89 static void st_dispatch_compute_group_size(struct gl_context *ctx,
90 const GLuint *num_groups,
91 const GLuint *group_size)
92 {
93 st_dispatch_compute_common(ctx, num_groups, group_size, NULL, 0);
94 }
95
st_init_compute_functions(struct dd_function_table * functions)96 void st_init_compute_functions(struct dd_function_table *functions)
97 {
98 functions->DispatchCompute = st_dispatch_compute;
99 functions->DispatchComputeIndirect = st_dispatch_compute_indirect;
100 functions->DispatchComputeGroupSize = st_dispatch_compute_group_size;
101 }
102