1 /*
2 * Copyright (C) 2016 Rob Clark <robclark@freedesktop.org>
3 * Copyright © 2018 Google, Inc.
4 *
5 * Permission is hereby granted, free of charge, to any person obtaining a
6 * copy of this software and associated documentation files (the "Software"),
7 * to deal in the Software without restriction, including without limitation
8 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
9 * and/or sell copies of the Software, and to permit persons to whom the
10 * Software is furnished to do so, subject to the following conditions:
11 *
12 * The above copyright notice and this permission notice (including the next
13 * paragraph) shall be included in all copies or substantial portions of the
14 * Software.
15 *
16 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
19 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
20 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
21 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
22 * SOFTWARE.
23 *
24 * Authors:
25 * Rob Clark <robclark@freedesktop.org>
26 */
27
28 #define FD_BO_NO_HARDPIN 1
29
30 #include "freedreno_query_acc.h"
31 #include "freedreno_state.h"
32
33 #include "fd6_barrier.h"
34 #include "fd6_blend.h"
35 #include "fd6_blitter.h"
36 #include "fd6_compute.h"
37 #include "fd6_context.h"
38 #include "fd6_draw.h"
39 #include "fd6_emit.h"
40 #include "fd6_gmem.h"
41 #include "fd6_image.h"
42 #include "fd6_pack.h"
43 #include "fd6_program.h"
44 #include "fd6_query.h"
45 #include "fd6_rasterizer.h"
46 #include "fd6_resource.h"
47 #include "fd6_texture.h"
48 #include "fd6_zsa.h"
49
50 static void
fd6_context_destroy(struct pipe_context * pctx)51 fd6_context_destroy(struct pipe_context *pctx) in_dt
52 {
53 struct fd6_context *fd6_ctx = fd6_context(fd_context(pctx));
54
55 fd6_descriptor_set_invalidate(&fd6_ctx->cs_descriptor_set);
56 for (unsigned i = 0; i < ARRAY_SIZE(fd6_ctx->descriptor_sets); i++)
57 fd6_descriptor_set_invalidate(&fd6_ctx->descriptor_sets[i]);
58
59 if (fd6_ctx->streamout_disable_stateobj)
60 fd_ringbuffer_del(fd6_ctx->streamout_disable_stateobj);
61
62 if (fd6_ctx->sample_locations_disable_stateobj)
63 fd_ringbuffer_del(fd6_ctx->sample_locations_disable_stateobj);
64
65 fd_context_destroy(pctx);
66
67 if (fd6_ctx->vsc_draw_strm)
68 fd_bo_del(fd6_ctx->vsc_draw_strm);
69 if (fd6_ctx->vsc_prim_strm)
70 fd_bo_del(fd6_ctx->vsc_prim_strm);
71 fd_bo_del(fd6_ctx->control_mem);
72
73 fd_context_cleanup_common_vbos(&fd6_ctx->base);
74
75 fd6_texture_fini(pctx);
76
77 free(fd6_ctx);
78 }
79
80 static void *
fd6_vertex_state_create(struct pipe_context * pctx,unsigned num_elements,const struct pipe_vertex_element * elements)81 fd6_vertex_state_create(struct pipe_context *pctx, unsigned num_elements,
82 const struct pipe_vertex_element *elements)
83 {
84 struct fd_context *ctx = fd_context(pctx);
85
86 struct fd6_vertex_stateobj *state = CALLOC_STRUCT(fd6_vertex_stateobj);
87 memcpy(state->base.pipe, elements, sizeof(*elements) * num_elements);
88 state->base.num_elements = num_elements;
89 state->stateobj =
90 fd_ringbuffer_new_object(ctx->pipe, 4 * (num_elements * 4 + 1));
91 struct fd_ringbuffer *ring = state->stateobj;
92
93 OUT_PKT4(ring, REG_A6XX_VFD_DECODE(0), 2 * num_elements);
94 for (int32_t i = 0; i < num_elements; i++) {
95 const struct pipe_vertex_element *elem = &elements[i];
96 enum pipe_format pfmt = (enum pipe_format)elem->src_format;
97 enum a6xx_format fmt = fd6_vertex_format(pfmt);
98 bool isint = util_format_is_pure_integer(pfmt);
99 assert(fmt != FMT6_NONE);
100
101 OUT_RING(ring, A6XX_VFD_DECODE_INSTR_IDX(elem->vertex_buffer_index) |
102 A6XX_VFD_DECODE_INSTR_OFFSET(elem->src_offset) |
103 A6XX_VFD_DECODE_INSTR_FORMAT(fmt) |
104 COND(elem->instance_divisor,
105 A6XX_VFD_DECODE_INSTR_INSTANCED) |
106 A6XX_VFD_DECODE_INSTR_SWAP(fd6_vertex_swap(pfmt)) |
107 A6XX_VFD_DECODE_INSTR_UNK30 |
108 COND(!isint, A6XX_VFD_DECODE_INSTR_FLOAT));
109 OUT_RING(ring,
110 MAX2(1, elem->instance_divisor)); /* VFD_DECODE[j].STEP_RATE */
111 }
112
113 for (int32_t i = 0; i < num_elements; i++) {
114 const struct pipe_vertex_element *elem = &elements[i];
115
116 OUT_PKT4(ring, REG_A6XX_VFD_FETCH_STRIDE(elem->vertex_buffer_index), 1);
117 OUT_RING(ring, elem->src_stride);
118 }
119
120 return state;
121 }
122
123 static void
fd6_vertex_state_delete(struct pipe_context * pctx,void * hwcso)124 fd6_vertex_state_delete(struct pipe_context *pctx, void *hwcso)
125 {
126 struct fd6_vertex_stateobj *so = (struct fd6_vertex_stateobj *)hwcso;
127
128 fd_ringbuffer_del(so->stateobj);
129 FREE(hwcso);
130 }
131
132 static void
validate_surface(struct pipe_context * pctx,struct pipe_surface * psurf)133 validate_surface(struct pipe_context *pctx, struct pipe_surface *psurf)
134 assert_dt
135 {
136 fd6_validate_format(fd_context(pctx), fd_resource(psurf->texture),
137 psurf->format);
138 }
139
140 static void
fd6_set_framebuffer_state(struct pipe_context * pctx,const struct pipe_framebuffer_state * pfb)141 fd6_set_framebuffer_state(struct pipe_context *pctx,
142 const struct pipe_framebuffer_state *pfb)
143 in_dt
144 {
145 if (pfb->zsbuf)
146 validate_surface(pctx, pfb->zsbuf);
147
148 for (unsigned i = 0; i < pfb->nr_cbufs; i++) {
149 if (!pfb->cbufs[i])
150 continue;
151 validate_surface(pctx, pfb->cbufs[i]);
152 }
153
154 fd_set_framebuffer_state(pctx, pfb);
155 }
156
157
158 static void
setup_state_map(struct fd_context * ctx)159 setup_state_map(struct fd_context *ctx)
160 {
161 STATIC_ASSERT(FD6_GROUP_NON_GROUP < 32);
162
163 fd_context_add_map(ctx, FD_DIRTY_VTXSTATE, BIT(FD6_GROUP_VTXSTATE));
164 fd_context_add_map(ctx, FD_DIRTY_VTXBUF, BIT(FD6_GROUP_VBO));
165 fd_context_add_map(ctx, FD_DIRTY_ZSA | FD_DIRTY_RASTERIZER,
166 BIT(FD6_GROUP_ZSA));
167 fd_context_add_map(ctx, FD_DIRTY_ZSA | FD_DIRTY_BLEND | FD_DIRTY_PROG,
168 BIT(FD6_GROUP_LRZ));
169 fd_context_add_map(ctx, FD_DIRTY_PROG | FD_DIRTY_RASTERIZER_CLIP_PLANE_ENABLE,
170 BIT(FD6_GROUP_PROG) | BIT(FD6_GROUP_PROG_KEY));
171 fd_context_add_map(ctx, FD_DIRTY_RASTERIZER | FD_DIRTY_MIN_SAMPLES | FD_DIRTY_FRAMEBUFFER,
172 BIT(FD6_GROUP_PROG_KEY));
173 fd_context_add_map(ctx, FD_DIRTY_RASTERIZER, BIT(FD6_GROUP_RASTERIZER));
174 fd_context_add_map(ctx,
175 FD_DIRTY_FRAMEBUFFER | FD_DIRTY_RASTERIZER_DISCARD |
176 FD_DIRTY_PROG | FD_DIRTY_BLEND_DUAL,
177 BIT(FD6_GROUP_PROG_FB_RAST));
178 fd_context_add_map(ctx, FD_DIRTY_BLEND | FD_DIRTY_SAMPLE_MASK,
179 BIT(FD6_GROUP_BLEND));
180 fd_context_add_map(ctx, FD_DIRTY_SAMPLE_LOCATIONS, BIT(FD6_GROUP_SAMPLE_LOCATIONS));
181 fd_context_add_map(ctx, FD_DIRTY_BLEND_COLOR, BIT(FD6_GROUP_BLEND_COLOR));
182 fd_context_add_map(ctx, FD_DIRTY_PROG | FD_DIRTY_CONST,
183 BIT(FD6_GROUP_CONST));
184 fd_context_add_map(ctx, FD_DIRTY_STREAMOUT, BIT(FD6_GROUP_SO));
185 fd_context_add_map(ctx, FD_DIRTY_BLEND_COHERENT,
186 BIT(FD6_GROUP_PRIM_MODE_SYSMEM) | BIT(FD6_GROUP_PRIM_MODE_GMEM));
187
188 fd_context_add_shader_map(ctx, PIPE_SHADER_VERTEX, FD_DIRTY_SHADER_TEX,
189 BIT(FD6_GROUP_VS_TEX));
190 fd_context_add_shader_map(ctx, PIPE_SHADER_TESS_CTRL, FD_DIRTY_SHADER_TEX,
191 BIT(FD6_GROUP_HS_TEX));
192 fd_context_add_shader_map(ctx, PIPE_SHADER_TESS_EVAL, FD_DIRTY_SHADER_TEX,
193 BIT(FD6_GROUP_DS_TEX));
194 fd_context_add_shader_map(ctx, PIPE_SHADER_GEOMETRY, FD_DIRTY_SHADER_TEX,
195 BIT(FD6_GROUP_GS_TEX));
196 fd_context_add_shader_map(ctx, PIPE_SHADER_FRAGMENT, FD_DIRTY_SHADER_TEX,
197 BIT(FD6_GROUP_FS_TEX));
198 fd_context_add_shader_map(ctx, PIPE_SHADER_COMPUTE, FD_DIRTY_SHADER_TEX,
199 BIT(FD6_GROUP_CS_TEX));
200
201 fd_context_add_shader_map(ctx, PIPE_SHADER_VERTEX,
202 FD_DIRTY_SHADER_SSBO | FD_DIRTY_SHADER_IMAGE,
203 BIT(FD6_GROUP_VS_BINDLESS));
204 fd_context_add_shader_map(ctx, PIPE_SHADER_TESS_CTRL,
205 FD_DIRTY_SHADER_SSBO | FD_DIRTY_SHADER_IMAGE,
206 BIT(FD6_GROUP_HS_BINDLESS));
207 fd_context_add_shader_map(ctx, PIPE_SHADER_TESS_EVAL,
208 FD_DIRTY_SHADER_SSBO | FD_DIRTY_SHADER_IMAGE,
209 BIT(FD6_GROUP_DS_BINDLESS));
210 fd_context_add_shader_map(ctx, PIPE_SHADER_GEOMETRY,
211 FD_DIRTY_SHADER_SSBO | FD_DIRTY_SHADER_IMAGE,
212 BIT(FD6_GROUP_GS_BINDLESS));
213 /* NOTE: FD6_GROUP_FS_BINDLESS has a weak dependency on the program
214 * state (ie. it needs to be re-generated with fb-read descriptor
215 * patched in) but this special case is handled in fd6_emit_3d_state()
216 */
217 fd_context_add_shader_map(ctx, PIPE_SHADER_FRAGMENT,
218 FD_DIRTY_SHADER_SSBO | FD_DIRTY_SHADER_IMAGE,
219 BIT(FD6_GROUP_FS_BINDLESS));
220 fd_context_add_shader_map(ctx, PIPE_SHADER_COMPUTE,
221 FD_DIRTY_SHADER_SSBO | FD_DIRTY_SHADER_IMAGE,
222 BIT(FD6_GROUP_CS_BINDLESS));
223 fd_context_add_shader_map(ctx, PIPE_SHADER_FRAGMENT,
224 FD_DIRTY_SHADER_PROG,
225 BIT(FD6_GROUP_PRIM_MODE_SYSMEM) | BIT(FD6_GROUP_PRIM_MODE_GMEM));
226
227 /* NOTE: scissor enabled bit is part of rasterizer state, but
228 * fd_rasterizer_state_bind() will mark scissor dirty if needed:
229 */
230 fd_context_add_map(ctx, FD_DIRTY_SCISSOR | FD_DIRTY_PROG,
231 BIT(FD6_GROUP_SCISSOR));
232
233 /* Stuff still emit in IB2
234 *
235 * NOTE: viewport state doesn't seem to change frequently, so possibly
236 * move it into FD6_GROUP_RASTERIZER?
237 */
238 fd_context_add_map(
239 ctx, FD_DIRTY_STENCIL_REF | FD_DIRTY_VIEWPORT | FD_DIRTY_RASTERIZER | FD_DIRTY_PROG,
240 BIT(FD6_GROUP_NON_GROUP));
241 }
242
243 template <chip CHIP>
244 struct pipe_context *
fd6_context_create(struct pipe_screen * pscreen,void * priv,unsigned flags)245 fd6_context_create(struct pipe_screen *pscreen, void *priv,
246 unsigned flags) disable_thread_safety_analysis
247 {
248 struct fd_screen *screen = fd_screen(pscreen);
249 struct fd6_context *fd6_ctx = CALLOC_STRUCT(fd6_context);
250 struct pipe_context *pctx;
251
252 if (!fd6_ctx)
253 return NULL;
254
255 pctx = &fd6_ctx->base.base;
256 pctx->screen = pscreen;
257
258 fd6_ctx->base.flags = flags;
259 fd6_ctx->base.dev = fd_device_ref(screen->dev);
260 fd6_ctx->base.screen = fd_screen(pscreen);
261 fd6_ctx->base.last.key = &fd6_ctx->last_key;
262
263 pctx->destroy = fd6_context_destroy;
264 pctx->create_blend_state = fd6_blend_state_create;
265 pctx->create_rasterizer_state = fd6_rasterizer_state_create;
266 pctx->create_depth_stencil_alpha_state = fd6_zsa_state_create;
267 pctx->create_vertex_elements_state = fd6_vertex_state_create;
268
269 fd6_draw_init<CHIP>(pctx);
270 fd6_compute_init<CHIP>(pctx);
271 fd6_gmem_init<CHIP>(pctx);
272 fd6_texture_init(pctx);
273 fd6_prog_init<CHIP>(pctx);
274 fd6_query_context_init(pctx);
275
276 setup_state_map(&fd6_ctx->base);
277
278 pctx = fd_context_init(&fd6_ctx->base, pscreen, priv, flags);
279 if (!pctx) {
280 free(fd6_ctx);
281 return NULL;
282 }
283
284 pctx->set_framebuffer_state = fd6_set_framebuffer_state;
285
286 /* after fd_context_init() to override set_shader_images() */
287 fd6_image_init(pctx);
288
289 /* after fd_context_init() to override memory_barrier/texture_barrier(): */
290 fd6_barrier_init(pctx);
291
292 util_blitter_set_texture_multisample(fd6_ctx->base.blitter, true);
293
294 pctx->delete_vertex_elements_state = fd6_vertex_state_delete;
295
296 /* fd_context_init overwrites delete_rasterizer_state, so set this
297 * here. */
298 pctx->delete_rasterizer_state = fd6_rasterizer_state_delete;
299 pctx->delete_blend_state = fd6_blend_state_delete;
300 pctx->delete_depth_stencil_alpha_state = fd6_zsa_state_delete;
301
302 /* initial sizes for VSC buffers (or rather the per-pipe sizes
303 * which is used to derive entire buffer size:
304 */
305 fd6_ctx->vsc_draw_strm_pitch = 0x440;
306 fd6_ctx->vsc_prim_strm_pitch = 0x1040;
307
308 fd6_ctx->control_mem =
309 fd_bo_new(screen->dev, 0x1000, 0, "control");
310
311 fd_context_add_private_bo(&fd6_ctx->base, fd6_ctx->control_mem);
312
313 memset(fd_bo_map(fd6_ctx->control_mem), 0, sizeof(struct fd6_control));
314
315 fd_context_setup_common_vbos(&fd6_ctx->base);
316
317 fd6_blitter_init<CHIP>(pctx);
318
319 struct fd_ringbuffer *ring =
320 fd_ringbuffer_new_object(fd6_ctx->base.pipe, 6 * 4);
321
322 OUT_REG(ring, A6XX_GRAS_SAMPLE_CONFIG());
323 OUT_REG(ring, A6XX_RB_SAMPLE_CONFIG());
324 OUT_REG(ring, A6XX_SP_TP_SAMPLE_CONFIG());
325
326 fd6_ctx->sample_locations_disable_stateobj = ring;
327
328 return fd_context_init_tc(pctx, flags);
329 }
330
331 /* Teach the compiler about needed variants: */
332 template struct pipe_context *fd6_context_create<A6XX>(struct pipe_screen *pscreen, void *priv, unsigned flags);
333 template struct pipe_context *fd6_context_create<A7XX>(struct pipe_screen *pscreen, void *priv, unsigned flags);
334