• Home
  • Line#
  • Scopes#
  • Navigate#
  • Raw
  • Download
1 /*
2  * Copyright (C) 2016 Rob Clark <robclark@freedesktop.org>
3  * Copyright © 2018 Google, Inc.
4  *
5  * Permission is hereby granted, free of charge, to any person obtaining a
6  * copy of this software and associated documentation files (the "Software"),
7  * to deal in the Software without restriction, including without limitation
8  * the rights to use, copy, modify, merge, publish, distribute, sublicense,
9  * and/or sell copies of the Software, and to permit persons to whom the
10  * Software is furnished to do so, subject to the following conditions:
11  *
12  * The above copyright notice and this permission notice (including the next
13  * paragraph) shall be included in all copies or substantial portions of the
14  * Software.
15  *
16  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18  * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
19  * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
20  * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
21  * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
22  * SOFTWARE.
23  *
24  * Authors:
25  *    Rob Clark <robclark@freedesktop.org>
26  */
27 
28 #define FD_BO_NO_HARDPIN 1
29 
30 #include "freedreno_query_acc.h"
31 #include "freedreno_state.h"
32 
33 #include "fd6_barrier.h"
34 #include "fd6_blend.h"
35 #include "fd6_blitter.h"
36 #include "fd6_compute.h"
37 #include "fd6_context.h"
38 #include "fd6_draw.h"
39 #include "fd6_emit.h"
40 #include "fd6_gmem.h"
41 #include "fd6_image.h"
42 #include "fd6_pack.h"
43 #include "fd6_program.h"
44 #include "fd6_query.h"
45 #include "fd6_rasterizer.h"
46 #include "fd6_resource.h"
47 #include "fd6_texture.h"
48 #include "fd6_zsa.h"
49 
50 static void
fd6_context_destroy(struct pipe_context * pctx)51 fd6_context_destroy(struct pipe_context *pctx) in_dt
52 {
53    struct fd6_context *fd6_ctx = fd6_context(fd_context(pctx));
54 
55    fd6_descriptor_set_invalidate(&fd6_ctx->cs_descriptor_set);
56    for (unsigned i = 0; i < ARRAY_SIZE(fd6_ctx->descriptor_sets); i++)
57       fd6_descriptor_set_invalidate(&fd6_ctx->descriptor_sets[i]);
58 
59    if (fd6_ctx->streamout_disable_stateobj)
60       fd_ringbuffer_del(fd6_ctx->streamout_disable_stateobj);
61 
62    if (fd6_ctx->sample_locations_disable_stateobj)
63       fd_ringbuffer_del(fd6_ctx->sample_locations_disable_stateobj);
64 
65    fd_context_destroy(pctx);
66 
67    if (fd6_ctx->vsc_draw_strm)
68       fd_bo_del(fd6_ctx->vsc_draw_strm);
69    if (fd6_ctx->vsc_prim_strm)
70       fd_bo_del(fd6_ctx->vsc_prim_strm);
71    fd_bo_del(fd6_ctx->control_mem);
72 
73    fd_context_cleanup_common_vbos(&fd6_ctx->base);
74 
75    fd6_texture_fini(pctx);
76 
77    free(fd6_ctx);
78 }
79 
80 static void *
fd6_vertex_state_create(struct pipe_context * pctx,unsigned num_elements,const struct pipe_vertex_element * elements)81 fd6_vertex_state_create(struct pipe_context *pctx, unsigned num_elements,
82                         const struct pipe_vertex_element *elements)
83 {
84    struct fd_context *ctx = fd_context(pctx);
85 
86    struct fd6_vertex_stateobj *state = CALLOC_STRUCT(fd6_vertex_stateobj);
87    memcpy(state->base.pipe, elements, sizeof(*elements) * num_elements);
88    state->base.num_elements = num_elements;
89    state->stateobj =
90       fd_ringbuffer_new_object(ctx->pipe, 4 * (num_elements * 4 + 1));
91    struct fd_ringbuffer *ring = state->stateobj;
92 
93    OUT_PKT4(ring, REG_A6XX_VFD_DECODE(0), 2 * num_elements);
94    for (int32_t i = 0; i < num_elements; i++) {
95       const struct pipe_vertex_element *elem = &elements[i];
96       enum pipe_format pfmt = (enum pipe_format)elem->src_format;
97       enum a6xx_format fmt = fd6_vertex_format(pfmt);
98       bool isint = util_format_is_pure_integer(pfmt);
99       assert(fmt != FMT6_NONE);
100 
101       OUT_RING(ring, A6XX_VFD_DECODE_INSTR_IDX(elem->vertex_buffer_index) |
102                         A6XX_VFD_DECODE_INSTR_OFFSET(elem->src_offset) |
103                         A6XX_VFD_DECODE_INSTR_FORMAT(fmt) |
104                         COND(elem->instance_divisor,
105                              A6XX_VFD_DECODE_INSTR_INSTANCED) |
106                         A6XX_VFD_DECODE_INSTR_SWAP(fd6_vertex_swap(pfmt)) |
107                         A6XX_VFD_DECODE_INSTR_UNK30 |
108                         COND(!isint, A6XX_VFD_DECODE_INSTR_FLOAT));
109       OUT_RING(ring,
110                MAX2(1, elem->instance_divisor)); /* VFD_DECODE[j].STEP_RATE */
111    }
112 
113    for (int32_t i = 0; i < num_elements; i++) {
114       const struct pipe_vertex_element *elem = &elements[i];
115 
116       OUT_PKT4(ring, REG_A6XX_VFD_FETCH_STRIDE(elem->vertex_buffer_index), 1);
117       OUT_RING(ring, elem->src_stride);
118    }
119 
120    return state;
121 }
122 
123 static void
fd6_vertex_state_delete(struct pipe_context * pctx,void * hwcso)124 fd6_vertex_state_delete(struct pipe_context *pctx, void *hwcso)
125 {
126    struct fd6_vertex_stateobj *so = (struct fd6_vertex_stateobj *)hwcso;
127 
128    fd_ringbuffer_del(so->stateobj);
129    FREE(hwcso);
130 }
131 
132 static void
validate_surface(struct pipe_context * pctx,struct pipe_surface * psurf)133 validate_surface(struct pipe_context *pctx, struct pipe_surface *psurf)
134    assert_dt
135 {
136    fd6_validate_format(fd_context(pctx), fd_resource(psurf->texture),
137                        psurf->format);
138 }
139 
140 static void
fd6_set_framebuffer_state(struct pipe_context * pctx,const struct pipe_framebuffer_state * pfb)141 fd6_set_framebuffer_state(struct pipe_context *pctx,
142                           const struct pipe_framebuffer_state *pfb)
143    in_dt
144 {
145    if (pfb->zsbuf)
146       validate_surface(pctx, pfb->zsbuf);
147 
148    for (unsigned i = 0; i < pfb->nr_cbufs; i++) {
149       if (!pfb->cbufs[i])
150          continue;
151       validate_surface(pctx, pfb->cbufs[i]);
152    }
153 
154    fd_set_framebuffer_state(pctx, pfb);
155 }
156 
157 
158 static void
setup_state_map(struct fd_context * ctx)159 setup_state_map(struct fd_context *ctx)
160 {
161    STATIC_ASSERT(FD6_GROUP_NON_GROUP < 32);
162 
163    fd_context_add_map(ctx, FD_DIRTY_VTXSTATE, BIT(FD6_GROUP_VTXSTATE));
164    fd_context_add_map(ctx, FD_DIRTY_VTXBUF, BIT(FD6_GROUP_VBO));
165    fd_context_add_map(ctx, FD_DIRTY_ZSA | FD_DIRTY_RASTERIZER,
166                       BIT(FD6_GROUP_ZSA));
167    fd_context_add_map(ctx, FD_DIRTY_ZSA | FD_DIRTY_BLEND | FD_DIRTY_PROG,
168                       BIT(FD6_GROUP_LRZ));
169    fd_context_add_map(ctx, FD_DIRTY_PROG | FD_DIRTY_RASTERIZER_CLIP_PLANE_ENABLE,
170                       BIT(FD6_GROUP_PROG) | BIT(FD6_GROUP_PROG_KEY));
171    fd_context_add_map(ctx, FD_DIRTY_RASTERIZER | FD_DIRTY_MIN_SAMPLES | FD_DIRTY_FRAMEBUFFER,
172                       BIT(FD6_GROUP_PROG_KEY));
173    fd_context_add_map(ctx, FD_DIRTY_RASTERIZER, BIT(FD6_GROUP_RASTERIZER));
174    fd_context_add_map(ctx,
175                       FD_DIRTY_FRAMEBUFFER | FD_DIRTY_RASTERIZER_DISCARD |
176                          FD_DIRTY_PROG | FD_DIRTY_BLEND_DUAL,
177                       BIT(FD6_GROUP_PROG_FB_RAST));
178    fd_context_add_map(ctx, FD_DIRTY_BLEND | FD_DIRTY_SAMPLE_MASK,
179                       BIT(FD6_GROUP_BLEND));
180    fd_context_add_map(ctx, FD_DIRTY_SAMPLE_LOCATIONS, BIT(FD6_GROUP_SAMPLE_LOCATIONS));
181    fd_context_add_map(ctx, FD_DIRTY_BLEND_COLOR, BIT(FD6_GROUP_BLEND_COLOR));
182    fd_context_add_map(ctx, FD_DIRTY_PROG | FD_DIRTY_CONST,
183                       BIT(FD6_GROUP_CONST));
184    fd_context_add_map(ctx, FD_DIRTY_STREAMOUT, BIT(FD6_GROUP_SO));
185    fd_context_add_map(ctx, FD_DIRTY_BLEND_COHERENT,
186       BIT(FD6_GROUP_PRIM_MODE_SYSMEM) | BIT(FD6_GROUP_PRIM_MODE_GMEM));
187 
188    fd_context_add_shader_map(ctx, PIPE_SHADER_VERTEX, FD_DIRTY_SHADER_TEX,
189                              BIT(FD6_GROUP_VS_TEX));
190    fd_context_add_shader_map(ctx, PIPE_SHADER_TESS_CTRL, FD_DIRTY_SHADER_TEX,
191                              BIT(FD6_GROUP_HS_TEX));
192    fd_context_add_shader_map(ctx, PIPE_SHADER_TESS_EVAL, FD_DIRTY_SHADER_TEX,
193                              BIT(FD6_GROUP_DS_TEX));
194    fd_context_add_shader_map(ctx, PIPE_SHADER_GEOMETRY, FD_DIRTY_SHADER_TEX,
195                              BIT(FD6_GROUP_GS_TEX));
196    fd_context_add_shader_map(ctx, PIPE_SHADER_FRAGMENT, FD_DIRTY_SHADER_TEX,
197                              BIT(FD6_GROUP_FS_TEX));
198    fd_context_add_shader_map(ctx, PIPE_SHADER_COMPUTE, FD_DIRTY_SHADER_TEX,
199                              BIT(FD6_GROUP_CS_TEX));
200 
201    fd_context_add_shader_map(ctx, PIPE_SHADER_VERTEX,
202                              FD_DIRTY_SHADER_SSBO | FD_DIRTY_SHADER_IMAGE,
203                              BIT(FD6_GROUP_VS_BINDLESS));
204    fd_context_add_shader_map(ctx, PIPE_SHADER_TESS_CTRL,
205                              FD_DIRTY_SHADER_SSBO | FD_DIRTY_SHADER_IMAGE,
206                              BIT(FD6_GROUP_HS_BINDLESS));
207    fd_context_add_shader_map(ctx, PIPE_SHADER_TESS_EVAL,
208                              FD_DIRTY_SHADER_SSBO | FD_DIRTY_SHADER_IMAGE,
209                              BIT(FD6_GROUP_DS_BINDLESS));
210    fd_context_add_shader_map(ctx, PIPE_SHADER_GEOMETRY,
211                              FD_DIRTY_SHADER_SSBO | FD_DIRTY_SHADER_IMAGE,
212                              BIT(FD6_GROUP_GS_BINDLESS));
213    /* NOTE: FD6_GROUP_FS_BINDLESS has a weak dependency on the program
214     * state (ie. it needs to be re-generated with fb-read descriptor
215     * patched in) but this special case is handled in fd6_emit_3d_state()
216     */
217    fd_context_add_shader_map(ctx, PIPE_SHADER_FRAGMENT,
218                              FD_DIRTY_SHADER_SSBO | FD_DIRTY_SHADER_IMAGE,
219                              BIT(FD6_GROUP_FS_BINDLESS));
220    fd_context_add_shader_map(ctx, PIPE_SHADER_COMPUTE,
221                              FD_DIRTY_SHADER_SSBO | FD_DIRTY_SHADER_IMAGE,
222                              BIT(FD6_GROUP_CS_BINDLESS));
223    fd_context_add_shader_map(ctx, PIPE_SHADER_FRAGMENT,
224                              FD_DIRTY_SHADER_PROG,
225                              BIT(FD6_GROUP_PRIM_MODE_SYSMEM) | BIT(FD6_GROUP_PRIM_MODE_GMEM));
226 
227    /* NOTE: scissor enabled bit is part of rasterizer state, but
228     * fd_rasterizer_state_bind() will mark scissor dirty if needed:
229     */
230    fd_context_add_map(ctx, FD_DIRTY_SCISSOR | FD_DIRTY_PROG,
231                       BIT(FD6_GROUP_SCISSOR));
232 
233    /* Stuff still emit in IB2
234     *
235     * NOTE: viewport state doesn't seem to change frequently, so possibly
236     * move it into FD6_GROUP_RASTERIZER?
237     */
238    fd_context_add_map(
239       ctx, FD_DIRTY_STENCIL_REF | FD_DIRTY_VIEWPORT | FD_DIRTY_RASTERIZER | FD_DIRTY_PROG,
240       BIT(FD6_GROUP_NON_GROUP));
241 }
242 
243 template <chip CHIP>
244 struct pipe_context *
fd6_context_create(struct pipe_screen * pscreen,void * priv,unsigned flags)245 fd6_context_create(struct pipe_screen *pscreen, void *priv,
246                    unsigned flags) disable_thread_safety_analysis
247 {
248    struct fd_screen *screen = fd_screen(pscreen);
249    struct fd6_context *fd6_ctx = CALLOC_STRUCT(fd6_context);
250    struct pipe_context *pctx;
251 
252    if (!fd6_ctx)
253       return NULL;
254 
255    pctx = &fd6_ctx->base.base;
256    pctx->screen = pscreen;
257 
258    fd6_ctx->base.flags = flags;
259    fd6_ctx->base.dev = fd_device_ref(screen->dev);
260    fd6_ctx->base.screen = fd_screen(pscreen);
261    fd6_ctx->base.last.key = &fd6_ctx->last_key;
262 
263    pctx->destroy = fd6_context_destroy;
264    pctx->create_blend_state = fd6_blend_state_create;
265    pctx->create_rasterizer_state = fd6_rasterizer_state_create;
266    pctx->create_depth_stencil_alpha_state = fd6_zsa_state_create;
267    pctx->create_vertex_elements_state = fd6_vertex_state_create;
268 
269    fd6_draw_init<CHIP>(pctx);
270    fd6_compute_init<CHIP>(pctx);
271    fd6_gmem_init<CHIP>(pctx);
272    fd6_texture_init(pctx);
273    fd6_prog_init<CHIP>(pctx);
274    fd6_query_context_init(pctx);
275 
276    setup_state_map(&fd6_ctx->base);
277 
278    pctx = fd_context_init(&fd6_ctx->base, pscreen, priv, flags);
279    if (!pctx) {
280       free(fd6_ctx);
281       return NULL;
282    }
283 
284    pctx->set_framebuffer_state = fd6_set_framebuffer_state;
285 
286    /* after fd_context_init() to override set_shader_images() */
287    fd6_image_init(pctx);
288 
289    /* after fd_context_init() to override memory_barrier/texture_barrier(): */
290    fd6_barrier_init(pctx);
291 
292    util_blitter_set_texture_multisample(fd6_ctx->base.blitter, true);
293 
294    pctx->delete_vertex_elements_state = fd6_vertex_state_delete;
295 
296    /* fd_context_init overwrites delete_rasterizer_state, so set this
297     * here. */
298    pctx->delete_rasterizer_state = fd6_rasterizer_state_delete;
299    pctx->delete_blend_state = fd6_blend_state_delete;
300    pctx->delete_depth_stencil_alpha_state = fd6_zsa_state_delete;
301 
302    /* initial sizes for VSC buffers (or rather the per-pipe sizes
303     * which is used to derive entire buffer size:
304     */
305    fd6_ctx->vsc_draw_strm_pitch = 0x440;
306    fd6_ctx->vsc_prim_strm_pitch = 0x1040;
307 
308    fd6_ctx->control_mem =
309       fd_bo_new(screen->dev, 0x1000, 0, "control");
310 
311    fd_context_add_private_bo(&fd6_ctx->base, fd6_ctx->control_mem);
312 
313    memset(fd_bo_map(fd6_ctx->control_mem), 0, sizeof(struct fd6_control));
314 
315    fd_context_setup_common_vbos(&fd6_ctx->base);
316 
317    fd6_blitter_init<CHIP>(pctx);
318 
319    struct fd_ringbuffer *ring =
320       fd_ringbuffer_new_object(fd6_ctx->base.pipe, 6 * 4);
321 
322    OUT_REG(ring, A6XX_GRAS_SAMPLE_CONFIG());
323    OUT_REG(ring, A6XX_RB_SAMPLE_CONFIG());
324    OUT_REG(ring, A6XX_SP_TP_SAMPLE_CONFIG());
325 
326    fd6_ctx->sample_locations_disable_stateobj = ring;
327 
328    return fd_context_init_tc(pctx, flags);
329 }
330 
331 /* Teach the compiler about needed variants: */
332 template struct pipe_context *fd6_context_create<A6XX>(struct pipe_screen *pscreen, void *priv, unsigned flags);
333 template struct pipe_context *fd6_context_create<A7XX>(struct pipe_screen *pscreen, void *priv, unsigned flags);
334