1 /* -*- mode: C; c-file-style: "k&r"; tab-width 4; indent-tabs-mode: t; -*- */
2
3 /*
4 * Copyright (C) 2012 Rob Clark <robclark@freedesktop.org>
5 *
6 * Permission is hereby granted, free of charge, to any person obtaining a
7 * copy of this software and associated documentation files (the "Software"),
8 * to deal in the Software without restriction, including without limitation
9 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
10 * and/or sell copies of the Software, and to permit persons to whom the
11 * Software is furnished to do so, subject to the following conditions:
12 *
13 * The above copyright notice and this permission notice (including the next
14 * paragraph) shall be included in all copies or substantial portions of the
15 * Software.
16 *
17 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
18 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
19 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
20 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
21 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
22 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
23 * SOFTWARE.
24 *
25 * Authors:
26 * Rob Clark <robclark@freedesktop.org>
27 */
28
29 #include "freedreno_context.h"
30 #include "freedreno_blitter.h"
31 #include "freedreno_draw.h"
32 #include "freedreno_fence.h"
33 #include "freedreno_program.h"
34 #include "freedreno_resource.h"
35 #include "freedreno_texture.h"
36 #include "freedreno_state.h"
37 #include "freedreno_gmem.h"
38 #include "freedreno_query.h"
39 #include "freedreno_query_hw.h"
40 #include "freedreno_util.h"
41 #include "util/u_upload_mgr.h"
42
43 static void
fd_context_flush(struct pipe_context * pctx,struct pipe_fence_handle ** fencep,unsigned flags)44 fd_context_flush(struct pipe_context *pctx, struct pipe_fence_handle **fencep,
45 unsigned flags)
46 {
47 struct fd_context *ctx = fd_context(pctx);
48 struct pipe_fence_handle *fence = NULL;
49
50 /* Take a ref to the batch's fence (batch can be unref'd when flushed: */
51 fd_fence_ref(pctx->screen, &fence, ctx->batch->fence);
52
53 if (flags & PIPE_FLUSH_FENCE_FD)
54 ctx->batch->needs_out_fence_fd = true;
55
56 if (!ctx->screen->reorder) {
57 fd_batch_flush(ctx->batch, true, false);
58 } else if (flags & PIPE_FLUSH_DEFERRED) {
59 fd_bc_flush_deferred(&ctx->screen->batch_cache, ctx);
60 } else {
61 fd_bc_flush(&ctx->screen->batch_cache, ctx);
62 }
63
64 if (fencep)
65 fd_fence_ref(pctx->screen, fencep, fence);
66
67 fd_fence_ref(pctx->screen, &fence, NULL);
68 }
69
70 static void
fd_texture_barrier(struct pipe_context * pctx,unsigned flags)71 fd_texture_barrier(struct pipe_context *pctx, unsigned flags)
72 {
73 /* On devices that could sample from GMEM we could possibly do better.
74 * Or if we knew that we were doing GMEM bypass we could just emit a
75 * cache flush, perhaps? But we don't know if future draws would cause
76 * us to use GMEM, and a flush in bypass isn't the end of the world.
77 */
78 fd_context_flush(pctx, NULL, 0);
79 }
80
81 /**
82 * emit marker string as payload of a no-op packet, which can be
83 * decoded by cffdump.
84 */
85 static void
fd_emit_string_marker(struct pipe_context * pctx,const char * string,int len)86 fd_emit_string_marker(struct pipe_context *pctx, const char *string, int len)
87 {
88 struct fd_context *ctx = fd_context(pctx);
89 struct fd_ringbuffer *ring;
90 const uint32_t *buf = (const void *)string;
91
92 if (!ctx->batch)
93 return;
94
95 ring = ctx->batch->draw;
96
97 /* max packet size is 0x3fff dwords: */
98 len = MIN2(len, 0x3fff * 4);
99
100 if (ctx->screen->gpu_id >= 500)
101 OUT_PKT7(ring, CP_NOP, align(len, 4) / 4);
102 else
103 OUT_PKT3(ring, CP_NOP, align(len, 4) / 4);
104 while (len >= 4) {
105 OUT_RING(ring, *buf);
106 buf++;
107 len -= 4;
108 }
109
110 /* copy remainder bytes without reading past end of input string: */
111 if (len > 0) {
112 uint32_t w = 0;
113 memcpy(&w, buf, len);
114 OUT_RING(ring, w);
115 }
116 }
117
118 void
fd_context_destroy(struct pipe_context * pctx)119 fd_context_destroy(struct pipe_context *pctx)
120 {
121 struct fd_context *ctx = fd_context(pctx);
122 unsigned i;
123
124 DBG("");
125
126 if (ctx->screen->reorder && util_queue_is_initialized(&ctx->flush_queue))
127 util_queue_destroy(&ctx->flush_queue);
128
129 fd_batch_reference(&ctx->batch, NULL); /* unref current batch */
130 fd_bc_invalidate_context(ctx);
131
132 fd_prog_fini(pctx);
133
134 if (ctx->blitter)
135 util_blitter_destroy(ctx->blitter);
136
137 if (pctx->stream_uploader)
138 u_upload_destroy(pctx->stream_uploader);
139
140 if (ctx->clear_rs_state)
141 pctx->delete_rasterizer_state(pctx, ctx->clear_rs_state);
142
143 if (ctx->primconvert)
144 util_primconvert_destroy(ctx->primconvert);
145
146 slab_destroy_child(&ctx->transfer_pool);
147
148 for (i = 0; i < ARRAY_SIZE(ctx->vsc_pipe); i++) {
149 struct fd_vsc_pipe *pipe = &ctx->vsc_pipe[i];
150 if (!pipe->bo)
151 break;
152 fd_bo_del(pipe->bo);
153 }
154
155 fd_device_del(ctx->dev);
156 fd_pipe_del(ctx->pipe);
157
158 if (fd_mesa_debug & (FD_DBG_BSTAT | FD_DBG_MSGS)) {
159 printf("batch_total=%u, batch_sysmem=%u, batch_gmem=%u, batch_nondraw=%u, batch_restore=%u\n",
160 (uint32_t)ctx->stats.batch_total, (uint32_t)ctx->stats.batch_sysmem,
161 (uint32_t)ctx->stats.batch_gmem, (uint32_t)ctx->stats.batch_nondraw,
162 (uint32_t)ctx->stats.batch_restore);
163 }
164
165 FREE(ctx);
166 }
167
168 static void
fd_set_debug_callback(struct pipe_context * pctx,const struct pipe_debug_callback * cb)169 fd_set_debug_callback(struct pipe_context *pctx,
170 const struct pipe_debug_callback *cb)
171 {
172 struct fd_context *ctx = fd_context(pctx);
173
174 if (cb)
175 ctx->debug = *cb;
176 else
177 memset(&ctx->debug, 0, sizeof(ctx->debug));
178 }
179
180 /* TODO we could combine a few of these small buffers (solid_vbuf,
181 * blit_texcoord_vbuf, and vsc_size_mem, into a single buffer and
182 * save a tiny bit of memory
183 */
184
185 static struct pipe_resource *
create_solid_vertexbuf(struct pipe_context * pctx)186 create_solid_vertexbuf(struct pipe_context *pctx)
187 {
188 static const float init_shader_const[] = {
189 -1.000000, +1.000000, +1.000000,
190 +1.000000, -1.000000, +1.000000,
191 };
192 struct pipe_resource *prsc = pipe_buffer_create(pctx->screen,
193 PIPE_BIND_CUSTOM, PIPE_USAGE_IMMUTABLE, sizeof(init_shader_const));
194 pipe_buffer_write(pctx, prsc, 0,
195 sizeof(init_shader_const), init_shader_const);
196 return prsc;
197 }
198
199 static struct pipe_resource *
create_blit_texcoord_vertexbuf(struct pipe_context * pctx)200 create_blit_texcoord_vertexbuf(struct pipe_context *pctx)
201 {
202 struct pipe_resource *prsc = pipe_buffer_create(pctx->screen,
203 PIPE_BIND_CUSTOM, PIPE_USAGE_DYNAMIC, 16);
204 return prsc;
205 }
206
207 void
fd_context_setup_common_vbos(struct fd_context * ctx)208 fd_context_setup_common_vbos(struct fd_context *ctx)
209 {
210 struct pipe_context *pctx = &ctx->base;
211
212 ctx->solid_vbuf = create_solid_vertexbuf(pctx);
213 ctx->blit_texcoord_vbuf = create_blit_texcoord_vertexbuf(pctx);
214
215 /* setup solid_vbuf_state: */
216 ctx->solid_vbuf_state.vtx = pctx->create_vertex_elements_state(
217 pctx, 1, (struct pipe_vertex_element[]){{
218 .vertex_buffer_index = 0,
219 .src_offset = 0,
220 .src_format = PIPE_FORMAT_R32G32B32_FLOAT,
221 }});
222 ctx->solid_vbuf_state.vertexbuf.count = 1;
223 ctx->solid_vbuf_state.vertexbuf.vb[0].stride = 12;
224 ctx->solid_vbuf_state.vertexbuf.vb[0].buffer.resource = ctx->solid_vbuf;
225
226 /* setup blit_vbuf_state: */
227 ctx->blit_vbuf_state.vtx = pctx->create_vertex_elements_state(
228 pctx, 2, (struct pipe_vertex_element[]){{
229 .vertex_buffer_index = 0,
230 .src_offset = 0,
231 .src_format = PIPE_FORMAT_R32G32_FLOAT,
232 }, {
233 .vertex_buffer_index = 1,
234 .src_offset = 0,
235 .src_format = PIPE_FORMAT_R32G32B32_FLOAT,
236 }});
237 ctx->blit_vbuf_state.vertexbuf.count = 2;
238 ctx->blit_vbuf_state.vertexbuf.vb[0].stride = 8;
239 ctx->blit_vbuf_state.vertexbuf.vb[0].buffer.resource = ctx->blit_texcoord_vbuf;
240 ctx->blit_vbuf_state.vertexbuf.vb[1].stride = 12;
241 ctx->blit_vbuf_state.vertexbuf.vb[1].buffer.resource = ctx->solid_vbuf;
242 }
243
244 void
fd_context_cleanup_common_vbos(struct fd_context * ctx)245 fd_context_cleanup_common_vbos(struct fd_context *ctx)
246 {
247 struct pipe_context *pctx = &ctx->base;
248
249 pctx->delete_vertex_elements_state(pctx, ctx->solid_vbuf_state.vtx);
250 pctx->delete_vertex_elements_state(pctx, ctx->blit_vbuf_state.vtx);
251
252 pipe_resource_reference(&ctx->solid_vbuf, NULL);
253 pipe_resource_reference(&ctx->blit_texcoord_vbuf, NULL);
254 }
255
256 struct pipe_context *
fd_context_init(struct fd_context * ctx,struct pipe_screen * pscreen,const uint8_t * primtypes,void * priv,unsigned flags)257 fd_context_init(struct fd_context *ctx, struct pipe_screen *pscreen,
258 const uint8_t *primtypes, void *priv, unsigned flags)
259 {
260 struct fd_screen *screen = fd_screen(pscreen);
261 struct pipe_context *pctx;
262 unsigned prio = 1;
263 int i;
264
265 /* lower numerical value == higher priority: */
266 if (fd_mesa_debug & FD_DBG_HIPRIO)
267 prio = 0;
268 else if (flags & PIPE_CONTEXT_HIGH_PRIORITY)
269 prio = 0;
270 else if (flags & PIPE_CONTEXT_LOW_PRIORITY)
271 prio = 2;
272
273 ctx->screen = screen;
274 ctx->pipe = fd_pipe_new2(screen->dev, FD_PIPE_3D, prio);
275
276 ctx->primtypes = primtypes;
277 ctx->primtype_mask = 0;
278 for (i = 0; i < PIPE_PRIM_MAX; i++)
279 if (primtypes[i])
280 ctx->primtype_mask |= (1 << i);
281
282 /* need some sane default in case state tracker doesn't
283 * set some state:
284 */
285 ctx->sample_mask = 0xffff;
286
287 pctx = &ctx->base;
288 pctx->screen = pscreen;
289 pctx->priv = priv;
290 pctx->flush = fd_context_flush;
291 pctx->emit_string_marker = fd_emit_string_marker;
292 pctx->set_debug_callback = fd_set_debug_callback;
293 pctx->create_fence_fd = fd_create_fence_fd;
294 pctx->fence_server_sync = fd_fence_server_sync;
295 pctx->texture_barrier = fd_texture_barrier;
296
297 pctx->stream_uploader = u_upload_create_default(pctx);
298 if (!pctx->stream_uploader)
299 goto fail;
300 pctx->const_uploader = pctx->stream_uploader;
301
302 ctx->batch = fd_bc_alloc_batch(&screen->batch_cache, ctx);
303
304 slab_create_child(&ctx->transfer_pool, &screen->transfer_pool);
305
306 if (!ctx->blit)
307 ctx->blit = fd_blitter_blit;
308
309 fd_draw_init(pctx);
310 fd_resource_context_init(pctx);
311 fd_query_context_init(pctx);
312 fd_texture_init(pctx);
313 fd_state_init(pctx);
314
315 ctx->blitter = util_blitter_create(pctx);
316 if (!ctx->blitter)
317 goto fail;
318
319 ctx->primconvert = util_primconvert_create(pctx, ctx->primtype_mask);
320 if (!ctx->primconvert)
321 goto fail;
322
323 list_inithead(&ctx->hw_active_queries);
324 list_inithead(&ctx->acc_active_queries);
325
326 return pctx;
327
328 fail:
329 pctx->destroy(pctx);
330 return NULL;
331 }
332