1 /**************************************************************************
2 *
3 * Copyright 2007 VMware, Inc.
4 * All Rights Reserved.
5 *
6 * Permission is hereby granted, free of charge, to any person obtaining a
7 * copy of this software and associated documentation files (the
8 * "Software"), to deal in the Software without restriction, including
9 * without limitation the rights to use, copy, modify, merge, publish,
10 * distribute, sub license, and/or sell copies of the Software, and to
11 * permit persons to whom the Software is furnished to do so, subject to
12 * the following conditions:
13 *
14 * The above copyright notice and this permission notice (including the
15 * next paragraph) shall be included in all copies or substantial portions
16 * of the Software.
17 *
18 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
19 * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
20 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT.
21 * IN NO EVENT SHALL VMWARE AND/OR ITS SUPPLIERS BE LIABLE FOR
22 * ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT,
23 * TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE
24 * SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
25 *
26 **************************************************************************/
27
28 /**
29 * Tiling engine.
30 *
31 * Builds per-tile display lists and executes them on calls to
32 * lp_setup_flush().
33 */
34
35 #include <limits.h>
36
37 #include "pipe/p_defines.h"
38 #include "util/u_framebuffer.h"
39 #include "util/u_inlines.h"
40 #include "util/u_memory.h"
41 #include "util/u_pack_color.h"
42 #include "util/u_viewport.h"
43 #include "draw/draw_pipe.h"
44 #include "util/os_time.h"
45 #include "lp_context.h"
46 #include "lp_memory.h"
47 #include "lp_scene.h"
48 #include "lp_texture.h"
49 #include "lp_debug.h"
50 #include "lp_fence.h"
51 #include "lp_query.h"
52 #include "lp_rast.h"
53 #include "lp_setup_context.h"
54 #include "lp_screen.h"
55 #include "lp_state.h"
56 #include "frontend/sw_winsys.h"
57
58 #include "draw/draw_context.h"
59 #include "draw/draw_vbuf.h"
60
61
62 static boolean set_scene_state( struct lp_setup_context *, enum setup_state,
63 const char *reason);
64 static boolean try_update_scene_state( struct lp_setup_context *setup );
65
66
67 static void
lp_setup_get_empty_scene(struct lp_setup_context * setup)68 lp_setup_get_empty_scene(struct lp_setup_context *setup)
69 {
70 assert(setup->scene == NULL);
71
72 setup->scene_idx++;
73 setup->scene_idx %= ARRAY_SIZE(setup->scenes);
74
75 setup->scene = setup->scenes[setup->scene_idx];
76
77 if (setup->scene->fence) {
78 if (LP_DEBUG & DEBUG_SETUP)
79 debug_printf("%s: wait for scene %d\n",
80 __FUNCTION__, setup->scene->fence->id);
81
82 lp_fence_wait(setup->scene->fence);
83 }
84
85 lp_scene_begin_binning(setup->scene, &setup->fb);
86
87 }
88
89
90 static void
first_triangle(struct lp_setup_context * setup,const float (* v0)[4],const float (* v1)[4],const float (* v2)[4])91 first_triangle( struct lp_setup_context *setup,
92 const float (*v0)[4],
93 const float (*v1)[4],
94 const float (*v2)[4])
95 {
96 assert(setup->state == SETUP_ACTIVE);
97 lp_setup_choose_triangle( setup );
98 setup->triangle( setup, v0, v1, v2 );
99 }
100
101 static void
first_line(struct lp_setup_context * setup,const float (* v0)[4],const float (* v1)[4])102 first_line( struct lp_setup_context *setup,
103 const float (*v0)[4],
104 const float (*v1)[4])
105 {
106 assert(setup->state == SETUP_ACTIVE);
107 lp_setup_choose_line( setup );
108 setup->line( setup, v0, v1 );
109 }
110
111 static void
first_point(struct lp_setup_context * setup,const float (* v0)[4])112 first_point( struct lp_setup_context *setup,
113 const float (*v0)[4])
114 {
115 assert(setup->state == SETUP_ACTIVE);
116 lp_setup_choose_point( setup );
117 setup->point( setup, v0 );
118 }
119
lp_setup_reset(struct lp_setup_context * setup)120 void lp_setup_reset( struct lp_setup_context *setup )
121 {
122 unsigned i;
123
124 LP_DBG(DEBUG_SETUP, "%s\n", __FUNCTION__);
125
126 /* Reset derived state */
127 for (i = 0; i < ARRAY_SIZE(setup->constants); ++i) {
128 setup->constants[i].stored_size = 0;
129 setup->constants[i].stored_data = NULL;
130 }
131
132 setup->fs.stored = NULL;
133 setup->dirty = ~0;
134
135 /* no current bin */
136 setup->scene = NULL;
137
138 /* Reset some state:
139 */
140 memset(&setup->clear, 0, sizeof setup->clear);
141
142 /* Have an explicit "start-binning" call and get rid of this
143 * pointer twiddling?
144 */
145 setup->line = first_line;
146 setup->point = first_point;
147 setup->triangle = first_triangle;
148 }
149
150
151 /** Rasterize all scene's bins */
152 static void
lp_setup_rasterize_scene(struct lp_setup_context * setup)153 lp_setup_rasterize_scene( struct lp_setup_context *setup )
154 {
155 struct lp_scene *scene = setup->scene;
156 struct llvmpipe_screen *screen = llvmpipe_screen(scene->pipe->screen);
157
158 scene->num_active_queries = setup->active_binned_queries;
159 memcpy(scene->active_queries, setup->active_queries,
160 scene->num_active_queries * sizeof(scene->active_queries[0]));
161
162 lp_scene_end_binning(scene);
163
164 lp_fence_reference(&setup->last_fence, scene->fence);
165
166 if (setup->last_fence)
167 setup->last_fence->issued = TRUE;
168
169 mtx_lock(&screen->rast_mutex);
170
171 /* FIXME: We enqueue the scene then wait on the rasterizer to finish.
172 * This means we never actually run any vertex stuff in parallel to
173 * rasterization (not in the same context at least) which is what the
174 * multiple scenes per setup is about - when we get a new empty scene
175 * any old one is already empty again because we waited here for
176 * raster tasks to be finished. Ideally, we shouldn't need to wait here
177 * and rely on fences elsewhere when waiting is necessary.
178 * Certainly, lp_scene_end_rasterization() would need to be deferred too
179 * and there's probably other bits why this doesn't actually work.
180 */
181 lp_rast_queue_scene(screen->rast, scene);
182 lp_rast_finish(screen->rast);
183 mtx_unlock(&screen->rast_mutex);
184
185 lp_scene_end_rasterization(setup->scene);
186 lp_setup_reset( setup );
187
188 LP_DBG(DEBUG_SETUP, "%s done \n", __FUNCTION__);
189 }
190
191
192
193 static boolean
begin_binning(struct lp_setup_context * setup)194 begin_binning( struct lp_setup_context *setup )
195 {
196 struct lp_scene *scene = setup->scene;
197 boolean need_zsload = FALSE;
198 boolean ok;
199
200 assert(scene);
201 assert(scene->fence == NULL);
202
203 /* Always create a fence:
204 */
205 scene->fence = lp_fence_create(MAX2(1, setup->num_threads));
206 if (!scene->fence)
207 return FALSE;
208
209 ok = try_update_scene_state(setup);
210 if (!ok)
211 return FALSE;
212
213 if (setup->fb.zsbuf &&
214 ((setup->clear.flags & PIPE_CLEAR_DEPTHSTENCIL) != PIPE_CLEAR_DEPTHSTENCIL) &&
215 util_format_is_depth_and_stencil(setup->fb.zsbuf->format))
216 need_zsload = TRUE;
217
218 LP_DBG(DEBUG_SETUP, "%s color clear bufs: %x depth: %s\n", __FUNCTION__,
219 setup->clear.flags >> 2,
220 need_zsload ? "clear": "load");
221
222 if (setup->clear.flags & PIPE_CLEAR_COLOR) {
223 unsigned cbuf;
224 for (cbuf = 0; cbuf < setup->fb.nr_cbufs; cbuf++) {
225 assert(PIPE_CLEAR_COLOR0 == 1 << 2);
226 if (setup->clear.flags & (1 << (2 + cbuf))) {
227 union lp_rast_cmd_arg clearrb_arg;
228 struct lp_rast_clear_rb *cc_scene =
229 (struct lp_rast_clear_rb *)
230 lp_scene_alloc(scene, sizeof(struct lp_rast_clear_rb));
231
232 if (!cc_scene) {
233 return FALSE;
234 }
235
236 cc_scene->cbuf = cbuf;
237 cc_scene->color_val = setup->clear.color_val[cbuf];
238 clearrb_arg.clear_rb = cc_scene;
239
240 if (!lp_scene_bin_everywhere(scene,
241 LP_RAST_OP_CLEAR_COLOR,
242 clearrb_arg))
243 return FALSE;
244 }
245 }
246 }
247
248 if (setup->fb.zsbuf) {
249 if (setup->clear.flags & PIPE_CLEAR_DEPTHSTENCIL) {
250 ok = lp_scene_bin_everywhere( scene,
251 LP_RAST_OP_CLEAR_ZSTENCIL,
252 lp_rast_arg_clearzs(
253 setup->clear.zsvalue,
254 setup->clear.zsmask));
255 if (!ok)
256 return FALSE;
257 }
258 }
259
260 setup->clear.flags = 0;
261 setup->clear.zsmask = 0;
262 setup->clear.zsvalue = 0;
263
264 scene->had_queries = !!setup->active_binned_queries;
265
266 LP_DBG(DEBUG_SETUP, "%s done\n", __FUNCTION__);
267 return TRUE;
268 }
269
270
271 /* This basically bins and then flushes any outstanding full-screen
272 * clears.
273 *
274 * TODO: fast path for fullscreen clears and no triangles.
275 */
276 static boolean
execute_clears(struct lp_setup_context * setup)277 execute_clears( struct lp_setup_context *setup )
278 {
279 LP_DBG(DEBUG_SETUP, "%s\n", __FUNCTION__);
280
281 return begin_binning( setup );
282 }
283
284 const char *states[] = {
285 "FLUSHED",
286 "CLEARED",
287 "ACTIVE "
288 };
289
290
291 static boolean
set_scene_state(struct lp_setup_context * setup,enum setup_state new_state,const char * reason)292 set_scene_state( struct lp_setup_context *setup,
293 enum setup_state new_state,
294 const char *reason)
295 {
296 unsigned old_state = setup->state;
297
298 if (old_state == new_state)
299 return TRUE;
300
301 if (LP_DEBUG & DEBUG_SCENE) {
302 debug_printf("%s old %s new %s%s%s\n",
303 __FUNCTION__,
304 states[old_state],
305 states[new_state],
306 (new_state == SETUP_FLUSHED) ? ": " : "",
307 (new_state == SETUP_FLUSHED) ? reason : "");
308
309 if (new_state == SETUP_FLUSHED && setup->scene)
310 lp_debug_draw_bins_by_cmd_length(setup->scene);
311 }
312
313 /* wait for a free/empty scene
314 */
315 if (old_state == SETUP_FLUSHED)
316 lp_setup_get_empty_scene(setup);
317
318 switch (new_state) {
319 case SETUP_CLEARED:
320 break;
321
322 case SETUP_ACTIVE:
323 if (!begin_binning( setup ))
324 goto fail;
325 break;
326
327 case SETUP_FLUSHED:
328 if (old_state == SETUP_CLEARED)
329 if (!execute_clears( setup ))
330 goto fail;
331
332 lp_setup_rasterize_scene( setup );
333 assert(setup->scene == NULL);
334 break;
335
336 default:
337 assert(0 && "invalid setup state mode");
338 goto fail;
339 }
340
341 setup->state = new_state;
342 return TRUE;
343
344 fail:
345 if (setup->scene) {
346 lp_scene_end_rasterization(setup->scene);
347 setup->scene = NULL;
348 }
349
350 setup->state = SETUP_FLUSHED;
351 lp_setup_reset( setup );
352 return FALSE;
353 }
354
355
356 void
lp_setup_flush(struct lp_setup_context * setup,struct pipe_fence_handle ** fence,const char * reason)357 lp_setup_flush( struct lp_setup_context *setup,
358 struct pipe_fence_handle **fence,
359 const char *reason)
360 {
361 set_scene_state( setup, SETUP_FLUSHED, reason );
362
363 if (fence) {
364 lp_fence_reference((struct lp_fence **)fence, setup->last_fence);
365 if (!*fence)
366 *fence = (struct pipe_fence_handle *)lp_fence_create(0);
367 }
368 }
369
370
371 void
lp_setup_bind_framebuffer(struct lp_setup_context * setup,const struct pipe_framebuffer_state * fb)372 lp_setup_bind_framebuffer( struct lp_setup_context *setup,
373 const struct pipe_framebuffer_state *fb )
374 {
375 LP_DBG(DEBUG_SETUP, "%s\n", __FUNCTION__);
376
377 /* Flush any old scene.
378 */
379 set_scene_state( setup, SETUP_FLUSHED, __FUNCTION__ );
380
381 /*
382 * Ensure the old scene is not reused.
383 */
384 assert(!setup->scene);
385
386 /* Set new state. This will be picked up later when we next need a
387 * scene.
388 */
389 util_copy_framebuffer_state(&setup->fb, fb);
390 setup->framebuffer.x0 = 0;
391 setup->framebuffer.y0 = 0;
392 setup->framebuffer.x1 = fb->width-1;
393 setup->framebuffer.y1 = fb->height-1;
394 setup->dirty |= LP_SETUP_NEW_SCISSOR;
395 }
396
397
398 /*
399 * Try to clear one color buffer of the attached fb, either by binning a clear
400 * command or queuing up the clear for later (when binning is started).
401 */
402 static boolean
lp_setup_try_clear_color_buffer(struct lp_setup_context * setup,const union pipe_color_union * color,unsigned cbuf)403 lp_setup_try_clear_color_buffer(struct lp_setup_context *setup,
404 const union pipe_color_union *color,
405 unsigned cbuf)
406 {
407 union lp_rast_cmd_arg clearrb_arg;
408 union util_color uc;
409 enum pipe_format format = setup->fb.cbufs[cbuf]->format;
410
411 LP_DBG(DEBUG_SETUP, "%s state %d\n", __FUNCTION__, setup->state);
412
413 util_pack_color_union(format, &uc, color);
414
415 if (setup->state == SETUP_ACTIVE) {
416 struct lp_scene *scene = setup->scene;
417
418 /* Add the clear to existing scene. In the unusual case where
419 * both color and depth-stencil are being cleared when there's
420 * already been some rendering, we could discard the currently
421 * binned scene and start again, but I don't see that as being
422 * a common usage.
423 */
424 struct lp_rast_clear_rb *cc_scene =
425 (struct lp_rast_clear_rb *)
426 lp_scene_alloc_aligned(scene, sizeof(struct lp_rast_clear_rb), 8);
427
428 if (!cc_scene) {
429 return FALSE;
430 }
431
432 cc_scene->cbuf = cbuf;
433 cc_scene->color_val = uc;
434 clearrb_arg.clear_rb = cc_scene;
435
436 if (!lp_scene_bin_everywhere(scene,
437 LP_RAST_OP_CLEAR_COLOR,
438 clearrb_arg))
439 return FALSE;
440 }
441 else {
442 /* Put ourselves into the 'pre-clear' state, specifically to try
443 * and accumulate multiple clears to color and depth_stencil
444 * buffers which the app or gallium frontend might issue
445 * separately.
446 */
447 set_scene_state( setup, SETUP_CLEARED, __FUNCTION__ );
448
449 assert(PIPE_CLEAR_COLOR0 == (1 << 2));
450 setup->clear.flags |= 1 << (cbuf + 2);
451 setup->clear.color_val[cbuf] = uc;
452 }
453
454 return TRUE;
455 }
456
457 static boolean
lp_setup_try_clear_zs(struct lp_setup_context * setup,double depth,unsigned stencil,unsigned flags)458 lp_setup_try_clear_zs(struct lp_setup_context *setup,
459 double depth,
460 unsigned stencil,
461 unsigned flags)
462 {
463 uint64_t zsmask = 0;
464 uint64_t zsvalue = 0;
465 uint32_t zmask32;
466 uint8_t smask8;
467 enum pipe_format format = setup->fb.zsbuf->format;
468
469 LP_DBG(DEBUG_SETUP, "%s state %d\n", __FUNCTION__, setup->state);
470
471 zmask32 = (flags & PIPE_CLEAR_DEPTH) ? ~0 : 0;
472 smask8 = (flags & PIPE_CLEAR_STENCIL) ? ~0 : 0;
473
474 zsvalue = util_pack64_z_stencil(format, depth, stencil);
475
476 zsmask = util_pack64_mask_z_stencil(format, zmask32, smask8);
477
478 zsvalue &= zsmask;
479
480 if (format == PIPE_FORMAT_Z24X8_UNORM ||
481 format == PIPE_FORMAT_X8Z24_UNORM) {
482 /*
483 * Make full mask if there's "X" bits so we can do full
484 * clear (without rmw).
485 */
486 uint32_t zsmask_full = 0;
487 zsmask_full = util_pack_mask_z_stencil(format, ~0, ~0);
488 zsmask |= ~zsmask_full;
489 }
490
491 if (setup->state == SETUP_ACTIVE) {
492 struct lp_scene *scene = setup->scene;
493
494 /* Add the clear to existing scene. In the unusual case where
495 * both color and depth-stencil are being cleared when there's
496 * already been some rendering, we could discard the currently
497 * binned scene and start again, but I don't see that as being
498 * a common usage.
499 */
500 if (!lp_scene_bin_everywhere(scene,
501 LP_RAST_OP_CLEAR_ZSTENCIL,
502 lp_rast_arg_clearzs(zsvalue, zsmask)))
503 return FALSE;
504 }
505 else {
506 /* Put ourselves into the 'pre-clear' state, specifically to try
507 * and accumulate multiple clears to color and depth_stencil
508 * buffers which the app or gallium frontend might issue
509 * separately.
510 */
511 set_scene_state( setup, SETUP_CLEARED, __FUNCTION__ );
512
513 setup->clear.flags |= flags;
514
515 setup->clear.zsmask |= zsmask;
516 setup->clear.zsvalue =
517 (setup->clear.zsvalue & ~zsmask) | (zsvalue & zsmask);
518 }
519
520 return TRUE;
521 }
522
523 void
lp_setup_clear(struct lp_setup_context * setup,const union pipe_color_union * color,double depth,unsigned stencil,unsigned flags)524 lp_setup_clear( struct lp_setup_context *setup,
525 const union pipe_color_union *color,
526 double depth,
527 unsigned stencil,
528 unsigned flags )
529 {
530 unsigned i;
531
532 /*
533 * Note any of these (max 9) clears could fail (but at most there should
534 * be just one failure!). This avoids doing the previous succeeded
535 * clears again (we still clear tiles twice if a clear command succeeded
536 * partially for one buffer).
537 */
538 if (flags & PIPE_CLEAR_DEPTHSTENCIL) {
539 unsigned flagszs = flags & PIPE_CLEAR_DEPTHSTENCIL;
540 if (!lp_setup_try_clear_zs(setup, depth, stencil, flagszs)) {
541 lp_setup_flush(setup, NULL, __FUNCTION__);
542
543 if (!lp_setup_try_clear_zs(setup, depth, stencil, flagszs))
544 assert(0);
545 }
546 }
547
548 if (flags & PIPE_CLEAR_COLOR) {
549 assert(PIPE_CLEAR_COLOR0 == (1 << 2));
550 for (i = 0; i < setup->fb.nr_cbufs; i++) {
551 if ((flags & (1 << (2 + i))) && setup->fb.cbufs[i]) {
552 if (!lp_setup_try_clear_color_buffer(setup, color, i)) {
553 lp_setup_flush(setup, NULL, __FUNCTION__);
554
555 if (!lp_setup_try_clear_color_buffer(setup, color, i))
556 assert(0);
557 }
558 }
559 }
560 }
561 }
562
563
564
565 void
lp_setup_set_triangle_state(struct lp_setup_context * setup,unsigned cull_mode,boolean ccw_is_frontface,boolean scissor,boolean half_pixel_center,boolean bottom_edge_rule,boolean multisample)566 lp_setup_set_triangle_state( struct lp_setup_context *setup,
567 unsigned cull_mode,
568 boolean ccw_is_frontface,
569 boolean scissor,
570 boolean half_pixel_center,
571 boolean bottom_edge_rule,
572 boolean multisample)
573 {
574 LP_DBG(DEBUG_SETUP, "%s\n", __FUNCTION__);
575
576 setup->ccw_is_frontface = ccw_is_frontface;
577 setup->cullmode = cull_mode;
578 setup->triangle = first_triangle;
579 setup->multisample = multisample;
580 setup->pixel_offset = half_pixel_center ? 0.5f : 0.0f;
581 setup->bottom_edge_rule = bottom_edge_rule;
582
583 if (setup->scissor_test != scissor) {
584 setup->dirty |= LP_SETUP_NEW_SCISSOR;
585 setup->scissor_test = scissor;
586 }
587 }
588
589 void
lp_setup_set_line_state(struct lp_setup_context * setup,float line_width)590 lp_setup_set_line_state( struct lp_setup_context *setup,
591 float line_width)
592 {
593 LP_DBG(DEBUG_SETUP, "%s\n", __FUNCTION__);
594
595 setup->line_width = line_width;
596 }
597
598 void
lp_setup_set_point_state(struct lp_setup_context * setup,float point_size,boolean point_size_per_vertex,uint sprite_coord_enable,uint sprite_coord_origin)599 lp_setup_set_point_state( struct lp_setup_context *setup,
600 float point_size,
601 boolean point_size_per_vertex,
602 uint sprite_coord_enable,
603 uint sprite_coord_origin)
604 {
605 LP_DBG(DEBUG_SETUP, "%s\n", __FUNCTION__);
606
607 setup->point_size = point_size;
608 setup->sprite_coord_enable = sprite_coord_enable;
609 setup->sprite_coord_origin = sprite_coord_origin;
610 setup->point_size_per_vertex = point_size_per_vertex;
611 }
612
613 void
lp_setup_set_setup_variant(struct lp_setup_context * setup,const struct lp_setup_variant * variant)614 lp_setup_set_setup_variant( struct lp_setup_context *setup,
615 const struct lp_setup_variant *variant)
616 {
617 LP_DBG(DEBUG_SETUP, "%s\n", __FUNCTION__);
618
619 setup->setup.variant = variant;
620 }
621
622 void
lp_setup_set_fs_variant(struct lp_setup_context * setup,struct lp_fragment_shader_variant * variant)623 lp_setup_set_fs_variant( struct lp_setup_context *setup,
624 struct lp_fragment_shader_variant *variant)
625 {
626 LP_DBG(DEBUG_SETUP, "%s %p\n", __FUNCTION__,
627 variant);
628
629 setup->fs.current.variant = variant;
630 setup->dirty |= LP_SETUP_NEW_FS;
631 }
632
633 void
lp_setup_set_fs_constants(struct lp_setup_context * setup,unsigned num,struct pipe_constant_buffer * buffers)634 lp_setup_set_fs_constants(struct lp_setup_context *setup,
635 unsigned num,
636 struct pipe_constant_buffer *buffers)
637 {
638 unsigned i;
639
640 LP_DBG(DEBUG_SETUP, "%s %p\n", __FUNCTION__, (void *) buffers);
641
642 assert(num <= ARRAY_SIZE(setup->constants));
643
644 for (i = 0; i < num; ++i) {
645 util_copy_constant_buffer(&setup->constants[i].current, &buffers[i]);
646 }
647 for (; i < ARRAY_SIZE(setup->constants); i++) {
648 util_copy_constant_buffer(&setup->constants[i].current, NULL);
649 }
650 setup->dirty |= LP_SETUP_NEW_CONSTANTS;
651 }
652
653 void
lp_setup_set_fs_ssbos(struct lp_setup_context * setup,unsigned num,struct pipe_shader_buffer * buffers)654 lp_setup_set_fs_ssbos(struct lp_setup_context *setup,
655 unsigned num,
656 struct pipe_shader_buffer *buffers)
657 {
658 unsigned i;
659
660 LP_DBG(DEBUG_SETUP, "%s %p\n", __FUNCTION__, (void *) buffers);
661
662 assert(num <= ARRAY_SIZE(setup->ssbos));
663
664 for (i = 0; i < num; ++i) {
665 util_copy_shader_buffer(&setup->ssbos[i].current, &buffers[i]);
666 }
667 for (; i < ARRAY_SIZE(setup->ssbos); i++) {
668 util_copy_shader_buffer(&setup->ssbos[i].current, NULL);
669 }
670 setup->dirty |= LP_SETUP_NEW_SSBOS;
671 }
672
673 void
lp_setup_set_fs_images(struct lp_setup_context * setup,unsigned num,struct pipe_image_view * images)674 lp_setup_set_fs_images(struct lp_setup_context *setup,
675 unsigned num,
676 struct pipe_image_view *images)
677 {
678 unsigned i;
679
680 LP_DBG(DEBUG_SETUP, "%s %p\n", __FUNCTION__, (void *) images);
681
682 assert(num <= ARRAY_SIZE(setup->images));
683
684 for (i = 0; i < num; ++i) {
685 struct pipe_image_view *image = &images[i];
686 util_copy_image_view(&setup->images[i].current, &images[i]);
687
688 struct pipe_resource *res = image->resource;
689 struct llvmpipe_resource *lp_res = llvmpipe_resource(res);
690 struct lp_jit_image *jit_image;
691
692 jit_image = &setup->fs.current.jit_context.images[i];
693 if (!lp_res)
694 continue;
695 if (!lp_res->dt) {
696 /* regular texture - setup array of mipmap level offsets */
697 if (llvmpipe_resource_is_texture(res)) {
698 jit_image->base = lp_res->tex_data;
699 } else
700 jit_image->base = lp_res->data;
701
702 jit_image->width = res->width0;
703 jit_image->height = res->height0;
704 jit_image->depth = res->depth0;
705 jit_image->num_samples = res->nr_samples;
706
707 if (llvmpipe_resource_is_texture(res)) {
708 uint32_t mip_offset = lp_res->mip_offsets[image->u.tex.level];
709
710 jit_image->width = u_minify(jit_image->width, image->u.tex.level);
711 jit_image->height = u_minify(jit_image->height, image->u.tex.level);
712
713 if (res->target == PIPE_TEXTURE_1D_ARRAY ||
714 res->target == PIPE_TEXTURE_2D_ARRAY ||
715 res->target == PIPE_TEXTURE_3D ||
716 res->target == PIPE_TEXTURE_CUBE ||
717 res->target == PIPE_TEXTURE_CUBE_ARRAY) {
718 /*
719 * For array textures, we don't have first_layer, instead
720 * adjust last_layer (stored as depth) plus the mip level offsets
721 * (as we have mip-first layout can't just adjust base ptr).
722 * XXX For mip levels, could do something similar.
723 */
724 jit_image->depth = image->u.tex.last_layer - image->u.tex.first_layer + 1;
725 mip_offset += image->u.tex.first_layer * lp_res->img_stride[image->u.tex.level];
726 } else
727 jit_image->depth = u_minify(jit_image->depth, image->u.tex.level);
728
729 jit_image->row_stride = lp_res->row_stride[image->u.tex.level];
730 jit_image->img_stride = lp_res->img_stride[image->u.tex.level];
731 jit_image->sample_stride = lp_res->sample_stride;
732 jit_image->base = (uint8_t *)jit_image->base + mip_offset;
733 }
734 else {
735 unsigned view_blocksize = util_format_get_blocksize(image->format);
736 jit_image->width = image->u.buf.size / view_blocksize;
737 jit_image->base = (uint8_t *)jit_image->base + image->u.buf.offset;
738 }
739 }
740 }
741 for (; i < ARRAY_SIZE(setup->images); i++) {
742 util_copy_image_view(&setup->images[i].current, NULL);
743 }
744 setup->dirty |= LP_SETUP_NEW_FS;
745 }
746
747 void
lp_setup_set_alpha_ref_value(struct lp_setup_context * setup,float alpha_ref_value)748 lp_setup_set_alpha_ref_value( struct lp_setup_context *setup,
749 float alpha_ref_value )
750 {
751 LP_DBG(DEBUG_SETUP, "%s %f\n", __FUNCTION__, alpha_ref_value);
752
753 if(setup->fs.current.jit_context.alpha_ref_value != alpha_ref_value) {
754 setup->fs.current.jit_context.alpha_ref_value = alpha_ref_value;
755 setup->dirty |= LP_SETUP_NEW_FS;
756 }
757 }
758
759 void
lp_setup_set_stencil_ref_values(struct lp_setup_context * setup,const ubyte refs[2])760 lp_setup_set_stencil_ref_values( struct lp_setup_context *setup,
761 const ubyte refs[2] )
762 {
763 LP_DBG(DEBUG_SETUP, "%s %d %d\n", __FUNCTION__, refs[0], refs[1]);
764
765 if (setup->fs.current.jit_context.stencil_ref_front != refs[0] ||
766 setup->fs.current.jit_context.stencil_ref_back != refs[1]) {
767 setup->fs.current.jit_context.stencil_ref_front = refs[0];
768 setup->fs.current.jit_context.stencil_ref_back = refs[1];
769 setup->dirty |= LP_SETUP_NEW_FS;
770 }
771 }
772
773 void
lp_setup_set_blend_color(struct lp_setup_context * setup,const struct pipe_blend_color * blend_color)774 lp_setup_set_blend_color( struct lp_setup_context *setup,
775 const struct pipe_blend_color *blend_color )
776 {
777 LP_DBG(DEBUG_SETUP, "%s\n", __FUNCTION__);
778
779 assert(blend_color);
780
781 if(memcmp(&setup->blend_color.current, blend_color, sizeof *blend_color) != 0) {
782 memcpy(&setup->blend_color.current, blend_color, sizeof *blend_color);
783 setup->dirty |= LP_SETUP_NEW_BLEND_COLOR;
784 }
785 }
786
787
788 void
lp_setup_set_scissors(struct lp_setup_context * setup,const struct pipe_scissor_state * scissors)789 lp_setup_set_scissors( struct lp_setup_context *setup,
790 const struct pipe_scissor_state *scissors )
791 {
792 unsigned i;
793 LP_DBG(DEBUG_SETUP, "%s\n", __FUNCTION__);
794
795 assert(scissors);
796
797 for (i = 0; i < PIPE_MAX_VIEWPORTS; ++i) {
798 setup->scissors[i].x0 = scissors[i].minx;
799 setup->scissors[i].x1 = scissors[i].maxx-1;
800 setup->scissors[i].y0 = scissors[i].miny;
801 setup->scissors[i].y1 = scissors[i].maxy-1;
802 }
803 setup->dirty |= LP_SETUP_NEW_SCISSOR;
804 }
805
806 void
lp_setup_set_sample_mask(struct lp_setup_context * setup,uint32_t sample_mask)807 lp_setup_set_sample_mask(struct lp_setup_context *setup,
808 uint32_t sample_mask)
809 {
810 if (setup->fs.current.jit_context.sample_mask != sample_mask) {
811 setup->fs.current.jit_context.sample_mask = sample_mask;
812 setup->dirty |= LP_SETUP_NEW_FS;
813 }
814 }
815
816 void
lp_setup_set_flatshade_first(struct lp_setup_context * setup,boolean flatshade_first)817 lp_setup_set_flatshade_first(struct lp_setup_context *setup,
818 boolean flatshade_first)
819 {
820 setup->flatshade_first = flatshade_first;
821 }
822
823 void
lp_setup_set_rasterizer_discard(struct lp_setup_context * setup,boolean rasterizer_discard)824 lp_setup_set_rasterizer_discard(struct lp_setup_context *setup,
825 boolean rasterizer_discard)
826 {
827 if (setup->rasterizer_discard != rasterizer_discard) {
828 setup->rasterizer_discard = rasterizer_discard;
829 setup->line = first_line;
830 setup->point = first_point;
831 setup->triangle = first_triangle;
832 }
833 }
834
835 void
lp_setup_set_vertex_info(struct lp_setup_context * setup,struct vertex_info * vertex_info)836 lp_setup_set_vertex_info(struct lp_setup_context *setup,
837 struct vertex_info *vertex_info)
838 {
839 /* XXX: just silently holding onto the pointer:
840 */
841 setup->vertex_info = vertex_info;
842 }
843
844
845 /**
846 * Called during state validation when LP_NEW_VIEWPORT is set.
847 */
848 void
lp_setup_set_viewports(struct lp_setup_context * setup,unsigned num_viewports,const struct pipe_viewport_state * viewports)849 lp_setup_set_viewports(struct lp_setup_context *setup,
850 unsigned num_viewports,
851 const struct pipe_viewport_state *viewports)
852 {
853 struct llvmpipe_context *lp = llvmpipe_context(setup->pipe);
854 unsigned i;
855
856 LP_DBG(DEBUG_SETUP, "%s\n", __FUNCTION__);
857
858 assert(num_viewports <= PIPE_MAX_VIEWPORTS);
859 assert(viewports);
860
861 /*
862 * For use in lp_state_fs.c, propagate the viewport values for all viewports.
863 */
864 for (i = 0; i < num_viewports; i++) {
865 float min_depth;
866 float max_depth;
867 util_viewport_zmin_zmax(&viewports[i], lp->rasterizer->clip_halfz,
868 &min_depth, &max_depth);
869
870 if (setup->viewports[i].min_depth != min_depth ||
871 setup->viewports[i].max_depth != max_depth) {
872 setup->viewports[i].min_depth = min_depth;
873 setup->viewports[i].max_depth = max_depth;
874 setup->dirty |= LP_SETUP_NEW_VIEWPORTS;
875 }
876 }
877 }
878
879
880 /**
881 * Called during state validation when LP_NEW_SAMPLER_VIEW is set.
882 */
883 void
lp_setup_set_fragment_sampler_views(struct lp_setup_context * setup,unsigned num,struct pipe_sampler_view ** views)884 lp_setup_set_fragment_sampler_views(struct lp_setup_context *setup,
885 unsigned num,
886 struct pipe_sampler_view **views)
887 {
888 unsigned i, max_tex_num;
889
890 LP_DBG(DEBUG_SETUP, "%s\n", __FUNCTION__);
891
892 assert(num <= PIPE_MAX_SHADER_SAMPLER_VIEWS);
893
894 max_tex_num = MAX2(num, setup->fs.current_tex_num);
895
896 for (i = 0; i < max_tex_num; i++) {
897 struct pipe_sampler_view *view = i < num ? views[i] : NULL;
898
899 if (view) {
900 struct pipe_resource *res = view->texture;
901 struct llvmpipe_resource *lp_tex = llvmpipe_resource(res);
902 struct lp_jit_texture *jit_tex;
903 jit_tex = &setup->fs.current.jit_context.textures[i];
904
905 /* We're referencing the texture's internal data, so save a
906 * reference to it.
907 */
908 pipe_resource_reference(&setup->fs.current_tex[i], res);
909
910 if (!lp_tex->dt) {
911 /* regular texture - setup array of mipmap level offsets */
912 int j;
913 unsigned first_level = 0;
914 unsigned last_level = 0;
915
916 if (llvmpipe_resource_is_texture(res)) {
917 first_level = view->u.tex.first_level;
918 last_level = view->u.tex.last_level;
919 assert(first_level <= last_level);
920 assert(last_level <= res->last_level);
921 jit_tex->base = lp_tex->tex_data;
922 }
923 else {
924 jit_tex->base = lp_tex->data;
925 }
926
927 if (LP_PERF & PERF_TEX_MEM) {
928 /* use dummy tile memory */
929 jit_tex->base = lp_dummy_tile;
930 jit_tex->width = TILE_SIZE/8;
931 jit_tex->height = TILE_SIZE/8;
932 jit_tex->depth = 1;
933 jit_tex->first_level = 0;
934 jit_tex->last_level = 0;
935 jit_tex->mip_offsets[0] = 0;
936 jit_tex->row_stride[0] = 0;
937 jit_tex->img_stride[0] = 0;
938 jit_tex->num_samples = 0;
939 jit_tex->sample_stride = 0;
940 }
941 else {
942 jit_tex->width = res->width0;
943 jit_tex->height = res->height0;
944 jit_tex->depth = res->depth0;
945 jit_tex->first_level = first_level;
946 jit_tex->last_level = last_level;
947 jit_tex->num_samples = res->nr_samples;
948 jit_tex->sample_stride = 0;
949
950 if (llvmpipe_resource_is_texture(res)) {
951 for (j = first_level; j <= last_level; j++) {
952 jit_tex->mip_offsets[j] = lp_tex->mip_offsets[j];
953 jit_tex->row_stride[j] = lp_tex->row_stride[j];
954 jit_tex->img_stride[j] = lp_tex->img_stride[j];
955 }
956
957 jit_tex->sample_stride = lp_tex->sample_stride;
958
959 if (res->target == PIPE_TEXTURE_1D_ARRAY ||
960 res->target == PIPE_TEXTURE_2D_ARRAY ||
961 res->target == PIPE_TEXTURE_CUBE ||
962 res->target == PIPE_TEXTURE_CUBE_ARRAY) {
963 /*
964 * For array textures, we don't have first_layer, instead
965 * adjust last_layer (stored as depth) plus the mip level offsets
966 * (as we have mip-first layout can't just adjust base ptr).
967 * XXX For mip levels, could do something similar.
968 */
969 jit_tex->depth = view->u.tex.last_layer - view->u.tex.first_layer + 1;
970 for (j = first_level; j <= last_level; j++) {
971 jit_tex->mip_offsets[j] += view->u.tex.first_layer *
972 lp_tex->img_stride[j];
973 }
974 if (view->target == PIPE_TEXTURE_CUBE ||
975 view->target == PIPE_TEXTURE_CUBE_ARRAY) {
976 assert(jit_tex->depth % 6 == 0);
977 }
978 assert(view->u.tex.first_layer <= view->u.tex.last_layer);
979 assert(view->u.tex.last_layer < res->array_size);
980 }
981 }
982 else {
983 /*
984 * For buffers, we don't have "offset", instead adjust
985 * the size (stored as width) plus the base pointer.
986 */
987 unsigned view_blocksize = util_format_get_blocksize(view->format);
988 /* probably don't really need to fill that out */
989 jit_tex->mip_offsets[0] = 0;
990 jit_tex->row_stride[0] = 0;
991 jit_tex->img_stride[0] = 0;
992
993 /* everything specified in number of elements here. */
994 jit_tex->width = view->u.buf.size / view_blocksize;
995 jit_tex->base = (uint8_t *)jit_tex->base + view->u.buf.offset;
996 /* XXX Unsure if we need to sanitize parameters? */
997 assert(view->u.buf.offset + view->u.buf.size <= res->width0);
998 }
999 }
1000 }
1001 else {
1002 /* display target texture/surface */
1003 /*
1004 * XXX: Where should this be unmapped?
1005 */
1006 struct llvmpipe_screen *screen = llvmpipe_screen(res->screen);
1007 struct sw_winsys *winsys = screen->winsys;
1008 jit_tex->base = winsys->displaytarget_map(winsys, lp_tex->dt,
1009 PIPE_MAP_READ);
1010 jit_tex->row_stride[0] = lp_tex->row_stride[0];
1011 jit_tex->img_stride[0] = lp_tex->img_stride[0];
1012 jit_tex->mip_offsets[0] = 0;
1013 jit_tex->width = res->width0;
1014 jit_tex->height = res->height0;
1015 jit_tex->depth = res->depth0;
1016 jit_tex->first_level = jit_tex->last_level = 0;
1017 jit_tex->num_samples = res->nr_samples;
1018 jit_tex->sample_stride = 0;
1019 assert(jit_tex->base);
1020 }
1021 }
1022 else {
1023 pipe_resource_reference(&setup->fs.current_tex[i], NULL);
1024 }
1025 }
1026 setup->fs.current_tex_num = num;
1027
1028 setup->dirty |= LP_SETUP_NEW_FS;
1029 }
1030
1031
1032 /**
1033 * Called during state validation when LP_NEW_SAMPLER is set.
1034 */
1035 void
lp_setup_set_fragment_sampler_state(struct lp_setup_context * setup,unsigned num,struct pipe_sampler_state ** samplers)1036 lp_setup_set_fragment_sampler_state(struct lp_setup_context *setup,
1037 unsigned num,
1038 struct pipe_sampler_state **samplers)
1039 {
1040 unsigned i;
1041
1042 LP_DBG(DEBUG_SETUP, "%s\n", __FUNCTION__);
1043
1044 assert(num <= PIPE_MAX_SAMPLERS);
1045
1046 for (i = 0; i < PIPE_MAX_SAMPLERS; i++) {
1047 const struct pipe_sampler_state *sampler = i < num ? samplers[i] : NULL;
1048
1049 if (sampler) {
1050 struct lp_jit_sampler *jit_sam;
1051 jit_sam = &setup->fs.current.jit_context.samplers[i];
1052
1053 jit_sam->min_lod = sampler->min_lod;
1054 jit_sam->max_lod = sampler->max_lod;
1055 jit_sam->lod_bias = sampler->lod_bias;
1056 COPY_4V(jit_sam->border_color, sampler->border_color.f);
1057 }
1058 }
1059
1060 setup->dirty |= LP_SETUP_NEW_FS;
1061 }
1062
1063
1064 /**
1065 * Is the given texture referenced by any scene?
1066 * Note: we have to check all scenes including any scenes currently
1067 * being rendered and the current scene being built.
1068 */
1069 unsigned
lp_setup_is_resource_referenced(const struct lp_setup_context * setup,const struct pipe_resource * texture)1070 lp_setup_is_resource_referenced( const struct lp_setup_context *setup,
1071 const struct pipe_resource *texture )
1072 {
1073 unsigned i;
1074
1075 /* check the render targets */
1076 for (i = 0; i < setup->fb.nr_cbufs; i++) {
1077 if (setup->fb.cbufs[i] && setup->fb.cbufs[i]->texture == texture)
1078 return LP_REFERENCED_FOR_READ | LP_REFERENCED_FOR_WRITE;
1079 }
1080 if (setup->fb.zsbuf && setup->fb.zsbuf->texture == texture) {
1081 return LP_REFERENCED_FOR_READ | LP_REFERENCED_FOR_WRITE;
1082 }
1083
1084 /* check textures referenced by the scene */
1085 for (i = 0; i < ARRAY_SIZE(setup->scenes); i++) {
1086 if (lp_scene_is_resource_referenced(setup->scenes[i], texture)) {
1087 return LP_REFERENCED_FOR_READ;
1088 }
1089 }
1090
1091 for (i = 0; i < ARRAY_SIZE(setup->ssbos); i++) {
1092 if (setup->ssbos[i].current.buffer == texture)
1093 return LP_REFERENCED_FOR_READ | LP_REFERENCED_FOR_WRITE;
1094 }
1095
1096 for (i = 0; i < ARRAY_SIZE(setup->images); i++) {
1097 if (setup->images[i].current.resource == texture)
1098 return LP_REFERENCED_FOR_READ | LP_REFERENCED_FOR_WRITE;
1099 }
1100
1101 return LP_UNREFERENCED;
1102 }
1103
1104
1105 /**
1106 * Called by vbuf code when we're about to draw something.
1107 *
1108 * This function stores all dirty state in the current scene's display list
1109 * memory, via lp_scene_alloc(). We can not pass pointers of mutable state to
1110 * the JIT functions, as the JIT functions will be called later on, most likely
1111 * on a different thread.
1112 *
1113 * When processing dirty state it is imperative that we don't refer to any
1114 * pointers previously allocated with lp_scene_alloc() in this function (or any
1115 * function) as they may belong to a scene freed since then.
1116 */
1117 static boolean
try_update_scene_state(struct lp_setup_context * setup)1118 try_update_scene_state( struct lp_setup_context *setup )
1119 {
1120 static const float fake_const_buf[4];
1121 boolean new_scene = (setup->fs.stored == NULL);
1122 struct lp_scene *scene = setup->scene;
1123 unsigned i;
1124
1125 assert(scene);
1126
1127 if (setup->dirty & LP_SETUP_NEW_VIEWPORTS) {
1128 /*
1129 * Record new depth range state for changes due to viewport updates.
1130 *
1131 * TODO: Collapse the existing viewport and depth range information
1132 * into one structure, for access by JIT.
1133 */
1134 struct lp_jit_viewport *stored;
1135
1136 stored = (struct lp_jit_viewport *)
1137 lp_scene_alloc(scene, sizeof setup->viewports);
1138
1139 if (!stored) {
1140 assert(!new_scene);
1141 return FALSE;
1142 }
1143
1144 memcpy(stored, setup->viewports, sizeof setup->viewports);
1145
1146 setup->fs.current.jit_context.viewports = stored;
1147 setup->dirty |= LP_SETUP_NEW_FS;
1148 }
1149
1150 if(setup->dirty & LP_SETUP_NEW_BLEND_COLOR) {
1151 uint8_t *stored;
1152 float* fstored;
1153 unsigned i, j;
1154 unsigned size;
1155
1156 /* Alloc u8_blend_color (16 x i8) and f_blend_color (4 or 8 x f32) */
1157 size = 4 * 16 * sizeof(uint8_t);
1158 size += (LP_MAX_VECTOR_LENGTH / 4) * sizeof(float);
1159 stored = lp_scene_alloc_aligned(scene, size, LP_MIN_VECTOR_ALIGN);
1160
1161 if (!stored) {
1162 assert(!new_scene);
1163 return FALSE;
1164 }
1165
1166 /* Store floating point colour */
1167 fstored = (float*)(stored + 4*16);
1168 for (i = 0; i < (LP_MAX_VECTOR_LENGTH / 4); ++i) {
1169 fstored[i] = setup->blend_color.current.color[i % 4];
1170 }
1171
1172 /* smear each blend color component across 16 ubyte elements */
1173 for (i = 0; i < 4; ++i) {
1174 uint8_t c = float_to_ubyte(setup->blend_color.current.color[i]);
1175 for (j = 0; j < 16; ++j)
1176 stored[i*16 + j] = c;
1177 }
1178
1179 setup->blend_color.stored = stored;
1180 setup->fs.current.jit_context.u8_blend_color = stored;
1181 setup->fs.current.jit_context.f_blend_color = fstored;
1182 setup->dirty |= LP_SETUP_NEW_FS;
1183 }
1184
1185 if (setup->dirty & LP_SETUP_NEW_CONSTANTS) {
1186 for (i = 0; i < ARRAY_SIZE(setup->constants); ++i) {
1187 struct pipe_resource *buffer = setup->constants[i].current.buffer;
1188 const unsigned current_size = MIN2(setup->constants[i].current.buffer_size,
1189 LP_MAX_TGSI_CONST_BUFFER_SIZE);
1190 const ubyte *current_data = NULL;
1191 int num_constants;
1192
1193 STATIC_ASSERT(DATA_BLOCK_SIZE >= LP_MAX_TGSI_CONST_BUFFER_SIZE);
1194
1195 if (buffer) {
1196 /* resource buffer */
1197 current_data = (ubyte *) llvmpipe_resource_data(buffer);
1198 }
1199 else if (setup->constants[i].current.user_buffer) {
1200 /* user-space buffer */
1201 current_data = (ubyte *) setup->constants[i].current.user_buffer;
1202 }
1203
1204 if (current_data && current_size >= sizeof(float)) {
1205 current_data += setup->constants[i].current.buffer_offset;
1206
1207 /* TODO: copy only the actually used constants? */
1208
1209 if (setup->constants[i].stored_size != current_size ||
1210 !setup->constants[i].stored_data ||
1211 memcmp(setup->constants[i].stored_data,
1212 current_data,
1213 current_size) != 0) {
1214 void *stored;
1215
1216 stored = lp_scene_alloc(scene, current_size);
1217 if (!stored) {
1218 assert(!new_scene);
1219 return FALSE;
1220 }
1221
1222 memcpy(stored,
1223 current_data,
1224 current_size);
1225 setup->constants[i].stored_size = current_size;
1226 setup->constants[i].stored_data = stored;
1227 }
1228 setup->fs.current.jit_context.constants[i] =
1229 setup->constants[i].stored_data;
1230 }
1231 else {
1232 setup->constants[i].stored_size = 0;
1233 setup->constants[i].stored_data = NULL;
1234 setup->fs.current.jit_context.constants[i] = fake_const_buf;
1235 }
1236
1237 num_constants =
1238 DIV_ROUND_UP(setup->constants[i].stored_size, lp_get_constant_buffer_stride(scene->pipe->screen));
1239 setup->fs.current.jit_context.num_constants[i] = num_constants;
1240 setup->dirty |= LP_SETUP_NEW_FS;
1241 }
1242 }
1243
1244 if (setup->dirty & LP_SETUP_NEW_SSBOS) {
1245 for (i = 0; i < ARRAY_SIZE(setup->ssbos); ++i) {
1246 struct pipe_resource *buffer = setup->ssbos[i].current.buffer;
1247 const ubyte *current_data = NULL;
1248
1249 if (!buffer)
1250 continue;
1251 /* resource buffer */
1252 current_data = (ubyte *) llvmpipe_resource_data(buffer);
1253 if (current_data) {
1254 current_data += setup->ssbos[i].current.buffer_offset;
1255
1256 setup->fs.current.jit_context.ssbos[i] = (const uint32_t *)current_data;
1257 setup->fs.current.jit_context.num_ssbos[i] = setup->ssbos[i].current.buffer_size;
1258 } else {
1259 setup->fs.current.jit_context.ssbos[i] = NULL;
1260 setup->fs.current.jit_context.num_ssbos[i] = 0;
1261 }
1262 setup->dirty |= LP_SETUP_NEW_FS;
1263 }
1264 }
1265 if (setup->dirty & LP_SETUP_NEW_FS) {
1266 if (!setup->fs.stored ||
1267 memcmp(setup->fs.stored,
1268 &setup->fs.current,
1269 sizeof setup->fs.current) != 0)
1270 {
1271 struct lp_rast_state *stored;
1272
1273 /* The fs state that's been stored in the scene is different from
1274 * the new, current state. So allocate a new lp_rast_state object
1275 * and append it to the bin's setup data buffer.
1276 */
1277 stored = (struct lp_rast_state *) lp_scene_alloc(scene, sizeof *stored);
1278 if (!stored) {
1279 assert(!new_scene);
1280 return FALSE;
1281 }
1282
1283 memcpy(&stored->jit_context,
1284 &setup->fs.current.jit_context,
1285 sizeof setup->fs.current.jit_context);
1286 stored->variant = setup->fs.current.variant;
1287
1288 if (!lp_scene_add_frag_shader_reference(scene,
1289 setup->fs.current.variant))
1290 return FALSE;
1291 setup->fs.stored = stored;
1292
1293 /* The scene now references the textures in the rasterization
1294 * state record. Note that now.
1295 */
1296 for (i = 0; i < ARRAY_SIZE(setup->fs.current_tex); i++) {
1297 if (setup->fs.current_tex[i]) {
1298 if (!lp_scene_add_resource_reference(scene,
1299 setup->fs.current_tex[i],
1300 new_scene)) {
1301 assert(!new_scene);
1302 return FALSE;
1303 }
1304 }
1305 }
1306 }
1307 }
1308
1309 if (setup->dirty & LP_SETUP_NEW_SCISSOR) {
1310 unsigned i;
1311 for (i = 0; i < PIPE_MAX_VIEWPORTS; ++i) {
1312 setup->draw_regions[i] = setup->framebuffer;
1313 if (setup->scissor_test) {
1314 u_rect_possible_intersection(&setup->scissors[i],
1315 &setup->draw_regions[i]);
1316 }
1317 }
1318 }
1319
1320 setup->dirty = 0;
1321
1322 assert(setup->fs.stored);
1323 return TRUE;
1324 }
1325
1326 boolean
lp_setup_update_state(struct lp_setup_context * setup,boolean update_scene)1327 lp_setup_update_state( struct lp_setup_context *setup,
1328 boolean update_scene )
1329 {
1330 /* Some of the 'draw' pipeline stages may have changed some driver state.
1331 * Make sure we've processed those state changes before anything else.
1332 *
1333 * XXX this is the only place where llvmpipe_context is used in the
1334 * setup code. This may get refactored/changed...
1335 */
1336 {
1337 struct llvmpipe_context *lp = llvmpipe_context(setup->pipe);
1338 if (lp->dirty) {
1339 llvmpipe_update_derived(lp);
1340 }
1341
1342 if (lp->setup->dirty) {
1343 llvmpipe_update_setup(lp);
1344 }
1345
1346 assert(setup->setup.variant);
1347
1348 /* Will probably need to move this somewhere else, just need
1349 * to know about vertex shader point size attribute.
1350 */
1351 setup->psize_slot = lp->psize_slot;
1352 setup->viewport_index_slot = lp->viewport_index_slot;
1353 setup->layer_slot = lp->layer_slot;
1354 setup->face_slot = lp->face_slot;
1355
1356 assert(lp->dirty == 0);
1357
1358 assert(lp->setup_variant.key.size ==
1359 setup->setup.variant->key.size);
1360
1361 assert(memcmp(&lp->setup_variant.key,
1362 &setup->setup.variant->key,
1363 setup->setup.variant->key.size) == 0);
1364 }
1365
1366 if (update_scene && setup->state != SETUP_ACTIVE) {
1367 if (!set_scene_state( setup, SETUP_ACTIVE, __FUNCTION__ ))
1368 return FALSE;
1369 }
1370
1371 /* Only call into update_scene_state() if we already have a
1372 * scene:
1373 */
1374 if (update_scene && setup->scene) {
1375 assert(setup->state == SETUP_ACTIVE);
1376
1377 if (try_update_scene_state(setup))
1378 return TRUE;
1379
1380 /* Update failed, try to restart the scene.
1381 *
1382 * Cannot call lp_setup_flush_and_restart() directly here
1383 * because of potential recursion.
1384 */
1385 if (!set_scene_state(setup, SETUP_FLUSHED, __FUNCTION__))
1386 return FALSE;
1387
1388 if (!set_scene_state(setup, SETUP_ACTIVE, __FUNCTION__))
1389 return FALSE;
1390
1391 if (!setup->scene)
1392 return FALSE;
1393
1394 return try_update_scene_state(setup);
1395 }
1396
1397 return TRUE;
1398 }
1399
1400
1401
1402 /* Only caller is lp_setup_vbuf_destroy()
1403 */
1404 void
lp_setup_destroy(struct lp_setup_context * setup)1405 lp_setup_destroy( struct lp_setup_context *setup )
1406 {
1407 uint i;
1408
1409 lp_setup_reset( setup );
1410
1411 util_unreference_framebuffer_state(&setup->fb);
1412
1413 for (i = 0; i < ARRAY_SIZE(setup->fs.current_tex); i++) {
1414 pipe_resource_reference(&setup->fs.current_tex[i], NULL);
1415 }
1416
1417 for (i = 0; i < ARRAY_SIZE(setup->constants); i++) {
1418 pipe_resource_reference(&setup->constants[i].current.buffer, NULL);
1419 }
1420
1421 for (i = 0; i < ARRAY_SIZE(setup->ssbos); i++) {
1422 pipe_resource_reference(&setup->ssbos[i].current.buffer, NULL);
1423 }
1424
1425 /* free the scenes in the 'empty' queue */
1426 for (i = 0; i < ARRAY_SIZE(setup->scenes); i++) {
1427 struct lp_scene *scene = setup->scenes[i];
1428
1429 if (scene->fence)
1430 lp_fence_wait(scene->fence);
1431
1432 lp_scene_destroy(scene);
1433 }
1434
1435 lp_fence_reference(&setup->last_fence, NULL);
1436
1437 FREE( setup );
1438 }
1439
1440
1441 /**
1442 * Create a new primitive tiling engine. Plug it into the backend of
1443 * the draw module. Currently also creates a rasterizer to use with
1444 * it.
1445 */
1446 struct lp_setup_context *
lp_setup_create(struct pipe_context * pipe,struct draw_context * draw)1447 lp_setup_create( struct pipe_context *pipe,
1448 struct draw_context *draw )
1449 {
1450 struct llvmpipe_screen *screen = llvmpipe_screen(pipe->screen);
1451 struct lp_setup_context *setup;
1452 unsigned i;
1453
1454 setup = CALLOC_STRUCT(lp_setup_context);
1455 if (!setup) {
1456 goto no_setup;
1457 }
1458
1459 lp_setup_init_vbuf(setup);
1460
1461 /* Used only in update_state():
1462 */
1463 setup->pipe = pipe;
1464
1465
1466 setup->num_threads = screen->num_threads;
1467 setup->vbuf = draw_vbuf_stage(draw, &setup->base);
1468 if (!setup->vbuf) {
1469 goto no_vbuf;
1470 }
1471
1472 draw_set_rasterize_stage(draw, setup->vbuf);
1473 draw_set_render(draw, &setup->base);
1474
1475 /* create some empty scenes */
1476 for (i = 0; i < MAX_SCENES; i++) {
1477 setup->scenes[i] = lp_scene_create( pipe );
1478 if (!setup->scenes[i]) {
1479 goto no_scenes;
1480 }
1481 }
1482
1483 setup->triangle = first_triangle;
1484 setup->line = first_line;
1485 setup->point = first_point;
1486
1487 setup->dirty = ~0;
1488
1489 /* Initialize empty default fb correctly, so the rect is empty */
1490 setup->framebuffer.x1 = -1;
1491 setup->framebuffer.y1 = -1;
1492
1493 return setup;
1494
1495 no_scenes:
1496 for (i = 0; i < MAX_SCENES; i++) {
1497 if (setup->scenes[i]) {
1498 lp_scene_destroy(setup->scenes[i]);
1499 }
1500 }
1501
1502 setup->vbuf->destroy(setup->vbuf);
1503 no_vbuf:
1504 FREE(setup);
1505 no_setup:
1506 return NULL;
1507 }
1508
1509
1510 /**
1511 * Put a BeginQuery command into all bins.
1512 */
1513 void
lp_setup_begin_query(struct lp_setup_context * setup,struct llvmpipe_query * pq)1514 lp_setup_begin_query(struct lp_setup_context *setup,
1515 struct llvmpipe_query *pq)
1516 {
1517
1518 set_scene_state(setup, SETUP_ACTIVE, "begin_query");
1519
1520 if (!(pq->type == PIPE_QUERY_OCCLUSION_COUNTER ||
1521 pq->type == PIPE_QUERY_OCCLUSION_PREDICATE ||
1522 pq->type == PIPE_QUERY_OCCLUSION_PREDICATE_CONSERVATIVE ||
1523 pq->type == PIPE_QUERY_PIPELINE_STATISTICS))
1524 return;
1525
1526 /* init the query to its beginning state */
1527 assert(setup->active_binned_queries < LP_MAX_ACTIVE_BINNED_QUERIES);
1528 /* exceeding list size so just ignore the query */
1529 if (setup->active_binned_queries >= LP_MAX_ACTIVE_BINNED_QUERIES) {
1530 return;
1531 }
1532 assert(setup->active_queries[setup->active_binned_queries] == NULL);
1533 setup->active_queries[setup->active_binned_queries] = pq;
1534 setup->active_binned_queries++;
1535
1536 assert(setup->scene);
1537 if (setup->scene) {
1538 if (!lp_scene_bin_everywhere(setup->scene,
1539 LP_RAST_OP_BEGIN_QUERY,
1540 lp_rast_arg_query(pq))) {
1541
1542 if (!lp_setup_flush_and_restart(setup))
1543 return;
1544
1545 if (!lp_scene_bin_everywhere(setup->scene,
1546 LP_RAST_OP_BEGIN_QUERY,
1547 lp_rast_arg_query(pq))) {
1548 return;
1549 }
1550 }
1551 setup->scene->had_queries |= TRUE;
1552 }
1553 }
1554
1555
1556 /**
1557 * Put an EndQuery command into all bins.
1558 */
1559 void
lp_setup_end_query(struct lp_setup_context * setup,struct llvmpipe_query * pq)1560 lp_setup_end_query(struct lp_setup_context *setup, struct llvmpipe_query *pq)
1561 {
1562 set_scene_state(setup, SETUP_ACTIVE, "end_query");
1563
1564 assert(setup->scene);
1565 if (setup->scene) {
1566 /* pq->fence should be the fence of the *last* scene which
1567 * contributed to the query result.
1568 */
1569 lp_fence_reference(&pq->fence, setup->scene->fence);
1570
1571 if (pq->type == PIPE_QUERY_OCCLUSION_COUNTER ||
1572 pq->type == PIPE_QUERY_OCCLUSION_PREDICATE ||
1573 pq->type == PIPE_QUERY_OCCLUSION_PREDICATE_CONSERVATIVE ||
1574 pq->type == PIPE_QUERY_PIPELINE_STATISTICS ||
1575 pq->type == PIPE_QUERY_TIMESTAMP) {
1576 if (pq->type == PIPE_QUERY_TIMESTAMP &&
1577 !(setup->scene->tiles_x | setup->scene->tiles_y)) {
1578 /*
1579 * If there's a zero width/height framebuffer, there's no bins and
1580 * hence no rast task is ever run. So fill in something here instead.
1581 */
1582 pq->end[0] = os_time_get_nano();
1583 }
1584
1585 if (!lp_scene_bin_everywhere(setup->scene,
1586 LP_RAST_OP_END_QUERY,
1587 lp_rast_arg_query(pq))) {
1588 if (!lp_setup_flush_and_restart(setup))
1589 goto fail;
1590
1591 if (!lp_scene_bin_everywhere(setup->scene,
1592 LP_RAST_OP_END_QUERY,
1593 lp_rast_arg_query(pq))) {
1594 goto fail;
1595 }
1596 }
1597 setup->scene->had_queries |= TRUE;
1598 }
1599 }
1600 else {
1601 lp_fence_reference(&pq->fence, setup->last_fence);
1602 }
1603
1604 fail:
1605 /* Need to do this now not earlier since it still needs to be marked as
1606 * active when binning it would cause a flush.
1607 */
1608 if (pq->type == PIPE_QUERY_OCCLUSION_COUNTER ||
1609 pq->type == PIPE_QUERY_OCCLUSION_PREDICATE ||
1610 pq->type == PIPE_QUERY_OCCLUSION_PREDICATE_CONSERVATIVE ||
1611 pq->type == PIPE_QUERY_PIPELINE_STATISTICS) {
1612 unsigned i;
1613
1614 /* remove from active binned query list */
1615 for (i = 0; i < setup->active_binned_queries; i++) {
1616 if (setup->active_queries[i] == pq)
1617 break;
1618 }
1619 assert(i < setup->active_binned_queries);
1620 if (i == setup->active_binned_queries)
1621 return;
1622 setup->active_binned_queries--;
1623 setup->active_queries[i] = setup->active_queries[setup->active_binned_queries];
1624 setup->active_queries[setup->active_binned_queries] = NULL;
1625 }
1626 }
1627
1628
1629 boolean
lp_setup_flush_and_restart(struct lp_setup_context * setup)1630 lp_setup_flush_and_restart(struct lp_setup_context *setup)
1631 {
1632 if (0) debug_printf("%s\n", __FUNCTION__);
1633
1634 assert(setup->state == SETUP_ACTIVE);
1635
1636 if (!set_scene_state(setup, SETUP_FLUSHED, __FUNCTION__))
1637 return FALSE;
1638
1639 if (!lp_setup_update_state(setup, TRUE))
1640 return FALSE;
1641
1642 return TRUE;
1643 }
1644
1645
1646