1 /**************************************************************************
2 *
3 * Copyright 2007-2018 VMware, Inc.
4 * All Rights Reserved.
5 *
6 * Permission is hereby granted, free of charge, to any person obtaining a
7 * copy of this software and associated documentation files (the
8 * "Software"), to deal in the Software without restriction, including
9 * without limitation the rights to use, copy, modify, merge, publish,
10 * distribute, sub license, and/or sell copies of the Software, and to
11 * permit persons to whom the Software is furnished to do so, subject to
12 * the following conditions:
13 *
14 * The above copyright notice and this permission notice (including the
15 * next paragraph) shall be included in all copies or substantial portions
16 * of the Software.
17 *
18 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
19 * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
20 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT.
21 * IN NO EVENT SHALL VMWARE AND/OR ITS SUPPLIERS BE LIABLE FOR
22 * ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT,
23 * TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE
24 * SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
25 *
26 **************************************************************************/
27
28 /**
29 * AA line stage: AA lines are converted triangles (with extra generic)
30 *
31 * Authors: Brian Paul
32 */
33
34
35 #include "pipe/p_context.h"
36 #include "pipe/p_defines.h"
37 #include "pipe/p_shader_tokens.h"
38 #include "util/u_inlines.h"
39
40 #include "util/format/u_format.h"
41 #include "util/u_math.h"
42 #include "util/u_memory.h"
43
44 #include "tgsi/tgsi_transform.h"
45 #include "tgsi/tgsi_dump.h"
46
47 #include "draw_context.h"
48 #include "draw_private.h"
49 #include "draw_pipe.h"
50
51 #include "nir.h"
52 #include "nir/nir_draw_helpers.h"
53
54 /** Approx number of new tokens for instructions in aa_transform_inst() */
55 #define NUM_NEW_TOKENS 53
56
57
58 /**
59 * Subclass of pipe_shader_state to carry extra fragment shader info.
60 */
61 struct aaline_fragment_shader
62 {
63 struct pipe_shader_state state;
64 void *driver_fs;
65 void *aaline_fs;
66 int generic_attrib; /**< generic used for distance */
67 };
68
69
70 /**
71 * Subclass of draw_stage
72 */
73 struct aaline_stage
74 {
75 struct draw_stage stage;
76
77 float half_line_width;
78
79 /** For AA lines, this is the vertex attrib slot for new generic */
80 uint coord_slot;
81 /** position, not necessarily output zero */
82 uint pos_slot;
83
84
85 /*
86 * Currently bound state
87 */
88 struct aaline_fragment_shader *fs;
89
90 /*
91 * Driver interface/override functions
92 */
93 void * (*driver_create_fs_state)(struct pipe_context *,
94 const struct pipe_shader_state *);
95 void (*driver_bind_fs_state)(struct pipe_context *, void *);
96 void (*driver_delete_fs_state)(struct pipe_context *, void *);
97 };
98
99
100
101 /**
102 * Subclass of tgsi_transform_context, used for transforming the
103 * user's fragment shader to add the special AA instructions.
104 */
105 struct aa_transform_context {
106 struct tgsi_transform_context base;
107 uint64_t tempsUsed; /**< bitmask */
108 int colorOutput; /**< which output is the primary color */
109 int maxInput, maxGeneric; /**< max input index found */
110 int colorTemp, aaTemp; /**< temp registers */
111 };
112
113 /**
114 * TGSI declaration transform callback.
115 * Look for a free input attrib, and two free temp regs.
116 */
117 static void
aa_transform_decl(struct tgsi_transform_context * ctx,struct tgsi_full_declaration * decl)118 aa_transform_decl(struct tgsi_transform_context *ctx,
119 struct tgsi_full_declaration *decl)
120 {
121 struct aa_transform_context *aactx = (struct aa_transform_context *)ctx;
122
123 if (decl->Declaration.File == TGSI_FILE_OUTPUT &&
124 decl->Semantic.Name == TGSI_SEMANTIC_COLOR &&
125 decl->Semantic.Index == 0) {
126 aactx->colorOutput = decl->Range.First;
127 }
128 else if (decl->Declaration.File == TGSI_FILE_INPUT) {
129 if ((int) decl->Range.Last > aactx->maxInput)
130 aactx->maxInput = decl->Range.Last;
131 if (decl->Semantic.Name == TGSI_SEMANTIC_GENERIC &&
132 (int) decl->Semantic.Index > aactx->maxGeneric) {
133 aactx->maxGeneric = decl->Semantic.Index;
134 }
135 }
136 else if (decl->Declaration.File == TGSI_FILE_TEMPORARY) {
137 uint i;
138 for (i = decl->Range.First;
139 i <= decl->Range.Last; i++) {
140 /*
141 * XXX this bitfield doesn't really cut it...
142 */
143 aactx->tempsUsed |= UINT64_C(1) << i;
144 }
145 }
146
147 ctx->emit_declaration(ctx, decl);
148 }
149
150
151 /**
152 * Find the lowest zero bit, or -1 if bitfield is all ones.
153 */
154 static int
free_bit(uint64_t bitfield)155 free_bit(uint64_t bitfield)
156 {
157 return ffsll(~bitfield) - 1;
158 }
159
160
161 /**
162 * TGSI transform prolog callback.
163 */
164 static void
aa_transform_prolog(struct tgsi_transform_context * ctx)165 aa_transform_prolog(struct tgsi_transform_context *ctx)
166 {
167 struct aa_transform_context *aactx = (struct aa_transform_context *) ctx;
168 uint64_t usedTemps = aactx->tempsUsed;
169
170 /* find two free temp regs */
171 aactx->colorTemp = free_bit(usedTemps);
172 usedTemps |= UINT64_C(1) << aactx->colorTemp;
173 aactx->aaTemp = free_bit(usedTemps);
174 assert(aactx->colorTemp >= 0);
175 assert(aactx->aaTemp >= 0);
176
177 /* declare new generic input/texcoord */
178 tgsi_transform_input_decl(ctx, aactx->maxInput + 1,
179 TGSI_SEMANTIC_GENERIC, aactx->maxGeneric + 1,
180 TGSI_INTERPOLATE_LINEAR);
181
182 /* declare new temp regs */
183 tgsi_transform_temp_decl(ctx, aactx->aaTemp);
184 tgsi_transform_temp_decl(ctx, aactx->colorTemp);
185 }
186
187
188 /**
189 * TGSI transform epilog callback.
190 */
191 static void
aa_transform_epilog(struct tgsi_transform_context * ctx)192 aa_transform_epilog(struct tgsi_transform_context *ctx)
193 {
194 struct aa_transform_context *aactx = (struct aa_transform_context *) ctx;
195
196 if (aactx->colorOutput != -1) {
197 struct tgsi_full_instruction inst;
198 /* insert distance-based coverage code for antialiasing. */
199
200 /* saturate(linewidth - fabs(interpx), linelength - fabs(interpz) */
201 inst = tgsi_default_full_instruction();
202 inst.Instruction.Saturate = true;
203 inst.Instruction.Opcode = TGSI_OPCODE_ADD;
204 inst.Instruction.NumDstRegs = 1;
205 tgsi_transform_dst_reg(&inst.Dst[0], TGSI_FILE_TEMPORARY,
206 aactx->aaTemp, TGSI_WRITEMASK_XZ);
207 inst.Instruction.NumSrcRegs = 2;
208 tgsi_transform_src_reg(&inst.Src[1], TGSI_FILE_INPUT, aactx->maxInput + 1,
209 TGSI_SWIZZLE_X, TGSI_SWIZZLE_X,
210 TGSI_SWIZZLE_Z, TGSI_SWIZZLE_Z);
211 tgsi_transform_src_reg(&inst.Src[0], TGSI_FILE_INPUT, aactx->maxInput + 1,
212 TGSI_SWIZZLE_Y, TGSI_SWIZZLE_Y,
213 TGSI_SWIZZLE_W, TGSI_SWIZZLE_W);
214 inst.Src[1].Register.Absolute = true;
215 inst.Src[1].Register.Negate = true;
216 ctx->emit_instruction(ctx, &inst);
217
218 /* MUL width / height alpha */
219 tgsi_transform_op2_swz_inst(ctx, TGSI_OPCODE_MUL,
220 TGSI_FILE_TEMPORARY, aactx->aaTemp,
221 TGSI_WRITEMASK_W,
222 TGSI_FILE_TEMPORARY, aactx->aaTemp,
223 TGSI_SWIZZLE_X,
224 TGSI_FILE_TEMPORARY, aactx->aaTemp,
225 TGSI_SWIZZLE_Z, false);
226
227 /* MOV rgb */
228 tgsi_transform_op1_inst(ctx, TGSI_OPCODE_MOV,
229 TGSI_FILE_OUTPUT, aactx->colorOutput,
230 TGSI_WRITEMASK_XYZ,
231 TGSI_FILE_TEMPORARY, aactx->colorTemp);
232
233 /* MUL alpha */
234 tgsi_transform_op2_inst(ctx, TGSI_OPCODE_MUL,
235 TGSI_FILE_OUTPUT, aactx->colorOutput,
236 TGSI_WRITEMASK_W,
237 TGSI_FILE_TEMPORARY, aactx->colorTemp,
238 TGSI_FILE_TEMPORARY, aactx->aaTemp, false);
239 }
240 }
241
242
243 /**
244 * TGSI instruction transform callback.
245 * Replace writes to result.color w/ a temp reg.
246 */
247 static void
aa_transform_inst(struct tgsi_transform_context * ctx,struct tgsi_full_instruction * inst)248 aa_transform_inst(struct tgsi_transform_context *ctx,
249 struct tgsi_full_instruction *inst)
250 {
251 struct aa_transform_context *aactx = (struct aa_transform_context *) ctx;
252 uint i;
253
254 /*
255 * Look for writes to result.color and replace with colorTemp reg.
256 */
257 for (i = 0; i < inst->Instruction.NumDstRegs; i++) {
258 struct tgsi_full_dst_register *dst = &inst->Dst[i];
259 if (dst->Register.File == TGSI_FILE_OUTPUT &&
260 dst->Register.Index == aactx->colorOutput) {
261 dst->Register.File = TGSI_FILE_TEMPORARY;
262 dst->Register.Index = aactx->colorTemp;
263 }
264 }
265
266 ctx->emit_instruction(ctx, inst);
267 }
268
269
270 /**
271 * Generate the frag shader we'll use for drawing AA lines.
272 * This will be the user's shader plus some arithmetic instructions.
273 */
274 static boolean
generate_aaline_fs(struct aaline_stage * aaline)275 generate_aaline_fs(struct aaline_stage *aaline)
276 {
277 struct pipe_context *pipe = aaline->stage.draw->pipe;
278 const struct pipe_shader_state *orig_fs = &aaline->fs->state;
279 struct pipe_shader_state aaline_fs;
280 struct aa_transform_context transform;
281 const uint newLen = tgsi_num_tokens(orig_fs->tokens) + NUM_NEW_TOKENS;
282
283 aaline_fs = *orig_fs; /* copy to init */
284 aaline_fs.tokens = tgsi_alloc_tokens(newLen);
285 if (aaline_fs.tokens == NULL)
286 return FALSE;
287
288 memset(&transform, 0, sizeof(transform));
289 transform.colorOutput = -1;
290 transform.maxInput = -1;
291 transform.maxGeneric = -1;
292 transform.colorTemp = -1;
293 transform.aaTemp = -1;
294 transform.base.prolog = aa_transform_prolog;
295 transform.base.epilog = aa_transform_epilog;
296 transform.base.transform_instruction = aa_transform_inst;
297 transform.base.transform_declaration = aa_transform_decl;
298
299 tgsi_transform_shader(orig_fs->tokens,
300 (struct tgsi_token *) aaline_fs.tokens,
301 newLen, &transform.base);
302
303 #if 0 /* DEBUG */
304 debug_printf("draw_aaline, orig shader:\n");
305 tgsi_dump(orig_fs->tokens, 0);
306 debug_printf("draw_aaline, new shader:\n");
307 tgsi_dump(aaline_fs.tokens, 0);
308 #endif
309
310 aaline->fs->aaline_fs = aaline->driver_create_fs_state(pipe, &aaline_fs);
311 if (aaline->fs->aaline_fs != NULL)
312 aaline->fs->generic_attrib = transform.maxGeneric + 1;
313
314 FREE((void *)aaline_fs.tokens);
315 return aaline->fs->aaline_fs != NULL;
316 }
317
318 static boolean
generate_aaline_fs_nir(struct aaline_stage * aaline)319 generate_aaline_fs_nir(struct aaline_stage *aaline)
320 {
321 struct pipe_context *pipe = aaline->stage.draw->pipe;
322 const struct pipe_shader_state *orig_fs = &aaline->fs->state;
323 struct pipe_shader_state aaline_fs;
324
325 aaline_fs = *orig_fs; /* copy to init */
326 aaline_fs.ir.nir = nir_shader_clone(NULL, orig_fs->ir.nir);
327 if (!aaline_fs.ir.nir)
328 return FALSE;
329
330 nir_lower_aaline_fs(aaline_fs.ir.nir, &aaline->fs->generic_attrib);
331 aaline->fs->aaline_fs = aaline->driver_create_fs_state(pipe, &aaline_fs);
332 if (aaline->fs->aaline_fs == NULL)
333 return FALSE;
334
335 return TRUE;
336 }
337
338 /**
339 * When we're about to draw our first AA line in a batch, this function is
340 * called to tell the driver to bind our modified fragment shader.
341 */
342 static boolean
bind_aaline_fragment_shader(struct aaline_stage * aaline)343 bind_aaline_fragment_shader(struct aaline_stage *aaline)
344 {
345 struct draw_context *draw = aaline->stage.draw;
346 struct pipe_context *pipe = draw->pipe;
347
348 if (!aaline->fs->aaline_fs) {
349 if (aaline->fs->state.type == PIPE_SHADER_IR_NIR) {
350 if (!generate_aaline_fs_nir(aaline))
351 return FALSE;
352 } else
353 if (!generate_aaline_fs(aaline))
354 return FALSE;
355 }
356
357 draw->suspend_flushing = TRUE;
358 aaline->driver_bind_fs_state(pipe, aaline->fs->aaline_fs);
359 draw->suspend_flushing = FALSE;
360
361 return TRUE;
362 }
363
364
365
366 static inline struct aaline_stage *
aaline_stage(struct draw_stage * stage)367 aaline_stage(struct draw_stage *stage)
368 {
369 return (struct aaline_stage *) stage;
370 }
371
372
373 /**
374 * Draw a wide line by drawing a quad, using geometry which will
375 * fullfill GL's antialiased line requirements.
376 */
377 static void
aaline_line(struct draw_stage * stage,struct prim_header * header)378 aaline_line(struct draw_stage *stage, struct prim_header *header)
379 {
380 const struct aaline_stage *aaline = aaline_stage(stage);
381 const float half_width = aaline->half_line_width;
382 struct prim_header tri;
383 struct vertex_header *v[8];
384 uint coordPos = aaline->coord_slot;
385 uint posPos = aaline->pos_slot;
386 float *pos, *tex;
387 float dx = header->v[1]->data[posPos][0] - header->v[0]->data[posPos][0];
388 float dy = header->v[1]->data[posPos][1] - header->v[0]->data[posPos][1];
389 float a = atan2f(dy, dx);
390 float c_a = cosf(a), s_a = sinf(a);
391 float half_length;
392 float t_l, t_w;
393 uint i;
394
395 half_length = 0.5f * sqrtf(dx * dx + dy * dy);
396
397 if (half_length < 0.5f) {
398 /*
399 * The logic we use for "normal" sized segments is incorrect
400 * for very short segments (basically because we only have
401 * one value to interpolate, not a distance to each endpoint).
402 * Therefore, we calculate half_length differently, so that for
403 * original line length (near) 0, we get alpha 0 - otherwise
404 * max alpha would still be 0.5. This also prevents us from
405 * artifacts due to degenerated lines (the endpoints being
406 * identical, which would still receive anywhere from alpha
407 * 0-0.5 otherwise) (at least the pstipple stage may generate
408 * such lines due to float inaccuracies if line length is very
409 * close to a integer).
410 * Might not be fully accurate neither (because the "strength" of
411 * the line is going to be determined by how close to the pixel
412 * center those 1 or 2 fragments are) but it's probably the best
413 * we can do.
414 */
415 half_length = 2.0f * half_length;
416 } else {
417 half_length = half_length + 0.5f;
418 }
419
420 t_w = half_width;
421 t_l = 0.5f;
422
423 /* allocate/dup new verts */
424 for (i = 0; i < 4; i++) {
425 v[i] = dup_vert(stage, header->v[i/2], i);
426 }
427
428 /*
429 * Quad strip for line from v0 to v1 (*=endpoints):
430 *
431 * 1 3
432 * +-----------------------------+
433 * | |
434 * | *v0 v1* |
435 * | |
436 * +-----------------------------+
437 * 0 2
438 */
439
440 /*
441 * We increase line length by 0.5 pixels (at each endpoint),
442 * and calculate the tri endpoints by moving them half-width
443 * distance away perpendicular to the line.
444 * XXX: since we change line endpoints (by 0.5 pixel), should
445 * actually re-interpolate all other values?
446 */
447
448 /* new verts */
449 pos = v[0]->data[posPos];
450 pos[0] += (-t_l * c_a - t_w * s_a);
451 pos[1] += (-t_l * s_a + t_w * c_a);
452
453 pos = v[1]->data[posPos];
454 pos[0] += (-t_l * c_a - -t_w * s_a);
455 pos[1] += (-t_l * s_a + -t_w * c_a);
456
457 pos = v[2]->data[posPos];
458 pos[0] += (t_l * c_a - t_w * s_a);
459 pos[1] += (t_l * s_a + t_w * c_a);
460
461 pos = v[3]->data[posPos];
462 pos[0] += (t_l * c_a - -t_w * s_a);
463 pos[1] += (t_l * s_a + -t_w * c_a);
464
465 /* new texcoords */
466 tex = v[0]->data[coordPos];
467 ASSIGN_4V(tex, -half_width, half_width, -half_length, half_length);
468
469 tex = v[1]->data[coordPos];
470 ASSIGN_4V(tex, half_width, half_width, -half_length, half_length);
471
472 tex = v[2]->data[coordPos];
473 ASSIGN_4V(tex, -half_width, half_width, half_length, half_length);
474
475 tex = v[3]->data[coordPos];
476 ASSIGN_4V(tex, half_width, half_width, half_length, half_length);
477
478 tri.v[0] = v[2]; tri.v[1] = v[1]; tri.v[2] = v[0];
479 stage->next->tri(stage->next, &tri);
480
481 tri.v[0] = v[3]; tri.v[1] = v[1]; tri.v[2] = v[2];
482 stage->next->tri(stage->next, &tri);
483 }
484
485
486 static void
aaline_first_line(struct draw_stage * stage,struct prim_header * header)487 aaline_first_line(struct draw_stage *stage, struct prim_header *header)
488 {
489 auto struct aaline_stage *aaline = aaline_stage(stage);
490 struct draw_context *draw = stage->draw;
491 struct pipe_context *pipe = draw->pipe;
492 const struct pipe_rasterizer_state *rast = draw->rasterizer;
493 void *r;
494
495 assert(draw->rasterizer->line_smooth && !draw->rasterizer->multisample);
496
497 if (draw->rasterizer->line_width <= 1.0)
498 aaline->half_line_width = 1.0;
499 else
500 aaline->half_line_width = 0.5f * draw->rasterizer->line_width + 0.5f;
501
502 if (!draw->rasterizer->half_pixel_center)
503 /*
504 * The tex coords probably would need adjustments?
505 */
506 debug_printf("aa lines without half pixel center may be wrong\n");
507
508 /*
509 * Bind (generate) our fragprog
510 */
511 if (!bind_aaline_fragment_shader(aaline)) {
512 stage->line = draw_pipe_passthrough_line;
513 stage->line(stage, header);
514 return;
515 }
516
517 draw_aaline_prepare_outputs(draw, draw->pipeline.aaline);
518
519 draw->suspend_flushing = TRUE;
520
521 /* Disable triangle culling, stippling, unfilled mode etc. */
522 r = draw_get_rasterizer_no_cull(draw, rast);
523 pipe->bind_rasterizer_state(pipe, r);
524
525 draw->suspend_flushing = FALSE;
526
527 /* now really draw first line */
528 stage->line = aaline_line;
529 stage->line(stage, header);
530 }
531
532
533 static void
aaline_flush(struct draw_stage * stage,unsigned flags)534 aaline_flush(struct draw_stage *stage, unsigned flags)
535 {
536 struct draw_context *draw = stage->draw;
537 struct aaline_stage *aaline = aaline_stage(stage);
538 struct pipe_context *pipe = draw->pipe;
539
540 stage->line = aaline_first_line;
541 stage->next->flush(stage->next, flags);
542
543 /* restore original frag shader */
544 draw->suspend_flushing = TRUE;
545 aaline->driver_bind_fs_state(pipe, aaline->fs ? aaline->fs->driver_fs : NULL);
546
547 /* restore original rasterizer state */
548 if (draw->rast_handle) {
549 pipe->bind_rasterizer_state(pipe, draw->rast_handle);
550 }
551
552 draw->suspend_flushing = FALSE;
553
554 draw_remove_extra_vertex_attribs(draw);
555 }
556
557
558 static void
aaline_reset_stipple_counter(struct draw_stage * stage)559 aaline_reset_stipple_counter(struct draw_stage *stage)
560 {
561 stage->next->reset_stipple_counter(stage->next);
562 }
563
564
565 static void
aaline_destroy(struct draw_stage * stage)566 aaline_destroy(struct draw_stage *stage)
567 {
568 struct aaline_stage *aaline = aaline_stage(stage);
569 struct pipe_context *pipe = stage->draw->pipe;
570
571 draw_free_temp_verts(stage);
572
573 /* restore the old entry points */
574 pipe->create_fs_state = aaline->driver_create_fs_state;
575 pipe->bind_fs_state = aaline->driver_bind_fs_state;
576 pipe->delete_fs_state = aaline->driver_delete_fs_state;
577
578 FREE(stage);
579 }
580
581
582 static struct aaline_stage *
draw_aaline_stage(struct draw_context * draw)583 draw_aaline_stage(struct draw_context *draw)
584 {
585 struct aaline_stage *aaline = CALLOC_STRUCT(aaline_stage);
586 if (!aaline)
587 return NULL;
588
589 aaline->stage.draw = draw;
590 aaline->stage.name = "aaline";
591 aaline->stage.next = NULL;
592 aaline->stage.point = draw_pipe_passthrough_point;
593 aaline->stage.line = aaline_first_line;
594 aaline->stage.tri = draw_pipe_passthrough_tri;
595 aaline->stage.flush = aaline_flush;
596 aaline->stage.reset_stipple_counter = aaline_reset_stipple_counter;
597 aaline->stage.destroy = aaline_destroy;
598
599 if (!draw_alloc_temp_verts(&aaline->stage, 8)) {
600 aaline->stage.destroy(&aaline->stage);
601 return NULL;
602 }
603
604 return aaline;
605 }
606
607
608 static struct aaline_stage *
aaline_stage_from_pipe(struct pipe_context * pipe)609 aaline_stage_from_pipe(struct pipe_context *pipe)
610 {
611 struct draw_context *draw = (struct draw_context *) pipe->draw;
612
613 if (draw) {
614 return aaline_stage(draw->pipeline.aaline);
615 } else {
616 return NULL;
617 }
618 }
619
620
621 /**
622 * This function overrides the driver's create_fs_state() function and
623 * will typically be called by the gallium frontend.
624 */
625 static void *
aaline_create_fs_state(struct pipe_context * pipe,const struct pipe_shader_state * fs)626 aaline_create_fs_state(struct pipe_context *pipe,
627 const struct pipe_shader_state *fs)
628 {
629 struct aaline_stage *aaline = aaline_stage_from_pipe(pipe);
630 struct aaline_fragment_shader *aafs = NULL;
631
632 if (!aaline)
633 return NULL;
634
635 aafs = CALLOC_STRUCT(aaline_fragment_shader);
636
637 if (!aafs)
638 return NULL;
639
640 aafs->state.type = fs->type;
641 if (fs->type == PIPE_SHADER_IR_TGSI)
642 aafs->state.tokens = tgsi_dup_tokens(fs->tokens);
643 else
644 aafs->state.ir.nir = nir_shader_clone(NULL, fs->ir.nir);
645
646 /* pass-through */
647 aafs->driver_fs = aaline->driver_create_fs_state(pipe, fs);
648
649 return aafs;
650 }
651
652
653 static void
aaline_bind_fs_state(struct pipe_context * pipe,void * fs)654 aaline_bind_fs_state(struct pipe_context *pipe, void *fs)
655 {
656 struct aaline_stage *aaline = aaline_stage_from_pipe(pipe);
657 struct aaline_fragment_shader *aafs = (struct aaline_fragment_shader *) fs;
658
659 if (!aaline) {
660 return;
661 }
662
663 /* save current */
664 aaline->fs = aafs;
665 /* pass-through */
666 aaline->driver_bind_fs_state(pipe, (aafs ? aafs->driver_fs : NULL));
667 }
668
669
670 static void
aaline_delete_fs_state(struct pipe_context * pipe,void * fs)671 aaline_delete_fs_state(struct pipe_context *pipe, void *fs)
672 {
673 struct aaline_stage *aaline = aaline_stage_from_pipe(pipe);
674 struct aaline_fragment_shader *aafs = (struct aaline_fragment_shader *) fs;
675
676 if (!aafs) {
677 return;
678 }
679
680 if (aaline) {
681 /* pass-through */
682 aaline->driver_delete_fs_state(pipe, aafs->driver_fs);
683
684 if (aafs->aaline_fs)
685 aaline->driver_delete_fs_state(pipe, aafs->aaline_fs);
686 }
687
688 if (aafs->state.type == PIPE_SHADER_IR_TGSI)
689 FREE((void*)aafs->state.tokens);
690 else
691 ralloc_free(aafs->state.ir.nir);
692 FREE(aafs);
693 }
694
695
696 void
draw_aaline_prepare_outputs(struct draw_context * draw,struct draw_stage * stage)697 draw_aaline_prepare_outputs(struct draw_context *draw,
698 struct draw_stage *stage)
699 {
700 struct aaline_stage *aaline = aaline_stage(stage);
701 const struct pipe_rasterizer_state *rast = draw->rasterizer;
702
703 /* update vertex attrib info */
704 aaline->pos_slot = draw_current_shader_position_output(draw);
705
706 if (!rast->line_smooth || rast->multisample)
707 return;
708
709 /* allocate the extra post-transformed vertex attribute */
710 if (aaline->fs && aaline->fs->aaline_fs)
711 aaline->coord_slot = draw_alloc_extra_vertex_attrib(draw,
712 TGSI_SEMANTIC_GENERIC,
713 aaline->fs->generic_attrib);
714 else
715 aaline->coord_slot = -1;
716 }
717
718 /**
719 * Called by drivers that want to install this AA line prim stage
720 * into the draw module's pipeline. This will not be used if the
721 * hardware has native support for AA lines.
722 */
723 boolean
draw_install_aaline_stage(struct draw_context * draw,struct pipe_context * pipe)724 draw_install_aaline_stage(struct draw_context *draw, struct pipe_context *pipe)
725 {
726 struct aaline_stage *aaline;
727
728 pipe->draw = (void *) draw;
729
730 /*
731 * Create / install AA line drawing / prim stage
732 */
733 aaline = draw_aaline_stage(draw);
734 if (!aaline)
735 return FALSE;
736
737 /* save original driver functions */
738 aaline->driver_create_fs_state = pipe->create_fs_state;
739 aaline->driver_bind_fs_state = pipe->bind_fs_state;
740 aaline->driver_delete_fs_state = pipe->delete_fs_state;
741
742 /* override the driver's functions */
743 pipe->create_fs_state = aaline_create_fs_state;
744 pipe->bind_fs_state = aaline_bind_fs_state;
745 pipe->delete_fs_state = aaline_delete_fs_state;
746
747 /* Install once everything is known to be OK:
748 */
749 draw->pipeline.aaline = &aaline->stage;
750
751 return TRUE;
752 }
753