1 /**************************************************************************
2 *
3 * Copyright 2007 VMware, Inc.
4 * All Rights Reserved.
5 *
6 * Permission is hereby granted, free of charge, to any person obtaining a
7 * copy of this software and associated documentation files (the
8 * "Software"), to deal in the Software without restriction, including
9 * without limitation the rights to use, copy, modify, merge, publish,
10 * distribute, sub license, and/or sell copies of the Software, and to
11 * permit persons to whom the Software is furnished to do so, subject to
12 * the following conditions:
13 *
14 * The above copyright notice and this permission notice (including the
15 * next paragraph) shall be included in all copies or substantial portions
16 * of the Software.
17 *
18 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
19 * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
20 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT.
21 * IN NO EVENT SHALL VMWARE AND/OR ITS SUPPLIERS BE LIABLE FOR
22 * ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT,
23 * TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE
24 * SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
25 *
26 **************************************************************************/
27
28 /* Authors: Keith Whitwell <keithw@vmware.com>
29 */
30
31 #include "compiler/nir/nir_builder.h"
32 #include "draw/draw_context.h"
33 #include "nir/nir_to_tgsi.h"
34 #include "tgsi/tgsi_parse.h"
35 #include "util/u_helpers.h"
36 #include "util/u_inlines.h"
37 #include "util/u_math.h"
38 #include "util/u_memory.h"
39 #include "util/u_transfer.h"
40 #include "nir.h"
41
42 #include "i915_context.h"
43 #include "i915_fpc.h"
44 #include "i915_reg.h"
45 #include "i915_resource.h"
46 #include "i915_state.h"
47 #include "i915_state_inlines.h"
48
49 /* The i915 (and related graphics cores) do not support GL_CLAMP. The
50 * Intel drivers for "other operating systems" implement GL_CLAMP as
51 * GL_CLAMP_TO_EDGE, so the same is done here.
52 */
53 static unsigned
translate_wrap_mode(unsigned wrap)54 translate_wrap_mode(unsigned wrap)
55 {
56 switch (wrap) {
57 case PIPE_TEX_WRAP_REPEAT:
58 return TEXCOORDMODE_WRAP;
59 case PIPE_TEX_WRAP_CLAMP:
60 return TEXCOORDMODE_CLAMP_EDGE; /* not quite correct */
61 case PIPE_TEX_WRAP_CLAMP_TO_EDGE:
62 return TEXCOORDMODE_CLAMP_EDGE;
63 case PIPE_TEX_WRAP_CLAMP_TO_BORDER:
64 return TEXCOORDMODE_CLAMP_BORDER;
65 case PIPE_TEX_WRAP_MIRROR_REPEAT:
66 return TEXCOORDMODE_MIRROR;
67 default:
68 return TEXCOORDMODE_WRAP;
69 }
70 }
71
72 static unsigned
translate_img_filter(unsigned filter)73 translate_img_filter(unsigned filter)
74 {
75 switch (filter) {
76 case PIPE_TEX_FILTER_NEAREST:
77 return FILTER_NEAREST;
78 case PIPE_TEX_FILTER_LINEAR:
79 return FILTER_LINEAR;
80 default:
81 assert(0);
82 return FILTER_NEAREST;
83 }
84 }
85
86 static unsigned
translate_mip_filter(unsigned filter)87 translate_mip_filter(unsigned filter)
88 {
89 switch (filter) {
90 case PIPE_TEX_MIPFILTER_NONE:
91 return MIPFILTER_NONE;
92 case PIPE_TEX_MIPFILTER_NEAREST:
93 return MIPFILTER_NEAREST;
94 case PIPE_TEX_MIPFILTER_LINEAR:
95 return MIPFILTER_LINEAR;
96 default:
97 assert(0);
98 return MIPFILTER_NONE;
99 }
100 }
101
102 static uint32_t
i915_remap_lis6_blend_dst_alpha(uint32_t lis6,uint32_t normal,uint32_t inv)103 i915_remap_lis6_blend_dst_alpha(uint32_t lis6, uint32_t normal, uint32_t inv)
104 {
105 uint32_t src = (lis6 >> S6_CBUF_SRC_BLEND_FACT_SHIFT) & BLENDFACT_MASK;
106 lis6 &= ~SRC_BLND_FACT(BLENDFACT_MASK);
107 if (src == BLENDFACT_DST_ALPHA)
108 src = normal;
109 else if (src == BLENDFACT_INV_DST_ALPHA)
110 src = inv;
111 lis6 |= SRC_BLND_FACT(src);
112
113 uint32_t dst = (lis6 >> S6_CBUF_DST_BLEND_FACT_SHIFT) & BLENDFACT_MASK;
114 lis6 &= ~DST_BLND_FACT(BLENDFACT_MASK);
115 if (dst == BLENDFACT_DST_ALPHA)
116 dst = normal;
117 else if (dst == BLENDFACT_INV_DST_ALPHA)
118 dst = inv;
119 lis6 |= DST_BLND_FACT(dst);
120
121 return lis6;
122 }
123
124 static uint32_t
i915_remap_iab_blend_dst_alpha(uint32_t iab,uint32_t normal,uint32_t inv)125 i915_remap_iab_blend_dst_alpha(uint32_t iab, uint32_t normal, uint32_t inv)
126 {
127 uint32_t src = (iab >> IAB_SRC_FACTOR_SHIFT) & BLENDFACT_MASK;
128 iab &= ~SRC_BLND_FACT(BLENDFACT_MASK);
129 if (src == BLENDFACT_DST_ALPHA)
130 src = normal;
131 else if (src == BLENDFACT_INV_DST_ALPHA)
132 src = inv;
133 iab |= SRC_ABLND_FACT(src);
134
135 uint32_t dst = (iab >> IAB_DST_FACTOR_SHIFT) & BLENDFACT_MASK;
136 iab &= ~DST_BLND_FACT(BLENDFACT_MASK);
137 if (dst == BLENDFACT_DST_ALPHA)
138 dst = normal;
139 else if (dst == BLENDFACT_INV_DST_ALPHA)
140 dst = inv;
141 iab |= DST_ABLND_FACT(dst);
142
143 return iab;
144 }
145
146 /* None of this state is actually used for anything yet.
147 */
148 static void *
i915_create_blend_state(struct pipe_context * pipe,const struct pipe_blend_state * blend)149 i915_create_blend_state(struct pipe_context *pipe,
150 const struct pipe_blend_state *blend)
151 {
152 struct i915_blend_state *cso_data = CALLOC_STRUCT(i915_blend_state);
153
154 {
155 unsigned eqRGB = blend->rt[0].rgb_func;
156 unsigned srcRGB = blend->rt[0].rgb_src_factor;
157 unsigned dstRGB = blend->rt[0].rgb_dst_factor;
158
159 unsigned eqA = blend->rt[0].alpha_func;
160 unsigned srcA = blend->rt[0].alpha_src_factor;
161 unsigned dstA = blend->rt[0].alpha_dst_factor;
162
163 /* Special handling for MIN/MAX filter modes handled at
164 * frontend level.
165 */
166
167 if (srcA != srcRGB || dstA != dstRGB || eqA != eqRGB) {
168
169 cso_data->iab = (_3DSTATE_INDEPENDENT_ALPHA_BLEND_CMD |
170 IAB_MODIFY_ENABLE | IAB_ENABLE | IAB_MODIFY_FUNC |
171 IAB_MODIFY_SRC_FACTOR | IAB_MODIFY_DST_FACTOR |
172 SRC_ABLND_FACT(i915_translate_blend_factor(srcA)) |
173 DST_ABLND_FACT(i915_translate_blend_factor(dstA)) |
174 (i915_translate_blend_func(eqA) << IAB_FUNC_SHIFT));
175 } else {
176 cso_data->iab =
177 (_3DSTATE_INDEPENDENT_ALPHA_BLEND_CMD | IAB_MODIFY_ENABLE | 0);
178 }
179 }
180
181 cso_data->modes4 |=
182 (_3DSTATE_MODES_4_CMD | ENABLE_LOGIC_OP_FUNC |
183 LOGIC_OP_FUNC(i915_translate_logic_op(blend->logicop_func)));
184
185 if (blend->logicop_enable)
186 cso_data->LIS5 |= S5_LOGICOP_ENABLE;
187
188 if (blend->dither)
189 cso_data->LIS5 |= S5_COLOR_DITHER_ENABLE;
190
191 /* We potentially do some fixup at emission for non-BGRA targets */
192 if ((blend->rt[0].colormask & PIPE_MASK_R) == 0)
193 cso_data->LIS5 |= S5_WRITEDISABLE_RED;
194
195 if ((blend->rt[0].colormask & PIPE_MASK_G) == 0)
196 cso_data->LIS5 |= S5_WRITEDISABLE_GREEN;
197
198 if ((blend->rt[0].colormask & PIPE_MASK_B) == 0)
199 cso_data->LIS5 |= S5_WRITEDISABLE_BLUE;
200
201 if ((blend->rt[0].colormask & PIPE_MASK_A) == 0)
202 cso_data->LIS5 |= S5_WRITEDISABLE_ALPHA;
203
204 if (blend->rt[0].blend_enable) {
205 unsigned funcRGB = blend->rt[0].rgb_func;
206 unsigned srcRGB = blend->rt[0].rgb_src_factor;
207 unsigned dstRGB = blend->rt[0].rgb_dst_factor;
208
209 cso_data->LIS6 |=
210 (S6_CBUF_BLEND_ENABLE |
211 SRC_BLND_FACT(i915_translate_blend_factor(srcRGB)) |
212 DST_BLND_FACT(i915_translate_blend_factor(dstRGB)) |
213 (i915_translate_blend_func(funcRGB) << S6_CBUF_BLEND_FUNC_SHIFT));
214 }
215
216 cso_data->LIS6_alpha_in_g = i915_remap_lis6_blend_dst_alpha(
217 cso_data->LIS6, BLENDFACT_DST_COLR, BLENDFACT_INV_DST_COLR);
218 cso_data->LIS6_alpha_is_x = i915_remap_lis6_blend_dst_alpha(
219 cso_data->LIS6, BLENDFACT_ONE, BLENDFACT_ZERO);
220
221 cso_data->iab_alpha_in_g = i915_remap_iab_blend_dst_alpha(
222 cso_data->iab, BLENDFACT_DST_COLR, BLENDFACT_INV_DST_COLR);
223 cso_data->iab_alpha_is_x = i915_remap_iab_blend_dst_alpha(
224 cso_data->iab, BLENDFACT_ONE, BLENDFACT_ZERO);
225
226 return cso_data;
227 }
228
229 static void
i915_bind_blend_state(struct pipe_context * pipe,void * blend)230 i915_bind_blend_state(struct pipe_context *pipe, void *blend)
231 {
232 struct i915_context *i915 = i915_context(pipe);
233
234 if (i915->blend == blend)
235 return;
236
237 i915->blend = (struct i915_blend_state *)blend;
238
239 i915->dirty |= I915_NEW_BLEND;
240 }
241
242 static void
i915_delete_blend_state(struct pipe_context * pipe,void * blend)243 i915_delete_blend_state(struct pipe_context *pipe, void *blend)
244 {
245 FREE(blend);
246 }
247
248 static void
i915_set_blend_color(struct pipe_context * pipe,const struct pipe_blend_color * blend_color)249 i915_set_blend_color(struct pipe_context *pipe,
250 const struct pipe_blend_color *blend_color)
251 {
252 struct i915_context *i915 = i915_context(pipe);
253
254 if (!blend_color)
255 return;
256
257 i915->blend_color = *blend_color;
258
259 i915->dirty |= I915_NEW_BLEND;
260 }
261
262 static void
i915_set_stencil_ref(struct pipe_context * pipe,const struct pipe_stencil_ref stencil_ref)263 i915_set_stencil_ref(struct pipe_context *pipe,
264 const struct pipe_stencil_ref stencil_ref)
265 {
266 struct i915_context *i915 = i915_context(pipe);
267
268 i915->stencil_ref = stencil_ref;
269
270 i915->dirty |= I915_NEW_DEPTH_STENCIL;
271 }
272
273 static void *
i915_create_sampler_state(struct pipe_context * pipe,const struct pipe_sampler_state * sampler)274 i915_create_sampler_state(struct pipe_context *pipe,
275 const struct pipe_sampler_state *sampler)
276 {
277 struct i915_sampler_state *cso = CALLOC_STRUCT(i915_sampler_state);
278 const unsigned ws = sampler->wrap_s;
279 const unsigned wt = sampler->wrap_t;
280 const unsigned wr = sampler->wrap_r;
281 unsigned minFilt, magFilt;
282 unsigned mipFilt;
283
284 cso->templ = *sampler;
285
286 mipFilt = translate_mip_filter(sampler->min_mip_filter);
287 minFilt = translate_img_filter(sampler->min_img_filter);
288 magFilt = translate_img_filter(sampler->mag_img_filter);
289
290 if (sampler->max_anisotropy > 1)
291 minFilt = magFilt = FILTER_ANISOTROPIC;
292
293 if (sampler->max_anisotropy > 2) {
294 cso->state[0] |= SS2_MAX_ANISO_4;
295 }
296
297 {
298 int b = (int)(sampler->lod_bias * 16.0);
299 b = CLAMP(b, -256, 255);
300 cso->state[0] |= ((b << SS2_LOD_BIAS_SHIFT) & SS2_LOD_BIAS_MASK);
301 }
302
303 /* Shadow:
304 */
305 if (sampler->compare_mode == PIPE_TEX_COMPARE_R_TO_TEXTURE) {
306 cso->state[0] |= (SS2_SHADOW_ENABLE | i915_translate_shadow_compare_func(
307 sampler->compare_func));
308
309 minFilt = FILTER_4X4_FLAT;
310 magFilt = FILTER_4X4_FLAT;
311 }
312
313 cso->state[0] |=
314 ((minFilt << SS2_MIN_FILTER_SHIFT) | (mipFilt << SS2_MIP_FILTER_SHIFT) |
315 (magFilt << SS2_MAG_FILTER_SHIFT));
316
317 cso->state[1] |= ((translate_wrap_mode(ws) << SS3_TCX_ADDR_MODE_SHIFT) |
318 (translate_wrap_mode(wt) << SS3_TCY_ADDR_MODE_SHIFT) |
319 (translate_wrap_mode(wr) << SS3_TCZ_ADDR_MODE_SHIFT));
320
321 if (!sampler->unnormalized_coords)
322 cso->state[1] |= SS3_NORMALIZED_COORDS;
323
324 {
325 int minlod = (int)(16.0 * sampler->min_lod);
326 int maxlod = (int)(16.0 * sampler->max_lod);
327 minlod = CLAMP(minlod, 0, 16 * 11);
328 maxlod = CLAMP(maxlod, 0, 16 * 11);
329
330 if (minlod > maxlod)
331 maxlod = minlod;
332
333 cso->minlod = minlod;
334 cso->maxlod = maxlod;
335 }
336
337 {
338 uint8_t r = float_to_ubyte(sampler->border_color.f[0]);
339 uint8_t g = float_to_ubyte(sampler->border_color.f[1]);
340 uint8_t b = float_to_ubyte(sampler->border_color.f[2]);
341 uint8_t a = float_to_ubyte(sampler->border_color.f[3]);
342 cso->state[2] = I915PACKCOLOR8888(r, g, b, a);
343 }
344 return cso;
345 }
346
347 static void
i915_bind_sampler_states(struct pipe_context * pipe,enum pipe_shader_type shader,unsigned start,unsigned num,void ** samplers)348 i915_bind_sampler_states(struct pipe_context *pipe,
349 enum pipe_shader_type shader, unsigned start,
350 unsigned num, void **samplers)
351 {
352 if (shader != PIPE_SHADER_FRAGMENT) {
353 assert(num == 0);
354 return;
355 }
356
357 struct i915_context *i915 = i915_context(pipe);
358 unsigned i;
359
360 /* Check for no-op */
361 if (num == i915->num_samplers &&
362 !memcmp(i915->fragment_sampler + start, samplers, num * sizeof(void *)))
363 return;
364
365 for (i = 0; i < num; ++i)
366 i915->fragment_sampler[i + start] = samplers[i];
367
368 /* find highest non-null samplers[] entry */
369 {
370 unsigned j = MAX2(i915->num_samplers, start + num);
371 while (j > 0 && i915->fragment_sampler[j - 1] == NULL)
372 j--;
373 i915->num_samplers = j;
374 }
375
376 i915->dirty |= I915_NEW_SAMPLER;
377 }
378
379 static void
i915_delete_sampler_state(struct pipe_context * pipe,void * sampler)380 i915_delete_sampler_state(struct pipe_context *pipe, void *sampler)
381 {
382 FREE(sampler);
383 }
384
385 /** XXX move someday? Or consolidate all these simple state setters
386 * into one file.
387 */
388
389 static uint32_t
i915_get_modes4_stencil(const struct pipe_stencil_state * stencil)390 i915_get_modes4_stencil(const struct pipe_stencil_state *stencil)
391 {
392 int testmask = stencil->valuemask & 0xff;
393 int writemask = stencil->writemask & 0xff;
394
395 return (_3DSTATE_MODES_4_CMD | ENABLE_STENCIL_TEST_MASK |
396 STENCIL_TEST_MASK(testmask) | ENABLE_STENCIL_WRITE_MASK |
397 STENCIL_WRITE_MASK(writemask));
398 }
399
400 static uint32_t
i915_get_lis5_stencil(const struct pipe_stencil_state * stencil)401 i915_get_lis5_stencil(const struct pipe_stencil_state *stencil)
402 {
403 int test = i915_translate_compare_func(stencil->func);
404 int fop = i915_translate_stencil_op(stencil->fail_op);
405 int dfop = i915_translate_stencil_op(stencil->zfail_op);
406 int dpop = i915_translate_stencil_op(stencil->zpass_op);
407
408 return (S5_STENCIL_TEST_ENABLE | S5_STENCIL_WRITE_ENABLE |
409 (test << S5_STENCIL_TEST_FUNC_SHIFT) |
410 (fop << S5_STENCIL_FAIL_SHIFT) |
411 (dfop << S5_STENCIL_PASS_Z_FAIL_SHIFT) |
412 (dpop << S5_STENCIL_PASS_Z_PASS_SHIFT));
413 }
414
415 static uint32_t
i915_get_bfo(const struct pipe_stencil_state * stencil)416 i915_get_bfo(const struct pipe_stencil_state *stencil)
417 {
418 int test = i915_translate_compare_func(stencil->func);
419 int fop = i915_translate_stencil_op(stencil->fail_op);
420 int dfop = i915_translate_stencil_op(stencil->zfail_op);
421 int dpop = i915_translate_stencil_op(stencil->zpass_op);
422
423 return (_3DSTATE_BACKFACE_STENCIL_OPS | BFO_ENABLE_STENCIL_FUNCS |
424 BFO_ENABLE_STENCIL_TWO_SIDE | BFO_ENABLE_STENCIL_REF |
425 BFO_STENCIL_TWO_SIDE | (test << BFO_STENCIL_TEST_SHIFT) |
426 (fop << BFO_STENCIL_FAIL_SHIFT) |
427 (dfop << BFO_STENCIL_PASS_Z_FAIL_SHIFT) |
428 (dpop << BFO_STENCIL_PASS_Z_PASS_SHIFT));
429 }
430
431 static uint32_t
i915_get_bfm(const struct pipe_stencil_state * stencil)432 i915_get_bfm(const struct pipe_stencil_state *stencil)
433 {
434 return (_3DSTATE_BACKFACE_STENCIL_MASKS | BFM_ENABLE_STENCIL_TEST_MASK |
435 BFM_ENABLE_STENCIL_WRITE_MASK |
436 ((stencil->valuemask & 0xff) << BFM_STENCIL_TEST_MASK_SHIFT) |
437 ((stencil->writemask & 0xff) << BFM_STENCIL_WRITE_MASK_SHIFT));
438 }
439
440 static void *
i915_create_depth_stencil_state(struct pipe_context * pipe,const struct pipe_depth_stencil_alpha_state * depth_stencil)441 i915_create_depth_stencil_state(
442 struct pipe_context *pipe,
443 const struct pipe_depth_stencil_alpha_state *depth_stencil)
444 {
445 struct i915_depth_stencil_state *cso =
446 CALLOC_STRUCT(i915_depth_stencil_state);
447
448 cso->stencil_modes4_cw = i915_get_modes4_stencil(&depth_stencil->stencil[0]);
449 cso->stencil_modes4_ccw =
450 i915_get_modes4_stencil(&depth_stencil->stencil[1]);
451
452 if (depth_stencil->stencil[0].enabled) {
453 cso->stencil_LIS5_cw = i915_get_lis5_stencil(&depth_stencil->stencil[0]);
454 }
455
456 if (depth_stencil->stencil[1].enabled) {
457 cso->bfo_cw[0] = i915_get_bfo(&depth_stencil->stencil[1]);
458 cso->bfo_cw[1] = i915_get_bfm(&depth_stencil->stencil[1]);
459
460 /* Precompute the backface stencil settings if front winding order is
461 * reversed -- HW doesn't have a bit to flip it for us.
462 */
463 cso->stencil_LIS5_ccw = i915_get_lis5_stencil(&depth_stencil->stencil[1]);
464 cso->bfo_ccw[0] = i915_get_bfo(&depth_stencil->stencil[0]);
465 cso->bfo_ccw[1] = i915_get_bfm(&depth_stencil->stencil[0]);
466 } else {
467 /* This actually disables two-side stencil: The bit set is a
468 * modify-enable bit to indicate we are changing the two-side
469 * setting. Then there is a symbolic zero to show that we are
470 * setting the flag to zero/off.
471 */
472 cso->bfo_cw[0] = cso->bfo_ccw[0] =
473 (_3DSTATE_BACKFACE_STENCIL_OPS | BFO_ENABLE_STENCIL_TWO_SIDE | 0);
474 cso->bfo_cw[1] = cso->bfo_ccw[1] = 0;
475
476 cso->stencil_LIS5_ccw = cso->stencil_LIS5_cw;
477 }
478
479 if (depth_stencil->depth_enabled) {
480 int func = i915_translate_compare_func(depth_stencil->depth_func);
481
482 cso->depth_LIS6 |=
483 (S6_DEPTH_TEST_ENABLE | (func << S6_DEPTH_TEST_FUNC_SHIFT));
484
485 if (depth_stencil->depth_writemask)
486 cso->depth_LIS6 |= S6_DEPTH_WRITE_ENABLE;
487 }
488
489 if (depth_stencil->alpha_enabled) {
490 int test = i915_translate_compare_func(depth_stencil->alpha_func);
491 uint8_t refByte = float_to_ubyte(depth_stencil->alpha_ref_value);
492
493 cso->depth_LIS6 |=
494 (S6_ALPHA_TEST_ENABLE | (test << S6_ALPHA_TEST_FUNC_SHIFT) |
495 (((unsigned)refByte) << S6_ALPHA_REF_SHIFT));
496 }
497
498 return cso;
499 }
500
501 static void
i915_bind_depth_stencil_state(struct pipe_context * pipe,void * depth_stencil)502 i915_bind_depth_stencil_state(struct pipe_context *pipe, void *depth_stencil)
503 {
504 struct i915_context *i915 = i915_context(pipe);
505
506 if (i915->depth_stencil == depth_stencil)
507 return;
508
509 i915->depth_stencil = (const struct i915_depth_stencil_state *)depth_stencil;
510
511 i915->dirty |= I915_NEW_DEPTH_STENCIL;
512 }
513
514 static void
i915_delete_depth_stencil_state(struct pipe_context * pipe,void * depth_stencil)515 i915_delete_depth_stencil_state(struct pipe_context *pipe, void *depth_stencil)
516 {
517 FREE(depth_stencil);
518 }
519
520 static void
i915_set_scissor_states(struct pipe_context * pipe,unsigned start_slot,unsigned num_scissors,const struct pipe_scissor_state * scissor)521 i915_set_scissor_states(struct pipe_context *pipe, unsigned start_slot,
522 unsigned num_scissors,
523 const struct pipe_scissor_state *scissor)
524 {
525 struct i915_context *i915 = i915_context(pipe);
526
527 memcpy(&i915->scissor, scissor, sizeof(*scissor));
528 i915->dirty |= I915_NEW_SCISSOR;
529 }
530
531 static void
i915_set_polygon_stipple(struct pipe_context * pipe,const struct pipe_poly_stipple * stipple)532 i915_set_polygon_stipple(struct pipe_context *pipe,
533 const struct pipe_poly_stipple *stipple)
534 {
535 }
536
537 static const struct nir_to_tgsi_options ntt_options = {
538 .lower_fabs = true,
539 };
540
541 static void *
i915_create_fs_state(struct pipe_context * pipe,const struct pipe_shader_state * templ)542 i915_create_fs_state(struct pipe_context *pipe,
543 const struct pipe_shader_state *templ)
544 {
545 struct i915_context *i915 = i915_context(pipe);
546 struct i915_fragment_shader *ifs = CALLOC_STRUCT(i915_fragment_shader);
547 if (!ifs)
548 return NULL;
549
550 ifs->draw_data = draw_create_fragment_shader(i915->draw, templ);
551
552 if (templ->type == PIPE_SHADER_IR_NIR) {
553 nir_shader *s = templ->ir.nir;
554 ifs->internal = s->info.internal;
555
556 ifs->state.tokens = nir_to_tgsi_options(s, pipe->screen, &ntt_options);
557 } else {
558 assert(templ->type == PIPE_SHADER_IR_TGSI);
559 /* we need to keep a local copy of the tokens */
560 ifs->state.tokens = tgsi_dup_tokens(templ->tokens);
561 ifs->internal = i915->no_log_program_errors;
562 }
563
564 ifs->state.type = PIPE_SHADER_IR_TGSI;
565
566 tgsi_scan_shader(ifs->state.tokens, &ifs->info);
567
568 /* The shader's compiled to i915 instructions here */
569 i915_translate_fragment_program(i915, ifs);
570
571 return ifs;
572 }
573
574 static void
i915_bind_fs_state(struct pipe_context * pipe,void * shader)575 i915_bind_fs_state(struct pipe_context *pipe, void *shader)
576 {
577 struct i915_context *i915 = i915_context(pipe);
578
579 if (i915->fs == shader)
580 return;
581
582 i915->fs = (struct i915_fragment_shader *)shader;
583
584 draw_bind_fragment_shader(i915->draw,
585 (i915->fs ? i915->fs->draw_data : NULL));
586
587 /* Tell draw if we need to do point sprites so we can get PNTC. */
588 if (i915->fs)
589 draw_wide_point_sprites(i915->draw, i915->fs->reads_pntc);
590
591 i915->dirty |= I915_NEW_FS;
592 }
593
594 static void
i915_delete_fs_state(struct pipe_context * pipe,void * shader)595 i915_delete_fs_state(struct pipe_context *pipe, void *shader)
596 {
597 struct i915_fragment_shader *ifs = (struct i915_fragment_shader *)shader;
598
599 ralloc_free(ifs->error);
600 FREE(ifs->program);
601 ifs->program = NULL;
602 FREE((struct tgsi_token *)ifs->state.tokens);
603 ifs->state.tokens = NULL;
604
605 ifs->program_len = 0;
606
607 FREE(ifs);
608 }
609
610 /* Does a test compile at link time to see if we'll be able to run this shader
611 * at runtime. Return a string to the GLSL compiler for anything we should
612 * report as link failure.
613 */
614 char *
i915_test_fragment_shader_compile(struct pipe_screen * screen,nir_shader * s)615 i915_test_fragment_shader_compile(struct pipe_screen *screen, nir_shader *s)
616 {
617 struct i915_fragment_shader *ifs = CALLOC_STRUCT(i915_fragment_shader);
618 if (!ifs)
619 return NULL;
620
621 /* NTT takes ownership of the shader, give it a clone. */
622 s = nir_shader_clone(NULL, s);
623
624 ifs->internal = s->info.internal;
625 ifs->state.tokens = nir_to_tgsi_options(s, screen, &ntt_options);
626 ifs->state.type = PIPE_SHADER_IR_TGSI;
627
628 tgsi_scan_shader(ifs->state.tokens, &ifs->info);
629
630 i915_translate_fragment_program(NULL, ifs);
631
632 char *msg = NULL;
633 if (ifs->error)
634 msg = strdup(ifs->error);
635
636 i915_delete_fs_state(NULL, ifs);
637
638 return msg;
639 }
640
641 static void *
i915_create_vs_state(struct pipe_context * pipe,const struct pipe_shader_state * templ)642 i915_create_vs_state(struct pipe_context *pipe,
643 const struct pipe_shader_state *templ)
644 {
645 struct i915_context *i915 = i915_context(pipe);
646
647 struct pipe_shader_state from_nir = {PIPE_SHADER_IR_TGSI};
648 if (templ->type == PIPE_SHADER_IR_NIR) {
649 nir_shader *s = templ->ir.nir;
650
651 NIR_PASS_V(s, nir_lower_point_size, 1.0, 255.0);
652
653 /* The gallivm draw path doesn't support non-native-integers NIR shaders,
654 * st/mesa does native-integers for the screen as a whole rather than
655 * per-stage, and i915 FS can't do native integers. So, convert to TGSI,
656 * where the draw path *does* support non-native-integers.
657 */
658 from_nir.tokens = nir_to_tgsi(s, pipe->screen);
659 templ = &from_nir;
660 }
661
662 return draw_create_vertex_shader(i915->draw, templ);
663 }
664
665 static void
i915_bind_vs_state(struct pipe_context * pipe,void * shader)666 i915_bind_vs_state(struct pipe_context *pipe, void *shader)
667 {
668 struct i915_context *i915 = i915_context(pipe);
669
670 if (i915->vs == shader)
671 return;
672
673 i915->vs = shader;
674
675 /* just pass-through to draw module */
676 draw_bind_vertex_shader(i915->draw, (struct draw_vertex_shader *)shader);
677
678 i915->dirty |= I915_NEW_VS;
679 }
680
681 static void
i915_delete_vs_state(struct pipe_context * pipe,void * shader)682 i915_delete_vs_state(struct pipe_context *pipe, void *shader)
683 {
684 struct i915_context *i915 = i915_context(pipe);
685
686 /* just pass-through to draw module */
687 draw_delete_vertex_shader(i915->draw, (struct draw_vertex_shader *)shader);
688 }
689
690 static void
i915_set_constant_buffer(struct pipe_context * pipe,enum pipe_shader_type shader,uint32_t index,bool take_ownership,const struct pipe_constant_buffer * cb)691 i915_set_constant_buffer(struct pipe_context *pipe,
692 enum pipe_shader_type shader, uint32_t index,
693 bool take_ownership,
694 const struct pipe_constant_buffer *cb)
695 {
696 struct i915_context *i915 = i915_context(pipe);
697 struct pipe_resource *buf = cb ? cb->buffer : NULL;
698 unsigned new_num = 0;
699 bool diff = true;
700
701 /* XXX don't support geom shaders now */
702 if (shader == PIPE_SHADER_GEOMETRY)
703 return;
704
705 if (cb && cb->user_buffer) {
706 buf = i915_user_buffer_create(pipe->screen, (void *)cb->user_buffer,
707 cb->buffer_size, PIPE_BIND_CONSTANT_BUFFER);
708 }
709
710 /* if we have a new buffer compare it with the old one */
711 if (buf) {
712 struct i915_buffer *ibuf = i915_buffer(buf);
713 struct pipe_resource *old_buf = i915->constants[shader];
714 struct i915_buffer *old = old_buf ? i915_buffer(old_buf) : NULL;
715 unsigned old_num = i915->current.num_user_constants[shader];
716
717 new_num = ibuf->b.width0 / 4 * sizeof(float);
718
719 if (old_num == new_num) {
720 if (old_num == 0)
721 diff = false;
722 #if 0
723 /* XXX no point in running this code since st/mesa only uses user buffers */
724 /* Can't compare the buffer data since they are userbuffers */
725 else if (old && old->free_on_destroy)
726 diff = memcmp(old->data, ibuf->data, ibuf->b.width0);
727 #else
728 (void)old;
729 #endif
730 }
731 } else {
732 diff = i915->current.num_user_constants[shader] != 0;
733 }
734
735 if (take_ownership) {
736 pipe_resource_reference(&i915->constants[shader], NULL);
737 i915->constants[shader] = buf;
738 } else {
739 pipe_resource_reference(&i915->constants[shader], buf);
740 }
741 i915->current.num_user_constants[shader] = new_num;
742
743 if (diff)
744 i915->dirty |= shader == PIPE_SHADER_VERTEX ? I915_NEW_VS_CONSTANTS
745 : I915_NEW_FS_CONSTANTS;
746
747 if (cb && cb->user_buffer) {
748 pipe_resource_reference(&buf, NULL);
749 }
750 }
751
752 static void
i915_set_sampler_views(struct pipe_context * pipe,enum pipe_shader_type shader,unsigned start,unsigned num,unsigned unbind_num_trailing_slots,bool take_ownership,struct pipe_sampler_view ** views)753 i915_set_sampler_views(struct pipe_context *pipe, enum pipe_shader_type shader,
754 unsigned start, unsigned num,
755 unsigned unbind_num_trailing_slots, bool take_ownership,
756 struct pipe_sampler_view **views)
757 {
758 if (shader != PIPE_SHADER_FRAGMENT) {
759 /* No support for VS samplers, because it would mean accessing the
760 * write-combined maps of the textures, which is very slow. VS samplers
761 * are not a required feature of GL2.1 or GLES2.
762 */
763 assert(num == 0);
764 return;
765 }
766 struct i915_context *i915 = i915_context(pipe);
767 uint32_t i;
768
769 assert(num <= PIPE_MAX_SAMPLERS);
770
771 /* Check for no-op */
772 if (views && num == i915->num_fragment_sampler_views &&
773 !memcmp(i915->fragment_sampler_views, views,
774 num * sizeof(struct pipe_sampler_view *))) {
775 if (take_ownership) {
776 for (unsigned i = 0; i < num; i++) {
777 struct pipe_sampler_view *view = views[i];
778 pipe_sampler_view_reference(&view, NULL);
779 }
780 }
781 return;
782 }
783
784 for (i = 0; i < num; i++) {
785 if (take_ownership) {
786 pipe_sampler_view_reference(&i915->fragment_sampler_views[i], NULL);
787 i915->fragment_sampler_views[i] = views[i];
788 } else {
789 pipe_sampler_view_reference(&i915->fragment_sampler_views[i],
790 views[i]);
791 }
792 }
793
794 for (i = num; i < i915->num_fragment_sampler_views; i++)
795 pipe_sampler_view_reference(&i915->fragment_sampler_views[i], NULL);
796
797 i915->num_fragment_sampler_views = num;
798
799 i915->dirty |= I915_NEW_SAMPLER_VIEW;
800 }
801
802 struct pipe_sampler_view *
i915_create_sampler_view_custom(struct pipe_context * pipe,struct pipe_resource * texture,const struct pipe_sampler_view * templ,unsigned width0,unsigned height0)803 i915_create_sampler_view_custom(struct pipe_context *pipe,
804 struct pipe_resource *texture,
805 const struct pipe_sampler_view *templ,
806 unsigned width0, unsigned height0)
807 {
808 struct pipe_sampler_view *view = CALLOC_STRUCT(pipe_sampler_view);
809
810 if (view) {
811 *view = *templ;
812 view->reference.count = 1;
813 view->texture = NULL;
814 pipe_resource_reference(&view->texture, texture);
815 view->context = pipe;
816 }
817
818 return view;
819 }
820
821 static struct pipe_sampler_view *
i915_create_sampler_view(struct pipe_context * pipe,struct pipe_resource * texture,const struct pipe_sampler_view * templ)822 i915_create_sampler_view(struct pipe_context *pipe,
823 struct pipe_resource *texture,
824 const struct pipe_sampler_view *templ)
825 {
826 struct pipe_sampler_view *view = CALLOC_STRUCT(pipe_sampler_view);
827
828 if (view) {
829 *view = *templ;
830 view->reference.count = 1;
831 view->texture = NULL;
832 pipe_resource_reference(&view->texture, texture);
833 view->context = pipe;
834 }
835
836 return view;
837 }
838
839 static void
i915_sampler_view_destroy(struct pipe_context * pipe,struct pipe_sampler_view * view)840 i915_sampler_view_destroy(struct pipe_context *pipe,
841 struct pipe_sampler_view *view)
842 {
843 pipe_resource_reference(&view->texture, NULL);
844 FREE(view);
845 }
846
847 static void
i915_set_framebuffer_state(struct pipe_context * pipe,const struct pipe_framebuffer_state * fb)848 i915_set_framebuffer_state(struct pipe_context *pipe,
849 const struct pipe_framebuffer_state *fb)
850 {
851 struct i915_context *i915 = i915_context(pipe);
852
853 util_copy_framebuffer_state(&i915->framebuffer, fb);
854 if (fb->nr_cbufs) {
855 struct i915_surface *surf = i915_surface(i915->framebuffer.cbufs[0]);
856 if (i915->current.fixup_swizzle != surf->oc_swizzle) {
857 i915->current.fixup_swizzle = surf->oc_swizzle;
858 memcpy(i915->current.color_swizzle, surf->color_swizzle,
859 sizeof(surf->color_swizzle));
860 i915->dirty |= I915_NEW_COLOR_SWIZZLE;
861 }
862 }
863 if (fb->zsbuf)
864 draw_set_zs_format(i915->draw, fb->zsbuf->format);
865
866 i915->dirty |= I915_NEW_FRAMEBUFFER;
867 }
868
869 static void
i915_set_clip_state(struct pipe_context * pipe,const struct pipe_clip_state * clip)870 i915_set_clip_state(struct pipe_context *pipe,
871 const struct pipe_clip_state *clip)
872 {
873 struct i915_context *i915 = i915_context(pipe);
874
875 i915->clip = *clip;
876
877 draw_set_clip_state(i915->draw, clip);
878
879 i915->dirty |= I915_NEW_CLIP;
880 }
881
882 /* Called when gallium frontends notice changes to the viewport
883 * matrix:
884 */
885 static void
i915_set_viewport_states(struct pipe_context * pipe,unsigned start_slot,unsigned num_viewports,const struct pipe_viewport_state * viewport)886 i915_set_viewport_states(struct pipe_context *pipe, unsigned start_slot,
887 unsigned num_viewports,
888 const struct pipe_viewport_state *viewport)
889 {
890 struct i915_context *i915 = i915_context(pipe);
891
892 i915->viewport = *viewport; /* struct copy */
893
894 /* pass the viewport info to the draw module */
895 draw_set_viewport_states(i915->draw, start_slot, num_viewports,
896 &i915->viewport);
897
898 i915->dirty |= I915_NEW_VIEWPORT;
899 }
900
901 static void *
i915_create_rasterizer_state(struct pipe_context * pipe,const struct pipe_rasterizer_state * rasterizer)902 i915_create_rasterizer_state(struct pipe_context *pipe,
903 const struct pipe_rasterizer_state *rasterizer)
904 {
905 struct i915_rasterizer_state *cso = CALLOC_STRUCT(i915_rasterizer_state);
906
907 cso->templ = *rasterizer;
908 cso->light_twoside = rasterizer->light_twoside;
909 cso->ds[0].u = _3DSTATE_DEPTH_OFFSET_SCALE;
910 cso->ds[1].f = rasterizer->offset_scale;
911 if (rasterizer->poly_stipple_enable) {
912 cso->st |= ST1_ENABLE;
913 }
914
915 if (rasterizer->scissor)
916 cso->sc[0] = _3DSTATE_SCISSOR_ENABLE_CMD | ENABLE_SCISSOR_RECT;
917 else
918 cso->sc[0] = _3DSTATE_SCISSOR_ENABLE_CMD | DISABLE_SCISSOR_RECT;
919
920 switch (rasterizer->cull_face) {
921 case PIPE_FACE_NONE:
922 cso->LIS4 |= S4_CULLMODE_NONE;
923 break;
924 case PIPE_FACE_FRONT:
925 if (rasterizer->front_ccw)
926 cso->LIS4 |= S4_CULLMODE_CCW;
927 else
928 cso->LIS4 |= S4_CULLMODE_CW;
929 break;
930 case PIPE_FACE_BACK:
931 if (rasterizer->front_ccw)
932 cso->LIS4 |= S4_CULLMODE_CW;
933 else
934 cso->LIS4 |= S4_CULLMODE_CCW;
935 break;
936 case PIPE_FACE_FRONT_AND_BACK:
937 cso->LIS4 |= S4_CULLMODE_BOTH;
938 break;
939 }
940
941 {
942 int line_width = CLAMP((int)(rasterizer->line_width * 2), 1, 0xf);
943
944 cso->LIS4 |= line_width << S4_LINE_WIDTH_SHIFT;
945
946 if (rasterizer->line_smooth)
947 cso->LIS4 |= S4_LINE_ANTIALIAS_ENABLE;
948 }
949
950 {
951 int point_size = CLAMP((int)rasterizer->point_size, 1, 0xff);
952
953 cso->LIS4 |= point_size << S4_POINT_WIDTH_SHIFT;
954 }
955
956 if (rasterizer->flatshade) {
957 cso->LIS4 |=
958 (S4_FLATSHADE_ALPHA | S4_FLATSHADE_COLOR | S4_FLATSHADE_SPECULAR);
959 }
960
961 if (!rasterizer->flatshade_first)
962 cso->LIS6 |= (2 << S6_TRISTRIP_PV_SHIFT);
963
964 cso->LIS7 = fui(rasterizer->offset_units);
965
966 return cso;
967 }
968
969 static void
i915_bind_rasterizer_state(struct pipe_context * pipe,void * raster)970 i915_bind_rasterizer_state(struct pipe_context *pipe, void *raster)
971 {
972 struct i915_context *i915 = i915_context(pipe);
973
974 if (i915->rasterizer == raster)
975 return;
976
977 i915->rasterizer = (struct i915_rasterizer_state *)raster;
978
979 /* pass-through to draw module */
980 draw_set_rasterizer_state(
981 i915->draw, (i915->rasterizer ? &(i915->rasterizer->templ) : NULL),
982 raster);
983
984 i915->dirty |= I915_NEW_RASTERIZER;
985 }
986
987 static void
i915_delete_rasterizer_state(struct pipe_context * pipe,void * raster)988 i915_delete_rasterizer_state(struct pipe_context *pipe, void *raster)
989 {
990 FREE(raster);
991 }
992
993 static void
i915_set_vertex_buffers(struct pipe_context * pipe,unsigned count,const struct pipe_vertex_buffer * buffers)994 i915_set_vertex_buffers(struct pipe_context *pipe, unsigned count,
995 const struct pipe_vertex_buffer *buffers)
996 {
997 struct i915_context *i915 = i915_context(pipe);
998 struct draw_context *draw = i915->draw;
999
1000 util_set_vertex_buffers_count(i915->vertex_buffers, &i915->nr_vertex_buffers,
1001 buffers, count, true);
1002
1003 /* pass-through to draw module */
1004 draw_set_vertex_buffers(draw, count, buffers);
1005 }
1006
1007 static void *
i915_create_vertex_elements_state(struct pipe_context * pipe,unsigned count,const struct pipe_vertex_element * attribs)1008 i915_create_vertex_elements_state(struct pipe_context *pipe, unsigned count,
1009 const struct pipe_vertex_element *attribs)
1010 {
1011 struct i915_velems_state *velems;
1012 assert(count <= PIPE_MAX_ATTRIBS);
1013 velems =
1014 (struct i915_velems_state *)MALLOC(sizeof(struct i915_velems_state));
1015 if (velems) {
1016 velems->count = count;
1017 memcpy(velems->velem, attribs, sizeof(*attribs) * count);
1018 }
1019 return velems;
1020 }
1021
1022 static void
i915_bind_vertex_elements_state(struct pipe_context * pipe,void * velems)1023 i915_bind_vertex_elements_state(struct pipe_context *pipe, void *velems)
1024 {
1025 struct i915_context *i915 = i915_context(pipe);
1026 struct i915_velems_state *i915_velems = (struct i915_velems_state *)velems;
1027
1028 if (i915->velems == velems)
1029 return;
1030
1031 i915->velems = velems;
1032
1033 /* pass-through to draw module */
1034 if (i915_velems) {
1035 draw_set_vertex_elements(i915->draw, i915_velems->count,
1036 i915_velems->velem);
1037 }
1038 }
1039
1040 static void
i915_delete_vertex_elements_state(struct pipe_context * pipe,void * velems)1041 i915_delete_vertex_elements_state(struct pipe_context *pipe, void *velems)
1042 {
1043 FREE(velems);
1044 }
1045
1046 static void
i915_set_sample_mask(struct pipe_context * pipe,unsigned sample_mask)1047 i915_set_sample_mask(struct pipe_context *pipe, unsigned sample_mask)
1048 {
1049 }
1050
1051 void
i915_init_state_functions(struct i915_context * i915)1052 i915_init_state_functions(struct i915_context *i915)
1053 {
1054 i915->base.create_blend_state = i915_create_blend_state;
1055 i915->base.bind_blend_state = i915_bind_blend_state;
1056 i915->base.delete_blend_state = i915_delete_blend_state;
1057
1058 i915->base.create_sampler_state = i915_create_sampler_state;
1059 i915->base.bind_sampler_states = i915_bind_sampler_states;
1060 i915->base.delete_sampler_state = i915_delete_sampler_state;
1061
1062 i915->base.create_depth_stencil_alpha_state =
1063 i915_create_depth_stencil_state;
1064 i915->base.bind_depth_stencil_alpha_state = i915_bind_depth_stencil_state;
1065 i915->base.delete_depth_stencil_alpha_state =
1066 i915_delete_depth_stencil_state;
1067
1068 i915->base.create_rasterizer_state = i915_create_rasterizer_state;
1069 i915->base.bind_rasterizer_state = i915_bind_rasterizer_state;
1070 i915->base.delete_rasterizer_state = i915_delete_rasterizer_state;
1071 i915->base.create_fs_state = i915_create_fs_state;
1072 i915->base.bind_fs_state = i915_bind_fs_state;
1073 i915->base.delete_fs_state = i915_delete_fs_state;
1074 i915->base.create_vs_state = i915_create_vs_state;
1075 i915->base.bind_vs_state = i915_bind_vs_state;
1076 i915->base.delete_vs_state = i915_delete_vs_state;
1077 i915->base.create_vertex_elements_state = i915_create_vertex_elements_state;
1078 i915->base.bind_vertex_elements_state = i915_bind_vertex_elements_state;
1079 i915->base.delete_vertex_elements_state = i915_delete_vertex_elements_state;
1080
1081 i915->base.set_blend_color = i915_set_blend_color;
1082 i915->base.set_stencil_ref = i915_set_stencil_ref;
1083 i915->base.set_clip_state = i915_set_clip_state;
1084 i915->base.set_sample_mask = i915_set_sample_mask;
1085 i915->base.set_constant_buffer = i915_set_constant_buffer;
1086 i915->base.set_framebuffer_state = i915_set_framebuffer_state;
1087
1088 i915->base.set_polygon_stipple = i915_set_polygon_stipple;
1089 i915->base.set_scissor_states = i915_set_scissor_states;
1090 i915->base.set_sampler_views = i915_set_sampler_views;
1091 i915->base.create_sampler_view = i915_create_sampler_view;
1092 i915->base.sampler_view_destroy = i915_sampler_view_destroy;
1093 i915->base.set_viewport_states = i915_set_viewport_states;
1094 i915->base.set_vertex_buffers = i915_set_vertex_buffers;
1095 }
1096