• Home
  • Line#
  • Scopes#
  • Navigate#
  • Raw
  • Download
1 /*
2  * Copyright (C) 2012 Rob Clark <robclark@freedesktop.org>
3  *
4  * Permission is hereby granted, free of charge, to any person obtaining a
5  * copy of this software and associated documentation files (the "Software"),
6  * to deal in the Software without restriction, including without limitation
7  * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8  * and/or sell copies of the Software, and to permit persons to whom the
9  * Software is furnished to do so, subject to the following conditions:
10  *
11  * The above copyright notice and this permission notice (including the next
12  * paragraph) shall be included in all copies or substantial portions of the
13  * Software.
14  *
15  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17  * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
18  * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19  * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
20  * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
21  * SOFTWARE.
22  *
23  * Authors:
24  *    Rob Clark <robclark@freedesktop.org>
25  *    Jonathan Marek <jonathan@marek.ca>
26  */
27 
28 #include "pipe/p_state.h"
29 #include "util/u_string.h"
30 #include "util/u_memory.h"
31 #include "util/u_inlines.h"
32 #include "util/format/u_format.h"
33 #include "tgsi/tgsi_dump.h"
34 #include "tgsi/tgsi_parse.h"
35 #include "nir/tgsi_to_nir.h"
36 
37 #include "freedreno_program.h"
38 
39 #include "ir2.h"
40 #include "fd2_program.h"
41 #include "fd2_texture.h"
42 #include "fd2_util.h"
43 #include "ir2/instr-a2xx.h"
44 
45 static struct fd2_shader_stateobj *
create_shader(struct pipe_context * pctx,gl_shader_stage type)46 create_shader(struct pipe_context *pctx, gl_shader_stage type)
47 {
48 	struct fd2_shader_stateobj *so = CALLOC_STRUCT(fd2_shader_stateobj);
49 	if (!so)
50 		return NULL;
51 	so->type = type;
52 	so->is_a20x = is_a20x(fd_context(pctx)->screen);
53 	return so;
54 }
55 
56 static void
delete_shader(struct fd2_shader_stateobj * so)57 delete_shader(struct fd2_shader_stateobj *so)
58 {
59 	if (!so)
60 		return;
61 	ralloc_free(so->nir);
62 	for (int i = 0; i < ARRAY_SIZE(so->variant); i++)
63 		free(so->variant[i].info.dwords);
64 	free(so);
65 }
66 
67 static void
emit(struct fd_ringbuffer * ring,gl_shader_stage type,struct ir2_shader_info * info,struct util_dynarray * patches)68 emit(struct fd_ringbuffer *ring, gl_shader_stage type,
69 	struct ir2_shader_info *info, struct util_dynarray *patches)
70 {
71 	unsigned i;
72 
73 	assert(info->sizedwords);
74 
75 	OUT_PKT3(ring, CP_IM_LOAD_IMMEDIATE, 2 + info->sizedwords);
76 	OUT_RING(ring, type == MESA_SHADER_FRAGMENT);
77 	OUT_RING(ring, info->sizedwords);
78 
79 	if (patches)
80 		util_dynarray_append(patches, uint32_t*, &ring->cur[info->mem_export_ptr]);
81 
82 	for (i = 0; i < info->sizedwords; i++)
83 		OUT_RING(ring, info->dwords[i]);
84 }
85 
86 static int
ir2_glsl_type_size(const struct glsl_type * type,bool bindless)87 ir2_glsl_type_size(const struct glsl_type *type, bool bindless)
88 {
89 	return glsl_count_attribute_slots(type, false);
90 }
91 
92 static void *
fd2_fp_state_create(struct pipe_context * pctx,const struct pipe_shader_state * cso)93 fd2_fp_state_create(struct pipe_context *pctx,
94 		const struct pipe_shader_state *cso)
95 {
96 	struct fd2_shader_stateobj *so = create_shader(pctx, MESA_SHADER_FRAGMENT);
97 	if (!so)
98 		return NULL;
99 
100 	so->nir = (cso->type == PIPE_SHADER_IR_NIR) ? cso->ir.nir :
101 		tgsi_to_nir(cso->tokens, pctx->screen, false);
102 
103 	NIR_PASS_V(so->nir, nir_lower_io,
104 	           nir_var_shader_in | nir_var_shader_out,
105 	           ir2_glsl_type_size, (nir_lower_io_options)0);
106 
107 	if (ir2_optimize_nir(so->nir, true))
108 		goto fail;
109 
110 	so->first_immediate = so->nir->num_uniforms;
111 
112 	ir2_compile(so, 0, NULL);
113 
114 	ralloc_free(so->nir);
115 	so->nir = NULL;
116 	return so;
117 
118 fail:
119 	delete_shader(so);
120 	return NULL;
121 }
122 
123 static void
fd2_fp_state_delete(struct pipe_context * pctx,void * hwcso)124 fd2_fp_state_delete(struct pipe_context *pctx, void *hwcso)
125 {
126 	struct fd2_shader_stateobj *so = hwcso;
127 	delete_shader(so);
128 }
129 
130 static void *
fd2_vp_state_create(struct pipe_context * pctx,const struct pipe_shader_state * cso)131 fd2_vp_state_create(struct pipe_context *pctx,
132 		const struct pipe_shader_state *cso)
133 {
134 	struct fd2_shader_stateobj *so = create_shader(pctx, MESA_SHADER_VERTEX);
135 	if (!so)
136 		return NULL;
137 
138 	so->nir = (cso->type == PIPE_SHADER_IR_NIR) ? cso->ir.nir :
139 		tgsi_to_nir(cso->tokens, pctx->screen, false);
140 
141 	NIR_PASS_V(so->nir, nir_lower_io,
142 	           nir_var_shader_in | nir_var_shader_out,
143 	           ir2_glsl_type_size, (nir_lower_io_options)0);
144 
145 	if (ir2_optimize_nir(so->nir, true))
146 		goto fail;
147 
148 	so->first_immediate = so->nir->num_uniforms;
149 
150 	/* compile binning variant now */
151 	ir2_compile(so, 0, NULL);
152 
153 	return so;
154 
155 fail:
156 	delete_shader(so);
157 	return NULL;
158 }
159 
160 static void
fd2_vp_state_delete(struct pipe_context * pctx,void * hwcso)161 fd2_vp_state_delete(struct pipe_context *pctx, void *hwcso)
162 {
163 	struct fd2_shader_stateobj *so = hwcso;
164 	delete_shader(so);
165 }
166 
167 static void
patch_vtx_fetch(struct fd_context * ctx,struct pipe_vertex_element * elem,instr_fetch_vtx_t * instr,uint16_t dst_swiz)168 patch_vtx_fetch(struct fd_context *ctx, struct pipe_vertex_element *elem,
169 	instr_fetch_vtx_t *instr, uint16_t dst_swiz)
170 {
171 	struct surface_format fmt = fd2_pipe2surface(elem->src_format);
172 
173 	instr->dst_swiz = fd2_vtx_swiz(elem->src_format, dst_swiz);
174 	instr->format_comp_all = fmt.sign == SQ_TEX_SIGN_SIGNED;
175 	instr->num_format_all = fmt.num_format;
176 	instr->format = fmt.format;
177 	instr->exp_adjust_all = fmt.exp_adjust;
178 	instr->stride = ctx->vtx.vertexbuf.vb[elem->vertex_buffer_index].stride;
179 	instr->offset = elem->src_offset;
180 }
181 
182 static void
patch_fetches(struct fd_context * ctx,struct ir2_shader_info * info,struct fd_vertex_stateobj * vtx,struct fd_texture_stateobj * tex)183 patch_fetches(struct fd_context *ctx, struct ir2_shader_info *info,
184 	struct fd_vertex_stateobj *vtx, struct fd_texture_stateobj *tex)
185 {
186 	for (int i = 0; i < info->num_fetch_instrs; i++) {
187 		struct ir2_fetch_info *fi = &info->fetch_info[i];
188 
189 		instr_fetch_t *instr = (instr_fetch_t*) &info->dwords[fi->offset];
190 		if (instr->opc == VTX_FETCH) {
191 			unsigned idx = (instr->vtx.const_index - 20) * 3 +
192 				instr->vtx.const_index_sel;
193 			patch_vtx_fetch(ctx, &vtx->pipe[idx], &instr->vtx, fi->vtx.dst_swiz);
194 			continue;
195 		}
196 
197 		assert(instr->opc == TEX_FETCH);
198 		instr->tex.const_idx = fd2_get_const_idx(ctx, tex, fi->tex.samp_id);
199 		instr->tex.src_swiz = fi->tex.src_swiz;
200 	}
201 }
202 
203 void
fd2_program_emit(struct fd_context * ctx,struct fd_ringbuffer * ring,struct fd_program_stateobj * prog)204 fd2_program_emit(struct fd_context *ctx, struct fd_ringbuffer *ring,
205 		struct fd_program_stateobj *prog)
206 {
207 	struct fd2_shader_stateobj *fp = NULL, *vp;
208 	struct ir2_shader_info *fpi, *vpi;
209 	struct ir2_frag_linkage *f;
210 	uint8_t vs_gprs, fs_gprs = 0, vs_export = 0;
211 	enum a2xx_sq_ps_vtx_mode mode = POSITION_1_VECTOR;
212 	bool binning = (ctx->batch && ring == ctx->batch->binning);
213 	unsigned variant = 0;
214 
215 	vp = prog->vs;
216 
217 	/* find variant matching the linked fragment shader */
218 	if (!binning) {
219 		fp = prog->fs;
220 		for (variant = 1; variant < ARRAY_SIZE(vp->variant); variant++) {
221 			/* if checked all variants, compile a new variant */
222 			if (!vp->variant[variant].info.sizedwords) {
223 				ir2_compile(vp, variant, fp);
224 				break;
225 			}
226 
227 			/* check if fragment shader linkage matches */
228 			if (!memcmp(&vp->variant[variant].f, &fp->variant[0].f,
229 					sizeof(struct ir2_frag_linkage)))
230 				break;
231 		}
232 		assert(variant < ARRAY_SIZE(vp->variant));
233 	}
234 
235 	vpi = &vp->variant[variant].info;
236 	fpi = &fp->variant[0].info;
237 	f = &fp->variant[0].f;
238 
239 	/* clear/gmem2mem/mem2gmem need to be changed to remove this condition */
240 	if (prog != &ctx->solid_prog && prog != &ctx->blit_prog[0]) {
241 		patch_fetches(ctx, vpi, ctx->vtx.vtx, &ctx->tex[PIPE_SHADER_VERTEX]);
242 		if (fp)
243 			patch_fetches(ctx, fpi, NULL, &ctx->tex[PIPE_SHADER_FRAGMENT]);
244 	}
245 
246 	emit(ring, MESA_SHADER_VERTEX, vpi,
247 		binning ? &ctx->batch->shader_patches : NULL);
248 
249 	if (fp) {
250 		emit(ring, MESA_SHADER_FRAGMENT, fpi, NULL);
251 		fs_gprs = (fpi->max_reg < 0) ? 0x80 : fpi->max_reg;
252 		vs_export = MAX2(1, f->inputs_count) - 1;
253 	}
254 
255 	vs_gprs = (vpi->max_reg < 0) ? 0x80 : vpi->max_reg;
256 
257 	if (vp->writes_psize && !binning)
258 		mode = POSITION_2_VECTORS_SPRITE;
259 
260 	/* set register to use for param (fragcoord/pointcoord/frontfacing) */
261 	OUT_PKT3(ring, CP_SET_CONSTANT, 2);
262 	OUT_RING(ring, CP_REG(REG_A2XX_SQ_CONTEXT_MISC));
263 	OUT_RING(ring, A2XX_SQ_CONTEXT_MISC_SC_SAMPLE_CNTL(CENTERS_ONLY) |
264 		COND(fp, A2XX_SQ_CONTEXT_MISC_PARAM_GEN_POS(f->inputs_count)) |
265 		/* we need SCREEN_XY for both fragcoord and frontfacing */
266 		A2XX_SQ_CONTEXT_MISC_SC_OUTPUT_SCREEN_XY);
267 
268 	OUT_PKT3(ring, CP_SET_CONSTANT, 2);
269 	OUT_RING(ring, CP_REG(REG_A2XX_SQ_PROGRAM_CNTL));
270 	OUT_RING(ring, A2XX_SQ_PROGRAM_CNTL_PS_EXPORT_MODE(2) |
271 			A2XX_SQ_PROGRAM_CNTL_VS_EXPORT_MODE(mode) |
272 			A2XX_SQ_PROGRAM_CNTL_VS_RESOURCE |
273 			A2XX_SQ_PROGRAM_CNTL_PS_RESOURCE |
274 			A2XX_SQ_PROGRAM_CNTL_VS_EXPORT_COUNT(vs_export) |
275 			A2XX_SQ_PROGRAM_CNTL_PS_REGS(fs_gprs) |
276 			A2XX_SQ_PROGRAM_CNTL_VS_REGS(vs_gprs) |
277 			COND(fp && fp->need_param, A2XX_SQ_PROGRAM_CNTL_PARAM_GEN) |
278 			COND(!fp, A2XX_SQ_PROGRAM_CNTL_GEN_INDEX_VTX));
279 }
280 
281 void
fd2_prog_init(struct pipe_context * pctx)282 fd2_prog_init(struct pipe_context *pctx)
283 {
284 	struct fd_context *ctx = fd_context(pctx);
285 	struct fd_program_stateobj *prog;
286 	struct fd2_shader_stateobj *so;
287 	struct ir2_shader_info *info;
288 	instr_fetch_vtx_t *instr;
289 
290 	pctx->create_fs_state = fd2_fp_state_create;
291 	pctx->delete_fs_state = fd2_fp_state_delete;
292 
293 	pctx->create_vs_state = fd2_vp_state_create;
294 	pctx->delete_vs_state = fd2_vp_state_delete;
295 
296 	fd_prog_init(pctx);
297 
298 	/* XXX maybe its possible to reuse patch_vtx_fetch somehow? */
299 
300 	prog = &ctx->solid_prog;
301 	so = prog->vs;
302 	ir2_compile(prog->vs, 1, prog->fs);
303 
304 #define IR2_FETCH_SWIZ_XY01 0xb08
305 #define IR2_FETCH_SWIZ_XYZ1 0xa88
306 
307 	info = &so->variant[1].info;
308 
309 	instr = (instr_fetch_vtx_t*) &info->dwords[info->fetch_info[0].offset];
310 	instr->const_index = 26;
311 	instr->const_index_sel = 0;
312 	instr->format = FMT_32_32_32_FLOAT;
313 	instr->format_comp_all = false;
314 	instr->stride = 12;
315 	instr->num_format_all = true;
316 	instr->dst_swiz = IR2_FETCH_SWIZ_XYZ1;
317 
318 	prog = &ctx->blit_prog[0];
319 	so = prog->vs;
320 	ir2_compile(prog->vs, 1, prog->fs);
321 
322 	info = &so->variant[1].info;
323 
324 	instr = (instr_fetch_vtx_t*) &info->dwords[info->fetch_info[0].offset];
325 	instr->const_index = 26;
326 	instr->const_index_sel = 1;
327 	instr->format = FMT_32_32_FLOAT;
328 	instr->format_comp_all = false;
329 	instr->stride = 8;
330 	instr->num_format_all = false;
331 	instr->dst_swiz = IR2_FETCH_SWIZ_XY01;
332 
333 	instr = (instr_fetch_vtx_t*) &info->dwords[info->fetch_info[1].offset];
334 	instr->const_index = 26;
335 	instr->const_index_sel = 0;
336 	instr->format = FMT_32_32_32_FLOAT;
337 	instr->format_comp_all = false;
338 	instr->stride = 12;
339 	instr->num_format_all = false;
340 	instr->dst_swiz = IR2_FETCH_SWIZ_XYZ1;
341 }
342