1 /**************************************************************************
2 *
3 * Copyright 2003 VMware, Inc.
4 * All Rights Reserved.
5 *
6 * Permission is hereby granted, free of charge, to any person obtaining a
7 * copy of this software and associated documentation files (the
8 * "Software"), to deal in the Software without restriction, including
9 * without limitation the rights to use, copy, modify, merge, publish,
10 * distribute, sub license, and/or sell copies of the Software, and to
11 * permit persons to whom the Software is furnished to do so, subject to
12 * the following conditions:
13 *
14 * The above copyright notice and this permission notice (including the
15 * next paragraph) shall be included in all copies or substantial portions
16 * of the Software.
17 *
18 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
19 * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
20 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT.
21 * IN NO EVENT SHALL VMWARE AND/OR ITS SUPPLIERS BE LIABLE FOR
22 * ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT,
23 * TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE
24 * SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
25 *
26 **************************************************************************/
27
28 #include "pipe/p_context.h"
29 #include "pipe/p_state.h"
30
31 #include "i915_context.h"
32 #include "i915_reg.h"
33 #include "i915_resource.h"
34 #include "i915_state.h"
35 #include "i915_state_inlines.h"
36
37 /*
38 * A note about min_lod & max_lod.
39 *
40 * There is a circular dependancy between the sampler state
41 * and the map state to be submitted to hw.
42 *
43 * Two condition must be meet:
44 * min_lod =< max_lod == true
45 * max_lod =< last_level == true
46 *
47 *
48 * This is all fine and dandy if it were for the fact that max_lod
49 * is set on the map state instead of the sampler state. That is
50 * the max_lod we submit on map is:
51 * max_lod = MIN2(last_level, max_lod);
52 *
53 * So we need to update the map state when we change samplers and
54 * we need to change the sampler state when map state is changed.
55 * The first part is done by calling update_texture in update_samplers
56 * and the second part is done else where in code tracking the state
57 * changes.
58 */
59
60 /***********************************************************************
61 * Samplers
62 */
63
64 /**
65 * Compute i915 texture sampling state.
66 *
67 * Recalculate all state from scratch. Perhaps not the most
68 * efficient, but this has gotten complex enough that we need
69 * something which is understandable and reliable.
70 * \param state returns the 3 words of compute state
71 */
72 static void
update_sampler(struct i915_context * i915,uint32_t unit,const struct i915_sampler_state * sampler,const struct i915_texture * tex,unsigned state[3])73 update_sampler(struct i915_context *i915, uint32_t unit,
74 const struct i915_sampler_state *sampler,
75 const struct i915_texture *tex, unsigned state[3])
76 {
77 const struct pipe_resource *pt = &tex->b;
78 unsigned minlod, lastlod;
79
80 state[0] = sampler->state[0];
81 state[1] = sampler->state[1];
82 state[2] = sampler->state[2];
83
84 if (pt->format == PIPE_FORMAT_UYVY || pt->format == PIPE_FORMAT_YUYV)
85 state[0] |= SS2_COLORSPACE_CONVERSION;
86
87 if (util_format_is_srgb(pt->format)) {
88 state[0] |= SS2_REVERSE_GAMMA_ENABLE;
89 }
90
91 /* There is no HW support for 1D textures, so we just make them 2D textures
92 * with h=1, but that means we need to make the Y coordinate not contribute
93 * to bringing any border color in. Clearing it sets it to WRAP.
94 */
95 if (pt->target == PIPE_TEXTURE_1D) {
96 state[1] &= ~SS3_TCY_ADDR_MODE_MASK;
97 }
98
99 /* The GLES2 spec says textures are incomplete (return 0,0,0,1) if:
100 *
101 * "A cube map sampler is called, any of the corresponding texture images are
102 * non-power-of-two images, and either the texture wrap mode is not
103 * CLAMP_TO_EDGE, or the minification filter is neither NEAREST nor LINEAR."
104 *
105 * while the i915 spec says:
106 *
107 * "When using cube map texture coordinates, only TEXCOORDMODE_CLAMP and *
108 * TEXCOORDMODE_CUBE settings are valid, and each TC component must have the
109 * same Address Control mode. TEXCOORDMODE_CUBE is not valid unless the
110 * width and height of the cube map are power-of-2."
111 *
112 * We don't expose support for the seamless cube map extension, so always use
113 * edge clamping.
114 */
115 if (pt->target == PIPE_TEXTURE_CUBE) {
116 state[1] &= ~(SS3_TCX_ADDR_MODE_MASK | SS3_TCY_ADDR_MODE_MASK |
117 SS3_TCZ_ADDR_MODE_MASK);
118 state[1] |= (TEXCOORDMODE_CLAMP_EDGE << SS3_TCX_ADDR_MODE_SHIFT);
119 state[1] |= (TEXCOORDMODE_CLAMP_EDGE << SS3_TCY_ADDR_MODE_SHIFT);
120 state[1] |= (TEXCOORDMODE_CLAMP_EDGE << SS3_TCZ_ADDR_MODE_SHIFT);
121 }
122
123 /* 3D textures don't seem to respect the border color.
124 * Fallback if there's ever a danger that they might refer to
125 * it.
126 *
127 * Effectively this means fallback on 3D clamp or
128 * clamp_to_border.
129 *
130 * XXX: Check if this is true on i945.
131 * XXX: Check if this bug got fixed in release silicon.
132 */
133 #if 0
134 {
135 const unsigned ws = sampler->templ->wrap_s;
136 const unsigned wt = sampler->templ->wrap_t;
137 const unsigned wr = sampler->templ->wrap_r;
138 if (pt->target == PIPE_TEXTURE_3D &&
139 (sampler->templ->min_img_filter != PIPE_TEX_FILTER_NEAREST ||
140 sampler->templ->mag_img_filter != PIPE_TEX_FILTER_NEAREST) &&
141 (ws == PIPE_TEX_WRAP_CLAMP ||
142 wt == PIPE_TEX_WRAP_CLAMP ||
143 wr == PIPE_TEX_WRAP_CLAMP ||
144 ws == PIPE_TEX_WRAP_CLAMP_TO_BORDER ||
145 wt == PIPE_TEX_WRAP_CLAMP_TO_BORDER ||
146 wr == PIPE_TEX_WRAP_CLAMP_TO_BORDER)) {
147 if (i915->conformance_mode > 0) {
148 assert(0);
149 /* sampler->fallback = true; */
150 /* TODO */
151 }
152 }
153 }
154 #endif
155
156 /* See note at the top of file */
157 minlod = sampler->minlod;
158 lastlod = pt->last_level << 4;
159
160 if (lastlod < minlod) {
161 minlod = lastlod;
162 }
163
164 state[1] |= (sampler->minlod << SS3_MIN_LOD_SHIFT);
165 state[1] |= (unit << SS3_TEXTUREMAP_INDEX_SHIFT);
166 }
167
168 /***********************************************************************
169 * Sampler views
170 */
171
172 static uint32_t
translate_texture_format(enum pipe_format pipeFormat,const struct pipe_sampler_view * view)173 translate_texture_format(enum pipe_format pipeFormat,
174 const struct pipe_sampler_view *view)
175 {
176 if ((view->swizzle_r != PIPE_SWIZZLE_X ||
177 view->swizzle_g != PIPE_SWIZZLE_Y ||
178 view->swizzle_b != PIPE_SWIZZLE_Z ||
179 view->swizzle_a != PIPE_SWIZZLE_W) &&
180 pipeFormat != PIPE_FORMAT_Z24_UNORM_S8_UINT &&
181 pipeFormat != PIPE_FORMAT_Z24X8_UNORM)
182 debug_printf("i915: unsupported texture swizzle for format %d\n",
183 pipeFormat);
184
185 switch (pipeFormat) {
186 case PIPE_FORMAT_L8_UNORM:
187 return MAPSURF_8BIT | MT_8BIT_L8;
188 case PIPE_FORMAT_I8_UNORM:
189 return MAPSURF_8BIT | MT_8BIT_I8;
190 case PIPE_FORMAT_A8_UNORM:
191 return MAPSURF_8BIT | MT_8BIT_A8;
192 case PIPE_FORMAT_L8A8_UNORM:
193 return MAPSURF_16BIT | MT_16BIT_AY88;
194 case PIPE_FORMAT_B5G6R5_UNORM:
195 return MAPSURF_16BIT | MT_16BIT_RGB565;
196 case PIPE_FORMAT_B5G5R5A1_UNORM:
197 return MAPSURF_16BIT | MT_16BIT_ARGB1555;
198 case PIPE_FORMAT_B4G4R4A4_UNORM:
199 return MAPSURF_16BIT | MT_16BIT_ARGB4444;
200 case PIPE_FORMAT_B10G10R10A2_UNORM:
201 return MAPSURF_32BIT | MT_32BIT_ARGB2101010;
202 case PIPE_FORMAT_B8G8R8A8_UNORM:
203 case PIPE_FORMAT_B8G8R8A8_SRGB:
204 return MAPSURF_32BIT | MT_32BIT_ARGB8888;
205 case PIPE_FORMAT_B8G8R8X8_UNORM:
206 return MAPSURF_32BIT | MT_32BIT_XRGB8888;
207 case PIPE_FORMAT_R8G8B8A8_UNORM:
208 return MAPSURF_32BIT | MT_32BIT_ABGR8888;
209 case PIPE_FORMAT_R8G8B8X8_UNORM:
210 return MAPSURF_32BIT | MT_32BIT_XBGR8888;
211 case PIPE_FORMAT_YUYV:
212 return (MAPSURF_422 | MT_422_YCRCB_NORMAL);
213 case PIPE_FORMAT_UYVY:
214 return (MAPSURF_422 | MT_422_YCRCB_SWAPY);
215 case PIPE_FORMAT_FXT1_RGB:
216 case PIPE_FORMAT_FXT1_RGBA:
217 return (MAPSURF_COMPRESSED | MT_COMPRESS_FXT1);
218 case PIPE_FORMAT_Z16_UNORM:
219 return (MAPSURF_16BIT | MT_16BIT_L16);
220 case PIPE_FORMAT_DXT1_RGB:
221 case PIPE_FORMAT_DXT1_SRGB:
222 return (MAPSURF_COMPRESSED | MT_COMPRESS_DXT1_RGB);
223 case PIPE_FORMAT_DXT1_RGBA:
224 case PIPE_FORMAT_DXT1_SRGBA:
225 return (MAPSURF_COMPRESSED | MT_COMPRESS_DXT1);
226 case PIPE_FORMAT_DXT3_RGBA:
227 case PIPE_FORMAT_DXT3_SRGBA:
228 return (MAPSURF_COMPRESSED | MT_COMPRESS_DXT2_3);
229 case PIPE_FORMAT_DXT5_RGBA:
230 case PIPE_FORMAT_DXT5_SRGBA:
231 return (MAPSURF_COMPRESSED | MT_COMPRESS_DXT4_5);
232 case PIPE_FORMAT_Z24_UNORM_S8_UINT:
233 case PIPE_FORMAT_Z24X8_UNORM: {
234 if (view->swizzle_r == PIPE_SWIZZLE_X &&
235 view->swizzle_g == PIPE_SWIZZLE_X &&
236 view->swizzle_b == PIPE_SWIZZLE_X &&
237 view->swizzle_a == PIPE_SWIZZLE_1)
238 return (MAPSURF_32BIT | MT_32BIT_xL824);
239 if (view->swizzle_r == PIPE_SWIZZLE_X &&
240 view->swizzle_g == PIPE_SWIZZLE_X &&
241 view->swizzle_b == PIPE_SWIZZLE_X &&
242 view->swizzle_a == PIPE_SWIZZLE_X)
243 return (MAPSURF_32BIT | MT_32BIT_xI824);
244 if (view->swizzle_r == PIPE_SWIZZLE_0 &&
245 view->swizzle_g == PIPE_SWIZZLE_0 &&
246 view->swizzle_b == PIPE_SWIZZLE_0 &&
247 view->swizzle_a == PIPE_SWIZZLE_X)
248 return (MAPSURF_32BIT | MT_32BIT_xA824);
249 debug_printf("i915: unsupported depth swizzle %d %d %d %d\n",
250 view->swizzle_r, view->swizzle_g, view->swizzle_b,
251 view->swizzle_a);
252 return (MAPSURF_32BIT | MT_32BIT_xL824);
253 }
254 default:
255 debug_printf("i915: translate_texture_format() bad image format %x\n",
256 pipeFormat);
257 assert(0);
258 return 0;
259 }
260 }
261
262 static inline uint32_t
ms3_tiling_bits(enum i915_winsys_buffer_tile tiling)263 ms3_tiling_bits(enum i915_winsys_buffer_tile tiling)
264 {
265 uint32_t tiling_bits = 0;
266
267 switch (tiling) {
268 case I915_TILE_Y:
269 tiling_bits |= MS3_TILE_WALK_Y;
270 FALLTHROUGH;
271 case I915_TILE_X:
272 tiling_bits |= MS3_TILED_SURFACE;
273 FALLTHROUGH;
274 case I915_TILE_NONE:
275 break;
276 }
277
278 return tiling_bits;
279 }
280
281 static void
update_map(struct i915_context * i915,uint32_t unit,const struct i915_texture * tex,const struct i915_sampler_state * sampler,const struct pipe_sampler_view * view,uint32_t state[3])282 update_map(struct i915_context *i915, uint32_t unit,
283 const struct i915_texture *tex,
284 const struct i915_sampler_state *sampler,
285 const struct pipe_sampler_view *view, uint32_t state[3])
286 {
287 const struct pipe_resource *pt = &tex->b;
288 uint32_t width = pt->width0, height = pt->height0, depth = pt->depth0;
289 int first_level = view->u.tex.first_level;
290 const uint32_t num_levels = pt->last_level - first_level;
291 unsigned max_lod = num_levels * 4;
292 bool is_npot = (!util_is_power_of_two_or_zero(pt->width0) ||
293 !util_is_power_of_two_or_zero(pt->height0));
294 uint32_t format, pitch;
295
296 /*
297 * This is a bit messy. i915 doesn't support NPOT with mipmaps, but we can
298 * still texture from a single level. This is useful to make u_blitter work.
299 */
300 if (is_npot) {
301 width = u_minify(width, first_level);
302 height = u_minify(height, first_level);
303 max_lod = 1;
304 }
305
306 assert(tex);
307 assert(width);
308 assert(height);
309 assert(depth);
310
311 format = translate_texture_format(pt->format, view);
312 pitch = tex->stride;
313
314 assert(format);
315 assert(pitch);
316
317 /* MS3 state */
318 state[0] =
319 (((height - 1) << MS3_HEIGHT_SHIFT) | ((width - 1) << MS3_WIDTH_SHIFT) |
320 format | ms3_tiling_bits(tex->tiling));
321
322 /*
323 * XXX When min_filter != mag_filter and there's just one mipmap level,
324 * set max_lod = 1 to make sure i915 chooses between min/mag filtering.
325 */
326
327 /* See note at the top of file */
328 if (max_lod > (sampler->maxlod >> 2))
329 max_lod = sampler->maxlod >> 2;
330
331 /* MS4 state */
332 state[1] = ((((pitch / 4) - 1) << MS4_PITCH_SHIFT) | MS4_CUBE_FACE_ENA_MASK |
333 ((max_lod) << MS4_MAX_LOD_SHIFT) |
334 ((depth - 1) << MS4_VOLUME_DEPTH_SHIFT));
335
336 if (is_npot)
337 state[2] = i915_texture_offset(tex, first_level, 0);
338 else
339 state[2] = 0;
340 }
341
342 static void
update_samplers(struct i915_context * i915)343 update_samplers(struct i915_context *i915)
344 {
345 uint32_t unit;
346
347 i915->current.sampler_enable_nr = 0;
348 i915->current.sampler_enable_flags = 0x0;
349
350 for (unit = 0;
351 unit < i915->num_fragment_sampler_views && unit < i915->num_samplers;
352 unit++) {
353 /* determine unit enable/disable by looking for a bound texture */
354 /* could also examine the fragment program? */
355 if (i915->fragment_sampler_views[unit]) {
356 struct i915_texture *texture =
357 i915_texture(i915->fragment_sampler_views[unit]->texture);
358
359 update_sampler(i915, unit,
360 i915->fragment_sampler[unit], /* sampler state */
361 texture, /* texture */
362 i915->current.sampler[unit]); /* the result */
363 update_map(i915, unit, texture, /* texture */
364 i915->fragment_sampler[unit], /* sampler state */
365 i915->fragment_sampler_views[unit], /* sampler view */
366 i915->current.texbuffer[unit]); /* the result */
367
368 i915->current.sampler_enable_nr++;
369 i915->current.sampler_enable_flags |= (1 << unit);
370 }
371 }
372
373 i915->hardware_dirty |= I915_HW_SAMPLER | I915_HW_MAP;
374 }
375
376 struct i915_tracked_state i915_hw_samplers = {
377 "samplers", update_samplers, I915_NEW_SAMPLER | I915_NEW_SAMPLER_VIEW};
378