1 /**********************************************************
2 * Copyright 2008-2009 VMware, Inc. All rights reserved.
3 *
4 * Permission is hereby granted, free of charge, to any person
5 * obtaining a copy of this software and associated documentation
6 * files (the "Software"), to deal in the Software without
7 * restriction, including without limitation the rights to use, copy,
8 * modify, merge, publish, distribute, sublicense, and/or sell copies
9 * of the Software, and to permit persons to whom the Software is
10 * furnished to do so, subject to the following conditions:
11 *
12 * The above copyright notice and this permission notice shall be
13 * included in all copies or substantial portions of the Software.
14 *
15 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
16 * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
17 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
18 * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
19 * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
20 * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
21 * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
22 * SOFTWARE.
23 *
24 **********************************************************/
25
26 #include "pipe/p_defines.h"
27 #include "util/u_bitmask.h"
28 #include "util/format/u_format.h"
29 #include "util/u_helpers.h"
30 #include "util/u_inlines.h"
31 #include "util/u_math.h"
32 #include "util/u_memory.h"
33 #include "util/u_transfer.h"
34
35 #include "svga_context.h"
36 #include "svga_cmd.h"
37 #include "svga_format.h"
38 #include "svga_resource_buffer.h"
39 #include "svga_screen.h"
40
41
42 static void
svga_set_vertex_buffers(struct pipe_context * pipe,unsigned count,const struct pipe_vertex_buffer * buffers)43 svga_set_vertex_buffers(struct pipe_context *pipe,
44 unsigned count,
45 const struct pipe_vertex_buffer *buffers)
46 {
47 struct svga_context *svga = svga_context(pipe);
48
49 util_set_vertex_buffers_count(svga->curr.vb,
50 &svga->curr.num_vertex_buffers,
51 buffers, count, true);
52
53 svga->dirty |= SVGA_NEW_VBUFFER;
54 }
55
56
57 /**
58 * Does the given vertex attrib format need range adjustment in the VS?
59 * Range adjustment scales and biases values from [0,1] to [-1,1].
60 * This lets us avoid the swtnl path.
61 */
62 static bool
attrib_needs_range_adjustment(enum pipe_format format)63 attrib_needs_range_adjustment(enum pipe_format format)
64 {
65 switch (format) {
66 case PIPE_FORMAT_R8G8B8_SNORM:
67 return true;
68 default:
69 return false;
70 }
71 }
72
73
74 /**
75 * Given a gallium vertex element format, return the corresponding
76 * SVGA3dDeclType.
77 */
78 static SVGA3dDeclType
translate_vertex_format_to_decltype(enum pipe_format format)79 translate_vertex_format_to_decltype(enum pipe_format format)
80 {
81 switch (format) {
82 case PIPE_FORMAT_R32_FLOAT: return SVGA3D_DECLTYPE_FLOAT1;
83 case PIPE_FORMAT_R32G32_FLOAT: return SVGA3D_DECLTYPE_FLOAT2;
84 case PIPE_FORMAT_R32G32B32_FLOAT: return SVGA3D_DECLTYPE_FLOAT3;
85 case PIPE_FORMAT_R32G32B32A32_FLOAT: return SVGA3D_DECLTYPE_FLOAT4;
86 case PIPE_FORMAT_B8G8R8A8_UNORM: return SVGA3D_DECLTYPE_D3DCOLOR;
87 case PIPE_FORMAT_R8G8B8A8_USCALED: return SVGA3D_DECLTYPE_UBYTE4;
88 case PIPE_FORMAT_R16G16_SSCALED: return SVGA3D_DECLTYPE_SHORT2;
89 case PIPE_FORMAT_R16G16B16A16_SSCALED: return SVGA3D_DECLTYPE_SHORT4;
90 case PIPE_FORMAT_R8G8B8A8_UNORM: return SVGA3D_DECLTYPE_UBYTE4N;
91 case PIPE_FORMAT_R16G16_SNORM: return SVGA3D_DECLTYPE_SHORT2N;
92 case PIPE_FORMAT_R16G16B16A16_SNORM: return SVGA3D_DECLTYPE_SHORT4N;
93 case PIPE_FORMAT_R16G16_UNORM: return SVGA3D_DECLTYPE_USHORT2N;
94 case PIPE_FORMAT_R16G16B16A16_UNORM: return SVGA3D_DECLTYPE_USHORT4N;
95 case PIPE_FORMAT_R10G10B10X2_USCALED: return SVGA3D_DECLTYPE_UDEC3;
96 case PIPE_FORMAT_R10G10B10X2_SNORM: return SVGA3D_DECLTYPE_DEC3N;
97 case PIPE_FORMAT_R16G16_FLOAT: return SVGA3D_DECLTYPE_FLOAT16_2;
98 case PIPE_FORMAT_R16G16B16A16_FLOAT: return SVGA3D_DECLTYPE_FLOAT16_4;
99
100 /* See attrib_needs_adjustment() and attrib_needs_w_to_1() above */
101 case PIPE_FORMAT_R8G8B8_SNORM: return SVGA3D_DECLTYPE_UBYTE4N;
102
103 /* See attrib_needs_w_to_1() above */
104 case PIPE_FORMAT_R16G16B16_SNORM: return SVGA3D_DECLTYPE_SHORT4N;
105 case PIPE_FORMAT_R16G16B16_UNORM: return SVGA3D_DECLTYPE_USHORT4N;
106 case PIPE_FORMAT_R8G8B8_UNORM: return SVGA3D_DECLTYPE_UBYTE4N;
107
108 default:
109 /* There are many formats without hardware support. This case
110 * will be hit regularly, meaning we'll need swvfetch.
111 */
112 return SVGA3D_DECLTYPE_MAX;
113 }
114 }
115
116
117 static void
define_input_element_object(struct svga_context * svga,struct svga_velems_state * velems)118 define_input_element_object(struct svga_context *svga,
119 struct svga_velems_state *velems)
120 {
121 SVGA3dInputElementDesc elements[PIPE_MAX_ATTRIBS];
122 unsigned i;
123
124 assert(velems->count <= PIPE_MAX_ATTRIBS);
125 assert(svga_have_vgpu10(svga));
126
127 for (i = 0; i < velems->count; i++) {
128 const struct pipe_vertex_element *elem = velems->velem + i;
129 SVGA3dSurfaceFormat svga_format;
130 unsigned vf_flags;
131
132 svga_translate_vertex_format_vgpu10(elem->src_format,
133 &svga_format, &vf_flags);
134
135 velems->decl_type[i] =
136 translate_vertex_format_to_decltype(elem->src_format);
137 elements[i].inputSlot = elem->vertex_buffer_index;
138 elements[i].alignedByteOffset = elem->src_offset;
139 elements[i].format = svga_format;
140
141 if (elem->instance_divisor) {
142 elements[i].inputSlotClass = SVGA3D_INPUT_PER_INSTANCE_DATA;
143 elements[i].instanceDataStepRate = elem->instance_divisor;
144 }
145 else {
146 elements[i].inputSlotClass = SVGA3D_INPUT_PER_VERTEX_DATA;
147 elements[i].instanceDataStepRate = 0;
148 }
149 elements[i].inputRegister = i;
150
151 if (elements[i].format == SVGA3D_FORMAT_INVALID) {
152 velems->need_swvfetch = true;
153 }
154
155 if (util_format_is_pure_integer(elem->src_format)) {
156 velems->attrib_is_pure_int |= (1 << i);
157 }
158
159 if (vf_flags & VF_W_TO_1) {
160 velems->adjust_attrib_w_1 |= (1 << i);
161 }
162
163 if (vf_flags & VF_U_TO_F_CAST) {
164 velems->adjust_attrib_utof |= (1 << i);
165 }
166 else if (vf_flags & VF_I_TO_F_CAST) {
167 velems->adjust_attrib_itof |= (1 << i);
168 }
169
170 if (vf_flags & VF_BGRA) {
171 velems->attrib_is_bgra |= (1 << i);
172 }
173
174 if (vf_flags & VF_PUINT_TO_SNORM) {
175 velems->attrib_puint_to_snorm |= (1 << i);
176 }
177 else if (vf_flags & VF_PUINT_TO_USCALED) {
178 velems->attrib_puint_to_uscaled |= (1 << i);
179 }
180 else if (vf_flags & VF_PUINT_TO_SSCALED) {
181 velems->attrib_puint_to_sscaled |= (1 << i);
182 }
183 }
184
185 velems->id = util_bitmask_add(svga->input_element_object_id_bm);
186
187 SVGA_RETRY(svga, SVGA3D_vgpu10_DefineElementLayout(svga->swc, velems->count,
188 velems->id, elements));
189 }
190
191
192 /**
193 * Translate the vertex element types to SVGA3dDeclType and check
194 * for VS-based vertex attribute adjustments.
195 */
196 static void
translate_vertex_decls(struct svga_context * svga,struct svga_velems_state * velems)197 translate_vertex_decls(struct svga_context *svga,
198 struct svga_velems_state *velems)
199 {
200 unsigned i;
201
202 assert(!svga_have_vgpu10(svga));
203
204 for (i = 0; i < velems->count; i++) {
205 const enum pipe_format f = velems->velem[i].src_format;
206 SVGA3dSurfaceFormat svga_format;
207 unsigned vf_flags;
208
209 svga_translate_vertex_format_vgpu10(f, &svga_format, &vf_flags);
210
211 velems->decl_type[i] = translate_vertex_format_to_decltype(f);
212 if (velems->decl_type[i] == SVGA3D_DECLTYPE_MAX) {
213 /* Unsupported format - use software fetch */
214 velems->need_swvfetch = true;
215 }
216
217 /* Check for VS-based adjustments */
218 if (attrib_needs_range_adjustment(f)) {
219 velems->adjust_attrib_range |= (1 << i);
220 }
221
222 if (vf_flags & VF_W_TO_1) {
223 velems->adjust_attrib_w_1 |= (1 << i);
224 }
225 }
226 }
227
228
229 static void *
svga_create_vertex_elements_state(struct pipe_context * pipe,unsigned count,const struct pipe_vertex_element * attribs)230 svga_create_vertex_elements_state(struct pipe_context *pipe,
231 unsigned count,
232 const struct pipe_vertex_element *attribs)
233 {
234 struct svga_context *svga = svga_context(pipe);
235 struct svga_velems_state *velems;
236
237 assert(count <= PIPE_MAX_ATTRIBS);
238 velems = (struct svga_velems_state *) MALLOC(sizeof(struct svga_velems_state));
239 if (velems) {
240 velems->count = count;
241 memcpy(velems->velem, attribs, sizeof(*attribs) * count);
242
243 velems->need_swvfetch = false;
244 velems->adjust_attrib_range = 0x0;
245 velems->attrib_is_pure_int = 0x0;
246 velems->adjust_attrib_w_1 = 0x0;
247 velems->adjust_attrib_itof = 0x0;
248 velems->adjust_attrib_utof = 0x0;
249 velems->attrib_is_bgra = 0x0;
250 velems->attrib_puint_to_snorm = 0x0;
251 velems->attrib_puint_to_uscaled = 0x0;
252 velems->attrib_puint_to_sscaled = 0x0;
253
254 if (svga_have_vgpu10(svga)) {
255 define_input_element_object(svga, velems);
256 }
257 else {
258 translate_vertex_decls(svga, velems);
259 }
260 for (unsigned i = 0; i < count; i++)
261 velems->strides[attribs[i].vertex_buffer_index] = attribs[i].src_stride;
262 }
263
264 svga->hud.num_vertexelement_objects++;
265 SVGA_STATS_COUNT_INC(svga_screen(svga->pipe.screen)->sws,
266 SVGA_STATS_COUNT_VERTEXELEMENT);
267
268 return velems;
269 }
270
271
272 static void
svga_bind_vertex_elements_state(struct pipe_context * pipe,void * state)273 svga_bind_vertex_elements_state(struct pipe_context *pipe, void *state)
274 {
275 struct svga_context *svga = svga_context(pipe);
276 struct svga_velems_state *velems = (struct svga_velems_state *) state;
277
278 svga->curr.velems = velems;
279 svga->dirty |= SVGA_NEW_VELEMENT;
280 }
281
282
283 static void
svga_delete_vertex_elements_state(struct pipe_context * pipe,void * state)284 svga_delete_vertex_elements_state(struct pipe_context *pipe, void *state)
285 {
286 struct svga_context *svga = svga_context(pipe);
287 struct svga_velems_state *velems = (struct svga_velems_state *) state;
288
289 if (svga_have_vgpu10(svga)) {
290 svga_hwtnl_flush_retry(svga);
291
292 SVGA_RETRY(svga, SVGA3D_vgpu10_DestroyElementLayout(svga->swc,
293 velems->id));
294
295 if (velems->id == svga->state.hw_draw.layout_id)
296 svga->state.hw_draw.layout_id = SVGA3D_INVALID_ID;
297
298 util_bitmask_clear(svga->input_element_object_id_bm, velems->id);
299 velems->id = SVGA3D_INVALID_ID;
300 }
301
302 FREE(velems);
303 svga->hud.num_vertexelement_objects--;
304 }
305
306
307 void
svga_cleanup_vertex_state(struct svga_context * svga)308 svga_cleanup_vertex_state(struct svga_context *svga)
309 {
310 unsigned i;
311
312 for (i = 0 ; i < svga->curr.num_vertex_buffers; i++)
313 pipe_vertex_buffer_unreference(&svga->curr.vb[i]);
314
315 pipe_resource_reference(&svga->state.hw_draw.ib, NULL);
316
317 for (i = 0; i < svga->state.hw_draw.num_vbuffers; i++)
318 pipe_resource_reference(&svga->state.hw_draw.vbuffers[i], NULL);
319 }
320
321
322 void
svga_init_vertex_functions(struct svga_context * svga)323 svga_init_vertex_functions(struct svga_context *svga)
324 {
325 svga->pipe.set_vertex_buffers = svga_set_vertex_buffers;
326 svga->pipe.create_vertex_elements_state = svga_create_vertex_elements_state;
327 svga->pipe.bind_vertex_elements_state = svga_bind_vertex_elements_state;
328 svga->pipe.delete_vertex_elements_state = svga_delete_vertex_elements_state;
329 }
330