1 /**********************************************************
2 * Copyright 2008-2009 VMware, Inc. All rights reserved.
3 *
4 * Permission is hereby granted, free of charge, to any person
5 * obtaining a copy of this software and associated documentation
6 * files (the "Software"), to deal in the Software without
7 * restriction, including without limitation the rights to use, copy,
8 * modify, merge, publish, distribute, sublicense, and/or sell copies
9 * of the Software, and to permit persons to whom the Software is
10 * furnished to do so, subject to the following conditions:
11 *
12 * The above copyright notice and this permission notice shall be
13 * included in all copies or substantial portions of the Software.
14 *
15 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
16 * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
17 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
18 * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
19 * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
20 * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
21 * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
22 * SOFTWARE.
23 *
24 **********************************************************/
25
26 #include "git_sha1.h" /* For MESA_GIT_SHA1 */
27 #include "util/format/u_format.h"
28 #include "util/u_memory.h"
29 #include "util/u_inlines.h"
30 #include "util/u_screen.h"
31 #include "util/u_string.h"
32 #include "util/u_math.h"
33
34 #include "os/os_process.h"
35
36 #include "svga_winsys.h"
37 #include "svga_public.h"
38 #include "svga_context.h"
39 #include "svga_format.h"
40 #include "svga_screen.h"
41 #include "svga_tgsi.h"
42 #include "svga_resource_texture.h"
43 #include "svga_resource.h"
44 #include "svga_debug.h"
45
46 #include "svga3d_shaderdefs.h"
47 #include "VGPU10ShaderTokens.h"
48
49 /* NOTE: this constant may get moved into a svga3d*.h header file */
50 #define SVGA3D_DX_MAX_RESOURCE_SIZE (128 * 1024 * 1024)
51
52 #ifndef MESA_GIT_SHA1
53 #define MESA_GIT_SHA1 "(unknown git revision)"
54 #endif
55
56 #ifdef DEBUG
57 int SVGA_DEBUG = 0;
58
59 static const struct debug_named_value svga_debug_flags[] = {
60 { "dma", DEBUG_DMA, NULL },
61 { "tgsi", DEBUG_TGSI, NULL },
62 { "pipe", DEBUG_PIPE, NULL },
63 { "state", DEBUG_STATE, NULL },
64 { "screen", DEBUG_SCREEN, NULL },
65 { "tex", DEBUG_TEX, NULL },
66 { "swtnl", DEBUG_SWTNL, NULL },
67 { "const", DEBUG_CONSTS, NULL },
68 { "viewport", DEBUG_VIEWPORT, NULL },
69 { "views", DEBUG_VIEWS, NULL },
70 { "perf", DEBUG_PERF, NULL },
71 { "flush", DEBUG_FLUSH, NULL },
72 { "sync", DEBUG_SYNC, NULL },
73 { "cache", DEBUG_CACHE, NULL },
74 { "streamout", DEBUG_STREAMOUT, NULL },
75 { "query", DEBUG_QUERY, NULL },
76 { "samplers", DEBUG_SAMPLERS, NULL },
77 DEBUG_NAMED_VALUE_END
78 };
79 #endif
80
81 static const char *
svga_get_vendor(struct pipe_screen * pscreen)82 svga_get_vendor( struct pipe_screen *pscreen )
83 {
84 return "VMware, Inc.";
85 }
86
87
88 static const char *
svga_get_name(struct pipe_screen * pscreen)89 svga_get_name( struct pipe_screen *pscreen )
90 {
91 const char *build = "", *llvm = "", *mutex = "";
92 static char name[100];
93 #ifdef DEBUG
94 /* Only return internal details in the DEBUG version:
95 */
96 build = "build: DEBUG;";
97 mutex = "mutex: " PIPE_ATOMIC ";";
98 #else
99 build = "build: RELEASE;";
100 #endif
101 #ifdef LLVM_AVAILABLE
102 llvm = "LLVM;";
103 #endif
104
105 snprintf(name, sizeof(name), "SVGA3D; %s %s %s", build, mutex, llvm);
106 return name;
107 }
108
109
110 /** Helper for querying float-valued device cap */
111 static float
get_float_cap(struct svga_winsys_screen * sws,SVGA3dDevCapIndex cap,float defaultVal)112 get_float_cap(struct svga_winsys_screen *sws, SVGA3dDevCapIndex cap,
113 float defaultVal)
114 {
115 SVGA3dDevCapResult result;
116 if (sws->get_cap(sws, cap, &result))
117 return result.f;
118 else
119 return defaultVal;
120 }
121
122
123 /** Helper for querying uint-valued device cap */
124 static unsigned
get_uint_cap(struct svga_winsys_screen * sws,SVGA3dDevCapIndex cap,unsigned defaultVal)125 get_uint_cap(struct svga_winsys_screen *sws, SVGA3dDevCapIndex cap,
126 unsigned defaultVal)
127 {
128 SVGA3dDevCapResult result;
129 if (sws->get_cap(sws, cap, &result))
130 return result.u;
131 else
132 return defaultVal;
133 }
134
135
136 /** Helper for querying boolean-valued device cap */
137 static boolean
get_bool_cap(struct svga_winsys_screen * sws,SVGA3dDevCapIndex cap,boolean defaultVal)138 get_bool_cap(struct svga_winsys_screen *sws, SVGA3dDevCapIndex cap,
139 boolean defaultVal)
140 {
141 SVGA3dDevCapResult result;
142 if (sws->get_cap(sws, cap, &result))
143 return result.b;
144 else
145 return defaultVal;
146 }
147
148
149 static float
svga_get_paramf(struct pipe_screen * screen,enum pipe_capf param)150 svga_get_paramf(struct pipe_screen *screen, enum pipe_capf param)
151 {
152 struct svga_screen *svgascreen = svga_screen(screen);
153 struct svga_winsys_screen *sws = svgascreen->sws;
154
155 switch (param) {
156 case PIPE_CAPF_MAX_LINE_WIDTH:
157 return svgascreen->maxLineWidth;
158 case PIPE_CAPF_MAX_LINE_WIDTH_AA:
159 return svgascreen->maxLineWidthAA;
160
161 case PIPE_CAPF_MAX_POINT_WIDTH:
162 /* fall-through */
163 case PIPE_CAPF_MAX_POINT_WIDTH_AA:
164 return svgascreen->maxPointSize;
165
166 case PIPE_CAPF_MAX_TEXTURE_ANISOTROPY:
167 return (float) get_uint_cap(sws, SVGA3D_DEVCAP_MAX_TEXTURE_ANISOTROPY, 4);
168
169 case PIPE_CAPF_MAX_TEXTURE_LOD_BIAS:
170 return 15.0;
171
172 case PIPE_CAPF_MIN_CONSERVATIVE_RASTER_DILATE:
173 /* fall-through */
174 case PIPE_CAPF_MAX_CONSERVATIVE_RASTER_DILATE:
175 /* fall-through */
176 case PIPE_CAPF_CONSERVATIVE_RASTER_DILATE_GRANULARITY:
177 return 0.0f;
178
179 }
180
181 debug_printf("Unexpected PIPE_CAPF_ query %u\n", param);
182 return 0;
183 }
184
185
186 static int
svga_get_param(struct pipe_screen * screen,enum pipe_cap param)187 svga_get_param(struct pipe_screen *screen, enum pipe_cap param)
188 {
189 struct svga_screen *svgascreen = svga_screen(screen);
190 struct svga_winsys_screen *sws = svgascreen->sws;
191 SVGA3dDevCapResult result;
192
193 switch (param) {
194 case PIPE_CAP_NPOT_TEXTURES:
195 case PIPE_CAP_MIXED_FRAMEBUFFER_SIZES:
196 case PIPE_CAP_MIXED_COLOR_DEPTH_BITS:
197 return 1;
198 case PIPE_CAP_MAX_DUAL_SOURCE_RENDER_TARGETS:
199 /*
200 * "In virtually every OpenGL implementation and hardware,
201 * GL_MAX_DUAL_SOURCE_DRAW_BUFFERS is 1"
202 * http://www.opengl.org/wiki/Blending
203 */
204 return sws->have_vgpu10 ? 1 : 0;
205 case PIPE_CAP_ANISOTROPIC_FILTER:
206 return 1;
207 case PIPE_CAP_POINT_SPRITE:
208 return 1;
209 case PIPE_CAP_MAX_RENDER_TARGETS:
210 return svgascreen->max_color_buffers;
211 case PIPE_CAP_OCCLUSION_QUERY:
212 return 1;
213 case PIPE_CAP_TEXTURE_BUFFER_OBJECTS:
214 return sws->have_vgpu10;
215 case PIPE_CAP_TEXTURE_SWIZZLE:
216 return 1;
217 case PIPE_CAP_CONSTANT_BUFFER_OFFSET_ALIGNMENT:
218 return 256;
219
220 case PIPE_CAP_MAX_TEXTURE_2D_SIZE:
221 {
222 unsigned size = 1 << (SVGA_MAX_TEXTURE_LEVELS - 1);
223 if (sws->get_cap(sws, SVGA3D_DEVCAP_MAX_TEXTURE_WIDTH, &result))
224 size = MIN2(result.u, size);
225 else
226 size = 2048;
227 if (sws->get_cap(sws, SVGA3D_DEVCAP_MAX_TEXTURE_HEIGHT, &result))
228 size = MIN2(result.u, size);
229 else
230 size = 2048;
231 return size;
232 }
233
234 case PIPE_CAP_MAX_TEXTURE_3D_LEVELS:
235 if (!sws->get_cap(sws, SVGA3D_DEVCAP_MAX_VOLUME_EXTENT, &result))
236 return 8; /* max 128x128x128 */
237 return MIN2(util_logbase2(result.u) + 1, SVGA_MAX_TEXTURE_LEVELS);
238
239 case PIPE_CAP_MAX_TEXTURE_CUBE_LEVELS:
240 /*
241 * No mechanism to query the host, and at least limited to 2048x2048 on
242 * certain hardware.
243 */
244 return MIN2(util_last_bit(screen->get_param(screen, PIPE_CAP_MAX_TEXTURE_2D_SIZE)),
245 12 /* 2048x2048 */);
246
247 case PIPE_CAP_MAX_TEXTURE_ARRAY_LAYERS:
248 return sws->have_sm5 ? SVGA3D_SM5_MAX_SURFACE_ARRAYSIZE :
249 (sws->have_vgpu10 ? SVGA3D_SM4_MAX_SURFACE_ARRAYSIZE : 0);
250
251 case PIPE_CAP_BLEND_EQUATION_SEPARATE: /* req. for GL 1.5 */
252 return 1;
253
254 case PIPE_CAP_TGSI_FS_COORD_ORIGIN_UPPER_LEFT:
255 return 1;
256 case PIPE_CAP_TGSI_FS_COORD_PIXEL_CENTER_HALF_INTEGER:
257 return sws->have_vgpu10;
258 case PIPE_CAP_TGSI_FS_COORD_PIXEL_CENTER_INTEGER:
259 return !sws->have_vgpu10;
260
261 case PIPE_CAP_VERTEX_COLOR_UNCLAMPED:
262 return 1; /* The color outputs of vertex shaders are not clamped */
263 case PIPE_CAP_VERTEX_COLOR_CLAMPED:
264 return sws->have_vgpu10;
265
266 case PIPE_CAP_MIXED_COLORBUFFER_FORMATS:
267 return 1; /* expected for GL_ARB_framebuffer_object */
268
269 case PIPE_CAP_GLSL_FEATURE_LEVEL:
270 if (sws->have_sm5) {
271 return 410;
272 } else if (sws->have_vgpu10) {
273 return 330;
274 } else {
275 return 120;
276 }
277
278 case PIPE_CAP_GLSL_FEATURE_LEVEL_COMPATIBILITY:
279 return sws->have_sm5 ? 410 : (sws->have_vgpu10 ? 330 : 120);
280
281 case PIPE_CAP_PREFER_BLIT_BASED_TEXTURE_TRANSFER:
282 return 0;
283
284 case PIPE_CAP_FRAGMENT_SHADER_TEXTURE_LOD:
285 case PIPE_CAP_FRAGMENT_SHADER_DERIVATIVES:
286 case PIPE_CAP_VERTEX_SHADER_SATURATE:
287 return 1;
288
289 case PIPE_CAP_DEPTH_CLIP_DISABLE:
290 case PIPE_CAP_INDEP_BLEND_ENABLE:
291 case PIPE_CAP_CONDITIONAL_RENDER:
292 case PIPE_CAP_QUERY_TIMESTAMP:
293 case PIPE_CAP_TGSI_INSTANCEID:
294 case PIPE_CAP_VERTEX_ELEMENT_INSTANCE_DIVISOR:
295 case PIPE_CAP_SEAMLESS_CUBE_MAP:
296 case PIPE_CAP_FAKE_SW_MSAA:
297 return sws->have_vgpu10;
298
299 case PIPE_CAP_MAX_STREAM_OUTPUT_BUFFERS:
300 return sws->have_vgpu10 ? SVGA3D_DX_MAX_SOTARGETS : 0;
301 case PIPE_CAP_MAX_STREAM_OUTPUT_SEPARATE_COMPONENTS:
302 return sws->have_vgpu10 ? 4 : 0;
303 case PIPE_CAP_MAX_STREAM_OUTPUT_INTERLEAVED_COMPONENTS:
304 return sws->have_sm5 ? SVGA3D_MAX_STREAMOUT_DECLS :
305 (sws->have_vgpu10 ? SVGA3D_MAX_DX10_STREAMOUT_DECLS : 0);
306 case PIPE_CAP_STREAM_OUTPUT_PAUSE_RESUME:
307 return sws->have_sm5;
308 case PIPE_CAP_STREAM_OUTPUT_INTERLEAVE_BUFFERS:
309 return sws->have_sm5;
310 case PIPE_CAP_TEXTURE_MULTISAMPLE:
311 return svgascreen->ms_samples ? 1 : 0;
312
313 case PIPE_CAP_MAX_TEXTURE_BUFFER_SIZE:
314 /* convert bytes to texels for the case of the largest texel
315 * size: float[4].
316 */
317 return SVGA3D_DX_MAX_RESOURCE_SIZE / (4 * sizeof(float));
318
319 case PIPE_CAP_MIN_TEXEL_OFFSET:
320 return sws->have_vgpu10 ? VGPU10_MIN_TEXEL_FETCH_OFFSET : 0;
321 case PIPE_CAP_MAX_TEXEL_OFFSET:
322 return sws->have_vgpu10 ? VGPU10_MAX_TEXEL_FETCH_OFFSET : 0;
323
324 case PIPE_CAP_MIN_TEXTURE_GATHER_OFFSET:
325 case PIPE_CAP_MAX_TEXTURE_GATHER_OFFSET:
326 return 0;
327
328 case PIPE_CAP_MAX_GEOMETRY_OUTPUT_VERTICES:
329 return sws->have_vgpu10 ? 256 : 0;
330 case PIPE_CAP_MAX_GEOMETRY_TOTAL_OUTPUT_COMPONENTS:
331 return sws->have_vgpu10 ? 1024 : 0;
332
333 case PIPE_CAP_PRIMITIVE_RESTART:
334 case PIPE_CAP_PRIMITIVE_RESTART_FIXED_INDEX:
335 return 1; /* may be a sw fallback, depending on restart index */
336
337 case PIPE_CAP_GENERATE_MIPMAP:
338 return sws->have_generate_mipmap_cmd;
339
340 case PIPE_CAP_NATIVE_FENCE_FD:
341 return sws->have_fence_fd;
342
343 case PIPE_CAP_QUADS_FOLLOW_PROVOKING_VERTEX_CONVENTION:
344 return 1;
345
346 case PIPE_CAP_CUBE_MAP_ARRAY:
347 case PIPE_CAP_INDEP_BLEND_FUNC:
348 case PIPE_CAP_SAMPLE_SHADING:
349 case PIPE_CAP_FORCE_PERSAMPLE_INTERP:
350 case PIPE_CAP_TEXTURE_QUERY_LOD:
351 return sws->have_sm4_1;
352
353 case PIPE_CAP_MAX_TEXTURE_GATHER_COMPONENTS:
354 /* SM4_1 supports only single-channel textures where as SM5 supports
355 * all four channel textures */
356 return sws->have_sm5 ? 4 :
357 (sws->have_sm4_1 ? 1 : 0);
358 case PIPE_CAP_DRAW_INDIRECT:
359 return sws->have_sm5;
360 case PIPE_CAP_MAX_VERTEX_STREAMS:
361 return sws->have_sm5 ? 4 : 0;
362 case PIPE_CAP_COMPUTE:
363 return 0;
364 case PIPE_CAP_MAX_VARYINGS:
365 return sws->have_vgpu10 ? VGPU10_MAX_FS_INPUTS : 10;
366 case PIPE_CAP_BUFFER_MAP_PERSISTENT_COHERENT:
367 return sws->have_coherent;
368
369 case PIPE_CAP_PCI_GROUP:
370 case PIPE_CAP_PCI_BUS:
371 case PIPE_CAP_PCI_DEVICE:
372 case PIPE_CAP_PCI_FUNCTION:
373 return 0;
374 case PIPE_CAP_MIN_MAP_BUFFER_ALIGNMENT:
375 return 64;
376 case PIPE_CAP_VERTEX_BUFFER_STRIDE_4BYTE_ALIGNED_ONLY:
377 case PIPE_CAP_VERTEX_BUFFER_OFFSET_4BYTE_ALIGNED_ONLY:
378 case PIPE_CAP_VERTEX_ELEMENT_SRC_OFFSET_4BYTE_ALIGNED_ONLY:
379 return 1; /* need 4-byte alignment for all offsets and strides */
380 case PIPE_CAP_MAX_VERTEX_ATTRIB_STRIDE:
381 return 2048;
382 case PIPE_CAP_MAX_VIEWPORTS:
383 assert((!sws->have_vgpu10 && svgascreen->max_viewports == 1) ||
384 (sws->have_vgpu10 &&
385 svgascreen->max_viewports == SVGA3D_DX_MAX_VIEWPORTS));
386 return svgascreen->max_viewports;
387 case PIPE_CAP_ENDIANNESS:
388 return PIPE_ENDIAN_LITTLE;
389
390 case PIPE_CAP_VENDOR_ID:
391 return 0x15ad; /* VMware Inc. */
392 case PIPE_CAP_DEVICE_ID:
393 return 0x0405; /* assume SVGA II */
394 case PIPE_CAP_ACCELERATED:
395 return 0; /* XXX: */
396 case PIPE_CAP_VIDEO_MEMORY:
397 /* XXX: Query the host ? */
398 return 1;
399 case PIPE_CAP_COPY_BETWEEN_COMPRESSED_AND_PLAIN_FORMATS:
400 return sws->have_vgpu10;
401 case PIPE_CAP_CLEAR_TEXTURE:
402 return sws->have_vgpu10;
403 case PIPE_CAP_DOUBLES:
404 return sws->have_sm5;
405 case PIPE_CAP_UMA:
406 case PIPE_CAP_GLSL_OPTIMIZE_CONSERVATIVELY:
407 case PIPE_CAP_ALLOW_MAPPED_BUFFERS_DURING_EXECUTION:
408 return 0;
409 case PIPE_CAP_TGSI_DIV:
410 return 1;
411 case PIPE_CAP_MAX_GS_INVOCATIONS:
412 return 32;
413 case PIPE_CAP_MAX_SHADER_BUFFER_SIZE:
414 return 1 << 27;
415 /* Verify this once protocol is finalized. Setting it to minimum value. */
416 case PIPE_CAP_MAX_SHADER_PATCH_VARYINGS:
417 return sws->have_sm5 ? 30 : 0;
418 default:
419 return u_pipe_screen_get_param_defaults(screen, param);
420 }
421 }
422
423
424 static int
vgpu9_get_shader_param(struct pipe_screen * screen,enum pipe_shader_type shader,enum pipe_shader_cap param)425 vgpu9_get_shader_param(struct pipe_screen *screen,
426 enum pipe_shader_type shader,
427 enum pipe_shader_cap param)
428 {
429 struct svga_screen *svgascreen = svga_screen(screen);
430 struct svga_winsys_screen *sws = svgascreen->sws;
431 unsigned val;
432
433 assert(!sws->have_vgpu10);
434
435 switch (shader)
436 {
437 case PIPE_SHADER_FRAGMENT:
438 switch (param)
439 {
440 case PIPE_SHADER_CAP_MAX_INSTRUCTIONS:
441 case PIPE_SHADER_CAP_MAX_ALU_INSTRUCTIONS:
442 return get_uint_cap(sws,
443 SVGA3D_DEVCAP_MAX_FRAGMENT_SHADER_INSTRUCTIONS,
444 512);
445 case PIPE_SHADER_CAP_MAX_TEX_INSTRUCTIONS:
446 case PIPE_SHADER_CAP_MAX_TEX_INDIRECTIONS:
447 return 512;
448 case PIPE_SHADER_CAP_MAX_CONTROL_FLOW_DEPTH:
449 return SVGA3D_MAX_NESTING_LEVEL;
450 case PIPE_SHADER_CAP_MAX_INPUTS:
451 return 10;
452 case PIPE_SHADER_CAP_MAX_OUTPUTS:
453 return svgascreen->max_color_buffers;
454 case PIPE_SHADER_CAP_MAX_CONST_BUFFER_SIZE:
455 return 224 * sizeof(float[4]);
456 case PIPE_SHADER_CAP_MAX_CONST_BUFFERS:
457 return 1;
458 case PIPE_SHADER_CAP_MAX_TEMPS:
459 val = get_uint_cap(sws, SVGA3D_DEVCAP_MAX_FRAGMENT_SHADER_TEMPS, 32);
460 return MIN2(val, SVGA3D_TEMPREG_MAX);
461 case PIPE_SHADER_CAP_INDIRECT_INPUT_ADDR:
462 /*
463 * Although PS 3.0 has some addressing abilities it can only represent
464 * loops that can be statically determined and unrolled. Given we can
465 * only handle a subset of the cases that the gallium frontend already
466 * does it is better to defer loop unrolling to the gallium frontend.
467 */
468 return 0;
469 case PIPE_SHADER_CAP_TGSI_CONT_SUPPORTED:
470 return 0;
471 case PIPE_SHADER_CAP_TGSI_SQRT_SUPPORTED:
472 return 0;
473 case PIPE_SHADER_CAP_INDIRECT_OUTPUT_ADDR:
474 case PIPE_SHADER_CAP_INDIRECT_TEMP_ADDR:
475 case PIPE_SHADER_CAP_INDIRECT_CONST_ADDR:
476 return 0;
477 case PIPE_SHADER_CAP_SUBROUTINES:
478 return 0;
479 case PIPE_SHADER_CAP_INT64_ATOMICS:
480 case PIPE_SHADER_CAP_INTEGERS:
481 return 0;
482 case PIPE_SHADER_CAP_FP16:
483 case PIPE_SHADER_CAP_FP16_DERIVATIVES:
484 case PIPE_SHADER_CAP_INT16:
485 case PIPE_SHADER_CAP_GLSL_16BIT_CONSTS:
486 return 0;
487 case PIPE_SHADER_CAP_MAX_TEXTURE_SAMPLERS:
488 case PIPE_SHADER_CAP_MAX_SAMPLER_VIEWS:
489 return 16;
490 case PIPE_SHADER_CAP_PREFERRED_IR:
491 return PIPE_SHADER_IR_TGSI;
492 case PIPE_SHADER_CAP_SUPPORTED_IRS:
493 return 0;
494 case PIPE_SHADER_CAP_TGSI_DROUND_SUPPORTED:
495 case PIPE_SHADER_CAP_TGSI_DFRACEXP_DLDEXP_SUPPORTED:
496 case PIPE_SHADER_CAP_TGSI_LDEXP_SUPPORTED:
497 case PIPE_SHADER_CAP_TGSI_FMA_SUPPORTED:
498 case PIPE_SHADER_CAP_TGSI_ANY_INOUT_DECL_RANGE:
499 case PIPE_SHADER_CAP_MAX_SHADER_BUFFERS:
500 case PIPE_SHADER_CAP_MAX_SHADER_IMAGES:
501 case PIPE_SHADER_CAP_LOWER_IF_THRESHOLD:
502 case PIPE_SHADER_CAP_TGSI_SKIP_MERGE_REGISTERS:
503 case PIPE_SHADER_CAP_MAX_HW_ATOMIC_COUNTERS:
504 case PIPE_SHADER_CAP_MAX_HW_ATOMIC_COUNTER_BUFFERS:
505 return 0;
506 case PIPE_SHADER_CAP_MAX_UNROLL_ITERATIONS_HINT:
507 return 32;
508 }
509 /* If we get here, we failed to handle a cap above */
510 debug_printf("Unexpected fragment shader query %u\n", param);
511 return 0;
512 case PIPE_SHADER_VERTEX:
513 switch (param)
514 {
515 case PIPE_SHADER_CAP_MAX_INSTRUCTIONS:
516 case PIPE_SHADER_CAP_MAX_ALU_INSTRUCTIONS:
517 return get_uint_cap(sws, SVGA3D_DEVCAP_MAX_VERTEX_SHADER_INSTRUCTIONS,
518 512);
519 case PIPE_SHADER_CAP_MAX_TEX_INSTRUCTIONS:
520 case PIPE_SHADER_CAP_MAX_TEX_INDIRECTIONS:
521 /* XXX: until we have vertex texture support */
522 return 0;
523 case PIPE_SHADER_CAP_MAX_CONTROL_FLOW_DEPTH:
524 return SVGA3D_MAX_NESTING_LEVEL;
525 case PIPE_SHADER_CAP_MAX_INPUTS:
526 return 16;
527 case PIPE_SHADER_CAP_MAX_OUTPUTS:
528 return 10;
529 case PIPE_SHADER_CAP_MAX_CONST_BUFFER_SIZE:
530 return 256 * sizeof(float[4]);
531 case PIPE_SHADER_CAP_MAX_CONST_BUFFERS:
532 return 1;
533 case PIPE_SHADER_CAP_MAX_TEMPS:
534 val = get_uint_cap(sws, SVGA3D_DEVCAP_MAX_VERTEX_SHADER_TEMPS, 32);
535 return MIN2(val, SVGA3D_TEMPREG_MAX);
536 case PIPE_SHADER_CAP_TGSI_CONT_SUPPORTED:
537 return 0;
538 case PIPE_SHADER_CAP_TGSI_SQRT_SUPPORTED:
539 return 0;
540 case PIPE_SHADER_CAP_INDIRECT_INPUT_ADDR:
541 case PIPE_SHADER_CAP_INDIRECT_OUTPUT_ADDR:
542 return 1;
543 case PIPE_SHADER_CAP_INDIRECT_TEMP_ADDR:
544 return 0;
545 case PIPE_SHADER_CAP_INDIRECT_CONST_ADDR:
546 return 1;
547 case PIPE_SHADER_CAP_SUBROUTINES:
548 return 0;
549 case PIPE_SHADER_CAP_INT64_ATOMICS:
550 case PIPE_SHADER_CAP_INTEGERS:
551 return 0;
552 case PIPE_SHADER_CAP_FP16:
553 case PIPE_SHADER_CAP_FP16_DERIVATIVES:
554 case PIPE_SHADER_CAP_INT16:
555 case PIPE_SHADER_CAP_GLSL_16BIT_CONSTS:
556 return 0;
557 case PIPE_SHADER_CAP_MAX_TEXTURE_SAMPLERS:
558 case PIPE_SHADER_CAP_MAX_SAMPLER_VIEWS:
559 return 0;
560 case PIPE_SHADER_CAP_PREFERRED_IR:
561 return PIPE_SHADER_IR_TGSI;
562 case PIPE_SHADER_CAP_SUPPORTED_IRS:
563 return 0;
564 case PIPE_SHADER_CAP_TGSI_DROUND_SUPPORTED:
565 case PIPE_SHADER_CAP_TGSI_DFRACEXP_DLDEXP_SUPPORTED:
566 case PIPE_SHADER_CAP_TGSI_LDEXP_SUPPORTED:
567 case PIPE_SHADER_CAP_TGSI_FMA_SUPPORTED:
568 case PIPE_SHADER_CAP_TGSI_ANY_INOUT_DECL_RANGE:
569 case PIPE_SHADER_CAP_MAX_SHADER_BUFFERS:
570 case PIPE_SHADER_CAP_MAX_SHADER_IMAGES:
571 case PIPE_SHADER_CAP_LOWER_IF_THRESHOLD:
572 case PIPE_SHADER_CAP_TGSI_SKIP_MERGE_REGISTERS:
573 case PIPE_SHADER_CAP_MAX_HW_ATOMIC_COUNTERS:
574 case PIPE_SHADER_CAP_MAX_HW_ATOMIC_COUNTER_BUFFERS:
575 return 0;
576 case PIPE_SHADER_CAP_MAX_UNROLL_ITERATIONS_HINT:
577 return 32;
578 }
579 /* If we get here, we failed to handle a cap above */
580 debug_printf("Unexpected vertex shader query %u\n", param);
581 return 0;
582 case PIPE_SHADER_GEOMETRY:
583 case PIPE_SHADER_COMPUTE:
584 case PIPE_SHADER_TESS_CTRL:
585 case PIPE_SHADER_TESS_EVAL:
586 /* no support for geometry, tess or compute shaders at this time */
587 return 0;
588 default:
589 debug_printf("Unexpected shader type (%u) query\n", shader);
590 return 0;
591 }
592 return 0;
593 }
594
595
596 static int
vgpu10_get_shader_param(struct pipe_screen * screen,enum pipe_shader_type shader,enum pipe_shader_cap param)597 vgpu10_get_shader_param(struct pipe_screen *screen,
598 enum pipe_shader_type shader,
599 enum pipe_shader_cap param)
600 {
601 struct svga_screen *svgascreen = svga_screen(screen);
602 struct svga_winsys_screen *sws = svgascreen->sws;
603
604 assert(sws->have_vgpu10);
605 (void) sws; /* silence unused var warnings in non-debug builds */
606
607 if ((!sws->have_sm5) &&
608 (shader == PIPE_SHADER_TESS_CTRL || shader == PIPE_SHADER_TESS_EVAL))
609 return 0;
610
611 if (shader == PIPE_SHADER_COMPUTE)
612 return 0;
613
614 /* NOTE: we do not query the device for any caps/limits at this time */
615
616 /* Generally the same limits for vertex, geometry and fragment shaders */
617 switch (param) {
618 case PIPE_SHADER_CAP_MAX_INSTRUCTIONS:
619 case PIPE_SHADER_CAP_MAX_ALU_INSTRUCTIONS:
620 case PIPE_SHADER_CAP_MAX_TEX_INSTRUCTIONS:
621 case PIPE_SHADER_CAP_MAX_TEX_INDIRECTIONS:
622 return 64 * 1024;
623 case PIPE_SHADER_CAP_MAX_CONTROL_FLOW_DEPTH:
624 return 64;
625 case PIPE_SHADER_CAP_MAX_INPUTS:
626 if (shader == PIPE_SHADER_FRAGMENT)
627 return VGPU10_MAX_FS_INPUTS;
628 else if (shader == PIPE_SHADER_GEOMETRY)
629 return VGPU10_MAX_GS_INPUTS;
630 else if (shader == PIPE_SHADER_TESS_CTRL)
631 return VGPU11_MAX_HS_INPUT_CONTROL_POINTS;
632 else if (shader == PIPE_SHADER_TESS_EVAL)
633 return VGPU11_MAX_DS_INPUT_CONTROL_POINTS;
634 else
635 return VGPU10_MAX_VS_INPUTS;
636 case PIPE_SHADER_CAP_MAX_OUTPUTS:
637 if (shader == PIPE_SHADER_FRAGMENT)
638 return VGPU10_MAX_FS_OUTPUTS;
639 else if (shader == PIPE_SHADER_GEOMETRY)
640 return VGPU10_MAX_GS_OUTPUTS;
641 else if (shader == PIPE_SHADER_TESS_CTRL)
642 return VGPU11_MAX_HS_OUTPUTS;
643 else if (shader == PIPE_SHADER_TESS_EVAL)
644 return VGPU11_MAX_DS_OUTPUTS;
645 else
646 return VGPU10_MAX_VS_OUTPUTS;
647 case PIPE_SHADER_CAP_MAX_CONST_BUFFER_SIZE:
648 return VGPU10_MAX_CONSTANT_BUFFER_ELEMENT_COUNT * sizeof(float[4]);
649 case PIPE_SHADER_CAP_MAX_CONST_BUFFERS:
650 return svgascreen->max_const_buffers;
651 case PIPE_SHADER_CAP_MAX_TEMPS:
652 return VGPU10_MAX_TEMPS;
653 case PIPE_SHADER_CAP_INDIRECT_INPUT_ADDR:
654 case PIPE_SHADER_CAP_INDIRECT_OUTPUT_ADDR:
655 case PIPE_SHADER_CAP_INDIRECT_TEMP_ADDR:
656 case PIPE_SHADER_CAP_INDIRECT_CONST_ADDR:
657 return TRUE; /* XXX verify */
658 case PIPE_SHADER_CAP_TGSI_CONT_SUPPORTED:
659 case PIPE_SHADER_CAP_TGSI_SQRT_SUPPORTED:
660 case PIPE_SHADER_CAP_SUBROUTINES:
661 case PIPE_SHADER_CAP_INTEGERS:
662 return TRUE;
663 case PIPE_SHADER_CAP_FP16:
664 case PIPE_SHADER_CAP_FP16_DERIVATIVES:
665 case PIPE_SHADER_CAP_INT16:
666 case PIPE_SHADER_CAP_GLSL_16BIT_CONSTS:
667 return FALSE;
668 case PIPE_SHADER_CAP_MAX_TEXTURE_SAMPLERS:
669 case PIPE_SHADER_CAP_MAX_SAMPLER_VIEWS:
670 return SVGA3D_DX_MAX_SAMPLERS;
671 case PIPE_SHADER_CAP_PREFERRED_IR:
672 return PIPE_SHADER_IR_TGSI;
673 case PIPE_SHADER_CAP_SUPPORTED_IRS:
674 return 0;
675 case PIPE_SHADER_CAP_TGSI_DROUND_SUPPORTED:
676 case PIPE_SHADER_CAP_TGSI_DFRACEXP_DLDEXP_SUPPORTED:
677 case PIPE_SHADER_CAP_TGSI_LDEXP_SUPPORTED:
678 case PIPE_SHADER_CAP_TGSI_FMA_SUPPORTED:
679 case PIPE_SHADER_CAP_TGSI_ANY_INOUT_DECL_RANGE:
680 case PIPE_SHADER_CAP_MAX_SHADER_BUFFERS:
681 case PIPE_SHADER_CAP_MAX_SHADER_IMAGES:
682 case PIPE_SHADER_CAP_LOWER_IF_THRESHOLD:
683 case PIPE_SHADER_CAP_TGSI_SKIP_MERGE_REGISTERS:
684 case PIPE_SHADER_CAP_INT64_ATOMICS:
685 case PIPE_SHADER_CAP_MAX_HW_ATOMIC_COUNTERS:
686 case PIPE_SHADER_CAP_MAX_HW_ATOMIC_COUNTER_BUFFERS:
687 return 0;
688 case PIPE_SHADER_CAP_MAX_UNROLL_ITERATIONS_HINT:
689 return 32;
690 default:
691 debug_printf("Unexpected vgpu10 shader query %u\n", param);
692 return 0;
693 }
694 return 0;
695 }
696
697
698 static int
svga_get_shader_param(struct pipe_screen * screen,enum pipe_shader_type shader,enum pipe_shader_cap param)699 svga_get_shader_param(struct pipe_screen *screen, enum pipe_shader_type shader,
700 enum pipe_shader_cap param)
701 {
702 struct svga_screen *svgascreen = svga_screen(screen);
703 struct svga_winsys_screen *sws = svgascreen->sws;
704 if (sws->have_vgpu10) {
705 return vgpu10_get_shader_param(screen, shader, param);
706 }
707 else {
708 return vgpu9_get_shader_param(screen, shader, param);
709 }
710 }
711
712
713 static void
svga_fence_reference(struct pipe_screen * screen,struct pipe_fence_handle ** ptr,struct pipe_fence_handle * fence)714 svga_fence_reference(struct pipe_screen *screen,
715 struct pipe_fence_handle **ptr,
716 struct pipe_fence_handle *fence)
717 {
718 struct svga_winsys_screen *sws = svga_screen(screen)->sws;
719 sws->fence_reference(sws, ptr, fence);
720 }
721
722
723 static bool
svga_fence_finish(struct pipe_screen * screen,struct pipe_context * ctx,struct pipe_fence_handle * fence,uint64_t timeout)724 svga_fence_finish(struct pipe_screen *screen,
725 struct pipe_context *ctx,
726 struct pipe_fence_handle *fence,
727 uint64_t timeout)
728 {
729 struct svga_winsys_screen *sws = svga_screen(screen)->sws;
730 bool retVal;
731
732 SVGA_STATS_TIME_PUSH(sws, SVGA_STATS_TIME_FENCEFINISH);
733
734 if (!timeout) {
735 retVal = sws->fence_signalled(sws, fence, 0) == 0;
736 }
737 else {
738 SVGA_DBG(DEBUG_DMA|DEBUG_PERF, "%s fence_ptr %p\n",
739 __FUNCTION__, fence);
740
741 retVal = sws->fence_finish(sws, fence, timeout, 0) == 0;
742 }
743
744 SVGA_STATS_TIME_POP(sws);
745
746 return retVal;
747 }
748
749
750 static int
svga_fence_get_fd(struct pipe_screen * screen,struct pipe_fence_handle * fence)751 svga_fence_get_fd(struct pipe_screen *screen,
752 struct pipe_fence_handle *fence)
753 {
754 struct svga_winsys_screen *sws = svga_screen(screen)->sws;
755
756 return sws->fence_get_fd(sws, fence, TRUE);
757 }
758
759
760 static int
svga_get_driver_query_info(struct pipe_screen * screen,unsigned index,struct pipe_driver_query_info * info)761 svga_get_driver_query_info(struct pipe_screen *screen,
762 unsigned index,
763 struct pipe_driver_query_info *info)
764 {
765 #define QUERY(NAME, ENUM, UNITS) \
766 {NAME, ENUM, {0}, UNITS, PIPE_DRIVER_QUERY_RESULT_TYPE_AVERAGE, 0, 0x0}
767
768 static const struct pipe_driver_query_info queries[] = {
769 /* per-frame counters */
770 QUERY("num-draw-calls", SVGA_QUERY_NUM_DRAW_CALLS,
771 PIPE_DRIVER_QUERY_TYPE_UINT64),
772 QUERY("num-fallbacks", SVGA_QUERY_NUM_FALLBACKS,
773 PIPE_DRIVER_QUERY_TYPE_UINT64),
774 QUERY("num-flushes", SVGA_QUERY_NUM_FLUSHES,
775 PIPE_DRIVER_QUERY_TYPE_UINT64),
776 QUERY("num-validations", SVGA_QUERY_NUM_VALIDATIONS,
777 PIPE_DRIVER_QUERY_TYPE_UINT64),
778 QUERY("map-buffer-time", SVGA_QUERY_MAP_BUFFER_TIME,
779 PIPE_DRIVER_QUERY_TYPE_MICROSECONDS),
780 QUERY("num-buffers-mapped", SVGA_QUERY_NUM_BUFFERS_MAPPED,
781 PIPE_DRIVER_QUERY_TYPE_UINT64),
782 QUERY("num-textures-mapped", SVGA_QUERY_NUM_TEXTURES_MAPPED,
783 PIPE_DRIVER_QUERY_TYPE_UINT64),
784 QUERY("num-bytes-uploaded", SVGA_QUERY_NUM_BYTES_UPLOADED,
785 PIPE_DRIVER_QUERY_TYPE_BYTES),
786 QUERY("num-command-buffers", SVGA_QUERY_NUM_COMMAND_BUFFERS,
787 PIPE_DRIVER_QUERY_TYPE_UINT64),
788 QUERY("command-buffer-size", SVGA_QUERY_COMMAND_BUFFER_SIZE,
789 PIPE_DRIVER_QUERY_TYPE_BYTES),
790 QUERY("flush-time", SVGA_QUERY_FLUSH_TIME,
791 PIPE_DRIVER_QUERY_TYPE_MICROSECONDS),
792 QUERY("surface-write-flushes", SVGA_QUERY_SURFACE_WRITE_FLUSHES,
793 PIPE_DRIVER_QUERY_TYPE_UINT64),
794 QUERY("num-readbacks", SVGA_QUERY_NUM_READBACKS,
795 PIPE_DRIVER_QUERY_TYPE_UINT64),
796 QUERY("num-resource-updates", SVGA_QUERY_NUM_RESOURCE_UPDATES,
797 PIPE_DRIVER_QUERY_TYPE_UINT64),
798 QUERY("num-buffer-uploads", SVGA_QUERY_NUM_BUFFER_UPLOADS,
799 PIPE_DRIVER_QUERY_TYPE_UINT64),
800 QUERY("num-const-buf-updates", SVGA_QUERY_NUM_CONST_BUF_UPDATES,
801 PIPE_DRIVER_QUERY_TYPE_UINT64),
802 QUERY("num-const-updates", SVGA_QUERY_NUM_CONST_UPDATES,
803 PIPE_DRIVER_QUERY_TYPE_UINT64),
804 QUERY("num-shader-relocations", SVGA_QUERY_NUM_SHADER_RELOCATIONS,
805 PIPE_DRIVER_QUERY_TYPE_UINT64),
806 QUERY("num-surface-relocations", SVGA_QUERY_NUM_SURFACE_RELOCATIONS,
807 PIPE_DRIVER_QUERY_TYPE_UINT64),
808
809 /* running total counters */
810 QUERY("memory-used", SVGA_QUERY_MEMORY_USED,
811 PIPE_DRIVER_QUERY_TYPE_BYTES),
812 QUERY("num-shaders", SVGA_QUERY_NUM_SHADERS,
813 PIPE_DRIVER_QUERY_TYPE_UINT64),
814 QUERY("num-resources", SVGA_QUERY_NUM_RESOURCES,
815 PIPE_DRIVER_QUERY_TYPE_UINT64),
816 QUERY("num-state-objects", SVGA_QUERY_NUM_STATE_OBJECTS,
817 PIPE_DRIVER_QUERY_TYPE_UINT64),
818 QUERY("num-surface-views", SVGA_QUERY_NUM_SURFACE_VIEWS,
819 PIPE_DRIVER_QUERY_TYPE_UINT64),
820 QUERY("num-generate-mipmap", SVGA_QUERY_NUM_GENERATE_MIPMAP,
821 PIPE_DRIVER_QUERY_TYPE_UINT64),
822 QUERY("num-failed-allocations", SVGA_QUERY_NUM_FAILED_ALLOCATIONS,
823 PIPE_DRIVER_QUERY_TYPE_UINT64),
824 QUERY("num-commands-per-draw", SVGA_QUERY_NUM_COMMANDS_PER_DRAW,
825 PIPE_DRIVER_QUERY_TYPE_FLOAT),
826 QUERY("shader-mem-used", SVGA_QUERY_SHADER_MEM_USED,
827 PIPE_DRIVER_QUERY_TYPE_UINT64),
828 };
829 #undef QUERY
830
831 if (!info)
832 return ARRAY_SIZE(queries);
833
834 if (index >= ARRAY_SIZE(queries))
835 return 0;
836
837 *info = queries[index];
838 return 1;
839 }
840
841
842 static void
init_logging(struct pipe_screen * screen)843 init_logging(struct pipe_screen *screen)
844 {
845 struct svga_screen *svgascreen = svga_screen(screen);
846 static const char *log_prefix = "Mesa: ";
847 char host_log[1000];
848
849 /* Log Version to Host */
850 snprintf(host_log, sizeof(host_log) - strlen(log_prefix),
851 "%s%s\n", log_prefix, svga_get_name(screen));
852 svgascreen->sws->host_log(svgascreen->sws, host_log);
853
854 snprintf(host_log, sizeof(host_log) - strlen(log_prefix),
855 "%s" PACKAGE_VERSION MESA_GIT_SHA1, log_prefix);
856 svgascreen->sws->host_log(svgascreen->sws, host_log);
857
858 /* If the SVGA_EXTRA_LOGGING env var is set, log the process's command
859 * line (program name and arguments).
860 */
861 if (debug_get_bool_option("SVGA_EXTRA_LOGGING", FALSE)) {
862 char cmdline[1000];
863 if (os_get_command_line(cmdline, sizeof(cmdline))) {
864 snprintf(host_log, sizeof(host_log) - strlen(log_prefix),
865 "%s%s\n", log_prefix, cmdline);
866 svgascreen->sws->host_log(svgascreen->sws, host_log);
867 }
868 }
869 }
870
871
872 /**
873 * no-op logging function to use when SVGA_NO_LOGGING is set.
874 */
875 static void
nop_host_log(struct svga_winsys_screen * sws,const char * message)876 nop_host_log(struct svga_winsys_screen *sws, const char *message)
877 {
878 /* nothing */
879 }
880
881
882 static void
svga_destroy_screen(struct pipe_screen * screen)883 svga_destroy_screen( struct pipe_screen *screen )
884 {
885 struct svga_screen *svgascreen = svga_screen(screen);
886
887 svga_screen_cache_cleanup(svgascreen);
888
889 mtx_destroy(&svgascreen->swc_mutex);
890 mtx_destroy(&svgascreen->tex_mutex);
891
892 svgascreen->sws->destroy(svgascreen->sws);
893
894 FREE(svgascreen);
895 }
896
897
898 /**
899 * Create a new svga_screen object
900 */
901 struct pipe_screen *
svga_screen_create(struct svga_winsys_screen * sws)902 svga_screen_create(struct svga_winsys_screen *sws)
903 {
904 struct svga_screen *svgascreen;
905 struct pipe_screen *screen;
906
907 #ifdef DEBUG
908 SVGA_DEBUG = debug_get_flags_option("SVGA_DEBUG", svga_debug_flags, 0 );
909 #endif
910
911 svgascreen = CALLOC_STRUCT(svga_screen);
912 if (!svgascreen)
913 goto error1;
914
915 svgascreen->debug.force_level_surface_view =
916 debug_get_bool_option("SVGA_FORCE_LEVEL_SURFACE_VIEW", FALSE);
917 svgascreen->debug.force_surface_view =
918 debug_get_bool_option("SVGA_FORCE_SURFACE_VIEW", FALSE);
919 svgascreen->debug.force_sampler_view =
920 debug_get_bool_option("SVGA_FORCE_SAMPLER_VIEW", FALSE);
921 svgascreen->debug.no_surface_view =
922 debug_get_bool_option("SVGA_NO_SURFACE_VIEW", FALSE);
923 svgascreen->debug.no_sampler_view =
924 debug_get_bool_option("SVGA_NO_SAMPLER_VIEW", FALSE);
925 svgascreen->debug.no_cache_index_buffers =
926 debug_get_bool_option("SVGA_NO_CACHE_INDEX_BUFFERS", FALSE);
927
928 screen = &svgascreen->screen;
929
930 screen->destroy = svga_destroy_screen;
931 screen->get_name = svga_get_name;
932 screen->get_vendor = svga_get_vendor;
933 screen->get_device_vendor = svga_get_vendor; // TODO actual device vendor
934 screen->get_param = svga_get_param;
935 screen->get_shader_param = svga_get_shader_param;
936 screen->get_paramf = svga_get_paramf;
937 screen->get_timestamp = NULL;
938 screen->is_format_supported = svga_is_format_supported;
939 screen->context_create = svga_context_create;
940 screen->fence_reference = svga_fence_reference;
941 screen->fence_finish = svga_fence_finish;
942 screen->fence_get_fd = svga_fence_get_fd;
943
944 screen->get_driver_query_info = svga_get_driver_query_info;
945 svgascreen->sws = sws;
946
947 svga_init_screen_resource_functions(svgascreen);
948
949 if (sws->get_hw_version) {
950 svgascreen->hw_version = sws->get_hw_version(sws);
951 } else {
952 svgascreen->hw_version = SVGA3D_HWVERSION_WS65_B1;
953 }
954
955 if (svgascreen->hw_version < SVGA3D_HWVERSION_WS8_B1) {
956 /* too old for 3D acceleration */
957 debug_printf("Hardware version 0x%x is too old for accerated 3D\n",
958 svgascreen->hw_version);
959 goto error2;
960 }
961
962 debug_printf("%s enabled\n",
963 sws->have_sm5 ? "SM5" :
964 sws->have_sm4_1 ? "SM4_1" :
965 sws->have_vgpu10 ? "VGPU10" : "VGPU9");
966
967 debug_printf("Mesa: %s %s (%s)\n", svga_get_name(screen),
968 PACKAGE_VERSION, MESA_GIT_SHA1);
969
970 /*
971 * The D16, D24X8, and D24S8 formats always do an implicit shadow compare
972 * when sampled from, where as the DF16, DF24, and D24S8_INT do not. So
973 * we prefer the later when available.
974 *
975 * This mimics hardware vendors extensions for D3D depth sampling. See also
976 * http://aras-p.info/texts/D3D9GPUHacks.html
977 */
978
979 {
980 boolean has_df16, has_df24, has_d24s8_int;
981 SVGA3dSurfaceFormatCaps caps;
982 SVGA3dSurfaceFormatCaps mask;
983 mask.value = 0;
984 mask.zStencil = 1;
985 mask.texture = 1;
986
987 svgascreen->depth.z16 = SVGA3D_Z_D16;
988 svgascreen->depth.x8z24 = SVGA3D_Z_D24X8;
989 svgascreen->depth.s8z24 = SVGA3D_Z_D24S8;
990
991 svga_get_format_cap(svgascreen, SVGA3D_Z_DF16, &caps);
992 has_df16 = (caps.value & mask.value) == mask.value;
993
994 svga_get_format_cap(svgascreen, SVGA3D_Z_DF24, &caps);
995 has_df24 = (caps.value & mask.value) == mask.value;
996
997 svga_get_format_cap(svgascreen, SVGA3D_Z_D24S8_INT, &caps);
998 has_d24s8_int = (caps.value & mask.value) == mask.value;
999
1000 /* XXX: We might want some other logic here.
1001 * Like if we only have d24s8_int we should
1002 * emulate the other formats with that.
1003 */
1004 if (has_df16) {
1005 svgascreen->depth.z16 = SVGA3D_Z_DF16;
1006 }
1007 if (has_df24) {
1008 svgascreen->depth.x8z24 = SVGA3D_Z_DF24;
1009 }
1010 if (has_d24s8_int) {
1011 svgascreen->depth.s8z24 = SVGA3D_Z_D24S8_INT;
1012 }
1013 }
1014
1015 /* Query device caps
1016 */
1017 if (sws->have_vgpu10) {
1018 svgascreen->haveProvokingVertex
1019 = get_bool_cap(sws, SVGA3D_DEVCAP_DX_PROVOKING_VERTEX, FALSE);
1020 svgascreen->haveLineSmooth = TRUE;
1021 svgascreen->maxPointSize = 80.0F;
1022 svgascreen->max_color_buffers = SVGA3D_DX_MAX_RENDER_TARGETS;
1023
1024 /* Multisample samples per pixel */
1025 if (sws->have_sm4_1 && debug_get_bool_option("SVGA_MSAA", TRUE)) {
1026 if (get_bool_cap(sws, SVGA3D_DEVCAP_MULTISAMPLE_2X, FALSE))
1027 svgascreen->ms_samples |= 1 << 1;
1028 if (get_bool_cap(sws, SVGA3D_DEVCAP_MULTISAMPLE_4X, FALSE))
1029 svgascreen->ms_samples |= 1 << 3;
1030 }
1031
1032 if (sws->have_sm5 && debug_get_bool_option("SVGA_MSAA", TRUE)) {
1033 if (get_bool_cap(sws, SVGA3D_DEVCAP_MULTISAMPLE_8X, FALSE))
1034 svgascreen->ms_samples |= 1 << 7;
1035 }
1036
1037 /* Maximum number of constant buffers */
1038 svgascreen->max_const_buffers =
1039 get_uint_cap(sws, SVGA3D_DEVCAP_DX_MAX_CONSTANT_BUFFERS, 1);
1040 svgascreen->max_const_buffers = MIN2(svgascreen->max_const_buffers,
1041 SVGA_MAX_CONST_BUFS);
1042
1043 svgascreen->haveBlendLogicops =
1044 get_bool_cap(sws, SVGA3D_DEVCAP_LOGIC_BLENDOPS, FALSE);
1045
1046 screen->is_format_supported = svga_is_dx_format_supported;
1047
1048 svgascreen->max_viewports = SVGA3D_DX_MAX_VIEWPORTS;
1049 }
1050 else {
1051 /* VGPU9 */
1052 unsigned vs_ver = get_uint_cap(sws, SVGA3D_DEVCAP_VERTEX_SHADER_VERSION,
1053 SVGA3DVSVERSION_NONE);
1054 unsigned fs_ver = get_uint_cap(sws, SVGA3D_DEVCAP_FRAGMENT_SHADER_VERSION,
1055 SVGA3DPSVERSION_NONE);
1056
1057 /* we require Shader model 3.0 or later */
1058 if (fs_ver < SVGA3DPSVERSION_30 || vs_ver < SVGA3DVSVERSION_30) {
1059 goto error2;
1060 }
1061
1062 svgascreen->haveProvokingVertex = FALSE;
1063
1064 svgascreen->haveLineSmooth =
1065 get_bool_cap(sws, SVGA3D_DEVCAP_LINE_AA, FALSE);
1066
1067 svgascreen->maxPointSize =
1068 get_float_cap(sws, SVGA3D_DEVCAP_MAX_POINT_SIZE, 1.0f);
1069 /* Keep this to a reasonable size to avoid failures in conform/pntaa.c */
1070 svgascreen->maxPointSize = MIN2(svgascreen->maxPointSize, 80.0f);
1071
1072 /* The SVGA3D device always supports 4 targets at this time, regardless
1073 * of what querying SVGA3D_DEVCAP_MAX_RENDER_TARGETS might return.
1074 */
1075 svgascreen->max_color_buffers = 4;
1076
1077 /* Only support one constant buffer
1078 */
1079 svgascreen->max_const_buffers = 1;
1080
1081 /* No multisampling */
1082 svgascreen->ms_samples = 0;
1083
1084 /* Only one viewport */
1085 svgascreen->max_viewports = 1;
1086 }
1087
1088 /* common VGPU9 / VGPU10 caps */
1089 svgascreen->haveLineStipple =
1090 get_bool_cap(sws, SVGA3D_DEVCAP_LINE_STIPPLE, FALSE);
1091
1092 svgascreen->maxLineWidth =
1093 MAX2(1.0, get_float_cap(sws, SVGA3D_DEVCAP_MAX_LINE_WIDTH, 1.0f));
1094
1095 svgascreen->maxLineWidthAA =
1096 MAX2(1.0, get_float_cap(sws, SVGA3D_DEVCAP_MAX_AA_LINE_WIDTH, 1.0f));
1097
1098 if (0) {
1099 debug_printf("svga: haveProvokingVertex %u\n",
1100 svgascreen->haveProvokingVertex);
1101 debug_printf("svga: haveLineStip %u "
1102 "haveLineSmooth %u maxLineWidth %.2f maxLineWidthAA %.2f\n",
1103 svgascreen->haveLineStipple, svgascreen->haveLineSmooth,
1104 svgascreen->maxLineWidth, svgascreen->maxLineWidthAA);
1105 debug_printf("svga: maxPointSize %g\n", svgascreen->maxPointSize);
1106 debug_printf("svga: msaa samples mask: 0x%x\n", svgascreen->ms_samples);
1107 }
1108
1109 (void) mtx_init(&svgascreen->tex_mutex, mtx_plain);
1110 (void) mtx_init(&svgascreen->swc_mutex, mtx_recursive);
1111
1112 svga_screen_cache_init(svgascreen);
1113
1114 if (debug_get_bool_option("SVGA_NO_LOGGING", FALSE) == TRUE) {
1115 svgascreen->sws->host_log = nop_host_log;
1116 } else {
1117 init_logging(screen);
1118 }
1119
1120 return screen;
1121 error2:
1122 FREE(svgascreen);
1123 error1:
1124 return NULL;
1125 }
1126
1127
1128 struct svga_winsys_screen *
svga_winsys_screen(struct pipe_screen * screen)1129 svga_winsys_screen(struct pipe_screen *screen)
1130 {
1131 return svga_screen(screen)->sws;
1132 }
1133
1134
1135 #ifdef DEBUG
1136 struct svga_screen *
svga_screen(struct pipe_screen * screen)1137 svga_screen(struct pipe_screen *screen)
1138 {
1139 assert(screen);
1140 assert(screen->destroy == svga_destroy_screen);
1141 return (struct svga_screen *)screen;
1142 }
1143 #endif
1144