• Home
  • Line#
  • Scopes#
  • Navigate#
  • Raw
  • Download
1 /*
2  * Copyright © 2014-2017 Broadcom
3  * Copyright (C) 2012 Rob Clark <robclark@freedesktop.org>
4  *
5  * Permission is hereby granted, free of charge, to any person obtaining a
6  * copy of this software and associated documentation files (the "Software"),
7  * to deal in the Software without restriction, including without limitation
8  * the rights to use, copy, modify, merge, publish, distribute, sublicense,
9  * and/or sell copies of the Software, and to permit persons to whom the
10  * Software is furnished to do so, subject to the following conditions:
11  *
12  * The above copyright notice and this permission notice (including the next
13  * paragraph) shall be included in all copies or substantial portions of the
14  * Software.
15  *
16  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18  * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
19  * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
20  * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
21  * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
22  * IN THE SOFTWARE.
23  */
24 
25 #include <sys/sysinfo.h>
26 
27 #include "common/v3d_device_info.h"
28 #include "common/v3d_limits.h"
29 #include "util/os_misc.h"
30 #include "pipe/p_defines.h"
31 #include "pipe/p_screen.h"
32 #include "pipe/p_state.h"
33 
34 #include "util/u_debug.h"
35 #include "util/u_memory.h"
36 #include "util/format/u_format.h"
37 #include "util/u_hash_table.h"
38 #include "util/u_screen.h"
39 #include "util/u_transfer_helper.h"
40 #include "util/ralloc.h"
41 #include "util/xmlconfig.h"
42 
43 #include <xf86drm.h>
44 #include "v3d_screen.h"
45 #include "v3d_context.h"
46 #include "v3d_resource.h"
47 #include "compiler/v3d_compiler.h"
48 #include "drm-uapi/drm_fourcc.h"
49 
50 static const char *
v3d_screen_get_name(struct pipe_screen * pscreen)51 v3d_screen_get_name(struct pipe_screen *pscreen)
52 {
53         struct v3d_screen *screen = v3d_screen(pscreen);
54 
55         if (!screen->name) {
56                 screen->name = ralloc_asprintf(screen,
57                                                "V3D %d.%d",
58                                                screen->devinfo.ver / 10,
59                                                screen->devinfo.ver % 10);
60         }
61 
62         return screen->name;
63 }
64 
65 static const char *
v3d_screen_get_vendor(struct pipe_screen * pscreen)66 v3d_screen_get_vendor(struct pipe_screen *pscreen)
67 {
68         return "Broadcom";
69 }
70 
71 static void
v3d_screen_destroy(struct pipe_screen * pscreen)72 v3d_screen_destroy(struct pipe_screen *pscreen)
73 {
74         struct v3d_screen *screen = v3d_screen(pscreen);
75 
76         _mesa_hash_table_destroy(screen->bo_handles, NULL);
77         v3d_bufmgr_destroy(pscreen);
78         slab_destroy_parent(&screen->transfer_pool);
79         if (screen->ro)
80                 screen->ro->destroy(screen->ro);
81 
82         if (using_v3d_simulator)
83                 v3d_simulator_destroy(screen->sim_file);
84 
85         v3d_compiler_free(screen->compiler);
86 
87 #ifdef ENABLE_SHADER_CACHE
88         if (screen->disk_cache)
89                 disk_cache_destroy(screen->disk_cache);
90 #endif
91 
92         u_transfer_helper_destroy(pscreen->transfer_helper);
93 
94         close(screen->fd);
95         ralloc_free(pscreen);
96 }
97 
98 static bool
v3d_has_feature(struct v3d_screen * screen,enum drm_v3d_param feature)99 v3d_has_feature(struct v3d_screen *screen, enum drm_v3d_param feature)
100 {
101         struct drm_v3d_get_param p = {
102                 .param = feature,
103         };
104         int ret = v3d_ioctl(screen->fd, DRM_IOCTL_V3D_GET_PARAM, &p);
105 
106         if (ret != 0)
107                 return false;
108 
109         return p.value;
110 }
111 
112 static int
v3d_screen_get_param(struct pipe_screen * pscreen,enum pipe_cap param)113 v3d_screen_get_param(struct pipe_screen *pscreen, enum pipe_cap param)
114 {
115         struct v3d_screen *screen = v3d_screen(pscreen);
116 
117         switch (param) {
118                 /* Supported features (boolean caps). */
119         case PIPE_CAP_VERTEX_COLOR_UNCLAMPED:
120         case PIPE_CAP_BUFFER_MAP_PERSISTENT_COHERENT:
121         case PIPE_CAP_NPOT_TEXTURES:
122         case PIPE_CAP_BLEND_EQUATION_SEPARATE:
123         case PIPE_CAP_TEXTURE_MULTISAMPLE:
124         case PIPE_CAP_TEXTURE_SWIZZLE:
125         case PIPE_CAP_VERTEX_ELEMENT_INSTANCE_DIVISOR:
126         case PIPE_CAP_START_INSTANCE:
127         case PIPE_CAP_VS_INSTANCEID:
128         case PIPE_CAP_FRAGMENT_SHADER_TEXTURE_LOD:
129         case PIPE_CAP_FRAGMENT_SHADER_DERIVATIVES:
130         case PIPE_CAP_PRIMITIVE_RESTART_FIXED_INDEX:
131         case PIPE_CAP_EMULATE_NONFIXED_PRIMITIVE_RESTART:
132         case PIPE_CAP_PRIMITIVE_RESTART:
133         case PIPE_CAP_OCCLUSION_QUERY:
134         case PIPE_CAP_POINT_SPRITE:
135         case PIPE_CAP_STREAM_OUTPUT_PAUSE_RESUME:
136         case PIPE_CAP_DRAW_INDIRECT:
137         case PIPE_CAP_MULTI_DRAW_INDIRECT:
138         case PIPE_CAP_QUADS_FOLLOW_PROVOKING_VERTEX_CONVENTION:
139         case PIPE_CAP_SIGNED_VERTEX_BUFFER_OFFSET:
140         case PIPE_CAP_SHADER_CAN_READ_OUTPUTS:
141         case PIPE_CAP_SHADER_PACK_HALF_FLOAT:
142         case PIPE_CAP_TEXTURE_HALF_FLOAT_LINEAR:
143         case PIPE_CAP_FRAMEBUFFER_NO_ATTACHMENT:
144         case PIPE_CAP_FS_FACE_IS_INTEGER_SYSVAL:
145         case PIPE_CAP_TGSI_TEXCOORD:
146         case PIPE_CAP_TEXTURE_MIRROR_CLAMP_TO_EDGE:
147         case PIPE_CAP_SAMPLER_VIEW_TARGET:
148         case PIPE_CAP_ANISOTROPIC_FILTER:
149         case PIPE_CAP_COPY_BETWEEN_COMPRESSED_AND_PLAIN_FORMATS:
150         case PIPE_CAP_INDEP_BLEND_FUNC:
151                 return 1;
152 
153         case PIPE_CAP_POLYGON_OFFSET_CLAMP:
154                 return screen->devinfo.ver >= 41;
155 
156         case PIPE_CAP_TEXTURE_QUERY_LOD:
157                 return screen->devinfo.ver >= 42;
158                 break;
159 
160         case PIPE_CAP_PACKED_UNIFORMS:
161                 /* We can't enable this flag, because it results in load_ubo
162                  * intrinsics across a 16b boundary, but v3d's TMU general
163                  * memory accesses wrap on 16b boundaries.
164                  */
165                 return 0;
166 
167         case PIPE_CAP_NIR_IMAGES_AS_DEREF:
168                 return 0;
169 
170         case PIPE_CAP_TEXTURE_TRANSFER_MODES:
171                 /* XXX perf: we don't want to emit these extra blits for
172                  * glReadPixels(), since we still have to do an uncached read
173                  * from the GPU of the result after waiting for the TFU blit
174                  * to happen.  However, disabling this introduces instability
175                  * in
176                  * dEQP-GLES31.functional.image_load_store.early_fragment_tests.*
177                  * and corruption in chromium's rendering.
178                  */
179                 return PIPE_TEXTURE_TRANSFER_BLIT;
180 
181         case PIPE_CAP_COMPUTE:
182                 return screen->has_csd && screen->devinfo.ver >= 41;
183 
184         case PIPE_CAP_GENERATE_MIPMAP:
185                 return v3d_has_feature(screen, DRM_V3D_PARAM_SUPPORTS_TFU);
186 
187         case PIPE_CAP_INDEP_BLEND_ENABLE:
188                 return screen->devinfo.ver >= 40;
189 
190         case PIPE_CAP_CONSTANT_BUFFER_OFFSET_ALIGNMENT:
191                 return V3D_NON_COHERENT_ATOM_SIZE;
192 
193         case PIPE_CAP_MAX_TEXTURE_GATHER_COMPONENTS:
194                 if (screen->devinfo.ver < 40)
195                         return 0;
196                 return 4;
197 
198         case PIPE_CAP_SHADER_BUFFER_OFFSET_ALIGNMENT:
199                 if (screen->has_cache_flush)
200                         return 4;
201                 else
202                         return 0; /* Disables shader storage */
203 
204         case PIPE_CAP_GLSL_FEATURE_LEVEL:
205                 return 330;
206 
207         case PIPE_CAP_ESSL_FEATURE_LEVEL:
208                 return 310;
209 
210 	case PIPE_CAP_GLSL_FEATURE_LEVEL_COMPATIBILITY:
211 		return 140;
212 
213         case PIPE_CAP_FS_COORD_ORIGIN_UPPER_LEFT:
214                 return 1;
215         case PIPE_CAP_FS_COORD_ORIGIN_LOWER_LEFT:
216                 return 0;
217         case PIPE_CAP_FS_COORD_PIXEL_CENTER_INTEGER:
218                 if (screen->devinfo.ver >= 40)
219                         return 0;
220                 else
221                         return 1;
222         case PIPE_CAP_FS_COORD_PIXEL_CENTER_HALF_INTEGER:
223                 if (screen->devinfo.ver >= 40)
224                         return 1;
225                 else
226                         return 0;
227 
228         case PIPE_CAP_MIXED_FRAMEBUFFER_SIZES:
229         case PIPE_CAP_MIXED_COLORBUFFER_FORMATS:
230         case PIPE_CAP_MIXED_COLOR_DEPTH_BITS:
231                 return 1;
232 
233         case PIPE_CAP_MAX_STREAM_OUTPUT_BUFFERS:
234                 return 4;
235 
236         case PIPE_CAP_MAX_VARYINGS:
237                 return V3D_MAX_FS_INPUTS / 4;
238 
239                 /* Texturing. */
240         case PIPE_CAP_MAX_TEXTURE_2D_SIZE:
241                 if (screen->devinfo.ver < 40)
242                         return 2048;
243                 else if (screen->nonmsaa_texture_size_limit)
244                         return 7680;
245                 else
246                         return V3D_MAX_IMAGE_DIMENSION;
247         case PIPE_CAP_MAX_TEXTURE_CUBE_LEVELS:
248         case PIPE_CAP_MAX_TEXTURE_3D_LEVELS:
249                 if (screen->devinfo.ver < 40)
250                         return 12;
251                 else
252                         return V3D_MAX_MIP_LEVELS;
253         case PIPE_CAP_MAX_TEXTURE_ARRAY_LAYERS:
254                 return V3D_MAX_ARRAY_LAYERS;
255 
256                 /* Render targets. */
257         case PIPE_CAP_MAX_RENDER_TARGETS:
258                 return 4;
259 
260         case PIPE_CAP_VENDOR_ID:
261                 return 0x14E4;
262         case PIPE_CAP_ACCELERATED:
263                 return 1;
264         case PIPE_CAP_VIDEO_MEMORY: {
265                 uint64_t system_memory;
266 
267                 if (!os_get_total_physical_memory(&system_memory))
268                         return 0;
269 
270                 return (int)(system_memory >> 20);
271         }
272         case PIPE_CAP_UMA:
273                 return 1;
274 
275         case PIPE_CAP_ALPHA_TEST:
276         case PIPE_CAP_FLATSHADE:
277         case PIPE_CAP_TWO_SIDED_COLOR:
278         case PIPE_CAP_VERTEX_COLOR_CLAMPED:
279         case PIPE_CAP_FRAGMENT_COLOR_CLAMPED:
280         case PIPE_CAP_GL_CLAMP:
281                 return 0;
282 
283         /* Geometry shaders */
284         case PIPE_CAP_MAX_GEOMETRY_TOTAL_OUTPUT_COMPONENTS:
285                 /* Minimum required by GLES 3.2 */
286                 return 1024;
287         case PIPE_CAP_MAX_GEOMETRY_OUTPUT_VERTICES:
288                 /* MAX_GEOMETRY_TOTAL_OUTPUT_COMPONENTS / 4 */
289                 return 256;
290         case PIPE_CAP_MAX_GS_INVOCATIONS:
291                 return 32;
292 
293         case PIPE_CAP_SUPPORTED_PRIM_MODES:
294         case PIPE_CAP_SUPPORTED_PRIM_MODES_WITH_RESTART:
295                 return screen->prim_types;
296 
297         case PIPE_CAP_TEXTURE_BUFFER_OBJECTS:
298                 return true;
299 
300         case PIPE_CAP_TEXTURE_BUFFER_OFFSET_ALIGNMENT:
301                 return 256;
302 
303         case PIPE_CAP_IMAGE_STORE_FORMATTED:
304                 return false;
305 
306         default:
307                 return u_pipe_screen_get_param_defaults(pscreen, param);
308         }
309 }
310 
311 static float
v3d_screen_get_paramf(struct pipe_screen * pscreen,enum pipe_capf param)312 v3d_screen_get_paramf(struct pipe_screen *pscreen, enum pipe_capf param)
313 {
314         switch (param) {
315         case PIPE_CAPF_MIN_LINE_WIDTH:
316         case PIPE_CAPF_MIN_LINE_WIDTH_AA:
317         case PIPE_CAPF_MIN_POINT_SIZE:
318         case PIPE_CAPF_MIN_POINT_SIZE_AA:
319            return 1;
320 
321         case PIPE_CAPF_POINT_SIZE_GRANULARITY:
322         case PIPE_CAPF_LINE_WIDTH_GRANULARITY:
323            return 0.1;
324 
325         case PIPE_CAPF_MAX_LINE_WIDTH:
326         case PIPE_CAPF_MAX_LINE_WIDTH_AA:
327                 return V3D_MAX_LINE_WIDTH;
328 
329         case PIPE_CAPF_MAX_POINT_SIZE:
330         case PIPE_CAPF_MAX_POINT_SIZE_AA:
331                 return V3D_MAX_POINT_SIZE;
332 
333         case PIPE_CAPF_MAX_TEXTURE_ANISOTROPY:
334                 return 16.0f;
335         case PIPE_CAPF_MAX_TEXTURE_LOD_BIAS:
336                 return 16.0f;
337 
338         case PIPE_CAPF_MIN_CONSERVATIVE_RASTER_DILATE:
339         case PIPE_CAPF_MAX_CONSERVATIVE_RASTER_DILATE:
340         case PIPE_CAPF_CONSERVATIVE_RASTER_DILATE_GRANULARITY:
341                 return 0.0f;
342         default:
343                 fprintf(stderr, "unknown paramf %d\n", param);
344                 return 0;
345         }
346 }
347 
348 static int
v3d_screen_get_shader_param(struct pipe_screen * pscreen,unsigned shader,enum pipe_shader_cap param)349 v3d_screen_get_shader_param(struct pipe_screen *pscreen, unsigned shader,
350                            enum pipe_shader_cap param)
351 {
352         struct v3d_screen *screen = v3d_screen(pscreen);
353 
354         switch (shader) {
355         case PIPE_SHADER_VERTEX:
356         case PIPE_SHADER_FRAGMENT:
357                 break;
358         case PIPE_SHADER_COMPUTE:
359                 if (!screen->has_csd)
360                         return 0;
361                 break;
362         case PIPE_SHADER_GEOMETRY:
363                 if (screen->devinfo.ver < 41)
364                         return 0;
365                 break;
366         default:
367                 return 0;
368         }
369 
370         /* this is probably not totally correct.. but it's a start: */
371         switch (param) {
372         case PIPE_SHADER_CAP_MAX_INSTRUCTIONS:
373         case PIPE_SHADER_CAP_MAX_ALU_INSTRUCTIONS:
374         case PIPE_SHADER_CAP_MAX_TEX_INSTRUCTIONS:
375         case PIPE_SHADER_CAP_MAX_TEX_INDIRECTIONS:
376                 return 16384;
377 
378         case PIPE_SHADER_CAP_MAX_CONTROL_FLOW_DEPTH:
379                 return UINT_MAX;
380 
381         case PIPE_SHADER_CAP_MAX_INPUTS:
382                 switch (shader) {
383                 case PIPE_SHADER_VERTEX:
384                         return V3D_MAX_VS_INPUTS / 4;
385                 case PIPE_SHADER_GEOMETRY:
386                         return V3D_MAX_GS_INPUTS / 4;
387                 case PIPE_SHADER_FRAGMENT:
388                         return V3D_MAX_FS_INPUTS / 4;
389                 default:
390                         return 0;
391                 };
392         case PIPE_SHADER_CAP_MAX_OUTPUTS:
393                 if (shader == PIPE_SHADER_FRAGMENT)
394                         return 4;
395                 else
396                         return V3D_MAX_FS_INPUTS / 4;
397         case PIPE_SHADER_CAP_MAX_TEMPS:
398                 return 256; /* GL_MAX_PROGRAM_TEMPORARIES_ARB */
399         case PIPE_SHADER_CAP_MAX_CONST_BUFFER0_SIZE:
400                 /* Note: Limited by the offset size in
401                  * v3d_unit_data_create().
402                  */
403                 return 16 * 1024 * sizeof(float);
404         case PIPE_SHADER_CAP_MAX_CONST_BUFFERS:
405                 return 16;
406         case PIPE_SHADER_CAP_CONT_SUPPORTED:
407                 return 0;
408         case PIPE_SHADER_CAP_INDIRECT_INPUT_ADDR:
409                 /* We don't currently support this in the backend, but that is
410                  * okay because our NIR compiler sets the option
411                  * lower_all_io_to_temps, which will eliminate indirect
412                  * indexing on all input/output variables by translating it to
413                  * indirect indexing on temporary variables instead, which we
414                  * will then lower to scratch. We prefer this over setting this
415                  * to 0, which would cause if-ladder injection to eliminate
416                  * indirect indexing on inputs.
417                  */
418                 return 1;
419         case PIPE_SHADER_CAP_INDIRECT_OUTPUT_ADDR:
420                 return 1;
421         case PIPE_SHADER_CAP_INDIRECT_TEMP_ADDR:
422                 return 1;
423         case PIPE_SHADER_CAP_INDIRECT_CONST_ADDR:
424                 return 1;
425         case PIPE_SHADER_CAP_SUBROUTINES:
426                 return 0;
427         case PIPE_SHADER_CAP_INTEGERS:
428                 return 1;
429         case PIPE_SHADER_CAP_FP16:
430         case PIPE_SHADER_CAP_FP16_DERIVATIVES:
431         case PIPE_SHADER_CAP_FP16_CONST_BUFFERS:
432         case PIPE_SHADER_CAP_INT16:
433         case PIPE_SHADER_CAP_GLSL_16BIT_CONSTS:
434         case PIPE_SHADER_CAP_DROUND_SUPPORTED:
435         case PIPE_SHADER_CAP_DFRACEXP_DLDEXP_SUPPORTED:
436         case PIPE_SHADER_CAP_LDEXP_SUPPORTED:
437         case PIPE_SHADER_CAP_TGSI_ANY_INOUT_DECL_RANGE:
438         case PIPE_SHADER_CAP_TGSI_SQRT_SUPPORTED:
439         case PIPE_SHADER_CAP_MAX_HW_ATOMIC_COUNTERS:
440         case PIPE_SHADER_CAP_MAX_HW_ATOMIC_COUNTER_BUFFERS:
441                 return 0;
442         case PIPE_SHADER_CAP_MAX_TEXTURE_SAMPLERS:
443         case PIPE_SHADER_CAP_MAX_SAMPLER_VIEWS:
444                 return V3D_MAX_TEXTURE_SAMPLERS;
445 
446         case PIPE_SHADER_CAP_MAX_SHADER_BUFFERS:
447                 if (screen->has_cache_flush) {
448                         if (shader == PIPE_SHADER_VERTEX ||
449                             shader == PIPE_SHADER_GEOMETRY) {
450                                 return 0;
451                         }
452                         return PIPE_MAX_SHADER_BUFFERS;
453                  } else {
454                         return 0;
455                  }
456 
457         case PIPE_SHADER_CAP_MAX_SHADER_IMAGES:
458                 if (screen->has_cache_flush) {
459                         if (screen->devinfo.ver < 41)
460                                 return 0;
461                         else
462                                 return PIPE_MAX_SHADER_IMAGES;
463                 } else {
464                         return 0;
465                 }
466 
467         case PIPE_SHADER_CAP_PREFERRED_IR:
468                 return PIPE_SHADER_IR_NIR;
469         case PIPE_SHADER_CAP_SUPPORTED_IRS:
470                 return 1 << PIPE_SHADER_IR_NIR;
471         default:
472                 fprintf(stderr, "unknown shader param %d\n", param);
473                 return 0;
474         }
475         return 0;
476 }
477 
478 static int
v3d_get_compute_param(struct pipe_screen * pscreen,enum pipe_shader_ir ir_type,enum pipe_compute_cap param,void * ret)479 v3d_get_compute_param(struct pipe_screen *pscreen, enum pipe_shader_ir ir_type,
480                       enum pipe_compute_cap param, void *ret)
481 {
482         struct v3d_screen *screen = v3d_screen(pscreen);
483 
484         if (!screen->has_csd)
485                 return 0;
486 
487 #define RET(x) do {                                     \
488                 if (ret)                                \
489                         memcpy(ret, x, sizeof(x));      \
490                 return sizeof(x);                       \
491         } while (0)
492 
493         switch (param) {
494         case PIPE_COMPUTE_CAP_ADDRESS_BITS:
495                 RET((uint32_t []) { 32 });
496                 break;
497 
498         case PIPE_COMPUTE_CAP_IR_TARGET:
499                 sprintf(ret, "v3d");
500                 return strlen(ret);
501 
502         case PIPE_COMPUTE_CAP_GRID_DIMENSION:
503                 RET((uint64_t []) { 3 });
504 
505         case PIPE_COMPUTE_CAP_MAX_GRID_SIZE:
506                 /* GL_MAX_COMPUTE_SHADER_WORK_GROUP_COUNT: The CSD has a
507                  * 16-bit field for the number of workgroups in each
508                  * dimension.
509                  */
510                 RET(((uint64_t []) { 65535, 65535, 65535 }));
511 
512         case PIPE_COMPUTE_CAP_MAX_BLOCK_SIZE:
513                 /* GL_MAX_COMPUTE_WORK_GROUP_SIZE */
514                 RET(((uint64_t []) { 256, 256, 256 }));
515 
516         case PIPE_COMPUTE_CAP_MAX_THREADS_PER_BLOCK:
517         case PIPE_COMPUTE_CAP_MAX_VARIABLE_THREADS_PER_BLOCK:
518                 /* GL_MAX_COMPUTE_WORK_GROUP_INVOCATIONS: This is
519                  * limited by WG_SIZE in the CSD.
520                  */
521                 RET((uint64_t []) { 256 });
522 
523         case PIPE_COMPUTE_CAP_MAX_GLOBAL_SIZE:
524                 RET((uint64_t []) { 1024 * 1024 * 1024 });
525 
526         case PIPE_COMPUTE_CAP_MAX_LOCAL_SIZE:
527                 /* GL_MAX_COMPUTE_SHARED_MEMORY_SIZE */
528                 RET((uint64_t []) { 32768 });
529 
530         case PIPE_COMPUTE_CAP_MAX_PRIVATE_SIZE:
531         case PIPE_COMPUTE_CAP_MAX_INPUT_SIZE:
532                 RET((uint64_t []) { 4096 });
533 
534         case PIPE_COMPUTE_CAP_MAX_MEM_ALLOC_SIZE: {
535                 struct sysinfo si;
536                 sysinfo(&si);
537                 RET((uint64_t []) { si.totalram });
538         }
539 
540         case PIPE_COMPUTE_CAP_MAX_CLOCK_FREQUENCY:
541                 /* OpenCL only */
542                 RET((uint32_t []) { 0 });
543 
544         case PIPE_COMPUTE_CAP_MAX_COMPUTE_UNITS:
545                 RET((uint32_t []) { 1 });
546 
547         case PIPE_COMPUTE_CAP_IMAGES_SUPPORTED:
548                 RET((uint32_t []) { 1 });
549 
550         case PIPE_COMPUTE_CAP_SUBGROUP_SIZE:
551                 RET((uint32_t []) { 16 });
552 
553         }
554 
555         return 0;
556 }
557 
558 static bool
v3d_screen_is_format_supported(struct pipe_screen * pscreen,enum pipe_format format,enum pipe_texture_target target,unsigned sample_count,unsigned storage_sample_count,unsigned usage)559 v3d_screen_is_format_supported(struct pipe_screen *pscreen,
560                                enum pipe_format format,
561                                enum pipe_texture_target target,
562                                unsigned sample_count,
563                                unsigned storage_sample_count,
564                                unsigned usage)
565 {
566         struct v3d_screen *screen = v3d_screen(pscreen);
567 
568         if (MAX2(1, sample_count) != MAX2(1, storage_sample_count))
569                 return false;
570 
571         if (sample_count > 1 && sample_count != V3D_MAX_SAMPLES)
572                 return false;
573 
574         if (target >= PIPE_MAX_TEXTURE_TYPES) {
575                 return false;
576         }
577 
578         if (usage & PIPE_BIND_VERTEX_BUFFER) {
579                 switch (format) {
580                 case PIPE_FORMAT_R32G32B32A32_FLOAT:
581                 case PIPE_FORMAT_R32G32B32_FLOAT:
582                 case PIPE_FORMAT_R32G32_FLOAT:
583                 case PIPE_FORMAT_R32_FLOAT:
584                 case PIPE_FORMAT_R32G32B32A32_SNORM:
585                 case PIPE_FORMAT_R32G32B32_SNORM:
586                 case PIPE_FORMAT_R32G32_SNORM:
587                 case PIPE_FORMAT_R32_SNORM:
588                 case PIPE_FORMAT_R32G32B32A32_SSCALED:
589                 case PIPE_FORMAT_R32G32B32_SSCALED:
590                 case PIPE_FORMAT_R32G32_SSCALED:
591                 case PIPE_FORMAT_R32_SSCALED:
592                 case PIPE_FORMAT_R16G16B16A16_UNORM:
593                 case PIPE_FORMAT_R16G16B16_UNORM:
594                 case PIPE_FORMAT_R16G16_UNORM:
595                 case PIPE_FORMAT_R16_UNORM:
596                 case PIPE_FORMAT_R16G16B16A16_SNORM:
597                 case PIPE_FORMAT_R16G16B16_SNORM:
598                 case PIPE_FORMAT_R16G16_SNORM:
599                 case PIPE_FORMAT_R16_SNORM:
600                 case PIPE_FORMAT_R16G16B16A16_USCALED:
601                 case PIPE_FORMAT_R16G16B16_USCALED:
602                 case PIPE_FORMAT_R16G16_USCALED:
603                 case PIPE_FORMAT_R16_USCALED:
604                 case PIPE_FORMAT_R16G16B16A16_SSCALED:
605                 case PIPE_FORMAT_R16G16B16_SSCALED:
606                 case PIPE_FORMAT_R16G16_SSCALED:
607                 case PIPE_FORMAT_R16_SSCALED:
608                 case PIPE_FORMAT_B8G8R8A8_UNORM:
609                 case PIPE_FORMAT_R8G8B8A8_UNORM:
610                 case PIPE_FORMAT_R8G8B8_UNORM:
611                 case PIPE_FORMAT_R8G8_UNORM:
612                 case PIPE_FORMAT_R8_UNORM:
613                 case PIPE_FORMAT_R8G8B8A8_SNORM:
614                 case PIPE_FORMAT_R8G8B8_SNORM:
615                 case PIPE_FORMAT_R8G8_SNORM:
616                 case PIPE_FORMAT_R8_SNORM:
617                 case PIPE_FORMAT_R8G8B8A8_USCALED:
618                 case PIPE_FORMAT_R8G8B8_USCALED:
619                 case PIPE_FORMAT_R8G8_USCALED:
620                 case PIPE_FORMAT_R8_USCALED:
621                 case PIPE_FORMAT_R8G8B8A8_SSCALED:
622                 case PIPE_FORMAT_R8G8B8_SSCALED:
623                 case PIPE_FORMAT_R8G8_SSCALED:
624                 case PIPE_FORMAT_R8_SSCALED:
625                 case PIPE_FORMAT_R10G10B10A2_UNORM:
626                 case PIPE_FORMAT_B10G10R10A2_UNORM:
627                 case PIPE_FORMAT_R10G10B10A2_SNORM:
628                 case PIPE_FORMAT_B10G10R10A2_SNORM:
629                 case PIPE_FORMAT_R10G10B10A2_USCALED:
630                 case PIPE_FORMAT_B10G10R10A2_USCALED:
631                 case PIPE_FORMAT_R10G10B10A2_SSCALED:
632                 case PIPE_FORMAT_B10G10R10A2_SSCALED:
633                         break;
634                 default:
635                         return false;
636                 }
637         }
638 
639         /* FORMAT_NONE gets allowed for ARB_framebuffer_no_attachments's probe
640          * of FRAMEBUFFER_MAX_SAMPLES
641          */
642         if ((usage & PIPE_BIND_RENDER_TARGET) &&
643             format != PIPE_FORMAT_NONE &&
644             !v3d_rt_format_supported(&screen->devinfo, format)) {
645                 return false;
646         }
647 
648         if ((usage & PIPE_BIND_SAMPLER_VIEW) &&
649             !v3d_tex_format_supported(&screen->devinfo, format)) {
650                 return false;
651         }
652 
653         if ((usage & PIPE_BIND_DEPTH_STENCIL) &&
654             !(format == PIPE_FORMAT_S8_UINT_Z24_UNORM ||
655               format == PIPE_FORMAT_X8Z24_UNORM ||
656               format == PIPE_FORMAT_Z16_UNORM ||
657               format == PIPE_FORMAT_Z32_FLOAT ||
658               format == PIPE_FORMAT_Z32_FLOAT_S8X24_UINT)) {
659                 return false;
660         }
661 
662         if ((usage & PIPE_BIND_INDEX_BUFFER) &&
663             !(format == PIPE_FORMAT_R8_UINT ||
664               format == PIPE_FORMAT_R16_UINT ||
665               format == PIPE_FORMAT_R32_UINT)) {
666                 return false;
667         }
668 
669         if (usage & PIPE_BIND_SHADER_IMAGE) {
670                 switch (format) {
671                 /* FIXME: maybe we can implement a swizzle-on-writes to add
672                  * support for BGRA-alike formats.
673                  */
674                 case PIPE_FORMAT_A4B4G4R4_UNORM:
675                 case PIPE_FORMAT_A1B5G5R5_UNORM:
676                 case PIPE_FORMAT_B5G6R5_UNORM:
677                 case PIPE_FORMAT_B8G8R8A8_UNORM:
678                 case PIPE_FORMAT_X8Z24_UNORM:
679                 case PIPE_FORMAT_Z16_UNORM:
680                         return false;
681                 default:
682                         return true;
683                 }
684         }
685 
686         return true;
687 }
688 
689 static const nir_shader_compiler_options v3d_nir_options = {
690         .lower_uadd_sat = true,
691         .lower_usub_sat = true,
692         .lower_iadd_sat = true,
693         .lower_all_io_to_temps = true,
694         .lower_extract_byte = true,
695         .lower_extract_word = true,
696         .lower_insert_byte = true,
697         .lower_insert_word = true,
698         .lower_bitfield_insert_to_shifts = true,
699         .lower_bitfield_extract_to_shifts = true,
700         .lower_bitfield_reverse = true,
701         .lower_bit_count = true,
702         .lower_cs_local_id_to_index = true,
703         .lower_ffract = true,
704         .lower_fmod = true,
705         .lower_pack_unorm_2x16 = true,
706         .lower_pack_snorm_2x16 = true,
707         .lower_pack_unorm_4x8 = true,
708         .lower_pack_snorm_4x8 = true,
709         .lower_unpack_unorm_4x8 = true,
710         .lower_unpack_snorm_4x8 = true,
711         .lower_pack_half_2x16 = true,
712         .lower_unpack_half_2x16 = true,
713         .lower_pack_32_2x16 = true,
714         .lower_pack_32_2x16_split = true,
715         .lower_unpack_32_2x16_split = true,
716         .lower_fdiv = true,
717         .lower_find_lsb = true,
718         .lower_ffma16 = true,
719         .lower_ffma32 = true,
720         .lower_ffma64 = true,
721         .lower_flrp32 = true,
722         .lower_fpow = true,
723         .lower_fsat = true,
724         .lower_fsqrt = true,
725         .lower_ifind_msb = true,
726         .lower_isign = true,
727         .lower_ldexp = true,
728         .lower_mul_high = true,
729         .lower_wpos_pntc = true,
730         .lower_rotate = true,
731         .lower_to_scalar = true,
732         .lower_int64_options = nir_lower_imul_2x32_64,
733         .has_fsub = true,
734         .has_isub = true,
735         .divergence_analysis_options =
736                 nir_divergence_multiple_workgroup_per_compute_subgroup,
737         /* This will enable loop unrolling in the state tracker so we won't
738          * be able to selectively disable it in backend if it leads to
739          * lower thread counts or TMU spills. Choose a conservative maximum to
740          * limit register pressure impact.
741          */
742         .max_unroll_iterations = 16,
743         .force_indirect_unrolling_sampler = true,
744 };
745 
746 static const void *
v3d_screen_get_compiler_options(struct pipe_screen * pscreen,enum pipe_shader_ir ir,unsigned shader)747 v3d_screen_get_compiler_options(struct pipe_screen *pscreen,
748                                 enum pipe_shader_ir ir, unsigned shader)
749 {
750         return &v3d_nir_options;
751 }
752 
753 static const uint64_t v3d_available_modifiers[] = {
754    DRM_FORMAT_MOD_BROADCOM_UIF,
755    DRM_FORMAT_MOD_LINEAR,
756    DRM_FORMAT_MOD_BROADCOM_SAND128,
757 };
758 
759 static void
v3d_screen_query_dmabuf_modifiers(struct pipe_screen * pscreen,enum pipe_format format,int max,uint64_t * modifiers,unsigned int * external_only,int * count)760 v3d_screen_query_dmabuf_modifiers(struct pipe_screen *pscreen,
761                                   enum pipe_format format, int max,
762                                   uint64_t *modifiers,
763                                   unsigned int *external_only,
764                                   int *count)
765 {
766         int i;
767         int num_modifiers = ARRAY_SIZE(v3d_available_modifiers);
768 
769         /* Expose DRM_FORMAT_MOD_BROADCOM_SAND128 only for PIPE_FORMAT_NV12 */
770         if (format != PIPE_FORMAT_NV12)
771                 num_modifiers--;
772 
773         if (!modifiers) {
774                 *count = num_modifiers;
775                 return;
776         }
777 
778         *count = MIN2(max, num_modifiers);
779         for (i = 0; i < *count; i++) {
780                 modifiers[i] = v3d_available_modifiers[i];
781                 if (external_only)
782                         external_only[i] = util_format_is_yuv(format);
783         }
784 }
785 
786 static bool
v3d_screen_is_dmabuf_modifier_supported(struct pipe_screen * pscreen,uint64_t modifier,enum pipe_format format,bool * external_only)787 v3d_screen_is_dmabuf_modifier_supported(struct pipe_screen *pscreen,
788                                         uint64_t modifier,
789                                         enum pipe_format format,
790                                         bool *external_only)
791 {
792         int i;
793         bool is_sand_col128 = (format == PIPE_FORMAT_NV12) &&
794                 (fourcc_mod_broadcom_mod(modifier) == DRM_FORMAT_MOD_BROADCOM_SAND128);
795 
796         if (is_sand_col128) {
797                 if (external_only)
798                         *external_only = true;
799                 return true;
800         }
801 
802         /* We don't want to generally allow DRM_FORMAT_MOD_BROADCOM_SAND128
803          * modifier, that is the last v3d_available_modifiers. We only accept
804          * it in the case of having a PIPE_FORMAT_NV12.
805          */
806         assert(v3d_available_modifiers[ARRAY_SIZE(v3d_available_modifiers) - 1] ==
807                DRM_FORMAT_MOD_BROADCOM_SAND128);
808         for (i = 0; i < ARRAY_SIZE(v3d_available_modifiers) - 1; i++) {
809                 if (v3d_available_modifiers[i] == modifier) {
810                         if (external_only)
811                                 *external_only = util_format_is_yuv(format);
812 
813                         return true;
814                 }
815         }
816 
817         return false;
818 }
819 
820 static enum pipe_format
v3d_screen_get_compatible_tlb_format(struct pipe_screen * screen,enum pipe_format format)821 v3d_screen_get_compatible_tlb_format(struct pipe_screen *screen,
822                                      enum pipe_format format)
823 {
824         switch (format) {
825         case PIPE_FORMAT_R16G16_UNORM:
826                 return PIPE_FORMAT_R16G16_UINT;
827         default:
828                 return format;
829         }
830 }
831 
832 static struct disk_cache *
v3d_screen_get_disk_shader_cache(struct pipe_screen * pscreen)833 v3d_screen_get_disk_shader_cache(struct pipe_screen *pscreen)
834 {
835         struct v3d_screen *screen = v3d_screen(pscreen);
836 
837         return screen->disk_cache;
838 }
839 
840 struct pipe_screen *
v3d_screen_create(int fd,const struct pipe_screen_config * config,struct renderonly * ro)841 v3d_screen_create(int fd, const struct pipe_screen_config *config,
842                   struct renderonly *ro)
843 {
844         struct v3d_screen *screen = rzalloc(NULL, struct v3d_screen);
845         struct pipe_screen *pscreen;
846 
847         pscreen = &screen->base;
848 
849         pscreen->destroy = v3d_screen_destroy;
850         pscreen->get_param = v3d_screen_get_param;
851         pscreen->get_paramf = v3d_screen_get_paramf;
852         pscreen->get_shader_param = v3d_screen_get_shader_param;
853         pscreen->get_compute_param = v3d_get_compute_param;
854         pscreen->context_create = v3d_context_create;
855         pscreen->is_format_supported = v3d_screen_is_format_supported;
856         pscreen->get_canonical_format = v3d_screen_get_compatible_tlb_format;
857 
858         screen->fd = fd;
859         screen->ro = ro;
860 
861         list_inithead(&screen->bo_cache.time_list);
862         (void)mtx_init(&screen->bo_handles_mutex, mtx_plain);
863         screen->bo_handles = util_hash_table_create_ptr_keys();
864 
865 #if defined(USE_V3D_SIMULATOR)
866         screen->sim_file = v3d_simulator_init(screen->fd);
867 #endif
868 
869         if (!v3d_get_device_info(screen->fd, &screen->devinfo, &v3d_ioctl))
870                 goto fail;
871 
872         driParseConfigFiles(config->options, config->options_info, 0, "v3d",
873                             NULL, NULL, NULL, 0, NULL, 0);
874 
875         /* We have to driCheckOption for the simulator mode to not assertion
876          * fail on not having our XML config.
877          */
878         const char *nonmsaa_name = "v3d_nonmsaa_texture_size_limit";
879         screen->nonmsaa_texture_size_limit =
880                 driCheckOption(config->options, nonmsaa_name, DRI_BOOL) &&
881                 driQueryOptionb(config->options, nonmsaa_name);
882 
883         slab_create_parent(&screen->transfer_pool, sizeof(struct v3d_transfer), 16);
884 
885         screen->has_csd = v3d_has_feature(screen, DRM_V3D_PARAM_SUPPORTS_CSD);
886         screen->has_cache_flush =
887                 v3d_has_feature(screen, DRM_V3D_PARAM_SUPPORTS_CACHE_FLUSH);
888         screen->has_perfmon = v3d_has_feature(screen, DRM_V3D_PARAM_SUPPORTS_PERFMON);
889 
890         v3d_fence_init(screen);
891 
892         v3d_process_debug_variable();
893 
894         v3d_resource_screen_init(pscreen);
895 
896         screen->compiler = v3d_compiler_init(&screen->devinfo, 0);
897 
898 #ifdef ENABLE_SHADER_CACHE
899         v3d_disk_cache_init(screen);
900 #endif
901 
902         pscreen->get_name = v3d_screen_get_name;
903         pscreen->get_vendor = v3d_screen_get_vendor;
904         pscreen->get_device_vendor = v3d_screen_get_vendor;
905         pscreen->get_compiler_options = v3d_screen_get_compiler_options;
906         pscreen->get_disk_shader_cache = v3d_screen_get_disk_shader_cache;
907         pscreen->query_dmabuf_modifiers = v3d_screen_query_dmabuf_modifiers;
908         pscreen->is_dmabuf_modifier_supported =
909                 v3d_screen_is_dmabuf_modifier_supported;
910 
911         if (screen->has_perfmon) {
912                 pscreen->get_driver_query_group_info = v3d_get_driver_query_group_info;
913                 pscreen->get_driver_query_info = v3d_get_driver_query_info;
914         }
915 
916         /* Generate the bitmask of supported draw primitives. */
917         screen->prim_types = BITFIELD_BIT(PIPE_PRIM_POINTS) |
918                              BITFIELD_BIT(PIPE_PRIM_LINES) |
919                              BITFIELD_BIT(PIPE_PRIM_LINE_LOOP) |
920                              BITFIELD_BIT(PIPE_PRIM_LINE_STRIP) |
921                              BITFIELD_BIT(PIPE_PRIM_TRIANGLES) |
922                              BITFIELD_BIT(PIPE_PRIM_TRIANGLE_STRIP) |
923                              BITFIELD_BIT(PIPE_PRIM_TRIANGLE_FAN) |
924                              BITFIELD_BIT(PIPE_PRIM_LINES_ADJACENCY) |
925                              BITFIELD_BIT(PIPE_PRIM_LINE_STRIP_ADJACENCY) |
926                              BITFIELD_BIT(PIPE_PRIM_TRIANGLES_ADJACENCY) |
927                              BITFIELD_BIT(PIPE_PRIM_TRIANGLE_STRIP_ADJACENCY);
928 
929         return pscreen;
930 
931 fail:
932         close(fd);
933         ralloc_free(pscreen);
934         return NULL;
935 }
936