• Home
  • Line#
  • Scopes#
  • Navigate#
  • Raw
  • Download
1 /**************************************************************************
2  *
3  * Copyright 2010-2012 VMware, Inc.
4  * All Rights Reserved.
5  *
6  * Permission is hereby granted, free of charge, to any person obtaining a
7  * copy of this software and associated documentation files (the
8  * "Software"), to deal in the Software without restriction, including
9  * without limitation the rights to use, copy, modify, merge, publish,
10  * distribute, sub license, and/or sell copies of the Software, and to
11  * permit persons to whom the Software is furnished to do so, subject to
12  * the following conditions:
13  *
14  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
15  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
16  * FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT. IN NO EVENT SHALL
17  * THE COPYRIGHT HOLDERS, AUTHORS AND/OR ITS SUPPLIERS BE LIABLE FOR ANY CLAIM,
18  * DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR
19  * OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE
20  * USE OR OTHER DEALINGS IN THE SOFTWARE.
21  *
22  * The above copyright notice and this permission notice (including the
23  * next paragraph) shall be included in all copies or substantial portions
24  * of the Software.
25  *
26  **************************************************************************/
27 
28 
29 #ifndef LP_BLD_LIMITS_H_
30 #define LP_BLD_LIMITS_H_
31 
32 
33 #include <limits.h>
34 
35 #include "pipe/p_state.h"
36 #include "pipe/p_defines.h"
37 #include "util/u_cpu_detect.h"
38 
39 /*
40  * TGSI translation limits.
41  *
42  * Some are slightly above SM 3.0 requirements to give some wiggle room to
43  * the gallium frontends.
44  */
45 
46 #define LP_MAX_TGSI_TEMPS 4096
47 
48 #define LP_MAX_TGSI_ADDRS 16
49 
50 #define LP_MAX_TGSI_IMMEDIATES 4096
51 
52 #define LP_MAX_TGSI_CONSTS 4096
53 
54 #define LP_MAX_TGSI_CONST_BUFFERS 16
55 
56 #define LP_MAX_TGSI_CONST_BUFFER_SIZE (LP_MAX_TGSI_CONSTS * sizeof(float[4]))
57 
58 #define LP_MAX_TGSI_SHADER_BUFFERS 16
59 
60 #define LP_MAX_TGSI_SHADER_BUFFER_SIZE (1 << 27)
61 
62 #define LP_MAX_TGSI_SHADER_IMAGES 16
63 
64 /*
65  * For quick access we cache registers in statically
66  * allocated arrays. Here we define the maximum size
67  * for those arrays.
68  */
69 #define LP_MAX_INLINED_TEMPS 256
70 
71 #define LP_MAX_INLINED_IMMEDIATES 256
72 
73 /**
74  * Maximum control flow nesting
75  *
76  * Vulkan CTS tests seem to have up to 76 levels. Add a few for safety.
77  * SM4.0 requires 64 (per subroutine actually, subroutine nesting itself is 32)
78  * SM3.0 requires 24 (most likely per subroutine too)
79  * add 2 more (some translation could add one more)
80  */
81 #define LP_MAX_TGSI_NESTING 80
82 
83 /**
84  * Maximum iterations before loop termination
85  * Shared between every loop in a TGSI shader
86  */
87 #define LP_MAX_TGSI_LOOP_ITERATIONS 65535
88 
89 static inline bool
lp_has_fp16(void)90 lp_has_fp16(void)
91 {
92    return util_get_cpu_caps()->has_f16c;
93 }
94 
95 /**
96  * Some of these limits are actually infinite (i.e., only limited by available
97  * memory), however advertising INT_MAX would cause some test problems to
98  * actually try to allocate the maximum and run out of memory and crash.  So
99  * stick with something reasonable here.
100  */
101 static inline int
gallivm_get_shader_param(enum pipe_shader_cap param)102 gallivm_get_shader_param(enum pipe_shader_cap param)
103 {
104    switch(param) {
105    case PIPE_SHADER_CAP_MAX_INSTRUCTIONS:
106    case PIPE_SHADER_CAP_MAX_ALU_INSTRUCTIONS:
107    case PIPE_SHADER_CAP_MAX_TEX_INSTRUCTIONS:
108    case PIPE_SHADER_CAP_MAX_TEX_INDIRECTIONS:
109       return 1 * 1024 * 1024;
110    case PIPE_SHADER_CAP_MAX_CONTROL_FLOW_DEPTH:
111       return LP_MAX_TGSI_NESTING;
112    case PIPE_SHADER_CAP_MAX_INPUTS:
113       return 32;
114    case PIPE_SHADER_CAP_MAX_OUTPUTS:
115       return 32;
116    case PIPE_SHADER_CAP_MAX_CONST_BUFFER_SIZE:
117       return LP_MAX_TGSI_CONST_BUFFER_SIZE;
118    case PIPE_SHADER_CAP_MAX_CONST_BUFFERS:
119       return LP_MAX_TGSI_CONST_BUFFERS;
120    case PIPE_SHADER_CAP_MAX_TEMPS:
121       return LP_MAX_TGSI_TEMPS;
122    case PIPE_SHADER_CAP_TGSI_CONT_SUPPORTED:
123       return 1;
124    case PIPE_SHADER_CAP_INDIRECT_INPUT_ADDR:
125    case PIPE_SHADER_CAP_INDIRECT_OUTPUT_ADDR:
126    case PIPE_SHADER_CAP_INDIRECT_TEMP_ADDR:
127    case PIPE_SHADER_CAP_INDIRECT_CONST_ADDR:
128       return 1;
129    case PIPE_SHADER_CAP_SUBROUTINES:
130       return 1;
131    case PIPE_SHADER_CAP_INTEGERS:
132       return 1;
133    case PIPE_SHADER_CAP_FP16:
134    case PIPE_SHADER_CAP_FP16_DERIVATIVES:
135    case PIPE_SHADER_CAP_FP16_CONST_BUFFERS:
136       return lp_has_fp16();
137    case PIPE_SHADER_CAP_INT64_ATOMICS:
138       return 0;
139    case PIPE_SHADER_CAP_INT16:
140    case PIPE_SHADER_CAP_GLSL_16BIT_CONSTS:
141       return 1;
142    case PIPE_SHADER_CAP_MAX_TEXTURE_SAMPLERS:
143       return PIPE_MAX_SAMPLERS;
144    case PIPE_SHADER_CAP_MAX_SAMPLER_VIEWS:
145       return PIPE_MAX_SHADER_SAMPLER_VIEWS;
146    case PIPE_SHADER_CAP_PREFERRED_IR:
147       return PIPE_SHADER_IR_TGSI;
148    case PIPE_SHADER_CAP_SUPPORTED_IRS:
149       return (1 << PIPE_SHADER_IR_TGSI) | (1 << PIPE_SHADER_IR_NIR);
150    case PIPE_SHADER_CAP_TGSI_SQRT_SUPPORTED:
151    case PIPE_SHADER_CAP_TGSI_ANY_INOUT_DECL_RANGE:
152       return 1;
153    case PIPE_SHADER_CAP_TGSI_DROUND_SUPPORTED:
154    case PIPE_SHADER_CAP_TGSI_DFRACEXP_DLDEXP_SUPPORTED:
155    case PIPE_SHADER_CAP_TGSI_LDEXP_SUPPORTED:
156    case PIPE_SHADER_CAP_TGSI_FMA_SUPPORTED:
157    case PIPE_SHADER_CAP_LOWER_IF_THRESHOLD:
158    case PIPE_SHADER_CAP_TGSI_SKIP_MERGE_REGISTERS:
159    case PIPE_SHADER_CAP_MAX_HW_ATOMIC_COUNTERS:
160    case PIPE_SHADER_CAP_MAX_HW_ATOMIC_COUNTER_BUFFERS:
161       return 0;
162    case PIPE_SHADER_CAP_MAX_UNROLL_ITERATIONS_HINT:
163       return 32;
164    case PIPE_SHADER_CAP_MAX_SHADER_BUFFERS:
165       return LP_MAX_TGSI_SHADER_BUFFERS;
166    case PIPE_SHADER_CAP_MAX_SHADER_IMAGES:
167       return LP_MAX_TGSI_SHADER_IMAGES;
168    }
169    /* if we get here, we missed a shader cap above (and should have seen
170     * a compiler warning.)
171     */
172    return 0;
173 }
174 
175 
176 #endif /* LP_BLD_LIMITS_H_ */
177