1 /**************************************************************************
2 *
3 * Copyright 2010-2012 VMware, Inc.
4 * All Rights Reserved.
5 *
6 * Permission is hereby granted, free of charge, to any person obtaining a
7 * copy of this software and associated documentation files (the
8 * "Software"), to deal in the Software without restriction, including
9 * without limitation the rights to use, copy, modify, merge, publish,
10 * distribute, sub license, and/or sell copies of the Software, and to
11 * permit persons to whom the Software is furnished to do so, subject to
12 * the following conditions:
13 *
14 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
15 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
16 * FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT. IN NO EVENT SHALL
17 * THE COPYRIGHT HOLDERS, AUTHORS AND/OR ITS SUPPLIERS BE LIABLE FOR ANY CLAIM,
18 * DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR
19 * OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE
20 * USE OR OTHER DEALINGS IN THE SOFTWARE.
21 *
22 * The above copyright notice and this permission notice (including the
23 * next paragraph) shall be included in all copies or substantial portions
24 * of the Software.
25 *
26 **************************************************************************/
27
28
29 #ifndef LP_BLD_LIMITS_H_
30 #define LP_BLD_LIMITS_H_
31
32
33 #include <limits.h>
34
35 #include "pipe/p_state.h"
36 #include "pipe/p_defines.h"
37 #include "util/u_cpu_detect.h"
38
39 /*
40 * llvmpipe shader limits
41 */
42
43 #define LP_MAX_TGSI_TEMPS 4096
44
45 #define LP_MAX_TGSI_ADDRS 16
46
47 #define LP_MAX_TGSI_IMMEDIATES 4096
48
49 #define LP_MAX_TGSI_CONSTS 4096
50
51 #define LP_MAX_TGSI_CONST_BUFFERS 16
52
53 #define LP_MAX_TGSI_CONST_BUFFER_SIZE (LP_MAX_TGSI_CONSTS * sizeof(float[4]))
54
55 #define LP_MAX_TGSI_SHADER_BUFFERS 32
56
57 #define LP_MAX_TGSI_SHADER_BUFFER_SIZE (1 << 27)
58
59 #define LP_MAX_TGSI_SHADER_IMAGES 64
60
61 /*
62 * For quick access we cache registers in statically
63 * allocated arrays. Here we define the maximum size
64 * for those arrays.
65 */
66 #define LP_MAX_INLINED_TEMPS 256
67
68 #define LP_MAX_INLINED_IMMEDIATES 256
69
70 /**
71 * Maximum control flow nesting
72 *
73 * Vulkan CTS tests seem to have up to 76 levels. Add a few for safety.
74 * SM4.0 requires 64 (per subroutine actually, subroutine nesting itself is 32)
75 * SM3.0 requires 24 (most likely per subroutine too)
76 * add 2 more (some translation could add one more)
77 */
78 #define LP_MAX_TGSI_NESTING 80
79
80 /**
81 * Maximum iterations before loop termination
82 * Shared between every loop in a TGSI shader
83 */
84 #define LP_MAX_TGSI_LOOP_ITERATIONS 65535
85
86 static inline bool
lp_has_fp16(void)87 lp_has_fp16(void)
88 {
89 return util_get_cpu_caps()->has_f16c || DETECT_ARCH_AARCH64;
90 }
91
92 /**
93 * Some of these limits are actually infinite (i.e., only limited by available
94 * memory), however advertising INT_MAX would cause some test problems to
95 * actually try to allocate the maximum and run out of memory and crash. So
96 * stick with something reasonable here.
97 */
98 static inline int
gallivm_get_shader_param(enum pipe_shader_cap param)99 gallivm_get_shader_param(enum pipe_shader_cap param)
100 {
101 switch(param) {
102 case PIPE_SHADER_CAP_MAX_INSTRUCTIONS:
103 case PIPE_SHADER_CAP_MAX_ALU_INSTRUCTIONS:
104 case PIPE_SHADER_CAP_MAX_TEX_INSTRUCTIONS:
105 case PIPE_SHADER_CAP_MAX_TEX_INDIRECTIONS:
106 return 1 * 1024 * 1024;
107 case PIPE_SHADER_CAP_MAX_CONTROL_FLOW_DEPTH:
108 return LP_MAX_TGSI_NESTING;
109 case PIPE_SHADER_CAP_MAX_INPUTS:
110 return 32;
111 case PIPE_SHADER_CAP_MAX_OUTPUTS:
112 return 32;
113 case PIPE_SHADER_CAP_MAX_CONST_BUFFER0_SIZE:
114 return LP_MAX_TGSI_CONST_BUFFER_SIZE;
115 case PIPE_SHADER_CAP_MAX_CONST_BUFFERS:
116 return LP_MAX_TGSI_CONST_BUFFERS;
117 case PIPE_SHADER_CAP_MAX_TEMPS:
118 return LP_MAX_TGSI_TEMPS;
119 case PIPE_SHADER_CAP_CONT_SUPPORTED:
120 return 1;
121 case PIPE_SHADER_CAP_INDIRECT_INPUT_ADDR:
122 case PIPE_SHADER_CAP_INDIRECT_OUTPUT_ADDR:
123 case PIPE_SHADER_CAP_INDIRECT_TEMP_ADDR:
124 case PIPE_SHADER_CAP_INDIRECT_CONST_ADDR:
125 return 1;
126 case PIPE_SHADER_CAP_SUBROUTINES:
127 return 1;
128 case PIPE_SHADER_CAP_INTEGERS:
129 return 1;
130 case PIPE_SHADER_CAP_FP16:
131 case PIPE_SHADER_CAP_FP16_DERIVATIVES:
132 return lp_has_fp16();
133 //enabling this breaks GTF-GL46.gtf21.GL2Tests.glGetUniform.glGetUniform
134 case PIPE_SHADER_CAP_FP16_CONST_BUFFERS:
135 return 0;
136 case PIPE_SHADER_CAP_INT64_ATOMICS:
137 return 0;
138 case PIPE_SHADER_CAP_INT16:
139 case PIPE_SHADER_CAP_GLSL_16BIT_CONSTS:
140 return 1;
141 case PIPE_SHADER_CAP_MAX_TEXTURE_SAMPLERS:
142 return PIPE_MAX_SAMPLERS;
143 case PIPE_SHADER_CAP_MAX_SAMPLER_VIEWS:
144 return PIPE_MAX_SHADER_SAMPLER_VIEWS;
145 case PIPE_SHADER_CAP_SUPPORTED_IRS:
146 return (1 << PIPE_SHADER_IR_TGSI) | (1 << PIPE_SHADER_IR_NIR);
147 case PIPE_SHADER_CAP_TGSI_SQRT_SUPPORTED:
148 case PIPE_SHADER_CAP_TGSI_ANY_INOUT_DECL_RANGE:
149 return 1;
150 case PIPE_SHADER_CAP_MAX_HW_ATOMIC_COUNTERS:
151 case PIPE_SHADER_CAP_MAX_HW_ATOMIC_COUNTER_BUFFERS:
152 return 0;
153 case PIPE_SHADER_CAP_MAX_SHADER_BUFFERS:
154 return LP_MAX_TGSI_SHADER_BUFFERS;
155 case PIPE_SHADER_CAP_MAX_SHADER_IMAGES:
156 return LP_MAX_TGSI_SHADER_IMAGES;
157 }
158 /* if we get here, we missed a shader cap above (and should have seen
159 * a compiler warning.)
160 */
161 return 0;
162 }
163
164
165 #endif /* LP_BLD_LIMITS_H_ */
166