xref: /aosp_15_r20/external/mesa3d/src/gallium/drivers/vc4/vc4_state.c (revision 6104692788411f58d303aa86923a9ff6ecaded22)
1 /*
2  * Copyright © 2014 Broadcom
3  * Copyright (C) 2012 Rob Clark <[email protected]>
4  *
5  * Permission is hereby granted, free of charge, to any person obtaining a
6  * copy of this software and associated documentation files (the "Software"),
7  * to deal in the Software without restriction, including without limitation
8  * the rights to use, copy, modify, merge, publish, distribute, sublicense,
9  * and/or sell copies of the Software, and to permit persons to whom the
10  * Software is furnished to do so, subject to the following conditions:
11  *
12  * The above copyright notice and this permission notice (including the next
13  * paragraph) shall be included in all copies or substantial portions of the
14  * Software.
15  *
16  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18  * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
19  * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
20  * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
21  * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
22  * IN THE SOFTWARE.
23  */
24 
25 #include "pipe/p_state.h"
26 #include "util/u_framebuffer.h"
27 #include "util/u_inlines.h"
28 #include "util/u_math.h"
29 #include "util/u_memory.h"
30 #include "util/u_helpers.h"
31 
32 #include "vc4_context.h"
33 
34 static void *
vc4_generic_cso_state_create(const void * src,uint32_t size)35 vc4_generic_cso_state_create(const void *src, uint32_t size)
36 {
37         void *dst = calloc(1, size);
38         if (!dst)
39                 return NULL;
40         memcpy(dst, src, size);
41         return dst;
42 }
43 
44 static void
vc4_generic_cso_state_delete(struct pipe_context * pctx,void * hwcso)45 vc4_generic_cso_state_delete(struct pipe_context *pctx, void *hwcso)
46 {
47         free(hwcso);
48 }
49 
50 static void
vc4_set_blend_color(struct pipe_context * pctx,const struct pipe_blend_color * blend_color)51 vc4_set_blend_color(struct pipe_context *pctx,
52                     const struct pipe_blend_color *blend_color)
53 {
54         struct vc4_context *vc4 = vc4_context(pctx);
55         vc4->blend_color.f = *blend_color;
56         for (int i = 0; i < 4; i++)
57                 vc4->blend_color.ub[i] = float_to_ubyte(blend_color->color[i]);
58         vc4->dirty |= VC4_DIRTY_BLEND_COLOR;
59 }
60 
61 static void
vc4_set_stencil_ref(struct pipe_context * pctx,const struct pipe_stencil_ref stencil_ref)62 vc4_set_stencil_ref(struct pipe_context *pctx,
63                     const struct pipe_stencil_ref stencil_ref)
64 {
65         struct vc4_context *vc4 = vc4_context(pctx);
66         vc4->stencil_ref = stencil_ref;
67         vc4->dirty |= VC4_DIRTY_STENCIL_REF;
68 }
69 
70 static void
vc4_set_clip_state(struct pipe_context * pctx,const struct pipe_clip_state * clip)71 vc4_set_clip_state(struct pipe_context *pctx,
72                    const struct pipe_clip_state *clip)
73 {
74         struct vc4_context *vc4 = vc4_context(pctx);
75         vc4->clip = *clip;
76         vc4->dirty |= VC4_DIRTY_CLIP;
77 }
78 
79 static void
vc4_set_sample_mask(struct pipe_context * pctx,unsigned sample_mask)80 vc4_set_sample_mask(struct pipe_context *pctx, unsigned sample_mask)
81 {
82         struct vc4_context *vc4 = vc4_context(pctx);
83         vc4->sample_mask = sample_mask & ((1 << VC4_MAX_SAMPLES) - 1);
84         vc4->dirty |= VC4_DIRTY_SAMPLE_MASK;
85 }
86 
87 static uint16_t
float_to_187_half(float f)88 float_to_187_half(float f)
89 {
90         return fui(f) >> 16;
91 }
92 
93 static void *
vc4_create_rasterizer_state(struct pipe_context * pctx,const struct pipe_rasterizer_state * cso)94 vc4_create_rasterizer_state(struct pipe_context *pctx,
95                             const struct pipe_rasterizer_state *cso)
96 {
97         struct vc4_rasterizer_state *so;
98         struct V3D21_DEPTH_OFFSET depth_offset = { V3D21_DEPTH_OFFSET_header };
99         struct V3D21_POINT_SIZE point_size = { V3D21_POINT_SIZE_header };
100         struct V3D21_LINE_WIDTH line_width = { V3D21_LINE_WIDTH_header };
101 
102         so = CALLOC_STRUCT(vc4_rasterizer_state);
103         if (!so)
104                 return NULL;
105 
106         so->base = *cso;
107 
108         if (!(cso->cull_face & PIPE_FACE_FRONT))
109                 so->config_bits[0] |= VC4_CONFIG_BITS_ENABLE_PRIM_FRONT;
110         if (!(cso->cull_face & PIPE_FACE_BACK))
111                 so->config_bits[0] |= VC4_CONFIG_BITS_ENABLE_PRIM_BACK;
112 
113         /* Workaround: HW-2726 PTB does not handle zero-size points (BCM2835,
114          * BCM21553).
115          */
116         point_size.point_size = MAX2(cso->point_size, .125f);
117 
118         line_width.line_width = cso->line_width;
119 
120         if (cso->front_ccw)
121                 so->config_bits[0] |= VC4_CONFIG_BITS_CW_PRIMITIVES;
122 
123         if (cso->offset_tri) {
124                 so->config_bits[0] |= VC4_CONFIG_BITS_ENABLE_DEPTH_OFFSET;
125 
126                 depth_offset.depth_offset_units =
127                         float_to_187_half(cso->offset_units);
128                 depth_offset.depth_offset_factor =
129                         float_to_187_half(cso->offset_scale);
130         }
131 
132         if (cso->multisample)
133                 so->config_bits[0] |= VC4_CONFIG_BITS_RASTERIZER_OVERSAMPLE_4X;
134 
135         V3D21_DEPTH_OFFSET_pack(NULL, so->packed.depth_offset, &depth_offset);
136         V3D21_POINT_SIZE_pack(NULL, so->packed.point_size, &point_size);
137         V3D21_LINE_WIDTH_pack(NULL, so->packed.line_width, &line_width);
138 
139         if (cso->tile_raster_order_fixed) {
140                 so->tile_raster_order_flags |= VC4_SUBMIT_CL_FIXED_RCL_ORDER;
141                 if (cso->tile_raster_order_increasing_x) {
142                         so->tile_raster_order_flags |=
143                                 VC4_SUBMIT_CL_RCL_ORDER_INCREASING_X;
144                 }
145                 if (cso->tile_raster_order_increasing_y) {
146                         so->tile_raster_order_flags |=
147                                 VC4_SUBMIT_CL_RCL_ORDER_INCREASING_Y;
148                 }
149         }
150 
151         return so;
152 }
153 
154 /* Blend state is baked into shaders. */
155 static void *
vc4_create_blend_state(struct pipe_context * pctx,const struct pipe_blend_state * cso)156 vc4_create_blend_state(struct pipe_context *pctx,
157                        const struct pipe_blend_state *cso)
158 {
159         return vc4_generic_cso_state_create(cso, sizeof(*cso));
160 }
161 
162 /**
163  * The TLB_STENCIL_SETUP data has a little bitfield for common writemask
164  * values, so you don't have to do a separate writemask setup.
165  */
166 static uint8_t
tlb_stencil_setup_writemask(uint8_t mask)167 tlb_stencil_setup_writemask(uint8_t mask)
168 {
169         switch (mask) {
170         case 0x1: return 0;
171         case 0x3: return 1;
172         case 0xf: return 2;
173         case 0xff: return 3;
174         default: return 0xff;
175         }
176 }
177 
178 static uint32_t
tlb_stencil_setup_bits(const struct pipe_stencil_state * state,uint8_t writemask_bits)179 tlb_stencil_setup_bits(const struct pipe_stencil_state *state,
180                        uint8_t writemask_bits)
181 {
182         static const uint8_t op_map[] = {
183                 [PIPE_STENCIL_OP_ZERO] = 0,
184                 [PIPE_STENCIL_OP_KEEP] = 1,
185                 [PIPE_STENCIL_OP_REPLACE] = 2,
186                 [PIPE_STENCIL_OP_INCR] = 3,
187                 [PIPE_STENCIL_OP_DECR] = 4,
188                 [PIPE_STENCIL_OP_INVERT] = 5,
189                 [PIPE_STENCIL_OP_INCR_WRAP] = 6,
190                 [PIPE_STENCIL_OP_DECR_WRAP] = 7,
191         };
192         uint32_t bits = 0;
193 
194         if (writemask_bits != 0xff)
195                 bits |= writemask_bits << 28;
196         bits |= op_map[state->zfail_op] << 25;
197         bits |= op_map[state->zpass_op] << 22;
198         bits |= op_map[state->fail_op] << 19;
199         bits |= state->func << 16;
200         /* Ref is filled in at uniform upload time */
201         bits |= state->valuemask << 0;
202 
203         return bits;
204 }
205 
206 static void *
vc4_create_depth_stencil_alpha_state(struct pipe_context * pctx,const struct pipe_depth_stencil_alpha_state * cso)207 vc4_create_depth_stencil_alpha_state(struct pipe_context *pctx,
208                                      const struct pipe_depth_stencil_alpha_state *cso)
209 {
210         struct vc4_depth_stencil_alpha_state *so;
211 
212         so = CALLOC_STRUCT(vc4_depth_stencil_alpha_state);
213         if (!so)
214                 return NULL;
215 
216         so->base = *cso;
217 
218         /* We always keep the early Z state correct, since a later state using
219          * early Z may want it.
220          */
221         so->config_bits[2] |= VC4_CONFIG_BITS_EARLY_Z_UPDATE;
222 
223         if (cso->depth_enabled) {
224                 if (cso->depth_writemask) {
225                         so->config_bits[1] |= VC4_CONFIG_BITS_Z_UPDATE;
226                 }
227                 so->config_bits[1] |= (cso->depth_func <<
228                                        VC4_CONFIG_BITS_DEPTH_FUNC_SHIFT);
229 
230                 /* We only handle early Z in the < direction because otherwise
231                  * we'd have to runtime guess which direction to set in the
232                  * render config.
233                  */
234                 if ((cso->depth_func == PIPE_FUNC_LESS ||
235                      cso->depth_func == PIPE_FUNC_LEQUAL) &&
236                     (!cso->stencil[0].enabled ||
237                      (cso->stencil[0].zfail_op == PIPE_STENCIL_OP_KEEP &&
238                       (!cso->stencil[1].enabled ||
239                        cso->stencil[1].zfail_op == PIPE_STENCIL_OP_KEEP)))) {
240                         so->config_bits[2] |= VC4_CONFIG_BITS_EARLY_Z;
241                 }
242         } else {
243                 so->config_bits[1] |= (PIPE_FUNC_ALWAYS <<
244                                        VC4_CONFIG_BITS_DEPTH_FUNC_SHIFT);
245         }
246 
247         if (cso->stencil[0].enabled) {
248                 const struct pipe_stencil_state *front = &cso->stencil[0];
249                 const struct pipe_stencil_state *back = &cso->stencil[1];
250 
251                 uint8_t front_writemask_bits =
252                         tlb_stencil_setup_writemask(front->writemask);
253                 uint8_t back_writemask = front->writemask;
254                 uint8_t back_writemask_bits = front_writemask_bits;
255 
256                 so->stencil_uniforms[0] =
257                         tlb_stencil_setup_bits(front, front_writemask_bits);
258                 if (back->enabled) {
259                         back_writemask = back->writemask;
260                         back_writemask_bits =
261                                 tlb_stencil_setup_writemask(back->writemask);
262 
263                         so->stencil_uniforms[0] |= (UINT32_C(1) << 30);
264                         so->stencil_uniforms[1] =
265                                 tlb_stencil_setup_bits(back, back_writemask_bits);
266                         so->stencil_uniforms[1] |= (UINT32_C(2) << 30);
267                 } else {
268                         so->stencil_uniforms[0] |= (UINT32_C(3) << 30);
269                 }
270 
271                 if (front_writemask_bits == 0xff ||
272                     back_writemask_bits == 0xff) {
273                         so->stencil_uniforms[2] = (front->writemask |
274                                                    (back_writemask << 8));
275                 }
276         }
277 
278         return so;
279 }
280 
281 static void
vc4_set_polygon_stipple(struct pipe_context * pctx,const struct pipe_poly_stipple * stipple)282 vc4_set_polygon_stipple(struct pipe_context *pctx,
283                         const struct pipe_poly_stipple *stipple)
284 {
285         struct vc4_context *vc4 = vc4_context(pctx);
286         vc4->stipple = *stipple;
287         vc4->dirty |= VC4_DIRTY_STIPPLE;
288 }
289 
290 static void
vc4_set_scissor_states(struct pipe_context * pctx,unsigned start_slot,unsigned num_scissors,const struct pipe_scissor_state * scissor)291 vc4_set_scissor_states(struct pipe_context *pctx,
292                        unsigned start_slot,
293                        unsigned num_scissors,
294                        const struct pipe_scissor_state *scissor)
295 {
296         struct vc4_context *vc4 = vc4_context(pctx);
297 
298         vc4->scissor = *scissor;
299         vc4->dirty |= VC4_DIRTY_SCISSOR;
300 }
301 
302 static void
vc4_set_viewport_states(struct pipe_context * pctx,unsigned start_slot,unsigned num_viewports,const struct pipe_viewport_state * viewport)303 vc4_set_viewport_states(struct pipe_context *pctx,
304                         unsigned start_slot,
305                         unsigned num_viewports,
306                         const struct pipe_viewport_state *viewport)
307 {
308         struct vc4_context *vc4 = vc4_context(pctx);
309         vc4->viewport = *viewport;
310         vc4->dirty |= VC4_DIRTY_VIEWPORT;
311 }
312 
313 static void
vc4_set_vertex_buffers(struct pipe_context * pctx,unsigned count,const struct pipe_vertex_buffer * vb)314 vc4_set_vertex_buffers(struct pipe_context *pctx,
315                        unsigned count,
316                        const struct pipe_vertex_buffer *vb)
317 {
318         struct vc4_context *vc4 = vc4_context(pctx);
319         struct vc4_vertexbuf_stateobj *so = &vc4->vertexbuf;
320 
321         util_set_vertex_buffers_mask(so->vb, &so->enabled_mask, vb,
322                                      count, true);
323         so->count = util_last_bit(so->enabled_mask);
324 
325         vc4->dirty |= VC4_DIRTY_VTXBUF;
326 }
327 
328 static void
vc4_blend_state_bind(struct pipe_context * pctx,void * hwcso)329 vc4_blend_state_bind(struct pipe_context *pctx, void *hwcso)
330 {
331         struct vc4_context *vc4 = vc4_context(pctx);
332         vc4->blend = hwcso;
333         vc4->dirty |= VC4_DIRTY_BLEND;
334 }
335 
336 static void
vc4_rasterizer_state_bind(struct pipe_context * pctx,void * hwcso)337 vc4_rasterizer_state_bind(struct pipe_context *pctx, void *hwcso)
338 {
339         struct vc4_context *vc4 = vc4_context(pctx);
340         struct vc4_rasterizer_state *rast = hwcso;
341 
342         if (vc4->rasterizer && rast &&
343             vc4->rasterizer->base.flatshade != rast->base.flatshade) {
344                 vc4->dirty |= VC4_DIRTY_FLAT_SHADE_FLAGS;
345         }
346 
347         vc4->rasterizer = hwcso;
348         vc4->dirty |= VC4_DIRTY_RASTERIZER;
349 }
350 
351 static void
vc4_zsa_state_bind(struct pipe_context * pctx,void * hwcso)352 vc4_zsa_state_bind(struct pipe_context *pctx, void *hwcso)
353 {
354         struct vc4_context *vc4 = vc4_context(pctx);
355         vc4->zsa = hwcso;
356         vc4->dirty |= VC4_DIRTY_ZSA;
357 }
358 
359 static void *
vc4_vertex_state_create(struct pipe_context * pctx,unsigned num_elements,const struct pipe_vertex_element * elements)360 vc4_vertex_state_create(struct pipe_context *pctx, unsigned num_elements,
361                         const struct pipe_vertex_element *elements)
362 {
363         struct vc4_vertex_stateobj *so = CALLOC_STRUCT(vc4_vertex_stateobj);
364 
365         if (!so)
366                 return NULL;
367 
368         memcpy(so->pipe, elements, sizeof(*elements) * num_elements);
369         so->num_elements = num_elements;
370 
371         return so;
372 }
373 
374 static void
vc4_vertex_state_bind(struct pipe_context * pctx,void * hwcso)375 vc4_vertex_state_bind(struct pipe_context *pctx, void *hwcso)
376 {
377         struct vc4_context *vc4 = vc4_context(pctx);
378         vc4->vtx = hwcso;
379         vc4->dirty |= VC4_DIRTY_VTXSTATE;
380 }
381 
382 static void
vc4_set_constant_buffer(struct pipe_context * pctx,enum pipe_shader_type shader,uint index,bool take_ownership,const struct pipe_constant_buffer * cb)383 vc4_set_constant_buffer(struct pipe_context *pctx,
384                         enum pipe_shader_type shader, uint index,
385                         bool take_ownership,
386                         const struct pipe_constant_buffer *cb)
387 {
388         struct vc4_context *vc4 = vc4_context(pctx);
389         struct vc4_constbuf_stateobj *so = &vc4->constbuf[shader];
390 
391         /* Note that the gallium frontend can unbind constant buffers by
392          * passing NULL here.
393          */
394         if (unlikely(!cb)) {
395                 so->enabled_mask &= ~(1 << index);
396                 so->dirty_mask &= ~(1 << index);
397                 return;
398         }
399 
400         if (index == 1 && so->cb[index].buffer_size != cb->buffer_size)
401                 vc4->dirty |= VC4_DIRTY_UBO_1_SIZE;
402 
403         util_copy_constant_buffer(&so->cb[index], cb, take_ownership);
404 
405         so->enabled_mask |= 1 << index;
406         so->dirty_mask |= 1 << index;
407         vc4->dirty |= VC4_DIRTY_CONSTBUF;
408 }
409 
410 static void
vc4_set_framebuffer_state(struct pipe_context * pctx,const struct pipe_framebuffer_state * framebuffer)411 vc4_set_framebuffer_state(struct pipe_context *pctx,
412                           const struct pipe_framebuffer_state *framebuffer)
413 {
414         struct vc4_context *vc4 = vc4_context(pctx);
415         struct pipe_framebuffer_state *cso = &vc4->framebuffer;
416 
417         vc4->job = NULL;
418 
419         util_copy_framebuffer_state(cso, framebuffer);
420 
421         /* Nonzero texture mipmap levels are laid out as if they were in
422          * power-of-two-sized spaces.  The renderbuffer config infers its
423          * stride from the width parameter, so we need to configure our
424          * framebuffer.  Note that if the z/color buffers were mismatched
425          * sizes, we wouldn't be able to do this.
426          */
427         if (cso->cbufs[0] && cso->cbufs[0]->u.tex.level) {
428                 struct vc4_resource *rsc =
429                         vc4_resource(cso->cbufs[0]->texture);
430                 cso->width =
431                         (rsc->slices[cso->cbufs[0]->u.tex.level].stride /
432                          rsc->cpp);
433         } else if (cso->zsbuf && cso->zsbuf->u.tex.level){
434                 struct vc4_resource *rsc =
435                         vc4_resource(cso->zsbuf->texture);
436                 cso->width =
437                         (rsc->slices[cso->zsbuf->u.tex.level].stride /
438                          rsc->cpp);
439         }
440 
441         vc4->dirty |= VC4_DIRTY_FRAMEBUFFER;
442 }
443 
444 static struct vc4_texture_stateobj *
vc4_get_stage_tex(struct vc4_context * vc4,enum pipe_shader_type shader)445 vc4_get_stage_tex(struct vc4_context *vc4, enum pipe_shader_type shader)
446 {
447         switch (shader) {
448         case PIPE_SHADER_FRAGMENT:
449                 vc4->dirty |= VC4_DIRTY_FRAGTEX;
450                 return &vc4->fragtex;
451                 break;
452         case PIPE_SHADER_VERTEX:
453                 vc4->dirty |= VC4_DIRTY_VERTTEX;
454                 return &vc4->verttex;
455                 break;
456         default:
457                 fprintf(stderr, "Unknown shader target %d\n", shader);
458                 abort();
459         }
460 }
461 
translate_wrap(uint32_t p_wrap,bool using_nearest)462 static uint32_t translate_wrap(uint32_t p_wrap, bool using_nearest)
463 {
464         switch (p_wrap) {
465         case PIPE_TEX_WRAP_REPEAT:
466                 return 0;
467         case PIPE_TEX_WRAP_CLAMP_TO_EDGE:
468                 return 1;
469         case PIPE_TEX_WRAP_MIRROR_REPEAT:
470                 return 2;
471         case PIPE_TEX_WRAP_CLAMP_TO_BORDER:
472                 return 3;
473         case PIPE_TEX_WRAP_CLAMP:
474                 return (using_nearest ? 1 : 3);
475         default:
476                 fprintf(stderr, "Unknown wrap mode %d\n", p_wrap);
477                 assert(!"not reached");
478                 return 0;
479         }
480 }
481 
482 static void *
vc4_create_sampler_state(struct pipe_context * pctx,const struct pipe_sampler_state * cso)483 vc4_create_sampler_state(struct pipe_context *pctx,
484                          const struct pipe_sampler_state *cso)
485 {
486         static const uint8_t minfilter_map[6] = {
487                 VC4_TEX_P1_MINFILT_NEAR_MIP_NEAR,
488                 VC4_TEX_P1_MINFILT_LIN_MIP_NEAR,
489                 VC4_TEX_P1_MINFILT_NEAR_MIP_LIN,
490                 VC4_TEX_P1_MINFILT_LIN_MIP_LIN,
491                 VC4_TEX_P1_MINFILT_NEAREST,
492                 VC4_TEX_P1_MINFILT_LINEAR,
493         };
494         static const uint32_t magfilter_map[] = {
495                 [PIPE_TEX_FILTER_NEAREST] = VC4_TEX_P1_MAGFILT_NEAREST,
496                 [PIPE_TEX_FILTER_LINEAR] = VC4_TEX_P1_MAGFILT_LINEAR,
497         };
498         bool either_nearest =
499                 (cso->mag_img_filter == PIPE_TEX_MIPFILTER_NEAREST ||
500                  cso->min_img_filter == PIPE_TEX_MIPFILTER_NEAREST);
501         struct vc4_sampler_state *so = CALLOC_STRUCT(vc4_sampler_state);
502 
503         if (!so)
504                 return NULL;
505 
506         memcpy(so, cso, sizeof(*cso));
507 
508         so->texture_p1 =
509                 (VC4_SET_FIELD(magfilter_map[cso->mag_img_filter],
510                                VC4_TEX_P1_MAGFILT) |
511                  VC4_SET_FIELD(minfilter_map[cso->min_mip_filter * 2 +
512                                              cso->min_img_filter],
513                                VC4_TEX_P1_MINFILT) |
514                  VC4_SET_FIELD(translate_wrap(cso->wrap_s, either_nearest),
515                                VC4_TEX_P1_WRAP_S) |
516                  VC4_SET_FIELD(translate_wrap(cso->wrap_t, either_nearest),
517                                VC4_TEX_P1_WRAP_T));
518 
519         return so;
520 }
521 
522 static void
vc4_sampler_states_bind(struct pipe_context * pctx,enum pipe_shader_type shader,unsigned start,unsigned nr,void ** hwcso)523 vc4_sampler_states_bind(struct pipe_context *pctx,
524                         enum pipe_shader_type shader, unsigned start,
525                         unsigned nr, void **hwcso)
526 {
527         struct vc4_context *vc4 = vc4_context(pctx);
528         struct vc4_texture_stateobj *stage_tex = vc4_get_stage_tex(vc4, shader);
529 
530         assert(start == 0);
531         unsigned i;
532         unsigned new_nr = 0;
533 
534         for (i = 0; i < nr; i++) {
535                 if (hwcso[i])
536                         new_nr = i + 1;
537                 stage_tex->samplers[i] = hwcso[i];
538         }
539 
540         for (; i < stage_tex->num_samplers; i++) {
541                 stage_tex->samplers[i] = NULL;
542         }
543 
544         stage_tex->num_samplers = new_nr;
545 }
546 
547 static struct pipe_sampler_view *
vc4_create_sampler_view(struct pipe_context * pctx,struct pipe_resource * prsc,const struct pipe_sampler_view * cso)548 vc4_create_sampler_view(struct pipe_context *pctx, struct pipe_resource *prsc,
549                         const struct pipe_sampler_view *cso)
550 {
551         struct vc4_sampler_view *so = CALLOC_STRUCT(vc4_sampler_view);
552         struct vc4_resource *rsc = vc4_resource(prsc);
553 
554         if (!so)
555                 return NULL;
556 
557         so->base = *cso;
558 
559         so->base.texture = NULL;
560         pipe_resource_reference(&so->base.texture, prsc);
561         so->base.reference.count = 1;
562         so->base.context = pctx;
563 
564         /* There is no hardware level clamping, and the start address of a
565          * texture may be misaligned, so in that case we have to copy to a
566          * temporary.
567          *
568          * Also, Raspberry Pi doesn't support sampling from raster textures,
569          * so we also have to copy to a temporary then.
570          */
571         if ((cso->u.tex.first_level &&
572              (cso->u.tex.first_level != cso->u.tex.last_level)) ||
573             rsc->vc4_format == VC4_TEXTURE_TYPE_RGBA32R ||
574             rsc->vc4_format == ~0) {
575                 struct vc4_resource *shadow_parent = rsc;
576                 struct pipe_resource tmpl = {
577                         .target = prsc->target,
578                         .format = prsc->format,
579                         .width0 = u_minify(prsc->width0,
580                                            cso->u.tex.first_level),
581                         .height0 = u_minify(prsc->height0,
582                                             cso->u.tex.first_level),
583                         .bind = PIPE_BIND_SAMPLER_VIEW | PIPE_BIND_RENDER_TARGET,
584                         .last_level = cso->u.tex.last_level - cso->u.tex.first_level,
585                         .nr_samples = prsc->nr_samples,
586                 };
587 
588                 /* Create the shadow texture.  The rest of the texture
589                  * parameter setup will use the shadow.
590                  */
591                 prsc = vc4_resource_create(pctx->screen, &tmpl);
592                 if (!prsc) {
593                         free(so);
594                         return NULL;
595                 }
596                 rsc = vc4_resource(prsc);
597                 vc4_bo_label(vc4_screen(pctx->screen), rsc->bo,
598                             "tiling shadow %dx%d",
599                              tmpl.width0, tmpl.height0);
600 
601                 /* Flag it as needing update of the contents from the parent. */
602                 rsc->writes = shadow_parent->writes - 1;
603                 assert(rsc->vc4_format != VC4_TEXTURE_TYPE_RGBA32R);
604 
605                 so->texture = prsc;
606         } else {
607                 pipe_resource_reference(&so->texture, prsc);
608 
609                 if (cso->u.tex.first_level) {
610                         so->force_first_level = true;
611                 }
612         }
613 
614         so->texture_p0 =
615                 (VC4_SET_FIELD((rsc->slices[0].offset +
616                                 cso->u.tex.first_layer *
617                                 rsc->cube_map_stride) >> 12, VC4_TEX_P0_OFFSET) |
618                  VC4_SET_FIELD(rsc->vc4_format & 15, VC4_TEX_P0_TYPE) |
619                  VC4_SET_FIELD(so->force_first_level ?
620                                cso->u.tex.last_level :
621                                cso->u.tex.last_level -
622                                cso->u.tex.first_level, VC4_TEX_P0_MIPLVLS) |
623                  VC4_SET_FIELD(cso->target == PIPE_TEXTURE_CUBE,
624                                VC4_TEX_P0_CMMODE));
625         so->texture_p1 =
626                 (VC4_SET_FIELD(rsc->vc4_format >> 4, VC4_TEX_P1_TYPE4) |
627                  VC4_SET_FIELD(prsc->height0 & 2047, VC4_TEX_P1_HEIGHT) |
628                  VC4_SET_FIELD(prsc->width0 & 2047, VC4_TEX_P1_WIDTH));
629 
630         if (prsc->format == PIPE_FORMAT_ETC1_RGB8)
631                 so->texture_p1 |= VC4_TEX_P1_ETCFLIP_MASK;
632 
633         return &so->base;
634 }
635 
636 static void
vc4_sampler_view_destroy(struct pipe_context * pctx,struct pipe_sampler_view * pview)637 vc4_sampler_view_destroy(struct pipe_context *pctx,
638                          struct pipe_sampler_view *pview)
639 {
640         struct vc4_sampler_view *view = vc4_sampler_view(pview);
641         pipe_resource_reference(&pview->texture, NULL);
642         pipe_resource_reference(&view->texture, NULL);
643         free(view);
644 }
645 
646 static void
vc4_set_sampler_views(struct pipe_context * pctx,enum pipe_shader_type shader,unsigned start,unsigned nr,unsigned unbind_num_trailing_slots,bool take_ownership,struct pipe_sampler_view ** views)647 vc4_set_sampler_views(struct pipe_context *pctx,
648                       enum pipe_shader_type shader,
649                       unsigned start, unsigned nr,
650                       unsigned unbind_num_trailing_slots,
651                       bool take_ownership,
652                       struct pipe_sampler_view **views)
653 {
654         struct vc4_context *vc4 = vc4_context(pctx);
655         struct vc4_texture_stateobj *stage_tex = vc4_get_stage_tex(vc4, shader);
656         unsigned i;
657         unsigned new_nr = 0;
658 
659         assert(start == 0);
660 
661         for (i = 0; i < nr; i++) {
662                 if (views[i])
663                         new_nr = i + 1;
664                 if (take_ownership) {
665                         pipe_sampler_view_reference(&stage_tex->textures[i], NULL);
666                         stage_tex->textures[i] = views[i];
667                 } else {
668                         pipe_sampler_view_reference(&stage_tex->textures[i], views[i]);
669                 }
670         }
671 
672         for (; i < stage_tex->num_textures; i++) {
673                 pipe_sampler_view_reference(&stage_tex->textures[i], NULL);
674         }
675 
676         stage_tex->num_textures = new_nr;
677 }
678 
679 void
vc4_state_init(struct pipe_context * pctx)680 vc4_state_init(struct pipe_context *pctx)
681 {
682         pctx->set_blend_color = vc4_set_blend_color;
683         pctx->set_stencil_ref = vc4_set_stencil_ref;
684         pctx->set_clip_state = vc4_set_clip_state;
685         pctx->set_sample_mask = vc4_set_sample_mask;
686         pctx->set_constant_buffer = vc4_set_constant_buffer;
687         pctx->set_framebuffer_state = vc4_set_framebuffer_state;
688         pctx->set_polygon_stipple = vc4_set_polygon_stipple;
689         pctx->set_scissor_states = vc4_set_scissor_states;
690         pctx->set_viewport_states = vc4_set_viewport_states;
691 
692         pctx->set_vertex_buffers = vc4_set_vertex_buffers;
693 
694         pctx->create_blend_state = vc4_create_blend_state;
695         pctx->bind_blend_state = vc4_blend_state_bind;
696         pctx->delete_blend_state = vc4_generic_cso_state_delete;
697 
698         pctx->create_rasterizer_state = vc4_create_rasterizer_state;
699         pctx->bind_rasterizer_state = vc4_rasterizer_state_bind;
700         pctx->delete_rasterizer_state = vc4_generic_cso_state_delete;
701 
702         pctx->create_depth_stencil_alpha_state = vc4_create_depth_stencil_alpha_state;
703         pctx->bind_depth_stencil_alpha_state = vc4_zsa_state_bind;
704         pctx->delete_depth_stencil_alpha_state = vc4_generic_cso_state_delete;
705 
706         pctx->create_vertex_elements_state = vc4_vertex_state_create;
707         pctx->delete_vertex_elements_state = vc4_generic_cso_state_delete;
708         pctx->bind_vertex_elements_state = vc4_vertex_state_bind;
709 
710         pctx->create_sampler_state = vc4_create_sampler_state;
711         pctx->delete_sampler_state = vc4_generic_cso_state_delete;
712         pctx->bind_sampler_states = vc4_sampler_states_bind;
713 
714         pctx->create_sampler_view = vc4_create_sampler_view;
715         pctx->sampler_view_destroy = vc4_sampler_view_destroy;
716         pctx->set_sampler_views = vc4_set_sampler_views;
717 }
718