• Home
  • Line#
  • Scopes#
  • Navigate#
  • Raw
  • Download
1 
2 /**********************************************************
3  * Copyright 2008-2009 VMware, Inc.  All rights reserved.
4  *
5  * Permission is hereby granted, free of charge, to any person
6  * obtaining a copy of this software and associated documentation
7  * files (the "Software"), to deal in the Software without
8  * restriction, including without limitation the rights to use, copy,
9  * modify, merge, publish, distribute, sublicense, and/or sell copies
10  * of the Software, and to permit persons to whom the Software is
11  * furnished to do so, subject to the following conditions:
12  *
13  * The above copyright notice and this permission notice shall be
14  * included in all copies or substantial portions of the Software.
15  *
16  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
17  * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
18  * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
19  * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
20  * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
21  * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
22  * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
23  * SOFTWARE.
24  *
25  **********************************************************/
26 
27 #include "util/u_format.h"
28 #include "util/u_inlines.h"
29 #include "util/u_memory.h"
30 #include "pipe/p_defines.h"
31 #include "util/u_upload_mgr.h"
32 
33 #include "svga_screen.h"
34 #include "svga_context.h"
35 #include "svga_state.h"
36 #include "svga_cmd.h"
37 #include "svga_tgsi.h"
38 #include "svga_debug.h"
39 #include "svga_resource_buffer.h"
40 #include "svga_shader.h"
41 
42 #include "svga_hw_reg.h"
43 
44 
45 /*
46  * Don't try to send more than 4kb of successive constants.
47  */
48 #define MAX_CONST_REG_COUNT 256  /**< number of float[4] constants */
49 
50 /**
51  * Extra space for svga-specific VS/PS constants (such as texcoord
52  * scale factors, vertex transformation scale/translation).
53  */
54 #define MAX_EXTRA_CONSTS 32
55 
56 /** Guest-backed surface constant buffers must be this size */
57 #define GB_CONSTBUF_SIZE (SVGA3D_CONSTREG_MAX)
58 
59 
60 /**
61  * Emit any extra shader-type-independent shader constants into the buffer
62  * pointed to by 'dest'.
63  * \return number of float[4] constants put into the 'dest' buffer
64  */
65 static unsigned
svga_get_extra_constants_common(struct svga_context * svga,const struct svga_shader_variant * variant,enum pipe_shader_type shader,float * dest)66 svga_get_extra_constants_common(struct svga_context *svga,
67                                 const struct svga_shader_variant *variant,
68                                 enum pipe_shader_type shader, float *dest)
69 {
70    uint32_t *dest_u = (uint32_t *) dest;  // uint version of dest
71    unsigned i;
72    unsigned count = 0;
73 
74    for (i = 0; i < variant->key.num_textures; i++) {
75       struct pipe_sampler_view *sv = svga->curr.sampler_views[shader][i];
76       if (sv) {
77          struct pipe_resource *tex = sv->texture;
78          /* Scaling factors needed for handling unnormalized texture coordinates
79           * for texture rectangles.
80           */
81          if (variant->key.tex[i].unnormalized) {
82             /* debug/sanity check */
83             assert(variant->key.tex[i].width_height_idx == count);
84 
85             *dest++ = 1.0 / (float)tex->width0;
86             *dest++ = 1.0 / (float)tex->height0;
87             *dest++ = 1.0;
88             *dest++ = 1.0;
89 
90             count++;
91          }
92 
93          /* Store the sizes for texture buffers.
94          */
95          if (tex->target == PIPE_BUFFER) {
96             unsigned bytes_per_element = util_format_get_blocksize(sv->format);
97             *dest_u++ = tex->width0 / bytes_per_element;
98             *dest_u++ = 1;
99             *dest_u++ = 1;
100             *dest_u++ = 1;
101 
102             count++;
103          }
104       }
105    }
106 
107    return count;
108 }
109 
110 
111 /**
112  * Emit any extra fragment shader constants into the buffer pointed
113  * to by 'dest'.
114  * \return number of float[4] constants put into the dest buffer
115  */
116 static unsigned
svga_get_extra_fs_constants(struct svga_context * svga,float * dest)117 svga_get_extra_fs_constants(struct svga_context *svga, float *dest)
118 {
119    const struct svga_shader_variant *variant = svga->state.hw_draw.fs;
120    unsigned count = 0;
121 
122    count += svga_get_extra_constants_common(svga, variant,
123                                             PIPE_SHADER_FRAGMENT, dest);
124 
125    assert(count <= MAX_EXTRA_CONSTS);
126 
127    return count;
128 }
129 
130 /**
131  * Emit extra constants needed for prescale computation into the
132  * the buffer pointed to by '*dest'. The updated buffer pointer
133  * will be returned in 'dest'.
134  */
135 static unsigned
svga_get_prescale_constants(struct svga_context * svga,float ** dest)136 svga_get_prescale_constants(struct svga_context *svga, float **dest)
137 {
138    memcpy(*dest, svga->state.hw_clear.prescale.scale, 4 * sizeof(float));
139    *dest += 4;
140 
141    memcpy(*dest, svga->state.hw_clear.prescale.translate, 4 * sizeof(float));
142    *dest += 4;
143 
144    return 2;
145 }
146 
147 /**
148  * Emit extra constants needed for point sprite emulation.
149  */
150 static unsigned
svga_get_pt_sprite_constants(struct svga_context * svga,float ** dest)151 svga_get_pt_sprite_constants(struct svga_context *svga, float **dest)
152 {
153    struct svga_screen *screen = svga_screen(svga->pipe.screen);
154    float *dst = *dest;
155 
156    dst[0] = 1.0 / (svga->curr.viewport.scale[0] * 2);
157    dst[1] = 1.0 / (svga->curr.viewport.scale[1] * 2);
158    dst[2] = svga->curr.rast->pointsize;
159    dst[3] = screen->maxPointSize;
160    *dest = *dest + 4;
161    return 1;
162 }
163 
164 /**
165  * Emit user-defined clip plane coefficients into the buffer pointed to
166  * by '*dest'. The updated buffer pointer will be returned in 'dest'.
167  */
168 static unsigned
svga_get_clip_plane_constants(struct svga_context * svga,const struct svga_shader_variant * variant,float ** dest)169 svga_get_clip_plane_constants(struct svga_context *svga,
170                               const struct svga_shader_variant *variant,
171                               float **dest)
172 {
173    unsigned count = 0;
174 
175    /* SVGA_NEW_CLIP */
176    if (svga_have_vgpu10(svga)) {
177       /* append user-defined clip plane coefficients onto constant buffer */
178       unsigned clip_planes = variant->key.clip_plane_enable;
179       while (clip_planes) {
180          int i = u_bit_scan(&clip_planes);
181          COPY_4V(*dest, svga->curr.clip.ucp[i]);
182          *dest += 4;
183          count += 1;
184       }
185    }
186    return count;
187 }
188 
189 /**
190  * Emit any extra vertex shader constants into the buffer pointed
191  * to by 'dest'.
192  * In particular, these would be the scale and bias factors computed
193  * from the framebuffer size which are used to copy with differences in
194  * GL vs D3D coordinate spaces.  See svga_tgsi_insn.c for more info.
195  * \return number of float[4] constants put into the dest buffer
196  */
197 static unsigned
svga_get_extra_vs_constants(struct svga_context * svga,float * dest)198 svga_get_extra_vs_constants(struct svga_context *svga, float *dest)
199 {
200    const struct svga_shader_variant *variant = svga->state.hw_draw.vs;
201    unsigned count = 0;
202 
203    /* SVGA_NEW_VS_VARIANT
204     */
205    if (variant->key.vs.need_prescale) {
206       count += svga_get_prescale_constants(svga, &dest);
207    }
208 
209    if (variant->key.vs.undo_viewport) {
210       /* Used to convert window coords back to NDC coords */
211       dest[0] = 1.0f / svga->curr.viewport.scale[0];
212       dest[1] = 1.0f / svga->curr.viewport.scale[1];
213       dest[2] = -svga->curr.viewport.translate[0];
214       dest[3] = -svga->curr.viewport.translate[1];
215       dest += 4;
216       count += 1;
217    }
218 
219    /* SVGA_NEW_CLIP */
220    count += svga_get_clip_plane_constants(svga, variant, &dest);
221 
222    /* common constants */
223    count += svga_get_extra_constants_common(svga, variant,
224                                             PIPE_SHADER_VERTEX, dest);
225 
226    assert(count <= MAX_EXTRA_CONSTS);
227 
228    return count;
229 }
230 
231 /**
232  * Emit any extra geometry shader constants into the buffer pointed
233  * to by 'dest'.
234  */
235 static unsigned
svga_get_extra_gs_constants(struct svga_context * svga,float * dest)236 svga_get_extra_gs_constants(struct svga_context *svga, float *dest)
237 {
238    const struct svga_shader_variant *variant = svga->state.hw_draw.gs;
239    unsigned count = 0;
240 
241    /* SVGA_NEW_GS_VARIANT
242     */
243 
244    /* Constants for point sprite
245     * These are used in the transformed gs that supports point sprite.
246     * They need to be added before the prescale constants.
247     */
248    if (variant->key.gs.wide_point) {
249       count += svga_get_pt_sprite_constants(svga, &dest);
250    }
251 
252    if (variant->key.gs.need_prescale) {
253       count += svga_get_prescale_constants(svga, &dest);
254    }
255 
256    /* SVGA_NEW_CLIP */
257    count += svga_get_clip_plane_constants(svga, variant, &dest);
258 
259    /* common constants */
260    count += svga_get_extra_constants_common(svga, variant,
261                                             PIPE_SHADER_GEOMETRY, dest);
262 
263    assert(count <= MAX_EXTRA_CONSTS);
264    return count;
265 }
266 
267 /**
268  * Check and emit one shader constant register.
269  * \param shader  PIPE_SHADER_FRAGMENT or PIPE_SHADER_VERTEX
270  * \param i  which float[4] constant to change
271  * \param value  the new float[4] value
272  */
273 static enum pipe_error
emit_const(struct svga_context * svga,enum pipe_shader_type shader,unsigned i,const float * value)274 emit_const(struct svga_context *svga, enum pipe_shader_type shader, unsigned i,
275            const float *value)
276 {
277    enum pipe_error ret = PIPE_OK;
278 
279    assert(shader < PIPE_SHADER_TYPES);
280    assert(i < SVGA3D_CONSTREG_MAX);
281    assert(!svga_have_vgpu10(svga));
282 
283    if (memcmp(svga->state.hw_draw.cb[shader][i], value,
284               4 * sizeof(float)) != 0) {
285       if (SVGA_DEBUG & DEBUG_CONSTS)
286          debug_printf("%s %s %u: %f %f %f %f\n",
287                       __FUNCTION__,
288                       shader == PIPE_SHADER_VERTEX ? "VERT" : "FRAG",
289                       i,
290                       value[0],
291                       value[1],
292                       value[2],
293                       value[3]);
294 
295       ret = SVGA3D_SetShaderConst( svga->swc,
296                                    i,
297                                    svga_shader_type(shader),
298                                    SVGA3D_CONST_TYPE_FLOAT,
299                                    value );
300       if (ret != PIPE_OK)
301          return ret;
302 
303       memcpy(svga->state.hw_draw.cb[shader][i], value, 4 * sizeof(float));
304 
305       svga->hud.num_const_updates++;
306    }
307 
308    return ret;
309 }
310 
311 
312 /*
313  * Check and emit a range of shader constant registers, trying to coalesce
314  * successive shader constant updates in a single command in order to save
315  * space on the command buffer.  This is a HWv8 feature.
316  */
317 static enum pipe_error
emit_const_range(struct svga_context * svga,enum pipe_shader_type shader,unsigned offset,unsigned count,const float (* values)[4])318 emit_const_range(struct svga_context *svga,
319                  enum pipe_shader_type shader,
320                  unsigned offset,
321                  unsigned count,
322                  const float (*values)[4])
323 {
324    unsigned i, j;
325    enum pipe_error ret;
326 
327    assert(shader == PIPE_SHADER_VERTEX ||
328           shader == PIPE_SHADER_FRAGMENT);
329    assert(!svga_have_vgpu10(svga));
330 
331 #ifdef DEBUG
332    if (offset + count > SVGA3D_CONSTREG_MAX) {
333       debug_printf("svga: too many constants (offset %u + count %u = %u (max = %u))\n",
334                    offset, count, offset + count, SVGA3D_CONSTREG_MAX);
335    }
336 #endif
337 
338    if (offset > SVGA3D_CONSTREG_MAX) {
339       /* This isn't OK, but if we propagate an error all the way up we'll
340        * just get into more trouble.
341        * XXX note that offset is always zero at this time so this is moot.
342        */
343       return PIPE_OK;
344    }
345 
346    if (offset + count > SVGA3D_CONSTREG_MAX) {
347       /* Just drop the extra constants for now.
348        * Ideally we should not have allowed the app to create a shader
349        * that exceeds our constant buffer size but there's no way to
350        * express that in gallium at this time.
351        */
352       count = SVGA3D_CONSTREG_MAX - offset;
353    }
354 
355    i = 0;
356    while (i < count) {
357       if (memcmp(svga->state.hw_draw.cb[shader][offset + i],
358                  values[i],
359                  4 * sizeof(float)) != 0) {
360          /* Found one dirty constant
361           */
362          if (SVGA_DEBUG & DEBUG_CONSTS)
363             debug_printf("%s %s %d: %f %f %f %f\n",
364                          __FUNCTION__,
365                          shader == PIPE_SHADER_VERTEX ? "VERT" : "FRAG",
366                          offset + i,
367                          values[i][0],
368                          values[i][1],
369                          values[i][2],
370                          values[i][3]);
371 
372          /* Look for more consecutive dirty constants.
373           */
374          j = i + 1;
375          while (j < count &&
376                 j < i + MAX_CONST_REG_COUNT &&
377                 memcmp(svga->state.hw_draw.cb[shader][offset + j],
378                        values[j],
379                        4 * sizeof(float)) != 0) {
380 
381             if (SVGA_DEBUG & DEBUG_CONSTS)
382                debug_printf("%s %s %d: %f %f %f %f\n",
383                             __FUNCTION__,
384                             shader == PIPE_SHADER_VERTEX ? "VERT" : "FRAG",
385                             offset + j,
386                             values[j][0],
387                             values[j][1],
388                             values[j][2],
389                             values[j][3]);
390 
391             ++j;
392          }
393 
394          assert(j >= i + 1);
395 
396          /* Send them all together.
397           */
398          if (svga_have_gb_objects(svga)) {
399             ret = SVGA3D_SetGBShaderConstsInline(svga->swc,
400                                                  offset + i, /* start */
401                                                  j - i,  /* count */
402                                                  svga_shader_type(shader),
403                                                  SVGA3D_CONST_TYPE_FLOAT,
404                                                  values + i);
405          }
406          else {
407             ret = SVGA3D_SetShaderConsts(svga->swc,
408                                          offset + i, j - i,
409                                          svga_shader_type(shader),
410                                          SVGA3D_CONST_TYPE_FLOAT,
411                                          values + i);
412          }
413          if (ret != PIPE_OK) {
414             return ret;
415          }
416 
417          /*
418           * Local copy of the hardware state.
419           */
420          memcpy(svga->state.hw_draw.cb[shader][offset + i],
421                 values[i],
422                 (j - i) * 4 * sizeof(float));
423 
424          i = j + 1;
425 
426          svga->hud.num_const_updates++;
427 
428       } else {
429          ++i;
430       }
431    }
432 
433    return PIPE_OK;
434 }
435 
436 
437 /**
438  * Emit all the constants in a constant buffer for a shader stage.
439  * On VGPU10, emit_consts_vgpu10 is used instead.
440  */
441 static enum pipe_error
emit_consts_vgpu9(struct svga_context * svga,enum pipe_shader_type shader)442 emit_consts_vgpu9(struct svga_context *svga, enum pipe_shader_type shader)
443 {
444    const struct pipe_constant_buffer *cbuf;
445    struct svga_screen *ss = svga_screen(svga->pipe.screen);
446    struct pipe_transfer *transfer = NULL;
447    unsigned count;
448    const float (*data)[4] = NULL;
449    unsigned i;
450    enum pipe_error ret = PIPE_OK;
451    const unsigned offset = 0;
452 
453    assert(shader < PIPE_SHADER_TYPES);
454    assert(!svga_have_vgpu10(svga));
455    /* Only one constant buffer per shader is supported before VGPU10.
456     * This is only an approximate check against that.
457     */
458    assert(svga->curr.constbufs[shader][1].buffer == NULL);
459 
460    cbuf = &svga->curr.constbufs[shader][0];
461 
462    if (svga->curr.constbufs[shader][0].buffer) {
463       /* emit user-provided constants */
464       data = (const float (*)[4])
465          pipe_buffer_map(&svga->pipe, svga->curr.constbufs[shader][0].buffer,
466                          PIPE_TRANSFER_READ, &transfer);
467       if (!data) {
468          return PIPE_ERROR_OUT_OF_MEMORY;
469       }
470 
471       /* sanity check */
472       assert(cbuf->buffer->width0 >=
473              cbuf->buffer_size);
474 
475       /* Use/apply the constant buffer size and offsets here */
476       count = cbuf->buffer_size / (4 * sizeof(float));
477       data += cbuf->buffer_offset / (4 * sizeof(float));
478 
479       if (ss->hw_version >= SVGA3D_HWVERSION_WS8_B1) {
480          ret = emit_const_range( svga, shader, offset, count, data );
481       }
482       else {
483          for (i = 0; i < count; i++) {
484             ret = emit_const( svga, shader, offset + i, data[i] );
485             if (ret != PIPE_OK) {
486                break;
487             }
488          }
489       }
490 
491       pipe_buffer_unmap(&svga->pipe, transfer);
492 
493       if (ret != PIPE_OK) {
494          return ret;
495       }
496    }
497 
498    /* emit extra shader constants */
499    {
500       const struct svga_shader_variant *variant = NULL;
501       unsigned offset;
502       float extras[MAX_EXTRA_CONSTS][4];
503       unsigned count, i;
504 
505       switch (shader) {
506       case PIPE_SHADER_VERTEX:
507          variant = svga->state.hw_draw.vs;
508          count = svga_get_extra_vs_constants(svga, (float *) extras);
509          break;
510       case PIPE_SHADER_FRAGMENT:
511          variant = svga->state.hw_draw.fs;
512          count = svga_get_extra_fs_constants(svga, (float *) extras);
513          break;
514       default:
515          assert(!"Unexpected shader type");
516          count = 0;
517       }
518 
519       assert(variant);
520       offset = variant->shader->info.file_max[TGSI_FILE_CONSTANT] + 1;
521       assert(count <= ARRAY_SIZE(extras));
522 
523       if (count > 0) {
524          if (ss->hw_version >= SVGA3D_HWVERSION_WS8_B1) {
525             ret = emit_const_range(svga, shader, offset, count,
526                                    (const float (*) [4])extras);
527          }
528          else {
529             for (i = 0; i < count; i++) {
530                ret = emit_const(svga, shader, offset + i, extras[i]);
531                if (ret != PIPE_OK)
532                   return ret;
533             }
534          }
535       }
536    }
537 
538    return ret;
539 }
540 
541 
542 
543 static enum pipe_error
emit_constbuf_vgpu10(struct svga_context * svga,enum pipe_shader_type shader)544 emit_constbuf_vgpu10(struct svga_context *svga, enum pipe_shader_type shader)
545 {
546    const struct pipe_constant_buffer *cbuf;
547    struct pipe_resource *dst_buffer = NULL;
548    enum pipe_error ret = PIPE_OK;
549    struct pipe_transfer *src_transfer;
550    struct svga_winsys_surface *dst_handle;
551    float extras[MAX_EXTRA_CONSTS][4];
552    unsigned extra_count, extra_size, extra_offset;
553    unsigned new_buf_size;
554    void *src_map = NULL, *dst_map;
555    unsigned offset;
556    const struct svga_shader_variant *variant;
557    unsigned alloc_buf_size;
558 
559    assert(shader == PIPE_SHADER_VERTEX ||
560           shader == PIPE_SHADER_GEOMETRY ||
561           shader == PIPE_SHADER_FRAGMENT);
562 
563    cbuf = &svga->curr.constbufs[shader][0];
564 
565    switch (shader) {
566    case PIPE_SHADER_VERTEX:
567       variant = svga->state.hw_draw.vs;
568       extra_count = svga_get_extra_vs_constants(svga, (float *) extras);
569       break;
570    case PIPE_SHADER_FRAGMENT:
571       variant = svga->state.hw_draw.fs;
572       extra_count = svga_get_extra_fs_constants(svga, (float *) extras);
573       break;
574    case PIPE_SHADER_GEOMETRY:
575       variant = svga->state.hw_draw.gs;
576       extra_count = svga_get_extra_gs_constants(svga, (float *) extras);
577       break;
578    default:
579       assert(!"Unexpected shader type");
580       /* Don't return an error code since we don't want to keep re-trying
581        * this function and getting stuck in an infinite loop.
582        */
583       return PIPE_OK;
584    }
585 
586    assert(variant);
587 
588    /* Compute extra constants size and offset in bytes */
589    extra_size = extra_count * 4 * sizeof(float);
590    extra_offset = 4 * sizeof(float) * variant->extra_const_start;
591 
592    if (cbuf->buffer_size + extra_size == 0)
593       return PIPE_OK;  /* nothing to do */
594 
595    /* Typically, the cbuf->buffer here is a user-space buffer so mapping
596     * it is really cheap.  If we ever get real HW buffers for constants
597     * we should void mapping and instead use a ResourceCopy command.
598     */
599    if (cbuf->buffer_size > 0) {
600       src_map = pipe_buffer_map_range(&svga->pipe, cbuf->buffer,
601                                       cbuf->buffer_offset, cbuf->buffer_size,
602                                       PIPE_TRANSFER_READ, &src_transfer);
603       assert(src_map);
604       if (!src_map) {
605          return PIPE_ERROR_OUT_OF_MEMORY;
606       }
607    }
608 
609    /* The new/dest buffer's size must be large enough to hold the original,
610     * user-specified constants, plus the extra constants.
611     * The size of the original constant buffer _should_ agree with what the
612     * shader is expecting, but it might not (it's not enforced anywhere by
613     * gallium).
614     */
615    new_buf_size = MAX2(cbuf->buffer_size, extra_offset) + extra_size;
616 
617    /* According to the DX10 spec, the constant buffer size must be
618     * in multiples of 16.
619     */
620    new_buf_size = align(new_buf_size, 16);
621 
622    /* Constant buffer size in the upload buffer must be in multiples of 256.
623     * In order to maximize the chance of merging the upload buffer chunks
624     * when svga_buffer_add_range() is called,
625     * the allocate buffer size needs to be in multiples of 256 as well.
626     * Otherwise, since there is gap between each dirty range of the upload buffer,
627     * each dirty range will end up in its own UPDATE_GB_IMAGE command.
628     */
629    alloc_buf_size = align(new_buf_size, CONST0_UPLOAD_ALIGNMENT);
630 
631    u_upload_alloc(svga->const0_upload, 0, alloc_buf_size,
632                   CONST0_UPLOAD_ALIGNMENT, &offset,
633                   &dst_buffer, &dst_map);
634    if (!dst_map) {
635       if (src_map)
636          pipe_buffer_unmap(&svga->pipe, src_transfer);
637       return PIPE_ERROR_OUT_OF_MEMORY;
638    }
639 
640    if (src_map) {
641       memcpy(dst_map, src_map, cbuf->buffer_size);
642       pipe_buffer_unmap(&svga->pipe, src_transfer);
643    }
644 
645    if (extra_size) {
646       assert(extra_offset + extra_size <= new_buf_size);
647       memcpy((char *) dst_map + extra_offset, extras, extra_size);
648    }
649 
650    /* Get winsys handle for the constant buffer */
651    if (svga->state.hw_draw.const0_buffer == dst_buffer &&
652        svga->state.hw_draw.const0_handle) {
653       /* re-reference already mapped buffer */
654       dst_handle = svga->state.hw_draw.const0_handle;
655    }
656    else {
657       /* we must unmap the buffer before getting the winsys handle */
658       u_upload_unmap(svga->const0_upload);
659 
660       dst_handle = svga_buffer_handle(svga, dst_buffer);
661       if (!dst_handle) {
662          pipe_resource_reference(&dst_buffer, NULL);
663          return PIPE_ERROR_OUT_OF_MEMORY;
664       }
665 
666       /* save the buffer / handle for next time */
667       pipe_resource_reference(&svga->state.hw_draw.const0_buffer, dst_buffer);
668       svga->state.hw_draw.const0_handle = dst_handle;
669    }
670 
671    /* Issue the SetSingleConstantBuffer command */
672    assert(new_buf_size % 16 == 0);
673    ret = SVGA3D_vgpu10_SetSingleConstantBuffer(svga->swc,
674                                                0, /* index */
675                                                svga_shader_type(shader),
676                                                dst_handle,
677                                                offset,
678                                                new_buf_size);
679 
680    if (ret != PIPE_OK) {
681       pipe_resource_reference(&dst_buffer, NULL);
682       return ret;
683    }
684 
685    /* Save this const buffer until it's replaced in the future.
686     * Otherwise, all references to the buffer will go away after the
687     * command buffer is submitted, it'll get recycled and we will have
688     * incorrect constant buffer bindings.
689     */
690    pipe_resource_reference(&svga->state.hw_draw.constbuf[shader], dst_buffer);
691 
692    svga->state.hw_draw.default_constbuf_size[shader] = new_buf_size;
693 
694    pipe_resource_reference(&dst_buffer, NULL);
695 
696    svga->hud.num_const_buf_updates++;
697 
698    return ret;
699 }
700 
701 
702 static enum pipe_error
emit_consts_vgpu10(struct svga_context * svga,enum pipe_shader_type shader)703 emit_consts_vgpu10(struct svga_context *svga, enum pipe_shader_type shader)
704 {
705    enum pipe_error ret;
706    unsigned dirty_constbufs;
707    unsigned enabled_constbufs;
708 
709    /* Emit 0th constant buffer (with extra constants) */
710    ret = emit_constbuf_vgpu10(svga, shader);
711    if (ret != PIPE_OK) {
712       return ret;
713    }
714 
715    enabled_constbufs = svga->state.hw_draw.enabled_constbufs[shader] | 1u;
716 
717    /* Emit other constant buffers (UBOs) */
718    dirty_constbufs = svga->state.dirty_constbufs[shader] & ~1u;
719 
720    while (dirty_constbufs) {
721       unsigned index = u_bit_scan(&dirty_constbufs);
722       unsigned offset = svga->curr.constbufs[shader][index].buffer_offset;
723       unsigned size = svga->curr.constbufs[shader][index].buffer_size;
724       struct svga_buffer *buffer =
725          svga_buffer(svga->curr.constbufs[shader][index].buffer);
726       struct svga_winsys_surface *handle;
727 
728       if (buffer) {
729          handle = svga_buffer_handle(svga, &buffer->b.b);
730          enabled_constbufs |= 1 << index;
731       }
732       else {
733          handle = NULL;
734          enabled_constbufs &= ~(1 << index);
735          assert(offset == 0);
736          assert(size == 0);
737       }
738 
739       if (size % 16 != 0) {
740          /* GL's buffer range sizes can be any number of bytes but the
741           * SVGA3D device requires a multiple of 16 bytes.
742           */
743          const unsigned total_size = buffer->b.b.width0;
744 
745          if (offset + align(size, 16) <= total_size) {
746             /* round up size to multiple of 16 */
747             size = align(size, 16);
748          }
749          else {
750             /* round down to mulitple of 16 (this may cause rendering problems
751              * but should avoid a device error).
752              */
753             size &= ~15;
754          }
755       }
756 
757       assert(size % 16 == 0);
758       ret = SVGA3D_vgpu10_SetSingleConstantBuffer(svga->swc,
759                                                   index,
760                                                   svga_shader_type(shader),
761                                                   handle,
762                                                   offset,
763                                                   size);
764       if (ret != PIPE_OK)
765          return ret;
766 
767       svga->hud.num_const_buf_updates++;
768    }
769 
770    svga->state.hw_draw.enabled_constbufs[shader] = enabled_constbufs;
771    svga->state.dirty_constbufs[shader] = 0;
772 
773    return ret;
774 }
775 
776 static enum pipe_error
emit_fs_consts(struct svga_context * svga,unsigned dirty)777 emit_fs_consts(struct svga_context *svga, unsigned dirty)
778 {
779    const struct svga_shader_variant *variant = svga->state.hw_draw.fs;
780    enum pipe_error ret = PIPE_OK;
781 
782    /* SVGA_NEW_FS_VARIANT
783     */
784    if (!variant)
785       return PIPE_OK;
786 
787    /* SVGA_NEW_FS_CONST_BUFFER
788     */
789    if (svga_have_vgpu10(svga)) {
790       ret = emit_consts_vgpu10(svga, PIPE_SHADER_FRAGMENT);
791    }
792    else {
793       ret = emit_consts_vgpu9(svga, PIPE_SHADER_FRAGMENT);
794    }
795 
796    return ret;
797 }
798 
799 
800 struct svga_tracked_state svga_hw_fs_constants =
801 {
802    "hw fs params",
803    (SVGA_NEW_FS_CONST_BUFFER |
804     SVGA_NEW_FS_VARIANT |
805     SVGA_NEW_TEXTURE_CONSTS),
806    emit_fs_consts
807 };
808 
809 
810 
811 static enum pipe_error
emit_vs_consts(struct svga_context * svga,unsigned dirty)812 emit_vs_consts(struct svga_context *svga, unsigned dirty)
813 {
814    const struct svga_shader_variant *variant = svga->state.hw_draw.vs;
815    enum pipe_error ret = PIPE_OK;
816 
817    /* SVGA_NEW_VS_VARIANT
818     */
819    if (!variant)
820       return PIPE_OK;
821 
822    /* SVGA_NEW_VS_CONST_BUFFER
823     */
824    if (svga_have_vgpu10(svga)) {
825       ret = emit_consts_vgpu10(svga, PIPE_SHADER_VERTEX);
826    }
827    else {
828       ret = emit_consts_vgpu9(svga, PIPE_SHADER_VERTEX);
829    }
830 
831    return ret;
832 }
833 
834 
835 struct svga_tracked_state svga_hw_vs_constants =
836 {
837    "hw vs params",
838    (SVGA_NEW_PRESCALE |
839     SVGA_NEW_VS_CONST_BUFFER |
840     SVGA_NEW_VS_VARIANT),
841    emit_vs_consts
842 };
843 
844 
845 static enum pipe_error
emit_gs_consts(struct svga_context * svga,unsigned dirty)846 emit_gs_consts(struct svga_context *svga, unsigned dirty)
847 {
848    const struct svga_shader_variant *variant = svga->state.hw_draw.gs;
849    enum pipe_error ret = PIPE_OK;
850 
851    /* SVGA_NEW_GS_VARIANT
852     */
853    if (!variant)
854       return PIPE_OK;
855 
856    /* SVGA_NEW_GS_CONST_BUFFER
857     */
858    if (svga_have_vgpu10(svga)) {
859       /**
860        * If only the rasterizer state has changed and the current geometry
861        * shader does not emit wide points, then there is no reason to
862        * re-emit the GS constants, so skip it.
863        */
864       if (dirty == SVGA_NEW_RAST && !variant->key.gs.wide_point)
865          return PIPE_OK;
866 
867       ret = emit_consts_vgpu10(svga, PIPE_SHADER_GEOMETRY);
868    }
869 
870    return ret;
871 }
872 
873 
874 struct svga_tracked_state svga_hw_gs_constants =
875 {
876    "hw gs params",
877    (SVGA_NEW_GS_CONST_BUFFER |
878     SVGA_NEW_RAST |
879     SVGA_NEW_GS_VARIANT),
880    emit_gs_consts
881 };
882