• Home
  • Line#
  • Scopes#
  • Navigate#
  • Raw
  • Download
1 /*
2  * Copyright 2016 Red Hat.
3  *
4  * Permission is hereby granted, free of charge, to any person obtaining a
5  * copy of this software and associated documentation files (the "Software"),
6  * to deal in the Software without restriction, including without limitation
7  * on the rights to use, copy, modify, merge, publish, distribute, sub
8  * license, and/or sell copies of the Software, and to permit persons to whom
9  * the Software is furnished to do so, subject to the following conditions:
10  *
11  * The above copyright notice and this permission notice (including the next
12  * paragraph) shall be included in all copies or substantial portions of the
13  * Software.
14  *
15  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17  * FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT. IN NO EVENT SHALL
18  * THE AUTHOR(S) AND/OR THEIR SUPPLIERS BE LIABLE FOR ANY CLAIM,
19  * DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR
20  * OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE
21  * USE OR OTHER DEALINGS IN THE SOFTWARE.
22  */
23 
24 #include "sp_context.h"
25 #include "sp_image.h"
26 #include "sp_texture.h"
27 
28 #include "util/format/u_format.h"
29 
30 /*
31  * Get the offset into the base image
32  * first element for a buffer or layer/level for texture.
33  */
34 static uint32_t
get_image_offset(const struct softpipe_resource * spr,const struct pipe_image_view * iview,enum pipe_format format,unsigned r_coord)35 get_image_offset(const struct softpipe_resource *spr,
36                  const struct pipe_image_view *iview,
37                  enum pipe_format format, unsigned r_coord)
38 {
39    int base_layer = 0;
40 
41    if (spr->base.target == PIPE_BUFFER)
42       return iview->u.buf.offset;
43 
44    if (spr->base.target == PIPE_TEXTURE_1D_ARRAY ||
45        spr->base.target == PIPE_TEXTURE_2D_ARRAY ||
46        spr->base.target == PIPE_TEXTURE_CUBE_ARRAY ||
47        spr->base.target == PIPE_TEXTURE_CUBE ||
48        spr->base.target == PIPE_TEXTURE_3D)
49       base_layer = r_coord + iview->u.tex.first_layer;
50    return softpipe_get_tex_image_offset(spr, iview->u.tex.level, base_layer);
51 }
52 
53 /*
54  * Does this texture instruction have a layer or depth parameter.
55  */
56 static inline bool
has_layer_or_depth(unsigned tgsi_tex_instr)57 has_layer_or_depth(unsigned tgsi_tex_instr)
58 {
59    return (tgsi_tex_instr == TGSI_TEXTURE_3D ||
60            tgsi_tex_instr == TGSI_TEXTURE_CUBE ||
61            tgsi_tex_instr == TGSI_TEXTURE_1D_ARRAY ||
62            tgsi_tex_instr == TGSI_TEXTURE_2D_ARRAY ||
63            tgsi_tex_instr == TGSI_TEXTURE_CUBE_ARRAY ||
64            tgsi_tex_instr == TGSI_TEXTURE_2D_ARRAY_MSAA);
65 }
66 
67 /*
68  * Is this texture instruction a single non-array coordinate.
69  */
70 static inline bool
has_1coord(unsigned tgsi_tex_instr)71 has_1coord(unsigned tgsi_tex_instr)
72 {
73    return (tgsi_tex_instr == TGSI_TEXTURE_BUFFER ||
74            tgsi_tex_instr == TGSI_TEXTURE_1D ||
75            tgsi_tex_instr == TGSI_TEXTURE_1D_ARRAY);
76 }
77 
78 /*
79  * check the bounds vs w/h/d
80  */
81 static inline bool
bounds_check(int width,int height,int depth,int s,int t,int r)82 bounds_check(int width, int height, int depth,
83              int s, int t, int r)
84 {
85    if (s < 0 || s >= width)
86       return false;
87    if (t < 0 || t >= height)
88       return false;
89    if (r < 0 || r >= depth)
90       return false;
91    return true;
92 }
93 
94 /*
95  * Checks if the texture target compatible with the image resource
96  * pipe target.
97  */
98 static inline bool
has_compat_target(unsigned pipe_target,unsigned tgsi_target)99 has_compat_target(unsigned pipe_target, unsigned tgsi_target)
100 {
101    switch (pipe_target) {
102    case PIPE_TEXTURE_1D:
103       if (tgsi_target == TGSI_TEXTURE_1D)
104          return true;
105       break;
106    case PIPE_TEXTURE_2D:
107       if (tgsi_target == TGSI_TEXTURE_2D)
108          return true;
109       break;
110    case PIPE_TEXTURE_RECT:
111       if (tgsi_target == TGSI_TEXTURE_RECT)
112          return true;
113       break;
114    case PIPE_TEXTURE_3D:
115       if (tgsi_target == TGSI_TEXTURE_3D ||
116           tgsi_target == TGSI_TEXTURE_2D)
117          return true;
118       break;
119    case PIPE_TEXTURE_CUBE:
120       if (tgsi_target == TGSI_TEXTURE_CUBE ||
121           tgsi_target == TGSI_TEXTURE_2D)
122          return true;
123       break;
124    case PIPE_TEXTURE_1D_ARRAY:
125       if (tgsi_target == TGSI_TEXTURE_1D ||
126           tgsi_target == TGSI_TEXTURE_1D_ARRAY)
127          return true;
128       break;
129    case PIPE_TEXTURE_2D_ARRAY:
130       if (tgsi_target == TGSI_TEXTURE_2D ||
131           tgsi_target == TGSI_TEXTURE_2D_ARRAY)
132          return true;
133       break;
134    case PIPE_TEXTURE_CUBE_ARRAY:
135       if (tgsi_target == TGSI_TEXTURE_CUBE ||
136           tgsi_target == TGSI_TEXTURE_CUBE_ARRAY ||
137           tgsi_target == TGSI_TEXTURE_2D)
138          return true;
139       break;
140    case PIPE_BUFFER:
141       return (tgsi_target == TGSI_TEXTURE_BUFFER);
142    }
143    return false;
144 }
145 
146 static bool
get_dimensions(const struct pipe_image_view * iview,const struct softpipe_resource * spr,unsigned tgsi_tex_instr,enum pipe_format pformat,unsigned * width,unsigned * height,unsigned * depth)147 get_dimensions(const struct pipe_image_view *iview,
148                const struct softpipe_resource *spr,
149                unsigned tgsi_tex_instr,
150                enum pipe_format pformat,
151                unsigned *width,
152                unsigned *height,
153                unsigned *depth)
154 {
155    if (tgsi_tex_instr == TGSI_TEXTURE_BUFFER) {
156       *width = iview->u.buf.size / util_format_get_blocksize(pformat);
157       *height = 1;
158       *depth = 1;
159       /*
160        * Bounds check the buffer size from the view
161        * and the buffer size from the underlying buffer.
162        */
163       if (util_format_get_stride(pformat, *width) >
164           util_format_get_stride(spr->base.format, spr->base.width0))
165          return false;
166    } else {
167       unsigned level;
168 
169       level = spr->base.target == PIPE_BUFFER ? 0 : iview->u.tex.level;
170       *width = u_minify(spr->base.width0, level);
171       *height = u_minify(spr->base.height0, level);
172 
173       if (spr->base.target == PIPE_TEXTURE_3D)
174          *depth = u_minify(spr->base.depth0, level);
175       else
176          *depth = spr->base.array_size;
177 
178       /* Make sure the resource and view have compatible formats */
179       if (util_format_get_blocksize(pformat) >
180           util_format_get_blocksize(spr->base.format))
181          return false;
182    }
183    return true;
184 }
185 
186 static void
fill_coords(const struct tgsi_image_params * params,unsigned index,const int s[TGSI_QUAD_SIZE],const int t[TGSI_QUAD_SIZE],const int r[TGSI_QUAD_SIZE],int * s_coord,int * t_coord,int * r_coord)187 fill_coords(const struct tgsi_image_params *params,
188             unsigned index,
189             const int s[TGSI_QUAD_SIZE],
190             const int t[TGSI_QUAD_SIZE],
191             const int r[TGSI_QUAD_SIZE],
192             int *s_coord, int *t_coord, int *r_coord)
193 {
194    *s_coord = s[index];
195    *t_coord = has_1coord(params->tgsi_tex_instr) ? 0 : t[index];
196    *r_coord = has_layer_or_depth(params->tgsi_tex_instr) ?
197       (params->tgsi_tex_instr == TGSI_TEXTURE_1D_ARRAY ? t[index] : r[index]) : 0;
198 }
199 /*
200  * Implement the image LOAD operation.
201  */
202 static void
sp_tgsi_load(const struct tgsi_image * image,const struct tgsi_image_params * params,const int s[TGSI_QUAD_SIZE],const int t[TGSI_QUAD_SIZE],const int r[TGSI_QUAD_SIZE],const int sample[TGSI_QUAD_SIZE],float rgba[TGSI_NUM_CHANNELS][TGSI_QUAD_SIZE])203 sp_tgsi_load(const struct tgsi_image *image,
204              const struct tgsi_image_params *params,
205              const int s[TGSI_QUAD_SIZE],
206              const int t[TGSI_QUAD_SIZE],
207              const int r[TGSI_QUAD_SIZE],
208              const int sample[TGSI_QUAD_SIZE],
209              float rgba[TGSI_NUM_CHANNELS][TGSI_QUAD_SIZE])
210 {
211    struct sp_tgsi_image *sp_img = (struct sp_tgsi_image *)image;
212    struct pipe_image_view *iview;
213    struct softpipe_resource *spr;
214    unsigned width, height, depth;
215    unsigned stride;
216    int c, j;
217    char *data_ptr;
218    unsigned offset = 0;
219 
220    if (params->unit >= PIPE_MAX_SHADER_IMAGES)
221       goto fail_write_all_zero;
222    iview = &sp_img->sp_iview[params->unit];
223    spr = (struct softpipe_resource *)iview->resource;
224    if (!spr)
225       goto fail_write_all_zero;
226 
227    if (!has_compat_target(spr->base.target, params->tgsi_tex_instr))
228       goto fail_write_all_zero;
229 
230    if (!get_dimensions(iview, spr, params->tgsi_tex_instr,
231                        params->format, &width, &height, &depth))
232       return;
233 
234    stride = util_format_get_stride(params->format, width);
235 
236    for (j = 0; j < TGSI_QUAD_SIZE; j++) {
237       int s_coord, t_coord, r_coord;
238       bool fill_zero = false;
239 
240       if (!(params->execmask & (1 << j)))
241          fill_zero = true;
242 
243       fill_coords(params, j, s, t, r, &s_coord, &t_coord, &r_coord);
244       if (!bounds_check(width, height, depth,
245                         s_coord, t_coord, r_coord))
246          fill_zero = true;
247 
248       if (fill_zero) {
249          int nc = util_format_get_nr_components(params->format);
250          int ival = util_format_is_pure_integer(params->format);
251          for (c = 0; c < 4; c++) {
252             rgba[c][j] = 0;
253             if (c == 3 && nc < 4) {
254                if (ival)
255                   ((int32_t *)rgba[c])[j] = 1;
256                else
257                   rgba[c][j] = 1.0;
258             }
259          }
260          continue;
261       }
262       offset = get_image_offset(spr, iview, params->format, r_coord);
263       data_ptr = (char *)spr->data + offset;
264 
265       uint32_t sdata[4];
266       util_format_read_4(params->format,
267                          sdata, 0,
268                          data_ptr, stride,
269                          s_coord, t_coord, 1, 1);
270       for (c = 0; c < 4; c++)
271          ((uint32_t *)rgba[c])[j] = sdata[c];
272    }
273    return;
274 fail_write_all_zero:
275    for (j = 0; j < TGSI_QUAD_SIZE; j++) {
276       for (c = 0; c < 4; c++)
277          rgba[c][j] = 0;
278    }
279    return;
280 }
281 
282 /*
283  * Implement the image STORE operation.
284  */
285 static void
sp_tgsi_store(const struct tgsi_image * image,const struct tgsi_image_params * params,const int s[TGSI_QUAD_SIZE],const int t[TGSI_QUAD_SIZE],const int r[TGSI_QUAD_SIZE],const int sample[TGSI_QUAD_SIZE],float rgba[TGSI_NUM_CHANNELS][TGSI_QUAD_SIZE])286 sp_tgsi_store(const struct tgsi_image *image,
287               const struct tgsi_image_params *params,
288               const int s[TGSI_QUAD_SIZE],
289               const int t[TGSI_QUAD_SIZE],
290               const int r[TGSI_QUAD_SIZE],
291               const int sample[TGSI_QUAD_SIZE],
292               float rgba[TGSI_NUM_CHANNELS][TGSI_QUAD_SIZE])
293 {
294    struct sp_tgsi_image *sp_img = (struct sp_tgsi_image *)image;
295    struct pipe_image_view *iview;
296    struct softpipe_resource *spr;
297    unsigned width, height, depth;
298    unsigned stride;
299    char *data_ptr;
300    int j, c;
301    unsigned offset = 0;
302    unsigned pformat = params->format;
303 
304    if (params->unit >= PIPE_MAX_SHADER_IMAGES)
305       return;
306    iview = &sp_img->sp_iview[params->unit];
307    spr = (struct softpipe_resource *)iview->resource;
308    if (!spr)
309       return;
310    if (!has_compat_target(spr->base.target, params->tgsi_tex_instr))
311       return;
312 
313    if (params->format == PIPE_FORMAT_NONE)
314       pformat = spr->base.format;
315 
316    if (!get_dimensions(iview, spr, params->tgsi_tex_instr,
317                        pformat, &width, &height, &depth))
318       return;
319 
320    stride = util_format_get_stride(pformat, width);
321 
322    for (j = 0; j < TGSI_QUAD_SIZE; j++) {
323       int s_coord, t_coord, r_coord;
324 
325       if (!(params->execmask & (1 << j)))
326          continue;
327 
328       fill_coords(params, j, s, t, r, &s_coord, &t_coord, &r_coord);
329       if (!bounds_check(width, height, depth,
330                         s_coord, t_coord, r_coord))
331          continue;
332 
333       offset = get_image_offset(spr, iview, pformat, r_coord);
334       data_ptr = (char *)spr->data + offset;
335 
336       uint32_t sdata[4];
337       for (c = 0; c < 4; c++)
338          sdata[c] = ((uint32_t *)rgba[c])[j];
339       util_format_write_4(pformat, sdata, 0, data_ptr, stride,
340                           s_coord, t_coord, 1, 1);
341    }
342 }
343 
344 /*
345  * Implement atomic operations on unsigned integers.
346  */
347 static void
handle_op_uint(const struct pipe_image_view * iview,const struct tgsi_image_params * params,bool just_read,char * data_ptr,uint qi,unsigned stride,enum tgsi_opcode opcode,int s,int t,float rgba[TGSI_NUM_CHANNELS][TGSI_QUAD_SIZE],float rgba2[TGSI_NUM_CHANNELS][TGSI_QUAD_SIZE])348 handle_op_uint(const struct pipe_image_view *iview,
349                const struct tgsi_image_params *params,
350                bool just_read,
351                char *data_ptr,
352                uint qi,
353                unsigned stride,
354                enum tgsi_opcode opcode,
355                int s,
356                int t,
357                float rgba[TGSI_NUM_CHANNELS][TGSI_QUAD_SIZE],
358                float rgba2[TGSI_NUM_CHANNELS][TGSI_QUAD_SIZE])
359 {
360    uint c;
361    int nc = util_format_get_nr_components(params->format);
362    unsigned sdata[4];
363 
364    util_format_read_4(params->format,
365                       sdata, 0,
366                       data_ptr, stride,
367                       s, t, 1, 1);
368 
369    if (just_read) {
370       for (c = 0; c < nc; c++) {
371          ((uint32_t *)rgba[c])[qi] = sdata[c];
372       }
373       return;
374    }
375    switch (opcode) {
376    case TGSI_OPCODE_ATOMUADD:
377       for (c = 0; c < nc; c++) {
378          unsigned temp = sdata[c];
379          sdata[c] += ((uint32_t *)rgba[c])[qi];
380          ((uint32_t *)rgba[c])[qi] = temp;
381       }
382       break;
383    case TGSI_OPCODE_ATOMXCHG:
384       for (c = 0; c < nc; c++) {
385          unsigned temp = sdata[c];
386          sdata[c] = ((uint32_t *)rgba[c])[qi];
387          ((uint32_t *)rgba[c])[qi] = temp;
388       }
389       break;
390    case TGSI_OPCODE_ATOMCAS:
391       for (c = 0; c < nc; c++) {
392          unsigned dst_x = sdata[c];
393          unsigned cmp_x = ((uint32_t *)rgba[c])[qi];
394          unsigned src_x = ((uint32_t *)rgba2[c])[qi];
395          unsigned temp = sdata[c];
396          sdata[c] = (dst_x == cmp_x) ? src_x : dst_x;
397          ((uint32_t *)rgba[c])[qi] = temp;
398       }
399       break;
400    case TGSI_OPCODE_ATOMAND:
401       for (c = 0; c < nc; c++) {
402          unsigned temp = sdata[c];
403          sdata[c] &= ((uint32_t *)rgba[c])[qi];
404          ((uint32_t *)rgba[c])[qi] = temp;
405       }
406       break;
407    case TGSI_OPCODE_ATOMOR:
408       for (c = 0; c < nc; c++) {
409          unsigned temp = sdata[c];
410          sdata[c] |= ((uint32_t *)rgba[c])[qi];
411          ((uint32_t *)rgba[c])[qi] = temp;
412       }
413       break;
414    case TGSI_OPCODE_ATOMXOR:
415       for (c = 0; c < nc; c++) {
416          unsigned temp = sdata[c];
417          sdata[c] ^= ((uint32_t *)rgba[c])[qi];
418          ((uint32_t *)rgba[c])[qi] = temp;
419       }
420       break;
421    case TGSI_OPCODE_ATOMUMIN:
422       for (c = 0; c < nc; c++) {
423          unsigned dst_x = sdata[c];
424          unsigned src_x = ((uint32_t *)rgba[c])[qi];
425          sdata[c] = MIN2(dst_x, src_x);
426          ((uint32_t *)rgba[c])[qi] = dst_x;
427       }
428       break;
429    case TGSI_OPCODE_ATOMUMAX:
430       for (c = 0; c < nc; c++) {
431          unsigned dst_x = sdata[c];
432          unsigned src_x = ((uint32_t *)rgba[c])[qi];
433          sdata[c] = MAX2(dst_x, src_x);
434          ((uint32_t *)rgba[c])[qi] = dst_x;
435       }
436       break;
437    case TGSI_OPCODE_ATOMIMIN:
438       for (c = 0; c < nc; c++) {
439          int dst_x = sdata[c];
440          int src_x = ((uint32_t *)rgba[c])[qi];
441          sdata[c] = MIN2(dst_x, src_x);
442          ((uint32_t *)rgba[c])[qi] = dst_x;
443       }
444       break;
445    case TGSI_OPCODE_ATOMIMAX:
446       for (c = 0; c < nc; c++) {
447          int dst_x = sdata[c];
448          int src_x = ((uint32_t *)rgba[c])[qi];
449          sdata[c] = MAX2(dst_x, src_x);
450          ((uint32_t *)rgba[c])[qi] = dst_x;
451       }
452       break;
453    default:
454       assert(!"Unexpected TGSI opcode in sp_tgsi_op");
455       break;
456    }
457    util_format_write_4(params->format, sdata, 0, data_ptr, stride,
458                        s, t, 1, 1);
459 }
460 
461 /*
462  * Implement atomic operations on signed integers.
463  */
464 static void
handle_op_int(const struct pipe_image_view * iview,const struct tgsi_image_params * params,bool just_read,char * data_ptr,uint qi,unsigned stride,enum tgsi_opcode opcode,int s,int t,float rgba[TGSI_NUM_CHANNELS][TGSI_QUAD_SIZE],float rgba2[TGSI_NUM_CHANNELS][TGSI_QUAD_SIZE])465 handle_op_int(const struct pipe_image_view *iview,
466               const struct tgsi_image_params *params,
467               bool just_read,
468               char *data_ptr,
469               uint qi,
470               unsigned stride,
471               enum tgsi_opcode opcode,
472               int s,
473               int t,
474               float rgba[TGSI_NUM_CHANNELS][TGSI_QUAD_SIZE],
475               float rgba2[TGSI_NUM_CHANNELS][TGSI_QUAD_SIZE])
476 {
477    uint c;
478    int nc = util_format_get_nr_components(params->format);
479    int sdata[4];
480    util_format_read_4(params->format,
481                       sdata, 0,
482                       data_ptr, stride,
483                       s, t, 1, 1);
484 
485    if (just_read) {
486       for (c = 0; c < nc; c++) {
487          ((int32_t *)rgba[c])[qi] = sdata[c];
488       }
489       return;
490    }
491    switch (opcode) {
492    case TGSI_OPCODE_ATOMUADD:
493       for (c = 0; c < nc; c++) {
494          int temp = sdata[c];
495          sdata[c] += ((int32_t *)rgba[c])[qi];
496          ((int32_t *)rgba[c])[qi] = temp;
497       }
498       break;
499    case TGSI_OPCODE_ATOMXCHG:
500       for (c = 0; c < nc; c++) {
501          int temp = sdata[c];
502          sdata[c] = ((int32_t *)rgba[c])[qi];
503          ((int32_t *)rgba[c])[qi] = temp;
504       }
505       break;
506    case TGSI_OPCODE_ATOMCAS:
507       for (c = 0; c < nc; c++) {
508          int dst_x = sdata[c];
509          int cmp_x = ((int32_t *)rgba[c])[qi];
510          int src_x = ((int32_t *)rgba2[c])[qi];
511          int temp = sdata[c];
512          sdata[c] = (dst_x == cmp_x) ? src_x : dst_x;
513          ((int32_t *)rgba[c])[qi] = temp;
514       }
515       break;
516    case TGSI_OPCODE_ATOMAND:
517       for (c = 0; c < nc; c++) {
518          int temp = sdata[c];
519          sdata[c] &= ((int32_t *)rgba[c])[qi];
520          ((int32_t *)rgba[c])[qi] = temp;
521       }
522       break;
523    case TGSI_OPCODE_ATOMOR:
524       for (c = 0; c < nc; c++) {
525          int temp = sdata[c];
526          sdata[c] |= ((int32_t *)rgba[c])[qi];
527          ((int32_t *)rgba[c])[qi] = temp;
528       }
529       break;
530    case TGSI_OPCODE_ATOMXOR:
531       for (c = 0; c < nc; c++) {
532          int temp = sdata[c];
533          sdata[c] ^= ((int32_t *)rgba[c])[qi];
534          ((int32_t *)rgba[c])[qi] = temp;
535       }
536       break;
537    case TGSI_OPCODE_ATOMUMIN:
538       for (c = 0; c < nc; c++) {
539          int dst_x = sdata[c];
540          int src_x = ((int32_t *)rgba[c])[qi];
541          sdata[c] = MIN2(dst_x, src_x);
542          ((int32_t *)rgba[c])[qi] = dst_x;
543       }
544       break;
545    case TGSI_OPCODE_ATOMUMAX:
546       for (c = 0; c < nc; c++) {
547          int dst_x = sdata[c];
548          int src_x = ((int32_t *)rgba[c])[qi];
549          sdata[c] = MAX2(dst_x, src_x);
550          ((int32_t *)rgba[c])[qi] = dst_x;
551       }
552       break;
553    case TGSI_OPCODE_ATOMIMIN:
554       for (c = 0; c < nc; c++) {
555          int dst_x = sdata[c];
556          int src_x = ((int32_t *)rgba[c])[qi];
557          sdata[c] = MIN2(dst_x, src_x);
558          ((int32_t *)rgba[c])[qi] = dst_x;
559       }
560       break;
561    case TGSI_OPCODE_ATOMIMAX:
562       for (c = 0; c < nc; c++) {
563          int dst_x = sdata[c];
564          int src_x = ((int32_t *)rgba[c])[qi];
565          sdata[c] = MAX2(dst_x, src_x);
566          ((int32_t *)rgba[c])[qi] = dst_x;
567       }
568       break;
569    default:
570       assert(!"Unexpected TGSI opcode in sp_tgsi_op");
571       break;
572    }
573    util_format_write_4(params->format, sdata, 0, data_ptr, stride,
574                        s, t, 1, 1);
575 }
576 
577 /* GLES OES_shader_image_atomic.txt allows XCHG on R32F */
578 static void
handle_op_r32f_xchg(const struct pipe_image_view * iview,const struct tgsi_image_params * params,bool just_read,char * data_ptr,uint qi,unsigned stride,enum tgsi_opcode opcode,int s,int t,float rgba[TGSI_NUM_CHANNELS][TGSI_QUAD_SIZE])579 handle_op_r32f_xchg(const struct pipe_image_view *iview,
580                     const struct tgsi_image_params *params,
581                     bool just_read,
582                     char *data_ptr,
583                     uint qi,
584                     unsigned stride,
585                     enum tgsi_opcode opcode,
586                     int s,
587                     int t,
588                     float rgba[TGSI_NUM_CHANNELS][TGSI_QUAD_SIZE])
589 {
590    float sdata[4];
591    uint c;
592    int nc = 1;
593    util_format_read_4(params->format,
594                       sdata, 0,
595                       data_ptr, stride,
596                       s, t, 1, 1);
597    if (just_read) {
598       for (c = 0; c < nc; c++) {
599          ((int32_t *)rgba[c])[qi] = sdata[c];
600       }
601       return;
602    }
603 
604    for (c = 0; c < nc; c++) {
605       int temp = sdata[c];
606       sdata[c] = ((float *)rgba[c])[qi];
607       ((float *)rgba[c])[qi] = temp;
608    }
609    util_format_write_4(params->format, sdata, 0, data_ptr, stride,
610                        s, t, 1, 1);
611 }
612 
613 /*
614  * Implement atomic image operations.
615  */
616 static void
sp_tgsi_op(const struct tgsi_image * image,const struct tgsi_image_params * params,enum tgsi_opcode opcode,const int s[TGSI_QUAD_SIZE],const int t[TGSI_QUAD_SIZE],const int r[TGSI_QUAD_SIZE],const int sample[TGSI_QUAD_SIZE],float rgba[TGSI_NUM_CHANNELS][TGSI_QUAD_SIZE],float rgba2[TGSI_NUM_CHANNELS][TGSI_QUAD_SIZE])617 sp_tgsi_op(const struct tgsi_image *image,
618            const struct tgsi_image_params *params,
619            enum tgsi_opcode opcode,
620            const int s[TGSI_QUAD_SIZE],
621            const int t[TGSI_QUAD_SIZE],
622            const int r[TGSI_QUAD_SIZE],
623            const int sample[TGSI_QUAD_SIZE],
624            float rgba[TGSI_NUM_CHANNELS][TGSI_QUAD_SIZE],
625            float rgba2[TGSI_NUM_CHANNELS][TGSI_QUAD_SIZE])
626 {
627    struct sp_tgsi_image *sp_img = (struct sp_tgsi_image *)image;
628    struct pipe_image_view *iview;
629    struct softpipe_resource *spr;
630    unsigned width, height, depth;
631    unsigned stride;
632    int j, c;
633    unsigned offset;
634    char *data_ptr;
635 
636    if (params->unit >= PIPE_MAX_SHADER_IMAGES)
637       return;
638    iview = &sp_img->sp_iview[params->unit];
639    spr = (struct softpipe_resource *)iview->resource;
640    if (!spr)
641       goto fail_write_all_zero;
642    if (!has_compat_target(spr->base.target, params->tgsi_tex_instr))
643       goto fail_write_all_zero;
644 
645    if (!get_dimensions(iview, spr, params->tgsi_tex_instr,
646                        params->format, &width, &height, &depth))
647       goto fail_write_all_zero;
648 
649    stride = util_format_get_stride(spr->base.format, width);
650 
651    for (j = 0; j < TGSI_QUAD_SIZE; j++) {
652       int s_coord, t_coord, r_coord;
653       bool just_read = false;
654 
655       fill_coords(params, j, s, t, r, &s_coord, &t_coord, &r_coord);
656       if (!bounds_check(width, height, depth,
657                         s_coord, t_coord, r_coord)) {
658          int nc = util_format_get_nr_components(params->format);
659          int ival = util_format_is_pure_integer(params->format);
660          int c;
661          for (c = 0; c < 4; c++) {
662             rgba[c][j] = 0;
663             if (c == 3 && nc < 4) {
664                if (ival)
665                   ((int32_t *)rgba[c])[j] = 1;
666                else
667                   rgba[c][j] = 1.0;
668             }
669          }
670          continue;
671       }
672 
673       /* just readback the value for atomic if execmask isn't set */
674       if (!(params->execmask & (1 << j))) {
675          just_read = true;
676       }
677 
678       offset = get_image_offset(spr, iview, params->format, r_coord);
679       data_ptr = (char *)spr->data + offset;
680 
681       /* we should see atomic operations on r32 formats */
682       if (util_format_is_pure_uint(params->format))
683          handle_op_uint(iview, params, just_read, data_ptr, j, stride,
684                         opcode, s_coord, t_coord, rgba, rgba2);
685       else if (util_format_is_pure_sint(params->format))
686          handle_op_int(iview, params, just_read, data_ptr, j, stride,
687                        opcode, s_coord, t_coord, rgba, rgba2);
688       else if (params->format == PIPE_FORMAT_R32_FLOAT &&
689                opcode == TGSI_OPCODE_ATOMXCHG)
690          handle_op_r32f_xchg(iview, params, just_read, data_ptr, j, stride,
691                              opcode, s_coord, t_coord, rgba);
692       else
693          assert(0);
694    }
695    return;
696 fail_write_all_zero:
697    for (j = 0; j < TGSI_QUAD_SIZE; j++) {
698       for (c = 0; c < 4; c++)
699          rgba[c][j] = 0;
700    }
701    return;
702 }
703 
704 static void
sp_tgsi_get_dims(const struct tgsi_image * image,const struct tgsi_image_params * params,int dims[4])705 sp_tgsi_get_dims(const struct tgsi_image *image,
706                  const struct tgsi_image_params *params,
707                  int dims[4])
708 {
709    struct sp_tgsi_image *sp_img = (struct sp_tgsi_image *)image;
710    struct pipe_image_view *iview;
711    struct softpipe_resource *spr;
712    int level;
713 
714    if (params->unit >= PIPE_MAX_SHADER_IMAGES)
715       return;
716    iview = &sp_img->sp_iview[params->unit];
717    spr = (struct softpipe_resource *)iview->resource;
718    if (!spr)
719       return;
720 
721    if (params->tgsi_tex_instr == TGSI_TEXTURE_BUFFER) {
722       dims[0] = iview->u.buf.size / util_format_get_blocksize(iview->format);
723       dims[1] = dims[2] = dims[3] = 0;
724       return;
725    }
726 
727    level = iview->u.tex.level;
728    dims[0] = u_minify(spr->base.width0, level);
729    switch (params->tgsi_tex_instr) {
730    case TGSI_TEXTURE_1D_ARRAY:
731       dims[1] = iview->u.tex.last_layer - iview->u.tex.first_layer + 1;
732       FALLTHROUGH;
733    case TGSI_TEXTURE_1D:
734       return;
735    case TGSI_TEXTURE_2D_ARRAY:
736       dims[2] = iview->u.tex.last_layer - iview->u.tex.first_layer + 1;
737       FALLTHROUGH;
738    case TGSI_TEXTURE_2D:
739    case TGSI_TEXTURE_CUBE:
740    case TGSI_TEXTURE_RECT:
741       dims[1] = u_minify(spr->base.height0, level);
742       return;
743    case TGSI_TEXTURE_3D:
744       dims[1] = u_minify(spr->base.height0, level);
745       dims[2] = u_minify(spr->base.depth0, level);
746       return;
747    case TGSI_TEXTURE_CUBE_ARRAY:
748       dims[1] = u_minify(spr->base.height0, level);
749       dims[2] = (iview->u.tex.last_layer - iview->u.tex.first_layer + 1) / 6;
750       break;
751    default:
752       assert(!"unexpected texture target in sp_get_dims()");
753       return;
754    }
755 }
756 
757 struct sp_tgsi_image *
sp_create_tgsi_image(void)758 sp_create_tgsi_image(void)
759 {
760    struct sp_tgsi_image *img = CALLOC_STRUCT(sp_tgsi_image);
761    if (!img)
762       return NULL;
763 
764    img->base.load = sp_tgsi_load;
765    img->base.store = sp_tgsi_store;
766    img->base.op = sp_tgsi_op;
767    img->base.get_dims = sp_tgsi_get_dims;
768    return img;
769 };
770