1 /*
2 * Copyright © Microsoft Corporation
3 *
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8 * and/or sell copies of the Software, and to permit persons to whom the
9 * Software is furnished to do so, subject to the following conditions:
10 *
11 * The above copyright notice and this permission notice (including the next
12 * paragraph) shall be included in all copies or substantial portions of the
13 * Software.
14 *
15 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
18 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
20 * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
21 * IN THE SOFTWARE.
22 */
23
24 #include "d3d12_context.h"
25 #include "d3d12_compiler.h"
26 #include "d3d12_debug.h"
27 #include "d3d12_format.h"
28 #include "d3d12_resource.h"
29 #include "d3d12_screen.h"
30
31 #include "util/u_blitter.h"
32 #include "util/format/u_format.h"
33
34 #include "nir_to_dxil.h"
35 #include "nir_builder.h"
36
37 static void
copy_buffer_region_no_barriers(struct d3d12_context * ctx,struct d3d12_resource * dst,uint64_t dst_offset,struct d3d12_resource * src,uint64_t src_offset,uint64_t size)38 copy_buffer_region_no_barriers(struct d3d12_context *ctx,
39 struct d3d12_resource *dst,
40 uint64_t dst_offset,
41 struct d3d12_resource *src,
42 uint64_t src_offset,
43 uint64_t size)
44 {
45 uint64_t dst_off, src_off;
46 ID3D12Resource *dst_buf = d3d12_resource_underlying(dst, &dst_off);
47 ID3D12Resource *src_buf = d3d12_resource_underlying(src, &src_off);
48
49 ctx->cmdlist->CopyBufferRegion(dst_buf, dst_offset + dst_off,
50 src_buf, src_offset + src_off,
51 size);
52 }
53
54 static bool
is_resolve(const struct pipe_blit_info * info)55 is_resolve(const struct pipe_blit_info *info)
56 {
57 return info->src.resource->nr_samples > 1 &&
58 info->dst.resource->nr_samples <= 1;
59 }
60
61 static bool
resolve_supported(const struct pipe_blit_info * info)62 resolve_supported(const struct pipe_blit_info *info)
63 {
64 assert(is_resolve(info));
65
66 // check for unsupported operations
67 if (util_format_is_depth_or_stencil(info->src.format) &&
68 info->mask != PIPE_MASK_Z) {
69 return false;
70 } else {
71 if (util_format_get_mask(info->dst.format) != info->mask ||
72 util_format_get_mask(info->src.format) != info->mask)
73 return false;
74 }
75
76 if (info->filter != PIPE_TEX_FILTER_NEAREST ||
77 info->scissor_enable ||
78 info->num_window_rectangles > 0 ||
79 info->alpha_blend)
80 return false;
81
82 // formats need to match
83 struct d3d12_resource *src = d3d12_resource(info->src.resource);
84 struct d3d12_resource *dst = d3d12_resource(info->dst.resource);
85 if (src->dxgi_format != dst->dxgi_format)
86 return false;
87
88 if (util_format_is_pure_integer(src->base.format))
89 return false;
90
91 // sizes needs to match
92 if (info->src.box.width != info->dst.box.width ||
93 info->src.box.height != info->dst.box.height)
94 return false;
95
96 // can only resolve full subresource
97 if (info->src.box.width != (int)u_minify(info->src.resource->width0,
98 info->src.level) ||
99 info->src.box.height != (int)u_minify(info->src.resource->height0,
100 info->src.level) ||
101 info->dst.box.width != (int)u_minify(info->dst.resource->width0,
102 info->dst.level) ||
103 info->dst.box.height != (int)u_minify(info->dst.resource->height0,
104 info->dst.level))
105 return false;
106
107 return true;
108 }
109
110 static void
blit_resolve(struct d3d12_context * ctx,const struct pipe_blit_info * info)111 blit_resolve(struct d3d12_context *ctx, const struct pipe_blit_info *info)
112 {
113 struct d3d12_batch *batch = d3d12_current_batch(ctx);
114 struct d3d12_resource *src = d3d12_resource(info->src.resource);
115 struct d3d12_resource *dst = d3d12_resource(info->dst.resource);
116
117 d3d12_transition_resource_state(ctx, src,
118 D3D12_RESOURCE_STATE_RESOLVE_SOURCE,
119 D3D12_BIND_INVALIDATE_FULL);
120 d3d12_transition_resource_state(ctx, dst,
121 D3D12_RESOURCE_STATE_RESOLVE_DEST,
122 D3D12_BIND_INVALIDATE_FULL);
123
124 d3d12_apply_resource_states(ctx);
125
126 d3d12_batch_reference_resource(batch, src);
127 d3d12_batch_reference_resource(batch, dst);
128
129 DXGI_FORMAT dxgi_format = d3d12_get_resource_srv_format(src->base.format, src->base.target);
130
131 assert(src->dxgi_format == dst->dxgi_format);
132 ctx->cmdlist->ResolveSubresource(
133 d3d12_resource_resource(dst), info->dst.level,
134 d3d12_resource_resource(src), info->src.level,
135 dxgi_format);
136 }
137
138 static bool
formats_are_copy_compatible(enum pipe_format src,enum pipe_format dst)139 formats_are_copy_compatible(enum pipe_format src, enum pipe_format dst)
140 {
141 if (src == dst)
142 return true;
143
144 /* We can skip the stencil copy */
145 if (util_format_get_depth_only(src) == dst ||
146 util_format_get_depth_only(dst) == src)
147 return true;
148
149 return false;
150 }
151
152 static bool
box_fits(const struct pipe_box * box,const struct pipe_resource * res,int level)153 box_fits(const struct pipe_box *box, const struct pipe_resource *res, int level)
154 {
155 unsigned lwidth = u_minify(res->width0, level);
156 unsigned lheight= u_minify(res->height0, level);
157 unsigned ldepth = res->target == PIPE_TEXTURE_3D ? u_minify(res->depth0, level) :
158 res->array_size;
159
160 unsigned wb = box->x;
161 unsigned we = box->x + box->width;
162
163 unsigned hb = box->y;
164 unsigned he = box->y + box->height;
165
166 unsigned db = box->z;
167 unsigned de = box->z + box->depth;
168
169 return (wb <= lwidth && we <= lwidth &&
170 hb <= lheight && he <= lheight &&
171 db <= ldepth && de <= ldepth);
172 }
173
174 static bool
direct_copy_supported(struct d3d12_screen * screen,const struct pipe_blit_info * info,bool have_predication)175 direct_copy_supported(struct d3d12_screen *screen,
176 const struct pipe_blit_info *info,
177 bool have_predication)
178 {
179 if (info->scissor_enable || info->alpha_blend ||
180 (have_predication && info->render_condition_enable) ||
181 MAX2(info->src.resource->nr_samples, 1) != MAX2(info->dst.resource->nr_samples, 1)) {
182 return false;
183 }
184
185 if (!formats_are_copy_compatible(info->src.format, info->dst.format))
186 return false;
187
188 if (util_format_is_depth_or_stencil(info->src.format) && !(info->mask & PIPE_MASK_ZS)) {
189 return false;
190 }
191
192 if (!util_format_is_depth_or_stencil(info->src.format)) {
193 if (util_format_get_mask(info->dst.format) != info->mask ||
194 util_format_get_mask(info->src.format) != info->mask)
195 return false;
196 }
197
198 if (abs(info->src.box.height) != info->dst.box.height) {
199 return false;
200 }
201
202 if (info->src.box.height != info->dst.box.height &&
203 (!util_format_is_depth_or_stencil(info->src.format) ||
204 screen->opts2.ProgrammableSamplePositionsTier ==
205 D3D12_PROGRAMMABLE_SAMPLE_POSITIONS_TIER_NOT_SUPPORTED)) {
206 return false;
207 }
208
209 if (!box_fits(&info->dst.box, info->dst.resource, info->dst.level)) {
210 return false;
211 }
212 if (!box_fits(&info->src.box, info->src.resource, info->src.level)) {
213 return false;
214 }
215
216 if (info->src.box.width != info->dst.box.width) {
217 return false;
218 }
219
220 if (info->src.box.depth != info->dst.box.depth) {
221 return false;
222 }
223
224 if ((screen->opts2.ProgrammableSamplePositionsTier ==
225 D3D12_PROGRAMMABLE_SAMPLE_POSITIONS_TIER_NOT_SUPPORTED &&
226 (info->src.resource->bind & PIPE_BIND_DEPTH_STENCIL ||
227 info->dst.resource->bind & PIPE_BIND_DEPTH_STENCIL)) ||
228 info->src.resource->nr_samples > 1) {
229
230 if (info->dst.box.x != 0 ||
231 info->dst.box.y != 0 ||
232 info->dst.box.z != 0)
233 return false;
234
235 if (info->src.box.x != 0 ||
236 info->src.box.y != 0 ||
237 info->src.box.z != 0 ||
238 info->src.box.width != (int)u_minify(info->src.resource->width0,
239 info->src.level) ||
240 info->src.box.height != (int)u_minify(info->src.resource->height0,
241 info->src.level) ||
242 info->src.box.depth != (int)u_minify(info->src.resource->depth0,
243 info->src.level))
244 return false;
245 }
246
247 return true;
248 }
249
250 inline static unsigned
get_subresource_id(enum pipe_texture_target target,unsigned subres,unsigned stride,unsigned z,unsigned * updated_z)251 get_subresource_id(enum pipe_texture_target target, unsigned subres, unsigned stride,
252 unsigned z, unsigned *updated_z)
253 {
254 if (d3d12_subresource_id_uses_layer(target)) {
255 subres += stride * z;
256 if (updated_z)
257 *updated_z = 0;
258 }
259 return subres;
260 }
261
262 static void
copy_subregion_no_barriers(struct d3d12_context * ctx,struct d3d12_resource * dst,unsigned dst_level,unsigned dstx,unsigned dsty,unsigned dstz,struct d3d12_resource * src,unsigned src_level,const struct pipe_box * psrc_box,unsigned mask)263 copy_subregion_no_barriers(struct d3d12_context *ctx,
264 struct d3d12_resource *dst,
265 unsigned dst_level,
266 unsigned dstx, unsigned dsty, unsigned dstz,
267 struct d3d12_resource *src,
268 unsigned src_level,
269 const struct pipe_box *psrc_box,
270 unsigned mask)
271 {
272 UNUSED struct d3d12_screen *screen = d3d12_screen(ctx->base.screen);
273 D3D12_TEXTURE_COPY_LOCATION src_loc, dst_loc;
274 unsigned src_z = psrc_box->z;
275
276 int src_subres_stride = src->base.last_level + 1;
277 int dst_subres_stride = dst->base.last_level + 1;
278
279 int src_array_size = src->base.array_size;
280 int dst_array_size = dst->base.array_size;
281
282 if (dst->base.target == PIPE_TEXTURE_CUBE)
283 dst_array_size *= 6;
284
285 if (src->base.target == PIPE_TEXTURE_CUBE)
286 src_array_size *= 6;
287
288 int stencil_src_res_offset = 1;
289 int stencil_dst_res_offset = 1;
290
291 int src_nres = 1;
292 int dst_nres = 1;
293
294 if (dst->base.format == PIPE_FORMAT_Z24_UNORM_S8_UINT ||
295 dst->base.format == PIPE_FORMAT_S8_UINT_Z24_UNORM ||
296 dst->base.format == PIPE_FORMAT_Z32_FLOAT_S8X24_UINT) {
297 stencil_dst_res_offset = dst_subres_stride * dst_array_size;
298 src_nres = 2;
299 }
300
301 if (src->base.format == PIPE_FORMAT_Z24_UNORM_S8_UINT ||
302 src->base.format == PIPE_FORMAT_S8_UINT_Z24_UNORM ||
303 dst->base.format == PIPE_FORMAT_Z32_FLOAT_S8X24_UINT) {
304 stencil_src_res_offset = src_subres_stride * src_array_size;
305 dst_nres = 2;
306 }
307
308 static_assert(PIPE_MASK_S == 0x20 && PIPE_MASK_Z == 0x10, "unexpected ZS format mask");
309 int nsubres = MIN2(src_nres, dst_nres);
310 unsigned subresource_copy_mask = nsubres > 1 ? mask >> 4 : 1;
311
312 for (int subres = 0; subres < nsubres; ++subres) {
313
314 if (!(subresource_copy_mask & (1 << subres)))
315 continue;
316
317 src_loc.Type = D3D12_TEXTURE_COPY_TYPE_SUBRESOURCE_INDEX;
318 src_loc.SubresourceIndex = get_subresource_id(src->base.target, src_level, src_subres_stride, src_z, &src_z) +
319 subres * stencil_src_res_offset;
320 src_loc.pResource = d3d12_resource_resource(src);
321
322 dst_loc.Type = D3D12_TEXTURE_COPY_TYPE_SUBRESOURCE_INDEX;
323 dst_loc.SubresourceIndex = get_subresource_id(dst->base.target, dst_level, dst_subres_stride, dstz, &dstz) +
324 subres * stencil_dst_res_offset;
325 dst_loc.pResource = d3d12_resource_resource(dst);
326
327 if (psrc_box->x == 0 && psrc_box->y == 0 && psrc_box->z == 0 &&
328 psrc_box->width == (int)u_minify(src->base.width0, src_level) &&
329 psrc_box->height == (int)u_minify(src->base.height0, src_level) &&
330 psrc_box->depth == (int)u_minify(src->base.depth0, src_level)) {
331
332 assert((dstx == 0 && dsty == 0 && dstz == 0) ||
333 screen->opts2.ProgrammableSamplePositionsTier !=
334 D3D12_PROGRAMMABLE_SAMPLE_POSITIONS_TIER_NOT_SUPPORTED ||
335 (!util_format_is_depth_or_stencil(dst->base.format) &&
336 !util_format_is_depth_or_stencil(src->base.format) &&
337 dst->base.nr_samples <= 1 &&
338 src->base.nr_samples <= 1));
339
340 ctx->cmdlist->CopyTextureRegion(&dst_loc, dstx, dsty, dstz,
341 &src_loc, NULL);
342
343 } else {
344 D3D12_BOX src_box;
345 src_box.left = psrc_box->x;
346 src_box.right = MIN2(psrc_box->x + psrc_box->width, (int)u_minify(src->base.width0, src_level));
347 src_box.top = psrc_box->y;
348 src_box.bottom = MIN2(psrc_box->y + psrc_box->height, (int)u_minify(src->base.height0, src_level));
349 src_box.front = src_z;
350 src_box.back = src_z + psrc_box->depth;
351
352 assert((screen->opts2.ProgrammableSamplePositionsTier !=
353 D3D12_PROGRAMMABLE_SAMPLE_POSITIONS_TIER_NOT_SUPPORTED ||
354 (!util_format_is_depth_or_stencil(dst->base.format) &&
355 !util_format_is_depth_or_stencil(src->base.format))) &&
356 dst->base.nr_samples <= 1 &&
357 src->base.nr_samples <= 1);
358
359 ctx->cmdlist->CopyTextureRegion(&dst_loc, dstx, dsty, dstz,
360 &src_loc, &src_box);
361 }
362 }
363 }
364
365 static void
copy_resource_y_flipped_no_barriers(struct d3d12_context * ctx,struct d3d12_resource * dst,unsigned dst_level,const struct pipe_box * pdst_box,struct d3d12_resource * src,unsigned src_level,const struct pipe_box * psrc_box,unsigned mask)366 copy_resource_y_flipped_no_barriers(struct d3d12_context *ctx,
367 struct d3d12_resource *dst,
368 unsigned dst_level,
369 const struct pipe_box *pdst_box,
370 struct d3d12_resource *src,
371 unsigned src_level,
372 const struct pipe_box *psrc_box,
373 unsigned mask)
374 {
375 if (D3D12_DEBUG_BLIT & d3d12_debug) {
376 debug_printf("D3D12 BLIT as COPY: from %s@%d %dx%dx%d + %dx%dx%d\n",
377 util_format_name(src->base.format), src_level,
378 psrc_box->x, psrc_box->y, psrc_box->z,
379 psrc_box->width, psrc_box->height, psrc_box->depth);
380 debug_printf(" to %s@%d %dx%dx%d\n",
381 util_format_name(dst->base.format), dst_level,
382 pdst_box->x, pdst_box->y, pdst_box->z);
383 }
384
385 struct pipe_box src_box = *psrc_box;
386 int src_inc = psrc_box->height > 0 ? 1 : -1;
387 int dst_inc = pdst_box->height > 0 ? 1 : -1;
388 src_box.height = 1;
389 int rows_to_copy = abs(psrc_box->height);
390
391 if (psrc_box->height < 0)
392 --src_box.y;
393
394 for (int y = 0, dest_y = pdst_box->y; y < rows_to_copy;
395 ++y, src_box.y += src_inc, dest_y += dst_inc) {
396 copy_subregion_no_barriers(ctx, dst, dst_level,
397 pdst_box->x, dest_y, pdst_box->z,
398 src, src_level, &src_box, mask);
399 }
400 }
401
402 void
d3d12_direct_copy(struct d3d12_context * ctx,struct d3d12_resource * dst,unsigned dst_level,const struct pipe_box * pdst_box,struct d3d12_resource * src,unsigned src_level,const struct pipe_box * psrc_box,unsigned mask)403 d3d12_direct_copy(struct d3d12_context *ctx,
404 struct d3d12_resource *dst,
405 unsigned dst_level,
406 const struct pipe_box *pdst_box,
407 struct d3d12_resource *src,
408 unsigned src_level,
409 const struct pipe_box *psrc_box,
410 unsigned mask)
411 {
412 struct d3d12_batch *batch = d3d12_current_batch(ctx);
413
414 unsigned src_subres = get_subresource_id(src->base.target, src_level, src->base.last_level + 1,
415 psrc_box->z, nullptr);
416 unsigned dst_subres = get_subresource_id(dst->base.target, dst_level, dst->base.last_level + 1,
417 pdst_box->z, nullptr);
418
419 if (D3D12_DEBUG_BLIT & d3d12_debug)
420 debug_printf("BLIT: Direct copy from subres %d to subres %d\n",
421 src_subres, dst_subres);
422
423 d3d12_transition_subresources_state(ctx, src, src_subres, 1, 0, 1,
424 d3d12_get_format_start_plane(src->base.format),
425 d3d12_get_format_num_planes(src->base.format),
426 D3D12_RESOURCE_STATE_COPY_SOURCE,
427 D3D12_BIND_INVALIDATE_FULL);
428
429 d3d12_transition_subresources_state(ctx, dst, dst_subres, 1, 0, 1,
430 d3d12_get_format_start_plane(dst->base.format),
431 d3d12_get_format_num_planes(dst->base.format),
432 D3D12_RESOURCE_STATE_COPY_DEST,
433 D3D12_BIND_INVALIDATE_FULL);
434
435 d3d12_apply_resource_states(ctx);
436
437 d3d12_batch_reference_resource(batch, src);
438 d3d12_batch_reference_resource(batch, dst);
439
440 if (src->base.target == PIPE_BUFFER) {
441 copy_buffer_region_no_barriers(ctx, dst, pdst_box->x,
442 src, psrc_box->x, psrc_box->width);
443 } else if (psrc_box->height == pdst_box->height) {
444 /* No flipping, we can forward this directly to resource_copy_region */
445 copy_subregion_no_barriers(ctx, dst, dst_level,
446 pdst_box->x, pdst_box->y, pdst_box->z,
447 src, src_level, psrc_box, mask);
448 } else {
449 assert(psrc_box->height == -pdst_box->height);
450 copy_resource_y_flipped_no_barriers(ctx, dst, dst_level, pdst_box,
451 src, src_level, psrc_box, mask);
452 }
453 }
454
455 static bool
is_same_resource(const struct pipe_blit_info * info)456 is_same_resource(const struct pipe_blit_info *info)
457 {
458 return d3d12_resource_resource(d3d12_resource(info->src.resource)) ==
459 d3d12_resource_resource(d3d12_resource(info->dst.resource)) &&
460 info->src.level == info->dst.level;
461 }
462
463 static struct pipe_resource *
create_staging_resource(struct d3d12_context * ctx,struct d3d12_resource * src,unsigned src_level,const struct pipe_box * src_box,struct pipe_box * dst_box,unsigned mask)464 create_staging_resource(struct d3d12_context *ctx,
465 struct d3d12_resource *src,
466 unsigned src_level,
467 const struct pipe_box *src_box,
468 struct pipe_box *dst_box,
469 unsigned mask)
470
471 {
472 struct pipe_resource templ = {};
473 struct pipe_resource *staging_res;
474 struct pipe_box copy_src;
475
476 u_box_3d(MIN2(src_box->x, src_box->x + src_box->width),
477 MIN2(src_box->y, src_box->y + src_box->height),
478 MIN2(src_box->z, src_box->z + src_box->depth),
479 abs(src_box->width), abs(src_box->height), abs(src_box->depth),
480 ©_src);
481
482 templ.format = src->base.format;
483 templ.width0 = copy_src.width;
484 templ.height0 = copy_src.height;
485 templ.depth0 = copy_src.depth;
486 templ.array_size = 1;
487 templ.nr_samples = 1;
488 templ.nr_storage_samples = 1;
489 templ.usage = PIPE_USAGE_STAGING;
490 templ.bind = util_format_is_depth_or_stencil(templ.format) ? PIPE_BIND_DEPTH_STENCIL : PIPE_BIND_RENDER_TARGET;
491 templ.target = src->base.target;
492
493 staging_res = ctx->base.screen->resource_create(ctx->base.screen, &templ);
494
495 dst_box->x = 0;
496 dst_box->y = 0;
497 dst_box->z = 0;
498 dst_box->width = copy_src.width;
499 dst_box->height = copy_src.height;
500 dst_box->depth = copy_src.depth;
501
502 d3d12_direct_copy(ctx, d3d12_resource(staging_res), 0, dst_box,
503 src, src_level, ©_src, mask);
504
505 if (src_box->width < 0) {
506 dst_box->x = dst_box->width;
507 dst_box->width = src_box->width;
508 }
509
510 if (src_box->height < 0) {
511 dst_box->y = dst_box->height;
512 dst_box->height = src_box->height;
513 }
514
515 if (src_box->depth < 0) {
516 dst_box->z = dst_box->depth;
517 dst_box->depth = src_box->depth;
518 }
519 return staging_res;
520 }
521
522 static void
blit_same_resource(struct d3d12_context * ctx,const struct pipe_blit_info * info)523 blit_same_resource(struct d3d12_context *ctx,
524 const struct pipe_blit_info *info)
525 {
526 struct pipe_blit_info dst_info = *info;
527
528 dst_info.src.level = 0;
529 dst_info.src.resource = create_staging_resource(ctx, d3d12_resource(info->src.resource),
530 info->src.level,
531 &info->src.box,
532 &dst_info.src.box, PIPE_MASK_RGBAZS);
533 ctx->base.blit(&ctx->base, &dst_info);
534 pipe_resource_reference(&dst_info.src.resource, NULL);
535 }
536
537 static void
util_blit_save_state(struct d3d12_context * ctx)538 util_blit_save_state(struct d3d12_context *ctx)
539 {
540 util_blitter_save_blend(ctx->blitter, ctx->gfx_pipeline_state.blend);
541 util_blitter_save_depth_stencil_alpha(ctx->blitter, ctx->gfx_pipeline_state.zsa);
542 util_blitter_save_vertex_elements(ctx->blitter, ctx->gfx_pipeline_state.ves);
543 util_blitter_save_stencil_ref(ctx->blitter, &ctx->stencil_ref);
544 util_blitter_save_rasterizer(ctx->blitter, ctx->gfx_pipeline_state.rast);
545 util_blitter_save_fragment_shader(ctx->blitter, ctx->gfx_stages[PIPE_SHADER_FRAGMENT]);
546 util_blitter_save_vertex_shader(ctx->blitter, ctx->gfx_stages[PIPE_SHADER_VERTEX]);
547 util_blitter_save_geometry_shader(ctx->blitter, ctx->gfx_stages[PIPE_SHADER_GEOMETRY]);
548
549 util_blitter_save_framebuffer(ctx->blitter, &ctx->fb);
550 util_blitter_save_viewport(ctx->blitter, ctx->viewport_states);
551 util_blitter_save_scissor(ctx->blitter, ctx->scissor_states);
552 util_blitter_save_fragment_sampler_states(ctx->blitter,
553 ctx->num_samplers[PIPE_SHADER_FRAGMENT],
554 (void **)ctx->samplers[PIPE_SHADER_FRAGMENT]);
555 util_blitter_save_fragment_sampler_views(ctx->blitter,
556 ctx->num_sampler_views[PIPE_SHADER_FRAGMENT],
557 ctx->sampler_views[PIPE_SHADER_FRAGMENT]);
558 util_blitter_save_fragment_constant_buffer_slot(ctx->blitter, ctx->cbufs[PIPE_SHADER_FRAGMENT]);
559 util_blitter_save_vertex_buffer_slot(ctx->blitter, ctx->vbs);
560 util_blitter_save_sample_mask(ctx->blitter, ctx->gfx_pipeline_state.sample_mask);
561 util_blitter_save_so_targets(ctx->blitter, ctx->gfx_pipeline_state.num_so_targets, ctx->so_targets);
562 }
563
564 static void
util_blit(struct d3d12_context * ctx,const struct pipe_blit_info * info)565 util_blit(struct d3d12_context *ctx,
566 const struct pipe_blit_info *info)
567 {
568 util_blit_save_state(ctx);
569
570 util_blitter_blit(ctx->blitter, info);
571 }
572
573 static bool
resolve_stencil_supported(struct d3d12_context * ctx,const struct pipe_blit_info * info)574 resolve_stencil_supported(struct d3d12_context *ctx,
575 const struct pipe_blit_info *info)
576 {
577 assert(is_resolve(info));
578
579 if (!util_format_is_depth_or_stencil(info->src.format) ||
580 !(info->mask & PIPE_MASK_S))
581 return false;
582
583 if (info->mask & PIPE_MASK_Z) {
584 struct pipe_blit_info new_info = *info;
585 new_info.mask = PIPE_MASK_Z;
586 if (!resolve_supported(&new_info) &&
587 !util_blitter_is_blit_supported(ctx->blitter, &new_info))
588 return false;
589 }
590
591 struct pipe_blit_info new_info = *info;
592 new_info.dst.format = PIPE_FORMAT_R8_UINT;
593 return util_blitter_is_blit_supported(ctx->blitter, &new_info);
594 }
595
596 static struct pipe_resource *
create_tmp_resource(struct pipe_screen * screen,const struct pipe_blit_info * info)597 create_tmp_resource(struct pipe_screen *screen,
598 const struct pipe_blit_info *info)
599 {
600 struct pipe_resource tpl = {};
601 tpl.width0 = info->dst.box.width;
602 tpl.height0 = info->dst.box.height;
603 tpl.depth0 = info->dst.box.depth;
604 tpl.array_size = 1;
605 tpl.format = PIPE_FORMAT_R8_UINT;
606 tpl.target = info->dst.resource->target;
607 tpl.nr_samples = info->dst.resource->nr_samples;
608 tpl.nr_storage_samples = info->dst.resource->nr_storage_samples;
609 tpl.usage = PIPE_USAGE_STREAM;
610 tpl.bind = PIPE_BIND_RENDER_TARGET | PIPE_BIND_SAMPLER_VIEW;
611 return screen->resource_create(screen, &tpl);
612 }
613
614 static void *
get_stencil_resolve_vs(struct d3d12_context * ctx)615 get_stencil_resolve_vs(struct d3d12_context *ctx)
616 {
617 if (ctx->stencil_resolve_vs)
618 return ctx->stencil_resolve_vs;
619
620 nir_builder b = nir_builder_init_simple_shader(MESA_SHADER_VERTEX,
621 dxil_get_nir_compiler_options(),
622 "linear_blit_vs");
623
624 const struct glsl_type *vec4 = glsl_vec4_type();
625 nir_variable *pos_in = nir_variable_create(b.shader, nir_var_shader_in,
626 vec4, "pos");
627
628 nir_variable *pos_out = nir_variable_create(b.shader, nir_var_shader_out,
629 vec4, "gl_Position");
630 pos_out->data.location = VARYING_SLOT_POS;
631
632 nir_store_var(&b, pos_out, nir_load_var(&b, pos_in), 0xf);
633
634 struct pipe_shader_state state = {};
635 state.type = PIPE_SHADER_IR_NIR;
636 state.ir.nir = b.shader;
637 ctx->stencil_resolve_vs = ctx->base.create_vs_state(&ctx->base, &state);
638
639 return ctx->stencil_resolve_vs;
640 }
641
642 static void *
get_stencil_resolve_fs(struct d3d12_context * ctx,bool no_flip)643 get_stencil_resolve_fs(struct d3d12_context *ctx, bool no_flip)
644 {
645 if (!no_flip && ctx->stencil_resolve_fs)
646 return ctx->stencil_resolve_fs;
647
648 if (no_flip && ctx->stencil_resolve_fs_no_flip)
649 return ctx->stencil_resolve_fs_no_flip;
650
651 nir_builder b = nir_builder_init_simple_shader(MESA_SHADER_FRAGMENT,
652 dxil_get_nir_compiler_options(),
653 no_flip ? "stencil_resolve_fs_no_flip" : "stencil_resolve_fs");
654
655 nir_variable *stencil_out = nir_variable_create(b.shader,
656 nir_var_shader_out,
657 glsl_uint_type(),
658 "stencil_out");
659 stencil_out->data.location = FRAG_RESULT_COLOR;
660
661 const struct glsl_type *sampler_type =
662 glsl_sampler_type(GLSL_SAMPLER_DIM_MS, false, false, GLSL_TYPE_UINT);
663 nir_variable *sampler = nir_variable_create(b.shader, nir_var_uniform,
664 sampler_type, "stencil_tex");
665 sampler->data.binding = 0;
666 sampler->data.explicit_binding = true;
667
668 nir_ssa_def *tex_deref = &nir_build_deref_var(&b, sampler)->dest.ssa;
669
670 nir_variable *pos_in = nir_variable_create(b.shader, nir_var_shader_in,
671 glsl_vec4_type(), "pos");
672 pos_in->data.location = VARYING_SLOT_POS; // VARYING_SLOT_VAR0?
673 nir_ssa_def *pos = nir_load_var(&b, pos_in);
674
675 nir_ssa_def *pos_src;
676
677 if (no_flip)
678 pos_src = pos;
679 else {
680 nir_tex_instr *txs = nir_tex_instr_create(b.shader, 1);
681 txs->op = nir_texop_txs;
682 txs->sampler_dim = GLSL_SAMPLER_DIM_MS;
683 txs->src[0].src_type = nir_tex_src_texture_deref;
684 txs->src[0].src = nir_src_for_ssa(tex_deref);
685 txs->is_array = false;
686 txs->dest_type = nir_type_int;
687
688 nir_ssa_dest_init(&txs->instr, &txs->dest, 2, 32, "tex");
689 nir_builder_instr_insert(&b, &txs->instr);
690
691 pos_src = nir_vec4(&b,
692 nir_channel(&b, pos, 0),
693 /*Height - pos_dest.y - 1*/
694 nir_fsub(&b,
695 nir_fsub(&b,
696 nir_channel(&b, nir_i2f32(&b, &txs->dest.ssa), 1),
697 nir_channel(&b, pos, 1)),
698 nir_imm_float(&b, 1.0)),
699 nir_channel(&b, pos, 2),
700 nir_channel(&b, pos, 3));
701 }
702
703 nir_tex_instr *tex = nir_tex_instr_create(b.shader, 3);
704 tex->sampler_dim = GLSL_SAMPLER_DIM_MS;
705 tex->op = nir_texop_txf_ms;
706 tex->src[0].src_type = nir_tex_src_coord;
707 tex->src[0].src = nir_src_for_ssa(nir_channels(&b, nir_f2i32(&b, pos_src), 0x3));
708 tex->src[1].src_type = nir_tex_src_ms_index;
709 tex->src[1].src = nir_src_for_ssa(nir_imm_int(&b, 0)); /* just use first sample */
710 tex->src[2].src_type = nir_tex_src_texture_deref;
711 tex->src[2].src = nir_src_for_ssa(tex_deref);
712 tex->dest_type = nir_type_uint32;
713 tex->is_array = false;
714 tex->coord_components = 2;
715
716 nir_ssa_dest_init(&tex->instr, &tex->dest, 4, 32, "tex");
717 nir_builder_instr_insert(&b, &tex->instr);
718
719 nir_store_var(&b, stencil_out, nir_channel(&b, &tex->dest.ssa, 1), 0x1);
720
721 struct pipe_shader_state state = {};
722 state.type = PIPE_SHADER_IR_NIR;
723 state.ir.nir = b.shader;
724 void *result;
725 if (no_flip) {
726 result = ctx->base.create_fs_state(&ctx->base, &state);
727 ctx->stencil_resolve_fs_no_flip = result;
728 } else {
729 result = ctx->base.create_fs_state(&ctx->base, &state);
730 ctx->stencil_resolve_fs = result;
731 }
732
733 return result;
734 }
735
736 static void *
get_sampler_state(struct d3d12_context * ctx)737 get_sampler_state(struct d3d12_context *ctx)
738 {
739 if (ctx->sampler_state)
740 return ctx->sampler_state;
741
742 struct pipe_sampler_state state;
743 memset(&state, 0, sizeof(state));
744 state.wrap_s = PIPE_TEX_WRAP_CLAMP_TO_EDGE;
745 state.wrap_t = PIPE_TEX_WRAP_CLAMP_TO_EDGE;
746 state.wrap_r = PIPE_TEX_WRAP_CLAMP_TO_EDGE;
747 state.normalized_coords = 1;
748
749 return ctx->sampler_state = ctx->base.create_sampler_state(&ctx->base, &state);
750 }
751
752 static struct pipe_resource *
resolve_stencil_to_temp(struct d3d12_context * ctx,const struct pipe_blit_info * info)753 resolve_stencil_to_temp(struct d3d12_context *ctx,
754 const struct pipe_blit_info *info)
755 {
756 struct pipe_context *pctx = &ctx->base;
757 struct pipe_resource *tmp = create_tmp_resource(pctx->screen, info);
758 if (!tmp) {
759 debug_printf("D3D12: failed to create stencil-resolve temp-resource\n");
760 return NULL;
761 }
762 assert(tmp->nr_samples < 2);
763
764 /* resolve stencil into tmp */
765 struct pipe_surface dst_tmpl;
766 util_blitter_default_dst_texture(&dst_tmpl, tmp, 0, 0);
767 dst_tmpl.format = tmp->format;
768 struct pipe_surface *dst_surf = pctx->create_surface(pctx, tmp, &dst_tmpl);
769 if (!dst_surf) {
770 debug_printf("D3D12: failed to create stencil-resolve dst-surface\n");
771 return NULL;
772 }
773
774 struct pipe_sampler_view src_templ, *src_view;
775 util_blitter_default_src_texture(ctx->blitter, &src_templ,
776 info->src.resource, info->src.level);
777 src_templ.format = util_format_stencil_only(info->src.format);
778 src_view = pctx->create_sampler_view(pctx, info->src.resource, &src_templ);
779
780 void *sampler_state = get_sampler_state(ctx);
781
782 util_blit_save_state(ctx);
783 pctx->set_sampler_views(pctx, PIPE_SHADER_FRAGMENT, 0, 1, 0, false, &src_view);
784 pctx->bind_sampler_states(pctx, PIPE_SHADER_FRAGMENT, 0, 1, &sampler_state);
785 util_blitter_custom_shader(ctx->blitter, dst_surf,
786 get_stencil_resolve_vs(ctx),
787 get_stencil_resolve_fs(ctx, info->src.box.height == info->dst.box.height));
788 util_blitter_restore_textures(ctx->blitter);
789 pipe_surface_reference(&dst_surf, NULL);
790 pipe_sampler_view_reference(&src_view, NULL);
791 return tmp;
792 }
793
794 static void
blit_resolve_stencil(struct d3d12_context * ctx,const struct pipe_blit_info * info)795 blit_resolve_stencil(struct d3d12_context *ctx,
796 const struct pipe_blit_info *info)
797 {
798 assert(info->mask & PIPE_MASK_S);
799
800 if (D3D12_DEBUG_BLIT & d3d12_debug)
801 debug_printf("D3D12 BLIT: blit_resolve_stencil\n");
802
803 if (info->mask & PIPE_MASK_Z) {
804 /* resolve depth into dst */
805 struct pipe_blit_info new_info = *info;
806 new_info.mask = PIPE_MASK_Z;
807
808 if (resolve_supported(&new_info))
809 blit_resolve(ctx, &new_info);
810 else
811 util_blit(ctx, &new_info);
812 }
813
814 struct pipe_resource *tmp = resolve_stencil_to_temp(ctx, info);
815
816
817 /* copy resolved stencil into dst */
818 struct d3d12_resource *dst = d3d12_resource(info->dst.resource);
819 d3d12_transition_subresources_state(ctx, d3d12_resource(tmp),
820 0, 1, 0, 1, 0, 1,
821 D3D12_RESOURCE_STATE_COPY_SOURCE,
822 D3D12_BIND_INVALIDATE_NONE);
823 d3d12_transition_subresources_state(ctx, dst,
824 0, 1, 0, 1, 1, 1,
825 D3D12_RESOURCE_STATE_COPY_DEST,
826 D3D12_BIND_INVALIDATE_FULL);
827 d3d12_apply_resource_states(ctx);
828
829 struct d3d12_batch *batch = d3d12_current_batch(ctx);
830 d3d12_batch_reference_resource(batch, d3d12_resource(tmp));
831 d3d12_batch_reference_resource(batch, dst);
832
833 D3D12_BOX src_box;
834 src_box.left = src_box.top = src_box.front = 0;
835 src_box.right = tmp->width0;
836 src_box.bottom = tmp->height0;
837 src_box.back = tmp->depth0;
838
839 D3D12_TEXTURE_COPY_LOCATION src_loc;
840 src_loc.Type = D3D12_TEXTURE_COPY_TYPE_SUBRESOURCE_INDEX;
841 src_loc.SubresourceIndex = 0;
842 src_loc.pResource = d3d12_resource_resource(d3d12_resource(tmp));
843
844 D3D12_TEXTURE_COPY_LOCATION dst_loc;
845 dst_loc.Type = D3D12_TEXTURE_COPY_TYPE_SUBRESOURCE_INDEX;
846 dst_loc.SubresourceIndex = 1;
847 dst_loc.pResource = d3d12_resource_resource(dst);
848
849 ctx->cmdlist->CopyTextureRegion(&dst_loc, info->dst.box.x,
850 info->dst.box.y, info->dst.box.z,
851 &src_loc, &src_box);
852
853 pipe_resource_reference(&tmp, NULL);
854 }
855
856 static bool
replicate_stencil_supported(struct d3d12_context * ctx,const struct pipe_blit_info * info)857 replicate_stencil_supported(struct d3d12_context *ctx,
858 const struct pipe_blit_info *info)
859 {
860 if (!util_format_is_depth_or_stencil(info->src.format) ||
861 !(info->mask & PIPE_MASK_S))
862 return false;
863
864 if (info->mask & PIPE_MASK_Z) {
865 struct pipe_blit_info new_info = *info;
866 new_info.mask = PIPE_MASK_Z;
867 if (!util_blitter_is_blit_supported(ctx->blitter, &new_info))
868 return false;
869 }
870
871 return true;
872 }
873
874 static void
blit_replicate_stencil(struct d3d12_context * ctx,const struct pipe_blit_info * info)875 blit_replicate_stencil(struct d3d12_context *ctx,
876 const struct pipe_blit_info *info)
877 {
878 assert(info->mask & PIPE_MASK_S);
879
880 if (D3D12_DEBUG_BLIT & d3d12_debug)
881 debug_printf("D3D12 BLIT: blit_replicate_stencil\n");
882
883 if (info->mask & PIPE_MASK_Z) {
884 /* resolve depth into dst */
885 struct pipe_blit_info new_info = *info;
886 new_info.mask = PIPE_MASK_Z;
887 util_blit(ctx, &new_info);
888 }
889
890 util_blit_save_state(ctx);
891 util_blitter_stencil_fallback(ctx->blitter, info->dst.resource,
892 info->dst.level,
893 &info->dst.box,
894 info->src.resource,
895 info->src.level,
896 &info->src.box,
897 info->scissor_enable ? &info->scissor : NULL);
898 }
899
900 void
d3d12_blit(struct pipe_context * pctx,const struct pipe_blit_info * info)901 d3d12_blit(struct pipe_context *pctx,
902 const struct pipe_blit_info *info)
903 {
904 struct d3d12_context *ctx = d3d12_context(pctx);
905
906 if (!info->render_condition_enable && ctx->current_predication) {
907 if (D3D12_DEBUG_BLIT & d3d12_debug)
908 debug_printf("D3D12 BLIT: Disable predication\n");
909 ctx->cmdlist->SetPredication(nullptr, 0, D3D12_PREDICATION_OP_EQUAL_ZERO);
910 }
911
912 if (D3D12_DEBUG_BLIT & d3d12_debug) {
913 debug_printf("D3D12 BLIT: from %s@%d msaa:%d %dx%dx%d + %dx%dx%d\n",
914 util_format_name(info->src.format), info->src.level,
915 info->src.resource->nr_samples,
916 info->src.box.x, info->src.box.y, info->src.box.z,
917 info->src.box.width, info->src.box.height, info->src.box.depth);
918 debug_printf(" to %s@%d msaa:%d %dx%dx%d + %dx%dx%d ",
919 util_format_name(info->dst.format), info->dst.level,
920 info->dst.resource->nr_samples,
921 info->dst.box.x, info->dst.box.y, info->dst.box.z,
922 info->dst.box.width, info->dst.box.height, info->dst.box.depth);
923 debug_printf("| flags %s%s%s\n",
924 info->render_condition_enable ? "cond " : "",
925 info->scissor_enable ? "scissor " : "",
926 info->alpha_blend ? "blend" : "");
927 }
928
929 if (is_same_resource(info))
930 blit_same_resource(ctx, info);
931 else if (is_resolve(info)) {
932 if (resolve_supported(info))
933 blit_resolve(ctx, info);
934 else if (util_blitter_is_blit_supported(ctx->blitter, info))
935 util_blit(ctx, info);
936 else if (resolve_stencil_supported(ctx, info))
937 blit_resolve_stencil(ctx, info);
938 else
939 debug_printf("D3D12: resolve unsupported %s -> %s\n",
940 util_format_short_name(info->src.resource->format),
941 util_format_short_name(info->dst.resource->format));
942 } else if (direct_copy_supported(d3d12_screen(pctx->screen), info,
943 ctx->current_predication != nullptr))
944 d3d12_direct_copy(ctx, d3d12_resource(info->dst.resource),
945 info->dst.level, &info->dst.box,
946 d3d12_resource(info->src.resource),
947 info->src.level, &info->src.box, info->mask);
948 else if (util_blitter_is_blit_supported(ctx->blitter, info))
949 util_blit(ctx, info);
950 else if (replicate_stencil_supported(ctx, info))
951 blit_replicate_stencil(ctx, info);
952 else
953 debug_printf("D3D12: blit unsupported %s -> %s\n",
954 util_format_short_name(info->src.resource->format),
955 util_format_short_name(info->dst.resource->format));
956
957 if (!info->render_condition_enable && ctx->current_predication) {
958 ctx->cmdlist->SetPredication(
959 d3d12_resource_resource(ctx->current_predication), 0, D3D12_PREDICATION_OP_EQUAL_ZERO);
960 if (D3D12_DEBUG_BLIT & d3d12_debug)
961 debug_printf("D3D12 BLIT: Re-enable predication\n");
962 }
963
964 }
965
966 static void
d3d12_resource_copy_region(struct pipe_context * pctx,struct pipe_resource * pdst,unsigned dst_level,unsigned dstx,unsigned dsty,unsigned dstz,struct pipe_resource * psrc,unsigned src_level,const struct pipe_box * psrc_box)967 d3d12_resource_copy_region(struct pipe_context *pctx,
968 struct pipe_resource *pdst,
969 unsigned dst_level,
970 unsigned dstx, unsigned dsty, unsigned dstz,
971 struct pipe_resource *psrc,
972 unsigned src_level,
973 const struct pipe_box *psrc_box)
974 {
975 struct d3d12_context *ctx = d3d12_context(pctx);
976 struct d3d12_resource *dst = d3d12_resource(pdst);
977 struct d3d12_resource *src = d3d12_resource(psrc);
978 struct pipe_resource *staging_res = NULL;
979 const struct pipe_box *src_box = psrc_box;
980 struct pipe_box staging_box, dst_box;
981
982 if (D3D12_DEBUG_BLIT & d3d12_debug) {
983 debug_printf("D3D12 COPY: from %s@%d msaa:%d mips:%d %dx%dx%d + %dx%dx%d\n",
984 util_format_name(psrc->format), src_level, psrc->nr_samples,
985 psrc->last_level,
986 psrc_box->x, psrc_box->y, psrc_box->z,
987 psrc_box->width, psrc_box->height, psrc_box->depth);
988 debug_printf(" to %s@%d msaa:%d mips:%d %dx%dx%d\n",
989 util_format_name(pdst->format), dst_level, psrc->nr_samples,
990 psrc->last_level, dstx, dsty, dstz);
991 }
992
993 /* Use an intermediate resource if copying from/to the same subresource */
994 if (d3d12_resource_resource(dst) == d3d12_resource_resource(src) && dst_level == src_level) {
995 staging_res = create_staging_resource(ctx, src, src_level, psrc_box, &staging_box, PIPE_MASK_RGBAZS);
996 src = d3d12_resource(staging_res);
997 src_level = 0;
998 src_box = &staging_box;
999 }
1000
1001 dst_box.x = dstx;
1002 dst_box.y = dsty;
1003 dst_box.z = dstz;
1004 dst_box.width = psrc_box->width;
1005 dst_box.height = psrc_box->height;
1006
1007 d3d12_direct_copy(ctx, dst, dst_level, &dst_box,
1008 src, src_level, src_box, PIPE_MASK_RGBAZS);
1009
1010 if (staging_res)
1011 pipe_resource_reference(&staging_res, NULL);
1012 }
1013
1014 void
d3d12_context_blit_init(struct pipe_context * ctx)1015 d3d12_context_blit_init(struct pipe_context *ctx)
1016 {
1017 ctx->resource_copy_region = d3d12_resource_copy_region;
1018 ctx->blit = d3d12_blit;
1019 }
1020