/* * Copyright © Microsoft Corporation * * Permission is hereby granted, free of charge, to any person obtaining a * copy of this software and associated documentation files (the "Software"), * to deal in the Software without restriction, including without limitation * the rights to use, copy, modify, merge, publish, distribute, sublicense, * and/or sell copies of the Software, and to permit persons to whom the * Software is furnished to do so, subject to the following conditions: * * The above copyright notice and this permission notice (including the next * paragraph) shall be included in all copies or substantial portions of the * Software. * * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS * IN THE SOFTWARE. */ #include "d3d12_screen.h" #include "d3d12_bufmgr.h" #include "d3d12_compiler.h" #include "d3d12_context.h" #include "d3d12_debug.h" #include "d3d12_fence.h" #ifdef HAVE_GALLIUM_D3D12_VIDEO #include "d3d12_video_screen.h" #endif #include "d3d12_format.h" #include "d3d12_residency.h" #include "d3d12_resource.h" #include "d3d12_nir_passes.h" #include "pipebuffer/pb_bufmgr.h" #include "util/debug.h" #include "util/u_math.h" #include "util/u_memory.h" #include "util/u_screen.h" #include "util/u_dl.h" #include "util/mesa-sha1.h" #include "nir.h" #include "frontend/sw_winsys.h" #include "nir_to_dxil.h" #include "git_sha1.h" #include #include static GUID OpenGLOn12CreatorID = { 0x6bb3cd34, 0x0d19, 0x45ab, 0x97, 0xed, 0xd7, 0x20, 0xba, 0x3d, 0xfc, 0x80 }; static const struct debug_named_value d3d12_debug_options[] = { { "verbose", D3D12_DEBUG_VERBOSE, NULL }, { "blit", D3D12_DEBUG_BLIT, "Trace blit and copy resource calls" }, { "experimental", D3D12_DEBUG_EXPERIMENTAL, "Enable experimental shader models feature" }, { "dxil", D3D12_DEBUG_DXIL, "Dump DXIL during program compile" }, { "disass", D3D12_DEBUG_DISASS, "Dump disassambly of created DXIL shader" }, { "res", D3D12_DEBUG_RESOURCE, "Debug resources" }, { "debuglayer", D3D12_DEBUG_DEBUG_LAYER, "Enable debug layer" }, { "gpuvalidator", D3D12_DEBUG_GPU_VALIDATOR, "Enable GPU validator" }, DEBUG_NAMED_VALUE_END }; DEBUG_GET_ONCE_FLAGS_OPTION(d3d12_debug, "D3D12_DEBUG", d3d12_debug_options, 0) uint32_t d3d12_debug; enum { HW_VENDOR_AMD = 0x1002, HW_VENDOR_INTEL = 0x8086, HW_VENDOR_MICROSOFT = 0x1414, HW_VENDOR_NVIDIA = 0x10de, }; static const char * d3d12_get_vendor(struct pipe_screen *pscreen) { return "Microsoft Corporation"; } static const char * d3d12_get_device_vendor(struct pipe_screen *pscreen) { struct d3d12_screen* screen = d3d12_screen(pscreen); switch (screen->vendor_id) { case HW_VENDOR_MICROSOFT: return "Microsoft"; case HW_VENDOR_AMD: return "AMD"; case HW_VENDOR_NVIDIA: return "NVIDIA"; case HW_VENDOR_INTEL: return "Intel"; default: return "Unknown"; } } static int d3d12_get_video_mem(struct pipe_screen *pscreen) { struct d3d12_screen* screen = d3d12_screen(pscreen); return screen->memory_size_megabytes; } static int d3d12_get_param(struct pipe_screen *pscreen, enum pipe_cap param) { struct d3d12_screen *screen = d3d12_screen(pscreen); switch (param) { case PIPE_CAP_NPOT_TEXTURES: return 1; case PIPE_CAP_MAX_DUAL_SOURCE_RENDER_TARGETS: /* D3D12 only supports dual-source blending for a single * render-target. From the D3D11 functional spec (which also defines * this for D3D12): * * "When Dual Source Color Blending is enabled, the Pixel Shader must * have only a single RenderTarget bound, at slot 0, and must output * both o0 and o1. Writing to other outputs (o2, o3 etc.) produces * undefined results for the corresponding RenderTargets, if bound * illegally." * * Source: https://microsoft.github.io/DirectX-Specs/d3d/archive/D3D11_3_FunctionalSpec.htm#17.6%20Dual%20Source%20Color%20Blending */ return 1; case PIPE_CAP_ANISOTROPIC_FILTER: return 1; case PIPE_CAP_MAX_RENDER_TARGETS: return D3D12_SIMULTANEOUS_RENDER_TARGET_COUNT; case PIPE_CAP_TEXTURE_SWIZZLE: return 1; case PIPE_CAP_MAX_TEXTURE_2D_SIZE: return D3D12_REQ_TEXTURE2D_U_OR_V_DIMENSION; case PIPE_CAP_MAX_TEXTURE_3D_LEVELS: return 11; // D3D12_REQ_TEXTURE3D_U_V_OR_W_DIMENSION == 2^10 case PIPE_CAP_MAX_TEXTURE_CUBE_LEVELS: return D3D12_REQ_MIP_LEVELS; case PIPE_CAP_PRIMITIVE_RESTART: case PIPE_CAP_INDEP_BLEND_ENABLE: case PIPE_CAP_INDEP_BLEND_FUNC: case PIPE_CAP_FRAGMENT_SHADER_TEXTURE_LOD: case PIPE_CAP_FRAGMENT_SHADER_DERIVATIVES: case PIPE_CAP_QUADS_FOLLOW_PROVOKING_VERTEX_CONVENTION: case PIPE_CAP_VERTEX_BUFFER_STRIDE_4BYTE_ALIGNED_ONLY: case PIPE_CAP_RGB_OVERRIDE_DST_ALPHA_BLEND: case PIPE_CAP_MIXED_COLOR_DEPTH_BITS: return 1; /* We need to do some lowering that requires a link to the sampler */ case PIPE_CAP_NIR_SAMPLERS_AS_DEREF: return 1; case PIPE_CAP_NIR_IMAGES_AS_DEREF: return 1; case PIPE_CAP_MAX_TEXTURE_ARRAY_LAYERS: /* Divide by 6 because this also applies to cubemaps */ return D3D12_REQ_TEXTURE2D_ARRAY_AXIS_DIMENSION / 6; case PIPE_CAP_DEPTH_CLIP_DISABLE: return 1; case PIPE_CAP_TGSI_TEXCOORD: return 1; case PIPE_CAP_MIXED_COLORBUFFER_FORMATS: return 1; case PIPE_CAP_VERTEX_COLOR_UNCLAMPED: return 1; case PIPE_CAP_GLSL_FEATURE_LEVEL: return 420; case PIPE_CAP_GLSL_FEATURE_LEVEL_COMPATIBILITY: return 420; case PIPE_CAP_ESSL_FEATURE_LEVEL: return 310; case PIPE_CAP_COMPUTE: return 1; case PIPE_CAP_TEXTURE_MULTISAMPLE: return 1; case PIPE_CAP_CUBE_MAP_ARRAY: return 1; case PIPE_CAP_TEXTURE_BUFFER_OBJECTS: return 1; case PIPE_CAP_TEXTURE_TRANSFER_MODES: return 0; /* unsure */ case PIPE_CAP_ENDIANNESS: return PIPE_ENDIAN_NATIVE; /* unsure */ case PIPE_CAP_MAX_VIEWPORTS: return D3D12_VIEWPORT_AND_SCISSORRECT_OBJECT_COUNT_PER_PIPELINE; case PIPE_CAP_MIXED_FRAMEBUFFER_SIZES: return 1; case PIPE_CAP_MAX_TEXTURE_GATHER_COMPONENTS: return 4; case PIPE_CAP_FS_COORD_PIXEL_CENTER_HALF_INTEGER: case PIPE_CAP_FS_COORD_ORIGIN_UPPER_LEFT: return 1; case PIPE_CAP_FS_FACE_IS_INTEGER_SYSVAL: return 1; case PIPE_CAP_ACCELERATED: return screen->vendor_id != HW_VENDOR_MICROSOFT; case PIPE_CAP_VIDEO_MEMORY: return d3d12_get_video_mem(pscreen); case PIPE_CAP_UMA: return screen->architecture.UMA; case PIPE_CAP_MAX_VERTEX_ATTRIB_STRIDE: return 2048; /* FIXME: no clue how to query this */ case PIPE_CAP_TEXTURE_FLOAT_LINEAR: case PIPE_CAP_TEXTURE_HALF_FLOAT_LINEAR: return 1; case PIPE_CAP_SHADER_BUFFER_OFFSET_ALIGNMENT: return D3D12_RAW_UAV_SRV_BYTE_ALIGNMENT; case PIPE_CAP_CONSTANT_BUFFER_OFFSET_ALIGNMENT: return D3D12_CONSTANT_BUFFER_DATA_PLACEMENT_ALIGNMENT; case PIPE_CAP_PCI_GROUP: case PIPE_CAP_PCI_BUS: case PIPE_CAP_PCI_DEVICE: case PIPE_CAP_PCI_FUNCTION: return 0; /* TODO: figure these out */ case PIPE_CAP_FLATSHADE: case PIPE_CAP_ALPHA_TEST: case PIPE_CAP_TWO_SIDED_COLOR: case PIPE_CAP_CLIP_PLANES: return 0; case PIPE_CAP_SHADER_STENCIL_EXPORT: return screen->opts.PSSpecifiedStencilRefSupported; case PIPE_CAP_SEAMLESS_CUBE_MAP: case PIPE_CAP_TEXTURE_QUERY_LOD: case PIPE_CAP_VS_INSTANCEID: case PIPE_CAP_TGSI_TEX_TXF_LZ: case PIPE_CAP_OCCLUSION_QUERY: case PIPE_CAP_POINT_SPRITE: case PIPE_CAP_VIEWPORT_TRANSFORM_LOWERED: case PIPE_CAP_PSIZ_CLAMPED: case PIPE_CAP_BLEND_EQUATION_SEPARATE: case PIPE_CAP_CONDITIONAL_RENDER: case PIPE_CAP_CONDITIONAL_RENDER_INVERTED: case PIPE_CAP_QUERY_TIMESTAMP: case PIPE_CAP_VERTEX_ELEMENT_INSTANCE_DIVISOR: case PIPE_CAP_VERTEX_ELEMENT_SRC_OFFSET_4BYTE_ALIGNED_ONLY: case PIPE_CAP_IMAGE_STORE_FORMATTED: case PIPE_CAP_GLSL_TESS_LEVELS_AS_INPUTS: return 1; case PIPE_CAP_MAX_STREAM_OUTPUT_BUFFERS: return D3D12_SO_BUFFER_SLOT_COUNT; case PIPE_CAP_MAX_STREAM_OUTPUT_SEPARATE_COMPONENTS: case PIPE_CAP_MAX_STREAM_OUTPUT_INTERLEAVED_COMPONENTS: return D3D12_SO_OUTPUT_COMPONENT_COUNT; /* Geometry shader output. */ case PIPE_CAP_MAX_GEOMETRY_OUTPUT_VERTICES: return D3D12_GS_MAX_OUTPUT_VERTEX_COUNT_ACROSS_INSTANCES; case PIPE_CAP_MAX_GEOMETRY_TOTAL_OUTPUT_COMPONENTS: return D3D12_REQ_GS_INVOCATION_32BIT_OUTPUT_COMPONENT_LIMIT; case PIPE_CAP_MAX_VARYINGS: /* Subtract one so that implicit position can be added */ return D3D12_PS_INPUT_REGISTER_COUNT - 1; case PIPE_CAP_NIR_COMPACT_ARRAYS: return 1; case PIPE_CAP_MAX_COMBINED_SHADER_OUTPUT_RESOURCES: if (screen->max_feature_level <= D3D_FEATURE_LEVEL_11_0) return D3D12_PS_CS_UAV_REGISTER_COUNT; if (screen->opts.ResourceBindingTier <= D3D12_RESOURCE_BINDING_TIER_2) return D3D12_UAV_SLOT_COUNT; return 0; case PIPE_CAP_START_INSTANCE: case PIPE_CAP_DRAW_PARAMETERS: case PIPE_CAP_DRAW_INDIRECT: case PIPE_CAP_MULTI_DRAW_INDIRECT: case PIPE_CAP_MULTI_DRAW_INDIRECT_PARAMS: case PIPE_CAP_FRAMEBUFFER_NO_ATTACHMENT: case PIPE_CAP_SAMPLE_SHADING: case PIPE_CAP_STREAM_OUTPUT_PAUSE_RESUME: case PIPE_CAP_STREAM_OUTPUT_INTERLEAVE_BUFFERS: case PIPE_CAP_INT64: case PIPE_CAP_INT64_DIVMOD: case PIPE_CAP_DOUBLES: case PIPE_CAP_DEVICE_RESET_STATUS_QUERY: case PIPE_CAP_ROBUST_BUFFER_ACCESS_BEHAVIOR: case PIPE_CAP_MEMOBJ: case PIPE_CAP_FENCE_SIGNAL: case PIPE_CAP_TIMELINE_SEMAPHORE_IMPORT: case PIPE_CAP_CLIP_HALFZ: return 1; case PIPE_CAP_MAX_VERTEX_STREAMS: return D3D12_SO_BUFFER_SLOT_COUNT; case PIPE_CAP_MAX_SHADER_PATCH_VARYINGS: /* This is asking about varyings, not total registers, so remove the 2 tess factor registers. */ return D3D12_HS_OUTPUT_PATCH_CONSTANT_REGISTER_COUNT - 2; default: return u_pipe_screen_get_param_defaults(pscreen, param); } } static float d3d12_get_paramf(struct pipe_screen *pscreen, enum pipe_capf param) { switch (param) { case PIPE_CAPF_MIN_LINE_WIDTH: case PIPE_CAPF_MIN_LINE_WIDTH_AA: case PIPE_CAPF_MIN_POINT_SIZE: case PIPE_CAPF_MIN_POINT_SIZE_AA: return 1; case PIPE_CAPF_POINT_SIZE_GRANULARITY: case PIPE_CAPF_LINE_WIDTH_GRANULARITY: return 0.1; case PIPE_CAPF_MAX_LINE_WIDTH: case PIPE_CAPF_MAX_LINE_WIDTH_AA: return 1.0f; /* no clue */ case PIPE_CAPF_MAX_POINT_SIZE: case PIPE_CAPF_MAX_POINT_SIZE_AA: return D3D12_MAX_POINT_SIZE; case PIPE_CAPF_MAX_TEXTURE_ANISOTROPY: return D3D12_MAX_MAXANISOTROPY; case PIPE_CAPF_MAX_TEXTURE_LOD_BIAS: return 15.99f; case PIPE_CAPF_MIN_CONSERVATIVE_RASTER_DILATE: case PIPE_CAPF_MAX_CONSERVATIVE_RASTER_DILATE: case PIPE_CAPF_CONSERVATIVE_RASTER_DILATE_GRANULARITY: return 0.0f; /* not implemented */ default: unreachable("unknown pipe_capf"); } return 0.0; } static int d3d12_get_shader_param(struct pipe_screen *pscreen, enum pipe_shader_type shader, enum pipe_shader_cap param) { struct d3d12_screen *screen = d3d12_screen(pscreen); switch (param) { case PIPE_SHADER_CAP_MAX_INSTRUCTIONS: case PIPE_SHADER_CAP_MAX_ALU_INSTRUCTIONS: case PIPE_SHADER_CAP_MAX_TEX_INSTRUCTIONS: case PIPE_SHADER_CAP_MAX_TEX_INDIRECTIONS: case PIPE_SHADER_CAP_MAX_CONTROL_FLOW_DEPTH: return INT_MAX; return 0; case PIPE_SHADER_CAP_MAX_INPUTS: switch (shader) { case PIPE_SHADER_VERTEX: return D3D12_VS_INPUT_REGISTER_COUNT; case PIPE_SHADER_FRAGMENT: return D3D12_PS_INPUT_REGISTER_COUNT; case PIPE_SHADER_GEOMETRY: return D3D12_GS_INPUT_REGISTER_COUNT; case PIPE_SHADER_TESS_CTRL: return D3D12_HS_CONTROL_POINT_PHASE_INPUT_REGISTER_COUNT; case PIPE_SHADER_TESS_EVAL: return D3D12_DS_INPUT_CONTROL_POINT_REGISTER_COUNT; case PIPE_SHADER_COMPUTE: return 0; default: unreachable("Unexpected shader"); } break; case PIPE_SHADER_CAP_MAX_OUTPUTS: switch (shader) { case PIPE_SHADER_VERTEX: return D3D12_VS_OUTPUT_REGISTER_COUNT; case PIPE_SHADER_FRAGMENT: return D3D12_PS_OUTPUT_REGISTER_COUNT; case PIPE_SHADER_GEOMETRY: return D3D12_GS_OUTPUT_REGISTER_COUNT; case PIPE_SHADER_TESS_CTRL: return D3D12_HS_CONTROL_POINT_PHASE_OUTPUT_REGISTER_COUNT; case PIPE_SHADER_TESS_EVAL: return D3D12_DS_OUTPUT_REGISTER_COUNT; case PIPE_SHADER_COMPUTE: return 0; default: unreachable("Unexpected shader"); } break; case PIPE_SHADER_CAP_MAX_TEXTURE_SAMPLERS: if (screen->opts.ResourceBindingTier == D3D12_RESOURCE_BINDING_TIER_1) return 16; return PIPE_MAX_SAMPLERS; case PIPE_SHADER_CAP_MAX_CONST_BUFFER0_SIZE: return 65536; case PIPE_SHADER_CAP_MAX_CONST_BUFFERS: return 13; /* 15 - 2 for lowered uniforms and state vars*/ case PIPE_SHADER_CAP_MAX_TEMPS: return INT_MAX; case PIPE_SHADER_CAP_INDIRECT_INPUT_ADDR: case PIPE_SHADER_CAP_INDIRECT_OUTPUT_ADDR: case PIPE_SHADER_CAP_INDIRECT_TEMP_ADDR: case PIPE_SHADER_CAP_SUBROUTINES: return 0; /* not implemented */ case PIPE_SHADER_CAP_INDIRECT_CONST_ADDR: case PIPE_SHADER_CAP_INTEGERS: return 1; case PIPE_SHADER_CAP_INT64_ATOMICS: case PIPE_SHADER_CAP_FP16: return 0; /* not implemented */ case PIPE_SHADER_CAP_PREFERRED_IR: return PIPE_SHADER_IR_NIR; case PIPE_SHADER_CAP_TGSI_SQRT_SUPPORTED: return 0; /* not implemented */ case PIPE_SHADER_CAP_MAX_SAMPLER_VIEWS: /* Note: This is wrong, but this is the max value that * TC can support to avoid overflowing an array. */ return PIPE_MAX_SAMPLERS; case PIPE_SHADER_CAP_DROUND_SUPPORTED: case PIPE_SHADER_CAP_DFRACEXP_DLDEXP_SUPPORTED: return 0; /* not implemented */ case PIPE_SHADER_CAP_TGSI_ANY_INOUT_DECL_RANGE: return 0; /* no idea */ case PIPE_SHADER_CAP_MAX_SHADER_BUFFERS: return (screen->max_feature_level >= D3D_FEATURE_LEVEL_11_1 || screen->opts.ResourceBindingTier >= D3D12_RESOURCE_BINDING_TIER_3) ? PIPE_MAX_SHADER_BUFFERS : D3D12_PS_CS_UAV_REGISTER_COUNT; case PIPE_SHADER_CAP_SUPPORTED_IRS: return 1 << PIPE_SHADER_IR_NIR; case PIPE_SHADER_CAP_MAX_SHADER_IMAGES: if (!screen->support_shader_images) return 0; return (screen->max_feature_level >= D3D_FEATURE_LEVEL_11_1 || screen->opts.ResourceBindingTier >= D3D12_RESOURCE_BINDING_TIER_3) ? PIPE_MAX_SHADER_IMAGES : D3D12_PS_CS_UAV_REGISTER_COUNT; case PIPE_SHADER_CAP_LDEXP_SUPPORTED: case PIPE_SHADER_CAP_MAX_HW_ATOMIC_COUNTERS: case PIPE_SHADER_CAP_MAX_HW_ATOMIC_COUNTER_BUFFERS: case PIPE_SHADER_CAP_CONT_SUPPORTED: return 0; /* not implemented */ /* should only get here on unhandled cases */ default: return 0; } } static int d3d12_get_compute_param(struct pipe_screen *pscreen, enum pipe_shader_ir ir, enum pipe_compute_cap cap, void *ret) { switch (cap) { case PIPE_COMPUTE_CAP_MAX_GRID_SIZE: { uint64_t *grid = (uint64_t *)ret; grid[0] = grid[1] = grid[2] = D3D12_CS_DISPATCH_MAX_THREAD_GROUPS_PER_DIMENSION; return sizeof(uint64_t) * 3; } case PIPE_COMPUTE_CAP_MAX_BLOCK_SIZE: { uint64_t *block = (uint64_t *)ret; block[0] = D3D12_CS_THREAD_GROUP_MAX_X; block[1] = D3D12_CS_THREAD_GROUP_MAX_Y; block[2] = D3D12_CS_THREAD_GROUP_MAX_Z; return sizeof(uint64_t) * 3; } case PIPE_COMPUTE_CAP_MAX_VARIABLE_THREADS_PER_BLOCK: case PIPE_COMPUTE_CAP_MAX_THREADS_PER_BLOCK: *(uint64_t *)ret = D3D12_CS_THREAD_GROUP_MAX_THREADS_PER_GROUP; return sizeof(uint64_t); case PIPE_COMPUTE_CAP_MAX_LOCAL_SIZE: *(uint64_t *)ret = D3D12_CS_TGSM_REGISTER_COUNT /*DWORDs*/ * 4; return sizeof(uint64_t); default: return 0; } } static bool d3d12_is_format_supported(struct pipe_screen *pscreen, enum pipe_format format, enum pipe_texture_target target, unsigned sample_count, unsigned storage_sample_count, unsigned bind) { struct d3d12_screen *screen = d3d12_screen(pscreen); if (MAX2(1, sample_count) != MAX2(1, storage_sample_count)) return false; if (target == PIPE_BUFFER) { /* Replace emulated vertex element formats for the tests */ format = d3d12_emulated_vtx_format(format); } else { /* Allow 3-comp 32 bit formats only for BOs (needed for ARB_tbo_rgb32) */ if ((format == PIPE_FORMAT_R32G32B32_FLOAT || format == PIPE_FORMAT_R32G32B32_SINT || format == PIPE_FORMAT_R32G32B32_UINT)) return false; } /* Don't advertise alpha/luminance_alpha formats because they can't be used * for render targets (except A8_UNORM) and can't be emulated by R/RG formats. * Let the state tracker choose an RGBA format instead. For YUV formats, we * want the state tracker to lower these to individual planes. */ if (format != PIPE_FORMAT_A8_UNORM && (util_format_is_alpha(format) || util_format_is_luminance_alpha(format) || util_format_is_yuv(format))) return false; if (format == PIPE_FORMAT_NONE) { /* For UAV-only rendering, aka ARB_framebuffer_no_attachments */ switch (sample_count) { case 0: case 1: case 4: case 8: case 16: return true; default: return false; } } DXGI_FORMAT dxgi_format = d3d12_get_format(format); if (dxgi_format == DXGI_FORMAT_UNKNOWN) return false; enum D3D12_FORMAT_SUPPORT1 dim_support = D3D12_FORMAT_SUPPORT1_NONE; switch (target) { case PIPE_TEXTURE_1D: case PIPE_TEXTURE_1D_ARRAY: dim_support = D3D12_FORMAT_SUPPORT1_TEXTURE1D; break; case PIPE_TEXTURE_2D: case PIPE_TEXTURE_RECT: case PIPE_TEXTURE_2D_ARRAY: dim_support = D3D12_FORMAT_SUPPORT1_TEXTURE2D; break; case PIPE_TEXTURE_3D: dim_support = D3D12_FORMAT_SUPPORT1_TEXTURE3D; break; case PIPE_TEXTURE_CUBE: case PIPE_TEXTURE_CUBE_ARRAY: dim_support = D3D12_FORMAT_SUPPORT1_TEXTURECUBE; break; case PIPE_BUFFER: dim_support = D3D12_FORMAT_SUPPORT1_BUFFER; break; default: unreachable("Unknown target"); } D3D12_FEATURE_DATA_FORMAT_SUPPORT fmt_info; fmt_info.Format = d3d12_get_resource_rt_format(format); if (FAILED(screen->dev->CheckFeatureSupport(D3D12_FEATURE_FORMAT_SUPPORT, &fmt_info, sizeof(fmt_info)))) return false; if (!(fmt_info.Support1 & dim_support)) return false; if (target == PIPE_BUFFER) { if (bind & PIPE_BIND_VERTEX_BUFFER && !(fmt_info.Support1 & D3D12_FORMAT_SUPPORT1_IA_VERTEX_BUFFER)) return false; if (bind & PIPE_BIND_INDEX_BUFFER) { if (format != PIPE_FORMAT_R16_UINT && format != PIPE_FORMAT_R32_UINT) return false; } if (sample_count > 0) return false; } else { /* all other targets are texture-targets */ if (bind & PIPE_BIND_RENDER_TARGET && !(fmt_info.Support1 & D3D12_FORMAT_SUPPORT1_RENDER_TARGET)) return false; if (bind & PIPE_BIND_BLENDABLE && !(fmt_info.Support1 & D3D12_FORMAT_SUPPORT1_BLENDABLE)) return false; if (bind & PIPE_BIND_SHADER_IMAGE && (fmt_info.Support2 & (D3D12_FORMAT_SUPPORT2_UAV_TYPED_LOAD | D3D12_FORMAT_SUPPORT2_UAV_TYPED_STORE)) != (D3D12_FORMAT_SUPPORT2_UAV_TYPED_LOAD | D3D12_FORMAT_SUPPORT2_UAV_TYPED_STORE)) return false; D3D12_FEATURE_DATA_FORMAT_SUPPORT fmt_info_sv; if (util_format_is_depth_or_stencil(format)) { fmt_info_sv.Format = d3d12_get_resource_srv_format(format, target); if (FAILED(screen->dev->CheckFeatureSupport(D3D12_FEATURE_FORMAT_SUPPORT, &fmt_info_sv, sizeof(fmt_info_sv)))) return false; } else fmt_info_sv = fmt_info; #ifdef _WIN32 if (bind & PIPE_BIND_DISPLAY_TARGET && (!(fmt_info.Support1 & D3D12_FORMAT_SUPPORT1_DISPLAY) || // Disable formats that don't support flip model dxgi_format == DXGI_FORMAT_B8G8R8X8_UNORM || dxgi_format == DXGI_FORMAT_B5G5R5A1_UNORM || dxgi_format == DXGI_FORMAT_B5G6R5_UNORM || dxgi_format == DXGI_FORMAT_B4G4R4A4_UNORM)) return false; #endif if (bind & PIPE_BIND_DEPTH_STENCIL && !(fmt_info.Support1 & D3D12_FORMAT_SUPPORT1_DEPTH_STENCIL)) return false; if (sample_count > 0) { if (!(fmt_info_sv.Support1 & D3D12_FORMAT_SUPPORT1_MULTISAMPLE_LOAD)) return false; if (!util_is_power_of_two_nonzero(sample_count)) return false; if (bind & PIPE_BIND_SHADER_IMAGE) return false; D3D12_FEATURE_DATA_MULTISAMPLE_QUALITY_LEVELS ms_info = {}; ms_info.Format = dxgi_format; ms_info.SampleCount = sample_count; if (FAILED(screen->dev->CheckFeatureSupport(D3D12_FEATURE_MULTISAMPLE_QUALITY_LEVELS, &ms_info, sizeof(ms_info))) || !ms_info.NumQualityLevels) return false; } } return true; } void d3d12_deinit_screen(struct d3d12_screen *screen) { if (screen->rtv_pool) { d3d12_descriptor_pool_free(screen->rtv_pool); screen->rtv_pool = nullptr; } if (screen->dsv_pool) { d3d12_descriptor_pool_free(screen->dsv_pool); screen->dsv_pool = nullptr; } if (screen->view_pool) { d3d12_descriptor_pool_free(screen->view_pool); screen->view_pool = nullptr; } if (screen->readback_slab_bufmgr) { screen->readback_slab_bufmgr->destroy(screen->readback_slab_bufmgr); screen->readback_slab_bufmgr = nullptr; } if (screen->slab_bufmgr) { screen->slab_bufmgr->destroy(screen->slab_bufmgr); screen->slab_bufmgr = nullptr; } if (screen->cache_bufmgr) { screen->cache_bufmgr->destroy(screen->cache_bufmgr); screen->cache_bufmgr = nullptr; } if (screen->bufmgr) { screen->bufmgr->destroy(screen->bufmgr); screen->bufmgr = nullptr; } d3d12_deinit_residency(screen); if (screen->fence) { screen->fence->Release(); screen->fence = nullptr; } if (screen->cmdqueue) { screen->cmdqueue->Release(); screen->cmdqueue = nullptr; } if (screen->dev) { screen->dev->Release(); screen->dev = nullptr; } } void d3d12_destroy_screen(struct d3d12_screen *screen) { slab_destroy_parent(&screen->transfer_pool); mtx_destroy(&screen->submit_mutex); mtx_destroy(&screen->descriptor_pool_mutex); glsl_type_singleton_decref(); FREE(screen); } static void d3d12_flush_frontbuffer(struct pipe_screen * pscreen, struct pipe_context *pctx, struct pipe_resource *pres, unsigned level, unsigned layer, void *winsys_drawable_handle, struct pipe_box *sub_box) { struct d3d12_screen *screen = d3d12_screen(pscreen); struct sw_winsys *winsys = screen->winsys; struct d3d12_resource *res = d3d12_resource(pres); if (!winsys || !pctx) return; assert(res->dt); void *map = winsys->displaytarget_map(winsys, res->dt, 0); if (map) { pctx = threaded_context_unwrap_sync(pctx); pipe_transfer *transfer = nullptr; void *res_map = pipe_texture_map(pctx, pres, level, layer, PIPE_MAP_READ, 0, 0, u_minify(pres->width0, level), u_minify(pres->height0, level), &transfer); if (res_map) { util_copy_rect((ubyte*)map, pres->format, res->dt_stride, 0, 0, transfer->box.width, transfer->box.height, (const ubyte*)res_map, transfer->stride, 0, 0); pipe_texture_unmap(pctx, transfer); } winsys->displaytarget_unmap(winsys, res->dt); } #ifdef _WIN32 // WindowFromDC is Windows-only, and this method requires an HWND, so only use it on Windows ID3D12SharingContract *sharing_contract; if (SUCCEEDED(screen->cmdqueue->QueryInterface(IID_PPV_ARGS(&sharing_contract)))) { ID3D12Resource *d3d12_res = d3d12_resource_resource(res); sharing_contract->Present(d3d12_res, 0, WindowFromDC((HDC)winsys_drawable_handle)); } #endif winsys->displaytarget_display(winsys, res->dt, winsys_drawable_handle, sub_box); } static ID3D12Debug * get_debug_interface() { typedef HRESULT(WINAPI *PFN_D3D12_GET_DEBUG_INTERFACE)(REFIID riid, void **ppFactory); PFN_D3D12_GET_DEBUG_INTERFACE D3D12GetDebugInterface; util_dl_library *d3d12_mod = util_dl_open(UTIL_DL_PREFIX "d3d12" UTIL_DL_EXT); if (!d3d12_mod) { debug_printf("D3D12: failed to load D3D12.DLL\n"); return NULL; } D3D12GetDebugInterface = (PFN_D3D12_GET_DEBUG_INTERFACE)util_dl_get_proc_address(d3d12_mod, "D3D12GetDebugInterface"); if (!D3D12GetDebugInterface) { debug_printf("D3D12: failed to load D3D12GetDebugInterface from D3D12.DLL\n"); return NULL; } ID3D12Debug *debug; if (FAILED(D3D12GetDebugInterface(IID_PPV_ARGS(&debug)))) { debug_printf("D3D12: D3D12GetDebugInterface failed\n"); return NULL; } return debug; } static void enable_d3d12_debug_layer() { ID3D12Debug *debug = get_debug_interface(); if (debug) { debug->EnableDebugLayer(); debug->Release(); } } static void enable_gpu_validation() { ID3D12Debug *debug = get_debug_interface(); ID3D12Debug3 *debug3; if (debug) { if (SUCCEEDED(debug->QueryInterface(IID_PPV_ARGS(&debug3)))) { debug3->SetEnableGPUBasedValidation(true); debug3->Release(); } debug->Release(); } } static ID3D12Device3 * create_device(IUnknown *adapter) { typedef HRESULT(WINAPI *PFN_D3D12CREATEDEVICE)(IUnknown*, D3D_FEATURE_LEVEL, REFIID, void**); typedef HRESULT(WINAPI *PFN_D3D12ENABLEEXPERIMENTALFEATURES)(UINT, const IID*, void*, UINT*); PFN_D3D12CREATEDEVICE D3D12CreateDevice; PFN_D3D12ENABLEEXPERIMENTALFEATURES D3D12EnableExperimentalFeatures; util_dl_library *d3d12_mod = util_dl_open(UTIL_DL_PREFIX "d3d12" UTIL_DL_EXT); if (!d3d12_mod) { debug_printf("D3D12: failed to load D3D12.DLL\n"); return NULL; } #ifdef _WIN32 if (d3d12_debug & D3D12_DEBUG_EXPERIMENTAL) #endif { D3D12EnableExperimentalFeatures = (PFN_D3D12ENABLEEXPERIMENTALFEATURES)util_dl_get_proc_address(d3d12_mod, "D3D12EnableExperimentalFeatures"); if (FAILED(D3D12EnableExperimentalFeatures(1, &D3D12ExperimentalShaderModels, NULL, NULL))) { debug_printf("D3D12: failed to enable experimental shader models\n"); return nullptr; } } D3D12CreateDevice = (PFN_D3D12CREATEDEVICE)util_dl_get_proc_address(d3d12_mod, "D3D12CreateDevice"); if (!D3D12CreateDevice) { debug_printf("D3D12: failed to load D3D12CreateDevice from D3D12.DLL\n"); return NULL; } ID3D12Device3 *dev; if (SUCCEEDED(D3D12CreateDevice(adapter, D3D_FEATURE_LEVEL_11_0, IID_PPV_ARGS(&dev)))) return dev; debug_printf("D3D12: D3D12CreateDevice failed\n"); return NULL; } static bool can_attribute_at_vertex(struct d3d12_screen *screen) { switch (screen->vendor_id) { case HW_VENDOR_MICROSOFT: return true; default: return screen->opts3.BarycentricsSupported; } } static bool can_shader_image_load_all_formats(struct d3d12_screen *screen) { if (!screen->opts.TypedUAVLoadAdditionalFormats) return false; /* All of these are required by ARB_shader_image_load_store */ static const DXGI_FORMAT additional_formats[] = { DXGI_FORMAT_R16G16B16A16_UNORM, DXGI_FORMAT_R16G16B16A16_SNORM, DXGI_FORMAT_R32G32_FLOAT, DXGI_FORMAT_R32G32_UINT, DXGI_FORMAT_R32G32_SINT, DXGI_FORMAT_R10G10B10A2_UNORM, DXGI_FORMAT_R10G10B10A2_UINT, DXGI_FORMAT_R11G11B10_FLOAT, DXGI_FORMAT_R8G8B8A8_SNORM, DXGI_FORMAT_R16G16_FLOAT, DXGI_FORMAT_R16G16_UNORM, DXGI_FORMAT_R16G16_UINT, DXGI_FORMAT_R16G16_SNORM, DXGI_FORMAT_R16G16_SINT, DXGI_FORMAT_R8G8_UNORM, DXGI_FORMAT_R8G8_UINT, DXGI_FORMAT_R8G8_SNORM, DXGI_FORMAT_R8G8_SINT, DXGI_FORMAT_R16_UNORM, DXGI_FORMAT_R16_SNORM, DXGI_FORMAT_R8_SNORM, }; for (unsigned i = 0; i < ARRAY_SIZE(additional_formats); ++i) { D3D12_FEATURE_DATA_FORMAT_SUPPORT support = { additional_formats[i] }; if (FAILED(screen->dev->CheckFeatureSupport(D3D12_FEATURE_FORMAT_SUPPORT, &support, sizeof(support))) || (support.Support1 & D3D12_FORMAT_SUPPORT1_TYPED_UNORDERED_ACCESS_VIEW) == D3D12_FORMAT_SUPPORT1_NONE || (support.Support2 & (D3D12_FORMAT_SUPPORT2_UAV_TYPED_LOAD | D3D12_FORMAT_SUPPORT2_UAV_TYPED_STORE)) != (D3D12_FORMAT_SUPPORT2_UAV_TYPED_LOAD | D3D12_FORMAT_SUPPORT2_UAV_TYPED_STORE)) return false; } return true; } static void d3d12_init_null_srvs(struct d3d12_screen *screen) { for (unsigned i = 0; i < RESOURCE_DIMENSION_COUNT; ++i) { D3D12_SHADER_RESOURCE_VIEW_DESC srv = {}; srv.Format = DXGI_FORMAT_R32G32B32A32_FLOAT; srv.Shader4ComponentMapping = D3D12_DEFAULT_SHADER_4_COMPONENT_MAPPING; switch (i) { case RESOURCE_DIMENSION_BUFFER: case RESOURCE_DIMENSION_UNKNOWN: srv.ViewDimension = D3D12_SRV_DIMENSION_BUFFER; srv.Buffer.FirstElement = 0; srv.Buffer.NumElements = 0; srv.Buffer.Flags = D3D12_BUFFER_SRV_FLAG_NONE; srv.Buffer.StructureByteStride = 0; break; case RESOURCE_DIMENSION_TEXTURE1D: srv.ViewDimension = D3D12_SRV_DIMENSION_TEXTURE1D; srv.Texture1D.MipLevels = 1; srv.Texture1D.MostDetailedMip = 0; srv.Texture1D.ResourceMinLODClamp = 0.0f; break; case RESOURCE_DIMENSION_TEXTURE1DARRAY: srv.ViewDimension = D3D12_SRV_DIMENSION_TEXTURE1DARRAY; srv.Texture1DArray.MipLevels = 1; srv.Texture1DArray.ArraySize = 1; srv.Texture1DArray.MostDetailedMip = 0; srv.Texture1DArray.FirstArraySlice = 0; srv.Texture1DArray.ResourceMinLODClamp = 0.0f; break; case RESOURCE_DIMENSION_TEXTURE2D: srv.ViewDimension = D3D12_SRV_DIMENSION_TEXTURE2D; srv.Texture2D.MipLevels = 1; srv.Texture2D.MostDetailedMip = 0; srv.Texture2D.PlaneSlice = 0; srv.Texture2D.ResourceMinLODClamp = 0.0f; break; case RESOURCE_DIMENSION_TEXTURE2DARRAY: srv.ViewDimension = D3D12_SRV_DIMENSION_TEXTURE2DARRAY; srv.Texture2DArray.MipLevels = 1; srv.Texture2DArray.ArraySize = 1; srv.Texture2DArray.MostDetailedMip = 0; srv.Texture2DArray.FirstArraySlice = 0; srv.Texture2DArray.PlaneSlice = 0; srv.Texture2DArray.ResourceMinLODClamp = 0.0f; break; case RESOURCE_DIMENSION_TEXTURE2DMS: srv.ViewDimension = D3D12_SRV_DIMENSION_TEXTURE2DMS; break; case RESOURCE_DIMENSION_TEXTURE2DMSARRAY: srv.ViewDimension = D3D12_SRV_DIMENSION_TEXTURE2DMSARRAY; srv.Texture2DMSArray.ArraySize = 1; srv.Texture2DMSArray.FirstArraySlice = 0; break; case RESOURCE_DIMENSION_TEXTURE3D: srv.ViewDimension = D3D12_SRV_DIMENSION_TEXTURE3D; srv.Texture3D.MipLevels = 1; srv.Texture3D.MostDetailedMip = 0; srv.Texture3D.ResourceMinLODClamp = 0.0f; break; case RESOURCE_DIMENSION_TEXTURECUBE: srv.ViewDimension = D3D12_SRV_DIMENSION_TEXTURECUBE; srv.TextureCube.MipLevels = 1; srv.TextureCube.MostDetailedMip = 0; srv.TextureCube.ResourceMinLODClamp = 0.0f; break; case RESOURCE_DIMENSION_TEXTURECUBEARRAY: srv.ViewDimension = D3D12_SRV_DIMENSION_TEXTURECUBEARRAY; srv.TextureCubeArray.MipLevels = 1; srv.TextureCubeArray.NumCubes = 1; srv.TextureCubeArray.MostDetailedMip = 0; srv.TextureCubeArray.First2DArrayFace = 0; srv.TextureCubeArray.ResourceMinLODClamp = 0.0f; break; } if (srv.ViewDimension != D3D12_SRV_DIMENSION_UNKNOWN) { d3d12_descriptor_pool_alloc_handle(screen->view_pool, &screen->null_srvs[i]); screen->dev->CreateShaderResourceView(NULL, &srv, screen->null_srvs[i].cpu_handle); } } } static void d3d12_init_null_uavs(struct d3d12_screen *screen) { for (unsigned i = 0; i < RESOURCE_DIMENSION_COUNT; ++i) { D3D12_UNORDERED_ACCESS_VIEW_DESC uav = {}; uav.Format = DXGI_FORMAT_R32G32B32A32_FLOAT; switch (i) { case RESOURCE_DIMENSION_BUFFER: case RESOURCE_DIMENSION_UNKNOWN: uav.ViewDimension = D3D12_UAV_DIMENSION_BUFFER; uav.Buffer.FirstElement = 0; uav.Buffer.NumElements = 0; uav.Buffer.Flags = D3D12_BUFFER_UAV_FLAG_NONE; uav.Buffer.StructureByteStride = 0; uav.Buffer.CounterOffsetInBytes = 0; break; case RESOURCE_DIMENSION_TEXTURE1D: uav.ViewDimension = D3D12_UAV_DIMENSION_TEXTURE1D; uav.Texture1D.MipSlice = 0; break; case RESOURCE_DIMENSION_TEXTURE1DARRAY: uav.ViewDimension = D3D12_UAV_DIMENSION_TEXTURE1DARRAY; uav.Texture1DArray.MipSlice = 0; uav.Texture1DArray.ArraySize = 1; uav.Texture1DArray.FirstArraySlice = 0; break; case RESOURCE_DIMENSION_TEXTURE2D: uav.ViewDimension = D3D12_UAV_DIMENSION_TEXTURE2D; uav.Texture2D.MipSlice = 0; uav.Texture2D.PlaneSlice = 0; break; case RESOURCE_DIMENSION_TEXTURE2DARRAY: case RESOURCE_DIMENSION_TEXTURECUBE: case RESOURCE_DIMENSION_TEXTURECUBEARRAY: uav.ViewDimension = D3D12_UAV_DIMENSION_TEXTURE2DARRAY; uav.Texture2DArray.MipSlice = 0; uav.Texture2DArray.ArraySize = 1; uav.Texture2DArray.FirstArraySlice = 0; uav.Texture2DArray.PlaneSlice = 0; break; case RESOURCE_DIMENSION_TEXTURE2DMS: case RESOURCE_DIMENSION_TEXTURE2DMSARRAY: break; case RESOURCE_DIMENSION_TEXTURE3D: uav.ViewDimension = D3D12_UAV_DIMENSION_TEXTURE3D; uav.Texture3D.MipSlice = 0; uav.Texture3D.FirstWSlice = 0; uav.Texture3D.WSize = 1; break; } if (uav.ViewDimension != D3D12_UAV_DIMENSION_UNKNOWN) { d3d12_descriptor_pool_alloc_handle(screen->view_pool, &screen->null_uavs[i]); screen->dev->CreateUnorderedAccessView(NULL, NULL, &uav, screen->null_uavs[i].cpu_handle); } } } static void d3d12_init_null_rtv(struct d3d12_screen *screen) { D3D12_RENDER_TARGET_VIEW_DESC rtv = {}; rtv.Format = DXGI_FORMAT_R8G8B8A8_UNORM; rtv.ViewDimension = D3D12_RTV_DIMENSION_TEXTURE2D; rtv.Texture2D.MipSlice = 0; rtv.Texture2D.PlaneSlice = 0; d3d12_descriptor_pool_alloc_handle(screen->rtv_pool, &screen->null_rtv); screen->dev->CreateRenderTargetView(NULL, &rtv, screen->null_rtv.cpu_handle); } static void d3d12_get_adapter_luid(struct pipe_screen *pscreen, char *luid) { struct d3d12_screen *screen = d3d12_screen(pscreen); memcpy(luid, &screen->adapter_luid, PIPE_LUID_SIZE); } static void d3d12_get_device_uuid(struct pipe_screen *pscreen, char *uuid) { struct d3d12_screen *screen = d3d12_screen(pscreen); memcpy(uuid, &screen->device_uuid, PIPE_UUID_SIZE); } static void d3d12_get_driver_uuid(struct pipe_screen *pscreen, char *uuid) { struct d3d12_screen *screen = d3d12_screen(pscreen); memcpy(uuid, &screen->driver_uuid, PIPE_UUID_SIZE); } static uint32_t d3d12_get_node_mask(struct pipe_screen *pscreen) { /* This implementation doesn't support linked adapters */ return 1; } static void d3d12_create_fence_win32(struct pipe_screen *pscreen, struct pipe_fence_handle **pfence, void *handle, const void *name, enum pipe_fd_type type) { d3d12_fence_reference((struct d3d12_fence **)pfence, type == PIPE_FD_TYPE_TIMELINE_SEMAPHORE ? d3d12_open_fence(d3d12_screen(pscreen), handle, name) : nullptr); } static void d3d12_set_fence_timeline_value(struct pipe_screen *pscreen, struct pipe_fence_handle *pfence, uint64_t value) { d3d12_fence(pfence)->value = value; } void d3d12_init_screen_base(struct d3d12_screen *screen, struct sw_winsys *winsys, LUID *adapter_luid) { d3d12_debug = debug_get_option_d3d12_debug(); screen->winsys = winsys; if (adapter_luid) screen->adapter_luid = *adapter_luid; mtx_init(&screen->descriptor_pool_mutex, mtx_plain); mtx_init(&screen->submit_mutex, mtx_plain); list_inithead(&screen->context_list); screen->base.get_vendor = d3d12_get_vendor; screen->base.get_device_vendor = d3d12_get_device_vendor; screen->base.get_param = d3d12_get_param; screen->base.get_paramf = d3d12_get_paramf; screen->base.get_shader_param = d3d12_get_shader_param; screen->base.get_compute_param = d3d12_get_compute_param; screen->base.is_format_supported = d3d12_is_format_supported; screen->base.get_compiler_options = d3d12_get_compiler_options; screen->base.context_create = d3d12_context_create; screen->base.flush_frontbuffer = d3d12_flush_frontbuffer; screen->base.get_device_luid = d3d12_get_adapter_luid; screen->base.get_device_uuid = d3d12_get_device_uuid; screen->base.get_driver_uuid = d3d12_get_driver_uuid; screen->base.get_device_node_mask = d3d12_get_node_mask; screen->base.create_fence_win32 = d3d12_create_fence_win32; screen->base.set_fence_timeline_value = d3d12_set_fence_timeline_value; } bool d3d12_init_screen(struct d3d12_screen *screen, IUnknown *adapter) { assert(screen->base.destroy != nullptr); #ifndef DEBUG if (d3d12_debug & D3D12_DEBUG_DEBUG_LAYER) #endif enable_d3d12_debug_layer(); if (d3d12_debug & D3D12_DEBUG_GPU_VALIDATOR) enable_gpu_validation(); screen->dev = create_device(adapter); if (!screen->dev) { debug_printf("D3D12: failed to create device\n"); return false; } screen->adapter_luid = GetAdapterLuid(screen->dev); ID3D12InfoQueue *info_queue; if (SUCCEEDED(screen->dev->QueryInterface(IID_PPV_ARGS(&info_queue)))) { D3D12_MESSAGE_SEVERITY severities[] = { D3D12_MESSAGE_SEVERITY_INFO, D3D12_MESSAGE_SEVERITY_WARNING, }; D3D12_MESSAGE_ID msg_ids[] = { D3D12_MESSAGE_ID_CLEARRENDERTARGETVIEW_MISMATCHINGCLEARVALUE, }; D3D12_INFO_QUEUE_FILTER NewFilter = {}; NewFilter.DenyList.NumSeverities = ARRAY_SIZE(severities); NewFilter.DenyList.pSeverityList = severities; NewFilter.DenyList.NumIDs = ARRAY_SIZE(msg_ids); NewFilter.DenyList.pIDList = msg_ids; info_queue->PushStorageFilter(&NewFilter); info_queue->Release(); } if (FAILED(screen->dev->CheckFeatureSupport(D3D12_FEATURE_D3D12_OPTIONS, &screen->opts, sizeof(screen->opts)))) { debug_printf("D3D12: failed to get device options\n"); return false; } if (FAILED(screen->dev->CheckFeatureSupport(D3D12_FEATURE_D3D12_OPTIONS1, &screen->opts1, sizeof(screen->opts1)))) { debug_printf("D3D12: failed to get device options\n"); return false; } if (FAILED(screen->dev->CheckFeatureSupport(D3D12_FEATURE_D3D12_OPTIONS2, &screen->opts2, sizeof(screen->opts2)))) { debug_printf("D3D12: failed to get device options\n"); return false; } if (FAILED(screen->dev->CheckFeatureSupport(D3D12_FEATURE_D3D12_OPTIONS3, &screen->opts3, sizeof(screen->opts3)))) { debug_printf("D3D12: failed to get device options\n"); return false; } if (FAILED(screen->dev->CheckFeatureSupport(D3D12_FEATURE_D3D12_OPTIONS4, &screen->opts4, sizeof(screen->opts4)))) { debug_printf("D3D12: failed to get device options\n"); return false; } screen->architecture.NodeIndex = 0; if (FAILED(screen->dev->CheckFeatureSupport(D3D12_FEATURE_ARCHITECTURE, &screen->architecture, sizeof(screen->architecture)))) { debug_printf("D3D12: failed to get device architecture\n"); return false; } D3D12_FEATURE_DATA_FEATURE_LEVELS feature_levels; static const D3D_FEATURE_LEVEL levels[] = { D3D_FEATURE_LEVEL_11_0, D3D_FEATURE_LEVEL_11_1, D3D_FEATURE_LEVEL_12_0, D3D_FEATURE_LEVEL_12_1, }; feature_levels.NumFeatureLevels = ARRAY_SIZE(levels); feature_levels.pFeatureLevelsRequested = levels; if (FAILED(screen->dev->CheckFeatureSupport(D3D12_FEATURE_FEATURE_LEVELS, &feature_levels, sizeof(feature_levels)))) { debug_printf("D3D12: failed to get device feature levels\n"); return false; } screen->max_feature_level = feature_levels.MaxSupportedFeatureLevel; D3D12_COMMAND_QUEUE_DESC queue_desc; queue_desc.Type = D3D12_COMMAND_LIST_TYPE_DIRECT; queue_desc.Priority = D3D12_COMMAND_QUEUE_PRIORITY_NORMAL; queue_desc.Flags = D3D12_COMMAND_QUEUE_FLAG_NONE; queue_desc.NodeMask = 0; ID3D12Device9 *device9; if (SUCCEEDED(screen->dev->QueryInterface(&device9))) { if (FAILED(device9->CreateCommandQueue1(&queue_desc, OpenGLOn12CreatorID, IID_PPV_ARGS(&screen->cmdqueue)))) return false; device9->Release(); } else { if (FAILED(screen->dev->CreateCommandQueue(&queue_desc, IID_PPV_ARGS(&screen->cmdqueue)))) return false; } if (FAILED(screen->dev->CreateFence(0, D3D12_FENCE_FLAG_NONE, IID_PPV_ARGS(&screen->fence)))) return false; if (!d3d12_init_residency(screen)) return false; UINT64 timestamp_freq; if (FAILED(screen->cmdqueue->GetTimestampFrequency(×tamp_freq))) timestamp_freq = 10000000; screen->timestamp_multiplier = 1000000000.0 / timestamp_freq; d3d12_screen_fence_init(&screen->base); d3d12_screen_resource_init(&screen->base); #ifdef HAVE_GALLIUM_D3D12_VIDEO d3d12_screen_video_init(&screen->base); #endif slab_create_parent(&screen->transfer_pool, sizeof(struct d3d12_transfer), 16); struct pb_desc desc; desc.alignment = D3D12_TEXTURE_DATA_PLACEMENT_ALIGNMENT; desc.usage = (pb_usage_flags)(PB_USAGE_CPU_WRITE | PB_USAGE_GPU_READ); screen->bufmgr = d3d12_bufmgr_create(screen); if (!screen->bufmgr) return false; screen->cache_bufmgr = pb_cache_manager_create(screen->bufmgr, 0xfffff, 2, 0, 512 * 1024 * 1024); if (!screen->cache_bufmgr) return false; screen->slab_bufmgr = pb_slab_range_manager_create(screen->cache_bufmgr, 16, D3D12_DEFAULT_RESOURCE_PLACEMENT_ALIGNMENT, D3D12_DEFAULT_RESOURCE_PLACEMENT_ALIGNMENT, &desc); if (!screen->slab_bufmgr) return false; desc.usage = (pb_usage_flags)(PB_USAGE_CPU_READ_WRITE | PB_USAGE_GPU_WRITE); screen->readback_slab_bufmgr = pb_slab_range_manager_create(screen->cache_bufmgr, 16, D3D12_DEFAULT_RESOURCE_PLACEMENT_ALIGNMENT, D3D12_DEFAULT_RESOURCE_PLACEMENT_ALIGNMENT, &desc); if (!screen->readback_slab_bufmgr) return false; screen->rtv_pool = d3d12_descriptor_pool_new(screen, D3D12_DESCRIPTOR_HEAP_TYPE_RTV, 64); screen->dsv_pool = d3d12_descriptor_pool_new(screen, D3D12_DESCRIPTOR_HEAP_TYPE_DSV, 64); screen->view_pool = d3d12_descriptor_pool_new(screen, D3D12_DESCRIPTOR_HEAP_TYPE_CBV_SRV_UAV, 1024); if (!screen->rtv_pool || !screen->dsv_pool || !screen->view_pool) return false; d3d12_init_null_srvs(screen); d3d12_init_null_uavs(screen); d3d12_init_null_rtv(screen); screen->have_load_at_vertex = can_attribute_at_vertex(screen); screen->support_shader_images = can_shader_image_load_all_formats(screen); ID3D12Device8 *dev8; if (SUCCEEDED(screen->dev->QueryInterface(&dev8))) { dev8->Release(); screen->support_create_not_resident = true; } screen->nir_options = *dxil_get_nir_compiler_options(); static constexpr uint64_t known_good_warp_version = 10ull << 48 | 22000ull << 16; if ((screen->vendor_id == HW_VENDOR_MICROSOFT && screen->driver_version < known_good_warp_version) || !screen->opts1.Int64ShaderOps) { /* Work around old versions of WARP that are completely broken for 64bit shifts */ screen->nir_options.lower_pack_64_2x32_split = false; screen->nir_options.lower_unpack_64_2x32_split = false; screen->nir_options.lower_int64_options = (nir_lower_int64_options)~0; } if (!screen->opts.DoublePrecisionFloatShaderOps) screen->nir_options.lower_doubles_options = (nir_lower_doubles_options)~0; const char *mesa_version = "Mesa " PACKAGE_VERSION MESA_GIT_SHA1; struct mesa_sha1 sha1_ctx; uint8_t sha1[SHA1_DIGEST_LENGTH]; STATIC_ASSERT(PIPE_UUID_SIZE <= sizeof(sha1)); /* The driver UUID is used for determining sharability of images and memory * between two instances in separate processes. People who want to * share memory need to also check the device UUID or LUID so all this * needs to be is the build-id. */ _mesa_sha1_compute(mesa_version, strlen(mesa_version), sha1); memcpy(screen->driver_uuid, sha1, PIPE_UUID_SIZE); /* The device UUID uniquely identifies the given device within the machine. */ _mesa_sha1_init(&sha1_ctx); _mesa_sha1_update(&sha1_ctx, &screen->vendor_id, sizeof(screen->vendor_id)); _mesa_sha1_update(&sha1_ctx, &screen->device_id, sizeof(screen->device_id)); _mesa_sha1_update(&sha1_ctx, &screen->subsys_id, sizeof(screen->subsys_id)); _mesa_sha1_update(&sha1_ctx, &screen->revision, sizeof(screen->revision)); _mesa_sha1_final(&sha1_ctx, sha1); memcpy(screen->device_uuid, sha1, PIPE_UUID_SIZE); glsl_type_singleton_init_or_ref(); return true; }