| // Copyright 2019 The Dawn Authors |
| // |
| // Licensed under the Apache License, Version 2.0 (the "License"); |
| // you may not use this file except in compliance with the License. |
| // You may obtain a copy of the License at |
| // |
| // http://www.apache.org/licenses/LICENSE-2.0 |
| // |
| // Unless required by applicable law or agreed to in writing, software |
| // distributed under the License is distributed on an "AS IS" BASIS, |
| // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
| // See the License for the specific language governing permissions and |
| // limitations under the License. |
| |
| #include "dawn/native/d3d12/PhysicalDeviceD3D12.h" |
| |
| #include <string> |
| #include <utility> |
| |
| #include "dawn/common/Constants.h" |
| #include "dawn/common/Platform.h" |
| #include "dawn/common/WindowsUtils.h" |
| #include "dawn/native/Instance.h" |
| #include "dawn/native/d3d/D3DError.h" |
| #include "dawn/native/d3d12/BackendD3D12.h" |
| #include "dawn/native/d3d12/DeviceD3D12.h" |
| #include "dawn/native/d3d12/PlatformFunctionsD3D12.h" |
| #include "dawn/native/d3d12/UtilsD3D12.h" |
| |
| namespace dawn::native::d3d12 { |
| |
| PhysicalDevice::PhysicalDevice(Backend* backend, ComPtr<IDXGIAdapter3> hardwareAdapter) |
| : Base(backend, std::move(hardwareAdapter), wgpu::BackendType::D3D12) {} |
| |
| PhysicalDevice::~PhysicalDevice() { |
| CleanUpDebugLayerFilters(); |
| } |
| |
| bool PhysicalDevice::SupportsExternalImages() const { |
| // Via dawn::native::d3d::ExternalImageDXGI::Create |
| return true; |
| } |
| |
| bool PhysicalDevice::SupportsFeatureLevel(FeatureLevel) const { |
| return true; |
| } |
| |
| const D3D12DeviceInfo& PhysicalDevice::GetDeviceInfo() const { |
| return mDeviceInfo; |
| } |
| |
| Backend* PhysicalDevice::GetBackend() const { |
| return static_cast<Backend*>(Base::GetBackend()); |
| } |
| |
| ComPtr<ID3D12Device> PhysicalDevice::GetDevice() const { |
| return mD3d12Device; |
| } |
| |
| MaybeError PhysicalDevice::InitializeImpl() { |
| DAWN_TRY(Base::InitializeImpl()); |
| // D3D12 cannot check for feature support without a device. |
| // Create the device to populate the adapter properties then reuse it when needed for actual |
| // rendering. |
| const PlatformFunctions* functions = GetBackend()->GetFunctions(); |
| if (FAILED(functions->d3d12CreateDevice(GetHardwareAdapter(), D3D_FEATURE_LEVEL_11_0, |
| __uuidof(ID3D12Device), &mD3d12Device))) { |
| return DAWN_INTERNAL_ERROR("D3D12CreateDevice failed"); |
| } |
| |
| DAWN_TRY(InitializeDebugLayerFilters()); |
| |
| DAWN_TRY_ASSIGN(mDeviceInfo, GatherDeviceInfo(*this)); |
| |
| // Base::InitializeImpl() cannot distinguish between discrete and integrated GPUs, so we need to |
| // overwrite it here. |
| if (mAdapterType == wgpu::AdapterType::DiscreteGPU && mDeviceInfo.isUMA) { |
| mAdapterType = wgpu::AdapterType::IntegratedGPU; |
| } |
| |
| if (GetInstance()->IsAdapterBlocklistEnabled()) { |
| #if DAWN_PLATFORM_IS(I386) |
| DAWN_INVALID_IF( |
| mDeviceInfo.shaderModel >= 60, |
| "D3D12 x86 SM6.0+ adapter is blocklisted. See https://crbug.com/tint/1753."); |
| |
| DAWN_INVALID_IF( |
| gpu_info::IsNvidia(mVendorId), |
| "D3D12 NVIDIA x86 adapter is blocklisted. See https://crbug.com/dawn/1196."); |
| #elif DAWN_PLATFORM_IS(ARM) |
| return DAWN_VALIDATION_ERROR( |
| "D3D12 on ARM CPU is blocklisted. See https://crbug.com/dawn/884."); |
| #endif |
| } |
| return {}; |
| } |
| |
| bool PhysicalDevice::AreTimestampQueriesSupported() const { |
| D3D12_COMMAND_QUEUE_DESC queueDesc = {}; |
| queueDesc.Flags = D3D12_COMMAND_QUEUE_FLAG_NONE; |
| queueDesc.Type = D3D12_COMMAND_LIST_TYPE_DIRECT; |
| ComPtr<ID3D12CommandQueue> d3d12CommandQueue; |
| HRESULT hr = mD3d12Device->CreateCommandQueue(&queueDesc, IID_PPV_ARGS(&d3d12CommandQueue)); |
| if (FAILED(hr)) { |
| return false; |
| } |
| |
| // GetTimestampFrequency returns an error HRESULT when there are bugs in Windows container |
| // and vGPU implementations. |
| uint64_t timeStampFrequency; |
| hr = d3d12CommandQueue->GetTimestampFrequency(&timeStampFrequency); |
| if (FAILED(hr)) { |
| return false; |
| } |
| |
| return true; |
| } |
| |
| void PhysicalDevice::InitializeSupportedFeaturesImpl() { |
| EnableFeature(Feature::TextureCompressionBC); |
| EnableFeature(Feature::MultiPlanarFormats); |
| EnableFeature(Feature::Depth32FloatStencil8); |
| EnableFeature(Feature::IndirectFirstInstance); |
| EnableFeature(Feature::RG11B10UfloatRenderable); |
| EnableFeature(Feature::DepthClipControl); |
| EnableFeature(Feature::SurfaceCapabilities); |
| EnableFeature(Feature::Float32Filterable); |
| |
| if (AreTimestampQueriesSupported()) { |
| EnableFeature(Feature::TimestampQuery); |
| EnableFeature(Feature::TimestampQueryInsidePasses); |
| } |
| EnableFeature(Feature::PipelineStatisticsQuery); |
| |
| // Both Dp4a and ShaderF16 features require DXC version being 1.4 or higher |
| if (GetBackend()->IsDXCAvailableAndVersionAtLeast(1, 4, 1, 4)) { |
| if (mDeviceInfo.supportsDP4a) { |
| EnableFeature(Feature::ChromiumExperimentalDp4a); |
| } |
| if (mDeviceInfo.supportsShaderF16) { |
| EnableFeature(Feature::ShaderF16); |
| } |
| } |
| |
| D3D12_FEATURE_DATA_FORMAT_SUPPORT bgra8unormFormatInfo = {}; |
| bgra8unormFormatInfo.Format = DXGI_FORMAT_B8G8R8A8_UNORM; |
| HRESULT hr = mD3d12Device->CheckFeatureSupport( |
| D3D12_FEATURE_FORMAT_SUPPORT, &bgra8unormFormatInfo, sizeof(bgra8unormFormatInfo)); |
| if (SUCCEEDED(hr) && |
| (bgra8unormFormatInfo.Support1 & D3D12_FORMAT_SUPPORT1_TYPED_UNORDERED_ACCESS_VIEW)) { |
| EnableFeature(Feature::BGRA8UnormStorage); |
| } |
| } |
| |
| MaybeError PhysicalDevice::InitializeSupportedLimitsImpl(CombinedLimits* limits) { |
| D3D12_FEATURE_DATA_D3D12_OPTIONS featureData = {}; |
| |
| DAWN_TRY(CheckHRESULT(mD3d12Device->CheckFeatureSupport(D3D12_FEATURE_D3D12_OPTIONS, |
| &featureData, sizeof(featureData)), |
| "CheckFeatureSupport D3D12_FEATURE_D3D12_OPTIONS")); |
| |
| // Check if the device is at least D3D_FEATURE_LEVEL_11_1 or D3D_FEATURE_LEVEL_11_0 |
| const D3D_FEATURE_LEVEL levelsToQuery[]{D3D_FEATURE_LEVEL_11_1, D3D_FEATURE_LEVEL_11_0}; |
| |
| D3D12_FEATURE_DATA_FEATURE_LEVELS featureLevels; |
| featureLevels.NumFeatureLevels = sizeof(levelsToQuery) / sizeof(D3D_FEATURE_LEVEL); |
| featureLevels.pFeatureLevelsRequested = levelsToQuery; |
| DAWN_TRY(CheckHRESULT(mD3d12Device->CheckFeatureSupport(D3D12_FEATURE_FEATURE_LEVELS, |
| &featureLevels, sizeof(featureLevels)), |
| "CheckFeatureSupport D3D12_FEATURE_FEATURE_LEVELS")); |
| |
| if (featureLevels.MaxSupportedFeatureLevel == D3D_FEATURE_LEVEL_11_0 && |
| featureData.ResourceBindingTier < D3D12_RESOURCE_BINDING_TIER_2) { |
| return DAWN_VALIDATION_ERROR( |
| "At least Resource Binding Tier 2 is required for D3D12 Feature Level 11.0 " |
| "devices."); |
| } |
| |
| GetDefaultLimits(&limits->v1); |
| |
| // https://docs.microsoft.com/en-us/windows/win32/direct3d12/hardware-feature-levels |
| |
| // Limits that are the same across D3D feature levels |
| limits->v1.maxTextureDimension1D = D3D12_REQ_TEXTURE1D_U_DIMENSION; |
| limits->v1.maxTextureDimension2D = D3D12_REQ_TEXTURE2D_U_OR_V_DIMENSION; |
| limits->v1.maxTextureDimension3D = D3D12_REQ_TEXTURE3D_U_V_OR_W_DIMENSION; |
| limits->v1.maxTextureArrayLayers = D3D12_REQ_TEXTURE2D_ARRAY_AXIS_DIMENSION; |
| // Slot values can be 0-15, inclusive: |
| // https://docs.microsoft.com/en-ca/windows/win32/api/d3d12/ns-d3d12-d3d12_input_element_desc |
| limits->v1.maxVertexBuffers = 16; |
| limits->v1.maxVertexAttributes = D3D12_IA_VERTEX_INPUT_RESOURCE_SLOT_COUNT; |
| |
| // Note: WebGPU requires FL11.1+ |
| // https://docs.microsoft.com/en-us/windows/win32/direct3d12/hardware-support |
| // Resource Binding Tier: 1 2 3 |
| |
| // Max(CBV+UAV+SRV) 1M 1M 1M+ |
| // Max CBV per stage 14 14 full |
| // Max SRV per stage 128 full full |
| // Max UAV in all stages 64 64 full |
| // Max Samplers per stage 16 2048 2048 |
| |
| // https://docs.microsoft.com/en-us/windows-hardware/test/hlk/testref/efad06e8-51d1-40ce-ad5c-573a134b4bb6 |
| // "full" means the full heap can be used. This is tested |
| // to work for 1 million descriptors, and 1.1M for tier 3. |
| uint32_t maxCBVsPerStage; |
| uint32_t maxSRVsPerStage; |
| uint32_t maxUAVsAllStages; |
| uint32_t maxSamplersPerStage; |
| switch (featureData.ResourceBindingTier) { |
| case D3D12_RESOURCE_BINDING_TIER_1: |
| maxCBVsPerStage = 14; |
| maxSRVsPerStage = 128; |
| maxUAVsAllStages = 64; |
| maxSamplersPerStage = 16; |
| break; |
| case D3D12_RESOURCE_BINDING_TIER_2: |
| maxCBVsPerStage = 14; |
| maxSRVsPerStage = 1'000'000; |
| maxUAVsAllStages = 64; |
| maxSamplersPerStage = 2048; |
| break; |
| case D3D12_RESOURCE_BINDING_TIER_3: |
| default: |
| maxCBVsPerStage = 1'100'000; |
| maxSRVsPerStage = 1'100'000; |
| maxUAVsAllStages = 1'100'000; |
| maxSamplersPerStage = 2048; |
| break; |
| } |
| |
| ASSERT(maxUAVsAllStages / 4 > limits->v1.maxStorageTexturesPerShaderStage); |
| ASSERT(maxUAVsAllStages / 4 > limits->v1.maxStorageBuffersPerShaderStage); |
| uint32_t maxUAVsPerStage = maxUAVsAllStages / 2; |
| |
| limits->v1.maxUniformBuffersPerShaderStage = maxCBVsPerStage; |
| // Allocate half of the UAVs to storage buffers, and half to storage textures. |
| limits->v1.maxStorageTexturesPerShaderStage = maxUAVsPerStage / 2; |
| limits->v1.maxStorageBuffersPerShaderStage = maxUAVsPerStage - maxUAVsPerStage / 2; |
| limits->v1.maxSampledTexturesPerShaderStage = maxSRVsPerStage; |
| limits->v1.maxSamplersPerShaderStage = maxSamplersPerStage; |
| |
| limits->v1.maxColorAttachments = D3D12_SIMULTANEOUS_RENDER_TARGET_COUNT; |
| |
| // https://docs.microsoft.com/en-us/windows/win32/direct3d12/root-signature-limits |
| // In DWORDS. Descriptor tables cost 1, Root constants cost 1, Root descriptors cost 2. |
| static constexpr uint32_t kMaxRootSignatureSize = 64u; |
| // Dawn maps WebGPU's binding model by: |
| // - (maxBindGroups) |
| // CBVs/UAVs/SRVs for bind group are a root descriptor table |
| // - (maxBindGroups) |
| // Samplers for each bind group are a root descriptor table |
| // - dynamic uniform buffers - root descriptor |
| // - dynamic storage buffers - root descriptor plus a root constant for the size |
| // RESERVED: |
| // - 3 = max of: |
| // - 2 root constants for the baseVertex/baseInstance constants. |
| // - 3 root constants for num workgroups X, Y, Z |
| static constexpr uint32_t kReservedSlots = 3; |
| |
| // Costs: |
| // - bind group: 2 = 1 cbv/uav/srv table + 1 sampler table |
| // - dynamic uniform buffer: 2 slots for a root descriptor |
| // - dynamic storage buffer: 3 slots for a root descriptor + root constant |
| |
| // Available slots after base limits considered. |
| uint32_t availableRootSignatureSlots = |
| kMaxRootSignatureSize - kReservedSlots - 2 * limits->v1.maxBindGroups - |
| 2 * limits->v1.maxDynamicUniformBuffersPerPipelineLayout - |
| 3 * limits->v1.maxDynamicStorageBuffersPerPipelineLayout; |
| |
| while (availableRootSignatureSlots >= 2) { |
| // Start by incrementing maxDynamicStorageBuffersPerPipelineLayout since the |
| // default is just 4 and developers likely want more. This scheme currently |
| // gets us to 8. |
| if (availableRootSignatureSlots >= 3) { |
| limits->v1.maxDynamicStorageBuffersPerPipelineLayout += 1; |
| availableRootSignatureSlots -= 3; |
| } |
| if (availableRootSignatureSlots >= 2) { |
| limits->v1.maxBindGroups += 1; |
| availableRootSignatureSlots -= 2; |
| } |
| if (availableRootSignatureSlots >= 2) { |
| limits->v1.maxDynamicUniformBuffersPerPipelineLayout += 1; |
| availableRootSignatureSlots -= 2; |
| } |
| } |
| |
| ASSERT(2 * limits->v1.maxBindGroups + 2 * limits->v1.maxDynamicUniformBuffersPerPipelineLayout + |
| 3 * limits->v1.maxDynamicStorageBuffersPerPipelineLayout <= |
| kMaxRootSignatureSize - kReservedSlots); |
| |
| // https://docs.microsoft.com/en-us/windows/win32/direct3dhlsl/sm5-attributes-numthreads |
| limits->v1.maxComputeWorkgroupSizeX = D3D12_CS_THREAD_GROUP_MAX_X; |
| limits->v1.maxComputeWorkgroupSizeY = D3D12_CS_THREAD_GROUP_MAX_Y; |
| limits->v1.maxComputeWorkgroupSizeZ = D3D12_CS_THREAD_GROUP_MAX_Z; |
| limits->v1.maxComputeInvocationsPerWorkgroup = D3D12_CS_THREAD_GROUP_MAX_THREADS_PER_GROUP; |
| |
| // https://docs.microsoft.com/en-us/windows/win32/api/d3d12/ns-d3d12-d3d12_dispatch_arguments |
| limits->v1.maxComputeWorkgroupsPerDimension = D3D12_CS_DISPATCH_MAX_THREAD_GROUPS_PER_DIMENSION; |
| |
| // https://docs.microsoft.com/en-us/windows/win32/direct3d11/overviews-direct3d-11-devices-downlevel-compute-shaders |
| // Thread Group Shared Memory is limited to 16Kb on downlevel hardware. This is less than |
| // the 32Kb that is available to Direct3D 11 hardware. D3D12 is also 32kb. |
| limits->v1.maxComputeWorkgroupStorageSize = 32768; |
| |
| // Max number of "constants" where each constant is a 16-byte float4 |
| limits->v1.maxUniformBufferBindingSize = D3D12_REQ_CONSTANT_BUFFER_ELEMENT_COUNT * 16; |
| |
| if (gpu_info::IsQualcomm(GetVendorId())) { |
| // limit of number of texels in a buffer == (1 << 27) |
| // D3D12_REQ_BUFFER_RESOURCE_TEXEL_COUNT_2_TO_EXP |
| // This limit doesn't apply to a raw buffer, but only applies to |
| // typed, or structured buffer. so this could be a QC driver bug. |
| limits->v1.maxStorageBufferBindingSize = uint64_t(1) |
| << D3D12_REQ_BUFFER_RESOURCE_TEXEL_COUNT_2_TO_EXP; |
| } else { |
| limits->v1.maxStorageBufferBindingSize = kAssumedMaxBufferSize; |
| } |
| |
| // D3D12 has no documented limit on the buffer size. |
| limits->v1.maxBufferSize = kAssumedMaxBufferSize; |
| |
| // Using base limits for: |
| // TODO(crbug.com/dawn/685): |
| // - maxInterStageShaderComponents |
| // - maxVertexBufferArrayStride |
| |
| // TODO(crbug.com/dawn/1448): |
| // - maxInterStageShaderVariables |
| |
| return {}; |
| } |
| |
| MaybeError PhysicalDevice::ValidateFeatureSupportedWithTogglesImpl( |
| wgpu::FeatureName feature, |
| const TogglesState& toggles) const { |
| // shader-f16 feature and chromium-experimental-dp4a feature require DXC 1.4 or higher for |
| // D3D12. Note that DXC version is checked in InitializeSupportedFeaturesImpl. |
| if (feature == wgpu::FeatureName::ShaderF16 || |
| feature == wgpu::FeatureName::ChromiumExperimentalDp4a) { |
| DAWN_INVALID_IF(!toggles.IsEnabled(Toggle::UseDXC), "Feature %s requires DXC for D3D12.", |
| GetInstance()->GetFeatureInfo(feature)->name); |
| } |
| return {}; |
| } |
| |
| MaybeError PhysicalDevice::InitializeDebugLayerFilters() { |
| if (!GetInstance()->IsBackendValidationEnabled()) { |
| return {}; |
| } |
| |
| D3D12_MESSAGE_ID denyIds[] = { |
| // |
| // Permanent IDs: list of warnings that are not applicable |
| // |
| |
| // Resource sub-allocation partially maps pre-allocated heaps. This means the |
| // entire physical addresses space may have no resources or have many resources |
| // assigned the same heap. |
| D3D12_MESSAGE_ID_HEAP_ADDRESS_RANGE_HAS_NO_RESOURCE, |
| D3D12_MESSAGE_ID_HEAP_ADDRESS_RANGE_INTERSECTS_MULTIPLE_BUFFERS, |
| |
| // The debug layer validates pipeline objects when they are created. Dawn validates |
| // them when them when they are set. Therefore, since the issue is caught at a later |
| // time, we can silence this warnings. |
| D3D12_MESSAGE_ID_CREATEGRAPHICSPIPELINESTATE_RENDERTARGETVIEW_NOT_SET, |
| |
| // Adding a clear color during resource creation would require heuristics or delayed |
| // creation. |
| // https://crbug.com/dawn/418 |
| D3D12_MESSAGE_ID_CLEARRENDERTARGETVIEW_MISMATCHINGCLEARVALUE, |
| D3D12_MESSAGE_ID_CLEARDEPTHSTENCILVIEW_MISMATCHINGCLEARVALUE, |
| |
| // Dawn enforces proper Unmaps at a later time. |
| // https://crbug.com/dawn/422 |
| D3D12_MESSAGE_ID_EXECUTECOMMANDLISTS_GPU_WRITTEN_READBACK_RESOURCE_MAPPED, |
| |
| // WebGPU allows empty scissors without empty viewports. |
| D3D12_MESSAGE_ID_DRAW_EMPTY_SCISSOR_RECTANGLE, |
| |
| // |
| // Temporary IDs: list of warnings that should be fixed or promoted |
| // |
| |
| // Remove after warning have been addressed |
| // https://crbug.com/dawn/421 |
| D3D12_MESSAGE_ID_GPU_BASED_VALIDATION_INCOMPATIBLE_RESOURCE_STATE, |
| |
| // For small placed resource alignment, we first request the small alignment, which may |
| // get rejected and generate a debug error. Then, we request 0 to get the allowed |
| // allowed alignment. |
| D3D12_MESSAGE_ID_CREATERESOURCE_INVALIDALIGNMENT, |
| |
| // WebGPU allows OOB vertex buffer access and relies on D3D12's robust buffer access |
| // behavior. |
| D3D12_MESSAGE_ID_COMMAND_LIST_DRAW_VERTEX_BUFFER_TOO_SMALL, |
| |
| // WebGPU allows setVertexBuffer with offset that equals to the whole vertex buffer |
| // size. |
| // Even this means that no vertex buffer view has been set in D3D12 backend. |
| // https://crbug.com/dawn/1255 |
| D3D12_MESSAGE_ID_COMMAND_LIST_DRAW_VERTEX_BUFFER_NOT_SET, |
| |
| // When using f16 in vertex attributes the debug layer may report float16_t as type |
| // `unknown`, resulting in a CREATEINPUTLAYOUT_TYPE_MISMATCH warning. |
| // https://crbug.com/tint/1473 |
| D3D12_MESSAGE_ID_CREATEINPUTLAYOUT_TYPE_MISMATCH, |
| }; |
| |
| // Create a retrieval filter with a deny list to suppress messages. |
| // Any messages remaining will be converted to Dawn errors. |
| D3D12_INFO_QUEUE_FILTER filter{}; |
| // Filter out info/message and only create errors from warnings or worse. |
| D3D12_MESSAGE_SEVERITY severities[] = { |
| D3D12_MESSAGE_SEVERITY_INFO, |
| D3D12_MESSAGE_SEVERITY_MESSAGE, |
| }; |
| filter.DenyList.NumSeverities = ARRAYSIZE(severities); |
| filter.DenyList.pSeverityList = severities; |
| filter.DenyList.NumIDs = ARRAYSIZE(denyIds); |
| filter.DenyList.pIDList = denyIds; |
| |
| ComPtr<ID3D12InfoQueue> infoQueue; |
| DAWN_TRY(CheckHRESULT(mD3d12Device.As(&infoQueue), |
| "D3D12 QueryInterface ID3D12Device to ID3D12InfoQueue")); |
| |
| // To avoid flooding the console, a storage-filter is also used to |
| // prevent messages from getting logged. |
| DAWN_TRY( |
| CheckHRESULT(infoQueue->PushStorageFilter(&filter), "ID3D12InfoQueue::PushStorageFilter")); |
| |
| DAWN_TRY(CheckHRESULT(infoQueue->PushRetrievalFilter(&filter), |
| "ID3D12InfoQueue::PushRetrievalFilter")); |
| |
| return {}; |
| } |
| |
| void PhysicalDevice::CleanUpDebugLayerFilters() { |
| if (!GetInstance()->IsBackendValidationEnabled()) { |
| return; |
| } |
| |
| // The device may not exist if this adapter failed to initialize. |
| if (mD3d12Device == nullptr) { |
| return; |
| } |
| |
| // If the debug layer is not installed, return immediately to avoid crashing the process. |
| ComPtr<ID3D12InfoQueue> infoQueue; |
| if (FAILED(mD3d12Device.As(&infoQueue))) { |
| return; |
| } |
| |
| infoQueue->PopRetrievalFilter(); |
| infoQueue->PopStorageFilter(); |
| } |
| |
| void PhysicalDevice::SetupBackendDeviceToggles(TogglesState* deviceToggles) const { |
| const bool useResourceHeapTier2 = (GetDeviceInfo().resourceHeapTier >= 2); |
| deviceToggles->Default(Toggle::UseD3D12ResourceHeapTier2, useResourceHeapTier2); |
| deviceToggles->Default(Toggle::UseD3D12RenderPass, GetDeviceInfo().supportsRenderPass); |
| deviceToggles->Default(Toggle::UseD3D12ResidencyManagement, true); |
| deviceToggles->Default(Toggle::D3D12AlwaysUseTypelessFormatsForCastableTexture, |
| !GetDeviceInfo().supportsCastingFullyTypedFormat); |
| deviceToggles->Default(Toggle::ApplyClearBigIntegerColorValueWithDraw, true); |
| |
| // The restriction on the source box specifying a portion of the depth stencil texture in |
| // CopyTextureRegion() is only available on the D3D12 platforms which doesn't support |
| // programmable sample positions. |
| deviceToggles->Default( |
| Toggle::D3D12UseTempBufferInDepthStencilTextureAndBufferCopyWithNonZeroBufferOffset, |
| GetDeviceInfo().programmableSamplePositionsTier == 0); |
| |
| // Check DXC for use_dxc toggle, and default to use FXC |
| // TODO(dawn:1495): When implementing adapter toggles, promote UseDXC as adapter toggle, and do |
| // the validation when creating adapters. |
| if (!GetBackend()->IsDXCAvailable()) { |
| deviceToggles->ForceSet(Toggle::UseDXC, false); |
| } |
| deviceToggles->Default(Toggle::UseDXC, false); |
| |
| // Disable optimizations when using FXC |
| // See https://crbug.com/dawn/1203 |
| deviceToggles->Default(Toggle::FxcOptimizations, false); |
| |
| // By default use the maximum shader-visible heap size allowed. |
| deviceToggles->Default(Toggle::UseD3D12SmallShaderVisibleHeapForTesting, false); |
| |
| // By default use D3D12 Root Signature Version 1.1 when possible |
| deviceToggles->Default(Toggle::D3D12UseRootSignatureVersion1_1, |
| GetDeviceInfo().supportsRootSignatureVersion1_1); |
| |
| uint32_t deviceId = GetDeviceId(); |
| uint32_t vendorId = GetVendorId(); |
| |
| // Currently this workaround is only needed on Intel Gen9, Gen9.5 and Gen11 GPUs. |
| // See http://crbug.com/1161355 for more information. |
| if (gpu_info::IsIntelGen9(vendorId, deviceId) || gpu_info::IsIntelGen11(vendorId, deviceId)) { |
| const gpu_info::DriverVersion kFixedDriverVersion = {31, 0, 101, 2114}; |
| if (gpu_info::CompareWindowsDriverVersion(vendorId, GetDriverVersion(), |
| kFixedDriverVersion) < 0) { |
| deviceToggles->Default( |
| Toggle::UseTempBufferInSmallFormatTextureToTextureCopyFromGreaterToLessMipLevel, |
| true); |
| } |
| } |
| |
| // Currently this workaround is only needed on Intel Gen9, Gen9.5 and Gen12 GPUs. |
| // See http://crbug.com/dawn/1487 for more information. |
| if (gpu_info::IsIntelGen9(vendorId, deviceId) || gpu_info::IsIntelGen12LP(vendorId, deviceId) || |
| gpu_info::IsIntelGen12HP(vendorId, deviceId)) { |
| deviceToggles->Default(Toggle::D3D12ForceClearCopyableDepthStencilTextureOnCreation, true); |
| } |
| |
| // Currently this workaround is only needed on Intel Gen12 GPUs. |
| // See http://crbug.com/dawn/1487 for more information. |
| if (gpu_info::IsIntelGen12LP(vendorId, deviceId) || |
| gpu_info::IsIntelGen12HP(vendorId, deviceId)) { |
| deviceToggles->Default(Toggle::D3D12DontSetClearValueOnDepthTextureCreation, true); |
| } |
| |
| // Currently this workaround is needed on any D3D12 backend for some particular situations. |
| // But we may need to limit it if D3D12 runtime fixes the bug on its new release. See |
| // https://crbug.com/dawn/1289 for more information. |
| // TODO(dawn:1289): Unset this toggle when we skip the split on the buffer-texture copy |
| // on the platforms where UnrestrictedBufferTextureCopyPitchSupported is true. |
| deviceToggles->Default(Toggle::D3D12SplitBufferTextureCopyForRowsPerImagePaddings, true); |
| |
| // This workaround is only needed on Intel Gen12LP with driver prior to 30.0.101.1692. |
| // See http://crbug.com/dawn/949 for more information. |
| if (gpu_info::IsIntelGen12LP(vendorId, deviceId)) { |
| const gpu_info::DriverVersion kFixedDriverVersion = {30, 0, 101, 1692}; |
| if (gpu_info::CompareWindowsDriverVersion(vendorId, GetDriverVersion(), |
| kFixedDriverVersion) == -1) { |
| deviceToggles->Default(Toggle::D3D12AllocateExtraMemoryFor2DArrayColorTexture, true); |
| } |
| } |
| |
| // This workaround is needed on Intel Gen12LP GPUs with driver >= 30.0.101.4091. |
| // See http://crbug.com/dawn/1083 for more information. |
| if (gpu_info::IsIntelGen12LP(vendorId, deviceId)) { |
| const gpu_info::DriverVersion kDriverVersion = {30, 0, 101, 4091}; |
| if (gpu_info::CompareWindowsDriverVersion(vendorId, GetDriverVersion(), kDriverVersion) != |
| -1) { |
| deviceToggles->Default(Toggle::UseBlitForDepthTextureToTextureCopyToNonzeroSubresource, |
| true); |
| } |
| } |
| |
| // D3D driver has a bug resolving overlapping queries to a same buffer on Intel Gen12 GPUs. This |
| // workaround is needed on the driver version >= 30.0.101.3413. |
| // TODO(crbug.com/dawn/1546): Remove the workaround when the bug is fixed in D3D driver. |
| if (gpu_info::IsIntelGen12LP(vendorId, deviceId) || |
| gpu_info::IsIntelGen12HP(vendorId, deviceId)) { |
| const gpu_info::DriverVersion kDriverVersion = {30, 0, 101, 3413}; |
| if (gpu_info::CompareWindowsDriverVersion(vendorId, GetDriverVersion(), kDriverVersion) != |
| -1) { |
| deviceToggles->Default(Toggle::ClearBufferBeforeResolveQueries, true); |
| } |
| } |
| |
| // Currently these workarounds are only needed on Intel Gen9.5 and Gen11 GPUs. |
| // See http://crbug.com/1237175 and http://crbug.com/dawn/1628 for more information. |
| if ((gpu_info::IsIntelGen9(vendorId, deviceId) && !gpu_info::IsSkylake(deviceId)) || |
| gpu_info::IsIntelGen11(vendorId, deviceId)) { |
| deviceToggles->Default( |
| Toggle::DisableSubAllocationFor2DTextureWithCopyDstOrRenderAttachment, true); |
| // Now we don't need to force clearing depth stencil textures with CopyDst as all the depth |
| // stencil textures (can only be 2D textures) will be created with CreateCommittedResource() |
| // instead of CreatePlacedResource(). |
| deviceToggles->Default(Toggle::D3D12ForceClearCopyableDepthStencilTextureOnCreation, false); |
| } |
| |
| // Currently this toggle is only needed on Intel Gen9 and Gen9.5 GPUs. |
| // See http://crbug.com/dawn/1579 for more information. |
| if (gpu_info::IsIntelGen9(vendorId, deviceId)) { |
| const gpu_info::DriverVersion kFixedDriverVersion = {31, 0, 101, 2121}; |
| if (gpu_info::CompareWindowsDriverVersion(vendorId, GetDriverVersion(), |
| kFixedDriverVersion) < 0) { |
| // We can add workaround when the blending operation is "Add", DstFactor is "Zero" and |
| // SrcFactor is "DstAlpha". |
| deviceToggles->ForceSet( |
| Toggle::D3D12ReplaceAddWithMinusWhenDstFactorIsZeroAndSrcFactorIsDstAlpha, true); |
| |
| // Unfortunately we cannot add workaround for other cases. |
| deviceToggles->ForceSet( |
| Toggle::NoWorkaroundDstAlphaAsSrcBlendFactorForBothColorAndAlphaDoesNotWork, true); |
| } |
| } |
| |
| #if D3D12_SDK_VERSION >= 602 |
| D3D12_FEATURE_DATA_D3D12_OPTIONS13 featureData13; |
| if (FAILED(mD3d12Device->CheckFeatureSupport(D3D12_FEATURE_D3D12_OPTIONS13, &featureData13, |
| sizeof(featureData13)))) { |
| // If the platform doesn't support D3D12_FEATURE_D3D12_OPTIONS13, default initialize the |
| // struct to set all features to false. |
| featureData13 = {}; |
| } |
| if (!featureData13.TextureCopyBetweenDimensionsSupported) |
| #endif |
| { |
| deviceToggles->ForceSet( |
| Toggle::D3D12UseTempBufferInTextureToTextureCopyBetweenDifferentDimensions, true); |
| } |
| |
| // Polyfill reflect builtin for vec2<f32> on Intel device in usng FXC. |
| // See https://crbug.com/tint/1798 for more information. |
| if (gpu_info::IsIntel(vendorId) && !deviceToggles->IsEnabled(Toggle::UseDXC)) { |
| deviceToggles->Default(Toggle::D3D12PolyfillReflectVec2F32, true); |
| } |
| } |
| |
| ResultOrError<Ref<DeviceBase>> PhysicalDevice::CreateDeviceImpl(AdapterBase* adapter, |
| const DeviceDescriptor* descriptor, |
| const TogglesState& deviceToggles) { |
| return Device::Create(adapter, descriptor, deviceToggles); |
| } |
| |
| // Resets the backend device and creates a new one. If any D3D12 objects belonging to the |
| // current ID3D12Device have not been destroyed, a non-zero value will be returned upon Reset() |
| // and the subequent call to CreateDevice will return a handle the existing device instead of |
| // creating a new one. |
| MaybeError PhysicalDevice::ResetInternalDeviceForTestingImpl() { |
| [[maybe_unused]] auto refCount = mD3d12Device.Reset(); |
| ASSERT(refCount == 0); |
| DAWN_TRY(Initialize()); |
| |
| return {}; |
| } |
| |
| } // namespace dawn::native::d3d12 |