#include "d3d12_host_display.h" #include "common/assert.h" #include "common/d3d11/shader_compiler.h" #include "common/d3d12/context.h" #include "common/d3d12/shader_cache.h" #include "common/d3d12/util.h" #include "common/log.h" #include "common/string_util.h" #include "core/settings.h" #include "display_ps.hlsl.h" #include "display_vs.hlsl.h" #include "frontend-common/postprocessing_shadergen.h" #include "imgui.h" #include "imgui_impl_dx12.h" #include #include Log_SetChannel(D3D12HostDisplay); static constexpr const std::array s_clear_color = {0.0f, 0.0f, 0.0f, 1.0f}; D3D12HostDisplay::D3D12HostDisplay() = default; D3D12HostDisplay::~D3D12HostDisplay() { if (!g_d3d12_context) return; // DestroyRenderSurface() will exec the command list. DestroyRenderSurface(); DestroyResources(); g_d3d12_context->Destroy(); } RenderAPI D3D12HostDisplay::GetRenderAPI() const { return RenderAPI::D3D12; } void* D3D12HostDisplay::GetRenderDevice() const { return g_d3d12_context->GetDevice(); } void* D3D12HostDisplay::GetRenderContext() const { return g_d3d12_context.get(); } bool D3D12HostDisplay::HasRenderDevice() const { return static_cast(g_d3d12_context); } bool D3D12HostDisplay::HasRenderSurface() const { return static_cast(m_swap_chain); } std::unique_ptr D3D12HostDisplay::CreateTexture(u32 width, u32 height, u32 layers, u32 levels, u32 samples, GPUTexture::Format format, const void* data, u32 data_stride, bool dynamic /* = false */) { const DXGI_FORMAT dformat = D3D12::Texture::GetDXGIFormat(format); if (dformat == DXGI_FORMAT_UNKNOWN) return {}; std::unique_ptr tex(std::make_unique()); if (!tex->Create(width, height, layers, levels, samples, dformat, dformat, DXGI_FORMAT_UNKNOWN, DXGI_FORMAT_UNKNOWN, D3D12_RESOURCE_FLAG_NONE)) { return {}; } if (data && !tex->LoadData(0, 0, width, height, data, data_stride)) return {}; return tex; } bool D3D12HostDisplay::BeginTextureUpdate(GPUTexture* texture, u32 width, u32 height, void** out_buffer, u32* out_pitch) { return static_cast(texture)->BeginStreamUpdate(0, 0, width, height, out_buffer, out_pitch); } void D3D12HostDisplay::EndTextureUpdate(GPUTexture* texture, u32 x, u32 y, u32 width, u32 height) { static_cast(texture)->EndStreamUpdate(x, y, width, height); } bool D3D12HostDisplay::UpdateTexture(GPUTexture* texture, u32 x, u32 y, u32 width, u32 height, const void* data, u32 pitch) { return HostDisplay::UpdateTexture(texture, x, y, width, height, data, pitch); } bool D3D12HostDisplay::DownloadTexture(GPUTexture* texture, u32 x, u32 y, u32 width, u32 height, void* out_data, u32 out_data_stride) { const D3D12::Texture* tex = static_cast(texture); if (!m_readback_staging_texture.EnsureSize(width, height, tex->GetDXGIFormat(), false)) return false; const D3D12_RESOURCE_STATES old_state = tex->GetState(); tex->TransitionToState(D3D12_RESOURCE_STATE_COPY_SOURCE); m_readback_staging_texture.CopyFromTexture(tex->GetResource(), 0, x, y, 0, 0, width, height); tex->TransitionToState(old_state); return m_readback_staging_texture.ReadPixels(0, 0, width, height, out_data, out_data_stride); } bool D3D12HostDisplay::SupportsTextureFormat(GPUTexture::Format format) const { const DXGI_FORMAT dfmt = D3D12::Texture::GetDXGIFormat(format); if (dfmt == DXGI_FORMAT_UNKNOWN) return false; return g_d3d12_context->SupportsTextureFormat(dfmt); } bool D3D12HostDisplay::GetHostRefreshRate(float* refresh_rate) { if (m_swap_chain && IsFullscreen()) { DXGI_SWAP_CHAIN_DESC desc; if (SUCCEEDED(m_swap_chain->GetDesc(&desc)) && desc.BufferDesc.RefreshRate.Numerator > 0 && desc.BufferDesc.RefreshRate.Denominator > 0) { Log_InfoPrintf("using fs rr: %u %u", desc.BufferDesc.RefreshRate.Numerator, desc.BufferDesc.RefreshRate.Denominator); *refresh_rate = static_cast(desc.BufferDesc.RefreshRate.Numerator) / static_cast(desc.BufferDesc.RefreshRate.Denominator); return true; } } return HostDisplay::GetHostRefreshRate(refresh_rate); } void D3D12HostDisplay::SetVSync(bool enabled) { m_vsync = enabled; } bool D3D12HostDisplay::CreateRenderDevice(const WindowInfo& wi, std::string_view adapter_name, bool debug_device, bool threaded_presentation) { ComPtr temp_dxgi_factory; #if WINAPI_FAMILY_PARTITION(WINAPI_PARTITION_DESKTOP) HRESULT hr = CreateDXGIFactory(IID_PPV_ARGS(temp_dxgi_factory.GetAddressOf())); #else HRESULT hr = CreateDXGIFactory2(0, IID_PPV_ARGS(temp_dxgi_factory.GetAddressOf())); #endif if (FAILED(hr)) { Log_ErrorPrintf("Failed to create DXGI factory: 0x%08X", hr); return false; } u32 adapter_index; if (!adapter_name.empty()) { AdapterAndModeList adapter_info(GetAdapterAndModeList(temp_dxgi_factory.Get())); for (adapter_index = 0; adapter_index < static_cast(adapter_info.adapter_names.size()); adapter_index++) { if (adapter_name == adapter_info.adapter_names[adapter_index]) break; } if (adapter_index == static_cast(adapter_info.adapter_names.size())) { Log_WarningPrintf("Could not find adapter '%*s', using first (%s)", static_cast(adapter_name.size()), adapter_name.data(), adapter_info.adapter_names[0].c_str()); adapter_index = 0; } } else { Log_InfoPrintf("No adapter selected, using first."); adapter_index = 0; } if (!D3D12::Context::Create(temp_dxgi_factory.Get(), adapter_index, debug_device)) return false; if (FAILED(hr)) { Log_ErrorPrintf("Failed to create D3D device: 0x%08X", hr); return false; } m_dxgi_factory = std::move(temp_dxgi_factory); m_allow_tearing_supported = false; ComPtr dxgi_factory5; hr = m_dxgi_factory.As(&dxgi_factory5); if (SUCCEEDED(hr)) { BOOL allow_tearing_supported = false; hr = dxgi_factory5->CheckFeatureSupport(DXGI_FEATURE_PRESENT_ALLOW_TEARING, &allow_tearing_supported, sizeof(allow_tearing_supported)); if (SUCCEEDED(hr)) m_allow_tearing_supported = (allow_tearing_supported == TRUE); } m_window_info = wi; if (m_window_info.type != WindowInfo::Type::Surfaceless && !CreateSwapChain(nullptr)) { m_window_info = {}; return false; } return true; } bool D3D12HostDisplay::InitializeRenderDevice(std::string_view shader_cache_directory, bool debug_device, bool threaded_presentation) { if (!CreateResources()) return false; return true; } bool D3D12HostDisplay::MakeRenderContextCurrent() { return true; } bool D3D12HostDisplay::DoneRenderContextCurrent() { return true; } bool D3D12HostDisplay::CreateSwapChain(const DXGI_MODE_DESC* fullscreen_mode) { HRESULT hr; #if WINAPI_FAMILY_PARTITION(WINAPI_PARTITION_DESKTOP) if (m_window_info.type != WindowInfo::Type::Win32) return false; const HWND window_hwnd = reinterpret_cast(m_window_info.window_handle); RECT client_rc{}; GetClientRect(window_hwnd, &client_rc); const u32 width = static_cast(client_rc.right - client_rc.left); const u32 height = static_cast(client_rc.bottom - client_rc.top); DXGI_SWAP_CHAIN_DESC swap_chain_desc = {}; swap_chain_desc.BufferDesc.Width = width; swap_chain_desc.BufferDesc.Height = height; swap_chain_desc.BufferDesc.Format = DXGI_FORMAT_R8G8B8A8_UNORM; swap_chain_desc.SampleDesc.Count = 1; swap_chain_desc.BufferCount = 2; swap_chain_desc.BufferUsage = DXGI_USAGE_RENDER_TARGET_OUTPUT; swap_chain_desc.OutputWindow = window_hwnd; swap_chain_desc.Windowed = TRUE; swap_chain_desc.SwapEffect = DXGI_SWAP_EFFECT_FLIP_DISCARD; m_using_allow_tearing = (m_allow_tearing_supported && !fullscreen_mode); if (m_using_allow_tearing) swap_chain_desc.Flags |= DXGI_SWAP_CHAIN_FLAG_ALLOW_TEARING; if (fullscreen_mode) { swap_chain_desc.Flags = DXGI_SWAP_CHAIN_FLAG_ALLOW_MODE_SWITCH; swap_chain_desc.Windowed = FALSE; swap_chain_desc.BufferDesc = *fullscreen_mode; } Log_InfoPrintf("Creating a %dx%d %s swap chain", swap_chain_desc.BufferDesc.Width, swap_chain_desc.BufferDesc.Height, swap_chain_desc.Windowed ? "windowed" : "full-screen"); hr = m_dxgi_factory->CreateSwapChain(g_d3d12_context->GetCommandQueue(), &swap_chain_desc, m_swap_chain.GetAddressOf()); if (FAILED(hr)) { Log_ErrorPrintf("CreateSwapChain failed: 0x%08X", hr); return false; } hr = m_dxgi_factory->MakeWindowAssociation(swap_chain_desc.OutputWindow, DXGI_MWA_NO_WINDOW_CHANGES); if (FAILED(hr)) Log_WarningPrintf("MakeWindowAssociation() to disable ALT+ENTER failed"); #else if (m_window_info.type != WindowInfo::Type::WinRT) return false; ComPtr factory2; hr = m_dxgi_factory.As(&factory2); if (FAILED(hr)) { Log_ErrorPrintf("Failed to get DXGI factory: %08X", hr); return false; } DXGI_SWAP_CHAIN_DESC1 swap_chain_desc = {}; swap_chain_desc.Width = m_window_info.surface_width; swap_chain_desc.Height = m_window_info.surface_height; swap_chain_desc.Format = DXGI_FORMAT_R8G8B8A8_UNORM; swap_chain_desc.SampleDesc.Count = 1; swap_chain_desc.BufferCount = 3; swap_chain_desc.BufferUsage = DXGI_USAGE_RENDER_TARGET_OUTPUT; swap_chain_desc.SwapEffect = DXGI_SWAP_EFFECT_FLIP_DISCARD; m_using_allow_tearing = (m_allow_tearing_supported && !fullscreen_mode); if (m_using_allow_tearing) swap_chain_desc.Flags |= DXGI_SWAP_CHAIN_FLAG_ALLOW_TEARING; ComPtr swap_chain1; hr = factory2->CreateSwapChainForCoreWindow(g_d3d12_context->GetCommandQueue(), static_cast(m_window_info.window_handle), &swap_chain_desc, nullptr, swap_chain1.GetAddressOf()); if (FAILED(hr)) { Log_ErrorPrintf("CreateSwapChainForCoreWindow failed: 0x%08X", hr); return false; } m_swap_chain = swap_chain1; #endif return CreateSwapChainRTV(); } bool D3D12HostDisplay::CreateSwapChainRTV() { DXGI_SWAP_CHAIN_DESC swap_chain_desc; HRESULT hr = m_swap_chain->GetDesc(&swap_chain_desc); if (FAILED(hr)) return false; for (u32 i = 0; i < swap_chain_desc.BufferCount; i++) { ComPtr backbuffer; hr = m_swap_chain->GetBuffer(i, IID_PPV_ARGS(backbuffer.GetAddressOf())); if (FAILED(hr)) { Log_ErrorPrintf("GetBuffer for RTV failed: 0x%08X", hr); return false; } D3D12::Texture tex; if (!tex.Adopt(std::move(backbuffer), DXGI_FORMAT_UNKNOWN, swap_chain_desc.BufferDesc.Format, DXGI_FORMAT_UNKNOWN, D3D12_RESOURCE_STATE_PRESENT)) { return false; } m_swap_chain_buffers.push_back(std::move(tex)); } m_window_info.surface_width = swap_chain_desc.BufferDesc.Width; m_window_info.surface_height = swap_chain_desc.BufferDesc.Height; Log_InfoPrintf("Swap chain buffer size: %ux%u", m_window_info.surface_width, m_window_info.surface_height); if (m_window_info.type == WindowInfo::Type::Win32) { BOOL fullscreen = FALSE; DXGI_SWAP_CHAIN_DESC desc; if (SUCCEEDED(m_swap_chain->GetFullscreenState(&fullscreen, nullptr)) && fullscreen && SUCCEEDED(m_swap_chain->GetDesc(&desc))) { m_window_info.surface_refresh_rate = static_cast(desc.BufferDesc.RefreshRate.Numerator) / static_cast(desc.BufferDesc.RefreshRate.Denominator); } else { m_window_info.surface_refresh_rate = 0.0f; } } m_current_swap_chain_buffer = 0; return true; } void D3D12HostDisplay::DestroySwapChainRTVs() { for (D3D12::Texture& buffer : m_swap_chain_buffers) buffer.Destroy(false); m_swap_chain_buffers.clear(); m_current_swap_chain_buffer = 0; } bool D3D12HostDisplay::ChangeRenderWindow(const WindowInfo& new_wi) { DestroyRenderSurface(); m_window_info = new_wi; return CreateSwapChain(nullptr); } void D3D12HostDisplay::DestroyRenderSurface() { // For some reason if we don't execute the command list here, the swap chain is in use.. not sure where. g_d3d12_context->ExecuteCommandList(true); if (IsFullscreen()) SetFullscreen(false, 0, 0, 0.0f); DestroySwapChainRTVs(); m_swap_chain.Reset(); } void D3D12HostDisplay::ResizeRenderWindow(s32 new_window_width, s32 new_window_height) { if (!m_swap_chain) return; // For some reason if we don't execute the command list here, the swap chain is in use.. not sure where. g_d3d12_context->ExecuteCommandList(true); DestroySwapChainRTVs(); HRESULT hr = m_swap_chain->ResizeBuffers(0, 0, 0, DXGI_FORMAT_UNKNOWN, m_using_allow_tearing ? DXGI_SWAP_CHAIN_FLAG_ALLOW_TEARING : 0); if (FAILED(hr)) Log_ErrorPrintf("ResizeBuffers() failed: 0x%08X", hr); if (!CreateSwapChainRTV()) Panic("Failed to recreate swap chain RTV after resize"); } bool D3D12HostDisplay::SupportsFullscreen() const { return true; } bool D3D12HostDisplay::IsFullscreen() { BOOL is_fullscreen = FALSE; return (m_swap_chain && SUCCEEDED(m_swap_chain->GetFullscreenState(&is_fullscreen, nullptr)) && is_fullscreen); } bool D3D12HostDisplay::SetFullscreen(bool fullscreen, u32 width, u32 height, float refresh_rate) { if (!m_swap_chain) return false; BOOL is_fullscreen = FALSE; HRESULT hr = m_swap_chain->GetFullscreenState(&is_fullscreen, nullptr); if (!fullscreen) { // leaving fullscreen if (is_fullscreen) return SUCCEEDED(m_swap_chain->SetFullscreenState(FALSE, nullptr)); else return true; } IDXGIOutput* output; if (FAILED(hr = m_swap_chain->GetContainingOutput(&output))) return false; DXGI_SWAP_CHAIN_DESC current_desc; hr = m_swap_chain->GetDesc(¤t_desc); if (FAILED(hr)) return false; DXGI_MODE_DESC new_mode = current_desc.BufferDesc; new_mode.Width = width; new_mode.Height = height; new_mode.RefreshRate.Numerator = static_cast(std::floor(refresh_rate * 1000.0f)); new_mode.RefreshRate.Denominator = 1000u; DXGI_MODE_DESC closest_mode; if (FAILED(hr = output->FindClosestMatchingMode(&new_mode, &closest_mode, nullptr)) || new_mode.Format != current_desc.BufferDesc.Format) { Log_ErrorPrintf("Failed to find closest matching mode, hr=%08X", hr); return false; } if (new_mode.Width == current_desc.BufferDesc.Width && new_mode.Height == current_desc.BufferDesc.Width && new_mode.RefreshRate.Numerator == current_desc.BufferDesc.RefreshRate.Numerator && new_mode.RefreshRate.Denominator == current_desc.BufferDesc.RefreshRate.Denominator) { Log_InfoPrintf("Fullscreen mode already set"); return true; } g_d3d12_context->ExecuteCommandList(true); DestroySwapChainRTVs(); m_swap_chain.Reset(); if (!CreateSwapChain(&closest_mode)) { Log_ErrorPrintf("Failed to create a fullscreen swap chain"); if (!CreateSwapChain(nullptr)) Panic("Failed to recreate windowed swap chain"); return false; } return true; } HostDisplay::AdapterAndModeList D3D12HostDisplay::GetAdapterAndModeList() { return GetAdapterAndModeList(m_dxgi_factory.Get()); } bool D3D12HostDisplay::CreateResources() { D3D12::RootSignatureBuilder rsbuilder; rsbuilder.Add32BitConstants(0, 4, D3D12_SHADER_VISIBILITY_VERTEX); rsbuilder.AddDescriptorTable(D3D12_DESCRIPTOR_RANGE_TYPE_SRV, 0, 1, D3D12_SHADER_VISIBILITY_ALL); rsbuilder.AddDescriptorTable(D3D12_DESCRIPTOR_RANGE_TYPE_SAMPLER, 0, 1, D3D12_SHADER_VISIBILITY_ALL); m_display_root_signature = rsbuilder.Create(); if (!m_display_root_signature) return false; rsbuilder.SetInputAssemblerFlag(); rsbuilder.Add32BitConstants(0, FrontendCommon::PostProcessingShader::PUSH_CONSTANT_SIZE_THRESHOLD / sizeof(u32), D3D12_SHADER_VISIBILITY_ALL); rsbuilder.AddDescriptorTable(D3D12_DESCRIPTOR_RANGE_TYPE_SRV, 0, 1, D3D12_SHADER_VISIBILITY_PIXEL); rsbuilder.AddDescriptorTable(D3D12_DESCRIPTOR_RANGE_TYPE_SAMPLER, 0, 1, D3D12_SHADER_VISIBILITY_PIXEL); m_post_processing_root_signature = rsbuilder.Create(); if (!m_post_processing_root_signature) return false; rsbuilder.SetInputAssemblerFlag(); rsbuilder.AddCBVParameter(0, D3D12_SHADER_VISIBILITY_ALL); rsbuilder.AddDescriptorTable(D3D12_DESCRIPTOR_RANGE_TYPE_SRV, 0, 1, D3D12_SHADER_VISIBILITY_PIXEL); rsbuilder.AddDescriptorTable(D3D12_DESCRIPTOR_RANGE_TYPE_SAMPLER, 0, 1, D3D12_SHADER_VISIBILITY_PIXEL); m_post_processing_cb_root_signature = rsbuilder.Create(); if (!m_post_processing_cb_root_signature) return false; D3D12::GraphicsPipelineBuilder gpbuilder; gpbuilder.SetPrimitiveTopologyType(D3D12_PRIMITIVE_TOPOLOGY_TYPE_TRIANGLE); gpbuilder.SetRootSignature(m_display_root_signature.Get()); gpbuilder.SetVertexShader(s_display_vs_bytecode, sizeof(s_display_vs_bytecode)); gpbuilder.SetPixelShader(s_display_ps_bytecode, sizeof(s_display_ps_bytecode)); gpbuilder.SetNoCullRasterizationState(); gpbuilder.SetNoDepthTestState(); gpbuilder.SetNoBlendingState(); gpbuilder.SetRenderTarget(0, DXGI_FORMAT_R8G8B8A8_UNORM); m_display_pipeline = gpbuilder.Create(g_d3d12_context->GetDevice(), false); if (!m_display_pipeline) return false; gpbuilder.SetBlendState(0, true, D3D12_BLEND_SRC_ALPHA, D3D12_BLEND_INV_SRC_ALPHA, D3D12_BLEND_OP_ADD, D3D12_BLEND_ONE, D3D12_BLEND_ZERO, D3D12_BLEND_OP_ADD, D3D12_COLOR_WRITE_ENABLE_ALL); m_software_cursor_pipeline = gpbuilder.Create(g_d3d12_context->GetDevice(), false); if (!m_software_cursor_pipeline) return false; D3D12_SAMPLER_DESC desc = {}; D3D12::SetDefaultSampler(&desc); desc.AddressU = D3D12_TEXTURE_ADDRESS_MODE_WRAP; desc.AddressV = D3D12_TEXTURE_ADDRESS_MODE_WRAP; desc.Filter = D3D12_FILTER_MIN_MAG_MIP_POINT; if (!g_d3d12_context->GetSamplerHeapManager().Allocate(&m_point_sampler)) return false; g_d3d12_context->GetDevice()->CreateSampler(&desc, m_point_sampler.cpu_handle); desc.Filter = D3D12_FILTER_MIN_MAG_LINEAR_MIP_POINT; if (!g_d3d12_context->GetSamplerHeapManager().Allocate(&m_linear_sampler)) return false; g_d3d12_context->GetDevice()->CreateSampler(&desc, m_linear_sampler.cpu_handle); return true; } void D3D12HostDisplay::DestroyResources() { m_post_processing_cbuffer.Destroy(false); m_post_processing_chain.ClearStages(); m_post_processing_input_texture.Destroy(); m_post_processing_stages.clear(); m_post_processing_cb_root_signature.Reset(); m_post_processing_root_signature.Reset(); m_readback_staging_texture.Destroy(false); g_d3d12_context->GetSamplerHeapManager().Free(&m_linear_sampler); g_d3d12_context->GetSamplerHeapManager().Free(&m_point_sampler); m_software_cursor_pipeline.Reset(); m_display_pipeline.Reset(); m_display_root_signature.Reset(); } bool D3D12HostDisplay::CreateImGuiContext() { ImGui::GetIO().DisplaySize.x = static_cast(m_window_info.surface_width); ImGui::GetIO().DisplaySize.y = static_cast(m_window_info.surface_height); return ImGui_ImplDX12_Init(DXGI_FORMAT_R8G8B8A8_UNORM); } void D3D12HostDisplay::DestroyImGuiContext() { g_d3d12_context->WaitForGPUIdle(); ImGui_ImplDX12_Shutdown(); } bool D3D12HostDisplay::UpdateImGuiFontTexture() { return ImGui_ImplDX12_CreateFontsTexture(); } bool D3D12HostDisplay::Render(bool skip_present) { if (skip_present || !m_swap_chain) { if (ImGui::GetCurrentContext()) ImGui::Render(); return false; } D3D12::Texture& swap_chain_buf = m_swap_chain_buffers[m_current_swap_chain_buffer]; m_current_swap_chain_buffer = ((m_current_swap_chain_buffer + 1) % static_cast(m_swap_chain_buffers.size())); ID3D12GraphicsCommandList* cmdlist = g_d3d12_context->GetCommandList(); RenderDisplay(cmdlist, &swap_chain_buf); if (ImGui::GetCurrentContext()) RenderImGui(cmdlist); RenderSoftwareCursor(cmdlist); swap_chain_buf.TransitionToState(D3D12_RESOURCE_STATE_PRESENT); g_d3d12_context->ExecuteCommandList(false); if (!m_vsync && m_using_allow_tearing) m_swap_chain->Present(0, DXGI_PRESENT_ALLOW_TEARING); else m_swap_chain->Present(BoolToUInt32(m_vsync), 0); return true; } bool D3D12HostDisplay::RenderScreenshot(u32 width, u32 height, std::vector* out_pixels, u32* out_stride, GPUTexture::Format* out_format) { static constexpr DXGI_FORMAT format = DXGI_FORMAT_R8G8B8A8_UNORM; static constexpr GPUTexture::Format hdformat = GPUTexture::Format::RGBA8; D3D12::Texture render_texture; if (!render_texture.Create(width, height, 1, 1, 1, format, DXGI_FORMAT_UNKNOWN, format, DXGI_FORMAT_UNKNOWN, D3D12_RESOURCE_FLAG_ALLOW_RENDER_TARGET) || !m_readback_staging_texture.EnsureSize(width, height, format, false)) { return false; } ID3D12GraphicsCommandList* cmdlist = g_d3d12_context->GetCommandList(); const auto [left, top, draw_width, draw_height] = CalculateDrawRect(width, height); if (HasDisplayTexture() && !m_post_processing_chain.IsEmpty()) { ApplyPostProcessingChain(cmdlist, &render_texture, left, top, width, height, static_cast(m_display_texture), m_display_texture_view_x, m_display_texture_view_y, m_display_texture_view_width, m_display_texture_view_height, width, height); } else { render_texture.TransitionToState(D3D12_RESOURCE_STATE_RENDER_TARGET); cmdlist->ClearRenderTargetView(render_texture.GetRTVOrDSVDescriptor(), s_clear_color.data(), 0, nullptr); cmdlist->OMSetRenderTargets(1, &render_texture.GetRTVOrDSVDescriptor().cpu_handle, FALSE, nullptr); if (HasDisplayTexture()) { RenderDisplay(cmdlist, left, top, draw_width, draw_height, static_cast(m_display_texture), m_display_texture_view_x, m_display_texture_view_y, m_display_texture_view_width, m_display_texture_view_height, IsUsingLinearFiltering()); } } cmdlist->OMSetRenderTargets(0, nullptr, FALSE, nullptr); render_texture.TransitionToState(D3D12_RESOURCE_STATE_COPY_SOURCE); m_readback_staging_texture.CopyFromTexture(render_texture, 0, 0, 0, 0, 0, width, height); const u32 stride = sizeof(u32) * width; out_pixels->resize(width * height); *out_stride = stride; *out_format = hdformat; return m_readback_staging_texture.ReadPixels(0, 0, width, height, out_pixels->data(), stride); } bool D3D12HostDisplay::SetGPUTimingEnabled(bool enabled) { g_d3d12_context->SetEnableGPUTiming(enabled); m_gpu_timing_enabled = enabled; return true; } float D3D12HostDisplay::GetAndResetAccumulatedGPUTime() { return g_d3d12_context->GetAndResetAccumulatedGPUTime(); } void D3D12HostDisplay::RenderImGui(ID3D12GraphicsCommandList* cmdlist) { ImGui::Render(); ImGui_ImplDX12_RenderDrawData(ImGui::GetDrawData()); } void D3D12HostDisplay::RenderDisplay(ID3D12GraphicsCommandList* cmdlist, D3D12::Texture* swap_chain_buf) { const auto [left, top, width, height] = CalculateDrawRect(GetWindowWidth(), GetWindowHeight()); if (HasDisplayTexture() && !m_post_processing_chain.IsEmpty()) { ApplyPostProcessingChain(cmdlist, swap_chain_buf, left, top, width, height, static_cast(m_display_texture), m_display_texture_view_x, m_display_texture_view_y, m_display_texture_view_width, m_display_texture_view_height, GetWindowWidth(), GetWindowHeight()); return; } swap_chain_buf->TransitionToState(D3D12_RESOURCE_STATE_RENDER_TARGET); cmdlist->ClearRenderTargetView(swap_chain_buf->GetRTVOrDSVDescriptor(), s_clear_color.data(), 0, nullptr); cmdlist->OMSetRenderTargets(1, &swap_chain_buf->GetRTVOrDSVDescriptor().cpu_handle, FALSE, nullptr); if (!HasDisplayTexture()) return; RenderDisplay(cmdlist, left, top, width, height, static_cast(m_display_texture), m_display_texture_view_x, m_display_texture_view_y, m_display_texture_view_width, m_display_texture_view_height, IsUsingLinearFiltering()); } void D3D12HostDisplay::RenderDisplay(ID3D12GraphicsCommandList* cmdlist, s32 left, s32 top, s32 width, s32 height, D3D12::Texture* texture, s32 texture_view_x, s32 texture_view_y, s32 texture_view_width, s32 texture_view_height, bool linear_filter) { const float position_adjust = linear_filter ? 0.5f : 0.0f; const float size_adjust = linear_filter ? 1.0f : 0.0f; const float uniforms[4] = { (static_cast(texture_view_x) + position_adjust) / static_cast(texture->GetWidth()), (static_cast(texture_view_y) + position_adjust) / static_cast(texture->GetHeight()), (static_cast(texture_view_width) - size_adjust) / static_cast(texture->GetWidth()), (static_cast(texture_view_height) - size_adjust) / static_cast(texture->GetHeight())}; cmdlist->SetGraphicsRootSignature(m_display_root_signature.Get()); cmdlist->SetPipelineState(m_display_pipeline.Get()); cmdlist->SetGraphicsRoot32BitConstants(0, static_cast(std::size(uniforms)), uniforms, 0); cmdlist->SetGraphicsRootDescriptorTable(1, texture->GetSRVDescriptor()); cmdlist->SetGraphicsRootDescriptorTable(2, linear_filter ? m_linear_sampler : m_point_sampler); D3D12::SetViewportAndScissor(cmdlist, left, top, width, height); cmdlist->IASetPrimitiveTopology(D3D_PRIMITIVE_TOPOLOGY_TRIANGLELIST); cmdlist->DrawInstanced(3, 1, 0, 0); } void D3D12HostDisplay::RenderSoftwareCursor(ID3D12GraphicsCommandList* cmdlist) { if (!HasSoftwareCursor()) return; const auto [left, top, width, height] = CalculateSoftwareCursorDrawRect(); RenderSoftwareCursor(cmdlist, left, top, width, height, m_cursor_texture.get()); } void D3D12HostDisplay::RenderSoftwareCursor(ID3D12GraphicsCommandList* cmdlist, s32 left, s32 top, s32 width, s32 height, GPUTexture* texture_handle) { const float uniforms[4] = {0.0f, 0.0f, 1.0f, 1.0f}; cmdlist->SetPipelineState(m_display_pipeline.Get()); cmdlist->SetGraphicsRoot32BitConstants(0, static_cast(std::size(uniforms)), uniforms, 0); cmdlist->SetGraphicsRootDescriptorTable(1, static_cast(texture_handle)->GetRTVOrDSVDescriptor()); cmdlist->SetGraphicsRootDescriptorTable(2, m_linear_sampler); D3D12::SetViewportAndScissor(cmdlist, left, top, width, height); cmdlist->IASetPrimitiveTopology(D3D_PRIMITIVE_TOPOLOGY_TRIANGLELIST); cmdlist->DrawInstanced(3, 1, 0, 0); } HostDisplay::AdapterAndModeList D3D12HostDisplay::StaticGetAdapterAndModeList() { ComPtr dxgi_factory; #if WINAPI_FAMILY_PARTITION(WINAPI_PARTITION_DESKTOP) HRESULT hr = CreateDXGIFactory(IID_PPV_ARGS(dxgi_factory.GetAddressOf())); #else HRESULT hr = CreateDXGIFactory2(0, IID_PPV_ARGS(dxgi_factory.GetAddressOf())); #endif if (FAILED(hr)) return {}; return GetAdapterAndModeList(dxgi_factory.Get()); } HostDisplay::AdapterAndModeList D3D12HostDisplay::GetAdapterAndModeList(IDXGIFactory* dxgi_factory) { AdapterAndModeList adapter_info; ComPtr current_adapter; while (SUCCEEDED(dxgi_factory->EnumAdapters(static_cast(adapter_info.adapter_names.size()), current_adapter.ReleaseAndGetAddressOf()))) { DXGI_ADAPTER_DESC adapter_desc; std::string adapter_name; if (SUCCEEDED(current_adapter->GetDesc(&adapter_desc))) { char adapter_name_buffer[128]; const int name_length = WideCharToMultiByte(CP_UTF8, 0, adapter_desc.Description, static_cast(std::wcslen(adapter_desc.Description)), adapter_name_buffer, countof(adapter_name_buffer), 0, nullptr); if (name_length >= 0) adapter_name.assign(adapter_name_buffer, static_cast(name_length)); else adapter_name.assign("(Unknown)"); } else { adapter_name.assign("(Unknown)"); } if (adapter_info.fullscreen_modes.empty()) { ComPtr output; if (SUCCEEDED(current_adapter->EnumOutputs(0, &output))) { UINT num_modes = 0; if (SUCCEEDED(output->GetDisplayModeList(DXGI_FORMAT_R8G8B8A8_UNORM, 0, &num_modes, nullptr))) { std::vector modes(num_modes); if (SUCCEEDED(output->GetDisplayModeList(DXGI_FORMAT_R8G8B8A8_UNORM, 0, &num_modes, modes.data()))) { for (const DXGI_MODE_DESC& mode : modes) { adapter_info.fullscreen_modes.push_back(StringUtil::StdStringFromFormat( "%u x %u @ %f hz", mode.Width, mode.Height, static_cast(mode.RefreshRate.Numerator) / static_cast(mode.RefreshRate.Denominator))); } } } } } // handle duplicate adapter names if (std::any_of(adapter_info.adapter_names.begin(), adapter_info.adapter_names.end(), [&adapter_name](const std::string& other) { return (adapter_name == other); })) { std::string original_adapter_name = std::move(adapter_name); u32 current_extra = 2; do { adapter_name = StringUtil::StdStringFromFormat("%s (%u)", original_adapter_name.c_str(), current_extra); current_extra++; } while (std::any_of(adapter_info.adapter_names.begin(), adapter_info.adapter_names.end(), [&adapter_name](const std::string& other) { return (adapter_name == other); })); } adapter_info.adapter_names.push_back(std::move(adapter_name)); } return adapter_info; } D3D12HostDisplay::PostProcessingStage::PostProcessingStage(PostProcessingStage&& move) : pipeline(std::move(move.pipeline)), output_texture(std::move(move.output_texture)), uniforms_size(move.uniforms_size) { move.uniforms_size = 0; } D3D12HostDisplay::PostProcessingStage::~PostProcessingStage() { output_texture.Destroy(true); } bool D3D12HostDisplay::SetPostProcessingChain(const std::string_view& config) { g_d3d12_context->ExecuteCommandList(true); if (config.empty()) { m_post_processing_stages.clear(); m_post_processing_chain.ClearStages(); return true; } if (!m_post_processing_chain.CreateFromString(config)) return false; m_post_processing_stages.clear(); D3D12::ShaderCache shader_cache; shader_cache.Open(EmuFolders::Cache, g_d3d12_context->GetFeatureLevel(), g_settings.gpu_use_debug_device); FrontendCommon::PostProcessingShaderGen shadergen(RenderAPI::D3D12, false); bool only_use_push_constants = true; for (u32 i = 0; i < m_post_processing_chain.GetStageCount(); i++) { const FrontendCommon::PostProcessingShader& shader = m_post_processing_chain.GetShaderStage(i); const std::string vs = shadergen.GeneratePostProcessingVertexShader(shader); const std::string ps = shadergen.GeneratePostProcessingFragmentShader(shader); const bool use_push_constants = shader.UsePushConstants(); only_use_push_constants &= use_push_constants; PostProcessingStage stage; stage.uniforms_size = shader.GetUniformsSize(); ComPtr vs_blob(shader_cache.GetVertexShader(vs)); ComPtr ps_blob(shader_cache.GetPixelShader(ps)); if (!vs_blob || !ps_blob) { Log_ErrorPrintf("Failed to compile one or more post-processing shaders, disabling."); m_post_processing_stages.clear(); m_post_processing_chain.ClearStages(); return false; } D3D12::GraphicsPipelineBuilder gpbuilder; gpbuilder.SetVertexShader(vs_blob.Get()); gpbuilder.SetPixelShader(ps_blob.Get()); gpbuilder.SetPrimitiveTopologyType(D3D12_PRIMITIVE_TOPOLOGY_TYPE_TRIANGLE); gpbuilder.SetNoCullRasterizationState(); gpbuilder.SetNoDepthTestState(); gpbuilder.SetNoBlendingState(); gpbuilder.SetRootSignature(use_push_constants ? m_post_processing_root_signature.Get() : m_post_processing_cb_root_signature.Get()); gpbuilder.SetRenderTarget(0, DXGI_FORMAT_R8G8B8A8_UNORM); stage.pipeline = gpbuilder.Create(g_d3d12_context->GetDevice(), shader_cache); if (!stage.pipeline) { Log_ErrorPrintf("Failed to compile one or more post-processing pipelines, disabling."); m_post_processing_stages.clear(); m_post_processing_chain.ClearStages(); return false; } D3D12::SetObjectNameFormatted(stage.pipeline.Get(), "%s Pipeline", shader.GetName().c_str()); m_post_processing_stages.push_back(std::move(stage)); } constexpr u32 UBO_SIZE = 1 * 1024 * 1024; if (!only_use_push_constants && m_post_processing_cbuffer.GetSize() < UBO_SIZE) { if (!m_post_processing_cbuffer.Create(UBO_SIZE)) { Log_ErrorPrintf("Failed to allocate %u byte constant buffer for postprocessing", UBO_SIZE); m_post_processing_stages.clear(); m_post_processing_chain.ClearStages(); return false; } D3D12::SetObjectName(m_post_processing_cbuffer.GetBuffer(), "Post Processing Uniform Buffer"); } m_post_processing_timer.Reset(); return true; } bool D3D12HostDisplay::CheckPostProcessingRenderTargets(u32 target_width, u32 target_height) { DebugAssert(!m_post_processing_stages.empty()); const DXGI_FORMAT tex_format = DXGI_FORMAT_R8G8B8A8_UNORM; const DXGI_FORMAT srv_format = DXGI_FORMAT_R8G8B8A8_UNORM; const DXGI_FORMAT rtv_format = DXGI_FORMAT_R8G8B8A8_UNORM; if (m_post_processing_input_texture.GetWidth() != target_width || m_post_processing_input_texture.GetHeight() != target_height) { if (!m_post_processing_input_texture.Create(target_width, target_height, 1, 1, 1, tex_format, srv_format, rtv_format, DXGI_FORMAT_UNKNOWN, D3D12_RESOURCE_FLAG_ALLOW_RENDER_TARGET)) { return false; } D3D12::SetObjectName(m_post_processing_input_texture.GetResource(), "Post Processing Input Texture"); } const u32 target_count = (static_cast(m_post_processing_stages.size()) - 1); for (u32 i = 0; i < target_count; i++) { PostProcessingStage& pps = m_post_processing_stages[i]; if (pps.output_texture.GetWidth() != target_width || pps.output_texture.GetHeight() != target_height) { if (!pps.output_texture.Create(target_width, target_height, 1, 1, 1, tex_format, srv_format, rtv_format, DXGI_FORMAT_UNKNOWN, D3D12_RESOURCE_FLAG_ALLOW_RENDER_TARGET)) { return false; } D3D12::SetObjectNameFormatted(pps.output_texture.GetResource(), "Post Processing Output Texture %u", i); } } return true; } void D3D12HostDisplay::ApplyPostProcessingChain(ID3D12GraphicsCommandList* cmdlist, D3D12::Texture* final_target, s32 final_left, s32 final_top, s32 final_width, s32 final_height, D3D12::Texture* texture, s32 texture_view_x, s32 texture_view_y, s32 texture_view_width, s32 texture_view_height, u32 target_width, u32 target_height) { if (!CheckPostProcessingRenderTargets(target_width, target_height)) { final_target->TransitionToState(D3D12_RESOURCE_STATE_RENDER_TARGET); cmdlist->ClearRenderTargetView(final_target->GetRTVOrDSVDescriptor(), s_clear_color.data(), 0, nullptr); cmdlist->OMSetRenderTargets(1, &final_target->GetRTVOrDSVDescriptor().cpu_handle, FALSE, nullptr); RenderDisplay(cmdlist, final_left, final_top, final_width, final_height, texture, texture_view_x, texture_view_y, texture_view_width, texture_view_height, IsUsingLinearFiltering()); return; } // downsample/upsample - use same viewport for remainder m_post_processing_input_texture.TransitionToState(D3D12_RESOURCE_STATE_RENDER_TARGET); cmdlist->ClearRenderTargetView(m_post_processing_input_texture.GetRTVOrDSVDescriptor(), s_clear_color.data(), 0, nullptr); cmdlist->OMSetRenderTargets(1, &m_post_processing_input_texture.GetRTVOrDSVDescriptor().cpu_handle, FALSE, nullptr); RenderDisplay(cmdlist, final_left, final_top, final_width, final_height, texture, texture_view_x, texture_view_y, texture_view_width, texture_view_height, IsUsingLinearFiltering()); m_post_processing_input_texture.TransitionToState(D3D12_RESOURCE_STATE_PIXEL_SHADER_RESOURCE); const s32 orig_texture_width = texture_view_width; const s32 orig_texture_height = texture_view_height; texture = &m_post_processing_input_texture; texture_view_x = final_left; texture_view_y = final_top; texture_view_width = final_width; texture_view_height = final_height; const u32 final_stage = static_cast(m_post_processing_stages.size()) - 1u; for (u32 i = 0; i < static_cast(m_post_processing_stages.size()); i++) { PostProcessingStage& pps = m_post_processing_stages[i]; const bool use_push_constants = m_post_processing_chain.GetShaderStage(i).UsePushConstants(); if (use_push_constants) { u8 buffer[FrontendCommon::PostProcessingShader::PUSH_CONSTANT_SIZE_THRESHOLD]; Assert(pps.uniforms_size <= sizeof(buffer)); m_post_processing_chain.GetShaderStage(i).FillUniformBuffer( buffer, texture->GetWidth(), texture->GetHeight(), texture_view_x, texture_view_y, texture_view_width, texture_view_height, GetWindowWidth(), GetWindowHeight(), orig_texture_width, orig_texture_height, static_cast(m_post_processing_timer.GetTimeSeconds())); cmdlist->SetGraphicsRootSignature(m_post_processing_root_signature.Get()); cmdlist->SetGraphicsRoot32BitConstants(0, sizeof(buffer) / sizeof(u32), buffer, 0); } else { if (!m_post_processing_cbuffer.ReserveMemory(pps.uniforms_size, D3D12_CONSTANT_BUFFER_DATA_PLACEMENT_ALIGNMENT)) { Panic("Failed to reserve space in post-processing UBO"); } const u32 offset = m_post_processing_cbuffer.GetCurrentOffset(); m_post_processing_chain.GetShaderStage(i).FillUniformBuffer( m_post_processing_cbuffer.GetCurrentHostPointer(), texture->GetWidth(), texture->GetHeight(), texture_view_x, texture_view_y, texture_view_width, texture_view_height, GetWindowWidth(), GetWindowHeight(), orig_texture_width, orig_texture_height, static_cast(m_post_processing_timer.GetTimeSeconds())); m_post_processing_cbuffer.CommitMemory(pps.uniforms_size); cmdlist->SetGraphicsRootSignature(m_post_processing_cb_root_signature.Get()); cmdlist->SetGraphicsRootConstantBufferView(0, m_post_processing_cbuffer.GetGPUPointer() + offset); } D3D12::Texture* rt = (i != final_stage) ? &pps.output_texture : final_target; rt->TransitionToState(D3D12_RESOURCE_STATE_RENDER_TARGET); cmdlist->ClearRenderTargetView(rt->GetRTVOrDSVDescriptor(), s_clear_color.data(), 0, nullptr); cmdlist->OMSetRenderTargets(1, &rt->GetRTVOrDSVDescriptor().cpu_handle, FALSE, nullptr); cmdlist->SetPipelineState(pps.pipeline.Get()); cmdlist->SetGraphicsRootDescriptorTable(1, texture->GetSRVDescriptor()); cmdlist->SetGraphicsRootDescriptorTable(2, m_point_sampler); cmdlist->IASetPrimitiveTopology(D3D_PRIMITIVE_TOPOLOGY_TRIANGLELIST); cmdlist->DrawInstanced(3, 1, 0, 0); if (i != final_stage) { pps.output_texture.TransitionToState(D3D12_RESOURCE_STATE_PIXEL_SHADER_RESOURCE); texture = &pps.output_texture; } } }