6393399758
The performance save is not worth accidental usage support. Also remove unnecessary copies from the shmem paths.
345 lines
7.5 KiB
C++
345 lines
7.5 KiB
C++
#include <windows.h>
|
|
#include "graphics-hook.h"
|
|
|
|
#if COMPILE_D3D12_HOOK
|
|
|
|
#include <d3d11on12.h>
|
|
#include <d3d12.h>
|
|
#include <dxgi1_4.h>
|
|
|
|
#include "dxgi-helpers.hpp"
|
|
#include "../funchook.h"
|
|
|
|
#define MAX_BACKBUFFERS 8
|
|
|
|
struct d3d12_data {
|
|
ID3D12Device *device; /* do not release */
|
|
uint32_t cx;
|
|
uint32_t cy;
|
|
DXGI_FORMAT format;
|
|
bool using_shtex;
|
|
bool multisampled;
|
|
bool dxgi_1_4;
|
|
|
|
ID3D11Device *device11;
|
|
ID3D11DeviceContext *context11;
|
|
ID3D11On12Device *device11on12;
|
|
|
|
union {
|
|
struct {
|
|
struct shtex_data *shtex_info;
|
|
ID3D11Resource *backbuffer11[MAX_BACKBUFFERS];
|
|
UINT backbuffer_count;
|
|
UINT cur_backbuffer;
|
|
ID3D11Texture2D *copy_tex;
|
|
HANDLE handle;
|
|
};
|
|
};
|
|
};
|
|
|
|
static struct d3d12_data data = {};
|
|
|
|
void d3d12_free(void)
|
|
{
|
|
if (data.copy_tex)
|
|
data.copy_tex->Release();
|
|
for (size_t i = 0; i < data.backbuffer_count; i++) {
|
|
if (data.backbuffer11[i])
|
|
data.backbuffer11[i]->Release();
|
|
}
|
|
if (data.device11)
|
|
data.device11->Release();
|
|
if (data.context11)
|
|
data.context11->Release();
|
|
if (data.device11on12)
|
|
data.device11on12->Release();
|
|
|
|
capture_free();
|
|
|
|
memset(&data, 0, sizeof(data));
|
|
|
|
hlog("----------------- d3d12 capture freed ----------------");
|
|
}
|
|
|
|
struct bb_info {
|
|
ID3D12Resource *backbuffer[MAX_BACKBUFFERS];
|
|
UINT count;
|
|
};
|
|
|
|
static bool create_d3d12_tex(bb_info &bb)
|
|
{
|
|
D3D11_RESOURCE_FLAGS rf11 = {};
|
|
HRESULT hr;
|
|
|
|
if (!bb.count)
|
|
return false;
|
|
|
|
data.backbuffer_count = bb.count;
|
|
|
|
for (UINT i = 0; i < bb.count; i++) {
|
|
hr = data.device11on12->CreateWrappedResource(
|
|
bb.backbuffer[i], &rf11,
|
|
D3D12_RESOURCE_STATE_COPY_SOURCE,
|
|
D3D12_RESOURCE_STATE_PRESENT, __uuidof(ID3D11Resource),
|
|
(void **)&data.backbuffer11[i]);
|
|
if (FAILED(hr)) {
|
|
hlog_hr("create_d3d12_tex: failed to create "
|
|
"backbuffer11",
|
|
hr);
|
|
return false;
|
|
}
|
|
}
|
|
|
|
D3D11_TEXTURE2D_DESC desc11 = {};
|
|
desc11.Width = data.cx;
|
|
desc11.Height = data.cy;
|
|
desc11.MipLevels = 1;
|
|
desc11.ArraySize = 1;
|
|
desc11.Format = data.format;
|
|
desc11.SampleDesc.Count = 1;
|
|
desc11.BindFlags = D3D11_BIND_SHADER_RESOURCE;
|
|
desc11.MiscFlags = D3D11_RESOURCE_MISC_SHARED;
|
|
|
|
hr = data.device11->CreateTexture2D(&desc11, nullptr, &data.copy_tex);
|
|
if (FAILED(hr)) {
|
|
hlog_hr("create_d3d12_tex: creation of d3d11 copy tex failed",
|
|
hr);
|
|
return false;
|
|
}
|
|
|
|
for (UINT i = 0; i < bb.count; i++) {
|
|
data.device11on12->ReleaseWrappedResources(
|
|
&data.backbuffer11[i], 1);
|
|
}
|
|
|
|
IDXGIResource *dxgi_res;
|
|
hr = data.copy_tex->QueryInterface(__uuidof(IDXGIResource),
|
|
(void **)&dxgi_res);
|
|
if (FAILED(hr)) {
|
|
hlog_hr("create_d3d12_tex: failed to query "
|
|
"IDXGIResource interface from texture",
|
|
hr);
|
|
return false;
|
|
}
|
|
|
|
hr = dxgi_res->GetSharedHandle(&data.handle);
|
|
dxgi_res->Release();
|
|
if (FAILED(hr)) {
|
|
hlog_hr("create_d3d12_tex: failed to get shared handle", hr);
|
|
return false;
|
|
}
|
|
|
|
return true;
|
|
}
|
|
|
|
typedef PFN_D3D11ON12_CREATE_DEVICE create_11_on_12_t;
|
|
|
|
static bool d3d12_init_11on12(void)
|
|
{
|
|
static HMODULE d3d11 = nullptr;
|
|
static create_11_on_12_t create_11_on_12 = nullptr;
|
|
static bool initialized_11 = false;
|
|
static bool initialized_func = false;
|
|
HRESULT hr;
|
|
|
|
if (!initialized_11 && !d3d11) {
|
|
d3d11 = load_system_library("d3d11.dll");
|
|
if (!d3d11) {
|
|
hlog("d3d12_init_11on12: failed to load d3d11");
|
|
}
|
|
initialized_11 = true;
|
|
}
|
|
|
|
if (!d3d11) {
|
|
return false;
|
|
}
|
|
|
|
if (!initialized_func && !create_11_on_12) {
|
|
create_11_on_12 = (create_11_on_12_t)GetProcAddress(
|
|
d3d11, "D3D11On12CreateDevice");
|
|
if (!create_11_on_12) {
|
|
hlog("d3d12_init_11on12: Failed to get "
|
|
"D3D11On12CreateDevice address");
|
|
}
|
|
|
|
initialized_func = true;
|
|
}
|
|
|
|
if (!create_11_on_12) {
|
|
return false;
|
|
}
|
|
|
|
hr = create_11_on_12(data.device, 0, nullptr, 0, nullptr, 0, 0,
|
|
&data.device11, &data.context11, nullptr);
|
|
if (FAILED(hr)) {
|
|
hlog_hr("d3d12_init_11on12: failed to create 11 device", hr);
|
|
return false;
|
|
}
|
|
|
|
data.device11->QueryInterface(__uuidof(ID3D11On12Device),
|
|
(void **)&data.device11on12);
|
|
if (FAILED(hr)) {
|
|
hlog_hr("d3d12_init_11on12: failed to query 11on12 device", hr);
|
|
return false;
|
|
}
|
|
|
|
return true;
|
|
}
|
|
|
|
static bool d3d12_shtex_init(HWND window, bb_info &bb)
|
|
{
|
|
if (!d3d12_init_11on12()) {
|
|
return false;
|
|
}
|
|
if (!create_d3d12_tex(bb)) {
|
|
return false;
|
|
}
|
|
if (!capture_init_shtex(&data.shtex_info, window, data.cx, data.cy,
|
|
data.format, false, (uintptr_t)data.handle)) {
|
|
return false;
|
|
}
|
|
|
|
hlog("d3d12 shared texture capture successful");
|
|
return true;
|
|
}
|
|
|
|
static inline bool d3d12_init_format(IDXGISwapChain *swap, HWND &window,
|
|
bb_info &bb)
|
|
{
|
|
DXGI_SWAP_CHAIN_DESC desc;
|
|
IDXGISwapChain3 *swap3;
|
|
HRESULT hr;
|
|
|
|
hr = swap->GetDesc(&desc);
|
|
if (FAILED(hr)) {
|
|
hlog_hr("d3d12_init_format: swap->GetDesc failed", hr);
|
|
return false;
|
|
}
|
|
|
|
data.format = fix_dxgi_format(desc.BufferDesc.Format);
|
|
data.multisampled = desc.SampleDesc.Count > 1;
|
|
window = desc.OutputWindow;
|
|
data.cx = desc.BufferDesc.Width;
|
|
data.cy = desc.BufferDesc.Height;
|
|
|
|
hr = swap->QueryInterface(__uuidof(IDXGISwapChain3), (void **)&swap3);
|
|
if (SUCCEEDED(hr)) {
|
|
data.dxgi_1_4 = true;
|
|
hlog("We're DXGI1.4 boys!");
|
|
swap3->Release();
|
|
}
|
|
|
|
hlog("Buffer count: %d, swap effect: %d", (int)desc.BufferCount,
|
|
(int)desc.SwapEffect);
|
|
|
|
bb.count = desc.SwapEffect == DXGI_SWAP_EFFECT_DISCARD
|
|
? 1
|
|
: desc.BufferCount;
|
|
|
|
if (bb.count == 1)
|
|
data.dxgi_1_4 = false;
|
|
|
|
if (bb.count > MAX_BACKBUFFERS) {
|
|
hlog("Somehow it's using more than the max backbuffers. "
|
|
"Not sure why anyone would do that.");
|
|
bb.count = 1;
|
|
data.dxgi_1_4 = false;
|
|
}
|
|
|
|
for (UINT i = 0; i < bb.count; i++) {
|
|
hr = swap->GetBuffer(i, __uuidof(ID3D12Resource),
|
|
(void **)&bb.backbuffer[i]);
|
|
if (SUCCEEDED(hr)) {
|
|
bb.backbuffer[i]->Release();
|
|
} else {
|
|
return false;
|
|
}
|
|
}
|
|
|
|
return true;
|
|
}
|
|
|
|
static void d3d12_init(IDXGISwapChain *swap)
|
|
{
|
|
bb_info bb = {};
|
|
HWND window;
|
|
HRESULT hr;
|
|
|
|
hr = swap->GetDevice(__uuidof(ID3D12Device), (void **)&data.device);
|
|
if (FAILED(hr)) {
|
|
hlog_hr("d3d12_init: failed to get device from swap", hr);
|
|
return;
|
|
}
|
|
|
|
data.device->Release();
|
|
|
|
if (!d3d12_init_format(swap, window, bb)) {
|
|
return;
|
|
}
|
|
|
|
if (global_hook_info->force_shmem) {
|
|
hlog("d3d12_init: shared memory capture currently "
|
|
"unsupported; ignoring");
|
|
}
|
|
|
|
if (!d3d12_shtex_init(window, bb))
|
|
d3d12_free();
|
|
}
|
|
|
|
static inline void d3d12_copy_texture(ID3D11Resource *dst, ID3D11Resource *src)
|
|
{
|
|
if (data.multisampled) {
|
|
data.context11->ResolveSubresource(dst, 0, src, 0, data.format);
|
|
} else {
|
|
data.context11->CopyResource(dst, src);
|
|
}
|
|
}
|
|
|
|
static inline void d3d12_shtex_capture(IDXGISwapChain *swap,
|
|
bool capture_overlay)
|
|
{
|
|
bool dxgi_1_4 = data.dxgi_1_4;
|
|
UINT cur_idx;
|
|
|
|
if (dxgi_1_4) {
|
|
IDXGISwapChain3 *swap3 =
|
|
reinterpret_cast<IDXGISwapChain3 *>(swap);
|
|
cur_idx = swap3->GetCurrentBackBufferIndex();
|
|
if (!capture_overlay) {
|
|
if (++cur_idx >= data.backbuffer_count)
|
|
cur_idx = 0;
|
|
}
|
|
} else {
|
|
cur_idx = data.cur_backbuffer;
|
|
}
|
|
|
|
ID3D11Resource *backbuffer = data.backbuffer11[cur_idx];
|
|
|
|
data.device11on12->AcquireWrappedResources(&backbuffer, 1);
|
|
d3d12_copy_texture(data.copy_tex, backbuffer);
|
|
data.device11on12->ReleaseWrappedResources(&backbuffer, 1);
|
|
data.context11->Flush();
|
|
|
|
if (!dxgi_1_4) {
|
|
if (++data.cur_backbuffer >= data.backbuffer_count)
|
|
data.cur_backbuffer = 0;
|
|
}
|
|
}
|
|
|
|
void d3d12_capture(void *swap_ptr, void *, bool capture_overlay)
|
|
{
|
|
IDXGISwapChain *swap = (IDXGISwapChain *)swap_ptr;
|
|
|
|
if (capture_should_stop()) {
|
|
d3d12_free();
|
|
}
|
|
if (capture_should_init()) {
|
|
d3d12_init(swap);
|
|
}
|
|
if (capture_ready()) {
|
|
d3d12_shtex_capture(swap, capture_overlay);
|
|
}
|
|
}
|
|
|
|
#endif
|