8614697c59
A mismatch will lead to failure.
441 lines
12 KiB
C++
441 lines
12 KiB
C++
/*
|
|
|
|
This file is provided under a dual BSD/GPLv2 license. When using or
|
|
redistributing this file, you may do so under either license.
|
|
|
|
GPL LICENSE SUMMARY
|
|
|
|
Copyright(c) Oct. 2015 Intel Corporation.
|
|
|
|
This program is free software; you can redistribute it and/or modify
|
|
it under the terms of version 2 of the GNU General Public License as
|
|
published by the Free Software Foundation.
|
|
|
|
This program is distributed in the hope that it will be useful, but
|
|
WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
|
|
General Public License for more details.
|
|
|
|
Contact Information:
|
|
|
|
Seung-Woo Kim, seung-woo.kim@intel.com
|
|
705 5th Ave S #500, Seattle, WA 98104
|
|
|
|
BSD LICENSE
|
|
|
|
Copyright(c) <date> Intel Corporation.
|
|
|
|
Redistribution and use in source and binary forms, with or without
|
|
modification, are permitted provided that the following conditions
|
|
are met:
|
|
|
|
* Redistributions of source code must retain the above copyright
|
|
notice, this list of conditions and the following disclaimer.
|
|
|
|
* Redistributions in binary form must reproduce the above copyright
|
|
notice, this list of conditions and the following disclaimer in
|
|
the documentation and/or other materials provided with the
|
|
distribution.
|
|
|
|
* Neither the name of Intel Corporation nor the names of its
|
|
contributors may be used to endorse or promote products derived
|
|
from this software without specific prior written permission.
|
|
|
|
THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
|
|
"AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
|
|
LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
|
|
A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
|
|
OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
|
|
SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
|
|
LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
|
|
DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
|
|
THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
|
|
(INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
|
|
OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
|
|
*/
|
|
|
|
// QSV_Encoder.cpp : Defines the exported functions for the DLL application.
|
|
//
|
|
|
|
#include "QSV_Encoder.h"
|
|
#include "QSV_Encoder_Internal.h"
|
|
#include <obs-module.h>
|
|
#include <string>
|
|
#include <atomic>
|
|
#include <intrin.h>
|
|
#include <d3d11.h>
|
|
#include <dxgi1_2.h>
|
|
#include <wrl/client.h>
|
|
|
|
#define do_log(level, format, ...) \
|
|
blog(level, "[qsv encoder: '%s'] " format, "msdk_impl", ##__VA_ARGS__)
|
|
|
|
mfxIMPL impl = MFX_IMPL_HARDWARE_ANY;
|
|
mfxVersion ver = {{0, 1}}; // for backward compatibility
|
|
std::atomic<bool> is_active{false};
|
|
|
|
bool prefer_current_or_igpu_enc(int *iGPUIndex)
|
|
{
|
|
IDXGIAdapter *pAdapter;
|
|
bool hasIGPU = false;
|
|
bool hasDGPU = false;
|
|
bool hasCurrent = false;
|
|
|
|
HMODULE hDXGI = LoadLibrary(L"dxgi.dll");
|
|
if (hDXGI == NULL) {
|
|
return false;
|
|
}
|
|
|
|
typedef HRESULT(WINAPI * LPCREATEDXGIFACTORY)(REFIID riid,
|
|
void **ppFactory);
|
|
|
|
LPCREATEDXGIFACTORY pCreateDXGIFactory =
|
|
(LPCREATEDXGIFACTORY)GetProcAddress(hDXGI,
|
|
"CreateDXGIFactory1");
|
|
if (pCreateDXGIFactory == NULL) {
|
|
pCreateDXGIFactory = (LPCREATEDXGIFACTORY)GetProcAddress(
|
|
hDXGI, "CreateDXGIFactory");
|
|
|
|
if (pCreateDXGIFactory == NULL) {
|
|
FreeLibrary(hDXGI);
|
|
return false;
|
|
}
|
|
}
|
|
|
|
IDXGIFactory *pFactory = NULL;
|
|
if (FAILED((*pCreateDXGIFactory)(__uuidof(IDXGIFactory),
|
|
(void **)(&pFactory)))) {
|
|
FreeLibrary(hDXGI);
|
|
return false;
|
|
}
|
|
|
|
LUID luid;
|
|
bool hasLuid = false;
|
|
obs_enter_graphics();
|
|
{
|
|
ID3D11Device *pDevice = (ID3D11Device *)gs_get_device_obj();
|
|
Microsoft::WRL::ComPtr<IDXGIDevice> dxgiDevice;
|
|
if (SUCCEEDED(pDevice->QueryInterface<IDXGIDevice>(
|
|
dxgiDevice.GetAddressOf()))) {
|
|
Microsoft::WRL::ComPtr<IDXGIAdapter> dxgiAdapter;
|
|
if (SUCCEEDED(dxgiDevice->GetAdapter(
|
|
dxgiAdapter.GetAddressOf()))) {
|
|
DXGI_ADAPTER_DESC desc;
|
|
hasLuid =
|
|
SUCCEEDED(dxgiAdapter->GetDesc(&desc));
|
|
if (hasLuid) {
|
|
luid = desc.AdapterLuid;
|
|
}
|
|
}
|
|
}
|
|
}
|
|
obs_leave_graphics();
|
|
|
|
// Check for i+I cases (Intel discrete + Intel integrated graphics on the same system). Default will be integrated.
|
|
for (int adapterIndex = 0;
|
|
SUCCEEDED(pFactory->EnumAdapters(adapterIndex, &pAdapter));
|
|
++adapterIndex) {
|
|
DXGI_ADAPTER_DESC AdapterDesc = {};
|
|
const HRESULT hr = pAdapter->GetDesc(&AdapterDesc);
|
|
pAdapter->Release();
|
|
|
|
if (SUCCEEDED(hr) && (AdapterDesc.VendorId == 0x8086)) {
|
|
if (hasLuid &&
|
|
(AdapterDesc.AdapterLuid.LowPart == luid.LowPart) &&
|
|
(AdapterDesc.AdapterLuid.HighPart ==
|
|
luid.HighPart)) {
|
|
hasCurrent = true;
|
|
*iGPUIndex = adapterIndex;
|
|
break;
|
|
}
|
|
|
|
if (AdapterDesc.DedicatedVideoMemory <=
|
|
512 * 1024 * 1024) {
|
|
hasIGPU = true;
|
|
if (iGPUIndex != NULL) {
|
|
*iGPUIndex = adapterIndex;
|
|
}
|
|
} else {
|
|
hasDGPU = true;
|
|
}
|
|
}
|
|
}
|
|
|
|
pFactory->Release();
|
|
FreeLibrary(hDXGI);
|
|
|
|
return hasCurrent || (hasIGPU && hasDGPU);
|
|
}
|
|
|
|
void qsv_encoder_version(unsigned short *major, unsigned short *minor)
|
|
{
|
|
*major = ver.Major;
|
|
*minor = ver.Minor;
|
|
}
|
|
|
|
qsv_t *qsv_encoder_open(qsv_param_t *pParams)
|
|
{
|
|
mfxIMPL impl_list[4] = {MFX_IMPL_HARDWARE, MFX_IMPL_HARDWARE2,
|
|
MFX_IMPL_HARDWARE3, MFX_IMPL_HARDWARE4};
|
|
int igpu_index = -1;
|
|
if (prefer_current_or_igpu_enc(&igpu_index) &&
|
|
(igpu_index < _countof(impl_list))) {
|
|
impl = impl_list[igpu_index];
|
|
}
|
|
|
|
QSV_Encoder_Internal *pEncoder = new QSV_Encoder_Internal(impl, ver);
|
|
mfxStatus sts = pEncoder->Open(pParams);
|
|
if (sts != MFX_ERR_NONE) {
|
|
|
|
#define WARN_ERR_IMPL(err, str, err_name) \
|
|
case err: \
|
|
do_log(LOG_WARNING, str " (" err_name ")"); \
|
|
break;
|
|
#define WARN_ERR(err, str) WARN_ERR_IMPL(err, str, #err)
|
|
|
|
switch (sts) {
|
|
WARN_ERR(MFX_ERR_UNKNOWN, "Unknown QSV error");
|
|
WARN_ERR(
|
|
MFX_ERR_NOT_INITIALIZED,
|
|
"Member functions called without initialization");
|
|
WARN_ERR(MFX_ERR_INVALID_HANDLE,
|
|
"Invalid session or MemId handle");
|
|
WARN_ERR(
|
|
MFX_ERR_NULL_PTR,
|
|
"NULL pointer in the input or output arguments");
|
|
WARN_ERR(MFX_ERR_UNDEFINED_BEHAVIOR,
|
|
"Undefined behavior");
|
|
WARN_ERR(MFX_ERR_NOT_ENOUGH_BUFFER,
|
|
"Insufficient buffer for input or output.");
|
|
WARN_ERR(MFX_ERR_NOT_FOUND,
|
|
"Specified object/item/sync point not found.");
|
|
WARN_ERR(MFX_ERR_MEMORY_ALLOC,
|
|
"Gailed to allocate memory");
|
|
WARN_ERR(MFX_ERR_LOCK_MEMORY,
|
|
"failed to lock the memory block "
|
|
"(external allocator).");
|
|
WARN_ERR(
|
|
MFX_ERR_UNSUPPORTED,
|
|
"Unsupported configurations, parameters, or features");
|
|
WARN_ERR(MFX_ERR_INVALID_VIDEO_PARAM,
|
|
"Incompatible video parameters detected");
|
|
WARN_ERR(
|
|
MFX_WRN_VIDEO_PARAM_CHANGED,
|
|
"The decoder detected a new sequence header in the "
|
|
"bitstream. Video parameters may have changed.");
|
|
WARN_ERR(
|
|
MFX_WRN_VALUE_NOT_CHANGED,
|
|
"The parameter has been clipped to its value range");
|
|
WARN_ERR(MFX_WRN_OUT_OF_RANGE,
|
|
"The parameter is out of valid value range");
|
|
WARN_ERR(MFX_WRN_INCOMPATIBLE_VIDEO_PARAM,
|
|
"Incompatible video parameters detected");
|
|
WARN_ERR(
|
|
MFX_WRN_FILTER_SKIPPED,
|
|
"The SDK VPP has skipped one or more optional filters "
|
|
"requested by the application");
|
|
WARN_ERR(MFX_ERR_ABORTED,
|
|
"The asynchronous operation aborted");
|
|
WARN_ERR(
|
|
MFX_ERR_MORE_DATA,
|
|
"Need more bitstream at decoding input, encoding "
|
|
"input, or video processing input frames");
|
|
WARN_ERR(MFX_ERR_MORE_SURFACE,
|
|
"Need more frame surfaces at "
|
|
"decoding or video processing output");
|
|
WARN_ERR(
|
|
MFX_ERR_MORE_BITSTREAM,
|
|
"Need more bitstream buffers at the encoding output");
|
|
WARN_ERR(MFX_WRN_IN_EXECUTION,
|
|
"Synchronous operation still running");
|
|
WARN_ERR(MFX_ERR_DEVICE_FAILED,
|
|
"Hardware device returned unexpected errors");
|
|
WARN_ERR(MFX_ERR_DEVICE_LOST,
|
|
"Hardware device was lost");
|
|
WARN_ERR(MFX_WRN_DEVICE_BUSY,
|
|
"Hardware device is currently busy");
|
|
WARN_ERR(MFX_WRN_PARTIAL_ACCELERATION,
|
|
"The hardware does not support the specified "
|
|
"configuration. Encoding, decoding, or video "
|
|
"processing may be partially accelerated");
|
|
}
|
|
|
|
#undef WARN_ERR
|
|
#undef WARN_ERR_IMPL
|
|
|
|
delete pEncoder;
|
|
if (pEncoder)
|
|
is_active.store(false);
|
|
return NULL;
|
|
}
|
|
|
|
return (qsv_t *)pEncoder;
|
|
}
|
|
|
|
int qsv_encoder_headers(qsv_t *pContext, uint8_t **pSPS, uint8_t **pPPS,
|
|
uint16_t *pnSPS, uint16_t *pnPPS)
|
|
{
|
|
QSV_Encoder_Internal *pEncoder = (QSV_Encoder_Internal *)pContext;
|
|
pEncoder->GetSPSPPS(pSPS, pPPS, pnSPS, pnPPS);
|
|
|
|
return 0;
|
|
}
|
|
|
|
int qsv_encoder_encode(qsv_t *pContext, uint64_t ts, uint8_t *pDataY,
|
|
uint8_t *pDataUV, uint32_t strideY, uint32_t strideUV,
|
|
mfxBitstream **pBS)
|
|
{
|
|
QSV_Encoder_Internal *pEncoder = (QSV_Encoder_Internal *)pContext;
|
|
mfxStatus sts = MFX_ERR_NONE;
|
|
|
|
if (pDataY != NULL && pDataUV != NULL)
|
|
sts = pEncoder->Encode(ts, pDataY, pDataUV, strideY, strideUV,
|
|
pBS);
|
|
|
|
if (sts == MFX_ERR_NONE)
|
|
return 0;
|
|
else if (sts == MFX_ERR_MORE_DATA)
|
|
return 1;
|
|
else
|
|
return -1;
|
|
}
|
|
|
|
int qsv_encoder_encode_tex(qsv_t *pContext, uint64_t ts, uint32_t tex_handle,
|
|
uint64_t lock_key, uint64_t *next_key,
|
|
mfxBitstream **pBS)
|
|
{
|
|
QSV_Encoder_Internal *pEncoder = (QSV_Encoder_Internal *)pContext;
|
|
mfxStatus sts = MFX_ERR_NONE;
|
|
|
|
sts = pEncoder->Encode_tex(ts, tex_handle, lock_key, next_key, pBS);
|
|
|
|
if (sts == MFX_ERR_NONE)
|
|
return 0;
|
|
else if (sts == MFX_ERR_MORE_DATA)
|
|
return 1;
|
|
else
|
|
return -1;
|
|
}
|
|
|
|
int qsv_encoder_close(qsv_t *pContext)
|
|
{
|
|
QSV_Encoder_Internal *pEncoder = (QSV_Encoder_Internal *)pContext;
|
|
delete pEncoder;
|
|
|
|
if (pEncoder)
|
|
is_active.store(false);
|
|
|
|
return 0;
|
|
}
|
|
|
|
/*
|
|
int qsv_param_default_preset(qsv_param_t *pParams, const char *preset,
|
|
const char *tune)
|
|
{
|
|
return 0;
|
|
}
|
|
|
|
int qsv_param_parse(qsv_param_t *, const char *name, const char *value)
|
|
{
|
|
return 0;
|
|
}
|
|
|
|
int qsv_param_apply_profile(qsv_param_t *, const char *profile)
|
|
{
|
|
return 0;
|
|
}
|
|
*/
|
|
|
|
int qsv_encoder_reconfig(qsv_t *pContext, qsv_param_t *pParams)
|
|
{
|
|
QSV_Encoder_Internal *pEncoder = (QSV_Encoder_Internal *)pContext;
|
|
mfxStatus sts = pEncoder->Reset(pParams);
|
|
|
|
if (sts == MFX_ERR_NONE)
|
|
return 0;
|
|
else
|
|
return -1;
|
|
}
|
|
|
|
enum qsv_cpu_platform qsv_get_cpu_platform()
|
|
{
|
|
using std::string;
|
|
|
|
int cpuInfo[4];
|
|
__cpuid(cpuInfo, 0);
|
|
|
|
string vendor;
|
|
vendor += string((char *)&cpuInfo[1], 4);
|
|
vendor += string((char *)&cpuInfo[3], 4);
|
|
vendor += string((char *)&cpuInfo[2], 4);
|
|
|
|
if (vendor != "GenuineIntel")
|
|
return QSV_CPU_PLATFORM_UNKNOWN;
|
|
|
|
__cpuid(cpuInfo, 1);
|
|
BYTE model = ((cpuInfo[0] >> 4) & 0xF) + ((cpuInfo[0] >> 12) & 0xF0);
|
|
BYTE family = ((cpuInfo[0] >> 8) & 0xF) + ((cpuInfo[0] >> 20) & 0xFF);
|
|
|
|
// See Intel 64 and IA-32 Architectures Software Developer's Manual,
|
|
// Vol 3C Table 35-1
|
|
if (family != 6)
|
|
return QSV_CPU_PLATFORM_UNKNOWN;
|
|
|
|
switch (model) {
|
|
case 0x1C:
|
|
case 0x26:
|
|
case 0x27:
|
|
case 0x35:
|
|
case 0x36:
|
|
return QSV_CPU_PLATFORM_BNL;
|
|
|
|
case 0x2a:
|
|
case 0x2d:
|
|
return QSV_CPU_PLATFORM_SNB;
|
|
|
|
case 0x3a:
|
|
case 0x3e:
|
|
return QSV_CPU_PLATFORM_IVB;
|
|
|
|
case 0x37:
|
|
case 0x4A:
|
|
case 0x4D:
|
|
case 0x5A:
|
|
case 0x5D:
|
|
return QSV_CPU_PLATFORM_SLM;
|
|
|
|
case 0x4C:
|
|
return QSV_CPU_PLATFORM_CHT;
|
|
|
|
case 0x3c:
|
|
case 0x3f:
|
|
case 0x45:
|
|
case 0x46:
|
|
return QSV_CPU_PLATFORM_HSW;
|
|
case 0x3d:
|
|
case 0x47:
|
|
case 0x4f:
|
|
case 0x56:
|
|
return QSV_CPU_PLATFORM_BDW;
|
|
|
|
case 0x4e:
|
|
case 0x5e:
|
|
return QSV_CPU_PLATFORM_SKL;
|
|
case 0x5c:
|
|
return QSV_CPU_PLATFORM_APL;
|
|
case 0x8e:
|
|
case 0x9e:
|
|
return QSV_CPU_PLATFORM_KBL;
|
|
case 0x7a:
|
|
return QSV_CPU_PLATFORM_GLK;
|
|
case 0x66:
|
|
return QSV_CPU_PLATFORM_CNL;
|
|
case 0x7d:
|
|
case 0x7e:
|
|
return QSV_CPU_PLATFORM_ICL;
|
|
}
|
|
|
|
//assume newer revisions are at least as capable as Haswell
|
|
return QSV_CPU_PLATFORM_INTEL;
|
|
}
|