obs-studio/plugins/obs-qsv11/QSV_Encoder.cpp

414 lines
11 KiB
C++

/*
This file is provided under a dual BSD/GPLv2 license. When using or
redistributing this file, you may do so under either license.
GPL LICENSE SUMMARY
Copyright(c) Oct. 2015 Intel Corporation.
This program is free software; you can redistribute it and/or modify
it under the terms of version 2 of the GNU General Public License as
published by the Free Software Foundation.
This program is distributed in the hope that it will be useful, but
WITHOUT ANY WARRANTY; without even the implied warranty of
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
General Public License for more details.
Contact Information:
Seung-Woo Kim, seung-woo.kim@intel.com
705 5th Ave S #500, Seattle, WA 98104
BSD LICENSE
Copyright(c) <date> Intel Corporation.
Redistribution and use in source and binary forms, with or without
modification, are permitted provided that the following conditions
are met:
* Redistributions of source code must retain the above copyright
notice, this list of conditions and the following disclaimer.
* Redistributions in binary form must reproduce the above copyright
notice, this list of conditions and the following disclaimer in
the documentation and/or other materials provided with the
distribution.
* Neither the name of Intel Corporation nor the names of its
contributors may be used to endorse or promote products derived
from this software without specific prior written permission.
THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
"AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
(INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
*/
// QSV_Encoder.cpp : Defines the exported functions for the DLL application.
//
#include "QSV_Encoder.h"
#include "QSV_Encoder_Internal.h"
#include <obs-module.h>
#include <string>
#include <atomic>
#include <intrin.h>
#include <d3d11.h>
#include <dxgi1_2.h>
#define do_log(level, format, ...) \
blog(level, "[qsv encoder: '%s'] " format, "msdk_impl", ##__VA_ARGS__)
mfxIMPL impl = MFX_IMPL_HARDWARE_ANY;
mfxVersion ver = {{0, 1}}; // for backward compatibility
std::atomic<bool> is_active{false};
bool prefer_igpu_enc(int *iGPUIndex)
{
IDXGIAdapter *pAdapter;
int adapterIndex = 0;
bool hasIGPU = false;
bool hasDGPU = false;
bool isDG1Primary = false;
HMODULE hDXGI = LoadLibrary(L"dxgi.dll");
if (hDXGI == NULL) {
return false;
}
typedef HRESULT(WINAPI * LPCREATEDXGIFACTORY)(REFIID riid,
void **ppFactory);
LPCREATEDXGIFACTORY pCreateDXGIFactory =
(LPCREATEDXGIFACTORY)GetProcAddress(hDXGI,
"CreateDXGIFactory1");
if (pCreateDXGIFactory == NULL) {
pCreateDXGIFactory = (LPCREATEDXGIFACTORY)GetProcAddress(
hDXGI, "CreateDXGIFactory");
if (pCreateDXGIFactory == NULL) {
FreeLibrary(hDXGI);
return false;
}
}
IDXGIFactory *pFactory = NULL;
if (FAILED((*pCreateDXGIFactory)(__uuidof(IDXGIFactory),
(void **)(&pFactory)))) {
FreeLibrary(hDXGI);
return false;
}
while (SUCCEEDED(pFactory->EnumAdapters(adapterIndex, &pAdapter))) {
DXGI_ADAPTER_DESC AdapterDesc = {};
if (SUCCEEDED(pAdapter->GetDesc(&AdapterDesc))) {
if (AdapterDesc.VendorId == 0x8086) {
if (AdapterDesc.DedicatedVideoMemory <=
512 * 1024 * 1024) {
hasIGPU = true;
if (iGPUIndex != NULL) {
*iGPUIndex = adapterIndex;
}
} else {
hasDGPU = true;
}
if ((AdapterDesc.DeviceId == 0x4905) ||
(AdapterDesc.DeviceId == 0x4906) ||
(AdapterDesc.DeviceId == 0x4907)) {
if (adapterIndex == 0) {
isDG1Primary = true;
}
}
}
}
adapterIndex++;
pAdapter->Release();
}
pFactory->Release();
FreeLibrary(hDXGI);
return hasIGPU && hasDGPU && isDG1Primary;
}
void qsv_encoder_version(unsigned short *major, unsigned short *minor)
{
*major = ver.Major;
*minor = ver.Minor;
}
qsv_t *qsv_encoder_open(qsv_param_t *pParams)
{
mfxIMPL impl_list[4] = {MFX_IMPL_HARDWARE, MFX_IMPL_HARDWARE2,
MFX_IMPL_HARDWARE3, MFX_IMPL_HARDWARE4};
int igpu_index = -1;
if (prefer_igpu_enc(&igpu_index)) {
impl = impl_list[igpu_index];
}
QSV_Encoder_Internal *pEncoder = new QSV_Encoder_Internal(impl, ver);
mfxStatus sts = pEncoder->Open(pParams);
if (sts != MFX_ERR_NONE) {
#define WARN_ERR_IMPL(err, str, err_name) \
case err: \
do_log(LOG_WARNING, str " (" err_name ")"); \
break;
#define WARN_ERR(err, str) WARN_ERR_IMPL(err, str, #err)
switch (sts) {
WARN_ERR(MFX_ERR_UNKNOWN, "Unknown QSV error");
WARN_ERR(
MFX_ERR_NOT_INITIALIZED,
"Member functions called without initialization");
WARN_ERR(MFX_ERR_INVALID_HANDLE,
"Invalid session or MemId handle");
WARN_ERR(
MFX_ERR_NULL_PTR,
"NULL pointer in the input or output arguments");
WARN_ERR(MFX_ERR_UNDEFINED_BEHAVIOR,
"Undefined behavior");
WARN_ERR(MFX_ERR_NOT_ENOUGH_BUFFER,
"Insufficient buffer for input or output.");
WARN_ERR(MFX_ERR_NOT_FOUND,
"Specified object/item/sync point not found.");
WARN_ERR(MFX_ERR_MEMORY_ALLOC,
"Gailed to allocate memory");
WARN_ERR(MFX_ERR_LOCK_MEMORY,
"failed to lock the memory block "
"(external allocator).");
WARN_ERR(
MFX_ERR_UNSUPPORTED,
"Unsupported configurations, parameters, or features");
WARN_ERR(MFX_ERR_INVALID_VIDEO_PARAM,
"Incompatible video parameters detected");
WARN_ERR(
MFX_WRN_VIDEO_PARAM_CHANGED,
"The decoder detected a new sequence header in the "
"bitstream. Video parameters may have changed.");
WARN_ERR(
MFX_WRN_VALUE_NOT_CHANGED,
"The parameter has been clipped to its value range");
WARN_ERR(MFX_WRN_OUT_OF_RANGE,
"The parameter is out of valid value range");
WARN_ERR(MFX_WRN_INCOMPATIBLE_VIDEO_PARAM,
"Incompatible video parameters detected");
WARN_ERR(
MFX_WRN_FILTER_SKIPPED,
"The SDK VPP has skipped one or more optional filters "
"requested by the application");
WARN_ERR(MFX_ERR_ABORTED,
"The asynchronous operation aborted");
WARN_ERR(
MFX_ERR_MORE_DATA,
"Need more bitstream at decoding input, encoding "
"input, or video processing input frames");
WARN_ERR(MFX_ERR_MORE_SURFACE,
"Need more frame surfaces at "
"decoding or video processing output");
WARN_ERR(
MFX_ERR_MORE_BITSTREAM,
"Need more bitstream buffers at the encoding output");
WARN_ERR(MFX_WRN_IN_EXECUTION,
"Synchronous operation still running");
WARN_ERR(MFX_ERR_DEVICE_FAILED,
"Hardware device returned unexpected errors");
WARN_ERR(MFX_ERR_DEVICE_LOST,
"Hardware device was lost");
WARN_ERR(MFX_WRN_DEVICE_BUSY,
"Hardware device is currently busy");
WARN_ERR(MFX_WRN_PARTIAL_ACCELERATION,
"The hardware does not support the specified "
"configuration. Encoding, decoding, or video "
"processing may be partially accelerated");
}
#undef WARN_ERR
#undef WARN_ERR_IMPL
delete pEncoder;
if (pEncoder)
is_active.store(false);
return NULL;
}
return (qsv_t *)pEncoder;
}
int qsv_encoder_headers(qsv_t *pContext, uint8_t **pSPS, uint8_t **pPPS,
uint16_t *pnSPS, uint16_t *pnPPS)
{
QSV_Encoder_Internal *pEncoder = (QSV_Encoder_Internal *)pContext;
pEncoder->GetSPSPPS(pSPS, pPPS, pnSPS, pnPPS);
return 0;
}
int qsv_encoder_encode(qsv_t *pContext, uint64_t ts, uint8_t *pDataY,
uint8_t *pDataUV, uint32_t strideY, uint32_t strideUV,
mfxBitstream **pBS)
{
QSV_Encoder_Internal *pEncoder = (QSV_Encoder_Internal *)pContext;
mfxStatus sts = MFX_ERR_NONE;
if (pDataY != NULL && pDataUV != NULL)
sts = pEncoder->Encode(ts, pDataY, pDataUV, strideY, strideUV,
pBS);
if (sts == MFX_ERR_NONE)
return 0;
else if (sts == MFX_ERR_MORE_DATA)
return 1;
else
return -1;
}
int qsv_encoder_encode_tex(qsv_t *pContext, uint64_t ts, uint32_t tex_handle,
uint64_t lock_key, uint64_t *next_key,
mfxBitstream **pBS)
{
QSV_Encoder_Internal *pEncoder = (QSV_Encoder_Internal *)pContext;
mfxStatus sts = MFX_ERR_NONE;
sts = pEncoder->Encode_tex(ts, tex_handle, lock_key, next_key, pBS);
if (sts == MFX_ERR_NONE)
return 0;
else if (sts == MFX_ERR_MORE_DATA)
return 1;
else
return -1;
}
int qsv_encoder_close(qsv_t *pContext)
{
QSV_Encoder_Internal *pEncoder = (QSV_Encoder_Internal *)pContext;
delete pEncoder;
if (pEncoder)
is_active.store(false);
return 0;
}
/*
int qsv_param_default_preset(qsv_param_t *pParams, const char *preset,
const char *tune)
{
return 0;
}
int qsv_param_parse(qsv_param_t *, const char *name, const char *value)
{
return 0;
}
int qsv_param_apply_profile(qsv_param_t *, const char *profile)
{
return 0;
}
*/
int qsv_encoder_reconfig(qsv_t *pContext, qsv_param_t *pParams)
{
QSV_Encoder_Internal *pEncoder = (QSV_Encoder_Internal *)pContext;
mfxStatus sts = pEncoder->Reset(pParams);
if (sts == MFX_ERR_NONE)
return 0;
else
return -1;
}
enum qsv_cpu_platform qsv_get_cpu_platform()
{
using std::string;
int cpuInfo[4];
__cpuid(cpuInfo, 0);
string vendor;
vendor += string((char *)&cpuInfo[1], 4);
vendor += string((char *)&cpuInfo[3], 4);
vendor += string((char *)&cpuInfo[2], 4);
if (vendor != "GenuineIntel")
return QSV_CPU_PLATFORM_UNKNOWN;
__cpuid(cpuInfo, 1);
BYTE model = ((cpuInfo[0] >> 4) & 0xF) + ((cpuInfo[0] >> 12) & 0xF0);
BYTE family = ((cpuInfo[0] >> 8) & 0xF) + ((cpuInfo[0] >> 20) & 0xFF);
// See Intel 64 and IA-32 Architectures Software Developer's Manual,
// Vol 3C Table 35-1
if (family != 6)
return QSV_CPU_PLATFORM_UNKNOWN;
switch (model) {
case 0x1C:
case 0x26:
case 0x27:
case 0x35:
case 0x36:
return QSV_CPU_PLATFORM_BNL;
case 0x2a:
case 0x2d:
return QSV_CPU_PLATFORM_SNB;
case 0x3a:
case 0x3e:
return QSV_CPU_PLATFORM_IVB;
case 0x37:
case 0x4A:
case 0x4D:
case 0x5A:
case 0x5D:
return QSV_CPU_PLATFORM_SLM;
case 0x4C:
return QSV_CPU_PLATFORM_CHT;
case 0x3c:
case 0x3f:
case 0x45:
case 0x46:
return QSV_CPU_PLATFORM_HSW;
case 0x3d:
case 0x47:
case 0x4f:
case 0x56:
return QSV_CPU_PLATFORM_BDW;
case 0x4e:
case 0x5e:
return QSV_CPU_PLATFORM_SKL;
case 0x5c:
return QSV_CPU_PLATFORM_APL;
case 0x8e:
case 0x9e:
return QSV_CPU_PLATFORM_KBL;
case 0x7a:
return QSV_CPU_PLATFORM_GLK;
case 0x66:
return QSV_CPU_PLATFORM_CNL;
case 0x7d:
case 0x7e:
return QSV_CPU_PLATFORM_ICL;
}
//assume newer revisions are at least as capable as Haswell
return QSV_CPU_PLATFORM_INTEL;
}