obs-studio/plugins/win-dshow/win-dshow-encoder.cpp
jp9000 4d002f588b (API Change) Remove encoder callback boilerplate
API Changed (in struct obs_encoder_info):
----------------------------------------
bool (*get_audio_info)(void *data, struct audio_convert_info *info);
bool (*get_video_info)(void *data, struct video_scale_info *info);

To:
----------------------------------------
void (*get_audio_info)(void *data, struct audio_convert_info *info);
void (*get_video_info)(void *data, struct video_scale_info *info);

The encoder video/audio information callbacks no longer need to manually
query the libobs video/audio information, that information is now passed
via the parameter, which the callbacks can modify.

The refactor that reduces boilerplate in the encoder video/audio
information callbacks also removes the need for their return values, so
change the return types to void.
2015-04-17 20:17:43 -07:00

368 lines
9.4 KiB
C++

#include <obs-module.h>
#include <obs-avc.h>
#include <util/darray.h>
#include <util/dstr.hpp>
#include "libdshowcapture/dshowcapture.hpp"
using namespace DShow;
using namespace std;
struct DShowEncoder {
obs_encoder_t *context;
VideoEncoder encoder;
VideoEncoderConfig config;
const wchar_t *device;
video_format format;
long long frameInterval;
bool first = true;
DARRAY(uint8_t) firstPacket;
DARRAY(uint8_t) header;
inline DShowEncoder(obs_encoder_t *context_, const wchar_t *device_)
: context(context_),
device(device_)
{
da_init(firstPacket);
da_init(header);
}
inline ~DShowEncoder()
{
da_free(firstPacket);
da_free(header);
}
inline void ParseFirstPacket(const uint8_t *data, size_t size);
inline bool Update(obs_data_t *settings);
inline bool Encode(struct encoder_frame *frame,
struct encoder_packet *packet, bool *received_packet);
};
static const char *GetC985EncoderName(void)
{
return obs_module_text("Encoder.C985");
}
static const char *GetC353EncoderName(void)
{
return obs_module_text("Encoder.C353");
}
static inline void FindDevice(DeviceId &id, const wchar_t *name)
{
vector<DeviceId> devices;
DShow::VideoEncoder::EnumEncoders(devices);
for (const DeviceId &device : devices) {
if (device.name.find(name) != string::npos) {
id = device;
break;
}
}
}
/*
* As far as I can tell the devices only seem to support 1024x768 and 1280x720
* resolutions, so I'm just going to cap it to those resolutions by aspect.
*
* XXX: This should really not be hard-coded. Problem is I don't know how to
* properly query the encoding capabilities of the devices.
*/
static const double standardAspect = 1024.0 / 768.0;
static const double wideAspect = 1280.0 / 720.0;
inline bool DShowEncoder::Update(obs_data_t *settings)
{
DStr deviceName;
DeviceId id;
FindDevice(id, device);
video_t *video = obs_encoder_video(context);
const struct video_output_info *voi = video_output_get_info(video);
int bitrate = (int)obs_data_get_int(settings, "bitrate");
int keyint_sec = (int)obs_data_get_int(settings, "keyint_sec");
int width = (int)obs_encoder_get_width(context);
int height = (int)obs_encoder_get_height(context);
double aspect = double(width) / double(height);
if (keyint_sec == 0)
keyint_sec = 2;
if (fabs(aspect - standardAspect) < fabs(aspect - wideAspect)) {
width = 1024;
height = 768;
} else {
width = 1280;
height = 720;
}
int keyint = keyint_sec * voi->fps_num / voi->fps_den;
frameInterval = voi->fps_den * 10000000 / voi->fps_num;
config.fpsNumerator = voi->fps_num;
config.fpsDenominator = voi->fps_den;
config.bitrate = bitrate;
config.keyframeInterval = keyint;
config.cx = width;
config.cy = height;
config.name = id.name;
config.path = id.path;
first = true;
da_resize(firstPacket, 0);
da_resize(header, 0);
dstr_from_wcs(deviceName, id.name.c_str());
DStr encoder_name;
dstr_from_wcs(encoder_name, config.name.c_str());
blog(LOG_DEBUG, "win-dshow-encoder:\n"
"\tencoder: %s\n"
"\twidth: %d\n"
"\theight: %d\n"
"\tfps_num: %d\n"
"\tfps_den: %d",
deviceName->array,
(int)width,
(int)height,
(int)voi->fps_num,
(int)voi->fps_den);
return encoder.SetConfig(config);
}
static bool UpdateDShowEncoder(void *data, obs_data_t *settings)
{
DShowEncoder *encoder = reinterpret_cast<DShowEncoder*>(data);
if (!obs_encoder_active(encoder->context))
return encoder->Update(settings);
return true;
}
static inline void *CreateDShowEncoder(obs_data_t *settings,
obs_encoder_t *context, const wchar_t *device)
{
DShowEncoder *encoder = nullptr;
try {
encoder = new DShowEncoder(context, device);
UpdateDShowEncoder(encoder, settings);
} catch (const char *error) {
blog(LOG_ERROR, "Could not create DirectShow encoder '%s': %s",
obs_encoder_get_name(context), error);
}
UNUSED_PARAMETER(settings);
return encoder;
}
static void *CreateC985Encoder(obs_data_t *settings, obs_encoder_t *context)
{
return CreateDShowEncoder(settings, context, L"C985");
}
static void *CreateC353Encoder(obs_data_t *settings, obs_encoder_t *context)
{
return CreateDShowEncoder(settings, context, L"C353");
}
static void DestroyDShowEncoder(void *data)
{
delete reinterpret_cast<DShowEncoder*>(data);
}
/* the first packet contains the SPS/PPS (header) NALs, so parse the first
* packet and separate the NALs */
inline void DShowEncoder::ParseFirstPacket(const uint8_t *data, size_t size)
{
const uint8_t *nal_start, *nal_end, *nal_codestart;
const uint8_t *end = data + size;
int type;
nal_start = obs_avc_find_startcode(data, end);
nal_end = nullptr;
while (nal_end != end) {
nal_codestart = nal_start;
while (nal_start < end && !*(nal_start++));
if (nal_start == end)
break;
type = nal_start[0] & 0x1F;
nal_end = obs_avc_find_startcode(nal_start, end);
if (!nal_end)
nal_end = end;
if (type == OBS_NAL_SPS || type == OBS_NAL_PPS) {
da_push_back_array(header, nal_codestart,
nal_end - nal_codestart);
} else {
da_push_back_array(firstPacket, nal_codestart,
nal_end - nal_codestart);
}
nal_start = nal_end;
}
}
inline bool DShowEncoder::Encode(struct encoder_frame *frame,
struct encoder_packet *packet, bool *received_packet)
{
unsigned char *frame_data[DSHOW_MAX_PLANES] = {};
size_t frame_sizes[DSHOW_MAX_PLANES] = {};
EncoderPacket dshowPacket;
bool new_packet = false;
/* The encoders expect YV12, so swap the chroma planes for encoding */
if (format == VIDEO_FORMAT_I420) {
frame_data[0] = frame->data[0];
frame_data[1] = frame->data[2];
frame_data[2] = frame->data[1];
frame_sizes[0] = frame->linesize[0] * config.cy;
frame_sizes[1] = frame->linesize[2] * config.cy / 2;
frame_sizes[2] = frame->linesize[1] * config.cy / 2;
}
long long actualPTS = frame->pts * frameInterval;
bool success = encoder.Encode(frame_data, frame_sizes,
actualPTS, actualPTS + frameInterval,
dshowPacket, new_packet);
if (!success)
return false;
if (new_packet && !!dshowPacket.data && !!dshowPacket.size) {
packet->data = dshowPacket.data;
packet->size = dshowPacket.size;
packet->type = OBS_ENCODER_VIDEO;
packet->pts = dshowPacket.pts / frameInterval;
packet->dts = dshowPacket.dts / frameInterval;
packet->keyframe = obs_avc_keyframe(packet->data, packet->size);
/* first packet must be parsed in order to retrieve header */
if (first) {
first = false;
ParseFirstPacket(packet->data, packet->size);
packet->data = firstPacket.array;
packet->size = firstPacket.num;
}
*received_packet = true;
}
return true;
}
static bool DShowEncode(void *data, struct encoder_frame *frame,
struct encoder_packet *packet, bool *received_packet)
{
return reinterpret_cast<DShowEncoder*>(data)->Encode(frame, packet,
received_packet);
}
static bool GetDShowExtraData(void *data, uint8_t **extra_data, size_t *size)
{
DShowEncoder *encoder = reinterpret_cast<DShowEncoder*>(data);
*extra_data = encoder->header.array;
*size = encoder->header.num;
return *size > 0;
}
static inline bool ValidResolution(uint32_t width, uint32_t height)
{
return (width == 1280 && height == 720) ||
(width == 1024 && height == 768);
}
static void GetDShowVideoInfo(void *data, struct video_scale_info *info)
{
DShowEncoder *encoder = reinterpret_cast<DShowEncoder*>(data);
encoder->format = VIDEO_FORMAT_I420;
if (info->format == VIDEO_FORMAT_I420 &&
ValidResolution(info->width, info->height))
return;
info->format = VIDEO_FORMAT_I420;
info->width = info->width;
info->height = info->height;
info->range = VIDEO_RANGE_DEFAULT;
info->colorspace = VIDEO_CS_DEFAULT;
double aspect = double(info->width) / double(info->height);
if (fabs(aspect - standardAspect) < fabs(aspect - wideAspect)) {
info->width = 1024;
info->height = 768;
} else {
info->width = 1280;
info->height = 720;
}
}
static void GetDShowEncoderDefauts(obs_data_t *settings)
{
obs_data_set_default_int(settings, "bitrate", 1000);
}
static obs_properties_t *GetDShowEncoderProperties(void *data)
{
obs_properties_t *ppts = obs_properties_create();
obs_properties_add_int(ppts, "bitrate", obs_module_text("Bitrate"),
1000, 60000, 1);
UNUSED_PARAMETER(data);
return ppts;
}
void RegisterDShowEncoders()
{
obs_encoder_info info = {};
info.type = OBS_ENCODER_VIDEO;
info.codec = "h264";
info.destroy = DestroyDShowEncoder;
info.encode = DShowEncode;
info.update = UpdateDShowEncoder;
info.get_defaults = GetDShowEncoderDefauts;
info.get_properties = GetDShowEncoderProperties;
info.get_extra_data = GetDShowExtraData;
info.get_video_info = GetDShowVideoInfo;
vector<DeviceId> devices;
DShow::VideoEncoder::EnumEncoders(devices);
bool foundC985 = false;
for (const DeviceId &device : devices) {
if (!foundC985 && device.name.find(L"C985") != string::npos) {
info.id = "dshow_c985_h264";
info.get_name = GetC985EncoderName;
info.create = CreateC985Encoder;
obs_register_encoder(&info);
foundC985 = true;
} else if (device.name.find(L"C353") != string::npos) {
info.id = "dshow_c353_h264";
info.get_name = GetC353EncoderName;
info.create = CreateC353Encoder;
obs_register_encoder(&info);
}
}
}