a89470d2ea
The cutoff hack was added many, many years ago as recommended by Konverter. Since then, there has been much work on the AAC encoder, so this hack should no longer be necessary.
402 lines
11 KiB
C
402 lines
11 KiB
C
/******************************************************************************
|
|
Copyright (C) 2014 by Hugh Bailey <obs.jim@gmail.com>
|
|
|
|
This program is free software: you can redistribute it and/or modify
|
|
it under the terms of the GNU General Public License as published by
|
|
the Free Software Foundation, either version 2 of the License, or
|
|
(at your option) any later version.
|
|
|
|
This program is distributed in the hope that it will be useful,
|
|
but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
GNU General Public License for more details.
|
|
|
|
You should have received a copy of the GNU General Public License
|
|
along with this program. If not, see <http://www.gnu.org/licenses/>.
|
|
******************************************************************************/
|
|
|
|
#include <util/base.h>
|
|
#include <util/circlebuf.h>
|
|
#include <util/darray.h>
|
|
#include <obs-module.h>
|
|
|
|
#include <libavformat/avformat.h>
|
|
|
|
#include "obs-ffmpeg-formats.h"
|
|
#include "obs-ffmpeg-compat.h"
|
|
|
|
#define do_log(level, format, ...) \
|
|
blog(level, "[FFmpeg %s encoder: '%s'] " format, \
|
|
enc->type, \
|
|
obs_encoder_get_name(enc->encoder), \
|
|
##__VA_ARGS__)
|
|
|
|
#define warn(format, ...) do_log(LOG_WARNING, format, ##__VA_ARGS__)
|
|
#define info(format, ...) do_log(LOG_INFO, format, ##__VA_ARGS__)
|
|
#define debug(format, ...) do_log(LOG_DEBUG, format, ##__VA_ARGS__)
|
|
|
|
struct enc_encoder {
|
|
obs_encoder_t *encoder;
|
|
|
|
const char *type;
|
|
|
|
AVCodec *codec;
|
|
AVCodecContext *context;
|
|
|
|
uint8_t *samples[MAX_AV_PLANES];
|
|
AVFrame *aframe;
|
|
int64_t total_samples;
|
|
|
|
DARRAY(uint8_t) packet_buffer;
|
|
|
|
size_t audio_planes;
|
|
size_t audio_size;
|
|
|
|
int frame_size; /* pretty much always 1024 for AAC */
|
|
int frame_size_bytes;
|
|
};
|
|
|
|
static inline uint64_t convert_speaker_layout(enum speaker_layout layout)
|
|
{
|
|
switch (layout) {
|
|
case SPEAKERS_UNKNOWN: return 0;
|
|
case SPEAKERS_MONO: return AV_CH_LAYOUT_MONO;
|
|
case SPEAKERS_STEREO: return AV_CH_LAYOUT_STEREO;
|
|
case SPEAKERS_2POINT1: return AV_CH_LAYOUT_SURROUND;
|
|
case SPEAKERS_4POINT0: return AV_CH_LAYOUT_4POINT0;
|
|
case SPEAKERS_4POINT1: return AV_CH_LAYOUT_4POINT1;
|
|
case SPEAKERS_5POINT1: return AV_CH_LAYOUT_5POINT1_BACK;
|
|
case SPEAKERS_7POINT1: return AV_CH_LAYOUT_7POINT1;
|
|
}
|
|
|
|
/* shouldn't get here */
|
|
return 0;
|
|
}
|
|
|
|
static inline enum speaker_layout convert_ff_channel_layout(uint64_t channel_layout)
|
|
{
|
|
switch (channel_layout) {
|
|
case AV_CH_LAYOUT_MONO: return SPEAKERS_MONO;
|
|
case AV_CH_LAYOUT_STEREO: return SPEAKERS_STEREO;
|
|
case AV_CH_LAYOUT_SURROUND: return SPEAKERS_2POINT1;
|
|
case AV_CH_LAYOUT_4POINT0: return SPEAKERS_4POINT0;
|
|
case AV_CH_LAYOUT_4POINT1: return SPEAKERS_4POINT1;
|
|
case AV_CH_LAYOUT_5POINT1_BACK: return SPEAKERS_5POINT1;
|
|
case AV_CH_LAYOUT_7POINT1: return SPEAKERS_7POINT1;
|
|
}
|
|
|
|
/* shouldn't get here */
|
|
return SPEAKERS_UNKNOWN;
|
|
}
|
|
|
|
static const char *aac_getname(void *unused)
|
|
{
|
|
UNUSED_PARAMETER(unused);
|
|
return obs_module_text("FFmpegAAC");
|
|
}
|
|
|
|
static const char *opus_getname(void *unused)
|
|
{
|
|
UNUSED_PARAMETER(unused);
|
|
return obs_module_text("FFmpegOpus");
|
|
}
|
|
|
|
static void enc_destroy(void *data)
|
|
{
|
|
struct enc_encoder *enc = data;
|
|
|
|
if (enc->samples[0])
|
|
av_freep(&enc->samples[0]);
|
|
if (enc->context)
|
|
avcodec_close(enc->context);
|
|
if (enc->aframe)
|
|
av_frame_free(&enc->aframe);
|
|
|
|
da_free(enc->packet_buffer);
|
|
bfree(enc);
|
|
}
|
|
|
|
static bool initialize_codec(struct enc_encoder *enc)
|
|
{
|
|
int ret;
|
|
|
|
enc->aframe = av_frame_alloc();
|
|
if (!enc->aframe) {
|
|
warn("Failed to allocate audio frame");
|
|
return false;
|
|
}
|
|
|
|
ret = avcodec_open2(enc->context, enc->codec, NULL);
|
|
if (ret < 0) {
|
|
warn("Failed to open AAC codec: %s", av_err2str(ret));
|
|
return false;
|
|
}
|
|
|
|
enc->frame_size = enc->context->frame_size;
|
|
if (!enc->frame_size)
|
|
enc->frame_size = 1024;
|
|
|
|
enc->frame_size_bytes = enc->frame_size * (int)enc->audio_size;
|
|
|
|
ret = av_samples_alloc(enc->samples, NULL, enc->context->channels,
|
|
enc->frame_size, enc->context->sample_fmt, 0);
|
|
if (ret < 0) {
|
|
warn("Failed to create audio buffer: %s", av_err2str(ret));
|
|
return false;
|
|
}
|
|
|
|
return true;
|
|
}
|
|
|
|
static void init_sizes(struct enc_encoder *enc, audio_t *audio)
|
|
{
|
|
const struct audio_output_info *aoi;
|
|
enum audio_format format;
|
|
|
|
aoi = audio_output_get_info(audio);
|
|
format = convert_ffmpeg_sample_format(enc->context->sample_fmt);
|
|
|
|
enc->audio_planes = get_audio_planes(format, aoi->speakers);
|
|
enc->audio_size = get_audio_size(format, aoi->speakers, 1);
|
|
}
|
|
|
|
#ifndef MIN
|
|
#define MIN(x, y) ((x) < (y) ? (x) : (y))
|
|
#endif
|
|
|
|
static void *enc_create(obs_data_t *settings, obs_encoder_t *encoder,
|
|
const char *type, const char *alt)
|
|
{
|
|
struct enc_encoder *enc;
|
|
int bitrate = (int)obs_data_get_int(settings, "bitrate");
|
|
audio_t *audio = obs_encoder_audio(encoder);
|
|
|
|
avcodec_register_all();
|
|
|
|
enc = bzalloc(sizeof(struct enc_encoder));
|
|
enc->encoder = encoder;
|
|
enc->codec = avcodec_find_encoder_by_name(type);
|
|
enc->type = type;
|
|
|
|
if (!enc->codec && alt) {
|
|
enc->codec = avcodec_find_encoder_by_name(alt);
|
|
enc->type = alt;
|
|
}
|
|
|
|
blog(LOG_INFO, "---------------------------------");
|
|
|
|
if (!enc->codec) {
|
|
warn("Couldn't find encoder");
|
|
goto fail;
|
|
}
|
|
|
|
if (!bitrate) {
|
|
warn("Invalid bitrate specified");
|
|
return NULL;
|
|
}
|
|
|
|
enc->context = avcodec_alloc_context3(enc->codec);
|
|
if (!enc->context) {
|
|
warn("Failed to create codec context");
|
|
goto fail;
|
|
}
|
|
|
|
enc->context->bit_rate = bitrate * 1000;
|
|
const struct audio_output_info *aoi;
|
|
aoi = audio_output_get_info(audio);
|
|
enc->context->channels = (int)audio_output_get_channels(audio);
|
|
enc->context->channel_layout = convert_speaker_layout(aoi->speakers);
|
|
enc->context->sample_rate = audio_output_get_sample_rate(audio);
|
|
enc->context->sample_fmt = enc->codec->sample_fmts ?
|
|
enc->codec->sample_fmts[0] : AV_SAMPLE_FMT_FLTP;
|
|
|
|
/* check to make sure sample rate is supported */
|
|
if (enc->codec->supported_samplerates) {
|
|
const int *rate = enc->codec->supported_samplerates;
|
|
int cur_rate = enc->context->sample_rate;
|
|
int closest = 0;
|
|
|
|
while (*rate) {
|
|
int dist = abs(cur_rate - *rate);
|
|
int closest_dist = abs(cur_rate - closest);
|
|
|
|
if (dist < closest_dist)
|
|
closest = *rate;
|
|
rate++;
|
|
}
|
|
|
|
if (closest)
|
|
enc->context->sample_rate = closest;
|
|
}
|
|
|
|
if (strcmp(enc->codec->name, "aac") == 0) {
|
|
}
|
|
|
|
info("bitrate: %" PRId64 ", channels: %d, channel_layout: %x\n",
|
|
(int64_t)enc->context->bit_rate / 1000,
|
|
(int)enc->context->channels,
|
|
(unsigned int)enc->context->channel_layout);
|
|
|
|
init_sizes(enc, audio);
|
|
|
|
/* enable experimental FFmpeg encoder if the only one available */
|
|
enc->context->strict_std_compliance = -2;
|
|
|
|
enc->context->flags = CODEC_FLAG_GLOBAL_H;
|
|
|
|
if (initialize_codec(enc))
|
|
return enc;
|
|
|
|
fail:
|
|
enc_destroy(enc);
|
|
return NULL;
|
|
}
|
|
|
|
static void *aac_create(obs_data_t *settings, obs_encoder_t *encoder)
|
|
{
|
|
return enc_create(settings, encoder, "aac", NULL);
|
|
}
|
|
|
|
static void *opus_create(obs_data_t *settings, obs_encoder_t *encoder)
|
|
{
|
|
return enc_create(settings, encoder, "libopus", "opus");
|
|
}
|
|
|
|
static bool do_encode(struct enc_encoder *enc,
|
|
struct encoder_packet *packet, bool *received_packet)
|
|
{
|
|
AVRational time_base = {1, enc->context->sample_rate};
|
|
AVPacket avpacket = {0};
|
|
int got_packet;
|
|
int ret;
|
|
|
|
enc->aframe->nb_samples = enc->frame_size;
|
|
enc->aframe->pts = av_rescale_q(enc->total_samples,
|
|
(AVRational){1, enc->context->sample_rate},
|
|
enc->context->time_base);
|
|
|
|
ret = avcodec_fill_audio_frame(enc->aframe, enc->context->channels,
|
|
enc->context->sample_fmt, enc->samples[0],
|
|
enc->frame_size_bytes * enc->context->channels, 1);
|
|
if (ret < 0) {
|
|
warn("avcodec_fill_audio_frame failed: %s", av_err2str(ret));
|
|
return false;
|
|
}
|
|
|
|
enc->total_samples += enc->frame_size;
|
|
|
|
#if LIBAVFORMAT_VERSION_INT >= AV_VERSION_INT(57, 40, 101)
|
|
ret = avcodec_send_frame(enc->context, enc->aframe);
|
|
if (ret == 0)
|
|
ret = avcodec_receive_packet(enc->context, &avpacket);
|
|
|
|
got_packet = (ret == 0);
|
|
|
|
if (ret == AVERROR_EOF || ret == AVERROR(EAGAIN))
|
|
ret = 0;
|
|
#else
|
|
ret = avcodec_encode_audio2(enc->context, &avpacket, enc->aframe,
|
|
&got_packet);
|
|
#endif
|
|
if (ret < 0) {
|
|
warn("avcodec_encode_audio2 failed: %s", av_err2str(ret));
|
|
return false;
|
|
}
|
|
|
|
*received_packet = !!got_packet;
|
|
if (!got_packet)
|
|
return true;
|
|
|
|
da_resize(enc->packet_buffer, 0);
|
|
da_push_back_array(enc->packet_buffer, avpacket.data, avpacket.size);
|
|
|
|
packet->pts = rescale_ts(avpacket.pts, enc->context, time_base);
|
|
packet->dts = rescale_ts(avpacket.dts, enc->context, time_base);
|
|
packet->data = enc->packet_buffer.array;
|
|
packet->size = avpacket.size;
|
|
packet->type = OBS_ENCODER_AUDIO;
|
|
packet->timebase_num = 1;
|
|
packet->timebase_den = (int32_t)enc->context->sample_rate;
|
|
av_free_packet(&avpacket);
|
|
return true;
|
|
}
|
|
|
|
static bool enc_encode(void *data, struct encoder_frame *frame,
|
|
struct encoder_packet *packet, bool *received_packet)
|
|
{
|
|
struct enc_encoder *enc = data;
|
|
|
|
for (size_t i = 0; i < enc->audio_planes; i++)
|
|
memcpy(enc->samples[i], frame->data[i], enc->frame_size_bytes);
|
|
|
|
return do_encode(enc, packet, received_packet);
|
|
}
|
|
|
|
static void enc_defaults(obs_data_t *settings)
|
|
{
|
|
obs_data_set_default_int(settings, "bitrate", 128);
|
|
}
|
|
|
|
static obs_properties_t *enc_properties(void *unused)
|
|
{
|
|
UNUSED_PARAMETER(unused);
|
|
|
|
obs_properties_t *props = obs_properties_create();
|
|
obs_properties_add_int(props, "bitrate",
|
|
obs_module_text("Bitrate"), 64, 1024, 32);
|
|
return props;
|
|
}
|
|
|
|
static bool enc_extra_data(void *data, uint8_t **extra_data, size_t *size)
|
|
{
|
|
struct enc_encoder *enc = data;
|
|
|
|
*extra_data = enc->context->extradata;
|
|
*size = enc->context->extradata_size;
|
|
return true;
|
|
}
|
|
|
|
static void enc_audio_info(void *data, struct audio_convert_info *info)
|
|
{
|
|
struct enc_encoder *enc = data;
|
|
info->format = convert_ffmpeg_sample_format(enc->context->sample_fmt);
|
|
info->samples_per_sec = (uint32_t)enc->context->sample_rate;
|
|
info->speakers = convert_ff_channel_layout(enc->context->channel_layout);
|
|
}
|
|
|
|
static size_t enc_frame_size(void *data)
|
|
{
|
|
struct enc_encoder *enc =data;
|
|
return enc->frame_size;
|
|
}
|
|
|
|
struct obs_encoder_info aac_encoder_info = {
|
|
.id = "ffmpeg_aac",
|
|
.type = OBS_ENCODER_AUDIO,
|
|
.codec = "AAC",
|
|
.get_name = aac_getname,
|
|
.create = aac_create,
|
|
.destroy = enc_destroy,
|
|
.encode = enc_encode,
|
|
.get_frame_size = enc_frame_size,
|
|
.get_defaults = enc_defaults,
|
|
.get_properties = enc_properties,
|
|
.get_extra_data = enc_extra_data,
|
|
.get_audio_info = enc_audio_info
|
|
};
|
|
|
|
struct obs_encoder_info opus_encoder_info = {
|
|
.id = "ffmpeg_opus",
|
|
.type = OBS_ENCODER_AUDIO,
|
|
.codec = "opus",
|
|
.get_name = opus_getname,
|
|
.create = opus_create,
|
|
.destroy = enc_destroy,
|
|
.encode = enc_encode,
|
|
.get_frame_size = enc_frame_size,
|
|
.get_defaults = enc_defaults,
|
|
.get_properties = enc_properties,
|
|
.get_extra_data = enc_extra_data,
|
|
.get_audio_info = enc_audio_info
|
|
};
|