This adds bicubic and lanczos scaling capability to libobs to improve scaling quality and sharpness when the output resolution has to be scaled relative to the base resolution. Bilinear is also available, although bilinear has rather poor quality and causes scaling to appear blurry. If the output resolution is close to the base resolution, then bilinear is used instead as an optimization, as there's no need to use these shaders if scaling is not in use. The Bicubic and Lanczos effects are also exposed via exported function to allow the ability to use those shaders in plugin modules if desired. The API change adds a variable 'scale_type' to the obs_video_info structure that allows the user interface to choose what type of scaling filter should be used.
497 lines
14 KiB
C
497 lines
14 KiB
C
/******************************************************************************
|
|
Copyright (C) 2013-2014 by Hugh Bailey <obs.jim@gmail.com>
|
|
|
|
This program is free software: you can redistribute it and/or modify
|
|
it under the terms of the GNU General Public License as published by
|
|
the Free Software Foundation, either version 2 of the License, or
|
|
(at your option) any later version.
|
|
|
|
This program is distributed in the hope that it will be useful,
|
|
but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
GNU General Public License for more details.
|
|
|
|
You should have received a copy of the GNU General Public License
|
|
along with this program. If not, see <http://www.gnu.org/licenses/>.
|
|
******************************************************************************/
|
|
|
|
#include "obs.h"
|
|
#include "obs-internal.h"
|
|
#include "graphics/vec4.h"
|
|
#include "media-io/format-conversion.h"
|
|
|
|
static uint64_t tick_sources(uint64_t cur_time, uint64_t last_time)
|
|
{
|
|
struct obs_core_data *data = &obs->data;
|
|
struct obs_source *source;
|
|
uint64_t delta_time;
|
|
float seconds;
|
|
|
|
if (!last_time)
|
|
last_time = cur_time -
|
|
video_output_get_frame_time(obs->video.video);
|
|
|
|
delta_time = cur_time - last_time;
|
|
seconds = (float)((double)delta_time / 1000000000.0);
|
|
|
|
pthread_mutex_lock(&data->sources_mutex);
|
|
|
|
source = data->first_source;
|
|
while (source) {
|
|
if (source->refs)
|
|
obs_source_video_tick(source, seconds);
|
|
source = (struct obs_source*)source->context.next;
|
|
}
|
|
|
|
pthread_mutex_unlock(&data->sources_mutex);
|
|
|
|
return cur_time;
|
|
}
|
|
|
|
/* in obs-display.c */
|
|
extern void render_display(struct obs_display *display);
|
|
|
|
static inline void render_displays(void)
|
|
{
|
|
struct obs_display *display;
|
|
|
|
if (!obs->data.valid)
|
|
return;
|
|
|
|
gs_enter_context(obs->video.graphics);
|
|
|
|
/* render extra displays/swaps */
|
|
pthread_mutex_lock(&obs->data.displays_mutex);
|
|
|
|
display = obs->data.first_display;
|
|
while (display) {
|
|
render_display(display);
|
|
display = display->next;
|
|
}
|
|
|
|
pthread_mutex_unlock(&obs->data.displays_mutex);
|
|
|
|
/* render main display */
|
|
render_display(&obs->video.main_display);
|
|
|
|
gs_leave_context();
|
|
}
|
|
|
|
static inline void set_render_size(uint32_t width, uint32_t height)
|
|
{
|
|
gs_enable_depth_test(false);
|
|
gs_set_cull_mode(GS_NEITHER);
|
|
|
|
gs_ortho(0.0f, (float)width, 0.0f, (float)height, -100.0f, 100.0f);
|
|
gs_set_viewport(0, 0, width, height);
|
|
}
|
|
|
|
static inline void unmap_last_surface(struct obs_core_video *video)
|
|
{
|
|
if (video->mapped_surface) {
|
|
gs_stagesurface_unmap(video->mapped_surface);
|
|
video->mapped_surface = NULL;
|
|
}
|
|
}
|
|
|
|
static inline void render_main_texture(struct obs_core_video *video,
|
|
int cur_texture)
|
|
{
|
|
struct vec4 clear_color;
|
|
vec4_set(&clear_color, 0.0f, 0.0f, 0.0f, 1.0f);
|
|
|
|
gs_set_render_target(video->render_textures[cur_texture], NULL);
|
|
gs_clear(GS_CLEAR_COLOR, &clear_color, 1.0f, 0);
|
|
|
|
set_render_size(video->base_width, video->base_height);
|
|
obs_view_render(&obs->data.main_view);
|
|
|
|
video->textures_rendered[cur_texture] = true;
|
|
}
|
|
|
|
static inline gs_effect_t *get_scale_effect_internal(
|
|
struct obs_core_video *video)
|
|
{
|
|
switch (video->scale_type) {
|
|
case OBS_SCALE_BILINEAR: return video->default_effect;
|
|
case OBS_SCALE_LANCZOS: return video->lanczos_effect;
|
|
case OBS_SCALE_BICUBIC:;
|
|
}
|
|
|
|
return video->bicubic_effect;
|
|
}
|
|
|
|
static inline bool resolution_close(struct obs_core_video *video,
|
|
uint32_t width, uint32_t height)
|
|
{
|
|
long width_cmp = (long)video->base_width - (long)width;
|
|
long height_cmp = (long)video->base_height - (long)height;
|
|
|
|
return labs(width_cmp) <= 16 && labs(height_cmp) <= 16;
|
|
}
|
|
|
|
static inline gs_effect_t *get_scale_effect(struct obs_core_video *video,
|
|
uint32_t width, uint32_t height)
|
|
{
|
|
if (resolution_close(video, width, height)) {
|
|
return video->default_effect;
|
|
} else {
|
|
/* if the scale method couldn't be loaded, use either bicubic
|
|
* or bilinear by default */
|
|
gs_effect_t *effect = get_scale_effect_internal(video);
|
|
if (!effect)
|
|
effect = !!video->bicubic_effect ?
|
|
video->bicubic_effect :
|
|
video->default_effect;
|
|
return effect;
|
|
}
|
|
}
|
|
|
|
static inline void render_output_texture(struct obs_core_video *video,
|
|
int cur_texture, int prev_texture)
|
|
{
|
|
gs_texture_t *texture = video->render_textures[prev_texture];
|
|
gs_texture_t *target = video->output_textures[cur_texture];
|
|
uint32_t width = gs_texture_get_width(target);
|
|
uint32_t height = gs_texture_get_height(target);
|
|
struct vec2 base_i;
|
|
|
|
vec2_set(&base_i,
|
|
1.0f / (float)video->base_width,
|
|
1.0f / (float)video->base_height);
|
|
|
|
gs_effect_t *effect = get_scale_effect(video, width, height);
|
|
gs_technique_t *tech = gs_effect_get_technique(effect, "DrawMatrix");
|
|
gs_eparam_t *image = gs_effect_get_param_by_name(effect, "image");
|
|
gs_eparam_t *matrix = gs_effect_get_param_by_name(effect,
|
|
"color_matrix");
|
|
gs_eparam_t *bres_i = gs_effect_get_param_by_name(effect,
|
|
"base_dimension_i");
|
|
size_t passes, i;
|
|
|
|
if (!video->textures_rendered[prev_texture])
|
|
return;
|
|
|
|
gs_set_render_target(target, NULL);
|
|
set_render_size(width, height);
|
|
|
|
if (bres_i)
|
|
gs_effect_set_vec2(bres_i, &base_i);
|
|
|
|
gs_effect_set_val(matrix, video->color_matrix, sizeof(float) * 16);
|
|
gs_effect_set_texture(image, texture);
|
|
|
|
gs_enable_blending(false);
|
|
passes = gs_technique_begin(tech);
|
|
for (i = 0; i < passes; i++) {
|
|
gs_technique_begin_pass(tech, i);
|
|
gs_draw_sprite(texture, 0, width, height);
|
|
gs_technique_end_pass(tech);
|
|
}
|
|
gs_technique_end(tech);
|
|
gs_enable_blending(true);
|
|
|
|
video->textures_output[cur_texture] = true;
|
|
}
|
|
|
|
static inline void set_eparam(gs_effect_t *effect, const char *name, float val)
|
|
{
|
|
gs_eparam_t *param = gs_effect_get_param_by_name(effect, name);
|
|
gs_effect_set_float(param, val);
|
|
}
|
|
|
|
static void render_convert_texture(struct obs_core_video *video,
|
|
int cur_texture, int prev_texture)
|
|
{
|
|
gs_texture_t *texture = video->output_textures[prev_texture];
|
|
gs_texture_t *target = video->convert_textures[cur_texture];
|
|
float fwidth = (float)video->output_width;
|
|
float fheight = (float)video->output_height;
|
|
size_t passes, i;
|
|
|
|
gs_effect_t *effect = video->conversion_effect;
|
|
gs_eparam_t *image = gs_effect_get_param_by_name(effect, "image");
|
|
gs_technique_t *tech = gs_effect_get_technique(effect,
|
|
video->conversion_tech);
|
|
|
|
if (!video->textures_output[prev_texture])
|
|
return;
|
|
|
|
set_eparam(effect, "u_plane_offset", (float)video->plane_offsets[1]);
|
|
set_eparam(effect, "v_plane_offset", (float)video->plane_offsets[2]);
|
|
set_eparam(effect, "width", fwidth);
|
|
set_eparam(effect, "height", fheight);
|
|
set_eparam(effect, "width_i", 1.0f / fwidth);
|
|
set_eparam(effect, "height_i", 1.0f / fheight);
|
|
set_eparam(effect, "width_d2", fwidth * 0.5f);
|
|
set_eparam(effect, "height_d2", fheight * 0.5f);
|
|
set_eparam(effect, "width_d2_i", 1.0f / (fwidth * 0.5f));
|
|
set_eparam(effect, "height_d2_i", 1.0f / (fheight * 0.5f));
|
|
set_eparam(effect, "input_height", (float)video->conversion_height);
|
|
|
|
gs_effect_set_texture(image, texture);
|
|
|
|
gs_set_render_target(target, NULL);
|
|
set_render_size(video->output_width, video->conversion_height);
|
|
|
|
gs_enable_blending(false);
|
|
passes = gs_technique_begin(tech);
|
|
for (i = 0; i < passes; i++) {
|
|
gs_technique_begin_pass(tech, i);
|
|
gs_draw_sprite(texture, 0, video->output_width,
|
|
video->conversion_height);
|
|
gs_technique_end_pass(tech);
|
|
}
|
|
gs_technique_end(tech);
|
|
gs_enable_blending(true);
|
|
|
|
video->textures_converted[cur_texture] = true;
|
|
}
|
|
|
|
static inline void stage_output_texture(struct obs_core_video *video,
|
|
int cur_texture, int prev_texture)
|
|
{
|
|
gs_texture_t *texture;
|
|
bool texture_ready;
|
|
gs_stagesurf_t *copy = video->copy_surfaces[cur_texture];
|
|
|
|
if (video->gpu_conversion) {
|
|
texture = video->convert_textures[prev_texture];
|
|
texture_ready = video->textures_converted[prev_texture];
|
|
} else {
|
|
texture = video->output_textures[prev_texture];
|
|
texture_ready = video->output_textures[prev_texture];
|
|
}
|
|
|
|
unmap_last_surface(video);
|
|
|
|
if (!texture_ready)
|
|
return;
|
|
|
|
gs_stage_texture(copy, texture);
|
|
|
|
video->textures_copied[cur_texture] = true;
|
|
}
|
|
|
|
static inline void render_video(struct obs_core_video *video, int cur_texture,
|
|
int prev_texture, uint64_t timestamp)
|
|
{
|
|
gs_begin_scene();
|
|
|
|
gs_enable_depth_test(false);
|
|
gs_set_cull_mode(GS_NEITHER);
|
|
|
|
circlebuf_push_back(&video->timestamp_buffer, ×tamp,
|
|
sizeof(timestamp));
|
|
|
|
render_main_texture(video, cur_texture);
|
|
render_output_texture(video, cur_texture, prev_texture);
|
|
if (video->gpu_conversion)
|
|
render_convert_texture(video, cur_texture, prev_texture);
|
|
|
|
stage_output_texture(video, cur_texture, prev_texture);
|
|
|
|
gs_set_render_target(NULL, NULL);
|
|
gs_enable_blending(true);
|
|
|
|
gs_end_scene();
|
|
}
|
|
|
|
static inline bool download_frame(struct obs_core_video *video,
|
|
int prev_texture, struct video_data *frame)
|
|
{
|
|
gs_stagesurf_t *surface = video->copy_surfaces[prev_texture];
|
|
|
|
if (!video->textures_copied[prev_texture])
|
|
return false;
|
|
|
|
if (!gs_stagesurface_map(surface, &frame->data[0], &frame->linesize[0]))
|
|
return false;
|
|
|
|
video->mapped_surface = surface;
|
|
return true;
|
|
}
|
|
|
|
static inline uint32_t calc_linesize(uint32_t pos, uint32_t linesize)
|
|
{
|
|
uint32_t size = pos % linesize;
|
|
return size ? size : linesize;
|
|
}
|
|
|
|
static void copy_dealign(
|
|
uint8_t *dst, uint32_t dst_pos, uint32_t dst_linesize,
|
|
const uint8_t *src, uint32_t src_pos, uint32_t src_linesize,
|
|
uint32_t remaining)
|
|
{
|
|
while (remaining) {
|
|
uint32_t src_remainder = src_pos % src_linesize;
|
|
uint32_t dst_offset = dst_linesize - src_remainder;
|
|
uint32_t src_offset = src_linesize - src_remainder;
|
|
|
|
if (remaining < dst_offset) {
|
|
memcpy(dst + dst_pos, src + src_pos, remaining);
|
|
src_pos += remaining;
|
|
dst_pos += remaining;
|
|
remaining = 0;
|
|
} else {
|
|
memcpy(dst + dst_pos, src + src_pos, dst_offset);
|
|
src_pos += src_offset;
|
|
dst_pos += dst_offset;
|
|
remaining -= dst_offset;
|
|
}
|
|
}
|
|
}
|
|
|
|
static inline uint32_t make_aligned_linesize_offset(uint32_t offset,
|
|
uint32_t dst_linesize, uint32_t src_linesize)
|
|
{
|
|
uint32_t remainder = offset % dst_linesize;
|
|
return (offset / dst_linesize) * src_linesize + remainder;
|
|
}
|
|
|
|
static void fix_gpu_converted_alignment(struct obs_core_video *video,
|
|
struct video_data *frame, int cur_texture)
|
|
{
|
|
struct obs_source_frame *new_frame =
|
|
&video->convert_frames[cur_texture];
|
|
uint32_t src_linesize = frame->linesize[0];
|
|
uint32_t dst_linesize = video->output_width * 4;
|
|
uint32_t src_pos = 0;
|
|
|
|
for (size_t i = 0; i < 3; i++) {
|
|
if (video->plane_linewidth[i] == 0)
|
|
break;
|
|
|
|
src_pos = make_aligned_linesize_offset(video->plane_offsets[i],
|
|
dst_linesize, src_linesize);
|
|
|
|
copy_dealign(new_frame->data[i], 0, dst_linesize,
|
|
frame->data[0], src_pos, src_linesize,
|
|
video->plane_sizes[i]);
|
|
}
|
|
|
|
/* replace with cached frames */
|
|
for (size_t i = 0; i < MAX_AV_PLANES; i++) {
|
|
frame->data[i] = new_frame->data[i];
|
|
frame->linesize[i] = new_frame->linesize[i];
|
|
}
|
|
}
|
|
|
|
static bool set_gpu_converted_data(struct obs_core_video *video,
|
|
struct video_data *frame, int cur_texture)
|
|
{
|
|
if (frame->linesize[0] == video->output_width*4) {
|
|
for (size_t i = 0; i < 3; i++) {
|
|
if (video->plane_linewidth[i] == 0)
|
|
break;
|
|
|
|
frame->linesize[i] = video->plane_linewidth[i];
|
|
frame->data[i] =
|
|
frame->data[0] + video->plane_offsets[i];
|
|
}
|
|
|
|
} else {
|
|
fix_gpu_converted_alignment(video, frame, cur_texture);
|
|
}
|
|
|
|
return true;
|
|
}
|
|
|
|
static bool convert_frame(struct obs_core_video *video,
|
|
struct video_data *frame,
|
|
const struct video_output_info *info, int cur_texture)
|
|
{
|
|
struct obs_source_frame *new_frame =
|
|
&video->convert_frames[cur_texture];
|
|
|
|
if (info->format == VIDEO_FORMAT_I420) {
|
|
compress_uyvx_to_i420(
|
|
frame->data[0], frame->linesize[0],
|
|
0, info->height,
|
|
new_frame->data, new_frame->linesize);
|
|
|
|
} else if (info->format == VIDEO_FORMAT_NV12) {
|
|
compress_uyvx_to_nv12(
|
|
frame->data[0], frame->linesize[0],
|
|
0, info->height,
|
|
new_frame->data, new_frame->linesize);
|
|
|
|
} else {
|
|
blog(LOG_ERROR, "convert_frame: unsupported texture format");
|
|
return false;
|
|
}
|
|
|
|
for (size_t i = 0; i < MAX_AV_PLANES; i++) {
|
|
frame->data[i] = new_frame->data[i];
|
|
frame->linesize[i] = new_frame->linesize[i];
|
|
}
|
|
|
|
return true;
|
|
}
|
|
|
|
static inline void output_video_data(struct obs_core_video *video,
|
|
struct video_data *frame, int cur_texture)
|
|
{
|
|
const struct video_output_info *info;
|
|
info = video_output_get_info(video->video);
|
|
|
|
if (video->gpu_conversion) {
|
|
if (!set_gpu_converted_data(video, frame, cur_texture))
|
|
return;
|
|
|
|
} else if (format_is_yuv(info->format)) {
|
|
if (!convert_frame(video, frame, info, cur_texture))
|
|
return;
|
|
}
|
|
|
|
video_output_swap_frame(video->video, frame);
|
|
}
|
|
|
|
static inline void output_frame(uint64_t timestamp)
|
|
{
|
|
struct obs_core_video *video = &obs->video;
|
|
int cur_texture = video->cur_texture;
|
|
int prev_texture = cur_texture == 0 ? NUM_TEXTURES-1 : cur_texture-1;
|
|
struct video_data frame;
|
|
bool frame_ready;
|
|
|
|
memset(&frame, 0, sizeof(struct video_data));
|
|
|
|
gs_enter_context(video->graphics);
|
|
|
|
render_video(video, cur_texture, prev_texture, timestamp);
|
|
frame_ready = download_frame(video, prev_texture, &frame);
|
|
|
|
gs_flush();
|
|
|
|
gs_leave_context();
|
|
|
|
if (frame_ready) {
|
|
circlebuf_pop_front(&video->timestamp_buffer, &frame.timestamp,
|
|
sizeof(frame.timestamp));
|
|
|
|
output_video_data(video, &frame, cur_texture);
|
|
}
|
|
|
|
if (++video->cur_texture == NUM_TEXTURES)
|
|
video->cur_texture = 0;
|
|
}
|
|
|
|
void *obs_video_thread(void *param)
|
|
{
|
|
uint64_t last_time = 0;
|
|
|
|
while (video_output_wait(obs->video.video)) {
|
|
uint64_t cur_time = video_output_get_time(obs->video.video);
|
|
|
|
last_time = tick_sources(cur_time, last_time);
|
|
|
|
render_displays();
|
|
|
|
output_frame(cur_time);
|
|
}
|
|
|
|
UNUSED_PARAMETER(param);
|
|
return NULL;
|
|
}
|