66259560e0
GS_RGBA, GS_BGRX, and GS_BGRA now use TYPELESS DXGI formats, so we can alias them between UNORM and UNORM_SRGB as necessary. GS_RGBA_UNORM, GS_BGRX_UNORM, and GS_BGRA_UNORM have been added to support straight UNORM types, which Windows requires for sharing textures from D3D9 and OpenGL. The D3D path aliases via views, and GL aliases via GL_EXT_texture_sRGB_decode/GL_FRAMEBUFFER_SRGB. A significant amount of code has changed in the D3D/GL backends, but the concepts are simple. On the D3D side, we need separate SRVs and RTVs to support nonlinear/linear reads and writes. On the GL side, we need to set the proper GL parameters to emulate the same. Add gs_enable_framebuffer_srgb/gs_framebuffer_srgb_enabled to set/get the framebuffer as SRGB or not. Add gs_linear_srgb_active/gs_set_linear_srgb to instruct sources that they should render as SRGB. Legacy sources can ignore this setting without regression. Update obs_source_draw to use linear SRGB as needed. Update render_filter_tex to use linear SRGB as needed. Add gs_effect_set_texture_srgb next to gs_effect_set_texture to set texture with SRGB view instead. Add SRGB helpers for vec4 struct. Create GDI-compatible textures without SRGB support. Doesn't seem to work with SRGB formats.
330 lines
8.2 KiB
C
330 lines
8.2 KiB
C
/******************************************************************************
|
|
Copyright (C) 2013 by Hugh Bailey <obs.jim@gmail.com>
|
|
|
|
This program is free software: you can redistribute it and/or modify
|
|
it under the terms of the GNU General Public License as published by
|
|
the Free Software Foundation, either version 2 of the License, or
|
|
(at your option) any later version.
|
|
|
|
This program is distributed in the hope that it will be useful,
|
|
but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
GNU General Public License for more details.
|
|
|
|
You should have received a copy of the GNU General Public License
|
|
along with this program. If not, see <http://www.gnu.org/licenses/>.
|
|
******************************************************************************/
|
|
|
|
#pragma once
|
|
|
|
#include "math-defs.h"
|
|
|
|
#include "../util/sse-intrin.h"
|
|
|
|
#ifdef __cplusplus
|
|
extern "C" {
|
|
#endif
|
|
|
|
struct vec3;
|
|
struct matrix4;
|
|
|
|
struct vec4 {
|
|
union {
|
|
struct {
|
|
float x, y, z, w;
|
|
};
|
|
float ptr[4];
|
|
__m128 m;
|
|
};
|
|
};
|
|
|
|
static inline void vec4_zero(struct vec4 *v)
|
|
{
|
|
v->m = _mm_setzero_ps();
|
|
}
|
|
|
|
static inline void vec4_set(struct vec4 *dst, float x, float y, float z,
|
|
float w)
|
|
{
|
|
dst->m = _mm_set_ps(w, z, y, x);
|
|
}
|
|
|
|
static inline void vec4_copy(struct vec4 *dst, const struct vec4 *v)
|
|
{
|
|
dst->m = v->m;
|
|
}
|
|
|
|
EXPORT void vec4_from_vec3(struct vec4 *dst, const struct vec3 *v);
|
|
|
|
static inline void vec4_add(struct vec4 *dst, const struct vec4 *v1,
|
|
const struct vec4 *v2)
|
|
{
|
|
dst->m = _mm_add_ps(v1->m, v2->m);
|
|
}
|
|
|
|
static inline void vec4_sub(struct vec4 *dst, const struct vec4 *v1,
|
|
const struct vec4 *v2)
|
|
{
|
|
dst->m = _mm_sub_ps(v1->m, v2->m);
|
|
}
|
|
|
|
static inline void vec4_mul(struct vec4 *dst, const struct vec4 *v1,
|
|
const struct vec4 *v2)
|
|
{
|
|
dst->m = _mm_mul_ps(v1->m, v2->m);
|
|
}
|
|
|
|
static inline void vec4_div(struct vec4 *dst, const struct vec4 *v1,
|
|
const struct vec4 *v2)
|
|
{
|
|
dst->m = _mm_div_ps(v1->m, v2->m);
|
|
}
|
|
|
|
static inline void vec4_addf(struct vec4 *dst, const struct vec4 *v, float f)
|
|
{
|
|
dst->m = _mm_add_ps(v->m, _mm_set1_ps(f));
|
|
}
|
|
|
|
static inline void vec4_subf(struct vec4 *dst, const struct vec4 *v, float f)
|
|
{
|
|
dst->m = _mm_sub_ps(v->m, _mm_set1_ps(f));
|
|
}
|
|
|
|
static inline void vec4_mulf(struct vec4 *dst, const struct vec4 *v, float f)
|
|
{
|
|
dst->m = _mm_mul_ps(v->m, _mm_set1_ps(f));
|
|
}
|
|
|
|
static inline void vec4_divf(struct vec4 *dst, const struct vec4 *v, float f)
|
|
{
|
|
dst->m = _mm_div_ps(v->m, _mm_set1_ps(f));
|
|
}
|
|
|
|
static inline float vec4_dot(const struct vec4 *v1, const struct vec4 *v2)
|
|
{
|
|
struct vec4 add;
|
|
__m128 mul = _mm_mul_ps(v1->m, v2->m);
|
|
add.m = _mm_add_ps(_mm_movehl_ps(mul, mul), mul);
|
|
add.m = _mm_add_ps(_mm_shuffle_ps(add.m, add.m, 0x55), add.m);
|
|
return add.x;
|
|
}
|
|
|
|
static inline void vec4_neg(struct vec4 *dst, const struct vec4 *v)
|
|
{
|
|
dst->x = -v->x;
|
|
dst->y = -v->y;
|
|
dst->z = -v->z;
|
|
dst->w = -v->w;
|
|
}
|
|
|
|
static inline float vec4_len(const struct vec4 *v)
|
|
{
|
|
float dot_val = vec4_dot(v, v);
|
|
return (dot_val > 0.0f) ? sqrtf(dot_val) : 0.0f;
|
|
}
|
|
|
|
static inline float vec4_dist(const struct vec4 *v1, const struct vec4 *v2)
|
|
{
|
|
struct vec4 temp;
|
|
float dot_val;
|
|
|
|
vec4_sub(&temp, v1, v2);
|
|
dot_val = vec4_dot(&temp, &temp);
|
|
return (dot_val > 0.0f) ? sqrtf(dot_val) : 0.0f;
|
|
}
|
|
|
|
static inline void vec4_norm(struct vec4 *dst, const struct vec4 *v)
|
|
{
|
|
float dot_val = vec4_dot(v, v);
|
|
dst->m = (dot_val > 0.0f)
|
|
? _mm_mul_ps(v->m, _mm_set1_ps(1.0f / sqrtf(dot_val)))
|
|
: _mm_setzero_ps();
|
|
}
|
|
|
|
static inline int vec4_close(const struct vec4 *v1, const struct vec4 *v2,
|
|
float epsilon)
|
|
{
|
|
struct vec4 test;
|
|
vec4_sub(&test, v1, v2);
|
|
return test.x < epsilon && test.y < epsilon && test.z < epsilon &&
|
|
test.w < epsilon;
|
|
}
|
|
|
|
static inline void vec4_min(struct vec4 *dst, const struct vec4 *v1,
|
|
const struct vec4 *v2)
|
|
{
|
|
dst->m = _mm_min_ps(v1->m, v2->m);
|
|
}
|
|
|
|
static inline void vec4_minf(struct vec4 *dst, const struct vec4 *v, float f)
|
|
{
|
|
dst->m = _mm_min_ps(v->m, _mm_set1_ps(f));
|
|
}
|
|
|
|
static inline void vec4_max(struct vec4 *dst, const struct vec4 *v1,
|
|
const struct vec4 *v2)
|
|
{
|
|
dst->m = _mm_max_ps(v1->m, v2->m);
|
|
}
|
|
|
|
static inline void vec4_maxf(struct vec4 *dst, const struct vec4 *v, float f)
|
|
{
|
|
dst->m = _mm_max_ps(v->m, _mm_set1_ps(f));
|
|
}
|
|
|
|
static inline void vec4_abs(struct vec4 *dst, const struct vec4 *v)
|
|
{
|
|
dst->x = fabsf(v->x);
|
|
dst->y = fabsf(v->y);
|
|
dst->z = fabsf(v->z);
|
|
dst->w = fabsf(v->w);
|
|
}
|
|
|
|
static inline void vec4_floor(struct vec4 *dst, const struct vec4 *v)
|
|
{
|
|
dst->x = floorf(v->x);
|
|
dst->y = floorf(v->y);
|
|
dst->z = floorf(v->z);
|
|
dst->w = floorf(v->w);
|
|
}
|
|
|
|
static inline void vec4_ceil(struct vec4 *dst, const struct vec4 *v)
|
|
{
|
|
dst->x = ceilf(v->x);
|
|
dst->y = ceilf(v->y);
|
|
dst->z = ceilf(v->z);
|
|
dst->w = ceilf(v->w);
|
|
}
|
|
|
|
static inline uint32_t vec4_to_rgba(const struct vec4 *src)
|
|
{
|
|
uint32_t val;
|
|
val = (uint32_t)((src->x * 255.0f) + 0.5f);
|
|
val |= (uint32_t)((src->y * 255.0f) + 0.5f) << 8;
|
|
val |= (uint32_t)((src->z * 255.0f) + 0.5f) << 16;
|
|
val |= (uint32_t)((src->w * 255.0f) + 0.5f) << 24;
|
|
return val;
|
|
}
|
|
|
|
static inline uint32_t vec4_to_bgra(const struct vec4 *src)
|
|
{
|
|
uint32_t val;
|
|
val = (uint32_t)((src->z * 255.0f) + 0.5f);
|
|
val |= (uint32_t)((src->y * 255.0f) + 0.5f) << 8;
|
|
val |= (uint32_t)((src->x * 255.0f) + 0.5f) << 16;
|
|
val |= (uint32_t)((src->w * 255.0f) + 0.5f) << 24;
|
|
return val;
|
|
}
|
|
|
|
static inline void vec4_from_rgba(struct vec4 *dst, uint32_t rgba)
|
|
{
|
|
dst->x = (float)(rgba & 0xFF) / 255.0f;
|
|
rgba >>= 8;
|
|
dst->y = (float)(rgba & 0xFF) / 255.0f;
|
|
rgba >>= 8;
|
|
dst->z = (float)(rgba & 0xFF) / 255.0f;
|
|
rgba >>= 8;
|
|
dst->w = (float)rgba / 255.0f;
|
|
}
|
|
|
|
static inline void vec4_from_bgra(struct vec4 *dst, uint32_t bgra)
|
|
{
|
|
dst->z = (float)(bgra & 0xFF) / 255.0f;
|
|
bgra >>= 8;
|
|
dst->y = (float)(bgra & 0xFF) / 255.0f;
|
|
bgra >>= 8;
|
|
dst->x = (float)(bgra & 0xFF) / 255.0f;
|
|
bgra >>= 8;
|
|
dst->w = (float)bgra / 255.0f;
|
|
}
|
|
|
|
static inline float srgb_nonlinear_to_linear(float u)
|
|
{
|
|
return (u <= 0.04045f) ? (u / 12.92f)
|
|
: powf((u + 0.055f) / 1.055f, 2.4f);
|
|
}
|
|
|
|
static inline void vec4_from_rgba_srgb(struct vec4 *dst, uint32_t rgba)
|
|
{
|
|
dst->x = srgb_nonlinear_to_linear((float)(rgba & 0xFF) / 255.0f);
|
|
rgba >>= 8;
|
|
dst->y = srgb_nonlinear_to_linear((float)(rgba & 0xFF) / 255.0f);
|
|
rgba >>= 8;
|
|
dst->z = srgb_nonlinear_to_linear((float)(rgba & 0xFF) / 255.0f);
|
|
rgba >>= 8;
|
|
dst->w = (float)rgba / 255.0f;
|
|
}
|
|
|
|
static inline void vec4_from_bgra_srgb(struct vec4 *dst, uint32_t bgra)
|
|
{
|
|
dst->z = srgb_nonlinear_to_linear((float)(bgra & 0xFF) / 255.0f);
|
|
bgra >>= 8;
|
|
dst->y = srgb_nonlinear_to_linear((float)(bgra & 0xFF) / 255.0f);
|
|
bgra >>= 8;
|
|
dst->x = srgb_nonlinear_to_linear((float)(bgra & 0xFF) / 255.0f);
|
|
bgra >>= 8;
|
|
dst->w = (float)bgra / 255.0f;
|
|
}
|
|
|
|
static inline void vec4_from_rgba_srgb_premultiply(struct vec4 *dst,
|
|
uint32_t rgba)
|
|
{
|
|
vec4_from_rgba_srgb(dst, rgba);
|
|
dst->x *= dst->w;
|
|
dst->y *= dst->w;
|
|
dst->z *= dst->w;
|
|
}
|
|
|
|
static inline void vec4_from_bgra_srgb_premultiply(struct vec4 *dst,
|
|
uint32_t bgra)
|
|
{
|
|
vec4_from_bgra_srgb(dst, bgra);
|
|
dst->x *= dst->w;
|
|
dst->y *= dst->w;
|
|
dst->z *= dst->w;
|
|
}
|
|
|
|
static inline float srgb_linear_to_nonlinear(float u)
|
|
{
|
|
return (u <= 0.0031308f) ? (12.92f * u)
|
|
: ((1.055f * powf(u, 1.0f / 2.4f)) - 0.055f);
|
|
}
|
|
|
|
static inline uint32_t vec4_to_rgba_srgb(const struct vec4 *src)
|
|
{
|
|
uint32_t val;
|
|
val = (uint32_t)((srgb_linear_to_nonlinear(src->x) * 255.0f) + 0.5f);
|
|
val |= (uint32_t)((srgb_linear_to_nonlinear(src->y) * 255.0f) + 0.5f)
|
|
<< 8;
|
|
val |= (uint32_t)((srgb_linear_to_nonlinear(src->z) * 255.0f) + 0.5f)
|
|
<< 16;
|
|
val |= (uint32_t)((src->w * 255.0f) + 0.5f) << 24;
|
|
return val;
|
|
}
|
|
|
|
static inline uint32_t vec4_to_bgra_srgb(const struct vec4 *src)
|
|
{
|
|
uint32_t val;
|
|
val = (uint32_t)((srgb_linear_to_nonlinear(src->z) * 255.0f) + 0.5f);
|
|
val |= (uint32_t)((srgb_linear_to_nonlinear(src->y) * 255.0f) + 0.5f)
|
|
<< 8;
|
|
val |= (uint32_t)((srgb_linear_to_nonlinear(src->x) * 255.0f) + 0.5f)
|
|
<< 16;
|
|
val |= (uint32_t)((src->w * 255.0f) + 0.5f) << 24;
|
|
return val;
|
|
}
|
|
|
|
static inline void vec4_srgb_linear_to_nonlinear(struct vec4 *dst)
|
|
{
|
|
dst->x = srgb_linear_to_nonlinear(dst->x);
|
|
dst->y = srgb_linear_to_nonlinear(dst->y);
|
|
dst->y = srgb_linear_to_nonlinear(dst->y);
|
|
}
|
|
|
|
EXPORT void vec4_transform(struct vec4 *dst, const struct vec4 *v,
|
|
const struct matrix4 *m);
|
|
|
|
#ifdef __cplusplus
|
|
}
|
|
#endif
|