summaryrefslogtreecommitdiff
path: root/Libraries/LibGfx/Gamma.h
diff options
context:
space:
mode:
Diffstat (limited to 'Libraries/LibGfx/Gamma.h')
-rw-r--r--Libraries/LibGfx/Gamma.h62
1 files changed, 23 insertions, 39 deletions
diff --git a/Libraries/LibGfx/Gamma.h b/Libraries/LibGfx/Gamma.h
index 0ef95b5f48..f6be93b8fe 100644
--- a/Libraries/LibGfx/Gamma.h
+++ b/Libraries/LibGfx/Gamma.h
@@ -30,6 +30,8 @@
#include <math.h>
#include <xmmintrin.h>
+#include <AK/SIMD.h>
+
#define GAMMA 2.2
// Most computer graphics are stored in the sRGB color space, which stores something close to
@@ -50,27 +52,28 @@
namespace Gfx {
+using AK::SIMD::f32x4;
+
#ifndef NO_FPU
# ifdef __SSE__
-// A vector of 4 floats, aligned for SSE instructions
-typedef float v4sf __attribute__((vector_size(16)));
-
-// Transform v4sf from gamma2.2 space to linear space
+// Transform f32x4 from gamma2.2 space to linear space
// Assumes x is in range [0, 1]
// FIXME: Remove this hack once clang-11 is available as the default in Github Actions.
// This is apparently sometime mid-December. https://github.com/actions/virtual-environments/issues/2130
# if !defined(__clang__) || __clang_major__ >= 11
-constexpr v4sf gamma_to_linear4(v4sf x)
+constexpr f32x4 gamma_to_linear4(f32x4 x)
# else
-inline v4sf gamma_to_linear4(v4sf x)
+inline f32x4 gamma_to_linear4(f32x4 x)
# endif
{
return (0.8f + 0.2f * x) * x * x;
}
-inline v4sf linear_to_gamma4(v4sf x)
+// Transform f32x4 from linear space to gamma2.2 space
+// Assumes x is in range [0, 1]
+inline f32x4 linear_to_gamma4(f32x4 x)
{
// Source for approximation: https://mimosa-pudica.net/fast-gamma/
constexpr float a = 0.00279491f;
@@ -81,59 +84,29 @@ inline v4sf linear_to_gamma4(v4sf x)
// Linearize v1 and v2, lerp them by mix factor, then convert back.
// The output is entirely v1 when mix = 0 and entirely v2 when mix = 1
-inline v4sf gamma_accurate_lerp4(v4sf v1, v4sf v2, float mix)
+inline f32x4 gamma_accurate_lerp4(f32x4 v1, f32x4 v2, float mix)
{
return linear_to_gamma4(gamma_to_linear4(v1) * (1 - mix) + gamma_to_linear4(v2) * mix);
}
-// Convert a and b to linear space, blend them by mix factor, then convert back using sse1.
-// The output is entirely a when mix = 0 and entirely b when mix = 1
-inline Color gamma_accurate_blend4(Color a, Color b, float mix)
-{
- v4sf ac = {
- (float)a.red(),
- (float)a.green(),
- (float)a.blue(),
- 0.f,
- };
- v4sf bc = {
- (float)b.red(),
- (float)b.green(),
- (float)b.blue(),
- 0.f,
- };
- v4sf out = 255.f * gamma_accurate_lerp4(ac / 255.f, bc / 255.f, mix);
- return Color(out[0], out[1], out[2]);
-}
-
# endif
// Transform scalar from gamma2.2 space to linear space
// Assumes x is in range [0, 1]
constexpr float gamma_to_linear(float x)
{
-# ifdef ACCURATE_GAMMA_ADJUSTMENT
- // Slower, but more accurate
- return pow(x, GAMMA);
-# else
return (0.8 + 0.2 * x) * x * x;
-# endif
}
// Transform scalar from linear space to gamma2.2 space
// Assumes x is in range [0, 1]
inline float linear_to_gamma(float x)
{
-# ifdef ACCURATE_GAMMA_ADJUSTMENT
- // Slower, but more accurate
- return pow(x, 1. / GAMMA);
-# else
// Source for approximation: https://mimosa-pudica.net/fast-gamma/
constexpr float a = 0.00279491;
constexpr float b = 1.15907984;
float c = (b / sqrt(1 + a)) - 1;
return ((b / __builtin_sqrt(x + a)) - c) * x;
-# endif
}
// Linearize v1 and v2, lerp them by mix factor, then convert back.
@@ -148,7 +121,18 @@ inline float gamma_accurate_lerp(float v1, float v2, float mix)
inline Color gamma_accurate_blend(Color a, Color b, float mix)
{
# ifdef __SSE__
- return gamma_accurate_blend4(a, b, mix);
+ f32x4 ac = {
+ (float)a.red(),
+ (float)a.green(),
+ (float)a.blue(),
+ };
+ f32x4 bc = {
+ (float)b.red(),
+ (float)b.green(),
+ (float)b.blue(),
+ };
+ f32x4 out = 255.f * gamma_accurate_lerp4(ac * (1.f / 255.f), bc * (1.f / 255.f), mix);
+ return Color(out[0], out[1], out[2]);
# else
return {
static_cast<u8>(255. * gamma_accurate_lerp(a.red() / 255., b.red() / 255., mix)),