mirror of
https://github.com/CloverHackyColor/CloverBootloader.git
synced 2024-11-14 10:05:43 +01:00
284 lines
8.5 KiB
C
284 lines
8.5 KiB
C
|
/* pam.h - pam (portable alpha map) utility library
|
||
|
**
|
||
|
** Colormap routines.
|
||
|
**
|
||
|
** Copyright (C) 1989, 1991 by Jef Poskanzer.
|
||
|
** Copyright (C) 1997 by Greg Roelofs.
|
||
|
**
|
||
|
** Permission to use, copy, modify, and distribute this software and its
|
||
|
** documentation for any purpose and without fee is hereby granted, provided
|
||
|
** that the above copyright notice appear in all copies and that both that
|
||
|
** copyright notice and this permission notice appear in supporting
|
||
|
** documentation. This software is provided "as is" without express or
|
||
|
** implied warranty.
|
||
|
*/
|
||
|
|
||
|
#ifndef PAM_H
|
||
|
#define PAM_H
|
||
|
|
||
|
// accidental debug assertions make color search much slower,
|
||
|
// so force assertions off if there's no explicit setting
|
||
|
#if !defined(NDEBUG) && !defined(DEBUG)
|
||
|
#define NDEBUG
|
||
|
#endif
|
||
|
|
||
|
#include <math.h>
|
||
|
#include <assert.h>
|
||
|
#include <stdlib.h>
|
||
|
#include <stdbool.h>
|
||
|
|
||
|
#ifndef MAX
|
||
|
# define MAX(a,b) ((a) > (b)? (a) : (b))
|
||
|
# define MIN(a,b) ((a) < (b)? (a) : (b))
|
||
|
#endif
|
||
|
|
||
|
#define MAX_DIFF 1e20
|
||
|
|
||
|
#ifndef USE_SSE
|
||
|
# if defined(__SSE__) && (defined(__amd64__) || defined(__X86_64__) || defined(_WIN64) || defined(WIN32) || defined(__WIN32__))
|
||
|
# define USE_SSE 1
|
||
|
# else
|
||
|
# define USE_SSE 0
|
||
|
# endif
|
||
|
#endif
|
||
|
|
||
|
#if USE_SSE
|
||
|
# include <xmmintrin.h>
|
||
|
# ifdef _MSC_VER
|
||
|
# include <intrin.h>
|
||
|
# define SSE_ALIGN
|
||
|
# else
|
||
|
# define SSE_ALIGN __attribute__ ((aligned (16)))
|
||
|
# if defined(__i386__) && defined(__PIC__)
|
||
|
# define cpuid(func,ax,bx,cx,dx)\
|
||
|
__asm__ __volatile__ ( \
|
||
|
"push %%ebx\n" \
|
||
|
"cpuid\n" \
|
||
|
"mov %%ebx, %1\n" \
|
||
|
"pop %%ebx\n" \
|
||
|
: "=a" (ax), "=r" (bx), "=c" (cx), "=d" (dx) \
|
||
|
: "a" (func));
|
||
|
# else
|
||
|
# define cpuid(func,ax,bx,cx,dx)\
|
||
|
__asm__ __volatile__ ("cpuid":\
|
||
|
"=a" (ax), "=b" (bx), "=c" (cx), "=d" (dx) : "a" (func));
|
||
|
# endif
|
||
|
#endif
|
||
|
#else
|
||
|
# define SSE_ALIGN
|
||
|
#endif
|
||
|
|
||
|
#ifndef _MSC_VER
|
||
|
#define LIQ_ARRAY(type, var, count) type var[count]
|
||
|
#else
|
||
|
#define LIQ_ARRAY(type, var, count) type* var = (type*)_alloca(sizeof(type)*(count))
|
||
|
#endif
|
||
|
|
||
|
#if defined(__GNUC__) || defined (__llvm__)
|
||
|
#define ALWAYS_INLINE __attribute__((always_inline)) inline
|
||
|
#define NEVER_INLINE __attribute__ ((noinline))
|
||
|
#elif defined(_MSC_VER)
|
||
|
#define inline __inline
|
||
|
#define restrict __restrict
|
||
|
#define ALWAYS_INLINE __forceinline
|
||
|
#define NEVER_INLINE __declspec(noinline)
|
||
|
#else
|
||
|
#define ALWAYS_INLINE inline
|
||
|
#define NEVER_INLINE
|
||
|
#endif
|
||
|
|
||
|
/* from pam.h */
|
||
|
|
||
|
typedef struct {
|
||
|
unsigned char r, g, b, a;
|
||
|
} rgba_pixel;
|
||
|
|
||
|
typedef struct {
|
||
|
float a, r, g, b;
|
||
|
} SSE_ALIGN f_pixel;
|
||
|
|
||
|
static const float internal_gamma = 0.5499f;
|
||
|
|
||
|
LIQ_PRIVATE void to_f_set_gamma(float gamma_lut[], const double gamma);
|
||
|
|
||
|
/**
|
||
|
Converts 8-bit color to internal gamma and premultiplied alpha.
|
||
|
(premultiplied color space is much better for blending of semitransparent colors)
|
||
|
*/
|
||
|
ALWAYS_INLINE static f_pixel rgba_to_f(const float gamma_lut[], const rgba_pixel px);
|
||
|
inline static f_pixel rgba_to_f(const float gamma_lut[], const rgba_pixel px)
|
||
|
{
|
||
|
float a = px.a/255.f;
|
||
|
|
||
|
return (f_pixel) {
|
||
|
.a = a,
|
||
|
.r = gamma_lut[px.r]*a,
|
||
|
.g = gamma_lut[px.g]*a,
|
||
|
.b = gamma_lut[px.b]*a,
|
||
|
};
|
||
|
}
|
||
|
|
||
|
inline static rgba_pixel f_to_rgb(const float gamma, const f_pixel px)
|
||
|
{
|
||
|
if (px.a < 1.f/256.f) {
|
||
|
return (rgba_pixel){0,0,0,0};
|
||
|
}
|
||
|
|
||
|
float r = px.r / px.a,
|
||
|
g = px.g / px.a,
|
||
|
b = px.b / px.a,
|
||
|
a = px.a;
|
||
|
|
||
|
r = powf(r, gamma/internal_gamma);
|
||
|
g = powf(g, gamma/internal_gamma);
|
||
|
b = powf(b, gamma/internal_gamma);
|
||
|
|
||
|
// 256, because numbers are in range 1..255.9999… rounded down
|
||
|
r *= 256.f;
|
||
|
g *= 256.f;
|
||
|
b *= 256.f;
|
||
|
a *= 256.f;
|
||
|
|
||
|
return (rgba_pixel){
|
||
|
.r = r>=255.f ? 255 : r,
|
||
|
.g = g>=255.f ? 255 : g,
|
||
|
.b = b>=255.f ? 255 : b,
|
||
|
.a = a>=255.f ? 255 : a,
|
||
|
};
|
||
|
}
|
||
|
|
||
|
ALWAYS_INLINE static double colordifference_ch(const double x, const double y, const double alphas);
|
||
|
inline static double colordifference_ch(const double x, const double y, const double alphas)
|
||
|
{
|
||
|
// maximum of channel blended on white, and blended on black
|
||
|
// premultiplied alpha and backgrounds 0/1 shorten the formula
|
||
|
const double black = x-y, white = black+alphas;
|
||
|
return MAX(black*black, white*white);
|
||
|
}
|
||
|
|
||
|
ALWAYS_INLINE static float colordifference_stdc(const f_pixel px, const f_pixel py);
|
||
|
inline static float colordifference_stdc(const f_pixel px, const f_pixel py)
|
||
|
{
|
||
|
// px_b.rgb = px.rgb + 0*(1-px.a) // blend px on black
|
||
|
// px_b.a = px.a + 1*(1-px.a)
|
||
|
// px_w.rgb = px.rgb + 1*(1-px.a) // blend px on white
|
||
|
// px_w.a = px.a + 1*(1-px.a)
|
||
|
|
||
|
// px_b.rgb = px.rgb // difference same as in opaque RGB
|
||
|
// px_b.a = 1
|
||
|
// px_w.rgb = px.rgb - px.a // difference simplifies to formula below
|
||
|
// px_w.a = 1
|
||
|
|
||
|
// (px.rgb - px.a) - (py.rgb - py.a)
|
||
|
// (px.rgb - py.rgb) + (py.a - px.a)
|
||
|
|
||
|
const double alphas = py.a-px.a;
|
||
|
return colordifference_ch(px.r, py.r, alphas) +
|
||
|
colordifference_ch(px.g, py.g, alphas) +
|
||
|
colordifference_ch(px.b, py.b, alphas);
|
||
|
}
|
||
|
|
||
|
ALWAYS_INLINE static float colordifference(f_pixel px, f_pixel py);
|
||
|
inline static float colordifference(f_pixel px, f_pixel py)
|
||
|
{
|
||
|
#if USE_SSE
|
||
|
const __m128 vpx = _mm_load_ps((const float*)&px);
|
||
|
const __m128 vpy = _mm_load_ps((const float*)&py);
|
||
|
|
||
|
// y.a - x.a
|
||
|
__m128 alphas = _mm_sub_ss(vpy, vpx);
|
||
|
alphas = _mm_shuffle_ps(alphas,alphas,0); // copy first to all four
|
||
|
|
||
|
__m128 onblack = _mm_sub_ps(vpx, vpy); // x - y
|
||
|
__m128 onwhite = _mm_add_ps(onblack, alphas); // x - y + (y.a - x.a)
|
||
|
|
||
|
onblack = _mm_mul_ps(onblack, onblack);
|
||
|
onwhite = _mm_mul_ps(onwhite, onwhite);
|
||
|
const __m128 max = _mm_max_ps(onwhite, onblack);
|
||
|
|
||
|
// add rgb, not a
|
||
|
const __m128 maxhl = _mm_movehl_ps(max, max);
|
||
|
const __m128 tmp = _mm_add_ps(max, maxhl);
|
||
|
const __m128 sum = _mm_add_ss(maxhl, _mm_shuffle_ps(tmp, tmp, 1));
|
||
|
|
||
|
const float res = _mm_cvtss_f32(sum);
|
||
|
assert(fabs(res - colordifference_stdc(px,py)) < 0.001);
|
||
|
return res;
|
||
|
#else
|
||
|
return colordifference_stdc(px,py);
|
||
|
#endif
|
||
|
}
|
||
|
|
||
|
/* from pamcmap.h */
|
||
|
union rgba_as_int {
|
||
|
rgba_pixel rgba;
|
||
|
unsigned int l;
|
||
|
};
|
||
|
|
||
|
typedef struct {
|
||
|
f_pixel acolor;
|
||
|
float adjusted_weight, // perceptual weight changed to tweak how mediancut selects colors
|
||
|
perceptual_weight; // number of pixels weighted by importance of different areas of the picture
|
||
|
|
||
|
float color_weight; // these two change every time histogram subset is sorted
|
||
|
union {
|
||
|
unsigned int sort_value;
|
||
|
unsigned char likely_colormap_index;
|
||
|
} tmp;
|
||
|
} hist_item;
|
||
|
|
||
|
typedef struct {
|
||
|
hist_item *achv;
|
||
|
void (*free)(void*);
|
||
|
double total_perceptual_weight;
|
||
|
unsigned int size;
|
||
|
unsigned int ignorebits;
|
||
|
} histogram;
|
||
|
|
||
|
typedef struct {
|
||
|
f_pixel acolor;
|
||
|
float popularity;
|
||
|
bool fixed; // if true it's user-supplied and must not be changed (e.g in K-Means iteration)
|
||
|
} colormap_item;
|
||
|
|
||
|
typedef struct colormap {
|
||
|
unsigned int colors;
|
||
|
void* (*malloc)(size_t);
|
||
|
void (*free)(void*);
|
||
|
colormap_item palette[];
|
||
|
} colormap;
|
||
|
|
||
|
struct acolorhist_arr_item {
|
||
|
union rgba_as_int color;
|
||
|
unsigned int perceptual_weight;
|
||
|
};
|
||
|
|
||
|
struct acolorhist_arr_head {
|
||
|
struct acolorhist_arr_item inline1, inline2;
|
||
|
unsigned int used, capacity;
|
||
|
struct acolorhist_arr_item *other_items;
|
||
|
};
|
||
|
|
||
|
struct acolorhash_table {
|
||
|
struct mempool *mempool;
|
||
|
unsigned int ignorebits, maxcolors, colors, cols, rows;
|
||
|
unsigned int hash_size;
|
||
|
unsigned int freestackp;
|
||
|
struct acolorhist_arr_item *freestack[512];
|
||
|
struct acolorhist_arr_head buckets[];
|
||
|
};
|
||
|
|
||
|
LIQ_PRIVATE void pam_freeacolorhash(struct acolorhash_table *acht);
|
||
|
LIQ_PRIVATE struct acolorhash_table *pam_allocacolorhash(unsigned int maxcolors, unsigned int surface, unsigned int ignorebits, void* (*malloc)(size_t), void (*free)(void*));
|
||
|
LIQ_PRIVATE histogram *pam_acolorhashtoacolorhist(const struct acolorhash_table *acht, const double gamma, void* (*malloc)(size_t), void (*free)(void*));
|
||
|
LIQ_PRIVATE bool pam_computeacolorhash(struct acolorhash_table *acht, const rgba_pixel *const pixels[], unsigned int cols, unsigned int rows, const unsigned char *importance_map);
|
||
|
LIQ_PRIVATE bool pam_add_to_hash(struct acolorhash_table *acht, unsigned int hash, unsigned int boost, union rgba_as_int px, unsigned int row, unsigned int rows);
|
||
|
|
||
|
LIQ_PRIVATE void pam_freeacolorhist(histogram *h);
|
||
|
|
||
|
LIQ_PRIVATE colormap *pam_colormap(unsigned int colors, void* (*malloc)(size_t), void (*free)(void*));
|
||
|
LIQ_PRIVATE colormap *pam_duplicate_colormap(colormap *map);
|
||
|
LIQ_PRIVATE void pam_freecolormap(colormap *c);
|
||
|
|
||
|
#endif
|