d5/d00/gamma__lut_8h_source.html

#pragma once


// Compile-time PROGMEM gamma LUT generator for C++11.

//

// Usage:

//   typedef fl::ProgmemLUT<fl::GammaEval<fl::gamma<fl::u8x24>(2.2f)>, 256> Gamma22;

//   uint8_t corrected = Gamma22::read(pixel);

//

// The gamma table is generated entirely at compile time and stored in

// PROGMEM (flash) on AVR/ESP platforms. No runtime floating-point math

// is involved in lookups.

//

// Why integer template parameters:

//   C++11 does not allow float or class-type non-type template parameters.

//   gamma<u8x24>(2.2f) converts the float to a constexpr uint32_t (the

//   raw fixed-point representation), which IS a valid NTTP in C++11.

//   This is why the helper returns an integer: it's the only way to

//   encode a floating-point gamma value in a template parameter in C++11.

//   This approach is portable across all embedded toolchains.


#include "fl/stl/int.h"

#include "fl/math/fixed_point/u8x24.h"

#include "fl/stl/type_traits.h"

#include "fastled_progmem.h"

#include "fl/stl/noexcept.h"


namespace fl {


// ---------- Public API ----------


// Convert a float gamma value to a fixed-point raw integer suitable for

// use as a template parameter. The Fixed type determines the precision.

//

// Example: gamma<u8x24>(2.2f) returns constexpr uint32_t

template <typename Fixed>


constexpr u32 gamma(float g) FL_NOEXCEPT {

    return Fixed(g).raw();

}


// Forward declarations

template <u32 GammaRaw> struct GammaEval;

template <typename Fn, fl::size N> struct ProgmemLUT;


// Convenience alias: 256-entry gamma table

template <u32 G>

using GammaTable256 = ProgmemLUT<GammaEval<G>, 256>;


// ---------- Constexpr pow implementation (C++11 compatible) ----------

//

// All functions use the single-return-statement form required by C++11

// constexpr. Branching is done via ternary operators, and multi-step

// computations are decomposed into chains of constexpr function calls.


namespace detail {


namespace gamma_constexpr {


constexpr int FRAC = 24;

constexpr u32 SCALE = (u32)1 << FRAC; // 16777216


// ---- Highest-bit finder (constexpr recursive) ----


constexpr int hb_step(u32 v, int r) FL_NOEXCEPT {

    return (v & 0xFFFF0000u) ? hb_step(v >> 16, r + 16)

         : (v & 0x0000FF00u) ? hb_step(v >> 8,  r + 8)

         : (v & 0x000000F0u) ? hb_step(v >> 4,  r + 4)

         : (v & 0x0000000Cu) ? hb_step(v >> 2,  r + 2)

         : (v & 0x00000002u) ? r + 1

         : r;

}


constexpr int highest_bit(u32 v) FL_NOEXCEPT {

    return v == 0 ? -1 : hb_step(v, 0);

}


// ---- Fixed-point log2 (signed result, negative for inputs < 1.0) ----

// Uses 4-term minimax polynomial for log2(1+t), t in [0,1).

// Minimax coefficients minimize max error over the full interval,

// unlike Taylor which diverges badly near t=1.


constexpr u32 log2_t(u32 val, int msb) FL_NOEXCEPT {

    return msb >= FRAC

        ? (val >> (msb - FRAC)) - SCALE

        : (val << (FRAC - msb)) - SCALE;

}


// Horner steps for log2(1+t) polynomial, split into separate

// constexpr functions for C++11 single-return-statement compliance.


constexpr i64 log2_h3(i64 t) FL_NOEXCEPT {

    return (static_cast<i64>(-1788416LL) * t) >> FRAC;

}


constexpr i64 log2_h2(i64 t) FL_NOEXCEPT {

    return ((6098176LL + log2_h3(t)) * t) >> FRAC;

}


constexpr i64 log2_h1(i64 t) FL_NOEXCEPT {

    return ((-11728384LL + log2_h2(t)) * t) >> FRAC;

}


constexpr i64 log2_h0(i64 t) FL_NOEXCEPT {

    return ((24189248LL + log2_h1(t)) * t) >> FRAC;

}


constexpr i32 log2_with_msb(u32 val, int msb) FL_NOEXCEPT {

    // Use multiplication instead of left-shift to avoid UB when (msb - FRAC)

    // is negative (left-shifting a negative value is undefined in C++).

    return static_cast<i32>(

        static_cast<i64>(msb - FRAC) * static_cast<i64>(1LL << FRAC) +

        log2_h0(static_cast<i64>(log2_t(val, msb)))

    );

}


constexpr i32 log2_fp(u32 val) FL_NOEXCEPT {

    return val == 0 ? static_cast<i32>(0x80000000)

                    : log2_with_msb(val, highest_bit(val));

}


// ---- Fixed-point exp2 (handles both positive and negative exponents) ----

// Uses 4-term minimax polynomial for 2^t - 1, t in [0,1).

// Minimax coefficients minimize max error over the full interval.


constexpr u64 exp2_h3(u64 fr) FL_NOEXCEPT {

    return (214016ULL * fr) >> FRAC;

}


constexpr u64 exp2_h2(u64 fr) FL_NOEXCEPT {

    return ((895232ULL + exp2_h3(fr)) * fr) >> FRAC;

}


constexpr u64 exp2_h1(u64 fr) FL_NOEXCEPT {

    return ((4038400ULL + exp2_h2(fr)) * fr) >> FRAC;

}


constexpr u64 exp2_h0(u64 fr) FL_NOEXCEPT {

    return ((11629376ULL + exp2_h1(fr)) * fr) >> FRAC;

}


constexpr u64 exp2_frac(u64 fr) FL_NOEXCEPT {

    return (1ULL << FRAC) + exp2_h0(fr);

}


// exp2 for non-negative 8.24 fixed-point input.


constexpr u32 exp2_pos(u32 x) FL_NOEXCEPT {

    return (x >> FRAC) >= 8 ? 0xFFFFFFFFu

        : static_cast<u32>(

            (static_cast<u64>(SCALE << (x >> FRAC)) *

             exp2_frac(x & (SCALE - 1))) >> FRAC

          );

}


// exp2 for negative input: 2^(-P) = 2^(1-f) >> (n+1)

// where P = n + f, n = integer part, f = fractional part.


constexpr u32 exp2_neg(u32 pos_val) FL_NOEXCEPT {

    return ((pos_val >> FRAC) + 1) >= 32 ? 0

        : static_cast<u32>(

            exp2_pos(SCALE - (pos_val & (SCALE - 1)))

            >> ((pos_val >> FRAC) + 1)

          );

}


constexpr u32 exp2_fp(i32 x) FL_NOEXCEPT {

    return x >= 0 ? exp2_pos(static_cast<u32>(x))

                  : exp2_neg(static_cast<u32>(-x));

}


// ---- Fixed-point pow: base^exp via exp2(exp * log2(base)) ----


constexpr u32 pow_fp(u32 base_raw, u32 exp_raw) FL_NOEXCEPT {

    return base_raw == 0     ? 0

         : exp_raw == 0      ? SCALE

         : base_raw == SCALE ? SCALE

         : exp2_fp(static_cast<i32>(

               (static_cast<i64>(exp_raw) *

                static_cast<i64>(log2_fp(base_raw))) >> FRAC

           ));

}


// ---- 8-bit gamma correction for a single pixel value ----

// Computes: clamp(round(pow(x/255, gamma) * 255), 0, 255)


constexpr u8 eval(u8 x, u32 gamma_raw) FL_NOEXCEPT {

    return x == 0   ? static_cast<u8>(0)

         : x == 255 ? static_cast<u8>(255)

         : static_cast<u8>(

               (pow_fp(

                   static_cast<u32>((static_cast<u64>(x) << FRAC) / 255),

                   gamma_raw

               ) * 255ULL + (SCALE >> 1)) >> FRAC

           );

}


// ---- 16-bit gamma correction for a single pixel value ----

// Computes: clamp(round(pow(x/255, gamma) * 65535), 0, 65535)

// Used by five-bit brightness and HD108 pipelines.


constexpr u16 eval16(u8 x, u32 gamma_raw) FL_NOEXCEPT {

    return x == 0   ? static_cast<u16>(0)

         : x == 255 ? static_cast<u16>(65535)

         : static_cast<u16>(

               (pow_fp(

                   static_cast<u32>((static_cast<u64>(x) << FRAC) / 255),

                   gamma_raw

               ) * 65535ULL + (SCALE >> 1)) >> FRAC

           );

}


} // namespace gamma_constexpr


} // namespace detail


// ---------- GammaEval functors ----------

// Compile-time gamma evaluation functors. GammaRaw is a fixed-point

// raw value obtained from gamma<u8x24>(float_value).


// 8-bit output: input u8 [0,255] → output u8 [0,255]

template <u32 GammaRaw>


struct GammaEval {


    constexpr u8 operator()(u8 x) const FL_NOEXCEPT {

        return detail::gamma_constexpr::eval(x, GammaRaw);

    }


};


// 16-bit output: input u8 [0,255] → output u16 [0,65535]

// Use this for five-bit brightness and HD108 pipelines.

template <u32 GammaRaw>


struct GammaEval16 {


    constexpr u16 operator()(u8 x) const FL_NOEXCEPT {

        return detail::gamma_constexpr::eval16(x, GammaRaw);

    }


};


// ---------- ProgmemLUT generators ----------


namespace detail {


template <typename T, fl::size N>


struct LutArray {

    T values[N];

};


template <typename Fn, fl::size... Is>

constexpr LutArray<u8, sizeof...(Is)>


make_lut_u8(fl::index_sequence<Is...>) FL_NOEXCEPT {

    return {{ Fn()(static_cast<u8>(Is))... }};

}


template <typename Fn, fl::size... Is>

constexpr LutArray<u16, sizeof...(Is)>


make_lut_u16(fl::index_sequence<Is...>) FL_NOEXCEPT {

    return {{ Fn()(static_cast<u8>(Is))... }};

}


} // namespace detail


// 8-bit PROGMEM lookup table (u8 input → u8 output).

// Fn must be a functor with constexpr operator()(u8) returning u8.

template <typename Fn, fl::size N>


struct ProgmemLUT {


    static u8 read(u8 index) FL_NOEXCEPT {

        return FL_PGM_READ_BYTE_NEAR(&kData.values[index]);

    }


    static const detail::LutArray<u8, N> kData;

};


template <typename Fn, fl::size N>

const detail::LutArray<u8, N>

ProgmemLUT<Fn, N>::kData FL_PROGMEM =

    detail::make_lut_u8<Fn>(fl::make_index_sequence<N>{});


// 16-bit PROGMEM lookup table (u8 input → u16 output).

// Fn must be a functor with constexpr operator()(u8) returning u16.

// Used by five-bit brightness and HD108 gamma pipelines.

template <typename Fn, fl::size N>


struct ProgmemLUT16 {


    static u16 read(u8 index) FL_NOEXCEPT {

        return FL_PGM_READ_WORD_NEAR(&kData.values[index]);

    }


    // Direct access to the raw PROGMEM array for hot-loop usage

    // (avoids per-element function call overhead).

    static const u16* data() FL_NOEXCEPT { return kData.values; }


    static const detail::LutArray<u16, N> kData;

};


template <typename Fn, fl::size N>

FL_ALIGN_PROGMEM(64) const detail::LutArray<u16, N>

ProgmemLUT16<Fn, N>::kData FL_PROGMEM =

    detail::make_lut_u16<Fn>(fl::make_index_sequence<N>{});


// ---------- Convenience aliases ----------


// 256-entry 8-bit gamma table

template <u32 G>

using GammaTable256 = ProgmemLUT<GammaEval<G>, 256>;


// 256-entry 16-bit gamma table (for five-bit brightness, HD108)

template <u32 G>

using GammaTable16_256 = ProgmemLUT16<GammaEval16<G>, 256>;


// ---------- Pre-defined gamma tables ----------


// 8-bit gamma tables (u8 input → u8 output).

// Usage: uint8_t corrected = fl::Gamma22LUT::read(pixel);

typedef ProgmemLUT<GammaEval<gamma<u8x24>(2.2f)>, 256> Gamma22LUT;

typedef ProgmemLUT<GammaEval<gamma<u8x24>(2.8f)>, 256> Gamma28LUT;


// 16-bit gamma tables (u8 input → u16 output).

// Usage: uint16_t val = fl::Gamma22LUT16::read(pixel);

typedef ProgmemLUT16<GammaEval16<gamma<u8x24>(2.2f)>, 256> Gamma22LUT16;

typedef ProgmemLUT16<GammaEval16<gamma<u8x24>(2.8f)>, 256> Gamma28LUT16;


// Explicit instantiation declaration for the most commonly used LUT.

// Suppresses per-TU ~6KB _GLOBAL__sub_I_ init blocks across all modules.

// Definition lives in gamma_lut.cpp.hpp (compiled once in fl.gfx+).

// Other LUT variants are instantiated implicitly on demand.

extern template struct ProgmemLUT16<GammaEval16<gamma<u8x24>(2.8f)>, 256>;


} // namespace fl

FL_ALIGN_PROGMEM
#define FL_ALIGN_PROGMEM(N)
Force N-byte alignment for platforms with unaligned access or cache-line optimization.
Definition fastled_progmem.h:139

FL_PGM_READ_BYTE_NEAR
#define FL_PGM_READ_BYTE_NEAR(x)
Read a byte (8-bit) from PROGMEM memory.
Definition fastled_progmem.h:86

FL_PGM_READ_WORD_NEAR
#define FL_PGM_READ_WORD_NEAR(x)
Read a word (16-bit) from PROGMEM memory.
Definition fastled_progmem.h:88

FL_PROGMEM
#define FL_PROGMEM
PROGMEM keyword for storage.
Definition fastled_progmem.h:71

fastled_progmem.h
Wrapper definitions to allow seamless use of PROGMEM in environments that have it.

int.h

fl::detail::gamma_constexpr::eval16
constexpr u16 eval16(u8 x, u32 gamma_raw) FL_NOEXCEPT
Definition gamma_lut.h:189

fl::detail::gamma_constexpr::pow_fp
constexpr u32 pow_fp(u32 base_raw, u32 exp_raw) FL_NOEXCEPT
Definition gamma_lut.h:161

fl::detail::gamma_constexpr::SCALE
constexpr u32 SCALE
Definition gamma_lut.h:58

fl::detail::gamma_constexpr::log2_h1
constexpr i64 log2_h1(i64 t) FL_NOEXCEPT
Definition gamma_lut.h:94

fl::detail::gamma_constexpr::log2_fp
constexpr i32 log2_fp(u32 val) FL_NOEXCEPT
Definition gamma_lut.h:110

fl::detail::gamma_constexpr::exp2_h3
constexpr u64 exp2_h3(u64 fr) FL_NOEXCEPT
Definition gamma_lut.h:119

fl::detail::gamma_constexpr::exp2_pos
constexpr u32 exp2_pos(u32 x) FL_NOEXCEPT
Definition gamma_lut.h:136

fl::detail::gamma_constexpr::highest_bit
constexpr int highest_bit(u32 v) FL_NOEXCEPT
Definition gamma_lut.h:71

fl::detail::gamma_constexpr::exp2_h0
constexpr u64 exp2_h0(u64 fr) FL_NOEXCEPT
Definition gamma_lut.h:128

fl::detail::gamma_constexpr::exp2_fp
constexpr u32 exp2_fp(i32 x) FL_NOEXCEPT
Definition gamma_lut.h:154

fl::detail::gamma_constexpr::log2_t
constexpr u32 log2_t(u32 val, int msb) FL_NOEXCEPT
Definition gamma_lut.h:80

fl::detail::gamma_constexpr::exp2_frac
constexpr u64 exp2_frac(u64 fr) FL_NOEXCEPT
Definition gamma_lut.h:131

fl::detail::gamma_constexpr::log2_h3
constexpr i64 log2_h3(i64 t) FL_NOEXCEPT
Definition gamma_lut.h:88

fl::detail::gamma_constexpr::log2_h0
constexpr i64 log2_h0(i64 t) FL_NOEXCEPT
Definition gamma_lut.h:97

fl::detail::gamma_constexpr::FRAC
constexpr int FRAC
Definition gamma_lut.h:57

fl::detail::gamma_constexpr::exp2_h2
constexpr u64 exp2_h2(u64 fr) FL_NOEXCEPT
Definition gamma_lut.h:122

fl::detail::gamma_constexpr::exp2_h1
constexpr u64 exp2_h1(u64 fr) FL_NOEXCEPT
Definition gamma_lut.h:125

fl::detail::gamma_constexpr::log2_with_msb
constexpr i32 log2_with_msb(u32 val, int msb) FL_NOEXCEPT
Definition gamma_lut.h:101

fl::detail::gamma_constexpr::eval
constexpr u8 eval(u8 x, u32 gamma_raw) FL_NOEXCEPT
Definition gamma_lut.h:174

fl::detail::gamma_constexpr::exp2_neg
constexpr u32 exp2_neg(u32 pos_val) FL_NOEXCEPT
Definition gamma_lut.h:146

fl::detail::gamma_constexpr::hb_step
constexpr int hb_step(u32 v, int r) FL_NOEXCEPT
Definition gamma_lut.h:62

fl::detail::gamma_constexpr::log2_h2
constexpr i64 log2_h2(i64 t) FL_NOEXCEPT
Definition gamma_lut.h:91

fl::detail::gamma_constexpr
Definition gamma_lut.h:55

fl::detail::make_lut_u16
constexpr LutArray< u16, sizeof...(Is)> make_lut_u16(fl::index_sequence< Is... >) FL_NOEXCEPT
Definition gamma_lut.h:241

fl::detail::make_lut_u8
constexpr LutArray< u8, sizeof...(Is)> make_lut_u8(fl::index_sequence< Is... >) FL_NOEXCEPT
Definition gamma_lut.h:235

fl::detail
Compile-time linker keep-alive hook for a single fl::Bus.
Definition bus_traits.h:48

fl::detail::LutArray::values
T values[N]
Definition gamma_lut.h:230

fl::detail::LutArray
Definition gamma_lut.h:229

fl::fl::make_index_sequence
typename make_index_sequence_impl< N >::type make_index_sequence
Definition s16x16x4.h:1168

fl::x
x
Definition transposition.cpp.hpp:24

fl::u8
unsigned char u8
Definition stdint.h:131

fl::kData
const detail::LutArray< u8, N > ProgmemLUT< Fn, N >::kData
Definition gamma_lut.h:260

fl::Gamma28LUT
ProgmemLUT< GammaEval< gamma< u8x24 >(2.8f)>, 256 > Gamma28LUT
Definition gamma_lut.h:299

fl::Gamma22LUT16
ProgmemLUT16< GammaEval16< gamma< u8x24 >(2.2f)>, 256 > Gamma22LUT16
Definition gamma_lut.h:303

fl::GammaTable16_256
ProgmemLUT16< GammaEval16< G >, 256 > GammaTable16_256
Definition gamma_lut.h:292

fl::i64
fl::i64 i64
Definition s16x16x4.h:222

fl::gamma
constexpr u32 gamma(float g) FL_NOEXCEPT
Definition gamma_lut.h:36

fl::t
t
Definition transposition.cpp.hpp:27

fl::make_index_sequence
typename make_index_sequence_impl< N >::type make_index_sequence
Definition type_traits.h:1168

fl::GammaTable256
ProgmemLUT< GammaEval< G >, 256 > GammaTable256
Definition gamma_lut.h:46

fl::u64
fl::u64 u64
Definition s16x16x4.h:221

fl::Gamma28LUT16
ProgmemLUT16< GammaEval16< gamma< u8x24 >(2.8f)>, 256 > Gamma28LUT16
Definition gamma_lut.h:304

fl::Gamma22LUT
ProgmemLUT< GammaEval< gamma< u8x24 >(2.2f)>, 256 > Gamma22LUT
Definition gamma_lut.h:298

fl
Base definition for an LED controller.
Definition crgb.hpp:179

noexcept.h

FL_NOEXCEPT
#define FL_NOEXCEPT

fl::GammaEval16::operator()
constexpr u16 operator()(u8 x) const FL_NOEXCEPT
Definition gamma_lut.h:219

fl::GammaEval16
Definition gamma_lut.h:218

fl::GammaEval::operator()
constexpr u8 operator()(u8 x) const FL_NOEXCEPT
Definition gamma_lut.h:210

fl::GammaEval
Definition gamma_lut.h:209

fl::ProgmemLUT16< GammaEval16< G >, 256 >::kData
static const detail::LutArray< u16, N > kData
Definition gamma_lut.h:276

fl::ProgmemLUT16::read
static u16 read(u8 index) FL_NOEXCEPT
Definition gamma_lut.h:268

fl::ProgmemLUT16::data
static const u16 * data() FL_NOEXCEPT
Definition gamma_lut.h:274

fl::ProgmemLUT16
Definition gamma_lut.h:267

fl::ProgmemLUT::read
static u8 read(u8 index) FL_NOEXCEPT
Definition gamma_lut.h:251

fl::ProgmemLUT< GammaEval< G >, 256 >::kData
static const detail::LutArray< u8, N > kData
Definition gamma_lut.h:255

fl::ProgmemLUT
Definition gamma_lut.h:250

fl::fl::index_sequence
Definition s16x16x4.h:1154

type_traits.h

u8x24.h