FastLED 3.9.15
Loading...
Searching...
No Matches

◆ aligned_ptr() [2/2]

template<typename T, fl::size_t N>
fl::fl::aligned_ptr< T, N >::aligned_ptr ( T * p)
inlineexplicit

Definition at line 167 of file s16x16x4.h.

178{
179
180// Forward declaration for cross-type operations
181struct s0x32x4;
182
185struct s16x16x4 {
186 simd::simd_u32x4 raw; // 4× i32 values in Q16 format
187
188 // ---- Construction ------------------------------------------------------
189
192 result.raw = r;
193 return result;
194 }
195
196 // Load 4 s16x16 values from memory (unaligned access supported)
198 return from_raw(simd::platforms::load_u32_4(reinterpret_cast<const u32*>(ptr))); // ok reinterpret cast
199 }
200
201 // Store 4 s16x16 values to memory (unaligned access supported)
202 FASTLED_FORCE_INLINE void store(s16x16* ptr) const {
203 simd::platforms::store_u32_4(reinterpret_cast<u32*>(ptr), raw); // ok reinterpret cast
204 }
205
206 // Broadcast single s16x16 value to all 4 lanes
208 return from_raw(simd::platforms::set1_u32_4(static_cast<u32>(value.raw())));
209 }
210
211 // ---- SIMD arithmetic (s16x16x4 OP s16x16x4 → s16x16x4) -----------------
212
214 return from_raw(simd::add_i32_4(raw, b.raw));
215 }
216
218 return from_raw(simd::sub_i32_4(raw, b.raw));
219 }
220
222 // Q16 × Q16 = Q32 → shift right 16 → Q16
223 return from_raw(simd::mulhi_i32_4(raw, b.raw));
224 }
225
227 // Unary negation: -x = 0 - x
228 auto zero = simd::set1_u32_4(0);
230 }
231
234 }
235
238 }
239
240 // Cross-type multiply: s16x16x4 × s0x32x4 → s16x16x4 (commutative)
241 // Implemented after s0x32x4 is defined
243
244 // ---- Math functions -------------------------------------------------------
245
248 // mask = -1 if negative (sign extended), 0 if positive
249 auto mask = simd::sra_i32_4(raw, 31);
250 // flip bits if negative, then add 1 (two's complement)
253 }
254
257 return from_raw(simd::min_i32_4(raw, b.raw));
258 }
259
262 return from_raw(simd::max_i32_4(raw, b.raw));
263 }
264
267 return max(lo).min(hi);
268 }
269
273 auto t_vec = s16x16x4::set1(t);
274 auto diff = b - (*this);
275 return (*this) + (diff * t_vec);
276 }
277
281 // Convert radians to 24-bit angle units (same as scalar s16x16)
282 // RAD_TO_24 = 2^24 / (2π) in Q16
283 static constexpr i32 RAD_TO_24 = 2670177; // from s16x16.h
284
285 // Convert 4 angles: mulhi_i32_4 does (i64*i64) >> 16
287
288 // Call vectorized sincos
290
291 // Shift results right by 15 to convert from raw sin32 output to Q16.16
292 out_sin = from_raw(simd::sra_i32_4(sc.sin_vals, 15));
293 out_cos = from_raw(simd::sra_i32_4(sc.cos_vals, 15));
294 }
295
300 return sin_out;
301 }
302
307 return cos_out;
308 }
309};
310
311// Include simd_ops.h to implement cross-type operations
312// Must come after all types are defined
313#include "fl/math/fixed_point/simd_ops.h" // allow-include-after-namespace
314
315} // namespace fl
FL_DISABLE_WARNING_PUSH U constexpr common_type_t< T, U > min(T a, U b) FL_NOEXCEPT
Memory functions are available in fl:: namespace via fl/stl/cstring.h Using declarations cannot work ...
Definition math.h:71
constexpr common_type_t< T, U > max(T a, U b) FL_NOEXCEPT
Definition math.h:75
constexpr enable_if< is_fixed_point< T >::value, T >::type abs(T x) FL_NOEXCEPT
FASTLED_FORCE_INLINE CRGB * operator+(const CRGBSet &pixels, int offset)
Retrieve a pointer to a CRGB array, using a CRGBSet and an LED offset.
Definition pixelset.h:488
Cross-type SIMD fixed-point operations (implemented after all types are defined)