935 lines
28 KiB
935 lines
28 KiB
6 years ago
|
#ifndef __INC_LIB8TION_H
|
||
|
#define __INC_LIB8TION_H
|
||
|
|
||
|
/*
|
||
|
|
||
|
Fast, efficient 8-bit math functions specifically
|
||
|
designed for high-performance LED programming.
|
||
|
|
||
|
Because of the AVR(Arduino) and ARM assembly language
|
||
|
implementations provided, using these functions often
|
||
|
results in smaller and faster code than the equivalent
|
||
|
program using plain "C" arithmetic and logic.
|
||
|
|
||
|
|
||
|
Included are:
|
||
|
|
||
|
|
||
|
- Saturating unsigned 8-bit add and subtract.
|
||
|
Instead of wrapping around if an overflow occurs,
|
||
|
these routines just 'clamp' the output at a maxumum
|
||
|
of 255, or a minimum of 0. Useful for adding pixel
|
||
|
values. E.g., qadd8( 200, 100) = 255.
|
||
|
|
||
|
qadd8( i, j) == MIN( (i + j), 0xFF )
|
||
|
qsub8( i, j) == MAX( (i - j), 0 )
|
||
|
|
||
|
- Saturating signed 8-bit ("7-bit") add.
|
||
|
qadd7( i, j) == MIN( (i + j), 0x7F)
|
||
|
|
||
|
|
||
|
- Scaling (down) of unsigned 8- and 16- bit values.
|
||
|
Scaledown value is specified in 1/256ths.
|
||
|
scale8( i, sc) == (i * sc) / 256
|
||
|
scale16by8( i, sc) == (i * sc) / 256
|
||
|
|
||
|
Example: scaling a 0-255 value down into a
|
||
|
range from 0-99:
|
||
|
downscaled = scale8( originalnumber, 100);
|
||
|
|
||
|
A special version of scale8 is provided for scaling
|
||
|
LED brightness values, to make sure that they don't
|
||
|
accidentally scale down to total black at low
|
||
|
dimming levels, since that would look wrong:
|
||
|
scale8_video( i, sc) = ((i * sc) / 256) +? 1
|
||
|
|
||
|
Example: reducing an LED brightness by a
|
||
|
dimming factor:
|
||
|
new_bright = scale8_video( orig_bright, dimming);
|
||
|
|
||
|
|
||
|
- Fast 8- and 16- bit unsigned random numbers.
|
||
|
Significantly faster than Arduino random(), but
|
||
|
also somewhat less random. You can add entropy.
|
||
|
random8() == random from 0..255
|
||
|
random8( n) == random from 0..(N-1)
|
||
|
random8( n, m) == random from N..(M-1)
|
||
|
|
||
|
random16() == random from 0..65535
|
||
|
random16( n) == random from 0..(N-1)
|
||
|
random16( n, m) == random from N..(M-1)
|
||
|
|
||
|
random16_set_seed( k) == seed = k
|
||
|
random16_add_entropy( k) == seed += k
|
||
|
|
||
|
|
||
|
- Absolute value of a signed 8-bit value.
|
||
|
abs8( i) == abs( i)
|
||
|
|
||
|
|
||
|
- 8-bit math operations which return 8-bit values.
|
||
|
These are provided mostly for completeness,
|
||
|
not particularly for performance.
|
||
|
mul8( i, j) == (i * j) & 0xFF
|
||
|
add8( i, j) == (i + j) & 0xFF
|
||
|
sub8( i, j) == (i - j) & 0xFF
|
||
|
|
||
|
|
||
|
- Fast 16-bit approximations of sin and cos.
|
||
|
Input angle is a uint16_t from 0-65535.
|
||
|
Output is a signed int16_t from -32767 to 32767.
|
||
|
sin16( x) == sin( (x/32768.0) * pi) * 32767
|
||
|
cos16( x) == cos( (x/32768.0) * pi) * 32767
|
||
|
Accurate to more than 99% in all cases.
|
||
|
|
||
|
- Fast 8-bit approximations of sin and cos.
|
||
|
Input angle is a uint8_t from 0-255.
|
||
|
Output is an UNsigned uint8_t from 0 to 255.
|
||
|
sin8( x) == (sin( (x/128.0) * pi) * 128) + 128
|
||
|
cos8( x) == (cos( (x/128.0) * pi) * 128) + 128
|
||
|
Accurate to within about 2%.
|
||
|
|
||
|
|
||
|
- Fast 8-bit "easing in/out" function.
|
||
|
ease8InOutCubic(x) == 3(x^i) - 2(x^3)
|
||
|
ease8InOutApprox(x) ==
|
||
|
faster, rougher, approximation of cubic easing
|
||
|
ease8InOutQuad(x) == quadratic (vs cubic) easing
|
||
|
|
||
|
- Cubic, Quadratic, and Triangle wave functions.
|
||
|
Input is a uint8_t representing phase withing the wave,
|
||
|
similar to how sin8 takes an angle 'theta'.
|
||
|
Output is a uint8_t representing the amplitude of
|
||
|
the wave at that point.
|
||
|
cubicwave8( x)
|
||
|
quadwave8( x)
|
||
|
triwave8( x)
|
||
|
|
||
|
- Square root for 16-bit integers. About three times
|
||
|
faster and five times smaller than Arduino's built-in
|
||
|
generic 32-bit sqrt routine.
|
||
|
sqrt16( uint16_t x ) == sqrt( x)
|
||
|
|
||
|
- Dimming and brightening functions for 8-bit
|
||
|
light values.
|
||
|
dim8_video( x) == scale8_video( x, x)
|
||
|
dim8_raw( x) == scale8( x, x)
|
||
|
dim8_lin( x) == (x<128) ? ((x+1)/2) : scale8(x,x)
|
||
|
brighten8_video( x) == 255 - dim8_video( 255 - x)
|
||
|
brighten8_raw( x) == 255 - dim8_raw( 255 - x)
|
||
|
brighten8_lin( x) == 255 - dim8_lin( 255 - x)
|
||
|
The dimming functions in particular are suitable
|
||
|
for making LED light output appear more 'linear'.
|
||
|
|
||
|
|
||
|
- Linear interpolation between two values, with the
|
||
|
fraction between them expressed as an 8- or 16-bit
|
||
|
fixed point fraction (fract8 or fract16).
|
||
|
lerp8by8( fromU8, toU8, fract8 )
|
||
|
lerp16by8( fromU16, toU16, fract8 )
|
||
|
lerp15by8( fromS16, toS16, fract8 )
|
||
|
== from + (( to - from ) * fract8) / 256)
|
||
|
lerp16by16( fromU16, toU16, fract16 )
|
||
|
== from + (( to - from ) * fract16) / 65536)
|
||
|
map8( in, rangeStart, rangeEnd)
|
||
|
== map( in, 0, 255, rangeStart, rangeEnd);
|
||
|
|
||
|
- Optimized memmove, memcpy, and memset, that are
|
||
|
faster than standard avr-libc 1.8.
|
||
|
memmove8( dest, src, bytecount)
|
||
|
memcpy8( dest, src, bytecount)
|
||
|
memset8( buf, value, bytecount)
|
||
|
|
||
|
- Beat generators which return sine or sawtooth
|
||
|
waves in a specified number of Beats Per Minute.
|
||
|
Sine wave beat generators can specify a low and
|
||
|
high range for the output. Sawtooth wave beat
|
||
|
generators always range 0-255 or 0-65535.
|
||
|
beatsin8( BPM, low8, high8)
|
||
|
= (sine(beatphase) * (high8-low8)) + low8
|
||
|
beatsin16( BPM, low16, high16)
|
||
|
= (sine(beatphase) * (high16-low16)) + low16
|
||
|
beatsin88( BPM88, low16, high16)
|
||
|
= (sine(beatphase) * (high16-low16)) + low16
|
||
|
beat8( BPM) = 8-bit repeating sawtooth wave
|
||
|
beat16( BPM) = 16-bit repeating sawtooth wave
|
||
|
beat88( BPM88) = 16-bit repeating sawtooth wave
|
||
|
BPM is beats per minute in either simple form
|
||
|
e.g. 120, or Q8.8 fixed-point form.
|
||
|
BPM88 is beats per minute in ONLY Q8.8 fixed-point
|
||
|
form.
|
||
|
|
||
|
Lib8tion is pronounced like 'libation': lie-BAY-shun
|
||
|
|
||
|
*/
|
||
|
|
||
|
|
||
|
|
||
|
#include <stdint.h>
|
||
|
|
||
|
#define LIB8STATIC __attribute__ ((unused)) static inline
|
||
|
#define LIB8STATIC_ALWAYS_INLINE __attribute__ ((always_inline)) static inline
|
||
|
|
||
|
#if !defined(__AVR__)
|
||
|
#include <string.h>
|
||
|
// for memmove, memcpy, and memset if not defined here
|
||
|
#endif
|
||
|
|
||
|
#if defined(__arm__)
|
||
|
|
||
|
#if defined(FASTLED_TEENSY3)
|
||
|
// Can use Cortex M4 DSP instructions
|
||
|
#define QADD8_C 0
|
||
|
#define QADD7_C 0
|
||
|
#define QADD8_ARM_DSP_ASM 1
|
||
|
#define QADD7_ARM_DSP_ASM 1
|
||
|
#else
|
||
|
// Generic ARM
|
||
|
#define QADD8_C 1
|
||
|
#define QADD7_C 1
|
||
|
#endif
|
||
|
|
||
|
#define QSUB8_C 1
|
||
|
#define SCALE8_C 1
|
||
|
#define SCALE16BY8_C 1
|
||
|
#define SCALE16_C 1
|
||
|
#define ABS8_C 1
|
||
|
#define MUL8_C 1
|
||
|
#define QMUL8_C 1
|
||
|
#define ADD8_C 1
|
||
|
#define SUB8_C 1
|
||
|
#define EASE8_C 1
|
||
|
#define AVG8_C 1
|
||
|
#define AVG7_C 1
|
||
|
#define AVG16_C 1
|
||
|
#define AVG15_C 1
|
||
|
#define BLEND8_C 1
|
||
|
|
||
|
|
||
|
#elif defined(__AVR__)
|
||
|
|
||
|
// AVR ATmega and friends Arduino
|
||
|
|
||
|
#define QADD8_C 0
|
||
|
#define QADD7_C 0
|
||
|
#define QSUB8_C 0
|
||
|
#define ABS8_C 0
|
||
|
#define ADD8_C 0
|
||
|
#define SUB8_C 0
|
||
|
#define AVG8_C 0
|
||
|
#define AVG7_C 0
|
||
|
#define AVG16_C 0
|
||
|
#define AVG15_C 0
|
||
|
|
||
|
#define QADD8_AVRASM 1
|
||
|
#define QADD7_AVRASM 1
|
||
|
#define QSUB8_AVRASM 1
|
||
|
#define ABS8_AVRASM 1
|
||
|
#define ADD8_AVRASM 1
|
||
|
#define SUB8_AVRASM 1
|
||
|
#define AVG8_AVRASM 1
|
||
|
#define AVG7_AVRASM 1
|
||
|
#define AVG16_AVRASM 1
|
||
|
#define AVG15_AVRASM 1
|
||
|
|
||
|
// Note: these require hardware MUL instruction
|
||
|
// -- sorry, ATtiny!
|
||
|
#if !defined(LIB8_ATTINY)
|
||
|
#define SCALE8_C 0
|
||
|
#define SCALE16BY8_C 0
|
||
|
#define SCALE16_C 0
|
||
|
#define MUL8_C 0
|
||
|
#define QMUL8_C 0
|
||
|
#define EASE8_C 0
|
||
|
#define BLEND8_C 0
|
||
|
#define SCALE8_AVRASM 1
|
||
|
#define SCALE16BY8_AVRASM 1
|
||
|
#define SCALE16_AVRASM 1
|
||
|
#define MUL8_AVRASM 1
|
||
|
#define QMUL8_AVRASM 1
|
||
|
#define EASE8_AVRASM 1
|
||
|
#define CLEANUP_R1_AVRASM 1
|
||
|
#define BLEND8_AVRASM 1
|
||
|
#else
|
||
|
// On ATtiny, we just use C implementations
|
||
|
#define SCALE8_C 1
|
||
|
#define SCALE16BY8_C 1
|
||
|
#define SCALE16_C 1
|
||
|
#define MUL8_C 1
|
||
|
#define QMUL8_C 1
|
||
|
#define EASE8_C 1
|
||
|
#define BLEND8_C 1
|
||
|
#define SCALE8_AVRASM 0
|
||
|
#define SCALE16BY8_AVRASM 0
|
||
|
#define SCALE16_AVRASM 0
|
||
|
#define MUL8_AVRASM 0
|
||
|
#define QMUL8_AVRASM 0
|
||
|
#define EASE8_AVRASM 0
|
||
|
#define BLEND8_AVRASM 0
|
||
|
#endif
|
||
|
|
||
|
#else
|
||
|
|
||
|
// unspecified architecture, so
|
||
|
// no ASM, everything in C
|
||
|
#define QADD8_C 1
|
||
|
#define QADD7_C 1
|
||
|
#define QSUB8_C 1
|
||
|
#define SCALE8_C 1
|
||
|
#define SCALE16BY8_C 1
|
||
|
#define SCALE16_C 1
|
||
|
#define ABS8_C 1
|
||
|
#define MUL8_C 1
|
||
|
#define QMUL8_C 1
|
||
|
#define ADD8_C 1
|
||
|
#define SUB8_C 1
|
||
|
#define EASE8_C 1
|
||
|
#define AVG8_C 1
|
||
|
#define AVG7_C 1
|
||
|
#define AVG16_C 1
|
||
|
#define AVG15_C 1
|
||
|
#define BLEND8_C 1
|
||
|
|
||
|
#endif
|
||
|
|
||
|
///@defgroup lib8tion Fast math functions
|
||
|
///A variety of functions for working with numbers.
|
||
|
///@{
|
||
|
|
||
|
|
||
|
///////////////////////////////////////////////////////////////////////
|
||
|
//
|
||
|
// typdefs for fixed-point fractional types.
|
||
|
//
|
||
|
// sfract7 should be interpreted as signed 128ths.
|
||
|
// fract8 should be interpreted as unsigned 256ths.
|
||
|
// sfract15 should be interpreted as signed 32768ths.
|
||
|
// fract16 should be interpreted as unsigned 65536ths.
|
||
|
//
|
||
|
// Example: if a fract8 has the value "64", that should be interpreted
|
||
|
// as 64/256ths, or one-quarter.
|
||
|
//
|
||
|
//
|
||
|
// fract8 range is 0 to 0.99609375
|
||
|
// in steps of 0.00390625
|
||
|
//
|
||
|
// sfract7 range is -0.9921875 to 0.9921875
|
||
|
// in steps of 0.0078125
|
||
|
//
|
||
|
// fract16 range is 0 to 0.99998474121
|
||
|
// in steps of 0.00001525878
|
||
|
//
|
||
|
// sfract15 range is -0.99996948242 to 0.99996948242
|
||
|
// in steps of 0.00003051757
|
||
|
//
|
||
|
|
||
|
/// ANSI unsigned short _Fract. range is 0 to 0.99609375
|
||
|
/// in steps of 0.00390625
|
||
|
typedef uint8_t fract8; ///< ANSI: unsigned short _Fract
|
||
|
|
||
|
/// ANSI: signed short _Fract. range is -0.9921875 to 0.9921875
|
||
|
/// in steps of 0.0078125
|
||
|
typedef int8_t sfract7; ///< ANSI: signed short _Fract
|
||
|
|
||
|
/// ANSI: unsigned _Fract. range is 0 to 0.99998474121
|
||
|
/// in steps of 0.00001525878
|
||
|
typedef uint16_t fract16; ///< ANSI: unsigned _Fract
|
||
|
|
||
|
/// ANSI: signed _Fract. range is -0.99996948242 to 0.99996948242
|
||
|
/// in steps of 0.00003051757
|
||
|
typedef int16_t sfract15; ///< ANSI: signed _Fract
|
||
|
|
||
|
|
||
|
// accumXY types should be interpreted as X bits of integer,
|
||
|
// and Y bits of fraction.
|
||
|
// E.g., accum88 has 8 bits of int, 8 bits of fraction
|
||
|
|
||
|
typedef uint16_t accum88; ///< ANSI: unsigned short _Accum. 8 bits int, 8 bits fraction
|
||
|
typedef int16_t saccum78; ///< ANSI: signed short _Accum. 7 bits int, 8 bits fraction
|
||
|
typedef uint32_t accum1616;///< ANSI: signed _Accum. 16 bits int, 16 bits fraction
|
||
|
typedef int32_t saccum1516;///< ANSI: signed _Accum. 15 bits int, 16 bits fraction
|
||
|
typedef uint16_t accum124; ///< no direct ANSI counterpart. 12 bits int, 4 bits fraction
|
||
|
typedef int32_t saccum114;///< no direct ANSI counterpart. 1 bit int, 14 bits fraction
|
||
|
|
||
|
|
||
|
|
||
|
#include "math8.h"
|
||
|
#include "scale8.h"
|
||
|
#include "random8.h"
|
||
|
#include "trig8.h"
|
||
|
|
||
|
///////////////////////////////////////////////////////////////////////
|
||
|
|
||
|
|
||
|
|
||
|
|
||
|
|
||
|
|
||
|
|
||
|
///////////////////////////////////////////////////////////////////////
|
||
|
//
|
||
|
// float-to-fixed and fixed-to-float conversions
|
||
|
//
|
||
|
// Note that anything involving a 'float' on AVR will be slower.
|
||
|
|
||
|
/// sfract15ToFloat: conversion from sfract15 fixed point to
|
||
|
/// IEEE754 32-bit float.
|
||
|
LIB8STATIC float sfract15ToFloat( sfract15 y)
|
||
|
{
|
||
|
return y / 32768.0;
|
||
|
}
|
||
|
|
||
|
/// conversion from IEEE754 float in the range (-1,1)
|
||
|
/// to 16-bit fixed point. Note that the extremes of
|
||
|
/// one and negative one are NOT representable. The
|
||
|
/// representable range is basically
|
||
|
LIB8STATIC sfract15 floatToSfract15( float f)
|
||
|
{
|
||
|
return f * 32768.0;
|
||
|
}
|
||
|
|
||
|
|
||
|
|
||
|
///////////////////////////////////////////////////////////////////////
|
||
|
//
|
||
|
// memmove8, memcpy8, and memset8:
|
||
|
// alternatives to memmove, memcpy, and memset that are
|
||
|
// faster on AVR than standard avr-libc 1.8
|
||
|
|
||
|
#if defined(__AVR__)
|
||
|
void * memmove8( void * dst, const void * src, uint16_t num );
|
||
|
void * memcpy8 ( void * dst, const void * src, uint16_t num ) __attribute__ ((noinline));
|
||
|
void * memset8 ( void * ptr, uint8_t value, uint16_t num ) __attribute__ ((noinline)) ;
|
||
|
#else
|
||
|
// on non-AVR platforms, these names just call standard libc.
|
||
|
#define memmove8 memmove
|
||
|
#define memcpy8 memcpy
|
||
|
#define memset8 memset
|
||
|
#endif
|
||
|
|
||
|
|
||
|
///////////////////////////////////////////////////////////////////////
|
||
|
//
|
||
|
// linear interpolation, such as could be used for Perlin noise, etc.
|
||
|
//
|
||
|
|
||
|
// A note on the structure of the lerp functions:
|
||
|
// The cases for b>a and b<=a are handled separately for
|
||
|
// speed: without knowing the relative order of a and b,
|
||
|
// the value (a-b) might be overflow the width of a or b,
|
||
|
// and have to be promoted to a wider, slower type.
|
||
|
// To avoid that, we separate the two cases, and are able
|
||
|
// to do all the math in the same width as the arguments,
|
||
|
// which is much faster and smaller on AVR.
|
||
|
|
||
|
/// linear interpolation between two unsigned 8-bit values,
|
||
|
/// with 8-bit fraction
|
||
|
LIB8STATIC uint8_t lerp8by8( uint8_t a, uint8_t b, fract8 frac)
|
||
|
{
|
||
|
uint8_t result;
|
||
|
if( b > a) {
|
||
|
uint8_t delta = b - a;
|
||
|
uint8_t scaled = scale8( delta, frac);
|
||
|
result = a + scaled;
|
||
|
} else {
|
||
|
uint8_t delta = a - b;
|
||
|
uint8_t scaled = scale8( delta, frac);
|
||
|
result = a - scaled;
|
||
|
}
|
||
|
return result;
|
||
|
}
|
||
|
|
||
|
/// linear interpolation between two unsigned 16-bit values,
|
||
|
/// with 16-bit fraction
|
||
|
LIB8STATIC uint16_t lerp16by16( uint16_t a, uint16_t b, fract16 frac)
|
||
|
{
|
||
|
uint16_t result;
|
||
|
if( b > a ) {
|
||
|
uint16_t delta = b - a;
|
||
|
uint16_t scaled = scale16(delta, frac);
|
||
|
result = a + scaled;
|
||
|
} else {
|
||
|
uint16_t delta = a - b;
|
||
|
uint16_t scaled = scale16( delta, frac);
|
||
|
result = a - scaled;
|
||
|
}
|
||
|
return result;
|
||
|
}
|
||
|
|
||
|
/// linear interpolation between two unsigned 16-bit values,
|
||
|
/// with 8-bit fraction
|
||
|
LIB8STATIC uint16_t lerp16by8( uint16_t a, uint16_t b, fract8 frac)
|
||
|
{
|
||
|
uint16_t result;
|
||
|
if( b > a) {
|
||
|
uint16_t delta = b - a;
|
||
|
uint16_t scaled = scale16by8( delta, frac);
|
||
|
result = a + scaled;
|
||
|
} else {
|
||
|
uint16_t delta = a - b;
|
||
|
uint16_t scaled = scale16by8( delta, frac);
|
||
|
result = a - scaled;
|
||
|
}
|
||
|
return result;
|
||
|
}
|
||
|
|
||
|
/// linear interpolation between two signed 15-bit values,
|
||
|
/// with 8-bit fraction
|
||
|
LIB8STATIC int16_t lerp15by8( int16_t a, int16_t b, fract8 frac)
|
||
|
{
|
||
|
int16_t result;
|
||
|
if( b > a) {
|
||
|
uint16_t delta = b - a;
|
||
|
uint16_t scaled = scale16by8( delta, frac);
|
||
|
result = a + scaled;
|
||
|
} else {
|
||
|
uint16_t delta = a - b;
|
||
|
uint16_t scaled = scale16by8( delta, frac);
|
||
|
result = a - scaled;
|
||
|
}
|
||
|
return result;
|
||
|
}
|
||
|
|
||
|
/// linear interpolation between two signed 15-bit values,
|
||
|
/// with 8-bit fraction
|
||
|
LIB8STATIC int16_t lerp15by16( int16_t a, int16_t b, fract16 frac)
|
||
|
{
|
||
|
int16_t result;
|
||
|
if( b > a) {
|
||
|
uint16_t delta = b - a;
|
||
|
uint16_t scaled = scale16( delta, frac);
|
||
|
result = a + scaled;
|
||
|
} else {
|
||
|
uint16_t delta = a - b;
|
||
|
uint16_t scaled = scale16( delta, frac);
|
||
|
result = a - scaled;
|
||
|
}
|
||
|
return result;
|
||
|
}
|
||
|
|
||
|
/// map8: map from one full-range 8-bit value into a narrower
|
||
|
/// range of 8-bit values, possibly a range of hues.
|
||
|
///
|
||
|
/// E.g. map myValue into a hue in the range blue..purple..pink..red
|
||
|
/// hue = map8( myValue, HUE_BLUE, HUE_RED);
|
||
|
///
|
||
|
/// Combines nicely with the waveform functions (like sin8, etc)
|
||
|
/// to produce continuous hue gradients back and forth:
|
||
|
///
|
||
|
/// hue = map8( sin8( myValue), HUE_BLUE, HUE_RED);
|
||
|
///
|
||
|
/// Mathematically simiar to lerp8by8, but arguments are more
|
||
|
/// like Arduino's "map"; this function is similar to
|
||
|
///
|
||
|
/// map( in, 0, 255, rangeStart, rangeEnd)
|
||
|
///
|
||
|
/// but faster and specifically designed for 8-bit values.
|
||
|
LIB8STATIC uint8_t map8( uint8_t in, uint8_t rangeStart, uint8_t rangeEnd)
|
||
|
{
|
||
|
uint8_t rangeWidth = rangeEnd - rangeStart;
|
||
|
uint8_t out = scale8( in, rangeWidth);
|
||
|
out += rangeStart;
|
||
|
return out;
|
||
|
}
|
||
|
|
||
|
|
||
|
///////////////////////////////////////////////////////////////////////
|
||
|
//
|
||
|
// easing functions; see http://easings.net
|
||
|
//
|
||
|
|
||
|
/// ease8InOutQuad: 8-bit quadratic ease-in / ease-out function
|
||
|
/// Takes around 13 cycles on AVR
|
||
|
#if EASE8_C == 1
|
||
|
LIB8STATIC uint8_t ease8InOutQuad( uint8_t i)
|
||
|
{
|
||
|
uint8_t j = i;
|
||
|
if( j & 0x80 ) {
|
||
|
j = 255 - j;
|
||
|
}
|
||
|
uint8_t jj = scale8( j, j);
|
||
|
uint8_t jj2 = jj << 1;
|
||
|
if( i & 0x80 ) {
|
||
|
jj2 = 255 - jj2;
|
||
|
}
|
||
|
return jj2;
|
||
|
}
|
||
|
|
||
|
#elif EASE8_AVRASM == 1
|
||
|
// This AVR asm version of ease8InOutQuad preserves one more
|
||
|
// low-bit of precision than the C version, and is also slightly
|
||
|
// smaller and faster.
|
||
|
LIB8STATIC uint8_t ease8InOutQuad(uint8_t val) {
|
||
|
uint8_t j=val;
|
||
|
asm volatile (
|
||
|
"sbrc %[val], 7 \n"
|
||
|
"com %[j] \n"
|
||
|
"mul %[j], %[j] \n"
|
||
|
"add r0, %[j] \n"
|
||
|
"ldi %[j], 0 \n"
|
||
|
"adc %[j], r1 \n"
|
||
|
"lsl r0 \n" // carry = high bit of low byte of mul product
|
||
|
"rol %[j] \n" // j = (j * 2) + carry // preserve add'l bit of precision
|
||
|
"sbrc %[val], 7 \n"
|
||
|
"com %[j] \n"
|
||
|
"clr __zero_reg__ \n"
|
||
|
: [j] "+&a" (j)
|
||
|
: [val] "a" (val)
|
||
|
: "r0", "r1"
|
||
|
);
|
||
|
return j;
|
||
|
}
|
||
|
|
||
|
#else
|
||
|
#error "No implementation for ease8InOutQuad available."
|
||
|
#endif
|
||
|
|
||
|
/// ease16InOutQuad: 16-bit quadratic ease-in / ease-out function
|
||
|
// C implementation at this point
|
||
|
LIB8STATIC uint16_t ease16InOutQuad( uint16_t i)
|
||
|
{
|
||
|
uint16_t j = i;
|
||
|
if( j & 0x8000 ) {
|
||
|
j = 65535 - j;
|
||
|
}
|
||
|
uint16_t jj = scale16( j, j);
|
||
|
uint16_t jj2 = jj << 1;
|
||
|
if( i & 0x8000 ) {
|
||
|
jj2 = 65535 - jj2;
|
||
|
}
|
||
|
return jj2;
|
||
|
}
|
||
|
|
||
|
|
||
|
/// ease8InOutCubic: 8-bit cubic ease-in / ease-out function
|
||
|
/// Takes around 18 cycles on AVR
|
||
|
LIB8STATIC fract8 ease8InOutCubic( fract8 i)
|
||
|
{
|
||
|
uint8_t ii = scale8_LEAVING_R1_DIRTY( i, i);
|
||
|
uint8_t iii = scale8_LEAVING_R1_DIRTY( ii, i);
|
||
|
|
||
|
uint16_t r1 = (3 * (uint16_t)(ii)) - ( 2 * (uint16_t)(iii));
|
||
|
|
||
|
/* the code generated for the above *'s automatically
|
||
|
cleans up R1, so there's no need to explicitily call
|
||
|
cleanup_R1(); */
|
||
|
|
||
|
uint8_t result = r1;
|
||
|
|
||
|
// if we got "256", return 255:
|
||
|
if( r1 & 0x100 ) {
|
||
|
result = 255;
|
||
|
}
|
||
|
return result;
|
||
|
}
|
||
|
|
||
|
/// ease8InOutApprox: fast, rough 8-bit ease-in/ease-out function
|
||
|
/// shaped approximately like 'ease8InOutCubic',
|
||
|
/// it's never off by more than a couple of percent
|
||
|
/// from the actual cubic S-curve, and it executes
|
||
|
/// more than twice as fast. Use when the cycles
|
||
|
/// are more important than visual smoothness.
|
||
|
/// Asm version takes around 7 cycles on AVR.
|
||
|
|
||
|
#if EASE8_C == 1
|
||
|
LIB8STATIC fract8 ease8InOutApprox( fract8 i)
|
||
|
{
|
||
|
if( i < 64) {
|
||
|
// start with slope 0.5
|
||
|
i /= 2;
|
||
|
} else if( i > (255 - 64)) {
|
||
|
// end with slope 0.5
|
||
|
i = 255 - i;
|
||
|
i /= 2;
|
||
|
i = 255 - i;
|
||
|
} else {
|
||
|
// in the middle, use slope 192/128 = 1.5
|
||
|
i -= 64;
|
||
|
i += (i / 2);
|
||
|
i += 32;
|
||
|
}
|
||
|
|
||
|
return i;
|
||
|
}
|
||
|
|
||
|
#elif EASE8_AVRASM == 1
|
||
|
LIB8STATIC uint8_t ease8InOutApprox( fract8 i)
|
||
|
{
|
||
|
// takes around 7 cycles on AVR
|
||
|
asm volatile (
|
||
|
" subi %[i], 64 \n\t"
|
||
|
" cpi %[i], 128 \n\t"
|
||
|
" brcc Lshift_%= \n\t"
|
||
|
|
||
|
// middle case
|
||
|
" mov __tmp_reg__, %[i] \n\t"
|
||
|
" lsr __tmp_reg__ \n\t"
|
||
|
" add %[i], __tmp_reg__ \n\t"
|
||
|
" subi %[i], 224 \n\t"
|
||
|
" rjmp Ldone_%= \n\t"
|
||
|
|
||
|
// start or end case
|
||
|
"Lshift_%=: \n\t"
|
||
|
" lsr %[i] \n\t"
|
||
|
" subi %[i], 96 \n\t"
|
||
|
|
||
|
"Ldone_%=: \n\t"
|
||
|
|
||
|
: [i] "+&a" (i)
|
||
|
:
|
||
|
: "r0", "r1"
|
||
|
);
|
||
|
return i;
|
||
|
}
|
||
|
#else
|
||
|
#error "No implementation for ease8 available."
|
||
|
#endif
|
||
|
|
||
|
|
||
|
|
||
|
/// triwave8: triangle (sawtooth) wave generator. Useful for
|
||
|
/// turning a one-byte ever-increasing value into a
|
||
|
/// one-byte value that oscillates up and down.
|
||
|
///
|
||
|
/// input output
|
||
|
/// 0..127 0..254 (positive slope)
|
||
|
/// 128..255 254..0 (negative slope)
|
||
|
///
|
||
|
/// On AVR this function takes just three cycles.
|
||
|
///
|
||
|
LIB8STATIC uint8_t triwave8(uint8_t in)
|
||
|
{
|
||
|
if( in & 0x80) {
|
||
|
in = 255 - in;
|
||
|
}
|
||
|
uint8_t out = in << 1;
|
||
|
return out;
|
||
|
}
|
||
|
|
||
|
|
||
|
// quadwave8 and cubicwave8: S-shaped wave generators (like 'sine').
|
||
|
// Useful for turning a one-byte 'counter' value into a
|
||
|
// one-byte oscillating value that moves smoothly up and down,
|
||
|
// with an 'acceleration' and 'deceleration' curve.
|
||
|
//
|
||
|
// These are even faster than 'sin8', and have
|
||
|
// slightly different curve shapes.
|
||
|
//
|
||
|
|
||
|
/// quadwave8: quadratic waveform generator. Spends just a little more
|
||
|
/// time at the limits than 'sine' does.
|
||
|
LIB8STATIC uint8_t quadwave8(uint8_t in)
|
||
|
{
|
||
|
return ease8InOutQuad( triwave8( in));
|
||
|
}
|
||
|
|
||
|
/// cubicwave8: cubic waveform generator. Spends visibly more time
|
||
|
/// at the limits than 'sine' does.
|
||
|
LIB8STATIC uint8_t cubicwave8(uint8_t in)
|
||
|
{
|
||
|
return ease8InOutCubic( triwave8( in));
|
||
|
}
|
||
|
|
||
|
/// squarewave8: square wave generator. Useful for
|
||
|
/// turning a one-byte ever-increasing value
|
||
|
/// into a one-byte value that is either 0 or 255.
|
||
|
/// The width of the output 'pulse' is
|
||
|
/// determined by the pulsewidth argument:
|
||
|
///
|
||
|
///~~~
|
||
|
/// If pulsewidth is 255, output is always 255.
|
||
|
/// If pulsewidth < 255, then
|
||
|
/// if input < pulsewidth then output is 255
|
||
|
/// if input >= pulsewidth then output is 0
|
||
|
///~~~
|
||
|
///
|
||
|
/// the output looking like:
|
||
|
///
|
||
|
///~~~
|
||
|
/// 255 +--pulsewidth--+
|
||
|
/// . | |
|
||
|
/// 0 0 +--------(256-pulsewidth)--------
|
||
|
///~~~
|
||
|
///
|
||
|
/// @param in
|
||
|
/// @param pulsewidth
|
||
|
/// @returns square wave output
|
||
|
LIB8STATIC uint8_t squarewave8( uint8_t in, uint8_t pulsewidth)
|
||
|
{
|
||
|
if( in < pulsewidth || (pulsewidth == 255)) {
|
||
|
return 255;
|
||
|
} else {
|
||
|
return 0;
|
||
|
}
|
||
|
}
|
||
|
|
||
|
|
||
|
// Beat generators - These functions produce waves at a given
|
||
|
// number of 'beats per minute'. Internally, they use
|
||
|
// the Arduino function 'millis' to track elapsed time.
|
||
|
// Accuracy is a bit better than one part in a thousand.
|
||
|
//
|
||
|
// beat8( BPM ) returns an 8-bit value that cycles 'BPM' times
|
||
|
// per minute, rising from 0 to 255, resetting to zero,
|
||
|
// rising up again, etc.. The output of this function
|
||
|
// is suitable for feeding directly into sin8, and cos8,
|
||
|
// triwave8, quadwave8, and cubicwave8.
|
||
|
// beat16( BPM ) returns a 16-bit value that cycles 'BPM' times
|
||
|
// per minute, rising from 0 to 65535, resetting to zero,
|
||
|
// rising up again, etc. The output of this function is
|
||
|
// suitable for feeding directly into sin16 and cos16.
|
||
|
// beat88( BPM88) is the same as beat16, except that the BPM88 argument
|
||
|
// MUST be in Q8.8 fixed point format, e.g. 120BPM must
|
||
|
// be specified as 120*256 = 30720.
|
||
|
// beatsin8( BPM, uint8_t low, uint8_t high) returns an 8-bit value that
|
||
|
// rises and falls in a sine wave, 'BPM' times per minute,
|
||
|
// between the values of 'low' and 'high'.
|
||
|
// beatsin16( BPM, uint16_t low, uint16_t high) returns a 16-bit value
|
||
|
// that rises and falls in a sine wave, 'BPM' times per
|
||
|
// minute, between the values of 'low' and 'high'.
|
||
|
// beatsin88( BPM88, ...) is the same as beatsin16, except that the
|
||
|
// BPM88 argument MUST be in Q8.8 fixed point format,
|
||
|
// e.g. 120BPM must be specified as 120*256 = 30720.
|
||
|
//
|
||
|
// BPM can be supplied two ways. The simpler way of specifying BPM is as
|
||
|
// a simple 8-bit integer from 1-255, (e.g., "120").
|
||
|
// The more sophisticated way of specifying BPM allows for fractional
|
||
|
// "Q8.8" fixed point number (an 'accum88') with an 8-bit integer part and
|
||
|
// an 8-bit fractional part. The easiest way to construct this is to multiply
|
||
|
// a floating point BPM value (e.g. 120.3) by 256, (e.g. resulting in 30796
|
||
|
// in this case), and pass that as the 16-bit BPM argument.
|
||
|
// "BPM88" MUST always be specified in Q8.8 format.
|
||
|
//
|
||
|
// Originally designed to make an entire animation project pulse with brightness.
|
||
|
// For that effect, add this line just above your existing call to "FastLED.show()":
|
||
|
//
|
||
|
// uint8_t bright = beatsin8( 60 /*BPM*/, 192 /*dimmest*/, 255 /*brightest*/ ));
|
||
|
// FastLED.setBrightness( bright );
|
||
|
// FastLED.show();
|
||
|
//
|
||
|
// The entire animation will now pulse between brightness 192 and 255 once per second.
|
||
|
|
||
|
|
||
|
// The beat generators need access to a millisecond counter.
|
||
|
// On Arduino, this is "millis()". On other platforms, you'll
|
||
|
// need to provide a function with this signature:
|
||
|
// uint32_t get_millisecond_timer();
|
||
|
// that provides similar functionality.
|
||
|
// You can also force use of the get_millisecond_timer function
|
||
|
// by #defining USE_GET_MILLISECOND_TIMER.
|
||
|
#if (defined(ARDUINO) || defined(SPARK) || defined(FASTLED_HAS_MILLIS)) && !defined(USE_GET_MILLISECOND_TIMER)
|
||
|
// Forward declaration of Arduino function 'millis'.
|
||
|
//uint32_t millis();
|
||
|
#define GET_MILLIS millis
|
||
|
#else
|
||
|
uint32_t get_millisecond_timer(void);
|
||
|
#define GET_MILLIS get_millisecond_timer
|
||
|
#endif
|
||
|
|
||
|
// beat16 generates a 16-bit 'sawtooth' wave at a given BPM,
|
||
|
/// with BPM specified in Q8.8 fixed-point format; e.g.
|
||
|
/// for this function, 120 BPM MUST BE specified as
|
||
|
/// 120*256 = 30720.
|
||
|
/// If you just want to specify "120", use beat16 or beat8.
|
||
|
LIB8STATIC uint16_t beat88( accum88 beats_per_minute_88, uint32_t timebase)
|
||
|
{
|
||
|
// BPM is 'beats per minute', or 'beats per 60000ms'.
|
||
|
// To avoid using the (slower) division operator, we
|
||
|
// want to convert 'beats per 60000ms' to 'beats per 65536ms',
|
||
|
// and then use a simple, fast bit-shift to divide by 65536.
|
||
|
//
|
||
|
// The ratio 65536:60000 is 279.620266667:256; we'll call it 280:256.
|
||
|
// The conversion is accurate to about 0.05%, more or less,
|
||
|
// e.g. if you ask for "120 BPM", you'll get about "119.93".
|
||
|
return (((GET_MILLIS()) - timebase) * beats_per_minute_88 * 280) >> 16;
|
||
|
}
|
||
|
|
||
|
/// beat16 generates a 16-bit 'sawtooth' wave at a given BPM
|
||
|
LIB8STATIC uint16_t beat16( accum88 beats_per_minute, uint32_t timebase)
|
||
|
{
|
||
|
// Convert simple 8-bit BPM's to full Q8.8 accum88's if needed
|
||
|
if( beats_per_minute < 256) beats_per_minute <<= 8;
|
||
|
return beat88(beats_per_minute, timebase);
|
||
|
}
|
||
|
|
||
|
/// beat8 generates an 8-bit 'sawtooth' wave at a given BPM
|
||
|
LIB8STATIC uint8_t beat8( accum88 beats_per_minute, uint32_t timebase)
|
||
|
{
|
||
|
return beat16( beats_per_minute, timebase) >> 8;
|
||
|
}
|
||
|
|
||
|
/// beatsin88 generates a 16-bit sine wave at a given BPM,
|
||
|
/// that oscillates within a given range.
|
||
|
/// For this function, BPM MUST BE SPECIFIED as
|
||
|
/// a Q8.8 fixed-point value; e.g. 120BPM must be
|
||
|
/// specified as 120*256 = 30720.
|
||
|
/// If you just want to specify "120", use beatsin16 or beatsin8.
|
||
|
LIB8STATIC uint16_t beatsin88( accum88 beats_per_minute_88, uint16_t lowest, uint16_t highest, uint32_t timebase, uint16_t phase_offset)
|
||
|
{
|
||
|
uint16_t beat = beat88( beats_per_minute_88, timebase);
|
||
|
uint16_t beatsin = (sin16( beat + phase_offset) + 32768);
|
||
|
uint16_t rangewidth = highest - lowest;
|
||
|
uint16_t scaledbeat = scale16( beatsin, rangewidth);
|
||
|
uint16_t result = lowest + scaledbeat;
|
||
|
return result;
|
||
|
}
|
||
|
|
||
|
/// beatsin16 generates a 16-bit sine wave at a given BPM,
|
||
|
/// that oscillates within a given range.
|
||
|
LIB8STATIC uint16_t beatsin16(accum88 beats_per_minute, uint16_t lowest, uint16_t highest, uint32_t timebase, uint16_t phase_offset)
|
||
|
{
|
||
|
uint16_t beat = beat16( beats_per_minute, timebase);
|
||
|
uint16_t beatsin = (sin16( beat + phase_offset) + 32768);
|
||
|
uint16_t rangewidth = highest - lowest;
|
||
|
uint16_t scaledbeat = scale16( beatsin, rangewidth);
|
||
|
uint16_t result = lowest + scaledbeat;
|
||
|
return result;
|
||
|
}
|
||
|
|
||
|
/// beatsin8 generates an 8-bit sine wave at a given BPM,
|
||
|
/// that oscillates within a given range.
|
||
|
LIB8STATIC uint8_t beatsin8( accum88 beats_per_minute, uint8_t lowest, uint8_t highest, uint32_t timebase, uint8_t phase_offset)
|
||
|
{
|
||
|
uint8_t beat = beat8( beats_per_minute, timebase);
|
||
|
uint8_t beatsin = sin8( beat + phase_offset);
|
||
|
uint8_t rangewidth = highest - lowest;
|
||
|
uint8_t scaledbeat = scale8( beatsin, rangewidth);
|
||
|
uint8_t result = lowest + scaledbeat;
|
||
|
return result;
|
||
|
}
|
||
|
|
||
|
|
||
|
/// Return the current seconds since boot in a 16-bit value. Used as part of the
|
||
|
/// "every N time-periods" mechanism
|
||
|
LIB8STATIC uint16_t seconds16(void)
|
||
|
{
|
||
|
uint32_t ms = GET_MILLIS();
|
||
|
uint16_t s16;
|
||
|
s16 = ms / 1000;
|
||
|
return s16;
|
||
|
}
|
||
|
|
||
|
/// Return the current minutes since boot in a 16-bit value. Used as part of the
|
||
|
/// "every N time-periods" mechanism
|
||
|
LIB8STATIC uint16_t minutes16(void)
|
||
|
{
|
||
|
uint32_t ms = GET_MILLIS();
|
||
|
uint16_t m16;
|
||
|
m16 = (ms / (60000L)) & 0xFFFF;
|
||
|
return m16;
|
||
|
}
|
||
|
|
||
|
/// Return the current hours since boot in an 8-bit value. Used as part of the
|
||
|
/// "every N time-periods" mechanism
|
||
|
LIB8STATIC uint8_t hours8(void)
|
||
|
{
|
||
|
uint32_t ms = GET_MILLIS();
|
||
|
uint8_t h8;
|
||
|
h8 = (ms / (3600000L)) & 0xFF;
|
||
|
return h8;
|
||
|
}
|
||
|
|
||
|
///@}
|
||
|
|
||
|
#endif
|