GY-63_MS5611/libraries/statHelpers/statHelpers.cpp

553 lines
11 KiB
C++
Raw Normal View History

2022-04-15 15:33:42 -04:00
//
// FILE: statHelpers.cpp
// AUTHOR: Rob Tillaart
2022-11-25 13:13:30 -05:00
// VERSION: 0.1.6
2022-04-15 15:33:42 -04:00
// PURPOSE: Arduino library with a number of statistic helper functions.
// DATE: 2020-07-01
// URL: https://github.com/RobTillaart/statHelpers
#include "statHelpers.h"
///////////////////////////////////////////////////////////////////////////
//
2022-11-25 13:13:30 -05:00
// PERMUTATIONS
2022-04-15 15:33:42 -04:00
//
uint32_t permutations(uint8_t n, uint8_t k)
{
uint32_t rv = 1;
2022-11-25 13:13:30 -05:00
for (uint8_t i = n; i > (n - k); i--)
{
rv *= i;
}
2022-04-15 15:33:42 -04:00
return rv;
}
uint64_t permutations64(uint8_t n, uint8_t k)
{
uint64_t rv = 1;
2022-11-25 13:13:30 -05:00
for (uint8_t i = n; i > (n - k); i--)
{
rv *= i;
}
2022-04-15 15:33:42 -04:00
return rv;
}
2022-11-25 13:13:30 -05:00
// can be optimized similar to dfactorial
2022-04-15 15:33:42 -04:00
double dpermutations(uint8_t n, uint8_t k)
{
double rv = 1;
2022-11-25 13:13:30 -05:00
for (uint8_t i = n; i > (n - k); i--)
{
rv *= i;
}
2022-04-15 15:33:42 -04:00
return rv;
}
/*
http://wordaligned.org/articles/next-permutation snippet
As an example consider finding the next permutation of:
8342666411
The longest monotonically decreasing tail is 666411, and the corresponding head is 8342.
8342 666411
666411 is, by definition, reverse-ordered, and cannot be increased by permuting its elements.
To find the next permutation, we must increase the head; a matter of finding the smallest tail
element larger than the heads final 2.
8342 666411
Walking back from the end of tail, the first element greater than 2 is 4.
8342 666411
Swap the 2 and the 4
8344 666211
2022-11-25 13:13:30 -05:00
Since head has increased, we now have a greater permutation. To reduce to the next permutation,
2022-04-15 15:33:42 -04:00
we reverse tail, putting it into increasing order.
8344 112666
Join the head and tail back together. The permutation one greater than 8342666411 is 8344112666.
*/
// http://www.nayuki.io/page/next-lexicographical-permutation-algorithm
// b = nextPermutation<char>(array, 100);
/*
template <typename T>
bool nextPermutation(T * array, uint16_t size)
{
// Find longest non-increasing suffix
int i = size - 1;
while (i > 0 && array[i - 1] >= array[i]) i--;
// Now i is the head index of the suffix
// Are we at the last permutation already?
if (i <= 0) return false;
// Let array[i - 1] be the pivot
// Find rightmost element that exceeds the pivot
int j = size - 1;
while (array[j] <= array[i - 1])
j--;
// Now the value array[j] will become the new pivot
// Assertion: j >= i
// Swap the pivot with j
T temp = array[i - 1];
array[i - 1] = array[j];
array[j] = temp;
// Reverse the suffix
j = size - 1;
while (i < j)
{
temp = array[i];
array[i] = array[j];
array[j] = temp;
i++;
j--;
}
return true;
}
*/
///////////////////////////////////////////////////////////////////////////
//
2022-11-25 13:13:30 -05:00
// FACTORIAL
2022-04-15 15:33:42 -04:00
//
2022-11-25 13:13:30 -05:00
// exact ==> 12!
2022-04-15 15:33:42 -04:00
uint32_t factorial(uint8_t n)
{
uint32_t f = 1;
while(n > 1) f *= (n--);
return f;
}
2022-11-25 13:13:30 -05:00
// exact ==> 20!
2022-04-15 15:33:42 -04:00
uint64_t factorial64(uint8_t n)
{
2022-11-25 13:13:30 -05:00
// to be tested
// if ( n <= 12) return factorial(12);
// uint64_t f = factorial(12);
// for (uint8_t t = 13; t <= n; t++) f *= t;
2022-04-15 15:33:42 -04:00
uint64_t f = 1;
while(n > 1) f *= (n--);
return f;
}
2022-11-25 13:13:30 -05:00
// float (4 byte) => 34!
// double (8 byte) => 170!
2022-04-15 15:33:42 -04:00
double dfactorialReference(uint8_t n)
{
double f = 1;
while (n > 1) f *= (n--);
return f;
}
2022-11-25 13:13:30 -05:00
// FASTER VERSION
// does part of the math with integers.
// tested on UNO and ESP32, roughly 3x faster
// numbers differ slightly in the order of IEEE754 precision => acceptable.
// 10e-7 for 4 bit float
// 10e-16 for 8 bit double
2022-04-15 15:33:42 -04:00
double dfactorial(uint8_t n)
{
double f = 1;
while (n > 4)
{
uint32_t val = n * (n-1);
val *= (n-2) * (n-3);
f *= val;
n -= 4;
}
2022-11-25 13:13:30 -05:00
while (n > 1) f *= (n--); // can be squeezed too.
2022-04-15 15:33:42 -04:00
return f;
}
2022-11-25 13:13:30 -05:00
// stirling is an approximation function for factorial(n).
// it is slower but constant in time.
// float => 26!
// double => 143!
2022-04-15 15:33:42 -04:00
double stirling(uint8_t n)
{
double v = exp(-n) * pow(n, n) * sqrt(TWO_PI * n);
return v;
}
2022-11-25 13:13:30 -05:00
// SEMIFACTORIAL
2022-04-15 15:33:42 -04:00
2022-11-25 13:13:30 -05:00
// exact ==> 20!!
2022-04-15 15:33:42 -04:00
uint32_t semiFactorial(uint8_t n)
{
uint32_t f = 1;
while(n > 1)
{
f *= n;
n -= 2;
}
return f;
}
2022-11-25 13:13:30 -05:00
// exact ==> 33!!
2022-04-15 15:33:42 -04:00
uint64_t semiFactorial64(uint8_t n)
{
uint64_t f = 1;
while(n > 1)
{
f *= n;
n -= 2;
}
return f;
}
2022-11-25 13:13:30 -05:00
// float (4 byte) => 56!!
// double (8 byte) => 300!!
2022-04-15 15:33:42 -04:00
double dSemiFactorial(uint16_t n)
{
double f = 1;
while (n > 6) // TODO: test performance gain by integer math. (depends on platform ?)
{
uint32_t val = n * (n-2) * (n-4);
f *= val;
n -= 6;
}
while (n > 1)
{
f *= n;
n -= 2;
}
return f;
}
///////////////////////////////////////////////////////////////////////////
//
2022-11-25 13:13:30 -05:00
// COMBINATIONS
2022-04-15 15:33:42 -04:00
//
2022-11-25 13:13:30 -05:00
// works for n = 0..30 for all k
2022-04-15 15:33:42 -04:00
uint32_t combinations(uint16_t n, uint16_t k)
{
if ((k == 0) || (k == n)) return 1;
if (k < (n-k)) k = n - k; // symmetry
uint32_t rv = n;
uint8_t p = 2;
for (uint8_t i = n-1; i > k; i--)
{
2022-11-25 13:13:30 -05:00
// if ((0xFFFFFFFF / i) < rv) return 0; // overflow detect...
2022-04-15 15:33:42 -04:00
rv = (rv * i) / p;
p++;
}
return rv;
}
2022-11-25 13:13:30 -05:00
// works for n = 0..61 for all k
2022-04-15 15:33:42 -04:00
uint64_t combinations64(uint16_t n, uint16_t k)
{
if ((k == 0) || (k == n)) return 1;
2022-11-25 13:13:30 -05:00
if (k < (n-k)) k = n - k; // symmetry
2022-04-15 15:33:42 -04:00
uint64_t rv = n;
uint8_t p = 2;
for (uint8_t i = n-1; i > k; i--)
{
2022-11-25 13:13:30 -05:00
// overflow detect here ?
2022-04-15 15:33:42 -04:00
rv = (rv * i) / p;
p++;
}
return rv;
}
2022-11-25 13:13:30 -05:00
// experimental - not exact but allows large values
// float (4 bits) works till n = 125 for all k
// double (8 bits) works till n = 1020 for all k
2022-04-15 15:33:42 -04:00
double dcombinations(uint16_t n, uint16_t k)
{
if ((k == 0) || (k == n)) return 1;
2022-11-25 13:13:30 -05:00
if (k < (n-k)) k = n - k; // symmetry
2022-04-15 15:33:42 -04:00
double rv = n;
uint16_t p = 2;
for (uint16_t i = n-1; i > k; i--)
{
rv *= i;
rv /= p;
p++;
}
return rv;
}
2022-11-25 13:13:30 -05:00
// recursive (mind your stack and time)
// works for n = 0..30 for all k
// educational purpose
2022-04-15 15:33:42 -04:00
uint32_t rcombinations(uint16_t n, uint16_t k)
{
if (k > (n-k)) k = n - k; // symmetry
if (k == 0) return 1;
return (n * rcombinations(n - 1, k - 1)) / k;
}
2022-11-25 13:13:30 -05:00
// recursive
// works for n = 0..61 for all k
// educational purpose
2022-04-15 15:33:42 -04:00
uint64_t rcombinations64(uint16_t n, uint16_t k)
{
if (k > (n-k)) k = n - k; // symmetry
if (k == 0) return 1;
return (n * rcombinations64(n - 1, k - 1)) / k;
}
2022-11-25 13:13:30 -05:00
// very slow double recursive way by means of Pascals triangle.
// works for n = 0..30 for all k (but takes a lot of time)
// educational purpose
2022-04-15 15:33:42 -04:00
uint32_t combPascal(uint16_t n, uint16_t k)
{
if (k > (n-k)) k = n - k; // symmetry
if (k > n ) return 0;
if (k == 0) return 1;
if (n < 2) return 1;
uint32_t rv = combPascal(n-1, k-1);
rv += combPascal(n-1, k);
return rv;
}
/////////////////////////////////////////////////
//
2022-11-25 13:13:30 -05:00
// EXPERIMENTAL
2022-04-15 15:33:42 -04:00
//
2022-11-25 13:13:30 -05:00
// BIG SECTION
//
// keep track of exponent myself in 32 bit unsigned integer
// - can be extended to a 64 bit integer
// however it already takes hours to calculate with 32 bits
2022-04-15 15:33:42 -04:00
/*
UNO
n n! millis() from earlier version
-----------------------------------------
1 1.00000e0 0
10 3.62880e6 1
100 9.33262e157 7
1000 4.02386e2567 105
2000 3.31627e5735 231
4000 1.82880e12673 504
8000 5.18416e27752 1086
10000 2.84625e35659 1389
16000 5.11880e60319 2330
32000 1.06550e130270 4978
100000 2.82428e456573 17201
1000000 8.26379e5565708 206421 (3.5 minutes)
10000000 an hour? too long...
ESP32 240MHz
n n! millis() from earlier version
-----------------------------------------
1 1.00000e0 0
10 3.62880e6 0
100 9.33262e157 0
1000 4.02387e2567 8
10000 2.84626e35659 110
100000 2.82423e456573 1390
1000000 8.26393e5565708 16781
10000000 1.20242e65657059 196573 (3++ minutes)
100000000 1.61720e756570556 2253211
1000000000 9.90463e4270738226 25410726 (7++ hrs to detect overflow! :(
1 0
10 0.6
100 1.57
1000 2.567
10000 3.5659
100000 4.56573
1000000 5.565708
10000000 6.5657059
100000000 7.56570556
// largest found - exponent is approaching max_uint32_t - 4294967296
518678058! 4.1873547e4294967283 // break condition was hit...
next one should fit too
518678059! 2.1718890e4294967292
*/
void bigFactorial(uint32_t n, double &mantissa, uint32_t &exponent)
{
exponent = 0;
double f = 1;
while (n > 1)
{
f *= n--;
while (f > 1000000000)
{
f /= 1000000000;
exponent += 9;
}
}
2022-11-25 13:13:30 -05:00
while (f > 10) // fix exponent if needed.
2022-04-15 15:33:42 -04:00
{
f /= 10;
exponent++;
}
mantissa = f;
}
2022-11-25 13:13:30 -05:00
// Should work full range for n = 518678059, k = { 0..n }
// and n > 518678059 => max k is definitely smaller ==> expect n+1 ==> k-15 at start
// performance: low. depends on k.
2022-04-15 15:33:42 -04:00
//
//
2022-11-25 13:13:30 -05:00
// for relative small k and large n (multiple orders of magnitude) one can get an estimate
// P(n,k) ~ raw = log10(n - k/2) * k;
// exponent = int(raw);
// mantissa = pow(10, raw - int(raw));
2022-04-15 15:33:42 -04:00
void bigPermutations(uint32_t n, uint32_t k, double &mantissa, uint32_t &exponent)
{
exponent = 0;
double f = 1;
for (uint32_t i = n; i > (n - k); i--)
{
f *= i;
while (f > 1000000000)
{
f /= 1000000000;
exponent += 9;
}
}
2022-11-25 13:13:30 -05:00
while (f > 10) // fix exponent if needed.
2022-04-15 15:33:42 -04:00
{
f /= 10;
exponent++;
}
mantissa = f;
}
void bigCombinations(uint32_t n, uint32_t k, double &mantissa, uint32_t &exponent)
{
exponent = 0;
if ((k == 0) || (k == n)) return;
2022-11-25 13:13:30 -05:00
if (k < (n-k)) k = n - k; // symmetry
2022-04-15 15:33:42 -04:00
double f = n;
uint32_t p = 2;
for (uint32_t i = n-1; i > k; i--)
{
f = (f * i) / p;
p++;
while (f > 1000000000)
{
f /= 1000000000;
exponent += 9;
}
}
2022-11-25 13:13:30 -05:00
while (f > 10) // fix exponent if needed.
2022-04-15 15:33:42 -04:00
{
f /= 10;
exponent++;
}
mantissa = f;
}
////////////////////////////////////////////////////////////
//
2022-11-25 13:13:30 -05:00
// EXPERIMENTAL 64 BIT
//
2022-04-15 15:33:42 -04:00
void bigFactorial64(uint64_t n, double &mantissa, uint64_t &exponent)
{
exponent = 0;
double f = 1;
while (n > 1)
{
f *= n--;
2022-11-25 13:13:30 -05:00
while (f > 1000000000) // optimize - per 1e9 to save divisions.
2022-04-15 15:33:42 -04:00
{
f /= 1000000000;
exponent += 9;
}
}
2022-11-25 13:13:30 -05:00
while (f > 10) // fix exponent if needed.
2022-04-15 15:33:42 -04:00
{
f /= 10;
exponent++;
}
mantissa = f;
}
void bigPermutations64(uint64_t n, uint64_t k, double &mantissa, uint64_t &exponent)
{
exponent = 0;
double f = 1;
for (uint64_t i = n; i > (n - k); i--)
{
f *= i;
while (f > 1000000000)
{
f /= 1000000000;
exponent += 9;
}
}
2022-11-25 13:13:30 -05:00
while (f > 10) // fix exponent if needed.
2022-04-15 15:33:42 -04:00
{
f /= 10;
exponent++;
}
mantissa = f;
}
void bigCombinations64(uint64_t n, uint64_t k, double &mantissa, uint64_t &exponent)
{
exponent = 0;
if ((k == 0) || (k == n)) return;
if (k < (n-k)) k = n - k; // symmetry
double f = n;
uint64_t p = 2;
for (uint64_t i = n-1; i > k; i--)
{
f = (f * i) / p;
p++;
while (f > 1000000000)
{
f /= 1000000000;
exponent += 9;
}
}
2022-11-25 13:13:30 -05:00
while (f > 10) // fix exponent if needed.
2022-04-15 15:33:42 -04:00
{
f /= 10;
exponent++;
}
mantissa = f;
}
2022-11-25 13:13:30 -05:00
// -- END OF FILE --
2022-04-15 15:33:42 -04:00