module Statistics.Math
(
choose
, logBeta
, chebyshev
, chebyshevBroucke
, factorial
, logFactorial
, incompleteGamma
, logGamma
, logGammaL
, log1p
) where
import Data.Int (Int64)
import Data.Word (Word64)
import Statistics.Constants (m_epsilon, m_sqrt_2_pi, m_ln_sqrt_2_pi, m_NaN,
m_neg_inf, m_pos_inf)
import Statistics.Distribution (cumulative)
import Statistics.Distribution.Normal (standard)
import qualified Data.Vector.Unboxed as U
import qualified Data.Vector.Generic as G
data C = C !Double !Double
chebyshev :: (G.Vector v Double) =>
Double
-> v Double
-> Double
chebyshev x a = fini . G.foldr' step (C 0 0) . G.tail $ a
where step k (C b0 b1) = C (k + x2 * b0 b1) b0
fini (C b0 b1) = G.head a + x * b0 b1
x2 = x * 2
data B = B !Double !Double !Double
chebyshevBroucke :: (G.Vector v Double) =>
Double
-> v Double
-> Double
chebyshevBroucke x = fini . G.foldr' step (B 0 0 0)
where step k (B b0 b1 _) = B (k + x2 * b0 b1) b0 b1
fini (B b0 _ b2) = (b0 b2) * 0.5
x2 = x * 2
logChooseFast :: Double -> Double -> Double
logChooseFast n k = log (n + 1) logBeta (n k + 1) (k + 1)
choose :: Int -> Int -> Double
n `choose` k
| k > n = 0
| k' < 50 = U.foldl' go 1 . U.enumFromTo 1 $ k'
| approx < max64 = fromIntegral . round64 $ approx
| otherwise = approx
where
k' = min k (nk)
approx = exp $ logChooseFast (fromIntegral n) (fromIntegral k')
go a i = a * (nk + j) / j
where j = fromIntegral i :: Double
nk = fromIntegral (n k')
max64 = fromIntegral (maxBound :: Int64)
round64 x = round x :: Int64
data F = F !Word64 !Word64
factorial :: Int -> Double
factorial n
| n < 0 = error "Statistics.Math.factorial: negative input"
| n <= 1 = 1
| n <= 14 = fini . U.foldl' goLong (F 1 1) $ ns
| otherwise = U.foldl' goDouble 1 $ ns
where goDouble t k = t * fromIntegral k
goLong (F z x) _ = F (z * x') x'
where x' = x + 1
fini (F z _) = fromIntegral z
ns = U.enumFromTo 2 n
logFactorial :: Int -> Double
logFactorial n
| n <= 14 = log (factorial n)
| otherwise = (x 0.5) * log x x + 9.1893853320467e-1 + z / x
where x = fromIntegral (n + 1)
y = 1 / (x * x)
z = (((5.95238095238e-4 * y) + 7.936500793651e-4) * y
2.7777777777778e-3) * y + 8.3333333333333e-2
incompleteGamma :: Double
-> Double
-> Double
incompleteGamma p x
| x < 0 || p <= 0 = m_pos_inf
| x == 0 = 0
| p >= 1000 = norm (3 * sqrt p * ((x/p) ** (1/3) + 1/(9*p) 1))
| x >= 1e8 = 1
| x <= 1 || x < p = let a = p * log x x logGamma (p + 1)
g = a + log (pearson p 1 1)
in if g > limit then exp g else 0
| otherwise = let g = p * log x x logGamma p + log cf
in if g > limit then 1 exp g else 1
where
norm = cumulative standard
pearson !a !c !g
| c' <= tolerance = g'
| otherwise = pearson a' c' g'
where a' = a + 1
c' = c * x / a'
g' = g + c'
cf = let a = 1 p
b = a + x + 1
p3 = x + 1
p4 = x * b
in contFrac a b 0 1 x p3 p4 (p3/p4)
contFrac !a !b !c !p1 !p2 !p3 !p4 !g
| abs (g rn) <= min tolerance (tolerance * rn) = g
| otherwise = contFrac a' b' c' (f p3) (f p4) (f p5) (f p6) rn
where a' = a + 1
b' = b + 2
c' = c + 1
an = a' * c'
p5 = b' * p3 an * p1
p6 = b' * p4 an * p2
rn = p5 / p6
f n | abs p5 > overflow = n / overflow
| otherwise = n
limit = 88
tolerance = 1e-14
overflow = 1e37
logGamma :: Double -> Double
logGamma x
| x <= 0 = m_pos_inf
| x < 1.5 = a + c *
((((r1_4 * b + r1_3) * b + r1_2) * b + r1_1) * b + r1_0) /
((((b + r1_8) * b + r1_7) * b + r1_6) * b + r1_5)
| x < 4 = (x 2) *
((((r2_4 * x + r2_3) * x + r2_2) * x + r2_1) * x + r2_0) /
((((x + r2_8) * x + r2_7) * x + r2_6) * x + r2_5)
| x < 12 = ((((r3_4 * x + r3_3) * x + r3_2) * x + r3_1) * x + r3_0) /
((((x + r3_8) * x + r3_7) * x + r3_6) * x + r3_5)
| x > 5.1e5 = k
| otherwise = k + x1 *
((r4_2 * x2 + r4_1) * x2 + r4_0) /
((x2 + r4_4) * x2 + r4_3)
where
(a , b , c)
| x < 0.5 = (y , x + 1 , x)
| otherwise = (0 , x , x 1)
y = log x
k = x * (y1) 0.5 * y + alr2pi
alr2pi = 0.918938533204673
x1 = 1 / x
x2 = x1 * x1
r1_0 = 2.66685511495; r1_1 = 24.4387534237; r1_2 = 21.9698958928
r1_3 = 11.1667541262; r1_4 = 3.13060547623; r1_5 = 0.607771387771
r1_6 = 11.9400905721; r1_7 = 31.4690115749; r1_8 = 15.2346874070
r2_0 = 78.3359299449; r2_1 = 142.046296688; r2_2 = 137.519416416
r2_3 = 78.6994924154; r2_4 = 4.16438922228; r2_5 = 47.0668766060
r2_6 = 313.399215894; r2_7 = 263.505074721; r2_8 = 43.3400022514
r3_0 = 2.12159572323e5; r3_1 = 2.30661510616e5; r3_2 = 2.74647644705e4
r3_3 = 4.02621119975e4; r3_4 = 2.29660729780e3; r3_5 = 1.16328495004e5
r3_6 = 1.46025937511e5; r3_7 = 2.42357409629e4; r3_8 = 5.70691009324e2
r4_0 = 0.279195317918525; r4_1 = 0.4917317610505968;
r4_2 = 0.0692910599291889; r4_3 = 3.350343815022304
r4_4 = 6.012459259764103
data L = L !Double !Double
logGammaL :: Double -> Double
logGammaL x
| x <= 0 = m_pos_inf
| otherwise = fini . U.foldl' go (L 0 (x+7)) $ a
where fini (L l _) = log (l+a0) + log m_sqrt_2_pi x65 + (x0.5) * log x65
go (L l t) k = L (l + k / t) (t1)
x65 = x + 6.5
a0 = 0.9999999999995183
a = U.fromList [ 0.1659470187408462e-06
, 0.9934937113930748e-05
, 0.1385710331296526
, 12.50734324009056
, 176.6150291498386
, 771.3234287757674
, 1259.139216722289
, 676.5203681218835
]
logGammaCorrection :: Double -> Double
logGammaCorrection x
| x < 10 = m_NaN
| x < big = chebyshevBroucke (t * t * 2 1) coeffs / x
| otherwise = 1 / (x * 12)
where
big = 94906265.62425156
t = 10 / x
coeffs = U.fromList [
0.1666389480451863247205729650822e+0,
0.1384948176067563840732986059135e-4,
0.9810825646924729426157171547487e-8,
0.1809129475572494194263306266719e-10,
0.6221098041892605227126015543416e-13,
0.3399615005417721944303330599666e-15,
0.2683181998482698748957538846666e-17
]
logBeta :: Double -> Double -> Double
logBeta a b
| p < 0 = m_NaN
| p == 0 = m_pos_inf
| p >= 10 = log q * (0.5) + m_ln_sqrt_2_pi + logGammaCorrection p + c +
(p 0.5) * log ppq + q * log1p(ppq)
| q >= 10 = logGamma p + c + p p * log pq + (q 0.5) * log1p(ppq)
| otherwise = logGamma p + logGamma q logGamma pq
where
p = min a b
q = max a b
ppq = p / pq
pq = p + q
c = logGammaCorrection q logGammaCorrection pq
log1p :: Double -> Double
log1p x
| x == 0 = 0
| x == 1 = m_neg_inf
| x < 1 = m_NaN
| x' < m_epsilon * 0.5 = x
| (x >= 0 && x < 1e-8) || (x >= 1e-9 && x < 0)
= x * (1 x * 0.5)
| x' < 0.375 = x * (1 x * chebyshevBroucke (x / 0.375) coeffs)
| otherwise = log (1 + x)
where
x' = abs x
coeffs = U.fromList [
0.10378693562743769800686267719098e+1,
0.13364301504908918098766041553133e+0,
0.19408249135520563357926199374750e-1,
0.30107551127535777690376537776592e-2,
0.48694614797154850090456366509137e-3,
0.81054881893175356066809943008622e-4,
0.13778847799559524782938251496059e-4,
0.23802210894358970251369992914935e-5,
0.41640416213865183476391859901989e-6,
0.73595828378075994984266837031998e-7,
0.13117611876241674949152294345011e-7,
0.23546709317742425136696092330175e-8,
0.42522773276034997775638052962567e-9,
0.77190894134840796826108107493300e-10,
0.14075746481359069909215356472191e-10,
0.25769072058024680627537078627584e-11,
0.47342406666294421849154395005938e-12,
0.87249012674742641745301263292675e-13,
0.16124614902740551465739833119115e-13,
0.29875652015665773006710792416815e-14,
0.55480701209082887983041321697279e-15,
0.10324619158271569595141333961932e-15
]