blob: 9179bc01ad1d30171c986729a9ee7be9c776af8e [file] [log] [blame]
* #%L
* %%
* Copyright 1999 CERN - European Organization for Nuclear Research.
* %%
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* See the License for the specific language governing permissions and
* limitations under the License.
* #L%
public class Statistics {
/** Some constants */
protected static final double MACHEP = 1.11022302462515654042E-16;
protected static final double MAXLOG = 7.09782712893383996732E2;
protected static final double MINLOG = -7.451332191019412076235E2;
protected static final double MAXGAM = 171.624376956302725;
protected static final double SQTPI = 2.50662827463100050242E0;
protected static final double SQRTH = 7.07106781186547524401E-1;
protected static final double LOGPI = 1.14472988584940017414;
protected static final double big = 4.503599627370496e15;
protected static final double biginv = 2.22044604925031308085e-16;
/* approximation for 0 <= |y - 0.5| <= 3/8 */
protected static final double P0[] = {
protected static final double Q0[] = {
/* 1.00000000000000000000E0, */
* Approximation for interval z = sqrt(-2 log y ) between 2 and 8 i.e., y
* between exp(-2) = .135 and exp(-32) = 1.27e-14.
protected static final double P1[] = {
protected static final double Q1[] = {
/* 1.00000000000000000000E0, */
* Approximation for interval z = sqrt(-2 log y ) between 8 and 64 i.e., y
* between exp(-32) = 1.27e-14 and exp(-2048) = 3.67e-890.
protected static final double P2[] = {
protected static final double Q2[] = {
/* 1.00000000000000000000E0, */
* Computes standard error for observed values of a binomial random variable.
* @param p
* the probability of success
* @param n
* the size of the sample
* @return the standard error
public static double binomialStandardError(double p, int n) {
if (n == 0) {
return 0;
return Math.sqrt((p * (1 - p)) / (double) n);
* Returns chi-squared probability for given value and degrees of freedom. (The probability that the chi-squared
* variate will be greater than x for the given degrees of freedom.)
* @param x
* the value
* @param v
* the number of degrees of freedom
* @return the chi-squared probability
public static double chiSquaredProbability(double x, double v) {
if (x < 0.0 || v < 1.0)
return 0.0;
return incompleteGammaComplement(v / 2.0, x / 2.0);
* Computes probability of F-ratio.
* @param F
* the F-ratio
* @param df1
* the first number of degrees of freedom
* @param df2
* the second number of degrees of freedom
* @return the probability of the F-ratio.
public static double FProbability(double F, int df1, int df2) {
return incompleteBeta(df2 / 2.0, df1 / 2.0, df2 / (df2 + df1 * F));
* Returns the area under the Normal (Gaussian) probability density function, integrated from minus infinity to
* <tt>x</tt> (assumes mean is zero, variance is one).
* <pre>
* x
* -
* 1 | | 2
* normal(x) = --------- | exp( - t /2 ) dt
* sqrt(2pi) | |
* -
* -inf.
* = ( 1 + erf(z) ) / 2
* = erfc(z) / 2
* </pre>
* where <tt>z = x/sqrt(2)</tt>. Computation is via the functions <tt>errorFunction</tt> and
* <tt>errorFunctionComplement</tt>.
* @param a
* the z-value
* @return the probability of the z value according to the normal pdf
public static double normalProbability(double a) {
double x, y, z;
x = a * SQRTH;
z = Math.abs(x);
if (z < SQRTH)
y = 0.5 + 0.5 * errorFunction(x);
else {
y = 0.5 * errorFunctionComplemented(z);
if (x > 0)
y = 1.0 - y;
return y;
* Returns the value, <tt>x</tt>, for which the area under the Normal (Gaussian) probability density function
* (integrated from minus infinity to <tt>x</tt>) is equal to the argument <tt>y</tt> (assumes mean is zero, variance
* is one).
* <p>
* For small arguments <tt>0 < y < exp(-2)</tt>, the program computes <tt>z = sqrt( -2.0 * log(y) )</tt>; then the
* approximation is <tt>x = z - log(z)/z - (1/z) P(1/z) / Q(1/z)</tt>. There are two rational functions P/Q, one for
* <tt>0 < y < exp(-32)</tt> and the other for <tt>y</tt> up to <tt>exp(-2)</tt>. For larger arguments,
* <tt>w = y - 0.5</tt>, and <tt>x/sqrt(2pi) = w + w**3 R(w**2)/S(w**2))</tt>.
* @param y0
* the area under the normal pdf
* @return the z-value
public static double normalInverse(double y0) {
double x, y, z, y2, x0, x1;
int code;
final double s2pi = Math.sqrt(2.0 * Math.PI);
if (y0 <= 0.0)
throw new IllegalArgumentException();
if (y0 >= 1.0)
throw new IllegalArgumentException();
code = 1;
y = y0;
if (y > (1.0 - 0.13533528323661269189)) { /* 0.135... = exp(-2) */
y = 1.0 - y;
code = 0;
if (y > 0.13533528323661269189) {
y = y - 0.5;
y2 = y * y;
x = y + y * (y2 * polevl(y2, P0, 4) / p1evl(y2, Q0, 8));
x = x * s2pi;
return (x);
x = Math.sqrt(-2.0 * Math.log(y));
x0 = x - Math.log(x) / x;
z = 1.0 / x;
if (x < 8.0) /* y > exp(-32) = 1.2664165549e-14 */
x1 = z * polevl(z, P1, 8) / p1evl(z, Q1, 8);
x1 = z * polevl(z, P2, 8) / p1evl(z, Q2, 8);
x = x0 - x1;
if (code != 0)
x = -x;
return (x);
* Returns natural logarithm of gamma function.
* @param x
* the value
* @return natural logarithm of gamma function
public static double lnGamma(double x) {
double p, q, w, z;
double A[] = {
double B[] = {
double C[] = {
/* 1.00000000000000000000E0, */
if (x < -34.0) {
q = -x;
w = lnGamma(q);
p = Math.floor(q);
if (p == q)
throw new ArithmeticException("lnGamma: Overflow");
z = q - p;
if (z > 0.5) {
p += 1.0;
z = p - q;
z = q * Math.sin(Math.PI * z);
if (z == 0.0)
throw new ArithmeticException("lnGamma: Overflow");
z = LOGPI - Math.log(z) - w;
return z;
if (x < 13.0) {
z = 1.0;
while (x >= 3.0) {
x -= 1.0;
z *= x;
while (x < 2.0) {
if (x == 0.0)
throw new ArithmeticException("lnGamma: Overflow");
z /= x;
x += 1.0;
if (z < 0.0)
z = -z;
if (x == 2.0)
return Math.log(z);
x -= 2.0;
p = x * polevl(x, B, 5) / p1evl(x, C, 6);
return (Math.log(z) + p);
if (x > 2.556348e305)
throw new ArithmeticException("lnGamma: Overflow");
q = (x - 0.5) * Math.log(x) - x + 0.91893853320467274178;
if (x > 1.0e8)
return (q);
p = 1.0 / (x * x);
if (x >= 1000.0)
q += ((7.9365079365079365079365e-4 * p
- 2.7777777777777777777778e-3) * p
+ 0.0833333333333333333333) / x;
q += polevl(p, A, 4) / x;
return q;
* Returns the error function of the normal distribution. The integral is
* <pre>
* x
* -
* 2 | | 2
* erf(x) = -------- | exp( - t ) dt.
* sqrt(pi) | |
* -
* 0
* </pre>
* <b>Implementation:</b> For <tt>0 <= |x| < 1, erf(x) = x * P4(x**2)/Q5(x**2)</tt>; otherwise
* <tt>erf(x) = 1 - erfc(x)</tt>.
* <p>
* Code adapted from the <A HREF=""> Java 2D Graph Package
* 2.4</A>, which in turn is a port from the <A HREF="">Cephes
* 2.2</A> Math Library (C).
* @param a
* the argument to the function.
public static double errorFunction(double x) {
double y, z;
final double T[] = {
final double U[] = {
// 1.00000000000000000000E0,
if (Math.abs(x) > 1.0)
return (1.0 - errorFunctionComplemented(x));
z = x * x;
y = x * polevl(z, T, 4) / p1evl(z, U, 5);
return y;
* Returns the complementary Error function of the normal distribution.
* <pre>
* 1 - erf(x) =
* inf.
* -
* 2 | | 2
* erfc(x) = -------- | exp( - t ) dt
* sqrt(pi) | |
* -
* x
* </pre>
* <b>Implementation:</b> For small x, <tt>erfc(x) = 1 - erf(x)</tt>; otherwise rational approximations are computed.
* <p>
* Code adapted from the <A HREF=""> Java 2D Graph Package
* 2.4</A>, which in turn is a port from the <A HREF="">Cephes
* 2.2</A> Math Library (C).
* @param a
* the argument to the function.
public static double errorFunctionComplemented(double a) {
double x, y, z, p, q;
double P[] = {
double Q[] = {
// 1.0
double R[] = {
double S[] = {
// 1.00000000000000000000E0,
if (a < 0.0)
x = -a;
x = a;
if (x < 1.0)
return 1.0 - errorFunction(a);
z = -a * a;
if (z < -MAXLOG) {
if (a < 0)
return (2.0);
return (0.0);
z = Math.exp(z);
if (x < 8.0) {
p = polevl(x, P, 8);
q = p1evl(x, Q, 8);
} else {
p = polevl(x, R, 5);
q = p1evl(x, S, 6);
y = (z * p) / q;
if (a < 0)
y = 2.0 - y;
if (y == 0.0) {
if (a < 0)
return 2.0;
return (0.0);
return y;
* Evaluates the given polynomial of degree <tt>N</tt> at <tt>x</tt>. Evaluates polynomial when coefficient of N is
* 1.0. Otherwise same as <tt>polevl()</tt>.
* <pre>
* 2 N
* y = C + C x + C x +...+ C x
* 0 1 2 N
* Coefficients are stored in reverse order:
* coef[0] = C , ..., coef[N] = C .
* N 0
* </pre>
* The function <tt>p1evl()</tt> assumes that <tt>coef[N] = 1.0</tt> and is omitted from the array. Its calling
* arguments are otherwise the same as <tt>polevl()</tt>.
* <p>
* In the interest of speed, there are no checks for out of bounds arithmetic.
* @param x
* argument to the polynomial.
* @param coef
* the coefficients of the polynomial.
* @param N
* the degree of the polynomial.
public static double p1evl(double x, double coef[], int N) {
double ans;
ans = x + coef[0];
for (int i = 1; i < N; i++)
ans = ans * x + coef[i];
return ans;
* Evaluates the given polynomial of degree <tt>N</tt> at <tt>x</tt>.
* <pre>
* 2 N
* y = C + C x + C x +...+ C x
* 0 1 2 N
* Coefficients are stored in reverse order:
* coef[0] = C , ..., coef[N] = C .
* N 0
* </pre>
* In the interest of speed, there are no checks for out of bounds arithmetic.
* @param x
* argument to the polynomial.
* @param coef
* the coefficients of the polynomial.
* @param N
* the degree of the polynomial.
public static double polevl(double x, double coef[], int N) {
double ans;
ans = coef[0];
for (int i = 1; i <= N; i++)
ans = ans * x + coef[i];
return ans;
* Returns the Incomplete Gamma function.
* @param a
* the parameter of the gamma distribution.
* @param x
* the integration end point.
public static double incompleteGamma(double a, double x)
double ans, ax, c, r;
if (x <= 0 || a <= 0)
return 0.0;
if (x > 1.0 && x > a)
return 1.0 - incompleteGammaComplement(a, x);
/* Compute x**a * exp(-x) / gamma(a) */
ax = a * Math.log(x) - x - lnGamma(a);
if (ax < -MAXLOG)
return (0.0);
ax = Math.exp(ax);
/* power series */
r = a;
c = 1.0;
ans = 1.0;
do {
r += 1.0;
c *= x / r;
ans += c;
} while (c / ans > MACHEP);
return (ans * ax / a);
* Returns the Complemented Incomplete Gamma function.
* @param a
* the parameter of the gamma distribution.
* @param x
* the integration start point.
public static double incompleteGammaComplement(double a, double x) {
double ans, ax, c, yc, r, t, y, z;
double pk, pkm1, pkm2, qk, qkm1, qkm2;
if (x <= 0 || a <= 0)
return 1.0;
if (x < 1.0 || x < a)
return 1.0 - incompleteGamma(a, x);
ax = a * Math.log(x) - x - lnGamma(a);
if (ax < -MAXLOG)
return 0.0;
ax = Math.exp(ax);
/* continued fraction */
y = 1.0 - a;
z = x + y + 1.0;
c = 0.0;
pkm2 = 1.0;
qkm2 = x;
pkm1 = x + 1.0;
qkm1 = z * x;
ans = pkm1 / qkm1;
do {
c += 1.0;
y += 1.0;
z += 2.0;
yc = y * c;
pk = pkm1 * z - pkm2 * yc;
qk = qkm1 * z - qkm2 * yc;
if (qk != 0) {
r = pk / qk;
t = Math.abs((ans - r) / r);
ans = r;
} else
t = 1.0;
pkm2 = pkm1;
pkm1 = pk;
qkm2 = qkm1;
qkm1 = qk;
if (Math.abs(pk) > big) {
pkm2 *= biginv;
pkm1 *= biginv;
qkm2 *= biginv;
qkm1 *= biginv;
} while (t > MACHEP);
return ans * ax;
* Returns the Gamma function of the argument.
public static double gamma(double x) {
double P[] = {
double Q[] = {
double p, z;
int i;
double q = Math.abs(x);
if (q > 33.0) {
if (x < 0.0) {
p = Math.floor(q);
if (p == q)
throw new ArithmeticException("gamma: overflow");
i = (int) p;
z = q - p;
if (z > 0.5) {
p += 1.0;
z = q - p;
z = q * Math.sin(Math.PI * z);
if (z == 0.0)
throw new ArithmeticException("gamma: overflow");
z = Math.abs(z);
z = Math.PI / (z * stirlingFormula(q));
return -z;
} else {
return stirlingFormula(x);
z = 1.0;
while (x >= 3.0) {
x -= 1.0;
z *= x;
while (x < 0.0) {
if (x == 0.0) {
throw new ArithmeticException("gamma: singular");
} else if (x > -1.E-9) {
return (z / ((1.0 + 0.5772156649015329 * x) * x));
z /= x;
x += 1.0;
while (x < 2.0) {
if (x == 0.0) {
throw new ArithmeticException("gamma: singular");
} else if (x < 1.e-9) {
return (z / ((1.0 + 0.5772156649015329 * x) * x));
z /= x;
x += 1.0;
if ((x == 2.0) || (x == 3.0))
return z;
x -= 2.0;
p = polevl(x, P, 6);
q = polevl(x, Q, 7);
return z * p / q;
* Returns the Gamma function computed by Stirling's formula. The polynomial STIR is valid for 33 <= x <= 172.
public static double stirlingFormula(double x) {
double STIR[] = {
double MAXSTIR = 143.01608;
double w = 1.0 / x;
double y = Math.exp(x);
w = 1.0 + w * polevl(w, STIR, 4);
if (x > MAXSTIR) {
/* Avoid overflow in Math.pow() */
double v = Math.pow(x, 0.5 * x - 0.25);
y = v * (v / y);
} else {
y = Math.pow(x, x - 0.5) / y;
y = SQTPI * y * w;
return y;
* Returns the Incomplete Beta Function evaluated from zero to <tt>xx</tt>.
* @param aa
* the alpha parameter of the beta distribution.
* @param bb
* the beta parameter of the beta distribution.
* @param xx
* the integration end point.
public static double incompleteBeta(double aa, double bb, double xx) {
double a, b, t, x, xc, w, y;
boolean flag;
if (aa <= 0.0 || bb <= 0.0)
throw new ArithmeticException("ibeta: Domain error!");
if ((xx <= 0.0) || (xx >= 1.0)) {
if (xx == 0.0)
return 0.0;
if (xx == 1.0)
return 1.0;
throw new ArithmeticException("ibeta: Domain error!");
flag = false;
if ((bb * xx) <= 1.0 && xx <= 0.95) {
t = powerSeries(aa, bb, xx);
return t;
w = 1.0 - xx;
/* Reverse a and b if x is greater than the mean. */
if (xx > (aa / (aa + bb))) {
flag = true;
a = bb;
b = aa;
xc = xx;
x = w;
} else {
a = aa;
b = bb;
xc = w;
x = xx;
if (flag && (b * x) <= 1.0 && x <= 0.95) {
t = powerSeries(a, b, x);
if (t <= MACHEP)
t = 1.0 - MACHEP;
t = 1.0 - t;
return t;
/* Choose expansion for better convergence. */
y = x * (a + b - 2.0) - (a - 1.0);
if (y < 0.0)
w = incompleteBetaFraction1(a, b, x);
w = incompleteBetaFraction2(a, b, x) / xc;
* Multiply w by the factor a b _ _ _ x (1-x) | (a+b) / ( a | (a) | (b) ) .
y = a * Math.log(x);
t = b * Math.log(xc);
if ((a + b) < MAXGAM && Math.abs(y) < MAXLOG && Math.abs(t) < MAXLOG) {
t = Math.pow(xc, b);
t *= Math.pow(x, a);
t /= a;
t *= w;
t *= gamma(a + b) / (gamma(a) * gamma(b));
if (flag) {
if (t <= MACHEP)
t = 1.0 - MACHEP;
t = 1.0 - t;
return t;
/* Resort to logarithms. */
y += t + lnGamma(a + b) - lnGamma(a) - lnGamma(b);
y += Math.log(w / a);
if (y < MINLOG)
t = 0.0;
t = Math.exp(y);
if (flag) {
if (t <= MACHEP)
t = 1.0 - MACHEP;
t = 1.0 - t;
return t;
* Continued fraction expansion #1 for incomplete beta integral.
public static double incompleteBetaFraction1(double a, double b, double x) {
double xk, pk, pkm1, pkm2, qk, qkm1, qkm2;
double k1, k2, k3, k4, k5, k6, k7, k8;
double r, t, ans, thresh;
int n;
k1 = a;
k2 = a + b;
k3 = a;
k4 = a + 1.0;
k5 = 1.0;
k6 = b - 1.0;
k7 = k4;
k8 = a + 2.0;
pkm2 = 0.0;
qkm2 = 1.0;
pkm1 = 1.0;
qkm1 = 1.0;
ans = 1.0;
r = 1.0;
n = 0;
thresh = 3.0 * MACHEP;
do {
xk = -(x * k1 * k2) / (k3 * k4);
pk = pkm1 + pkm2 * xk;
qk = qkm1 + qkm2 * xk;
pkm2 = pkm1;
pkm1 = pk;
qkm2 = qkm1;
qkm1 = qk;
xk = (x * k5 * k6) / (k7 * k8);
pk = pkm1 + pkm2 * xk;
qk = qkm1 + qkm2 * xk;
pkm2 = pkm1;
pkm1 = pk;
qkm2 = qkm1;
qkm1 = qk;
if (qk != 0)
r = pk / qk;
if (r != 0) {
t = Math.abs((ans - r) / r);
ans = r;
} else
t = 1.0;
if (t < thresh)
return ans;
k1 += 1.0;
k2 += 1.0;
k3 += 2.0;
k4 += 2.0;
k5 += 1.0;
k6 -= 1.0;
k7 += 2.0;
k8 += 2.0;
if ((Math.abs(qk) + Math.abs(pk)) > big) {
pkm2 *= biginv;
pkm1 *= biginv;
qkm2 *= biginv;
qkm1 *= biginv;
if ((Math.abs(qk) < biginv) || (Math.abs(pk) < biginv)) {
pkm2 *= big;
pkm1 *= big;
qkm2 *= big;
qkm1 *= big;
} while (++n < 300);
return ans;
* Continued fraction expansion #2 for incomplete beta integral.
public static double incompleteBetaFraction2(double a, double b, double x) {
double xk, pk, pkm1, pkm2, qk, qkm1, qkm2;
double k1, k2, k3, k4, k5, k6, k7, k8;
double r, t, ans, z, thresh;
int n;
k1 = a;
k2 = b - 1.0;
k3 = a;
k4 = a + 1.0;
k5 = 1.0;
k6 = a + b;
k7 = a + 1.0;
k8 = a + 2.0;
pkm2 = 0.0;
qkm2 = 1.0;
pkm1 = 1.0;
qkm1 = 1.0;
z = x / (1.0 - x);
ans = 1.0;
r = 1.0;
n = 0;
thresh = 3.0 * MACHEP;
do {
xk = -(z * k1 * k2) / (k3 * k4);
pk = pkm1 + pkm2 * xk;
qk = qkm1 + qkm2 * xk;
pkm2 = pkm1;
pkm1 = pk;
qkm2 = qkm1;
qkm1 = qk;
xk = (z * k5 * k6) / (k7 * k8);
pk = pkm1 + pkm2 * xk;
qk = qkm1 + qkm2 * xk;
pkm2 = pkm1;
pkm1 = pk;
qkm2 = qkm1;
qkm1 = qk;
if (qk != 0)
r = pk / qk;
if (r != 0) {
t = Math.abs((ans - r) / r);
ans = r;
} else
t = 1.0;
if (t < thresh)
return ans;
k1 += 1.0;
k2 -= 1.0;
k3 += 2.0;
k4 += 2.0;
k5 += 1.0;
k6 += 1.0;
k7 += 2.0;
k8 += 2.0;
if ((Math.abs(qk) + Math.abs(pk)) > big) {
pkm2 *= biginv;
pkm1 *= biginv;
qkm2 *= biginv;
qkm1 *= biginv;
if ((Math.abs(qk) < biginv) || (Math.abs(pk) < biginv)) {
pkm2 *= big;
pkm1 *= big;
qkm2 *= big;
qkm1 *= big;
} while (++n < 300);
return ans;
* Power series for incomplete beta integral. Use when b*x is small and x not too close to 1.
public static double powerSeries(double a, double b, double x) {
double s, t, u, v, n, t1, z, ai;
ai = 1.0 / a;
u = (1.0 - b) * x;
v = u / (a + 1.0);
t1 = v;
t = u;
n = 2.0;
s = 0.0;
z = MACHEP * ai;
while (Math.abs(v) > z) {
u = (n - b) * x / n;
t *= u;
v = t / (a + n);
s += v;
n += 1.0;
s += t1;
s += ai;
u = a * Math.log(x);
if ((a + b) < MAXGAM && Math.abs(u) < MAXLOG) {
t = gamma(a + b) / (gamma(a) * gamma(b));
s = s * t * Math.pow(x, a);
} else {
t = lnGamma(a + b) - lnGamma(a) - lnGamma(b) + u + Math.log(s);
if (t < MINLOG)
s = 0.0;
s = Math.exp(t);
return s;