Statistical functions on arrays of numbers, namely, the mean, variance, standard deviation, covariance, min and max

       

/*
 * Copyright (c) 2009-2010, Sergey Karakovskiy and Julian Togelius
 * All rights reserved.
 *
 * Redistribution and use in source and binary forms, with or without
 * modification, are permitted provided that the following conditions are met:
 *     * Redistributions of source code must retain the above copyright
 *       notice, this list of conditions and the following disclaimer.
 *     * Redistributions in binary form must reproduce the above copyright
 *       notice, this list of conditions and the following disclaimer in the
 *       documentation and/or other materials provided with the distribution.
 *     * Neither the name of the Mario AI nor the
 *       names of its contributors may be used to endorse or promote products
 *       derived from this software without specific prior written permission.
 *
 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
 * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
 * WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.
 * IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT,
 * INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT
 * NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR
 * PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
 * WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
 * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
 * POSSIBILITY OF SUCH DAMAGE.
 */

//package ch.idsia.utils.statistics;

import java.io.IOException;
import java.io.PrintStream;
import java.util.Enumeration;
import java.util.Vector;

/**
 * This class implements some simple statistical functions on arrays of numbers,
 * namely, the mean, variance, standard deviation, covariance, min and max.
 */

public class Stats {

  /**
   * Converts a vector of Numbers into an array of double. This function does
   * not necessarily belong here, but is commonly required in order to apply
   * the statistical functions conveniently, since they only deal with arrays
   * of double. (Note that a Number of the common superclass of all the Object
   * versions of the primitives, such as Integer, Double etc.).
   */
  // package that at present just provides average and sd of a
  // vector of doubles

  // also enables writing the
  // Gnuplot comments begin with #

  // next need to find out how to select a particular line style
  // found it :
  // This plots sin(x) and cos(x) with linespoints, using the same line type
  // but different point types:
  // plot sin(x) with linesp lt 1 pt 3, cos(x) with linesp lt 1 pt 4
  public static double[] v2a(Vector v) {
    double[] d = new double[v.size()];
    int i = 0;
    for (Enumeration e = v.elements(); e.hasMoreElements();)
      d[i++] = ((Number) e.nextElement()).doubleValue();
    return d;
  }

  /**
   * Calculates the square of a double.
   * 
   * @return Returns x*x
   */

  public static double sqr(double x) {
    return x * x;
  }

  /**
   * Returns the average of an array of double.
   */

  public static double mean(double[] v) {
    double tot = 0.0;
    for (int i = 0; i < v.length; i++)
      tot += v[i];
    return tot / v.length;
  }

  /**
   * @param v
   *            - sample
   * @return the average of an array of int.
   */

  public static double mean(int[] v) {
    double tot = 0.0;
    for (int i = 0; i < v.length; i++)
      tot += v[i];
    return tot / v.length;
  }

  /**
   * Returns the sample standard deviation of an array of double.
   */

  public static double sdev(double[] v) {
    return Math.sqrt(variance(v));
  }

  /**
   * Returns the standard error of an array of double, where this is defined
   * as the standard deviation of the sample divided by the square root of the
   * sample size.
   */

  public static double stderr(double[] v) {
    return sdev(v) / Math.sqrt(v.length);
  }

  /**
   * Returns the variance of the array of double.
   */

  public static double variance(double[] v) {
    double mu = mean(v);
    double sumsq = 0.0;
    for (int i = 0; i < v.length; i++)
      sumsq += sqr(mu - v[i]);
    return sumsq / (v.length);
    // return 1.12; this was done to test a discrepancy with Business
    // Statistics
  }

  /**
   * this alternative version was used to check correctness
   */

  private static double variance2(double[] v) {
    double mu = mean(v);
    double sumsq = 0.0;
    for (int i = 0; i < v.length; i++)
      sumsq += sqr(v[i]);
    System.out.println(sumsq + " : " + mu);
    double diff = (sumsq - v.length * sqr(mu));
    System.out.println("Diff = " + diff);
    return diff / (v.length);
  }

  /**
   * Returns the covariance of the paired arrays of double.
   */

  public static double covar(double[] v1, double[] v2) {
    double m1 = mean(v1);
    double m2 = mean(v2);
    double sumsq = 0.0;
    for (int i = 0; i < v1.length; i++)
      sumsq += (m1 - v1[i]) * (m2 - v2[i]);
    return sumsq / (v1.length);
  }

  public static double correlation(double[] v1, double[] v2) {
    // an inefficient implementation!!!
    return covar(v1, v2) / (sdev(v1) * sdev(v2));
  }

  public static double correlation2(double[] v1, double[] v2) {
    // an inefficient implementation!!!
    return sqr(covar(v1, v2)) / (covar(v1, v1) * covar(v2, v2));
  }

  /**
   * Returns the maximum value in the array.
   */

  public static double max(double[] v) {
    double m = v[0];
    for (int i = 1; i < v.length; i++)
      m = Math.max(m, v[i]);
    return m;
  }

  /**
   * Returns the minimum value in the array.
   */

  public static double min(double[] v) {
    double m = v[0];
    for (int i = 1; i < v.length; i++)
      m = Math.min(m, v[i]);
    return m;
  }

  /**
   * Prints the means and standard deviation of the data to the standard
   * output.
   */

  public static void analyse(double[] v) {
    analyse(v, System.out);
    // System.out.println("Average = " + mean(v) + "  sd = " + sdev(v));
  }

  /**
   * Prints the means and standard deviation of the data to the specified
   * PrintStream
   * 
   * @param v
   *            contains the data
   * @param s
   *            is the corresponding PrintStream
   */

  public static void analyse(double[] v, PrintStream s) {
    s.println("Average = " + mean(v) + "  sd = " + sdev(v));
  }

  /**
   * @param v
   *            contains the data
   * @return A String summary of the with the mean and standard deviation of
   *         the data.
   */

  public static String analysisString(double[] v) {
    return "Average = " + mean(v) + "  sd = " + sdev(v) + "  min = "
        + min(v) + "  max = " + max(v);
  }

  /**
   * Returns a string that compares the root mean square of the data with the
   * standard deviation of the data. This is probably too specialised to be of
   * much general use.
   * 
   * @param v
   *            contains the data
   * @return root mean square = <...> standard deviation = <...>
   */
  public static String rmsString(double[] v) {
    double[] tv = new double[v.length];
    for (int i = 0; i < v.length; i++)
      tv[i] = v[i] * v[i];
    return "rms = " + mean(tv) + " sd = " + sdev(v) + "\n";
  }

  /**
   * Runs through some utils using the functions defined in this class.
   * 
   * @throws java.io.IOException
   */

  public static void main(String[] args) throws IOException {

    double[] d = new double[0];

    double dd = mean(d);

    System.out.println(dd + "\t" + Double.isNaN(dd));

    for (int i = 0; i < 3; i++) {
      double[] x = new double[i];
      System.out.println(mean(x) + "\t " + stderr(x) + "\t " + sdev(x));
    }
  }

}

Related examples in the same category

1.	Absolute value
2.	Find absolute value of float, int, double and long using Math.abs
3.	Find ceiling value of a number using Math.ceil
4.	Find exponential value of a number using Math.exp
5.	Find floor value of a number using Math.floor
6.	Find minimum of two numbers using Math.min
7.	Find power using Math.pow
8.	Find square root of a number using Math.sqrt
9.	Find natural logarithm value of a number using Math.log
10.	Find maximum of two numbers using Math.max
11.	Get the power value
12.	Using the Math Trig Methods
13.	Using BigDecimal for Precision
14.	Demonstrate our own version round()
15.	Demonstrate a few of the Math functions for Trigonometry
16.	Exponential Demo
17.	Min Demo
18.	Basic Math Demo
19.	Using strict math in applications
20.	Conversion between polar and rectangular coordinates
21.	Using the pow() function
22.	Using strict math at the method level
23.	Calculating hyperbolic functions
24.	Calculating trigonometric functions
25.	Weighted floating-point comparisons
26.	Solving right triangles
27.	Applying the quadratic formula
28.	Calculate the floor of the log, base 2
29.	Greatest Common Divisor (GCD) of positive integer numbers
30.	Least Common Multiple (LCM) of two strictly positive integer numbers
31.	Moving Average
32.	Make Exponention
33.	Caclulate the factorial of N
34.	Trigonometric Demo
35.	Complex Number Demo
36.	sqrt(a^2 + b^2) without under/overflow
37.	Returns an integer hash code representing the given double array value.
38.	Returns an integer hash code representing the given double value.
39.	Returns n!. Shorthand for n Factorial, the product of the numbers 1,...,n as a double.
40.	Returns n!. Shorthand for n Factorial, the product of the numbers 1,...,n.
41.	Returns the hyperbolic sine of x.
42.	Contains static definition for matrix math methods.
43.	For a double precision value x, this method returns +1.0 if x >= 0 and -1.0 if x < 0. Returns NaN if x is NaN.
44.	For a float value x, this method returns +1.0F if x >= 0 and -1.0F if x < 0. Returns NaN if x is NaN.
45.	Normalize an angle in a 2&pi wide interval around a center value.
46.	Normalizes an angle to a relative angle.
47.	Normalizes an angle to an absolute angle
48.	Normalizes an angle to be near an absolute angle
49.	Returns the natural logarithm of n!.
50.	Returns the least common multiple between two integer values.
51.	Gets the greatest common divisor of the absolute value of two numbers
52.	Matrix manipulation
53.	Returns exact (http://mathworld.wolfram.com/BinomialCoefficient.html) Binomial Coefficient
54.	Returns a double representation of the (http://mathworld.wolfram.com/BinomialCoefficient.html) Binomial Coefficient
55.	Returns the natural log of the (http://mathworld.wolfram.com/BinomialCoefficient.html) Binomial Coefficient
56.	Returns the hyperbolic cosine of x.
57.	Math Utils
58.	Implements the methods which are in the standard J2SE's Math class, but are not in in J2ME's.
59.	Utility methods for mathematical problems.
60.	A math utility class with static methods.
61.	Computes the binomial coefficient "n over k"
62.	Log Gamma
63.	Log Beta
64.	Beta
65.	Gamma
66.	Factorial
67.	Computes p(x;n,p) where x~B(n,p)
68.	Returns the sum of two doubles expressed in log space
69.	sigmod
70.	sigmod rev
71.	Numbers that are closer than this are considered equal
72.	Returns the KL divergence, K(p1 \|\| p2).
73.	Returns the sum of two doubles expressed in log space
74.	Returns the difference of two doubles expressed in log space
75.	Is Prime
76.	This class calculates the Factorial of a numbers passed into the program through command line arguments.
77.	Calculates the Greatest Common Divisor of two numbers passed into the program through command line arguments.
78.	Variance: the square of the standard deviation.
79.	Population Standard Deviation
80.	Returns from a static prime table the least prime that is greater than or equal to a specified value.

Statistical functions on arrays of numbers, namely, the mean, variance, standard deviation, covariance, min and max : Math « Development Class « Java

Related examples in the same category