Free cookie consent management tool by TermsFeed Policy Generator

source: trunk/sources/HeuristicLab.DataAnalysis/3.2/Statistics.cs @ 2535

Last change on this file since 2535 was 2535, checked in by mkommend, 14 years ago

corrected median implementation (ticket #808)

File size: 7.5 KB
RevLine 
[2]1#region License Information
2/* HeuristicLab
3 * Copyright (C) 2002-2008 Heuristic and Evolutionary Algorithms Laboratory (HEAL)
4 *
5 * This file is part of HeuristicLab.
6 *
7 * HeuristicLab is free software: you can redistribute it and/or modify
8 * it under the terms of the GNU General Public License as published by
9 * the Free Software Foundation, either version 3 of the License, or
10 * (at your option) any later version.
11 *
12 * HeuristicLab is distributed in the hope that it will be useful,
13 * but WITHOUT ANY WARRANTY; without even the implied warranty of
14 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
15 * GNU General Public License for more details.
16 *
17 * You should have received a copy of the GNU General Public License
18 * along with HeuristicLab. If not, see <http://www.gnu.org/licenses/>.
19 */
20#endregion
21
22using System;
23using System.Collections.Generic;
24using System.Text;
25
26namespace HeuristicLab.DataAnalysis {
27  public class Statistics {
28
29    /// <summary>
30    /// Minimum returns the smalles entry of values.
31    /// Throws and exception if values is empty.
32    /// </summary>
33    /// <typeparam name="T"></typeparam>
34    /// <param name="values"></param>
35    /// <returns></returns>
36    public static T Minimum<T>(IEnumerable<T> values) where T : struct, IComparable, IComparable<T> {
37      IEnumerator<T> enumerator = values.GetEnumerator();
38
39      // this will throw an exception if the values collection is empty
40      enumerator.MoveNext();
41      T minimum = enumerator.Current;
42
[1786]43      while (enumerator.MoveNext()) {
[2]44        T current = enumerator.Current;
[1786]45        if (current.CompareTo(minimum) < 0) {
[2]46          minimum = current;
47        }
48      }
49
50      return minimum;
51    }
52
53    /// <summary>
54    /// Maximum returns the largest entry of values.
55    /// Throws an exception if values is empty.
56    /// </summary>
57    /// <typeparam name="T"></typeparam>
58    /// <param name="values"></param>
59    /// <returns></returns>
60    public static T Maximum<T>(IEnumerable<T> values) where T : struct, IComparable, IComparable<T> {
61      IEnumerator<T> enumerator = values.GetEnumerator();
62
63      // this will throw an exception if the values collection is empty
64      enumerator.MoveNext();
65      T maximum = enumerator.Current;
66
[1786]67      while (enumerator.MoveNext()) {
[2]68        T current = enumerator.Current;
[1786]69        if (current.CompareTo(maximum) > 0) {
[2]70          maximum = current;
71        }
72      }
73
74      return maximum;
75    }
76
77    /// <summary>
78    /// Range calculates the difference between the larges and smallest entry of values.
79    /// </summary>
80    /// <param name="values"></param>
81    /// <returns></returns>
82    public static double Range(double[] values) {
83      return Range(values, 0, values.Length);
84    }
85
86    /// <summary>
87    /// Range calculates the difference between the larges and smallest entry of values.
88    /// </summary>
89    public static double Range(List<double> values) {
90      return Range(values.ToArray(), 0, values.Count);
91    }
92
93    /// <summary>
94    /// Range calculates the difference between the largest and smallest entry of values between start and end.
95    /// </summary>
96    /// <param name="values">collection of values</param>
97    /// <param name="start">start index (inclusive)</param>
98    /// <param name="end">end index (exclusive)</param>
99    /// <returns></returns>
100    public static double Range(double[] values, int start, int end) {
[1786]101      if (start < 0 || start > values.Length || end < 0 || end > values.Length || start > end) {
[2]102        throw new InvalidOperationException();
103      }
104
[1788]105      double minimum = double.PositiveInfinity;
106      double maximum = double.NegativeInfinity;
[1786]107      for (int i = start; i < end; i++) {
108        if (!double.IsNaN(values[i])) {
109          if (values[i] > maximum) {
110            maximum = values[i];
111          }
112          if (values[i] < minimum) {
113            minimum = values[i];
114          }
[2]115        }
116      }
117      return (maximum - minimum);
118    }
119
120    /// <summary>
121    /// Calculates the mean of all values.
122    /// </summary>
123    /// <param name="values"></param>
124    /// <returns></returns>
125    public static double Mean(List<double> values) {
126      return Mean(values.ToArray(), 0, values.Count);
127    }
128
129    // Calculates the mean of all values.
130    public static double Mean(double[] values) {
131      return Mean(values, 0, values.Length);
132    }
133
134    /// <summary>
135    /// Calculates the mean of the values between start and end.
136    /// </summary>
137    /// <param name="values"></param>
138    /// <param name="start">start index (inclusive)</param>
139    /// <param name="end">end index(exclusive)</param>
140    /// <returns></returns>
141    public static double Mean(double[] values, int start, int end) {
[2136]142      if (values.Length == 0) throw new ArgumentException("Values is empty.");
143      if(end <=start) throw new ArgumentException("End is smaller or equal start");
[2]144      double sum = 0.0;
[1071]145      int n = 0;
[1786]146      for (int i = start; i < end; i++) {
147        if (!double.IsNaN(values[i])) {
[2]148          sum += values[i];
[1071]149          n++;
[2]150        }
151      }
[2136]152      if (n > 0)
153        return sum / n;
154      else throw new ArgumentException("Only NaN elements in values");
[2]155    }
156
157    /// <summary>
158    /// Calculates the median of the values.
159    /// </summary>
160    /// <param name="values"></param>
161    /// <returns></returns>
162    public static double Median(double[] values) {
[1786]163      if (values.Length == 0) throw new InvalidOperationException();
[2]164      int n = values.Length;
165      double[] sortedValues = new double[n];
166
167      Array.Copy(values, sortedValues, n);
168      Array.Sort(sortedValues);
169
170      // return the middle element (if n is uneven) or the average of the two middle elements if n is even.
[1786]171      if (n % 2 == 1) {
[2]172        return sortedValues[n / 2];
173      } else {
[2535]174        return (sortedValues[(n / 2)-1] + sortedValues[n / 2 ]) / 2.0;
[2]175      }
176    }
177
178
179    /// <summary>
180    /// Calculates the standard deviation of values.
181    /// </summary>
182    /// <param name="values"></param>
183    /// <returns></returns>
184    public static double StandardDeviation(double[] values) {
185      return Math.Sqrt(Variance(values));
186    }
187
188    /// <summary>
189    /// Calculates the variance of values.
190    /// </summary>
191    /// <param name="values"></param>
192    /// <returns></returns>
193    public static double Variance(double[] values) {
194      return Variance(values, 0, values.Length);
195    }
196
197
198    /// <summary>
199    /// Calculates the variance of the entries of values between start and end.
200    /// </summary>
201    /// <param name="values"></param>
202    /// <param name="start">start index (inclusive)</param>
203    /// <param name="end">end index (exclusive)</param>
204    /// <returns></returns>
205    public static double Variance(double[] values, int start, int end) {
[2136]206      if (values.Length == 0) throw new ArgumentException("Values is empty.");
207      if (end <= start) throw new ArgumentException("End is smaller or equal start");
[1071]208      if (end - start == 1)
[2]209        return 0.0;
210
211      double mean = Mean(values, start, end);
212      double squaredErrorsSum = 0.0;
213
[1071]214      int n = 0;
215      for (int i = start; i < end; i++) {
216        if (!double.IsNaN(values[i])) {
217          double d = values[i] - mean;
218          squaredErrorsSum += d * d;
219          n++;
[2]220        }
221      }
[1071]222      if (n < 2) {
[2136]223        throw new ArgumentException("Only one non-NaN element in values");
[1071]224      }
225      return squaredErrorsSum / (n - 1);
[2]226    }
227  }
228}
Note: See TracBrowser for help on using the repository browser.