Free cookie consent management tool by TermsFeed Policy Generator

source: branches/crossvalidation-2434/HeuristicLab.Analysis.Statistics.Views/3.3/StatisticalTestsView.cs @ 14029

Last change on this file since 14029 was 12869, checked in by gkronber, 9 years ago

#2434: merged r12835:12868 from trunk to cross-validation branch

File size: 19.5 KB
RevLine 
[9353]1#region License Information
2/* HeuristicLab
[12012]3 * Copyright (C) 2002-2015 Heuristic and Evolutionary Algorithms Laboratory (HEAL)
[9353]4 *
5 * This file is part of HeuristicLab.
6 *
7 * HeuristicLab is free software: you can redistribute it and/or modify
8 * it under the terms of the GNU General Public License as published by
9 * the Free Software Foundation, either version 3 of the License, or
10 * (at your option) any later version.
11 *
12 * HeuristicLab is distributed in the hope that it will be useful,
13 * but WITHOUT ANY WARRANTY; without even the implied warranty of
14 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
15 * GNU General Public License for more details.
16 *
17 * You should have received a copy of the GNU General Public License
18 * along with HeuristicLab. If not, see <http://www.gnu.org/licenses/>.
19 */
20#endregion
21
22using System;
23using System.Collections.Generic;
24using System.Linq;
[9913]25using System.Threading.Tasks;
[9353]26using System.Windows.Forms;
[9937]27using HeuristicLab.Collections;
[11693]28using HeuristicLab.Common;
[12684]29using HeuristicLab.Common.Resources;
[9353]30using HeuristicLab.Core.Views;
31using HeuristicLab.Data;
32using HeuristicLab.MainForm;
33using HeuristicLab.Optimization;
34using HeuristicLab.Optimization.Views;
35
[11705]36namespace HeuristicLab.Analysis.Statistics.Views {
37  [View("Statistical Tests", "HeuristicLab.Analysis.Statistics.Views.InfoResources.StatisticalTestsInfo.rtf")]
[9353]38  [Content(typeof(RunCollection), false)]
[11693]39  public sealed partial class StatisticalTestsView : ItemView, IConfigureableView {
40    private double significanceLevel = 0.05;
[11612]41    private const int requiredSampleSize = 5;
[9353]42    private double[][] data;
[12684]43    private bool suppressUpdates;
44    private bool initializing;
[9353]45
[11693]46    public double SignificanceLevel {
47      get { return significanceLevel; }
48      set {
49        if (!significanceLevel.IsAlmost(value)) {
50          significanceLevel = value;
51          ResetUI();
52          CalculateValues();
53        }
54      }
[9353]55    }
56
57    public new RunCollection Content {
58      get { return (RunCollection)base.Content; }
59      set { base.Content = value; }
60    }
61
62    public override bool ReadOnly {
63      get { return true; }
64      set { /*not needed because results are always readonly */}
65    }
66
[11693]67    public StatisticalTestsView() {
68      InitializeComponent();
69    }
70
71    public void ShowConfiguration() {
72      using (StatisticalTestsConfigurationDialog dlg = new StatisticalTestsConfigurationDialog(this)) {
73        dlg.ShowDialog(this);
74      }
75    }
76
[9353]77    protected override void OnContentChanged() {
78      base.OnContentChanged();
79
80      if (Content != null) {
[12684]81        UpdateUI();
82      } else {
[12613]83        ResetUI();
[9353]84      }
[9911]85      UpdateCaption();
[9353]86    }
87
[12684]88    private void UpdateUI() {
89      initializing = true;
90      UpdateResultComboBox();
91      UpdateGroupsComboBox();
92      RebuildDataTable();
93      FillCompComboBox();
94      ResetUI();
95      CalculateValues();
96      initializing = false;
97    }
98
[9911]99    private void UpdateCaption() {
[9913]100      Caption = Content != null ? Content.OptimizerName + " Statistical Tests" : ViewAttribute.GetViewName(GetType());
[9911]101    }
102
[9353]103    #region events
104    protected override void RegisterContentEvents() {
105      base.RegisterContentEvents();
[11696]106      Content.ColumnsChanged += Content_ColumnsChanged;
107      Content.RowsChanged += Content_RowsChanged;
[12684]108      Content.CollectionReset += Content_CollectionReset;
[9911]109      Content.UpdateOfRunsInProgressChanged += Content_UpdateOfRunsInProgressChanged;
[9353]110    }
111
112    protected override void DeregisterContentEvents() {
113      base.DeregisterContentEvents();
[11696]114      Content.ColumnsChanged -= Content_ColumnsChanged;
115      Content.RowsChanged -= Content_RowsChanged;
[12684]116      Content.CollectionReset -= Content_CollectionReset;
[9911]117      Content.UpdateOfRunsInProgressChanged -= Content_UpdateOfRunsInProgressChanged;
[9353]118    }
[9911]119
[11696]120    void Content_RowsChanged(object sender, EventArgs e) {
[12599]121      if (suppressUpdates) return;
122      if (InvokeRequired) Invoke((Action<object, EventArgs>)Content_RowsChanged, sender, e);
123      else {
[12684]124        UpdateUI();
[12599]125      }
[9911]126    }
127
[11696]128    void Content_ColumnsChanged(object sender, EventArgs e) {
[12599]129      if (suppressUpdates) return;
130      if (InvokeRequired) Invoke((Action<object, EventArgs>)Content_ColumnsChanged, sender, e);
131      else {
[12684]132        UpdateUI();
[12116]133      }
[9911]134    }
135
[11696]136    private void Content_CollectionReset(object sender, CollectionItemsChangedEventArgs<IRun> e) {
[12599]137      if (suppressUpdates) return;
138      if (InvokeRequired) Invoke((Action<object, CollectionItemsChangedEventArgs<IRun>>)Content_CollectionReset, sender, e);
139      else {
[12684]140        UpdateUI();
[12599]141      }
[9911]142    }
143
144    void Content_UpdateOfRunsInProgressChanged(object sender, EventArgs e) {
[12599]145      if (InvokeRequired) Invoke((Action<object, EventArgs>)Content_UpdateOfRunsInProgressChanged, sender, e);
146      else {
147        suppressUpdates = Content.UpdateOfRunsInProgress;
[12684]148        if (!suppressUpdates) UpdateUI();
[9911]149      }
150    }
[12613]151
152    private void openBoxPlotToolStripMenuItem_Click(object sender, EventArgs e) {
153      RunCollectionBoxPlotView boxplotView = new RunCollectionBoxPlotView();
154      boxplotView.Content = Content;
155      boxplotView.SetXAxis(groupComboBox.SelectedItem.ToString());
156      boxplotView.SetYAxis(resultComboBox.SelectedItem.ToString());
157
158      boxplotView.Show();
159    }
160
161    private void groupCompComboBox_SelectedValueChanged(object sender, EventArgs e) {
[12684]162      if (initializing || suppressUpdates) return;
[12613]163      string curItem = (string)groupCompComboBox.SelectedItem;
164      CalculatePairwise(curItem);
165    }
166
167    private void resultComboBox_SelectedValueChanged(object sender, EventArgs e) {
[12684]168      if (initializing || suppressUpdates) return;
[12613]169      RebuildDataTable();
170      ResetUI();
171      CalculateValues();
172    }
173
174    private void groupComboBox_SelectedValueChanged(object sender, EventArgs e) {
[12684]175      if (initializing || suppressUpdates) return;
[12613]176      RebuildDataTable();
177      FillCompComboBox();
178      ResetUI();
179      CalculateValues();
180    }
[9353]181    #endregion
182
183    private void UpdateGroupsComboBox() {
[12684]184      string selectedItem = (string)groupComboBox.SelectedItem;
185
[9353]186      groupComboBox.Items.Clear();
187      var parameters = (from run in Content
188                        where run.Visible
189                        from param in run.Parameters
190                        select param.Key).Distinct().ToArray();
191
192      foreach (var p in parameters) {
193        var variations = (from run in Content
194                          where run.Visible && run.Parameters.ContainsKey(p) &&
195                          (run.Parameters[p] is IntValue || run.Parameters[p] is DoubleValue ||
196                          run.Parameters[p] is StringValue || run.Parameters[p] is BoolValue)
197                          select ((dynamic)run.Parameters[p]).Value).Distinct();
198
199        if (variations.Count() > 1) {
200          groupComboBox.Items.Add(p);
201        }
202      }
203
204      if (groupComboBox.Items.Count > 0) {
205        //try to select something different than "Seed" or "Algorithm Name" as this makes no sense
206        //and takes a long time to group
207        List<int> possibleIndizes = new List<int>();
208        for (int i = 0; i < groupComboBox.Items.Count; i++) {
209          if (groupComboBox.Items[i].ToString() != "Seed"
210            && groupComboBox.Items[i].ToString() != "Algorithm Name") {
211            possibleIndizes.Add(i);
212          }
213        }
214
[12684]215        if (selectedItem != null && groupComboBox.Items.Contains(selectedItem)) {
216          groupComboBox.SelectedItem = selectedItem;
217        } else if (possibleIndizes.Count > 0) {
[9353]218          groupComboBox.SelectedItem = groupComboBox.Items[possibleIndizes.First()];
219        }
220      }
221    }
222
223    private string[] GetColumnNames(IEnumerable<IRun> runs) {
224      string parameterName = (string)groupComboBox.SelectedItem;
225      var r = runs.Where(x => x.Parameters.ContainsKey(parameterName));
226      return r.Select(x => ((dynamic)x.Parameters[parameterName]).Value).Distinct().Select(x => (string)x.ToString()).ToArray();
227    }
228
229    private void UpdateResultComboBox() {
[12684]230      string selectedItem = (string)resultComboBox.SelectedItem;
231
[9353]232      resultComboBox.Items.Clear();
233      var results = (from run in Content
234                     where run.Visible
235                     from result in run.Results
236                     where result.Value is IntValue || result.Value is DoubleValue
237                     select result.Key).Distinct().ToArray();
238
239      resultComboBox.Items.AddRange(results);
[12684]240
241      if (selectedItem != null && resultComboBox.Items.Contains(selectedItem)) {
242        resultComboBox.SelectedItem = selectedItem;
243      } else if (resultComboBox.Items.Count > 0) {
244        resultComboBox.SelectedItem = resultComboBox.Items[0];
245      }
[9353]246    }
247
[9389]248    private void FillCompComboBox() {
[12684]249      string selectedItem = (string)groupCompComboBox.SelectedItem;
[9389]250      string parameterName = (string)groupComboBox.SelectedItem;
251      if (parameterName != null) {
252        string resultName = (string)resultComboBox.SelectedItem;
253        if (resultName != null) {
254          var runs = Content.Where(x => x.Results.ContainsKey(resultName) && x.Visible);
255          var columnNames = GetColumnNames(runs).ToList();
256          groupCompComboBox.Items.Clear();
257          columnNames.ForEach(x => groupCompComboBox.Items.Add(x));
[12684]258          if (selectedItem != null && groupCompComboBox.Items.Contains(selectedItem)) {
259            groupCompComboBox.SelectedItem = selectedItem;
260          } else if (groupCompComboBox.Items.Count > 0) {
261            groupCompComboBox.SelectedItem = groupCompComboBox.Items[0];
262          }
[9389]263        }
264      }
265    }
266
[9353]267    private void RebuildDataTable() {
268      string parameterName = (string)groupComboBox.SelectedItem;
269      if (parameterName != null) {
270        string resultName = (string)resultComboBox.SelectedItem;
271
272        var runs = Content.Where(x => x.Results.ContainsKey(resultName) && x.Visible);
273        var columnNames = GetColumnNames(runs);
274        var groups = GetGroups(columnNames, runs);
275        data = new double[columnNames.Count()][];
276
[12869]277        if (!groups.Any() || !columnNames.Any()) {
278          return;
279        }
280
[9353]281        DoubleMatrix dt = new DoubleMatrix(groups.Select(x => x.Count()).Max(), columnNames.Count());
282        dt.ColumnNames = columnNames;
[9937]283        DataTable histogramDataTable = new DataTable(resultName);
[9353]284
[9937]285        for (int i = 0; i < columnNames.Count(); i++) {
286          int j = 0;
[9353]287          data[i] = new double[groups[i].Count()];
[9937]288          DataRow row = new DataRow(columnNames[i]);
289          row.VisualProperties.ChartType = DataRowVisualProperties.DataRowChartType.Histogram;
290          histogramDataTable.Rows.Add(row);
291
[9353]292          foreach (IRun run in groups[i]) {
293            dt[j, i] = (double)((dynamic)run.Results[resultName]).Value;
294            data[i][j] = dt[j, i];
[9937]295            row.Values.Add(dt[j, i]);
[9353]296            j++;
297          }
298        }
299
[11611]300        GenerateChart(histogramDataTable);
[9353]301        stringConvertibleMatrixView.Content = dt;
302      }
303    }
304
[11611]305    private void GenerateChart(DataTable histogramTable) {
[11837]306      histogramControl.ClearPoints();
[11611]307      foreach (var row in histogramTable.Rows) {
[11612]308        histogramControl.AddPoints(row.Name, row.Values, true);
[11611]309      }
310    }
311
[9353]312    private List<IEnumerable<IRun>> GetGroups(string[] columnNames, IEnumerable<IRun> runs) {
313      List<IEnumerable<IRun>> runCols = new List<IEnumerable<IRun>>();
314      string parameterName = (string)groupComboBox.SelectedItem;
315
316      foreach (string cn in columnNames) {
[12869]317        var tmpRuns = runs.Where(x =>
318        x.Parameters.ContainsKey(parameterName) &&
319        (((string)((dynamic)x.Parameters[parameterName]).Value.ToString()) == cn));
[9353]320        runCols.Add(tmpRuns);
321      }
322
323      return runCols;
324    }
325
[9389]326    private void ResetUI() {
327      normalityLabel.Image = null;
[11695]328      normalityTextLabel.Text = string.Empty;
[9389]329      groupCompLabel.Image = null;
[11695]330      groupComTextLabel.Text = string.Empty;
[9749]331      pairwiseLabel.Image = null;
[11695]332      pairwiseTextLabel.Text = string.Empty;
333
[9389]334      pValTextBox.Text = string.Empty;
335      equalDistsTextBox.Text = string.Empty;
336    }
337
[9937]338    private bool VerifyDataLength(bool showMessage) {
[12869]339      if (data == null || data.Length < 2)
[9937]340        return false;
341
342      //alglib needs at least 5 samples for computation
[12131]343      if (data.Any(x => x.Length < requiredSampleSize)) {
[9937]344        if (showMessage)
[11695]345          MessageBox.Show(this, "You need at least " + requiredSampleSize
346            + " samples per group for computing hypothesis tests.", "HeuristicLab", MessageBoxButtons.OK,
[9937]347            MessageBoxIcon.Error);
348        return false;
349      }
350      return true;
351    }
352
[9913]353    private void CalculateValues() {
[9937]354      if (!VerifyDataLength(true))
355        return;
356
[12116]357      if (data != null && data.All(x => x != null)) {
[12684]358        MainFormManager.GetMainForm<MainForm.WindowsForms.MainForm>()
[9922]359          .AddOperationProgressToView(this, "Calculating...");
[9923]360
361        string curItem = (string)groupCompComboBox.SelectedItem;
362        Task.Factory.StartNew(() => CalculateValuesAsync(curItem));
[9922]363      }
[9913]364    }
365
[9923]366    private void CalculateValuesAsync(string groupName) {
[11696]367      CalculateAllGroupsTest();
368      CalculateNormalityTest();
[9923]369      CalculatePairwiseTest(groupName);
[9913]370
[12684]371      MainFormManager.GetMainForm<MainForm.WindowsForms.MainForm>().RemoveOperationProgressFromView(this);
[9913]372    }
373
[9923]374    private void CalculatePairwise(string groupName) {
[12684]375      if (groupName == null) return;
[9937]376      if (!VerifyDataLength(false))
377        return;
378
[12684]379      MainFormManager.GetMainForm<MainForm.WindowsForms.MainForm>().AddOperationProgressToView(pairwiseTestGroupBox, "Calculating...");
[9923]380      Task.Factory.StartNew(() => CalculatePairwiseAsync(groupName));
[9913]381    }
382
[9923]383    private void CalculatePairwiseAsync(string groupName) {
384      CalculatePairwiseTest(groupName);
[9913]385
[12684]386      MainFormManager.GetMainForm<MainForm.WindowsForms.MainForm>().RemoveOperationProgressFromView(pairwiseTestGroupBox);
[9913]387    }
388
[11696]389    private void CalculateAllGroupsTest() {
[11692]390      double pval = KruskalWallisTest.Test(data);
[12690]391      DisplayAllGroupsTextResults(pval);
392    }
393
394    private void DisplayAllGroupsTextResults(double pval) {
395      if (InvokeRequired) {
396        Invoke((Action<double>)DisplayAllGroupsTextResults, pval);
397      } else {
398        pValTextBox.Text = pval.ToString();
399        if (pval < significanceLevel) {
[12684]400          groupCompLabel.Image = VSImageLibrary.Default;
[11695]401          groupComTextLabel.Text = "There are groups with different distributions";
[12690]402        } else {
[12684]403          groupCompLabel.Image = VSImageLibrary.Warning;
[11695]404          groupComTextLabel.Text = "Groups have an equal distribution";
[12690]405        }
[9389]406      }
[9353]407    }
408
[11696]409    private void CalculateNormalityTest() {
[9353]410      double val;
411      List<double> res = new List<double>();
[11696]412      DoubleMatrix pValsMatrix = new DoubleMatrix(1, stringConvertibleMatrixView.Content.Columns);
413      pValsMatrix.ColumnNames = stringConvertibleMatrixView.Content.ColumnNames;
[12684]414      pValsMatrix.RowNames = new[] { "p-Value" };
[9353]415
416      for (int i = 0; i < data.Length; i++) {
417        alglib.jarqueberatest(data[i], data[i].Length, out val);
418        res.Add(val);
[11696]419        pValsMatrix[0, i] = val;
[9353]420      }
421
[11696]422      // p-value is below significance level and thus the null hypothesis (data is normally distributed) is rejected
[9950]423      if (res.Any(x => x < significanceLevel)) {
[12684]424        Invoke(new Action(() => {
425          normalityLabel.Image = VSImageLibrary.Warning;
[11695]426          normalityTextLabel.Text = "Some groups may not be normally distributed";
427        }));
[9936]428      } else {
[12684]429        Invoke(new Action(() => {
430          normalityLabel.Image = VSImageLibrary.Default;
[11695]431          normalityTextLabel.Text = "All sample data is normally distributed";
432        }));
[9353]433      }
434
[12684]435      Invoke(new Action(() => {
[11601]436        normalityStringConvertibleMatrixView.Content = pValsMatrix;
437        normalityStringConvertibleMatrixView.DataGridView.AutoResizeColumns(DataGridViewAutoSizeColumnsMode.AllCells);
438      }));
[9353]439    }
440
[11696]441    private void ShowPairwiseResult(int nrOfEqualDistributions) {
442      double ratio = ((double)nrOfEqualDistributions) / (data.Length - 1) * 100.0;
[12684]443      equalDistsTextBox.Text = ratio + " %";
[9913]444
[11696]445      if (nrOfEqualDistributions == 0) {
[12684]446        Invoke(new Action(() => {
447          pairwiseLabel.Image = VSImageLibrary.Default;
[11695]448          pairwiseTextLabel.Text = "All groups have different distributions";
449        }));
[9913]450      } else {
[12684]451        Invoke(new Action(() => {
452          pairwiseLabel.Image = VSImageLibrary.Warning;
[11695]453          pairwiseTextLabel.Text = "Some groups have equal distributions";
454        }));
[9913]455      }
456    }
457
[11696]458    private void CalculatePairwiseTest(string groupName) {
459      var columnNames = stringConvertibleMatrixView.Content.ColumnNames.ToList();
460      int colIndex = columnNames.IndexOf(groupName);
461      columnNames = columnNames.Where(x => x != groupName).ToList();
[9957]462
463      double[][] newData = FilterDataForPairwiseTest(colIndex);
464
[12869]465      var rowNames = new[] { "p-Value of Mann-Whitney U", "Adjusted p-Value of Mann-Whitney U",
[11691]466            "p-Value of T-Test", "Adjusted p-Value of T-Test", "Cohen's d", "Hedges' g" };
[9950]467
[9957]468      DoubleMatrix pValsMatrix = new DoubleMatrix(rowNames.Length, columnNames.Count());
469      pValsMatrix.ColumnNames = columnNames;
[9950]470      pValsMatrix.RowNames = rowNames;
[9353]471
[11696]472      double mwuBothTails;
[11691]473      double tTestBothTails;
[9957]474      double[] mwuPValues = new double[newData.Length];
475      double[] tTestPValues = new double[newData.Length];
[9950]476      bool[] decision = null;
477      double[] adjustedMwuPValues = null;
478      double[] adjustedTtestPValues = null;
[11696]479      int cnt = 0;
[9950]480
[9957]481      for (int i = 0; i < newData.Length; i++) {
[11696]482        mwuBothTails = PairwiseTest.MannWhitneyUTest(data[colIndex], newData[i]);
[11692]483        tTestBothTails = PairwiseTest.TTest(data[colIndex], newData[i]);
[11696]484        mwuPValues[i] = mwuBothTails;
[11692]485        tTestPValues[i] = tTestBothTails;
[11696]486
487        if (mwuBothTails > significanceLevel) {
488          cnt++;
489        }
[9353]490      }
491
[9950]492      adjustedMwuPValues = BonferroniHolm.Calculate(significanceLevel, mwuPValues, out decision);
493      adjustedTtestPValues = BonferroniHolm.Calculate(significanceLevel, tTestPValues, out decision);
494
[9957]495      for (int i = 0; i < newData.Length; i++) {
[11692]496        pValsMatrix[0, i] = mwuPValues[i];
497        pValsMatrix[1, i] = adjustedMwuPValues[i];
498        pValsMatrix[2, i] = tTestPValues[i];
499        pValsMatrix[3, i] = adjustedTtestPValues[i];
500        pValsMatrix[4, i] = SampleSizeDetermination.CalculateCohensD(data[colIndex], newData[i]);
501        pValsMatrix[5, i] = SampleSizeDetermination.CalculateHedgesG(data[colIndex], newData[i]);
[9950]502      }
503
[12684]504      Invoke(new Action(() => {
[11601]505        pairwiseStringConvertibleMatrixView.Content = pValsMatrix;
506        pairwiseStringConvertibleMatrixView.DataGridView.AutoResizeColumns(DataGridViewAutoSizeColumnsMode.AllCells);
507      }));
[11696]508
509      ShowPairwiseResult(cnt);
[9353]510    }
511
[11696]512    private double[][] FilterDataForPairwiseTest(int columnToRemove) {
513      double[][] newData = new double[data.Length - 1][];
514
515      int i = 0;
516      int l = 0;
517      while (i < data.Length) {
518        if (i != columnToRemove) {
519          double[] row = new double[data[i].Length - 1];
520          newData[l] = row;
521
522          int j = 0, k = 0;
523          while (j < row.Length) {
524            if (i != columnToRemove) {
525              newData[l][j] = data[i][k];
526              j++;
527              k++;
528            } else {
529              k++;
530            }
531          }
532          i++;
533          l++;
534        } else {
535          i++;
536        }
537      }
538      return newData;
539    }
[9353]540  }
541}
Note: See TracBrowser for help on using the repository browser.