Free cookie consent management tool by TermsFeed Policy Generator

source: branches/2994-AutoDiffForIntervals/HeuristicLab.Problems.DataAnalysis.Views/3.4/Classification/ClassificationSolutionVariableImpactsView.cs @ 17399

Last change on this file since 17399 was 17312, checked in by gkronber, 5 years ago

#2994: merged r17220:17306 from trunk to branch

File size: 10.4 KB
RevLine 
[14348]1#region License Information
2/* HeuristicLab
[17209]3 * Copyright (C) Heuristic and Evolutionary Algorithms Laboratory (HEAL)
[14348]4 *
5 * This file is part of HeuristicLab.
6 *
7 * HeuristicLab is free software: you can redistribute it and/or modify
8 * it under the terms of the GNU General Public License as published by
9 * the Free Software Foundation, either version 3 of the License, or
10 * (at your option) any later version.
11 *
12 * HeuristicLab is distributed in the hope that it will be useful,
13 * but WITHOUT ANY WARRANTY; without even the implied warranty of
14 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
15 * GNU General Public License for more details.
16 *
17 * You should have received a copy of the GNU General Public License
18 * along with HeuristicLab. If not, see <http://www.gnu.org/licenses/>.
19 */
20#endregion
[15667]21
[14348]22using System;
[15667]23using System.Collections.Generic;
[14348]24using System.Linq;
[15753]25using System.Threading;
26using System.Threading.Tasks;
[15667]27using HeuristicLab.Common;
[14348]28using HeuristicLab.Data;
29using HeuristicLab.MainForm;
30
31namespace HeuristicLab.Problems.DataAnalysis.Views {
32  [View("Variable Impacts")]
[15638]33  [Content(typeof(IClassificationSolution))]
34  public partial class ClassificationSolutionVariableImpactsView : DataAnalysisSolutionEvaluationView {
[15674]35    private enum SortingCriteria {
36      ImpactValue,
37      Occurrence,
38      VariableName
39    }
[16422]40    private CancellationTokenSource cancellationToken = new CancellationTokenSource();
41    private List<Tuple<string, double>> rawVariableImpacts = new List<Tuple<string, double>>();
[17312]42    private bool attachedToProgress = false;
[15674]43
[15638]44    public new IClassificationSolution Content {
45      get { return (IClassificationSolution)base.Content; }
[14348]46      set {
47        base.Content = value;
48      }
49    }
50
[15638]51    public ClassificationSolutionVariableImpactsView()
[14348]52      : base() {
53      InitializeComponent();
[15667]54
[15729]55      //Set the default values
[14348]56      this.dataPartitionComboBox.SelectedIndex = 0;
[16422]57      this.replacementComboBox.SelectedIndex = 3;
[14826]58      this.factorVarReplComboBox.SelectedIndex = 0;
[16422]59      this.sortByComboBox.SelectedItem = SortingCriteria.ImpactValue;
[14348]60    }
61
62    protected override void RegisterContentEvents() {
63      base.RegisterContentEvents();
64      Content.ModelChanged += new EventHandler(Content_ModelChanged);
65      Content.ProblemDataChanged += new EventHandler(Content_ProblemDataChanged);
66    }
67    protected override void DeregisterContentEvents() {
68      base.DeregisterContentEvents();
69      Content.ModelChanged -= new EventHandler(Content_ModelChanged);
70      Content.ProblemDataChanged -= new EventHandler(Content_ProblemDataChanged);
71    }
72
73    protected virtual void Content_ProblemDataChanged(object sender, EventArgs e) {
74      OnContentChanged();
75    }
76    protected virtual void Content_ModelChanged(object sender, EventArgs e) {
77      OnContentChanged();
78    }
79    protected override void OnContentChanged() {
80      base.OnContentChanged();
[16422]81      rawVariableImpacts.Clear();
82
[14348]83      if (Content == null) {
[16422]84        variableImpactsArrayView.Content = null;
[14348]85      } else {
[15753]86        UpdateVariableImpact();
[14348]87      }
88    }
[17312]89    protected override void OnHidden(EventArgs e) {
90      base.OnHidden(e);
[16422]91      cancellationToken.Cancel();
[17312]92
93      if (attachedToProgress) {
94        Progress.Hide(this);
95        attachedToProgress = false;
96      }
[15753]97    }
98
[15667]99    private void dataPartitionComboBox_SelectedIndexChanged(object sender, EventArgs e) {
[16422]100      rawVariableImpacts.Clear();
[15753]101      UpdateVariableImpact();
[15667]102    }
103    private void replacementComboBox_SelectedIndexChanged(object sender, EventArgs e) {
[16422]104      rawVariableImpacts.Clear();
[15753]105      UpdateVariableImpact();
[15667]106    }
107    private void sortByComboBox_SelectedIndexChanged(object sender, EventArgs e) {
108      //Update the default ordering (asc,desc), but remove the eventHandler beforehand (otherwise the data would be ordered twice)
109      ascendingCheckBox.CheckedChanged -= ascendingCheckBox_CheckedChanged;
[16422]110      ascendingCheckBox.Checked = (SortingCriteria)sortByComboBox.SelectedItem != SortingCriteria.ImpactValue;
[15667]111      ascendingCheckBox.CheckedChanged += ascendingCheckBox_CheckedChanged;
112
[16422]113      UpdateOrdering();
[15667]114    }
115    private void ascendingCheckBox_CheckedChanged(object sender, EventArgs e) {
[16422]116      UpdateOrdering();
[15667]117    }
[15729]118
[16422]119    private async void UpdateVariableImpact() {
120      IProgress progress;
[15667]121
[15729]122      //Check if the selection is valid
[15674]123      if (Content == null) { return; }
124      if (replacementComboBox.SelectedIndex < 0) { return; }
125      if (dataPartitionComboBox.SelectedIndex < 0) { return; }
126      if (factorVarReplComboBox.SelectedIndex < 0) { return; }
127
[15729]128      //Prepare arguments
[15674]129      var replMethod = (ClassificationSolutionVariableImpactsCalculator.ReplacementMethodEnum)replacementComboBox.Items[replacementComboBox.SelectedIndex];
130      var factorReplMethod = (ClassificationSolutionVariableImpactsCalculator.FactorReplacementMethodEnum)factorVarReplComboBox.Items[factorVarReplComboBox.SelectedIndex];
131      var dataPartition = (ClassificationSolutionVariableImpactsCalculator.DataPartitionEnum)dataPartitionComboBox.SelectedItem;
132
[16422]133      variableImpactsArrayView.Caption = Content.Name + " Variable Impacts";
[16430]134      progress = Progress.Show(this, "Calculating variable impacts for " + Content.Name);
[17312]135      attachedToProgress = true;
[16422]136      cancellationToken = new CancellationTokenSource();
[15753]137
[16422]138      try {
[15753]139        var problemData = Content.ProblemData;
140        var inputvariables = new HashSet<string>(problemData.AllowedInputVariables.Union(Content.Model.VariablesUsedForPrediction));
[16422]141        //Remember the original ordering of the variables
142        var originalVariableOrdering = problemData.Dataset.VariableNames
143          .Where(v => inputvariables.Contains(v))
144          .Where(v => problemData.Dataset.VariableHasType<double>(v) || problemData.Dataset.VariableHasType<string>(v))
145          .ToList();
[15753]146
[16422]147        List<Tuple<string, double>> impacts = null;
148        await Task.Run(() => { impacts = CalculateVariableImpacts(originalVariableOrdering, Content.Model, problemData, Content.EstimatedClassValues, dataPartition, replMethod, factorReplMethod, cancellationToken.Token, progress); });
149        if (impacts == null) { return; }
150
151        rawVariableImpacts.AddRange(impacts);
152        UpdateOrdering();
[16430]153      } finally {
[17312]154        if (attachedToProgress) {
155          Progress.Hide(this);
156          attachedToProgress = false;
157        }
[16422]158      }
[14348]159    }
[16422]160    private List<Tuple<string, double>> CalculateVariableImpacts(List<string> originalVariableOrdering,
161      IClassificationModel model,
162      IClassificationProblemData problemData,
163      IEnumerable<double> estimatedClassValues,
164      ClassificationSolutionVariableImpactsCalculator.DataPartitionEnum dataPartition,
165      ClassificationSolutionVariableImpactsCalculator.ReplacementMethodEnum replMethod,
166      ClassificationSolutionVariableImpactsCalculator.FactorReplacementMethodEnum factorReplMethod,
167      CancellationToken token,
168      IProgress progress) {
169      List<Tuple<string, double>> impacts = new List<Tuple<string, double>>();
170      int count = originalVariableOrdering.Count;
171      int i = 0;
172      var modifiableDataset = ((Dataset)(problemData.Dataset).Clone()).ToModifiable();
173      IEnumerable<int> rows = ClassificationSolutionVariableImpactsCalculator.GetPartitionRows(dataPartition, problemData);
[14348]174
[16422]175      //Calculate original quality-values (via calculator, default is R²)
176      IEnumerable<double> targetValuesPartition = problemData.Dataset.GetDoubleValues(problemData.TargetVariable, rows);
177      IEnumerable<double> estimatedClassValuesPartition = Content.GetEstimatedClassValues(rows);
178
179      var originalCalculatorValue = ClassificationSolutionVariableImpactsCalculator.CalculateQuality(targetValuesPartition, estimatedClassValuesPartition);
180      var clonedModel = (IClassificationModel)model.Clone();
181      foreach (var variableName in originalVariableOrdering) {
182        if (cancellationToken.Token.IsCancellationRequested) { return null; }
183        progress.ProgressValue = (double)++i / count;
[16430]184        progress.Message = string.Format("Calculating impact for variable {0} ({1} of {2})", variableName, i, count);
[16422]185
186        double impact = 0;
187        //If the variable isn't used for prediction, it has zero impact.
188        if (model.VariablesUsedForPrediction.Contains(variableName)) {
189          impact = ClassificationSolutionVariableImpactsCalculator.CalculateImpact(variableName, clonedModel, problemData, modifiableDataset, rows, replMethod, factorReplMethod, targetValuesPartition, originalCalculatorValue);
190        }
191        impacts.Add(new Tuple<string, double>(variableName, impact));
192      }
193
194      return impacts;
195    }
196
[15667]197    /// <summary>
[16422]198    /// Updates the <see cref="variableImpactsArrayView"/> according to the selected ordering <see cref="ascendingCheckBox"/> of the selected Column <see cref="sortByComboBox"/>
[15667]199    /// The default is "Descending" by "VariableImpact" (as in previous versions)
200    /// </summary>
[16422]201    private void UpdateOrdering() {
[15667]202      //Check if valid sortingCriteria is selected and data exists
[15674]203      if (sortByComboBox.SelectedIndex == -1) { return; }
204      if (rawVariableImpacts == null) { return; }
205      if (!rawVariableImpacts.Any()) { return; }
[14348]206
[15674]207      var selectedItem = (SortingCriteria)sortByComboBox.SelectedItem;
[15667]208      bool ascending = ascendingCheckBox.Checked;
[14348]209
[16422]210      IEnumerable<Tuple<string, double>> orderedEntries = null;
[15667]211
212      //Sort accordingly
213      switch (selectedItem) {
[15674]214        case SortingCriteria.ImpactValue:
[16422]215          orderedEntries = rawVariableImpacts.OrderBy(v => v.Item2);
[15667]216          break;
[15674]217        case SortingCriteria.Occurrence:
218          orderedEntries = rawVariableImpacts;
[15667]219          break;
[15674]220        case SortingCriteria.VariableName:
[16422]221          orderedEntries = rawVariableImpacts.OrderBy(v => v.Item1, new NaturalStringComparer());
[15667]222          break;
223        default:
[15674]224          throw new NotImplementedException("Ordering for selected SortingCriteria not implemented");
[15667]225      }
226
[15674]227      if (!ascending) { orderedEntries = orderedEntries.Reverse(); }
228
[15667]229      //Write the data back
[16422]230      var impactArray = new DoubleArray(orderedEntries.Select(i => i.Item2).ToArray()) {
231        ElementNames = orderedEntries.Select(i => i.Item1)
[15667]232      };
[15729]233
[15753]234      //Could be, if the View was closed
[16422]235      if (!variableImpactsArrayView.IsDisposed) {
236        variableImpactsArrayView.Content = (DoubleArray)impactArray.AsReadOnly();
[15729]237      }
[14348]238    }
239  }
240}
Note: See TracBrowser for help on using the repository browser.