Free cookie consent management tool by TermsFeed Policy Generator

source: branches/HeuristicLab.DataImporter/HeuristicLab.DataImporter.Command/MissingValues/FillMissingValuesWithLinearInterpolation.cs @ 9614

Last change on this file since 9614 was 9614, checked in by mkommend, 11 years ago

#1734: Added StorableConstructor to all storable DataImporter classes.

File size: 4.0 KB
Line 
1#region License Information
2/* HeuristicLab
3 * Copyright (C) 2002-2012 Heuristic and Evolutionary Algorithms Laboratory (HEAL)
4 *
5 * This file is part of HeuristicLab.
6 *
7 * HeuristicLab is free software: you can redistribute it and/or modify
8 * it under the terms of the GNU General Public License as published by
9 * the Free Software Foundation, either version 3 of the License, or
10 * (at your option) any later version.
11 *
12 * HeuristicLab is distributed in the hope that it will be useful,
13 * but WITHOUT ANY WARRANTY; without even the implied warranty of
14 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
15 * GNU General Public License for more details.
16 *
17 * You should have received a copy of the GNU General Public License
18 * along with HeuristicLab. If not, see <http://www.gnu.org/licenses/>.
19 */
20#endregion
21
22using System.Collections.Generic;
23using System.Linq;
24using System.Windows.Forms;
25using HeuristicLab.DataImporter.Data;
26using HeuristicLab.DataImporter.Data.CommandBase;
27using HeuristicLab.DataImporter.Data.Model;
28using HeuristicLab.Persistence.Default.CompositeSerializers.Storable;
29
30namespace HeuristicLab.DataImporter.Command {
31  [StorableClass]
32  [ViewableCommandInfoAttribute("Linear Interpolation", 1, ColumnGroupState.DoubleColumnSelected | ColumnGroupState.AnySelectedColumnContainsNull,
33    "Handle Missing Values", Position = 2)]
34  public class FillMissingValuesWithLinearInterpolation : FillMissingValueCommandBase {
35    [StorableConstructor]
36    protected FillMissingValuesWithLinearInterpolation(bool deserializing) : base(deserializing) { }
37    public FillMissingValuesWithLinearInterpolation(DataSet dataSet, string columnGroupName, int[] affectedColumns) :
38      base(dataSet, columnGroupName, affectedColumns) {
39    }
40
41    public override string Description {
42      get { return "Interpolate missing values"; }
43    }
44
45    public override void Execute() {
46      base.Execute();
47      DoubleColumn column;
48      int startIndex = -1;
49      int endIndex = -1;
50      oldSortOrder = ColumnGroup.SortOrdersForColumns.ToList();
51      oldSortedColumnIndexes = new List<int>(ColumnGroup.SortedColumnIndexes);
52      foreach (int col in AffectedColumns) {
53        if (ColumnGroup.GetColumn(col) is DoubleColumn && ColumnGroup.GetColumn(col).ContainsNullValues) {
54          column = (DoubleColumn)ColumnGroup.Columns.ElementAt(col);
55          if (column.SortOrder != SortOrder.None)
56            ColumnGroup.ResetSorting();
57          nullValues.Add(col, new List<int>());
58          startIndex = FindNextNotNullValueIndex(column, startIndex);
59          endIndex = FindNextNotNullValueIndex(column, startIndex);
60          while (endIndex != -1) {
61            if (endIndex - startIndex != 1) {
62              nullValues[col].AddRange(Enumerable.Range(startIndex + 1, endIndex - startIndex - 1));
63              InterpolateValues(column, startIndex, endIndex);
64            }
65            startIndex = endIndex;
66            endIndex = FindNextNotNullValueIndex(column, endIndex);
67          }
68          startIndex = -1;
69        }
70      }
71      ColumnGroup.FireChanged();
72      ColumnGroup = null;
73    }
74
75    private int FindNextNotNullValueIndex(DoubleColumn column, int startIndex) {
76      int endIndex = -1;
77      for (int i = startIndex + 1; i < column.TotalValuesCount && endIndex == -1; i++)
78        if (column.GetValue(i) != null)
79          endIndex = i;
80      return endIndex;
81    }
82
83    private void InterpolateValues(DoubleColumn column, int startIndex, int endIndex) {
84      double startValue = (double)column.GetValue(startIndex);
85      double endValue = (double)column.GetValue(endIndex);
86      double stepwidth = (endValue - startValue) / (endIndex - startIndex);
87
88      for (int i = startIndex + 1; i < endIndex; i++) {
89        if (column.GetValue(i) != null)
90          throw new CommandExecutionException("Tried to manipulate non null value!", this);
91        column.ChangeValue(i, startValue + stepwidth * (i - startIndex));
92      }
93    }
94  }
95}
Note: See TracBrowser for help on using the repository browser.