Free cookie consent management tool by TermsFeed Policy Generator

source: branches/HeuristicLab.DataImporter/HeuristicLab.DataImporter.Command/MissingValues/FillMissingValuesWithLinearInterpolation.cs @ 8614

Last change on this file since 8614 was 7267, checked in by gkronber, 13 years ago

#1734 updated copyright year in all files of the DataImporter branch

File size: 4.0 KB
Line 
1#region License Information
2/* HeuristicLab
3 * Copyright (C) 2002-2012 Heuristic and Evolutionary Algorithms Laboratory (HEAL)
4 *
5 * This file is part of HeuristicLab.
6 *
7 * HeuristicLab is free software: you can redistribute it and/or modify
8 * it under the terms of the GNU General Public License as published by
9 * the Free Software Foundation, either version 3 of the License, or
10 * (at your option) any later version.
11 *
12 * HeuristicLab is distributed in the hope that it will be useful,
13 * but WITHOUT ANY WARRANTY; without even the implied warranty of
14 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
15 * GNU General Public License for more details.
16 *
17 * You should have received a copy of the GNU General Public License
18 * along with HeuristicLab. If not, see <http://www.gnu.org/licenses/>.
19 */
20#endregion
21
22using System;
23using System.Collections.Generic;
24using System.Linq;
25using System.Text;
26using System.Windows.Forms;
27using HeuristicLab.DataImporter.Data;
28using HeuristicLab.DataImporter.Data.CommandBase;
29using HeuristicLab.DataImporter.Data.Model;
30using HeuristicLab.Persistence.Default.CompositeSerializers.Storable;
31
32namespace HeuristicLab.DataImporter.Command {
33  [StorableClass]
34  [ViewableCommandInfoAttribute("Linear Interpolation", 1, ColumnGroupState.DoubleColumnSelected | ColumnGroupState.AnySelectedColumnContainsNull,
35    "Handle Missing Values", Position = 2)]
36  public class FillMissingValuesWithLinearInterpolation : FillMissingValueCommandBase {
37    private FillMissingValuesWithLinearInterpolation()
38      : base(null, string.Empty, null) {
39    }
40
41    public FillMissingValuesWithLinearInterpolation(DataSet dataSet, string columnGroupName, int[] affectedColumns) :
42      base(dataSet, columnGroupName, affectedColumns) {
43    }
44
45    public override string Description {
46      get { return "Interpolate missing values"; }
47    }
48
49    public override void Execute() {
50      base.Execute();
51      DoubleColumn column;
52      int startIndex = -1;
53      int endIndex = -1;
54      oldSortOrder = ColumnGroup.SortOrdersForColumns.ToList();
55      oldSortedColumnIndexes = new List<int>(ColumnGroup.SortedColumnIndexes);
56      foreach (int col in AffectedColumns) {
57        if (ColumnGroup.GetColumn(col) is DoubleColumn && ColumnGroup.GetColumn(col).ContainsNullValues) {
58          column = (DoubleColumn)ColumnGroup.Columns.ElementAt(col);
59          if (column.SortOrder != SortOrder.None)
60            ColumnGroup.ResetSorting();
61          nullValues.Add(col, new List<int>());
62          startIndex = FindNextNotNullValueIndex(column, startIndex);
63          endIndex = FindNextNotNullValueIndex(column, startIndex);
64          while (endIndex != -1) {
65            if (endIndex - startIndex != 1) {
66              nullValues[col].AddRange(Enumerable.Range(startIndex + 1, endIndex - startIndex - 1));
67              InterpolateValues(column, startIndex, endIndex);
68            }
69            startIndex = endIndex;
70            endIndex = FindNextNotNullValueIndex(column, endIndex);
71          }
72          startIndex = -1;
73        }
74      }
75      ColumnGroup.FireChanged();
76      ColumnGroup = null;
77    }
78
79    private int FindNextNotNullValueIndex(DoubleColumn column, int startIndex) {
80      int endIndex = -1;
81      for (int i = startIndex + 1; i < column.TotalValuesCount && endIndex == -1; i++)
82        if (column.GetValue(i) != null)
83          endIndex = i;
84      return endIndex;
85    }
86
87    private void InterpolateValues(DoubleColumn column, int startIndex, int endIndex) {
88      double startValue = (double)column.GetValue(startIndex);
89      double endValue = (double)column.GetValue(endIndex);
90      double stepwidth = (endValue - startValue) / (endIndex - startIndex);
91
92      for (int i = startIndex + 1; i < endIndex; i++) {
93        if (column.GetValue(i) != null)
94          throw new CommandExecutionException("Tried to manipulate non null value!", this);
95        column.ChangeValue(i, startValue + stepwidth * (i - startIndex));
96      }
97    }
98  }
99}
Note: See TracBrowser for help on using the repository browser.