Free cookie consent management tool by TermsFeed Policy Generator

source: branches/DataPreprocessing/HeuristicLab.DataPreprocessing/3.3/Implementations/TransformationLogic.cs @ 10671

Last change on this file since 10671 was 10586, checked in by tsteinre, 11 years ago
  • divided/refactored PreprocessingData into TransactionalPreprocessingData and preprocessingData
File size: 2.6 KB
Line 
1#region License Information
2/* HeuristicLab
3 * Copyright (C) 2002-2013 Heuristic and Evolutionary Algorithms Laboratory (HEAL)
4 *
5 * This file is part of HeuristicLab.
6 *
7 * HeuristicLab is free software: you can redistribute it and/or modify
8 * it under the terms of the GNU General Public License as published by
9 * the Free Software Foundation, either version 3 of the License, or
10 * (at your option) any later version.
11 *
12 * HeuristicLab is distributed in the hope that it will be useful,
13 * but WITHOUT ANY WARRANTY; without even the implied warranty of
14 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
15 * GNU General Public License for more details.
16 *
17 * You should have received a copy of the GNU General Public License
18 * along with HeuristicLab. If not, see <http://www.gnu.org/licenses/>.
19 */
20#endregion
21
22using System;
23
24namespace HeuristicLab.DataPreprocessing {
25
26  public class TransformationLogic : ITransformationLogic {
27
28    private readonly ITransactionalPreprocessingData preprocessingData;
29    private readonly ISearchLogic searchLogic;
30    private readonly IStatisticsLogic statisticsLogic;
31
32    public TransformationLogic(ITransactionalPreprocessingData thePreprocessingData, ISearchLogic theSearchLogic, IStatisticsLogic theStatisticsLogic) {
33      preprocessingData = thePreprocessingData;
34      searchLogic = theSearchLogic;
35      statisticsLogic = theStatisticsLogic;
36    }
37
38    public void DeleteRowsWithMissingValuesGreater(double percent) {
39      for (int i = 0; i < preprocessingData.Rows; ++i) {
40        int missingCount = statisticsLogic.GetRowMissingValueCount(i);
41        if (100f / preprocessingData.Columns * missingCount >= percent) {
42          preprocessingData.DeleteRow(i);
43          --i;
44        }
45      }
46    }
47
48    public void DeleteColumnsWithMissingValuesGreater(float percent) {
49      for (int i = 0; i < preprocessingData.Columns; ++i) {
50        int missingCount = statisticsLogic.GetMissingValueCount(i);
51        if (100f / preprocessingData.Columns * missingCount >= percent) {
52          preprocessingData.DeleteColumn(i);
53          --i;
54        }
55      }
56    }
57
58    public void DeleteColumnsWithVarianceSmaller(double variance) {
59      for (int i = 0; i < preprocessingData.Columns; ++i) {
60        if (preprocessingData.IsType<double>(i) || preprocessingData.IsType<DateTime>(i)) {
61          double columnVariance = statisticsLogic.GetVariance(i);
62          if (columnVariance < variance) {
63            preprocessingData.DeleteColumn(i);
64            --i;
65          }
66        }
67      }
68    }
69
70  }
71}
Note: See TracBrowser for help on using the repository browser.