#region License Information
/* HeuristicLab
* Copyright (C) Heuristic and Evolutionary Algorithms Laboratory (HEAL)
*
* This file is part of HeuristicLab.
*
* HeuristicLab is free software: you can redistribute it and/or modify
* it under the terms of the GNU General Public License as published by
* the Free Software Foundation, either version 3 of the License, or
* (at your option) any later version.
*
* HeuristicLab is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
* GNU General Public License for more details.
*
* You should have received a copy of the GNU General Public License
* along with HeuristicLab. If not, see .
*/
#endregion
using System;
using System.Collections.Generic;
using HeuristicLab.Core;
using HeuristicLab.Data;
using HeuristicLab.Problems.DataAnalysis;
using HEAL.Attic;
namespace HeuristicLab.DataPreprocessing {
[StorableType("1fd88253-ae07-415f-81df-5b73c61fd495")]
public interface IPreprocessingData : INamedItem {
#region Cells
bool IsCellEmpty(int columnIndex, int rowIndex);
T GetCell(int columnIndex, int rowIndex);
void SetCell(int columnIndex, int rowIndex, T value);
string GetCellAsString(int columnIndex, int rowIndex);
IList GetValues(int columnIndex, bool considerSelection = false);
void SetValues(int columnIndex, IList values);
bool SetValue(string value, int columnIndex, int rowIndex);
int Columns { get; }
int Rows { get; }
#endregion
#region Rows
void InsertRow(int rowIndex);
void DeleteRow(int rowIndex);
void DeleteRowsWithIndices(IEnumerable rows);
void InsertColumn(string variableName, int columnIndex);
void DeleteColumn(int columnIndex);
void RenameColumn(int columnIndex, string name);
void RenameColumns(IList names);
bool AreAllStringColumns(IEnumerable columnIndices);
#endregion
#region Variables
IEnumerable VariableNames { get; }
IEnumerable GetDoubleVariableNames();
string GetVariableName(int columnIndex);
int GetColumnIndex(string variableName);
bool VariableHasType(int columnIndex);
Type GetVariableType(int columnIndex);
IList InputVariables { get; }
string TargetVariable { get; } // optional
#endregion
#region Partitions
IntRange TrainingPartition { get; }
IntRange TestPartition { get; }
#endregion
#region Transformations
IList Transformations { get; }
#endregion
#region Validation
bool Validate(string value, out string errorMessage, int columnIndex);
#endregion
#region Import & Export
void Import(IDataAnalysisProblemData problemData);
Dataset ExportToDataset();
#endregion
#region Selection
IDictionary> Selection { get; set; }
void ClearSelection();
event EventHandler SelectionChanged;
#endregion
#region Transactions
event DataPreprocessingChangedEventHandler Changed;
bool IsUndoAvailable { get; }
void Undo();
void InTransaction(Action action, DataPreprocessingChangedEventType type = DataPreprocessingChangedEventType.Any);
void BeginTransaction(DataPreprocessingChangedEventType type);
void EndTransaction();
#endregion
#region Statistics
T GetMin(int columnIndex, bool considerSelection = false, T emptyValue = default(T));
T GetMax(int columnIndex, bool considerSelection = false, T emptyValue = default(T));
T GetMean(int columnIndex, bool considerSelection = false, T emptyValue = default(T));
T GetMedian(int columnIndex, bool considerSelection = false, T emptyValue = default(T)) where T : IComparable;
T GetMode(int columnIndex, bool considerSelection = false, T emptyValue = default(T)) where T : IEquatable;
T GetStandardDeviation(int columnIndex, bool considerSelection = false, T emptyValue = default(T));
T GetVariance(int columnIndex, bool considerSelection = false, T emptyValue = default(T));
T GetQuantile(double alpha, int columnIndex, bool considerSelection = false, T emptyValue = default(T)) where T : IComparable;
int GetDistinctValues(int columnIndex, bool considerSelection = false);
int GetMissingValueCount();
int GetMissingValueCount(int columnIndex);
int GetRowMissingValueCount(int rowIndex);
#endregion
}
}