Free cookie consent management tool by TermsFeed Policy Generator

source: branches/DataAnalysis Refactoring/HeuristicLab.Problems.DataAnalysis/3.4/RegressionProblemData.cs @ 5559

Last change on this file since 5559 was 5559, checked in by mkommend, 13 years ago

#1418: worked on different ProblemData classes.

File size: 4.5 KB
Line 
1#region License Information
2/* HeuristicLab
3 * Copyright (C) 2002-2011 Heuristic and Evolutionary Algorithms Laboratory (HEAL)
4 *
5 * This file is part of HeuristicLab.
6 *
7 * HeuristicLab is free software: you can redistribute it and/or modify
8 * it under the terms of the GNU General Public License as published by
9 * the Free Software Foundation, either version 3 of the License, or
10 * (at your option) any later version.
11 *
12 * HeuristicLab is distributed in the hope that it will be useful,
13 * but WITHOUT ANY WARRANTY; without even the implied warranty of
14 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
15 * GNU General Public License for more details.
16 *
17 * You should have received a copy of the GNU General Public License
18 * along with HeuristicLab. If not, see <http://www.gnu.org/licenses/>.
19 */
20#endregion
21
22using System;
23using System.Collections.Generic;
24using System.IO;
25using System.Linq;
26using HeuristicLab.Common;
27using HeuristicLab.Persistence.Default.CompositeSerializers.Storable;
28
29namespace HeuristicLab.Problems.DataAnalysis {
30  [StorableClass]
31  public sealed class RegressionProblemData : DataAnalysisProblemData, IRegressionProblemData {
32
33    #region default data
34    private static double[,] kozaF1 = new double[,] {
35          {2.017885919, -1.449165046},
36          {1.30060506,  -1.344523885},
37          {1.147134798, -1.317989331},
38          {0.877182504, -1.266142284},
39          {0.852562452, -1.261020794},
40          {0.431095788, -1.158793317},
41          {0.112586002, -1.050908405},
42          {0.04594507,  -1.021989402},
43          {0.042572879, -1.020438113},
44          {-0.074027291,  -0.959859562},
45          {-0.109178553,  -0.938094706},
46          {-0.259721109,  -0.803635355},
47          {-0.272991057,  -0.387519561},
48          {-0.161978191,  -0.193611001},
49          {-0.102489983,  -0.114215349},
50          {-0.01469968, -0.014918985},
51          {-0.008863365,  -0.008942626},
52          {0.026751057, 0.026054094},
53          {0.166922436, 0.14309643},
54          {0.176953808, 0.1504144},
55          {0.190233418, 0.159916534},
56          {0.199800708, 0.166635331},
57          {0.261502822, 0.207600348},
58          {0.30182879,  0.232370249},
59          {0.83763905,  0.468046718}
60    };
61    private static Dataset defaultDataset;
62    private static IEnumerable<string> defaultAllowedInputVariables;
63    private static string defaultTargetVariable;
64
65    static RegressionProblemData() {
66      defaultDataset = new Dataset(new string[] { "y", "x" }, kozaF1);
67      defaultDataset.Name = "Fourth-order Polynomial Function Benchmark Dataset";
68      defaultDataset.Description = "f(x) = x^4 + x^3 + x^2 + x^1";
69      defaultAllowedInputVariables = new List<string>() { "x" };
70      defaultTargetVariable = "y";
71    }
72    #endregion
73
74    #region propeties
75    [Storable]
76    private string targetVariable;
77    public string TargetVariable {
78      get { return targetVariable; }
79      set {
80        if (!Dataset.VariableNames.Contains(value))
81          throw new ArgumentException(string.Format("The target variable {0} is not present in the dataset", value));
82        if (targetVariable != value) {
83          targetVariable = value;
84          OnChanged();
85        }
86      }
87    }
88    #endregion
89
90    [StorableConstructor]
91    private RegressionProblemData(bool deserializing) : base(deserializing) { }
92    private RegressionProblemData(RegressionProblemData original, Cloner cloner) : base(original, cloner) { }
93    public override IDeepCloneable Clone(Cloner cloner) { return new RegressionProblemData(this, cloner); }
94
95    public RegressionProblemData()
96      : this(defaultDataset, defaultAllowedInputVariables, defaultTargetVariable) {
97    }
98
99    public RegressionProblemData(Dataset dataset, IEnumerable<string> allowedInputVariables, string targetVariable)
100      : base(dataset, allowedInputVariables) {
101      TargetVariable = targetVariable;
102    }
103
104    public static RegressionProblemData ImportFromFile(string fileName) {
105      TableFileParser csvFileParser = new TableFileParser();
106      csvFileParser.Parse(fileName);
107
108      Dataset dataset = new Dataset(csvFileParser.VariableNames, csvFileParser.Values);
109      dataset.Name = Path.GetFileName(fileName);
110
111      RegressionProblemData problemData = new RegressionProblemData(dataset, dataset.VariableNames.Skip(1), dataset.VariableNames.First());
112      problemData.Name = "Data imported from " + Path.GetFileName(fileName);
113      return problemData;
114    }
115  }
116}
Note: See TracBrowser for help on using the repository browser.