Free cookie consent management tool by TermsFeed Policy Generator

source: trunk/sources/HeuristicLab.Problems.DataAnalysis/3.4/Implementation/Regression/RegressionEnsembleModel.cs @ 13921

Last change on this file since 13921 was 13921, checked in by bburlacu, 8 years ago

#2604: Revert changes to DataAnalysisSolution and IDataAnalysisSolution and implement the desired properties in model classes that implement IDataAnalysisModel, IRegressionModel and IClassificationModel.

File size: 8.3 KB
Line 
1#region License Information
2/* HeuristicLab
3 * Copyright (C) 2002-2015 Heuristic and Evolutionary Algorithms Laboratory (HEAL)
4 *
5 * This file is part of HeuristicLab.
6 *
7 * HeuristicLab is free software: you can redistribute it and/or modify
8 * it under the terms of the GNU General Public License as published by
9 * the Free Software Foundation, either version 3 of the License, or
10 * (at your option) any later version.
11 *
12 * HeuristicLab is distributed in the hope that it will be useful,
13 * but WITHOUT ANY WARRANTY; without even the implied warranty of
14 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
15 * GNU General Public License for more details.
16 *
17 * You should have received a copy of the GNU General Public License
18 * along with HeuristicLab. If not, see <http://www.gnu.org/licenses/>.
19 */
20#endregion
21
22using System;
23using System.Collections.Generic;
24using System.Linq;
25using HeuristicLab.Common;
26using HeuristicLab.Core;
27using HeuristicLab.Persistence.Default.CompositeSerializers.Storable;
28
29namespace HeuristicLab.Problems.DataAnalysis {
30  /// <summary>
31  /// Represents regression solutions that contain an ensemble of multiple regression models
32  /// </summary>
33  [StorableClass]
34  [Item("RegressionEnsembleModel", "A regression model that contains an ensemble of multiple regression models")]
35  public sealed class RegressionEnsembleModel : NamedItem, IRegressionEnsembleModel {
36    public IEnumerable<string> VariablesUsedForPrediction {
37      get { return models.SelectMany(x => x.VariablesUsedForPrediction).Distinct().OrderBy(x => x); }
38    }
39
40    private List<IRegressionModel> models;
41    public IEnumerable<IRegressionModel> Models {
42      get { return new List<IRegressionModel>(models); }
43    }
44
45    [Storable]
46    private readonly string target;
47    public string TargetVariable {
48      get { return models.First().TargetVariable; }
49    }
50
51    [Storable(Name = "Models")]
52    private IEnumerable<IRegressionModel> StorableModels {
53      get { return models; }
54      set { models = value.ToList(); }
55    }
56
57    private List<double> modelWeights;
58    public IEnumerable<double> ModelWeights {
59      get { return modelWeights; }
60    }
61
62    [Storable(Name = "ModelWeights")]
63    private IEnumerable<double> StorableModelWeights {
64      get { return modelWeights; }
65      set { modelWeights = value.ToList(); }
66    }
67
68    [Storable]
69    private bool averageModelEstimates = true;
70    public bool AverageModelEstimates {
71      get { return averageModelEstimates; }
72      set {
73        if (averageModelEstimates != value) {
74          averageModelEstimates = value;
75          OnChanged();
76        }
77      }
78    }
79
80    #region backwards compatiblity 3.3.5
81    [Storable(Name = "models", AllowOneWay = true)]
82    private List<IRegressionModel> OldStorableModels {
83      set { models = value; }
84    }
85    #endregion
86
87    [StorableHook(HookType.AfterDeserialization)]
88    private void AfterDeserialization() {
89      // BackwardsCompatibility 3.3.14
90      #region Backwards compatible code, remove with 3.4
91      if (modelWeights == null || !modelWeights.Any())
92        modelWeights = new List<double>(models.Select(m => 1.0));
93      #endregion
94    }
95
96    [StorableConstructor]
97    private RegressionEnsembleModel(bool deserializing) : base(deserializing) { }
98    private RegressionEnsembleModel(RegressionEnsembleModel original, Cloner cloner)
99      : base(original, cloner) {
100      this.models = original.Models.Select(cloner.Clone).ToList();
101      this.modelWeights = new List<double>(original.ModelWeights);
102      this.averageModelEstimates = original.averageModelEstimates;
103    }
104    public override IDeepCloneable Clone(Cloner cloner) {
105      return new RegressionEnsembleModel(this, cloner);
106    }
107
108    public RegressionEnsembleModel() : this(Enumerable.Empty<IRegressionModel>()) { }
109    public RegressionEnsembleModel(IEnumerable<IRegressionModel> models) : this(models, models.Select(m => 1.0)) { }
110    public RegressionEnsembleModel(IEnumerable<IRegressionModel> models, IEnumerable<double> modelWeights)
111      : base() {
112      this.name = ItemName;
113      this.description = ItemDescription;
114
115
116      this.models = new List<IRegressionModel>(models);
117      this.modelWeights = new List<double>(modelWeights);
118    }
119
120    public void Add(IRegressionModel model) {
121      Add(model, 1.0);
122    }
123    public void Add(IRegressionModel model, double weight) {
124      models.Add(model);
125      modelWeights.Add(weight);
126      OnChanged();
127    }
128
129    public void AddRange(IEnumerable<IRegressionModel> models) {
130      AddRange(models, models.Select(m => 1.0));
131    }
132    public void AddRange(IEnumerable<IRegressionModel> models, IEnumerable<double> weights) {
133      this.models.AddRange(models);
134      modelWeights.AddRange(weights);
135      OnChanged();
136    }
137
138    public void Remove(IRegressionModel model) {
139      var index = models.IndexOf(model);
140      models.RemoveAt(index);
141      modelWeights.RemoveAt(index);
142      OnChanged();
143    }
144    public void RemoveRange(IEnumerable<IRegressionModel> models) {
145      foreach (var model in models) {
146        var index = this.models.IndexOf(model);
147        this.models.RemoveAt(index);
148        modelWeights.RemoveAt(index);
149      }
150      OnChanged();
151    }
152
153    public double GetModelWeight(IRegressionModel model) {
154      var index = models.IndexOf(model);
155      return modelWeights[index];
156    }
157    public void SetModelWeight(IRegressionModel model, double weight) {
158      var index = models.IndexOf(model);
159      modelWeights[index] = weight;
160      OnChanged();
161    }
162
163    #region evaluation
164    public IEnumerable<IEnumerable<double>> GetEstimatedValueVectors(IDataset dataset, IEnumerable<int> rows) {
165      var estimatedValuesEnumerators = (from model in models
166                                        let weight = GetModelWeight(model)
167                                        select model.GetEstimatedValues(dataset, rows).Select(e => weight * e)
168                                        .GetEnumerator()).ToList();
169
170      while (estimatedValuesEnumerators.All(en => en.MoveNext())) {
171        yield return from enumerator in estimatedValuesEnumerators
172                     select enumerator.Current;
173      }
174    }
175
176    public IEnumerable<double> GetEstimatedValues(IDataset dataset, IEnumerable<int> rows) {
177      double weightsSum = modelWeights.Sum();
178      var summedEstimates = from estimatedValuesVector in GetEstimatedValueVectors(dataset, rows)
179                            select estimatedValuesVector.DefaultIfEmpty(double.NaN).Sum();
180
181      if (AverageModelEstimates)
182        return summedEstimates.Select(v => v / weightsSum);
183      else
184        return summedEstimates;
185
186    }
187
188    public IEnumerable<double> GetEstimatedValues(IDataset dataset, IEnumerable<int> rows, Func<int, IRegressionModel, bool> modelSelectionPredicate) {
189      var estimatedValuesEnumerators = GetEstimatedValueVectors(dataset, rows).GetEnumerator();
190      var rowsEnumerator = rows.GetEnumerator();
191
192      while (rowsEnumerator.MoveNext() & estimatedValuesEnumerators.MoveNext()) {
193        var estimatedValueEnumerator = estimatedValuesEnumerators.Current.GetEnumerator();
194        int currentRow = rowsEnumerator.Current;
195        double weightsSum = 0.0;
196        double filteredEstimatesSum = 0.0;
197
198        for (int m = 0; m < models.Count; m++) {
199          estimatedValueEnumerator.MoveNext();
200          var model = models[m];
201          if (!modelSelectionPredicate(currentRow, model)) continue;
202
203          filteredEstimatesSum += estimatedValueEnumerator.Current;
204          weightsSum += modelWeights[m];
205        }
206
207        if (AverageModelEstimates)
208          yield return filteredEstimatesSum / weightsSum;
209        else
210          yield return filteredEstimatesSum;
211      }
212    }
213
214    #endregion
215
216    public event EventHandler Changed;
217    private void OnChanged() {
218      var handler = Changed;
219      if (handler != null)
220        handler(this, EventArgs.Empty);
221    }
222
223
224    public RegressionEnsembleSolution CreateRegressionSolution(IRegressionProblemData problemData) {
225      return new RegressionEnsembleSolution(this, new RegressionEnsembleProblemData(problemData));
226    }
227    IRegressionSolution IRegressionModel.CreateRegressionSolution(IRegressionProblemData problemData) {
228      return CreateRegressionSolution(problemData);
229    }
230  }
231}
Note: See TracBrowser for help on using the repository browser.