Free cookie consent management tool by TermsFeed Policy Generator

source: branches/DataAnalysis Refactoring/HeuristicLab.Problems.DataAnalysis.Symbolic/3.4/Analyzers/SymbolicDataAnalysisMultiObjectiveValidationBestSolutionAnalyzer.cs @ 5685

Last change on this file since 5685 was 5685, checked in by gkronber, 13 years ago

#1418 Implemented validation best solution analyzers for symbolic classification and regression, added analyzers to symbolic data analysis problem classes and changed details of parameter wiring in problem classes.

File size: 8.5 KB
Line 
1#region License Information
2/* HeuristicLab
3 * Copyright (C) 2002-2011 Heuristic and Evolutionary Algorithms Laboratory (HEAL)
4 *
5 * This file is part of HeuristicLab.
6 *
7 * HeuristicLab is free software: you can redistribute it and/or modify
8 * it under the terms of the GNU General Public License as published by
9 * the Free Software Foundation, either version 3 of the License, or
10 * (at your option) any later version.
11 *
12 * HeuristicLab is distributed in the hope that it will be useful,
13 * but WITHOUT ANY WARRANTY; without even the implied warranty of
14 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
15 * GNU General Public License for more details.
16 *
17 * You should have received a copy of the GNU General Public License
18 * along with HeuristicLab. If not, see <http://www.gnu.org/licenses/>.
19 */
20#endregion
21
22using System.Collections.Generic;
23using System.Linq;
24using HeuristicLab.Common;
25using HeuristicLab.Core;
26using HeuristicLab.Data;
27using HeuristicLab.Encodings.SymbolicExpressionTreeEncoding;
28using HeuristicLab.Operators;
29using HeuristicLab.Optimization;
30using HeuristicLab.Parameters;
31using HeuristicLab.Persistence.Default.CompositeSerializers.Storable;
32
33namespace HeuristicLab.Problems.DataAnalysis.Symbolic {
34  /// <summary>
35  /// An operator that analyzes the validation best symbolic data analysis solution for multi objective symbolic data analysis problems.
36  /// </summary>
37  [Item("SymbolicDataAnalysisMultiObjectiveValidationBestSolutionAnalyzer", "An operator that analyzes the validation best symbolic data analysis solution for multi objective symbolic data analysis problems.")]
38  [StorableClass]
39  public abstract class SymbolicDataAnalysisMultiObjectiveValidationBestSolutionAnalyzer<S, T, U> : SymbolicDataAnalysisValidationAnalyzer<T, U>,
40    ISymbolicDataAnalysisMultiObjectiveAnalyzer
41    where S : class, ISymbolicDataAnalysisSolution
42    where T : class, ISymbolicDataAnalysisMultiObjectiveEvaluator<U>
43    where U : class, IDataAnalysisProblemData {
44    private const string QualitiesParameterName = "Qualities";
45    private const string MaximizationParameterName = "Maximization";
46    private const string ValidationBestSolutionsParameterName = "Best validation solutions";
47    private const string ValidationBestSolutionQualitiesParameterName = "Best validation solution qualities";
48    private const string ValidationBestSolutionsResultName = ValidationBestSolutionsParameterName;
49    private const string ValidationBestSolutionQualitiesResultName = ValidationBestSolutionQualitiesParameterName;
50
51    #region parameter properties
52    public IScopeTreeLookupParameter<DoubleArray> QualitiesParameter {
53      get { return (IScopeTreeLookupParameter<DoubleArray>)Parameters[QualitiesParameterName]; }
54    }
55    public ILookupParameter<BoolArray> MaximizationParameter {
56      get { return (ILookupParameter<BoolArray>)Parameters[MaximizationParameterName]; }
57    }
58    public ILookupParameter<ItemList<S>> ValidationBestSolutionsParameter {
59      get { return (ILookupParameter<ItemList<S>>)Parameters[ValidationBestSolutionsParameterName]; }
60    }
61    public ILookupParameter<ItemList<DoubleArray>> ValidationBestSolutionQualitiesParameter {
62      get { return (ILookupParameter<ItemList<DoubleArray>>)Parameters[ValidationBestSolutionQualitiesParameterName]; }
63    }
64    #endregion
65    #region properties
66    public ItemArray<DoubleArray> Qualities {
67      get { return QualitiesParameter.ActualValue; }
68    }
69    public BoolArray Maximization {
70      get { return MaximizationParameter.ActualValue; }
71    }
72    public ItemList<S> ValidationBestSolutions {
73      get { return ValidationBestSolutionsParameter.ActualValue; }
74      set { ValidationBestSolutionsParameter.ActualValue = value; }
75    }
76    public ItemList<DoubleArray> ValidationBestSolutionQualities {
77      get { return ValidationBestSolutionQualitiesParameter.ActualValue; }
78      set { ValidationBestSolutionQualitiesParameter.ActualValue = value; }
79    }
80    #endregion
81
82    [StorableConstructor]
83    protected SymbolicDataAnalysisMultiObjectiveValidationBestSolutionAnalyzer(bool deserializing) : base(deserializing) { }
84    protected SymbolicDataAnalysisMultiObjectiveValidationBestSolutionAnalyzer(SymbolicDataAnalysisMultiObjectiveValidationBestSolutionAnalyzer<S, T, U> original, Cloner cloner) : base(original, cloner) { }
85    public SymbolicDataAnalysisMultiObjectiveValidationBestSolutionAnalyzer()
86      : base() {
87      Parameters.Add(new ScopeTreeLookupParameter<DoubleArray>(QualitiesParameterName, "The qualities of the trees that should be analyzed."));
88      Parameters.Add(new LookupParameter<BoolArray>(MaximizationParameterName, "The directions of optimization for each dimension."));
89      Parameters.Add(new LookupParameter<ItemList<S>>(ValidationBestSolutionsParameterName, "The validation best (Pareto-optimal) symbolic data analysis solutions."));
90      Parameters.Add(new LookupParameter<ItemList<DoubleArray>>(ValidationBestSolutionQualitiesParameterName, "The qualities of the validation best (Pareto-optimal) solutions."));
91    }
92
93    public override IOperation Apply() {
94      var results = ResultCollection;
95      // create empty parameter and result values
96      if (ValidationBestSolutions == null) {
97        ValidationBestSolutions = new ItemList<S>();
98        ValidationBestSolutionQualities = new ItemList<DoubleArray>();
99        results.Add(new Result(ValidationBestSolutionQualitiesResultName, ValidationBestSolutionQualities));
100        results.Add(new Result(ValidationBestSolutionsResultName, ValidationBestSolutions));
101      }
102
103      IList<double[]> trainingBestQualities = ValidationBestSolutionQualities
104        .Select(x => x.ToArray())
105        .ToList();
106
107      #region find best trees
108      IList<int> nonDominatedIndexes = new List<int>();
109      ISymbolicExpressionTree[] tree = SymbolicExpressionTrees.ToArray();
110      List<double[]> qualities = new List<double[]>();
111      bool[] maximization = Maximization.ToArray();
112      List<double[]> newNonDominatedQualities = new List<double[]>();
113      var evaluator = Evaluator;
114      int start = ValidationSamplesStart.Value;
115      int end = ValidationSamplesEnd.Value;
116      IEnumerable<int> rows = Enumerable.Range(start, end - start);
117      for (int i = 0; i < tree.Length; i++) {
118        qualities.Add(evaluator.Evaluate(ExecutionContext, tree[i], ProblemData, rows)); // qualities[i] = ...
119        if (IsNonDominated(qualities[i], trainingBestQualities, maximization) &&
120          IsNonDominated(qualities[i], qualities, maximization)) {
121          newNonDominatedQualities.Add(qualities[i]);
122          nonDominatedIndexes.Add(i);
123        }
124      }
125      #endregion
126      #region update Pareto-optimal solution archive
127      if (nonDominatedIndexes.Count > 0) {
128        ItemList<DoubleArray> nonDominatedQualities = new ItemList<DoubleArray>();
129        ItemList<S> nonDominatedSolutions = new ItemList<S>();
130        // add all new non-dominated solutions to the archive
131        foreach (var index in nonDominatedIndexes) {
132          S solution = CreateSolution(tree[index], qualities[index]);
133          nonDominatedSolutions.Add(solution);
134          nonDominatedQualities.Add(new DoubleArray(qualities[index]));
135        }
136        // add old non-dominated solutions only if they are not dominated by one of the new solutions
137        for (int i = 0; i < trainingBestQualities.Count; i++) {
138          if (IsNonDominated(trainingBestQualities[i], newNonDominatedQualities, maximization)) {
139            nonDominatedSolutions.Add(ValidationBestSolutions[i]);
140            nonDominatedQualities.Add(ValidationBestSolutionQualities[i]);
141          }
142        }
143
144        results[ValidationBestSolutionsResultName].Value = nonDominatedSolutions;
145        results[ValidationBestSolutionQualitiesResultName].Value = nonDominatedQualities;
146      }
147      #endregion
148      return base.Apply();
149    }
150
151    protected abstract S CreateSolution(ISymbolicExpressionTree bestTree, double[] bestQuality);
152
153    private bool IsNonDominated(double[] point, IList<double[]> points, bool[] maximization) {
154      foreach (var refPoint in points) {
155        bool refPointDominatesPoint = true;
156        for (int i = 0; i < point.Length; i++) {
157          refPointDominatesPoint &= IsBetter(refPoint[i], point[i], maximization[i]);
158        }
159        if (refPointDominatesPoint) return false;
160      }
161      return true;
162    }
163    private bool IsBetter(double lhs, double rhs, bool maximization) {
164      if (maximization) return lhs > rhs;
165      else return lhs < rhs;
166    }
167  }
168}
Note: See TracBrowser for help on using the repository browser.