Free cookie consent management tool by TermsFeed Policy Generator

source: trunk/sources/HeuristicLab.Problems.DataAnalysis.Symbolic.Regression/3.4/SymbolicRegressionPruningOperator.cs @ 12222

Last change on this file since 12222 was 12189, checked in by bburlacu, 10 years ago

#2359: Implemented improvements

File size: 4.7 KB
RevLine 
[11025]1#region License Information
2
3/* HeuristicLab
[12012]4 * Copyright (C) 2002-2015 Heuristic and Evolutionary Algorithms Laboratory (HEAL)
[11025]5 *
6 * This file is part of HeuristicLab.
7 *
8 * HeuristicLab is free software: you can redistribute it and/or modify
9 * it under the terms of the GNU General Public License as published by
10 * the Free Software Foundation, either version 3 of the License, or
11 * (at your option) any later version.
12 *
13 * HeuristicLab is distributed in the hope that it will be useful,
14 * but WITHOUT ANY WARRANTY; without even the implied warranty of
15 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
16 * GNU General Public License for more details.
17 *
18 * You should have received a copy of the GNU General Public License
19 * along with HeuristicLab. If not, see <http://www.gnu.org/licenses/>.
20 */
21
22#endregion
23
[12189]24using System.Collections.Generic;
[11025]25using System.Linq;
[10469]26using HeuristicLab.Common;
27using HeuristicLab.Core;
[12189]28using HeuristicLab.Encodings.SymbolicExpressionTreeEncoding;
[10469]29using HeuristicLab.Persistence.Default.CompositeSerializers.Storable;
30
31namespace HeuristicLab.Problems.DataAnalysis.Symbolic.Regression {
32  [StorableClass]
33  [Item("SymbolicRegressionPruningOperator", "An operator which prunes symbolic regression trees.")]
34  public class SymbolicRegressionPruningOperator : SymbolicDataAnalysisExpressionPruningOperator {
35    protected SymbolicRegressionPruningOperator(SymbolicRegressionPruningOperator original, Cloner cloner)
36      : base(original, cloner) {
37    }
38    public override IDeepCloneable Clone(Cloner cloner) {
39      return new SymbolicRegressionPruningOperator(this, cloner);
40    }
41
42    [StorableConstructor]
43    protected SymbolicRegressionPruningOperator(bool deserializing) : base(deserializing) { }
44
[12189]45    public SymbolicRegressionPruningOperator(ISymbolicDataAnalysisSolutionImpactValuesCalculator impactValuesCalculator)
46      : base(impactValuesCalculator) {
[10469]47    }
48
[12189]49    protected override ISymbolicDataAnalysisModel CreateModel(ISymbolicExpressionTree tree, ISymbolicDataAnalysisExpressionTreeInterpreter interpreter, IDataAnalysisProblemData problemData, DoubleLimit estimationLimits) {
50      return new SymbolicRegressionModel(tree, interpreter, estimationLimits.Lower, estimationLimits.Upper);
[10469]51    }
52
53    protected override double Evaluate(IDataAnalysisModel model) {
54      var regressionModel = (IRegressionModel)model;
55      var regressionProblemData = (IRegressionProblemData)ProblemData;
[12189]56      var rows = Enumerable.Range(FitnessCalculationPartition.Start, FitnessCalculationPartition.Size);
57      return Evaluate(regressionModel, regressionProblemData, rows);
58    }
59
60    private static double Evaluate(IRegressionModel model, IRegressionProblemData problemData,
61      IEnumerable<int> rows) {
62      var estimatedValues = model.GetEstimatedValues(problemData.Dataset, rows); // also bounds the values
63      var targetValues = problemData.Dataset.GetDoubleValues(problemData.TargetVariable, rows);
[10469]64      OnlineCalculatorError errorState;
65      var quality = OnlinePearsonsRSquaredCalculator.Calculate(targetValues, estimatedValues, out errorState);
66      if (errorState != OnlineCalculatorError.None) return double.NaN;
67      return quality;
68    }
[12189]69
70    public static ISymbolicExpressionTree Prune(ISymbolicExpressionTree tree, SymbolicRegressionSolutionImpactValuesCalculator impactValuesCalculator, ISymbolicDataAnalysisExpressionTreeInterpreter interpreter, IRegressionProblemData problemData, DoubleLimit estimationLimits, IEnumerable<int> rows, double nodeImpactThreshold = 0.0, bool pruneOnlyZeroImpactNodes = false) {
71      var clonedTree = (ISymbolicExpressionTree)tree.Clone();
72      var model = new SymbolicRegressionModel(clonedTree, interpreter, estimationLimits.Lower, estimationLimits.Upper);
73      var nodes = clonedTree.IterateNodesPrefix().ToList();
74      double quality = Evaluate(model, problemData, rows);
75
76      for (int i = 0; i < nodes.Count; ++i) {
77        var node = nodes[i];
78        if (node is ConstantTreeNode) continue;
79
80        double impactValue, replacementValue;
81        impactValuesCalculator.CalculateImpactAndReplacementValues(model, node, problemData, rows, out impactValue, out replacementValue, quality);
82
83        if (pruneOnlyZeroImpactNodes) {
84          if (!impactValue.IsAlmost(0.0)) continue;
85        } else if (nodeImpactThreshold < impactValue) {
86          continue;
87        }
88
89        var constantNode = (ConstantTreeNode)node.Grammar.GetSymbol("Constant").CreateTreeNode();
90        constantNode.Value = replacementValue;
91
92        ReplaceWithConstant(node, constantNode);
93        i += node.GetLength() - 1; // skip subtrees under the node that was folded
94
95        quality -= impactValue;
96      }
97      return model.SymbolicExpressionTree;
98    }
[10469]99  }
100}
Note: See TracBrowser for help on using the repository browser.