Free cookie consent management tool by TermsFeed Policy Generator

source: branches/2521_ProblemRefactoring/HeuristicLab.Problems.GeneticProgramming/3.3/BasicSymbolicRegression/Problem.cs @ 17320

Last change on this file since 17320 was 17320, checked in by mkommend, 5 years ago

#2521: Added cancellation token to evaluate function of problems.

File size: 7.9 KB
Line 
1#region License Information
2/* HeuristicLab
3 * Copyright (C) Heuristic and Evolutionary Algorithms Laboratory (HEAL)
4 *
5 * This file is part of HeuristicLab.
6 *
7 * HeuristicLab is free software: you can redistribute it and/or modify
8 * it under the terms of the GNU General Public License as published by
9 * the Free Software Foundation, either version 3 of the License, or
10 * (at your option) any later version.
11 *
12 * HeuristicLab is distributed in the hope that it will be useful,
13 * but WITHOUT ANY WARRANTY; without even the implied warranty of
14 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
15 * GNU General Public License for more details.
16 *
17 * You should have received a copy of the GNU General Public License
18 * along with HeuristicLab. If not, see <http://www.gnu.org/licenses/>.
19 */
20#endregion
21
22using System;
23using System.Collections.Generic;
24using System.Linq;
25using System.Threading;
26using HEAL.Attic;
27using HeuristicLab.Common;
28using HeuristicLab.Core;
29using HeuristicLab.Encodings.SymbolicExpressionTreeEncoding;
30using HeuristicLab.Parameters;
31using HeuristicLab.Problems.DataAnalysis;
32using HeuristicLab.Problems.Instances;
33
34
35namespace HeuristicLab.Problems.GeneticProgramming.BasicSymbolicRegression {
36  [Item("Koza-style Symbolic Regression", "An implementation of symbolic regression without bells-and-whistles. Use \"Symbolic Regression Problem (single-objective)\" if you want to use all features.")]
37  [Creatable(CreatableAttribute.Categories.GeneticProgrammingProblems, Priority = 900)]
38  [StorableType("72011B73-28C6-4D5E-BEDF-27425BC87B9C")]
39  public sealed class Problem : SymbolicExpressionTreeProblem, IRegressionProblem, IProblemInstanceConsumer<IRegressionProblemData>, IProblemInstanceExporter<IRegressionProblemData> {
40
41    #region parameter names
42    private const string ProblemDataParameterName = "ProblemData";
43    #endregion
44
45    #region Parameter Properties
46    IParameter IDataAnalysisProblem.ProblemDataParameter { get { return ProblemDataParameter; } }
47
48    public IValueParameter<IRegressionProblemData> ProblemDataParameter {
49      get { return (IValueParameter<IRegressionProblemData>)Parameters[ProblemDataParameterName]; }
50    }
51    #endregion
52
53    #region Properties
54    public IRegressionProblemData ProblemData {
55      get { return ProblemDataParameter.Value; }
56      set { ProblemDataParameter.Value = value; }
57    }
58    IDataAnalysisProblemData IDataAnalysisProblem.ProblemData { get { return ProblemData; } }
59    #endregion
60
61    public event EventHandler ProblemDataChanged;
62
63    #region item cloning and persistence
64    // persistence
65    [StorableConstructor]
66    private Problem(StorableConstructorFlag _) : base(_) { }
67    [StorableHook(HookType.AfterDeserialization)]
68    private void AfterDeserialization() {
69      RegisterEventHandlers();
70    }
71
72    // cloning
73    private Problem(Problem original, Cloner cloner)
74      : base(original, cloner) {
75      RegisterEventHandlers();
76    }
77    public override IDeepCloneable Clone(Cloner cloner) { return new Problem(this, cloner); }
78    #endregion
79
80    public Problem() : base(new SymbolicExpressionTreeEncoding()) {
81      Maximization = true;
82      Parameters.Add(new ValueParameter<IRegressionProblemData>(ProblemDataParameterName, "The data for the regression problem", new RegressionProblemData()));
83
84      Encoding.TreeLength = 100;
85      Encoding.TreeDepth = 17;
86
87      UpdateGrammar();
88      RegisterEventHandlers();
89    }
90
91
92    public override double Evaluate(ISymbolicExpressionTree tree, IRandom random, CancellationToken cancellationToken) {
93      // Doesn't use classes from HeuristicLab.Problems.DataAnalysis.Symbolic to make sure that the implementation can be fully understood easily.
94      // HeuristicLab.Problems.DataAnalysis.Symbolic would already provide all the necessary functionality (esp. interpreter) but at a much higher complexity.
95      // Another argument is that we don't need a reference to HeuristicLab.Problems.DataAnalysis.Symbolic
96
97      var problemData = ProblemData;
98      var rows = ProblemData.TrainingIndices.ToArray();
99      var target = problemData.Dataset.GetDoubleValues(problemData.TargetVariable, rows);
100      var predicted = Interpret(tree, problemData.Dataset, rows);
101
102      OnlineCalculatorError errorState;
103      var r = OnlinePearsonsRCalculator.Calculate(target, predicted, out errorState);
104      if (errorState != OnlineCalculatorError.None) r = 0;
105      return r * r;
106    }
107
108    private IEnumerable<double> Interpret(ISymbolicExpressionTree tree, IDataset dataset, IEnumerable<int> rows) {
109      // skip programRoot and startSymbol
110      return InterpretRec(tree.Root.GetSubtree(0).GetSubtree(0), dataset, rows);
111    }
112
113    private IEnumerable<double> InterpretRec(ISymbolicExpressionTreeNode node, IDataset dataset, IEnumerable<int> rows) {
114      Func<ISymbolicExpressionTreeNode, ISymbolicExpressionTreeNode, Func<double, double, double>, IEnumerable<double>> binaryEval =
115        (left, right, f) => InterpretRec(left, dataset, rows).Zip(InterpretRec(right, dataset, rows), f);
116
117      switch (node.Symbol.Name) {
118        case "+": return binaryEval(node.GetSubtree(0), node.GetSubtree(1), (x, y) => x + y);
119        case "*": return binaryEval(node.GetSubtree(0), node.GetSubtree(1), (x, y) => x * y);
120        case "-": return binaryEval(node.GetSubtree(0), node.GetSubtree(1), (x, y) => x - y);
121        case "%": return binaryEval(node.GetSubtree(0), node.GetSubtree(1), (x, y) => y.IsAlmost(0.0) ? 0.0 : x / y); // protected division
122        default: {
123            double erc;
124            if (double.TryParse(node.Symbol.Name, out erc)) {
125              return rows.Select(_ => erc);
126            } else {
127              // assume that this is a variable name
128              return dataset.GetDoubleValues(node.Symbol.Name, rows);
129            }
130          }
131      }
132    }
133
134
135    #region events
136    private void RegisterEventHandlers() {
137      ProblemDataParameter.ValueChanged += new EventHandler(ProblemDataParameter_ValueChanged);
138      if (ProblemDataParameter.Value != null) ProblemDataParameter.Value.Changed += new EventHandler(ProblemData_Changed);
139    }
140
141    private void ProblemDataParameter_ValueChanged(object sender, EventArgs e) {
142      ProblemDataParameter.Value.Changed += new EventHandler(ProblemData_Changed);
143      OnProblemDataChanged();
144      OnReset();
145    }
146
147    private void ProblemData_Changed(object sender, EventArgs e) {
148      OnReset();
149    }
150
151    private void OnProblemDataChanged() {
152      UpdateGrammar();
153
154      var handler = ProblemDataChanged;
155      if (handler != null) handler(this, EventArgs.Empty);
156    }
157
158    private void UpdateGrammar() {
159      // whenever ProblemData is changed we create a new grammar with the necessary symbols
160      var g = new SimpleSymbolicExpressionGrammar();
161      g.AddSymbols(new[] { "+", "*", "%", "-" }, 2, 2); // % is protected division 1/0 := 0
162
163      foreach (var variableName in ProblemData.AllowedInputVariables)
164        g.AddTerminalSymbol(variableName);
165
166      // generate ephemeral random consts in the range [-10..+10[ (2*number of variables)
167      var rand = new System.Random();
168      for (int i = 0; i < ProblemData.AllowedInputVariables.Count() * 2; i++) {
169        string newErcSy;
170        do {
171          newErcSy = string.Format("{0:F2}", rand.NextDouble() * 20 - 10);
172        } while (g.Symbols.Any(sy => sy.Name == newErcSy)); // it might happen that we generate the same constant twice
173        g.AddTerminalSymbol(newErcSy);
174      }
175
176      Encoding.GrammarParameter.ReadOnly = false;
177      Encoding.Grammar = g;
178      Encoding.GrammarParameter.ReadOnly = true;
179    }
180    #endregion
181
182    #region Import & Export
183    public void Load(IRegressionProblemData data) {
184      Name = data.Name;
185      Description = data.Description;
186      ProblemData = data;
187    }
188
189    public IRegressionProblemData Export() {
190      return ProblemData;
191    }
192    #endregion
193  }
194}
Note: See TracBrowser for help on using the repository browser.