Free cookie consent management tool by TermsFeed Policy Generator

source: trunk/sources/HeuristicLab.Problems.DataAnalysis.MultiVariate.Regression/3.3/Symbolic/SymbolicVectorRegressionProblem.cs @ 4068

Last change on this file since 4068 was 4068, checked in by swagner, 14 years ago

Sorted usings and removed unused usings in entire solution (#1094)

File size: 16.9 KB
Line 
1#region License Information
2/* HeuristicLab
3 * Copyright (C) 2002-2010 Heuristic and Evolutionary Algorithms Laboratory (HEAL)
4 *
5 * This file is part of HeuristicLab.
6 *
7 * HeuristicLab is free software: you can redistribute it and/or modify
8 * it under the terms of the GNU General Public License as published by
9 * the Free Software Foundation, either version 3 of the License, or
10 * (at your option) any later version.
11 *
12 * HeuristicLab is distributed in the hope that it will be useful,
13 * but WITHOUT ANY WARRANTY; without even the implied warranty of
14 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
15 * GNU General Public License for more details.
16 *
17 * You should have received a copy of the GNU General Public License
18 * along with HeuristicLab. If not, see <http://www.gnu.org/licenses/>.
19 */
20#endregion
21
22using System;
23using System.Collections.Generic;
24using System.Linq;
25using HeuristicLab.Common;
26using HeuristicLab.Core;
27using HeuristicLab.Data;
28using HeuristicLab.Encodings.SymbolicExpressionTreeEncoding;
29using HeuristicLab.Encodings.SymbolicExpressionTreeEncoding.Analyzers;
30using HeuristicLab.Encodings.SymbolicExpressionTreeEncoding.Creators;
31using HeuristicLab.Encodings.SymbolicExpressionTreeEncoding.Interfaces;
32using HeuristicLab.Optimization;
33using HeuristicLab.Parameters;
34using HeuristicLab.Persistence.Default.CompositeSerializers.Storable;
35using HeuristicLab.PluginInfrastructure;
36using HeuristicLab.Problems.DataAnalysis.Symbolic;
37
38namespace HeuristicLab.Problems.DataAnalysis.MultiVariate.Regression.Symbolic {
39  [StorableClass]
40  public class SymbolicVectorRegressionProblem : MultiVariateDataAnalysisProblem, IProblem {
41
42    #region Parameter Properties
43    public new ValueParameter<SymbolicExpressionTreeCreator> SolutionCreatorParameter {
44      get { return (ValueParameter<SymbolicExpressionTreeCreator>)Parameters["SolutionCreator"]; }
45    }
46
47    IParameter IProblem.SolutionCreatorParameter {
48      get {
49        return SolutionCreatorParameter;
50      }
51    }
52    public ValueParameter<ISymbolicExpressionTreeInterpreter> SymbolicExpressionTreeInterpreterParameter {
53      get { return (ValueParameter<ISymbolicExpressionTreeInterpreter>)Parameters["SymbolicExpressionTreeInterpreter"]; }
54    }
55
56    public ValueParameter<ISymbolicExpressionGrammar> FunctionTreeGrammarParameter {
57      get { return (ValueParameter<ISymbolicExpressionGrammar>)Parameters["FunctionTreeGrammar"]; }
58    }
59    public ValueParameter<IntValue> MaxExpressionLengthParameter {
60      get { return (ValueParameter<IntValue>)Parameters["MaxExpressionLength"]; }
61    }
62    public ValueParameter<IntValue> MaxExpressionDepthParameter {
63      get { return (ValueParameter<IntValue>)Parameters["MaxExpressionDepth"]; }
64    }
65    public ValueParameter<IntValue> MaxFunctionDefiningBranchesParameter {
66      get { return (ValueParameter<IntValue>)Parameters["MaxFunctionDefiningBranches"]; }
67    }
68    public ValueParameter<IntValue> MaxFunctionArgumentsParameter {
69      get { return (ValueParameter<IntValue>)Parameters["MaxFunctionArguments"]; }
70    }
71    public ValueParameter<DoubleArray> UpperEstimationLimitParameter {
72      get { return (ValueParameter<DoubleArray>)Parameters["UpperEstimationLimit"]; }
73    }
74    public ValueParameter<DoubleArray> LowerEstimationLimitParameter {
75      get { return (ValueParameter<DoubleArray>)Parameters["LowerEstimationLimit"]; }
76    }
77    #endregion
78
79    #region Properties
80    public IntValue MaxExpressionLength {
81      get { return MaxExpressionLengthParameter.Value; }
82      set { MaxExpressionLengthParameter.Value = value; }
83    }
84    public IntValue MaxExpressionDepth {
85      get { return MaxExpressionDepthParameter.Value; }
86      set { MaxExpressionDepthParameter.Value = value; }
87    }
88    public IntValue MaxFunctionDefiningBranches {
89      get { return MaxFunctionDefiningBranchesParameter.Value; }
90      set { MaxFunctionDefiningBranchesParameter.Value = value; }
91    }
92    public IntValue MaxFunctionArguments {
93      get { return MaxFunctionArgumentsParameter.Value; }
94      set { MaxFunctionArgumentsParameter.Value = value; }
95    }
96    public new SymbolicExpressionTreeCreator SolutionCreator {
97      get { return SolutionCreatorParameter.Value; }
98      set { SolutionCreatorParameter.Value = value; }
99    }
100    public DoubleArray UpperEstimationLimit {
101      get { return UpperEstimationLimitParameter.Value; }
102      set { UpperEstimationLimitParameter.Value = value; }
103    }
104    public DoubleArray LowerEstimationLimit {
105      get { return LowerEstimationLimitParameter.Value; }
106      set { LowerEstimationLimitParameter.Value = value; }
107    }
108    ISolutionCreator IProblem.SolutionCreator {
109      get { return SolutionCreatorParameter.Value; }
110    }
111    public ISymbolicExpressionTreeInterpreter SymbolicExpressionTreeInterpreter {
112      get { return SymbolicExpressionTreeInterpreterParameter.Value; }
113      set { SymbolicExpressionTreeInterpreterParameter.Value = value; }
114    }
115
116    public ISymbolicExpressionGrammar FunctionTreeGrammar {
117      get { return (ISymbolicExpressionGrammar)FunctionTreeGrammarParameter.Value; }
118      set { FunctionTreeGrammarParameter.Value = value; }
119    }
120
121    private List<IOperator> operators;
122    public override IEnumerable<IOperator> Operators {
123      get { return operators; }
124    }
125    public IEnumerable<IAnalyzer> Analyzers {
126      get { return operators.OfType<IAnalyzer>(); }
127    }
128    public IntValue TrainingSamplesStart {
129      get { return new IntValue(MultiVariateDataAnalysisProblemData.TrainingSamplesStart.Value); }
130    }
131    public IntValue TrainingSamplesEnd {
132      get {
133        return new IntValue((MultiVariateDataAnalysisProblemData.TrainingSamplesStart.Value +
134          MultiVariateDataAnalysisProblemData.TrainingSamplesEnd.Value) / 2);
135      }
136    }
137    public IntValue ValidationSamplesStart {
138      get { return TrainingSamplesEnd; }
139    }
140    public IntValue ValidationSamplesEnd {
141      get { return new IntValue(MultiVariateDataAnalysisProblemData.TrainingSamplesEnd.Value); }
142    }
143    public IntValue TestSamplesStart {
144      get { return MultiVariateDataAnalysisProblemData.TestSamplesStart; }
145    }
146    public IntValue TestSamplesEnd {
147      get { return MultiVariateDataAnalysisProblemData.TestSamplesEnd; }
148    }
149    public DoubleValue PunishmentFactor {
150      get { return new DoubleValue(10.0); }
151    }
152    #endregion
153
154    [Storable]
155    private SymbolicVectorRegressionGrammar grammar;
156
157    public SymbolicVectorRegressionProblem()
158      : base() {
159      SymbolicExpressionTreeCreator creator = new ProbabilisticTreeCreator();
160      grammar = new SymbolicVectorRegressionGrammar(MultiVariateDataAnalysisProblemData.TargetVariables.CheckedItems.Count());
161      var globalGrammar = new GlobalSymbolicExpressionGrammar(grammar);
162      var interpreter = new SimpleArithmeticExpressionInterpreter();
163      Parameters.Add(new ValueParameter<SymbolicExpressionTreeCreator>("SolutionCreator", "The operator which should be used to create new symbolic regression solutions.", creator));
164      Parameters.Add(new ValueParameter<ISymbolicExpressionTreeInterpreter>("SymbolicExpressionTreeInterpreter", "The interpreter that should be used to evaluate the symbolic expression tree.", interpreter));
165      Parameters.Add(new ValueParameter<ISymbolicExpressionGrammar>("FunctionTreeGrammar", "The grammar that should be used for symbolic regression models.", globalGrammar));
166      Parameters.Add(new ValueParameter<IntValue>("MaxExpressionLength", "Maximal length of the symbolic expression.", new IntValue(100)));
167      Parameters.Add(new ValueParameter<IntValue>("MaxExpressionDepth", "Maximal depth of the symbolic expression.", new IntValue(10)));
168      Parameters.Add(new ValueParameter<IntValue>("MaxFunctionDefiningBranches", "Maximal number of automatically defined functions.", (IntValue)new IntValue(0).AsReadOnly()));
169      Parameters.Add(new ValueParameter<IntValue>("MaxFunctionArguments", "Maximal number of arguments of automatically defined functions.", (IntValue)new IntValue(0).AsReadOnly()));
170      Parameters.Add(new ValueParameter<DoubleArray>("UpperEstimationLimit", "The upper limit for the estimated values for each component."));
171      Parameters.Add(new ValueParameter<DoubleArray>("LowerEstimationLimit", "The lower limit for the estimated values for each component."));
172      creator.SymbolicExpressionTreeParameter.ActualName = "SymbolicVectorRegressionModel";
173
174      ParameterizeSolutionCreator();
175      UpdateGrammar();
176      UpdateEstimationLimits();
177      Initialize();
178    }
179
180    [StorableConstructor]
181    private SymbolicVectorRegressionProblem(bool deserializing) : base() { }
182
183    [StorableHook(HookType.AfterDeserialization)]
184    private void AfterDeserializationHook() {
185      Initialize();
186    }
187
188    public override IDeepCloneable Clone(Cloner cloner) {
189      SymbolicVectorRegressionProblem clone = (SymbolicVectorRegressionProblem)base.Clone(cloner);
190      clone.Initialize();
191      return clone;
192    }
193
194    private void RegisterParameterValueEvents() {
195      MaxFunctionArgumentsParameter.ValueChanged += new EventHandler(ArchitectureParameter_ValueChanged);
196      MaxFunctionDefiningBranchesParameter.ValueChanged += new EventHandler(ArchitectureParameter_ValueChanged);
197      SolutionCreatorParameter.ValueChanged += new EventHandler(SolutionCreatorParameter_ValueChanged);
198    }
199
200    private void RegisterParameterEvents() {
201      MaxFunctionArgumentsParameter.Value.ValueChanged += new EventHandler(ArchitectureParameterValue_ValueChanged);
202      MaxFunctionDefiningBranchesParameter.Value.ValueChanged += new EventHandler(ArchitectureParameterValue_ValueChanged);
203      SolutionCreator.SymbolicExpressionTreeParameter.ActualNameChanged += new EventHandler(SolutionCreator_SymbolicExpressionTreeParameter_ActualNameChanged);
204    }
205
206    #region event handling
207    protected override void OnMultiVariateDataAnalysisProblemChanged(EventArgs e) {
208      base.OnMultiVariateDataAnalysisProblemChanged(e);
209      int dimension = MultiVariateDataAnalysisProblemData.TargetVariables.CheckedItems.Count();
210      // paritions should be updated
211      ParameterizeAnalyzers();
212      // input variables should be updated
213      UpdateGrammar();
214      UpdateEstimationLimits();
215    }
216
217    protected virtual void OnArchitectureParameterChanged(EventArgs e) {
218      UpdateGrammar();
219    }
220
221    protected virtual void OnGrammarChanged(EventArgs e) { }
222    protected virtual void OnOperatorsChanged(EventArgs e) { RaiseOperatorsChanged(e); }
223    protected virtual void OnSolutionCreatorChanged(EventArgs e) {
224      SolutionCreator.SymbolicExpressionTreeParameter.ActualNameChanged += new EventHandler(SolutionCreator_SymbolicExpressionTreeParameter_ActualNameChanged);
225      ParameterizeSolutionCreator();
226      OnSolutionParameterNameChanged(e);
227      RaiseSolutionCreatorChanged(e);
228    }
229
230    protected virtual void OnSolutionParameterNameChanged(EventArgs e) {
231      ParameterizeAnalyzers();
232      ParameterizeOperators();
233    }
234    #endregion
235
236    #region event handlers
237    private void SolutionCreatorParameter_ValueChanged(object sender, EventArgs e) {
238      OnSolutionCreatorChanged(e);
239    }
240    private void SolutionCreator_SymbolicExpressionTreeParameter_ActualNameChanged(object sender, EventArgs e) {
241      OnSolutionParameterNameChanged(e);
242    }
243    private void ArchitectureParameter_ValueChanged(object sender, EventArgs e) {
244      MaxFunctionArgumentsParameter.Value.ValueChanged += new EventHandler(ArchitectureParameterValue_ValueChanged);
245      MaxFunctionDefiningBranchesParameter.Value.ValueChanged += new EventHandler(ArchitectureParameterValue_ValueChanged);
246      OnArchitectureParameterChanged(e);
247    }
248    private void ArchitectureParameterValue_ValueChanged(object sender, EventArgs e) {
249      OnArchitectureParameterChanged(e);
250    }
251    #endregion
252
253    #region Helpers
254    protected void AddOperator(IOperator op) {
255      operators.Add(op);
256    }
257
258    private void Initialize() {
259      InitializeOperators();
260      RegisterParameterEvents();
261      RegisterParameterValueEvents();
262    }
263
264    private void UpdateGrammar() {
265      var selectedTargetVariables = MultiVariateDataAnalysisProblemData.TargetVariables.CheckedItems;
266      grammar.SetDimension(selectedTargetVariables.Count());
267      foreach (var varSymbol in grammar.Symbols.OfType<HeuristicLab.Problems.DataAnalysis.Symbolic.Symbols.Variable>()) {
268        varSymbol.VariableNames = MultiVariateDataAnalysisProblemData.InputVariables.CheckedItems.Select(x => x.Value.Value);
269      }
270
271      var globalGrammar = new GlobalSymbolicExpressionGrammar(grammar);
272      globalGrammar.MaxFunctionArguments = MaxFunctionArguments.Value;
273      globalGrammar.MaxFunctionDefinitions = MaxFunctionDefiningBranches.Value;
274      FunctionTreeGrammar = globalGrammar;
275    }
276
277    private void UpdateEstimationLimits() {
278      IEnumerable<string> selectedTargetVariables = MultiVariateDataAnalysisProblemData.TargetVariables.CheckedItems.Select(x => x.Value.Value);
279      UpperEstimationLimit = new DoubleArray(selectedTargetVariables.Count());
280      LowerEstimationLimit = new DoubleArray(selectedTargetVariables.Count());
281      int i = 0;
282      foreach (string targetVariable in selectedTargetVariables) {
283        if (TrainingSamplesStart.Value < TrainingSamplesEnd.Value) {
284          var targetValues = MultiVariateDataAnalysisProblemData.Dataset.GetVariableValues(targetVariable, TrainingSamplesStart.Value, TrainingSamplesEnd.Value);
285          var mean = targetValues.Average();
286          var range = targetValues.Max() - targetValues.Min();
287          UpperEstimationLimit[i] = mean + PunishmentFactor.Value * range;
288          LowerEstimationLimit[i] = mean - PunishmentFactor.Value * range;
289        } else {
290          UpperEstimationLimit[i] = 0;
291          LowerEstimationLimit[i] = 0;
292        }
293        i++;
294      }
295    }
296
297
298    private void InitializeOperators() {
299      operators = new List<IOperator>();
300      operators.AddRange(ApplicationManager.Manager.GetInstances<ISymbolicExpressionTreeOperator>().OfType<IOperator>());
301      operators.Add(new MinAverageMaxSymbolicExpressionTreeSizeAnalyzer());
302      // operators.Add(new SymbolicVectorRegressionVariableFrequencyAnalyzer());
303      ParameterizeOperators();
304      ParameterizeAnalyzers();
305    }
306
307    private void ParameterizeSolutionCreator() {
308      SolutionCreator.SymbolicExpressionGrammarParameter.ActualName = FunctionTreeGrammarParameter.Name;
309      SolutionCreator.MaxTreeHeightParameter.ActualName = MaxExpressionDepthParameter.Name;
310      SolutionCreator.MaxTreeSizeParameter.ActualName = MaxExpressionLengthParameter.Name;
311      SolutionCreator.MaxFunctionArgumentsParameter.ActualName = MaxFunctionArgumentsParameter.Name;
312      SolutionCreator.MaxFunctionDefinitionsParameter.ActualName = MaxFunctionDefiningBranchesParameter.Name;
313    }
314
315    private void ParameterizeAnalyzers() {
316      foreach (ISymbolicExpressionTreeAnalyzer analyzer in Analyzers.OfType<ISymbolicExpressionTreeAnalyzer>()) {
317        analyzer.SymbolicExpressionTreeParameter.ActualName = SolutionCreator.SymbolicExpressionTreeParameter.ActualName;
318      }
319      //foreach (var analyzer in Analyzers) {
320      //  var varFreqAnalyzer = analyzer as SymbolicVectorRegressionVariableFrequencyAnalyzer;
321      //  if (varFreqAnalyzer != null) {
322      //    varFreqAnalyzer.ProblemDataParameter.ActualName = MultiVariateDataAnalysisProblemDataParameter.Name;
323      //    varFreqAnalyzer.SymbolicExpressionTreeParameter.ActualName = SolutionCreator.SymbolicExpressionTreeParameter.ActualName;
324      //  }
325      //}
326    }
327
328    private void ParameterizeOperators() {
329      foreach (ISymbolicExpressionTreeOperator op in Operators.OfType<ISymbolicExpressionTreeOperator>()) {
330        op.MaxTreeHeightParameter.ActualName = MaxExpressionDepthParameter.Name;
331        op.MaxTreeSizeParameter.ActualName = MaxExpressionLengthParameter.Name;
332        op.SymbolicExpressionGrammarParameter.ActualName = FunctionTreeGrammarParameter.Name;
333      }
334      foreach (ISymbolicExpressionTreeCrossover op in Operators.OfType<ISymbolicExpressionTreeCrossover>()) {
335        op.ParentsParameter.ActualName = SolutionCreator.SymbolicExpressionTreeParameter.ActualName;
336        op.ChildParameter.ActualName = SolutionCreator.SymbolicExpressionTreeParameter.ActualName;
337      }
338      foreach (ISymbolicExpressionTreeManipulator op in Operators.OfType<ISymbolicExpressionTreeManipulator>()) {
339        op.SymbolicExpressionTreeParameter.ActualName = SolutionCreator.SymbolicExpressionTreeParameter.ActualName;
340      }
341      foreach (ISymbolicExpressionTreeArchitectureManipulator op in Operators.OfType<ISymbolicExpressionTreeArchitectureManipulator>()) {
342        op.MaxFunctionArgumentsParameter.ActualName = MaxFunctionArgumentsParameter.Name;
343        op.MaxFunctionDefinitionsParameter.ActualName = MaxFunctionDefiningBranchesParameter.Name;
344      }
345    }
346    #endregion
347
348  }
349}
Note: See TracBrowser for help on using the repository browser.