#region License Information
/* HeuristicLab
* Copyright (C) 2002-2010 Heuristic and Evolutionary Algorithms Laboratory (HEAL)
*
* This file is part of HeuristicLab.
*
* HeuristicLab is free software: you can redistribute it and/or modify
* it under the terms of the GNU General Public License as published by
* the Free Software Foundation, either version 3 of the License, or
* (at your option) any later version.
*
* HeuristicLab is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
* GNU General Public License for more details.
*
* You should have received a copy of the GNU General Public License
* along with HeuristicLab. If not, see .
*/
#endregion
using System;
using System.Collections.Generic;
using System.Linq;
using HeuristicLab.Common;
using HeuristicLab.Core;
using HeuristicLab.Data;
using HeuristicLab.Encodings.SymbolicExpressionTreeEncoding;
using HeuristicLab.Encodings.SymbolicExpressionTreeEncoding.Analyzers;
using HeuristicLab.Encodings.SymbolicExpressionTreeEncoding.Creators;
using HeuristicLab.Encodings.SymbolicExpressionTreeEncoding.Interfaces;
using HeuristicLab.Optimization;
using HeuristicLab.Parameters;
using HeuristicLab.Persistence.Default.CompositeSerializers.Storable;
using HeuristicLab.PluginInfrastructure;
using HeuristicLab.Problems.DataAnalysis.Symbolic;
namespace HeuristicLab.Problems.DataAnalysis.MultiVariate.Regression.Symbolic {
[StorableClass]
public class SymbolicVectorRegressionProblem : MultiVariateDataAnalysisProblem, IProblem {
#region Parameter Properties
public new ValueParameter SolutionCreatorParameter {
get { return (ValueParameter)Parameters["SolutionCreator"]; }
}
IParameter IProblem.SolutionCreatorParameter {
get {
return SolutionCreatorParameter;
}
}
public ValueParameter SymbolicExpressionTreeInterpreterParameter {
get { return (ValueParameter)Parameters["SymbolicExpressionTreeInterpreter"]; }
}
public ValueParameter FunctionTreeGrammarParameter {
get { return (ValueParameter)Parameters["FunctionTreeGrammar"]; }
}
public ValueParameter MaxExpressionLengthParameter {
get { return (ValueParameter)Parameters["MaxExpressionLength"]; }
}
public ValueParameter MaxExpressionDepthParameter {
get { return (ValueParameter)Parameters["MaxExpressionDepth"]; }
}
public ValueParameter MaxFunctionDefiningBranchesParameter {
get { return (ValueParameter)Parameters["MaxFunctionDefiningBranches"]; }
}
public ValueParameter MaxFunctionArgumentsParameter {
get { return (ValueParameter)Parameters["MaxFunctionArguments"]; }
}
public ValueParameter UpperEstimationLimitParameter {
get { return (ValueParameter)Parameters["UpperEstimationLimit"]; }
}
public ValueParameter LowerEstimationLimitParameter {
get { return (ValueParameter)Parameters["LowerEstimationLimit"]; }
}
#endregion
#region Properties
public IntValue MaxExpressionLength {
get { return MaxExpressionLengthParameter.Value; }
set { MaxExpressionLengthParameter.Value = value; }
}
public IntValue MaxExpressionDepth {
get { return MaxExpressionDepthParameter.Value; }
set { MaxExpressionDepthParameter.Value = value; }
}
public IntValue MaxFunctionDefiningBranches {
get { return MaxFunctionDefiningBranchesParameter.Value; }
set { MaxFunctionDefiningBranchesParameter.Value = value; }
}
public IntValue MaxFunctionArguments {
get { return MaxFunctionArgumentsParameter.Value; }
set { MaxFunctionArgumentsParameter.Value = value; }
}
public new SymbolicExpressionTreeCreator SolutionCreator {
get { return SolutionCreatorParameter.Value; }
set { SolutionCreatorParameter.Value = value; }
}
public DoubleArray UpperEstimationLimit {
get { return UpperEstimationLimitParameter.Value; }
set { UpperEstimationLimitParameter.Value = value; }
}
public DoubleArray LowerEstimationLimit {
get { return LowerEstimationLimitParameter.Value; }
set { LowerEstimationLimitParameter.Value = value; }
}
ISolutionCreator IProblem.SolutionCreator {
get { return SolutionCreatorParameter.Value; }
}
public ISymbolicExpressionTreeInterpreter SymbolicExpressionTreeInterpreter {
get { return SymbolicExpressionTreeInterpreterParameter.Value; }
set { SymbolicExpressionTreeInterpreterParameter.Value = value; }
}
public ISymbolicExpressionGrammar FunctionTreeGrammar {
get { return (ISymbolicExpressionGrammar)FunctionTreeGrammarParameter.Value; }
set { FunctionTreeGrammarParameter.Value = value; }
}
public override IEnumerable Operators {
get { return operators; }
}
public IEnumerable Analyzers {
get { return operators.OfType(); }
}
public IntValue TrainingSamplesStart {
get { return new IntValue(MultiVariateDataAnalysisProblemData.TrainingSamplesStart.Value); }
}
public IntValue TrainingSamplesEnd {
get {
return new IntValue((MultiVariateDataAnalysisProblemData.TrainingSamplesStart.Value +
MultiVariateDataAnalysisProblemData.TrainingSamplesEnd.Value) / 2);
}
}
public IntValue ValidationSamplesStart {
get { return TrainingSamplesEnd; }
}
public IntValue ValidationSamplesEnd {
get { return new IntValue(MultiVariateDataAnalysisProblemData.TrainingSamplesEnd.Value); }
}
public IntValue TestSamplesStart {
get { return MultiVariateDataAnalysisProblemData.TestSamplesStart; }
}
public IntValue TestSamplesEnd {
get { return MultiVariateDataAnalysisProblemData.TestSamplesEnd; }
}
public DoubleValue PunishmentFactor {
get { return new DoubleValue(10.0); }
}
#endregion
[Storable]
private SymbolicVectorRegressionGrammar grammar;
[Storable]
private List operators;
[StorableConstructor]
protected SymbolicVectorRegressionProblem(bool deserializing) : base(deserializing) { }
protected SymbolicVectorRegressionProblem(SymbolicVectorRegressionProblem original, Cloner cloner)
: base(original, cloner) {
operators = original.operators.Select(x => (IOperator)cloner.Clone(x)).ToList();
RegisterParameterEvents();
RegisterParameterValueEvents();
}
public SymbolicVectorRegressionProblem()
: base() {
SymbolicExpressionTreeCreator creator = new ProbabilisticTreeCreator();
grammar = new SymbolicVectorRegressionGrammar(MultiVariateDataAnalysisProblemData.TargetVariables.CheckedItems.Count());
var globalGrammar = new GlobalSymbolicExpressionGrammar(grammar);
var interpreter = new SimpleArithmeticExpressionInterpreter();
Parameters.Add(new ValueParameter("SolutionCreator", "The operator which should be used to create new symbolic regression solutions.", creator));
Parameters.Add(new ValueParameter("SymbolicExpressionTreeInterpreter", "The interpreter that should be used to evaluate the symbolic expression tree.", interpreter));
Parameters.Add(new ValueParameter("FunctionTreeGrammar", "The grammar that should be used for symbolic regression models.", globalGrammar));
Parameters.Add(new ValueParameter("MaxExpressionLength", "Maximal length of the symbolic expression.", new IntValue(100)));
Parameters.Add(new ValueParameter("MaxExpressionDepth", "Maximal depth of the symbolic expression.", new IntValue(10)));
Parameters.Add(new ValueParameter("MaxFunctionDefiningBranches", "Maximal number of automatically defined functions.", (IntValue)new IntValue(0).AsReadOnly()));
Parameters.Add(new ValueParameter("MaxFunctionArguments", "Maximal number of arguments of automatically defined functions.", (IntValue)new IntValue(0).AsReadOnly()));
Parameters.Add(new ValueParameter("UpperEstimationLimit", "The upper limit for the estimated values for each component."));
Parameters.Add(new ValueParameter("LowerEstimationLimit", "The lower limit for the estimated values for each component."));
creator.SymbolicExpressionTreeParameter.ActualName = "SymbolicVectorRegressionModel";
ParameterizeSolutionCreator();
UpdateGrammar();
UpdateEstimationLimits();
InitializeOperators();
RegisterParameterEvents();
RegisterParameterValueEvents();
}
[StorableHook(HookType.AfterDeserialization)]
private void AfterDeserialization() {
// BackwardsCompatibility3.3
#region Backwards compatible code (remove with 3.4)
if (operators == null) InitializeOperators();
#endregion
RegisterParameterEvents();
RegisterParameterValueEvents();
}
public override IDeepCloneable Clone(Cloner cloner) {
return new SymbolicVectorRegressionProblem(this, cloner);
}
private void RegisterParameterValueEvents() {
MaxFunctionArgumentsParameter.ValueChanged += new EventHandler(ArchitectureParameter_ValueChanged);
MaxFunctionDefiningBranchesParameter.ValueChanged += new EventHandler(ArchitectureParameter_ValueChanged);
SolutionCreatorParameter.ValueChanged += new EventHandler(SolutionCreatorParameter_ValueChanged);
}
private void RegisterParameterEvents() {
MaxFunctionArgumentsParameter.Value.ValueChanged += new EventHandler(ArchitectureParameterValue_ValueChanged);
MaxFunctionDefiningBranchesParameter.Value.ValueChanged += new EventHandler(ArchitectureParameterValue_ValueChanged);
SolutionCreator.SymbolicExpressionTreeParameter.ActualNameChanged += new EventHandler(SolutionCreator_SymbolicExpressionTreeParameter_ActualNameChanged);
}
#region event handling
protected override void OnMultiVariateDataAnalysisProblemChanged(EventArgs e) {
base.OnMultiVariateDataAnalysisProblemChanged(e);
int dimension = MultiVariateDataAnalysisProblemData.TargetVariables.CheckedItems.Count();
// paritions should be updated
ParameterizeAnalyzers();
// input variables should be updated
UpdateGrammar();
UpdateEstimationLimits();
}
protected virtual void OnArchitectureParameterChanged(EventArgs e) {
UpdateGrammar();
}
protected virtual void OnGrammarChanged(EventArgs e) { }
protected virtual void OnOperatorsChanged(EventArgs e) { RaiseOperatorsChanged(e); }
protected virtual void OnSolutionCreatorChanged(EventArgs e) {
SolutionCreator.SymbolicExpressionTreeParameter.ActualNameChanged += new EventHandler(SolutionCreator_SymbolicExpressionTreeParameter_ActualNameChanged);
ParameterizeSolutionCreator();
OnSolutionParameterNameChanged(e);
RaiseSolutionCreatorChanged(e);
}
protected virtual void OnSolutionParameterNameChanged(EventArgs e) {
ParameterizeAnalyzers();
ParameterizeOperators();
}
#endregion
#region event handlers
private void SolutionCreatorParameter_ValueChanged(object sender, EventArgs e) {
OnSolutionCreatorChanged(e);
}
private void SolutionCreator_SymbolicExpressionTreeParameter_ActualNameChanged(object sender, EventArgs e) {
OnSolutionParameterNameChanged(e);
}
private void ArchitectureParameter_ValueChanged(object sender, EventArgs e) {
MaxFunctionArgumentsParameter.Value.ValueChanged += new EventHandler(ArchitectureParameterValue_ValueChanged);
MaxFunctionDefiningBranchesParameter.Value.ValueChanged += new EventHandler(ArchitectureParameterValue_ValueChanged);
OnArchitectureParameterChanged(e);
}
private void ArchitectureParameterValue_ValueChanged(object sender, EventArgs e) {
OnArchitectureParameterChanged(e);
}
#endregion
#region Helpers
protected void AddOperator(IOperator op) {
operators.Add(op);
}
private void UpdateGrammar() {
var selectedTargetVariables = MultiVariateDataAnalysisProblemData.TargetVariables.CheckedItems;
grammar.SetDimension(selectedTargetVariables.Count());
foreach (var varSymbol in grammar.Symbols.OfType()) {
varSymbol.VariableNames = MultiVariateDataAnalysisProblemData.InputVariables.CheckedItems.Select(x => x.Value.Value);
}
var globalGrammar = new GlobalSymbolicExpressionGrammar(grammar);
globalGrammar.MaxFunctionArguments = MaxFunctionArguments.Value;
globalGrammar.MaxFunctionDefinitions = MaxFunctionDefiningBranches.Value;
FunctionTreeGrammar = globalGrammar;
}
private void UpdateEstimationLimits() {
IEnumerable selectedTargetVariables = MultiVariateDataAnalysisProblemData.TargetVariables.CheckedItems.Select(x => x.Value.Value);
UpperEstimationLimit = new DoubleArray(selectedTargetVariables.Count());
LowerEstimationLimit = new DoubleArray(selectedTargetVariables.Count());
int i = 0;
foreach (string targetVariable in selectedTargetVariables) {
if (TrainingSamplesStart.Value < TrainingSamplesEnd.Value) {
var targetValues = MultiVariateDataAnalysisProblemData.Dataset.GetVariableValues(targetVariable, TrainingSamplesStart.Value, TrainingSamplesEnd.Value);
var mean = targetValues.Average();
var range = targetValues.Max() - targetValues.Min();
UpperEstimationLimit[i] = mean + PunishmentFactor.Value * range;
LowerEstimationLimit[i] = mean - PunishmentFactor.Value * range;
} else {
UpperEstimationLimit[i] = 0;
LowerEstimationLimit[i] = 0;
}
i++;
}
}
private void InitializeOperators() {
operators = new List();
operators.AddRange(ApplicationManager.Manager.GetInstances().OfType());
operators.Add(new MinAverageMaxSymbolicExpressionTreeSizeAnalyzer());
// operators.Add(new SymbolicVectorRegressionVariableFrequencyAnalyzer());
ParameterizeOperators();
ParameterizeAnalyzers();
}
private void ParameterizeSolutionCreator() {
SolutionCreator.SymbolicExpressionGrammarParameter.ActualName = FunctionTreeGrammarParameter.Name;
SolutionCreator.MaxTreeHeightParameter.ActualName = MaxExpressionDepthParameter.Name;
SolutionCreator.MaxTreeSizeParameter.ActualName = MaxExpressionLengthParameter.Name;
SolutionCreator.MaxFunctionArgumentsParameter.ActualName = MaxFunctionArgumentsParameter.Name;
SolutionCreator.MaxFunctionDefinitionsParameter.ActualName = MaxFunctionDefiningBranchesParameter.Name;
}
private void ParameterizeAnalyzers() {
foreach (ISymbolicExpressionTreeAnalyzer analyzer in Analyzers.OfType()) {
analyzer.SymbolicExpressionTreeParameter.ActualName = SolutionCreator.SymbolicExpressionTreeParameter.ActualName;
}
//foreach (var analyzer in Analyzers) {
// var varFreqAnalyzer = analyzer as SymbolicVectorRegressionVariableFrequencyAnalyzer;
// if (varFreqAnalyzer != null) {
// varFreqAnalyzer.ProblemDataParameter.ActualName = MultiVariateDataAnalysisProblemDataParameter.Name;
// varFreqAnalyzer.SymbolicExpressionTreeParameter.ActualName = SolutionCreator.SymbolicExpressionTreeParameter.ActualName;
// }
//}
}
private void ParameterizeOperators() {
foreach (ISymbolicExpressionTreeOperator op in Operators.OfType()) {
op.MaxTreeHeightParameter.ActualName = MaxExpressionDepthParameter.Name;
op.MaxTreeSizeParameter.ActualName = MaxExpressionLengthParameter.Name;
op.SymbolicExpressionGrammarParameter.ActualName = FunctionTreeGrammarParameter.Name;
}
foreach (ISymbolicExpressionTreeCrossover op in Operators.OfType()) {
op.ParentsParameter.ActualName = SolutionCreator.SymbolicExpressionTreeParameter.ActualName;
op.ChildParameter.ActualName = SolutionCreator.SymbolicExpressionTreeParameter.ActualName;
}
foreach (ISymbolicExpressionTreeManipulator op in Operators.OfType()) {
op.SymbolicExpressionTreeParameter.ActualName = SolutionCreator.SymbolicExpressionTreeParameter.ActualName;
}
foreach (ISymbolicExpressionTreeArchitectureManipulator op in Operators.OfType()) {
op.MaxFunctionArgumentsParameter.ActualName = MaxFunctionArgumentsParameter.Name;
op.MaxFunctionDefinitionsParameter.ActualName = MaxFunctionDefiningBranchesParameter.Name;
}
}
#endregion
}
}