[5717] | 1 | #region License Information
|
---|
| 2 | /* HeuristicLab
|
---|
| 3 | * Copyright (C) 2002-2011 Heuristic and Evolutionary Algorithms Laboratory (HEAL)
|
---|
| 4 | *
|
---|
| 5 | * This file is part of HeuristicLab.
|
---|
| 6 | *
|
---|
| 7 | * HeuristicLab is free software: you can redistribute it and/or modify
|
---|
| 8 | * it under the terms of the GNU General Public License as published by
|
---|
| 9 | * the Free Software Foundation, either version 3 of the License, or
|
---|
| 10 | * (at your option) any later version.
|
---|
| 11 | *
|
---|
| 12 | * HeuristicLab is distributed in the hope that it will be useful,
|
---|
| 13 | * but WITHOUT ANY WARRANTY; without even the implied warranty of
|
---|
| 14 | * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
---|
| 15 | * GNU General Public License for more details.
|
---|
| 16 | *
|
---|
| 17 | * You should have received a copy of the GNU General Public License
|
---|
| 18 | * along with HeuristicLab. If not, see <http://www.gnu.org/licenses/>.
|
---|
| 19 | */
|
---|
| 20 | #endregion
|
---|
| 21 |
|
---|
| 22 | using System;
|
---|
| 23 | using System.Collections.Generic;
|
---|
| 24 | using System.Linq;
|
---|
| 25 | using HeuristicLab.Common;
|
---|
[6256] | 26 | using HeuristicLab.Encodings.SymbolicExpressionTreeEncoding;
|
---|
[5717] | 27 | using HeuristicLab.Problems.DataAnalysis.Symbolic.Views;
|
---|
| 28 |
|
---|
| 29 | namespace HeuristicLab.Problems.DataAnalysis.Symbolic.Classification.Views {
|
---|
| 30 | public partial class InteractiveSymbolicDiscriminantFunctionClassificationSolutionSimplifierView : InteractiveSymbolicDataAnalysisSolutionSimplifierView {
|
---|
| 31 | private readonly ConstantTreeNode constantNode;
|
---|
| 32 | private readonly SymbolicExpressionTree tempTree;
|
---|
| 33 |
|
---|
| 34 | public new SymbolicDiscriminantFunctionClassificationSolution Content {
|
---|
| 35 | get { return (SymbolicDiscriminantFunctionClassificationSolution)base.Content; }
|
---|
| 36 | set { base.Content = value; }
|
---|
| 37 | }
|
---|
| 38 |
|
---|
| 39 | public InteractiveSymbolicDiscriminantFunctionClassificationSolutionSimplifierView()
|
---|
| 40 | : base() {
|
---|
| 41 | InitializeComponent();
|
---|
| 42 | this.Caption = "Interactive Classification Solution Simplifier";
|
---|
| 43 |
|
---|
| 44 | constantNode = ((ConstantTreeNode)new Constant().CreateTreeNode());
|
---|
| 45 | ISymbolicExpressionTreeNode root = new ProgramRootSymbol().CreateTreeNode();
|
---|
| 46 | ISymbolicExpressionTreeNode start = new StartSymbol().CreateTreeNode();
|
---|
[5736] | 47 | root.AddSubtree(start);
|
---|
[5717] | 48 | tempTree = new SymbolicExpressionTree(root);
|
---|
| 49 | }
|
---|
| 50 |
|
---|
| 51 | protected override void UpdateModel(ISymbolicExpressionTree tree) {
|
---|
[5736] | 52 | Content.Model = new SymbolicDiscriminantFunctionClassificationModel(tree, Content.Model.Interpreter);
|
---|
[7027] | 53 | // the default policy for setting thresholds in classification models is the accuarcy maximizing policy.
|
---|
| 54 | // This is rather slow to calculate and can lead to a very laggy UI in the interactive solution simplifier.
|
---|
| 55 | // However, since we automatically prune sub-trees based on the threshold reaching the maximum accuracy we must
|
---|
| 56 | // also use maximum accuracy threshold calculation here in order to prevent incoherent behavior of the simplifier.
|
---|
| 57 | Content.SetAccuracyMaximizingThresholds();
|
---|
[5717] | 58 | }
|
---|
| 59 |
|
---|
| 60 | protected override Dictionary<ISymbolicExpressionTreeNode, double> CalculateReplacementValues(ISymbolicExpressionTree tree) {
|
---|
| 61 | Dictionary<ISymbolicExpressionTreeNode, double> replacementValues = new Dictionary<ISymbolicExpressionTreeNode, double>();
|
---|
[5993] | 62 | foreach (ISymbolicExpressionTreeNode node in tree.Root.GetSubtree(0).GetSubtree(0).IterateNodesPrefix()) {
|
---|
| 63 | replacementValues[node] = CalculateReplacementValue(node, tree);
|
---|
[5717] | 64 | }
|
---|
| 65 | return replacementValues;
|
---|
| 66 | }
|
---|
| 67 |
|
---|
| 68 | protected override Dictionary<ISymbolicExpressionTreeNode, double> CalculateImpactValues(ISymbolicExpressionTree tree) {
|
---|
| 69 | var interpreter = Content.Model.Interpreter;
|
---|
| 70 | var dataset = Content.ProblemData.Dataset;
|
---|
| 71 | var rows = Content.ProblemData.TrainingIndizes;
|
---|
| 72 | string targetVariable = Content.ProblemData.TargetVariable;
|
---|
| 73 | Dictionary<ISymbolicExpressionTreeNode, double> impactValues = new Dictionary<ISymbolicExpressionTreeNode, double>();
|
---|
[5736] | 74 | List<ISymbolicExpressionTreeNode> nodes = tree.Root.GetSubtree(0).GetSubtree(0).IterateNodesPostfix().ToList();
|
---|
[5717] | 75 |
|
---|
[6740] | 76 | var targetClassValues = dataset.GetDoubleValues(targetVariable, rows);
|
---|
[5717] | 77 | var originalOutput = interpreter.GetSymbolicExpressionTreeValues(tree, dataset, rows)
|
---|
[5736] | 78 | .LimitToRange(Content.Model.LowerEstimationLimit, Content.Model.UpperEstimationLimit)
|
---|
[5717] | 79 | .ToArray();
|
---|
| 80 | double[] classValues;
|
---|
| 81 | double[] thresholds;
|
---|
[6438] | 82 | // normal distribution cut points are used as thresholds here because they are a lot faster to calculate than the accuracy maximizing thresholds
|
---|
[5717] | 83 | NormalDistributionCutPointsThresholdCalculator.CalculateThresholds(Content.ProblemData, originalOutput, targetClassValues, out classValues, out thresholds);
|
---|
[5736] | 84 | var classifier = new SymbolicDiscriminantFunctionClassificationModel(tree, interpreter);
|
---|
| 85 | classifier.SetThresholdsAndClassValues(thresholds, classValues);
|
---|
[5942] | 86 | OnlineCalculatorError errorState;
|
---|
| 87 | double originalAccuracy = OnlineAccuracyCalculator.Calculate(targetClassValues, classifier.GetEstimatedClassValues(dataset, rows), out errorState);
|
---|
| 88 | if (errorState != OnlineCalculatorError.None) originalAccuracy = 0.0;
|
---|
[5717] | 89 |
|
---|
| 90 | foreach (ISymbolicExpressionTreeNode node in nodes) {
|
---|
| 91 | var parent = node.Parent;
|
---|
[5993] | 92 | constantNode.Value = CalculateReplacementValue(node, tree);
|
---|
[5717] | 93 | ISymbolicExpressionTreeNode replacementNode = constantNode;
|
---|
| 94 | SwitchNode(parent, node, replacementNode);
|
---|
[5736] | 95 | var newOutput = interpreter.GetSymbolicExpressionTreeValues(tree, dataset, rows)
|
---|
| 96 | .LimitToRange(Content.Model.LowerEstimationLimit, Content.Model.UpperEstimationLimit)
|
---|
| 97 | .ToArray();
|
---|
[5717] | 98 | NormalDistributionCutPointsThresholdCalculator.CalculateThresholds(Content.ProblemData, newOutput, targetClassValues, out classValues, out thresholds);
|
---|
[5736] | 99 | classifier = new SymbolicDiscriminantFunctionClassificationModel(tree, interpreter);
|
---|
| 100 | classifier.SetThresholdsAndClassValues(thresholds, classValues);
|
---|
[5942] | 101 | double newAccuracy = OnlineAccuracyCalculator.Calculate(targetClassValues, classifier.GetEstimatedClassValues(dataset, rows), out errorState);
|
---|
| 102 | if (errorState != OnlineCalculatorError.None) newAccuracy = 0.0;
|
---|
[5717] | 103 |
|
---|
| 104 | // impact = 0 if no change
|
---|
| 105 | // impact < 0 if new solution is better
|
---|
| 106 | // impact > 0 if new solution is worse
|
---|
| 107 | impactValues[node] = originalAccuracy - newAccuracy;
|
---|
| 108 | SwitchNode(parent, replacementNode, node);
|
---|
| 109 | }
|
---|
| 110 | return impactValues;
|
---|
| 111 | }
|
---|
| 112 |
|
---|
[5993] | 113 | private double CalculateReplacementValue(ISymbolicExpressionTreeNode node, ISymbolicExpressionTree sourceTree) {
|
---|
| 114 | // remove old ADFs
|
---|
[6803] | 115 | while (tempTree.Root.SubtreeCount > 1) tempTree.Root.RemoveSubtree(1);
|
---|
[5993] | 116 | // clone ADFs of source tree
|
---|
[6803] | 117 | for (int i = 1; i < sourceTree.Root.SubtreeCount; i++) {
|
---|
[5993] | 118 | tempTree.Root.AddSubtree((ISymbolicExpressionTreeNode)sourceTree.Root.GetSubtree(i).Clone());
|
---|
[6256] | 119 | }
|
---|
[5736] | 120 | var start = tempTree.Root.GetSubtree(0);
|
---|
[6803] | 121 | while (start.SubtreeCount > 0) start.RemoveSubtree(0);
|
---|
[5736] | 122 | start.AddSubtree((ISymbolicExpressionTreeNode)node.Clone());
|
---|
[5717] | 123 | var interpreter = Content.Model.Interpreter;
|
---|
| 124 | var rows = Content.ProblemData.TrainingIndizes;
|
---|
| 125 | return interpreter.GetSymbolicExpressionTreeValues(tempTree, Content.ProblemData.Dataset, rows).Median();
|
---|
| 126 | }
|
---|
| 127 |
|
---|
| 128 |
|
---|
| 129 | private void SwitchNode(ISymbolicExpressionTreeNode root, ISymbolicExpressionTreeNode oldBranch, ISymbolicExpressionTreeNode newBranch) {
|
---|
[6803] | 130 | for (int i = 0; i < root.SubtreeCount; i++) {
|
---|
[5736] | 131 | if (root.GetSubtree(i) == oldBranch) {
|
---|
| 132 | root.RemoveSubtree(i);
|
---|
| 133 | root.InsertSubtree(i, newBranch);
|
---|
[5717] | 134 | return;
|
---|
| 135 | }
|
---|
| 136 | }
|
---|
| 137 | }
|
---|
[6256] | 138 |
|
---|
| 139 | protected override void btnOptimizeConstants_Click(object sender, EventArgs e) {
|
---|
| 140 |
|
---|
| 141 | }
|
---|
[5717] | 142 | }
|
---|
| 143 | }
|
---|