Free cookie consent management tool by TermsFeed Policy Generator

source: branches/DataAnalysis/HeuristicLab.Problems.DataAnalysis/3.3/Operators/WeightedParentsQualityVarianceComparator.cs @ 4631

Last change on this file since 4631 was 4193, checked in by gkronber, 14 years ago

Created a feature/exploration branch for new data analysis features #1142

File size: 7.0 KB
RevLine 
[3378]1#region License Information
2/* HeuristicLab
3 * Copyright (C) 2002-2010 Heuristic and Evolutionary Algorithms Laboratory (HEAL)
4 *
5 * This file is part of HeuristicLab.
6 *
7 * HeuristicLab is free software: you can redistribute it and/or modify
8 * it under the terms of the GNU General Public License as published by
9 * the Free Software Foundation, either version 3 of the License, or
10 * (at your option) any later version.
11 *
12 * HeuristicLab is distributed in the hope that it will be useful,
13 * but WITHOUT ANY WARRANTY; without even the implied warranty of
14 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
15 * GNU General Public License for more details.
16 *
17 * You should have received a copy of the GNU General Public License
18 * along with HeuristicLab. If not, see <http://www.gnu.org/licenses/>.
19 */
20#endregion
21
22using System;
23using System.Linq;
[4044]24using alglib;
[3378]25using HeuristicLab.Core;
26using HeuristicLab.Data;
27using HeuristicLab.Operators;
[4044]28using HeuristicLab.Optimization;
[3378]29using HeuristicLab.Parameters;
30using HeuristicLab.Persistence.Default.CompositeSerializers.Storable;
31
[4044]32namespace HeuristicLab.Problems.DataAnalysis.Operators {
33  [Item("WeightedParentsQualityVarianceComparator", "Compares the quality and variance of the quality against that of its parents (assumes the parents are subscopes to the child scope). This operator works with any number of subscopes > 0.")]
[3378]34  [StorableClass]
[4044]35  public class WeightedParentsQualityVarianceComparator : SingleSuccessorOperator, ISubScopesQualityComparator {
[3378]36    public IValueLookupParameter<BoolValue> MaximizationParameter {
37      get { return (IValueLookupParameter<BoolValue>)Parameters["Maximization"]; }
38    }
[4044]39    public ILookupParameter<BoolValue> ResultParameter {
40      get { return (ILookupParameter<BoolValue>)Parameters["Result"]; }
41    }
42    public IValueLookupParameter<DoubleValue> ConfidenceIntervalParameter {
43      get { return (IValueLookupParameter<DoubleValue>)Parameters["ConfidenceInterval"]; }
44    }
[3378]45    public ILookupParameter<DoubleValue> LeftSideParameter {
46      get { return (ILookupParameter<DoubleValue>)Parameters["LeftSide"]; }
47    }
[4044]48    public ILookupParameter<DoubleValue> LeftSideVarianceParameter {
49      get { return (ILookupParameter<DoubleValue>)Parameters["LeftSideVariance"]; }
50    }
51    public ILookupParameter<IntValue> LeftSideSamplesParameter {
52      get { return (ILookupParameter<IntValue>)Parameters["LeftSideSamples"]; }
53    }
[3378]54    public ILookupParameter<ItemArray<DoubleValue>> RightSideParameter {
55      get { return (ILookupParameter<ItemArray<DoubleValue>>)Parameters["RightSide"]; }
56    }
[4044]57    public ILookupParameter<ItemArray<DoubleValue>> RightSideVariancesParameters {
58      get { return (ILookupParameter<ItemArray<DoubleValue>>)Parameters["RightSideVariances"]; }
[3378]59    }
[4044]60    public ILookupParameter<ItemArray<IntValue>> RightSideSamplesParameters {
61      get { return (ILookupParameter<ItemArray<IntValue>>)Parameters["RightSideSamples"]; }
[3378]62    }
63
[4044]64    public WeightedParentsQualityVarianceComparator()
[3378]65      : base() {
66      Parameters.Add(new ValueLookupParameter<BoolValue>("Maximization", "True if the problem is a maximization problem, false otherwise"));
[4044]67      Parameters.Add(new LookupParameter<BoolValue>("Result", "The result of the comparison: True means Quality is better, False means it is worse than parents."));
68      Parameters.Add(new ValueLookupParameter<DoubleValue>("ConfidenceInterval", "The confidence interval used for the test.", new DoubleValue(0.05)));
69
[3378]70      Parameters.Add(new LookupParameter<DoubleValue>("LeftSide", "The quality of the child."));
[4044]71      Parameters.Add(new LookupParameter<DoubleValue>("LeftSideVariance", "The variances of the quality of the new child."));
72      Parameters.Add(new LookupParameter<IntValue>("LeftSideSamples", "The number of samples used to calculate the quality of the new child."));
73
[3659]74      Parameters.Add(new ScopeTreeLookupParameter<DoubleValue>("RightSide", "The qualities of the parents."));
[4044]75      Parameters.Add(new ScopeTreeLookupParameter<DoubleValue>("RightSideVariances", "The variances of the parents."));
[4131]76      Parameters.Add(new ScopeTreeLookupParameter<IntValue>("RightSideSamples", "The number of samples used to calculate the quality of the parent."));
[3378]77    }
78
79    public override IOperation Apply() {
[4044]80      double leftQuality = LeftSideParameter.ActualValue.Value;
81      double leftVariance = LeftSideVarianceParameter.ActualValue.Value;
82      int leftSamples = LeftSideSamplesParameter.ActualValue.Value;
83
[3378]84      ItemArray<DoubleValue> rightQualities = RightSideParameter.ActualValue;
[4044]85      ItemArray<DoubleValue> rightVariances = RightSideVariancesParameters.ActualValue;
86      ItemArray<IntValue> rightSamples = RightSideSamplesParameters.ActualValue;
87
[3378]88      if (rightQualities.Length < 1) throw new InvalidOperationException(Name + ": No subscopes found.");
89      bool maximization = MaximizationParameter.ActualValue.Value;
90
[4044]91      int bestParentIndex;
92      double bestParentQuality;
93      double bestParentVariance;
94      int bestParentSamples;
[3378]95
[4044]96      if (maximization)
97        bestParentQuality = rightQualities.Max(x => x.Value);
98      else
99        bestParentQuality = rightQualities.Min(x => x.Value);
100      bestParentIndex = rightQualities.FindIndex(x => x.Value == bestParentQuality);
101      bestParentVariance = rightVariances[bestParentIndex].Value;
102      bestParentSamples = rightSamples[bestParentIndex].Value;
[3378]103
[4044]104      double xmean = leftQuality;
105      double xvar = leftVariance;
106      int n = leftSamples;
107      double ymean = bestParentQuality;
108      double yvar = bestParentVariance;
109      double m = bestParentSamples;
[3378]110
[4044]111
112      //following code taken from ALGLIB studentttest line 351
113      // Two-sample unpooled test
114      double p = 0;
115      double stat = (xmean - ymean) / Math.Sqrt(xvar / n + yvar / m);
116      double c = xvar / n / (xvar / n + yvar / m);
117      double df = (n - 1) * (m - 1) / ((m - 1) * AP.Math.Sqr(c) + (n - 1) * (1 - AP.Math.Sqr(c)));
118      if ((double)(stat) > (double)(0))
119        p = 1 - 0.5 * ibetaf.incompletebeta(df / 2, 0.5, df / (df + AP.Math.Sqr(stat)));
120      else
121        p = 0.5 * ibetaf.incompletebeta(df / 2, 0.5, df / (df + AP.Math.Sqr(stat)));
122      double bothtails = 2 * Math.Min(p, 1 - p);
123      double lefttail = p;
124      double righttail = 1 - p;
125
126      bool result = false;
[4193]127      // reject only if the child is significantly worse
128      if (maximization) {
129        if (bothtails > ConfidenceIntervalParameter.ActualValue.Value) result = true;
130        else if (leftQuality > bestParentQuality) result = true;
131        else result = false;
132      } else {
133        if (bothtails > ConfidenceIntervalParameter.ActualValue.Value) result = true;
134        else if (leftQuality < bestParentQuality) result = true;
135        else result = false;
136      }
[4044]137
[3378]138      BoolValue resultValue = ResultParameter.ActualValue;
139      if (resultValue == null) {
140        ResultParameter.ActualValue = new BoolValue(result);
141      } else {
142        resultValue.Value = result;
143      }
144      return base.Apply();
145    }
146  }
147}
Note: See TracBrowser for help on using the repository browser.