Changeset 8658 for trunk/sources/HeuristicLab.Problems.DataAnalysis
- Timestamp:
- 09/14/12 18:48:07 (12 years ago)
- File:
-
- 1 edited
Legend:
- Unmodified
- Added
- Removed
-
trunk/sources/HeuristicLab.Problems.DataAnalysis/3.4/Implementation/Classification/ThresholdCalculators/NormalDistributionCutPointsThresholdCalculator.cs
r8638 r8658 93 93 } 94 94 thresholdList.Sort(); 95 thresholdList.Insert(0, double.NegativeInfinity); 95 96 // add small value and large value for the calculation of most influential class in each thresholded section 97 thresholdList.Insert(0, estimatedValues.Min() - 1); 98 thresholdList.Add(estimatedValues.Max() + 1); 96 99 97 100 // determine class values for each partition separated by a threshold by calculating the density of all class distributions 98 101 // all points in the partition are classified as the class with the maximal density in the parition 99 102 List<double> classValuesList = new List<double>(); 100 if (thresholdList.Count == 1) {103 if (thresholdList.Count == 2) { 101 104 // this happens if there are no thresholds (distributions for all classes are exactly the same) 102 105 // -> all samples should be classified as the first class … … 105 108 // at least one reasonable threshold ... 106 109 // find the most likely class for the points between thresholds m 107 for (int i = 0; i < thresholdList.Count; i++) { 108 double m; 109 if (double.IsNegativeInfinity(thresholdList[i])) { 110 m = thresholdList[i + 1] - 1.0; // smaller than the smallest non-infinity threshold 111 } else if (i == thresholdList.Count - 1) { 112 // last threshold 113 m = thresholdList[i] + 1.0; // larger than the last threshold 114 } else { 115 m = thresholdList[i] + (thresholdList[i + 1] - thresholdList[i]) / 2.0; // middle of partition 116 } 117 118 // determine class with maximal probability density in m 119 double maxDensity = LogNormalDensity(m, classMean[originalClasses[0]], classStdDev[originalClasses[0]]); 110 for (int i = 0; i < thresholdList.Count - 1; i++) { 111 112 // determine class with maximal density mass between the thresholds 113 double maxDensity = LogNormalDensityMass(thresholdList[i], thresholdList[i + 1], classMean[originalClasses[0]], classStdDev[originalClasses[0]]); 120 114 double maxDensityClassValue = originalClasses[0]; 121 115 foreach (var classValue in originalClasses.Skip(1)) { 122 double density = LogNormalDensity (m, classMean[classValue], classStdDev[classValue]);116 double density = LogNormalDensityMass(thresholdList[i], thresholdList[i + 1], classMean[classValue], classStdDev[classValue]); 123 117 if (density > maxDensity) { 124 118 maxDensity = density; … … 139 133 // / / /\s \ \ 140 134 // -/---/-/ -\---\-\---- 135 141 136 List<double> filteredThresholds = new List<double>(); 142 137 List<double> filteredClassValues = new List<double>(); 143 filteredThresholds.Add( thresholdList[0]);138 filteredThresholds.Add(double.NegativeInfinity); // the smallest possible threshold for the first class 144 139 filteredClassValues.Add(classValuesList[0]); 140 // do not include the last threshold which was just needed for the previous step 145 141 for (int i = 0; i < classValuesList.Count - 1; i++) { 146 142 if (!classValuesList[i].IsAlmost(classValuesList[i + 1])) { … … 153 149 } 154 150 151 private static double LogNormalDensityMass(double lower, double upper, double mu, double sigma) { 152 if (sigma.IsAlmost(0.0)) { 153 if (lower < mu && mu < upper) return double.PositiveInfinity; // log(1) 154 else return double.NegativeInfinity; // log(0) 155 } 156 157 Func<double, double> f = (x) => 158 x * -0.5 * Math.Log(2.0 * Math.PI * sigma * sigma) - Math.Pow(x - mu, 3) / (3 * 2.0 * sigma * sigma); 159 160 if (double.IsNegativeInfinity(lower)) return f(upper); 161 else return f(upper) - f(lower); 162 } 163 155 164 private static double LogNormalDensity(double x, double mu, double sigma) { 156 if (sigma.IsAlmost(0.0)) 157 if ( mu.IsAlmost(x)) return 0.0; // (log(1))165 if (sigma.IsAlmost(0.0)) { 166 if (x.IsAlmost(mu)) return 0.0; // log(1); 158 167 else return double.NegativeInfinity; 159 return -0.5 * Math.Log(2.0 * Math.PI * sigma * sigma) - ((x - mu) * (x - mu)) / (2.0 * sigma * sigma); 168 } 169 170 return -0.5 * Math.Log(2.0 * Math.PI * sigma * sigma) - Math.Pow(x - mu, 2) / (2.0 * sigma * sigma); 160 171 } 161 172 … … 176 187 x2 = m2; 177 188 } else { 178 // scale s1 and s2 for numeric stability 179 s2 = s2 / s1; 180 s1 = 1.0; 181 double a = (s1 + s2) * (s1 - s2); 182 double g = Math.Sqrt(s1 * s1 * s2 * s2 * ((m1 - m2) * (m1 - m2) + 2.0 * (s1 * s1 + s2 * s2) * Math.Log(s2 / s1))); 183 double m1s2 = m1 * s2 * s2; 184 double m2s1 = m2 * s1 * s1; 185 x1 = -(-m2s1 + m1s2 + g) / a; 186 x2 = (m2s1 - m1s2 + g) / a; 189 if (s2 < s1) { 190 // make sure s2 is the larger std.dev. 191 CalculateCutPoints(m2, s2, m1, s1, out x1, out x2); 192 } else { 193 // scale s1 and s2 for numeric stability 194 //s2 = s2 / s1; 195 //s1 = 1.0; 196 double a = (s1 + s2) * (s1 - s2); 197 double g = Math.Sqrt(s1 * s1 * s2 * s2 * ((m1 - m2) * (m1 - m2) + 2.0 * (s1 * s1 + s2 * s2) * Math.Log(s2 / s1))); 198 double m1s2 = m1 * s2 * s2; 199 double m2s1 = m2 * s1 * s1; 200 x1 = -(-m2s1 + m1s2 + g) / a; 201 x2 = (m2s1 - m1s2 + g) / a; 202 } 187 203 } 188 204 }
Note: See TracChangeset
for help on using the changeset viewer.