Context Navigation

← Previous Change
Next Change →

Changeset 16311 for branches/2845_EnhancedProgress/HeuristicLab.Algorithms.DataAnalysis/3.4/TSNE/TSNEStatic.cs

Timestamp:

11/20/18 15:26:57 (5 years ago)

Author:

pfleck

Message:

#2845 Merged trunk changes into branch (15406-15681, 15683-16308)

Location:

branches/2845_EnhancedProgress

Files:

: 4 edited

. (modified) (1 prop)
HeuristicLab.Algorithms.DataAnalysis (modified) (1 prop)
HeuristicLab.Algorithms.DataAnalysis/3.4 (modified) (1 prop)
HeuristicLab.Algorithms.DataAnalysis/3.4/TSNE/TSNEStatic.cs (modified) (28 diffs)

Legend:

: Unmodified
: Added
: Removed

branches/2845_EnhancedProgress

Property svn:mergeinfo changed

/branches/2839_HiveProjectManagement (added)	merged: 15761,15767-15768,15777,15792,15813,15819,15908,15913-15914,15920,15922,15925,15933,15953-15956,15966,15969,15978,15992,15995,16040,16043-16044,16050,16057,16060,16062,16064,16066,16068,16072,16089,16091-16095,16116
/branches/2916_IndexedDataTableSerialization (added)	merged: 15918
/branches/HiveProjectManagement (added)	merged: 15377-15380,15399,15401,15411-15412,15422,15496-15497,15500,15503,15508,15523,15526-15528,15530,15540,15546-15547,15552,15557,15559,15567,15576-15577,15580,15627-15628,15630,15641-15644,15658-15659,15666,15671,15715-15716,15737,15742,15760
/stable	merged: 15587-15588
/trunk (added)	merged: 15706-15708,15727-15730,15738-15739,15751-15755,15766,15769,15782-15783,15785-15787,15789-15790,15793,15796-15799,15802,15810,15818,15829,15839,15845,15853-15855,15869,15871,15882,15891,15902,15931-15932,15934,15940,15951-15952,15972,15983,15998-15999,16015,16021,16023-16025,16032-16033,16054,16059,16063,16071,16084-16086,16117-16118,16120,16122,16168-16169,16177,16179,16184-16187,16202-16209,16211,16213,16216,16218-16219,16221,16223-16224,16232,16241-16244,16252,16255,16257-16261,16263-16264,16266-16267,16269-16274,16276-16280,16283-16287,16289-16294,16296-16298,16301-16302,16305
/trunk/sources (added)	merged: 15408-15409,15419,15427,15447-15448,15452,15461,15464,15478,15480-15481,15483,15486,15498-15499,15502,15505,15513,15517-15518,15532,15534,15545,15548,15551,15556,15560,15566,15581,15583,15589-15591,15594,15596,15598,15607,15610-15611,15619,15621-15623,15626,15637-15638,15645,15665,15667,15672-15674

branches/2845_EnhancedProgress/HeuristicLab.Algorithms.DataAnalysis

Property svn:mergeinfo changed

/branches/2839_HiveProjectManagement/HeuristicLab.Algorithms.DataAnalysis (added)	merged: 16057,16092
/stable/HeuristicLab.Algorithms.DataAnalysis	merged: 15587
/trunk/HeuristicLab.Algorithms.DataAnalysis (added)	merged: 15739,15769,15783,15786,15854,15869,16071,16086,16117,16168,16243
/trunk/sources/HeuristicLab.Algorithms.DataAnalysis (added)	merged: 15464,15499,15502,15505,15532,15545,15548,15551,15556,15581,15583,15589

branches/2845_EnhancedProgress/HeuristicLab.Algorithms.DataAnalysis/3.4

Property svn:mergeinfo set to (toggle deleted branches)

/branches/2839_HiveProjectManagement/HeuristicLab.Algorithms.DataAnalysis/3.4	merged	eligible
/stable/HeuristicLab.Algorithms.DataAnalysis/3.4	merged	eligible
/trunk/HeuristicLab.Algorithms.DataAnalysis/3.4	merged	eligible
/branches/1721-RandomForestPersistence/HeuristicLab.Algorithms.DataAnalysis/3.4	10321-10322
/branches/Async/HeuristicLab.Algorithms.DataAnalysis/3.4	13329-15286
/branches/Benchmarking/sources/HeuristicLab.Algorithms.DataAnalysis/3.4	6917-7005
/branches/ClassificationModelComparison/HeuristicLab.Algorithms.DataAnalysis/3.4	9070-13099
/branches/CloningRefactoring/HeuristicLab.Algorithms.DataAnalysis/3.4	4656-4721
/branches/DataAnalysis Refactoring/HeuristicLab.Algorithms.DataAnalysis/3.4	5471-5808
/branches/DataAnalysis SolutionEnsembles/HeuristicLab.Algorithms.DataAnalysis/3.4	5815-6180
/branches/DataAnalysis/HeuristicLab.Algorithms.DataAnalysis/3.4	4458-4459,4462,4464
/branches/DataPreprocessing/HeuristicLab.Algorithms.DataAnalysis/3.4	10085-11101
/branches/GP.Grammar.Editor/HeuristicLab.Algorithms.DataAnalysis/3.4	6284-6795
/branches/GP.Symbols (TimeLag, Diff, Integral)/HeuristicLab.Algorithms.DataAnalysis/3.4	5060
/branches/HeuristicLab.DatasetRefactor/sources/HeuristicLab.Algorithms.DataAnalysis/3.4	11570-12508
/branches/HeuristicLab.Problems.Orienteering/HeuristicLab.Algorithms.DataAnalysis/3.4	11130-12721
/branches/HeuristicLab.RegressionSolutionGradientView/HeuristicLab.Algorithms.DataAnalysis/3.4	13819-14091
/branches/HeuristicLab.TimeSeries/HeuristicLab.Algorithms.DataAnalysis/3.4	8116-8789
/branches/LogResidualEvaluator/HeuristicLab.Algorithms.DataAnalysis/3.4	10202-10483
/branches/NET40/sources/HeuristicLab.Algorithms.DataAnalysis/3.4	5138-5162
/branches/ParallelEngine/HeuristicLab.Algorithms.DataAnalysis/3.4	5175-5192
/branches/ProblemInstancesRegressionAndClassification/HeuristicLab.Algorithms.DataAnalysis/3.4	7773-7810
/branches/QAPAlgorithms/HeuristicLab.Algorithms.DataAnalysis/3.4	6350-6627
/branches/Restructure trunk solution/HeuristicLab.Algorithms.DataAnalysis/3.4	6828
/branches/SpectralKernelForGaussianProcesses/HeuristicLab.Algorithms.DataAnalysis/3.4	10204-10479
/branches/SuccessProgressAnalysis/HeuristicLab.Algorithms.DataAnalysis/3.4	5370-5682
/branches/Trunk/HeuristicLab.Algorithms.DataAnalysis/3.4	6829-6865
/branches/VNS/HeuristicLab.Algorithms.DataAnalysis/3.4	5594-5752
/branches/Weighted TSNE/3.4	15451-15531
/branches/histogram/HeuristicLab.Algorithms.DataAnalysis/3.4	5959-6341
/branches/symbreg-factors-2650/HeuristicLab.Algorithms.DataAnalysis/3.4	14232-14825
/trunk/sources/HeuristicLab.Algorithms.DataAnalysis/3.4	15406-15681

branches/2845_EnhancedProgress/HeuristicLab.Algorithms.DataAnalysis/3.4/TSNE/TSNEStatic.cs

-                      r16308
+                      r16311
 #region License Information
 /* HeuristicLab
  * Copyright (C) 2002-2016 Heuristic and Evolutionary Algorithms Laboratory (HEAL)
+ * Copyright (C) 2002-2018 Heuristic and Evolutionary Algorithms Laboratory (HEAL)
+ *
  * This file is part of HeuristicLab.
 …
   [StorableClass]
   public class TSNEStatic<T> {
     [StorableClass]
     public sealed class TSNEState : DeepCloneable {
 …
       [StorableConstructor]
       public TSNEState(bool deserializing) { }
+      public TSNEState(T[] data, IDistance<T> distance, IRandom random, int newDimensions, double perplexity, double theta, int stopLyingIter, int momSwitchIter, double momentum, double finalMomentum, double eta) {
+      public TSNEState(IReadOnlyList<T> data, IDistance<T> distance, IRandom random, int newDimensions, double perplexity,
+        double theta, int stopLyingIter, int momSwitchIter, double momentum, double finalMomentum, double eta, bool randomInit) {
         this.distance = distance;
         this.random = random;
 …
         // initialize
         noDatapoints = data.Length;
+        noDatapoints = data.Count;
         if (noDatapoints - 1 < 3 * perplexity)
           throw new ArgumentException("Perplexity too large for the number of data points!");
 …
         gains = new double[noDatapoints, newDimensions];
         for (var i = 0; i < noDatapoints; i++)
           for (var j = 0; j < newDimensions; j++)
             gains[i, j] = 1.0;
+        for (var j = 0; j < newDimensions; j++)
+          gains[i, j] = 1.0;
         p = null;
 …
         var rand = new NormalDistributedRandom(random, 0, 1);
         for (var i = 0; i < noDatapoints; i++)
+          for (var j = 0; j < newDimensions; j++)
+            newData[i, j] = rand.NextDouble() * .0001;
+        for (var j = 0; j < newDimensions; j++)
+          newData[i, j] = rand.NextDouble() * .0001;
+        if (!(data[0] is IReadOnlyList<double>) || randomInit) return;
+        for (var i = 0; i < noDatapoints; i++)
+        for (var j = 0; j < newDimensions; j++) {
+          var row = (IReadOnlyList<double>) data[i];
+          newData[i, j] = row[j % row.Count];
+        }
+      }
       #endregion
       public double EvaluateError() {
+        return exact ?
+          EvaluateErrorExact(p, newData, noDatapoints, newDimensions) :
+          EvaluateErrorApproximate(rowP, colP, valP, newData, theta);
+        return exact ? EvaluateErrorExact(p, newData, noDatapoints, newDimensions) : EvaluateErrorApproximate(rowP, colP, valP, newData, theta);
+      }
       #region Helpers
       private static void CalculateApproximateSimilarities(T[] data, IDistance<T> distance, double perplexity, out int[] rowP, out int[] colP, out double[] valP) {
+      private static void CalculateApproximateSimilarities(IReadOnlyList<T> data, IDistance<T> distance, double perplexity, out int[] rowP, out int[] colP, out double[] valP) {
         // Compute asymmetric pairwise input similarities
         ComputeGaussianPerplexity(data, distance, out rowP, out colP, out valP, perplexity, (int)(3 * perplexity));
+        ComputeGaussianPerplexity(data, distance, out rowP, out colP, out valP, perplexity, (int) (3 * perplexity));
         // Symmetrize input similarities
         int[] sRowP, symColP;
 …
         valP = sValP;
         var sumP = .0;
+        for (var i = 0; i < rowP[data.Length]; i++) sumP += valP[i];
+        for (var i = 0; i < rowP[data.Length]; i++) valP[i] /= sumP;
+      }
+      private static double[,] CalculateExactSimilarites(T[] data, IDistance<T> distance, double perplexity) {
+        for (var i = 0; i < rowP[data.Count]; i++) sumP += valP[i];
+        for (var i = 0; i < rowP[data.Count]; i++) valP[i] /= sumP;
+      }
+      private static double[,] CalculateExactSimilarites(IReadOnlyList<T> data, IDistance<T> distance, double perplexity) {
         // Compute similarities
         var p = new double[data.Length, data.Length];
+        var p = new double[data.Count, data.Count];
         ComputeGaussianPerplexity(data, distance, p, perplexity);
         // Symmetrize input similarities
         for (var n = 0; n < data.Length; n++) {
           for (var m = n + 1; m < data.Length; m++) {
+        for (var n = 0; n < data.Count; n++) {
+          for (var m = n + 1; m < data.Count; m++) {
             p[n, m] += p[m, n];
             p[m, n] = p[n, m];
 …
+        }
         var sumP = .0;
+        for (var i = 0; i < data.Length; i++) for (var j = 0; j < data.Length; j++) sumP += p[i, j];
+        for (var i = 0; i < data.Length; i++) for (var j = 0; j < data.Length; j++) p[i, j] /= sumP;
+        for (var i = 0; i < data.Count; i++) {
+          for (var j = 0; j < data.Count; j++) {
+            sumP += p[i, j];
+          }
+        }
+        for (var i = 0; i < data.Count; i++) {
+          for (var j = 0; j < data.Count; j++) {
+            p[i, j] /= sumP;
+          }
+        }
         return p;
+      }
       private static void ComputeGaussianPerplexity(IReadOnlyList<T> x, IDistance<T> distance, out int[] rowP, out int[] colP, out double[] valP, double perplexity, int k) {
         if (perplexity > k) throw new ArgumentException("Perplexity should be lower than k!");
 …
           // Iterate until we found a good perplexity
+          var iter = 0; double sumP = 0;
+          var iter = 0;
+          double sumP = 0;
           while (!found && iter < 200) {
             // Compute Gaussian kernel row
             for (var m = 0; m < k; m++) curP[m] = Math.Exp(-beta * distances[m + 1]);
 …
             if (hdiff < tol && -hdiff < tol) {
               found = true;
+            } else {
+            }
+            else {
               if (hdiff > 0) {
                 minBeta = beta;
 …
                 else
                   beta = (beta + maxBeta) / 2.0;
+              } else {
+              }
+              else {
                 maxBeta = beta;
                 if (minBeta.IsAlmost(double.MinValue) || minBeta.IsAlmost(double.MaxValue))
 …
+        }
+      }
       private static void ComputeGaussianPerplexity(T[] x, IDistance<T> distance, double[,] p, double perplexity) {
+      private static void ComputeGaussianPerplexity(IReadOnlyList<T> x, IDistance<T> distance, double[,] p, double perplexity) {
         // Compute the distance matrix
         var dd = ComputeDistances(x, distance);
         var n = x.Length;
+        var n = x.Count;
         // Compute the Gaussian kernel row by row
         for (var i = 0; i < n; i++) {
 …
           // Iterate until we found a good perplexity
           var iter = 0;
           while (!found && iter < 200) {      // 200 iterations as in tSNE implementation by van der Maarten
+          while (!found && iter < 200) { // 200 iterations as in tSNE implementation by van der Maarten
             // Compute Gaussian kernel row
 …
             if (hdiff < tol && -hdiff < tol) {
               found = true;
+            } else {
+            }
+            else {
               if (hdiff > 0) {
                 minBeta = beta;
 …
                 else
                   beta = (beta + maxBeta) / 2.0;
+              } else {
+              }
+              else {
                 maxBeta = beta;
                 if (minBeta.IsAlmost(double.MinValue) || minBeta.IsAlmost(double.MaxValue))
 …
+        }
+      }
+      private static double[][] ComputeDistances(T[] x, IDistance<T> distance) {
+        var res = new double[x.Length][];
+        for (var r = 0; r < x.Length; r++) {
+          var rowV = new double[x.Length];
+      private static double[][] ComputeDistances(IReadOnlyList<T> x, IDistance<T> distance) {
+        var res = new double[x.Count][];
+        for (var r = 0; r < x.Count; r++) {
+          var rowV = new double[x.Count];
           // all distances must be symmetric
           for (var c = 0; c < r; c++) {
 …
+          }
           rowV[r] = 0.0; // distance to self is zero for all distances
           for (var c = r + 1; c < x.Length; c++) {
+          for (var c = r + 1; c < x.Count; c++) {
             rowV[c] = distance.Get(x[r], x[c]);
+          }
 …
         // return x.Select(m => x.Select(n => distance.Get(m, n)).ToArray()).ToArray();
+      }
       private static double EvaluateErrorExact(double[,] p, double[,] y, int n, int d) {
         // Compute the squared Euclidean distance matrix
 …
               q[n1, m] = 1 / (1 + dd[n1, m]);
               sumQ += q[n1, m];
+            } else q[n1, m] = double.Epsilon;
+            }
+            else q[n1, m] = double.Epsilon;
+          }
+        }
 …
         var c = .0;
         for (var i = 0; i < n; i++)
           for (var j = 0; j < n; j++) {
             c += p[i, j] * Math.Log((p[i, j] + float.Epsilon) / (q[i, j] + float.Epsilon));
+          }
+        for (var j = 0; j < n; j++) {
+          c += p[i, j] * Math.Log((p[i, j] + float.Epsilon) / (q[i, j] + float.Epsilon));
+        }
         return c;
+      }
       private static double EvaluateErrorApproximate(IReadOnlyList<int> rowP, IReadOnlyList<int> colP, IReadOnlyList<double> valP, double[,] y, double theta) {
         // Get estimate of normalization term
 …
+      }
       private static void SymmetrizeMatrix(IReadOnlyList<int> rowP, IReadOnlyList<int> colP, IReadOnlyList<double> valP, out int[] symRowP, out int[] symColP, out double[] symValP) {
         // Count number of elements and row counts of symmetric matrix
         var n = rowP.Count - 1;
 …
         for (var j = 0; j < n; j++) {
           for (var i = rowP[j]; i < rowP[j + 1]; i++) {
             // Check whether element (col_P[i], n) is present
             var present = false;
 …
         var offset = new int[n];
         for (var j = 0; j < n; j++) {
           for (var i = rowP[j]; i < rowP[j + 1]; i++) {                                  // considering element(n, colP[i])
+          for (var i = rowP[j]; i < rowP[j + 1]; i++) { // considering element(n, colP[i])
             // Check whether element (col_P[i], n) is present
 …
     public static double[,] Run(T[] data, IDistance<T> distance, IRandom random,
       int newDimensions = 2, double perplexity = 25, int iterations = 1000,
+      double theta = 0,
+      int stopLyingIter = 0, int momSwitchIter = 0, double momentum = .5,
+      double theta = 0, int stopLyingIter = 0, int momSwitchIter = 0, double momentum = .5,
       double finalMomentum = .8, double eta = 10.0
       ) {
+    ) {
       var state = CreateState(data, distance, random, newDimensions, perplexity,
         theta, stopLyingIter, momSwitchIter, momentum, finalMomentum, eta);
 …
       int newDimensions = 2, double perplexity = 25, double theta = 0,
       int stopLyingIter = 0, int momSwitchIter = 0, double momentum = .5,
       double finalMomentum = .8, double eta = 10.0
       ) {
       return new TSNEState(data, distance, random, newDimensions, perplexity, theta, stopLyingIter, momSwitchIter, momentum, finalMomentum, eta);
+      double finalMomentum = .8, double eta = 10.0, bool randomInit = true
+    ) {
+      return new TSNEState(data, distance, random, newDimensions, perplexity, theta, stopLyingIter, momSwitchIter, momentum, finalMomentum, eta, randomInit);
+    }
 …
         for (var j = 0; j < state.newDimensions; j++) {
           state.gains[i, j] = Math.Sign(state.dY[i, j]) != Math.Sign(state.uY[i, j])
             ? state.gains[i, j] + .2  // +0.2 nd *0.8 are used in two separate implementations of tSNE -> seems to be correct
+            ? state.gains[i, j] + .2 // +0.2 nd *0.8 are used in two separate implementations of tSNE -> seems to be correct
             : state.gains[i, j] * .8;
           if (state.gains[i, j] < .01) state.gains[i, j] = .01;
+        }
+      }
       // Perform gradient update (with momentum and gains)
       for (var i = 0; i < state.noDatapoints; i++)
         for (var j = 0; j < state.newDimensions; j++)
           state.uY[i, j] = state.currentMomentum * state.uY[i, j] - state.eta * state.gains[i, j] * state.dY[i, j];
+      for (var j = 0; j < state.newDimensions; j++)
+        state.uY[i, j] = state.currentMomentum * state.uY[i, j] - state.eta * state.gains[i, j] * state.dY[i, j];
       for (var i = 0; i < state.noDatapoints; i++)
         for (var j = 0; j < state.newDimensions; j++)
           state.newData[i, j] = state.newData[i, j] + state.uY[i, j];
+      for (var j = 0; j < state.newDimensions; j++)
+        state.newData[i, j] = state.newData[i, j] + state.uY[i, j];
       // Make solution zero-mean
 …
         if (state.exact)
           for (var i = 0; i < state.noDatapoints; i++)
             for (var j = 0; j < state.noDatapoints; j++)
               state.p[i, j] /= 12.0;
+          for (var j = 0; j < state.noDatapoints; j++)
+            state.p[i, j] /= 12.0;
         else
           for (var i = 0; i < state.rowP[state.noDatapoints]; i++)
 …
       // Compute final t-SNE gradient
       for (var i = 0; i < n; i++)
         for (var j = 0; j < d; j++) {
           dC[i, j] = posF[i, j] - negF[i, j] / sumQ;
+        }
+      for (var j = 0; j < d; j++) {
+        dC[i, j] = posF[i, j] - negF[i, j] / sumQ;
+      }
+    }

Note: See TracChangeset for help on using the changeset viewer.

Download in other formats:

Update cookies preferences