Free cookie consent management tool by TermsFeed Policy Generator

source: branches/ScatterSearch (trunk integration)/HeuristicLab.Problems.Instances.DataAnalysis/3.3/Clustering/ClusteringInstanceProvider.cs @ 8086

Last change on this file since 8086 was 8086, checked in by jkarder, 13 years ago

#1331:

  • synced branch with trunk
  • added custom interface (ISimilarityBasedOperator) to mark operators that conduct similarity calculation
  • similarity calculators are now parameterized by the algorithm
  • deleted SolutionPool2TierUpdateMethod
  • deleted KnapsackMultipleGuidesPathRelinker
  • moved IImprovementOperator, IPathRelinker and ISimilarityCalculator to HeuristicLab.Optimization
  • added parameter descriptions
  • fixed plugin references
  • fixed count of EvaluatedSolutions
  • fixed check for duplicate solutions
  • minor code improvements
File size: 3.0 KB
Line 
1#region License Information
2/* HeuristicLab
3 * Copyright (C) 2002-2012 Heuristic and Evolutionary Algorithms Laboratory (HEAL)
4 *
5 * This file is part of HeuristicLab.
6 *
7 * HeuristicLab is free software: you can redistribute it and/or modify
8 * it under the terms of the GNU General Public License as published by
9 * the Free Software Foundation, either version 3 of the License, or
10 * (at your option) any later version.
11 *
12 * HeuristicLab is distributed in the hope that it will be useful,
13 * but WITHOUT ANY WARRANTY; without even the implied warranty of
14 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
15 * GNU General Public License for more details.
16 *
17 * You should have received a copy of the GNU General Public License
18 * along with HeuristicLab. If not, see <http://www.gnu.org/licenses/>.
19 */
20#endregion
21
22using System;
23using System.Collections.Generic;
24using System.IO;
25using System.Text;
26using HeuristicLab.Problems.DataAnalysis;
27
28namespace HeuristicLab.Problems.Instances.DataAnalysis {
29  public abstract class ClusteringInstanceProvider : IProblemInstanceProvider<IClusteringProblemData> {
30    public IClusteringProblemData LoadData(string path) {
31      var csvFileParser = new TableFileParser();
32
33      csvFileParser.Parse(path);
34
35      var dataset = new Dataset(csvFileParser.VariableNames, csvFileParser.Values);
36      var claData = new ClusteringProblemData(dataset, dataset.DoubleVariables);
37
38      int trainingPartEnd = csvFileParser.Rows * 2 / 3;
39      claData.TrainingPartition.Start = 0;
40      claData.TrainingPartition.End = trainingPartEnd;
41      claData.TestPartition.Start = trainingPartEnd;
42      claData.TestPartition.End = csvFileParser.Rows;
43      int pos = path.LastIndexOf('\\');
44      if (pos < 0)
45        claData.Name = path;
46      else {
47        pos++;
48        claData.Name = path.Substring(pos, path.Length - pos);
49      }
50
51      return claData;
52    }
53
54    public void SaveData(IClusteringProblemData instance, string path) {
55      var strBuilder = new StringBuilder();
56
57      foreach (var variable in instance.InputVariables) {
58        strBuilder.Append(variable + ";");
59      }
60      strBuilder.Remove(strBuilder.Length - 1, 1);
61      strBuilder.AppendLine();
62
63      var dataset = instance.Dataset;
64
65      for (int i = 0; i < dataset.Rows; i++) {
66        for (int j = 0; j < dataset.Columns; j++) {
67          strBuilder.Append(dataset.GetValue(i, j) + ";");
68        }
69        strBuilder.Remove(strBuilder.Length - 1, 1);
70        strBuilder.AppendLine();
71      }
72
73      using (var writer = new StreamWriter(path)) {
74        writer.Write(strBuilder);
75      }
76    }
77
78    public abstract IEnumerable<IDataDescriptor> GetDataDescriptors();
79    public abstract IClusteringProblemData LoadData(IDataDescriptor descriptor);
80
81    public abstract string Name { get; }
82    public abstract string Description { get; }
83    public abstract Uri WebLink { get; }
84    public abstract string ReferencePublication { get; }
85  }
86}
Note: See TracBrowser for help on using the repository browser.