Free cookie consent management tool by TermsFeed Policy Generator

source: trunk/sources/HeuristicLab.Problems.Instances.DataAnalysis/3.3/Classification/UCI/UCIInstanceProvider.cs @ 8889

Last change on this file since 8889 was 8889, checked in by sforsten, 10 years ago

#1941: IUCIDataDescriptor to add more information about the datasets to the data, to distinguish between different version, as suggested by abeham

File size: 2.9 KB
Line 
1#region License Information
2/* HeuristicLab
3 * Copyright (C) 2002-2012 Heuristic and Evolutionary Algorithms Laboratory (HEAL)
4 *
5 * This file is part of HeuristicLab.
6 *
7 * HeuristicLab is free software: you can redistribute it and/or modify
8 * it under the terms of the GNU General Public License as published by
9 * the Free Software Foundation, either version 3 of the License, or
10 * (at your option) any later version.
11 *
12 * HeuristicLab is distributed in the hope that it will be useful,
13 * but WITHOUT ANY WARRANTY; without even the implied warranty of
14 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
15 * GNU General Public License for more details.
16 *
17 * You should have received a copy of the GNU General Public License
18 * along with HeuristicLab. If not, see <http://www.gnu.org/licenses/>.
19 */
20#endregion
21
22using System;
23using System.Collections.Generic;
24using System.IO;
25using System.Linq;
26using ICSharpCode.SharpZipLib.Zip;
27
28namespace HeuristicLab.Problems.Instances.DataAnalysis {
29  public class UCIInstanceProvider : ResourceClassificationInstanceProvider {
30    public override string Name {
31      get { return "UCI Problems"; }
32    }
33    public override string Description {
34      get {
35        return "";
36      }
37    }
38    public override Uri WebLink {
39      get { return new Uri("http://archive.ics.uci.edu/ml/datasets.html"); }
40    }
41    public override string ReferencePublication {
42      get { return ""; }
43    }
44
45    protected override string FileName { get { return "UCI"; } }
46
47    public override IEnumerable<IDataDescriptor> GetDataDescriptors() {
48      List<IUCIDataDescriptor> descriptorList = new List<IUCIDataDescriptor>();
49      descriptorList.Add(new Iris());
50      descriptorList.Add(new Mammography());
51      descriptorList.Add(new Thyroid());
52      descriptorList.Add(new Wine());
53      var solutionsArchiveName = GetResourceName(FileName + @"\.zip");
54      if (!String.IsNullOrEmpty(solutionsArchiveName)) {
55        using (var solutionsZipFile = new ZipInputStream(GetType().Assembly.GetManifestResourceStream(solutionsArchiveName))) {
56          IList<string> entries = new List<string>();
57          ZipEntry curEntry;
58          while ((curEntry = solutionsZipFile.GetNextEntry()) != null) {
59            entries.Add(curEntry.Name);
60          }
61          foreach (var entry in entries.OrderBy(x => x)) {
62            string prettyName = Path.GetFileNameWithoutExtension(entry);
63            IUCIDataDescriptor desc = descriptorList.Where(x => x.Name.Equals(prettyName)).FirstOrDefault();
64            prettyName = String.Format("{0}, {1}, {2}", prettyName, desc.Donor, desc.Year);
65            if (desc != null) {
66              yield return new ResourceClassificationDataDescriptor(prettyName, desc.Description, entry);
67            } else
68              yield return new ResourceClassificationDataDescriptor(prettyName, Description, entry);
69          }
70        }
71      }
72    }
73  }
74}
Note: See TracBrowser for help on using the repository browser.