Changeset 8585 for branches/HeuristicLab.Mono/HeuristicLab.Problems.Instances.DataAnalysis/3.3/Classification/CSV/ClassifiactionCSVInstanceProvider.cs
- Timestamp:
- 09/06/12 09:52:52 (12 years ago)
- Location:
- branches/HeuristicLab.Mono
- Files:
-
- 2 edited
Legend:
- Unmodified
- Added
- Removed
-
branches/HeuristicLab.Mono
-
branches/HeuristicLab.Mono/HeuristicLab.Problems.Instances.DataAnalysis/3.3/Classification/CSV/ClassifiactionCSVInstanceProvider.cs
r8211 r8585 22 22 using System; 23 23 using System.Collections.Generic; 24 using System.Globalization; 24 25 using System.IO; 25 26 using System.Linq; 26 27 using System.Text; 28 using HeuristicLab.Common; 27 29 using HeuristicLab.Problems.DataAnalysis; 28 30 … … 61 63 62 64 Dataset dataset = new Dataset(csvFileParser.VariableNames, csvFileParser.Values); 63 string targetVar = csvFileParser.VariableNames.Where(x => dataset.DoubleVariables.Contains(x)).Last(); 64 IEnumerable<string> allowedInputVars = dataset.DoubleVariables.Where(x => !x.Equals(targetVar)); 65 string targetVar = dataset.DoubleVariables.Last(); 65 66 66 ClassificationProblemData claData = new ClassificationProblemData(dataset, allowedInputVars, targetVar); 67 68 int trainingPartEnd = csvFileParser.Rows * 2 / 3; 69 claData.TrainingPartition.Start = 0; 70 claData.TrainingPartition.End = trainingPartEnd; 71 claData.TestPartition.Start = trainingPartEnd; 72 claData.TestPartition.End = csvFileParser.Rows; 73 int pos = path.LastIndexOf('\\'); 74 if (pos < 0) 75 claData.Name = path; 76 else { 77 pos++; 78 claData.Name = path.Substring(pos, path.Length - pos); 67 // turn of input variables that are constant in the training partition 68 var allowedInputVars = new List<string>(); 69 var trainingIndizes = Enumerable.Range(0, (csvFileParser.Rows * 2) / 3); 70 foreach (var variableName in dataset.DoubleVariables) { 71 if (dataset.GetDoubleValues(variableName, trainingIndizes).Range() > 0 && 72 variableName != targetVar) 73 allowedInputVars.Add(variableName); 79 74 } 80 75 81 return claData; 76 ClassificationProblemData classificationData = new ClassificationProblemData(dataset, allowedInputVars, targetVar); 77 78 int trainingPartEnd = trainingIndizes.Last(); 79 classificationData.TrainingPartition.Start = trainingIndizes.First(); 80 classificationData.TrainingPartition.End = trainingPartEnd; 81 classificationData.TestPartition.Start = trainingPartEnd; 82 classificationData.TestPartition.End = csvFileParser.Rows; 83 84 classificationData.Name = Path.GetFileName(path); 85 86 return classificationData; 82 87 } 83 88 … … 86 91 } 87 92 public override void ExportData(IClassificationProblemData instance, string path) { 88 StringBuilder strBuilder = new StringBuilder();93 var strBuilder = new StringBuilder(); 89 94 90 95 foreach (var variable in instance.InputVariables) { 91 strBuilder.Append(variable + ";");96 strBuilder.Append(variable + CultureInfo.CurrentCulture.TextInfo.ListSeparator); 92 97 } 93 strBuilder.Remove(strBuilder.Length - 1, 1);98 strBuilder.Remove(strBuilder.Length - CultureInfo.CurrentCulture.TextInfo.ListSeparator.Length, CultureInfo.CurrentCulture.TextInfo.ListSeparator.Length); 94 99 strBuilder.AppendLine(); 95 100 96 Datasetdataset = instance.Dataset;101 var dataset = instance.Dataset; 97 102 98 103 for (int i = 0; i < dataset.Rows; i++) { 99 104 for (int j = 0; j < dataset.Columns; j++) { 100 strBuilder.Append(dataset.GetValue(i, j) + ";"); 105 if (j > 0) strBuilder.Append(CultureInfo.CurrentCulture.TextInfo.ListSeparator); 106 strBuilder.Append(dataset.GetValue(i, j)); 101 107 } 102 strBuilder.Remove(strBuilder.Length - 1, 1);103 108 strBuilder.AppendLine(); 104 109 } 105 110 106 using ( StreamWriter writer = new StreamWriter(path)) {111 using (var writer = new StreamWriter(path)) { 107 112 writer.Write(strBuilder); 108 113 }
Note: See TracChangeset
for help on using the changeset viewer.