#region License Information
/* HeuristicLab
* Copyright (C) 2002-2008 Heuristic and Evolutionary Algorithms Laboratory (HEAL)
*
* This file is part of HeuristicLab.
*
* HeuristicLab is free software: you can redistribute it and/or modify
* it under the terms of the GNU General Public License as published by
* the Free Software Foundation, either version 3 of the License, or
* (at your option) any later version.
*
* HeuristicLab is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
* GNU General Public License for more details.
*
* You should have received a copy of the GNU General Public License
* along with HeuristicLab. If not, see .
*/
#endregion
using System;
using System.Collections.Generic;
using System.Text;
using System.Windows.Forms;
using HeuristicLab.PluginInfrastructure;
using System.Net;
using System.ServiceModel;
using System.ServiceModel.Description;
using System.Linq;
using HeuristicLab.Data;
using HeuristicLab.Core;
using HeuristicLab.Modeling;
using HeuristicLab.Modeling.Database;
using HeuristicLab.DataAnalysis;
using HeuristicLab.GP.Interfaces;
using HeuristicLab.GP;
using HeuristicLab.GP.StructureIdentification;
namespace HeuristicLab.CEDMA.Server {
public class SimpleDispatcher : IDispatcher, IViewable {
private class AlgorithmConfiguration {
public string name;
public ProblemSpecification problemSpecification;
}
internal event EventHandler Changed;
private IModelingDatabase database;
public IModelingDatabase Database {
get {
return database;
}
}
private Dataset dataset;
public Dataset Dataset {
get {
return dataset;
}
}
public IEnumerable TargetVariables {
get {
return Enumerable.Range(0, Dataset.Columns).Select(x => Dataset.GetVariableName(x));
}
}
public IEnumerable Variables {
get {
return TargetVariables;
}
}
private HeuristicLab.Modeling.IAlgorithm[] defaultAlgorithms;
public IEnumerable GetAlgorithms(LearningTask task) {
switch (task) {
case LearningTask.Regression: {
return defaultAlgorithms.Where(a => (a as IClassificationAlgorithm) == null && (a as ITimeSeriesAlgorithm) == null);
}
case LearningTask.Classification: {
return defaultAlgorithms.Where(a => (a as IClassificationAlgorithm) != null);
}
case LearningTask.TimeSeries: {
return defaultAlgorithms.Where(a => (a as ITimeSeriesAlgorithm) != null);
}
default: {
return new HeuristicLab.Modeling.IAlgorithm[] { };
}
}
}
private Random random;
private Dictionary problemSpecifications;
private Dictionary> algorithms;
public IEnumerable GetAllowedAlgorithms(string targetVariable) {
if (algorithms.ContainsKey(targetVariable))
return algorithms[targetVariable];
else return new HeuristicLab.Modeling.IAlgorithm[] { };
}
private Dictionary activeVariables;
public IEnumerable AllowedTargetVariables {
get { return activeVariables.Where(x => x.Value).Select(x => x.Key); }
}
private Dictionary> finishedAndDispatchedRuns;
private object locker = new object();
public double TrainingSetPercentageSize {
get;
set;
}
public int SkippedRowsBeginning {
get;
set;
}
public int SkippedRowsEnd {
get;
set;
}
public SimpleDispatcher(IModelingDatabase database, Dataset dataset) {
this.dataset = dataset;
this.database = database;
dataset.Changed += (sender, args) => FireChanged();
random = new Random();
activeVariables = new Dictionary();
problemSpecifications = new Dictionary();
algorithms = new Dictionary>();
finishedAndDispatchedRuns = new Dictionary>();
defaultAlgorithms = ApplicationManager.Manager.GetInstances().ToArray();
TrainingSetPercentageSize = 0.5;
SkippedRowsBeginning = 2;
// PopulateFinishedRuns();
}
public HeuristicLab.Modeling.IAlgorithm GetNextJob() {
lock (locker) {
if (activeVariables.Where(x => x.Value == true).Count() > 0) {
string[] targetVariables = (from pair in activeVariables
where pair.Value == true
select pair.Key).ToArray();
string targetVariable = SelectTargetVariable(targetVariables);
HeuristicLab.Modeling.IAlgorithm selectedAlgorithm = SelectAndConfigureAlgorithm(targetVariable);
return selectedAlgorithm;
} else return null;
}
}
public virtual string SelectTargetVariable(string[] targetVariables) {
return targetVariables[random.Next(targetVariables.Length)];
}
public HeuristicLab.Modeling.IAlgorithm SelectAndConfigureAlgorithm(string targetVariable) {
HeuristicLab.Modeling.IAlgorithm selectedAlgorithm = null;
var possibleAlgos =
algorithms[targetVariable]
.Where(x =>
((x is IStochasticAlgorithm) || !AlgorithmFinishedOrDispatched(problemSpecifications[targetVariable], x.Name)));
if (possibleAlgos.Count() > 0) selectedAlgorithm = possibleAlgos.ElementAt(random.Next(possibleAlgos.Count()));
if (selectedAlgorithm != null) {
// create a clone of the algorithm template before setting the parameters
selectedAlgorithm = (HeuristicLab.Modeling.IAlgorithm)selectedAlgorithm.Clone();
SetProblemParameters(selectedAlgorithm, problemSpecifications[targetVariable]);
if (!(selectedAlgorithm is IStochasticAlgorithm))
AddDispatchedRun(problemSpecifications[targetVariable], selectedAlgorithm.Name);
}
return selectedAlgorithm;
}
//private void PopulateFinishedRuns() {
// var dispatchedAlgos = from model in Database.GetAllModels()
// select new {
// TargetVariable = model.TargetVariable.Name,
// Algorithm = model.Algorithm.Name,
// InputVariables = Database.GetInputVariableResults(model).Select(x => x.Variable.Name).Distinct(),
// };
// foreach (var algo in dispatchedAlgos) {
// ProblemSpecification spec = new ProblemSpecification();
// spec.TargetVariable = algo.TargetVariable;
// foreach (string variable in algo.InputVariables) spec.AddInputVariable(variable);
// AddDispatchedRun(spec, algo.Algorithm);
// }
//}
private void SetProblemParameters(HeuristicLab.Modeling.IAlgorithm algo, ProblemSpecification spec) {
algo.Dataset = spec.Dataset;
algo.TargetVariable = spec.TargetVariable;
algo.TrainingSamplesStart = spec.TrainingSamplesStart;
algo.TrainingSamplesEnd = spec.TrainingSamplesEnd;
algo.ValidationSamplesStart = spec.ValidationSamplesStart;
algo.ValidationSamplesEnd = spec.ValidationSamplesEnd;
algo.TestSamplesStart = spec.TestSamplesStart;
algo.TestSamplesEnd = spec.TestSamplesEnd;
List allowedFeatures = new List();
foreach (string inputVariable in spec.InputVariables) {
if (inputVariable != spec.TargetVariable) {
allowedFeatures.Add(inputVariable);
}
}
if (spec.LearningTask == LearningTask.TimeSeries) {
algo.TrainingSamplesStart = spec.TrainingSamplesStart + 1; // first possible index is 1 because of differential symbol
if (spec.AutoRegressive) {
allowedFeatures.Add(spec.TargetVariable);
}
}
algo.AllowedVariables = allowedFeatures;
}
private void AddDispatchedRun(ProblemSpecification specification, string algorithm) {
AlgorithmConfiguration conf = new AlgorithmConfiguration();
conf.name = algorithm;
conf.problemSpecification = new ProblemSpecification(specification);
if (!finishedAndDispatchedRuns.ContainsKey(specification.TargetVariable))
finishedAndDispatchedRuns.Add(specification.TargetVariable, new List());
finishedAndDispatchedRuns[specification.TargetVariable].Add(conf);
}
private bool AlgorithmFinishedOrDispatched(ProblemSpecification specification, string algoName) {
return
finishedAndDispatchedRuns.ContainsKey(specification.TargetVariable) &&
finishedAndDispatchedRuns[specification.TargetVariable].Any(x =>
algoName == x.name &&
specification.Equals(x.problemSpecification));
}
internal void EnableTargetVariable(string name) {
activeVariables[name] = true;
}
internal void DisableTargetVariable(string name) {
activeVariables[name] = false;
}
public void EnableAlgorithm(string targetVariable, HeuristicLab.Modeling.IAlgorithm algo) {
if (!algorithms.ContainsKey(targetVariable)) algorithms.Add(targetVariable, new List());
if (!algorithms[targetVariable].Contains(algo))
algorithms[targetVariable].Add(algo);
}
public void DisableAlgorithm(string targetVariable, HeuristicLab.Modeling.IAlgorithm algo) {
algorithms[targetVariable].Remove(algo);
}
public ProblemSpecification GetProblemSpecification(string targetVariable) {
if (!problemSpecifications.ContainsKey(targetVariable))
problemSpecifications[targetVariable] = CreateDefaultProblemSpecification(targetVariable);
return problemSpecifications[targetVariable];
}
private ProblemSpecification CreateDefaultProblemSpecification(string targetVariable) {
ProblemSpecification spec = new ProblemSpecification();
spec.Dataset = dataset;
spec.TargetVariable = targetVariable;
spec.LearningTask = LearningTask.Regression;
int targetColumn = dataset.GetVariableIndex(targetVariable);
// find index of first correct target value
int firstValueIndex;
for (firstValueIndex = 0; firstValueIndex < dataset.Rows; firstValueIndex++) {
double x = dataset.GetValue(firstValueIndex, targetColumn);
if (!(double.IsNaN(x) || double.IsInfinity(x))) break;
}
firstValueIndex += SkippedRowsBeginning;
// find index of last correct target value
int lastValueIndex;
for (lastValueIndex = dataset.Rows - 1; lastValueIndex > firstValueIndex; lastValueIndex--) {
double x = dataset.GetValue(lastValueIndex, targetColumn);
if (!(double.IsNaN(x) || double.IsInfinity(x))) break;
}
lastValueIndex -= SkippedRowsEnd;
int validTargetRange = lastValueIndex - firstValueIndex;
spec.TrainingSamplesStart = firstValueIndex;
spec.TrainingSamplesEnd = firstValueIndex + (int)Math.Floor(validTargetRange * TrainingSetPercentageSize);
spec.ValidationSamplesStart = spec.TrainingSamplesEnd;
spec.ValidationSamplesEnd = spec.TrainingSamplesEnd + (int)Math.Floor(validTargetRange * (1 - TrainingSetPercentageSize) / 2.0);
spec.TestSamplesStart = spec.ValidationSamplesEnd;
spec.TestSamplesEnd = lastValueIndex;
return spec;
}
public void FireChanged() {
if (Changed != null) Changed(this, new EventArgs());
}
#region IViewable Members
public virtual IView CreateView() {
return new DispatcherView(this);
}
#endregion
}
}