#region License Information
/* HeuristicLab
* Copyright (C) 2002-2015 Heuristic and Evolutionary Algorithms Laboratory (HEAL)
*
* This file is part of HeuristicLab.
*
* HeuristicLab is free software: you can redistribute it and/or modify
* it under the terms of the GNU General Public License as published by
* the Free Software Foundation, either version 3 of the License, or
* (at your option) any later version.
*
* HeuristicLab is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
* GNU General Public License for more details.
*
* You should have received a copy of the GNU General Public License
* along with HeuristicLab. If not, see .
*/
#endregion
using System;
using System.Collections.Generic;
using System.Linq;
using HeuristicLab.Common;
using HeuristicLab.Core;
using HeuristicLab.Persistence.Default.CompositeSerializers.Storable;
namespace HeuristicLab.Encodings.SymbolicExpressionTreeEncoding {
///
/// The default symbolic expression grammar stores symbols and syntactic constraints for symbols.
/// Symbols are treated as equvivalent if they have the same name.
/// Syntactic constraints limit the number of allowed sub trees for a node with a symbol and which symbols are allowed
/// in the sub-trees of a symbol (can be specified for each sub-tree index separately).
///
[StorableClass]
public abstract class SymbolicExpressionGrammarBase : NamedItem, ISymbolicExpressionGrammarBase {
#region properties for separation between implementation and persistence
[Storable(Name = "Symbols")]
private IEnumerable StorableSymbols {
get { return symbols.Values.ToArray(); }
set { foreach (var s in value) symbols.Add(s.Name, s); }
}
[Storable(Name = "SymbolSubtreeCount")]
private IEnumerable>> StorableSymbolSubtreeCount {
get { return symbolSubtreeCount.Select(x => new KeyValuePair>(GetSymbol(x.Key), x.Value)).ToArray(); }
set { foreach (var pair in value) symbolSubtreeCount.Add(pair.Key.Name, pair.Value); }
}
[Storable(Name = "AllowedChildSymbols")]
private IEnumerable>> StorableAllowedChildSymbols {
get { return allowedChildSymbols.Select(x => new KeyValuePair>(GetSymbol(x.Key), x.Value.Select(GetSymbol).ToArray())).ToArray(); }
set { foreach (var pair in value) allowedChildSymbols.Add(pair.Key.Name, pair.Value.Select(y => y.Name).ToList()); }
}
[Storable(Name = "AllowedChildSymbolsPerIndex")]
private IEnumerable, IEnumerable>> StorableAllowedChildSymbolsPerIndex {
get { return allowedChildSymbolsPerIndex.Select(x => new KeyValuePair, IEnumerable>(Tuple.Create(GetSymbol(x.Key.Item1), x.Key.Item2), x.Value.Select(GetSymbol).ToArray())).ToArray(); }
set {
foreach (var pair in value)
allowedChildSymbolsPerIndex.Add(Tuple.Create(pair.Key.Item1.Name, pair.Key.Item2), pair.Value.Select(y => y.Name).ToList());
}
}
#endregion
private bool suppressEvents;
protected readonly Dictionary symbols;
protected readonly Dictionary> symbolSubtreeCount;
protected readonly Dictionary> allowedChildSymbols;
protected readonly Dictionary, List> allowedChildSymbolsPerIndex;
public override bool CanChangeName {
get { return false; }
}
public override bool CanChangeDescription {
get { return false; }
}
[StorableConstructor]
protected SymbolicExpressionGrammarBase(bool deserializing)
: base(deserializing) {
cachedMinExpressionLength = new Dictionary();
cachedMaxExpressionLength = new Dictionary, int>();
cachedMinExpressionDepth = new Dictionary();
cachedMaxExpressionDepth = new Dictionary();
cachedIsAllowedChildSymbol = new Dictionary, bool>();
cachedIsAllowedChildSymbolIndex = new Dictionary, bool>();
symbols = new Dictionary();
symbolSubtreeCount = new Dictionary>();
allowedChildSymbols = new Dictionary>();
allowedChildSymbolsPerIndex = new Dictionary, List>();
suppressEvents = false;
}
protected SymbolicExpressionGrammarBase(SymbolicExpressionGrammarBase original, Cloner cloner)
: base(original, cloner) {
cachedMinExpressionLength = new Dictionary();
cachedMaxExpressionLength = new Dictionary, int>();
cachedMinExpressionDepth = new Dictionary();
cachedMaxExpressionDepth = new Dictionary();
cachedIsAllowedChildSymbol = new Dictionary, bool>();
cachedIsAllowedChildSymbolIndex = new Dictionary, bool>();
symbols = original.symbols.ToDictionary(x => x.Key, y => cloner.Clone(y.Value));
symbolSubtreeCount = new Dictionary>(original.symbolSubtreeCount);
allowedChildSymbols = new Dictionary>();
foreach (var element in original.allowedChildSymbols)
allowedChildSymbols.Add(element.Key, new List(element.Value));
allowedChildSymbolsPerIndex = new Dictionary, List>();
foreach (var element in original.allowedChildSymbolsPerIndex)
allowedChildSymbolsPerIndex.Add(element.Key, new List(element.Value));
suppressEvents = false;
}
protected SymbolicExpressionGrammarBase(string name, string description)
: base(name, description) {
cachedMinExpressionLength = new Dictionary();
cachedMaxExpressionLength = new Dictionary, int>();
cachedMinExpressionDepth = new Dictionary();
cachedMaxExpressionDepth = new Dictionary();
cachedIsAllowedChildSymbol = new Dictionary, bool>();
cachedIsAllowedChildSymbolIndex = new Dictionary, bool>();
symbols = new Dictionary();
symbolSubtreeCount = new Dictionary>();
allowedChildSymbols = new Dictionary>();
allowedChildSymbolsPerIndex = new Dictionary, List>();
suppressEvents = false;
}
#region protected grammar manipulation methods
public virtual void AddSymbol(ISymbol symbol) {
if (ContainsSymbol(symbol)) throw new ArgumentException("Symbol " + symbol + " is already defined.");
foreach (var s in symbol.Flatten()) {
symbols.Add(s.Name, s);
int maxSubTreeCount = Math.Min(s.MinimumArity + 1, s.MaximumArity);
symbolSubtreeCount.Add(s.Name, Tuple.Create(s.MinimumArity, maxSubTreeCount));
}
ClearCaches();
}
public virtual void RemoveSymbol(ISymbol symbol) {
foreach (var s in symbol.Flatten()) {
symbols.Remove(s.Name);
allowedChildSymbols.Remove(s.Name);
for (int i = 0; i < GetMaximumSubtreeCount(s); i++)
allowedChildSymbolsPerIndex.Remove(Tuple.Create(s.Name, i));
symbolSubtreeCount.Remove(s.Name);
foreach (var parent in Symbols) {
List allowedChilds;
if (allowedChildSymbols.TryGetValue(parent.Name, out allowedChilds))
allowedChilds.Remove(s.Name);
for (int i = 0; i < GetMaximumSubtreeCount(parent); i++) {
if (allowedChildSymbolsPerIndex.TryGetValue(Tuple.Create(parent.Name, i), out allowedChilds))
allowedChilds.Remove(s.Name);
}
}
suppressEvents = true;
foreach (var groupSymbol in Symbols.OfType())
groupSymbol.SymbolsCollection.Remove(symbol);
suppressEvents = false;
}
ClearCaches();
}
public virtual ISymbol GetSymbol(string symbolName) {
ISymbol symbol;
if (symbols.TryGetValue(symbolName, out symbol)) return symbol;
return null;
}
public virtual void AddAllowedChildSymbol(ISymbol parent, ISymbol child) {
bool changed = false;
foreach (ISymbol p in parent.Flatten().Where(p => !(p is GroupSymbol)))
changed |= AddAllowedChildSymbolToDictionaries(p, child);
if (changed) {
ClearCaches();
OnChanged();
}
}
private bool AddAllowedChildSymbolToDictionaries(ISymbol parent, ISymbol child) {
List childSymbols;
if (!allowedChildSymbols.TryGetValue(parent.Name, out childSymbols)) {
childSymbols = new List();
allowedChildSymbols.Add(parent.Name, childSymbols);
}
if (childSymbols.Contains(child.Name)) return false;
suppressEvents = true;
for (int argumentIndex = 0; argumentIndex < GetMaximumSubtreeCount(parent); argumentIndex++)
RemoveAllowedChildSymbol(parent, child, argumentIndex);
suppressEvents = false;
childSymbols.Add(child.Name);
return true;
}
public virtual void AddAllowedChildSymbol(ISymbol parent, ISymbol child, int argumentIndex) {
bool changed = false;
foreach (ISymbol p in parent.Flatten().Where(p => !(p is GroupSymbol)))
changed |= AddAllowedChildSymbolToDictionaries(p, child, argumentIndex);
if (changed) {
ClearCaches();
OnChanged();
}
}
private bool AddAllowedChildSymbolToDictionaries(ISymbol parent, ISymbol child, int argumentIndex) {
List childSymbols;
if (!allowedChildSymbols.TryGetValue(parent.Name, out childSymbols)) {
childSymbols = new List();
allowedChildSymbols.Add(parent.Name, childSymbols);
}
if (childSymbols.Contains(child.Name)) return false;
var key = Tuple.Create(parent.Name, argumentIndex);
if (!allowedChildSymbolsPerIndex.TryGetValue(key, out childSymbols)) {
childSymbols = new List();
allowedChildSymbolsPerIndex.Add(key, childSymbols);
}
if (childSymbols.Contains(child.Name)) return false;
childSymbols.Add(child.Name);
return true;
}
public virtual void RemoveAllowedChildSymbol(ISymbol parent, ISymbol child) {
bool changed = false;
List childSymbols;
if (allowedChildSymbols.TryGetValue(child.Name, out childSymbols)) {
changed |= childSymbols.Remove(child.Name);
}
for (int argumentIndex = 0; argumentIndex < GetMaximumSubtreeCount(parent); argumentIndex++) {
var key = Tuple.Create(parent.Name, argumentIndex);
if (allowedChildSymbolsPerIndex.TryGetValue(key, out childSymbols))
changed |= childSymbols.Remove(child.Name);
}
if (changed) {
ClearCaches();
OnChanged();
}
}
public virtual void RemoveAllowedChildSymbol(ISymbol parent, ISymbol child, int argumentIndex) {
bool changed = false;
suppressEvents = true;
List childSymbols;
if (allowedChildSymbols.TryGetValue(parent.Name, out childSymbols)) {
if (childSymbols.Remove(child.Name)) {
for (int i = 0; i < GetMaximumSubtreeCount(parent); i++) {
if (i != argumentIndex) AddAllowedChildSymbol(parent, child, i);
}
changed = true;
}
}
suppressEvents = false;
var key = Tuple.Create(parent.Name, argumentIndex);
if (allowedChildSymbolsPerIndex.TryGetValue(key, out childSymbols))
changed |= childSymbols.Remove(child.Name);
if (changed) {
ClearCaches();
OnChanged();
}
}
public virtual void SetSubtreeCount(ISymbol symbol, int minimumSubtreeCount, int maximumSubtreeCount) {
var symbols = symbol.Flatten().Where(s => !(s is GroupSymbol));
if (symbols.Any(s => s.MinimumArity > minimumSubtreeCount)) throw new ArgumentException("Invalid minimum subtree count " + minimumSubtreeCount + " for " + symbol);
if (symbols.Any(s => s.MaximumArity < maximumSubtreeCount)) throw new ArgumentException("Invalid maximum subtree count " + maximumSubtreeCount + " for " + symbol);
foreach (ISymbol s in symbols)
SetSubTreeCountInDictionaries(s, minimumSubtreeCount, maximumSubtreeCount);
ClearCaches();
OnChanged();
}
private void SetSubTreeCountInDictionaries(ISymbol symbol, int minimumSubtreeCount, int maximumSubtreeCount) {
for (int i = maximumSubtreeCount; i < GetMaximumSubtreeCount(symbol); i++) {
var key = Tuple.Create(symbol.Name, i);
allowedChildSymbolsPerIndex.Remove(key);
}
symbolSubtreeCount[symbol.Name] = Tuple.Create(minimumSubtreeCount, maximumSubtreeCount);
}
#endregion
public virtual IEnumerable Symbols {
get { return symbols.Values; }
}
public virtual IEnumerable AllowedSymbols {
get { return Symbols.Where(s => s.Enabled); }
}
public virtual bool ContainsSymbol(ISymbol symbol) {
return symbols.ContainsKey(symbol.Name);
}
private readonly Dictionary, bool> cachedIsAllowedChildSymbol;
public virtual bool IsAllowedChildSymbol(ISymbol parent, ISymbol child) {
if (allowedChildSymbols.Count == 0) return false;
if (!child.Enabled) return false;
bool result;
var key = Tuple.Create(parent.Name, child.Name);
if (cachedIsAllowedChildSymbol.TryGetValue(key, out result)) return result;
// value has to be calculated and cached make sure this is done in only one thread
lock (cachedIsAllowedChildSymbol) {
// in case the value has been calculated on another thread in the meanwhile
if (cachedIsAllowedChildSymbol.TryGetValue(key, out result)) return result;
List temp;
if (allowedChildSymbols.TryGetValue(parent.Name, out temp)) {
if (temp.SelectMany(s => GetSymbol(s).Flatten()).Any(s => s.Name == child.Name)) {
cachedIsAllowedChildSymbol.Add(key, true);
return true;
}
}
cachedIsAllowedChildSymbol.Add(key, false);
return false;
}
}
private readonly Dictionary, bool> cachedIsAllowedChildSymbolIndex;
public virtual bool IsAllowedChildSymbol(ISymbol parent, ISymbol child, int argumentIndex) {
if (!child.Enabled) return false;
if (IsAllowedChildSymbol(parent, child)) return true;
if (allowedChildSymbolsPerIndex.Count == 0) return false;
bool result;
var key = Tuple.Create(parent.Name, child.Name, argumentIndex);
if (cachedIsAllowedChildSymbolIndex.TryGetValue(key, out result)) return result;
// value has to be calculated and cached make sure this is done in only one thread
lock (cachedIsAllowedChildSymbolIndex) {
// in case the value has been calculated on another thread in the meanwhile
if (cachedIsAllowedChildSymbolIndex.TryGetValue(key, out result)) return result;
List temp;
if (allowedChildSymbolsPerIndex.TryGetValue(Tuple.Create(parent.Name, argumentIndex), out temp)) {
if (temp.SelectMany(s => GetSymbol(s).Flatten()).Any(s => s.Name == child.Name)) {
cachedIsAllowedChildSymbolIndex.Add(key, true);
return true;
}
}
cachedIsAllowedChildSymbolIndex.Add(key, false);
return false;
}
}
public IEnumerable GetAllowedChildSymbols(ISymbol parent) {
foreach (ISymbol child in AllowedSymbols) {
if (IsAllowedChildSymbol(parent, child)) yield return child;
}
}
public IEnumerable GetAllowedChildSymbols(ISymbol parent, int argumentIndex) {
foreach (ISymbol child in AllowedSymbols) {
if (IsAllowedChildSymbol(parent, child, argumentIndex)) yield return child;
}
}
public virtual int GetMinimumSubtreeCount(ISymbol symbol) {
return symbolSubtreeCount[symbol.Name].Item1;
}
public virtual int GetMaximumSubtreeCount(ISymbol symbol) {
return symbolSubtreeCount[symbol.Name].Item2;
}
protected void ClearCaches() {
cachedMinExpressionLength.Clear();
cachedMaxExpressionLength.Clear();
cachedMinExpressionDepth.Clear();
cachedMaxExpressionDepth.Clear();
cachedIsAllowedChildSymbol.Clear();
cachedIsAllowedChildSymbolIndex.Clear();
}
private readonly Dictionary cachedMinExpressionLength;
public int GetMinimumExpressionLength(ISymbol symbol) {
int res;
if (cachedMinExpressionLength.TryGetValue(symbol.Name, out res))
return res;
// value has to be calculated and cached make sure this is done in only one thread
lock (cachedMinExpressionLength) {
// in case the value has been calculated on another thread in the meanwhile
if (cachedMinExpressionLength.TryGetValue(symbol.Name, out res)) return res;
res = GetMinimumExpressionLengthRec(symbol);
foreach (var entry in cachedMinExpressionLength.Where(e => e.Value >= int.MaxValue).ToList()) {
if (entry.Key != symbol.Name) cachedMinExpressionLength.Remove(entry.Key);
}
return res;
}
}
private int GetMinimumExpressionLengthRec(ISymbol symbol) {
int temp;
if (!cachedMinExpressionLength.TryGetValue(symbol.Name, out temp)) {
cachedMinExpressionLength[symbol.Name] = int.MaxValue; // prevent infinite recursion
long sumOfMinExpressionLengths = 1 + (from argIndex in Enumerable.Range(0, GetMinimumSubtreeCount(symbol))
let minForSlot = (long)(from s in GetAllowedChildSymbols(symbol, argIndex)
where s.InitialFrequency > 0.0
select GetMinimumExpressionLengthRec(s)).DefaultIfEmpty(0).Min()
select minForSlot).DefaultIfEmpty(0).Sum();
cachedMinExpressionLength[symbol.Name] = (int)Math.Min(sumOfMinExpressionLengths, int.MaxValue);
return cachedMinExpressionLength[symbol.Name];
}
return temp;
}
private readonly Dictionary, int> cachedMaxExpressionLength;
public int GetMaximumExpressionLength(ISymbol symbol, int maxDepth) {
int temp;
var key = Tuple.Create(symbol.Name, maxDepth);
if (cachedMaxExpressionLength.TryGetValue(key, out temp)) return temp;
// value has to be calculated and cached make sure this is done in only one thread
lock (cachedMaxExpressionLength) {
// in case the value has been calculated on another thread in the meanwhile
if (cachedMaxExpressionLength.TryGetValue(key, out temp)) return temp;
cachedMaxExpressionLength[key] = int.MaxValue; // prevent infinite recursion
long sumOfMaxTrees = 1 + (from argIndex in Enumerable.Range(0, GetMaximumSubtreeCount(symbol))
let maxForSlot = (long)(from s in GetAllowedChildSymbols(symbol, argIndex)
where s.InitialFrequency > 0.0
where GetMinimumExpressionDepth(s) < maxDepth
select GetMaximumExpressionLength(s, maxDepth - 1)).DefaultIfEmpty(0).Max()
select maxForSlot).DefaultIfEmpty(0).Sum();
cachedMaxExpressionLength[key] = (int)Math.Min(sumOfMaxTrees, int.MaxValue);
return cachedMaxExpressionLength[key];
}
}
private readonly Dictionary cachedMinExpressionDepth;
public int GetMinimumExpressionDepth(ISymbol symbol) {
int res;
if (cachedMinExpressionDepth.TryGetValue(symbol.Name, out res))
return res;
// value has to be calculated and cached make sure this is done in only one thread
lock (cachedMinExpressionDepth) {
// in case the value has been calculated on another thread in the meanwhile
if (cachedMinExpressionDepth.TryGetValue(symbol.Name, out res)) return res;
res = GetMinimumExpressionDepthRec(symbol);
foreach (var entry in cachedMinExpressionDepth.Where(e => e.Value >= int.MaxValue).ToList()) {
if (entry.Key != symbol.Name) cachedMinExpressionDepth.Remove(entry.Key);
}
return res;
}
}
private int GetMinimumExpressionDepthRec(ISymbol symbol) {
int temp;
if (!cachedMinExpressionDepth.TryGetValue(symbol.Name, out temp)) {
cachedMinExpressionDepth[symbol.Name] = int.MaxValue; // prevent infinite recursion
long minDepth = 1 + (from argIndex in Enumerable.Range(0, GetMinimumSubtreeCount(symbol))
let minForSlot = (long)(from s in GetAllowedChildSymbols(symbol, argIndex)
where s.InitialFrequency > 0.0
select GetMinimumExpressionDepthRec(s)).DefaultIfEmpty(0).Min()
select minForSlot).DefaultIfEmpty(0).Max();
cachedMinExpressionDepth[symbol.Name] = (int)Math.Min(minDepth, int.MaxValue);
return cachedMinExpressionDepth[symbol.Name];
}
return temp;
}
private readonly Dictionary cachedMaxExpressionDepth;
public int GetMaximumExpressionDepth(ISymbol symbol) {
int temp;
if (cachedMaxExpressionDepth.TryGetValue(symbol.Name, out temp)) return temp;
// value has to be calculated and cached make sure this is done in only one thread
lock (cachedMaxExpressionDepth) {
// in case the value has been calculated on another thread in the meanwhile
if (cachedMaxExpressionDepth.TryGetValue(symbol.Name, out temp)) return temp;
cachedMaxExpressionDepth[symbol.Name] = int.MaxValue;
long maxDepth = 1 + (from argIndex in Enumerable.Range(0, GetMaximumSubtreeCount(symbol))
let maxForSlot = (long)(from s in GetAllowedChildSymbols(symbol, argIndex)
where s.InitialFrequency > 0.0
select GetMaximumExpressionDepth(s)).DefaultIfEmpty(0).Max()
select maxForSlot).DefaultIfEmpty(0).Max();
cachedMaxExpressionDepth[symbol.Name] = (int)Math.Min(maxDepth, int.MaxValue);
return cachedMaxExpressionDepth[symbol.Name];
}
}
public event EventHandler Changed;
protected virtual void OnChanged() {
if (suppressEvents) return;
var handler = Changed;
if (handler != null) handler(this, EventArgs.Empty);
}
}
}