Free cookie consent management tool by TermsFeed Policy Generator

source: branches/plugins/HeuristicLab.StructureIdentification/3.2/Recombination/LangdonHomologousCrossOver.cs @ 3494

Last change on this file since 3494 was 619, checked in by gkronber, 16 years ago

added a homologous crossover operator for GP as described by Langdon. (ticket #108)

File size: 14.8 KB
Line 
1#region License Information
2/* HeuristicLab
3 * Copyright (C) 2002-2008 Heuristic and Evolutionary Algorithms Laboratory (HEAL)
4 *
5 * This file is part of HeuristicLab.
6 *
7 * HeuristicLab is free software: you can redistribute it and/or modify
8 * it under the terms of the GNU General Public License as published by
9 * the Free Software Foundation, either version 3 of the License, or
10 * (at your option) any later version.
11 *
12 * HeuristicLab is distributed in the hope that it will be useful,
13 * but WITHOUT ANY WARRANTY; without even the implied warranty of
14 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
15 * GNU General Public License for more details.
16 *
17 * You should have received a copy of the GNU General Public License
18 * along with HeuristicLab. If not, see <http://www.gnu.org/licenses/>.
19 */
20#endregion
21
22using System;
23using System.Collections.Generic;
24using System.Linq;
25using System.Text;
26using HeuristicLab.Core;
27using HeuristicLab.Operators;
28using HeuristicLab.Random;
29using HeuristicLab.Data;
30using HeuristicLab.Constraints;
31using HeuristicLab.Functions;
32using System.Diagnostics;
33
34namespace HeuristicLab.StructureIdentification {
35  /// <summary>
36  /// Implementation of a homologous crossover operator as described in:
37  /// William B. Langdon
38  /// Size Fair and Homologous Tree Genetic Programming Crossovers,
39  /// Genetic Programming and Evolvable Machines, Vol. 1, Number 1/2, pp. 95-119, April 2000
40  /// </summary>
41  public class LangdonHomologousCrossOver : OperatorBase {
42    private const int MAX_RECOMBINATION_TRIES = 20;
43    public override string Description {
44      get {
45        return @"";
46      }
47    }
48    public LangdonHomologousCrossOver()
49      : base() {
50      AddVariableInfo(new VariableInfo("Random", "Pseudo random number generator", typeof(MersenneTwister), VariableKind.In));
51      AddVariableInfo(new VariableInfo("OperatorLibrary", "The operator library containing all available operators", typeof(GPOperatorLibrary), VariableKind.In));
52      AddVariableInfo(new VariableInfo("MaxTreeHeight", "The maximal allowed height of the tree", typeof(IntData), VariableKind.In));
53      AddVariableInfo(new VariableInfo("MaxTreeSize", "The maximal allowed size (number of nodes) of the tree", typeof(IntData), VariableKind.In));
54      AddVariableInfo(new VariableInfo("FunctionTree", "The tree to mutate", typeof(IFunctionTree), VariableKind.In | VariableKind.New));
55      AddVariableInfo(new VariableInfo("TreeSize", "The size (number of nodes) of the tree", typeof(IntData), VariableKind.New));
56      AddVariableInfo(new VariableInfo("TreeHeight", "The height of the tree", typeof(IntData), VariableKind.New));
57    }
58
59    public override IOperation Apply(IScope scope) {
60      MersenneTwister random = GetVariableValue<MersenneTwister>("Random", scope, true);
61      GPOperatorLibrary opLibrary = GetVariableValue<GPOperatorLibrary>("OperatorLibrary", scope, true);
62      int maxTreeHeight = GetVariableValue<IntData>("MaxTreeHeight", scope, true).Data;
63      int maxTreeSize = GetVariableValue<IntData>("MaxTreeSize", scope, true).Data;
64
65      TreeGardener gardener = new TreeGardener(random, opLibrary);
66
67      if((scope.SubScopes.Count % 2) != 0)
68        throw new InvalidOperationException("Number of parents is not even");
69
70      CompositeOperation initOperations = new CompositeOperation();
71
72      int children = scope.SubScopes.Count / 2;
73      for(int i = 0; i < children; i++) {
74        IScope parent1 = scope.SubScopes[0];
75        scope.RemoveSubScope(parent1);
76        IScope parent2 = scope.SubScopes[0];
77        scope.RemoveSubScope(parent2);
78        IScope child = new Scope(i.ToString());
79        IOperation childInitOperation = Cross(gardener, maxTreeSize, maxTreeHeight, scope, random, parent1, parent2, child);
80        initOperations.AddOperation(childInitOperation);
81        scope.AddSubScope(child);
82      }
83
84      return initOperations;
85    }
86
87    private IOperation Cross(TreeGardener gardener, int maxTreeSize, int maxTreeHeight,
88      IScope scope, MersenneTwister random, IScope parent1, IScope parent2, IScope child) {
89      List<IFunctionTree> newBranches;
90      IFunctionTree newTree = Cross(gardener, parent1, parent2,
91        random, maxTreeSize, maxTreeHeight, out newBranches);
92
93
94      int newTreeSize = newTree.Size;
95      int newTreeHeight = newTree.Height;
96      child.AddVariable(new HeuristicLab.Core.Variable(scope.TranslateName("FunctionTree"), newTree));
97      child.AddVariable(new HeuristicLab.Core.Variable(scope.TranslateName("TreeSize"), new IntData(newTreeSize)));
98      child.AddVariable(new HeuristicLab.Core.Variable(scope.TranslateName("TreeHeight"), new IntData(newTreeHeight)));
99
100      // check if the new tree is valid and if the height of is still in the allowed bounds (we are not so strict for the max-size)
101      Debug.Assert(gardener.IsValidTree(newTree) && newTreeHeight <= maxTreeHeight && newTreeSize <= maxTreeSize);
102      return gardener.CreateInitializationOperation(newBranches, child);
103    }
104
105
106    private IFunctionTree Cross(TreeGardener gardener, IScope f, IScope g, MersenneTwister random, int maxTreeSize, int maxTreeHeight, out List<IFunctionTree> newBranches) {
107      IFunctionTree tree0 = f.GetVariableValue<IFunctionTree>("FunctionTree", false);
108      int tree0Height = f.GetVariableValue<IntData>("TreeHeight", false).Data;
109      int tree0Size = f.GetVariableValue<IntData>("TreeSize", false).Data;
110
111      IFunctionTree tree1 = g.GetVariableValue<IFunctionTree>("FunctionTree", false);
112      int tree1Height = g.GetVariableValue<IntData>("TreeHeight", false).Data;
113      int tree1Size = g.GetVariableValue<IntData>("TreeSize", false).Data;
114
115      if(tree0Size == 1 && tree1Size == 1) {
116        return CombineTerminals(gardener, tree0, tree1, random, maxTreeHeight, out newBranches);
117      } else {
118        newBranches = new List<IFunctionTree>();
119
120        // we are going to insert tree1 into tree0 at a random place so we have to make sure that tree0 is not a terminal
121        // in case both trees are higher than 1 we swap the trees with probability 50%
122        if(tree0Height == 1 || (tree1Height > 1 && random.Next(2) == 0)) {
123          IFunctionTree tmp = tree0; tree0 = tree1; tree1 = tmp;
124          int tmpHeight = tree0Height; tree0Height = tree1Height; tree1Height = tmpHeight;
125          int tmpSize = tree0Size; tree0Size = tree1Size; tree1Size = tmpSize;
126        }
127
128        // select a random suboperator of the 'receiving' tree
129        IFunctionTree crossoverPoint = gardener.GetRandomParentNode(tree0);
130        int removedBranchIndex;
131        IFunctionTree removedBranch;
132        IList<IFunction> allowedFunctions;
133        if(crossoverPoint == null) {
134          removedBranchIndex = 0;
135          removedBranch = tree0;
136          allowedFunctions = gardener.GetAllowedSubFunctions(null, 0);
137        } else {
138          removedBranchIndex = random.Next(crossoverPoint.SubTrees.Count);
139          removedBranch = crossoverPoint.SubTrees[removedBranchIndex];
140          allowedFunctions = gardener.GetAllowedSubFunctions(crossoverPoint.Function, removedBranchIndex);
141        }
142        int removedBranchSize = removedBranch.Size;
143        int maxBranchSize = maxTreeSize - (tree0.Size - removedBranchSize);
144        int maxBranchHeight = maxTreeHeight - gardener.GetBranchLevel(tree0, removedBranch);
145        List<int> removedBranchThread = GetThread(removedBranch, tree0);
146        IFunctionTree insertedBranch = GetReplacementBranch(random, gardener, allowedFunctions, tree1, removedBranchThread, removedBranchSize, maxBranchSize, maxBranchHeight);
147
148        int tries = 0;
149        while(insertedBranch == null) {
150          if(tries++ > MAX_RECOMBINATION_TRIES) {
151            if(random.Next() > 0.5) return tree1;
152            else return tree0;
153          }
154
155          // retry with a different crossoverPoint       
156          crossoverPoint = gardener.GetRandomParentNode(tree0);
157          if(crossoverPoint == null) {
158            removedBranchIndex = 0;
159            removedBranch = tree0;
160            allowedFunctions = gardener.GetAllowedSubFunctions(null, 0);
161          } else {
162            removedBranchIndex = random.Next(crossoverPoint.SubTrees.Count);
163            removedBranch = crossoverPoint.SubTrees[removedBranchIndex];
164            allowedFunctions = gardener.GetAllowedSubFunctions(crossoverPoint.Function, removedBranchIndex);
165          }
166          removedBranchSize = removedBranch.Size;
167          maxBranchSize = maxTreeSize - (tree0.Size - removedBranchSize);
168          maxBranchHeight = maxTreeHeight - gardener.GetBranchLevel(tree0, removedBranch) + 1;
169          removedBranchThread = GetThread(removedBranch, tree0);
170          insertedBranch = GetReplacementBranch(random, gardener, allowedFunctions, tree1, removedBranchThread, removedBranchSize, maxBranchSize, maxBranchHeight);
171        }
172        if(crossoverPoint != null) {
173          // replace the branch below the crossoverpoint with the selected branch from root1
174          crossoverPoint.RemoveSubTree(removedBranchIndex);
175          crossoverPoint.InsertSubTree(removedBranchIndex, insertedBranch);
176          return tree0;
177        } else {
178          return insertedBranch;
179        }
180      }
181    }
182
183    private IFunctionTree GetReplacementBranch(IRandom random, TreeGardener gardener, IList<IFunction> allowedFunctions, IFunctionTree tree, List<int> removedBranchThread, int removedBranchSize, int maxBranchSize, int maxBranchHeight) {
184      var branches = gardener.GetAllSubTrees(tree).Where(t => allowedFunctions.Contains(t.Function) && t.Size < maxBranchSize && t.Height < maxBranchHeight)
185        .Select(t => new { Tree = t, Size = t.Size, Thread = GetThread(t, tree) }).Where(s => s.Size < 2 * removedBranchSize + 1);
186
187      var shorterBranches = branches.Where(t => t.Size < removedBranchSize);
188      var longerBranches = branches.Where(t => t.Size > removedBranchSize);
189      var equalLengthBranches = branches.Where(t => t.Size == removedBranchSize);
190
191      if(shorterBranches.Count() == 0 || longerBranches.Count() == 0) {
192        if(equalLengthBranches.Count() == 0) {
193          return null;
194        } else {
195          return equalLengthBranches.OrderBy(t => MatchingSteps(removedBranchThread, t.Thread)).Last().Tree;
196        }
197      } else {
198        // invariant: |shorterBranches| > 0  and |longerBranches| > 0
199        double pEqualLength = equalLengthBranches.Count() > 0 ? 1.0 / removedBranchSize : 0.0;
200        double pLonger = (1.0 - pEqualLength) / (longerBranches.Count() * (1.0 + longerBranches.Average(t => t.Size) / shorterBranches.Average(t => t.Size)));
201        double pShorter = (1.0 - pEqualLength - pLonger);
202
203        double r = random.NextDouble();
204        if(r < pLonger) {
205          return longerBranches.OrderBy(t => MatchingSteps(removedBranchThread, t.Thread)).Last().Tree;
206        } else if(r < pLonger + pShorter) {
207          return shorterBranches.OrderBy(t => MatchingSteps(removedBranchThread, t.Thread)).Last().Tree;
208        } else {
209          return equalLengthBranches.OrderBy(t => MatchingSteps(removedBranchThread, t.Thread)).Last().Tree;
210        }
211      }
212    }
213
214    private int MatchingSteps(List<int> removedBranchThread, List<int> list) {
215      int n = Math.Min(removedBranchThread.Count, list.Count);
216      for(int i = 0; i < n; i++) if(removedBranchThread[i] != list[i]) return i;
217      return n;
218    }
219
220    private List<int> GetThread(IFunctionTree t, IFunctionTree tree) {
221      List<int> thread = new List<int>();
222      for(int i = 0; i < tree.SubTrees.Count; i++) {
223        if(t == tree.SubTrees[i]) {
224          thread.Add(i);
225          return thread;
226        } else {
227          thread.AddRange(GetThread(t, tree.SubTrees[i]));
228          if(thread.Count > 0) {
229            thread.Insert(0, i);
230            return thread;
231          }
232        }
233      }
234      return thread;
235    }
236
237
238    // take f and g and create a tree that has f and g as sub-trees
239    // example
240    //       O
241    //      /|\
242    //     g 2 f
243    //
244    private IFunctionTree CombineTerminals(TreeGardener gardener, IFunctionTree f, IFunctionTree g, MersenneTwister random, int maxTreeHeight, out List<IFunctionTree> newBranches) {
245      newBranches = new List<IFunctionTree>();
246      // determine the set of possible parent functions
247      ICollection<IFunction> possibleParents = gardener.GetPossibleParents(new List<IFunction>() { f.Function, g.Function });
248      if(possibleParents.Count == 0) throw new InvalidProgramException();
249      // and select a random one
250      IFunctionTree parent = possibleParents.ElementAt(random.Next(possibleParents.Count())).GetTreeNode();
251
252      int nSlots = Math.Max(2, parent.Function.MinArity);
253      // determine which slot can take which sub-trees
254      List<IFunctionTree>[] slots = new List<IFunctionTree>[nSlots];
255      for(int slot = 0; slot < nSlots; slot++) {
256        ICollection<IFunction> allowedSubFunctions = gardener.GetAllowedSubFunctions(parent.Function, slot);
257        List<IFunctionTree> allowedTrees = new List<IFunctionTree>();
258        if(allowedSubFunctions.Contains(f.Function)) allowedTrees.Add(f);
259        if(allowedSubFunctions.Contains(g.Function)) allowedTrees.Add(g);
260        slots[slot] = allowedTrees;
261      }
262      // fill the slots in the order of degrees of freedom
263      int[] slotSequence = Enumerable.Range(0, slots.Count()).OrderBy(slot => slots[slot].Count()).ToArray();
264
265      // tmp arry to store the tree for each sub-tree slot of the parent
266      IFunctionTree[] selectedFunctionTrees = new IFunctionTree[nSlots];
267
268      // fill the sub-tree slots of the parent starting with the slots that can take potentially both functions (f and g)
269      for(int i = 0; i < slotSequence.Length; i++) {
270        int slot = slotSequence[i];
271        List<IFunctionTree> allowedTrees = slots[slot];
272        // when neither f nor g fit into the slot => create a new random tree
273        if(allowedTrees.Count() == 0) {
274          var allowedFunctions = gardener.GetAllowedSubFunctions(parent.Function, slot);
275          selectedFunctionTrees[slot] = gardener.CreateRandomTree(allowedFunctions, 1, 1);
276          newBranches.AddRange(gardener.GetAllSubTrees(selectedFunctionTrees[slot]));
277        } else {
278          // select randomly which tree to insert into this slot
279          IFunctionTree selectedTree = allowedTrees[random.Next(allowedTrees.Count())];
280          selectedFunctionTrees[slot] = selectedTree;
281          // remove the tree that we used in this slot from following function-sets
282          for(int j = i + 1; j < slotSequence.Length; j++) {
283            int otherSlot = slotSequence[j];
284            slots[otherSlot].Remove(selectedTree);
285          }
286        }
287      }
288      // actually append the sub-trees to the parent tree
289      for(int i = 0; i < selectedFunctionTrees.Length; i++) {
290        parent.InsertSubTree(i, selectedFunctionTrees[i]);
291      }
292
293      return parent;
294    }
295  }
296}
Note: See TracBrowser for help on using the repository browser.