Changeset 15060

-                      r14116
+                      r15060
     <Compile Include="Linear\MultinomialLogitClassificationSolution.cs" />
     <Compile Include="Linear\MultinomialLogitModel.cs" />
+    <Compile Include="MctsSymbolicRegression\Automaton.cs" />
+    <Compile Include="MctsSymbolicRegression\CodeGenerator.cs" />
+    <Compile Include="MctsSymbolicRegression\ConstraintHandler.cs" />
+    <Compile Include="MctsSymbolicRegression\Disassembler.cs" />
+    <Compile Include="MctsSymbolicRegression\ExpressionEvaluator.cs" />
+    <Compile Include="MctsSymbolicRegression\MctsSymbolicRegressionAlgorithm.cs" />
+    <Compile Include="MctsSymbolicRegression\MctsSymbolicRegressionStatic.cs" />
+    <Compile Include="MctsSymbolicRegression\OpCodes.cs" />
+    <Compile Include="MctsSymbolicRegression\Policies\EpsGreedy.cs" />
+    <Compile Include="MctsSymbolicRegression\Policies\UcbTuned.cs" />
+    <Compile Include="MctsSymbolicRegression\Policies\IActionStatistics.cs" />
+    <Compile Include="MctsSymbolicRegression\Policies\IPolicy.cs" />
+    <Compile Include="MctsSymbolicRegression\Policies\PolicyBase.cs" />
+    <Compile Include="MctsSymbolicRegression\Policies\Ucb.cs" />
+    <Compile Include="MctsSymbolicRegression\SymbolicExpressionGenerator.cs" />
+    <Compile Include="MctsSymbolicRegression\Tree.cs" />
     <Compile Include="Nca\Initialization\INcaInitializer.cs" />
     <Compile Include="Nca\Initialization\LdaInitializer.cs" />

stable/HeuristicLab.Algorithms.DataAnalysis/3.4/MctsSymbolicRegression/Automaton.cs

-                      r13645
+                      r15060
 /* HeuristicLab
  * Copyright (C) 2002-2015 Heuristic and Evolutionary Algorithms Laboratory (HEAL)
- * and the BEACON Center for the Study of Evolution in Action.
+ *
  * This file is part of HeuristicLab.
 …
 namespace HeuristicLab.Algorithms.DataAnalysis.MctsSymbolicRegression {
   // this is the core class for generating expressions.
+  // the automaton determines which expressions are allowed
+  // it represents a finite state automaton, each state transition can be associated with an action (e.g. to produce code).
+  // the automaton determines the possible structures for expressions.
+  //
+  // to understand this code it is worthwile to generate a graphical visualization of the automaton (see PrintAutomaton).
+  // If the code is compiled in debug mode the automaton produces a Graphviz file into the folder of the application
+  // whenever an instance of the automaton is constructed.
+  //
+  // This class relies on two other classes:
+  // - CodeGenerator to produce code for a stack-based evaluator and
+  // - ConstraintHandler to restrict the allowed set of expressions.
+  //
+  // The ConstraintHandler extends the automaton and adds semantic restrictions for expressions produced by the automaton.
+  //
+  //
   internal class Automaton {
     public const int StateExpr = 1;
 …
     public const int StateInvTFStart = 23;
     public const int StateInvTFEnd = 24;
+    private const int FirstDynamicState = 25;
+    public const int FirstDynamicState = 25;
+    // more states for individual variables are created dynamically
     private const int StartState = StateExpr;
 …
         () => {
           codeGenerator.Emit1(OpCodes.LoadConst0);
+        },
+        "0");
+          constraintHandler.StartNewTermInPoly();
+        },
+        "0, StartTermInPoly");
       AddTransition(StateLogTEnd, StateLogFactorEnd,
         () => {
 …
         () => {
           codeGenerator.Emit1(OpCodes.LoadConst1);
+        },
+        "c");
+          constraintHandler.StartNewTermInPoly();
+        },
+        "c, StartTermInPoly");
       AddTransition(StateInvTEnd, StateInvFactorEnd,
         () => {
 …
     private readonly int[] followStatesBuf = new int[1000];
     public void FollowStates(int state, out int[] buf, out int nElements) {
-      // return followStates[state]
-      //   .Where(s => s < FirstDynamicState || s >= minVarIdx) // for variables we only allow non-decreasing state sequences
-      //   // the following states imply an additional variable being added to the expression
-      //   // F, Sum, Prod
-      //   .Where(s => (s != StateF && s != StateSum && s != StateProd) || variablesRemaining > 0);
       // for loop instead of where iterator
       var fs = followStates[state];
       int j = 0;
-      //Console.Write(stateNames[CurrentState] + " allowed: ");
       for (int i = 0; i < fs.Count; i++) {
         var s = fs[i];
         if (constraintHandler.IsAllowedFollowState(state, s)) {
-          //Console.Write(s + " ");
           followStatesBuf[j++] = s;
+        }
+      }
-      //Console.WriteLine();
       buf = followStatesBuf;
       nElements = j;
 …
     public void Goto(int targetState) {
-      //Console.WriteLine("->{0}", stateNames[targetState]);
-      // Contract.Assert(FollowStates(CurrentState).Contains(targetState));
       if (actions[CurrentState, targetState] != null)
         actions[CurrentState, targetState].ForEach(a => a()); // execute all actions
 …
     public bool IsFinalState(int s) {
       return s == StateExprEnd;
+      return s == StateExprEnd && !constraintHandler.IsInvalidExpression;
+    }
 …
         writer.WriteLine("digraph {");
         // writer.WriteLine("rankdir=LR");
-        int[] fs;
-        int nFs;
         for (int s = StartState; s < stateNames.Count; s++) {
           for (int i = 0; i < followStates[s].Count; i++) {

stable/HeuristicLab.Algorithms.DataAnalysis/3.4/MctsSymbolicRegression/CodeGenerator.cs

r13645	r15060
2	2	/* HeuristicLab
3	3	* Copyright (C) 2002-2015 Heuristic and Evolutionary Algorithms Laboratory (HEAL)
4		* and the BEACON Center for the Study of Evolution in Action.
5	4	*
6	5	* This file is part of HeuristicLab.

stable/HeuristicLab.Algorithms.DataAnalysis/3.4/MctsSymbolicRegression/ConstraintHandler.cs

-                      r13645
+                      r15060
 /* HeuristicLab
  * Copyright (C) 2002-2015 Heuristic and Evolutionary Algorithms Laboratory (HEAL)
- * and the BEACON Center for the Study of Evolution in Action.
+ *
  * This file is part of HeuristicLab.
 …
 #endregion
+using System;
+using System.Collections.Generic;
 using System.Diagnostics.Contracts;
+using System.Linq;
 namespace HeuristicLab.Algorithms.DataAnalysis.MctsSymbolicRegression {
+  // more states for individual variables are created dynamically
+  // This class restricts the set of allowed transitions of the automaton to prevent exploration of duplicate expressions.
+  // It would be possible to implement this class in such a way that the search never visits a duplicate expression. However,
+  // it seems very intricate to detect this robustly and in all cases while generating an expression because
+  // some for of lookahead is necessary.
+  // Instead the constraint handler only catches the obvious duplicates directly, but does not guarantee that the search always produces a valid expression.
+  // The ratio of the number of unsuccessful searches, that need backtracking should be tracked in the MCTS alg (MctsSymbolicRegressionStatic)
+  // All changes to this class should be tested through unit tests. It is important that the ConstraintHandler is not too restrictive.
+  // the constraints are derived from a canonical form for expressions.
+  // overall we can enforce a limited number of variable references
+  //
+  // an expression is a sum of terms t_1 ... t_n where terms are ordered according to a relation t_i (<=)_term t_j for each pair t_i, t_j and i <= j
+  // a term is a product of factors where factors are ordered according to relation f_i (<=)_factor f_j for each pair f_i,f_j and i <= j
+  // we want to enforce lower-order terms before higher-order terms in expressions (based on number of variable references)
+  // factors can have different types (variable, exp, log, inverse)
+  // (<=)_term  [IsSmallerOrEqualTerm(t_i, t_j)]
+  //   1.  NumberOfVarRefs(t_i) < NumberOfVarRefs(t_j)  --> true           enforce terms with non-decreasing number of var refs
+  //   2.  NumberOfVarRefs(t_i) > NumberOfVarRefs(t_j)  --> false
+  //   3.  NumFactors(t_i) > NumFactors(t_j)            --> true           enforce terms with non-increasing number of factors
+  //   4.  NumFactors(t_i) < NumFactors(t_j)            --> false
+  //   5.  for all k factors: Factor(k, t_i) (<=)_factor  Factor(k, t_j) --> true // factors must be non-decreasing
+  //   6.  all factors are (=)_factor                   --> true
+  //   7.  else false
+  // (<=)_factor  [IsSmallerOrEqualFactor(f_i, f_j)]
+  //   1.  FactorType(t_i) < FactorType(t_j)  --> true           enforce terms with non-decreasing factor type (var < exp < log < inv)
+  //   2.  FactorType(t_i) > FactorType(t_j)  --> false
+  //   3.  Compare the two factors specifically
+  //     - variables: varIdx_i <= varIdx_j (only one var reference)
+  //     - exp: number of variable references and then varIdx_i <= varIdx_j for each position
+  //     - log: number of variable references and ...
+  //     - inv: number of variable references and ...
+  //
+  // for log and inverse factors we allow all polynomials as argument
+  // a polynomial is a sum of terms t_1 ... t_n where terms are ordered according to a relation t_i (<=)_poly t_j for each pair t_i, t_j and i <= j
+  // (<=)_poly  [IsSmallerOrEqualPoly(t_i, t_j)]
+  //  1. NumberOfVarRefs(t_i) < NumberOfVarRefs(t_j)         --> true // enforce non-decreasing number of var refs
+  //  2. NumberOfVarRefs(t_i) > NumberOfVarRefs(t_j)         --> false // enforce non-decreasing number of var refs
+  //  3. for all k variables: VarIdx(k,t_i) > VarIdx(k, t_j) --> false // enforce non-decreasing variable idx
+  // we store the following to make comparsions:
+  // - prevTerm (complete & containing all factors)
+  // - curTerm  (incomplete & containing all completed factors)
+  // - curFactor (incomplete)
   internal class ConstraintHandler {
     private int nVars;
     private readonly int maxVariables;
+    public int prevTermFirstVariableState;
+    public int curTermFirstVariableState;
+    public int prevTermFirstFactorType;
+    public int curTermFirstFactorType;
+    public int prevFactorType;
+    public int curFactorType;
+    public int prevFactorFirstVariableState;
+    public int curFactorFirstVariableState;
+    public int prevVariableRef;
+    private bool invalidExpression;
+    public bool IsInvalidExpression {
+      get { return invalidExpression; }
+    }
+    private TermInformation prevTerm;
+    private TermInformation curTerm;
+    private FactorInformation curFactor;
+    private class TermInformation {
+      public int numVarReferences { get { return factors.Sum(f => f.numVarReferences); } }
+      public List<FactorInformation> factors = new List<FactorInformation>();
+    }
+    private class FactorInformation {
+      public int numVarReferences = 0;
+      public int factorType; // use the state number to represent types
+      // for variable factors
+      public int variableState = -1;
+      // for exp  factors
+      public List<int> expVariableStates = new List<int>();
+      // for log and inv factors
+      public List<List<int>> polyVariableStates = new List<List<int>>();
+    }
 …
+    }
+    // 1) an expression is a sum of terms t_1 ... t_n
+    //    FirstFactorType(t_i) <= FirstFactorType(t_j) for each pair t_i, t_j where i < j
+    //    FirstVarReference(t_i) <= FirstVarReference(t_j) for each pair t_i, t_j where i < j and FirstFactorType(t_i) = FirstFactorType(t_j)
+    // 2) a term is a product of factors, each factor is either a variable factor, an exp factor, a log factor or an inverse factor
+    //    FactorType(f_i) <= FactorType(f_j) for each pair of factors f_i, f_j and i < j
+    //    FirstVarReference(f_i) <= FirstVarReference(f_j) for each pair of factors f_i, f_j and i < j and FactorType(f_i) = FactorType(f_j)
+    // 3) a variable factor is a product of variable references v1...vn
+    //    VarIdx(v_i) <= VarIdx(v_j) for each pair of variable references v_i, v_j and i < j
+    //    (IMPLICIT) FirstVarReference(t) <= VarIdx(v_i) for each variable reference v_i in term t
+    // 4) an exponential factor is the exponential of a product of variables v1...vn
+    //    VarIdx(v_i) <= VarIdx(v_j) for each pair of variable references v_i, v_j and i < j
+    //    (IMPLICIT) FirstVarReference(t) <= VarIdx(v_i) for each variable reference v_i in term t
+    // 5) a log factor is a sum of terms t_i where each term is a product of variables
+    //    FirstVarReference(t_i) <= FirstVarReference(t_j) for each pair of terms t_i, t_j and i < j
+    //    for each term t: VarIdx(v_i) <= VarIdx(v_j) for each pair of variable references v_i, v_j and i < j in t
+    // the order relations for terms and factors
+    private static int CompareTerms(TermInformation a, TermInformation b) {
+      if (a.numVarReferences < b.numVarReferences) return -1;
+      if (a.numVarReferences > b.numVarReferences) return 1;
+      if (a.factors.Count > b.factors.Count) return -1;  // terms with more factors should be ordered first
+      if (a.factors.Count < b.factors.Count) return +1;
+      var aFactors = a.factors.GetEnumerator();
+      var bFactors = b.factors.GetEnumerator();
+      while (aFactors.MoveNext() & bFactors.MoveNext()) {
+        var c = CompareFactors(aFactors.Current, bFactors.Current);
+        if (c < 0) return -1;
+        if (c > 0) return 1;
+      }
+      // all factors are the same => terms are the same
+      return 0;
+    }
+    private static int CompareFactors(FactorInformation a, FactorInformation b) {
+      if (a.factorType < b.factorType) return -1;
+      if (a.factorType > b.factorType) return +1;
+      // same factor types
+      if (a.factorType == Automaton.StateVariableFactorStart) {
+        return a.variableState.CompareTo(b.variableState);
+      } else if (a.factorType == Automaton.StateExpFactorStart) {
+        return CompareStateLists(a.expVariableStates, b.expVariableStates);
+      } else {
+        if (a.numVarReferences < b.numVarReferences) return -1;
+        if (a.numVarReferences > b.numVarReferences) return +1;
+        if (a.polyVariableStates.Count > b.polyVariableStates.Count) return -1; // more terms in the poly should be ordered first
+        if (a.polyVariableStates.Count < b.polyVariableStates.Count) return +1;
+        // log and inv
+        var aTerms = a.polyVariableStates.GetEnumerator();
+        var bTerms = b.polyVariableStates.GetEnumerator();
+        while (aTerms.MoveNext() & bTerms.MoveNext()) {
+          var c = CompareStateLists(aTerms.Current, bTerms.Current);
+          if (c != 0) return c;
+        }
+        return 0; // all terms in the polynomial are the same
+      }
+    }
+    private static int CompareStateLists(List<int> a, List<int> b) {
+      if (a.Count < b.Count) return -1;
+      if (a.Count > b.Count) return +1;
+      for (int i = 0; i < a.Count; i++) {
+        if (a[i] < b[i]) return -1;
+        if (a[i] > b[i]) return +1;
+      }
+      return 0; // all states are the same
+    }
+    private bool IsNewTermAllowed() {
+      // next term must have at least as many variable references as the previous term
+      return prevTerm == null || nVars + prevTerm.numVarReferences <= maxVariables;
+    }
+    private bool IsNewFactorAllowed() {
+      // next factor must have a larger or equal type compared to the previous factor.
+      // if the types are the same it must have at least as many variable references.
+      // so if the prevFactor is any other than invFactor (last possible type) then we only need to be able to add one variable
+      // otherwise we need to be able to add at least as many variables as the previous factor
+      return !curTerm.factors.Any() ||
+             (nVars + curTerm.factors.Last().numVarReferences <= maxVariables);
+    }
+    private bool IsAllowedAsNextFactorType(int followState) {
+      // IsNewTermAllowed already ensures that we can add a term with enough variable references
+      // enforce constraints within terms (compare to prev factor)
+      if (curTerm.factors.Any()) {
+        // enforce non-decreasing factor types
+        if (curTerm.factors.Last().factorType > followState) return false;
+        // when the factor type is the same, starting a new factor is only allowed if we can add at least the number of variables of the prev factor
+        if (curTerm.factors.Last().factorType == followState && nVars + curTerm.factors.Last().numVarReferences > maxVariables) return false;
+      }
+      // enforce constraints on terms (compare to prev term)
+      // meaning that we must ensure non-decreasing terms
+      if (prevTerm != null) {
+        // a factor type is only allowed if we can then produce a term that is larger or equal to the prev term
+        // (1) if we the number of variable references still remaining is larger than the number of variable references in the prev term
+        //     then it is always possible to build a larger term
+        // (2) otherwise we try to build the largest possible term starting from current factors in the term.
+        //
+        var numVarRefsRemaining = maxVariables - nVars;
+        Contract.Assert(!curTerm.factors.Any() || curTerm.factors.Last().numVarReferences <= numVarRefsRemaining);
+        if (prevTerm.numVarReferences < numVarRefsRemaining) return true;
+        // variable factors must be handled differently because they can only contain one variable reference
+        if (followState == Automaton.StateVariableFactorStart) {
+          // append the variable factor and the maximum possible state from the previous factor to create a larger factor
+          var varF = CreateLargestPossibleFactor(Automaton.StateVariableFactorStart, 1);
+          var maxF = CreateLargestPossibleFactor(prevTerm.factors.Max(f => f.factorType), numVarRefsRemaining - 1);
+          var origFactorCount = curTerm.factors.Count;
+          // add this factor to the current term
+          curTerm.factors.Add(varF);
+          curTerm.factors.Add(maxF);
+          var c = CompareTerms(prevTerm, curTerm);
+          // restore term
+          curTerm.factors.RemoveRange(origFactorCount, 2);
+          // if the prev term is still larger then this followstate is not allowed
+          if (c > 0) {
+            return false;
+          }
+        } else {
+          var newF = CreateLargestPossibleFactor(followState, numVarRefsRemaining);
+          var origFactorCount = curTerm.factors.Count;
+          // add this factor to the current term
+          curTerm.factors.Add(newF);
+          var c = CompareTerms(prevTerm, curTerm);
+          // restore term
+          curTerm.factors.RemoveAt(origFactorCount);
+          // if the prev term is still larger then this followstate is not allowed
+          if (c > 0) {
+            return false;
+          }
+        }
+      }
+      return true;
+    }
+    // largest possible factor of the given kind
+    private FactorInformation CreateLargestPossibleFactor(int factorType, int numVarRefs) {
+      var newF = new FactorInformation();
+      newF.factorType = factorType;
+      if (factorType == Automaton.StateVariableFactorStart) {
+        newF.variableState = int.MaxValue;
+        newF.numVarReferences = 1;
+      } else if (factorType == Automaton.StateExpFactorStart) {
+        for (int i = 0; i < numVarRefs; i++)
+          newF.expVariableStates.Add(int.MaxValue);
+        newF.numVarReferences = numVarRefs;
+      } else if (factorType == Automaton.StateInvFactorStart || factorType == Automaton.StateLogFactorStart) {
+        for (int i = 0; i < numVarRefs; i++) {
+          newF.polyVariableStates.Add(new List<int>());
+          newF.polyVariableStates[i].Add(int.MaxValue);
+        }
+        newF.numVarReferences = numVarRefs;
+      }
+      return newF;
+    }
+    private bool IsAllowedAsNextVariableFactor(int variableState) {
+      Contract.Assert(variableState >= Automaton.FirstDynamicState);
+      return !curTerm.factors.Any() || curTerm.factors.Last().variableState <= variableState;
+    }
+    private bool IsAllowedAsNextInExp(int variableState) {
+      Contract.Assert(variableState >= Automaton.FirstDynamicState);
+      if (curFactor.expVariableStates.Any() && curFactor.expVariableStates.Last() > variableState) return false;
+      if (curTerm.factors.Any()) {
+        // try and compare with prev factor
+        curFactor.numVarReferences++;
+        curFactor.expVariableStates.Add(variableState);
+        var c = CompareFactors(curTerm.factors.Last(), curFactor);
+        curFactor.numVarReferences--;
+        curFactor.expVariableStates.RemoveAt(curFactor.expVariableStates.Count - 1);
+        return c <= 0;
+      }
+      return true;
+    }
+    private bool IsNewTermAllowedInPoly() {
+      return nVars + curFactor.polyVariableStates.Last().Count() <= maxVariables;
+    }
+    private bool IsAllowedAsNextInPoly(int variableState) {
+      Contract.Assert(variableState >= Automaton.FirstDynamicState);
+      return !curFactor.polyVariableStates.Any() ||
+             !curFactor.polyVariableStates.Last().Any() ||
+              curFactor.polyVariableStates.Last().Last() <= variableState;
+    }
+    private bool IsTermCompleteInPoly() {
+      var nTerms = curFactor.polyVariableStates.Count;
+      return nTerms == 1 ||
+             curFactor.polyVariableStates[nTerms - 2].Count <= curFactor.polyVariableStates[nTerms - 1].Count;
+    }
+    private bool IsCompleteExp() {
+      return !curTerm.factors.Any() || CompareFactors(curTerm.factors.Last(), curFactor) <= 0;
+    }
     public bool IsAllowedFollowState(int currentState, int followState) {
+      // the following states are always allowed
+      // an invalid action was taken earlier on => nothing can be done anymore
+      if (invalidExpression) return false;
+      // states that have no alternative are always allowed
+      // some ending states are only allowed if enough variables have been used in the term
       if (
+        followState == Automaton.StateVariableFactorEnd ||
+        followState == Automaton.StateExpFEnd ||
+        followState == Automaton.StateExpFactorEnd ||
+        followState == Automaton.StateLogTFEnd ||
+        followState == Automaton.StateLogTEnd ||
+        followState == Automaton.StateLogFactorEnd ||
+        followState == Automaton.StateInvTFEnd ||
+        followState == Automaton.StateInvTEnd ||
+        followState == Automaton.StateInvFactorEnd ||
+        followState == Automaton.StateFactorEnd ||
+        followState == Automaton.StateTermEnd ||
+        followState == Automaton.StateExprEnd
+        currentState == Automaton.StateTermStart ||           // no alternative
+        currentState == Automaton.StateExpFactorStart ||
+        currentState == Automaton.StateLogFactorStart ||
+        currentState == Automaton.StateInvFactorStart ||
+        followState == Automaton.StateVariableFactorEnd ||    // no alternative
+        followState == Automaton.StateExpFEnd ||              // no alternative
+        followState == Automaton.StateLogTFEnd ||             // no alternative
+        followState == Automaton.StateInvTFEnd ||             // no alternative
+        followState == Automaton.StateFactorEnd ||            // always allowed because no alternative
+        followState == Automaton.StateExprEnd                 // we could also constrain the minimum number of terms here
       ) return true;
+      // all other states are only allowed if we can add more variables
+      if (nVars >= maxVariables) return false;
+      // the following states are always allowed when we can add more variables
+      // starting a new term is only allowed if we can add a term with at least the number of variables of the prev term
+      if (followState == Automaton.StateTermStart && !IsNewTermAllowed()) return false;
+      if (followState == Automaton.StateFactorStart && !IsNewFactorAllowed()) return false;
+      if (currentState == Automaton.StateFactorStart && !IsAllowedAsNextFactorType(followState)) return false;
+      if (followState == Automaton.StateTermEnd && prevTerm != null && CompareTerms(prevTerm, curTerm) > 0) return false;
+      // all of these states add at least one variable
       if (
+        followState == Automaton.StateTermStart ||
+        followState == Automaton.StateFactorStart ||
+        followState == Automaton.StateExpFStart ||
+        followState == Automaton.StateLogTStart ||
+        followState == Automaton.StateLogTFStart ||
+        followState == Automaton.StateInvTStart ||
+        followState == Automaton.StateInvTFStart
+        ) return true;
+      // enforce non-decreasing factor types
+      if (currentState == Automaton.StateFactorStart) {
+        if (curFactorType < 0) {
+          //    FirstFactorType(t_i) <= FirstFactorType(t_j) for each pair t_i, t_j where i < j
+          return prevTermFirstFactorType <= followState;
+        } else {
+          // FactorType(f_i) <= FactorType(f_j) for each pair of factors f_i, f_j and i < j
+          return curFactorType <= followState;
+        }
+      }
+      // enforce non-decreasing variables references in variable and exp factors
+      if (currentState == Automaton.StateVariableFactorStart || currentState == Automaton.StateExpFStart || currentState == Automaton.StateLogTFStart || currentState == Automaton.StateInvTFStart) {
+        if (prevVariableRef > followState) return false; // never allow decreasing variables
+        if (prevFactorType < 0) {
+          // FirstVarReference(t_i) <= FirstVarReference(t_j) for each pair t_i, t_j where i < j
+          return prevTermFirstVariableState <= followState;
+        } else if (prevFactorType == curFactorType) {
+          // (FirstVarReference(f_i) <= FirstVarReference(f_j) for each pair of factors f_i, f_j and i < j and FactorType(f_i) = FactorType(f_j)
+          return prevFactorFirstVariableState <= followState;
+        }
+      }
+      return true;
+          followState == Automaton.StateVariableFactorStart ||
+          followState == Automaton.StateExpFactorStart || followState == Automaton.StateExpFStart ||
+          followState == Automaton.StateLogFactorStart || followState == Automaton.StateLogTStart ||
+          followState == Automaton.StateLogTFStart ||
+          followState == Automaton.StateInvFactorStart || followState == Automaton.StateInvTStart ||
+          followState == Automaton.StateInvTFStart) {
+        if (nVars + 1 > maxVariables) return false;
+      }
+      if (currentState == Automaton.StateVariableFactorStart && !IsAllowedAsNextVariableFactor(followState)) return false;
+      else if (currentState == Automaton.StateExpFStart && !IsAllowedAsNextInExp(followState)) return false;
+      else if (followState == Automaton.StateLogTStart && !IsNewTermAllowedInPoly()) return false;
+      else if (currentState == Automaton.StateLogTFStart && !IsAllowedAsNextInPoly(followState)) return false;
+      else if (followState == Automaton.StateInvTStart && !IsNewTermAllowedInPoly()) return false;
+      else if (currentState == Automaton.StateInvTFStart && !IsAllowedAsNextInPoly(followState)) return false;
+      // finishing an exponential factor is only allowed when the number of variable references is large enough
+      else if (followState == Automaton.StateExpFactorEnd && !IsCompleteExp()) return false;
+      // finishing a polynomial (in log or inv) is only allowed when the number of variable references is large enough
+      else if (followState == Automaton.StateInvTEnd && !IsTermCompleteInPoly()) return false;
+      else if (followState == Automaton.StateLogTEnd && !IsTermCompleteInPoly()) return false;
+      else if (nVars > maxVariables) return false;
+      else return true;
+    }
 …
     public void Reset() {
       nVars = 0;
+      prevTermFirstVariableState = -1;
+      curTermFirstVariableState = -1;
+      prevTermFirstFactorType = -1;
+      curTermFirstFactorType = -1;
+      prevVariableRef = -1;
+      prevFactorType = -1;
+      curFactorType = -1;
+      curFactorFirstVariableState = -1;
+      prevFactorFirstVariableState = -1;
+      prevTerm = null;
+      curTerm = null;
+      curFactor = null;
+      invalidExpression = false;
+    }
     public void StartTerm() {
+      // reset factor type. in each term we can start with each type of factor
+      prevTermFirstVariableState = curTermFirstVariableState;
+      curTermFirstVariableState = -1;
+      prevTermFirstFactorType = curTermFirstFactorType;
+      curTermFirstFactorType = -1;
+      prevFactorType = -1;
+      curFactorType = -1;
+      curFactorFirstVariableState = -1;
+      prevFactorFirstVariableState = -1;
+      curTerm = new TermInformation();
+    }
     public void StartFactor(int state) {
+      prevFactorType = curFactorType;
+      curFactorType = -1;
+      prevFactorFirstVariableState = curFactorFirstVariableState;
+      curFactorFirstVariableState = -1;
+      // store the first factor type
+      if (curTermFirstFactorType < 0) {
+        curTermFirstFactorType = state;
+      }
+      curFactorType = state;
+      // reset variable references. in each factor we can start with each variable reference
+      prevVariableRef = -1;
+      curFactor = new FactorInformation();
+      curFactor.factorType = state;
+    }
     public void AddVarToCurrentFactor(int state) {
+      Contract.Assert(prevVariableRef <= state);
+      // store the first variable reference for each factor
+      if (curFactorFirstVariableState < 0) {
+        curFactorFirstVariableState = state;
+        // store the first variable reference for each term
+        if (curTermFirstVariableState < 0) {
+          curTermFirstVariableState = state;
+        }
+      }
+      prevVariableRef = state;
+      Contract.Assert(Automaton.FirstDynamicState <= state);
+      Contract.Assert(curTerm != null);
+      Contract.Assert(curFactor != null);
       nVars++;
+      curFactor.numVarReferences++;
+      if (curFactor.factorType == Automaton.StateVariableFactorStart) {
+        Contract.Assert(curFactor.variableState < 0); // not set before
+        curFactor.variableState = state;
+      } else if (curFactor.factorType == Automaton.StateExpFactorStart) {
+        curFactor.expVariableStates.Add(state);
+      } else if (curFactor.factorType == Automaton.StateLogFactorStart ||
+                 curFactor.factorType == Automaton.StateInvFactorStart) {
+        curFactor.polyVariableStates.Last().Add(state);
+      } else throw new InvalidProgramException();
+    }
+    public void StartNewTermInPoly() {
+      curFactor.polyVariableStates.Add(new List<int>());
+    }
     public void EndFactor() {
+      Contract.Assert(prevFactorFirstVariableState <= curFactorFirstVariableState);
+      Contract.Assert(prevFactorType <= curFactorType);
+      // enforce non-decreasing factors
+      if (curTerm.factors.Any() && CompareFactors(curTerm.factors.Last(), curFactor) > 0)
+        invalidExpression = true;
+      curTerm.factors.Add(curFactor);
+      curFactor = null;
+    }
     public void EndTerm() {
+      Contract.Assert(prevFactorType <= curFactorType);
+      Contract.Assert(prevTermFirstVariableState <= curTermFirstVariableState);
+      // enforce non-decreasing terms (TODO: equal terms should not be allowed)
+      if (prevTerm != null && CompareTerms(prevTerm, curTerm) > 0)
+        invalidExpression = true;
+      prevTerm = curTerm;
+      curTerm = null;
+    }
+  }

stable/HeuristicLab.Algorithms.DataAnalysis/3.4/MctsSymbolicRegression/Disassembler.cs

r13645	r15060
2	2	/* HeuristicLab
3	3	* Copyright (C) 2002-2015 Heuristic and Evolutionary Algorithms Laboratory (HEAL)
4		* and the BEACON Center for the Study of Evolution in Action.
5	4	*
6	5	* This file is part of HeuristicLab.
…	…
24	23
25	24	namespace HeuristicLab.Algorithms.DataAnalysis.MctsSymbolicRegression {
26		~~#if DEBUG~~
27	25	internal class Disassembler {
28	26	public static string CodeToString(byte[] code, double[] consts) {
…	…
40	38	case (byte)OpCodes.LoadVar:
41	39	{
42		short arg = (short)((~~(short)code[pc] << 8) \| (short)~~code[pc + 1]);
	40	short arg = (short)((code[pc] << 8) \| code[pc + 1]);
43	41	pc += 2;
44	42	sb.AppendFormat(" var{0} ", arg); break;
…	…
52	50	}
53	51	}
54		~~#endif~~
55	52	}

stable/HeuristicLab.Algorithms.DataAnalysis/3.4/MctsSymbolicRegression/ExpressionEvaluator.cs

-                      r13645
+                      r15060
 /* HeuristicLab
  * Copyright (C) 2002-2015 Heuristic and Evolutionary Algorithms Laboratory (HEAL)
- * and the BEACON Center for the Study of Evolution in Action.
+ *
  * This file is part of HeuristicLab.
 …
   internal class ExpressionEvaluator {
     // manages it's own vector buffers
+    private readonly List<double[]> vectorBuffers = new List<double[]>();
+    private readonly List<double[]> scalarBuffers = new List<double[]>(); // scalars are vectors of length 1 (to allow mixing scalars and vectors on the same stack)
+    private readonly double[][] vectorBuffers;
+    private readonly double[][] scalarBuffers; // scalars are vectors of length 1 (to allow mixing scalars and vectors on the same stack)
+    private int lastVecBufIdx;
+    private int lastScalarBufIdx;
     private double[] GetVectorBuffer() {
+      var v = vectorBuffers[vectorBuffers.Count - 1];
+      vectorBuffers.RemoveAt(vectorBuffers.Count - 1);
+      return v;
+      return vectorBuffers[--lastVecBufIdx];
+    }
     private double[] GetScalarBuffer() {
+      var v = scalarBuffers[scalarBuffers.Count - 1];
+      scalarBuffers.RemoveAt(scalarBuffers.Count - 1);
+      return v;
+      return scalarBuffers[--lastScalarBufIdx];
+    }
     private void ReleaseBuffer(double[] buf) {
+      (buf.Length == 1 ? scalarBuffers : vectorBuffers).Add(buf);
+      if (buf.Length == 1) {
+        scalarBuffers[lastScalarBufIdx++] = buf;
+      } else {
+        vectorBuffers[lastVecBufIdx++] = buf;
+      }
+    }
 …
       // preallocate buffers
+      vectorBuffers = new double[MaxStackSize * (1 + MaxParams)][];
+      scalarBuffers = new double[MaxStackSize * (1 + MaxParams)][];
       for (int i = 0; i < MaxStackSize; i++) {
         ReleaseBuffer(new double[vLen]);
 …
       short arg;
       // checked at the end to make sure we do not leak buffers
       int initialScalarCount = scalarBuffers.Count;
       int initialVectorCount = vectorBuffers.Count;
+      int initialScalarCount = lastScalarBufIdx;
+      int initialVectorCount = lastVecBufIdx;
       while (true) {
 …
                 var f = 1.0 / (maxFx * consts[curParamIdx]);
                 // adjust c so that maxFx*c = 1
+                // adjust c so that maxFx*c = 1 TODO: this is not ideal as it enforces positive arguments to exp()
                 consts[curParamIdx] *= f;
 …
+            }
             ReleaseBuffer(r);
             Contract.Assert(vectorBuffers.Count == initialVectorCount);
             Contract.Assert(scalarBuffers.Count == initialScalarCount);
+            Contract.Assert(lastVecBufIdx == initialVectorCount);
+            Contract.Assert(lastScalarBufIdx == initialScalarCount);
             return;
+        }
 …
       // checked at the end to make sure we do not leak buffers
       int initialScalarCount = scalarBuffers.Count;
       int initialVectorCount = vectorBuffers.Count;
+      int initialScalarCount = lastScalarBufIdx;
+      int initialVectorCount = lastVecBufIdx;
       while (true) {
 …
+            }
             Contract.Assert(vectorBuffers.Count == initialVectorCount);
             Contract.Assert(scalarBuffers.Count == initialScalarCount);
+            Contract.Assert(lastVecBufIdx == initialVectorCount);
+            Contract.Assert(lastScalarBufIdx == initialScalarCount);
             return; // break loop
+        }
 …
       s = 0;
       if (op == (byte)OpCodes.LoadVar) {
         s = (short)(((short)code[pc] << 8) | (short)code[pc + 1]);
+        s = (short)((code[pc] << 8) | code[pc + 1]);
         pc += 2;
+      }

stable/HeuristicLab.Algorithms.DataAnalysis/3.4/MctsSymbolicRegression/MctsSymbolicRegressionAlgorithm.cs

-                      r13645
+                      r15060
 /* HeuristicLab
  * Copyright (C) 2002-2015 Heuristic and Evolutionary Algorithms Laboratory (HEAL)
- * and the BEACON Center for the Study of Evolution in Action.
+ *
  * This file is part of HeuristicLab.
 …
 using System.Runtime.CompilerServices;
 using System.Threading;
+using HeuristicLab.Algorithms.DataAnalysis.MctsSymbolicRegression.Policies;
 using HeuristicLab.Analysis;
 using HeuristicLab.Common;
 …
     private const string AllowedFactorsParameterName = "Allowed factors";
     private const string ConstantOptimizationIterationsParameterName = "Iterations (constant optimization)";
     private const string CParameterName = "C";
+    private const string PolicyParameterName = "Policy";
     private const string SeedParameterName = "Seed";
     private const string SetSeedRandomlyParameterName = "SetSeedRandomly";
 …
       get { return (IFixedValueParameter<IntValue>)Parameters[IterationsParameterName]; }
+    }
     public IFixedValueParameter<IntValue> MaxSizeParameter {
+    public IFixedValueParameter<IntValue> MaxVariableReferencesParameter {
       get { return (IFixedValueParameter<IntValue>)Parameters[MaxVariablesParameterName]; }
+    }
 …
       get { return (IFixedValueParameter<IntValue>)Parameters[ConstantOptimizationIterationsParameterName]; }
+    }
     public IFixedValueParameter<DoubleValue> CParameter {
       get { return (IFixedValueParameter<DoubleValue>)Parameters[CParameterName]; }
+    public IValueParameter<IPolicy> PolicyParameter {
+      get { return (IValueParameter<IPolicy>)Parameters[PolicyParameterName]; }
+    }
     public IFixedValueParameter<DoubleValue> PunishmentFactorParameter {
 …
       set { SetSeedRandomlyParameter.Value.Value = value; }
+    }
+    public int MaxSize {
+      get { return MaxSizeParameter.Value.Value; }
+      set { MaxSizeParameter.Value.Value = value; }
+    }
+    public double C {
+      get { return CParameter.Value.Value; }
+      set { CParameter.Value.Value = value; }
+    }
+    public int MaxVariableReferences {
+      get { return MaxVariableReferencesParameter.Value.Value; }
+      set { MaxVariableReferencesParameter.Value.Value = value; }
+    }
+    public IPolicy Policy {
+      get { return PolicyParameter.Value; }
+      set { PolicyParameter.Value = value; }
+    }
     public double PunishmentFactor {
       get { return PunishmentFactorParameter.Value.Value; }
 …
       Parameters.Add(new FixedValueParameter<IntValue>(MaxVariablesParameterName,
         "Maximal number of variables references in the symbolic regression models (multiple usages of the same variable are counted)", new IntValue(5)));
+      Parameters.Add(new FixedValueParameter<DoubleValue>(CParameterName,
+        "Balancing parameter in UCT formula (0 < c < 1000). Small values: greedy search. Large values: enumeration. Default: 1.0", new DoubleValue(1.0)));
+      // Parameters.Add(new FixedValueParameter<DoubleValue>(CParameterName,
+      //   "Balancing parameter in UCT formula (0 < c < 1000). Small values: greedy search. Large values: enumeration. Default: 1.0", new DoubleValue(1.0)));
+      Parameters.Add(new ValueParameter<IPolicy>(PolicyParameterName,
+        "The policy to use for selecting nodes in MCTS (e.g. Ucb)", new Ucb()));
+      PolicyParameter.Hidden = true;
       Parameters.Add(new ValueParameter<ICheckedItemList<StringValue>>(AllowedFactorsParameterName,
         "Choose which expressions are allowed as factors in the model.", defaultFactorsList));
 …
       Results.Add(new Result("Iterations", iterations));
+      var bestSolutionIteration = new IntValue(0);
+      Results.Add(new Result("Best solution iteration", bestSolutionIteration));
       var table = new DataTable("Qualities");
       table.Rows.Add(new DataRow("Best quality"));
 …
       var avgQuality = new DoubleValue();
       Results.Add(new Result("Average quality", avgQuality));
+      var totalRollouts = new IntValue();
+      Results.Add(new Result("Total rollouts", totalRollouts));
+      var effRollouts = new IntValue();
+      Results.Add(new Result("Effective rollouts", effRollouts));
+      var funcEvals = new IntValue();
+      Results.Add(new Result("Function evaluations", funcEvals));
+      var gradEvals = new IntValue();
+      Results.Add(new Result("Gradient evaluations", gradEvals));
       // same as in SymbolicRegressionSingleObjectiveProblem
 …
       var problemData = (IRegressionProblemData)Problem.ProblemData.Clone();
       if (!AllowedFactors.CheckedItems.Any()) throw new ArgumentException("At least on type of factor must be allowed");
+      var state = MctsSymbolicRegressionStatic.CreateState(problemData, (uint)Seed, MaxSize, C, ScaleVariables, ConstantOptimizationIterations,
+      var state = MctsSymbolicRegressionStatic.CreateState(problemData, (uint)Seed, MaxVariableReferences, ScaleVariables, ConstantOptimizationIterations,
+        Policy,
         lowerLimit, upperLimit,
         allowProdOfVars: AllowedFactors.CheckedItems.Any(s => s.Value.Value == VariableProductFactorName),
 …
       double bestQ = 0.0;
       double curBestQ = 0.0;
-      double q = 0.0;
       int n = 0;
       // Loop until iteration limit reached or canceled.
 …
         cancellationToken.ThrowIfCancellationRequested();
         q = MctsSymbolicRegressionStatic.MakeStep(state);
+        var q = MctsSymbolicRegressionStatic.MakeStep(state);
         sumQ += q; // sum of qs in the last updateinterval iterations
         curBestQ = Math.Max(q, curBestQ); // the best q in the last updateinterval iterations
 …
         // iteration results
         if (n == updateInterval) {
+          if (bestQ > bestQuality.Value) {
+            bestSolutionIteration.Value = i;
+          }
           bestQuality.Value = bestQ;
           curQuality.Value = curBestQ;
 …
           sumQ = 0.0;
           curBestQ = 0.0;
+          funcEvals.Value = state.FuncEvaluations;
+          gradEvals.Value = state.GradEvaluations;
+          effRollouts.Value = state.EffectiveRollouts;
+          totalRollouts.Value = state.TotalRollouts;
           table.Rows["Best quality"].Values.Add(bestQuality.Value);
 …
       // final results
       if (n > 0) {
+        if (bestQ > bestQuality.Value) {
+          bestSolutionIteration.Value = iterations.Value + n;
+        }
         bestQuality.Value = bestQ;
         curQuality.Value = curBestQ;
         avgQuality.Value = sumQ / n;
+        funcEvals.Value = state.FuncEvaluations;
+        gradEvals.Value = state.GradEvaluations;
+        effRollouts.Value = state.EffectiveRollouts;
+        totalRollouts.Value = state.TotalRollouts;
         table.Rows["Best quality"].Values.Add(bestQuality.Value);
 …
         table.Rows["Average quality"].Values.Add(avgQuality.Value);
         iterations.Value = iterations.Value + n;
+      }
 …
       Results.Add(new Result("Best solution quality (train)", new DoubleValue(state.BestSolutionTrainingQuality)));
       Results.Add(new Result("Best solution quality (test)", new DoubleValue(state.BestSolutionTestQuality)));
       // produce solution

stable/HeuristicLab.Algorithms.DataAnalysis/3.4/MctsSymbolicRegression/MctsSymbolicRegressionStatic.cs

-                      r13645
+                      r15060
 /* HeuristicLab
  * Copyright (C) 2002-2015 Heuristic and Evolutionary Algorithms Laboratory (HEAL)
- * and the BEACON Center for the Study of Evolution in Action.
+ *
  * This file is part of HeuristicLab.
 …
 using System.Diagnostics.Contracts;
 using System.Linq;
+using HeuristicLab.Algorithms.DataAnalysis.MctsSymbolicRegression.Policies;
 using HeuristicLab.Common;
 using HeuristicLab.Core;
 …
       double BestSolutionTrainingQuality { get; }
       double BestSolutionTestQuality { get; }
+      int TotalRollouts { get; }
+      int EffectiveRollouts { get; }
+      int FuncEvaluations { get; }
+      int GradEvaluations { get; } // number of gradient evaluations (* num parameters) to get a value representative of the effort comparable to the number of function evaluations
+      // TODO other stats on LM optimizer might be interesting here
+    }
 …
       internal readonly Automaton automaton;
       internal IRandom random { get; private set; }
-      internal readonly double c;
       internal readonly Tree tree;
-      internal readonly List<Tree> bestChildrenBuf;
       internal readonly Func<byte[], int, double> evalFun;
+      internal readonly IPolicy treePolicy;
+      // MCTS might get stuck. Track statistics on the number of effective rollouts
+      internal int totalRollouts;
+      internal int effectiveRollouts;
 …
       private double[] bestConsts;
+      // stats
+      private int funcEvaluations;
+      private int gradEvaluations;
       // buffers
       private readonly double[] ones; // vector of ones (as default params)
 …
       private readonly double[][] gradBuf;
+      public State(IRegressionProblemData problemData, uint randSeed, int maxVariables, double c, bool scaleVariables, int constOptIterations,
+      public State(IRegressionProblemData problemData, uint randSeed, int maxVariables, bool scaleVariables, int constOptIterations,
+        IPolicy treePolicy = null,
         double lowerEstimationLimit = double.MinValue, double upperEstimationLimit = double.MaxValue,
         bool allowProdOfVars = true,
 …
         this.problemData = problemData;
-        this.c = c;
         this.constOptIterations = constOptIterations;
         this.evalFun = this.Eval;
 …
         this.automaton = new Automaton(x, maxVariables, allowProdOfVars, allowExp, allowLog, allowInv, allowMultipleTerms);
+        this.tree = new Tree() { state = automaton.CurrentState };
+        this.treePolicy = treePolicy ?? new Ucb();
+        this.tree = new Tree() { state = automaton.CurrentState, actionStatistics = treePolicy.CreateActionStatistics() };
         // reset best solution
 …
         this.ones = Enumerable.Repeat(1.0, MaxParams).ToArray();
         constsBuf = new double[MaxParams];
-        this.bestChildrenBuf = new List<Tree>(2 * x.Length); // the number of follow states in the automaton is O(number of variables) 2 * number of variables should be sufficient (capacity is increased if necessary anyway)
         this.predBuf = new double[y.Length];
         this.testPredBuf = new double[testY.Length];
 …
       #region IState inferface
       public bool Done { get { return tree != null && tree.done; } }
+      public bool Done { get { return tree != null && tree.Done; } }
       public double BestSolutionTrainingQuality {
 …
           var treeGen = new SymbolicExpressionTreeGenerator(problemData.AllowedInputVariables.ToArray());
           var interpreter = new SymbolicDataAnalysisExpressionTreeLinearInterpreter();
-          var simplifier = new SymbolicDataAnalysisExpressionTreeSimplifier();
           var t = new SymbolicExpressionTree(treeGen.Exec(bestCode, bestConsts, bestNParams, scalingFactor, scalingOffset));
+          var simpleT = simplifier.Simplify(t);
+          var model = new SymbolicRegressionModel(simpleT, interpreter, lowerEstimationLimit, upperEstimationLimit);
+          var model = new SymbolicRegressionModel(t, interpreter, lowerEstimationLimit, upperEstimationLimit);
           // model has already been scaled linearly in Eval
 …
+        }
+      }
+      public int TotalRollouts { get { return totalRollouts; } }
+      public int EffectiveRollouts { get { return effectiveRollouts; } }
+      public int FuncEvaluations { get { return funcEvaluations; } }
+      public int GradEvaluations { get { return gradEvaluations; } } // number of gradient evaluations (* num parameters) to get a value representative of the effort comparable to the number of function evaluations
       #endregion
 …
         Array.Copy(ones, constsBuf, nParams);
         evaluator.Exec(code, x, constsBuf, predBuf, adjustOffsetForLogAndExp: true);
+        funcEvaluations++;
         // calc opt scaling (alpha*f(x) + beta)
 …
           // optimize constants using the starting point calculated above
           OptimizeConstsLm(code, constsBuf, nParams, 0.0, nIters: constOptIterations);
           evaluator.Exec(code, x, constsBuf, predBuf);
+          funcEvaluations++;
           rsq = RSq(y, predBuf);
           optConsts = constsBuf;
 …
       private void OptimizeConstsLm(byte[] code, double[] consts, int nParams, double epsF = 0.0, int nIters = 100) {
         double[] optConsts = new double[nParams]; // allocate a smaller buffer for constants opt
+        double[] optConsts = new double[nParams]; // allocate a smaller buffer for constants opt (TODO perf?)
         Array.Copy(consts, optConsts, nParams);
 …
         alglib.minlmoptimize(state, Func, FuncAndJacobian, null, code);
         alglib.minlmresults(state, out optConsts, out rep);
+        funcEvaluations += rep.nfunc;
+        gradEvaluations += rep.njac * nParams;
         if (rep.terminationtype < 0) throw new ArgumentException("lm failed: termination type = " + rep.terminationtype);
 …
       private void Func(double[] arg, double[] fi, object obj) {
-        // 0.5 * MSE and gradient
         var code = (byte[])obj;
         evaluator.Exec(code, x, arg, predBuf); // gradients are nParams x vLen
 …
+    }
+    public static IState CreateState(IRegressionProblemData problemData, uint randSeed, int maxVariables = 3, double c = 1.0,
+      bool scaleVariables = true, int constOptIterations = 0, double lowerEstimationLimit = double.MinValue, double upperEstimationLimit = double.MaxValue,
+    public static IState CreateState(IRegressionProblemData problemData, uint randSeed, int maxVariables = 3,
+      bool scaleVariables = true, int constOptIterations = 0,
+      IPolicy policy = null,
+      double lowerEstimationLimit = double.MinValue, double upperEstimationLimit = double.MaxValue,
       bool allowProdOfVars = true,
       bool allowExp = true,
 …
       bool allowMultipleTerms = false
       ) {
+      return new State(problemData, randSeed, maxVariables, c, scaleVariables, constOptIterations,
+      return new State(problemData, randSeed, maxVariables, scaleVariables, constOptIterations,
+        policy,
         lowerEstimationLimit, upperEstimationLimit,
         allowProdOfVars, allowExp, allowLog, allowInv, allowMultipleTerms);
 …
       var tree = mctsState.tree;
       var eval = mctsState.evalFun;
-      var bestChildrenBuf = mctsState.bestChildrenBuf;
       var rand = mctsState.random;
+      double c = mctsState.c;
+      automaton.Reset();
+      return TreeSearchRec(rand, tree, c, automaton, eval, bestChildrenBuf);
+    }
+    private static double TreeSearchRec(IRandom rand, Tree tree, double c, Automaton automaton, Func<byte[], int, double> eval, List<Tree> bestChildrenBuf) {
+      var treePolicy = mctsState.treePolicy;
+      double q = 0;
+      bool success = false;
+      do {
+        automaton.Reset();
+        success = TryTreeSearchRec(rand, tree, automaton, eval, treePolicy, out q);
+        mctsState.totalRollouts++;
+      } while (!success && !tree.Done);
+      mctsState.effectiveRollouts++;
+      return q;
+    }
+    // tree search might fail because of constraints for expressions
+    // in this case we get stuck we just restart
+    // see ConstraintHandler.cs for more info
+    private static bool TryTreeSearchRec(IRandom rand, Tree tree, Automaton automaton, Func<byte[], int, double> eval, IPolicy treePolicy,
+      out double q) {
       Tree selectedChild = null;
-      double q;
       Contract.Assert(tree.state == automaton.CurrentState);
       Contract.Assert(!tree.done);
+      Contract.Assert(!tree.Done);
       if (tree.children == null) {
         if (automaton.IsFinalState(tree.state)) {
           // final state
           tree.done = true;
+          tree.Done = true;
           // EVALUATE
 …
           automaton.GetCode(out code, out nParams);
           q = eval(code, nParams);
+          tree.visits++;
           tree.sumQuality += q;
           return q;
+          treePolicy.Update(tree.actionStatistics, q);
+          return true; // we reached a final state
         } else {
           // EXPAND
 …
           int nFs;
           automaton.FollowStates(automaton.CurrentState, out possibleFollowStates, out nFs);
+          if (nFs == 0) {
+            // stuck in a dead end (no final state and no allowed follow states)
+            q = 0;
+            tree.Done = true;
+            tree.children = null;
+            return false;
+          }
           tree.children = new Tree[nFs];
+          for (int i = 0; i < tree.children.Length; i++) tree.children[i] = new Tree() { children = null, done = false, state = possibleFollowStates[i], visits = 0 };
+          selectedChild = SelectFinalOrRandom(automaton, tree, rand);
+          for (int i = 0; i < tree.children.Length; i++)
+            tree.children[i] = new Tree() { children = null, state = possibleFollowStates[i], actionStatistics = treePolicy.CreateActionStatistics() };
+          selectedChild = nFs > 1 ? SelectFinalOrRandom(automaton, tree, rand) : tree.children[0];
+        }
       } else {
         // tree.children != null
         // UCT selection within tree
+        selectedChild = SelectUct(tree, rand, c, bestChildrenBuf);
+        int selectedIdx = 0;
+        if (tree.children.Length > 1) {
+          selectedIdx = treePolicy.Select(tree.children.Select(ch => ch.actionStatistics), rand);
+        }
+        selectedChild = tree.children[selectedIdx];
+      }
       // make selected step and recurse
       automaton.Goto(selectedChild.state);
+      q = TreeSearchRec(rand, selectedChild, c, automaton, eval, bestChildrenBuf);
+      tree.sumQuality += q;
+      tree.visits++;
+      // tree.done = tree.children.All(ch => ch.done);
+      tree.done = true; for (int i = 0; i < tree.children.Length && tree.done; i++) tree.done = tree.children[i].done;
+      if (tree.done) {
+        tree.children = null; // cut of the sub-branch if it has been fully explored
+        // TODO: update all qualities and visits to remove the information gained from this whole branch
+      }
+      return q;
+    }
+    private static Tree SelectUct(Tree tree, IRandom rand, double c, List<Tree> bestChildrenBuf) {
+      // determine total tries of still active children
+      int totalTries = 0;
+      bestChildrenBuf.Clear();
+      for (int i = 0; i < tree.children.Length; i++) {
+        var ch = tree.children[i];
+        if (ch.done) continue;
+        if (ch.visits == 0) bestChildrenBuf.Add(ch);
+        else totalTries += tree.children[i].visits;
+      }
+      // if there are unvisited children select a random child
+      if (bestChildrenBuf.Any()) {
+        return bestChildrenBuf[rand.Next(bestChildrenBuf.Count)];
+      }
+      Contract.Assert(totalTries > 0); // the tree is not done yet so there is at least on child that is not done
+      double logTotalTries = Math.Log(totalTries);
+      var bestQ = double.NegativeInfinity;
+      for (int i = 0; i < tree.children.Length; i++) {
+        var ch = tree.children[i];
+        if (ch.done) continue;
+        var childQ = ch.AverageQuality + c * Math.Sqrt(logTotalTries / ch.visits);
+        if (childQ > bestQ) {
+          bestChildrenBuf.Clear();
+          bestChildrenBuf.Add(ch);
+          bestQ = childQ;
+        } else if (childQ >= bestQ) {
+          bestChildrenBuf.Add(ch);
+        }
+      }
+      return bestChildrenBuf.Count > 0 ? bestChildrenBuf[rand.Next(bestChildrenBuf.Count)] : bestChildrenBuf[0];
+      var success = TryTreeSearchRec(rand, selectedChild, automaton, eval, treePolicy, out q);
+      if (success) {
+        // only update if successful
+        treePolicy.Update(tree.actionStatistics, q);
+      }
+      tree.Done = tree.children.All(ch => ch.Done);
+      if (tree.Done) {
+        tree.children = null; // cut off the sub-branch if it has been fully explored
+      }
+      return success;
+    }
 …
+        }
+      }
       // no final state -> select a random child
+      // no final state -> select a the first child
       if (selectedChildIdx == -1) {
         selectedChildIdx = rand.Next(tree.children.Length);
+        selectedChildIdx = 0;
+      }
       return tree.children[selectedChildIdx];

stable/HeuristicLab.Algorithms.DataAnalysis/3.4/MctsSymbolicRegression/OpCodes.cs

r13645	r15060
2	2	/* HeuristicLab
3	3	* Copyright (C) 2002-2015 Heuristic and Evolutionary Algorithms Laboratory (HEAL)
4		* and the BEACON Center for the Study of Evolution in Action.
5	4	*
6	5	* This file is part of HeuristicLab.

stable/HeuristicLab.Algorithms.DataAnalysis/3.4/MctsSymbolicRegression/Policies/EpsGreedy.cs

-                      r13659
+                      r15060
 using HeuristicLab.Data;
 using HeuristicLab.Parameters;
+using HeuristicLab.Persistence.Default.CompositeSerializers.Storable;
 namespace HeuristicLab.Algorithms.DataAnalysis.MctsSymbolicRegression.Policies {
+  [StorableClass]
   [Item("EpsilonGreedy", "Epsilon greedy policy with parameter eps to balance between exploitation and exploration")]
   internal class EpsilonGreedy : PolicyBase {
+  public class EpsilonGreedy : PolicyBase {
     private class ActionStatistics : IActionStatistics {
       public double SumQuality { get; set; }
 …
+    }
+    private EpsilonGreedy(EpsilonGreedy original, Cloner cloner)
+    [StorableConstructor]
+    protected EpsilonGreedy(bool deserializing) : base(deserializing) { }
+    protected EpsilonGreedy(EpsilonGreedy original, Cloner cloner)
       : base(original, cloner) {
+    }

stable/HeuristicLab.Algorithms.DataAnalysis/3.4/MctsSymbolicRegression/Policies/PolicyBase.cs

-                      r13659
+                      r15060
 namespace HeuristicLab.Algorithms.DataAnalysis.MctsSymbolicRegression.Policies {
   [StorableClass]
   internal abstract class PolicyBase : Item, IParameterizedItem, IPolicy {
+  public abstract class PolicyBase : Item, IParameterizedItem, IPolicy {
     [Storable]
     public IKeyedItemCollection<string, IParameter> Parameters { get; private set; }
     [StorableConstructor]
     private PolicyBase(bool deserializing) : base(deserializing) { }
+    protected PolicyBase(bool deserializing) : base(deserializing) { }
     protected PolicyBase(PolicyBase original, Cloner cloner)
       : base(original, cloner) {

stable/HeuristicLab.Algorithms.DataAnalysis/3.4/MctsSymbolicRegression/Policies/Ucb.cs

-                      r13659
+                      r15060
 using HeuristicLab.Data;
 using HeuristicLab.Parameters;
+using HeuristicLab.Persistence.Default.CompositeSerializers.Storable;
 namespace HeuristicLab.Algorithms.DataAnalysis.MctsSymbolicRegression.Policies {
+  [StorableClass]
   [Item("Ucb Policy", "Ucb with parameter c to balance between exploitation and exploration")]
   internal class Ucb : PolicyBase {
+  public class Ucb : PolicyBase {
     private class ActionStatistics : IActionStatistics {
       public double SumQuality { get; set; }
 …
+    }
+    private Ucb(Ucb original, Cloner cloner)
+    [StorableConstructor]
+    protected Ucb(bool deserializing) : base(deserializing) { }
+    protected Ucb(Ucb original, Cloner cloner)
       : base(original, cloner) {
+    }

stable/HeuristicLab.Algorithms.DataAnalysis/3.4/MctsSymbolicRegression/Policies/UcbTuned.cs

-                      r13659
+                      r15060
 using HeuristicLab.Data;
 using HeuristicLab.Parameters;
+using HeuristicLab.Persistence.Default.CompositeSerializers.Storable;
 namespace HeuristicLab.Algorithms.DataAnalysis.MctsSymbolicRegression.Policies {
+  [StorableClass]
   [Item("UcbTuned Policy", "UcbTuned is similar to Ucb but tracks empirical variance. Use parameter c to balance between exploitation and exploration")]
   internal class UcbTuned : PolicyBase {
+  public class UcbTuned : PolicyBase {
     private class ActionStatistics : IActionStatistics {
       public double SumQuality { get; set; }
 …
+    }
+    private UcbTuned(UcbTuned original, Cloner cloner)
+    [StorableConstructor]
+    protected UcbTuned(bool deserializing) : base(deserializing) { }
+    protected UcbTuned(UcbTuned original, Cloner cloner)
       : base(original, cloner) {
+    }

stable/HeuristicLab.Algorithms.DataAnalysis/3.4/MctsSymbolicRegression/SymbolicExpressionGenerator.cs

-                      r13645
+                      r15060
 /* HeuristicLab
  * Copyright (C) 2002-2015 Heuristic and Evolutionary Algorithms Laboratory (HEAL)
- * and the BEACON Center for the Study of Evolution in Action.
+ *
  * This file is part of HeuristicLab.
 …
             break;
           case OpCodes.Add: {
               var t1 = stack[topOfStack];
               var t2 = stack[topOfStack - 1];
+              var t1 = stack[topOfStack - 1];
+              var t2 = stack[topOfStack];
               topOfStack--;
               if (t2.Symbol is Addition) {
                 t2.AddSubtree(t1);
+              if (t1.Symbol is Addition) {
+                t1.AddSubtree(t2);
               } else {
                 var addNode = addSy.CreateTreeNode();
 …
+            }
           case OpCodes.Mul: {
               var t1 = stack[topOfStack];
               var t2 = stack[topOfStack - 1];
+              var t1 = stack[topOfStack - 1];
+              var t2 = stack[topOfStack];
               topOfStack--;
               if (t2.Symbol is Multiplication) {
                 t2.AddSubtree(t1);
+              if (t1.Symbol is Multiplication) {
+                t1.AddSubtree(t2);
               } else {
                 var mulNode = mulSy.CreateTreeNode();
 …
       s = 0;
       if (op == OpCodes.LoadVar) {
         s = (short)(((short)code[pc] << 8) | (short)code[pc + 1]);
+        s = (short)((code[pc] << 8) | code[pc + 1]);
         pc += 2;
+      }

stable/HeuristicLab.Algorithms.DataAnalysis/3.4/MctsSymbolicRegression/Tree.cs

-                      r13645
+                      r15060
 /* HeuristicLab
  * Copyright (C) 2002-2015 Heuristic and Evolutionary Algorithms Laboratory (HEAL)
- * and the BEACON Center for the Study of Evolution in Action.
+ *
  * This file is part of HeuristicLab.
 …
 #endregion
+using HeuristicLab.Algorithms.DataAnalysis.MctsSymbolicRegression.Policies;
 namespace HeuristicLab.Algorithms.DataAnalysis.MctsSymbolicRegression {
   // represents tree nodes for the search tree in MCTS
   internal class Tree {
     public int state;
+    public int visits;
+    public double sumQuality;
+    public double AverageQuality { get { return sumQuality / (double)visits; } }
+    public bool done;
+    public bool Done {
+      get { return actionStatistics.Done; }
+      set { actionStatistics.Done = value; }
+    }
+    public IActionStatistics actionStatistics;
     public Tree[] children;
+  }

stable/HeuristicLab.Tests

Property svn:mergeinfo changed
/trunk/sources/HeuristicLab.Tests merged: 13648,13651,13654,13661,13708

stable/HeuristicLab.Tests/HeuristicLab.Algorithms.DataAnalysis-3.4/MctsSymbolicRegressionTest.cs

-                      r13648
+                      r15060
 using System;
+using System.Diagnostics.Contracts;
 using System.Linq;
 using System.Threading;
 using HeuristicLab.Algorithms.DataAnalysis.MctsSymbolicRegression;
+using HeuristicLab.Algorithms.DataAnalysis.MctsSymbolicRegression.Policies;
 using HeuristicLab.Data;
 using HeuristicLab.Optimization;
 …
+      {
         // possible solutions with max two variable references:
+        // TODO: equal terms should not be allowed (see ConstraintHandler)
         // x
         // log(x)
 …
         // x * exp(x)
         // x * 1/x
         // x + x
+        // x + x                                        ?
         // x + log(x)
         // x + exp(x)
 …
         // log(x) * exp(x)
         // log(x) * 1/x
         // log(x) + log(x)
         // log(x) + exp(x)
+        // log(x) + log(x)                              ?
+        // log(x) + exp(x)                              ?
         // log(x) + 1/x
         //              -- 6
         // exp(x) * exp(x)
         // exp(x) * 1/x
         // exp(x) + exp(x)
+        // exp(x) + exp(x)                              ?
         // exp(x) + 1/x
         //              -- 4
         // 1/x * 1/x
         // 1/x + 1/x
+        // 1/x + 1/x                                    ?
         //              -- 2
         // log(x+x)
+        // log(x+x)                                     ?
         // log(x*x)
         // exp(x*x)
         // 1/(x+x)
+        // 1/(x+x)                                      ?
         // 1/(x*x)
         //              -- 5
         TestMctsNumberOfSolutions(regProblem, 2, 29);
+      }
 …
         //              -- 2
         // x * x
         // x + x
+        // x + x                                            ?
         // x * exp(x)
         // x + exp(x)
         // exp(x) * exp(x)
         // exp(x) + exp(x)
+        // exp(x) + exp(x)                                  ?
         // exp(x*x)
         //              -- 7
         // x * x * x
+        // x + x * x
+        // x * x + x                                        !!
+        // x + x + x
+        // x + x * x
+        // x + x + x                                        ?
         // x * x * exp(x)
+        // x + x * exp(x)
+        // x * x + exp(x)
+        // x + x + exp(x)
+        // x * exp(x) + x                                   !!
+        // x * exp(x) + exp(x)
+        // x + exp(x) * exp(x)
+        // x + exp(x) + exp(x)
+        // x + x * exp(x)
+        // x + x + exp(x)                                   ?
+        // exp(x) + x*x
+        // exp(x) + x*exp(x)
+        // x + exp(x) * exp(x)
+        // x + exp(x) + exp(x)                              ?
         // x * exp(x) * exp(x)
         // x * exp(x*x)
         // x + exp(x*x)
         //              -- 15
+        //              -- 13
         // exp(x) * exp(x) * exp(x)
+        // exp(x) + exp(x) * exp(x)
+        // exp(x) * exp(x) + exp(x)                         !!
+        // exp(x) + exp(x) + exp(x)
+        //              -- 4
+        // exp(x) + exp(x) * exp(x)
+        // exp(x) + exp(x) + exp(x)                         ?
+        //              -- 3
         // exp(x)   * exp(x*x)
         // exp(x)   + exp(x*x)
+        // exp(x*x) * exp(x)                                !!
+        // exp(x*x) + exp(x)                                !!
+        //              -- 4
+        //              -- 2
         // exp(x*x*x)
         //              -- 1
+        TestMctsNumberOfSolutions(regProblem, 3, 2 + 7 + 15 + 4 + 4 + 1, allowLog: false, allowInv: false);
+        TestMctsNumberOfSolutions(regProblem, 3, 2 + 7 + 13 + 3 + 2 + 1, allowLog: false, allowInv: false);
+      }
+      {
+        // possible solutions with max 4 variable references:
+        // without exp, log and inv
+        // x
+        // x*x
+        // x+x                                             ?
+        // x*x*x
+        // x+x*x
+        // x+x+x                                           ?
+        // x*x*x*x
+        // x+x*x*x
+        // x*x+x*x                                         ?
+        // x+x+x*x                                         ?
+        // x+x+x+x                                         ?
+        TestMctsNumberOfSolutions(regProblem, 4, 11, allowLog: false, allowInv: false, allowExp: false);
+      }
+      {
+        // possible solutions with max 5 variable references:
+        // without exp, log and inv
+        // x
+        // xx
+        // x+x                                             ?
+        // xxx
+        // x+xx
+        // x+x+x                                           ?
+        // xxxx
+        // x+xxx
+        // xx+xx                                           ?
+        // x+x+xx                                          ?
+        // x+x+x+x                                         ?
+        // xxxxx
+        // x+xxxx
+        // xx+xxx
+        // x+x+xxx                                         ?
+        // x+xx+xx                                         ?
+        // x+x+x+xx                                        ?
+        // x+x+x+x+x                                       ?
+        TestMctsNumberOfSolutions(regProblem, 5, 18, allowLog: false, allowInv: false, allowExp: false);
+      }
+    }
 …
     #endregion
     #region Nguyen
     [TestMethod]
+    // [TestMethod]
     [TestCategory("Algorithms.DataAnalysis")]
     [TestProperty("Time", "short")]
 …
       TestMcts(regProblem);
+    }
     [TestMethod]
+    // [TestMethod]
     [TestCategory("Algorithms.DataAnalysis")]
     [TestProperty("Time", "short")]
 …
       TestMcts(regProblem);
+    }
     [TestMethod]
+    // [TestMethod]
     [TestCategory("Algorithms.DataAnalysis")]
     [TestProperty("Time", "short")]
 …
       TestMcts(regProblem, successThreshold: 0.99);
+    }
     [TestMethod]
+    // [TestMethod]
     [TestCategory("Algorithms.DataAnalysis")]
     [TestProperty("Time", "short")]
 …
       TestMcts(regProblem);
+    }
     [TestMethod]
+    // [TestMethod]
     [TestCategory("Algorithms.DataAnalysis")]
     [TestProperty("Time", "short")]
 …
       TestMcts(regProblem);
+    }
     [TestMethod]
+    // [TestMethod]
     [TestCategory("Algorithms.DataAnalysis")]
     [TestProperty("Time", "short")]
 …
       TestMcts(regProblem);
+    }
     [TestMethod]
+    // [TestMethod]
     [TestCategory("Algorithms.DataAnalysis")]
     [TestProperty("Time", "short")]
 …
       TestMcts(regProblem);
+    }
     [TestMethod]
+    // [TestMethod]
     [TestCategory("Algorithms.DataAnalysis")]
     [TestProperty("Time", "short")]
 …
       TestMcts(regProblem, successThreshold: 0.99);
+    }
     [TestMethod]
+    // [TestMethod]
     [TestCategory("Algorithms.DataAnalysis")]
     [TestProperty("Time", "short")]
 …
       TestMcts(regProblem, iterations: 10000);
+    }
     [TestMethod]
+    // [TestMethod]
     [TestCategory("Algorithms.DataAnalysis")]
     [TestProperty("Time", "short")]
 …
       TestMcts(regProblem);
+    }
     [TestMethod]
+    // [TestMethod]
     [TestCategory("Algorithms.DataAnalysis")]
     [TestProperty("Time", "short")]
 …
       TestMcts(regProblem, 10000, 0.95); // cannot solve exactly in 10000 iterations
+    }
     [TestMethod]
+    // [TestMethod]
     [TestCategory("Algorithms.DataAnalysis")]
     [TestProperty("Time", "short")]
 …
     #region keijzer
     [TestMethod]
+    // [TestMethod]
     [TestCategory("Algorithms.DataAnalysis")]
     [TestProperty("Time", "long")]
 …
+    }
     [TestMethod]
+    // [TestMethod]
     [TestCategory("Algorithms.DataAnalysis")]
     [TestProperty("Time", "short")]
 …
+    }
+    // [TestMethod]
+    [TestCategory("Algorithms.DataAnalysis")]
+    [TestProperty("Time", "short")]
+    public void MctsSymbRegBenchmarkKeijzer7() {
+      var provider = new HeuristicLab.Problems.Instances.DataAnalysis.KeijzerInstanceProvider();
+      var regProblem = provider.LoadData(provider.GetDataDescriptors().Single(x => x.Name.Contains("Keijzer 7 f(")));
+      // some Keijzer problem instances have very large test partitions (here we are not concerened about test performance)
+      if (regProblem.TestPartition.End - regProblem.TestPartition.Start > 1000) regProblem.TestPartition.End = regProblem.TestPartition.Start + 1000;
+      TestMcts(regProblem);
+    }
     [TestMethod]
     [TestCategory("Algorithms.DataAnalysis")]
     [TestProperty("Time", "short")]
     public void MctsSymbRegBenchmarkKeijzer7() {
       var provider = new HeuristicLab.Problems.Instances.DataAnalysis.KeijzerInstanceProvider();
       var regProblem = provider.LoadData(provider.GetDataDescriptors().Single(x => x.Name.Contains("Keijzer 7 f(")));
+    // [TestCategory("Algorithms.DataAnalysis")]
+    [TestProperty("Time", "short")]
+    public void MctsSymbRegBenchmarkKeijzer8() {
+      var provider = new HeuristicLab.Problems.Instances.DataAnalysis.KeijzerInstanceProvider();
+      var regProblem = provider.LoadData(provider.GetDataDescriptors().Single(x => x.Name.Contains("Keijzer 8 f(")));
       // some Keijzer problem instances have very large test partitions (here we are not concerened about test performance)
       if (regProblem.TestPartition.End - regProblem.TestPartition.Start > 1000) regProblem.TestPartition.End = regProblem.TestPartition.Start + 1000;
 …
     [TestMethod]
+    [TestCategory("Algorithms.DataAnalysis")]
+    [TestProperty("Time", "short")]
+    public void MctsSymbRegBenchmarkKeijzer8() {
+      var provider = new HeuristicLab.Problems.Instances.DataAnalysis.KeijzerInstanceProvider();
+      var regProblem = provider.LoadData(provider.GetDataDescriptors().Single(x => x.Name.Contains("Keijzer 8 f(")));
+      // some Keijzer problem instances have very large test partitions (here we are not concerened about test performance)
+      if (regProblem.TestPartition.End - regProblem.TestPartition.Start > 1000) regProblem.TestPartition.End = regProblem.TestPartition.Start + 1000;
+      TestMcts(regProblem);
+    }
+    [TestMethod]
+    [TestCategory("Algorithms.DataAnalysis")]
+    // [TestCategory("Algorithms.DataAnalysis")]
     [TestProperty("Time", "short")]
     public void MctsSymbRegBenchmarkKeijzer9() {
 …
+    }
      */
     [TestMethod]
+    // [TestMethod]
     [TestCategory("Algorithms.DataAnalysis")]
     [TestProperty("Time", "short")]
 …
       TestMcts(regProblem, iterations: 10000, allowLog: false, allowExp: false, allowInv: false, successThreshold: 0.99); // cannot solve exactly in 10000 iterations
+    }
     [TestMethod]
+    // [TestMethod]
     [TestCategory("Algorithms.DataAnalysis")]
     [TestProperty("Time", "short")]
 …
       TestMcts(regProblem);
+    }
     [TestMethod]
+    // [TestMethod]
     [TestCategory("Algorithms.DataAnalysis")]
     [TestProperty("Time", "short")]
 …
       mctsSymbReg.Problem = regProblem;
       mctsSymbReg.Iterations = iterations;
+      mctsSymbReg.MaxSize = 10;
+      mctsSymbReg.C = 2; // less greedy
+      mctsSymbReg.MaxVariableReferences = 10;
+      var ucbPolicy = new Ucb();
+      ucbPolicy.C = 2;
+      mctsSymbReg.Policy = ucbPolicy;
       mctsSymbReg.SetSeedRandomly = false;
       mctsSymbReg.Seed = 1234;
 …
     private void TestMctsNumberOfSolutions(IRegressionProblemData problemData, int maxNumberOfVariables, int expectedNumberOfSolutions,
+      bool allowProd = true,
       bool allowExp = true,
       bool allowLog = true,
 …
       regProblem.ProblemDataParameter.Value = problemData;
       #region Algorithm Configuration
+      mctsSymbReg.SetSeedRandomly = false;
+      mctsSymbReg.Seed = 1234;
       mctsSymbReg.Problem = regProblem;
       mctsSymbReg.Iterations = int.MaxValue; // stopping when all solutions have been enumerated
+      mctsSymbReg.MaxSize = maxNumberOfVariables;
+      mctsSymbReg.C = 1000; // essentially breath first seach
+      mctsSymbReg.MaxVariableReferences = maxNumberOfVariables;
+      var ucbPolicy = new Ucb();
+      ucbPolicy.C = 1000; // essentially breadth first search
+      mctsSymbReg.Policy = ucbPolicy;
+      mctsSymbReg.AllowedFactors.SetItemCheckedState(mctsSymbReg.AllowedFactors.Single(s => s.Value.StartsWith("prod")), allowProd);
       mctsSymbReg.AllowedFactors.SetItemCheckedState(mctsSymbReg.AllowedFactors.Single(s => s.Value.Contains("exp")), allowExp);
       mctsSymbReg.AllowedFactors.SetItemCheckedState(mctsSymbReg.AllowedFactors.Single(s => s.Value.Contains("log")), allowLog);

stable/HeuristicLab.Tests/HeuristicLab.Tests.csproj

r14967	r15060
478	478	<Compile Include="HeuristicLab-3.3\ThreadSafeLogTest.cs" />
479	479	<Compile Include="HeuristicLab-3.3\ToStringTest.cs" />
	480	<Compile Include="HeuristicLab.Algorithms.DataAnalysis-3.4\MctsSymbolicRegressionTest.cs" />
480	481	<Compile Include="HeuristicLab.Algorithms.DataAnalysis-3.4\GradientBoostingTest.cs" />
481	482	<Compile Include="HeuristicLab.Algorithms.DataAnalysis-3.4\SupportVectorMachineTest.cs" />

Context Navigation

Legend:

stable

stable/HeuristicLab.Algorithms.DataAnalysis

stable/HeuristicLab.Algorithms.DataAnalysis/3.4/HeuristicLab.Algorithms.DataAnalysis-3.4.csproj

stable/HeuristicLab.Algorithms.DataAnalysis/3.4/MctsSymbolicRegression/Automaton.cs

stable/HeuristicLab.Algorithms.DataAnalysis/3.4/MctsSymbolicRegression/CodeGenerator.cs

stable/HeuristicLab.Algorithms.DataAnalysis/3.4/MctsSymbolicRegression/ConstraintHandler.cs

stable/HeuristicLab.Algorithms.DataAnalysis/3.4/MctsSymbolicRegression/Disassembler.cs

stable/HeuristicLab.Algorithms.DataAnalysis/3.4/MctsSymbolicRegression/ExpressionEvaluator.cs

stable/HeuristicLab.Algorithms.DataAnalysis/3.4/MctsSymbolicRegression/MctsSymbolicRegressionAlgorithm.cs

stable/HeuristicLab.Algorithms.DataAnalysis/3.4/MctsSymbolicRegression/MctsSymbolicRegressionStatic.cs

stable/HeuristicLab.Algorithms.DataAnalysis/3.4/MctsSymbolicRegression/OpCodes.cs

stable/HeuristicLab.Algorithms.DataAnalysis/3.4/MctsSymbolicRegression/Policies/EpsGreedy.cs

stable/HeuristicLab.Algorithms.DataAnalysis/3.4/MctsSymbolicRegression/Policies/PolicyBase.cs

stable/HeuristicLab.Algorithms.DataAnalysis/3.4/MctsSymbolicRegression/Policies/Ucb.cs

stable/HeuristicLab.Algorithms.DataAnalysis/3.4/MctsSymbolicRegression/Policies/UcbTuned.cs

stable/HeuristicLab.Algorithms.DataAnalysis/3.4/MctsSymbolicRegression/SymbolicExpressionGenerator.cs

stable/HeuristicLab.Algorithms.DataAnalysis/3.4/MctsSymbolicRegression/Tree.cs

stable/HeuristicLab.Tests

stable/HeuristicLab.Tests/HeuristicLab.Algorithms.DataAnalysis-3.4/MctsSymbolicRegressionTest.cs

stable/HeuristicLab.Tests/HeuristicLab.Tests.csproj

Download in other formats: