Context Navigation

← Previous Change
Next Change →

GenericPolicy.cs

Timestamp:

08/24/15 13:56:27 (9 years ago)

Author:

gkronber

Message:

#2283: experiments on grammatical optimization algorithms (maxreward instead of avg reward, ...)

File:

: 1 edited

branches/HeuristicLab.Problems.GrammaticalOptimization-gkr/HeuristicLab.Algorithms.GrammaticalOptimization/SequentialDecisionPolicies/GenericPolicy.cs (modified) (5 diffs)

Legend:

: Unmodified
: Added
: Removed

branches/HeuristicLab.Problems.GrammaticalOptimization-gkr/HeuristicLab.Algorithms.GrammaticalOptimization/SequentialDecisionPolicies/GenericPolicy.cs

-                      r12298
+                      r12893
     private int[] actionIndexMap; // don't allocate each time
     public bool TrySelect(Random random, string curState, IEnumerable<string> afterStates, out int selectedStateIdx) {
+    public bool TrySelect(System.Random random, string curState, IEnumerable<string> afterStates, out int selectedStateIdx) {
       // fail if all states are done (corresponding state infos are disabled)
       if (afterStates.All(s => Done(s))) {
 …
     private int SelectBoltzmann(Random random, IEnumerable<double> qs, double beta = 10) {
+    private int SelectBoltzmann(System.Random random, IEnumerable<double> qs, double beta = 10) {
       // select best
 …
+    }
     private int SelectEpsGreedy(Random random, IEnumerable<double> qs, double eps = 0.2) {
+    private int SelectEpsGreedy(System.Random random, IEnumerable<double> qs, double eps = 0.2) {
       if (random.NextDouble() >= eps) { // eps == 0 should be equivalent to pure exploitation, eps == 1 is pure exploration
         // select best
 …
             bestActions.Add(aIdx);
             bestQ = q;
           } else if (q.IsAlmost(bestQ)) {
+          } else if (HeuristicLab.Common.Extensions.IsAlmost(q,bestQ)) {
             bestActions.Add(aIdx);
+          }
 …
+    }
     private int SelectRandom(Random random, IEnumerable<double> qs) {
+    private int SelectRandom(System.Random random, IEnumerable<double> qs) {
       return qs
          .Select((aInfo, idx) => Tuple.Create(aInfo, idx))

Note: See TracChangeset for help on using the changeset viewer.

Context Navigation

Changeset 12893 for branches/HeuristicLab.Problems.GrammaticalOptimization-gkr/HeuristicLab.Algorithms.GrammaticalOptimization/SequentialDecisionPolicies/GenericPolicy.cs

Legend:

branches/HeuristicLab.Problems.GrammaticalOptimization-gkr/HeuristicLab.Algorithms.GrammaticalOptimization/SequentialDecisionPolicies/GenericPolicy.cs

Download in other formats: