Free cookie consent management tool by TermsFeed Policy Generator

Ignore:
Timestamp:
02/11/15 13:06:02 (9 years ago)
Author:
gkronber
Message:

#2283: commit before cleanup after EuroCAST

File:
1 edited

Legend:

Unmodified
Added
Removed
  • branches/HeuristicLab.Problems.GrammaticalOptimization/HeuristicLab.Algorithms.GrammaticalOptimization/SequentialDecisionPolicies/GenericFunctionApproximationGrammarPolicy.cs

    r11977 r11980  
    6161      }
    6262
    63 
    64      
    65       const double beta = 20;
     63     
     64      /*
     65      const double beta = 10;
    6666      var w = from idx in Enumerable.Range(0, maxIdx)
    6767              let afterStateQ = activeAfterStates[idx]
     
    7171      selectedStateIdx = actionIndexMap[bestAction];
    7272      Debug.Assert(selectedStateIdx >= 0);
    73      
    74 
    75       /*
    76       if (random.NextDouble() < 0.2) {
     73      */
     74     
     75     
     76      if (random.NextDouble() < 0.5) {
    7777        selectedStateIdx = actionIndexMap[random.Next(maxIdx)];
    7878      } else {
     
    9191        selectedStateIdx = actionIndexMap[bestIdxs[random.Next(bestIdxs.Count)]];
    9292      }
    93       */
     93     
    9494      return true;
    9595    }
     
    140140      double delta = reward - GetValue(state);
    141141      // delta /= problem.GetFeatures(state).Count();
    142       //const double alpha = 0.01;
     142      //const double alpha = 0.001;
    143143      foreach (var feature in problem.GetFeatures(state)) {
    144144        featureTries[feature.Id] = GetFeatureTries(feature.Id) + 1;
Note: See TracChangeset for help on using the changeset viewer.