Context Navigation

GenericFunctionApproximationGrammarPolicy.cs

Timestamp:

02/11/15 20:11:35 (10 years ago)

Author:

gkronber

Message:

#2283: cleanup and included HeuristicLab.dlls to create a self-contained branch

File:

-                      r11980
+                      r11981
         originalIdx++;
+      }
-      /*
-      const double beta = 10;
-      var w = from idx in Enumerable.Range(0, maxIdx)
-              let afterStateQ = activeAfterStates[idx]
-              select Math.Exp(beta * afterStateQ);
-      var bestAction = Enumerable.Range(0, maxIdx).SampleProportional(random, w);
-      selectedStateIdx = actionIndexMap[bestAction];
-      Debug.Assert(selectedStateIdx >= 0);
-      */
+      if (random.NextDouble() < 0.5) {
+      // TODO: policy should be a parameter of the function approximation policy
+      if (random.NextDouble() < 0.2) {
         selectedStateIdx = actionIndexMap[random.Next(maxIdx)];
       } else {
 …
     private void UpdateWeights(string state, double reward) {
       double delta = reward - GetValue(state);
-      // delta /= problem.GetFeatures(state).Count();
-      //const double alpha = 0.001;
       foreach (var feature in problem.GetFeatures(state)) {
         featureTries[feature.Id] = GetFeatureTries(feature.Id) + 1;

Note: See TracChangeset for help on using the changeset viewer.