Changeset 11730 for branches/HeuristicLab.Problems.GrammaticalOptimization/HeuristicLab.Algorithms.Bandits/Policies/EpsGreedyPolicy.cs
- Timestamp:
- 01/02/15 16:08:21 (10 years ago)
- File:
-
- 1 edited
Legend:
- Unmodified
- Added
- Removed
-
branches/HeuristicLab.Problems.GrammaticalOptimization/HeuristicLab.Algorithms.Bandits/Policies/EpsGreedyPolicy.cs
r11727 r11730 27 27 if (random.NextDouble() > eps) { 28 28 // select best 29 var maxReward= double.NegativeInfinity;29 var bestQ = double.NegativeInfinity; 30 30 int bestAction = -1; 31 31 foreach (var a in Actions) { 32 32 if (tries[a] == 0) return a; 33 var avgReward= sumReward[a] / tries[a];34 if ( maxReward < avgReward) {35 maxReward = avgReward;33 var q = sumReward[a] / tries[a]; 34 if (bestQ < q) { 35 bestQ = q; 36 36 bestAction = a; 37 37 } … … 65 65 Array.Clear(sumReward, 0, sumReward.Length); 66 66 } 67 public override void PrintStats() { 68 for (int i = 0; i < sumReward.Length; i++) { 69 if (tries[i] >= 0) { 70 Console.Write(" {0,5:F2} {1}", sumReward[i] / tries[i], tries[i]); 71 } else { 72 Console.Write("-", ""); 73 } 74 } 75 Console.WriteLine(); 76 } 77 public override string ToString() { 78 return string.Format("EpsGreedyPolicy({0:F2})", eps); 79 } 67 80 } 68 81 }
Note: See TracChangeset
for help on using the changeset viewer.