Context Navigation

UCTPolicy.cs

Timestamp:

01/10/16 17:13:27 (9 years ago)

Author:

aballeit

Message:

#2283 UCT parameter c

File:

-                      r12503
+                      r13492
     private readonly double c;
+    public UCTPolicy(double c = 1.0) {
+      // c = sqrt(2)
+    public UCTPolicy(double c = 1.41421356237)
+    {
       this.c = c;
+    }
 …
           q = double.PositiveInfinity;
         } else {
             q = aInfo.SumReward / aInfo.Tries + 2.0 * c * Math.Sqrt(Math.Log(totalTries) / aInfo.Tries);
+            q = aInfo.SumReward / aInfo.Tries + c * Math.Sqrt(Math.Log(totalTries) / aInfo.Tries);
+        }
         if (q > bestQ) {

Note: See TracChangeset for help on using the changeset viewer.