Free cookie consent management tool by TermsFeed Policy Generator

Ignore:
Timestamp:
01/10/16 17:13:27 (9 years ago)
Author:
aballeit
Message:

#2283 UCT parameter c

File:
1 edited

Legend:

Unmodified
Added
Removed
  • branches/HeuristicLab.Problems.GrammaticalOptimization/HeuristicLab.Algorithms.Bandits/Policies/UCTPolicy.cs

    r12503 r13492  
    1212    private readonly double c;
    1313
    14     public UCTPolicy(double c = 1.0) {
     14      // c = sqrt(2)
     15    public UCTPolicy(double c = 1.41421356237)
     16    {
    1517      this.c = c;
    1618    }
     
    3032          q = double.PositiveInfinity;
    3133        } else {
    32             q = aInfo.SumReward / aInfo.Tries + 2.0 * c * Math.Sqrt(Math.Log(totalTries) / aInfo.Tries);
     34            q = aInfo.SumReward / aInfo.Tries + c * Math.Sqrt(Math.Log(totalTries) / aInfo.Tries);
    3335        }
    3436        if (q > bestQ) {
Note: See TracChangeset for help on using the changeset viewer.