- Timestamp:
- 02/17/15 16:04:58 (10 years ago)
- File:
-
- 1 edited
Legend:
- Unmodified
- Added
- Removed
-
branches/HeuristicLab.Problems.GrammaticalOptimization/HeuristicLab.Algorithms.GrammaticalOptimization/SequentialDecisionPolicies/GenericFunctionApproximationGrammarPolicy.cs
r11981 r12026 129 129 double delta = reward - GetValue(state); 130 130 foreach (var feature in problem.GetFeatures(state)) { 131 featureTries[feature.Id] = GetFeatureTries(feature.Id) + 1; 132 Debug.Assert(GetFeatureTries(feature.Id) >= 1); 133 double alpha = 1.0 / GetFeatureTries(feature.Id); 134 alpha = Math.Max(alpha, 0.001); 131 //featureTries[feature.Id] = GetFeatureTries(feature.Id) + 1; 132 //Debug.Assert(GetFeatureTries(feature.Id) >= 1); 133 //double alpha = 1.0 / GetFeatureTries(feature.Id); 134 //alpha = Math.Max(alpha, 0.001); 135 var alpha = 0.01; 135 136 136 137 double w;
Note: See TracChangeset
for help on using the changeset viewer.