Changeset 11850 for branches/HeuristicLab.Problems.GrammaticalOptimization/HeuristicLab.Algorithms.GrammaticalOptimization/ISequentialDecisionPolicy.cs
- Timestamp:
- 02/01/15 20:14:38 (10 years ago)
- File:
-
- 1 moved
Legend:
- Unmodified
- Added
- Removed
-
branches/HeuristicLab.Problems.GrammaticalOptimization/HeuristicLab.Algorithms.GrammaticalOptimization/ISequentialDecisionPolicy.cs
r11849 r11850 11 11 // here we assume that a reward is only recieved at the end of the episode and the update is done only after an episode is complete 12 12 // we also assume that the policy can fail to select one of the followStates 13 public interface I Policy<in TState> {13 public interface ISequentialDecisionPolicy<in TState> { 14 14 bool TrySelect(Random random, TState curState, IEnumerable<TState> afterStates, out int selectedStateIdx); // selectedState \in afterStates 15 15
Note: See TracChangeset
for help on using the changeset viewer.