Context Navigation

IPolicy.cs @ 11744

Visit:

Last change on this file since 11744 was 11744, checked in by gkronber, 9 years ago
#2283 worked on TD, and models for MCTS
File size: 805 bytes

Rev	Line
[11744]	1	using System;
	2	using System.Collections.Generic;
	3	using System.Linq;
	4	using System.Text;
	5	using System.Threading.Tasks;
	6	using HeuristicLab.Problems.GrammaticalOptimization;
	7
	8	namespace HeuristicLab.Algorithms.Bandits {
	9	// this interface represents a policy for reinforcement learning
	10	public interface IPolicy<in TState, TAction> {
	11	TAction SelectAction(Random random, TState state, IEnumerable<TAction> actions);
	12	void UpdateReward(TState state, TAction action, double reward, TState newState); // reward received when after taking action in state and new state
	13	bool Done(TState state); // for deterministic MDP with deterministic rewards and goal to find a state with max reward
	14	}
	15
	16	public interface IGrammarPolicy : IPolicy<ReadonlySequence, ReadonlySequence> {
	17
	18	}
	19	}

Note: See TracBrowser for help on using the repository browser.