Context Navigation

GenericThompsonSamplingPolicy.cs @ 13042

Visit:

Last change on this file since 13042 was 11974, checked in by gkronber, 10 years ago
#2283: eurocast experiments
File size: 1.3 KB

Line
1	using System;
2	using System.Collections.Generic;
3	using System.Diagnostics;
4	using System.Linq;
5	using System.Text;
6	using System.Threading.Tasks;
7	using HeuristicLab.Common;
8
9	namespace HeuristicLab.Algorithms.Bandits.BanditPolicies {
10	public class GenericThompsonSamplingPolicy : IBanditPolicy {
11	private readonly IModel model;
12
13	public GenericThompsonSamplingPolicy(IModel model) {
14	this.model = model;
15	}
16
17	public int SelectAction(Random random, IEnumerable<IBanditPolicyActionInfo> actionInfos) {
18	var myActionInfos = actionInfos.OfType<ModelPolicyActionInfo>();
19	int bestAction = -1;
20	double bestQ = double.NegativeInfinity;
21	var aIdx = -1;
22	foreach (var aInfo in myActionInfos) {
23	aIdx++;
24	var q = aInfo.SampleExpectedReward(random);
25	// very unlikely to be equal and we don't care
26	if (q > bestQ) {
27	bestQ = q;
28	bestAction = aIdx;
29	}
30	}
31	Debug.Assert(bestAction > -1);
32	return bestAction;
33	}
34
35	public IBanditPolicyActionInfo CreateActionInfo() {
36	return new ModelPolicyActionInfo((IModel)model.Clone());
37	}
38
39	public override string ToString() {
40	return string.Format("GenericThompsonSamplingPolicy({0})", model);
41	}
42	}
43	}

Note: See TracBrowser for help on using the repository browser.