public CheeseMazeEnvironment(Dictionary<string, string> options)
: base(options)
{
ValidActions = (int[])Enum.GetValues(typeof(ActionsEnum));
ValidObservations = (int[])Enum.GetValues(typeof(ObservationsEnum));
ValidRewards = (int[])Enum.GetValues(typeof(RewardEnum));
base.fill_out_bits();
//todo: OPTIONS -> set probability
this._probability = _defaultProbability;
Debug.Assert(this._probability >= 0 && this._probability <= 1, "probability is set outside [0,1]");
if (this._rnd.NextDouble() < this._probability)
{
this.Observation = this.OHead;
}
else
{
this.Observation = this.OTail;
}
this.Reward = 0;
}