public override void Learn(GridWorld world) { float[] currentState = world.GetState(); float currentReward = CurrentReward(); learningAgent.Learn(currentState, currentReward); }
public override WorldAction Process(GridWorld world) { Reward(-1); float[] state = world.GetState(); int index = learningAgent.Process(state); return(IndexToAction(index)); }