protected internal virtual void onEnvStep() { Action action = rlGlueConnection.Receive().Action(); RewardObservationTerminal rewardObservation = environment.EnvironmentStep(action); rlGlueConnection .Send() .State(RlGlueConnection.ConnectionState.EnvironmentStep) .And() .SizeOfState() .AndSizeOfInteger() .AndSizeOfDouble() .AndSizeOfObservation(rewardObservation.Observation) .And() .Terminal(rewardObservation.Terminal) .And() .Double(rewardObservation.Reward) .And() .Observation(rewardObservation.Observation) .Flush(); }
protected internal virtual void onAgentInit() { string taskSpec; rlGlueConnection .Receive() .String(out taskSpec); agent.AgentInit(taskSpec); rlGlueConnection .Send() .State(RlGlueConnection.ConnectionState.AgentInitialize) .And() .SizeOfState() .Flush(); }
public virtual string RLInit() { rlGlueConnection .Send() .State(RlGlueConnection.ConnectionState.RLInit) .And() .SizeOfState() .Flush(); ReceiveAndVerifyState(RlGlueConnection.ConnectionState.RLInit); return(rlGlueConnection.Receive().String()); }