public override Core.EnvironmentDescription <double, int> GetEnvironmentDescription() { var spaceDesc = new Core.SpaceDescription <double>( new[] { 0.0, 0.0, -1.0, -1.0, 0.0, 0.0, 0.0, 0.0, 0.0 }, new[] { 10.0, 10.0, 1.0, 1.0, 20.0, 10.0, 100.0, 3.17, 3.17 }); var actionDesc = Core.SpaceDescription <int> .CreateOneDimensionalSpaceDescription(0, 3); var rewardDesc = new Core.DimensionDescription <double>(-5, 10); return(new Core.EnvironmentDescription <double, int>(spaceDesc, actionDesc, rewardDesc, 0.9)); }
public override Core.EnvironmentDescription <double, int> GetEnvironmentDescription() { var stateSpaceDescription = new Core.SpaceDescription <double>( new[] { MinPosition, minVelocity }, new[] { MaxPosition, maxVelocity }, new[] { (MinPosition + MaxPosition) / 2, (minVelocity + maxVelocity) / 2 }, new[] { 0.1, 0.1 }); var actionSpaceDescription = new Core.SpaceDescription <int>( new[] { 0 }, new[] { 2 }); var reinforcementSpaceDescription = new Core.DimensionDescription <double>(-1, 0); return(new Core.EnvironmentDescription <double, int>(stateSpaceDescription, actionSpaceDescription, reinforcementSpaceDescription, 0.9)); }
public override Core.EnvironmentDescription <double, int> GetEnvironmentDescription() { var stateSpaceDescription = new Core.SpaceDescription <double>( new[] { 0.0, 0.0, -1.0, -1.0 }, new[] { 1.0, 1.0, 1.0, 1.0 }, new[] { 0.5, 0.5, 0.0, 0.0 }, new[] { 0.1, 0.1, 0.1, 0.1 }); var actionSpaceDescription = new Core.SpaceDescription <int>( new[] { 0 }, new[] { 3 }); var reinforcementSpaceDescription = new Core.DimensionDescription <double>(-5, 10000); return(new Core.EnvironmentDescription <double, int>( stateSpaceDescription, actionSpaceDescription, reinforcementSpaceDescription, 0.95)); }
public override Core.EnvironmentDescription <double, double> GetEnvironmentDescription() { double[] standardDeviation = new double[8]; double[] averageState = Enumerable.Repeat <double>(0.0, 8).ToArray(); standardDeviation[0] = 2; standardDeviation[1] = 0.1; standardDeviation[2] = 0.1; standardDeviation[3] = 0.1; standardDeviation[4] = 1; standardDeviation[5] = 1; standardDeviation[6] = 1; standardDeviation[7] = 1; Core.SpaceDescription <double> stateDescription = new Core.SpaceDescription <double>(null, null, averageState, standardDeviation); Core.SpaceDescription <double> actionDescription = Core.SpaceDescription <double> .CreateOneDimensionalSpaceDescription(-10, 10); Core.DimensionDescription <double> reinforcementDescription = new Core.DimensionDescription <double>(-4, 4); return(new Core.EnvironmentDescription <double, double>(stateDescription, actionDescription, reinforcementDescription, 0.9)); }