Beispiel #1
0
        public override Core.EnvironmentDescription <double, int> GetEnvironmentDescription()
        {
            var spaceDesc = new Core.SpaceDescription <double>(
                new[] { 0.0, 0.0, -1.0, -1.0, 0.0, 0.0, 0.0, 0.0, 0.0 },
                new[] { 10.0, 10.0, 1.0, 1.0, 20.0, 10.0, 100.0, 3.17, 3.17 });
            var actionDesc = Core.SpaceDescription <int> .CreateOneDimensionalSpaceDescription(0, 3);

            var rewardDesc = new Core.DimensionDescription <double>(-5, 10);

            return(new Core.EnvironmentDescription <double, int>(spaceDesc, actionDesc, rewardDesc, 0.9));
        }
        public override Core.EnvironmentDescription <double, int> GetEnvironmentDescription()
        {
            var stateSpaceDescription = new Core.SpaceDescription <double>(
                new[] { MinPosition, minVelocity },
                new[] { MaxPosition, maxVelocity },
                new[] { (MinPosition + MaxPosition) / 2, (minVelocity + maxVelocity) / 2 },
                new[] { 0.1, 0.1 });
            var actionSpaceDescription = new Core.SpaceDescription <int>(
                new[] { 0 },
                new[] { 2 });
            var reinforcementSpaceDescription = new Core.DimensionDescription <double>(-1, 0);

            return(new Core.EnvironmentDescription <double, int>(stateSpaceDescription, actionSpaceDescription, reinforcementSpaceDescription, 0.9));
        }
Beispiel #3
0
        public override Core.EnvironmentDescription <double, int> GetEnvironmentDescription()
        {
            var stateSpaceDescription = new Core.SpaceDescription <double>(
                new[] { 0.0, 0.0, -1.0, -1.0 },
                new[] { 1.0, 1.0, 1.0, 1.0 },
                new[] { 0.5, 0.5, 0.0, 0.0 },
                new[] { 0.1, 0.1, 0.1, 0.1 });
            var actionSpaceDescription = new Core.SpaceDescription <int>(
                new[] { 0 }, new[] { 3 });
            var reinforcementSpaceDescription = new Core.DimensionDescription <double>(-5, 10000);

            return(new Core.EnvironmentDescription <double, int>(
                       stateSpaceDescription,
                       actionSpaceDescription,
                       reinforcementSpaceDescription,
                       0.95));
        }
        public override Core.EnvironmentDescription <double, double> GetEnvironmentDescription()
        {
            double[] standardDeviation = new double[8];
            double[] averageState      = Enumerable.Repeat <double>(0.0, 8).ToArray();

            standardDeviation[0] = 2;
            standardDeviation[1] = 0.1;
            standardDeviation[2] = 0.1;
            standardDeviation[3] = 0.1;
            standardDeviation[4] = 1;
            standardDeviation[5] = 1;
            standardDeviation[6] = 1;
            standardDeviation[7] = 1;

            Core.SpaceDescription <double> stateDescription
                = new Core.SpaceDescription <double>(null, null, averageState, standardDeviation);
            Core.SpaceDescription <double> actionDescription
                = Core.SpaceDescription <double> .CreateOneDimensionalSpaceDescription(-10, 10);

            Core.DimensionDescription <double> reinforcementDescription
                = new Core.DimensionDescription <double>(-4, 4);

            return(new Core.EnvironmentDescription <double, double>(stateDescription, actionDescription, reinforcementDescription, 0.9));
        }