Beispiel #1
0
        public void ApplyValueEstimate()
        {
            var inputTensor = new TensorProxy()
            {
                shape = new long[] { 2, 1 },
                data  = new Tensor(2, 1, new[] { 0.5f, 8f })
            };
            var agentInfos = GetFakeAgentInfos();

            var applier = new ValueEstimateApplier();

            applier.Apply(inputTensor, agentInfos);
            var agents = agentInfos;

            var agent = agents[0] as TestAgent;

            Assert.NotNull(agent);
            var action = agent.GetAction();

            Assert.AreEqual(action.value, 0.5f);

            agent = agents[1] as TestAgent;
            Assert.NotNull(agent);
            action = agent.GetAction();
            Assert.AreEqual(action.value, 8);
        }
Beispiel #2
0
        public void ApplyValueEstimate()
        {
            var inputTensor = new Tensor()
            {
                Shape = new long[] { 2, 1 },
                Data  = new float[, ] {
                    { 0.5f }, { 8f }
                }
            };
            var agentInfos = GetFakeAgentInfos();

            var applier = new ValueEstimateApplier();

            applier.Apply(inputTensor, agentInfos);
            var agents = agentInfos.Keys.ToList();
            var agent  = agents[0] as TestAgent;
            var action = agent.GetAction();

            Assert.AreEqual(action.value, 0.5f);
            agent  = agents[1] as TestAgent;
            action = agent.GetAction();
            Assert.AreEqual(action.value, 8);
        }