C# (CSharp) AIXI Agent.GeneratePerceptAndUpdateの例

プログラミング言語: C# (CSharp)

名前空間/パッケージ名: AIXI

クラス/型: Agent

メソッド/関数: GeneratePerceptAndUpdate

hotexamples.comのコード掲載数: 2

C# (CSharp) AIXI Agent.GeneratePerceptAndUpdate - 2件のコード例が見つかりました。すべてオープンソースプロジェクトから抽出されたC# (CSharp)のAIXI.Agent.GeneratePerceptAndUpdateの実例で、最も評価が高いものを厳選しています。コード例の評価を行っていただくことで、より質の高いコード例が表示されるようになります。

よく使われるメソッド

表示非表示

ModelUpdateAction(2)

AverageReward(1)

GeneratePerceptAndUpdate(1)

GenerateRandomAction(1)

MaximumReward(1)

ModelSize(1)

ModelUpdatePercept(1)

Playout(1)

Search(1)

GeneratePerceptAndUpdate() public abstract method

public abstract GeneratePerceptAndUpdate ( ) : int>.Tuple
return	int>.Tuple

Agent Class Documentation

コード例 #1

ファイルを表示

        public double Sample(Agent agent, int horizon)
        {
            double reward = 0.0;

            if (horizon == 0)
            {
                return((int)reward);
            }
            else if (this.Type == ChanceNode)
            {
                var percept      = agent.GeneratePerceptAndUpdate();
                int observation  = percept.Item1;
                int randomReward = percept.Item2;

                if (!this.Children.ContainsKey(observation))  //new node ->add it as decision node
                {
                    this.Children[observation] = new MonteCarloSearchNode(DecisionNode);
                }
                MonteCarloSearchNode observationChild = this.Children[observation];

                reward = randomReward + observationChild.Sample(agent, horizon - 1);
            }
            else if (this.Visits == 0) //unvisited decision node or we have exceeded maximum tree depth
            {
                reward = agent.Playout(horizon);
//                Console.WriteLine("from playout: reward ="+reward);
            }
            else   //Previously visited decision node

            {
                int actionNullable = this.SelectAction(agent);
                int action         = actionNullable;

                agent.ModelUpdateAction(action);

                if (!this.Children.ContainsKey(action))     //this action is new chance child
                {
                    this.Children[action] = new MonteCarloSearchNode(ChanceNode);
                }
                MonteCarloSearchNode actionChild = this.Children[action];

                reward = actionChild.Sample(agent, horizon);   //it is not clear if not horizon-1. (asks pyaixi)
            }

            double visitsDouble = this.Visits;

            //Console.WriteLine("> {3} - {0}, {1}, {2}", this.mean, reward, (reward + (visitsDouble * this.mean) / (visitsDouble + 1.0)), visitsDouble);
            this.Mean   = (reward + (visitsDouble * this.Mean)) / (1.0 + visitsDouble);
            this.Visits = this.Visits + 1;

            return(reward);
        }

コード例 #2

ファイルを表示

ファイル: MonteCarloSearchTree.cs プロジェクト: GoodAI/SummerCamp

        public double Sample(Agent agent, int horizon)
        {
            double reward = 0.0;

            if (horizon == 0) {
                return (int)reward;
            }
            else if (this.Type == ChanceNode) {
                var percept = agent.GeneratePerceptAndUpdate();
                int observation = percept.Item1;
                int randomReward = percept.Item2;

                if (!this.Children.ContainsKey(observation)) {//new node ->add it as decision node
                    this.Children[observation] = new MonteCarloSearchNode(DecisionNode);
                }
                MonteCarloSearchNode observationChild = this.Children[observation];

                reward = randomReward + observationChild.Sample(agent, horizon-1);
            }
            else if (this.Visits == 0) //unvisited decision node or we have exceeded maximum tree depth
            {
                reward = agent.Playout(horizon);
            //                Console.WriteLine("from playout: reward ="+reward);
            }
            else { //Previously visited decision node

                int actionNullable = this.SelectAction(agent);
                int action = actionNullable;

                agent.ModelUpdateAction(action);

                if (!this.Children.ContainsKey(action)){    //this action is new chance child
                    this.Children[action]=new MonteCarloSearchNode(ChanceNode);
                }
                MonteCarloSearchNode actionChild = this.Children[action];

                reward = actionChild.Sample(agent, horizon);   //it is not clear if not horizon-1. (asks pyaixi)
            }

            double visitsDouble = this.Visits;
            //Console.WriteLine("> {3} - {0}, {1}, {2}", this.mean, reward, (reward + (visitsDouble * this.mean) / (visitsDouble + 1.0)), visitsDouble);
            this.Mean = (reward + (visitsDouble*this.Mean)) / (1.0 + visitsDouble);
            this.Visits = this.Visits+1;

            return reward;
        }