C# (CSharp) QAgent.tick 예제들

프로그래밍 언어: C# (CSharp)

클래스/타입: QAgent

메소드/함수: tick

hotexamples.com에서의 예제들: 3

C# (CSharp) QAgent.tick - 3개의 예제가 발견되었습니다. 이것들은 오픈소스 프로젝트에서 추출된 C# (CSharp)의 QAgent.tick에 대한 실세계 최고 등급의 예제들입니다. 예제들을 평가하여 예제의 품질 향상에 도움을 줄 수 있습니다.

자주 사용되는 메소드들

보기 숨기기

GetAction(4)

tick(3)

GetState(3)

startlearn(3)

UpdateState(3)

Load(3)

Reinitialize(3)

TurnOffExploration(2)

draw_world(2)

Deserialize(2)

TurnOffLearning(2)

Save(2)

Serialize(2)

goveryfast(2)

GetType(2)

goslow(1)

getTickCount(1)

gonormal(1)

stoplearn(1)

gofast(1)

AI_ID(1)

getProcessedItemCount(1)

getAvgReward(1)

getAvgLoss(1)

TurnOnLearning(1)

ToQAction(1)

RewardAgent(1)

GetStateMaxScore(1)

GetQActions(1)

TurnOnExploration(1)

예제 #1

파일 보기

        private void BackgroundThread()
        {
            while (!needToStop)
            {
                if (!paused)
                {
                    qAgent.tick();
                    UpdateUI(canvas);
                }

                Thread.Sleep(interval);
            }
        }

예제 #2

파일 보기

파일: FormAgent.cs 프로젝트: Jason6583/ParallelDeepReinforcementLearning

        private void BackgroundThread()
        {
            while (!needToStop)
            {
                if (!paused)
                {
                    // pause when all reward items have been found
                    if (txtReward.Text != "" && txtPunish.Text != "" && qAgent.tick(Double.Parse(txtReward.Text), Double.Parse(txtPunish.Text)) == 1)
                    {
                        paused = true;
                    }
                    UpdateUI(canvas);
                }

                Thread.Sleep(interval);
            }
        }

예제 #3

파일 보기

        static void Main(string[] args)  // b r o k e n
        {
            Console.ForegroundColor = ConsoleColor.DarkMagenta;
            if (File.Exists(qAgentBrainPath))
            {
                using (FileStream fstream = new FileStream(qAgentBrainPath, FileMode.Open, FileAccess.Read, FileShare.Read)) {
                    qAgent = new BinaryFormatter().Deserialize(fstream) as QAgent;
                    qAgent.Reinitialize();
                }
                Console.WriteLine("QAgent loaded");
            }
            else
            {
                var num_inputs      = 6; // 9 eyes, each sees 3 numbers (wall, green, red thing proximity)
                var num_actions     = 3; // 5 possible angles agent can turn
                var temporal_window = 1; // amount of temporal memory. 0 = agent lives in-the-moment :)
                var network_size    = num_inputs * temporal_window + num_actions * temporal_window + num_inputs;


                // config brain
                var layer_defs = new List <LayerDefinition>();

                // the value function network computes a value of taking any of the possible actions
                // given an input state. Here we specify one explicitly the hard way
                // but user could also equivalently instead use opt.hidden_layer_sizes = [20,20]
                // to just insert simple relu hidden layers.
                layer_defs.Add(new LayerDefinition {
                    type = "input", out_sx = 1, out_sy = 1, out_depth = network_size
                });
                layer_defs.Add(new LayerDefinition {
                    type = "fc", num_neurons = 96, activation = "relu"
                });
                layer_defs.Add(new LayerDefinition {
                    type = "fc", num_neurons = 96, activation = "relu"
                });
                layer_defs.Add(new LayerDefinition {
                    type = "fc", num_neurons = 96, activation = "relu"
                });
                layer_defs.Add(new LayerDefinition {
                    type = "regression", num_neurons = num_actions
                });

                // options for the Temporal Difference learner that trains the above net
                // by backpropping the temporal difference learning rule.
                //var opt = new Options { method="sgd", learning_rate=0.01, l2_decay=0.001, momentum=0.9, batch_size=10, l1_decay=0.001 };
                Options opt = new Options {
                    method = "adadelta", l2_decay = 0.001, batch_size = 10
                };

                TrainingOptions tdtrainer_options = new TrainingOptions();
                tdtrainer_options.temporal_window       = temporal_window;
                tdtrainer_options.experience_size       = 30000;
                tdtrainer_options.start_learn_threshold = 1000;
                tdtrainer_options.gamma = 0.7;
                tdtrainer_options.learning_steps_total  = 200000;
                tdtrainer_options.learning_steps_burnin = 3000;
                tdtrainer_options.epsilon_min           = 0.05;
                tdtrainer_options.epsilon_test_time     = 0.00;
                tdtrainer_options.layer_defs            = layer_defs;
                tdtrainer_options.options = opt;

                DeepQLearn brain = new DeepQLearn(num_inputs, num_actions, tdtrainer_options);
                qAgent = new QAgent(brain);
            }
            qAgent.startlearn();
            new Thread(() => {
                while (true)
                {
                    if (DateTime.Now.Ticks / TimeSpan.TicksPerMillisecond % 31 /*arbitrary*/ == 0)
                    {
                        using (FileStream fstream = new FileStream(qAgentBrainPath, FileMode.Create, FileAccess.Write, FileShare.ReadWrite)) {
                            new BinaryFormatter().Serialize(fstream, qAgent);
                        }
                    }
                    qAgent.tick();
                }
            }).Start();
        }