예제 #1
0
        public A3C(Optimizer p_optimizer, NeuralNetwork p_network, float p_gamma, int p_asynchUpdate) : base(p_optimizer, p_network, p_gamma)
        {
            _thNetwork   = IOUtils.LoadNetwork(IOUtils.SaveNetwork(p_network));
            _thOptimizer = new ADAM(_thNetwork);

            _asyncUnit = new AsyncUnit();
            _asyncUnit.Init(p_asynchUpdate);
            _thOptimizer.InitAsynchMode(true);

            _stack = new Stack();
        }
예제 #2
0
        public AsyncQLearning(Optimizer p_optimizer, NeuralNetwork p_networkQ, NeuralNetwork p_networkQt, float p_gamma, int p_asynchUpdate)
        {
            _optimizer = p_optimizer;
            _networkQ  = p_networkQ;
            _networkQt = p_networkQt;
            _gamma     = p_gamma;

            _asyncUnit = new AsyncUnit();
            _asyncUnit.Init(p_asynchUpdate);
            _optimizer.InitAsynchMode(true);
        }