C# (CSharp) SparseMatrix.getStateList Examples

Programming Language: C# (CSharp)

Class/Type: SparseMatrix

Method/Function: getStateList

Examples at hotexamples.com: 2

C# (CSharp) SparseMatrix.getStateList - 2 examples found. These are the top rated real world C# (CSharp) examples of SparseMatrix.getStateList extracted from open source projects. You can rate examples to help us improve the quality of examples.

Frequently Used Methods

Show Hide

At(17)

Clone(12)

Clear(5)

Add(3)

ColCount(3)

AddValueTo(3)

AppendCols(2)

AddElement(2)

getActionList(2)

ComputeEigenPair(2)

getStateList(2)

CheckSymmetricalMatrixRules(2)

ClearColumn(1)

ContainsAt(1)

getPolicy(1)

Ax(1)

addState(1)

addAction(1)

Last(1)

ComputeNormAgainst(1)

Contains(1)

ClearRow(1)

CheckCount(1)

ColumnSums(1)

ColInd(1)

AddConstant(1)

AddValue(1)

ColumnEnumerator(1)

Example #1

Show file

File: RapportManager.cs Project: hanshan3290/AndroidStudioApp

        //TODO: FOR DEBUG ONLY
        public void printPolicy(SparseMatrix<DialogueState, DialogueAction> policy)
        {
            Console.Write("       ");
            //Print actions
            foreach (DialogueAction act in policy.getActionList())
            {
                Console.Write(act.getCommunicativeAct().getCommActType() + " ");
            } Console.WriteLine();

            //Print State and values
            foreach (DialogueState st in policy.getStateList())
            {
                Console.Write(st.CurrentUtterance + "   ");
                double[] values = policy[st];

                for (int a = 0; a < policy.getActionList().Count; a++)
                {
                    Console.Write(values[a].ToString("#.000") + "    ");    //#.000 - 3 decimal points
                } Console.WriteLine();
            } Console.WriteLine();
        }

Example #2

Show file

File: RapportManager.cs Project: hanshan3290/AndroidStudioApp

        public void runRL()
        {
            //CODE BELOW IS ONLY FOR TESTING RL
            int NStates = 5, NActions = (int)COMMUNICATIVE_ACT.COMM_ITEMS, NEpisodes = 50, NIterations = 20;
            Random rand = new Random();

            SparseMatrix<DialogueState, DialogueAction> policy = new SparseMatrix<DialogueState, DialogueAction>();

            for (int s = 0; s < NStates; s++)
            {
                //Create new State
                DialogueState ds = new DialogueState();
                ds.CurrentUtterance = "state" + s;
                policy.addState(ds);
            }

            for (int a = 0; a < NActions; a++)
            {
                DialogueAction da = new DialogueAction();
                da.setVerbalAct(new CommunicativeAct((COMMUNICATIVE_ACT)(a % (int)COMMUNICATIVE_ACT.COMM_ITEMS)));
                policy.addAction(da);
            }

            DialogueState currState = policy.getStateList()[0];
            DialogueAction currAct = policy.getActionList()[0];

            //QLearner<DialogueState, DialogueAction> RLearner = new QLearner<DialogueState, DialogueAction>(0.95, 0.7, 0.15, policy, rewardFunction);
            QLambdaLearner<DialogueState, DialogueAction> RLearner = new QLambdaLearner<DialogueState, DialogueAction>(0.95, 0.9, 0.15, 0.8, policy, rewardFunction);
            //SARSALearner<DialogueState, DialogueAction> RLearner = new SARSALearner<DialogueState, DialogueAction>(0.95, 0.9, 0.15, 0.8, policy, rewardFunction);

            RLearner.setStartState(currState);

            //Iterate
            for (int episode = 0; episode < NEpisodes; episode++)
            {
                currState = policy.getStateList()[0];
                currAct = policy.getActionList()[0];
                int stateIndex = 0;

                for (int iteration = 0; (iteration < NIterations) && (currState.CurrentUtterance != "state4"); iteration++)
                {
                    currAct = RLearner.nextAction();

                    //Observe new state
                    if (currAct.getCommunicativeAct().getCommActType() == COMMUNICATIVE_ACT.NO_COMM)
                    {
                        currState = policy.getStateList()[(++stateIndex) % NStates];
                    }

                    //Update (and observe reward)
                    RLearner.update(currState, currAct);
                }

                //Final update to get final reward
                //qLearner.update(currState, currAct);

                RLearner.newEpisode();

                Console.WriteLine("EPISODE " + episode + ": " + RLearner.getEpisodeReward(episode));
            }

            Console.WriteLine("\nPolicy items: " + policy.getPolicy().Count + "\n");

            foreach (Tuple<DialogueState, DialogueAction> t in policy.getPolicy().Keys)
            {
                Console.WriteLine("State: " + t.Item1.CurrentUtterance + ", Action: " + t.Item2.getCommunicativeAct().getCommActType() + "\n");
            }

            printPolicy(policy);
        }