C# (CSharp) POMDP BeliefState.AddBelief 예제들

프로그래밍 언어: C# (CSharp)

네임스페이스/패키지 이름: POMDP

클래스/타입: BeliefState

메소드/함수: AddBelief

hotexamples.com에서의 예제들: 3

C# (CSharp) POMDP BeliefState.AddBelief - 3개의 예제가 발견되었습니다. 이것들은 오픈소스 프로젝트에서 추출된 C# (CSharp)의 POMDP.BeliefState.AddBelief에 대한 실세계 최고 등급의 예제들입니다. 예제들을 평가하여 예제의 품질 향상에 도움을 줄 수 있습니다.

자주 사용되는 메소드들

보기 숨기기

Next(6)

AddBelief(3)

RandomState(3)

Reward(2)

Validate(2)

sampleState(2)

Beliefs(1)

RandomObservation(1)

예제 #1

파일 보기

파일: BeliefState.cs 프로젝트: abadied/AI_POMDP

        public BeliefState Next(Action a, Observation o)
        {
            BeliefState bsNext = new BeliefState(m_dDomain);
            //your code here
            double normalizationFactor = 0.0;

            foreach (State stateTag in m_dDomain.States)
            {
                double updateProbabilityForState = 0.0;
                foreach (State state in m_dDomain.States) //or in States????????????
                {
                    if (state.Successors(a).Contains(stateTag))
                    {
                        double transitionProbability = state.TransitionProbability(a: a, sTag: stateTag);
                        double beliefOfstate         = this.m_dBeliefs[state];
                        updateProbabilityForState += transitionProbability * beliefOfstate;
                    }
                }
                updateProbabilityForState *= stateTag.ObservationProbability(a: a, o: o);
                bsNext.AddBelief(stateTag, updateProbabilityForState);
                normalizationFactor += updateProbabilityForState;
            }
            for (int i = 0; i < bsNext.m_dBeliefs.Keys.Count; i++)
            {
                State stateToNormalize = bsNext.m_dBeliefs.Keys.ElementAt(i);
                bsNext.m_dBeliefs[stateToNormalize] /= normalizationFactor;
            }
            Debug.Assert(bsNext.Validate());
            return(bsNext);
        }

예제 #2

파일 보기

        // t(b,a,b') = pr(b'| a,b) = (sum over all o in omega) pr(b'|a,o,b) * pr(o|a,b). lecture 13, page 3
        public BeliefState Next(Action a, Observation o)
        {
            BeliefState bsNext = new BeliefState(m_dDomain);

            //double sumOfBTag = 0;
            foreach (State sTag in m_dDomain.States)
            {
                double stateProbabilityInBtag;
                stateProbabilityInBtag = sTag.ObservationProbability(a, o) * transitionProbabilityForEachState(sTag, a) / probabilityOfObservationGivenAB(a, o);
                bsNext.AddBelief(sTag, stateProbabilityInBtag);
            }
            return(bsNext);
            //foreach (State sTag in m_dDomain.States)
            //{
            //    //pr(b'|a,o,b)
            //    double currBTag = CalculateBTagForEachState(sTag, a, o);
            //    sumOfBTag += currBTag;
            //    bsNext.AddBelief(sTag, currBTag);
            //}
            //foreach (State sTag in m_dDomain.States)
            //{
            //    bsNext.m_dBeliefs[sTag] = bsNext.m_dBeliefs[sTag]/sumOfBTag;
            //}
            //Debug.Assert(bsNext.Validate());
            //return bsNext;
        }

예제 #3

파일 보기

        public BeliefState Next(Action a, Observation o)
        {
            BeliefState bsNext = new BeliefState(m_dDomain); //Represents the new belief state b_o_s

            double normalizing_factor = 0;                   //We will divide our resulted belief state by this factor, instead of calculating Pr(o|a,b)

            HashSet <State> reachableStates = new HashSet <State>();

            // The neighboring states are the union of all neighboring states
            // of states with positive probability on current belief state.
            // When we calculate the new distribution over states, we just need
            // to look on S' such that Tr(S,a,S')>0
            foreach (KeyValuePair <State, double> entry in m_dBeliefs)
            {
                if (entry.Value > 0)
                {
                    foreach (State s in entry.Key.Successors(a))
                    {
                        reachableStates.Add(s);
                        // We optimize the calculation by adding the weighted transition value as we build the reachableStates Set
                        // Instead of first calculating the set and only then finding all its ancenstors and perform the calculation
                        bsNext.AddBelief(s, entry.Value * entry.Key.TransitionProbability(a, s));
                    }
                }
            }

            foreach (State s_prime in reachableStates)
            {
                double trans_prob = 0;
                double obs_prob   = s_prime.ObservationProbability(a, o); // We Calculate O(o,s',a)*(b\dot\Tr(s',a))
                trans_prob = bsNext[s_prime];
                // for each state s_prime trans_prob equals O(s_prime,a,o)*dot(b,Tr(s,a,s_prime))
                trans_prob *= obs_prob;
                //The normalizing factor is sum of all values, we divide the vector by this number to make it a distribution
                normalizing_factor += trans_prob;
                // Updating the new belief state
                bsNext[s_prime] = trans_prob;
            }

            foreach (State s in reachableStates)
            {
                bsNext[s] /= normalizing_factor;
            }

            Debug.Assert(bsNext.Validate());
            return(bsNext);
        }