C# (CSharp) WebmindBrowser.BayesClassifier ExcludedWordsの例

プログラミング言語: C# (CSharp)

名前空間/パッケージ名: WebmindBrowser.BayesClassifier

クラス/型: ExcludedWords

hotexamples.comのコード掲載数: 6

C# (CSharp) WebmindBrowser.BayesClassifier ExcludedWords - 6件のコード例が見つかりました。すべてオープンソースプロジェクトから抽出されたC# (CSharp)のWebmindBrowser.BayesClassifier.ExcludedWordsの実例で、最も評価が高いものを厳選しています。コード例の評価を行っていただくことで、より質の高いコード例が表示されるようになります。

よく使われるメソッド

表示非表示

InitDefault(2)

IsExcluded(1)

コード例 #1

ファイルを表示

ファイル: testClassifier.cs プロジェクト: SihangZhou/webbrowser

        private Dictionary <string, double> makePrediction(String fileContent, SortedDictionary <string, ICategory> sd)
        {
            ExcludedWords m_ExcludedWords = new ExcludedWords();

            m_ExcludedWords.InitDefault();
            EnumerableCategory words_in_file = new EnumerableCategory("", m_ExcludedWords);

            words_in_file.TeachCategory(fileContent);//理解naive bayes后，我终于理解了，这个就是提取待分类文本的特征(即属性词)
            //万事俱备，只欠计算
            Dictionary <string, double> score = new Dictionary <string, double>();

            foreach (KeyValuePair <string, ICategory> cat in sd)
            {
                score.Add(cat.Key, 0.0);
            }


            foreach (KeyValuePair <string, int> kvp1 in words_in_file)
            {
                // PhraseCount pc_in_file = kvp1.Value;
                String words_in_predictionfile = kvp1.Key;//算P(f1=x1|s=si)，其中words_in_predictionfile就是x1
                foreach (KeyValuePair <string, ICategory> kvp in sd)
                {
                    ICategory cat   = kvp.Value;
                    int       count = cat.GetPhraseCount(words_in_predictionfile);//这里每轮的words_in_predictionfile是待分类文本的特征词
                    if (0 < count)
                    {
                        score[kvp.Key] += System.Math.Log((double)count / (double)cat.TotalWords);//说到底还是按类别(cat1、cat2...)等分类统计概率,就是连乘P(f1=x1|s=si)
                    }
                    else//count==0,用0.01代替0防止log无意义
                    {
                        score[kvp.Key] += System.Math.Log(0.01 / (double)cat.TotalWords);
                    }
                    System.Diagnostics.Trace.WriteLine(words_in_predictionfile + "(" +
                                                       kvp.Key + ")" + score[kvp.Key]);
                }
            }
            int total = 0;

            foreach (Category cat in sd.Values)
            {
                total += cat.TotalWords;
            }

            foreach (KeyValuePair <string, ICategory> kvp in sd) //觉得这里写得很没意思，就是把cat1+cat2+cat3+cat4+cat5作为总和，然后分别用每个类别去除以这个总和，然后取对数
            {                                                    //更重要的，这里的含义我真不理解，签名是把每个类别的单词处于该类别的count，然后取对数，相加，然后又加上一个类别除以类别之和取对数
                //现在理解了，这就是算先验概率啊
                ICategory cat = kvp.Value;
                score[kvp.Key] += System.Math.Log((double)cat.TotalWords / (double)total);
            }
            return(score);
        }

コード例 #2

ファイルを表示

 public Classifier()
 {
     m_Categories    = new SortedDictionary <string, ICategory>();
     m_ExcludedWords = new ExcludedWords();
     m_ExcludedWords.InitDefault();
 }

コード例 #3

ファイルを表示

ファイル: Classifier.cs プロジェクト: ginobilinie/webbrowser

 public Classifier()
 {
     m_Categories = new SortedDictionary<string, ICategory>();
     m_ExcludedWords = new ExcludedWords();
     m_ExcludedWords.InitDefault();
 }

コード例 #4

ファイルを表示

ファイル: testClassifier.cs プロジェクト: ginobilinie/webbrowser

        private Dictionary<string, double> makePrediction(String fileContent, SortedDictionary<string, ICategory> sd)
        {
            ExcludedWords m_ExcludedWords = new ExcludedWords();
            m_ExcludedWords.InitDefault();
            EnumerableCategory words_in_file = new EnumerableCategory("", m_ExcludedWords);
            words_in_file.TeachCategory(fileContent);//理解naive bayes后，我终于理解了，这个就是提取待分类文本的特征(即属性词)
            //万事俱备，只欠计算
            Dictionary<string, double> score = new Dictionary<string, double>();
            foreach (KeyValuePair<string, ICategory> cat in sd)
            {
                score.Add(cat.Key, 0.0);
            }

            foreach (KeyValuePair<string, int> kvp1 in words_in_file)
            {
               // PhraseCount pc_in_file = kvp1.Value;
                String words_in_predictionfile = kvp1.Key;//算P(f1=x1|s=si)，其中words_in_predictionfile就是x1
                foreach (KeyValuePair<string, ICategory> kvp in sd)
                {
                    ICategory cat = kvp.Value;
                    int count = cat.GetPhraseCount(words_in_predictionfile);//这里每轮的words_in_predictionfile是待分类文本的特征词
                    if (0 < count)
                    {
                        score[kvp.Key] += System.Math.Log((double)count / (double)cat.TotalWords);//说到底还是按类别(cat1、cat2...)等分类统计概率,就是连乘P(f1=x1|s=si)
                    }
                    else//count==0,用0.01代替0防止log无意义
                    {
                        score[kvp.Key] += System.Math.Log(0.01 / (double)cat.TotalWords);
                    }
                    System.Diagnostics.Trace.WriteLine(words_in_predictionfile + "(" +
                        kvp.Key + ")" + score[kvp.Key]);
                }

            }
            int total = 0;
            foreach (Category cat in sd.Values)
            {
                total += cat.TotalWords;
            }

            foreach (KeyValuePair<string, ICategory> kvp in sd)//觉得这里写得很没意思，就是把cat1+cat2+cat3+cat4+cat5作为总和，然后分别用每个类别去除以这个总和，然后取对数
            {//更重要的，这里的含义我真不理解，签名是把每个类别的单词处于该类别的count，然后取对数，相加，然后又加上一个类别除以类别之和取对数
                //现在理解了，这就是算先验概率啊
                ICategory cat = kvp.Value;
                score[kvp.Key] += System.Math.Log((double)cat.TotalWords / (double)total);
            }
            return score;
        }

コード例 #5

ファイルを表示

 public Category(string cat, ExcludedWords excluded)
 {
     m_Phrases  = new Dictionary <string, int>();
     m_Excluded = excluded;
     m_Name     = cat;
 }

コード例 #6

ファイルを表示

 public EnumerableCategory(string Cat, ExcludedWords Excluded) : base(Cat, Excluded)
 {
 }