C# (CSharp) webis.naiveBayes.processing DocumentSource示例

编程语言: C# (CSharp)

命名空间/包名称: webis.naiveBayes.processing

类/类型: DocumentSource

hotexamples.com的示例: 3

C# (CSharp) webis.naiveBayes.processing DocumentSource - 已找到3个示例。这些是从开源项目中提取的最受好评的webis.naiveBayes.processing.DocumentSource现实C# (CSharp)示例。您可以评价示例，以帮助我们提高示例质量。

示例#1

显示文件

文件： WordLevelProcessor.cs 项目： pombredanne/peng04

        public TextSource Process(IEnumerable<string> documents, string name)
        {
            TextSource result = new TextSource();

            foreach (var item in documents)
            {
                var doc = new DocumentSource();
                var sItem = item.Replace(".", " . ")
                                .Replace(",", " , ")
                                .Replace("\r\n", " \r##n ")
                                .Replace("\n", " \n ")
                                .Replace(",", " , ")
                                .Replace("##n", "\n");
                // consider punctuation marks/new line as seperate words

                foreach (var segment in sItem.Split(new[] { ' ' }, StringSplitOptions.RemoveEmptyEntries))
                {
                    doc.LanguageSegments.Add(segment);
                }

                result.Documents.Add(doc);
            }

            result.Name = name;
            return result;
        }

示例#2

显示文件

文件： BayesTextClassifier.cs 项目： pombredanne/peng04

        public double P_c(CategoryProbabilityDistribution trainingDistribution, DocumentSource testData, int n, double prob_c)
        {
            var result = Math.Log10(prob_c);

            for (int i = 0; i <= testData.LanguageSegments.Count - n; i++)
            {
                IEnumerable<string> ngram = testData.LanguageSegments.Skip(i).Take(n).ToArray();
                var xyz = Math.Log10(trainingDistribution.GetProbability(ngram));

                if(xyz < -1000)
                {
                    xyz = -1000;
                }

                result += xyz;
            }

            return result;
        }

示例#3

显示文件

文件： CharacterLevelProcessor.cs 项目： pombredanne/peng04

        public TextSource Process(IEnumerable<string> documents, string name)
        {
            TextSource result = new TextSource();

            foreach (var item in documents)
            {
                var doc = new DocumentSource();

                foreach (var segment in item)
                {
                    doc.LanguageSegments.Add(segment.ToString());
                }

                result.Documents.Add(doc);
            }

            result.Name = name;
            return result;
        }